| Elliott Hughes | f1ada79 | 2014-05-02 17:56:56 -0700 | [diff] [blame] | 1 | /*	$OpenBSD: vfwscanf.c,v 1.4 2014/03/19 05:17:01 guenther Exp $ */ | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 2 | /*- | 
 | 3 |  * Copyright (c) 1990, 1993 | 
 | 4 |  *	The Regents of the University of California.  All rights reserved. | 
 | 5 |  * | 
 | 6 |  * This code is derived from software contributed to Berkeley by | 
 | 7 |  * Chris Torek. | 
 | 8 |  * | 
 | 9 |  * Redistribution and use in source and binary forms, with or without | 
 | 10 |  * modification, are permitted provided that the following conditions | 
 | 11 |  * are met: | 
 | 12 |  * 1. Redistributions of source code must retain the above copyright | 
 | 13 |  *    notice, this list of conditions and the following disclaimer. | 
 | 14 |  * 2. Redistributions in binary form must reproduce the above copyright | 
 | 15 |  *    notice, this list of conditions and the following disclaimer in the | 
 | 16 |  *    documentation and/or other materials provided with the distribution. | 
 | 17 |  * 3. Neither the name of the University nor the names of its contributors | 
 | 18 |  *    may be used to endorse or promote products derived from this software | 
 | 19 |  *    without specific prior written permission. | 
 | 20 |  * | 
 | 21 |  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND | 
 | 22 |  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | 
 | 23 |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | 
 | 24 |  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE | 
 | 25 |  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL | 
 | 26 |  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS | 
 | 27 |  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) | 
 | 28 |  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT | 
 | 29 |  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY | 
 | 30 |  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF | 
 | 31 |  * SUCH DAMAGE. | 
 | 32 |  */ | 
 | 33 |  | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 34 | #include <inttypes.h> | 
 | 35 | #include <limits.h> | 
 | 36 | #include <locale.h> | 
 | 37 | #include <stdarg.h> | 
 | 38 | #include <stddef.h> | 
 | 39 | #include <stdio.h> | 
 | 40 | #include <stdlib.h> | 
 | 41 | #include <string.h> | 
 | 42 | #include <wctype.h> | 
 | 43 | #include "local.h" | 
 | 44 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 45 | #define BUF 513 /* Maximum length of numeric string. */ | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 46 |  | 
 | 47 | /* | 
 | 48 |  * Flags used during conversion. | 
 | 49 |  */ | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 50 | #define LONG 0x00001       /* l: long or double */ | 
 | 51 | #define LONGDBL 0x00002    /* L: long double */ | 
 | 52 | #define SHORT 0x00004      /* h: short */ | 
 | 53 | #define SHORTSHORT 0x00008 /* hh: 8 bit integer */ | 
 | 54 | #define LLONG 0x00010      /* ll: long long (+ deprecated q: quad) */ | 
 | 55 | #define POINTER 0x00020    /* p: void * (as hex) */ | 
 | 56 | #define SIZEINT 0x00040    /* z: (signed) size_t */ | 
 | 57 | #define MAXINT 0x00080     /* j: intmax_t */ | 
 | 58 | #define PTRINT 0x00100     /* t: ptrdiff_t */ | 
 | 59 | #define NOSKIP 0x00200     /* [ or c: do not skip blanks */ | 
 | 60 | #define SUPPRESS 0x00400   /* *: suppress assignment */ | 
 | 61 | #define UNSIGNED 0x00800   /* %[oupxX] conversions */ | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 62 |  | 
 | 63 | /* | 
 | 64 |  * The following are used in numeric conversions only: | 
 | 65 |  * SIGNOK, HAVESIGN, NDIGITS, DPTOK, and EXPOK are for floating point; | 
 | 66 |  * SIGNOK, HAVESIGN, NDIGITS, PFXOK, and NZDIGITS are for integral. | 
 | 67 |  */ | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 68 | #define SIGNOK 0x01000   /* +/- is (still) legal */ | 
 | 69 | #define HAVESIGN 0x02000 /* sign detected */ | 
 | 70 | #define NDIGITS 0x04000  /* no digits detected */ | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 71 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 72 | #define DPTOK 0x08000 /* (float) decimal point is still legal */ | 
 | 73 | #define EXPOK 0x10000 /* (float) exponent (e+3, etc) still legal */ | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 74 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 75 | #define PFXOK 0x08000    /* 0x prefix is (still) legal */ | 
 | 76 | #define NZDIGITS 0x10000 /* no zero digits detected */ | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 77 |  | 
 | 78 | /* | 
 | 79 |  * Conversion types. | 
 | 80 |  */ | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 81 | #define CT_CHAR 0   /* %c conversion */ | 
 | 82 | #define CT_CCL 1    /* %[...] conversion */ | 
 | 83 | #define CT_STRING 2 /* %s conversion */ | 
 | 84 | #define CT_INT 3    /* integer, i.e., strtoimax or strtoumax */ | 
 | 85 | #define CT_FLOAT 4  /* floating, i.e., strtod */ | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 86 |  | 
| Elliott Hughes | 0d3ba1f | 2017-12-06 16:41:35 -0800 | [diff] [blame] | 87 | // An interpretive version of __sccl from vfscanf.c --- a table of all wchar_t values would | 
 | 88 | // be a little too expensive, and some kind of compressed version isn't worth the trouble. | 
 | 89 | static inline bool in_ccl(wchar_t wc, const wchar_t* ccl) { | 
 | 90 |   // Is this a negated set? | 
 | 91 |   bool member_result = true; | 
 | 92 |   if (*ccl == '^') { | 
 | 93 |     member_result = false; | 
 | 94 |     ++ccl; | 
 | 95 |   } | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 96 |  | 
| Elliott Hughes | 0d3ba1f | 2017-12-06 16:41:35 -0800 | [diff] [blame] | 97 |   // The first character may be ']' or '-' without being special. | 
 | 98 |   if (*ccl == '-' || *ccl == ']') { | 
 | 99 |     // A literal match? | 
 | 100 |     if (*ccl == wc) return member_result; | 
 | 101 |     ++ccl; | 
 | 102 |   } | 
 | 103 |  | 
 | 104 |   while (*ccl && *ccl != ']') { | 
 | 105 |     // The last character may be '-' without being special. | 
 | 106 |     if (*ccl == '-' && ccl[1] != '\0' && ccl[1] != ']') { | 
 | 107 |       wchar_t first = *(ccl - 1); | 
 | 108 |       wchar_t last = *(ccl + 1); | 
 | 109 |       if (first <= last) { | 
 | 110 |         // In the range? | 
 | 111 |         if (wc >= first && wc <= last) return member_result; | 
 | 112 |         ccl += 2; | 
 | 113 |         continue; | 
 | 114 |       } | 
 | 115 |       // A '-' is not considered to be part of a range if the character after | 
 | 116 |       // is not greater than the character before, so fall through... | 
 | 117 |     } | 
 | 118 |     // A literal match? | 
 | 119 |     if (*ccl == wc) return member_result; | 
 | 120 |     ++ccl; | 
 | 121 |   } | 
 | 122 |   return !member_result; | 
 | 123 | } | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 124 |  | 
| Elliott Hughes | 7f0849f | 2016-08-26 16:17:17 -0700 | [diff] [blame] | 125 | #pragma GCC diagnostic push | 
 | 126 | #pragma GCC diagnostic ignored "-Wframe-larger-than=" | 
 | 127 |  | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 128 | /* | 
 | 129 |  * vfwscanf | 
 | 130 |  */ | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 131 | int __vfwscanf(FILE* __restrict fp, const wchar_t* __restrict fmt, __va_list ap) { | 
 | 132 |   wint_t c;               /* character from format, or conversion */ | 
 | 133 |   size_t width;           /* field width, or 0 */ | 
 | 134 |   wchar_t* p;             /* points into all kinds of strings */ | 
 | 135 |   int n;                  /* handy integer */ | 
 | 136 |   int flags;              /* flags as defined above */ | 
 | 137 |   wchar_t* p0;            /* saves original value of p when necessary */ | 
 | 138 |   int nassigned;          /* number of fields assigned */ | 
 | 139 |   int nconversions;       /* number of conversions */ | 
 | 140 |   int nread;              /* number of characters consumed from fp */ | 
 | 141 |   int base;               /* base argument to strtoimax/strtouimax */ | 
 | 142 |   wchar_t buf[BUF];       /* buffer for numeric conversions */ | 
| Elliott Hughes | 0d3ba1f | 2017-12-06 16:41:35 -0800 | [diff] [blame] | 143 |   const wchar_t* ccl; | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 144 |   wint_t wi;              /* handy wint_t */ | 
 | 145 |   char* mbp;              /* multibyte string pointer for %c %s %[ */ | 
 | 146 |   size_t nconv;           /* number of bytes in mb. conversion */ | 
 | 147 |   char mbbuf[MB_LEN_MAX]; /* temporary mb. character buffer */ | 
 | 148 |   mbstate_t mbs; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 149 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 150 |   /* `basefix' is used to avoid `if' tests in the integer scanner */ | 
 | 151 |   static short basefix[17] = { 10, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16 }; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 152 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 153 |   _SET_ORIENTATION(fp, 1); | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 154 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 155 |   nassigned = 0; | 
 | 156 |   nconversions = 0; | 
 | 157 |   nread = 0; | 
 | 158 |   base = 0; /* XXX just to keep gcc happy */ | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 159 |   for (;;) { | 
 | 160 |     c = *fmt++; | 
 | 161 |     if (c == 0) { | 
 | 162 |       return (nassigned); | 
 | 163 |     } | 
 | 164 |     if (iswspace(c)) { | 
 | 165 |       while ((c = __fgetwc_unlock(fp)) != WEOF && iswspace(c)) | 
 | 166 |         ; | 
 | 167 |       if (c != WEOF) __ungetwc(c, fp); | 
 | 168 |       continue; | 
 | 169 |     } | 
 | 170 |     if (c != '%') goto literal; | 
 | 171 |     width = 0; | 
 | 172 |     flags = 0; | 
 | 173 |     /* | 
 | 174 |      * switch on the format.  continue if done; | 
 | 175 |      * break once format type is derived. | 
 | 176 |      */ | 
 | 177 |   again: | 
 | 178 |     c = *fmt++; | 
 | 179 |     switch (c) { | 
 | 180 |       case '%': | 
 | 181 |       literal: | 
 | 182 |         if ((wi = __fgetwc_unlock(fp)) == WEOF) goto input_failure; | 
 | 183 |         if (wi != c) { | 
 | 184 |           __ungetwc(wi, fp); | 
| Elliott Hughes | bf9cb9e | 2017-12-11 12:39:01 -0800 | [diff] [blame] | 185 |           goto match_failure; | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 186 |         } | 
 | 187 |         nread++; | 
 | 188 |         continue; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 189 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 190 |       case '*': | 
 | 191 |         flags |= SUPPRESS; | 
 | 192 |         goto again; | 
 | 193 |       case 'j': | 
 | 194 |         flags |= MAXINT; | 
 | 195 |         goto again; | 
 | 196 |       case 'L': | 
 | 197 |         flags |= LONGDBL; | 
 | 198 |         goto again; | 
 | 199 |       case 'h': | 
 | 200 |         if (*fmt == 'h') { | 
 | 201 |           fmt++; | 
 | 202 |           flags |= SHORTSHORT; | 
 | 203 |         } else { | 
 | 204 |           flags |= SHORT; | 
 | 205 |         } | 
 | 206 |         goto again; | 
 | 207 |       case 'l': | 
 | 208 |         if (*fmt == 'l') { | 
 | 209 |           fmt++; | 
 | 210 |           flags |= LLONG; | 
 | 211 |         } else { | 
 | 212 |           flags |= LONG; | 
 | 213 |         } | 
 | 214 |         goto again; | 
 | 215 |       case 'q': | 
 | 216 |         flags |= LLONG; /* deprecated */ | 
 | 217 |         goto again; | 
 | 218 |       case 't': | 
 | 219 |         flags |= PTRINT; | 
 | 220 |         goto again; | 
 | 221 |       case 'z': | 
 | 222 |         flags |= SIZEINT; | 
 | 223 |         goto again; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 224 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 225 |       case '0': | 
 | 226 |       case '1': | 
 | 227 |       case '2': | 
 | 228 |       case '3': | 
 | 229 |       case '4': | 
 | 230 |       case '5': | 
 | 231 |       case '6': | 
 | 232 |       case '7': | 
 | 233 |       case '8': | 
 | 234 |       case '9': | 
 | 235 |         width = width * 10 + c - '0'; | 
 | 236 |         goto again; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 237 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 238 |       /* | 
 | 239 |        * Conversions. | 
 | 240 |        * Those marked `compat' are for 4.[123]BSD compatibility. | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 241 |        */ | 
 | 242 |       case 'D': /* compat */ | 
 | 243 |         flags |= LONG; | 
 | 244 |         /* FALLTHROUGH */ | 
 | 245 |       case 'd': | 
 | 246 |         c = CT_INT; | 
 | 247 |         base = 10; | 
 | 248 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 249 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 250 |       case 'i': | 
 | 251 |         c = CT_INT; | 
 | 252 |         base = 0; | 
 | 253 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 254 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 255 |       case 'O': /* compat */ | 
 | 256 |         flags |= LONG; | 
 | 257 |         /* FALLTHROUGH */ | 
 | 258 |       case 'o': | 
 | 259 |         c = CT_INT; | 
 | 260 |         flags |= UNSIGNED; | 
 | 261 |         base = 8; | 
 | 262 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 263 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 264 |       case 'u': | 
 | 265 |         c = CT_INT; | 
 | 266 |         flags |= UNSIGNED; | 
 | 267 |         base = 10; | 
 | 268 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 269 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 270 |       case 'X': | 
 | 271 |       case 'x': | 
 | 272 |         flags |= PFXOK; /* enable 0x prefixing */ | 
 | 273 |         c = CT_INT; | 
 | 274 |         flags |= UNSIGNED; | 
 | 275 |         base = 16; | 
 | 276 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 277 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 278 |       case 'e': | 
 | 279 |       case 'E': | 
 | 280 |       case 'f': | 
 | 281 |       case 'F': | 
 | 282 |       case 'g': | 
 | 283 |       case 'G': | 
 | 284 |       case 'a': | 
 | 285 |       case 'A': | 
 | 286 |         c = CT_FLOAT; | 
 | 287 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 288 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 289 |       case 's': | 
 | 290 |         c = CT_STRING; | 
 | 291 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 292 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 293 |       case '[': | 
| Elliott Hughes | 0d3ba1f | 2017-12-06 16:41:35 -0800 | [diff] [blame] | 294 |         ccl = fmt; | 
 | 295 |         if (*fmt == '^') fmt++; | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 296 |         if (*fmt == ']') fmt++; | 
 | 297 |         while (*fmt != '\0' && *fmt != ']') fmt++; | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 298 |         fmt++; | 
 | 299 |         flags |= NOSKIP; | 
 | 300 |         c = CT_CCL; | 
 | 301 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 302 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 303 |       case 'c': | 
 | 304 |         flags |= NOSKIP; | 
 | 305 |         c = CT_CHAR; | 
 | 306 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 307 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 308 |       case 'p': /* pointer format is like hex */ | 
 | 309 |         flags |= POINTER | PFXOK; | 
 | 310 |         c = CT_INT; | 
 | 311 |         flags |= UNSIGNED; | 
 | 312 |         base = 16; | 
 | 313 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 314 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 315 |       case 'n': | 
 | 316 |         nconversions++; | 
 | 317 |         if (flags & SUPPRESS) continue; | 
 | 318 |         if (flags & SHORTSHORT) | 
 | 319 |           *va_arg(ap, signed char*) = nread; | 
 | 320 |         else if (flags & SHORT) | 
 | 321 |           *va_arg(ap, short*) = nread; | 
 | 322 |         else if (flags & LONG) | 
 | 323 |           *va_arg(ap, long*) = nread; | 
 | 324 |         else if (flags & SIZEINT) | 
 | 325 |           *va_arg(ap, ssize_t*) = nread; | 
 | 326 |         else if (flags & PTRINT) | 
 | 327 |           *va_arg(ap, ptrdiff_t*) = nread; | 
 | 328 |         else if (flags & LLONG) | 
 | 329 |           *va_arg(ap, long long*) = nread; | 
 | 330 |         else if (flags & MAXINT) | 
 | 331 |           *va_arg(ap, intmax_t*) = nread; | 
 | 332 |         else | 
 | 333 |           *va_arg(ap, int*) = nread; | 
 | 334 |         continue; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 335 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 336 |       /* | 
 | 337 |        * Disgusting backwards compatibility hacks.	XXX | 
 | 338 |        */ | 
 | 339 |       case '\0': /* compat */ | 
 | 340 |         return (EOF); | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 341 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 342 |       default: /* compat */ | 
 | 343 |         if (iswupper(c)) flags |= LONG; | 
 | 344 |         c = CT_INT; | 
 | 345 |         base = 10; | 
 | 346 |         break; | 
 | 347 |     } | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 348 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 349 |     /* | 
 | 350 |      * Consume leading white space, except for formats | 
 | 351 |      * that suppress this. | 
 | 352 |      */ | 
 | 353 |     if ((flags & NOSKIP) == 0) { | 
 | 354 |       while ((wi = __fgetwc_unlock(fp)) != WEOF && iswspace(wi)) nread++; | 
 | 355 |       if (wi == WEOF) goto input_failure; | 
 | 356 |       __ungetwc(wi, fp); | 
 | 357 |     } | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 358 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 359 |     /* | 
 | 360 |      * Do the conversion. | 
 | 361 |      */ | 
 | 362 |     switch (c) { | 
 | 363 |       case CT_CHAR: | 
 | 364 |         /* scan arbitrary characters (sets NOSKIP) */ | 
 | 365 |         if (width == 0) width = 1; | 
 | 366 |         if (flags & LONG) { | 
 | 367 |           if (!(flags & SUPPRESS)) p = va_arg(ap, wchar_t*); | 
 | 368 |           n = 0; | 
 | 369 |           while (width-- != 0 && (wi = __fgetwc_unlock(fp)) != WEOF) { | 
 | 370 |             if (!(flags & SUPPRESS)) *p++ = (wchar_t)wi; | 
 | 371 |             n++; | 
 | 372 |           } | 
 | 373 |           if (n == 0) goto input_failure; | 
 | 374 |           nread += n; | 
 | 375 |           if (!(flags & SUPPRESS)) nassigned++; | 
 | 376 |         } else { | 
 | 377 |           if (!(flags & SUPPRESS)) mbp = va_arg(ap, char*); | 
 | 378 |           n = 0; | 
 | 379 |           memset(&mbs, 0, sizeof(mbs)); | 
 | 380 |           while (width != 0 && (wi = __fgetwc_unlock(fp)) != WEOF) { | 
 | 381 |             if (width >= MB_CUR_MAX && !(flags & SUPPRESS)) { | 
 | 382 |               nconv = wcrtomb(mbp, wi, &mbs); | 
 | 383 |               if (nconv == (size_t)-1) goto input_failure; | 
 | 384 |             } else { | 
 | 385 |               nconv = wcrtomb(mbbuf, wi, &mbs); | 
 | 386 |               if (nconv == (size_t)-1) goto input_failure; | 
 | 387 |               if (nconv > width) { | 
 | 388 |                 __ungetwc(wi, fp); | 
 | 389 |                 break; | 
 | 390 |               } | 
 | 391 |               if (!(flags & SUPPRESS)) memcpy(mbp, mbbuf, nconv); | 
 | 392 |             } | 
 | 393 |             if (!(flags & SUPPRESS)) mbp += nconv; | 
 | 394 |             width -= nconv; | 
 | 395 |             n++; | 
 | 396 |           } | 
 | 397 |           if (n == 0) goto input_failure; | 
 | 398 |           nread += n; | 
 | 399 |           if (!(flags & SUPPRESS)) nassigned++; | 
 | 400 |         } | 
 | 401 |         nconversions++; | 
 | 402 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 403 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 404 |       case CT_CCL: | 
| Elliott Hughes | bf9cb9e | 2017-12-11 12:39:01 -0800 | [diff] [blame] | 405 |       case CT_STRING: | 
 | 406 |         // CT_CCL: scan a (nonempty) character class (sets NOSKIP). | 
 | 407 |         // CT_STRING: like CCL, but zero-length string OK, & no NOSKIP. | 
 | 408 |         if (width == 0) width = (size_t)~0; // 'infinity'. | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 409 |         if ((flags & SUPPRESS) && (flags & LONG)) { | 
 | 410 |           n = 0; | 
| Elliott Hughes | bf9cb9e | 2017-12-11 12:39:01 -0800 | [diff] [blame] | 411 |           while ((wi = __fgetwc_unlock(fp)) != WEOF && width-- != 0 && ((c == CT_CCL && in_ccl(wi, ccl)) || (c == CT_STRING && !iswspace(wi)))) n++; | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 412 |           if (wi != WEOF) __ungetwc(wi, fp); | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 413 |         } else if (flags & LONG) { | 
 | 414 |           p0 = p = va_arg(ap, wchar_t*); | 
| Elliott Hughes | bf9cb9e | 2017-12-11 12:39:01 -0800 | [diff] [blame] | 415 |           while ((wi = __fgetwc_unlock(fp)) != WEOF && width-- != 0 && ((c == CT_CCL && in_ccl(wi, ccl)) || (c == CT_STRING && !iswspace(wi)))) { | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 416 |             *p++ = (wchar_t)wi; | 
| Elliott Hughes | bf9cb9e | 2017-12-11 12:39:01 -0800 | [diff] [blame] | 417 |           } | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 418 |           if (wi != WEOF) __ungetwc(wi, fp); | 
 | 419 |           n = p - p0; | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 420 |         } else { | 
 | 421 |           if (!(flags & SUPPRESS)) mbp = va_arg(ap, char*); | 
 | 422 |           n = 0; | 
 | 423 |           memset(&mbs, 0, sizeof(mbs)); | 
| Elliott Hughes | bf9cb9e | 2017-12-11 12:39:01 -0800 | [diff] [blame] | 424 |           while ((wi = __fgetwc_unlock(fp)) != WEOF && width != 0 && ((c == CT_CCL && in_ccl(wi, ccl)) || (c == CT_STRING && !iswspace(wi)))) { | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 425 |             if (width >= MB_CUR_MAX && !(flags & SUPPRESS)) { | 
 | 426 |               nconv = wcrtomb(mbp, wi, &mbs); | 
 | 427 |               if (nconv == (size_t)-1) goto input_failure; | 
 | 428 |             } else { | 
 | 429 |               nconv = wcrtomb(mbbuf, wi, &mbs); | 
 | 430 |               if (nconv == (size_t)-1) goto input_failure; | 
 | 431 |               if (nconv > width) break; | 
 | 432 |               if (!(flags & SUPPRESS)) memcpy(mbp, mbbuf, nconv); | 
 | 433 |             } | 
 | 434 |             if (!(flags & SUPPRESS)) mbp += nconv; | 
 | 435 |             width -= nconv; | 
 | 436 |             n++; | 
 | 437 |           } | 
 | 438 |           if (wi != WEOF) __ungetwc(wi, fp); | 
| Elliott Hughes | bf9cb9e | 2017-12-11 12:39:01 -0800 | [diff] [blame] | 439 |         } | 
 | 440 |         if (c == CT_CCL && n == 0) goto match_failure; | 
 | 441 |         if (!(flags & SUPPRESS)) { | 
 | 442 |           if (flags & LONG) { | 
 | 443 |             *p = L'\0'; | 
 | 444 |           } else { | 
 | 445 |             *mbp = '\0'; | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 446 |           } | 
| Elliott Hughes | bf9cb9e | 2017-12-11 12:39:01 -0800 | [diff] [blame] | 447 |           ++nassigned; | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 448 |         } | 
 | 449 |         nread += n; | 
 | 450 |         nconversions++; | 
 | 451 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 452 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 453 |       case CT_INT: | 
 | 454 |         /* scan an integer as if by strtoimax/strtoumax */ | 
 | 455 |         if (width == 0 || width > sizeof(buf) / sizeof(*buf) - 1) | 
 | 456 |           width = sizeof(buf) / sizeof(*buf) - 1; | 
 | 457 |         flags |= SIGNOK | NDIGITS | NZDIGITS; | 
 | 458 |         for (p = buf; width; width--) { | 
 | 459 |           c = __fgetwc_unlock(fp); | 
 | 460 |           /* | 
 | 461 |            * Switch on the character; `goto ok' | 
 | 462 |            * if we accept it as a part of number. | 
 | 463 |            */ | 
 | 464 |           switch (c) { | 
 | 465 |             /* | 
 | 466 |              * The digit 0 is always legal, but is | 
 | 467 |              * special.  For %i conversions, if no | 
 | 468 |              * digits (zero or nonzero) have been | 
 | 469 |              * scanned (only signs), we will have | 
 | 470 |              * base==0.  In that case, we should set | 
 | 471 |              * it to 8 and enable 0x prefixing. | 
 | 472 |              * Also, if we have not scanned zero digits | 
 | 473 |              * before this, do not turn off prefixing | 
 | 474 |              * (someone else will turn it off if we | 
 | 475 |              * have scanned any nonzero digits). | 
 | 476 |              */ | 
 | 477 |             case '0': | 
 | 478 |               if (base == 0) { | 
 | 479 |                 base = 8; | 
 | 480 |                 flags |= PFXOK; | 
 | 481 |               } | 
 | 482 |               if (flags & NZDIGITS) | 
 | 483 |                 flags &= ~(SIGNOK | NZDIGITS | NDIGITS); | 
 | 484 |               else | 
 | 485 |                 flags &= ~(SIGNOK | PFXOK | NDIGITS); | 
 | 486 |               goto ok; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 487 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 488 |             /* 1 through 7 always legal */ | 
 | 489 |             case '1': | 
 | 490 |             case '2': | 
 | 491 |             case '3': | 
 | 492 |             case '4': | 
 | 493 |             case '5': | 
 | 494 |             case '6': | 
 | 495 |             case '7': | 
 | 496 |               base = basefix[base]; | 
 | 497 |               flags &= ~(SIGNOK | PFXOK | NDIGITS); | 
 | 498 |               goto ok; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 499 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 500 |             /* digits 8 and 9 ok iff decimal or hex */ | 
 | 501 |             case '8': | 
 | 502 |             case '9': | 
 | 503 |               base = basefix[base]; | 
 | 504 |               if (base <= 8) break; /* not legal here */ | 
 | 505 |               flags &= ~(SIGNOK | PFXOK | NDIGITS); | 
 | 506 |               goto ok; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 507 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 508 |             /* letters ok iff hex */ | 
 | 509 |             case 'A': | 
 | 510 |             case 'B': | 
 | 511 |             case 'C': | 
 | 512 |             case 'D': | 
 | 513 |             case 'E': | 
 | 514 |             case 'F': | 
 | 515 |             case 'a': | 
 | 516 |             case 'b': | 
 | 517 |             case 'c': | 
 | 518 |             case 'd': | 
 | 519 |             case 'e': | 
 | 520 |             case 'f': | 
 | 521 |               /* no need to fix base here */ | 
 | 522 |               if (base <= 10) break; /* not legal here */ | 
 | 523 |               flags &= ~(SIGNOK | PFXOK | NDIGITS); | 
 | 524 |               goto ok; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 525 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 526 |             /* sign ok only as first character */ | 
 | 527 |             case '+': | 
 | 528 |             case '-': | 
 | 529 |               if (flags & SIGNOK) { | 
 | 530 |                 flags &= ~SIGNOK; | 
 | 531 |                 flags |= HAVESIGN; | 
 | 532 |                 goto ok; | 
 | 533 |               } | 
 | 534 |               break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 535 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 536 |             /* | 
 | 537 |              * x ok iff flag still set and 2nd char (or | 
 | 538 |              * 3rd char if we have a sign). | 
 | 539 |              */ | 
 | 540 |             case 'x': | 
 | 541 |             case 'X': | 
 | 542 |               if ((flags & PFXOK) && p == buf + 1 + !!(flags & HAVESIGN)) { | 
 | 543 |                 base = 16; /* if %i */ | 
 | 544 |                 flags &= ~PFXOK; | 
 | 545 |                 goto ok; | 
 | 546 |               } | 
 | 547 |               break; | 
 | 548 |           } | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 549 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 550 |           /* | 
 | 551 |            * If we got here, c is not a legal character | 
 | 552 |            * for a number.  Stop accumulating digits. | 
 | 553 |            */ | 
 | 554 |           if (c != WEOF) __ungetwc(c, fp); | 
 | 555 |           break; | 
 | 556 |         ok: | 
 | 557 |           /* | 
 | 558 |            * c is legal: store it and look at the next. | 
 | 559 |            */ | 
 | 560 |           *p++ = (wchar_t)c; | 
 | 561 |         } | 
 | 562 |         /* | 
 | 563 |          * If we had only a sign, it is no good; push | 
 | 564 |          * back the sign.  If the number ends in `x', | 
 | 565 |          * it was [sign] '0' 'x', so push back the x | 
 | 566 |          * and treat it as [sign] '0'. | 
 | 567 |          */ | 
 | 568 |         if (flags & NDIGITS) { | 
 | 569 |           if (p > buf) __ungetwc(*--p, fp); | 
 | 570 |           goto match_failure; | 
 | 571 |         } | 
 | 572 |         c = p[-1]; | 
 | 573 |         if (c == 'x' || c == 'X') { | 
 | 574 |           --p; | 
 | 575 |           __ungetwc(c, fp); | 
 | 576 |         } | 
 | 577 |         if ((flags & SUPPRESS) == 0) { | 
 | 578 |           uintmax_t res; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 579 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 580 |           *p = '\0'; | 
 | 581 |           if (flags & UNSIGNED) | 
 | 582 |             res = wcstoimax(buf, NULL, base); | 
 | 583 |           else | 
 | 584 |             res = wcstoumax(buf, NULL, base); | 
 | 585 |           if (flags & POINTER) | 
 | 586 |             *va_arg(ap, void**) = (void*)(uintptr_t)res; | 
 | 587 |           else if (flags & MAXINT) | 
 | 588 |             *va_arg(ap, intmax_t*) = res; | 
 | 589 |           else if (flags & LLONG) | 
 | 590 |             *va_arg(ap, long long*) = res; | 
 | 591 |           else if (flags & SIZEINT) | 
 | 592 |             *va_arg(ap, ssize_t*) = res; | 
 | 593 |           else if (flags & PTRINT) | 
 | 594 |             *va_arg(ap, ptrdiff_t*) = res; | 
 | 595 |           else if (flags & LONG) | 
 | 596 |             *va_arg(ap, long*) = res; | 
 | 597 |           else if (flags & SHORT) | 
 | 598 |             *va_arg(ap, short*) = res; | 
 | 599 |           else if (flags & SHORTSHORT) | 
 | 600 |             *va_arg(ap, signed char*) = res; | 
 | 601 |           else | 
 | 602 |             *va_arg(ap, int*) = res; | 
 | 603 |           nassigned++; | 
 | 604 |         } | 
 | 605 |         nread += p - buf; | 
 | 606 |         nconversions++; | 
 | 607 |         break; | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 608 |  | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 609 |       case CT_FLOAT: | 
 | 610 |         /* scan a floating point number as if by strtod */ | 
 | 611 |         if (width == 0 || width > sizeof(buf) / sizeof(*buf) - 1) | 
 | 612 |           width = sizeof(buf) / sizeof(*buf) - 1; | 
 | 613 |         if ((width = wparsefloat(fp, buf, buf + width)) == 0) goto match_failure; | 
 | 614 |         if ((flags & SUPPRESS) == 0) { | 
 | 615 |           if (flags & LONGDBL) { | 
 | 616 |             long double res = wcstold(buf, &p); | 
 | 617 |             *va_arg(ap, long double*) = res; | 
 | 618 |           } else if (flags & LONG) { | 
 | 619 |             double res = wcstod(buf, &p); | 
 | 620 |             *va_arg(ap, double*) = res; | 
 | 621 |           } else { | 
 | 622 |             float res = wcstof(buf, &p); | 
 | 623 |             *va_arg(ap, float*) = res; | 
 | 624 |           } | 
 | 625 |           if (p - buf != (ptrdiff_t)width) abort(); | 
 | 626 |           nassigned++; | 
 | 627 |         } | 
 | 628 |         nread += width; | 
 | 629 |         nconversions++; | 
 | 630 |         break; | 
 | 631 |     } | 
 | 632 |   } | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 633 | input_failure: | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 634 |   return (nconversions != 0 ? nassigned : EOF); | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 635 | match_failure: | 
| Elliott Hughes | c8f2c52 | 2017-10-31 13:07:51 -0700 | [diff] [blame] | 636 |   return (nassigned); | 
| Elliott Hughes | 01ae00f | 2014-04-29 16:28:56 -0700 | [diff] [blame] | 637 | } | 
| Elliott Hughes | 7f0849f | 2016-08-26 16:17:17 -0700 | [diff] [blame] | 638 | #pragma GCC diagnostic pop |