123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757 |
- /*
- * Modified by Manuel Novoa III Mar 13, 2001
- *
- * The vfscanf routine was completely rewritten to add features and remove
- * bugs. The function __strtold, based on my strtod code in stdlib, was
- * added to provide floating point support for the scanf functions.
- *
- * So far they pass the test cases from glibc-2.1.3, except in two instances.
- * In one case, the test appears to be broken. The other case is something
- * I need to research further. This version of scanf assumes it can only
- * peek one character ahead. Apparently, glibc looks further. The difference
- * can be seen when parsing a floating point value in the character
- * sequence "100ergs". glibc is able to back up before the 'e' and return
- * a value of 100, whereas this scanf reports a bad match with the stream
- * pointer at 'r'. A similar situation can also happen when parsing hex
- * values prefixed by 0x or 0X; a failure would occur for "0xg". In order to
- * fix this, I need to rework the "ungetc" machinery in stdio.c again.
- * I do have one reference though, that seems to imply scanf has a single
- * character of lookahead.
- *
- * May 20, 2001
- *
- * Quote from ANSI/ISO C99 standard:
- *
- * fscanf pushes back at most one input character onto the input stream.
- * Therefore, some sequences that are acceptable to strtod, strtol, etc.,
- * are unacceptable to fscanf.
- *
- * So uClibc's *scanf functions conform to the standard, and glibc's
- * implementation doesn't for the "100ergs" case mentioned above.
- */
- #define _GNU_SOURCE
- #include <features.h>
- #if defined(__UCLIBC__) && !defined(__USE_ISOC99)
- #define __USE_ISOC99
- #endif
- #define _STDIO_UTILITY
- #include <stdio.h>
- #include <stdlib.h>
- #include <unistd.h>
- #include <ctype.h>
- #include <string.h>
- #include <stdarg.h>
- #ifdef __STDIO_THREADSAFE
- #include <pthread.h>
- #endif /* __STDIO_THREADSAFE */
- #ifdef L_scanf
- #ifdef __STDC__
- int scanf(const char *fmt, ...)
- #else
- int scanf(fmt, va_alist)
- __const char *fmt;
- va_dcl
- #endif
- {
- va_list ptr;
- int rv;
- va_start(ptr, fmt);
- rv = vfscanf(stdin, fmt, ptr);
- va_end(ptr);
- return rv;
- }
- #endif
- #ifdef L_sscanf
- #if !defined(__STDIO_BUFFERS) && !defined(__STDIO_GLIBC_CUSTOM_STREAMS)
- #warning skipping sscanf since no buffering and no custom streams!
- #else
- int sscanf(const char *sp, const char *fmt, ...)
- {
- va_list ptr;
- int rv;
- va_start(ptr, fmt);
- rv = vsscanf(sp, fmt, ptr);
- va_end(ptr);
- return rv;
- }
- #endif
- #endif
- #ifdef L_fscanf
- #ifdef __STDC__
- int fscanf(FILE * fp, const char *fmt, ...)
- #else
- int fscanf(fp, fmt, va_alist)
- FILE *fp;
- __const char *fmt;
- va_dcl
- #endif
- {
- va_list ptr;
- int rv;
- va_start(ptr, fmt);
- rv = vfscanf(fp, fmt, ptr);
- va_end(ptr);
- return rv;
- }
- #endif
- #ifdef L_vscanf
- int vscanf(fmt, ap)
- __const char *fmt;
- va_list ap;
- {
- return vfscanf(stdin, fmt, ap);
- }
- #endif
- #ifdef L_vsscanf
- #ifdef __STDIO_BUFFERS
- int vsscanf(__const char *sp, __const char *fmt, va_list ap)
- {
- FILE string[1];
- string->filedes = -2; /* for debugging */
- string->modeflags = (__FLAG_NARROW|__FLAG_READONLY);
- string->bufstart = string->bufrpos = (unsigned char *) ((void *) sp);
- string->bufgetc = (char *) ((unsigned) -1);
- #ifdef __STDIO_THREADSAFE
- __stdio_init_mutex(&string->lock);
- #endif
- return vfscanf(string, fmt, ap);
- }
- #else /* __STDIO_BUFFERS */
- #ifdef __STDIO_GLIBC_CUSTOM_STREAMS
- int vsscanf(__const char *sp, __const char *fmt, va_list ap)
- {
- FILE *f;
- int rv;
- if ((f = fmemopen((char *)sp, strlen(sp), "r")) == NULL) {
- return -1;
- }
- rv = vfscanf(f, fmt, ap);
- fclose(f);
- return rv;
- }
- #else /* __STDIO_GLIBC_CUSTOM_STREAMS */
- #warning skipping vsscanf since no buffering and no custom streams!
- #endif /* __STDIO_GLIBC_CUSTOM_STREAMS */
- #endif /* __STDIO_BUFFERS */
- #endif
- #ifdef L_vfscanf
- #include <assert.h>
- #include <ctype.h>
- #include <limits.h>
- static int valid_digit(char c, char base)
- {
- if (base == 16) {
- return isxdigit(c);
- } else {
- return (__isdigit(c) && (c < '0' + base));
- }
- }
- extern unsigned long
- _stdlib_strto_l(register const char * __restrict str,
- char ** __restrict endptr, int base, int sflag);
- extern unsigned long long
- _stdlib_strto_ll(register const char * __restrict str,
- char ** __restrict endptr, int base, int sflag);
- struct scan_cookie {
- FILE *fp;
- int nread;
- int width;
- int width_flag;
- int ungot_char;
- int ungot_flag;
- int app_ungot;
- };
- #ifdef __UCLIBC_HAS_LONG_LONG__
- static const char qual[] = "hl" /* "jtz" */ "Lq";
- /* char = -2, short = -1, int = 0, long = 1, long long = 2 */
- static const char qsz[] = { -1, 1, 2, 2 };
- #else
- static const char qual[] = "hl" /* "jtz" */;
- static const char qsz[] = { -1, 1, };
- #endif
- #ifdef __UCLIBC_HAS_FLOATS__
- static int __strtold(long double *ld, struct scan_cookie *sc);
- /*01234567890123456 */
- static const char spec[] = "%n[csoupxXidfeEgG";
- #else
- static const char spec[] = "%n[csoupxXid";
- #endif
- /* radix[i] <-> spec[i+5] o u p x X i d */
- static const char radix[] = { 8, 10, 16, 16, 16, 0, 10 };
- static void init_scan_cookie(struct scan_cookie *sc, FILE *fp)
- {
- sc->fp = fp;
- sc->nread = 0;
- sc->width_flag = 0;
- sc->ungot_flag = 0;
- sc->app_ungot = ((fp->modeflags & __MASK_UNGOT) ? fp->ungot[1] : 0);
- }
- /* TODO -- what about literal '\0' chars in a file??? */
- static int scan_getc_nw(struct scan_cookie *sc)
- {
- if (sc->ungot_flag == 0) {
- sc->ungot_char = getc(sc->fp);
- } else {
- sc->ungot_flag = 0;
- }
- if (sc->ungot_char > 0) {
- ++sc->nread;
- }
- sc->width_flag = 0;
- return sc->ungot_char;
- }
- static int scan_getc(struct scan_cookie *sc)
- {
- if (sc->ungot_flag == 0) {
- sc->ungot_char = getc(sc->fp);
- }
- sc->width_flag = 1;
- if (--sc->width < 0) {
- sc->ungot_flag = 1;
- return 0;
- }
- sc->ungot_flag = 0;
- if (sc->ungot_char > 0) {
- ++sc->nread;
- }
- return sc->ungot_char;
- }
- static void scan_ungetc(struct scan_cookie *sc)
- {
- if (sc->ungot_flag != 0) {
- assert(sc->width < 0);
- return;
- }
- if (sc->width_flag) {
- ++sc->width;
- }
- sc->ungot_flag = 1;
- if (sc->ungot_char > 0) { /* not EOF or EOS */
- --sc->nread;
- }
- }
- static void kill_scan_cookie(struct scan_cookie *sc)
- {
- if (sc->ungot_flag) {
- ungetc(sc->ungot_char,sc->fp);
- /* Deal with distiction between user and scanf ungots. */
- if (sc->nread == 0) { /* Only one char was read... app ungot? */
- sc->fp->ungot[1] = sc->app_ungot; /* restore ungot state. */
- }
- }
- }
- int vfscanf(fp, format, ap)
- FILE *fp;
- const char *format;
- va_list ap;
- {
- #ifdef __UCLIBC_HAS_LONG_LONG__
- #define STRTO_L_(s,e,b,sf) _stdlib_strto_ll(s,e,b,sf)
- #define MAX_DIGITS 64
- #define UV_TYPE unsigned long long
- #define V_TYPE long long
- #else
- #define STRTO_L_(s,e,b,sf) _stdlib_strto_l(s,e,b,sf)
- #define MAX_DIGITS 32
- #define UV_TYPE unsigned long
- #define V_TYPE long
- #endif
- #ifdef __UCLIBC_HAS_FLOATS__
- long double ld;
- #endif
- UV_TYPE uv;
- struct scan_cookie sc;
- unsigned const char *fmt;
- const char *p;
- unsigned char *b;
- void *vp;
- int cc, i, cnt;
- signed char lval;
- unsigned char store, usflag, base, invert, r0, r1;
- unsigned char buf[MAX_DIGITS+2];
- unsigned char scanset[UCHAR_MAX + 1];
- __STDIO_THREADLOCK(fp);
- init_scan_cookie(&sc,fp);
- fmt = (unsigned const char *) format;
- cnt = 0;
- while (*fmt) {
- store = 1;
- lval = 0;
- sc.width = INT_MAX;
- if (*fmt == '%') { /* Conversion specification. */
- ++fmt;
- if (*fmt == '*') { /* Suppress assignment. */
- store = 0;
- ++fmt;
- }
- for (i = 0 ; __isdigit(*fmt) ; sc.width = i) {
- i = (i * 10) + (*fmt++ - '0'); /* Get specified width. */
- }
- for (i = 0 ; i < sizeof(qual) ; i++) { /* Optional qualifier. */
- if (qual[i] == *fmt) {
- ++fmt;
- lval += qsz[i];
- if ((i < 2) && (qual[i] == *fmt)) { /* Double h or l. */
- ++fmt;
- lval += qsz[i];
- }
- break;
- }
- }
- for (p = spec ; *p ; p++) { /* Process format specifier. */
- if (*fmt != *p) continue;
- if (p-spec < 1) { /* % - match a '%'*/
- goto matchchar;
- }
- if (p-spec < 2) { /* n - store number of chars read */
- *(va_arg(ap, int *)) = sc.nread;
- scan_getc_nw(&sc);
- goto nextfmt;
- }
- if (p-spec > 3) { /* skip white space if not c or [ */
- do {
- i = scan_getc_nw(&sc);
- } while (__isspace(i));
- scan_ungetc(&sc);
- }
- if (p-spec < 5) { /* [,c,s - string conversions */
- invert = 0;
- if (*p == 'c') {
- invert = 1;
- if (sc.width == INT_MAX) {
- sc.width = 1;
- }
- }
- for (i=0 ; i<= UCHAR_MAX ; i++) {
- scanset[i] = ((*p == 's') ? (__isspace(i) == 0) : 0);
- }
- if (*p == '[') { /* need to build a scanset */
- if (*++fmt == '^') {
- invert = 1;
- ++fmt;
- }
- if (*fmt == ']') {
- scanset[(int)']'] = 1;
- ++fmt;
- }
- r0 = 0;
- while (*fmt && *fmt !=']') { /* build scanset */
- if ((*fmt == '-') && r0 && (fmt[1] != ']')) {
- /* range */
- ++fmt;
- if (*fmt < r0) {
- r1 = r0;
- r0 = *fmt;
- } else {
- r1 = *fmt;
- }
- for (i=r0 ; i<= r1 ; i++) {
- scanset[i] = 1;
- }
- r0 = 0;
- } else {
- r0 = *fmt;
- scanset[r0] = 1;
- }
- ++fmt;
- }
- if (!*fmt) { /* format string exhausted! */
- goto done;
- }
- }
- /* ok -- back to common work */
- if (sc.width <= 0) {
- goto done;
- }
- if (store) {
- b = va_arg(ap, unsigned char *);
- } else {
- b = buf;
- }
- cc = scan_getc(&sc);
- if (cc <= 0) {
- scan_ungetc(&sc);
- goto done; /* return EOF if cnt == 0 */
- }
- i = 0;
- while ((cc>0) && (scanset[cc] != invert)) {
- i = 1; /* yes, we stored something */
- *b = cc;
- b += store;
- cc = scan_getc(&sc);
- }
- if (i==0) {
- scan_ungetc(&sc);
- goto done; /* return cnt */
- }
- if (*p != 'c') { /* nul-terminate the stored string */
- *b = 0;
- }
- cnt += store;
- goto nextfmt;
- }
- if (p-spec < 12) { /* o,u,p,x,X,i,d - (un)signed integer */
- if (*p == 'p') {
- /* assume pointer same size as int or long. */
- lval = (sizeof(char *) == sizeof(long));
- }
- usflag = ((p-spec) < 10); /* (1)0 if (un)signed */
- base = radix[(int)(p-spec) - 5];
- b = buf;
- if (sc.width <= 0) {
- goto done;
- }
- cc = scan_getc(&sc);
- if ((cc == '+') || (cc == '-')) { /* Handle leading sign.*/
- *b++ = cc;
- cc = scan_getc(&sc);
- }
- if (cc == '0') { /* Possibly set base and handle prefix. */
- if ((base == 0) || (base == 16)) {
- cc = scan_getc(&sc);
- if ((cc == 'x') || (cc == 'X')) {
- /* We're committed to base 16 now. */
- base = 16;
- cc = scan_getc(&sc);
- } else { /* oops... back up */
- scan_ungetc(&sc);
- cc = '0';
- if (base == 0) {
- base = 8;
- }
- }
- }
- }
- if (base == 0) { /* Default to base 10 */
- base = 10;
- }
- /* At this point, we're ready to start reading digits. */
- if (cc == '0') {
- *b++ = cc; /* Store first leading 0 */
- do { /* but ignore others. */
- cc = scan_getc(&sc);
- } while (cc == '0');
- }
- while (valid_digit(cc,base)) { /* Now for nonzero digits.*/
- if (b - buf < MAX_DIGITS) {
- *b++ = cc;
- }
- cc = scan_getc(&sc);
- }
- *b = 0; /* null-terminate */
- if ((b == buf) || (*--b == '+') || (*b == '-')) {
- scan_ungetc(&sc);
- goto done; /* No digits! */
- }
- if (store) {
- if (*buf == '-') {
- usflag = 0;
- }
- uv = STRTO_L_(buf, NULL, base, 1-usflag);
- vp = va_arg(ap, void *);
- switch (lval) {
- case 2: /* If no long long, treat as long . */
- #ifdef __UCLIBC_HAS_LONG_LONG__
- *((unsigned long long *)vp) = uv;
- break;
- #endif
- case 1:
- #if ULONG_MAX == UINT_MAX
- case 0: /* int and long int are the same */
- #endif
- #ifdef __UCLIBC_HAS_LONG_LONG__
- if (usflag) {
- if (uv > ULONG_MAX) {
- uv = ULONG_MAX;
- }
- } else if (((V_TYPE)uv) > LONG_MAX) {
- uv = LONG_MAX;
- } else if (((V_TYPE)uv) < LONG_MIN) {
- uv = (UV_TYPE) LONG_MIN;
- }
- #endif
- *((unsigned long *)vp) = (unsigned long)uv;
- break;
- #if ULONG_MAX != UINT_MAX
- case 0: /* int and long int are different */
- if (usflag) {
- if (uv > UINT_MAX) {
- uv = UINT_MAX;
- }
- } else if (((V_TYPE)uv) > INT_MAX) {
- uv = INT_MAX;
- } else if (((V_TYPE)uv) < INT_MIN) {
- uv = (UV_TYPE) INT_MIN;
- }
- *((unsigned int *)vp) = (unsigned int)uv;
- break;
- #endif
- case -1:
- if (usflag) {
- if (uv > USHRT_MAX) {
- uv = USHRT_MAX;
- }
- } else if (((V_TYPE)uv) > SHRT_MAX) {
- uv = SHRT_MAX;
- } else if (((V_TYPE)uv) < SHRT_MIN) {
- uv = (UV_TYPE) SHRT_MIN;
- }
- *((unsigned short *)vp) = (unsigned short)uv;
- break;
- case -2:
- if (usflag) {
- if (uv > UCHAR_MAX) {
- uv = UCHAR_MAX;
- }
- } else if (((V_TYPE)uv) > CHAR_MAX) {
- uv = CHAR_MAX;
- } else if (((V_TYPE)uv) < CHAR_MIN) {
- uv = (UV_TYPE) CHAR_MIN;
- }
- *((unsigned char *)vp) = (unsigned char) uv;
- break;
- default:
- assert(0);
- }
- ++cnt;
- }
- goto nextfmt;
- }
- #ifdef __UCLIBC_HAS_FLOATS__
- else { /* floating point */
- if (sc.width <= 0) {
- goto done;
- }
- if (__strtold(&ld, &sc)) { /* Success! */
- if (store) {
- vp = va_arg(ap, void *);
- switch (lval) {
- case 2:
- *((long double *)vp) = ld;
- break;
- case 1:
- *((double *)vp) = (double) ld;
- break;
- case 0:
- *((float *)vp) = (float) ld;
- break;
- default: /* Illegal qualifier! */
- assert(0);
- goto done;
- }
- ++cnt;
- }
- goto nextfmt;
- }
- }
- #else
- assert(0);
- #endif
- goto done;
- }
- /* Unrecognized specifier! */
- goto RETURN_cnt;
- } if (__isspace(*fmt)) { /* Consume all whitespace. */
- do {
- i = scan_getc_nw(&sc);
- } while (__isspace(i));
- } else { /* Match the current fmt char. */
- matchchar:
- if (scan_getc_nw(&sc) != *fmt) {
- goto done;
- }
- scan_getc_nw(&sc);
- }
- nextfmt:
- scan_ungetc(&sc);
- ++fmt;
- }
- done: /* end of scan */
- kill_scan_cookie(&sc);
- if ((sc.ungot_char <= 0) && (cnt == 0) && (*fmt)) {
- cnt = EOF;
- }
- RETURN_cnt:
- __STDIO_THREADUNLOCK(fp);
- return (cnt);
- }
- /*****************************************************************************/
- #ifdef __UCLIBC_HAS_FLOATS__
- #include <float.h>
- #define MAX_SIG_DIGITS 20
- #define MAX_IGNORED_DIGITS 2000
- #define MAX_ALLOWED_EXP (MAX_SIG_DIGITS + MAX_IGNORED_DIGITS + LDBL_MAX_10_EXP)
- #if LDBL_DIG > MAX_SIG_DIGITS
- #error need to adjust MAX_SIG_DIGITS
- #endif
- #include <limits.h>
- #if MAX_ALLOWED_EXP > INT_MAX
- #error size assumption violated for MAX_ALLOWED_EXP
- #endif
- int __strtold(long double *ld, struct scan_cookie *sc)
- {
- long double number;
- long double p10;
- int exponent_power;
- int exponent_temp;
- int negative;
- int num_digits;
- int since_decimal;
- int c;
- c = scan_getc(sc); /* Decrements width. */
- negative = 0;
- switch(c) { /* Handle optional sign. */
- case '-': negative = 1; /* Fall through to get next char. */
- case '+': c = scan_getc(sc);
- }
- number = 0.;
- num_digits = -1;
- exponent_power = 0;
- since_decimal = INT_MIN;
- LOOP:
- while (__isdigit(c)) { /* Process string of digits. */
- ++since_decimal;
- if (num_digits < 0) { /* First time through? */
- ++num_digits; /* We've now seen a digit. */
- }
- if (num_digits || (c != '0')) { /* had/have nonzero */
- ++num_digits;
- if (num_digits <= MAX_SIG_DIGITS) { /* Is digit significant? */
- number = number * 10. + (c - '0');
- }
- }
- c = scan_getc(sc);
- }
- if ((c == '.') && (since_decimal < 0)) { /* If no previous decimal pt, */
- since_decimal = 0; /* save position of decimal point */
- c = scan_getc(sc); /* and process rest of digits */
- goto LOOP;
- }
- if (num_digits<0) { /* Must have at least one digit. */
- goto FAIL;
- }
- if (num_digits > MAX_SIG_DIGITS) { /* Adjust exp for skipped digits. */
- exponent_power += num_digits - MAX_SIG_DIGITS;
- }
- if (since_decimal >= 0) { /* Adjust exponent for decimal point. */
- exponent_power -= since_decimal;
- }
- if (negative) { /* Correct for sign. */
- number = -number;
- negative = 0; /* Reset for exponent processing below. */
- }
- /* Process an exponent string. */
- if (c == 'e' || c == 'E') {
- c = scan_getc(sc);
- switch(c) { /* Handle optional sign. */
- case '-': negative = 1; /* Fall through to get next char. */
- case '+': c = scan_getc(sc);
- }
- num_digits = 0;
- exponent_temp = 0;
- while (__isdigit(c)) { /* Process string of digits. */
- if (exponent_temp < MAX_ALLOWED_EXP) { /* overflow check */
- exponent_temp = exponent_temp * 10 + (c - '0');
- }
- c = scan_getc(sc);
- ++num_digits;
- }
- if (num_digits == 0) { /* Were there no exp digits? */
- goto FAIL;
- } /* else */
- if (negative) {
- exponent_power -= exponent_temp;
- } else {
- exponent_power += exponent_temp;
- }
- }
- if (number != 0.) {
- /* Now scale the result. */
- exponent_temp = exponent_power;
- p10 = 10.;
- if (exponent_temp < 0) {
- exponent_temp = -exponent_temp;
- }
- while (exponent_temp) {
- if (exponent_temp & 1) {
- if (exponent_power < 0) {
- number /= p10;
- } else {
- number *= p10;
- }
- }
- exponent_temp >>= 1;
- p10 *= p10;
- }
- }
- *ld = number;
- return 1;
- FAIL:
- scan_ungetc(sc);
- return 0;
- }
- #endif /* __UCLIBC_HAS_FLOATS__ */
- #endif
|