/* * vsscanf.c * * vsscanf(), from which the rest of the scanf() * family is built */ #include <ctype.h> #include <stdarg.h> #include <stddef.h> #include <inttypes.h> #include <string.h> #include <limits.h> #include <stdio.h> #include <sys/bitops.h> #ifndef LONG_BIT #define LONG_BIT (CHAR_BIT*sizeof(long)) #endif enum flags { FL_SPLAT = 0x01, /* Drop the value, do not assign */ FL_WIDTH = 0x02, /* Field width specified */ FL_MINUS = 0x04, /* Negative number */ }; enum ranks { rank_char = -2, rank_short = -1, rank_int = 0, rank_long = 1, rank_longlong = 2, rank_ptr = INT_MAX /* Special value used for pointers */ }; #define MIN_RANK rank_char #define MAX_RANK rank_longlong #define INTMAX_RANK rank_longlong #define SIZE_T_RANK rank_long #define PTRDIFF_T_RANK rank_long enum bail { bail_none = 0, /* No error condition */ bail_eof, /* Hit EOF */ bail_err /* Conversion mismatch */ }; int vsscanf(const char *buffer, const char *format, va_list ap) { const char *p = format; char ch; const char *q = buffer; const char *qq; uintmax_t val = 0; int rank = rank_int; /* Default rank */ unsigned int width = UINT_MAX; int base; enum flags flags = 0; enum { st_normal, /* Ground state */ st_flags, /* Special flags */ st_width, /* Field width */ st_modifiers, /* Length or conversion modifiers */ st_match_init, /* Initial state of %[ sequence */ st_match, /* Main state of %[ sequence */ st_match_range, /* After - in a %[ sequence */ } state = st_normal; char *sarg = NULL; /* %s %c or %[ string argument */ enum bail bail = bail_none; int converted = 0; /* Successful conversions */ unsigned long matchmap[((1 << CHAR_BIT) + (LONG_BIT - 1)) / LONG_BIT]; int matchinv = 0; /* Is match map inverted? */ unsigned char range_start = 0; while ((ch = *p++) && !bail) { switch (state) { case st_normal: if (ch == '%') { state = st_flags; flags = 0; rank = rank_int; width = UINT_MAX; } else if (isspace((unsigned char)ch)) { q = skipspace(q); } else { if (*q == ch) q++; else bail = bail_err; /* Match failure */ } break; case st_flags: switch (ch) { case '*': flags |= FL_SPLAT; break; case '0' ... '9': width = (ch - '0'); state = st_width; flags |= FL_WIDTH; break; default: state = st_modifiers; p--; /* Process this character again */ break; } break; case st_width: if (ch >= '0' && ch <= '9') { width = width * 10 + (ch - '0'); } else { state = st_modifiers; p--; /* Process this character again */ } break; case st_modifiers: switch (ch) { /* Length modifiers - nonterminal sequences */ case 'h': rank--; /* Shorter rank */ break; case 'l': rank++; /* Longer rank */ break; case 'j': rank = INTMAX_RANK; break; case 'z': rank = SIZE_T_RANK; break; case 't': rank = PTRDIFF_T_RANK; break; case 'L': case 'q': rank = rank_longlong; /* long double/long long */ break; default: /* Output modifiers - terminal sequences */ state = st_normal; /* Next state will be normal */ if (rank < MIN_RANK) /* Canonicalize rank */ rank = MIN_RANK; else if (rank > MAX_RANK) rank = MAX_RANK; switch (ch) { case 'P': /* Upper case pointer */ case 'p': /* Pointer */ #if 0 /* Enable this to allow null pointers by name */ q = skipspace(q); if (!isdigit((unsigned char)*q)) { static const char *const nullnames[] = { "null", "nul", "nil", "(null)", "(nul)", "(nil)", 0 }; const char *const *np; /* Check to see if it's a null pointer by name */ for (np = nullnames; *np; np++) { if (!strncasecmp(q, *np, strlen(*np))) { val = (uintmax_t) ((void *)NULL); goto set_integer; } } /* Failure */ bail = bail_err; break; } /* else */ #endif rank = rank_ptr; base = 0; goto scan_int; case 'i': /* Base-independent integer */ base = 0; goto scan_int; case 'd': /* Decimal integer */ base = 10; goto scan_int; case 'o': /* Octal integer */ base = 8; goto scan_int; case 'u': /* Unsigned decimal integer */ base = 10; goto scan_int; case 'x': /* Hexadecimal integer */ case 'X': base = 16; goto scan_int; case 'n': /* Number of characters consumed */ val = (q - buffer); goto set_integer; scan_int: q = skipspace(q); if (!*q) { bail = bail_eof; break; } val = strntoumax(q, (char **)&qq, base, width); if (qq == q) { bail = bail_err; break; } q = qq; converted++; /* fall through */ set_integer: if (!(flags & FL_SPLAT)) { switch (rank) { case rank_char: *va_arg(ap, unsigned char *) = (unsigned char)val; break; case rank_short: *va_arg(ap, unsigned short *) = (unsigned short)val; break; case rank_int: *va_arg(ap, unsigned int *) = (unsigned int)val; break; case rank_long: *va_arg(ap, unsigned long *) = (unsigned long)val; break; case rank_longlong: *va_arg(ap, unsigned long long *) = (unsigned long long)val; break; case rank_ptr: *va_arg(ap, void **) = (void *)(uintptr_t) val; break; } } break; case 'c': /* Character */ width = (flags & FL_WIDTH) ? width : 1; /* Default width == 1 */ sarg = va_arg(ap, char *); while (width--) { if (!*q) { bail = bail_eof; break; } *sarg++ = *q++; } if (!bail) converted++; break; case 's': /* String */ { char *sp; sp = sarg = va_arg(ap, char *); while (width-- && *q && !isspace((unsigned char)*q)) { *sp++ = *q++; } if (sarg != sp) { *sp = '\0'; /* Terminate output */ converted++; } else { bail = bail_eof; } } break; case '[': /* Character range */ sarg = va_arg(ap, char *); state = st_match_init; matchinv = 0; memset(matchmap, 0, sizeof matchmap); break; case '%': /* %% sequence */ if (*q == '%') q++; else bail = bail_err; break; default: /* Anything else */ bail = bail_err; /* Unknown sequence */ break; } } break; case st_match_init: /* Initial state for %[ match */ if (ch == '^' && !matchinv) { matchinv = 1; } else { range_start = (unsigned char)ch; set_bit((unsigned char)ch, matchmap); state = st_match; } break; case st_match: /* Main state for %[ match */ if (ch == ']') { goto match_run; } else if (ch == '-') { state = st_match_range; } else { range_start = (unsigned char)ch; set_bit((unsigned char)ch, matchmap); } break; case st_match_range: /* %[ match after - */ if (ch == ']') { set_bit((unsigned char)'-', matchmap); /* - was last character */ goto match_run; } else { int i; for (i = range_start; i <= (unsigned char)ch; i++) set_bit(i, matchmap); state = st_match; } break; match_run: /* Match expression finished */ qq = q; while (width && *q && test_bit((unsigned char)*q, matchmap) ^ matchinv) { *sarg++ = *q++; } if (q != qq) { *sarg = '\0'; converted++; } else { bail = *q ? bail_err : bail_eof; } break; } } if (bail == bail_eof && !converted) converted = -1; /* Return EOF (-1) */ return converted; }