552 lines
18 KiB
C
552 lines
18 KiB
C
/*
|
|
* general implementation of scanf used by scanf, sscanf, fscanf,
|
|
* _cscanf, wscanf, swscanf and fwscanf
|
|
*
|
|
* Copyright 1996,1998 Marcus Meissner
|
|
* Copyright 1996 Jukka Iivonen
|
|
* Copyright 1997,2000 Uwe Bonnes
|
|
* Copyright 2000 Jon Griffiths
|
|
* Copyright 2002 Daniel Gudbjartsson
|
|
*
|
|
* This library is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* This library is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with this library; if not, write to the Free Software
|
|
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
*/
|
|
|
|
#ifdef WIDE_SCANF
|
|
#define _L_(x) L##x
|
|
#define _CHAR_ WCHAR
|
|
#define _EOF_ MSVCRT_WEOF
|
|
#define _ISSPACE_(c) MSVCRT_iswspace(c)
|
|
#define _ISDIGIT_(c) MSVCRT_iswdigit(c)
|
|
#define _CONVERT_(c) c /*** FIXME ***/
|
|
#define _CHAR2DIGIT_(c, base) wchar2digit((c), (base))
|
|
#else /* WIDE_SCANF */
|
|
#define _L_(x) x
|
|
#define _CHAR_ char
|
|
#define _EOF_ MSVCRT_EOF
|
|
#define _ISSPACE_(c) isspace(c)
|
|
#define _ISDIGIT_(c) isdigit(c)
|
|
#define _CONVERT_(c) c /*** FIXME ***/
|
|
#define _CHAR2DIGIT_(c, base) char2digit((c), (base))
|
|
#endif /* WIDE_SCANF */
|
|
|
|
#ifdef CONSOLE
|
|
#define _GETC_(file) _getch()
|
|
#define _UNGETC_(nch, file) _ungetch(nch)
|
|
#define _FUNCTION_ _cscanf(const _CHAR_ *format, ...)
|
|
#else
|
|
#ifdef STRING
|
|
#undef _EOF_
|
|
#define _EOF_ 0
|
|
#define _GETC_(file) *file++
|
|
#define _UNGETC_(nch, file) file--
|
|
#ifdef WIDE_SCANF
|
|
#define _FUNCTION_ MSVCRT_swscanf(const WCHAR *file, const WCHAR *format, ...)
|
|
#else /* WIDE_SCANF */
|
|
#define _FUNCTION_ MSVCRT_sscanf(const char *file, const char *format, ...)
|
|
#endif /* WIDE_SCANF */
|
|
#else /* STRING */
|
|
#ifdef WIDE_SCANF
|
|
#define _GETC_(file) MSVCRT_fgetwc(file)
|
|
#define _UNGETC_(nch, file) MSVCRT_ungetwc(nch, file)
|
|
#define _FUNCTION_ MSVCRT_fwscanf(MSVCRT_FILE* file, const WCHAR *format, ...)
|
|
#else /* WIDE_SCANF */
|
|
#define _GETC_(file) MSVCRT_fgetc(file)
|
|
#define _UNGETC_(nch, file) MSVCRT_ungetc(nch, file)
|
|
#define _FUNCTION_ MSVCRT_fscanf(MSVCRT_FILE* file, const char *format, ...)
|
|
#endif /* WIDE_SCANF */
|
|
#endif /* STRING */
|
|
#endif /* CONSOLE */
|
|
|
|
/*********************************************************************
|
|
* Implemented based on
|
|
* http://msdn.microsoft.com/library/default.asp?url=/library/en-us/vccore98/html/_crt_format_specification_fields_.2d_.scanf_and_wscanf_functions.asp
|
|
* Extended by C. Scott Ananian <cananian@alumni.princeton.edu> to handle
|
|
* more types of format spec.
|
|
*/
|
|
int _FUNCTION_ {
|
|
int rd = 0;
|
|
int nch;
|
|
va_list ap;
|
|
if (!*format) return 0;
|
|
#ifndef WIDE_SCANF
|
|
#ifdef CONSOLE
|
|
WARN("(\"%s\"): semi-stub\n", format);
|
|
#else /* CONSOLE */
|
|
#ifdef STRING
|
|
WARN("%s (\"%s\"): semi-stub\n", file, format);
|
|
#else /* STRING */
|
|
WARN("%p (\"%s\"): semi-stub\n", file, format);
|
|
#endif /* STRING */
|
|
#endif /* CONSOLE */
|
|
#endif /* WIDE_SCANF */
|
|
nch = _GETC_(file);
|
|
va_start(ap, format);
|
|
while (*format) {
|
|
/* a whitespace character in the format string causes scanf to read,
|
|
* but not store, all consecutive white-space characters in the input
|
|
* up to the next non-white-space character. One white space character
|
|
* in the input matches any number (including zero) and combination of
|
|
* white-space characters in the input. */
|
|
if (_ISSPACE_(*format)) {
|
|
/* skip whitespace */
|
|
while ((nch!=_EOF_) && _ISSPACE_(nch))
|
|
nch = _GETC_(file);
|
|
}
|
|
/* a format specification causes scanf to read and convert characters
|
|
* in the input into values of a specified type. The value is assigned
|
|
* to an argument in the argument list. Format specifications have
|
|
* the form %[*][width][{h | l | I64 | L}]type */
|
|
else if (*format == _L_('%')) {
|
|
int st = 0; int suppress = 0; int width = 0;
|
|
int base, number_signed;
|
|
int h_prefix = 0;
|
|
int l_prefix = 0;
|
|
int L_prefix = 0;
|
|
int w_prefix = 0;
|
|
int prefix_finished = 0;
|
|
/* int I64_prefix = 0; */
|
|
format++;
|
|
/* look for leading asterisk, which means 'suppress assignment of
|
|
* this field'. */
|
|
if (*format==_L_('*')) {
|
|
format++;
|
|
suppress=1;
|
|
}
|
|
/* look for width specification */
|
|
while (_ISDIGIT_(*format)) {
|
|
width*=10;
|
|
width+=*format++ - _L_('0');
|
|
}
|
|
if (width==0) width=-1; /* no width spec seen */
|
|
/* read prefix (if any) */
|
|
while (!prefix_finished) {
|
|
switch(*format) {
|
|
case _L_('h'): h_prefix = 1; break;
|
|
case _L_('l'): l_prefix = 1; break;
|
|
case _L_('w'): w_prefix = 1; break;
|
|
case _L_('L'): L_prefix = 1; break;
|
|
case _L_('I'):
|
|
if (*(format + 1) == _L_('6') &&
|
|
*(format + 2) == _L_('4')) {
|
|
/* I64_prefix = 1; */
|
|
format += 2;
|
|
FIXME("I64 prefix currently not implemented in fscanf/fwscanf");
|
|
}
|
|
break;
|
|
default:
|
|
prefix_finished = 1;
|
|
}
|
|
if (!prefix_finished) format++;
|
|
}
|
|
/* read type */
|
|
switch(*format) {
|
|
case _L_('%'): { /* read a percent symbol */
|
|
while ((nch!=_EOF_) && _ISSPACE_(nch))
|
|
nch = _GETC_(file);
|
|
if (nch==_L_('%')) {
|
|
suppress = 1; /* whoops no field to be read */
|
|
st = 1; /* but we got what we expected */
|
|
nch = _GETC_(file);
|
|
}
|
|
}
|
|
break;
|
|
case _L_('x'):
|
|
case _L_('X'): /* hexadecimal integer. */
|
|
base = 16; number_signed = 0;
|
|
goto number;
|
|
case _L_('o'): /* octal integer */
|
|
base = 8; number_signed = 0;
|
|
goto number;
|
|
case _L_('u'): /* unsigned decimal integer */
|
|
base = 10; number_signed = 0;
|
|
goto number;
|
|
case _L_('d'): /* signed decimal integer */
|
|
base = 10; number_signed = 1;
|
|
goto number;
|
|
case _L_('i'): /* generic integer */
|
|
base = 0; number_signed = 1;
|
|
number: {
|
|
/* read an integer */
|
|
long unsigned int cur = 0;
|
|
int negative = 0;
|
|
int seendigit=0;
|
|
/* skip initial whitespace */
|
|
while ((nch!=_EOF_) && _ISSPACE_(nch))
|
|
nch = _GETC_(file);
|
|
/* get sign */
|
|
if (number_signed && (nch == _L_('-') ||
|
|
nch == _L_('+'))) {
|
|
negative = (nch==_L_('-'));
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
}
|
|
/* look for leading indication of base */
|
|
if (width!=0 && nch == _L_('0')) {
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
seendigit=1;
|
|
if (width!=0 && (nch==_L_('x') || nch==_L_('X'))) {
|
|
if (base==0)
|
|
base=16;
|
|
if (base==16) {
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
seendigit=0;
|
|
}
|
|
} else if (base==0)
|
|
base = 8;
|
|
}
|
|
/* throw away leading zeros */
|
|
while (width!=0 && nch==_L_('0')) {
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
seendigit=1;
|
|
}
|
|
if (width!=0 && _CHAR2DIGIT_(nch, base)!=-1) {
|
|
cur = _CHAR2DIGIT_(nch, base);
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
seendigit=1;
|
|
}
|
|
/* read until no more digits */
|
|
while (width!=0 && (nch!=_EOF_) && _CHAR2DIGIT_(nch, base)!=-1) {
|
|
cur = cur*base + _CHAR2DIGIT_(nch, base);
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
seendigit=1;
|
|
}
|
|
/* okay, done! */
|
|
if (!seendigit) break; /* not a valid number */
|
|
st = 1;
|
|
if (!suppress) {
|
|
#define _SET_NUMBER_(type) *va_arg(ap, type*) = negative ? -cur : cur
|
|
if (number_signed) {
|
|
if (l_prefix) _SET_NUMBER_(long int);
|
|
else if (h_prefix) _SET_NUMBER_(short int);
|
|
else _SET_NUMBER_(int);
|
|
} else {
|
|
if (negative) {
|
|
WARN("Dropping sign in reading a negative number into an unsigned value");
|
|
negative = 0;
|
|
}
|
|
if (l_prefix) _SET_NUMBER_(unsigned long int);
|
|
else if (h_prefix)
|
|
_SET_NUMBER_(unsigned short int);
|
|
else _SET_NUMBER_(unsigned int);
|
|
}
|
|
}
|
|
}
|
|
break;
|
|
case _L_('e'):
|
|
case _L_('E'):
|
|
case _L_('f'):
|
|
case _L_('g'):
|
|
case _L_('G'): { /* read a float */
|
|
long double cur = 0;
|
|
int negative = 0;
|
|
/* skip initial whitespace */
|
|
while ((nch!=_EOF_) && _ISSPACE_(nch))
|
|
nch = _GETC_(file);
|
|
/* get sign. */
|
|
if (nch == _L_('-') || nch == _L_('+')) {
|
|
negative = (nch==_L_('-'));
|
|
if (width>0) width--;
|
|
if (width==0) break;
|
|
nch = _GETC_(file);
|
|
}
|
|
/* get first digit. */
|
|
if (!_ISDIGIT_(nch)) break;
|
|
cur = (nch - _L_('0')) * (negative ? -1 : 1);
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
/* read until no more digits */
|
|
while (width!=0 && (nch!=_EOF_) && _ISDIGIT_(nch)) {
|
|
cur = cur*10 + (nch - _L_('0'));
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
}
|
|
/* handle decimals */
|
|
if (width!=0 && nch == _L_('.')) {
|
|
float dec = 1;
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
while (width!=0 && (nch!=_EOF_) && _ISDIGIT_(nch)) {
|
|
dec /= 10;
|
|
cur += dec * (nch - _L_('0'));
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
}
|
|
}
|
|
/* handle exponent */
|
|
if (width!=0 && (nch == _L_('e') || nch == _L_('E'))) {
|
|
int exponent = 0, negexp = 0;
|
|
float expcnt;
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
/* possible sign on the exponent */
|
|
if (width!=0 && (nch==_L_('+') || nch==_L_('-'))) {
|
|
negexp = (nch==_L_('-'));
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
}
|
|
/* exponent digits */
|
|
while (width!=0 && (nch!=_EOF_) && _ISDIGIT_(nch)) {
|
|
exponent *= 10;
|
|
exponent += (nch - _L_('0'));
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
}
|
|
/* update 'cur' with this exponent. */
|
|
expcnt = negexp ? .1 : 10;
|
|
while (exponent!=0) {
|
|
if (exponent&1)
|
|
cur*=expcnt;
|
|
exponent/=2;
|
|
expcnt=expcnt*expcnt;
|
|
}
|
|
}
|
|
st = 1;
|
|
if (!suppress) {
|
|
if (L_prefix) _SET_NUMBER_(long double);
|
|
else if (l_prefix) _SET_NUMBER_(double);
|
|
else _SET_NUMBER_(float);
|
|
}
|
|
}
|
|
break;
|
|
/* According to
|
|
* http://msdn.microsoft.com/library/default.asp?url=/library/en-us/vclib/html/_crt_scanf_type_field_characters.asp
|
|
* 's' reads a character string in a call to fscanf
|
|
* and 'S' a wide character string and vice versa in a
|
|
* call to fwscanf. The 'h', 'w' and 'l' prefixes override
|
|
* this behaviour. 'h' forces reading char * but 'l' and 'w'
|
|
* force reading WCHAR. */
|
|
case _L_('s'):
|
|
if (w_prefix || l_prefix) goto widecharstring;
|
|
else if (h_prefix) goto charstring;
|
|
#ifdef WIDE_SCANF
|
|
else goto widecharstring;
|
|
#else /* WIDE_SCANF */
|
|
else goto charstring;
|
|
#endif /* WIDE_SCANF */
|
|
case _L_('S'):
|
|
if (w_prefix || l_prefix) goto widecharstring;
|
|
else if (h_prefix) goto charstring;
|
|
#ifdef WIDE_SCANF
|
|
else goto charstring;
|
|
#else /* WIDE_SCANF */
|
|
else goto widecharstring;
|
|
#endif /* WIDE_SCANF */
|
|
charstring: { /* read a word into a char */
|
|
char*str = suppress ? NULL : va_arg(ap, char*);
|
|
char*sptr = str;
|
|
/* skip initial whitespace */
|
|
while ((nch!=_EOF_) && _ISSPACE_(nch))
|
|
nch = _GETC_(file);
|
|
/* read until whitespace */
|
|
while (width!=0 && (nch!=_EOF_) && !_ISSPACE_(nch)) {
|
|
#ifdef WIDE_SCANF
|
|
if (!suppress) *sptr++ = _CONVERT_(nch);
|
|
#else /* WIDE_SCANF */
|
|
if (!suppress) *sptr++ = nch;
|
|
#endif /* WIDE_SCANF */
|
|
st++;
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
}
|
|
/* terminate */
|
|
if (!suppress) *sptr = 0;
|
|
}
|
|
break;
|
|
widecharstring: { /* read a word into a WCHAR * */
|
|
WCHAR*str =
|
|
suppress ? NULL : va_arg(ap, WCHAR*);
|
|
WCHAR*sptr = str;
|
|
/* skip initial whitespace */
|
|
while ((nch!=_EOF_) && _ISSPACE_(nch))
|
|
nch = _GETC_(file);
|
|
/* read until whitespace */
|
|
while (width!=0 && (nch!=_EOF_) && !_ISSPACE_(nch)) {
|
|
#ifdef WIDE_SCANF
|
|
if (!suppress) *sptr++ = nch;
|
|
#else /* WIDE_SCANF */
|
|
if (!suppress) *sptr++ = _CONVERT_(nch);
|
|
#endif /* WIDE_SCANF */
|
|
st++;
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
}
|
|
/* terminate */
|
|
if (!suppress) *sptr = 0;
|
|
}
|
|
break;
|
|
/* 'c' and 'C work analogously to 's' and 'S' as described
|
|
* above */
|
|
case _L_('c'):
|
|
if (w_prefix || l_prefix) goto widecharacter;
|
|
else if (h_prefix) goto character;
|
|
#ifdef WIDE_SCANF
|
|
else goto widecharacter;
|
|
#else /* WIDE_SCANF */
|
|
else goto character;
|
|
#endif /* WIDE_SCANF */
|
|
case _L_('C'):
|
|
if (w_prefix || l_prefix) goto widecharacter;
|
|
else if (h_prefix) goto character;
|
|
#ifdef WIDE_SCANF
|
|
else goto character;
|
|
#else /* WIDE_SCANF */
|
|
else goto widecharacter;
|
|
#endif /* WIDE_SCANF */
|
|
character: { /* read single character into char */
|
|
if (!suppress) {
|
|
char*c = va_arg(ap, char*);
|
|
#ifdef WIDE_SCANF
|
|
*c = _CONVERT_(nch);
|
|
#else /* WIDE_SCANF */
|
|
*c = nch;
|
|
#endif /* WIDE_SCANF */
|
|
st = 1;
|
|
}
|
|
nch = _GETC_(file);
|
|
}
|
|
break;
|
|
widecharacter: {
|
|
if (!suppress) { /* read single character into WCHAR */
|
|
WCHAR*c = va_arg(ap, WCHAR*);
|
|
#ifdef WIDE_SCANF
|
|
*c = nch;
|
|
#else /* WIDE_SCANF */
|
|
*c = _CONVERT_(nch);
|
|
#endif /* WIDE_SCANF */
|
|
st = 1;
|
|
}
|
|
nch = _GETC_(file);
|
|
}
|
|
break;
|
|
case _L_('n'): {
|
|
if (!suppress) {
|
|
int*n = va_arg(ap, int*);
|
|
*n = rd;
|
|
}
|
|
}
|
|
break;
|
|
case _L_('['): {
|
|
_CHAR_ *str = suppress ? NULL : va_arg(ap, _CHAR_*);
|
|
_CHAR_ *sptr = str;
|
|
RTL_BITMAP bitMask;
|
|
LPBYTE Mask;
|
|
int invert = 0; /* Set if we are NOT to find the chars */
|
|
|
|
/* Init our bitmap */
|
|
#ifdef WIDE_SCANF
|
|
Mask = HeapAlloc(GetProcessHeap(), HEAP_ZERO_MEMORY, 65536/8);
|
|
RtlInitializeBitMap(&bitMask, Mask, 65536);
|
|
#else /* WIDE_SCANF */
|
|
Mask = HeapAlloc(GetProcessHeap(), HEAP_ZERO_MEMORY, 256/8);
|
|
RtlInitializeBitMap(&bitMask, Mask, 256);
|
|
#endif /* WIDE_SCANF */
|
|
|
|
/* Read the format */
|
|
format++;
|
|
if(*format == '^') {
|
|
invert = 1;
|
|
format++;
|
|
}
|
|
if(*format == ']') {
|
|
RtlSetBits(&bitMask, ']', 1);
|
|
format++;
|
|
}
|
|
while(*format && (*format != ']')) {
|
|
if((*format == '-') && (*(format + 1) != ']')) {
|
|
int n = 0;
|
|
for(;(n + *(format - 1)) < *(format + 1); n++)
|
|
RtlSetBits(&bitMask, n + *(format - 1), 1);
|
|
format++;
|
|
}
|
|
RtlSetBits(&bitMask, *format, 1);
|
|
format++;
|
|
}
|
|
/* read until char is not suitable */
|
|
while ((width != 0) && (nch != _EOF_)) {
|
|
if(!invert) {
|
|
if(RtlAreBitsSet(&bitMask, nch, 1)) {
|
|
#ifdef WIDE_SCANF
|
|
if (!suppress) *sptr++ = _CONVERT_(nch);
|
|
#else /* WIDE_SCANF */
|
|
if (!suppress) *sptr++ = nch;
|
|
#endif /* WIDE_SCANF */
|
|
} else
|
|
break;
|
|
} else {
|
|
if(RtlAreBitsClear(&bitMask, nch, 1)) {
|
|
#ifdef WIDE_SCANF
|
|
if (!suppress) *sptr++ = _CONVERT_(nch);
|
|
#else /* WIDE_SCANF */
|
|
if (!suppress) *sptr++ = nch;
|
|
#endif /* WIDE_SCANF */
|
|
} else
|
|
break;
|
|
}
|
|
st++;
|
|
nch = _GETC_(file);
|
|
if (width>0) width--;
|
|
}
|
|
/* terminate */
|
|
if (!suppress) *sptr = 0;
|
|
HeapFree(GetProcessHeap(), 0, Mask);
|
|
}
|
|
break;
|
|
default: FIXME("unhandled: %%%c\n", *format);
|
|
/* From spec: "if a percent sign is followed by a character
|
|
* that has no meaning as a format-control character, that
|
|
* character and the following characters are treated as
|
|
* an ordinary sequence of characters, that is, a sequence
|
|
* of characters that must match the input. For example,
|
|
* to specify that a percent-sign character is to be input,
|
|
* use %%."
|
|
* LEAVING AS-IS because we catch bugs better that way. */
|
|
}
|
|
if (st && !suppress) rd++;
|
|
else if (!st) break;
|
|
}
|
|
/* a non-white-space character causes scanf to read, but not store,
|
|
* a matching non-white-space character. */
|
|
else {
|
|
/* check for character match */
|
|
if (nch == *format) {
|
|
nch = _GETC_(file);
|
|
} else break;
|
|
}
|
|
format++;
|
|
}
|
|
if (nch!=_EOF_) {
|
|
_UNGETC_(nch, file);
|
|
}
|
|
va_end(ap);
|
|
TRACE("returning %d\n", rd);
|
|
return rd;
|
|
}
|
|
|
|
#undef _L_
|
|
#undef _CHAR_
|
|
#undef _EOF_
|
|
#undef _ISSPACE_
|
|
#undef _ISDIGIT_
|
|
#undef _CONVERT_
|
|
#undef _CHAR2DIGIT_
|
|
#undef _GETC_
|
|
#undef _UNGETC_
|
|
#undef _FUNCTION_
|