vfwscanf.c revision 117250
1/*-
2 * Copyright (c) 1990, 1993
3 *	The Regents of the University of California.  All rights reserved.
4 *
5 * This code is derived from software contributed to Berkeley by
6 * Chris Torek.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 *    notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 *    notice, this list of conditions and the following disclaimer in the
15 *    documentation and/or other materials provided with the distribution.
16 * 3. All advertising materials mentioning features or use of this software
17 *    must display the following acknowledgement:
18 *	This product includes software developed by the University of
19 *	California, Berkeley and its contributors.
20 * 4. Neither the name of the University nor the names of its contributors
21 *    may be used to endorse or promote products derived from this software
22 *    without specific prior written permission.
23 *
24 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
25 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
26 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
27 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
28 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
29 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
30 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
31 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
32 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
33 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
34 * SUCH DAMAGE.
35 */
36
37#include <sys/cdefs.h>
38#if 0
39#if defined(LIBC_SCCS) && !defined(lint)
40static char sccsid[] = "@(#)vfscanf.c	8.1 (Berkeley) 6/4/93";
41#endif /* LIBC_SCCS and not lint */
42__FBSDID("FreeBSD: src/lib/libc/stdio/vfscanf.c,v 1.32 2003/06/28 09:03:05 das Exp ");
43#endif
44__FBSDID("$FreeBSD: head/lib/libc/stdio/vfwscanf.c 117250 2003-07-05 03:39:23Z tjr $");
45
46#include "namespace.h"
47#include <ctype.h>
48#include <inttypes.h>
49#include <stdio.h>
50#include <stdlib.h>
51#include <stddef.h>
52#include <stdarg.h>
53#include <string.h>
54#include <wchar.h>
55#include <wctype.h>
56#include "un-namespace.h"
57
58#include "libc_private.h"
59#include "local.h"
60
61#define FLOATING_POINT
62
63#ifdef FLOATING_POINT
64#include <locale.h>
65#endif
66
67#define	BUF		513	/* Maximum length of numeric string. */
68
69/*
70 * Flags used during conversion.
71 */
72#define	LONG		0x01	/* l: long or double */
73#define	LONGDBL		0x02	/* L: long double */
74#define	SHORT		0x04	/* h: short */
75#define	SUPPRESS	0x08	/* *: suppress assignment */
76#define	POINTER		0x10	/* p: void * (as hex) */
77#define	NOSKIP		0x20	/* [ or c: do not skip blanks */
78#define	LONGLONG	0x400	/* ll: long long (+ deprecated q: quad) */
79#define	INTMAXT		0x800	/* j: intmax_t */
80#define	PTRDIFFT	0x1000	/* t: ptrdiff_t */
81#define	SIZET		0x2000	/* z: size_t */
82#define	SHORTSHORT	0x4000	/* hh: char */
83#define	UNSIGNED	0x8000	/* %[oupxX] conversions */
84
85/*
86 * The following are used in integral conversions only:
87 * SIGNOK, NDIGITS, PFXOK, and NZDIGITS
88 */
89#define	SIGNOK		0x40	/* +/- is (still) legal */
90#define	NDIGITS		0x80	/* no digits detected */
91#define	PFXOK		0x100	/* 0x prefix is (still) legal */
92#define	NZDIGITS	0x200	/* no zero digits detected */
93
94/*
95 * Conversion types.
96 */
97#define	CT_CHAR		0	/* %c conversion */
98#define	CT_CCL		1	/* %[...] conversion */
99#define	CT_STRING	2	/* %s conversion */
100#define	CT_INT		3	/* %[dioupxX] conversion */
101#define	CT_FLOAT	4	/* %[efgEFG] conversion */
102
103static int parsefloat(FILE *, wchar_t *, wchar_t *);
104
105extern int __scanfdebug;
106
107#define	INCCL(_c)	\
108	(cclcompl ? (wmemchr(ccls, (_c), ccle - ccls) == NULL) : \
109	(wmemchr(ccls, (_c), ccle - ccls) != NULL))
110
111/*
112 * MT-safe version.
113 */
114int
115vfwscanf(FILE * __restrict fp, const wchar_t * __restrict fmt, va_list ap)
116{
117	int ret;
118
119	FLOCKFILE(fp);
120	ORIENT(fp, 1);
121	ret = __vfwscanf(fp, fmt, ap);
122	FUNLOCKFILE(fp);
123	return (ret);
124}
125
126/*
127 * Non-MT-safe version.
128 */
129int
130__vfwscanf(FILE * __restrict fp, const wchar_t * __restrict fmt, va_list ap)
131{
132	wint_t c;		/* character from format, or conversion */
133	size_t width;		/* field width, or 0 */
134	wchar_t *p;		/* points into all kinds of strings */
135	int n;			/* handy integer */
136	int flags;		/* flags as defined above */
137	wchar_t *p0;		/* saves original value of p when necessary */
138	int nassigned;		/* number of fields assigned */
139	int nconversions;	/* number of conversions */
140	int nread;		/* number of characters consumed from fp */
141	int base;		/* base argument to conversion function */
142	wchar_t buf[BUF];	/* buffer for numeric conversions */
143	const wchar_t *ccls;	/* character class start */
144	const wchar_t *ccle;	/* character class end */
145	int cclcompl;		/* ccl is complemented? */
146	wint_t wi;		/* handy wint_t */
147	char *mbp;		/* multibyte string pointer for %c %s %[ */
148	size_t nconv;		/* number of bytes in mb. conversion */
149	mbstate_t mbs;		/* multibyte state */
150	char mbbuf[MB_LEN_MAX];	/* temporary mb. character buffer */
151
152	/* `basefix' is used to avoid `if' tests in the integer scanner */
153	static short basefix[17] =
154		{ 10, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16 };
155
156	nassigned = 0;
157	nconversions = 0;
158	nread = 0;
159	ccls = ccle = NULL;
160	for (;;) {
161		c = *fmt++;
162		if (c == 0)
163			return (nassigned);
164		if (iswspace(c)) {
165			while ((c = __fgetwc(fp)) != WEOF &&
166			    iswspace(c))
167				;
168			if (c != WEOF)
169				__ungetwc(c, fp);
170			continue;
171		}
172		if (c != '%')
173			goto literal;
174		width = 0;
175		flags = 0;
176		/*
177		 * switch on the format.  continue if done;
178		 * break once format type is derived.
179		 */
180again:		c = *fmt++;
181		switch (c) {
182		case '%':
183literal:
184			if ((wi = __fgetwc(fp)) == WEOF)
185				goto input_failure;
186			if (wi != c) {
187				__ungetwc(wi, fp);
188				goto input_failure;
189			}
190			nread++;
191			continue;
192
193		case '*':
194			flags |= SUPPRESS;
195			goto again;
196		case 'j':
197			flags |= INTMAXT;
198			goto again;
199		case 'l':
200			if (flags & LONG) {
201				flags &= ~LONG;
202				flags |= LONGLONG;
203			} else
204				flags |= LONG;
205			goto again;
206		case 'q':
207			flags |= LONGLONG;	/* not quite */
208			goto again;
209		case 't':
210			flags |= PTRDIFFT;
211			goto again;
212		case 'z':
213			flags |= SIZET;
214			goto again;
215		case 'L':
216			flags |= LONGDBL;
217			goto again;
218		case 'h':
219			if (flags & SHORT) {
220				flags &= ~SHORT;
221				flags |= SHORTSHORT;
222			} else
223				flags |= SHORT;
224			goto again;
225
226		case '0': case '1': case '2': case '3': case '4':
227		case '5': case '6': case '7': case '8': case '9':
228			width = width * 10 + c - '0';
229			goto again;
230
231		/*
232		 * Conversions.
233		 */
234		case 'd':
235			c = CT_INT;
236			base = 10;
237			break;
238
239		case 'i':
240			c = CT_INT;
241			base = 0;
242			break;
243
244		case 'o':
245			c = CT_INT;
246			flags |= UNSIGNED;
247			base = 8;
248			break;
249
250		case 'u':
251			c = CT_INT;
252			flags |= UNSIGNED;
253			base = 10;
254			break;
255
256		case 'X':
257		case 'x':
258			flags |= PFXOK;	/* enable 0x prefixing */
259			c = CT_INT;
260			flags |= UNSIGNED;
261			base = 16;
262			break;
263
264#ifdef FLOATING_POINT
265		case 'A': case 'E': case 'F': case 'G':
266		case 'a': case 'e': case 'f': case 'g':
267			c = CT_FLOAT;
268			break;
269#endif
270
271		case 'S':
272			flags |= LONG;
273			/* FALLTHROUGH */
274		case 's':
275			c = CT_STRING;
276			break;
277
278		case '[':
279			ccls = fmt;
280			if (*fmt == '^') {
281				cclcompl = 1;
282				fmt++;
283			} else
284				cclcompl = 0;
285			if (*fmt == ']')
286				fmt++;
287			while (*fmt != '\0' && *fmt != ']')
288				fmt++;
289			ccle = fmt;
290			fmt++;
291			flags |= NOSKIP;
292			c = CT_CCL;
293			break;
294
295		case 'C':
296			flags |= LONG;
297			/* FALLTHROUGH */
298		case 'c':
299			flags |= NOSKIP;
300			c = CT_CHAR;
301			break;
302
303		case 'p':	/* pointer format is like hex */
304			flags |= POINTER | PFXOK;
305			c = CT_INT;		/* assumes sizeof(uintmax_t) */
306			flags |= UNSIGNED;	/*      >= sizeof(uintptr_t) */
307			base = 16;
308			break;
309
310		case 'n':
311			nconversions++;
312			if (flags & SUPPRESS)	/* ??? */
313				continue;
314			if (flags & SHORTSHORT)
315				*va_arg(ap, char *) = nread;
316			else if (flags & SHORT)
317				*va_arg(ap, short *) = nread;
318			else if (flags & LONG)
319				*va_arg(ap, long *) = nread;
320			else if (flags & LONGLONG)
321				*va_arg(ap, long long *) = nread;
322			else if (flags & INTMAXT)
323				*va_arg(ap, intmax_t *) = nread;
324			else if (flags & SIZET)
325				*va_arg(ap, size_t *) = nread;
326			else if (flags & PTRDIFFT)
327				*va_arg(ap, ptrdiff_t *) = nread;
328			else
329				*va_arg(ap, int *) = nread;
330			continue;
331
332		default:
333			goto match_failure;
334
335		/*
336		 * Disgusting backwards compatibility hack.	XXX
337		 */
338		case '\0':	/* compat */
339			return (EOF);
340		}
341
342		/*
343		 * Consume leading white space, except for formats
344		 * that suppress this.
345		 */
346		if ((flags & NOSKIP) == 0) {
347			while ((wi = __fgetwc(fp)) != WEOF && iswspace(wi))
348				nread++;
349			if (wi == WEOF)
350				goto input_failure;
351			__ungetwc(wi, fp);
352		}
353
354		/*
355		 * Do the conversion.
356		 */
357		switch (c) {
358
359		case CT_CHAR:
360			/* scan arbitrary characters (sets NOSKIP) */
361			if (width == 0)
362				width = 1;
363			if (flags & LONG) {
364				if (!(flags & SUPPRESS))
365					p = va_arg(ap, wchar_t *);
366				n = 0;
367				while (width-- != 0 &&
368				    (wi = __fgetwc(fp)) != WEOF) {
369					if (!(flags & SUPPRESS))
370						*p++ = (wchar_t)wi;
371					n++;
372				}
373				if (n == 0)
374					goto input_failure;
375				nread += n;
376				if (!(flags & SUPPRESS))
377					nassigned++;
378			} else {
379				if (!(flags & SUPPRESS))
380					mbp = va_arg(ap, char *);
381				n = 0;
382				memset(&mbs, 0, sizeof(mbs));
383				while (width != 0 &&
384				    (wi = __fgetwc(fp)) != WEOF) {
385					if (width >= MB_CUR_MAX &&
386					    !(flags & SUPPRESS)) {
387						nconv = wcrtomb(mbp, wi, &mbs);
388						if (nconv == (size_t)-1)
389							goto input_failure;
390					} else {
391						nconv = wcrtomb(mbbuf, wi,
392						    &mbs);
393						if (nconv == (size_t)-1)
394							goto input_failure;
395						if (nconv > width) {
396							__ungetwc(wi, fp);
397							break;
398						}
399						if (!(flags & SUPPRESS))
400							memcpy(mbp, mbbuf,
401							    nconv);
402					}
403					if (!(flags & SUPPRESS))
404						mbp += nconv;
405					width -= nconv;
406					n++;
407				}
408				if (n == 0)
409					goto input_failure;
410				nread += n;
411				if (!(flags & SUPPRESS))
412					nassigned++;
413			}
414			nconversions++;
415			break;
416
417		case CT_CCL:
418			/* scan a (nonempty) character class (sets NOSKIP) */
419			if (width == 0)
420				width = (size_t)~0;	/* `infinity' */
421			/* take only those things in the class */
422			if ((flags & SUPPRESS) && (flags & LONG)) {
423				n = 0;
424				while ((wi = __fgetwc(fp)) != WEOF &&
425				    width-- != 0 && INCCL(wi))
426					n++;
427				if (wi != WEOF)
428					__ungetwc(wi, fp);
429				if (n == 0)
430					goto match_failure;
431			} else if (flags & LONG) {
432				p0 = p = va_arg(ap, wchar_t *);
433				while ((wi = __fgetwc(fp)) != WEOF &&
434				    width-- != 0 && INCCL(wi))
435					*p++ = (wchar_t)wi;
436				if (wi != WEOF)
437					__ungetwc(wi, fp);
438				n = p - p0;
439				if (n == 0)
440					goto match_failure;
441				*p = 0;
442				nassigned++;
443			} else {
444				if (!(flags & SUPPRESS))
445					mbp = va_arg(ap, char *);
446				n = 0;
447				memset(&mbs, 0, sizeof(mbs));
448				while ((wi = __fgetwc(fp)) != WEOF &&
449				    width != 0 && INCCL(wi)) {
450					if (width >= MB_CUR_MAX &&
451					   !(flags & SUPPRESS)) {
452						nconv = wcrtomb(mbp, wi, &mbs);
453						if (nconv == (size_t)-1)
454							goto input_failure;
455					} else {
456						nconv = wcrtomb(mbbuf, wi,
457						    &mbs);
458						if (nconv == (size_t)-1)
459							goto input_failure;
460						if (nconv > width)
461							break;
462						if (!(flags & SUPPRESS))
463							memcpy(mbp, mbbuf,
464							    nconv);
465					}
466					if (!(flags & SUPPRESS))
467						mbp += nconv;
468					width -= nconv;
469					n++;
470				}
471				if (wi != WEOF)
472					__ungetwc(wi, fp);
473				if (!(flags & SUPPRESS)) {
474					*mbp = 0;
475					nassigned++;
476				}
477			}
478			nread += n;
479			nconversions++;
480			break;
481
482		case CT_STRING:
483			/* like CCL, but zero-length string OK, & no NOSKIP */
484			if (width == 0)
485				width = (size_t)~0;
486			if ((flags & SUPPRESS) && (flags & LONG)) {
487				while ((wi = __fgetwc(fp)) != WEOF &&
488				    width-- != 0 &&
489				    !iswspace(wi))
490					nread++;
491				if (wi != WEOF)
492					__ungetwc(wi, fp);
493			} else if (flags & LONG) {
494				p0 = p = va_arg(ap, wchar_t *);
495				while ((wi = __fgetwc(fp)) != WEOF &&
496				    width-- != 0 &&
497				    !iswspace(wi)) {
498					*p++ = (wchar_t)wi;
499					nread++;
500				}
501				if (wi != WEOF)
502					__ungetwc(wi, fp);
503				*p = '\0';
504				nassigned++;
505			} else {
506				if (!(flags & SUPPRESS))
507					mbp = va_arg(ap, char *);
508				memset(&mbs, 0, sizeof(mbs));
509				while ((wi = __fgetwc(fp)) != WEOF &&
510				    width != 0 &&
511				    !iswspace(wi)) {
512					if (width >= MB_CUR_MAX &&
513					    !(flags & SUPPRESS)) {
514						nconv = wcrtomb(mbp, wi, &mbs);
515						if (nconv == (size_t)-1)
516							goto input_failure;
517					} else {
518						nconv = wcrtomb(mbbuf, wi,
519						    &mbs);
520						if (nconv == (size_t)-1)
521							goto input_failure;
522						if (nconv > width)
523							break;
524						if (!(flags & SUPPRESS))
525							memcpy(mbp, mbbuf,
526							    nconv);
527					}
528					if (!(flags & SUPPRESS))
529						mbp += nconv;
530					width -= nconv;
531					nread++;
532				}
533				if (wi != WEOF)
534					__ungetwc(wi, fp);
535				if (!(flags & SUPPRESS)) {
536					*mbp = 0;
537					nassigned++;
538				}
539			}
540			nconversions++;
541			continue;
542
543		case CT_INT:
544			/* scan an integer as if by the conversion function */
545			if (width == 0 || width > sizeof(buf) /
546			    sizeof(*buf) - 1)
547				width = sizeof(buf) / sizeof(*buf) - 1;
548			flags |= SIGNOK | NDIGITS | NZDIGITS;
549			for (p = buf; width; width--) {
550				c = __fgetwc(fp);
551				/*
552				 * Switch on the character; `goto ok'
553				 * if we accept it as a part of number.
554				 */
555				switch (c) {
556
557				/*
558				 * The digit 0 is always legal, but is
559				 * special.  For %i conversions, if no
560				 * digits (zero or nonzero) have been
561				 * scanned (only signs), we will have
562				 * base==0.  In that case, we should set
563				 * it to 8 and enable 0x prefixing.
564				 * Also, if we have not scanned zero digits
565				 * before this, do not turn off prefixing
566				 * (someone else will turn it off if we
567				 * have scanned any nonzero digits).
568				 */
569				case '0':
570					if (base == 0) {
571						base = 8;
572						flags |= PFXOK;
573					}
574					if (flags & NZDIGITS)
575					    flags &= ~(SIGNOK|NZDIGITS|NDIGITS);
576					else
577					    flags &= ~(SIGNOK|PFXOK|NDIGITS);
578					goto ok;
579
580				/* 1 through 7 always legal */
581				case '1': case '2': case '3':
582				case '4': case '5': case '6': case '7':
583					base = basefix[base];
584					flags &= ~(SIGNOK | PFXOK | NDIGITS);
585					goto ok;
586
587				/* digits 8 and 9 ok iff decimal or hex */
588				case '8': case '9':
589					base = basefix[base];
590					if (base <= 8)
591						break;	/* not legal here */
592					flags &= ~(SIGNOK | PFXOK | NDIGITS);
593					goto ok;
594
595				/* letters ok iff hex */
596				case 'A': case 'B': case 'C':
597				case 'D': case 'E': case 'F':
598				case 'a': case 'b': case 'c':
599				case 'd': case 'e': case 'f':
600					/* no need to fix base here */
601					if (base <= 10)
602						break;	/* not legal here */
603					flags &= ~(SIGNOK | PFXOK | NDIGITS);
604					goto ok;
605
606				/* sign ok only as first character */
607				case '+': case '-':
608					if (flags & SIGNOK) {
609						flags &= ~SIGNOK;
610						goto ok;
611					}
612					break;
613
614				/* x ok iff flag still set & 2nd char */
615				case 'x': case 'X':
616					if (flags & PFXOK && p == buf + 1) {
617						base = 16;	/* if %i */
618						flags &= ~PFXOK;
619						goto ok;
620					}
621					break;
622				}
623
624				/*
625				 * If we got here, c is not a legal character
626				 * for a number.  Stop accumulating digits.
627				 */
628				if (c != WEOF)
629					__ungetwc(c, fp);
630				break;
631		ok:
632				/*
633				 * c is legal: store it and look at the next.
634				 */
635				*p++ = (wchar_t)c;
636			}
637			/*
638			 * If we had only a sign, it is no good; push
639			 * back the sign.  If the number ends in `x',
640			 * it was [sign] '0' 'x', so push back the x
641			 * and treat it as [sign] '0'.
642			 */
643			if (flags & NDIGITS) {
644				if (p > buf)
645					__ungetwc(*--p, fp);
646				goto match_failure;
647			}
648			c = p[-1];
649			if (c == 'x' || c == 'X') {
650				--p;
651				__ungetwc(c, fp);
652			}
653			if ((flags & SUPPRESS) == 0) {
654				uintmax_t res;
655
656				*p = 0;
657				if ((flags & UNSIGNED) == 0)
658				    res = wcstoimax(buf, NULL, base);
659				else
660				    res = wcstoumax(buf, NULL, base);
661				if (flags & POINTER)
662					*va_arg(ap, void **) =
663							(void *)(uintptr_t)res;
664				else if (flags & SHORTSHORT)
665					*va_arg(ap, char *) = res;
666				else if (flags & SHORT)
667					*va_arg(ap, short *) = res;
668				else if (flags & LONG)
669					*va_arg(ap, long *) = res;
670				else if (flags & LONGLONG)
671					*va_arg(ap, long long *) = res;
672				else if (flags & INTMAXT)
673					*va_arg(ap, intmax_t *) = res;
674				else if (flags & PTRDIFFT)
675					*va_arg(ap, ptrdiff_t *) = res;
676				else if (flags & SIZET)
677					*va_arg(ap, size_t *) = res;
678				else
679					*va_arg(ap, int *) = res;
680				nassigned++;
681			}
682			nread += p - buf;
683			nconversions++;
684			break;
685
686#ifdef FLOATING_POINT
687		case CT_FLOAT:
688			/* scan a floating point number as if by strtod */
689			if (width == 0 || width > sizeof(buf) /
690			    sizeof(*buf) - 1)
691				width = sizeof(buf) / sizeof(*buf) - 1;
692			if ((width = parsefloat(fp, buf, buf + width)) == 0)
693				goto match_failure;
694			if ((flags & SUPPRESS) == 0) {
695				if (flags & LONGDBL) {
696					long double res = wcstold(buf, &p);
697					*va_arg(ap, long double *) = res;
698				} else if (flags & LONG) {
699					double res = wcstod(buf, &p);
700					*va_arg(ap, double *) = res;
701				} else {
702					float res = wcstof(buf, &p);
703					*va_arg(ap, float *) = res;
704				}
705				if (__scanfdebug && p - buf != width)
706					abort();
707				nassigned++;
708			}
709			nread += width;
710			nconversions++;
711			break;
712#endif /* FLOATING_POINT */
713		}
714	}
715input_failure:
716	return (nconversions != 0 ? nassigned : EOF);
717match_failure:
718	return (nassigned);
719}
720
721#ifdef FLOATING_POINT
722static int
723parsefloat(FILE *fp, wchar_t *buf, wchar_t *end)
724{
725	wchar_t *commit, *p;
726	int infnanpos = 0;
727	enum {
728		S_START, S_GOTSIGN, S_INF, S_NAN, S_MAYBEHEX,
729		S_DIGITS, S_FRAC, S_EXP, S_EXPDIGITS
730	} state = S_START;
731	wchar_t c;
732	wchar_t decpt = (wchar_t)(unsigned char)*localeconv()->decimal_point;
733	_Bool gotmantdig = 0, ishex = 0;
734
735	/*
736	 * We set commit = p whenever the string we have read so far
737	 * constitutes a valid representation of a floating point
738	 * number by itself.  At some point, the parse will complete
739	 * or fail, and we will ungetc() back to the last commit point.
740	 * To ensure that the file offset gets updated properly, it is
741	 * always necessary to read at least one character that doesn't
742	 * match; thus, we can't short-circuit "infinity" or "nan(...)".
743	 */
744	commit = buf - 1;
745	c = WEOF;
746	for (p = buf; p < end; ) {
747		if ((c = __fgetwc(fp)) == WEOF)
748			break;
749reswitch:
750		switch (state) {
751		case S_START:
752			state = S_GOTSIGN;
753			if (c == '-' || c == '+')
754				break;
755			else
756				goto reswitch;
757		case S_GOTSIGN:
758			switch (c) {
759			case '0':
760				state = S_MAYBEHEX;
761				commit = p;
762				break;
763			case 'I':
764			case 'i':
765				state = S_INF;
766				break;
767			case 'N':
768			case 'n':
769				state = S_NAN;
770				break;
771			default:
772				state = S_DIGITS;
773				goto reswitch;
774			}
775			break;
776		case S_INF:
777			if (infnanpos > 6 ||
778			    (c != "nfinity"[infnanpos] &&
779			     c != "NFINITY"[infnanpos]))
780				goto parsedone;
781			if (infnanpos == 1 || infnanpos == 6)
782				commit = p;	/* inf or infinity */
783			infnanpos++;
784			break;
785		case S_NAN:
786			switch (infnanpos) {
787			case -1:	/* XXX kludge to deal with nan(...) */
788				goto parsedone;
789			case 0:
790				if (c != 'A' && c != 'a')
791					goto parsedone;
792				break;
793			case 1:
794				if (c != 'N' && c != 'n')
795					goto parsedone;
796				else
797					commit = p;
798				break;
799			case 2:
800				if (c != '(')
801					goto parsedone;
802				break;
803			default:
804				if (c == ')') {
805					commit = p;
806					infnanpos = -2;
807				} else if (!iswalnum(c) && c != '_')
808					goto parsedone;
809				break;
810			}
811			infnanpos++;
812			break;
813		case S_MAYBEHEX:
814			state = S_DIGITS;
815			if (c == 'X' || c == 'x') {
816				ishex = 1;
817				break;
818			} else {	/* we saw a '0', but no 'x' */
819				gotmantdig = 1;
820				goto reswitch;
821			}
822		case S_DIGITS:
823			if (ishex && iswxdigit(c) || iswdigit(c))
824				gotmantdig = 1;
825			else {
826				state = S_FRAC;
827				if (c != decpt)
828					goto reswitch;
829			}
830			if (gotmantdig)
831				commit = p;
832			break;
833		case S_FRAC:
834			if ((c == 'E' || c == 'e') && !ishex ||
835			    (c == 'P' || c == 'p') && ishex) {
836				if (!gotmantdig)
837					goto parsedone;
838				else
839					state = S_EXP;
840			} else if (ishex && iswxdigit(c) || iswdigit(c)) {
841				commit = p;
842				gotmantdig = 1;
843			} else
844				goto parsedone;
845			break;
846		case S_EXP:
847			state = S_EXPDIGITS;
848			if (c == '-' || c == '+')
849				break;
850			else
851				goto reswitch;
852		case S_EXPDIGITS:
853			if (iswdigit(c))
854				commit = p;
855			else
856				goto parsedone;
857			break;
858		default:
859			abort();
860		}
861		*p++ = c;
862		c = WEOF;
863	}
864
865parsedone:
866	if (c != WEOF)
867		__ungetwc(c, fp);
868	while (commit < --p)
869		__ungetwc(*p, fp);
870	*++commit = '\0';
871	return (commit - buf);
872}
873#endif
874