master
  1#include "stdio_impl.h"
  2#include <errno.h>
  3#include <ctype.h>
  4#include <limits.h>
  5#include <string.h>
  6#include <stdarg.h>
  7#include <stddef.h>
  8#include <stdlib.h>
  9#include <wchar.h>
 10#include <inttypes.h>
 11#ifdef __wasilibc_unmodified_upstream // Changes to optimize printf/scanf when long double isn't needed
 12#else
 13#include "printscan.h"
 14#endif
 15
 16/* Convenient bit representation for modifier flags, which all fall
 17 * within 31 codepoints of the space character. */
 18
 19#define ALT_FORM   (1U<<'#'-' ')
 20#define ZERO_PAD   (1U<<'0'-' ')
 21#define LEFT_ADJ   (1U<<'-'-' ')
 22#define PAD_POS    (1U<<' '-' ')
 23#define MARK_POS   (1U<<'+'-' ')
 24#define GROUPED    (1U<<'\''-' ')
 25
 26#define FLAGMASK (ALT_FORM|ZERO_PAD|LEFT_ADJ|PAD_POS|MARK_POS|GROUPED)
 27
 28/* State machine to accept length modifiers + conversion specifiers.
 29 * Result is 0 on failure, or an argument type to pop on success. */
 30
 31enum {
 32	BARE, LPRE, LLPRE, HPRE, HHPRE, BIGLPRE,
 33	ZTPRE, JPRE,
 34	STOP,
 35	PTR, INT, UINT, ULLONG,
 36	LONG, ULONG,
 37	SHORT, USHORT, CHAR, UCHAR,
 38	LLONG, SIZET, IMAX, UMAX, PDIFF, UIPTR,
 39	DBL, LDBL,
 40	NOARG,
 41	MAXSTATE
 42};
 43
 44#define S(x) [(x)-'A']
 45
 46static const unsigned char states[]['z'-'A'+1] = {
 47	{ /* 0: bare types */
 48		S('d') = INT, S('i') = INT,
 49		S('o') = UINT, S('u') = UINT, S('x') = UINT, S('X') = UINT,
 50		S('e') = DBL, S('f') = DBL, S('g') = DBL, S('a') = DBL,
 51		S('E') = DBL, S('F') = DBL, S('G') = DBL, S('A') = DBL,
 52		S('c') = INT, S('C') = UINT,
 53		S('s') = PTR, S('S') = PTR, S('p') = UIPTR, S('n') = PTR,
 54		S('m') = NOARG,
 55		S('l') = LPRE, S('h') = HPRE, S('L') = BIGLPRE,
 56		S('z') = ZTPRE, S('j') = JPRE, S('t') = ZTPRE,
 57	}, { /* 1: l-prefixed */
 58		S('d') = LONG, S('i') = LONG,
 59		S('o') = ULONG, S('u') = ULONG, S('x') = ULONG, S('X') = ULONG,
 60		S('e') = DBL, S('f') = DBL, S('g') = DBL, S('a') = DBL,
 61		S('E') = DBL, S('F') = DBL, S('G') = DBL, S('A') = DBL,
 62		S('c') = UINT, S('s') = PTR, S('n') = PTR,
 63		S('l') = LLPRE,
 64	}, { /* 2: ll-prefixed */
 65		S('d') = LLONG, S('i') = LLONG,
 66		S('o') = ULLONG, S('u') = ULLONG,
 67		S('x') = ULLONG, S('X') = ULLONG,
 68		S('n') = PTR,
 69	}, { /* 3: h-prefixed */
 70		S('d') = SHORT, S('i') = SHORT,
 71		S('o') = USHORT, S('u') = USHORT,
 72		S('x') = USHORT, S('X') = USHORT,
 73		S('n') = PTR,
 74		S('h') = HHPRE,
 75	}, { /* 4: hh-prefixed */
 76		S('d') = CHAR, S('i') = CHAR,
 77		S('o') = UCHAR, S('u') = UCHAR,
 78		S('x') = UCHAR, S('X') = UCHAR,
 79		S('n') = PTR,
 80	}, { /* 5: L-prefixed */
 81		S('e') = LDBL, S('f') = LDBL, S('g') = LDBL, S('a') = LDBL,
 82		S('E') = LDBL, S('F') = LDBL, S('G') = LDBL, S('A') = LDBL,
 83		S('n') = PTR,
 84	}, { /* 6: z- or t-prefixed (assumed to be same size) */
 85		S('d') = PDIFF, S('i') = PDIFF,
 86		S('o') = SIZET, S('u') = SIZET,
 87		S('x') = SIZET, S('X') = SIZET,
 88		S('n') = PTR,
 89	}, { /* 7: j-prefixed */
 90		S('d') = IMAX, S('i') = IMAX,
 91		S('o') = UMAX, S('u') = UMAX,
 92		S('x') = UMAX, S('X') = UMAX,
 93		S('n') = PTR,
 94	}
 95};
 96
 97#define OOB(x) ((unsigned)(x)-'A' > 'z'-'A')
 98
 99union arg
100{
101	uintmax_t i;
102#if !defined(__wasilibc_printscan_no_floating_point)
103#if defined(__wasilibc_printscan_no_long_double)
104	long_double f;
105#else
106	long double f;
107#endif
108#endif
109	void *p;
110};
111
112static void pop_arg(union arg *arg, int type, va_list *ap)
113{
114	switch (type) {
115	       case PTR:	arg->p = va_arg(*ap, void *);
116	break; case INT:	arg->i = va_arg(*ap, int);
117	break; case UINT:	arg->i = va_arg(*ap, unsigned int);
118	break; case LONG:	arg->i = va_arg(*ap, long);
119	break; case ULONG:	arg->i = va_arg(*ap, unsigned long);
120	break; case ULLONG:	arg->i = va_arg(*ap, unsigned long long);
121	break; case SHORT:	arg->i = (short)va_arg(*ap, int);
122	break; case USHORT:	arg->i = (unsigned short)va_arg(*ap, int);
123	break; case CHAR:	arg->i = (signed char)va_arg(*ap, int);
124	break; case UCHAR:	arg->i = (unsigned char)va_arg(*ap, int);
125	break; case LLONG:	arg->i = va_arg(*ap, long long);
126	break; case SIZET:	arg->i = va_arg(*ap, size_t);
127	break; case IMAX:	arg->i = va_arg(*ap, intmax_t);
128	break; case UMAX:	arg->i = va_arg(*ap, uintmax_t);
129	break; case PDIFF:	arg->i = va_arg(*ap, ptrdiff_t);
130	break; case UIPTR:	arg->i = (uintptr_t)va_arg(*ap, void *);
131#if defined(__wasilibc_printscan_no_floating_point)
132	break; case DBL:
133	break; case LDBL:	floating_point_not_supported();
134#else
135	break; case DBL:	arg->f = va_arg(*ap, double);
136#if defined(__wasilibc_printscan_no_long_double)
137	break; case LDBL:	long_double_not_supported();
138#else
139	break; case LDBL:	arg->f = va_arg(*ap, long double);
140#endif
141#endif
142	}
143}
144
145static void out(FILE *f, const wchar_t *s, size_t l)
146{
147	while (l-- && !ferror(f)) fputwc(*s++, f);
148}
149
150static void pad(FILE *f, int n, int fl)
151{
152	if ((fl & LEFT_ADJ) || !n || ferror(f)) return;
153	fprintf(f, "%*s", n, "");
154}
155
156static int getint(wchar_t **s) {
157	int i;
158	for (i=0; iswdigit(**s); (*s)++) {
159		if (i > INT_MAX/10U || **s-'0' > INT_MAX-10*i) i = -1;
160		else i = 10*i + (**s-'0');
161	}
162	return i;
163}
164
165static const char sizeprefix['y'-'a'] = {
166['a'-'a']='L', ['e'-'a']='L', ['f'-'a']='L', ['g'-'a']='L',
167['d'-'a']='j', ['i'-'a']='j', ['o'-'a']='j', ['u'-'a']='j', ['x'-'a']='j',
168['p'-'a']='j'
169};
170
171static int wprintf_core(FILE *f, const wchar_t *fmt, va_list *ap, union arg *nl_arg, int *nl_type)
172{
173	wchar_t *a, *z, *s=(wchar_t *)fmt;
174	unsigned l10n=0, fl;
175	int w, p, xp;
176	union arg arg;
177	int argpos;
178	unsigned st, ps;
179	int cnt=0, l=0;
180	int i;
181	int t;
182	char *bs;
183	char charfmt[16];
184	wchar_t wc;
185
186	for (;;) {
187		/* This error is only specified for snprintf, but since it's
188		 * unspecified for other forms, do the same. Stop immediately
189		 * on overflow; otherwise %n could produce wrong results. */
190		if (l > INT_MAX - cnt) goto overflow;
191
192		/* Update output count, end loop when fmt is exhausted */
193		cnt += l;
194		if (!*s) break;
195
196		/* Handle literal text and %% format specifiers */
197		for (a=s; *s && *s!='%'; s++);
198		for (z=s; s[0]=='%' && s[1]=='%'; z++, s+=2);
199		if (z-a > INT_MAX-cnt) goto overflow;
200		l = z-a;
201		if (f) out(f, a, l);
202		if (l) continue;
203
204		if (iswdigit(s[1]) && s[2]=='$') {
205			l10n=1;
206			argpos = s[1]-'0';
207			s+=3;
208		} else {
209			argpos = -1;
210			s++;
211		}
212
213		/* Read modifier flags */
214		for (fl=0; (unsigned)*s-' '<32 && (FLAGMASK&(1U<<*s-' ')); s++)
215			fl |= 1U<<*s-' ';
216
217		/* Read field width */
218		if (*s=='*') {
219			if (iswdigit(s[1]) && s[2]=='$') {
220				l10n=1;
221				nl_type[s[1]-'0'] = INT;
222				w = nl_arg[s[1]-'0'].i;
223				s+=3;
224			} else if (!l10n) {
225				w = f ? va_arg(*ap, int) : 0;
226				s++;
227			} else goto inval;
228			if (w<0) fl|=LEFT_ADJ, w=-w;
229		} else if ((w=getint(&s))<0) goto overflow;
230
231		/* Read precision */
232		if (*s=='.' && s[1]=='*') {
233			if (isdigit(s[2]) && s[3]=='$') {
234				nl_type[s[2]-'0'] = INT;
235				p = nl_arg[s[2]-'0'].i;
236				s+=4;
237			} else if (!l10n) {
238				p = f ? va_arg(*ap, int) : 0;
239				s+=2;
240			} else goto inval;
241			xp = (p>=0);
242		} else if (*s=='.') {
243			s++;
244			p = getint(&s);
245			xp = 1;
246		} else {
247			p = -1;
248			xp = 0;
249		}
250
251		/* Format specifier state machine */
252		st=0;
253		do {
254			if (OOB(*s)) goto inval;
255			ps=st;
256			st=states[st]S(*s++);
257		} while (st-1<STOP);
258		if (!st) goto inval;
259
260		/* Check validity of argument type (nl/normal) */
261		if (st==NOARG) {
262			if (argpos>=0) goto inval;
263		} else {
264			if (argpos>=0) nl_type[argpos]=st, arg=nl_arg[argpos];
265			else if (f) pop_arg(&arg, st, ap);
266			else return 0;
267		}
268
269		if (!f) continue;
270
271		/* Do not process any new directives once in error state. */
272		if (ferror(f)) return -1;
273
274		t = s[-1];
275		if (ps && (t&15)==3) t&=~32;
276
277		switch (t) {
278		case 'n':
279			switch(ps) {
280			case BARE: *(int *)arg.p = cnt; break;
281			case LPRE: *(long *)arg.p = cnt; break;
282			case LLPRE: *(long long *)arg.p = cnt; break;
283			case HPRE: *(unsigned short *)arg.p = cnt; break;
284			case HHPRE: *(unsigned char *)arg.p = cnt; break;
285			case ZTPRE: *(size_t *)arg.p = cnt; break;
286			case JPRE: *(uintmax_t *)arg.p = cnt; break;
287			}
288			continue;
289		case 'c':
290		case 'C':
291			if (w<1) w=1;
292			pad(f, w-1, fl);
293			out(f, &(wchar_t){t=='C' ? arg.i : btowc(arg.i)}, 1);
294			pad(f, w-1, fl^LEFT_ADJ);
295			l = w;
296			continue;
297		case 'S':
298			a = arg.p;
299			z = a + wcsnlen(a, p<0 ? INT_MAX : p);
300			if (p<0 && *z) goto overflow;
301			p = z-a;
302			if (w<p) w=p;
303			pad(f, w-p, fl);
304			out(f, a, p);
305			pad(f, w-p, fl^LEFT_ADJ);
306			l=w;
307			continue;
308		case 'm':
309			arg.p = strerror(errno);
310		case 's':
311			if (!arg.p) arg.p = "(null)";
312			bs = arg.p;
313			for (i=l=0; l<(p<0?INT_MAX:p) && (i=mbtowc(&wc, bs, MB_LEN_MAX))>0; bs+=i, l++);
314			if (i<0) return -1;
315			if (p<0 && *bs) goto overflow;
316			p=l;
317			if (w<p) w=p;
318			pad(f, w-p, fl);
319			bs = arg.p;
320			while (l--) {
321				i=mbtowc(&wc, bs, MB_LEN_MAX);
322				bs+=i;
323				out(f, &wc, 1);
324			}
325			pad(f, w-p, fl^LEFT_ADJ);
326			l=w;
327			continue;
328		}
329
330		if (xp && p<0) goto overflow;
331#if defined(__wasilibc_printscan_no_long_double)
332		// Omit the 'L' modifier for floating-point cases.
333		switch (t|32) {
334		case 'a': case 'e': case 'f': case 'g':
335			snprintf(charfmt, sizeof charfmt, "%%%s%s%s%s%s*.*%c",
336				"#"+!(fl & ALT_FORM),
337				"+"+!(fl & MARK_POS),
338				"-"+!(fl & LEFT_ADJ),
339				" "+!(fl & PAD_POS),
340				"0"+!(fl & ZERO_PAD),
341				t);
342
343			l = fprintf(f, charfmt, w, p, arg.f);
344			break;
345		case 'd': case 'i': case 'o': case 'u': case 'x': case 'p':
346			snprintf(charfmt, sizeof charfmt, "%%%s%s%s%s%s*.*%c%c",
347				"#"+!(fl & ALT_FORM),
348				"+"+!(fl & MARK_POS),
349				"-"+!(fl & LEFT_ADJ),
350				" "+!(fl & PAD_POS),
351				"0"+!(fl & ZERO_PAD),
352				sizeprefix[(t|32)-'a'], t);
353
354			l = fprintf(f, charfmt, w, p, arg.i);
355			break;
356		}
357#else
358		snprintf(charfmt, sizeof charfmt, "%%%s%s%s%s%s*.*%c%c",
359			"#"+!(fl & ALT_FORM),
360			"+"+!(fl & MARK_POS),
361			"-"+!(fl & LEFT_ADJ),
362			" "+!(fl & PAD_POS),
363			"0"+!(fl & ZERO_PAD),
364			sizeprefix[(t|32)-'a'], t);
365
366		switch (t|32) {
367#if !defined(__wasilibc_printscan_no_floating_point)
368		case 'a': case 'e': case 'f': case 'g':
369			l = fprintf(f, charfmt, w, p, arg.f);
370			break;
371#endif
372		case 'd': case 'i': case 'o': case 'u': case 'x': case 'p':
373			l = fprintf(f, charfmt, w, p, arg.i);
374			break;
375		}
376#endif
377	}
378
379	if (f) return cnt;
380	if (!l10n) return 0;
381
382	for (i=1; i<=NL_ARGMAX && nl_type[i]; i++)
383		pop_arg(nl_arg+i, nl_type[i], ap);
384	for (; i<=NL_ARGMAX && !nl_type[i]; i++);
385	if (i<=NL_ARGMAX) return -1;
386	return 1;
387
388inval:
389	errno = EINVAL;
390	return -1;
391overflow:
392	errno = EOVERFLOW;
393	return -1;
394}
395
396int vfwprintf(FILE *restrict f, const wchar_t *restrict fmt, va_list ap)
397{
398	va_list ap2;
399	int nl_type[NL_ARGMAX+1] = {0};
400	union arg nl_arg[NL_ARGMAX+1];
401	int olderr;
402	int ret;
403
404	/* the copy allows passing va_list* even if va_list is an array */
405	va_copy(ap2, ap);
406	if (wprintf_core(0, fmt, &ap2, nl_arg, nl_type) < 0) {
407		va_end(ap2);
408		return -1;
409	}
410
411	FLOCK(f);
412	fwide(f, 1);
413	olderr = f->flags & F_ERR;
414	f->flags &= ~F_ERR;
415	ret = wprintf_core(f, fmt, &ap2, nl_arg, nl_type);
416	if (ferror(f)) ret = -1;
417	f->flags |= olderr;
418	FUNLOCK(f);
419	va_end(ap2);
420	return ret;
421}