434
|
1 /* Formatted output to strings.
|
|
2 Copyright (C) 1999-2000, 2002-2003, 2006-2010 Free Software Foundation, Inc.
|
|
3
|
|
4 This program is free software; you can redistribute it and/or modify
|
|
5 it under the terms of the GNU General Public License as published by
|
|
6 the Free Software Foundation; either version 3, or (at your option)
|
|
7 any later version.
|
|
8
|
|
9 This program is distributed in the hope that it will be useful,
|
|
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
12 GNU General Public License for more details.
|
|
13
|
|
14 You should have received a copy of the GNU General Public License along
|
|
15 with this program; if not, write to the Free Software Foundation,
|
|
16 Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
|
|
17
|
|
18 /* This file can be parametrized with the following macros:
|
|
19 CHAR_T The element type of the format string.
|
|
20 CHAR_T_ONLY_ASCII Set to 1 to enable verification that all characters
|
|
21 in the format string are ASCII.
|
|
22 DIRECTIVE Structure denoting a format directive.
|
|
23 Depends on CHAR_T.
|
|
24 DIRECTIVES Structure denoting the set of format directives of a
|
|
25 format string. Depends on CHAR_T.
|
|
26 PRINTF_PARSE Function that parses a format string.
|
|
27 Depends on CHAR_T.
|
|
28 STATIC Set to 'static' to declare the function static.
|
|
29 ENABLE_UNISTDIO Set to 1 to enable the unistdio extensions. */
|
|
30
|
|
31 #ifndef PRINTF_PARSE
|
|
32 # include <config.h>
|
|
33 #endif
|
|
34
|
|
35 /* Specification. */
|
|
36 #ifndef PRINTF_PARSE
|
|
37 # include "printf-parse.h"
|
|
38 #endif
|
|
39
|
|
40 /* Default parameters. */
|
|
41 #ifndef PRINTF_PARSE
|
|
42 # define PRINTF_PARSE printf_parse
|
|
43 # define CHAR_T char
|
|
44 # define DIRECTIVE char_directive
|
|
45 # define DIRECTIVES char_directives
|
|
46 #endif
|
|
47
|
|
48 /* Get size_t, NULL. */
|
|
49 #include <stddef.h>
|
|
50
|
|
51 /* Get intmax_t. */
|
|
52 #if defined IN_LIBINTL || defined IN_LIBASPRINTF
|
|
53 # if HAVE_STDINT_H_WITH_UINTMAX
|
|
54 # include <stdint.h>
|
|
55 # endif
|
|
56 # if HAVE_INTTYPES_H_WITH_UINTMAX
|
|
57 # include <inttypes.h>
|
|
58 # endif
|
|
59 #else
|
|
60 # include <stdint.h>
|
|
61 #endif
|
|
62
|
|
63 /* malloc(), realloc(), free(). */
|
|
64 #include <stdlib.h>
|
|
65
|
|
66 /* errno. */
|
|
67 #include <errno.h>
|
|
68
|
|
69 /* Checked size_t computations. */
|
|
70 #include "xsize.h"
|
|
71
|
|
72 #if CHAR_T_ONLY_ASCII
|
|
73 /* c_isascii(). */
|
|
74 # include "c-ctype.h"
|
|
75 #endif
|
|
76
|
|
77 #ifdef STATIC
|
|
78 STATIC
|
|
79 #endif
|
|
80 int
|
|
81 PRINTF_PARSE (const CHAR_T *format, DIRECTIVES *d, arguments *a)
|
|
82 {
|
|
83 const CHAR_T *cp = format; /* pointer into format */
|
|
84 size_t arg_posn = 0; /* number of regular arguments consumed */
|
|
85 size_t d_allocated; /* allocated elements of d->dir */
|
|
86 size_t a_allocated; /* allocated elements of a->arg */
|
|
87 size_t max_width_length = 0;
|
|
88 size_t max_precision_length = 0;
|
|
89
|
|
90 d->count = 0;
|
|
91 d_allocated = 1;
|
|
92 d->dir = (DIRECTIVE *) malloc (d_allocated * sizeof (DIRECTIVE));
|
|
93 if (d->dir == NULL)
|
|
94 /* Out of memory. */
|
|
95 goto out_of_memory_1;
|
|
96
|
|
97 a->count = 0;
|
|
98 a_allocated = 0;
|
|
99 a->arg = NULL;
|
|
100
|
|
101 #define REGISTER_ARG(_index_,_type_) \
|
|
102 { \
|
|
103 size_t n = (_index_); \
|
|
104 if (n >= a_allocated) \
|
|
105 { \
|
|
106 size_t memory_size; \
|
|
107 argument *memory; \
|
|
108 \
|
|
109 a_allocated = xtimes (a_allocated, 2); \
|
|
110 if (a_allocated <= n) \
|
|
111 a_allocated = xsum (n, 1); \
|
|
112 memory_size = xtimes (a_allocated, sizeof (argument)); \
|
|
113 if (size_overflow_p (memory_size)) \
|
|
114 /* Overflow, would lead to out of memory. */ \
|
|
115 goto out_of_memory; \
|
|
116 memory = (argument *) (a->arg \
|
|
117 ? realloc (a->arg, memory_size) \
|
|
118 : malloc (memory_size)); \
|
|
119 if (memory == NULL) \
|
|
120 /* Out of memory. */ \
|
|
121 goto out_of_memory; \
|
|
122 a->arg = memory; \
|
|
123 } \
|
|
124 while (a->count <= n) \
|
|
125 a->arg[a->count++].type = TYPE_NONE; \
|
|
126 if (a->arg[n].type == TYPE_NONE) \
|
|
127 a->arg[n].type = (_type_); \
|
|
128 else if (a->arg[n].type != (_type_)) \
|
|
129 /* Ambiguous type for positional argument. */ \
|
|
130 goto error; \
|
|
131 }
|
|
132
|
|
133 while (*cp != '\0')
|
|
134 {
|
|
135 CHAR_T c = *cp++;
|
|
136 if (c == '%')
|
|
137 {
|
|
138 size_t arg_index = ARG_NONE;
|
|
139 DIRECTIVE *dp = &d->dir[d->count]; /* pointer to next directive */
|
|
140
|
|
141 /* Initialize the next directive. */
|
|
142 dp->dir_start = cp - 1;
|
|
143 dp->flags = 0;
|
|
144 dp->width_start = NULL;
|
|
145 dp->width_end = NULL;
|
|
146 dp->width_arg_index = ARG_NONE;
|
|
147 dp->precision_start = NULL;
|
|
148 dp->precision_end = NULL;
|
|
149 dp->precision_arg_index = ARG_NONE;
|
|
150 dp->arg_index = ARG_NONE;
|
|
151
|
|
152 /* Test for positional argument. */
|
|
153 if (*cp >= '0' && *cp <= '9')
|
|
154 {
|
|
155 const CHAR_T *np;
|
|
156
|
|
157 for (np = cp; *np >= '0' && *np <= '9'; np++)
|
|
158 ;
|
|
159 if (*np == '$')
|
|
160 {
|
|
161 size_t n = 0;
|
|
162
|
|
163 for (np = cp; *np >= '0' && *np <= '9'; np++)
|
|
164 n = xsum (xtimes (n, 10), *np - '0');
|
|
165 if (n == 0)
|
|
166 /* Positional argument 0. */
|
|
167 goto error;
|
|
168 if (size_overflow_p (n))
|
|
169 /* n too large, would lead to out of memory later. */
|
|
170 goto error;
|
|
171 arg_index = n - 1;
|
|
172 cp = np + 1;
|
|
173 }
|
|
174 }
|
|
175
|
|
176 /* Read the flags. */
|
|
177 for (;;)
|
|
178 {
|
|
179 if (*cp == '\'')
|
|
180 {
|
|
181 dp->flags |= FLAG_GROUP;
|
|
182 cp++;
|
|
183 }
|
|
184 else if (*cp == '-')
|
|
185 {
|
|
186 dp->flags |= FLAG_LEFT;
|
|
187 cp++;
|
|
188 }
|
|
189 else if (*cp == '+')
|
|
190 {
|
|
191 dp->flags |= FLAG_SHOWSIGN;
|
|
192 cp++;
|
|
193 }
|
|
194 else if (*cp == ' ')
|
|
195 {
|
|
196 dp->flags |= FLAG_SPACE;
|
|
197 cp++;
|
|
198 }
|
|
199 else if (*cp == '#')
|
|
200 {
|
|
201 dp->flags |= FLAG_ALT;
|
|
202 cp++;
|
|
203 }
|
|
204 else if (*cp == '0')
|
|
205 {
|
|
206 dp->flags |= FLAG_ZERO;
|
|
207 cp++;
|
|
208 }
|
|
209 else
|
|
210 break;
|
|
211 }
|
|
212
|
|
213 /* Parse the field width. */
|
|
214 if (*cp == '*')
|
|
215 {
|
|
216 dp->width_start = cp;
|
|
217 cp++;
|
|
218 dp->width_end = cp;
|
|
219 if (max_width_length < 1)
|
|
220 max_width_length = 1;
|
|
221
|
|
222 /* Test for positional argument. */
|
|
223 if (*cp >= '0' && *cp <= '9')
|
|
224 {
|
|
225 const CHAR_T *np;
|
|
226
|
|
227 for (np = cp; *np >= '0' && *np <= '9'; np++)
|
|
228 ;
|
|
229 if (*np == '$')
|
|
230 {
|
|
231 size_t n = 0;
|
|
232
|
|
233 for (np = cp; *np >= '0' && *np <= '9'; np++)
|
|
234 n = xsum (xtimes (n, 10), *np - '0');
|
|
235 if (n == 0)
|
|
236 /* Positional argument 0. */
|
|
237 goto error;
|
|
238 if (size_overflow_p (n))
|
|
239 /* n too large, would lead to out of memory later. */
|
|
240 goto error;
|
|
241 dp->width_arg_index = n - 1;
|
|
242 cp = np + 1;
|
|
243 }
|
|
244 }
|
|
245 if (dp->width_arg_index == ARG_NONE)
|
|
246 {
|
|
247 dp->width_arg_index = arg_posn++;
|
|
248 if (dp->width_arg_index == ARG_NONE)
|
|
249 /* arg_posn wrapped around. */
|
|
250 goto error;
|
|
251 }
|
|
252 REGISTER_ARG (dp->width_arg_index, TYPE_INT);
|
|
253 }
|
|
254 else if (*cp >= '0' && *cp <= '9')
|
|
255 {
|
|
256 size_t width_length;
|
|
257
|
|
258 dp->width_start = cp;
|
|
259 for (; *cp >= '0' && *cp <= '9'; cp++)
|
|
260 ;
|
|
261 dp->width_end = cp;
|
|
262 width_length = dp->width_end - dp->width_start;
|
|
263 if (max_width_length < width_length)
|
|
264 max_width_length = width_length;
|
|
265 }
|
|
266
|
|
267 /* Parse the precision. */
|
|
268 if (*cp == '.')
|
|
269 {
|
|
270 cp++;
|
|
271 if (*cp == '*')
|
|
272 {
|
|
273 dp->precision_start = cp - 1;
|
|
274 cp++;
|
|
275 dp->precision_end = cp;
|
|
276 if (max_precision_length < 2)
|
|
277 max_precision_length = 2;
|
|
278
|
|
279 /* Test for positional argument. */
|
|
280 if (*cp >= '0' && *cp <= '9')
|
|
281 {
|
|
282 const CHAR_T *np;
|
|
283
|
|
284 for (np = cp; *np >= '0' && *np <= '9'; np++)
|
|
285 ;
|
|
286 if (*np == '$')
|
|
287 {
|
|
288 size_t n = 0;
|
|
289
|
|
290 for (np = cp; *np >= '0' && *np <= '9'; np++)
|
|
291 n = xsum (xtimes (n, 10), *np - '0');
|
|
292 if (n == 0)
|
|
293 /* Positional argument 0. */
|
|
294 goto error;
|
|
295 if (size_overflow_p (n))
|
|
296 /* n too large, would lead to out of memory
|
|
297 later. */
|
|
298 goto error;
|
|
299 dp->precision_arg_index = n - 1;
|
|
300 cp = np + 1;
|
|
301 }
|
|
302 }
|
|
303 if (dp->precision_arg_index == ARG_NONE)
|
|
304 {
|
|
305 dp->precision_arg_index = arg_posn++;
|
|
306 if (dp->precision_arg_index == ARG_NONE)
|
|
307 /* arg_posn wrapped around. */
|
|
308 goto error;
|
|
309 }
|
|
310 REGISTER_ARG (dp->precision_arg_index, TYPE_INT);
|
|
311 }
|
|
312 else
|
|
313 {
|
|
314 size_t precision_length;
|
|
315
|
|
316 dp->precision_start = cp - 1;
|
|
317 for (; *cp >= '0' && *cp <= '9'; cp++)
|
|
318 ;
|
|
319 dp->precision_end = cp;
|
|
320 precision_length = dp->precision_end - dp->precision_start;
|
|
321 if (max_precision_length < precision_length)
|
|
322 max_precision_length = precision_length;
|
|
323 }
|
|
324 }
|
|
325
|
|
326 {
|
|
327 arg_type type;
|
|
328
|
|
329 /* Parse argument type/size specifiers. */
|
|
330 {
|
|
331 int flags = 0;
|
|
332
|
|
333 for (;;)
|
|
334 {
|
|
335 if (*cp == 'h')
|
|
336 {
|
|
337 flags |= (1 << (flags & 1));
|
|
338 cp++;
|
|
339 }
|
|
340 else if (*cp == 'L')
|
|
341 {
|
|
342 flags |= 4;
|
|
343 cp++;
|
|
344 }
|
|
345 else if (*cp == 'l')
|
|
346 {
|
|
347 flags += 8;
|
|
348 cp++;
|
|
349 }
|
|
350 else if (*cp == 'j')
|
|
351 {
|
|
352 if (sizeof (intmax_t) > sizeof (long))
|
|
353 {
|
|
354 /* intmax_t = long long */
|
|
355 flags += 16;
|
|
356 }
|
|
357 else if (sizeof (intmax_t) > sizeof (int))
|
|
358 {
|
|
359 /* intmax_t = long */
|
|
360 flags += 8;
|
|
361 }
|
|
362 cp++;
|
|
363 }
|
|
364 else if (*cp == 'z' || *cp == 'Z')
|
|
365 {
|
|
366 /* 'z' is standardized in ISO C 99, but glibc uses 'Z'
|
|
367 because the warning facility in gcc-2.95.2 understands
|
|
368 only 'Z' (see gcc-2.95.2/gcc/c-common.c:1784). */
|
|
369 if (sizeof (size_t) > sizeof (long))
|
|
370 {
|
|
371 /* size_t = long long */
|
|
372 flags += 16;
|
|
373 }
|
|
374 else if (sizeof (size_t) > sizeof (int))
|
|
375 {
|
|
376 /* size_t = long */
|
|
377 flags += 8;
|
|
378 }
|
|
379 cp++;
|
|
380 }
|
|
381 else if (*cp == 't')
|
|
382 {
|
|
383 if (sizeof (ptrdiff_t) > sizeof (long))
|
|
384 {
|
|
385 /* ptrdiff_t = long long */
|
|
386 flags += 16;
|
|
387 }
|
|
388 else if (sizeof (ptrdiff_t) > sizeof (int))
|
|
389 {
|
|
390 /* ptrdiff_t = long */
|
|
391 flags += 8;
|
|
392 }
|
|
393 cp++;
|
|
394 }
|
|
395 #if defined __APPLE__ && defined __MACH__
|
|
396 /* On MacOS X 10.3, PRIdMAX is defined as "qd".
|
|
397 We cannot change it to "lld" because PRIdMAX must also
|
|
398 be understood by the system's printf routines. */
|
|
399 else if (*cp == 'q')
|
|
400 {
|
|
401 if (64 / 8 > sizeof (long))
|
|
402 {
|
|
403 /* int64_t = long long */
|
|
404 flags += 16;
|
|
405 }
|
|
406 else
|
|
407 {
|
|
408 /* int64_t = long */
|
|
409 flags += 8;
|
|
410 }
|
|
411 cp++;
|
|
412 }
|
|
413 #endif
|
|
414 #if (defined _WIN32 || defined __WIN32__) && ! defined __CYGWIN__
|
|
415 /* On native Win32, PRIdMAX is defined as "I64d".
|
|
416 We cannot change it to "lld" because PRIdMAX must also
|
|
417 be understood by the system's printf routines. */
|
|
418 else if (*cp == 'I' && cp[1] == '6' && cp[2] == '4')
|
|
419 {
|
|
420 if (64 / 8 > sizeof (long))
|
|
421 {
|
|
422 /* __int64 = long long */
|
|
423 flags += 16;
|
|
424 }
|
|
425 else
|
|
426 {
|
|
427 /* __int64 = long */
|
|
428 flags += 8;
|
|
429 }
|
|
430 cp += 3;
|
|
431 }
|
|
432 #endif
|
|
433 else
|
|
434 break;
|
|
435 }
|
|
436
|
|
437 /* Read the conversion character. */
|
|
438 c = *cp++;
|
|
439 switch (c)
|
|
440 {
|
|
441 case 'd': case 'i':
|
|
442 #if HAVE_LONG_LONG_INT
|
|
443 /* If 'long long' exists and is larger than 'long': */
|
|
444 if (flags >= 16 || (flags & 4))
|
|
445 type = TYPE_LONGLONGINT;
|
|
446 else
|
|
447 #endif
|
|
448 /* If 'long long' exists and is the same as 'long', we parse
|
|
449 "lld" into TYPE_LONGINT. */
|
|
450 if (flags >= 8)
|
|
451 type = TYPE_LONGINT;
|
|
452 else if (flags & 2)
|
|
453 type = TYPE_SCHAR;
|
|
454 else if (flags & 1)
|
|
455 type = TYPE_SHORT;
|
|
456 else
|
|
457 type = TYPE_INT;
|
|
458 break;
|
|
459 case 'o': case 'u': case 'x': case 'X':
|
|
460 #if HAVE_LONG_LONG_INT
|
|
461 /* If 'long long' exists and is larger than 'long': */
|
|
462 if (flags >= 16 || (flags & 4))
|
|
463 type = TYPE_ULONGLONGINT;
|
|
464 else
|
|
465 #endif
|
|
466 /* If 'unsigned long long' exists and is the same as
|
|
467 'unsigned long', we parse "llu" into TYPE_ULONGINT. */
|
|
468 if (flags >= 8)
|
|
469 type = TYPE_ULONGINT;
|
|
470 else if (flags & 2)
|
|
471 type = TYPE_UCHAR;
|
|
472 else if (flags & 1)
|
|
473 type = TYPE_USHORT;
|
|
474 else
|
|
475 type = TYPE_UINT;
|
|
476 break;
|
|
477 case 'f': case 'F': case 'e': case 'E': case 'g': case 'G':
|
|
478 case 'a': case 'A':
|
|
479 if (flags >= 16 || (flags & 4))
|
|
480 type = TYPE_LONGDOUBLE;
|
|
481 else
|
|
482 type = TYPE_DOUBLE;
|
|
483 break;
|
|
484 case 'c':
|
|
485 if (flags >= 8)
|
|
486 #if HAVE_WINT_T
|
|
487 type = TYPE_WIDE_CHAR;
|
|
488 #else
|
|
489 goto error;
|
|
490 #endif
|
|
491 else
|
|
492 type = TYPE_CHAR;
|
|
493 break;
|
|
494 #if HAVE_WINT_T
|
|
495 case 'C':
|
|
496 type = TYPE_WIDE_CHAR;
|
|
497 c = 'c';
|
|
498 break;
|
|
499 #endif
|
|
500 case 's':
|
|
501 if (flags >= 8)
|
|
502 #if HAVE_WCHAR_T
|
|
503 type = TYPE_WIDE_STRING;
|
|
504 #else
|
|
505 goto error;
|
|
506 #endif
|
|
507 else
|
|
508 type = TYPE_STRING;
|
|
509 break;
|
|
510 #if HAVE_WCHAR_T
|
|
511 case 'S':
|
|
512 type = TYPE_WIDE_STRING;
|
|
513 c = 's';
|
|
514 break;
|
|
515 #endif
|
|
516 case 'p':
|
|
517 type = TYPE_POINTER;
|
|
518 break;
|
|
519 case 'n':
|
|
520 #if HAVE_LONG_LONG_INT
|
|
521 /* If 'long long' exists and is larger than 'long': */
|
|
522 if (flags >= 16 || (flags & 4))
|
|
523 type = TYPE_COUNT_LONGLONGINT_POINTER;
|
|
524 else
|
|
525 #endif
|
|
526 /* If 'long long' exists and is the same as 'long', we parse
|
|
527 "lln" into TYPE_COUNT_LONGINT_POINTER. */
|
|
528 if (flags >= 8)
|
|
529 type = TYPE_COUNT_LONGINT_POINTER;
|
|
530 else if (flags & 2)
|
|
531 type = TYPE_COUNT_SCHAR_POINTER;
|
|
532 else if (flags & 1)
|
|
533 type = TYPE_COUNT_SHORT_POINTER;
|
|
534 else
|
|
535 type = TYPE_COUNT_INT_POINTER;
|
|
536 break;
|
|
537 #if ENABLE_UNISTDIO
|
|
538 /* The unistdio extensions. */
|
|
539 case 'U':
|
|
540 if (flags >= 16)
|
|
541 type = TYPE_U32_STRING;
|
|
542 else if (flags >= 8)
|
|
543 type = TYPE_U16_STRING;
|
|
544 else
|
|
545 type = TYPE_U8_STRING;
|
|
546 break;
|
|
547 #endif
|
|
548 case '%':
|
|
549 type = TYPE_NONE;
|
|
550 break;
|
|
551 default:
|
|
552 /* Unknown conversion character. */
|
|
553 goto error;
|
|
554 }
|
|
555 }
|
|
556
|
|
557 if (type != TYPE_NONE)
|
|
558 {
|
|
559 dp->arg_index = arg_index;
|
|
560 if (dp->arg_index == ARG_NONE)
|
|
561 {
|
|
562 dp->arg_index = arg_posn++;
|
|
563 if (dp->arg_index == ARG_NONE)
|
|
564 /* arg_posn wrapped around. */
|
|
565 goto error;
|
|
566 }
|
|
567 REGISTER_ARG (dp->arg_index, type);
|
|
568 }
|
|
569 dp->conversion = c;
|
|
570 dp->dir_end = cp;
|
|
571 }
|
|
572
|
|
573 d->count++;
|
|
574 if (d->count >= d_allocated)
|
|
575 {
|
|
576 size_t memory_size;
|
|
577 DIRECTIVE *memory;
|
|
578
|
|
579 d_allocated = xtimes (d_allocated, 2);
|
|
580 memory_size = xtimes (d_allocated, sizeof (DIRECTIVE));
|
|
581 if (size_overflow_p (memory_size))
|
|
582 /* Overflow, would lead to out of memory. */
|
|
583 goto out_of_memory;
|
|
584 memory = (DIRECTIVE *) realloc (d->dir, memory_size);
|
|
585 if (memory == NULL)
|
|
586 /* Out of memory. */
|
|
587 goto out_of_memory;
|
|
588 d->dir = memory;
|
|
589 }
|
|
590 }
|
|
591 #if CHAR_T_ONLY_ASCII
|
|
592 else if (!c_isascii (c))
|
|
593 {
|
|
594 /* Non-ASCII character. Not supported. */
|
|
595 goto error;
|
|
596 }
|
|
597 #endif
|
|
598 }
|
|
599 d->dir[d->count].dir_start = cp;
|
|
600
|
|
601 d->max_width_length = max_width_length;
|
|
602 d->max_precision_length = max_precision_length;
|
|
603 return 0;
|
|
604
|
|
605 error:
|
|
606 if (a->arg)
|
|
607 free (a->arg);
|
|
608 if (d->dir)
|
|
609 free (d->dir);
|
|
610 errno = EINVAL;
|
|
611 return -1;
|
|
612
|
|
613 out_of_memory:
|
|
614 if (a->arg)
|
|
615 free (a->arg);
|
|
616 if (d->dir)
|
|
617 free (d->dir);
|
|
618 out_of_memory_1:
|
|
619 errno = ENOMEM;
|
|
620 return -1;
|
|
621 }
|
|
622
|
|
623 #undef PRINTF_PARSE
|
|
624 #undef DIRECTIVES
|
|
625 #undef DIRECTIVE
|
|
626 #undef CHAR_T_ONLY_ASCII
|
|
627 #undef CHAR_T
|