printf-parse.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544
  1. /* Formatted output to strings.
  2. Copyright (C) 1999-2000, 2002-2003, 2006 Free Software Foundation, Inc.
  3. This program is free software; you can redistribute it and/or modify it
  4. under the terms of the GNU Library General Public License as published
  5. by the Free Software Foundation; either version 2, or (at your option)
  6. any later version.
  7. This program is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  10. Library General Public License for more details.
  11. You should have received a copy of the GNU Library General Public
  12. License along with this program; if not, write to the Free Software
  13. Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301,
  14. USA. */
  15. #include <config.h>
  16. /* Specification. */
  17. #if WIDE_CHAR_VERSION
  18. # include "wprintf-parse.h"
  19. #else
  20. # include "printf-parse.h"
  21. #endif
  22. /* Get size_t, NULL. */
  23. #include <stddef.h>
  24. /* Get intmax_t. */
  25. #if HAVE_STDINT_H_WITH_UINTMAX
  26. # include <stdint.h>
  27. #endif
  28. #if HAVE_INTTYPES_H_WITH_UINTMAX
  29. # include <inttypes.h>
  30. #endif
  31. /* malloc(), realloc(), free(). */
  32. #include <stdlib.h>
  33. /* Checked size_t computations. */
  34. #include "xsize.h"
  35. #if WIDE_CHAR_VERSION
  36. # define PRINTF_PARSE wprintf_parse
  37. # define CHAR_T wchar_t
  38. # define DIRECTIVE wchar_t_directive
  39. # define DIRECTIVES wchar_t_directives
  40. #else
  41. # define PRINTF_PARSE printf_parse
  42. # define CHAR_T char
  43. # define DIRECTIVE char_directive
  44. # define DIRECTIVES char_directives
  45. #endif
  46. #ifdef STATIC
  47. STATIC
  48. #endif
  49. int
  50. PRINTF_PARSE (const CHAR_T *format, DIRECTIVES *d, arguments *a)
  51. {
  52. const CHAR_T *cp = format; /* pointer into format */
  53. size_t arg_posn = 0; /* number of regular arguments consumed */
  54. size_t d_allocated; /* allocated elements of d->dir */
  55. size_t a_allocated; /* allocated elements of a->arg */
  56. size_t max_width_length = 0;
  57. size_t max_precision_length = 0;
  58. d->count = 0;
  59. d_allocated = 1;
  60. d->dir = malloc (d_allocated * sizeof (DIRECTIVE));
  61. if (d->dir == NULL)
  62. /* Out of memory. */
  63. return -1;
  64. a->count = 0;
  65. a_allocated = 0;
  66. a->arg = NULL;
  67. #define REGISTER_ARG(_index_,_type_) \
  68. { \
  69. size_t n = (_index_); \
  70. if (n >= a_allocated) \
  71. { \
  72. size_t memory_size; \
  73. argument *memory; \
  74. \
  75. a_allocated = xtimes (a_allocated, 2); \
  76. if (a_allocated <= n) \
  77. a_allocated = xsum (n, 1); \
  78. memory_size = xtimes (a_allocated, sizeof (argument)); \
  79. if (size_overflow_p (memory_size)) \
  80. /* Overflow, would lead to out of memory. */ \
  81. goto error; \
  82. memory = (a->arg \
  83. ? realloc (a->arg, memory_size) \
  84. : malloc (memory_size)); \
  85. if (memory == NULL) \
  86. /* Out of memory. */ \
  87. goto error; \
  88. a->arg = memory; \
  89. } \
  90. while (a->count <= n) \
  91. a->arg[a->count++].type = TYPE_NONE; \
  92. if (a->arg[n].type == TYPE_NONE) \
  93. a->arg[n].type = (_type_); \
  94. else if (a->arg[n].type != (_type_)) \
  95. /* Ambiguous type for positional argument. */ \
  96. goto error; \
  97. }
  98. while (*cp != '\0')
  99. {
  100. CHAR_T c = *cp++;
  101. if (c == '%')
  102. {
  103. size_t arg_index = ARG_NONE;
  104. DIRECTIVE *dp = &d->dir[d->count];/* pointer to next directive */
  105. /* Initialize the next directive. */
  106. dp->dir_start = cp - 1;
  107. dp->flags = 0;
  108. dp->width_start = NULL;
  109. dp->width_end = NULL;
  110. dp->width_arg_index = ARG_NONE;
  111. dp->precision_start = NULL;
  112. dp->precision_end = NULL;
  113. dp->precision_arg_index = ARG_NONE;
  114. dp->arg_index = ARG_NONE;
  115. /* Test for positional argument. */
  116. if (*cp >= '0' && *cp <= '9')
  117. {
  118. const CHAR_T *np;
  119. for (np = cp; *np >= '0' && *np <= '9'; np++)
  120. ;
  121. if (*np == '$')
  122. {
  123. size_t n = 0;
  124. for (np = cp; *np >= '0' && *np <= '9'; np++)
  125. n = xsum (xtimes (n, 10), *np - '0');
  126. if (n == 0)
  127. /* Positional argument 0. */
  128. goto error;
  129. if (size_overflow_p (n))
  130. /* n too large, would lead to out of memory later. */
  131. goto error;
  132. arg_index = n - 1;
  133. cp = np + 1;
  134. }
  135. }
  136. /* Read the flags. */
  137. for (;;)
  138. {
  139. if (*cp == '\'')
  140. {
  141. dp->flags |= FLAG_GROUP;
  142. cp++;
  143. }
  144. else if (*cp == '-')
  145. {
  146. dp->flags |= FLAG_LEFT;
  147. cp++;
  148. }
  149. else if (*cp == '+')
  150. {
  151. dp->flags |= FLAG_SHOWSIGN;
  152. cp++;
  153. }
  154. else if (*cp == ' ')
  155. {
  156. dp->flags |= FLAG_SPACE;
  157. cp++;
  158. }
  159. else if (*cp == '#')
  160. {
  161. dp->flags |= FLAG_ALT;
  162. cp++;
  163. }
  164. else if (*cp == '0')
  165. {
  166. dp->flags |= FLAG_ZERO;
  167. cp++;
  168. }
  169. else
  170. break;
  171. }
  172. /* Parse the field width. */
  173. if (*cp == '*')
  174. {
  175. dp->width_start = cp;
  176. cp++;
  177. dp->width_end = cp;
  178. if (max_width_length < 1)
  179. max_width_length = 1;
  180. /* Test for positional argument. */
  181. if (*cp >= '0' && *cp <= '9')
  182. {
  183. const CHAR_T *np;
  184. for (np = cp; *np >= '0' && *np <= '9'; np++)
  185. ;
  186. if (*np == '$')
  187. {
  188. size_t n = 0;
  189. for (np = cp; *np >= '0' && *np <= '9'; np++)
  190. n = xsum (xtimes (n, 10), *np - '0');
  191. if (n == 0)
  192. /* Positional argument 0. */
  193. goto error;
  194. if (size_overflow_p (n))
  195. /* n too large, would lead to out of memory later. */
  196. goto error;
  197. dp->width_arg_index = n - 1;
  198. cp = np + 1;
  199. }
  200. }
  201. if (dp->width_arg_index == ARG_NONE)
  202. {
  203. dp->width_arg_index = arg_posn++;
  204. if (dp->width_arg_index == ARG_NONE)
  205. /* arg_posn wrapped around. */
  206. goto error;
  207. }
  208. REGISTER_ARG (dp->width_arg_index, TYPE_INT);
  209. }
  210. else if (*cp >= '0' && *cp <= '9')
  211. {
  212. size_t width_length;
  213. dp->width_start = cp;
  214. for (; *cp >= '0' && *cp <= '9'; cp++)
  215. ;
  216. dp->width_end = cp;
  217. width_length = dp->width_end - dp->width_start;
  218. if (max_width_length < width_length)
  219. max_width_length = width_length;
  220. }
  221. /* Parse the precision. */
  222. if (*cp == '.')
  223. {
  224. cp++;
  225. if (*cp == '*')
  226. {
  227. dp->precision_start = cp - 1;
  228. cp++;
  229. dp->precision_end = cp;
  230. if (max_precision_length < 2)
  231. max_precision_length = 2;
  232. /* Test for positional argument. */
  233. if (*cp >= '0' && *cp <= '9')
  234. {
  235. const CHAR_T *np;
  236. for (np = cp; *np >= '0' && *np <= '9'; np++)
  237. ;
  238. if (*np == '$')
  239. {
  240. size_t n = 0;
  241. for (np = cp; *np >= '0' && *np <= '9'; np++)
  242. n = xsum (xtimes (n, 10), *np - '0');
  243. if (n == 0)
  244. /* Positional argument 0. */
  245. goto error;
  246. if (size_overflow_p (n))
  247. /* n too large, would lead to out of memory
  248. later. */
  249. goto error;
  250. dp->precision_arg_index = n - 1;
  251. cp = np + 1;
  252. }
  253. }
  254. if (dp->precision_arg_index == ARG_NONE)
  255. {
  256. dp->precision_arg_index = arg_posn++;
  257. if (dp->precision_arg_index == ARG_NONE)
  258. /* arg_posn wrapped around. */
  259. goto error;
  260. }
  261. REGISTER_ARG (dp->precision_arg_index, TYPE_INT);
  262. }
  263. else
  264. {
  265. size_t precision_length;
  266. dp->precision_start = cp - 1;
  267. for (; *cp >= '0' && *cp <= '9'; cp++)
  268. ;
  269. dp->precision_end = cp;
  270. precision_length = dp->precision_end - dp->precision_start;
  271. if (max_precision_length < precision_length)
  272. max_precision_length = precision_length;
  273. }
  274. }
  275. {
  276. arg_type type;
  277. /* Parse argument type/size specifiers. */
  278. {
  279. int flags = 0;
  280. for (;;)
  281. {
  282. if (*cp == 'h')
  283. {
  284. flags |= (1 << (flags & 1));
  285. cp++;
  286. }
  287. else if (*cp == 'L')
  288. {
  289. flags |= 4;
  290. cp++;
  291. }
  292. else if (*cp == 'l')
  293. {
  294. flags += 8;
  295. cp++;
  296. }
  297. #ifdef HAVE_INTMAX_T
  298. else if (*cp == 'j')
  299. {
  300. if (sizeof (intmax_t) > sizeof (long))
  301. {
  302. /* intmax_t = long long */
  303. flags += 16;
  304. }
  305. else if (sizeof (intmax_t) > sizeof (int))
  306. {
  307. /* intmax_t = long */
  308. flags += 8;
  309. }
  310. cp++;
  311. }
  312. #endif
  313. else if (*cp == 'z' || *cp == 'Z')
  314. {
  315. /* 'z' is standardized in ISO C 99, but glibc uses 'Z'
  316. because the warning facility in gcc-2.95.2 understands
  317. only 'Z' (see gcc-2.95.2/gcc/c-common.c:1784). */
  318. if (sizeof (size_t) > sizeof (long))
  319. {
  320. /* size_t = long long */
  321. flags += 16;
  322. }
  323. else if (sizeof (size_t) > sizeof (int))
  324. {
  325. /* size_t = long */
  326. flags += 8;
  327. }
  328. cp++;
  329. }
  330. else if (*cp == 't')
  331. {
  332. if (sizeof (ptrdiff_t) > sizeof (long))
  333. {
  334. /* ptrdiff_t = long long */
  335. flags += 16;
  336. }
  337. else if (sizeof (ptrdiff_t) > sizeof (int))
  338. {
  339. /* ptrdiff_t = long */
  340. flags += 8;
  341. }
  342. cp++;
  343. }
  344. else
  345. break;
  346. }
  347. /* Read the conversion character. */
  348. c = *cp++;
  349. switch (c)
  350. {
  351. case 'd': case 'i':
  352. #ifdef HAVE_LONG_LONG_INT
  353. /* If 'long long' exists and is larger than 'long': */
  354. if (flags >= 16 || (flags & 4))
  355. type = TYPE_LONGLONGINT;
  356. else
  357. #endif
  358. /* If 'long long' exists and is the same as 'long', we parse
  359. "lld" into TYPE_LONGINT. */
  360. if (flags >= 8)
  361. type = TYPE_LONGINT;
  362. else if (flags & 2)
  363. type = TYPE_SCHAR;
  364. else if (flags & 1)
  365. type = TYPE_SHORT;
  366. else
  367. type = TYPE_INT;
  368. break;
  369. case 'o': case 'u': case 'x': case 'X':
  370. #ifdef HAVE_LONG_LONG_INT
  371. /* If 'long long' exists and is larger than 'long': */
  372. if (flags >= 16 || (flags & 4))
  373. type = TYPE_ULONGLONGINT;
  374. else
  375. #endif
  376. /* If 'unsigned long long' exists and is the same as
  377. 'unsigned long', we parse "llu" into TYPE_ULONGINT. */
  378. if (flags >= 8)
  379. type = TYPE_ULONGINT;
  380. else if (flags & 2)
  381. type = TYPE_UCHAR;
  382. else if (flags & 1)
  383. type = TYPE_USHORT;
  384. else
  385. type = TYPE_UINT;
  386. break;
  387. case 'f': case 'F': case 'e': case 'E': case 'g': case 'G':
  388. case 'a': case 'A':
  389. #ifdef HAVE_LONG_DOUBLE
  390. if (flags >= 16 || (flags & 4))
  391. type = TYPE_LONGDOUBLE;
  392. else
  393. #endif
  394. type = TYPE_DOUBLE;
  395. break;
  396. case 'c':
  397. if (flags >= 8)
  398. #ifdef HAVE_WINT_T
  399. type = TYPE_WIDE_CHAR;
  400. #else
  401. goto error;
  402. #endif
  403. else
  404. type = TYPE_CHAR;
  405. break;
  406. #ifdef HAVE_WINT_T
  407. case 'C':
  408. type = TYPE_WIDE_CHAR;
  409. c = 'c';
  410. break;
  411. #endif
  412. case 's':
  413. if (flags >= 8)
  414. #ifdef HAVE_WCHAR_T
  415. type = TYPE_WIDE_STRING;
  416. #else
  417. goto error;
  418. #endif
  419. else
  420. type = TYPE_STRING;
  421. break;
  422. #ifdef HAVE_WCHAR_T
  423. case 'S':
  424. type = TYPE_WIDE_STRING;
  425. c = 's';
  426. break;
  427. #endif
  428. case 'p':
  429. type = TYPE_POINTER;
  430. break;
  431. case 'n':
  432. #ifdef HAVE_LONG_LONG_INT
  433. /* If 'long long' exists and is larger than 'long': */
  434. if (flags >= 16 || (flags & 4))
  435. type = TYPE_COUNT_LONGLONGINT_POINTER;
  436. else
  437. #endif
  438. /* If 'long long' exists and is the same as 'long', we parse
  439. "lln" into TYPE_COUNT_LONGINT_POINTER. */
  440. if (flags >= 8)
  441. type = TYPE_COUNT_LONGINT_POINTER;
  442. else if (flags & 2)
  443. type = TYPE_COUNT_SCHAR_POINTER;
  444. else if (flags & 1)
  445. type = TYPE_COUNT_SHORT_POINTER;
  446. else
  447. type = TYPE_COUNT_INT_POINTER;
  448. break;
  449. case '%':
  450. type = TYPE_NONE;
  451. break;
  452. default:
  453. /* Unknown conversion character. */
  454. goto error;
  455. }
  456. }
  457. if (type != TYPE_NONE)
  458. {
  459. dp->arg_index = arg_index;
  460. if (dp->arg_index == ARG_NONE)
  461. {
  462. dp->arg_index = arg_posn++;
  463. if (dp->arg_index == ARG_NONE)
  464. /* arg_posn wrapped around. */
  465. goto error;
  466. }
  467. REGISTER_ARG (dp->arg_index, type);
  468. }
  469. dp->conversion = c;
  470. dp->dir_end = cp;
  471. }
  472. d->count++;
  473. if (d->count >= d_allocated)
  474. {
  475. size_t memory_size;
  476. DIRECTIVE *memory;
  477. d_allocated = xtimes (d_allocated, 2);
  478. memory_size = xtimes (d_allocated, sizeof (DIRECTIVE));
  479. if (size_overflow_p (memory_size))
  480. /* Overflow, would lead to out of memory. */
  481. goto error;
  482. memory = realloc (d->dir, memory_size);
  483. if (memory == NULL)
  484. /* Out of memory. */
  485. goto error;
  486. d->dir = memory;
  487. }
  488. }
  489. }
  490. d->dir[d->count].dir_start = cp;
  491. d->max_width_length = max_width_length;
  492. d->max_precision_length = max_precision_length;
  493. return 0;
  494. error:
  495. if (a->arg)
  496. free (a->arg);
  497. if (d->dir)
  498. free (d->dir);
  499. return -1;
  500. }
  501. #undef DIRECTIVES
  502. #undef DIRECTIVE
  503. #undef CHAR_T
  504. #undef PRINTF_PARSE