Sync usage with man page.
[netbsd-mini2440.git] / gnu / dist / gettext / gettext-tools / src / format-awk.c
blobd2a9423a4b0453bafc20e4b93551fb8ebc4beecd
1 /* awk format strings.
2 Copyright (C) 2001-2004 Free Software Foundation, Inc.
3 Written by Bruno Haible <haible@clisp.cons.org>, 2002.
5 This program is free software; you can redistribute it and/or modify
6 it under the terms of the GNU General Public License as published by
7 the Free Software Foundation; either version 2, or (at your option)
8 any later version.
10 This program is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 GNU General Public License for more details.
15 You should have received a copy of the GNU General Public License
16 along with this program; if not, write to the Free Software Foundation,
17 Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
19 #ifdef HAVE_CONFIG_H
20 # include <config.h>
21 #endif
23 #include <stdbool.h>
24 #include <stdlib.h>
26 #include "format.h"
27 #include "c-ctype.h"
28 #include "xalloc.h"
29 #include "xerror.h"
30 #include "format-invalid.h"
31 #include "gettext.h"
33 #define _(str) gettext (str)
35 /* awk format strings are described in the gawk-3.1 documentation and
36 implemented in gawk-3.1.0/builtin.c: format_tree().
37 A directive
38 - starts with '%' or '%m$' where m is a positive integer,
39 - is optionally followed by any of the characters '#', '0', '-', ' ', '+',
40 each of which acts as a flag,
41 - is optionally followed by a width specification: '*' (reads an argument)
42 or '*m$' or a nonempty digit sequence,
43 - is optionally followed by '.' and a precision specification: '*' (reads
44 an argument) or '*m$' or a nonempty digit sequence,
45 - is finished by a specifier
46 - '%', that needs no argument,
47 - 'c', that need a character argument,
48 - 's', that need a string argument,
49 - 'i', 'd', that need a signed integer argument,
50 - 'o', 'u', 'x', 'X', that need an unsigned integer argument,
51 - 'e', 'E', 'f', 'g', 'G', that need a floating-point argument.
52 Numbered ('%m$' or '*m$') and unnumbered argument specifications cannot
53 be used in the same string.
56 enum format_arg_type
58 FAT_NONE,
59 FAT_CHARACTER,
60 FAT_STRING,
61 FAT_INTEGER,
62 FAT_UNSIGNED_INTEGER,
63 FAT_FLOAT
66 struct numbered_arg
68 unsigned int number;
69 enum format_arg_type type;
72 struct spec
74 unsigned int directives;
75 unsigned int numbered_arg_count;
76 unsigned int allocated;
77 struct numbered_arg *numbered;
80 /* Locale independent test for a decimal digit.
81 Argument can be 'char' or 'unsigned char'. (Whereas the argument of
82 <ctype.h> isdigit must be an 'unsigned char'.) */
83 #undef isdigit
84 #define isdigit(c) ((unsigned int) ((c) - '0') < 10)
87 static int
88 numbered_arg_compare (const void *p1, const void *p2)
90 unsigned int n1 = ((const struct numbered_arg *) p1)->number;
91 unsigned int n2 = ((const struct numbered_arg *) p2)->number;
93 return (n1 > n2 ? 1 : n1 < n2 ? -1 : 0);
96 static void *
97 format_parse (const char *format, bool translated, char **invalid_reason)
99 struct spec spec;
100 unsigned int unnumbered_arg_count;
101 struct spec *result;
103 spec.directives = 0;
104 spec.numbered_arg_count = 0;
105 spec.allocated = 0;
106 spec.numbered = NULL;
107 unnumbered_arg_count = 0;
109 for (; *format != '\0';)
110 if (*format++ == '%')
112 /* A directive. */
113 unsigned int number = 0;
114 enum format_arg_type type;
116 spec.directives++;
118 if (isdigit (*format))
120 const char *f = format;
121 unsigned int m = 0;
125 m = 10 * m + (*f - '0');
126 f++;
128 while (isdigit (*f));
130 if (*f == '$')
132 if (m == 0)
134 *invalid_reason = INVALID_ARGNO_0 (spec.directives);
135 goto bad_format;
137 number = m;
138 format = ++f;
142 /* Parse flags. */
143 while (*format == ' ' || *format == '+' || *format == '-'
144 || *format == '#' || *format == '0')
145 format++;
147 /* Parse width. */
148 if (*format == '*')
150 unsigned int width_number = 0;
152 format++;
154 if (isdigit (*format))
156 const char *f = format;
157 unsigned int m = 0;
161 m = 10 * m + (*f - '0');
162 f++;
164 while (isdigit (*f));
166 if (*f == '$')
168 if (m == 0)
170 *invalid_reason =
171 INVALID_WIDTH_ARGNO_0 (spec.directives);
172 goto bad_format;
174 width_number = m;
175 format = ++f;
179 if (width_number)
181 /* Numbered argument. */
183 /* Numbered and unnumbered specifications are exclusive. */
184 if (unnumbered_arg_count > 0)
186 *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED ();
187 goto bad_format;
190 if (spec.allocated == spec.numbered_arg_count)
192 spec.allocated = 2 * spec.allocated + 1;
193 spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, spec.allocated * sizeof (struct numbered_arg));
195 spec.numbered[spec.numbered_arg_count].number = width_number;
196 spec.numbered[spec.numbered_arg_count].type = FAT_INTEGER;
197 spec.numbered_arg_count++;
199 else
201 /* Unnumbered argument. */
203 /* Numbered and unnumbered specifications are exclusive. */
204 if (spec.numbered_arg_count > 0)
206 *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED ();
207 goto bad_format;
210 if (spec.allocated == unnumbered_arg_count)
212 spec.allocated = 2 * spec.allocated + 1;
213 spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, spec.allocated * sizeof (struct numbered_arg));
215 spec.numbered[unnumbered_arg_count].number = unnumbered_arg_count + 1;
216 spec.numbered[unnumbered_arg_count].type = FAT_INTEGER;
217 unnumbered_arg_count++;
220 else if (isdigit (*format))
222 do format++; while (isdigit (*format));
225 /* Parse precision. */
226 if (*format == '.')
228 format++;
230 if (*format == '*')
232 unsigned int precision_number = 0;
234 format++;
236 if (isdigit (*format))
238 const char *f = format;
239 unsigned int m = 0;
243 m = 10 * m + (*f - '0');
244 f++;
246 while (isdigit (*f));
248 if (*f == '$')
250 if (m == 0)
252 *invalid_reason =
253 INVALID_PRECISION_ARGNO_0 (spec.directives);
254 goto bad_format;
256 precision_number = m;
257 format = ++f;
261 if (precision_number)
263 /* Numbered argument. */
265 /* Numbered and unnumbered specifications are exclusive. */
266 if (unnumbered_arg_count > 0)
268 *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED ();
269 goto bad_format;
272 if (spec.allocated == spec.numbered_arg_count)
274 spec.allocated = 2 * spec.allocated + 1;
275 spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, spec.allocated * sizeof (struct numbered_arg));
277 spec.numbered[spec.numbered_arg_count].number = precision_number;
278 spec.numbered[spec.numbered_arg_count].type = FAT_INTEGER;
279 spec.numbered_arg_count++;
281 else
283 /* Unnumbered argument. */
285 /* Numbered and unnumbered specifications are exclusive. */
286 if (spec.numbered_arg_count > 0)
288 *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED ();
289 goto bad_format;
292 if (spec.allocated == unnumbered_arg_count)
294 spec.allocated = 2 * spec.allocated + 1;
295 spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, spec.allocated * sizeof (struct numbered_arg));
297 spec.numbered[unnumbered_arg_count].type = unnumbered_arg_count + 1;
298 spec.numbered[unnumbered_arg_count].type = FAT_INTEGER;
299 unnumbered_arg_count++;
302 else if (isdigit (*format))
304 do format++; while (isdigit (*format));
308 switch (*format)
310 case '%':
311 type = FAT_NONE;
312 break;
313 case 'c':
314 type = FAT_CHARACTER;
315 break;
316 case 's':
317 type = FAT_STRING;
318 break;
319 case 'i': case 'd':
320 type = FAT_INTEGER;
321 break;
322 case 'u': case 'o': case 'x': case 'X':
323 type = FAT_UNSIGNED_INTEGER;
324 break;
325 case 'e': case 'E': case 'f': case 'g': case 'G':
326 type = FAT_FLOAT;
327 break;
328 default:
329 *invalid_reason =
330 (*format == '\0'
331 ? INVALID_UNTERMINATED_DIRECTIVE ()
332 : INVALID_CONVERSION_SPECIFIER (spec.directives, *format));
333 goto bad_format;
336 if (type != FAT_NONE)
338 if (number)
340 /* Numbered argument. */
342 /* Numbered and unnumbered specifications are exclusive. */
343 if (unnumbered_arg_count > 0)
345 *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED ();
346 goto bad_format;
349 if (spec.allocated == spec.numbered_arg_count)
351 spec.allocated = 2 * spec.allocated + 1;
352 spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, spec.allocated * sizeof (struct numbered_arg));
354 spec.numbered[spec.numbered_arg_count].number = number;
355 spec.numbered[spec.numbered_arg_count].type = type;
356 spec.numbered_arg_count++;
358 else
360 /* Unnumbered argument. */
362 /* Numbered and unnumbered specifications are exclusive. */
363 if (spec.numbered_arg_count > 0)
365 *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED ();
366 goto bad_format;
369 if (spec.allocated == unnumbered_arg_count)
371 spec.allocated = 2 * spec.allocated + 1;
372 spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, spec.allocated * sizeof (struct numbered_arg));
374 spec.numbered[unnumbered_arg_count].number = unnumbered_arg_count + 1;
375 spec.numbered[unnumbered_arg_count].type = type;
376 unnumbered_arg_count++;
380 format++;
383 /* Convert the unnumbered argument array to numbered arguments. */
384 if (unnumbered_arg_count > 0)
385 spec.numbered_arg_count = unnumbered_arg_count;
386 /* Sort the numbered argument array, and eliminate duplicates. */
387 else if (spec.numbered_arg_count > 1)
389 unsigned int i, j;
390 bool err;
392 qsort (spec.numbered, spec.numbered_arg_count,
393 sizeof (struct numbered_arg), numbered_arg_compare);
395 /* Remove duplicates: Copy from i to j, keeping 0 <= j <= i. */
396 err = false;
397 for (i = j = 0; i < spec.numbered_arg_count; i++)
398 if (j > 0 && spec.numbered[i].number == spec.numbered[j-1].number)
400 enum format_arg_type type1 = spec.numbered[i].type;
401 enum format_arg_type type2 = spec.numbered[j-1].type;
402 enum format_arg_type type_both;
404 if (type1 == type2)
405 type_both = type1;
406 else
408 /* Incompatible types. */
409 type_both = FAT_NONE;
410 if (!err)
411 *invalid_reason =
412 INVALID_INCOMPATIBLE_ARG_TYPES (spec.numbered[i].number);
413 err = true;
416 spec.numbered[j-1].type = type_both;
418 else
420 if (j < i)
422 spec.numbered[j].number = spec.numbered[i].number;
423 spec.numbered[j].type = spec.numbered[i].type;
425 j++;
427 spec.numbered_arg_count = j;
428 if (err)
429 /* *invalid_reason has already been set above. */
430 goto bad_format;
433 result = (struct spec *) xmalloc (sizeof (struct spec));
434 *result = spec;
435 return result;
437 bad_format:
438 if (spec.numbered != NULL)
439 free (spec.numbered);
440 return NULL;
443 static void
444 format_free (void *descr)
446 struct spec *spec = (struct spec *) descr;
448 if (spec->numbered != NULL)
449 free (spec->numbered);
450 free (spec);
453 static int
454 format_get_number_of_directives (void *descr)
456 struct spec *spec = (struct spec *) descr;
458 return spec->directives;
461 static bool
462 format_check (void *msgid_descr, void *msgstr_descr, bool equality,
463 formatstring_error_logger_t error_logger,
464 const char *pretty_msgstr)
466 struct spec *spec1 = (struct spec *) msgid_descr;
467 struct spec *spec2 = (struct spec *) msgstr_descr;
468 bool err = false;
470 if (spec1->numbered_arg_count + spec2->numbered_arg_count > 0)
472 unsigned int i, j;
473 unsigned int n1 = spec1->numbered_arg_count;
474 unsigned int n2 = spec2->numbered_arg_count;
476 /* Check the argument names are the same.
477 Both arrays are sorted. We search for the first difference. */
478 for (i = 0, j = 0; i < n1 || j < n2; )
480 int cmp = (i >= n1 ? 1 :
481 j >= n2 ? -1 :
482 spec1->numbered[i].number > spec2->numbered[j].number ? 1 :
483 spec1->numbered[i].number < spec2->numbered[j].number ? -1 :
486 if (cmp > 0)
488 if (error_logger)
489 error_logger (_("a format specification for argument %u, as in '%s', doesn't exist in 'msgid'"),
490 spec2->numbered[j].number, pretty_msgstr);
491 err = true;
492 break;
494 else if (cmp < 0)
496 if (equality)
498 if (error_logger)
499 error_logger (_("a format specification for argument %u doesn't exist in '%s'"),
500 spec1->numbered[i].number, pretty_msgstr);
501 err = true;
502 break;
504 else
505 i++;
507 else
508 j++, i++;
510 /* Check the argument types are the same. */
511 if (!err)
512 for (i = 0, j = 0; j < n2; )
514 if (spec1->numbered[i].number == spec2->numbered[j].number)
516 if (spec1->numbered[i].type != spec2->numbered[j].type)
518 if (error_logger)
519 error_logger (_("format specifications in 'msgid' and '%s' for argument %u are not the same"),
520 pretty_msgstr, spec2->numbered[j].number);
521 err = true;
522 break;
524 j++, i++;
526 else
527 i++;
531 return err;
535 struct formatstring_parser formatstring_awk =
537 format_parse,
538 format_free,
539 format_get_number_of_directives,
540 format_check
544 #ifdef TEST
546 /* Test program: Print the argument list specification returned by
547 format_parse for strings read from standard input. */
549 #include <stdio.h>
550 #include "getline.h"
552 static void
553 format_print (void *descr)
555 struct spec *spec = (struct spec *) descr;
556 unsigned int last;
557 unsigned int i;
559 if (spec == NULL)
561 printf ("INVALID");
562 return;
565 printf ("(");
566 last = 1;
567 for (i = 0; i < spec->numbered_arg_count; i++)
569 unsigned int number = spec->numbered[i].number;
571 if (i > 0)
572 printf (" ");
573 if (number < last)
574 abort ();
575 for (; last < number; last++)
576 printf ("_ ");
577 switch (spec->numbered[i].type)
579 case FAT_CHARACTER:
580 printf ("c");
581 break;
582 case FAT_STRING:
583 printf ("s");
584 break;
585 case FAT_INTEGER:
586 printf ("i");
587 break;
588 case FAT_UNSIGNED_INTEGER:
589 printf ("[unsigned]i");
590 break;
591 case FAT_FLOAT:
592 printf ("f");
593 break;
594 default:
595 abort ();
597 last = number + 1;
599 printf (")");
603 main ()
605 for (;;)
607 char *line = NULL;
608 size_t line_size = 0;
609 int line_len;
610 char *invalid_reason;
611 void *descr;
613 line_len = getline (&line, &line_size, stdin);
614 if (line_len < 0)
615 break;
616 if (line_len > 0 && line[line_len - 1] == '\n')
617 line[--line_len] = '\0';
619 invalid_reason = NULL;
620 descr = format_parse (line, false, &invalid_reason);
622 format_print (descr);
623 printf ("\n");
624 if (descr == NULL)
625 printf ("%s\n", invalid_reason);
627 free (invalid_reason);
628 free (line);
631 return 0;
635 * For Emacs M-x compile
636 * Local Variables:
637 * compile-command: "/bin/sh ../libtool --mode=link gcc -o a.out -static -O -g -Wall -I.. -I../lib -I../intl -DHAVE_CONFIG_H -DTEST format-awk.c ../lib/libgettextlib.la"
638 * End:
641 #endif /* TEST */