diff options
author | Bruno Haible <bruno@clisp.org> | 2010-11-08 01:12:06 +0100 |
---|---|---|
committer | Bruno Haible <bruno@clisp.org> | 2011-06-07 23:38:48 +0200 |
commit | 8a5368eaf0daab888ad5a770a7689e170f33be96 (patch) | |
tree | 0f2941a543a1e23e4336c6b02f05cd237525dec6 | |
parent | ee68315931a8eed630ddd9913ae4e9f743780957 (diff) | |
download | external_gettext-8a5368eaf0daab888ad5a770a7689e170f33be96.zip external_gettext-8a5368eaf0daab888ad5a770a7689e170f33be96.tar.gz external_gettext-8a5368eaf0daab888ad5a770a7689e170f33be96.tar.bz2 |
format-c.c: Share code with libintlext.
-rw-r--r-- | gettext-tools/po/ChangeLog | 4 | ||||
-rw-r--r-- | gettext-tools/po/POTFILES.in | 1 | ||||
-rw-r--r-- | gettext-tools/src/ChangeLog | 9 | ||||
-rw-r--r-- | gettext-tools/src/FILES | 1 | ||||
-rw-r--r-- | gettext-tools/src/Makefile.am | 30 | ||||
-rw-r--r-- | gettext-tools/src/format-c-parse.h | 853 | ||||
-rw-r--r-- | gettext-tools/src/format-c.c | 837 |
7 files changed, 894 insertions, 841 deletions
diff --git a/gettext-tools/po/ChangeLog b/gettext-tools/po/ChangeLog index 90c06c4..714a45d 100644 --- a/gettext-tools/po/ChangeLog +++ b/gettext-tools/po/ChangeLog @@ -1,3 +1,7 @@ +2011-06-02 Bruno Haible <bruno@clisp.org> + + * POTFILES.in: Add src/format-c-parse.h. + 2010-10-10 Bruno Haible <bruno@clisp.org> * bg.po: Update from Roumen Petrov <transl@roumenpetrov.info>. diff --git a/gettext-tools/po/POTFILES.in b/gettext-tools/po/POTFILES.in index fb7ccc6..fc66f5d 100644 --- a/gettext-tools/po/POTFILES.in +++ b/gettext-tools/po/POTFILES.in @@ -31,6 +31,7 @@ src/format.c src/format-awk.c src/format-boost.c src/format-c.c +src/format-c-parse.h src/format-csharp.c src/format-elisp.c src/format-gcc-internal.c diff --git a/gettext-tools/src/ChangeLog b/gettext-tools/src/ChangeLog index c951dab..91e300d 100644 --- a/gettext-tools/src/ChangeLog +++ b/gettext-tools/src/ChangeLog @@ -1,5 +1,14 @@ 2010-11-07 Bruno Haible <bruno@clisp.org> + format-c.c: Share code with libintlext. + * format-c-parse.h: New file, extracted from format-c.c. + * format-c.c: Include it. + (format_parse_entrails): Remove function. + * Makefile.am (FORMAT_SOURCE): Add format-c-parse.h. + * FILES: Update. + +2010-11-07 Bruno Haible <bruno@clisp.org> + format-c.c: Prepare for sharing code with libintlext. * format-c.c: Move INVALID_* macros. (IF_OOM): New macro. diff --git a/gettext-tools/src/FILES b/gettext-tools/src/FILES index d2147d4..9a41f48 100644 --- a/gettext-tools/src/FILES +++ b/gettext-tools/src/FILES @@ -211,6 +211,7 @@ plural-table.c format.h Declarations of the language dependent format string handlers. format-invalid.h Declarations of some error messages for invalid strings. format-c.c Format string handling for C. +format-c-parse.h Format string handling for C, parsing routine. format-sh.c Format string handling for Shell. format-python.c Format string handling for Python. format-lisp.c Format string handling for Common Lisp. diff --git a/gettext-tools/src/Makefile.am b/gettext-tools/src/Makefile.am index a37f7c7..188a0e6 100644 --- a/gettext-tools/src/Makefile.am +++ b/gettext-tools/src/Makefile.am @@ -112,12 +112,30 @@ FORMAT_SOURCE = format.c else FORMAT_SOURCE = ../woe32dll/c++format.cc endif -FORMAT_SOURCE += format-invalid.h \ -format-c.c format-sh.c format-python.c format-lisp.c format-elisp.c \ -format-librep.c format-scheme.c format-java.c format-csharp.c format-awk.c \ -format-pascal.c format-ycp.c format-tcl.c format-perl.c format-perl-brace.c \ -format-php.c format-gcc-internal.c format-gfc-internal.c \ -format-qt.c format-qt-plural.c format-kde.c format-boost.c +FORMAT_SOURCE += \ + format-invalid.h \ + format-c.c format-c-parse.h \ + format-sh.c \ + format-python.c \ + format-lisp.c \ + format-elisp.c \ + format-librep.c \ + format-scheme.c \ + format-java.c \ + format-csharp.c \ + format-awk.c \ + format-pascal.c \ + format-ycp.c \ + format-tcl.c \ + format-perl.c \ + format-perl-brace.c \ + format-php.c \ + format-gcc-internal.c \ + format-gfc-internal.c \ + format-qt.c \ + format-qt-plural.c \ + format-kde.c \ + format-boost.c # libgettextsrc contains all code that is needed by at least two programs. libgettextsrc_la_SOURCES = \ diff --git a/gettext-tools/src/format-c-parse.h b/gettext-tools/src/format-c-parse.h new file mode 100644 index 0000000..a585ccd --- /dev/null +++ b/gettext-tools/src/format-c-parse.h @@ -0,0 +1,853 @@ +/* Parsing C format strings. + Copyright (C) 2001-2004, 2006-2007, 2009 Free Software Foundation, Inc. + Written by Bruno Haible <haible@clisp.cons.org>, 2001. + + This program is free software: you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation; either version 3 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with this program. If not, see <http://www.gnu.org/licenses/>. */ + + +/* C format strings are described in POSIX (IEEE P1003.1 2001), section + XSH 3 fprintf(). See also Linux fprintf(3) manual page. + A directive + - starts with '%' or '%m$' where m is a positive integer, + - is optionally followed by any of the characters '#', '0', '-', ' ', '+', + "'", or - only in msgstr strings - the string "I", each of which acts as + a flag, + - is optionally followed by a width specification: '*' (reads an argument) + or '*m$' or a nonempty digit sequence, + - is optionally followed by '.' and a precision specification: '*' (reads + an argument) or '*m$' or a nonempty digit sequence, + - is either continued like this: + - is optionally followed by a size specifier, one of 'hh' 'h' 'l' 'll' + 'L' 'q' 'j' 'z' 't', + - is finished by a specifier + - '%', that needs no argument, + - 'c', 'C', that need a character argument, + - 's', 'S', that need a string argument, + - 'i', 'd', that need a signed integer argument, + - 'o', 'u', 'x', 'X', that need an unsigned integer argument, + - 'e', 'E', 'f', 'F', 'g', 'G', 'a', 'A', that need a floating-point + argument, + - 'p', that needs a 'void *' argument, + - 'n', that needs a pointer to integer. + or is finished by a specifier '<' inttypes-macro '>' where inttypes-macro + is an ISO C 99 section 7.8.1 format directive. + Numbered ('%m$' or '*m$') and unnumbered argument specifications cannot + be used in the same string. When numbered argument specifications are + used, specifying the Nth argument requires that all the leading arguments, + from the first to the (N-1)th, are specified in the format string. + */ + +enum format_arg_type +{ + FAT_NONE = 0, + /* Basic types */ + FAT_INTEGER = 1, + FAT_DOUBLE = 2, + FAT_CHAR = 3, + FAT_STRING = 4, + FAT_OBJC_OBJECT = 5, + FAT_POINTER = 6, + FAT_COUNT_POINTER = 7, + /* Flags */ + FAT_UNSIGNED = 1 << 3, + FAT_SIZE_SHORT = 1 << 4, + FAT_SIZE_CHAR = 2 << 4, + FAT_SIZE_LONG = 1 << 6, + FAT_SIZE_LONGLONG = 2 << 6, + FAT_SIZE_8_T = 1 << 8, + FAT_SIZE_16_T = 1 << 9, + FAT_SIZE_32_T = 1 << 10, + FAT_SIZE_64_T = 1 << 11, + FAT_SIZE_LEAST8_T = 1 << 12, + FAT_SIZE_LEAST16_T = 1 << 13, + FAT_SIZE_LEAST32_T = 1 << 14, + FAT_SIZE_LEAST64_T = 1 << 15, + FAT_SIZE_FAST8_T = 1 << 16, + FAT_SIZE_FAST16_T = 1 << 17, + FAT_SIZE_FAST32_T = 1 << 18, + FAT_SIZE_FAST64_T = 1 << 19, + FAT_SIZE_INTMAX_T = 1 << 20, + FAT_SIZE_INTPTR_T = 1 << 21, + FAT_SIZE_SIZE_T = 1 << 22, + FAT_SIZE_PTRDIFF_T = 1 << 23, + FAT_WIDE = FAT_SIZE_LONG, + /* Meaningful combinations of basic types and flags: + 'signed char' = FAT_INTEGER | FAT_SIZE_CHAR, + 'unsigned char' = FAT_INTEGER | FAT_SIZE_CHAR | FAT_UNSIGNED, + 'short' = FAT_INTEGER | FAT_SIZE_SHORT, + 'unsigned short' = FAT_INTEGER | FAT_SIZE_SHORT | FAT_UNSIGNED, + 'int' = FAT_INTEGER, + 'unsigned int' = FAT_INTEGER | FAT_UNSIGNED, + 'long int' = FAT_INTEGER | FAT_SIZE_LONG, + 'unsigned long int' = FAT_INTEGER | FAT_SIZE_LONG | FAT_UNSIGNED, + 'long long int' = FAT_INTEGER | FAT_SIZE_LONGLONG, + 'unsigned long long int' = FAT_INTEGER | FAT_SIZE_LONGLONG | FAT_UNSIGNED, + 'double' = FAT_DOUBLE, + 'long double' = FAT_DOUBLE | FAT_SIZE_LONGLONG, + 'char'/'int' = FAT_CHAR, + 'wchar_t'/'wint_t' = FAT_CHAR | FAT_SIZE_LONG, + 'const char *' = FAT_STRING, + 'const wchar_t *' = FAT_STRING | FAT_SIZE_LONG, + 'void *' = FAT_POINTER, + FAT_COUNT_SCHAR_POINTER = FAT_COUNT_POINTER | FAT_SIZE_CHAR, + FAT_COUNT_SHORT_POINTER = FAT_COUNT_POINTER | FAT_SIZE_SHORT, + FAT_COUNT_INT_POINTER = FAT_COUNT_POINTER, + FAT_COUNT_LONGINT_POINTER = FAT_COUNT_POINTER | FAT_SIZE_LONG, + FAT_COUNT_LONGLONGINT_POINTER = FAT_COUNT_POINTER | FAT_SIZE_LONGLONG, + */ + /* Bitmasks */ + FAT_BASIC_MASK = (FAT_INTEGER | FAT_DOUBLE | FAT_CHAR | FAT_STRING + | FAT_OBJC_OBJECT | FAT_POINTER | FAT_COUNT_POINTER), + FAT_SIZE_MASK = (FAT_SIZE_SHORT | FAT_SIZE_CHAR + | FAT_SIZE_LONG | FAT_SIZE_LONGLONG + | FAT_SIZE_8_T | FAT_SIZE_16_T + | FAT_SIZE_32_T | FAT_SIZE_64_T + | FAT_SIZE_LEAST8_T | FAT_SIZE_LEAST16_T + | FAT_SIZE_LEAST32_T | FAT_SIZE_LEAST64_T + | FAT_SIZE_FAST8_T | FAT_SIZE_FAST16_T + | FAT_SIZE_FAST32_T | FAT_SIZE_FAST64_T + | FAT_SIZE_INTMAX_T | FAT_SIZE_INTPTR_T + | FAT_SIZE_SIZE_T | FAT_SIZE_PTRDIFF_T) +}; +#ifdef __cplusplus +typedef int format_arg_type_t; +#else +typedef enum format_arg_type format_arg_type_t; +#endif + +struct numbered_arg +{ + unsigned int number; + format_arg_type_t type; +}; + +struct unnumbered_arg +{ + format_arg_type_t type; +}; + +struct spec +{ + unsigned int directives; + unsigned int unnumbered_arg_count; + unsigned int allocated; + struct unnumbered_arg *unnumbered; + bool unlikely_intentional; + unsigned int sysdep_directives_count; + const char **sysdep_directives; +}; + +/* Locale independent test for a decimal digit. + Argument can be 'char' or 'unsigned char'. (Whereas the argument of + <ctype.h> isdigit must be an 'unsigned char'.) */ +#undef isdigit +#define isdigit(c) ((unsigned int) ((c) - '0') < 10) + +/* Whether to recognize the 'I' flag. */ +#if SYSDEP_SEGMENTS_PROCESSED +/* The 'I' flag can only occur in glibc >= 2.2. On other platforms, gettext() + filters it away even if it is present in the msgstr in the .mo file. */ +# define HANDLE_I_FLAG \ + (__GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ >= 2)) +#else +# define HANDLE_I_FLAG 1 +#endif + + +static int +numbered_arg_compare (const void *p1, const void *p2) +{ + unsigned int n1 = ((const struct numbered_arg *) p1)->number; + unsigned int n2 = ((const struct numbered_arg *) p2)->number; + + return (n1 > n2 ? 1 : n1 < n2 ? -1 : 0); +} + +static struct spec * +format_parse_entrails (const char *format, bool translated, + bool objc_extensions, char *fdi, char **invalid_reason, + struct spec *result) +{ + const char *const format_start = format; + struct spec spec; + unsigned int numbered_arg_count; + struct numbered_arg *numbered; + + spec.directives = 0; + numbered_arg_count = 0; + spec.unnumbered_arg_count = 0; + spec.allocated = 0; + numbered = NULL; + spec.unnumbered = NULL; + spec.unlikely_intentional = false; + spec.sysdep_directives_count = 0; + spec.sysdep_directives = NULL; + + for (; *format != '\0';) + if (*format++ == '%') + { + /* A directive. */ + unsigned int number = 0; + format_arg_type_t type; + format_arg_type_t size; + + FDI_SET (format - 1, FMTDIR_START); + spec.directives++; + + if (isdigit (*format)) + { + const char *f = format; + unsigned int m = 0; + + do + { + m = 10 * m + (*f - '0'); + f++; + } + while (isdigit (*f)); + + if (*f == '$') + { + if (m == 0) + { + *invalid_reason = INVALID_ARGNO_0 (spec.directives); + FDI_SET (f, FMTDIR_ERROR); + goto bad_format; + } + number = m; + format = ++f; + } + } + + /* Parse flags. */ + for (;;) + { + if (*format == ' ' || *format == '+' || *format == '-' + || *format == '#' || *format == '0' || *format == '\'') + format++; +#if HANDLE_I_FLAG + else if (translated && *format == 'I') + { + spec.sysdep_directives = + (const char **) + xrealloc (spec.sysdep_directives, + 2 * (spec.sysdep_directives_count + 1) + * sizeof (const char *)); + IF_OOM (spec.sysdep_directives, goto bad_format;) + spec.sysdep_directives[2 * spec.sysdep_directives_count] = format; + spec.sysdep_directives[2 * spec.sysdep_directives_count + 1] = format + 1; + spec.sysdep_directives_count++; + format++; + } +#endif + else + break; + } + + /* Parse width. */ + if (*format == '*') + { + unsigned int width_number = 0; + + format++; + + if (isdigit (*format)) + { + const char *f = format; + unsigned int m = 0; + + do + { + m = 10 * m + (*f - '0'); + f++; + } + while (isdigit (*f)); + + if (*f == '$') + { + if (m == 0) + { + *invalid_reason = + INVALID_WIDTH_ARGNO_0 (spec.directives); + FDI_SET (f, FMTDIR_ERROR); + goto bad_format; + } + width_number = m; + format = ++f; + } + } + + if (width_number) + { + /* Numbered argument. */ + + /* Numbered and unnumbered specifications are exclusive. */ + if (spec.unnumbered_arg_count > 0) + { + *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); + FDI_SET (format - 1, FMTDIR_ERROR); + goto bad_format; + } + + if (spec.allocated == numbered_arg_count) + { + spec.allocated = 2 * spec.allocated + 1; + numbered = (struct numbered_arg *) xrealloc (numbered, spec.allocated * sizeof (struct numbered_arg)); + IF_OOM (numbered, goto bad_format;) + } + numbered[numbered_arg_count].number = width_number; + numbered[numbered_arg_count].type = FAT_INTEGER; + numbered_arg_count++; + } + else + { + /* Unnumbered argument. */ + + /* Numbered and unnumbered specifications are exclusive. */ + if (numbered_arg_count > 0) + { + *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); + FDI_SET (format - 1, FMTDIR_ERROR); + goto bad_format; + } + + if (spec.allocated == spec.unnumbered_arg_count) + { + spec.allocated = 2 * spec.allocated + 1; + spec.unnumbered = (struct unnumbered_arg *) xrealloc (spec.unnumbered, spec.allocated * sizeof (struct unnumbered_arg)); + IF_OOM (spec.unnumbered, goto bad_format;) + } + spec.unnumbered[spec.unnumbered_arg_count].type = FAT_INTEGER; + spec.unnumbered_arg_count++; + } + } + else if (isdigit (*format)) + { + do format++; while (isdigit (*format)); + } + + /* Parse precision. */ + if (*format == '.') + { + format++; + + if (*format == '*') + { + unsigned int precision_number = 0; + + format++; + + if (isdigit (*format)) + { + const char *f = format; + unsigned int m = 0; + + do + { + m = 10 * m + (*f - '0'); + f++; + } + while (isdigit (*f)); + + if (*f == '$') + { + if (m == 0) + { + *invalid_reason = + INVALID_PRECISION_ARGNO_0 (spec.directives); + FDI_SET (f, FMTDIR_ERROR); + goto bad_format; + } + precision_number = m; + format = ++f; + } + } + + if (precision_number) + { + /* Numbered argument. */ + + /* Numbered and unnumbered specifications are exclusive. */ + if (spec.unnumbered_arg_count > 0) + { + *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); + FDI_SET (format - 1, FMTDIR_ERROR); + goto bad_format; + } + + if (spec.allocated == numbered_arg_count) + { + spec.allocated = 2 * spec.allocated + 1; + numbered = (struct numbered_arg *) xrealloc (numbered, spec.allocated * sizeof (struct numbered_arg)); + IF_OOM (numbered, goto bad_format;) + } + numbered[numbered_arg_count].number = precision_number; + numbered[numbered_arg_count].type = FAT_INTEGER; + numbered_arg_count++; + } + else + { + /* Unnumbered argument. */ + + /* Numbered and unnumbered specifications are exclusive. */ + if (numbered_arg_count > 0) + { + *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); + FDI_SET (format - 1, FMTDIR_ERROR); + goto bad_format; + } + + if (spec.allocated == spec.unnumbered_arg_count) + { + spec.allocated = 2 * spec.allocated + 1; + spec.unnumbered = (struct unnumbered_arg *) xrealloc (spec.unnumbered, spec.allocated * sizeof (struct unnumbered_arg)); + IF_OOM (spec.unnumbered, goto bad_format;) + } + spec.unnumbered[spec.unnumbered_arg_count].type = FAT_INTEGER; + spec.unnumbered_arg_count++; + } + } + else if (isdigit (*format)) + { + do format++; while (isdigit (*format)); + } + } + + if (!SYSDEP_SEGMENTS_PROCESSED && *format == '<') + { + spec.sysdep_directives = + (const char **) + xrealloc (spec.sysdep_directives, + 2 * (spec.sysdep_directives_count + 1) + * sizeof (const char *)); + IF_OOM (spec.sysdep_directives, goto bad_format;) + spec.sysdep_directives[2 * spec.sysdep_directives_count] = format; + + format++; + /* Parse ISO C 99 section 7.8.1 format string directive. + Syntax: + P R I { d | i | o | u | x | X } + { { | LEAST | FAST } { 8 | 16 | 32 | 64 } | MAX | PTR } */ + if (*format != 'P') + { + *invalid_reason = INVALID_C99_MACRO (spec.directives); + FDI_SET (*format == '\0' ? format - 1 : format, FMTDIR_ERROR); + goto bad_format; + } + format++; + if (*format != 'R') + { + *invalid_reason = INVALID_C99_MACRO (spec.directives); + FDI_SET (*format == '\0' ? format - 1 : format, FMTDIR_ERROR); + goto bad_format; + } + format++; + if (*format != 'I') + { + *invalid_reason = INVALID_C99_MACRO (spec.directives); + FDI_SET (*format == '\0' ? format - 1 : format, FMTDIR_ERROR); + goto bad_format; + } + format++; + + switch (*format) + { + case 'i': case 'd': + type = FAT_INTEGER; + break; + case 'u': case 'o': case 'x': case 'X': + type = FAT_INTEGER | FAT_UNSIGNED; + break; + default: + *invalid_reason = INVALID_C99_MACRO (spec.directives); + FDI_SET (*format == '\0' ? format - 1 : format, FMTDIR_ERROR); + goto bad_format; + } + format++; + + if (format[0] == 'M' && format[1] == 'A' && format[2] == 'X') + { + type |= FAT_SIZE_INTMAX_T; + format += 3; + } + else if (format[0] == 'P' && format[1] == 'T' && format[2] == 'R') + { + type |= FAT_SIZE_INTPTR_T; + format += 3; + } + else + { + if (format[0] == 'L' && format[1] == 'E' && format[2] == 'A' + && format[3] == 'S' && format[4] == 'T') + { + format += 5; + if (format[0] == '8') + { + type |= FAT_SIZE_LEAST8_T; + format++; + } + else if (format[0] == '1' && format[1] == '6') + { + type |= FAT_SIZE_LEAST16_T; + format += 2; + } + else if (format[0] == '3' && format[1] == '2') + { + type |= FAT_SIZE_LEAST32_T; + format += 2; + } + else if (format[0] == '6' && format[1] == '4') + { + type |= FAT_SIZE_LEAST64_T; + format += 2; + } + else + { + *invalid_reason = INVALID_C99_MACRO (spec.directives); + FDI_SET (*format == '\0' ? format - 1 : format, + FMTDIR_ERROR); + goto bad_format; + } + } + else if (format[0] == 'F' && format[1] == 'A' + && format[2] == 'S' && format[3] == 'T') + { + format += 4; + if (format[0] == '8') + { + type |= FAT_SIZE_FAST8_T; + format++; + } + else if (format[0] == '1' && format[1] == '6') + { + type |= FAT_SIZE_FAST16_T; + format += 2; + } + else if (format[0] == '3' && format[1] == '2') + { + type |= FAT_SIZE_FAST32_T; + format += 2; + } + else if (format[0] == '6' && format[1] == '4') + { + type |= FAT_SIZE_FAST64_T; + format += 2; + } + else + { + *invalid_reason = INVALID_C99_MACRO (spec.directives); + FDI_SET (*format == '\0' ? format - 1 : format, + FMTDIR_ERROR); + goto bad_format; + } + } + else + { + if (format[0] == '8') + { + type |= FAT_SIZE_8_T; + format++; + } + else if (format[0] == '1' && format[1] == '6') + { + type |= FAT_SIZE_16_T; + format += 2; + } + else if (format[0] == '3' && format[1] == '2') + { + type |= FAT_SIZE_32_T; + format += 2; + } + else if (format[0] == '6' && format[1] == '4') + { + type |= FAT_SIZE_64_T; + format += 2; + } + else + { + *invalid_reason = INVALID_C99_MACRO (spec.directives); + FDI_SET (*format == '\0' ? format - 1 : format, + FMTDIR_ERROR); + goto bad_format; + } + } + } + + if (*format != '>') + { + *invalid_reason = INVALID_ANGLE_BRACKET (spec.directives); + FDI_SET (*format == '\0' ? format - 1 : format, FMTDIR_ERROR); + goto bad_format; + } + + spec.sysdep_directives[2 * spec.sysdep_directives_count + 1] = format + 1; + spec.sysdep_directives_count++; + } + else + { + /* Parse size. */ + size = 0; + for (;; format++) + { + if (*format == 'h') + { + if (size & (FAT_SIZE_SHORT | FAT_SIZE_CHAR)) + size = FAT_SIZE_CHAR; + else + size = FAT_SIZE_SHORT; + } + else if (*format == 'l') + { + if (size & (FAT_SIZE_LONG | FAT_SIZE_LONGLONG)) + size = FAT_SIZE_LONGLONG; + else + size = FAT_SIZE_LONG; + } + else if (*format == 'L') + size = FAT_SIZE_LONGLONG; + else if (*format == 'q') + /* Old BSD 4.4 convention. */ + size = FAT_SIZE_LONGLONG; + else if (*format == 'j') + size = FAT_SIZE_INTMAX_T; + else if (*format == 'z' || *format == 'Z') + /* 'z' is standardized in ISO C 99, but glibc uses 'Z' + because the warning facility in gcc-2.95.2 understands + only 'Z' (see gcc-2.95.2/gcc/c-common.c:1784). */ + size = FAT_SIZE_SIZE_T; + else if (*format == 't') + size = FAT_SIZE_PTRDIFF_T; +#if (defined _WIN32 || defined __WIN32__) && ! defined __CYGWIN__ + else if (SYSDEP_SEGMENTS_PROCESSED + && *format == 'I' + && format[1] == '6' + && format[2] == '4') + { + size = FAT_SIZE_64_T; + format += 2; + } +#endif + else + break; + } + + switch (*format) + { + case '%': + /* Programmers writing _("%2%") most often will not want to + use this string as a c-format string, but rather as a + literal or as a different kind of format string. */ + if (format[-1] != '%') + spec.unlikely_intentional = true; + type = FAT_NONE; + break; + case 'm': /* glibc extension */ + type = FAT_NONE; + break; + case 'c': + type = FAT_CHAR; + type |= (size & (FAT_SIZE_LONG | FAT_SIZE_LONGLONG) + ? FAT_WIDE : 0); + break; + case 'C': /* obsolete */ + type = FAT_CHAR | FAT_WIDE; + break; + case 's': + type = FAT_STRING; + type |= (size & (FAT_SIZE_LONG | FAT_SIZE_LONGLONG) + ? FAT_WIDE : 0); + break; + case 'S': /* obsolete */ + type = FAT_STRING | FAT_WIDE; + break; + case 'i': case 'd': + type = FAT_INTEGER; + type |= (size & FAT_SIZE_MASK); + break; + case 'u': case 'o': case 'x': case 'X': + type = FAT_INTEGER | FAT_UNSIGNED; + type |= (size & FAT_SIZE_MASK); + break; + case 'e': case 'E': case 'f': case 'F': case 'g': case 'G': + case 'a': case 'A': + type = FAT_DOUBLE; + type |= (size & FAT_SIZE_LONGLONG); + break; + case '@': + if (objc_extensions) + { + type = FAT_OBJC_OBJECT; + break; + } + goto other; + case 'p': + type = FAT_POINTER; + break; + case 'n': + type = FAT_COUNT_POINTER; + type |= (size & FAT_SIZE_MASK); + break; + other: + default: + if (*format == '\0') + { + *invalid_reason = INVALID_UNTERMINATED_DIRECTIVE (); + FDI_SET (format - 1, FMTDIR_ERROR); + } + else + { + *invalid_reason = + INVALID_CONVERSION_SPECIFIER (spec.directives, *format); + FDI_SET (format, FMTDIR_ERROR); + } + goto bad_format; + } + } + + if (type != FAT_NONE) + { + if (number) + { + /* Numbered argument. */ + + /* Numbered and unnumbered specifications are exclusive. */ + if (spec.unnumbered_arg_count > 0) + { + *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); + FDI_SET (format, FMTDIR_ERROR); + goto bad_format; + } + + if (spec.allocated == numbered_arg_count) + { + spec.allocated = 2 * spec.allocated + 1; + numbered = (struct numbered_arg *) xrealloc (numbered, spec.allocated * sizeof (struct numbered_arg)); + IF_OOM (numbered, goto bad_format;) + } + numbered[numbered_arg_count].number = number; + numbered[numbered_arg_count].type = type; + numbered_arg_count++; + } + else + { + /* Unnumbered argument. */ + + /* Numbered and unnumbered specifications are exclusive. */ + if (numbered_arg_count > 0) + { + *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); + FDI_SET (format, FMTDIR_ERROR); + goto bad_format; + } + + if (spec.allocated == spec.unnumbered_arg_count) + { + spec.allocated = 2 * spec.allocated + 1; + spec.unnumbered = (struct unnumbered_arg *) xrealloc (spec.unnumbered, spec.allocated * sizeof (struct unnumbered_arg)); + IF_OOM (spec.unnumbered, goto bad_format;) + } + spec.unnumbered[spec.unnumbered_arg_count].type = type; + spec.unnumbered_arg_count++; + } + } + + FDI_SET (format, FMTDIR_END); + + format++; + } + + /* Sort the numbered argument array, and eliminate duplicates. */ + if (numbered_arg_count > 1) + { + unsigned int i, j; + bool err; + + qsort (numbered, numbered_arg_count, + sizeof (struct numbered_arg), numbered_arg_compare); + + /* Remove duplicates: Copy from i to j, keeping 0 <= j <= i. */ + err = false; + for (i = j = 0; i < numbered_arg_count; i++) + if (j > 0 && numbered[i].number == numbered[j-1].number) + { + format_arg_type_t type1 = numbered[i].type; + format_arg_type_t type2 = numbered[j-1].type; + format_arg_type_t type_both; + + if (type1 == type2) + type_both = type1; + else + { + /* Incompatible types. */ + type_both = FAT_NONE; + if (!err) + *invalid_reason = + INVALID_INCOMPATIBLE_ARG_TYPES (numbered[i].number); + err = true; + } + + numbered[j-1].type = type_both; + } + else + { + if (j < i) + { + numbered[j].number = numbered[i].number; + numbered[j].type = numbered[i].type; + } + j++; + } + numbered_arg_count = j; + if (err) + /* *invalid_reason has already been set above. */ + goto bad_format; + } + + /* Verify that the format strings uses all arguments up to the highest + numbered one. */ + if (numbered_arg_count > 0) + { + unsigned int i; + + for (i = 0; i < numbered_arg_count; i++) + if (numbered[i].number != i + 1) + { + *invalid_reason = INVALID_IGNORED_ARGUMENT (numbered[i].number, i + 1); + goto bad_format; + } + + /* So now the numbered arguments array is equivalent to a sequence + of unnumbered arguments. */ + spec.unnumbered_arg_count = numbered_arg_count; + spec.allocated = spec.unnumbered_arg_count; + spec.unnumbered = XNMALLOC (spec.allocated, struct unnumbered_arg); + IF_OOM (spec.unnumbered, goto bad_format;) + for (i = 0; i < spec.unnumbered_arg_count; i++) + spec.unnumbered[i].type = numbered[i].type; + free (numbered); + numbered_arg_count = 0; + } + + *result = spec; + return result; + + bad_format: + if (numbered != NULL) + free (numbered); + if (spec.unnumbered != NULL) + free (spec.unnumbered); + if (spec.sysdep_directives != NULL) + free (spec.sysdep_directives); + return NULL; +} diff --git a/gettext-tools/src/format-c.c b/gettext-tools/src/format-c.c index 93c9517..d88f8de 100644 --- a/gettext-tools/src/format-c.c +++ b/gettext-tools/src/format-c.c @@ -54,841 +54,8 @@ only on glibc >= 2.2 platforms. */ #define SYSDEP_SEGMENTS_PROCESSED false -/* C format strings are described in POSIX (IEEE P1003.1 2001), section - XSH 3 fprintf(). See also Linux fprintf(3) manual page. - A directive - - starts with '%' or '%m$' where m is a positive integer, - - is optionally followed by any of the characters '#', '0', '-', ' ', '+', - "'", or - only in msgstr strings - the string "I", each of which acts as - a flag, - - is optionally followed by a width specification: '*' (reads an argument) - or '*m$' or a nonempty digit sequence, - - is optionally followed by '.' and a precision specification: '*' (reads - an argument) or '*m$' or a nonempty digit sequence, - - is either continued like this: - - is optionally followed by a size specifier, one of 'hh' 'h' 'l' 'll' - 'L' 'q' 'j' 'z' 't', - - is finished by a specifier - - '%', that needs no argument, - - 'c', 'C', that need a character argument, - - 's', 'S', that need a string argument, - - 'i', 'd', that need a signed integer argument, - - 'o', 'u', 'x', 'X', that need an unsigned integer argument, - - 'e', 'E', 'f', 'F', 'g', 'G', 'a', 'A', that need a floating-point - argument, - - 'p', that needs a 'void *' argument, - - 'n', that needs a pointer to integer. - or is finished by a specifier '<' inttypes-macro '>' where inttypes-macro - is an ISO C 99 section 7.8.1 format directive. - Numbered ('%m$' or '*m$') and unnumbered argument specifications cannot - be used in the same string. When numbered argument specifications are - used, specifying the Nth argument requires that all the leading arguments, - from the first to the (N-1)th, are specified in the format string. - */ - -enum format_arg_type -{ - FAT_NONE = 0, - /* Basic types */ - FAT_INTEGER = 1, - FAT_DOUBLE = 2, - FAT_CHAR = 3, - FAT_STRING = 4, - FAT_OBJC_OBJECT = 5, - FAT_POINTER = 6, - FAT_COUNT_POINTER = 7, - /* Flags */ - FAT_UNSIGNED = 1 << 3, - FAT_SIZE_SHORT = 1 << 4, - FAT_SIZE_CHAR = 2 << 4, - FAT_SIZE_LONG = 1 << 6, - FAT_SIZE_LONGLONG = 2 << 6, - FAT_SIZE_8_T = 1 << 8, - FAT_SIZE_16_T = 1 << 9, - FAT_SIZE_32_T = 1 << 10, - FAT_SIZE_64_T = 1 << 11, - FAT_SIZE_LEAST8_T = 1 << 12, - FAT_SIZE_LEAST16_T = 1 << 13, - FAT_SIZE_LEAST32_T = 1 << 14, - FAT_SIZE_LEAST64_T = 1 << 15, - FAT_SIZE_FAST8_T = 1 << 16, - FAT_SIZE_FAST16_T = 1 << 17, - FAT_SIZE_FAST32_T = 1 << 18, - FAT_SIZE_FAST64_T = 1 << 19, - FAT_SIZE_INTMAX_T = 1 << 20, - FAT_SIZE_INTPTR_T = 1 << 21, - FAT_SIZE_SIZE_T = 1 << 22, - FAT_SIZE_PTRDIFF_T = 1 << 23, - FAT_WIDE = FAT_SIZE_LONG, - /* Meaningful combinations of basic types and flags: - 'signed char' = FAT_INTEGER | FAT_SIZE_CHAR, - 'unsigned char' = FAT_INTEGER | FAT_SIZE_CHAR | FAT_UNSIGNED, - 'short' = FAT_INTEGER | FAT_SIZE_SHORT, - 'unsigned short' = FAT_INTEGER | FAT_SIZE_SHORT | FAT_UNSIGNED, - 'int' = FAT_INTEGER, - 'unsigned int' = FAT_INTEGER | FAT_UNSIGNED, - 'long int' = FAT_INTEGER | FAT_SIZE_LONG, - 'unsigned long int' = FAT_INTEGER | FAT_SIZE_LONG | FAT_UNSIGNED, - 'long long int' = FAT_INTEGER | FAT_SIZE_LONGLONG, - 'unsigned long long int' = FAT_INTEGER | FAT_SIZE_LONGLONG | FAT_UNSIGNED, - 'double' = FAT_DOUBLE, - 'long double' = FAT_DOUBLE | FAT_SIZE_LONGLONG, - 'char'/'int' = FAT_CHAR, - 'wchar_t'/'wint_t' = FAT_CHAR | FAT_SIZE_LONG, - 'const char *' = FAT_STRING, - 'const wchar_t *' = FAT_STRING | FAT_SIZE_LONG, - 'void *' = FAT_POINTER, - FAT_COUNT_SCHAR_POINTER = FAT_COUNT_POINTER | FAT_SIZE_CHAR, - FAT_COUNT_SHORT_POINTER = FAT_COUNT_POINTER | FAT_SIZE_SHORT, - FAT_COUNT_INT_POINTER = FAT_COUNT_POINTER, - FAT_COUNT_LONGINT_POINTER = FAT_COUNT_POINTER | FAT_SIZE_LONG, - FAT_COUNT_LONGLONGINT_POINTER = FAT_COUNT_POINTER | FAT_SIZE_LONGLONG, - */ - /* Bitmasks */ - FAT_BASIC_MASK = (FAT_INTEGER | FAT_DOUBLE | FAT_CHAR | FAT_STRING - | FAT_OBJC_OBJECT | FAT_POINTER | FAT_COUNT_POINTER), - FAT_SIZE_MASK = (FAT_SIZE_SHORT | FAT_SIZE_CHAR - | FAT_SIZE_LONG | FAT_SIZE_LONGLONG - | FAT_SIZE_8_T | FAT_SIZE_16_T - | FAT_SIZE_32_T | FAT_SIZE_64_T - | FAT_SIZE_LEAST8_T | FAT_SIZE_LEAST16_T - | FAT_SIZE_LEAST32_T | FAT_SIZE_LEAST64_T - | FAT_SIZE_FAST8_T | FAT_SIZE_FAST16_T - | FAT_SIZE_FAST32_T | FAT_SIZE_FAST64_T - | FAT_SIZE_INTMAX_T | FAT_SIZE_INTPTR_T - | FAT_SIZE_SIZE_T | FAT_SIZE_PTRDIFF_T) -}; -#ifdef __cplusplus -typedef int format_arg_type_t; -#else -typedef enum format_arg_type format_arg_type_t; -#endif - -struct numbered_arg -{ - unsigned int number; - format_arg_type_t type; -}; - -struct unnumbered_arg -{ - format_arg_type_t type; -}; - -struct spec -{ - unsigned int directives; - unsigned int unnumbered_arg_count; - unsigned int allocated; - struct unnumbered_arg *unnumbered; - bool unlikely_intentional; - unsigned int sysdep_directives_count; - const char **sysdep_directives; -}; - -/* Locale independent test for a decimal digit. - Argument can be 'char' or 'unsigned char'. (Whereas the argument of - <ctype.h> isdigit must be an 'unsigned char'.) */ -#undef isdigit -#define isdigit(c) ((unsigned int) ((c) - '0') < 10) - -/* Whether to recognize the 'I' flag. */ -#if SYSDEP_SEGMENTS_PROCESSED -/* The 'I' flag can only occur in glibc >= 2.2. On other platforms, gettext() - filters it away even if it is present in the msgstr in the .mo file. */ -# define HANDLE_I_FLAG \ - (__GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ >= 2)) -#else -# define HANDLE_I_FLAG 1 -#endif - - -static int -numbered_arg_compare (const void *p1, const void *p2) -{ - unsigned int n1 = ((const struct numbered_arg *) p1)->number; - unsigned int n2 = ((const struct numbered_arg *) p2)->number; - - return (n1 > n2 ? 1 : n1 < n2 ? -1 : 0); -} - -static struct spec * -format_parse_entrails (const char *format, bool translated, - bool objc_extensions, char *fdi, char **invalid_reason, - struct spec *result) -{ - const char *const format_start = format; - struct spec spec; - unsigned int numbered_arg_count; - struct numbered_arg *numbered; - - spec.directives = 0; - numbered_arg_count = 0; - spec.unnumbered_arg_count = 0; - spec.allocated = 0; - numbered = NULL; - spec.unnumbered = NULL; - spec.unlikely_intentional = false; - spec.sysdep_directives_count = 0; - spec.sysdep_directives = NULL; - - for (; *format != '\0';) - if (*format++ == '%') - { - /* A directive. */ - unsigned int number = 0; - format_arg_type_t type; - format_arg_type_t size; - - FDI_SET (format - 1, FMTDIR_START); - spec.directives++; - - if (isdigit (*format)) - { - const char *f = format; - unsigned int m = 0; - - do - { - m = 10 * m + (*f - '0'); - f++; - } - while (isdigit (*f)); - - if (*f == '$') - { - if (m == 0) - { - *invalid_reason = INVALID_ARGNO_0 (spec.directives); - FDI_SET (f, FMTDIR_ERROR); - goto bad_format; - } - number = m; - format = ++f; - } - } - - /* Parse flags. */ - for (;;) - { - if (*format == ' ' || *format == '+' || *format == '-' - || *format == '#' || *format == '0' || *format == '\'') - format++; -#if HANDLE_I_FLAG - else if (translated && *format == 'I') - { - spec.sysdep_directives = - (const char **) - xrealloc (spec.sysdep_directives, - 2 * (spec.sysdep_directives_count + 1) - * sizeof (const char *)); - IF_OOM (spec.sysdep_directives, goto bad_format;) - spec.sysdep_directives[2 * spec.sysdep_directives_count] = format; - spec.sysdep_directives[2 * spec.sysdep_directives_count + 1] = format + 1; - spec.sysdep_directives_count++; - format++; - } -#endif - else - break; - } - - /* Parse width. */ - if (*format == '*') - { - unsigned int width_number = 0; - - format++; - - if (isdigit (*format)) - { - const char *f = format; - unsigned int m = 0; - - do - { - m = 10 * m + (*f - '0'); - f++; - } - while (isdigit (*f)); - - if (*f == '$') - { - if (m == 0) - { - *invalid_reason = - INVALID_WIDTH_ARGNO_0 (spec.directives); - FDI_SET (f, FMTDIR_ERROR); - goto bad_format; - } - width_number = m; - format = ++f; - } - } - - if (width_number) - { - /* Numbered argument. */ - - /* Numbered and unnumbered specifications are exclusive. */ - if (spec.unnumbered_arg_count > 0) - { - *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); - FDI_SET (format - 1, FMTDIR_ERROR); - goto bad_format; - } - - if (spec.allocated == numbered_arg_count) - { - spec.allocated = 2 * spec.allocated + 1; - numbered = (struct numbered_arg *) xrealloc (numbered, spec.allocated * sizeof (struct numbered_arg)); - IF_OOM (numbered, goto bad_format;) - } - numbered[numbered_arg_count].number = width_number; - numbered[numbered_arg_count].type = FAT_INTEGER; - numbered_arg_count++; - } - else - { - /* Unnumbered argument. */ - - /* Numbered and unnumbered specifications are exclusive. */ - if (numbered_arg_count > 0) - { - *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); - FDI_SET (format - 1, FMTDIR_ERROR); - goto bad_format; - } - - if (spec.allocated == spec.unnumbered_arg_count) - { - spec.allocated = 2 * spec.allocated + 1; - spec.unnumbered = (struct unnumbered_arg *) xrealloc (spec.unnumbered, spec.allocated * sizeof (struct unnumbered_arg)); - IF_OOM (spec.unnumbered, goto bad_format;) - } - spec.unnumbered[spec.unnumbered_arg_count].type = FAT_INTEGER; - spec.unnumbered_arg_count++; - } - } - else if (isdigit (*format)) - { - do format++; while (isdigit (*format)); - } - - /* Parse precision. */ - if (*format == '.') - { - format++; - - if (*format == '*') - { - unsigned int precision_number = 0; - - format++; - - if (isdigit (*format)) - { - const char *f = format; - unsigned int m = 0; - - do - { - m = 10 * m + (*f - '0'); - f++; - } - while (isdigit (*f)); - - if (*f == '$') - { - if (m == 0) - { - *invalid_reason = - INVALID_PRECISION_ARGNO_0 (spec.directives); - FDI_SET (f, FMTDIR_ERROR); - goto bad_format; - } - precision_number = m; - format = ++f; - } - } - - if (precision_number) - { - /* Numbered argument. */ - - /* Numbered and unnumbered specifications are exclusive. */ - if (spec.unnumbered_arg_count > 0) - { - *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); - FDI_SET (format - 1, FMTDIR_ERROR); - goto bad_format; - } - - if (spec.allocated == numbered_arg_count) - { - spec.allocated = 2 * spec.allocated + 1; - numbered = (struct numbered_arg *) xrealloc (numbered, spec.allocated * sizeof (struct numbered_arg)); - IF_OOM (numbered, goto bad_format;) - } - numbered[numbered_arg_count].number = precision_number; - numbered[numbered_arg_count].type = FAT_INTEGER; - numbered_arg_count++; - } - else - { - /* Unnumbered argument. */ - - /* Numbered and unnumbered specifications are exclusive. */ - if (numbered_arg_count > 0) - { - *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); - FDI_SET (format - 1, FMTDIR_ERROR); - goto bad_format; - } - - if (spec.allocated == spec.unnumbered_arg_count) - { - spec.allocated = 2 * spec.allocated + 1; - spec.unnumbered = (struct unnumbered_arg *) xrealloc (spec.unnumbered, spec.allocated * sizeof (struct unnumbered_arg)); - IF_OOM (spec.unnumbered, goto bad_format;) - } - spec.unnumbered[spec.unnumbered_arg_count].type = FAT_INTEGER; - spec.unnumbered_arg_count++; - } - } - else if (isdigit (*format)) - { - do format++; while (isdigit (*format)); - } - } - - if (!SYSDEP_SEGMENTS_PROCESSED && *format == '<') - { - spec.sysdep_directives = - (const char **) - xrealloc (spec.sysdep_directives, - 2 * (spec.sysdep_directives_count + 1) - * sizeof (const char *)); - IF_OOM (spec.sysdep_directives, goto bad_format;) - spec.sysdep_directives[2 * spec.sysdep_directives_count] = format; - - format++; - /* Parse ISO C 99 section 7.8.1 format string directive. - Syntax: - P R I { d | i | o | u | x | X } - { { | LEAST | FAST } { 8 | 16 | 32 | 64 } | MAX | PTR } */ - if (*format != 'P') - { - *invalid_reason = INVALID_C99_MACRO (spec.directives); - FDI_SET (*format == '\0' ? format - 1 : format, FMTDIR_ERROR); - goto bad_format; - } - format++; - if (*format != 'R') - { - *invalid_reason = INVALID_C99_MACRO (spec.directives); - FDI_SET (*format == '\0' ? format - 1 : format, FMTDIR_ERROR); - goto bad_format; - } - format++; - if (*format != 'I') - { - *invalid_reason = INVALID_C99_MACRO (spec.directives); - FDI_SET (*format == '\0' ? format - 1 : format, FMTDIR_ERROR); - goto bad_format; - } - format++; - - switch (*format) - { - case 'i': case 'd': - type = FAT_INTEGER; - break; - case 'u': case 'o': case 'x': case 'X': - type = FAT_INTEGER | FAT_UNSIGNED; - break; - default: - *invalid_reason = INVALID_C99_MACRO (spec.directives); - FDI_SET (*format == '\0' ? format - 1 : format, FMTDIR_ERROR); - goto bad_format; - } - format++; - - if (format[0] == 'M' && format[1] == 'A' && format[2] == 'X') - { - type |= FAT_SIZE_INTMAX_T; - format += 3; - } - else if (format[0] == 'P' && format[1] == 'T' && format[2] == 'R') - { - type |= FAT_SIZE_INTPTR_T; - format += 3; - } - else - { - if (format[0] == 'L' && format[1] == 'E' && format[2] == 'A' - && format[3] == 'S' && format[4] == 'T') - { - format += 5; - if (format[0] == '8') - { - type |= FAT_SIZE_LEAST8_T; - format++; - } - else if (format[0] == '1' && format[1] == '6') - { - type |= FAT_SIZE_LEAST16_T; - format += 2; - } - else if (format[0] == '3' && format[1] == '2') - { - type |= FAT_SIZE_LEAST32_T; - format += 2; - } - else if (format[0] == '6' && format[1] == '4') - { - type |= FAT_SIZE_LEAST64_T; - format += 2; - } - else - { - *invalid_reason = INVALID_C99_MACRO (spec.directives); - FDI_SET (*format == '\0' ? format - 1 : format, - FMTDIR_ERROR); - goto bad_format; - } - } - else if (format[0] == 'F' && format[1] == 'A' - && format[2] == 'S' && format[3] == 'T') - { - format += 4; - if (format[0] == '8') - { - type |= FAT_SIZE_FAST8_T; - format++; - } - else if (format[0] == '1' && format[1] == '6') - { - type |= FAT_SIZE_FAST16_T; - format += 2; - } - else if (format[0] == '3' && format[1] == '2') - { - type |= FAT_SIZE_FAST32_T; - format += 2; - } - else if (format[0] == '6' && format[1] == '4') - { - type |= FAT_SIZE_FAST64_T; - format += 2; - } - else - { - *invalid_reason = INVALID_C99_MACRO (spec.directives); - FDI_SET (*format == '\0' ? format - 1 : format, - FMTDIR_ERROR); - goto bad_format; - } - } - else - { - if (format[0] == '8') - { - type |= FAT_SIZE_8_T; - format++; - } - else if (format[0] == '1' && format[1] == '6') - { - type |= FAT_SIZE_16_T; - format += 2; - } - else if (format[0] == '3' && format[1] == '2') - { - type |= FAT_SIZE_32_T; - format += 2; - } - else if (format[0] == '6' && format[1] == '4') - { - type |= FAT_SIZE_64_T; - format += 2; - } - else - { - *invalid_reason = INVALID_C99_MACRO (spec.directives); - FDI_SET (*format == '\0' ? format - 1 : format, - FMTDIR_ERROR); - goto bad_format; - } - } - } - - if (*format != '>') - { - *invalid_reason = INVALID_ANGLE_BRACKET (spec.directives); - FDI_SET (*format == '\0' ? format - 1 : format, FMTDIR_ERROR); - goto bad_format; - } - - spec.sysdep_directives[2 * spec.sysdep_directives_count + 1] = format + 1; - spec.sysdep_directives_count++; - } - else - { - /* Parse size. */ - size = 0; - for (;; format++) - { - if (*format == 'h') - { - if (size & (FAT_SIZE_SHORT | FAT_SIZE_CHAR)) - size = FAT_SIZE_CHAR; - else - size = FAT_SIZE_SHORT; - } - else if (*format == 'l') - { - if (size & (FAT_SIZE_LONG | FAT_SIZE_LONGLONG)) - size = FAT_SIZE_LONGLONG; - else - size = FAT_SIZE_LONG; - } - else if (*format == 'L') - size = FAT_SIZE_LONGLONG; - else if (*format == 'q') - /* Old BSD 4.4 convention. */ - size = FAT_SIZE_LONGLONG; - else if (*format == 'j') - size = FAT_SIZE_INTMAX_T; - else if (*format == 'z' || *format == 'Z') - /* 'z' is standardized in ISO C 99, but glibc uses 'Z' - because the warning facility in gcc-2.95.2 understands - only 'Z' (see gcc-2.95.2/gcc/c-common.c:1784). */ - size = FAT_SIZE_SIZE_T; - else if (*format == 't') - size = FAT_SIZE_PTRDIFF_T; -#if (defined _WIN32 || defined __WIN32__) && ! defined __CYGWIN__ - else if (SYSDEP_SEGMENTS_PROCESSED - && *format == 'I' - && format[1] == '6' - && format[2] == '4') - { - size = FAT_SIZE_64_T; - format += 2; - } -#endif - else - break; - } - - switch (*format) - { - case '%': - /* Programmers writing _("%2%") most often will not want to - use this string as a c-format string, but rather as a - literal or as a different kind of format string. */ - if (format[-1] != '%') - spec.unlikely_intentional = true; - type = FAT_NONE; - break; - case 'm': /* glibc extension */ - type = FAT_NONE; - break; - case 'c': - type = FAT_CHAR; - type |= (size & (FAT_SIZE_LONG | FAT_SIZE_LONGLONG) - ? FAT_WIDE : 0); - break; - case 'C': /* obsolete */ - type = FAT_CHAR | FAT_WIDE; - break; - case 's': - type = FAT_STRING; - type |= (size & (FAT_SIZE_LONG | FAT_SIZE_LONGLONG) - ? FAT_WIDE : 0); - break; - case 'S': /* obsolete */ - type = FAT_STRING | FAT_WIDE; - break; - case 'i': case 'd': - type = FAT_INTEGER; - type |= (size & FAT_SIZE_MASK); - break; - case 'u': case 'o': case 'x': case 'X': - type = FAT_INTEGER | FAT_UNSIGNED; - type |= (size & FAT_SIZE_MASK); - break; - case 'e': case 'E': case 'f': case 'F': case 'g': case 'G': - case 'a': case 'A': - type = FAT_DOUBLE; - type |= (size & FAT_SIZE_LONGLONG); - break; - case '@': - if (objc_extensions) - { - type = FAT_OBJC_OBJECT; - break; - } - goto other; - case 'p': - type = FAT_POINTER; - break; - case 'n': - type = FAT_COUNT_POINTER; - type |= (size & FAT_SIZE_MASK); - break; - other: - default: - if (*format == '\0') - { - *invalid_reason = INVALID_UNTERMINATED_DIRECTIVE (); - FDI_SET (format - 1, FMTDIR_ERROR); - } - else - { - *invalid_reason = - INVALID_CONVERSION_SPECIFIER (spec.directives, *format); - FDI_SET (format, FMTDIR_ERROR); - } - goto bad_format; - } - } - - if (type != FAT_NONE) - { - if (number) - { - /* Numbered argument. */ - - /* Numbered and unnumbered specifications are exclusive. */ - if (spec.unnumbered_arg_count > 0) - { - *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); - FDI_SET (format, FMTDIR_ERROR); - goto bad_format; - } - - if (spec.allocated == numbered_arg_count) - { - spec.allocated = 2 * spec.allocated + 1; - numbered = (struct numbered_arg *) xrealloc (numbered, spec.allocated * sizeof (struct numbered_arg)); - IF_OOM (numbered, goto bad_format;) - } - numbered[numbered_arg_count].number = number; - numbered[numbered_arg_count].type = type; - numbered_arg_count++; - } - else - { - /* Unnumbered argument. */ - - /* Numbered and unnumbered specifications are exclusive. */ - if (numbered_arg_count > 0) - { - *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); - FDI_SET (format, FMTDIR_ERROR); - goto bad_format; - } - - if (spec.allocated == spec.unnumbered_arg_count) - { - spec.allocated = 2 * spec.allocated + 1; - spec.unnumbered = (struct unnumbered_arg *) xrealloc (spec.unnumbered, spec.allocated * sizeof (struct unnumbered_arg)); - IF_OOM (spec.unnumbered, goto bad_format;) - } - spec.unnumbered[spec.unnumbered_arg_count].type = type; - spec.unnumbered_arg_count++; - } - } - - FDI_SET (format, FMTDIR_END); - - format++; - } - - /* Sort the numbered argument array, and eliminate duplicates. */ - if (numbered_arg_count > 1) - { - unsigned int i, j; - bool err; - - qsort (numbered, numbered_arg_count, - sizeof (struct numbered_arg), numbered_arg_compare); - - /* Remove duplicates: Copy from i to j, keeping 0 <= j <= i. */ - err = false; - for (i = j = 0; i < numbered_arg_count; i++) - if (j > 0 && numbered[i].number == numbered[j-1].number) - { - format_arg_type_t type1 = numbered[i].type; - format_arg_type_t type2 = numbered[j-1].type; - format_arg_type_t type_both; - - if (type1 == type2) - type_both = type1; - else - { - /* Incompatible types. */ - type_both = FAT_NONE; - if (!err) - *invalid_reason = - INVALID_INCOMPATIBLE_ARG_TYPES (numbered[i].number); - err = true; - } - - numbered[j-1].type = type_both; - } - else - { - if (j < i) - { - numbered[j].number = numbered[i].number; - numbered[j].type = numbered[i].type; - } - j++; - } - numbered_arg_count = j; - if (err) - /* *invalid_reason has already been set above. */ - goto bad_format; - } - - /* Verify that the format strings uses all arguments up to the highest - numbered one. */ - if (numbered_arg_count > 0) - { - unsigned int i; - - for (i = 0; i < numbered_arg_count; i++) - if (numbered[i].number != i + 1) - { - *invalid_reason = INVALID_IGNORED_ARGUMENT (numbered[i].number, i + 1); - goto bad_format; - } - - /* So now the numbered arguments array is equivalent to a sequence - of unnumbered arguments. */ - spec.unnumbered_arg_count = numbered_arg_count; - spec.allocated = spec.unnumbered_arg_count; - spec.unnumbered = XNMALLOC (spec.allocated, struct unnumbered_arg); - IF_OOM (spec.unnumbered, goto bad_format;) - for (i = 0; i < spec.unnumbered_arg_count; i++) - spec.unnumbered[i].type = numbered[i].type; - free (numbered); - numbered_arg_count = 0; - } - - *result = spec; - return result; - - bad_format: - if (numbered != NULL) - free (numbered); - if (spec.unnumbered != NULL) - free (spec.unnumbered); - if (spec.sysdep_directives != NULL) - free (spec.sysdep_directives); - return NULL; -} +/* Include the bulk of the C format string parsing code. */ +#include "format-c-parse.h" static void * format_parse (const char *format, bool translated, bool objc_extensions, |