| /* Ruby format strings. |
| Copyright (C) 2001-2004, 2006-2009, 2019-2020 Free Software Foundation, Inc. |
| Written by Bruno Haible <bruno@clisp.org>, 2020. |
| |
| This program is free software: you can redistribute it and/or modify |
| it under the terms of the GNU General Public License as published by |
| the Free Software Foundation; either version 3 of the License, or |
| (at your option) any later version. |
| |
| This program is distributed in the hope that it will be useful, |
| but WITHOUT ANY WARRANTY; without even the implied warranty of |
| MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| GNU General Public License for more details. |
| |
| You should have received a copy of the GNU General Public License |
| along with this program. If not, see <https://www.gnu.org/licenses/>. */ |
| |
| #ifdef HAVE_CONFIG_H |
| # include <config.h> |
| #endif |
| |
| #include <limits.h> |
| #include <stdbool.h> |
| #include <stdlib.h> |
| #include <string.h> |
| |
| #include "format.h" |
| #include "c-ctype.h" |
| #include "xalloc.h" |
| #include "xvasprintf.h" |
| #include "format-invalid.h" |
| #include "gettext.h" |
| |
| #define _(str) gettext (str) |
| |
| /* Ruby format strings are described in |
| https://ruby-doc.org/core-2.7.1/Kernel.html#method-i-sprintf |
| and are implemented in ruby-2.7.1/sprintf.c . |
| A format string consists of literal text and directives. |
| A directive |
| - starts with '%', |
| - is optionally followed by a sequence of the following: |
| - any of the characters ' ', '#', '+', '-', '0', each of which acts as a |
| flag, |
| - a digit sequence starting with a non-zero digit, followed by '$', at |
| most once per directive, indicating a positional argument to consume, |
| - '<' KEY '>', at most once per directive, indicating a hash table element |
| to consume, |
| - a digit sequence starting with a non-zero digit, specifying a width, |
| - '*', indicating a width, taken from the argument list, |
| - '*' and a digit sequence, followed by '$', indicating a width, taken |
| from a positional argument, |
| - '.' and a digit sequence, indicating a precision, |
| - '.' '*', indicating a precision, taken from the argument list, |
| - '.' '*' and a digit sequence, followed by '$', indicating a precision, |
| taken from a positional argument. |
| This sequence is in any order, except that |
| - flags must occur before width and precision, |
| - width must occur before precision. |
| - is finished by a specifier |
| - 's', that takes an object to print without double-quote delimiters, |
| - 'p', that takes an object to print with double-quote delimiters (in case |
| of a string), |
| - '{' KEY '}', indicating a hash table element to consume and to print |
| like with 's', |
| - 'c', that takes a character, |
| - 'd', 'i', 'u', 'o', 'x', 'X', 'b', 'B', that take an integer, |
| - 'f', 'g', 'G', 'e', 'E', 'a', 'A', that take a floating-point number. |
| Additionally there are the directives '%%' '%<newline>', which take no |
| argument. |
| Numbered, unnumbered, and named argument specifications cannot be used in |
| the same string; either all arguments are numbered, or all arguments are |
| unnumbered, or all arguments are named. |
| */ |
| |
| enum format_arg_type |
| { |
| FAT_NONE, |
| FAT_ANY, |
| FAT_ESCAPED_ANY, |
| FAT_CHARACTER, |
| FAT_INTEGER, |
| FAT_FLOAT |
| }; |
| |
| struct named_arg |
| { |
| char *name; |
| enum format_arg_type type; |
| }; |
| |
| struct numbered_arg |
| { |
| unsigned int number; |
| enum format_arg_type type; |
| }; |
| |
| struct spec |
| { |
| unsigned int directives; |
| unsigned int named_arg_count; |
| unsigned int numbered_arg_count; |
| struct named_arg *named; |
| struct numbered_arg *numbered; |
| }; |
| |
| /* Locale independent test for a decimal digit. |
| Argument can be 'char' or 'unsigned char'. (Whereas the argument of |
| <ctype.h> isdigit must be an 'unsigned char'.) */ |
| #undef isdigit |
| #define isdigit(c) ((unsigned int) ((c) - '0') < 10) |
| |
| |
| static int |
| named_arg_compare (const void *p1, const void *p2) |
| { |
| return strcmp (((const struct named_arg *) p1)->name, |
| ((const struct named_arg *) p2)->name); |
| } |
| |
| static int |
| numbered_arg_compare (const void *p1, const void *p2) |
| { |
| unsigned int n1 = ((const struct numbered_arg *) p1)->number; |
| unsigned int n2 = ((const struct numbered_arg *) p2)->number; |
| |
| return (n1 > n2 ? 1 : n1 < n2 ? -1 : 0); |
| } |
| |
| #define INVALID_MIXES_NAMED_UNNAMED() \ |
| xstrdup (_("The string refers to arguments both through argument names and through unnamed argument specifications.")) |
| |
| #define INVALID_TWO_ARG_NAMES(directive_number) \ |
| xasprintf (_("In the directive number %u, two names are given for the same argument."), directive_number) |
| |
| #define INVALID_TWO_ARG_NUMBERS(directive_number) \ |
| xasprintf (_("In the directive number %u, two numbers are given for the same argument."), directive_number) |
| |
| #define INVALID_FLAG_AFTER_WIDTH(directive_number) \ |
| xasprintf (_("In the directive number %u, a flag is given after the width."), directive_number) |
| |
| #define INVALID_FLAG_AFTER_PRECISION(directive_number) \ |
| xasprintf (_("In the directive number %u, a flag is given after the precision."), directive_number) |
| |
| #define INVALID_WIDTH_AFTER_PRECISION(directive_number) \ |
| xasprintf (_("In the directive number %u, the width is given after the precision."), directive_number) |
| |
| #define INVALID_WIDTH_TWICE(directive_number) \ |
| xasprintf (_("In the directive number %u, a width is given twice."), directive_number) |
| |
| #define INVALID_PRECISION_TWICE(directive_number) \ |
| xasprintf (_("In the directive number %u, a precision is given twice."), directive_number) |
| |
| static void * |
| format_parse (const char *format, bool translated, char *fdi, |
| char **invalid_reason) |
| { |
| const char *const format_start = format; |
| struct spec spec; |
| unsigned int unnumbered_arg_count; |
| unsigned int allocated; |
| struct spec *result; |
| |
| spec.directives = 0; |
| spec.named_arg_count = 0; |
| spec.numbered_arg_count = 0; |
| spec.named = NULL; |
| spec.numbered = NULL; |
| unnumbered_arg_count = 0; |
| allocated = 0; |
| |
| for (; *format != '\0';) |
| if (*format++ == '%') |
| { |
| /* A directive. */ |
| char *name = NULL; |
| unsigned int number = 0; |
| |
| bool seen_width = false; |
| unsigned int width_number = 0; |
| bool width_takenext = false; |
| |
| bool seen_precision = false; |
| unsigned int precision_number = 0; |
| bool precision_takenext = false; |
| |
| enum format_arg_type type; |
| |
| FDI_SET (format - 1, FMTDIR_START); |
| spec.directives++; |
| |
| for (;;) |
| { |
| if (*format == ' ' |
| || *format == '#' |
| || *format == '+' |
| || *format == '-' |
| || *format == '0') |
| { |
| /* A flag. */ |
| if (seen_width) |
| { |
| *invalid_reason = INVALID_FLAG_AFTER_WIDTH (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (seen_precision) |
| { |
| *invalid_reason = INVALID_FLAG_AFTER_PRECISION (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| format++; |
| continue; |
| } |
| |
| if (*format == '<') |
| { |
| const char *name_start; |
| const char *name_end; |
| size_t n; |
| |
| if ((spec.numbered_arg_count > 0 |
| || number > 0 || width_number > 0 || precision_number > 0) |
| || (unnumbered_arg_count > 0 |
| || width_takenext || precision_takenext)) |
| { |
| *invalid_reason = INVALID_MIXES_NAMED_UNNAMED (); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (name != NULL) |
| { |
| *invalid_reason = INVALID_TWO_ARG_NAMES (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| |
| name_start = ++format; |
| for (; *format != '\0'; format++) |
| if (*format == '>') |
| break; |
| if (*format == '\0') |
| { |
| *invalid_reason = INVALID_UNTERMINATED_DIRECTIVE (); |
| FDI_SET (format - 1, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| name_end = format++; |
| |
| n = name_end - name_start; |
| name = XNMALLOC (n + 1, char); |
| memcpy (name, name_start, n); |
| name[n] = '\0'; |
| |
| continue; |
| } |
| |
| if (isdigit (*format)) |
| { |
| unsigned int m = 0; |
| |
| do |
| { |
| if (m < UINT_MAX / 10) |
| m = 10 * m + (*format - '0'); |
| else |
| m = UINT_MAX - 1; |
| format++; |
| } |
| while (isdigit (*format)); |
| |
| if (*format == '$') |
| { |
| if (spec.named_arg_count > 0 || name != NULL) |
| { |
| *invalid_reason = INVALID_MIXES_NAMED_UNNAMED (); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (unnumbered_arg_count > 0 |
| || width_takenext || precision_takenext) |
| { |
| *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (number > 0) |
| { |
| *invalid_reason = INVALID_TWO_ARG_NUMBERS (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| number = m; |
| format++; |
| } |
| else |
| { |
| /* Seen a constant width. */ |
| if (seen_precision) |
| { |
| *invalid_reason = INVALID_WIDTH_AFTER_PRECISION (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (seen_width) |
| { |
| *invalid_reason = INVALID_WIDTH_TWICE (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| seen_width = true; |
| } |
| continue; |
| } |
| |
| if (*format == '*') |
| { |
| /* Parse width. */ |
| format++; |
| |
| if (isdigit (*format)) |
| { |
| const char *f = format; |
| unsigned int m = 0; |
| |
| do |
| { |
| if (m < UINT_MAX / 10) |
| m = 10 * m + (*f - '0'); |
| else |
| m = UINT_MAX - 1; |
| f++; |
| } |
| while (isdigit (*f)); |
| |
| if (*f == '$') |
| { |
| format = f; |
| if (spec.named_arg_count > 0 || name != NULL) |
| { |
| *invalid_reason = INVALID_MIXES_NAMED_UNNAMED (); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (unnumbered_arg_count > 0 |
| || width_takenext || precision_takenext) |
| { |
| *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (seen_precision) |
| { |
| *invalid_reason = INVALID_WIDTH_AFTER_PRECISION (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (seen_width) |
| { |
| *invalid_reason = INVALID_WIDTH_TWICE (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (m == 0) |
| { |
| *invalid_reason = INVALID_ARGNO_0 (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| seen_width = true; |
| width_number = m; |
| format++; |
| continue; |
| } |
| } |
| |
| if (spec.named_arg_count > 0 || name != NULL) |
| { |
| *invalid_reason = INVALID_MIXES_NAMED_UNNAMED (); |
| FDI_SET (format - 1, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (spec.numbered_arg_count > 0 |
| || number > 0 || width_number > 0 || precision_number > 0) |
| { |
| *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); |
| FDI_SET (format - 1, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (seen_precision) |
| { |
| *invalid_reason = INVALID_WIDTH_AFTER_PRECISION (spec.directives); |
| FDI_SET (format - 1, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (seen_width) |
| { |
| *invalid_reason = INVALID_WIDTH_TWICE (spec.directives); |
| FDI_SET (format - 1, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| seen_width = true; |
| width_takenext = true; |
| continue; |
| } |
| |
| if (*format == '.') |
| { |
| /* Parse precision. */ |
| format++; |
| |
| if (*format == '*') |
| { |
| format++; |
| |
| if (isdigit (*format)) |
| { |
| const char *f = format; |
| unsigned int m = 0; |
| |
| do |
| { |
| if (m < UINT_MAX / 10) |
| m = 10 * m + (*f - '0'); |
| else |
| m = UINT_MAX - 1; |
| f++; |
| } |
| while (isdigit (*f)); |
| |
| if (*f == '$') |
| { |
| format = f; |
| if (spec.named_arg_count > 0 || name != NULL) |
| { |
| *invalid_reason = INVALID_MIXES_NAMED_UNNAMED (); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (unnumbered_arg_count > 0 |
| || width_takenext || precision_takenext) |
| { |
| *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (seen_precision) |
| { |
| *invalid_reason = INVALID_PRECISION_TWICE (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (m == 0) |
| { |
| *invalid_reason = INVALID_ARGNO_0 (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| seen_precision = true; |
| precision_number = m; |
| format++; |
| continue; |
| } |
| } |
| |
| if (spec.named_arg_count > 0 || name != NULL) |
| { |
| *invalid_reason = INVALID_MIXES_NAMED_UNNAMED (); |
| FDI_SET (format - 1, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (spec.numbered_arg_count > 0 |
| || number > 0 || width_number > 0 || precision_number > 0) |
| { |
| *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); |
| FDI_SET (format - 1, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (seen_precision) |
| { |
| *invalid_reason = INVALID_PRECISION_TWICE (spec.directives); |
| FDI_SET (format - 1, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| seen_precision = true; |
| precision_takenext = true; |
| continue; |
| } |
| |
| while (isdigit (*format)) |
| format++; |
| |
| /* Seen a constant precision. */ |
| if (seen_precision) |
| { |
| *invalid_reason = INVALID_PRECISION_TWICE (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| seen_precision = true; |
| continue; |
| } |
| |
| break; |
| } |
| |
| switch (*format) |
| { |
| case '%': |
| case '\n': |
| type = FAT_NONE; |
| break; |
| case 's': |
| type = FAT_ANY; |
| break; |
| case 'p': |
| type = FAT_ESCAPED_ANY; |
| break; |
| case 'c': |
| type = FAT_CHARACTER; |
| break; |
| case 'd': |
| case 'i': |
| case 'u': |
| case 'o': |
| case 'x': |
| case 'X': |
| case 'b': |
| case 'B': |
| type = FAT_INTEGER; |
| break; |
| case 'f': |
| case 'g': |
| case 'G': |
| case 'e': |
| case 'E': |
| case 'a': |
| case 'A': |
| type = FAT_FLOAT; |
| break; |
| case '{': |
| { |
| const char *name_start; |
| const char *name_end; |
| size_t n; |
| |
| if ((spec.numbered_arg_count > 0 |
| || number > 0 || width_number > 0 || precision_number > 0) |
| || (unnumbered_arg_count > 0 |
| || width_takenext || precision_takenext)) |
| { |
| *invalid_reason = INVALID_MIXES_NAMED_UNNAMED (); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (name != NULL) |
| { |
| *invalid_reason = INVALID_TWO_ARG_NAMES (spec.directives); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| |
| name_start = ++format; |
| for (; *format != '\0'; format++) |
| if (*format == '}') |
| break; |
| if (*format == '\0') |
| { |
| *invalid_reason = INVALID_UNTERMINATED_DIRECTIVE (); |
| FDI_SET (format - 1, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| name_end = format; |
| |
| n = name_end - name_start; |
| name = XNMALLOC (n + 1, char); |
| memcpy (name, name_start, n); |
| name[n] = '\0'; |
| } |
| type = FAT_ANY; |
| break; |
| |
| default: |
| if (*format == '\0') |
| { |
| *invalid_reason = INVALID_UNTERMINATED_DIRECTIVE (); |
| FDI_SET (format - 1, FMTDIR_ERROR); |
| } |
| else |
| { |
| *invalid_reason = |
| INVALID_CONVERSION_SPECIFIER (spec.directives, *format); |
| FDI_SET (format, FMTDIR_ERROR); |
| } |
| goto bad_format; |
| } |
| |
| if (seen_width) |
| { |
| /* Register the argument specification for the width. */ |
| if (width_number > 0) |
| { |
| if (allocated == spec.numbered_arg_count) |
| { |
| allocated = 2 * allocated + 1; |
| spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, allocated * sizeof (struct numbered_arg)); |
| } |
| spec.numbered[spec.numbered_arg_count].number = width_number; |
| spec.numbered[spec.numbered_arg_count].type = FAT_INTEGER; |
| spec.numbered_arg_count++; |
| } |
| else if (width_takenext) |
| { |
| if (allocated == unnumbered_arg_count) |
| { |
| allocated = 2 * allocated + 1; |
| spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, allocated * sizeof (struct numbered_arg)); |
| } |
| spec.numbered[unnumbered_arg_count].number = unnumbered_arg_count + 1; |
| spec.numbered[unnumbered_arg_count].type = FAT_INTEGER; |
| unnumbered_arg_count++; |
| } |
| } |
| |
| if (seen_precision) |
| { |
| /* Register the argument specification for the precision. */ |
| if (precision_number > 0) |
| { |
| if (allocated == spec.numbered_arg_count) |
| { |
| allocated = 2 * allocated + 1; |
| spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, allocated * sizeof (struct numbered_arg)); |
| } |
| spec.numbered[spec.numbered_arg_count].number = precision_number; |
| spec.numbered[spec.numbered_arg_count].type = FAT_INTEGER; |
| spec.numbered_arg_count++; |
| } |
| else if (precision_takenext) |
| { |
| if (allocated == unnumbered_arg_count) |
| { |
| allocated = 2 * allocated + 1; |
| spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, allocated * sizeof (struct numbered_arg)); |
| } |
| spec.numbered[unnumbered_arg_count].number = unnumbered_arg_count + 1; |
| spec.numbered[unnumbered_arg_count].type = FAT_INTEGER; |
| unnumbered_arg_count++; |
| } |
| } |
| |
| if (type != FAT_NONE) |
| { |
| /* Register the argument specification for the value. */ |
| if (name != NULL) |
| { |
| if (allocated == spec.named_arg_count) |
| { |
| allocated = 2 * allocated + 1; |
| spec.named = (struct named_arg *) xrealloc (spec.named, allocated * sizeof (struct named_arg)); |
| } |
| spec.named[spec.named_arg_count].name = name; |
| spec.named[spec.named_arg_count].type = type; |
| spec.named_arg_count++; |
| } |
| else if (number > 0) |
| { |
| if (allocated == spec.numbered_arg_count) |
| { |
| allocated = 2 * allocated + 1; |
| spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, allocated * sizeof (struct numbered_arg)); |
| } |
| spec.numbered[spec.numbered_arg_count].number = number; |
| spec.numbered[spec.numbered_arg_count].type = type; |
| spec.numbered_arg_count++; |
| } |
| else |
| { |
| if (spec.named_arg_count > 0) |
| { |
| *invalid_reason = INVALID_MIXES_NAMED_UNNAMED (); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (spec.numbered_arg_count > 0) |
| { |
| *invalid_reason = INVALID_MIXES_NUMBERED_UNNUMBERED (); |
| FDI_SET (format, FMTDIR_ERROR); |
| goto bad_format; |
| } |
| if (allocated == unnumbered_arg_count) |
| { |
| allocated = 2 * allocated + 1; |
| spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, allocated * sizeof (struct numbered_arg)); |
| } |
| spec.numbered[unnumbered_arg_count].number = unnumbered_arg_count + 1; |
| spec.numbered[unnumbered_arg_count].type = type; |
| unnumbered_arg_count++; |
| } |
| } |
| |
| FDI_SET (format, FMTDIR_END); |
| |
| format++; |
| } |
| |
| /* Verify that either all arguments are numbered, or all arguments are |
| unnumbered, or all arguments are named. */ |
| if ((spec.numbered_arg_count > 0) |
| + (unnumbered_arg_count > 0) |
| + (spec.named_arg_count > 0) |
| > 1) |
| abort (); |
| |
| /* Convert the unnumbered argument array to numbered arguments. */ |
| if (unnumbered_arg_count > 0) |
| spec.numbered_arg_count = unnumbered_arg_count; |
| /* Sort the numbered argument array, and eliminate duplicates. */ |
| else if (spec.numbered_arg_count > 1) |
| { |
| unsigned int i, j; |
| bool err; |
| |
| qsort (spec.numbered, spec.numbered_arg_count, |
| sizeof (struct numbered_arg), numbered_arg_compare); |
| |
| /* Remove duplicates: Copy from i to j, keeping 0 <= j <= i. */ |
| err = false; |
| for (i = j = 0; i < spec.numbered_arg_count; i++) |
| if (j > 0 && spec.numbered[i].number == spec.numbered[j-1].number) |
| { |
| enum format_arg_type type1 = spec.numbered[i].type; |
| enum format_arg_type type2 = spec.numbered[j-1].type; |
| enum format_arg_type type_both; |
| |
| if (type1 == type2) |
| type_both = type1; |
| else |
| { |
| /* Incompatible types. */ |
| type_both = FAT_NONE; |
| if (!err) |
| *invalid_reason = |
| INVALID_INCOMPATIBLE_ARG_TYPES (spec.numbered[i].number); |
| err = true; |
| } |
| |
| spec.numbered[j-1].type = type_both; |
| } |
| else |
| { |
| if (j < i) |
| { |
| spec.numbered[j].number = spec.numbered[i].number; |
| spec.numbered[j].type = spec.numbered[i].type; |
| } |
| j++; |
| } |
| spec.numbered_arg_count = j; |
| if (err) |
| /* *invalid_reason has already been set above. */ |
| goto bad_format; |
| } |
| |
| /* Sort the named argument array, and eliminate duplicates. */ |
| if (spec.named_arg_count > 1) |
| { |
| unsigned int i, j; |
| bool err; |
| |
| qsort (spec.named, spec.named_arg_count, sizeof (struct named_arg), |
| named_arg_compare); |
| |
| /* Remove duplicates: Copy from i to j, keeping 0 <= j <= i. */ |
| err = false; |
| for (i = j = 0; i < spec.named_arg_count; i++) |
| if (j > 0 && strcmp (spec.named[i].name, spec.named[j-1].name) == 0) |
| { |
| enum format_arg_type type1 = spec.named[i].type; |
| enum format_arg_type type2 = spec.named[j-1].type; |
| enum format_arg_type type_both; |
| |
| if (type1 == type2) |
| type_both = type1; |
| else |
| { |
| /* Incompatible types. */ |
| type_both = FAT_NONE; |
| if (!err) |
| *invalid_reason = |
| xasprintf (_("The string refers to the argument named '%s' in incompatible ways."), spec.named[i].name); |
| err = true; |
| } |
| |
| spec.named[j-1].type = type_both; |
| free (spec.named[i].name); |
| } |
| else |
| { |
| if (j < i) |
| { |
| spec.named[j].name = spec.named[i].name; |
| spec.named[j].type = spec.named[i].type; |
| } |
| j++; |
| } |
| spec.named_arg_count = j; |
| if (err) |
| /* *invalid_reason has already been set above. */ |
| goto bad_format; |
| } |
| |
| result = XMALLOC (struct spec); |
| *result = spec; |
| return result; |
| |
| bad_format: |
| if (spec.named != NULL) |
| { |
| unsigned int i; |
| for (i = 0; i < spec.named_arg_count; i++) |
| free (spec.named[i].name); |
| free (spec.named); |
| } |
| if (spec.numbered != NULL) |
| free (spec.numbered); |
| return NULL; |
| } |
| |
| static void |
| format_free (void *descr) |
| { |
| struct spec *spec = (struct spec *) descr; |
| |
| if (spec->named != NULL) |
| { |
| unsigned int i; |
| for (i = 0; i < spec->named_arg_count; i++) |
| free (spec->named[i].name); |
| free (spec->named); |
| } |
| if (spec->numbered != NULL) |
| free (spec->numbered); |
| free (spec); |
| } |
| |
| static int |
| format_get_number_of_directives (void *descr) |
| { |
| struct spec *spec = (struct spec *) descr; |
| |
| return spec->directives; |
| } |
| |
| static bool |
| format_check (void *msgid_descr, void *msgstr_descr, bool equality, |
| formatstring_error_logger_t error_logger, |
| const char *pretty_msgid, const char *pretty_msgstr) |
| { |
| struct spec *spec1 = (struct spec *) msgid_descr; |
| struct spec *spec2 = (struct spec *) msgstr_descr; |
| bool err = false; |
| |
| if (spec1->named_arg_count > 0 && spec2->numbered_arg_count > 0) |
| { |
| if (error_logger) |
| error_logger (_("format specifications in '%s' expect a hash table, those in '%s' expect individual arguments"), |
| pretty_msgid, pretty_msgstr); |
| err = true; |
| } |
| else if (spec1->numbered_arg_count > 0 && spec2->named_arg_count > 0) |
| { |
| if (error_logger) |
| error_logger (_("format specifications in '%s' expect individual arguments, those in '%s' expect a hash table"), |
| pretty_msgid, pretty_msgstr); |
| err = true; |
| } |
| else |
| { |
| if (spec1->named_arg_count + spec2->named_arg_count > 0) |
| { |
| unsigned int i, j; |
| unsigned int n1 = spec1->named_arg_count; |
| unsigned int n2 = spec2->named_arg_count; |
| |
| /* Check the argument names are the same. |
| Both arrays are sorted. We search for the first difference. */ |
| for (i = 0, j = 0; i < n1 || j < n2; ) |
| { |
| int cmp = (i >= n1 ? 1 : |
| j >= n2 ? -1 : |
| strcmp (spec1->named[i].name, spec2->named[j].name)); |
| |
| if (cmp > 0) |
| { |
| if (error_logger) |
| error_logger (_("a format specification for argument '%s', as in '%s', doesn't exist in '%s'"), |
| spec2->named[j].name, pretty_msgstr, |
| pretty_msgid); |
| err = true; |
| break; |
| } |
| else if (cmp < 0) |
| { |
| if (equality) |
| { |
| if (error_logger) |
| error_logger (_("a format specification for argument '%s' doesn't exist in '%s'"), |
| spec1->named[i].name, pretty_msgstr); |
| err = true; |
| break; |
| } |
| else |
| i++; |
| } |
| else |
| j++, i++; |
| } |
| /* Check the argument types are the same. */ |
| if (!err) |
| for (i = 0, j = 0; j < n2; ) |
| { |
| if (strcmp (spec1->named[i].name, spec2->named[j].name) == 0) |
| { |
| if (!(spec1->named[i].type == spec2->named[j].type)) |
| { |
| if (error_logger) |
| error_logger (_("format specifications in '%s' and '%s' for argument '%s' are not the same"), |
| pretty_msgid, pretty_msgstr, |
| spec2->named[j].name); |
| err = true; |
| break; |
| } |
| j++, i++; |
| } |
| else |
| i++; |
| } |
| } |
| |
| if (spec1->numbered_arg_count + spec2->numbered_arg_count > 0) |
| { |
| unsigned int i; |
| |
| /* Check the argument types are the same. */ |
| if (spec1->numbered_arg_count != spec2->numbered_arg_count) |
| { |
| if (error_logger) |
| error_logger (_("number of format specifications in '%s' and '%s' does not match"), |
| pretty_msgid, pretty_msgstr); |
| err = true; |
| } |
| else |
| for (i = 0; i < spec2->numbered_arg_count; i++) |
| if (!(spec1->numbered[i].type == spec2->numbered[i].type)) |
| { |
| if (error_logger) |
| error_logger (_("format specifications in '%s' and '%s' for argument %u are not the same"), |
| pretty_msgid, pretty_msgstr, i + 1); |
| err = true; |
| } |
| } |
| } |
| |
| return err; |
| } |
| |
| |
| struct formatstring_parser formatstring_ruby = |
| { |
| format_parse, |
| format_free, |
| format_get_number_of_directives, |
| NULL, |
| format_check |
| }; |
| |
| |
| #ifdef TEST |
| |
| /* Test program: Print the argument list specification returned by |
| format_parse for strings read from standard input. */ |
| |
| #include <stdio.h> |
| |
| static void |
| format_print (void *descr) |
| { |
| struct spec *spec = (struct spec *) descr; |
| unsigned int i; |
| |
| if (spec == NULL) |
| { |
| printf ("INVALID"); |
| return; |
| } |
| |
| if (spec->named_arg_count > 0) |
| { |
| if (spec->numbered_arg_count > 0) |
| abort (); |
| |
| printf ("({"); |
| for (i = 0; i < spec->named_arg_count; i++) |
| { |
| if (i > 0) |
| printf (", "); |
| printf (":%s => ", spec->named[i].name); |
| switch (spec->named[i].type) |
| { |
| case FAT_ANY: |
| printf ("s"); |
| break; |
| case FAT_ESCAPED_ANY: |
| printf ("p"); |
| break; |
| case FAT_CHARACTER: |
| printf ("c"); |
| break; |
| case FAT_INTEGER: |
| printf ("i"); |
| break; |
| case FAT_FLOAT: |
| printf ("f"); |
| break; |
| default: |
| abort (); |
| } |
| } |
| printf ("})"); |
| } |
| else |
| { |
| unsigned int last; |
| |
| printf ("("); |
| last = 1; |
| for (i = 0; i < spec->numbered_arg_count; i++) |
| { |
| unsigned int number = spec->numbered[i].number; |
| |
| if (i > 0) |
| printf (" "); |
| if (number < last) |
| abort (); |
| for (; last < number; last++) |
| printf ("_ "); |
| switch (spec->numbered[i].type) |
| { |
| case FAT_ANY: |
| printf ("s"); |
| break; |
| case FAT_ESCAPED_ANY: |
| printf ("p"); |
| break; |
| case FAT_CHARACTER: |
| printf ("c"); |
| break; |
| case FAT_INTEGER: |
| printf ("i"); |
| break; |
| case FAT_FLOAT: |
| printf ("f"); |
| break; |
| default: |
| abort (); |
| } |
| last = number + 1; |
| } |
| printf (")"); |
| } |
| } |
| |
| int |
| main () |
| { |
| for (;;) |
| { |
| char *line = NULL; |
| size_t line_size = 0; |
| int line_len; |
| char *invalid_reason; |
| void *descr; |
| |
| line_len = getline (&line, &line_size, stdin); |
| if (line_len < 0) |
| break; |
| if (line_len > 0 && line[line_len - 1] == '\n') |
| line[--line_len] = '\0'; |
| |
| invalid_reason = NULL; |
| descr = format_parse (line, false, NULL, &invalid_reason); |
| |
| format_print (descr); |
| printf ("\n"); |
| if (descr == NULL) |
| printf ("%s\n", invalid_reason); |
| |
| free (invalid_reason); |
| free (line); |
| } |
| |
| return 0; |
| } |
| |
| /* |
| * For Emacs M-x compile |
| * Local Variables: |
| * compile-command: "/bin/sh ../libtool --tag=CC --mode=link gcc -o a.out -static -O -g -Wall -I.. -I../gnulib-lib -I../../gettext-runtime/intl -DHAVE_CONFIG_H -DTEST format-ruby.c ../gnulib-lib/libgettextlib.la" |
| * End: |
| */ |
| |
| #endif /* TEST */ |