#ifdef HAVE_CONFIG_H
# include <config.h>
#endif
#include <alloca.h>
#include <stdbool.h>
#include <stdlib.h>
#include <string.h>
#include "format.h"
#include "c-ctype.h"
#include "xalloc.h"
#include "xerror.h"
#include "format-invalid.h"
#include "error.h"
#include "error-progname.h"
#include "gettext.h"
#define _(str) gettext (str)
enum format_arg_type
{
FAT_NONE,
FAT_OBJECT,
FAT_NUMBER,
FAT_DATE
};
struct numbered_arg
{
unsigned int number;
enum format_arg_type type;
};
struct spec
{
unsigned int directives;
unsigned int numbered_arg_count;
unsigned int allocated;
struct numbered_arg *numbered;
};
static bool date_format_parse (const char *format);
static bool number_format_parse (const char *format);
static bool choice_format_parse (const char *format, struct spec *spec,
char **invalid_reason);
#define HANDLE_QUOTE \
if (*format == '\'' && *++format != '\'') \
quoting = !quoting;
static bool
message_format_parse (const char *format, struct spec *spec,
char **invalid_reason)
{
bool quoting = false;
for (;;)
{
HANDLE_QUOTE;
if (!quoting && *format == '{')
{
unsigned int depth;
const char *element_start;
const char *element_end;
size_t n;
char *element;
unsigned int number;
enum format_arg_type type;
spec->directives++;
element_start = ++format;
depth = 0;
for (; *format != '\0'; format++)
{
if (*format == '{')
depth++;
else if (*format == '}')
{
if (depth == 0)
break;
else
depth--;
}
}
if (*format == '\0')
{
*invalid_reason =
xstrdup (_("The string ends in the middle of a directive: found '{' without matching '}'."));
return false;
}
element_end = format++;
n = element_end - element_start;
element = (char *) alloca (n + 1);
memcpy (element, element_start, n);
element[n] = '\0';
if (!c_isdigit (*element))
{
*invalid_reason =
xasprintf (_("In the directive number %u, '{' is not followed by an argument number."), spec->directives);
return false;
}
number = 0;
do
{
number = 10 * number + (*element - '0');
element++;
}
while (c_isdigit (*element));
type = FAT_OBJECT;
if (*element == '\0')
;
else if (strncmp (element, ",time", 5) == 0
|| strncmp (element, ",date", 5) == 0)
{
type = FAT_DATE;
element += 5;
if (*element == '\0')
;
else if (*element == ',')
{
element++;
if (strcmp (element, "short") == 0
|| strcmp (element, "medium") == 0
|| strcmp (element, "long") == 0
|| strcmp (element, "full") == 0
|| date_format_parse (element))
;
else
{
*invalid_reason =
xasprintf (_("In the directive number %u, the substring \"%s\" is not a valid date/time style."), spec->directives, element);
return false;
}
}
else
{
*element = '\0';
element -= 4;
*invalid_reason =
xasprintf (_("In the directive number %u, \"%s\" is not followed by a comma."), spec->directives, element);
return false;
}
}
else if (strncmp (element, ",number", 7) == 0)
{
type = FAT_NUMBER;
element += 7;
if (*element == '\0')
;
else if (*element == ',')
{
element++;
if (strcmp (element, "currency") == 0
|| strcmp (element, "percent") == 0
|| strcmp (element, "integer") == 0
|| number_format_parse (element))
;
else
{
*invalid_reason =
xasprintf (_("In the directive number %u, the substring \"%s\" is not a valid number style."), spec->directives, element);
return false;
}
}
else
{
*element = '\0';
element -= 6;
*invalid_reason =
xasprintf (_("In the directive number %u, \"%s\" is not followed by a comma."), spec->directives, element);
return false;
}
}
else if (strncmp (element, ",choice", 7) == 0)
{
type = FAT_NUMBER;
element += 7;
if (*element == '\0')
;
else if (*element == ',')
{
element++;
if (choice_format_parse (element, spec, invalid_reason))
;
else
return false;
}
else
{
*element = '\0';
element -= 6;
*invalid_reason =
xasprintf (_("In the directive number %u, \"%s\" is not followed by a comma."), spec->directives, element);
return false;
}
}
else
{
*invalid_reason =
xasprintf (_("In the directive number %u, the argument number is not followed by a comma and one of \"%s\", \"%s\", \"%s\", \"%s\"."), spec->directives, "time", "date", "number", "choice");
return false;
}
if (spec->allocated == spec->numbered_arg_count)
{
spec->allocated = 2 * spec->allocated + 1;
spec->numbered = (struct numbered_arg *) xrealloc (spec->numbered, spec->allocated * sizeof (struct numbered_arg));
}
spec->numbered[spec->numbered_arg_count].number = number;
spec->numbered[spec->numbered_arg_count].type = type;
spec->numbered_arg_count++;
}
else if (!quoting && *format == '}')
{
*invalid_reason =
xstrdup (_("The string starts in the middle of a directive: found '}' without matching '{'."));
return false;
}
else if (*format != '\0')
format++;
else
break;
}
return true;
}
static bool
date_format_parse (const char *format)
{
return true;
}
static bool
number_format_parse (const char *format)
{
bool quoting = false;
bool seen_semicolon = false;
HANDLE_QUOTE;
for (;;)
{
while (*format != '\0'
&& !(!quoting && (*format == '0' || *format == '#')))
{
if (format[0] == '\\')
{
if (format[1] == 'u'
&& c_isxdigit (format[2])
&& c_isxdigit (format[3])
&& c_isxdigit (format[4])
&& c_isxdigit (format[5]))
format += 6;
else
format += 2;
}
else
format += 1;
HANDLE_QUOTE;
}
if (!(!quoting && (*format == '0' || *format == '#')))
return false;
while (!quoting && *format == '#')
{
format++;
HANDLE_QUOTE;
if (!quoting && *format == ',')
{
format++;
HANDLE_QUOTE;
}
}
while (!quoting && *format == '0')
{
format++;
HANDLE_QUOTE;
if (!quoting && *format == ',')
{
format++;
HANDLE_QUOTE;
}
}
if (!quoting && *format == '.')
{
format++;
HANDLE_QUOTE;
while (!quoting && *format == '0')
{
format++;
HANDLE_QUOTE;
}
while (!quoting && *format == '#')
{
format++;
HANDLE_QUOTE;
}
}
if (!quoting && *format == 'E')
{
const char *format_save = format;
format++;
HANDLE_QUOTE;
if (!quoting && *format == '0')
{
do
{
format++;
HANDLE_QUOTE;
}
while (!quoting && *format == '0');
}
else
{
format = format_save;
quoting = false;
}
}
while (*format != '\0'
&& (seen_semicolon || !(!quoting && *format == ';')))
{
if (format[0] == '\\')
{
if (format[1] == 'u'
&& c_isxdigit (format[2])
&& c_isxdigit (format[3])
&& c_isxdigit (format[4])
&& c_isxdigit (format[5]))
format += 6;
else
format += 2;
}
else
format += 1;
HANDLE_QUOTE;
}
if (seen_semicolon || !(!quoting && *format == ';'))
break;
}
return (*format == '\0');
}
static bool
choice_format_parse (const char *format, struct spec *spec,
char **invalid_reason)
{
bool quoting = false;
HANDLE_QUOTE;
if (*format == '\0')
return true;
for (;;)
{
bool number_nonempty;
char *msgformat;
char *mp;
number_nonempty = false;
while (*format != '\0'
&& !(!quoting && (*format == '<' || *format == '#'
|| strncmp (format, "\\u2264", 6) == 0
|| *format == '|')))
{
if (format[0] == '\\')
{
if (format[1] == 'u'
&& c_isxdigit (format[2])
&& c_isxdigit (format[3])
&& c_isxdigit (format[4])
&& c_isxdigit (format[5]))
format += 6;
else
format += 2;
}
else
format += 1;
number_nonempty = true;
HANDLE_QUOTE;
}
if (*format == '\0')
break;
if (!number_nonempty)
{
*invalid_reason =
xasprintf (_("In the directive number %u, a choice contains no number."), spec->directives);
return false;
}
if (*format == '<' || *format == '#')
format += 1;
else if (strncmp (format, "\\u2264", 6) == 0)
format += 6;
else
{
*invalid_reason =
xasprintf (_("In the directive number %u, a choice contains a number that is not followed by '<', '#' or '%s'."), spec->directives, "\\u2264");
return false;
}
HANDLE_QUOTE;
msgformat = (char *) alloca (strlen (format) + 1);
mp = msgformat;
while (*format != '\0' && !(!quoting && *format == '|'))
{
*mp++ = *format++;
HANDLE_QUOTE;
}
*mp = '\0';
if (!message_format_parse (msgformat, spec, invalid_reason))
return false;
if (*format == '\0')
break;
format++;
HANDLE_QUOTE;
}
return true;
}
static int
numbered_arg_compare (const void *p1, const void *p2)
{
unsigned int n1 = ((const struct numbered_arg *) p1)->number;
unsigned int n2 = ((const struct numbered_arg *) p2)->number;
return (n1 > n2 ? 1 : n1 < n2 ? -1 : 0);
}
static void *
format_parse (const char *format, char **invalid_reason)
{
struct spec spec;
struct spec *result;
spec.directives = 0;
spec.numbered_arg_count = 0;
spec.allocated = 0;
spec.numbered = NULL;
if (!message_format_parse (format, &spec, invalid_reason))
goto bad_format;
if (spec.numbered_arg_count > 1)
{
unsigned int i, j;
bool err;
qsort (spec.numbered, spec.numbered_arg_count,
sizeof (struct numbered_arg), numbered_arg_compare);
err = false;
for (i = j = 0; i < spec.numbered_arg_count; i++)
if (j > 0 && spec.numbered[i].number == spec.numbered[j-1].number)
{
enum format_arg_type type1 = spec.numbered[i].type;
enum format_arg_type type2 = spec.numbered[j-1].type;
enum format_arg_type type_both;
if (type1 == type2 || type2 == FAT_OBJECT)
type_both = type1;
else if (type1 == FAT_OBJECT)
type_both = type2;
else
{
type_both = FAT_NONE;
if (!err)
*invalid_reason =
INVALID_INCOMPATIBLE_ARG_TYPES (spec.numbered[i].number);
err = true;
}
spec.numbered[j-1].type = type_both;
}
else
{
if (j < i)
{
spec.numbered[j].number = spec.numbered[i].number;
spec.numbered[j].type = spec.numbered[i].type;
}
j++;
}
spec.numbered_arg_count = j;
if (err)
goto bad_format;
}
result = (struct spec *) xmalloc (sizeof (struct spec));
*result = spec;
return result;
bad_format:
if (spec.numbered != NULL)
free (spec.numbered);
return NULL;
}
static void
format_free (void *descr)
{
struct spec *spec = (struct spec *) descr;
if (spec->numbered != NULL)
free (spec->numbered);
free (spec);
}
static int
format_get_number_of_directives (void *descr)
{
struct spec *spec = (struct spec *) descr;
return spec->directives;
}
static bool
format_check (const lex_pos_ty *pos, void *msgid_descr, void *msgstr_descr,
bool equality, bool noisy, const char *pretty_msgstr)
{
struct spec *spec1 = (struct spec *) msgid_descr;
struct spec *spec2 = (struct spec *) msgstr_descr;
bool err = false;
if (spec1->numbered_arg_count + spec2->numbered_arg_count > 0)
{
unsigned int i, j;
unsigned int n1 = spec1->numbered_arg_count;
unsigned int n2 = spec2->numbered_arg_count;
for (i = 0, j = 0; i < n1 || j < n2; )
{
int cmp = (i >= n1 ? 1 :
j >= n2 ? -1 :
spec1->numbered[i].number > spec2->numbered[j].number ? 1 :
spec1->numbered[i].number < spec2->numbered[j].number ? -1 :
0);
if (cmp > 0)
{
if (noisy)
{
error_with_progname = false;
error_at_line (0, 0, pos->file_name, pos->line_number,
_("a format specification for argument {%u}, as in '%s', doesn't exist in 'msgid'"),
spec2->numbered[j].number, pretty_msgstr);
error_with_progname = true;
}
err = true;
break;
}
else if (cmp < 0)
{
if (equality)
{
if (noisy)
{
error_with_progname = false;
error_at_line (0, 0, pos->file_name, pos->line_number,
_("a format specification for argument {%u} doesn't exist in '%s'"),
spec1->numbered[i].number, pretty_msgstr);
error_with_progname = true;
}
err = true;
break;
}
else
i++;
}
else
j++, i++;
}
if (!err)
for (i = 0, j = 0; j < n2; )
{
if (spec1->numbered[i].number == spec2->numbered[j].number)
{
if (spec1->numbered[i].type != spec2->numbered[j].type)
{
if (noisy)
{
error_with_progname = false;
error_at_line (0, 0, pos->file_name, pos->line_number,
_("format specifications in 'msgid' and '%s' for argument {%u} are not the same"),
pretty_msgstr,
spec2->numbered[j].number);
error_with_progname = true;
}
err = true;
break;
}
j++, i++;
}
else
i++;
}
}
return err;
}
struct formatstring_parser formatstring_java =
{
format_parse,
format_free,
format_get_number_of_directives,
format_check
};
#ifdef TEST
#include <stdio.h>
#include "getline.h"
static void
format_print (void *descr)
{
struct spec *spec = (struct spec *) descr;
unsigned int last;
unsigned int i;
if (spec == NULL)
{
printf ("INVALID");
return;
}
printf ("(");
last = 0;
for (i = 0; i < spec->numbered_arg_count; i++)
{
unsigned int number = spec->numbered[i].number;
if (i > 0)
printf (" ");
if (number < last)
abort ();
for (; last < number; last++)
printf ("_ ");
switch (spec->numbered[i].type)
{
case FAT_OBJECT:
printf ("*");
break;
case FAT_NUMBER:
printf ("Number");
break;
case FAT_DATE:
printf ("Date");
break;
default:
abort ();
}
last = number + 1;
}
printf (")");
}
int
main ()
{
for (;;)
{
char *line = NULL;
size_t line_size = 0;
int line_len;
char *invalid_reason;
void *descr;
line_len = getline (&line, &line_size, stdin);
if (line_len < 0)
break;
if (line_len > 0 && line[line_len - 1] == '\n')
line[--line_len] = '\0';
invalid_reason = NULL;
descr = format_parse (line, &invalid_reason);
format_print (descr);
printf ("\n");
if (descr == NULL)
printf ("%s\n", invalid_reason);
free (invalid_reason);
free (line);
}
return 0;
}
#endif