#ifdef HAVE_CONFIG_H
# include "config.h"
#endif
#include <alloca.h>
#include <errno.h>
#include <getopt.h>
#include <limits.h>
#include <locale.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#ifdef HAVE_UNISTD_H
# include <unistd.h>
#elif defined _MSC_VER || defined __MINGW32__
# include <io.h>
#endif
#include <fnmatch.h>
#include "closeout.h"
#include "dir-list.h"
#include "error.h"
#include "error-progname.h"
#include "progname.h"
#include "relocatable.h"
#include "basename.h"
#include "message.h"
#include "read-po.h"
#include "write-po.h"
#include "str-list.h"
#include "msgl-charset.h"
#include "xalloc.h"
#include "exit.h"
#include "full-write.h"
#include "findprog.h"
#include "pipe.h"
#include "wait-process.h"
#include "gettext.h"
#define _(str) gettext (str)
static int force_po;
static string_list_ty *location_files;
static string_list_ty *domain_names;
static string_list_ty *grep_args[3];
static const char *grep_path;
static char **grep_argv[3];
static const struct option long_options[] =
{
{ "add-location", no_argument, &line_comment, 1 },
{ "comment", no_argument, NULL, 'C' },
{ "directory", required_argument, NULL, 'D' },
{ "domain", required_argument, NULL, 'M' },
{ "escape", no_argument, NULL, CHAR_MAX + 1 },
{ "extended-regexp", no_argument, NULL, 'E' },
{ "file", required_argument, NULL, 'f' },
{ "fixed-strings", no_argument, NULL, 'F' },
{ "force-po", no_argument, &force_po, 1 },
{ "help", no_argument, NULL, 'h' },
{ "ignore-case", no_argument, NULL, 'i' },
{ "indent", no_argument, NULL, CHAR_MAX + 2 },
{ "location", required_argument, NULL, 'N' },
{ "msgid", no_argument, NULL, 'K' },
{ "msgstr", no_argument, NULL, 'T' },
{ "no-escape", no_argument, NULL, CHAR_MAX + 3 },
{ "no-location", no_argument, &line_comment, 0 },
{ "no-wrap", no_argument, NULL, CHAR_MAX + 6 },
{ "output-file", required_argument, NULL, 'o' },
{ "properties-input", no_argument, NULL, 'P' },
{ "properties-output", no_argument, NULL, 'p' },
{ "regexp", required_argument, NULL, 'e' },
{ "sort-by-file", no_argument, NULL, CHAR_MAX + 4 },
{ "sort-output", no_argument, NULL, CHAR_MAX + 5 },
{ "strict", no_argument, NULL, 'S' },
{ "stringtable-input", no_argument, NULL, CHAR_MAX + 7 },
{ "stringtable-output", no_argument, NULL, CHAR_MAX + 8 },
{ "version", no_argument, NULL, 'V' },
{ "width", required_argument, NULL, 'w' },
{ NULL, 0, NULL, 0 }
};
static void no_pass (int opt)
#if defined __GNUC__ && ((__GNUC__ == 2 && __GNUC_MINOR__ >= 5) || __GNUC__ > 2)
__attribute__ ((noreturn))
#endif
;
static void usage (int status)
#if defined __GNUC__ && ((__GNUC__ == 2 && __GNUC_MINOR__ >= 5) || __GNUC__ > 2)
__attribute__ ((noreturn))
#endif
;
static msgdomain_list_ty *process_msgdomain_list (msgdomain_list_ty *mdlp);
int
main (int argc, char **argv)
{
int opt;
bool do_help;
bool do_version;
char *output_file;
const char *input_file;
int grep_pass;
msgdomain_list_ty *result;
bool sort_by_filepos = false;
bool sort_by_msgid = false;
set_program_name (argv[0]);
error_print_progname = maybe_print_progname;
#ifdef HAVE_SETLOCALE
setlocale (LC_ALL, "");
#endif
bindtextdomain (PACKAGE, relocate (LOCALEDIR));
textdomain (PACKAGE);
atexit (close_stdout);
do_help = false;
do_version = false;
output_file = NULL;
input_file = NULL;
grep_pass = -1;
location_files = string_list_alloc ();
domain_names = string_list_alloc ();
grep_args[0] = string_list_alloc ();
grep_args[1] = string_list_alloc ();
grep_args[2] = string_list_alloc ();
while ((opt = getopt_long (argc, argv, "CD:e:Ef:FhiKM:N:o:pPTVw:",
long_options, NULL))
!= EOF)
switch (opt)
{
case '\0':
break;
case 'C':
grep_pass = 2;
break;
case 'D':
dir_list_append (optarg);
break;
case 'e':
if (grep_pass < 0)
no_pass (opt);
string_list_append (grep_args[grep_pass], "-e");
string_list_append (grep_args[grep_pass], optarg);
break;
case 'E':
if (grep_pass < 0)
no_pass (opt);
string_list_append (grep_args[grep_pass], "-E");
break;
case 'f':
if (grep_pass < 0)
no_pass (opt);
string_list_append (grep_args[grep_pass], "-f");
string_list_append (grep_args[grep_pass], optarg);
break;
case 'F':
if (grep_pass < 0)
no_pass (opt);
string_list_append (grep_args[grep_pass], "-F");
break;
case 'h':
do_help = true;
break;
case 'i':
if (grep_pass < 0)
no_pass (opt);
string_list_append (grep_args[grep_pass], "-i");
break;
case 'K':
grep_pass = 0;
break;
case 'M':
string_list_append (domain_names, optarg);
break;
case 'N':
string_list_append (location_files, optarg);
break;
case 'o':
output_file = optarg;
break;
case 'p':
message_print_syntax_properties ();
break;
case 'P':
input_syntax = syntax_properties;
break;
case 'S':
message_print_style_uniforum ();
break;
case 'T':
grep_pass = 1;
break;
case 'V':
do_version = true;
break;
case 'w':
{
int value;
char *endp;
value = strtol (optarg, &endp, 10);
if (endp != optarg)
message_page_width_set (value);
}
break;
case CHAR_MAX + 1:
message_print_style_escape (true);
break;
case CHAR_MAX + 2:
message_print_style_indent ();
break;
case CHAR_MAX + 3:
message_print_style_escape (false);
break;
case CHAR_MAX + 4:
sort_by_filepos = true;
break;
case CHAR_MAX + 5:
sort_by_msgid = true;
break;
case CHAR_MAX + 6:
message_page_width_ignore ();
break;
case CHAR_MAX + 7:
input_syntax = syntax_stringtable;
break;
case CHAR_MAX + 8:
message_print_syntax_stringtable ();
break;
default:
usage (EXIT_FAILURE);
break;
}
if (do_version)
{
printf ("%s (GNU %s) %s\n", basename (program_name), PACKAGE, VERSION);
printf (_("Copyright (C) %s Free Software Foundation, Inc.\n\
This is free software; see the source for copying conditions. There is NO\n\
warranty; not even for MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.\n\
"),
"2001-2003");
printf (_("Written by %s.\n"), "Bruno Haible");
exit (EXIT_SUCCESS);
}
if (do_help)
usage (EXIT_SUCCESS);
if (optind == argc)
input_file = "-";
else if (optind + 1 == argc)
input_file = argv[optind];
else
{
error (EXIT_SUCCESS, 0, _("at most one input file allowed"));
usage (EXIT_FAILURE);
}
if (!line_comment && sort_by_filepos)
error (EXIT_FAILURE, 0, _("%s and %s are mutually exclusive"),
"--no-location", "--sort-by-file");
if (sort_by_msgid && sort_by_filepos)
error (EXIT_FAILURE, 0, _("%s and %s are mutually exclusive"),
"--sort-output", "--sort-by-file");
result = read_po_file (input_file);
if (grep_args[0]->nitems > 0
|| grep_args[1]->nitems > 0
|| grep_args[2]->nitems > 0)
{
compare_po_locale_charsets (result);
grep_path = find_in_path ("grep");
#if (defined (sun) || defined (__sun)) && defined (__SVR4)
if ((strcmp (grep_path, "/usr/bin/grep") == 0
|| strcmp (grep_path, "/bin/grep") == 0)
&& access ("/usr/xpg4/bin/grep", X_OK) == 0)
grep_path = "/usr/xpg4/bin/grep";
#endif
}
for (grep_pass = 0; grep_pass < 3; grep_pass++)
if (grep_args[grep_pass]->nitems > 0)
{
string_list_ty *args = grep_args[grep_pass];
size_t option_q;
size_t i, j;
#if (defined (sun) || defined (__sun)) && !defined (__SVR4)
option_q = 0;
#else
option_q = 1;
#endif
grep_argv[grep_pass] =
(char **) xmalloc ((1 + option_q + args->nitems + 1)
* sizeof (char *));
grep_argv[grep_pass][0] = (char *) grep_path;
j = 1;
if (option_q)
grep_argv[grep_pass][j++] = "-q";
for (i = 0; i < args->nitems; i++)
grep_argv[grep_pass][j++] = (char *) args->item[i];
grep_argv[grep_pass][j] = NULL;
}
result = process_msgdomain_list (result);
if (sort_by_filepos)
msgdomain_list_sort_by_filepos (result);
else if (sort_by_msgid)
msgdomain_list_sort_by_msgid (result);
msgdomain_list_print (result, output_file, force_po, false);
exit (EXIT_SUCCESS);
}
static void
no_pass (int opt)
{
error (EXIT_SUCCESS, 0,
_("option '%c' cannot be used before 'K' or 'T' or 'C' has been specified"),
opt);
usage (EXIT_FAILURE);
}
static void
usage (int status)
{
if (status != EXIT_SUCCESS)
fprintf (stderr, _("Try `%s --help' for more information.\n"),
program_name);
else
{
printf (_("\
Usage: %s [OPTION] [INPUTFILE]\n\
"), program_name);
printf ("\n");
printf (_("\
Extracts all messages of a translation catalog that match a given pattern\n\
or belong to some given source files.\n\
"));
printf ("\n");
printf (_("\
Mandatory arguments to long options are mandatory for short options too.\n"));
printf ("\n");
printf (_("\
Input file location:\n"));
printf (_("\
INPUTFILE input PO file\n"));
printf (_("\
-D, --directory=DIRECTORY add DIRECTORY to list for input files search\n"));
printf (_("\
If no input file is given or if it is -, standard input is read.\n"));
printf ("\n");
printf (_("\
Output file location:\n"));
printf (_("\
-o, --output-file=FILE write output to specified file\n"));
printf (_("\
The results are written to standard output if no output file is specified\n\
or if it is -.\n"));
printf ("\n");
printf (_("\
Message selection:\n\
[-N SOURCEFILE]... [-M DOMAINNAME]...\n\
[-K MSGID-PATTERN] [-T MSGSTR-PATTERN] [-C COMMENT-PATTERN]\n\
A message is selected if it comes from one of the specified source files,\n\
or if it comes from one of the specified domains,\n\
or if -K is given and its key (msgid or msgid_plural) matches MSGID-PATTERN,\n\
or if -T is given and its translation (msgstr) matches MSGSTR-PATTERN,\n\
or if -C is given and the translator's comment matches COMMENT-PATTERN.\n\
\n\
When more than one selection criterion is specified, the set of selected\n\
messages is the union of the selected messages of each criterion.\n\
\n\
MSGID-PATTERN or MSGSTR-PATTERN syntax:\n\
[-E | -F] [-e PATTERN | -f FILE]...\n\
PATTERNs are basic regular expressions by default, or extended regular\n\
expressions if -E is given, or fixed strings if -F is given.\n\
\n\
-N, --location=SOURCEFILE select messages extracted from SOURCEFILE\n\
-M, --domain=DOMAINNAME select messages belonging to domain DOMAINNAME\n\
-K, --msgid start of patterns for the msgid\n\
-T, --msgstr start of patterns for the msgstr\n\
-C, --comment start of patterns for the translator's comment\n\
-E, --extended-regexp PATTERN is an extended regular expression\n\
-F, --fixed-strings PATTERN is a set of newline-separated strings\n\
-e, --regexp=PATTERN use PATTERN as a regular expression\n\
-f, --file=FILE obtain PATTERN from FILE\n\
-i, --ignore-case ignore case distinctions\n\
"));
printf ("\n");
printf (_("\
Input file syntax:\n"));
printf (_("\
-P, --properties-input input file is in Java .properties syntax\n"));
printf (_("\
--stringtable-input input file is in NeXTstep/GNUstep .strings syntax\n"));
printf ("\n");
printf (_("\
Output details:\n"));
printf (_("\
--no-escape do not use C escapes in output (default)\n"));
printf (_("\
--escape use C escapes in output, no extended chars\n"));
printf (_("\
--force-po write PO file even if empty\n"));
printf (_("\
--indent indented output style\n"));
printf (_("\
--no-location suppress '#: filename:line' lines\n"));
printf (_("\
--add-location preserve '#: filename:line' lines (default)\n"));
printf (_("\
--strict strict Uniforum output style\n"));
printf (_("\
-p, --properties-output write out a Java .properties file\n"));
printf (_("\
--stringtable-output write out a NeXTstep/GNUstep .strings file\n"));
printf (_("\
-w, --width=NUMBER set output page width\n"));
printf (_("\
--no-wrap do not break long message lines, longer than\n\
the output page width, into several lines\n"));
printf (_("\
--sort-output generate sorted output\n"));
printf (_("\
--sort-by-file sort output by file location\n"));
printf ("\n");
printf (_("\
Informative output:\n"));
printf (_("\
-h, --help display this help and exit\n"));
printf (_("\
-V, --version output version information and exit\n"));
printf ("\n");
fputs (_("Report bugs to <bug-gnu-gettext@gnu.org>.\n"),
stdout);
}
exit (status);
}
static bool
filename_list_match (const string_list_ty *slp, const char *filename)
{
size_t j;
for (j = 0; j < slp->nitems; ++j)
if (fnmatch (slp->item[j], filename, FNM_PATHNAME) == 0)
return true;
return false;
}
#ifdef EINTR
static inline int
nonintr_close (int fd)
{
int retval;
do
retval = close (fd);
while (retval < 0 && errno == EINTR);
return retval;
}
#define close nonintr_close
#endif
static bool
is_string_selected (int grep_pass, const char *str, size_t len)
{
if (grep_args[grep_pass]->nitems > 0)
{
pid_t child;
int fd[1];
int exitstatus;
child = create_pipe_out ("grep", grep_path, grep_argv[grep_pass],
DEV_NULL, false, true, true, fd);
if (full_write (fd[0], str, len) < len)
error (EXIT_FAILURE, errno,
_("write to grep subprocess failed"));
close (fd[0]);
exitstatus = wait_subprocess (child, "grep", false, true, true);
return (exitstatus == 0);
}
else
return 0;
}
static bool
is_message_selected (const message_ty *mp)
{
size_t i;
const char *msgstr;
size_t msgstr_len;
const char *p;
if (mp->msgid[0] == '\0')
return true;
for (i = 0; i < mp->filepos_count; i++)
if (filename_list_match (location_files, mp->filepos[i].file_name))
return true;
if (is_string_selected (0, mp->msgid, strlen (mp->msgid)))
return true;
if (mp->msgid_plural != NULL
&& is_string_selected (0, mp->msgid_plural, strlen (mp->msgid_plural)))
return true;
msgstr = mp->msgstr;
msgstr_len = mp->msgstr_len;
for (p = msgstr; p < msgstr + msgstr_len; )
{
size_t length = strlen (p);
if (is_string_selected (1, p, length))
return true;
p += length + 1;
}
if (grep_args[2]->nitems > 0
&& mp->comment != NULL && mp->comment->nitems > 0)
{
size_t length;
char *total_comment;
char *q;
size_t j;
length = 0;
for (j = 0; j < mp->comment->nitems; j++)
length += strlen (mp->comment->item[j]) + 1;
total_comment = (char *) alloca (length);
q = total_comment;
for (j = 0; j < mp->comment->nitems; j++)
{
size_t l = strlen (mp->comment->item[j]);
memcpy (q, mp->comment->item[j], l);
q += l;
*q++ = '\n';
}
if (q != total_comment + length)
abort ();
if (is_string_selected (2, total_comment, length))
return true;
}
return false;
}
static void
process_message_list (const char *domain, message_list_ty *mlp)
{
if (string_list_member (domain_names, domain))
;
else
message_list_remove_if_not (mlp, is_message_selected);
}
static msgdomain_list_ty *
process_msgdomain_list (msgdomain_list_ty *mdlp)
{
size_t k;
for (k = 0; k < mdlp->nitems; k++)
process_message_list (mdlp->item[k]->domain, mdlp->item[k]->messages);
return mdlp;
}