%x string s_name charmap defn nchar subs subs2 ldef elem
%{
/*-
* Copyright (c) 1995 Alex Tatmanjants <alex@elvisti.kiev.ua>
* at Electronni Visti IA, Kiev, Ukraine.
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#include <sys/cdefs.h>
__FBSDID("$FreeBSD: src/usr.bin/colldef/scan.l,v 1.19 2002/08/23 04:18:26 ache Exp $");
#include <ctype.h>
#include <err.h>
#include <limits.h>
#include <unistd.h>
#include <string.h>
#include <wchar.h>
#include <sysexits.h>
#include <sys/types.h>
#include "collate.h"
#include "common.h"
#ifdef __APPLE__
#include "parse.h"
#else /* !__APPLE__ */
#include "y.tab.h"
#endif /* __APPLE__ */
int line_no = 1, save_no, fromsubs;
wchar_t buf0[BUFSIZE], *ptr;
wchar_t *buf = buf0;
wchar_t bufstr[BUFSIZE], *ptrsave;
FILE *map_fp;
YY_BUFFER_STATE main_buf, map_buf;
#ifdef FLEX_DEBUG
YYSTYPE yylval;
#endif /* FLEX_DEBUG */
int yylex(void);
static int localedefmode = 0;
static orderpass = 0;
%}
%%
<INITIAL,charmap,nchar,subs,subs2,ldef>[ \t]+ ;
<subs2,ldef>\" { ptr = buf; BEGIN(string); }
<string>\< {
if(localedefmode) {
ptrsave = ptr;
ptr = buf = bufstr;
BEGIN(s_name);
} else {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "string buffer overflow near line %u, character '<'",
line_no);
*ptr++ = '<';
}
}
<subs>\< { ptr = buf; fromsubs = 1; BEGIN(s_name); }
<ldef>[,;] return *yytext;
<ldef>forward { yylval.ch = DIRECTIVE_FORWARD; return ORDER_DIRECTIVE; }
<ldef>backward { yylval.ch = DIRECTIVE_BACKWARD; return ORDER_DIRECTIVE; }
<ldef>position { yylval.ch = DIRECTIVE_POSITION; return ORDER_DIRECTIVE; }
<ldef>collating[-_]element return COLLATING_ELEMENT;
<ldef>collating[-_]symbol return COLLATING_SYMBOL;
<ldef>from return FROM;
<ldef>\.\.\. return ELLIPSIS;
<ldef>IGNORE return IGNORE;
<ldef>UNDEFINED return UNDEFINED;
<ldef>order[-_]start return ORDER_START;
<ldef>order[-_]end {
char line[YY_BUF_SIZE];
if (orderpass)
return ORDER_END;
/* The first pass only defined the left-most symbol. We reread the
* order lines, and forward references should now be resolved. */
orderpass++;
YY_FLUSH_BUFFER;
rewind(yyin);
for(;;) {
if (fgets(line, sizeof(line), yyin) == NULL)
errx(EX_UNAVAILABLE, "EOF rescanning for order_start");
if (*line == '#')
continue;
if (strstr(line, "order_start") != NULL)
break;
}
return ORDER_SECOND_PASS;
}
<ldef>END[ \t]+LC_COLLATE return END_LC_COLLATE;
<ldef>\n {
line_no++;
return '\n';
}
<ldef>\< { ptr = buf; BEGIN(elem); }
<INITIAL>\< { ptr = buf; fromsubs = 0; BEGIN(s_name); }
<*>^#.*\n line_no++;
^\n line_no++;
<INITIAL>\\\n line_no++;
<INITIAL,nchar,subs>\\t { yylval.ch = '\t'; return CHAR; }
<INITIAL,nchar,subs>\\n { yylval.ch = '\n'; return CHAR; }
<INITIAL,nchar,subs>\\b { yylval.ch = '\b'; return CHAR; }
<INITIAL,nchar,subs>\\f { yylval.ch = '\f'; return CHAR; }
<INITIAL,nchar,subs>\\v { yylval.ch = '\v'; return CHAR; }
<INITIAL,nchar,subs>\\r { yylval.ch = '\r'; return CHAR; }
<INITIAL,nchar,subs>\\a { yylval.ch = '\a'; return CHAR; }
<subs2>\n {
line_no++;
BEGIN(INITIAL);
return '\n';
}
<INITIAL,nchar>\n {
line_no++;
if (map_fp != NULL) {
ptr = buf;
BEGIN(defn);
}
return '\n';
}
<INITIAL>[;,{}()] return *yytext;
<INITIAL>substitute { BEGIN(subs); return SUBSTITUTE; }
<INITIAL>LC_COLLATE { BEGIN(ldef); localedefmode++; return START_LC_COLLATE; }
<subs>with { BEGIN(subs2); return WITH; }
<INITIAL>order return ORDER;
<INITIAL,ldef>charmap BEGIN(charmap);
<INITIAL>;[ \t]*\.\.\.[ \t]*; return RANGE;
<INITIAL,nchar,subs>\\([0-7]{3}) {
u_int v;
sscanf(&yytext[1], "%o", &v);
yylval.ch = v;
return CHAR;
}
<INITIAL,nchar,subs>\\x\{([0-9a-fA-F]{2,8})\} {
u_int v;
sscanf(&yytext[3], "%x", &v);
yylval.ch = v;
return CHAR;
}
<INITIAL,nchar,subs>\\x([0-9a-fA-F]{2}) {
u_int v;
sscanf(&yytext[2], "%x", &v);
yylval.ch = v;
return CHAR;
}
<INITIAL,nchar,subs>\\. { yylval.ch = yytext[1]; return CHAR; }
<INITIAL,nchar,subs>. { yylval.ch = *(u_char *)yytext; return CHAR; }
<defn>^\n line_no++;
<defn>[ \t]+ {
if (ptr == buf)
errx(EX_UNAVAILABLE, "map expected near line %u of %s",
line_no, map_name);
*ptr = 0;
if (localedefmode && *buf == '<' && ptr[-1] == '>') {
if (ptr == buf + 2)
errx(EX_UNAVAILABLE, "map expected near line %u of %s",
line_no, map_name);
*--ptr = 0;
wcscpy(yylval.str, buf + 1);
} else
wcscpy(yylval.str, buf);
BEGIN(nchar);
return DEFN;
}
<s_name,elem>\/\/ {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "name buffer overflow near line %u, character '/'",
line_no);
*ptr++ = '/';
}
<s_name,elem>\/\> {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "name buffer overflow near line %u, character '>'",
line_no);
*ptr++ = '>';
}
<string>\\\" {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "string buffer overflow near line %u, character '\"'",
line_no);
*ptr++ = '"';
}
<elem>\> {
if (ptr == buf)
errx(EX_UNAVAILABLE, "non-empty name expected near line %u",
line_no);
*ptr = 0;
wcscpy(yylval.str, buf);
BEGIN(ldef);
return ELEM;
}
<s_name>\> {
struct symbol *s;
if (ptr == buf)
errx(EX_UNAVAILABLE, "non-empty name expected near line %u",
line_no);
*ptr = 0;
s = getsymbol(buf, EXISTS);
switch (s->type) {
case SYMBOL_CHAR:
break;
case SYMBOL_CHAIN:
errx(EX_UNAVAILABLE, "name <%s> is chain type near line %u",
showwcs(buf, CHARMAP_SYMBOL_LEN), line_no);
case SYMBOL_SYMBOL:
errx(EX_UNAVAILABLE, "name <%s> is symbol type near line %u",
showwcs(buf, CHARMAP_SYMBOL_LEN), line_no);
default:
errx(EX_UNAVAILABLE, "name <%s>: unknown symbol type (%d) near line %u",
showwcs(buf, CHARMAP_SYMBOL_LEN), s->type, line_no);
}
if (localedefmode) {
ptr = ptrsave;
buf = buf0;
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "string buffer overflow near line %u, character <%s>",
line_no, showwcs(bufstr, CHARMAP_SYMBOL_LEN));
*ptr++ = s->u.wc;
BEGIN(string);
} else {
yylval.ch = s->u.wc;
if (fromsubs)
BEGIN(subs);
else
BEGIN(INITIAL);
return CHAR;
}
}
<string>\" {
*ptr = 0;
wcscpy(yylval.str, buf);
if (localedefmode)
BEGIN(ldef);
else
BEGIN(subs2);
return STRING;
}
<s_name,defn,elem>. {
const char *s = (map_fp != NULL) ? map_name : "input";
if (!isascii(*yytext) || !isprint(*yytext))
errx(EX_UNAVAILABLE, "non-ASCII or non-printable character 0x%02x not allowed in the map/name near line %u of %s",
*yytext, line_no, s);
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "map/name buffer overflow near line %u of %s, character '%c'",
line_no, s, *yytext);
*ptr++ = *yytext;
}
<string>\\t {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "string buffer overflow near line %u, character '\\t'",
line_no);
*ptr++ = '\t';
}
<string>\\b {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "string buffer overflow near line %u, character '\\b'",
line_no);
*ptr++ = '\b';
}
<string>\\f {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "string buffer overflow near line %u, character '\\f'",
line_no);
*ptr++ = '\f';
}
<string>\\v {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "string buffer overflow near line %u, character '\\v'",
line_no);
*ptr++ = '\v';
}
<string>\\n {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "string buffer overflow near line %u, character '\\n'",
line_no);
*ptr++ = '\n';
}
<string>\\r {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "string buffer overflow near line %u, character '\\r'",
line_no);
*ptr++ = '\r';
}
<string>\\a {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "string buffer overflow near line %u, character '\\a'",
line_no);
*ptr++ = '\a';
}
<s_name,string,defn,elem>\n {
const char *s = (map_fp != NULL) ? map_name : "input";
errx(EX_UNAVAILABLE, "unterminated map/name/string near line %u of %s", line_no, s);
}
<s_name,string,nchar,elem><<EOF>> {
const char *s = (map_fp != NULL) ? map_name : "input";
errx(EX_UNAVAILABLE, "premature EOF in the name/string/char near line %u of %s", line_no, s);
}
<string>\\x\{([0-9a-f]{2,8})\} {
u_int v;
sscanf(&yytext[3], "%x", &v);
*ptr++ = v;
}
<string>\\x([0-9a-f]{2}) {
u_int v;
sscanf(&yytext[2], "%x", &v);
*ptr++ = v;
}
<string>\\([0-7]{3}) {
u_int v;
sscanf(&yytext[1], "%o", &v);
*ptr++ = v;
}
<string>\\. {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "string buffer overflow near line %u, character '%c'",
line_no, yytext[1]);
*ptr++ = yytext[1];
}
<string>. {
if(ptr >= buf + BUFSIZE - 1)
errx(EX_UNAVAILABLE, "string buffer overflow near line %u, character '%c'",
line_no, *yytext);
*ptr++ = *yytext;
}
<charmap>[^ \t\n]+ {
if(*yytext == '/')
strcpy(map_name, yytext);
else {
strcat(map_name, "/");
strcat(map_name, yytext);
}
if((map_fp = fopen(map_name, "r")) == NULL)
err(EX_UNAVAILABLE, "can't open 'charmap' file %s",
map_name);
save_no = line_no;
line_no = 1;
map_buf = yy_new_buffer(map_fp, YY_BUF_SIZE);
main_buf = YY_CURRENT_BUFFER;
yy_switch_to_buffer(map_buf);
ptr = buf;
BEGIN(defn);
}
<charmap>\n {
errx(EX_UNAVAILABLE, "'charmap' file name expected near line %u",
line_no);
}
<charmap><<EOF>> {
errx(EX_UNAVAILABLE, "'charmap' file name expected near line %u",
line_no);
}
<INITIAL,defn><<EOF>> {
if(map_fp != NULL) {
if (ptr != buf)
errx(EX_UNAVAILABLE, "premature EOF in the map near line %u of %s", line_no, map_name);
yy_switch_to_buffer(main_buf);
yy_delete_buffer(map_buf);
fclose(map_fp);
map_fp = NULL;
line_no = save_no;
if (localedefmode)
BEGIN(ldef);
else
BEGIN(INITIAL);
} else
yyterminate();
}
%%
#ifdef FLEX_DEBUG
main()
{
while(yylex())
;
return 0;
}
#endif /* FLEX_DEBUG */