awk.lx.l revision dc5a8425272d2602e4c21b95b9eeac2b897f45a1
%{
/*
* CDDL HEADER START
*
* The contents of this file are subject to the terms of the
* Common Development and Distribution License, Version 1.0 only
* (the "License"). You may not use this file except in compliance
* with the License.
*
* You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
* or http://www.opensolaris.org/os/licensing.
* See the License for the specific language governing permissions
* and limitations under the License.
*
* When distributing Covered Code, include this CDDL HEADER in each
* file and include the License file at usr/src/OPENSOLARIS.LICENSE.
* If applicable, add the following below this CDDL HEADER, with the
* fields enclosed by brackets "[]" replaced with your own identifying
* information: Portions Copyright [yyyy] [name of copyright owner]
*
* CDDL HEADER END
*/
/*
* Copyright 1996 Sun Microsystems, Inc. All rights reserved.
* Use is subject to license terms.
*/
%}
%{
/* Copyright (c) 1984, 1986, 1987, 1988, 1989 AT&T */
%}
%{
/* All Rights Reserved */
%}
%{
#pragma ident "%Z%%M% %I% %E% SMI"
%}
%Start A str chc sc reg comment
%{
#include "awk.h"
#include "awk.def"
#undef input /* defeat lex */
extern int yylval;
extern int mustfld;
long long lineno = 1;
#ifdef DEBUG
# define RETURN(x) {if (dbg) ptoken(x); return (x); }
#else
# define RETURN(x) return (x)
#endif
#define CADD { cbuf[clen++]=yytext[0]; if (clen>=CBUFLEN-1) { yyerror(\
"string too long", cbuf); BEGIN A; } }
#define CBUFLEN 150
wchar_t cbuf[CBUFLEN];
int clen, cflag;
%}
%a 50000
%o 50000
A [a-zA-Z_]
B [a-zA-Z0-9_]
D [0-9]
WS [ \t]
%%
switch (yybgin-yysvec-1) { /* witchcraft */
case 0:
BEGIN A;
break;
case sc:
BEGIN A;
RETURN('}');
}
<A>^\n lineno++;
<A>^{WS}*#.*\n lineno++; /* strip comment lines */
<A>{WS} /* dummy for cstyle */;
<A>"\\"\n lineno++;
<reg>"\\"\n lineno++;
<A>"||" RETURN(BOR);
<A>BEGIN RETURN(XBEGIN);
<A>END RETURN(XEND);
<A>PROGEND RETURN(EOF);
<A>"&&" RETURN(AND);
<A>"!" RETURN(NOT);
<A>"!=" { yylval = NE; RETURN(RELOP); }
<A>"~" { yylval = MATCH; RETURN(MATCHOP); }
<A>"!~" { yylval = NOTMATCH; RETURN(MATCHOP); }
<A>"<" { yylval = LT; RETURN(RELOP); }
<A>"<=" { yylval = LE; RETURN(RELOP); }
<A>"==" { yylval = EQ; RETURN(RELOP); }
<A>">=" { yylval = GE; RETURN(RELOP); }
<A>">" { yylval = GT; RETURN(RELOP); }
<A>">>" { yylval = APPEND; RETURN(RELOP); }
<A>"++" { yylval = INCR; RETURN(INCR); }
<A>"--" { yylval = DECR; RETURN(DECR); }
<A>"+=" { yylval = ADDEQ; RETURN(ASGNOP); }
<A>"-=" { yylval = SUBEQ; RETURN(ASGNOP); }
<A>"*=" { yylval = MULTEQ; RETURN(ASGNOP); }
<A>"/=" { yylval = DIVEQ; RETURN(ASGNOP); }
<A>"%=" { yylval = MODEQ; RETURN(ASGNOP); }
<A>"=" { yylval = ASSIGN; RETURN(ASGNOP); }
<A>"$"{D}+ {
static wchar_t L_record[] = L"$record";
if (watoi(yytext+1)==0) {
yylval = (int)lookup(L_record, symtab, 0);
RETURN(STRING);
} else {
yylval = fieldadr(watoi(yytext+1));
RETURN(FIELD);
}
}
<A>"$"{WS}* { RETURN(INDIRECT); }
<A>NF { mustfld=1;
yylval = (int)setsymtab(yytext, NULL, 0.0, NUM, symtab);
RETURN(VAR); }
<A>({D}+("."?){D}*|"."{D}+)((e|E)("+"|-)?{D}+)? {
yylval = (int)setsymtab(yytext, NULL, watof(yytext),
CON|NUM, symtab); RETURN(NUMBER); }
<A>"}"{WS}*\n { BEGIN sc; lineno++; RETURN(';'); }
<A>"}" { BEGIN sc; RETURN(';'); }
<A>";"\n { lineno++; RETURN(';'); }
<A>\n { lineno++; RETURN(NL); }
<A>while RETURN(WHILE);
<A>for RETURN(FOR);
<A>if RETURN(IF);
<A>else RETURN(ELSE);
<A>next RETURN(NEXT);
<A>exit RETURN(EXIT);
<A>break RETURN(BREAK);
<A>continue RETURN(CONTINUE);
<A>print { yylval = PRINT; RETURN(PRINT); }
<A>printf { yylval = PRINTF; RETURN(PRINTF); }
<A>sprintf { yylval = SPRINTF; RETURN(SPRINTF); }
<A>split { yylval = SPLIT; RETURN(SPLIT); }
<A>substr RETURN(SUBSTR);
<A>index RETURN(INDEX);
<A>in RETURN(IN);
<A>getline RETURN(GETLINE);
<A>length { yylval = FLENGTH; RETURN(FNCN); }
<A>log { yylval = FLOG; RETURN(FNCN); }
<A>int { yylval = FINT; RETURN(FNCN); }
<A>exp { yylval = FEXP; RETURN(FNCN); }
<A>sqrt { yylval = FSQRT; RETURN(FNCN); }
<A>{A}{B}* {
static wchar_t L_0[] = { 0 };
yylval = (int)setsymtab(yytext, tostring(L_0), 0.0, STR|NUM,
symtab);
RETURN(VAR);
}
<A>\" { BEGIN str; clen=0; }
<A># { BEGIN comment; }
<comment>\n { BEGIN A; lineno++; RETURN(NL); }
<comment>. /* dummy */;
<A>. { yylval = yytext[0]; RETURN(yytext[0]); }
<reg>"[" { BEGIN chc; clen=0; cflag=0; }
<reg>"[^" { BEGIN chc; clen=0; cflag=1; }
<reg>"?" RETURN(QUEST);
<reg>"+" RETURN(PLUS);
<reg>"*" RETURN(STAR);
<reg>"|" RETURN(OR);
<reg>"." RETURN(DOT);
<reg>"(" RETURN('(');
<reg>")" RETURN(')');
<reg>"^" RETURN('^');
<reg>"$" RETURN('$');
<reg>\\{D}{D}{D} { wsscanf(yytext+1, "%o", &yylval); RETURN(CHAR); }
<reg>\\. { if (yytext[1]=='n') yylval = '\n';
else if (yytext[1] == 't') yylval = '\t';
else if (yytext[1] == 'b') yylval = '\b';
else if (yytext[1] == 'r') yylval = '\r';
else if (yytext[1] == 'f') yylval = '\f';
else yylval = yytext[1];
RETURN(CHAR);
}
<reg>"/" { BEGIN A; unput('/'); }
<reg>\n { yyerror("newline in regular expression"); lineno++; BEGIN A; }
<reg>. { yylval = yytext[0]; RETURN(CHAR); }
<str>\" { wchar_t *s; BEGIN A; cbuf[clen]=0; s = tostring(cbuf);
cbuf[clen] = ' '; cbuf[++clen] = 0;
yylval = (int)setsymtab(cbuf, s, 0.0, CON|STR, symtab);
RETURN(STRING); }
<str>\n { yyerror("newline in string"); lineno++; BEGIN A; }
<str>"\\\"" { cbuf[clen++]='"'; }
<str>"\\"n { cbuf[clen++]='\n'; }
<chc>"\\"n { cbuf[clen++]='\n'; }
<str>"\\"t { cbuf[clen++]='\t'; }
<chc>"\\"t { cbuf[clen++]='\t'; }
<str>"\\"b { cbuf[clen++]='\b'; }
<chc>"\\"b { cbuf[clen++]='\b'; }
<str>"\\"r { cbuf[clen++]='\r'; }
<chc>"\\"r { cbuf[clen++]='\r'; }
<str>"\\"f { cbuf[clen++]='\f'; }
<chc>"\\"f { cbuf[clen++]='\f'; }
<str>"\\\\" { cbuf[clen++]='\\'; }
<chc>"\\\\" { cbuf[clen++]='\\'; }
<str>. { CADD; }
<chc>"\\""]" { cbuf[clen++]=']'; }
<chc>"]" { BEGIN reg; cbuf[clen]=0; yylval = (int)tostring(cbuf);
if (cflag==0) { RETURN(CCL); }
else { RETURN(NCCL); } }
<chc>\n { yyerror("newline in character class"); lineno++; BEGIN A; }
<chc>. { CADD; }
%%
int
input()
{
int c;
extern wchar_t *lexprog;
if (yysptr > yysbuf)
c = U(*--yysptr);
else if (yyin == NULL)
c = *lexprog++;
else
c = getwc(yyin);
if (c == '\n')
yylineno++;
else if (c == EOF)
c = 0;
return (c);
}
void
startreg()
{
BEGIN reg;
}