run.c revision 7c478bd95313f5f23a4c958a745db2134aa03244
/*
* CDDL HEADER START
*
* The contents of this file are subject to the terms of the
* Common Development and Distribution License, Version 1.0 only
* (the "License"). You may not use this file except in compliance
* with the License.
*
* You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
* or http://www.opensolaris.org/os/licensing.
* See the License for the specific language governing permissions
* and limitations under the License.
*
* When distributing Covered Code, include this CDDL HEADER in each
* file and include the License file at usr/src/OPENSOLARIS.LICENSE.
* If applicable, add the following below this CDDL HEADER, with the
* fields enclosed by brackets "[]" replaced with your own identifying
* information: Portions Copyright [yyyy] [name of copyright owner]
*
* CDDL HEADER END
*/
/* Copyright (c) 1984, 1986, 1987, 1988, 1989 AT&T */
/* All Rights Reserved */
/*
* Copyright 2003 Sun Microsystems, Inc. All rights reserved.
* Use is subject to license terms.
*/
#ident "%Z%%M% %I% %E% SMI"
#define DEBUG
#define tempfree(a) {if (istemp(a)) {xfree(a->sval); a->tval = 0; }}
#include "awk.def"
#include "math.h"
#include "awk.h"
#include "stdio.h"
#include "ctype.h"
#include "wctype.h"
#include "awktype.h"
#include <stdlib.h>
#define RECSIZE BUFSIZ
#define FILENUM 10
struct
{
FILE *fp;
int type;
wchar_t *fname;
} files[FILENUM];
FILE *popen();
extern CELL *execute(), *nodetoobj(), *fieldel(), *dopa2(), *gettemp();
#define PA2NUM 29
int pairstack[PA2NUM], paircnt;
NODE *winner = NULL;
#define MAXTMP 20
CELL tmps[MAXTMP];
static CELL truecell ={ OBOOL, BTRUE, 0, 0, 0.0, NUM, 0 };
CELL *true = &truecell;
static CELL falsecell ={ OBOOL, BFALSE, 0, 0, 0.0, NUM, 0 };
CELL *false = &falsecell;
static CELL breakcell ={ OJUMP, JBREAK, 0, 0, 0.0, NUM, 0 };
CELL *jbreak = &breakcell;
static CELL contcell ={ OJUMP, JCONT, 0, 0, 0.0, NUM, 0 };
CELL *jcont = &contcell;
static CELL nextcell ={ OJUMP, JNEXT, 0, 0, 0.0, NUM, 0 };
CELL *jnext = &nextcell;
static CELL exitcell ={ OJUMP, JEXIT, 0, 0, 0.0, NUM, 0 };
CELL *jexit = &exitcell;
static CELL tempcell ={ OCELL, CTEMP, 0, 0, 0.0, NUM, 0 };
run(a) NODE *a;
{
register int i;
execute(a);
/* Wait for children to complete if output to a pipe. */
for (i=0; i<FILENUM; i++)
if (files[i].fp && files[i].type == '|')
pclose(files[i].fp);
}
CELL *execute(u) NODE *u;
{
register CELL *(*proc)();
register CELL *x;
register NODE *a;
if (u == NULL)
return (true);
for (a = u; /* dummy */; a = a->nnext) {
if (cantexec(a))
return (nodetoobj(a));
if (notlegal(a->nobj))
error(FATAL, "illegal statement %o", a);
proc = proctab[a->nobj-FIRSTTOKEN];
x = (*proc)(a->narg, a->nobj);
if (isfld(x))
fldbld();
if (isexpr(a))
return (x);
/* a statement, goto next statement */
if (isjump(x))
return (x);
if (a->nnext == (NODE *)NULL)
return (x);
tempfree(x);
}
}
CELL *program(a, n) register NODE **a;
{
register CELL *x;
if (a[0] != NULL) {
x = execute(a[0]);
if (isexit(x))
return (true);
if (isjump(x))
error(FATAL, "unexpected break, continue or next");
tempfree(x);
}
while (getrec()) {
x = execute(a[1]);
if (isexit(x)) {
tempfree(x);
break;
}
tempfree(x);
}
if (a[2] != NULL) {
x = execute(a[2]);
if (isbreak(x) || isnext(x) || iscont(x))
error(FATAL, "unexpected break, continue or next");
tempfree(x);
}
return (true);
}
CELL *getline()
{
register CELL *x;
x = gettemp();
setfval(x, (awkfloat) getrec());
return (x);
}
CELL *array(a, n) register NODE **a;
{
register CELL *x, *y;
extern CELL *arrayel();
x = execute(a[1]);
y = arrayel(a[0], x);
tempfree(x);
return (y);
}
CELL *arrayel(a, b) NODE *a; CELL *b;
{
register wchar_t *s;
register CELL *x;
register int i;
register CELL *y;
s = getsval(b);
x = (CELL *) a;
if (!(x->tval&ARR)) {
xfree(x->sval);
x->tval &= ~STR;
x->tval |= ARR;
x->sval = (wchar_t *) makesymtab();
}
y = setsymtab(s, tostring(L_NULL), 0.0, STR|NUM, x->sval);
y->ctype = OCELL;
y->csub = CVAR;
return (y);
}
CELL *matchop(a, n) NODE **a;
{
register CELL *x;
register wchar_t *s;
register int i;
x = execute(a[0]);
s = getsval(x);
tempfree(x);
i = match(a[1], s);
if (n == MATCH && i == 1 || n == NOTMATCH && i == 0)
return (true);
else
return (false);
}
CELL *boolop(a, n) NODE **a;
{
register CELL *x, *y;
register int i;
x = execute(a[0]);
i = istrue(x);
tempfree(x);
switch (n) {
case BOR:
if (i) return (true);
y = execute(a[1]);
i = istrue(y);
tempfree(y);
if (i) return (true);
else return (false);
case AND:
if (!i) return (false);
y = execute(a[1]);
i = istrue(y);
tempfree(y);
if (i) return (true);
else return (false);
case NOT:
if (i) return (false);
else return (true);
default:
error(FATAL, "unknown boolean operator %d", n);
}
}
CELL *relop(a, n) NODE **a;
{
register int i;
register CELL *x, *y;
awkfloat j;
register wchar_t *xs, *ys;
x = execute(a[0]);
y = execute(a[1]);
if (x->tval&NUM && y->tval&NUM) {
j = x->fval - y->fval;
i = j<0? -1: (j>0? 1: 0);
} else {
xs = getsval(x);
ys = getsval(y);
if (xs && ys)
i = wscoll(xs, ys);
else
return (false);
}
tempfree(x);
tempfree(y);
switch (n) {
case LT: if (i<0) return (true);
else return (false);
case LE: if (i<=0) return (true);
else return (false);
case NE: if (i!=0) return (true);
else return (false);
case EQ: if (i == 0) return (true);
else return (false);
case GE: if (i>=0) return (true);
else return (false);
case GT: if (i>0) return (true);
else return (false);
default:
error(FATAL, "unknown relational operator %d", n);
}
}
CELL *gettemp()
{
register int i;
register CELL *x;
for (i=0; i<MAXTMP; i++)
if (tmps[i].tval == 0)
break;
if (i == MAXTMP)
error(FATAL, "out of temporaries in gettemp");
tmps[i] = tempcell;
x = &tmps[i];
return (x);
}
CELL *indirect(a, n) NODE **a;
{
register CELL *x;
register int m;
CELL *fieldadr();
x = execute(a[0]);
m = getfval(x);
tempfree(x);
x = fieldadr(m);
x->ctype = OCELL;
x->csub = CFLD;
return (x);
}
CELL *substr(a, nnn) NODE **a;
{
register int k, m, n;
register wchar_t *s, temp;
register CELL *x, *y;
y = execute(a[0]);
s = getsval(y);
k = wslen(s) + 1;
if (k <= 1) {
x = gettemp();
setsval(x, L_NULL);
return (x);
}
x = execute(a[1]);
m = getfval(x);
if (m <= 0)
m = 1;
else if (m > k)
m = k;
tempfree(x);
if (a[2] != 0) {
x = execute(a[2]);
n = getfval(x);
tempfree(x);
}
else
n = k - 1;
if (n < 0)
n = 0;
else if (n > k - m)
n = k - m;
dprintf("substr: m=%d, n=%d, s=%ws\n", m, n, s);
x = gettemp();
temp = s[n+m-1];
s[n+m-1] = (wchar_t)0x0;
setsval(x, s + m - 1);
s[n+m-1] = temp;
tempfree(y);
return (x);
}
CELL *sindex(a, nnn) NODE **a;
{
register CELL *x;
register wchar_t *s1, *s2, *p1, *p2, *q;
x = execute(a[0]);
s1 = getsval(x);
tempfree(x);
x = execute(a[1]);
s2 = getsval(x);
tempfree(x);
x = gettemp();
for (p1 = s1; *p1 != (wchar_t)0x0; p1++) {
for (q=p1, p2=s2; *p2 != (wchar_t)0x0 && *q == *p2; q++, p2++)
;
if (*p2 == (wchar_t)0x0) {
setfval(x, (awkfloat) (p1 - s1 + 1)); /* origin 1 */
return (x);
}
}
setfval(x, 0.0);
return (x);
}
wchar_t *format(s, a) register wchar_t *s; NODE *a;
{
register wchar_t *buf, *ep, *str;
register wchar_t *p;
register char *t;
wchar_t *os;
wchar_t tbuf[2*RECSIZE];
char fmt[200];
register CELL *x;
int flag = 0;
awkfloat xf;
os = s;
p = buf= (wchar_t *)malloc(RECSIZE * sizeof (wchar_t));
if (p == NULL)
error(FATAL, "out of space in format");
ep = p + RECSIZE;
while (*s) {
if (*s != '%') {
*p++ = *s++;
continue;
}
if (*(s+1) == '%') {
*p++ = '%';
s += 2;
continue;
}
for (t=fmt; *s != '\0'; s++)
{
if (*s == 's' || *s == 'c')
*t++ = 'w';
*t++ = *s;
if (*s >= 'a' && *s <= 'z' && *s != 'l')
break;
if (*s == '*') {
if (a == NULL) {
error(FATAL,
"not enough arguments in printf(%ws) or sprintf(%ws)",
os, os);
}
x = execute(a);
a = a->nnext;
sprintf(t-1, "%d", (int) getfval(x));
t = fmt + strlen(fmt);
tempfree(x);
}
}
*t = '\0';
if (t >= fmt + sizeof (fmt))
error(FATAL, "format item %.20ws... too long", os);
switch (*s) {
case 'f': case 'e': case 'g':
flag = 1;
break;
case 'd':
flag = 2;
if (*(s-1) == 'l') break;
*(t-1) = 'l';
*t = 'd';
*++t = '\0';
break;
case 'o': case 'x':
flag = *(s-1) == 'l' ? 2 : 3;
break;
case 'c':
flag = 3;
break;
case 's':
flag = 4;
break;
default:
flag = 0;
break;
}
if (flag == 0) {
wsprintf(p, "%s", fmt);
p += wslen(p);
continue;
}
if (a == NULL) {
error(FATAL,
"not enough arguments in printf(%ws) or sprintf(%ws)", os, os);
}
x = execute(a);
a = a->nnext;
/*
* Get the string to check length; %s is the usual problem;
* other conversions can cause overrun if they occur when
* the buffer is almost filled.
*/
if (flag == 4) { /* watch out for converting to numbers! */
str = getsval(x);
}
else {
xf = getfval(x);
if (flag == 1) wsprintf(tbuf, fmt, xf);
else if (flag == 2) wsprintf(tbuf, fmt, (long)xf);
else if (flag == 3) wsprintf(tbuf, fmt, (int)xf);
if (wslen(tbuf) >= RECSIZE)
error(FATAL, "formatted item %s... too long",
tbuf);
str = tbuf;
}
/*
* If string overruns the buffer, reallocate;
* consider length of format string
*/
if (p + wslen(str) + wslen(s) + 1 >= ep) {
int newlen, oldlen;
oldlen = p - buf;
/* Add RECSIZE for additional space */
newlen = oldlen + wslen(str) + RECSIZE;
buf = realloc(buf, (unsigned) newlen * sizeof(wchar_t));
if (buf == NULL)
error(FATAL, "out of format space");
p = buf + oldlen;
ep = buf + newlen;
}
/* Transfer string to buffer */
if (flag == 4)
wsprintf(p, fmt, str);
else
wscpy(p, str);
tempfree(x);
p += wslen(p);
if (p >= ep)
error(FATAL, "formatted string too long");
s++;
}
*p = '\0';
return (buf);
}
CELL *asprintf(a, n) NODE **a;
{
register CELL *x;
register NODE *y;
register wchar_t *s;
y = a[0]->nnext;
x = execute(a[0]);
s = format(getsval(x), y);
tempfree(x);
x = gettemp();
x->sval = s;
x->tval = STR;
return (x);
}
CELL *arith(a, n) NODE **a;
{
awkfloat i, j;
register CELL *x, *y, *z;
x = execute(a[0]);
i = getfval(x);
tempfree(x);
if (n != UMINUS) {
y = execute(a[1]);
j = getfval(y);
tempfree(y);
}
z = gettemp();
switch (n) {
case ADD:
i += j;
break;
case MINUS:
i -= j;
break;
case MULT:
i *= j;
break;
case DIVIDE:
if (j == 0)
error(FATAL, "division by zero");
i /= j;
break;
case MOD:
if (j == 0)
error(FATAL, "division by zero");
i = i - j*(long)(i/j);
break;
case UMINUS:
i = -i;
break;
default:
error(FATAL, "illegal arithmetic operator %d", n);
}
setfval(z, i);
return (z);
}
CELL *incrdecr(a, n) NODE **a;
{
register CELL *x, *z;
register int k;
awkfloat xf;
x = execute(a[0]);
xf = getfval(x);
k = (n == PREINCR || n == POSTINCR) ? 1 : -1;
if (n == PREINCR || n == PREDECR) {
setfval(x, xf + k);
return (x);
}
z = gettemp();
setfval(z, xf);
setfval(x, xf + k);
tempfree(x);
return (z);
}
CELL *assign(a, n) NODE **a;
{
register CELL *x, *y;
awkfloat xf, yf;
x = execute(a[0]);
y = execute(a[1]);
if (n == ASSIGN) { /* ordinary assignment */
if ((y->tval & (STR|NUM)) == (STR|NUM)) {
setsval(x, y->sval);
x->fval = y->fval;
x->tval |= NUM;
} else if (y->tval & STR)
setsval(x, y->sval);
else if (y->tval & NUM)
setfval(x, y->fval);
tempfree(y);
return (x);
}
xf = getfval(x);
yf = getfval(y);
switch (n) {
case ADDEQ:
xf += yf;
break;
case SUBEQ:
xf -= yf;
break;
case MULTEQ:
xf *= yf;
break;
case DIVEQ:
if (yf == 0)
error(FATAL, "division by zero");
xf /= yf;
break;
case MODEQ:
if (yf == 0)
error(FATAL, "division by zero");
xf = xf - yf*(long)(xf/yf);
break;
default:
error(FATAL, "illegal assignment operator %d", n);
break;
}
tempfree(y);
setfval(x, xf);
return (x);
}
CELL *cat(a, q) NODE **a;
{
register CELL *x, *y, *z;
register int n1, n2;
register wchar_t *s;
x = execute(a[0]);
y = execute(a[1]);
getsval(x);
getsval(y);
n1 = wslen(x->sval);
n2 = wslen(y->sval);
if ((s = (wchar_t *) malloc((n1 + n2 + 1) * sizeof (wchar_t))) == NULL)
error(FATAL, "out of space in cat");
wscpy(s, x->sval);
wscpy(s+n1, y->sval);
tempfree(y);
z = gettemp();
z->sval = s;
z->tval = STR;
tempfree(x);
return (z);
}
CELL *pastat(a, n) NODE **a;
{
register CELL *x;
if (a[0] == 0)
x = true;
else
x = execute(a[0]);
if (istrue(x)) {
tempfree(x);
x = execute(a[1]);
}
return (x);
}
CELL *dopa2(a, n) NODE **a;
{
register CELL *x;
register int pair;
pair = (int) a[3];
if (pairstack[pair] == 0) {
x = execute(a[0]);
if (istrue(x))
pairstack[pair] = 1;
tempfree(x);
}
if (pairstack[pair] == 1) {
x = execute(a[1]);
if (istrue(x))
pairstack[pair] = 0;
tempfree(x);
x = execute(a[2]);
return (x);
}
return (false);
}
CELL *aprintf(a, n) NODE **a;
{
register CELL *x;
x = asprintf(a, n);
if (a[1] == NULL) {
printf("%ws", x->sval);
tempfree(x);
return (true);
}
redirprint(x->sval, (int)a[1], a[2]);
return (x);
}
CELL *split(a, nnn) NODE **a;
{
register CELL *x;
register CELL *ap;
register wchar_t *s, *p, c;
wchar_t *t, temp, num[5];
register wchar_t sep;
int n, flag;
x = execute(a[0]);
s = getsval(x);
tempfree(x);
if (a[2] == 0)
sep = **FS;
else {
x = execute(a[2]);
sep = getsval(x)[0];
tempfree(x);
}
ap = (CELL *) a[1];
freesymtab(ap);
dprintf("split: s=|%ws|, a=%ws, sep=|%wc|\n", s, ap->nval, sep);
ap->tval &= ~STR;
ap->tval |= ARR;
ap->sval = (wchar_t *) makesymtab();
n = 0;
if (sep == ' ')
for (n = 0; /* dummy */; /* dummy */) {
c = *s;
while (iswblank(c) || c == '\t' || c == '\n')
c = *(++s);
if (*s == 0)
break;
n++;
t = s;
do
c = *(++s);
while (! iswblank(c) && c != '\t' &&
c != '\n' && c != '\0');
temp = c;
*s = (wchar_t)0x0;
wsprintf(num, "%d", n);
if (isanumber(t))
setsymtab(num, tostring(t),
watof(t), STR|NUM, ap->sval);
else
setsymtab(num, tostring(t), 0.0, STR, ap->sval);
*s = temp;
if (*s != 0)
s++;
} else if (*s != 0)
for (;;) {
n++;
t = s;
while ((c = *s) != sep && c != '\n' && c != '\0')
s++;
temp = c;
*s = (wchar_t)0x0;
wsprintf(num, "%d", n);
if (isanumber(t))
setsymtab(num, tostring(t),
watof(t), STR|NUM, ap->sval);
else
setsymtab(num, tostring(t), 0.0, STR, ap->sval);
*s = temp;
if (*s++ == 0)
break;
}
x = gettemp();
x->tval = NUM;
x->fval = n;
return (x);
}
CELL *ifstat(a, n) NODE **a;
{
register CELL *x;
x = execute(a[0]);
if (istrue(x)) {
tempfree(x);
x = execute(a[1]);
} else if (a[2] != 0) {
tempfree(x);
x = execute(a[2]);
}
return (x);
}
CELL *whilestat(a, n) NODE **a;
{
register CELL *x;
for (;;) {
x = execute(a[0]);
if (!istrue(x)) return (x);
tempfree(x);
x = execute(a[1]);
if (isbreak(x)) {
x = true;
return (x);
}
if (isnext(x) || isexit(x))
return (x);
tempfree(x);
}
}
CELL *forstat(a, n) NODE **a;
{
register CELL *x;
register CELL *z;
z = execute(a[0]);
tempfree(z);
for (;;) {
if (a[1]!=0) {
x = execute(a[1]);
if (!istrue(x)) return (x);
else tempfree(x);
}
x = execute(a[3]);
if (isbreak(x)) { /* turn off break */
x = true;
return (x);
}
if (isnext(x) || isexit(x))
return (x);
tempfree(x);
z = execute(a[2]);
tempfree(z);
}
}
CELL *instat(a, n) NODE **a;
{
register CELL *vp, *arrayp, *cp, **tp;
register CELL *x;
int i;
vp = (CELL *) a[0];
arrayp = (CELL *) a[1];
if (!(arrayp->tval & ARR))
error(FATAL, "%ws is not an array", arrayp->nval);
tp = (CELL **) arrayp->sval;
for (i = 0; i < MAXSYM; i++) { /* this routine knows too much */
for (cp = tp[i]; cp != NULL; cp = cp->nextval) {
setsval(vp, cp->nval);
x = execute(a[2]);
if (isbreak(x)) {
x = true;
return (x);
}
if (isnext(x) || isexit(x))
return (x);
tempfree(x);
}
}
return (true);
}
CELL *jump(a, n) NODE **a;
{
register CELL *y;
switch (n) {
case EXIT:
if (a[0] != 0) {
y = execute(a[0]);
errorflag = getfval(y);
}
return (jexit);
case NEXT:
return (jnext);
case BREAK:
return (jbreak);
case CONTINUE:
return (jcont);
default:
error(FATAL, "illegal jump type %d", n);
}
}
CELL *fncn(a, n) NODE **a;
{
register CELL *x;
awkfloat u;
register int t;
register wchar_t *wp;
t = (int) a[0];
x = execute(a[1]);
if (t == FLENGTH)
u = (awkfloat) wslen(getsval(x));
else if (t == FLOG)
u = log(getfval(x));
else if (t == FINT)
u = (awkfloat) (long) getfval(x);
else if (t == FEXP)
u = exp(getfval(x));
else if (t == FSQRT)
u = sqrt(getfval(x));
else
error(FATAL, "illegal function type %d", t);
tempfree(x);
x = gettemp();
setfval(x, u);
return (x);
}
CELL *print(a, n) NODE **a;
{
register NODE *x;
register CELL *y;
wchar_t s[RECSIZE];
wchar_t *ss, *bp, *ep;
s[0] = '\0';
bp = s;
ep = s + RECSIZE;
for (x=a[0]; x!=NULL; x=x->nnext) {
y = execute(x);
ss = getsval(y);
/* allocate larger buffer if needed */
if (ep < bp + wslen(bp) + wslen(ss)) {
int newlen;
wchar_t *oldbp;
newlen = wslen(bp) + wslen(ss) + 1 + 1;
oldbp = bp;
bp = malloc(newlen * sizeof(wchar_t));
if (bp == NULL)
error(FATAL, "out of space in print");
ep = bp + newlen;
wscpy(bp, oldbp);
if (oldbp != s)
free(oldbp);
}
if (ss)
wscat(bp, ss);
tempfree(y);
if (x->nnext == NULL)
wscat(bp, *ORS);
else
wscat(bp, *OFS);
}
if (a[1] == 0) {
printf("%ws", bp);
if (bp != s)
free(bp);
return (true);
}
redirprint(bp, (int)a[1], a[2]);
if (bp != s)
free(bp);
return (false);
}
CELL *nullproc() {}
CELL *nodetoobj(a) NODE *a;
{
register CELL *x;
x= (CELL *) a->nobj;
x->ctype = OCELL;
x->csub = a->subtype;
if (isfld(x))
fldbld();
return (x);
}
redirprint(s, a, b) wchar_t *s; NODE *b;
{
register int i;
register CELL *x;
x = execute(b);
getsval(x);
for (i=0; i<FILENUM; i++)
if (files[i].fname && wscmp(x->sval, files[i].fname) == 0)
goto doit;
for (i=0; i<FILENUM; i++)
if (files[i].fp == 0)
break;
if (i >= FILENUM)
error(FATAL, "too many output files %d", i);
if (a == '|') /* a pipe! */
files[i].fp = popen(toeuccode(x->sval), "w");
else if (a == APPEND)
files[i].fp = fopen(toeuccode(x->sval), "a");
else if (a == GT)
files[i].fp = fopen(toeuccode(x->sval), "w");
else
error(FATAL, "illegal redirection near line %lld", lineno);
if (files[i].fp == NULL)
error(FATAL, "can't open file %ws", x->sval);
files[i].fname = tostring(x->sval);
files[i].type = a;
doit:
fprintf(files[i].fp, "%ws", s);
#ifndef gcos
fflush(files[i].fp); /* in case someone is waiting for the output */
#endif
tempfree(x);
}