Submitted-By: Jawaid Bazyar (baz...@netcom.com)
Posting-number: Volume 1, Source 97
Archive-Name: gno/util/awk.04
Architecture: 2gs,UNIX
Version-Number: 1.00
=run.c
-/****************************************************************
-Copyright (C) AT&T 1993
-All Rights Reserved
-
-Permission to use, copy, modify, and distribute this software and
-its documentation for any purpose and without fee is hereby
-granted, provided that the above copyright notice appear in all
-copies and that both that the copyright notice and this
-permission notice and warranty disclaimer appear in supporting
-documentation, and that the name of AT&T or any of its entities
-not be used in advertising or publicity pertaining to
-distribution of the software without specific, written prior
-permission.
-
-AT&T DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE,
-INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS.
-IN NO EVENT SHALL AT&T OR ANY OF ITS ENTITIES BE LIABLE FOR ANY
-SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
-WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER
-IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION,
-ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF
-THIS SOFTWARE.
-****************************************************************/
-
-#ifdef __ORCAC__
-segment "run";
-#endif
-
-#define tempfree(x) if (istemp(x)) tfree(x); else
-
-#define DEBUG
-#include <stdio.h>
-#include <ctype.h>
-#include <setjmp.h>
-#include <math.h>
-#include <string.h>
-#include <stdlib.h>
-#include <time.h>
-#include "awk.h"
-#include "y.tab.h"
-
-#ifdef __ORCAC__
-#undef FOPEN_MAX
-#define FOPEN_MAX 40
-#endif
-
-#ifdef _NFILE
-#ifndef FOPEN_MAX
-#define FOPEN_MAX _NFILE
-#endif
-#endif
-
-#ifndef FOPEN_MAX
-#define FOPEN_MAX 40 /* max number of open files */
-#endif
-
-#ifndef RAND_MAX
-#define RAND_MAX 32767 /* all that ansi guarantees */
-#endif
-
-jmp_buf env;
-
-/* an attempt to go a bit faster: */
-
-/* #define execute(p) (isvalue(p) ? (Cell *)((p)->narg[0]) : r_execute(p)) */
-#define execute(p) r_execute(p)
-#define getfval(p) (((p)->tval & (ARR|FLD|REC|NUM)) == NUM ? (p)->fval : r_getfval(p))
-#define getsval(p) (((p)->tval & (ARR|FLD|REC|STR)) == STR ? (p)->sval : r_getsval(p))
-
-
-#define PA2NUM 29 /* max number of pat,pat patterns allowed */
-int paircnt; /* number of them in use */
-int pairstack[PA2NUM]; /* state of each pat,pat */
-
-Node *winner = NULL; /* root of parse tree */
-Cell *tmps; /* free temporary cells for execution */
-
-static Cell truecell ={ OBOOL, BTRUE, 0, 0, 1.0, NUM };
-Cell *true = &truecell;
-static Cell falsecell ={ OBOOL, BFALSE, 0, 0, 0.0, NUM };
-Cell *false = &falsecell;
-static Cell breakcell ={ OJUMP, JBREAK, 0, 0, 0.0, NUM };
-Cell *jbreak = &breakcell;
-static Cell contcell ={ OJUMP, JCONT, 0, 0, 0.0, NUM };
-Cell *jcont = &contcell;
-static Cell nextcell ={ OJUMP, JNEXT, 0, 0, 0.0, NUM };
-Cell *jnext = &nextcell;
-static Cell exitcell ={ OJUMP, JEXIT, 0, 0, 0.0, NUM };
-Cell *jexit = &exitcell;
-static Cell retcell ={ OJUMP, JRET, 0, 0, 0.0, NUM };
-Cell *jret = &retcell;
-static Cell tempcell ={ OCELL, CTEMP, 0, 0, 0.0, NUM };
-
-Node *curnode = NULL; /* the node being executed, for debugging */
-
-void run(Node *a) /* execution of parse tree starts here */
-{
- execute(a);
- closeall();
-}
-
-Cell *r_execute(Node *u) /* execute a node of the parse tree */
-{
- register Cell *(*proc)(Node **, int);
- register Cell *x;
- register Node *a;
-
- if (u == NULL)
- return(true);
- for (a = u; ; a = a->nnext) {
- curnode = a;
- if (isvalue(a)) {
- x = (Cell *) (a->narg[0]);
- if ((x->tval & FLD) && !donefld)
- fldbld();
- else if ((x->tval & REC) && !donerec)
- recbld();
- return(x);
- }
- if (notlegal(a->nobj)) /* probably a Cell* but too risky to print */
- ERROR "illegal statement" FATAL;
- proc = proctab[a->nobj-FIRSTTOKEN];
- x = (*proc)(a->narg, a->nobj);
- if ((x->tval & FLD) && !donefld)
- fldbld();
- else if ((x->tval & REC) && !donerec)
- recbld();
- if (isexpr(a))
- return(x);
- if (isjump(x))
- return(x);
- if (a->nnext == NULL)
- return(x);
- tempfree(x);
- }
-}
-
-
-Cell *program(Node **a, int n) /* execute an awk program */
-{ /* a[0] = BEGIN, a[1] = body, a[2] = END */
- register Cell *x;
-
- if (setjmp(env) != 0)
- goto ex;
- if (a[0]) { /* BEGIN */
- x = execute(a[0]);
- if (isexit(x))
- return(true);
- if (isjump(x))
- ERROR "illegal break, continue or next from BEGIN" FATAL;
- tempfree(x);
- }
- loop:
- if (a[1] || a[2])
- while (getrec(record) > 0) {
- x = execute(a[1]);
- if (isexit(x))
- break;
- tempfree(x);
- }
- ex:
- if (setjmp(env) != 0) /* handles exit within END */
- goto ex1;
- if (a[2]) { /* END */
- x = execute(a[2]);
- if (isbreak(x) || isnext(x) || iscont(x))
- ERROR "illegal break, next, or continue from END" FATAL;
- tempfree(x);
- }
- ex1:
- return(true);
-}
-
-struct Frame { /* stack frame for awk function calls */
- int nargs; /* number of arguments in this call */
- Cell *fcncell; /* pointer to Cell for function */
- Cell **args; /* pointer to array of arguments after execute */
- Cell *retval; /* return value */
-};
-
-#define NARGS 50 /* max args in a call */
-
-struct Frame *frame = NULL; /* base of stack frames; dynamically allocated */
-int nframe = 0; /* number of frames allocated */
-struct Frame *fp = NULL; /* frame pointer. bottom level unused */
-
-Cell *call(Node **a, int n) /* function call. very kludgy and fragile */
-{
- static Cell newcopycell = { OCELL, CCOPY, 0, (uchar *) "", 0.0, NUM|STR|DONTFREE };
- int i, ncall, ndef;
- Node *x;
-#ifdef __ORCAC__
- Cell **args, **oargs, *y, *z, *fcn;
-#else
- Cell *args[NARGS], *oargs[NARGS], *y, *z, *fcn;
-#endif
- uchar *s;
-
-#ifdef __ORCAC__
- args = malloc(sizeof(Cell *) * NARGS);
- oargs = malloc(sizeof(Cell *) * NARGS);
-#endif
- fcn = execute(a[0]); /* the function itself */
- s = fcn->nval;
- if (!isfunc(fcn))
- ERROR "calling undefined function %s", s FATAL;
- if (frame == NULL) {
- fp = frame = (struct Frame *) calloc(nframe += 100, sizeof(struct Frame));
- if (frame == NULL)
- ERROR "out of space for stack frames calling %s", s FATAL;
- }
- for (ncall = 0, x = a[1]; x != NULL; x = x->nnext) /* args in call */
- ncall++;
- ndef = (int) fcn->fval; /* args in defn */
- dprintf( ("calling %s, %d args (%d in defn), fp=%d\n", s, (int)ncall, (int)ndef, fp-frame) );
- if (ncall > ndef)
- ERROR "function %s called with %d args, uses only %d",
- s, ncall, ndef WARNING;
- if (ncall + ndef > NARGS)
- ERROR "function %s has %d arguments, limit %d", s, ncall+ndef, NARGS FATAL;
- for (i = 0, x = a[1]; x != NULL; i++, x = x->nnext) { /* get call args */
- dprintf( ("evaluate args[%d], fp=%d:\n",(int) i, (int)fp-frame) );
- y = execute(x);
- oargs[i] = y;
- dprintf( ("args[%d]: %s %f <%s>, t=%o\n",
- (int)i, y->nval, y->fval, isarr(y) ? "(array)" : (char*) y->sval, y->tval) );
- if (isfunc(y))
- ERROR "can't use function %s as argument in %s", y->nval, s FATAL;
- if (isarr(y))
- args[i] = y; /* arrays by ref */
- else
- args[i] = copycell(y);
- tempfree(y);
- }
- for ( ; i < ndef; i++) { /* add null args for ones not provided */
- args[i] = gettemp();
- *args[i] = newcopycell;
- }
- fp++; /* now ok to up frame */
- if (fp >= frame + nframe) {
- int dfp = fp - frame; /* old index */
- frame = (struct Frame *)
- realloc((char *) frame, (nframe += 100) * sizeof(struct Frame));
- if (frame == NULL)
- ERROR "out of space for stack frames in %s", s FATAL;
- fp = frame + dfp;
- }
- fp->fcncell = fcn;
- fp->args = args;
- fp->nargs = ndef; /* number defined with (excess are locals) */
- fp->retval = gettemp();
-
- dprintf( ("start exec of %s, fp=%d\n", s, (int)fp-frame) );
- y = execute((Node *)(fcn->sval)); /* execute body */
- dprintf( ("finished exec of %s, fp=%d\n", s, (int)fp-frame) );
-
- for (i = 0; i < ndef; i++) {
- Cell *t = fp->args[i];
- if (isarr(t)) {
- if (t->csub == CCOPY) {
- if (i >= ncall) {
- freesymtab(t);
- t->csub = CTEMP;
- } else {
- oargs[i]->tval = t->tval;
- oargs[i]->tval &= ~(STR|NUM|DONTFREE);
- oargs[i]->sval = t->sval;
- tempfree(t);
- }
- }
- } else if (t != y) { /* kludge to prevent freeing twice */
- t->csub = CTEMP;
- tempfree(t);
- }
- }
- tempfree(fcn);
-#ifdef __ORCAC__
- if (isexit(y) || isnext(y)) {
- free(args); free(oargs); return y;
- }
-#else
- if (isexit(y) || isnext(y))
- return y;
-#endif
- tempfree(y); /* this can free twice! */
- z = fp->retval; /* return value */
- dprintf( ("%s returns %g |%s| %o\n", s, getfval(z), getsval(z), (int)z->tval) );
- fp--;
-#ifdef __ORCAC__
- free(args);
- free(oargs);
-#endif
- return(z);
-}
-
-Cell *copycell(Cell *x) /* make a copy of a cell in a temp */
-{
- Cell *y;
-
- y = gettemp();
- y->csub = CCOPY; /* prevents freeing until call is over */
- y->nval = x->nval;
- y->sval = x->sval ? tostring(x->sval) : NULL;
- y->fval = x->fval;
- y->tval = x->tval & ~(CON|FLD|REC|DONTFREE); /* copy is not constant or field */
- /* is DONTFREE right? */
- return y;
-}
-
-Cell *arg(Node **a, int n) /* nth argument of a function */
-{
-
- n = (int) a[0]; /* argument number, counting from 0 */
- dprintf( ("arg(%d), fp->nargs=%d\n", (int)n, (int)fp->nargs) );
- if (n+1 > fp->nargs)
- ERROR "argument #%d of function %s was not supplied",
- n+1, fp->fcncell->nval FATAL;
- return fp->args[n];
-}
-
-Cell *jump(Node **a, int n) /* break, continue, next, continue, return */
-{
- register Cell *y;
-
- switch (n) {
- case EXIT:
- if (a[0] != NULL) {
- y = execute(a[0]);
- errorflag = getfval(y);
- tempfree(y);
- }
- longjmp(env, 1);
- case RETURN:
- if (a[0] != NULL) {
- y = execute(a[0]);
- if ((y->tval & (STR|NUM)) == (STR|NUM)) {
- setsval(fp->retval, getsval(y));
- fp->retval->fval = getfval(y);
- fp->retval->tval |= NUM;
- }
- else if (y->tval & STR)
- setsval(fp->retval, getsval(y));
- else if (y->tval & NUM)
- setfval(fp->retval, getfval(y));
- else /* can't happen */
- ERROR "bad type variable %d", y->tval FATAL;
- tempfree(y);
- }
- return(jret);
- case NEXT:
- return(jnext);
- case BREAK:
- return(jbreak);
- case CONTINUE:
- return(jcont);
- default: /* can't happen */
- ERROR "illegal jump type %d", n FATAL;
- }
- return 0; /* not reached */
-}
-
-Cell *getline(Node **a, int n) /* get next line from specific input */
-{ /* a[0] is variable, a[1] is operator, a[2] is filename */
- register Cell *r, *x;
-#ifdef __ORCAC__
- static uchar *buf = NULL;
-#else
- uchar buf[RECSIZE];
-#endif
- FILE *fp;
-
-#ifdef __ORCAC__
- if (buf == NULL) {
- buf = malloc(RECSIZE);
- }
-#endif
- fflush(stdout); /* in case someone is waiting for a prompt */
- r = gettemp();
- if (a[1] != NULL) { /* getline < file */
- x = execute(a[2]); /* filename */
- if ((int) a[1] == '|') /* input pipe */
- a[1] = (Node *) LE; /* arbitrary flag */
- fp = openfile((int) a[1], getsval(x));
- tempfree(x);
- if (fp == NULL)
- n = -1;
- else
- n = readrec(buf, sizeof(buf), fp);
- if (n <= 0) {
- ;
- } else if (a[0] != NULL) { /* getline var <file */
- setsval(execute(a[0]), buf);
- } else { /* getline <file */
- if (!(recloc->tval & DONTFREE))
- xfree(recloc->sval);
- strcpy(record, buf);
- recloc->sval = record;
- recloc->tval = REC | STR | DONTFREE;
- if (isnumber(recloc->sval)) {
- recloc->fval = atof(recloc->sval);
- recloc->tval |= NUM;
- }
- donerec = 1; donefld = 0;
- }
- } else { /* bare getline; use current input */
- if (a[0] == NULL) /* getline */
- n = getrec(record);
- else { /* getline var */
- n = getrec(buf);
- setsval(execute(a[0]), buf);
- }
- }
- setfval(r, (Awkfloat) n);
- return r;
-}
-
-Cell *getnf(Node **a, int n) /* get NF */
-{
- if (donefld == 0)
- fldbld();
- return (Cell *) a[0];
-}
-
-Cell *array(Node **a, int n) /* a[0] is symtab, a[1] is list of subscripts */
-{
- register Cell *x, *y, *z;
- register uchar *s;
- register Node *np;
-#ifdef __ORCAC__
- static uchar *buf = NULL;
-#else
- uchar buf[RECSIZE];
-#endif
-
-#ifdef __ORCAC__
- if (buf == NULL) buf = malloc(RECSIZE);
-#endif
- x = execute(a[0]); /* Cell* for symbol table */
- buf[0] = 0;
- for (np = a[1]; np; np = np->nnext) {
- y = execute(np); /* subscript */
- s = getsval(y);
- strcat(buf, s);
- if (np->nnext)
- strcat(buf, *SUBSEP);
- tempfree(y);
- }
- if (!isarr(x)) {
- dprintf( ("making %s into an array\n", x->nval) );
- if (freeable(x))
- xfree(x->sval);
- x->tval &= ~(STR|NUM|DONTFREE);
- x->tval |= ARR;
- x->sval = (uchar *) makesymtab(NSYMTAB);
- }
- z = setsymtab(buf, "", 0.0, STR|NUM, (Array *) x->sval);
- z->ctype = OCELL;
- z->csub = CVAR;
- tempfree(x);
- return(z);
-}
-
-Cell *adelete(Node **a, int n) /* a[0] is symtab, a[1] is list of subscripts */
-{
- Cell *x, *y;
- Node *np;
-#ifdef __ORCAC__
- static uchar *buf = NULL;
- uchar *s;
-#else
- uchar buf[RECSIZE], *s;
-#endif
-
-#ifdef __ORCAC__
- if (buf == NULL) buf = malloc(RECSIZE);
-#endif
- x = execute(a[0]); /* Cell* for symbol table */
- if (!isarr(x))
- return true;
- buf[0] = 0;
- for (np = a[1]; np; np = np->nnext) {
- y = execute(np); /* subscript */
- s = getsval(y);
- strcat(buf, s);
- if (np->nnext)
- strcat(buf, *SUBSEP);
- tempfree(y);
- }
- freeelem(x, buf);
- tempfree(x);
- return true;
-}
-
-Cell *intest(Node **a, int n) /* a[0] is index (list), a[1] is symtab */
-{
- register Cell *x, *ap, *k;
- Node *p;
-#ifdef __ORCAC__
- static char *buf = NULL;
-#else
- char buf[RECSIZE];
-#endif
- uchar *s;
-
-#ifdef __ORCAC__
- if (buf == NULL) buf = malloc(RECSIZE);
-#endif
- ap = execute(a[1]); /* array name */
- if (!isarr(ap)) {
- dprintf( ("making %s into an array\n", ap->nval) );
- if (freeable(ap))
- xfree(ap->sval);
- ap->tval &= ~(STR|NUM|DONTFREE);
- ap->tval |= ARR;
- ap->sval = (uchar *) makesymtab(NSYMTAB);
- }
- buf[0] = 0;
- for (p = a[0]; p; p = p->nnext) {
- x = execute(p); /* expr */
- s = getsval(x);
- strcat(buf, s);
- tempfree(x);
- if (p->nnext)
- strcat(buf, *SUBSEP);
- }
- k = lookup(buf, (Array *) ap->sval);
- tempfree(ap);
- if (k == NULL)
- return(false);
- else
- return(true);
-}
-
-
-Cell *matchop(Node **a, int n) /* ~ and match() */
-{
- register Cell *x, *y;
- register uchar *s, *t;
- register int i;
- fa *pfa;
- int (*mf)(fa *, uchar *) = match, mode = 0;
-
- if (n == MATCHFCN) {
- mf = pmatch;
- mode = 1;
- }
- x = execute(a[1]); /* a[1] = target text */
- s = getsval(x);
- if (a[0] == 0) /* a[1] == 0: already-compiled reg expr */
- i = (*mf)((fa *) a[2], s);
- else {
- y = execute(a[2]); /* a[2] = regular expr */
- t = getsval(y);
- pfa = makedfa(t, mode);
- i = (*mf)(pfa, s);
- tempfree(y);
- }
- tempfree(x);
- if (n == MATCHFCN) {
- int start = patbeg - s + 1;
- if (patlen < 0)
- start = 0;
- setfval(rstartloc, (Awkfloat) start);
- setfval(rlengthloc, (Awkfloat) patlen);
- x = gettemp();
- x->tval = NUM;
- x->fval = start;
- return x;
- } else if (n == MATCH && i == 1 || n == NOTMATCH && i == 0)
- return(true);
- else
- return(false);
-}
-
-
-Cell *boolop(Node **a, int n) /* a[0] || a[1], a[0] && a[1], !a[0] */
-{
- register Cell *x, *y;
- register int i;
-
- x = execute(a[0]);
- i = istrue(x);
- tempfree(x);
- switch (n) {
- case BOR:
- if (i) return(true);
- y = execute(a[1]);
- i = istrue(y);
- tempfree(y);
- if (i) return(true);
- else return(false);
- case AND:
- if ( !i ) return(false);
- y = execute(a[1]);
- i = istrue(y);
- tempfree(y);
- if (i) return(true);
- else return(false);
- case NOT:
- if (i) return(false);
- else return(true);
- default: /* can't happen */
- ERROR "unknown boolean operator %d", n FATAL;
- }
- return 0; /*NOTREACHED*/
-}
-
-Cell *relop(Node **a, int n) /* a[0 < a[1], etc. */
-{
- register int i;
- register Cell *x, *y;
- Awkfloat j;
-
- x = execute(a[0]);
- y = execute(a[1]);
- if (x->tval&NUM && y->tval&NUM) {
- j = x->fval - y->fval;
- i = j<0? -1: (j>0? 1: 0);
- } else {
- i = strcmp(getsval(x), getsval(y));
- }
- tempfree(x);
- tempfree(y);
- switch (n) {
- case LT: if (i<0) return(true);
- else return(false);
- case LE: if (i<=0) return(true);
- else return(false);
- case NE: if (i!=0) return(true);
- else return(false);
- case EQ: if (i == 0) return(true);
- else return(false);
- case GE: if (i>=0) return(true);
- else return(false);
- case GT: if (i>0) return(true);
- else return(false);
- default: /* can't happen */
- ERROR "unknown relational operator %d", n FATAL;
- }
- return 0; /*NOTREACHED*/
-}
-
-void tfree(Cell *a) /* free a tempcell */
-{
- if (freeable(a))
- xfree(a->sval);
- if (a == tmps)
- ERROR "tempcell list is curdled" FATAL;
- a->cnext = tmps;
- tmps = a;
-}
-
-Cell *gettemp(void) /* get a tempcell */
-{ int i;
- register Cell *x;
-
- if (!tmps) {
- tmps = (Cell *) calloc(100, sizeof(Cell));
- if (!tmps)
- ERROR "out of space for temporaries" FATAL;
- for(i = 1; i < 100; i++)
- tmps[i-1].cnext = &tmps[i];
- tmps[i-1].cnext = 0;
- }
- x = tmps;
- tmps = x->cnext;
- *x = tempcell;
- return(x);
-}
-
-Cell *indirect(Node **a, int n) /* $( a[0] ) */
-{
- register Cell *x;
- register int m;
- register uchar *s;
-
- x = execute(a[0]);
- m = getfval(x);
- if (m == 0 && !isnumber(s = getsval(x))) /* suspicion! */
- ERROR "illegal field $(%s), name \"%s\"", s, x->nval FATAL;
- /* can x->nval ever be null??? */
- /* ERROR "illegal field $(%s)", s FATAL; */
- tempfree(x);
- x = fieldadr(m);
- x->ctype = OCELL;
- x->csub = CFLD;
- return(x);
-}
-
-Cell *substr(Node **a, int nnn) /* substr(a[0], a[1], a[2]) */
-{
- register int k, m, n;
- register uchar *s;
- int temp;
- register Cell *x, *y, *z;
-
- x = execute(a[0]);
- y = execute(a[1]);
- if (a[2] != 0)
- z = execute(a[2]);
- s = getsval(x);
- k = strlen(s) + 1;
- if (k <= 1) {
- tempfree(x);
- tempfree(y);
- if (a[2] != 0)
- tempfree(z);
- x = gettemp();
- setsval(x, "");
- return(x);
- }
- m = getfval(y);
- if (m <= 0)
- m = 1;
- else if (m > k)
- m = k;
- tempfree(y);
- if (a[2] != 0) {
- n = getfval(z);
- tempfree(z);
- } else
- n = k - 1;
- if (n < 0)
- n = 0;
- else if (n > k - m)
- n = k - m;
- dprintf( ("substr: m=%d, n=%d, s=%s\n", (int)m, (int)n, s) );
- y = gettemp();
- temp = s[n+m-1]; /* with thanks to John Linderman */
- s[n+m-1] = '\0';
- setsval(y, s + m - 1);
- s[n+m-1] = temp;
- tempfree(x);
- return(y);
-}
-
-Cell *sindex(Node **a, int nnn) /* index(a[0], a[1]) */
-{
- register Cell *x, *y, *z;
- register uchar *s1, *s2, *p1, *p2, *q;
- Awkfloat v = 0.0;
-
- x = execute(a[0]);
- s1 = getsval(x);
- y = execute(a[1]);
- s2 = getsval(y);
-
- z = gettemp();
- for (p1 = s1; *p1 != '\0'; p1++) {
- for (q=p1, p2=s2; *p2 != '\0' && *q == *p2; q++, p2++)
- ;
- if (*p2 == '\0') {
- v = (Awkfloat) (p1 - s1 + 1); /* origin 1 */
- break;
- }
- }
- tempfree(x);
- tempfree(y);
- setfval(z, v);
- return(z);
-}
-
-int format(uchar *buf, int bufsize, uchar *s, Node *a) /* printf-like conversions */
-{
-#ifdef __ORCAC__
- static uchar *fmt = NULL;
-#else
- uchar fmt[RECSIZE];
-#endif
- register uchar *p, *t, *os;
- register Cell *x;
- int flag = 0, n;
-
-#ifdef __ORCAC__
- if (fmt == NULL) fmt = malloc(RECSIZE);
-#endif
- os = s;
- p = buf;
- while (*s) {
- if (p - buf >= bufsize)
- return -1;
- if (*s != '%') {
- *p++ = *s++;
- continue;
- }
- if (*(s+1) == '%') {
- *p++ = '%';
- s += 2;
- continue;
- }
- for (t=fmt; (*t++ = *s) != '\0'; s++) {
- if (isalpha(*s) && *s != 'l' && *s != 'h' && *s != 'L')
- break; /* the ansi panoply */
- if (*s == '*') {
- x = execute(a);
- a = a->nnext;
- sprintf((char *)t-1, "%d", (int) getfval(x));
- t = fmt + strlen(fmt);
- tempfree(x);
- }
- }
- *t = '\0';
- if (t >= fmt + sizeof(fmt))
- ERROR "format item %.30s... too long", os FATAL;
- switch (*s) {
- case 'f': case 'e': case 'g': case 'E': case 'G':
- flag = 1;
- break;
- case 'd': case 'i':
- flag = 2;
- if(*(s-1) == 'l') break;
- *(t-1) = 'l';
- *t = 'd';
- *++t = '\0';
- break;
- case 'o': case 'x': case 'X': case 'u':
- flag = *(s-1) == 'l' ? 2 : 3;
- break;
- case 's':
- flag = 4;
- break;
- case 'c':
- flag = 5;
- break;
- default:
- ERROR "weird printf conversion %s", fmt WARNING;
- flag = 0;
- break;
- }
- if (a == NULL)
- ERROR "not enough args in printf(%s)", os FATAL;
- x = execute(a);
- a = a->nnext;
- switch (flag) {
- case 0: sprintf((char *)p, "%s", fmt); /* unknown, so dump it too */
- p += strlen(p);
- sprintf((char *)p, "%s", getsval(x));
- break;
- case 1: sprintf((char *)p, (char *)fmt, getfval(x)); break;
- case 2: sprintf((char *)p, (char *)fmt, (long) getfval(x)); break;
- case 3: sprintf((char *)p, (char *)fmt, (int) getfval(x)); break;
- case 4:
- t = getsval(x);
- n = strlen(t);
- if (n >= bufsize)
- ERROR "huge string (%d chars) in printf %.30s...",
- n, t FATAL;
- sprintf((char *)p, (char *)fmt, t);
- break;
- case 5:
- isnum(x) ? sprintf((char *)p, (char *)fmt, (int) getfval(x))
- : sprintf((char *)p, (char *)fmt, getsval(x)[0]);
- break;
- }
- tempfree(x);
- p += strlen(p);
- s++;
- }
- *p = '\0';
- for ( ; a; a = a->nnext) /* evaluate any remaining args */
- execute(a);
- return 0;
-}
-
-Cell *asprintf(Node **a, int n) /* sprintf(a[0]) */
-{
- register Cell *x;
- register Node *y;
-#ifdef __ORCAC__
- static uchar *buf = NULL;
-#else
- static uchar buf[3*RECSIZE];
-#endif
-
-#ifdef __ORCAC__
- if (buf == NULL) buf = malloc(3*RECSIZE);
-#endif
-
- y = a[0]->nnext;
- x = execute(a[0]);
- if (format(buf, sizeof buf, getsval(x), y) == -1)
- ERROR "sprintf string %.30s... too long", buf FATAL;
- tempfree(x);
- x = gettemp();
- x->sval = tostring(buf);
- x->tval = STR;
- return(x);
-}
-
-Cell *aprintf(Node **a, int n) /* printf */
-{ /* a[0] is list of args, starting with format string */
- /* a[1] is redirection operator, a[2] is redirection file */
- FILE *fp;
- register Cell *x;
- register Node *y;
-#ifndef __ORCAC__
- static uchar buf[3*RECSIZE];
-#else
- static uchar *buf = NULL;
-
- if (buf == NULL) buf = malloc(3*RECSIZE);
-#endif
-
- y = a[0]->nnext;
- x = execute(a[0]);
- if (format(buf, sizeof buf, getsval(x), y) == -1)
- ERROR "printf string %.30s... too long", buf FATAL;
- tempfree(x);
- if (a[1] == NULL) {
- fputs((char *)buf, stdout);
- if (ferror(stdout))
- ERROR "write error on stdout" FATAL;
- } else {
- fp = redirect((int)a[1], a[2]);
- fputs((char *)buf, fp);
- fflush(fp);
- if (ferror(fp))
- ERROR "write error on %s", filename(fp) FATAL;
- }
- return(true);
-}
-
-Cell *arith(Node **a, int n) /* a[0] + a[1], etc. also -a[0] */
-{
- Awkfloat i, j;
- int v;
- register Cell *x, *y, *z;
-
- x = execute(a[0]);
- i = getfval(x);
- tempfree(x);
- if (n != UMINUS) {
- y = execute(a[1]);
- j = getfval(y);
- tempfree(y);
- }
- z = gettemp();
- switch (n) {
- case ADD:
- i += j;
- break;
- case MINUS:
- i -= j;
- break;
- case MULT:
- i *= j;
- break;
- case DIVIDE:
- if (j == 0)
- ERROR "division by zero" FATAL;
- i /= j;
- break;
- case MOD:
- if (j == 0)
- ERROR "division by zero in mod" FATAL;
- modf((extended)i/j, &v);
- i = i - j * v;
- break;
- case UMINUS:
- i = -i;
- break;
- case POWER:
- if (j >= 0 && modf((extended)j, &v) == 0.0) /* pos integer exponent */
- i = ipow(i, (int) j);
- else
- i = errcheck(pow(i, j), "pow");
- break;
- default: /* can't happen */
- ERROR "illegal arithmetic operator %d", n FATAL;
- }
- setfval(z, i);
- return(z);
-}
-
-double ipow(double x, int n) /* x**n. ought to be done by pow, but isn't always */
-{
- double v;
-
- if (n <= 0)
- return 1;
- v = ipow(x, n/2);
- if (n % 2 == 0)
- return v * v;
- else
- return x * v * v;
-}
-
-Cell *incrdecr(Node **a, int n) /* a[0]++, etc. */
-{
- register Cell *x, *z;
- register int k;
- Awkfloat xf;
-
- x = execute(a[0]);
- xf = getfval(x);
- k = (n == PREINCR || n == POSTINCR) ? 1 : -1;
- if (n == PREINCR || n == PREDECR) {
- setfval(x, xf + k);
- return(x);
- }
- z = gettemp();
- setfval(z, xf);
- setfval(x, xf + k);
- tempfree(x);
- return(z);
-}
-
-Cell *assign(Node **a, int n) /* a[0] = a[1], a[0] += a[1], etc. */
-{ /* this is subtle; don't muck with it. */
- register Cell *x, *y;
- Awkfloat xf, yf;
- int v;
-
- y = execute(a[1]);
- x = execute(a[0]);
- if (n == ASSIGN) { /* ordinary assignment */
- if (x == y && !(x->tval & (FLD|REC))) /* self-assignment: */
- ; /* leave alone unless it's a field */
- else if ((y->tval & (STR|NUM)) == (STR|NUM)) {
- setsval(x, getsval(y));
- x->fval = getfval(y);
- x->tval |= NUM;
- }
- else if (y->tval & STR)
- setsval(x, getsval(y));
- else if (y->tval & NUM)
- setfval(x, getfval(y));
- else
- funnyvar(y, "read value of");
- tempfree(y);
- return(x);
- }
- xf = getfval(x);
- yf = getfval(y);
- switch (n) {
- case ADDEQ:
- xf += yf;
- break;
- case SUBEQ:
- xf -= yf;
- break;
- case MULTEQ:
- xf *= yf;
- break;
- case DIVEQ:
- if (yf == 0)
- ERROR "division by zero in /=" FATAL;
- xf /= yf;
- break;
- case MODEQ:
- if (yf == 0)
- ERROR "division by zero in %%=" FATAL;
- modf((extended)xf/yf, &v);
- xf = xf - yf * v;
- break;
- case POWEQ:
- if (yf >= 0 && modf((extended)yf, &v) == 0.0) /* pos integer exponent */
- xf = ipow(xf, (int) yf);
- else
- xf = errcheck(pow(xf, yf), "pow");
- break;
- default:
- ERROR "illegal assignment operator %d", n FATAL;
- break;
- }
- tempfree(y);
- setfval(x, xf);
- return(x);
-}
-
-Cell *cat(Node **a, int q) /* a[0] cat a[1] */
-{
- register Cell *x, *y, *z;
- register int n1, n2;
- register uchar *s;
-
- x = execute(a[0]);
- y = execute(a[1]);
- getsval(x);
- getsval(y);
- n1 = strlen(x->sval);
- n2 = strlen(y->sval);
- s = (uchar *) malloc(n1 + n2 + 1);
- if (s == NULL)
- ERROR "out of space concatenating %.15s... and %.15s...",
- x->sval, y->sval FATAL;
- strcpy(s, x->sval);
- strcpy(s+n1, y->sval);
- tempfree(y);
- z = gettemp();
- z->sval = s;
- z->tval = STR;
- tempfree(x);
- return(z);
-}
-
-Cell *pastat(Node **a, int n) /* a[0] { a[1] } */
-{
- register Cell *x;
-
- if (a[0] == 0)
- x = execute(a[1]);
- else {
- x = execute(a[0]);
- if (istrue(x)) {
- tempfree(x);
- x = execute(a[1]);
- }
- }
- return x;
-}
-
-Cell *dopa2(Node **a, int n) /* a[0], a[1] { a[2] } */
-{
- register Cell *x;
- register int pair;
-
- pair = (int) a[3];
- if (pairstack[pair] == 0) {
- x = execute(a[0]);
- if (istrue(x))
- pairstack[pair] = 1;
- tempfree(x);
- }
- if (pairstack[pair] == 1) {
- x = execute(a[1]);
- if (istrue(x))
- pairstack[pair] = 0;
- tempfree(x);
- x = execute(a[2]);
- return(x);
- }
- return(false);
-}
-
-Cell *split(Node **a, int nnn) /* split(a[0], a[1], a[2]); a[3] is type */
-{
- Cell *x, *y, *ap;
- register uchar *s;
- register int sep;
- uchar *t, temp, num[10], *fs;
- int n, tempstat;
-
- y = execute(a[0]); /* source string */
- s = getsval(y);
- if (a[2] == 0) /* fs string */
- fs = *FS;
- else if ((int) a[3] == STRING) { /* split(str,arr,"string") */
- x = execute(a[2]);
- fs = getsval(x);
- } else if ((int) a[3] == REGEXPR)
- fs = (uchar*) "(regexpr)"; /* split(str,arr,/regexpr/) */
- else
- ERROR "illegal type of split()" FATAL;
- sep = *fs;
- ap = execute(a[1]); /* array name */
- freesymtab(ap);
- dprintf( ("split: s=|%s|, a=%s, sep=|%s|\n", s, ap->nval, fs) );
- ap->tval &= ~STR;
- ap->tval |= ARR;
- ap->sval = (uchar *) makesymtab(NSYMTAB);
-
- n = 0;
- if (*s != '\0' && strlen(fs) > 1 || (int) a[3] == REGEXPR) { /* reg expr */
- fa *pfa;
- if ((int) a[3] == REGEXPR) { /* it's ready already */
- pfa = (fa *) a[2];
- } else {
- pfa = makedfa(fs, 1);
- }
- if (nematch(pfa,s)) {
- tempstat = pfa->initstat;
- pfa->initstat = 2;
- do {
- n++;
- sprintf((char *)num, "%d", n);
- temp = *patbeg;
- *patbeg = '\0';
- if (isnumber(s))
- setsymtab(num, s, atof((char *)s), STR|NUM, (Array *) ap->sval);
- else
- setsymtab(num, s, 0.0, STR, (Array *) ap->sval);
- *patbeg = temp;
- s = patbeg + patlen;
- if (*(patbeg+patlen-1) == 0 || *s == 0) {
- n++;
- sprintf((char *)num, "%d", n);
- setsymtab(num, "", 0.0, STR, (Array *) ap->sval);
- pfa->initstat = tempstat;
- goto spdone;
- }
- } while (nematch(pfa,s));
- }
- n++;
- sprintf((char *)num, "%d", n);
- if (isnumber(s))
- setsymtab(num, s, atof((char *)s), STR|NUM, (Array *) ap->sval);
- else
- setsymtab(num, s, 0.0, STR, (Array *) ap->sval);
- spdone:
- pfa = NULL;
- } else if (sep == ' ') {
- for (n = 0; ; ) {
- while (*s == ' ' || *s == '\t' || *s == '\n')
- s++;
- if (*s == 0)
- break;
- n++;
- t = s;
- do
- s++;
- while (*s!=' ' && *s!='\t' && *s!='\n' && *s!='\0');
- temp = *s;
- *s = '\0';
- sprintf((char *)num, "%d", n);
- if (isnumber(t))
- setsymtab(num, t, atof((char *)t), STR|NUM, (Array *) ap->sval);
- else
- setsymtab(num, t, 0.0, STR, (Array *) ap->sval);
- *s = temp;
- if (*s != 0)
- s++;
- }
- } else if (*s != 0) {
- for (;;) {
- n++;
- t = s;
- while (*s != sep && *s != '\n' && *s != '\0')
- s++;
- temp = *s;
- *s = '\0';
- sprintf((char *)num, "%d", n);
- if (isnumber(t))
- setsymtab(num, t, atof((char *)t), STR|NUM, (Array *) ap->sval);
- else
- setsymtab(num, t, 0.0, STR, (Array *) ap->sval);
- *s = temp;
- if (*s++ == 0)
- break;
- }
- }
- tempfree(ap);
- tempfree(y);
- if (a[2] != 0 && (int) a[3] == STRING)
- tempfree(x);
- x = gettemp();
- x->tval = NUM;
- x->fval = n;
- return(x);
-}
-
-Cell *condexpr(Node **a, int n) /* a[0] ? a[1] : a[2] */
-{
- register Cell *x;
-
- x = execute(a[0]);
- if (istrue(x)) {
- tempfree(x);
- x = execute(a[1]);
- } else {
- tempfree(x);
- x = execute(a[2]);
- }
- return(x);
-}
-
-Cell *ifstat(Node **a, int n) /* if (a[0]) a[1]; else a[2] */
-{
- register Cell *x;
-
- x = execute(a[0]);
- if (istrue(x)) {
- tempfree(x);
- x = execute(a[1]);
- } else if (a[2] != 0) {
- tempfree(x);
- x = execute(a[2]);
- }
- return(x);
-}
-
-Cell *whilestat(Node **a, int n) /* while (a[0]) a[1] */
-{
- register Cell *x;
-
- for (;;) {
- x = execute(a[0]);
- if (!istrue(x))
- return(x);
- tempfree(x);
- x = execute(a[1]);
- if (isbreak(x)) {
- x = true;
- return(x);
- }
- if (isnext(x) || isexit(x) || isret(x))
- return(x);
- tempfree(x);
- }
-}
-
-Cell *dostat(Node **a, int n) /* do a[0]; while(a[1]) */
-{
- register Cell *x;
-
- for (;;) {
- x = execute(a[0]);
- if (isbreak(x))
- return true;
- if (isnext(x) || isexit(x) || isret(x))
- return(x);
- tempfree(x);
- x = execute(a[1]);
- if (!istrue(x))
- return(x);
- tempfree(x);
- }
-}
-
-Cell *forstat(Node **a, int n) /* for (a[0]; a[1]; a[2]) a[3] */
-{
- register Cell *x;
-
- x = execute(a[0]);
- tempfree(x);
- for (;;) {
- if (a[1]!=0) {
- x = execute(a[1]);
- if (!istrue(x)) return(x);
- else tempfree(x);
- }
- x = execute(a[3]);
- if (isbreak(x)) /* turn off break */
- return true;
- if (isnext(x) || isexit(x) || isret(x))
- return(x);
- tempfree(x);
- x = execute(a[2]);
- tempfree(x);
- }
-}
-
-Cell *instat(Node **a, int n) /* for (a[0] in a[1]) a[2] */
-{
- register Cell *x, *vp, *arrayp, *cp, *ncp;
- Array *tp;
- int i;
-
- vp = execute(a[0]);
- arrayp = execute(a[1]);
- if (!isarr(arrayp)) {
- return true;
- }
- tp = (Array *) arrayp->sval;
- tempfree(arrayp);
- for (i = 0; i < tp->size; i++) { /* this routine knows too much */
- for (cp = tp->tab[i]; cp != NULL; cp = ncp) {
- setsval(vp, cp->nval);
- ncp = cp->cnext;
- x = execute(a[2]);
- if (isbreak(x)) {
- tempfree(vp);
- return true;
- }
- if (isnext(x) || isexit(x) || isret(x)) {
- tempfree(vp);
- return(x);
- }
- tempfree(x);
- }
- }
- return true;
-}
-
-/* if someone ever wants to run over the arrays in sorted order, */
-/* here it is. but it will likely run slower, not faster. */
-
-/*
- *int qstrcmp(p, q)
- * uchar **p, **q;
- *{
- * return strcmp(*p, *q);
- *}
- */
-
-/*Cell *instat(Node **a, int n) /* for (a[0] in a[1]) a[2] */
-/*{
-/* register Cell *x, *vp, *arrayp, *cp, *ncp, *ret;
-/* Array *tp;
-/* int i, ne;
-/*#define BIGENOUGH 1000
-/* uchar *elems[BIGENOUGH], **ep;
-/*
-/* vp = execute(a[0]);
-/* arrayp = execute(a[1]);
-/* if (!isarr(arrayp))
-/* ERROR "%s is not an array", arrayp->nval FATAL;
-/* tp = (Array *) arrayp->sval;
-/* tempfree(arrayp);
-/* ep = elems;
-/* ret = true;
-/* if (tp->nelem >= BIGENOUGH)
-/* ep = (uchar **) malloc(tp->nelem * sizeof(char *));
-/*
-/* for (i = ne = 0; i < tp->size; i++)
-/* for (cp = tp->tab[i]; cp != NULL; cp = cp->cnext)
-/* ep[ne++] = cp->nval;
-/* if (ne != tp->nelem)
-/* ERROR "can't happen: lost elems %d vs. %d", ne, tp->nelem FATAL;
-/* qsort(ep, ne, sizeof(char *), qstrcmp);
-/* for (i = 0; i < ne; i++) {
-/* setsval(vp, ep[i]);
-/* x = execute(a[2]);
-/* if (isbreak(x)) {
-/* tempfree(vp);
-/* break;
-/* }
-/* if (isnext(x) || isexit(x) || isret(x)) {
-/* tempfree(vp);
-/* ret = x;
-/* break;
-/* }
-/* tempfree(x);
-/* }
-/* if (ep != elems)
-/* free(ep);
-/* return ret;
-/*}
-*/
-
-
-Cell *bltin(Node **a, int n) /* builtin functions. a[0] is type, a[1] is arg list */
-{
- register Cell *x, *y;
- /*Awkfloat u;*/
- int u;
- register int t;
-#ifdef __ORCAC__
- uchar *p;
- static uchar *buf = NULL;
-#else
- uchar *p, buf[RECSIZE];
-#endif
- Node *nextarg;
- FILE *fp;
-
-#ifdef __ORCAC__
- if (buf == NULL) buf = malloc(RECSIZE);
-#endif
- t = (int) a[0];
- x = execute(a[1]);
- nextarg = a[1]->nnext;
- switch (t) {
- case FLENGTH:
- u = strlen(getsval(x)); break;
- case FLOG:
- u = errcheck(log(getfval(x)), "log"); break;
- case FINT:
- modf((extended)getfval(x), &u); break;
- case FEXP:
- u = errcheck(exp(getfval(x)), "exp"); break;
- case FSQRT:
- u = errcheck(sqrt(getfval(x)), "sqrt"); break;
- case FSIN:
- u = sin(getfval(x)); break;
- case FCOS:
- u = cos(getfval(x)); break;
- case FATAN:
- if (nextarg == 0) {
- ERROR "atan2 requires two arguments; returning 1.0" WARNING;
- u = 1.0;
- } else {
- y = execute(a[1]->nnext);
- u = atan2(getfval(x), getfval(y));
- tempfree(y);
- nextarg = nextarg->nnext;
- }
- break;
- case FSYSTEM:
- fflush(stdout); /* in case something is buffered already */
- u = (Awkfloat) system((char *)getsval(x)) / 256; /* 256 is unix-dep */
- break;
- case FRAND:
- /* in principle, rand() returns something in 0..RAND_MAX */
- u = (Awkfloat) (rand() % RAND_MAX) / RAND_MAX;
- break;
- case FSRAND:
- if (x->tval & REC) /* no argument provided */
- u = (int) time(NULL);
- else
- u = getfval(x);
- srand((int) u); u = (int) u;
- break;
- case FTOUPPER:
- case FTOLOWER:
- strcpy(buf, getsval(x));
- if (t == FTOUPPER) {
- for (p = buf; *p; p++)
- if (islower(*p))
- *p = toupper(*p);
- } else {
- for (p = buf; *p; p++)
- if (isupper(*p))
- *p = tolower(*p);
- }
- tempfree(x);
- x = gettemp();
- setsval(x, buf);
- return x;
- case FFLUSH:
- if ((fp = openfile(GT, getsval(x))) == NULL)
- u = EOF;
- else
- u = fflush(fp);
- break;
- default: /* can't happen */
- ERROR "illegal function type %d", t FATAL;
- break;
- }
- tempfree(x);
- x = gettemp();
- setfval(x, u);
- if (nextarg != 0) {
- ERROR "warning: function has too many arguments" WARNING;
- for ( ; nextarg; nextarg = nextarg->nnext)
- execute(nextarg);
- }
- return(x);
-}
-
-Cell *printstat(Node **a, int n) /* print a[0] */
-{
- register Node *x;
- register Cell *y;
- FILE *fp;
-
- if (a[1] == 0) /* a[1] is redirection operator, a[2] is file */
- fp = stdout;
- else
- fp = redirect((int)a[1], a[2]);
- for (x = a[0]; x != NULL; x = x->nnext) {
- y = execute(x);
- fputs((char *)getsval(y), fp);
- tempfree(y);
- if (x->nnext == NULL)
- fputs((char *)*ORS, fp);
- else
- fputs((char *)*OFS, fp);
- }
- if (a[1] != 0)
- fflush(fp);
- if (ferror(fp))
- ERROR "write error on %s", filename(fp) FATAL;
- return(true);
-}
-
-Cell *nullproc(Node **a, int n)
-{
- n;
- a;
- return 0;
-}
-
-
-FILE *redirect(int a, Node *b) /* set up all i/o redirections */
-{
- FILE *fp;
- Cell *x;
- uchar *fname;
-
- x = execute(b);
- fname = getsval(x);
- fp = openfile(a, fname);
- if (fp == NULL)
- ERROR "can't open file %s", fname FATAL;
- tempfree(x);
- return fp;
-}
-
-struct files {
- FILE *fp;
- uchar *fname;
- int mode; /* '|', 'a', 'w' => LE/LT, GT */
-} files[FOPEN_MAX] ={
- { NULL /*stdin*/, "/dev/stdin", LT }, /* watch out: don't free this! */
- { NULL /*stdout*/, "/dev/stdout", GT },
- { NULL /*stderr*/, "/dev/stderr", GT }
-};
-
-void initfiles(void)
-{
- files[0].fp = stdin;
- files[1].fp = stdout;
- files[2].fp = stderr;
-}
-
-FILE *openfile(int a, uchar *us)
-{
- char *s = us;
- register int i, m;
- register FILE *fp;
-
- if (*s == '\0')
- ERROR "null file name in print or getline" FATAL;
- for (i=0; i < FOPEN_MAX; i++)
- if (files[i].fname && strcmp(s, files[i].fname) == 0)
- if (a == files[i].mode || a==APPEND && files[i].mode==GT)
- return files[i].fp;
- for (i=0; i < FOPEN_MAX; i++)
- if (files[i].fp == 0)
- break;
- if (i >= FOPEN_MAX)
- ERROR "%s makes too many open files", s FATAL;
- fflush(stdout); /* force a semblance of order */
- m = a;
- if (a == GT) {
- fp = fopen(s, "w");
- } else if (a == APPEND) {
- fp = fopen(s, "a");
- m = GT; /* so can mix > and >> */
- } else if (a == '|') { /* output pipe */
- fp = popen(s, "w");
- } else if (a == LE) { /* input pipe */
- fp = popen(s, "r");
- } else if (a == LT) { /* getline <file */
- fp = strcmp(s, "-") == 0 ? stdin : fopen(s, "r"); /* "-" is stdin */
- } else /* can't happen */
- ERROR "illegal redirection %d", a FATAL;
- if (fp != NULL) {
- files[i].fname = tostring(s);
- files[i].fp = fp;
- files[i].mode = m;
- }
- return fp;
-}
-
-uchar *filename(FILE *fp)
-{
- int i;
-
- for (i = 0; i < FOPEN_MAX; i++)
- if (fp == files[i].fp)
- return files[i].fname;
- return "???";
-}
-
-Cell *closefile(Node **a, int n)
-{
- register Cell *x;
- int i, stat;
-
- n;
- x = execute(a[0]);
- getsval(x);
- for (i = 0; i < FOPEN_MAX; i++)
- if (files[i].fname && strcmp(x->sval, files[i].fname) == 0) {
- if (ferror(files[i].fp))
- ERROR "i/o error occurred on %s", files[i].fname WARNING;
- if (files[i].mode == '|' || files[i].mode == LE)
- stat = pclose(files[i].fp);
- else
- stat = fclose(files[i].fp);
- if (stat == EOF)
- ERROR "i/o error occurred closing %s", files[i].fname WARNING;
- if (i > 2) /* don't do /dev/std... */
- xfree(files[i].fname);
- files[i].fname = NULL; /* watch out for ref thru this */
- files[i].fp = NULL;
- }
- tempfree(x);
- return(true);
-}
-
-void closeall(void)
-{
- int i, stat;
-
- for (i = 0; i < FOPEN_MAX; i++)
- if (files[i].fp) {
- if (ferror(files[i].fp))
- ERROR "i/o error occurred on %s", files[i].fname WARNING;
- if (files[i].mode == '|' || files[i].mode == LE)
- stat = pclose(files[i].fp);
- else
- stat = fclose(files[i].fp);
- if (stat == EOF)
- ERROR "i/o error occurred while closing %s", files[i].fname WARNING;
- }
-}
-
-#define SUBSIZE (20 * RECSIZE)
-
-Cell *sub(Node **a, int nnn) /* substitute command */
-{
- register uchar *sptr, *pb, *q;
- register Cell *x, *y, *result;
-#ifdef __ORCAC__
- uchar *buf,*t;
-#else
- uchar buf[SUBSIZE], *t;
-#endif
- fa *pfa;
-
-#ifdef __ORCAC__
- buf = malloc(SUBSIZE);
-#endif
- x = execute(a[3]); /* target string */
- t = getsval(x);
- if (a[0] == 0) /* 0 => a[1] is already-compiled regexpr */
- pfa = (fa *) a[1]; /* regular expression */
- else {
- y = execute(a[1]);
- pfa = makedfa(getsval(y), 1);
- tempfree(y);
- }
- y = execute(a[2]); /* replacement string */
- result = false;
- if (pmatch(pfa, t)) {
- pb = buf;
- sptr = t;
- while (sptr < patbeg)
- *pb++ = *sptr++;
- sptr = getsval(y);
- while (*sptr != 0 && pb < buf + SUBSIZE - 1)
- if (*sptr == '\\' && *(sptr+1) == '&') {
- sptr++; /* skip \, */
- *pb++ = *sptr++; /* add & */
- } else if (*sptr == '&') {
- sptr++;
- for (q = patbeg; q < patbeg+patlen; )
- *pb++ = *q++;
- } else
- *pb++ = *sptr++;
- *pb = '\0';
- if (pb >= buf + SUBSIZE)
- ERROR "sub() result %30s too big", buf FATAL;
- sptr = patbeg + patlen;
- if ((patlen == 0 && *patbeg) || (patlen && *(sptr-1)))
- while (*pb++ = *sptr++)
- ;
- if (pb >= buf + SUBSIZE)
- ERROR "sub() result %.30s too big", buf FATAL;
- setsval(x, buf);
- result = true;;
- }
- tempfree(x);
- tempfree(y);
-#ifdef __ORCAC__
- free(buf);
-#endif
- return result;
-}
-
-Cell *gsub(Node **a, int nnn) /* global substitute */
-{
- register Cell *x, *y;
- register uchar *rptr, *sptr, *t, *pb;
-#ifdef __ORCAC__
- uchar *buf;
-#else
- uchar buf[SUBSIZE];
-#endif
- register fa *pfa;
- int mflag, tempstat, num;
-
-#ifdef __ORCAC__
- buf = malloc(SUBSIZE);
-#endif
- mflag = 0; /* if mflag == 0, can replace empty string */
- num = 0;
- x = execute(a[3]); /* target string */
- t = getsval(x);
- if (a[0] == 0) /* 0 => a[1] is already-compiled regexpr */
- pfa = (fa *) a[1]; /* regular expression */
- else {
- y = execute(a[1]);
- pfa = makedfa(getsval(y), 1);
- tempfree(y);
- }
- y = execute(a[2]); /* replacement string */
- if (pmatch(pfa, t)) {
- tempstat = pfa->initstat;
- pfa->initstat = 2;
- pb = buf;
- rptr = getsval(y);
- do {
- /*
- uchar *p;
- int i;
- printf("target string: %s, *patbeg = %o, patlen = %d\n",
- t, *patbeg, patlen);
- printf(" match found: ");
- p=patbeg;
- for (i=0; i<patlen; i++)
- printf("%c", *p++);
- printf("\n");
- */
- if (patlen == 0 && *patbeg != 0) { /* matched empty string */
- if (mflag == 0) { /* can replace empty */
- num++;
- sptr = rptr;
- while (*sptr != 0 && pb < buf + SUBSIZE-1)
- if (*sptr == '\\' && *(sptr+1) == '&') {
- sptr++;
- *pb++ = *sptr++;
- } else if (*sptr == '&') {
- uchar *q;
- sptr++;
- for (q = patbeg; q < patbeg+patlen; )
- *pb++ = *q++;
- } else
- *pb++ = *sptr++;
- }
- if (*t == 0) /* at end */
- goto done;
- *pb++ = *t++;
- if (pb >= buf + SUBSIZE-1)
- ERROR "gsub() result %.30s too big", buf FATAL;
- mflag = 0;
- }
- else { /* matched nonempty string */
- num++;
- sptr = t;
- while (sptr < patbeg && pb < buf + SUBSIZE-1)
- *pb++ = *sptr++;
- sptr = rptr;
- while (*sptr != 0 && pb < buf + SUBSIZE-1)
- if (*sptr == '\\' && *(sptr+1) == '&') {
- sptr++;
- *pb++ = *sptr++;
- } else if (*sptr == '&') {
- uchar *q;
- sptr++;
- for (q = patbeg; q < patbeg+patlen; )
- *pb++ = *q++;
- } else
- *pb++ = *sptr++;
- t = patbeg + patlen;
- if ((*(t-1) == 0) || (*t == 0))
- goto done;
- if (pb >= buf + SUBSIZE-1)
- ERROR "gsub() result %.30s too big", buf FATAL;
- mflag = 1;
- }
- } while (pmatch(pfa,t));
- sptr = t;
- while (*pb++ = *sptr++)
- ;
- done: if (pb >= buf + SUBSIZE-1)
- ERROR "gsub() result %.30s too big", buf FATAL;
- *pb = '\0';
- setsval(x, buf);
- pfa->initstat = tempstat;
- }
- tempfree(x);
- tempfree(y);
-#ifdef __ORCAC__
- free(buf);
-#endif
- x = gettemp();
- x->tval = NUM;
- x->fval = num;
- return(x);
-}
=awk.lx.l
-%Start A str sc reg comment
-
-%{
-/****************************************************************
-Copyright (C) AT&T 1993
-All Rights Reserved
-
-Permission to use, copy, modify, and distribute this software and
-its documentation for any purpose and without fee is hereby
-granted, provided that the above copyright notice appear in all
-copies and that both that the copyright notice and this
-permission notice and warranty disclaimer appear in supporting
-documentation, and that the name of AT&T or any of its entities
-not be used in advertising or publicity pertaining to
-distribution of the software without specific, written prior
-permission.
-
-AT&T DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE,
-INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS.
-IN NO EVENT SHALL AT&T OR ANY OF ITS ENTITIES BE LIABLE FOR ANY
-SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
-WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER
-IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION,
-ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF
-THIS SOFTWARE.
-****************************************************************/
-
-/* some of this depends on behavior of lex that
- may not be preserved in other implementations of lex.
-*/
-
-#undef input /* defeat lex */
-#undef unput
-
-#include <stdlib.h>
-#include <string.h>
-#include "awk.h"
-#include "y.tab.h"
-
-extern YYSTYPE yylval;
-extern int infunc;
-
-int lineno = 1;
-int bracecnt = 0;
-int brackcnt = 0;
-int parencnt = 0;
-#define DEBUG
-#ifdef DEBUG
-# define RET(x) {if(dbg)printf("lex %s [%s]\n", tokname(x), yytext); return(x); }
-#else
-# define RET(x) return(x)
-#endif
-
-#define CADD cbuf[clen++] = yytext[0]; \
- if (clen >= CBUFLEN-1) { \
- ERROR "string/reg expr %.30s... too long", cbuf SYNTAX; \
- BEGIN A; \
- }
-
-uchar cbuf[CBUFLEN];
-uchar *s;
-int clen, cflag;
-%}
-
-A [a-zA-Z_]
-B [a-zA-Z0-9_]
-D [0-9]
-O [0-7]
-H [0-9a-fA-F]
-WS [ \t]
-
-%%
- switch (yybgin-yysvec-1) { /* witchcraft */
- case 0:
- BEGIN A;
- break;
- case sc:
- BEGIN A;
- RET('}');
- }
-
-<A>\n { lineno++; RET(NL); }
-<A>#.* { ; } /* strip comments */
-<A>{WS}+ { ; }
-<A>; { RET(';'); }
-
-<A>"\\"\n { lineno++; }
-<A>BEGIN { RET(XBEGIN); }
-<A>END { RET(XEND); }
-<A>func(tion)? { if (infunc) ERROR "illegal nested function" SYNTAX; RET(FUNC); }
-<A>return { if (!infunc) ERROR "return not in function" SYNTAX; RET(RETURN); }
-<A>"&&" { RET(AND); }
-<A>"||" { RET(BOR); }
-<A>"!" { RET(NOT); }
-<A>"!=" { yylval.i = NE; RET(NE); }
-<A>"~" { yylval.i = MATCH; RET(MATCHOP); }
-<A>"!~" { yylval.i = NOTMATCH; RET(MATCHOP); }
-<A>"<" { yylval.i = LT; RET(LT); }
-<A>"<=" { yylval.i = LE; RET(LE); }
-<A>"==" { yylval.i = EQ; RET(EQ); }
-<A>">=" { yylval.i = GE; RET(GE); }
-<A>">" { yylval.i = GT; RET(GT); }
-<A>">>" { yylval.i = APPEND; RET(APPEND); }
-<A>"++" { yylval.i = INCR; RET(INCR); }
-<A>"--" { yylval.i = DECR; RET(DECR); }
-<A>"+=" { yylval.i = ADDEQ; RET(ASGNOP); }
-<A>"-=" { yylval.i = SUBEQ; RET(ASGNOP); }
-<A>"*=" { yylval.i = MULTEQ; RET(ASGNOP); }
-<A>"/=" { yylval.i = DIVEQ; RET(ASGNOP); }
-<A>"%=" { yylval.i = MODEQ; RET(ASGNOP); }
-<A>"^=" { yylval.i = POWEQ; RET(ASGNOP); }
-<A>"**=" { yylval.i = POWEQ; RET(ASGNOP); }
-<A>"=" { yylval.i = ASSIGN; RET(ASGNOP); }
-<A>"**" { RET(POWER); }
-<A>"^" { RET(POWER); }
-
-<A>"$"{D}+ { yylval.cp = fieldadr(atoi(yytext+1)); RET(FIELD); }
-<A>"$NF" { unputstr("(NF)"); return(INDIRECT); }
-<A>"$"{A}{B}* { int c, n;
- c = input(); unput(c);
- if (c == '(' || c == '[' || infunc && (n=isarg(yytext+1)) >= 0) {
- unputstr(yytext+1);
- return(INDIRECT);
- } else {
- yylval.cp = setsymtab(yytext+1,"",0.0,STR|NUM,symtab);
- RET(IVAR);
- }
- }
-<A>"$" { RET(INDIRECT); }
-<A>NF { yylval.cp = setsymtab(yytext, "", 0.0, NUM, symtab); RET(VARNF); }
-
-<A>({D}+("."?){D}*|"."{D}+)((e|E)("+"|-)?{D}+)? {
- yylval.cp = setsymtab(yytext, tostring(yytext), atof(yytext), CON|NUM, symtab);
- /* should this also have STR set? */
- RET(NUMBER); }
-
-<A>while { RET(WHILE); }
-<A>for { RET(FOR); }
-<A>do { RET(DO); }
-<A>if { RET(IF); }
-<A>else { RET(ELSE); }
-<A>next { RET(NEXT); }
-<A>exit { RET(EXIT); }
-<A>break { RET(BREAK); }
-<A>continue { RET(CONTINUE); }
-<A>print { yylval.i = PRINT; RET(PRINT); }
-<A>printf { yylval.i = PRINTF; RET(PRINTF); }
-<A>sprintf { yylval.i = SPRINTF; RET(SPRINTF); }
-<A>split { yylval.i = SPLIT; RET(SPLIT); }
-<A>substr { RET(SUBSTR); }
-<A>sub { yylval.i = SUB; RET(SUB); }
-<A>gsub { yylval.i = GSUB; RET(GSUB); }
-<A>index { RET(INDEX); }
-<A>match { RET(MATCHFCN); }
-<A>in { RET(IN); }
-<A>getline { RET(GETLINE); }
-<A>close { RET(CLOSE); }
-<A>delete { RET(DELETE); }
-<A>length { yylval.i = FLENGTH; RET(BLTIN); }
-<A>log { yylval.i = FLOG; RET(BLTIN); }
-<A>int { yylval.i = FINT; RET(BLTIN); }
-<A>exp { yylval.i = FEXP; RET(BLTIN); }
-<A>sqrt { yylval.i = FSQRT; RET(BLTIN); }
-<A>sin { yylval.i = FSIN; RET(BLTIN); }
-<A>cos { yylval.i = FCOS; RET(BLTIN); }
-<A>atan2 { yylval.i = FATAN; RET(BLTIN); }
-<A>system { yylval.i = FSYSTEM; RET(BLTIN); }
-<A>rand { yylval.i = FRAND; RET(BLTIN); }
-<A>srand { yylval.i = FSRAND; RET(BLTIN); }
-<A>toupper { yylval.i = FTOUPPER; RET(BLTIN); }
-<A>tolower { yylval.i = FTOLOWER; RET(BLTIN); }
-<A>fflush { yylval.i = FFLUSH; RET(BLTIN); }
-
-<A>{A}{B}* { int n, c;
- c = input(); unput(c); /* look for '(' */
- if (c != '(' && infunc && (n=isarg(yytext)) >= 0) {
- yylval.i = n;
- RET(ARG);
- } else {
- yylval.cp = setsymtab(yytext,"",0.0,STR|NUM,symtab);
- if (c == '(') {
- RET(CALL);
- } else {
- RET(VAR);
- }
- }
- }
-<A>\" { BEGIN str; clen = 0; }
-
-<A>"}" { if (--bracecnt < 0) ERROR "extra }" SYNTAX; BEGIN sc; RET(';'); }
-<A>"]" { if (--brackcnt < 0) ERROR "extra ]" SYNTAX; RET(']'); }
-<A>")" { if (--parencnt < 0) ERROR "extra )" SYNTAX; RET(')'); }
-
-<A>. { if (yytext[0] == '{') bracecnt++;
- else if (yytext[0] == '[') brackcnt++;
- else if (yytext[0] == '(') parencnt++;
- RET(yylval.i = yytext[0]); /* everything else */ }
-
-<reg>\\. { cbuf[clen++] = '\\'; cbuf[clen++] = yytext[1]; }
-<reg>\n { ERROR "newline in regular expression %.10s...", cbuf SYNTAX; lineno++; BEGIN A; }
-<reg>"/" { BEGIN A;
- cbuf[clen] = 0;
- yylval.s = tostring(cbuf);
- unput('/');
- RET(REGEXPR); }
-<reg>. { CADD; }
-
-<str>\" { BEGIN A;
- cbuf[clen] = 0; s = tostring(cbuf);
- cbuf[clen] = ' '; cbuf[++clen] = 0;
- yylval.cp = setsymtab(cbuf, s, 0.0, CON|STR, symtab);
- RET(STRING); }
-<str>\n { ERROR "newline in string %.10s...", cbuf SYNTAX; lineno++; BEGIN A; }
-<str>"\\\"" { cbuf[clen++] = '"'; }
-<str>"\\"n { cbuf[clen++] = '\n'; }
-<str>"\\"t { cbuf[clen++] = '\t'; }
-<str>"\\"f { cbuf[clen++] = '\f'; }
-<str>"\\"r { cbuf[clen++] = '\r'; }
-<str>"\\"b { cbuf[clen++] = '\b'; }
-<str>"\\"v { cbuf[clen++] = '\v'; } /* these ANSIisms may not be known by */
-<str>"\\"a { cbuf[clen++] = '\007'; } /* your compiler. hence 007 for bell */
-<str>"\\\\" { cbuf[clen++] = '\\'; }
-<str>"\\"({O}{O}{O}|{O}{O}|{O}) { int n;
- sscanf(yytext+1, "%o", &n); cbuf[clen++] = n; }
-<str>"\\"x({H}+) { int n; /* ANSI permits any number! */
- sscanf(yytext+2, "%x", &n); cbuf[clen++] = n; }
-<str>"\\". { cbuf[clen++] = yytext[1]; }
-<str>. { CADD; }
-
-%%
-
-void startreg(void) /* start parsing a regular expression */
-{
- BEGIN reg;
- clen = 0;
-}
-
-/* input() and unput() are transcriptions of the standard lex
- macros for input and output with additions for error message
- printing. God help us all if someone changes how lex works.
-*/
-
-uchar ebuf[300];
-uchar *ep = ebuf;
-
-input(void) /* get next lexical input character */
-{
- register int c;
- extern uchar *lexprog;
-
- if (yysptr > yysbuf)
- c = U(*--yysptr);
- else if (lexprog != NULL) { /* awk '...' */
- if (c = *lexprog)
- lexprog++;
- } else /* awk -f ... */
- c = pgetc();
- if (c == '\n')
- yylineno++;
- else if (c == EOF)
- c = 0;
- if (ep >= ebuf + sizeof ebuf)
- ep = ebuf;
- return *ep++ = c;
-}
-
-void unput(int c) /* put lexical character back on input */
-{
- yytchar = c;
- if (yytchar == '\n')
- yylineno--;
- *yysptr++ = yytchar;
- if (--ep < ebuf)
- ep = ebuf + sizeof(ebuf) - 1;
-}
-
-
-void unputstr(char *s) /* put a string back on input */
-{
- int i;
-
- for (i = strlen(s)-1; i >= 0; i--)
- unput(s[i]);
-}
+ END OF ARCHIVE