Merge commit 'b31320a79e2054c6739b5229259dbf98f3afc547' into merges
[unleashed.git] / contrib / awk / run.c
blob6bf42c242d8454e10d5c2110b9d6be57c40a7739
1 /****************************************************************
2 Copyright (C) Lucent Technologies 1997
3 All Rights Reserved
5 Permission to use, copy, modify, and distribute this software and
6 its documentation for any purpose and without fee is hereby
7 granted, provided that the above copyright notice appear in all
8 copies and that both that the copyright notice and this
9 permission notice and warranty disclaimer appear in supporting
10 documentation, and that the name Lucent Technologies or any of
11 its entities not be used in advertising or publicity pertaining
12 to distribution of the software without specific, written prior
13 permission.
15 LUCENT DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE,
16 INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS.
17 IN NO EVENT SHALL LUCENT OR ANY OF ITS ENTITIES BE LIABLE FOR ANY
18 SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
19 WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER
20 IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION,
21 ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF
22 THIS SOFTWARE.
23 ****************************************************************/
25 #define DEBUG
26 #include <stdio.h>
27 #include <ctype.h>
28 #include <setjmp.h>
29 #include <limits.h>
30 #include <math.h>
31 #include <string.h>
32 #include <stdlib.h>
33 #include <time.h>
34 #include "awk.h"
35 #include "ytab.h"
37 #define tempfree(x) if (istemp(x)) tfree(x); else
40 #undef tempfree
42 void tempfree(Cell *p) {
43 if (p->ctype == OCELL && (p->csub < CUNK || p->csub > CFREE)) {
44 WARNING("bad csub %d in Cell %d %s",
45 p->csub, p->ctype, p->sval);
47 if (istemp(p))
48 tfree(p);
52 /* do we really need these? */
53 /* #ifdef _NFILE */
54 /* #ifndef FOPEN_MAX */
55 /* #define FOPEN_MAX _NFILE */
56 /* #endif */
57 /* #endif */
58 /* */
59 /* #ifndef FOPEN_MAX */
60 /* #define FOPEN_MAX 40 */ /* max number of open files */
61 /* #endif */
62 /* */
63 /* #ifndef RAND_MAX */
64 /* #define RAND_MAX 32767 */ /* all that ansi guarantees */
65 /* #endif */
67 jmp_buf env;
68 extern int pairstack[];
69 extern Awkfloat srand_seed;
71 Node *winner = NULL; /* root of parse tree */
72 Cell *tmps; /* free temporary cells for execution */
74 static Cell truecell ={ OBOOL, BTRUE, 0, 0, 1.0, NUM };
75 Cell *True = &truecell;
76 static Cell falsecell ={ OBOOL, BFALSE, 0, 0, 0.0, NUM };
77 Cell *False = &falsecell;
78 static Cell breakcell ={ OJUMP, JBREAK, 0, 0, 0.0, NUM };
79 Cell *jbreak = &breakcell;
80 static Cell contcell ={ OJUMP, JCONT, 0, 0, 0.0, NUM };
81 Cell *jcont = &contcell;
82 static Cell nextcell ={ OJUMP, JNEXT, 0, 0, 0.0, NUM };
83 Cell *jnext = &nextcell;
84 static Cell nextfilecell ={ OJUMP, JNEXTFILE, 0, 0, 0.0, NUM };
85 Cell *jnextfile = &nextfilecell;
86 static Cell exitcell ={ OJUMP, JEXIT, 0, 0, 0.0, NUM };
87 Cell *jexit = &exitcell;
88 static Cell retcell ={ OJUMP, JRET, 0, 0, 0.0, NUM };
89 Cell *jret = &retcell;
90 static Cell tempcell ={ OCELL, CTEMP, 0, "", 0.0, NUM|STR|DONTFREE };
92 Node *curnode = NULL; /* the node being executed, for debugging */
94 /* buffer memory management */
95 int adjbuf(char **pbuf, int *psiz, int minlen, int quantum, char **pbptr,
96 const char *whatrtn)
97 /* pbuf: address of pointer to buffer being managed
98 * psiz: address of buffer size variable
99 * minlen: minimum length of buffer needed
100 * quantum: buffer size quantum
101 * pbptr: address of movable pointer into buffer, or 0 if none
102 * whatrtn: name of the calling routine if failure should cause fatal error
104 * return 0 for realloc failure, !=0 for success
107 if (minlen > *psiz) {
108 char *tbuf;
109 int rminlen = quantum ? minlen % quantum : 0;
110 int boff = pbptr ? *pbptr - *pbuf : 0;
111 /* round up to next multiple of quantum */
112 if (rminlen)
113 minlen += quantum - rminlen;
114 tbuf = (char *) realloc(*pbuf, minlen);
115 dprintf( ("adjbuf %s: %d %d (pbuf=%p, tbuf=%p)\n", whatrtn, *psiz, minlen, *pbuf, tbuf) );
116 if (tbuf == NULL) {
117 if (whatrtn)
118 FATAL("out of memory in %s", whatrtn);
119 return 0;
121 *pbuf = tbuf;
122 *psiz = minlen;
123 if (pbptr)
124 *pbptr = tbuf + boff;
126 return 1;
129 void run(Node *a) /* execution of parse tree starts here */
131 extern void stdinit(void);
133 stdinit();
134 execute(a);
135 closeall();
138 Cell *execute(Node *u) /* execute a node of the parse tree */
140 Cell *(*proc)(Node **, int);
141 Cell *x;
142 Node *a;
144 if (u == NULL)
145 return(True);
146 for (a = u; ; a = a->nnext) {
147 curnode = a;
148 if (isvalue(a)) {
149 x = (Cell *) (a->narg[0]);
150 if (isfld(x) && !donefld)
151 fldbld();
152 else if (isrec(x) && !donerec)
153 recbld();
154 return(x);
156 if (notlegal(a->nobj)) /* probably a Cell* but too risky to print */
157 FATAL("illegal statement");
158 proc = proctab[a->nobj-FIRSTTOKEN];
159 x = (*proc)(a->narg, a->nobj);
160 if (isfld(x) && !donefld)
161 fldbld();
162 else if (isrec(x) && !donerec)
163 recbld();
164 if (isexpr(a))
165 return(x);
166 if (isjump(x))
167 return(x);
168 if (a->nnext == NULL)
169 return(x);
170 tempfree(x);
175 Cell *program(Node **a, int n) /* execute an awk program */
176 { /* a[0] = BEGIN, a[1] = body, a[2] = END */
177 Cell *x;
179 if (setjmp(env) != 0)
180 goto ex;
181 if (a[0]) { /* BEGIN */
182 x = execute(a[0]);
183 if (isexit(x))
184 return(True);
185 if (isjump(x))
186 FATAL("illegal break, continue, next or nextfile from BEGIN");
187 tempfree(x);
189 if (a[1] || a[2])
190 while (getrec(&record, &recsize, 1) > 0) {
191 x = execute(a[1]);
192 if (isexit(x))
193 break;
194 tempfree(x);
197 if (setjmp(env) != 0) /* handles exit within END */
198 goto ex1;
199 if (a[2]) { /* END */
200 x = execute(a[2]);
201 if (isbreak(x) || isnext(x) || iscont(x))
202 FATAL("illegal break, continue, next or nextfile from END");
203 tempfree(x);
205 ex1:
206 return(True);
209 struct Frame { /* stack frame for awk function calls */
210 int nargs; /* number of arguments in this call */
211 Cell *fcncell; /* pointer to Cell for function */
212 Cell **args; /* pointer to array of arguments after execute */
213 Cell *retval; /* return value */
216 #define NARGS 50 /* max args in a call */
218 struct Frame *frame = NULL; /* base of stack frames; dynamically allocated */
219 int nframe = 0; /* number of frames allocated */
220 struct Frame *fp = NULL; /* frame pointer. bottom level unused */
222 Cell *call(Node **a, int n) /* function call. very kludgy and fragile */
224 static Cell newcopycell = { OCELL, CCOPY, 0, "", 0.0, NUM|STR|DONTFREE };
225 int i, ncall, ndef;
226 int freed = 0; /* handles potential double freeing when fcn & param share a tempcell */
227 Node *x;
228 Cell *args[NARGS], *oargs[NARGS]; /* BUG: fixed size arrays */
229 Cell *y, *z, *fcn;
230 char *s;
232 fcn = execute(a[0]); /* the function itself */
233 s = fcn->nval;
234 if (!isfcn(fcn))
235 FATAL("calling undefined function %s", s);
236 if (frame == NULL) {
237 fp = frame = (struct Frame *) calloc(nframe += 100, sizeof(struct Frame));
238 if (frame == NULL)
239 FATAL("out of space for stack frames calling %s", s);
241 for (ncall = 0, x = a[1]; x != NULL; x = x->nnext) /* args in call */
242 ncall++;
243 ndef = (int) fcn->fval; /* args in defn */
244 dprintf( ("calling %s, %d args (%d in defn), fp=%d\n", s, ncall, ndef, (int) (fp-frame)) );
245 if (ncall > ndef)
246 WARNING("function %s called with %d args, uses only %d",
247 s, ncall, ndef);
248 if (ncall + ndef > NARGS)
249 FATAL("function %s has %d arguments, limit %d", s, ncall+ndef, NARGS);
250 for (i = 0, x = a[1]; x != NULL; i++, x = x->nnext) { /* get call args */
251 dprintf( ("evaluate args[%d], fp=%d:\n", i, (int) (fp-frame)) );
252 y = execute(x);
253 oargs[i] = y;
254 dprintf( ("args[%d]: %s %f <%s>, t=%o\n",
255 i, NN(y->nval), y->fval, isarr(y) ? "(array)" : NN(y->sval), y->tval) );
256 if (isfcn(y))
257 FATAL("can't use function %s as argument in %s", y->nval, s);
258 if (isarr(y))
259 args[i] = y; /* arrays by ref */
260 else
261 args[i] = copycell(y);
262 tempfree(y);
264 for ( ; i < ndef; i++) { /* add null args for ones not provided */
265 args[i] = gettemp();
266 *args[i] = newcopycell;
268 fp++; /* now ok to up frame */
269 if (fp >= frame + nframe) {
270 int dfp = fp - frame; /* old index */
271 frame = (struct Frame *)
272 realloc((char *) frame, (nframe += 100) * sizeof(struct Frame));
273 if (frame == NULL)
274 FATAL("out of space for stack frames in %s", s);
275 fp = frame + dfp;
277 fp->fcncell = fcn;
278 fp->args = args;
279 fp->nargs = ndef; /* number defined with (excess are locals) */
280 fp->retval = gettemp();
282 dprintf( ("start exec of %s, fp=%d\n", s, (int) (fp-frame)) );
283 y = execute((Node *)(fcn->sval)); /* execute body */
284 dprintf( ("finished exec of %s, fp=%d\n", s, (int) (fp-frame)) );
286 for (i = 0; i < ndef; i++) {
287 Cell *t = fp->args[i];
288 if (isarr(t)) {
289 if (t->csub == CCOPY) {
290 if (i >= ncall) {
291 freesymtab(t);
292 t->csub = CTEMP;
293 tempfree(t);
294 } else {
295 oargs[i]->tval = t->tval;
296 oargs[i]->tval &= ~(STR|NUM|DONTFREE);
297 oargs[i]->sval = t->sval;
298 tempfree(t);
301 } else if (t != y) { /* kludge to prevent freeing twice */
302 t->csub = CTEMP;
303 tempfree(t);
304 } else if (t == y && t->csub == CCOPY) {
305 t->csub = CTEMP;
306 tempfree(t);
307 freed = 1;
310 tempfree(fcn);
311 if (isexit(y) || isnext(y))
312 return y;
313 if (freed == 0) {
314 tempfree(y); /* don't free twice! */
316 z = fp->retval; /* return value */
317 dprintf( ("%s returns %g |%s| %o\n", s, getfval(z), getsval(z), z->tval) );
318 fp--;
319 return(z);
322 Cell *copycell(Cell *x) /* make a copy of a cell in a temp */
324 Cell *y;
326 y = gettemp();
327 y->csub = CCOPY; /* prevents freeing until call is over */
328 y->nval = x->nval; /* BUG? */
329 if (isstr(x))
330 y->sval = tostring(x->sval);
331 y->fval = x->fval;
332 y->tval = x->tval & ~(CON|FLD|REC|DONTFREE); /* copy is not constant or field */
333 /* is DONTFREE right? */
334 return y;
337 Cell *arg(Node **a, int n) /* nth argument of a function */
340 n = ptoi(a[0]); /* argument number, counting from 0 */
341 dprintf( ("arg(%d), fp->nargs=%d\n", n, fp->nargs) );
342 if (n+1 > fp->nargs)
343 FATAL("argument #%d of function %s was not supplied",
344 n+1, fp->fcncell->nval);
345 return fp->args[n];
348 Cell *jump(Node **a, int n) /* break, continue, next, nextfile, return */
350 Cell *y;
352 switch (n) {
353 case EXIT:
354 if (a[0] != NULL) {
355 y = execute(a[0]);
356 errorflag = (int) getfval(y);
357 tempfree(y);
359 longjmp(env, 1);
360 case RETURN:
361 if (a[0] != NULL) {
362 y = execute(a[0]);
363 if ((y->tval & (STR|NUM)) == (STR|NUM)) {
364 setsval(fp->retval, getsval(y));
365 fp->retval->fval = getfval(y);
366 fp->retval->tval |= NUM;
368 else if (y->tval & STR)
369 setsval(fp->retval, getsval(y));
370 else if (y->tval & NUM)
371 setfval(fp->retval, getfval(y));
372 else /* can't happen */
373 FATAL("bad type variable %d", y->tval);
374 tempfree(y);
376 return(jret);
377 case NEXT:
378 return(jnext);
379 case NEXTFILE:
380 nextfile();
381 return(jnextfile);
382 case BREAK:
383 return(jbreak);
384 case CONTINUE:
385 return(jcont);
386 default: /* can't happen */
387 FATAL("illegal jump type %d", n);
389 return 0; /* not reached */
392 Cell *awkgetline(Node **a, int n) /* get next line from specific input */
393 { /* a[0] is variable, a[1] is operator, a[2] is filename */
394 Cell *r, *x;
395 extern Cell **fldtab;
396 FILE *fp;
397 char *buf;
398 int bufsize = recsize;
399 int mode;
401 if ((buf = (char *) malloc(bufsize)) == NULL)
402 FATAL("out of memory in getline");
404 fflush(stdout); /* in case someone is waiting for a prompt */
405 r = gettemp();
406 if (a[1] != NULL) { /* getline < file */
407 x = execute(a[2]); /* filename */
408 mode = ptoi(a[1]);
409 if (mode == '|') /* input pipe */
410 mode = LE; /* arbitrary flag */
411 fp = openfile(mode, getsval(x));
412 tempfree(x);
413 if (fp == NULL)
414 n = -1;
415 else
416 n = readrec(&buf, &bufsize, fp);
417 if (n <= 0) {
419 } else if (a[0] != NULL) { /* getline var <file */
420 x = execute(a[0]);
421 setsval(x, buf);
422 tempfree(x);
423 } else { /* getline <file */
424 setsval(fldtab[0], buf);
425 if (is_number(fldtab[0]->sval)) {
426 fldtab[0]->fval = atof(fldtab[0]->sval);
427 fldtab[0]->tval |= NUM;
430 } else { /* bare getline; use current input */
431 if (a[0] == NULL) /* getline */
432 n = getrec(&record, &recsize, 1);
433 else { /* getline var */
434 n = getrec(&buf, &bufsize, 0);
435 x = execute(a[0]);
436 setsval(x, buf);
437 tempfree(x);
440 setfval(r, (Awkfloat) n);
441 free(buf);
442 return r;
445 Cell *getnf(Node **a, int n) /* get NF */
447 if (donefld == 0)
448 fldbld();
449 return (Cell *) a[0];
452 Cell *array(Node **a, int n) /* a[0] is symtab, a[1] is list of subscripts */
454 Cell *x, *y, *z;
455 char *s;
456 Node *np;
457 char *buf;
458 int bufsz = recsize;
459 int nsub = strlen(*SUBSEP);
461 if ((buf = (char *) malloc(bufsz)) == NULL)
462 FATAL("out of memory in array");
464 x = execute(a[0]); /* Cell* for symbol table */
465 buf[0] = 0;
466 for (np = a[1]; np; np = np->nnext) {
467 y = execute(np); /* subscript */
468 s = getsval(y);
469 if (!adjbuf(&buf, &bufsz, strlen(buf)+strlen(s)+nsub+1, recsize, 0, "array"))
470 FATAL("out of memory for %s[%s...]", x->nval, buf);
471 strcat(buf, s);
472 if (np->nnext)
473 strcat(buf, *SUBSEP);
474 tempfree(y);
476 if (!isarr(x)) {
477 dprintf( ("making %s into an array\n", NN(x->nval)) );
478 if (freeable(x))
479 xfree(x->sval);
480 x->tval &= ~(STR|NUM|DONTFREE);
481 x->tval |= ARR;
482 x->sval = (char *) makesymtab(NSYMTAB);
484 z = setsymtab(buf, "", 0.0, STR|NUM, (Array *) x->sval);
485 z->ctype = OCELL;
486 z->csub = CVAR;
487 tempfree(x);
488 free(buf);
489 return(z);
492 Cell *awkdelete(Node **a, int n) /* a[0] is symtab, a[1] is list of subscripts */
494 Cell *x, *y;
495 Node *np;
496 char *s;
497 int nsub = strlen(*SUBSEP);
499 x = execute(a[0]); /* Cell* for symbol table */
500 if (!isarr(x))
501 return True;
502 if (a[1] == NULL) { /* delete the elements, not the table */
503 freesymtab(x);
504 x->tval &= ~STR;
505 x->tval |= ARR;
506 x->sval = (char *) makesymtab(NSYMTAB);
507 } else {
508 int bufsz = recsize;
509 char *buf;
510 if ((buf = (char *) malloc(bufsz)) == NULL)
511 FATAL("out of memory in adelete");
512 buf[0] = 0;
513 for (np = a[1]; np; np = np->nnext) {
514 y = execute(np); /* subscript */
515 s = getsval(y);
516 if (!adjbuf(&buf, &bufsz, strlen(buf)+strlen(s)+nsub+1, recsize, 0, "awkdelete"))
517 FATAL("out of memory deleting %s[%s...]", x->nval, buf);
518 strcat(buf, s);
519 if (np->nnext)
520 strcat(buf, *SUBSEP);
521 tempfree(y);
523 freeelem(x, buf);
524 free(buf);
526 tempfree(x);
527 return True;
530 Cell *intest(Node **a, int n) /* a[0] is index (list), a[1] is symtab */
532 Cell *x, *ap, *k;
533 Node *p;
534 char *buf;
535 char *s;
536 int bufsz = recsize;
537 int nsub = strlen(*SUBSEP);
539 ap = execute(a[1]); /* array name */
540 if (!isarr(ap)) {
541 dprintf( ("making %s into an array\n", ap->nval) );
542 if (freeable(ap))
543 xfree(ap->sval);
544 ap->tval &= ~(STR|NUM|DONTFREE);
545 ap->tval |= ARR;
546 ap->sval = (char *) makesymtab(NSYMTAB);
548 if ((buf = (char *) malloc(bufsz)) == NULL) {
549 FATAL("out of memory in intest");
551 buf[0] = 0;
552 for (p = a[0]; p; p = p->nnext) {
553 x = execute(p); /* expr */
554 s = getsval(x);
555 if (!adjbuf(&buf, &bufsz, strlen(buf)+strlen(s)+nsub+1, recsize, 0, "intest"))
556 FATAL("out of memory deleting %s[%s...]", x->nval, buf);
557 strcat(buf, s);
558 tempfree(x);
559 if (p->nnext)
560 strcat(buf, *SUBSEP);
562 k = lookup(buf, (Array *) ap->sval);
563 tempfree(ap);
564 free(buf);
565 if (k == NULL)
566 return(False);
567 else
568 return(True);
572 Cell *matchop(Node **a, int n) /* ~ and match() */
574 Cell *x, *y;
575 char *s, *t;
576 int i;
577 fa *pfa;
578 int (*mf)(fa *, const char *) = match, mode = 0;
580 if (n == MATCHFCN) {
581 mf = pmatch;
582 mode = 1;
584 x = execute(a[1]); /* a[1] = target text */
585 s = getsval(x);
586 if (a[0] == NULL) /* a[1] == 0: already-compiled reg expr */
587 i = (*mf)((fa *) a[2], s);
588 else {
589 y = execute(a[2]); /* a[2] = regular expr */
590 t = getsval(y);
591 pfa = makedfa(t, mode);
592 i = (*mf)(pfa, s);
593 tempfree(y);
595 tempfree(x);
596 if (n == MATCHFCN) {
597 int start = patbeg - s + 1;
598 if (patlen < 0)
599 start = 0;
600 setfval(rstartloc, (Awkfloat) start);
601 setfval(rlengthloc, (Awkfloat) patlen);
602 x = gettemp();
603 x->tval = NUM;
604 x->fval = start;
605 return x;
606 } else if ((n == MATCH && i == 1) || (n == NOTMATCH && i == 0))
607 return(True);
608 else
609 return(False);
613 Cell *boolop(Node **a, int n) /* a[0] || a[1], a[0] && a[1], !a[0] */
615 Cell *x, *y;
616 int i;
618 x = execute(a[0]);
619 i = istrue(x);
620 tempfree(x);
621 switch (n) {
622 case BOR:
623 if (i) return(True);
624 y = execute(a[1]);
625 i = istrue(y);
626 tempfree(y);
627 if (i) return(True);
628 else return(False);
629 case AND:
630 if ( !i ) return(False);
631 y = execute(a[1]);
632 i = istrue(y);
633 tempfree(y);
634 if (i) return(True);
635 else return(False);
636 case NOT:
637 if (i) return(False);
638 else return(True);
639 default: /* can't happen */
640 FATAL("unknown boolean operator %d", n);
642 return 0; /*NOTREACHED*/
645 Cell *relop(Node **a, int n) /* a[0 < a[1], etc. */
647 int i;
648 Cell *x, *y;
649 Awkfloat j;
651 x = execute(a[0]);
652 y = execute(a[1]);
653 if (x->tval&NUM && y->tval&NUM) {
654 j = x->fval - y->fval;
655 i = j<0? -1: (j>0? 1: 0);
656 } else {
657 i = strcoll(getsval(x), getsval(y));
659 tempfree(x);
660 tempfree(y);
661 switch (n) {
662 case LT: if (i<0) return(True);
663 else return(False);
664 case LE: if (i<=0) return(True);
665 else return(False);
666 case NE: if (i!=0) return(True);
667 else return(False);
668 case EQ: if (i == 0) return(True);
669 else return(False);
670 case GE: if (i>=0) return(True);
671 else return(False);
672 case GT: if (i>0) return(True);
673 else return(False);
674 default: /* can't happen */
675 FATAL("unknown relational operator %d", n);
677 return 0; /*NOTREACHED*/
680 void tfree(Cell *a) /* free a tempcell */
682 if (freeable(a)) {
683 dprintf( ("freeing %s %s %o\n", NN(a->nval), NN(a->sval), a->tval) );
684 xfree(a->sval);
686 if (a == tmps)
687 FATAL("tempcell list is curdled");
688 a->cnext = tmps;
689 tmps = a;
692 Cell *gettemp(void) /* get a tempcell */
693 { int i;
694 Cell *x;
696 if (!tmps) {
697 tmps = (Cell *) calloc(100, sizeof(Cell));
698 if (!tmps)
699 FATAL("out of space for temporaries");
700 for(i = 1; i < 100; i++)
701 tmps[i-1].cnext = &tmps[i];
702 tmps[i-1].cnext = NULL;
704 x = tmps;
705 tmps = x->cnext;
706 *x = tempcell;
707 return(x);
710 Cell *indirect(Node **a, int n) /* $( a[0] ) */
712 Awkfloat val;
713 Cell *x;
714 int m;
715 char *s;
717 x = execute(a[0]);
718 val = getfval(x); /* freebsd: defend against super large field numbers */
719 if ((Awkfloat)INT_MAX < val)
720 FATAL("trying to access out of range field %s", x->nval);
721 m = (int) val;
722 if (m == 0 && !is_number(s = getsval(x))) /* suspicion! */
723 FATAL("illegal field $(%s), name \"%s\"", s, x->nval);
724 /* BUG: can x->nval ever be null??? */
725 tempfree(x);
726 x = fieldadr(m);
727 x->ctype = OCELL; /* BUG? why are these needed? */
728 x->csub = CFLD;
729 return(x);
732 Cell *substr(Node **a, int nnn) /* substr(a[0], a[1], a[2]) */
734 int k, m, n;
735 char *s;
736 int temp;
737 Cell *x, *y, *z = NULL;
739 x = execute(a[0]);
740 y = execute(a[1]);
741 if (a[2] != NULL)
742 z = execute(a[2]);
743 s = getsval(x);
744 k = strlen(s) + 1;
745 if (k <= 1) {
746 tempfree(x);
747 tempfree(y);
748 if (a[2] != NULL) {
749 tempfree(z);
751 x = gettemp();
752 setsval(x, "");
753 return(x);
755 m = (int) getfval(y);
756 if (m <= 0)
757 m = 1;
758 else if (m > k)
759 m = k;
760 tempfree(y);
761 if (a[2] != NULL) {
762 n = (int) getfval(z);
763 tempfree(z);
764 } else
765 n = k - 1;
766 if (n < 0)
767 n = 0;
768 else if (n > k - m)
769 n = k - m;
770 dprintf( ("substr: m=%d, n=%d, s=%s\n", m, n, s) );
771 y = gettemp();
772 temp = s[n+m-1]; /* with thanks to John Linderman */
773 s[n+m-1] = '\0';
774 setsval(y, s + m - 1);
775 s[n+m-1] = temp;
776 tempfree(x);
777 return(y);
780 Cell *sindex(Node **a, int nnn) /* index(a[0], a[1]) */
782 Cell *x, *y, *z;
783 char *s1, *s2, *p1, *p2, *q;
784 Awkfloat v = 0.0;
786 x = execute(a[0]);
787 s1 = getsval(x);
788 y = execute(a[1]);
789 s2 = getsval(y);
791 z = gettemp();
792 for (p1 = s1; *p1 != '\0'; p1++) {
793 for (q=p1, p2=s2; *p2 != '\0' && *q == *p2; q++, p2++)
795 if (*p2 == '\0') {
796 v = (Awkfloat) (p1 - s1 + 1); /* origin 1 */
797 break;
800 tempfree(x);
801 tempfree(y);
802 setfval(z, v);
803 return(z);
806 #define MAXNUMSIZE 50
808 int format(char **pbuf, int *pbufsize, const char *s, Node *a) /* printf-like conversions */
810 char *fmt;
811 char *p, *t;
812 const char *os;
813 Cell *x;
814 int flag = 0, n;
815 int fmtwd; /* format width */
816 int fmtsz = recsize;
817 char *buf = *pbuf;
818 int bufsize = *pbufsize;
820 os = s;
821 p = buf;
822 if ((fmt = (char *) malloc(fmtsz)) == NULL)
823 FATAL("out of memory in format()");
824 while (*s) {
825 adjbuf(&buf, &bufsize, MAXNUMSIZE+1+p-buf, recsize, &p, "format1");
826 if (*s != '%') {
827 *p++ = *s++;
828 continue;
830 if (*(s+1) == '%') {
831 *p++ = '%';
832 s += 2;
833 continue;
835 /* have to be real careful in case this is a huge number, eg, %100000d */
836 fmtwd = atoi(s+1);
837 if (fmtwd < 0)
838 fmtwd = -fmtwd;
839 adjbuf(&buf, &bufsize, fmtwd+1+p-buf, recsize, &p, "format2");
840 for (t = fmt; (*t++ = *s) != '\0'; s++) {
841 if (!adjbuf(&fmt, &fmtsz, MAXNUMSIZE+1+t-fmt, recsize, &t, "format3"))
842 FATAL("format item %.30s... ran format() out of memory", os);
843 if (isalpha((uschar)*s) && *s != 'l' && *s != 'h' && *s != 'L')
844 break; /* the ansi panoply */
845 if (*s == '*') {
846 x = execute(a);
847 a = a->nnext;
848 sprintf(t-1, "%d", fmtwd=(int) getfval(x));
849 if (fmtwd < 0)
850 fmtwd = -fmtwd;
851 adjbuf(&buf, &bufsize, fmtwd+1+p-buf, recsize, &p, "format");
852 t = fmt + strlen(fmt);
853 tempfree(x);
856 *t = '\0';
857 if (fmtwd < 0)
858 fmtwd = -fmtwd;
859 adjbuf(&buf, &bufsize, fmtwd+1+p-buf, recsize, &p, "format4");
861 switch (*s) {
862 case 'f': case 'e': case 'g': case 'E': case 'G':
863 flag = 'f';
864 break;
865 case 'd': case 'i':
866 flag = 'd';
867 if(*(s-1) == 'l') break;
868 *(t-1) = 'l';
869 *t = 'd';
870 *++t = '\0';
871 break;
872 case 'o': case 'x': case 'X': case 'u':
873 flag = *(s-1) == 'l' ? 'd' : 'u';
874 break;
875 case 's':
876 flag = 's';
877 break;
878 case 'c':
879 flag = 'c';
880 break;
881 default:
882 WARNING("weird printf conversion %s", fmt);
883 flag = '?';
884 break;
886 if (a == NULL)
887 FATAL("not enough args in printf(%s)", os);
888 x = execute(a);
889 a = a->nnext;
890 n = MAXNUMSIZE;
891 if (fmtwd > n)
892 n = fmtwd;
893 adjbuf(&buf, &bufsize, 1+n+p-buf, recsize, &p, "format5");
894 switch (flag) {
895 case '?': sprintf(p, "%s", fmt); /* unknown, so dump it too */
896 t = getsval(x);
897 n = strlen(t);
898 if (fmtwd > n)
899 n = fmtwd;
900 adjbuf(&buf, &bufsize, 1+strlen(p)+n+p-buf, recsize, &p, "format6");
901 p += strlen(p);
902 sprintf(p, "%s", t);
903 break;
904 case 'f': sprintf(p, fmt, getfval(x)); break;
905 case 'd': sprintf(p, fmt, (long) getfval(x)); break;
906 case 'u': sprintf(p, fmt, (int) getfval(x)); break;
907 case 's':
908 t = getsval(x);
909 n = strlen(t);
910 if (fmtwd > n)
911 n = fmtwd;
912 if (!adjbuf(&buf, &bufsize, 1+n+p-buf, recsize, &p, "format7"))
913 FATAL("huge string/format (%d chars) in printf %.30s... ran format() out of memory", n, t);
914 sprintf(p, fmt, t);
915 break;
916 case 'c':
917 if (isnum(x)) {
918 if (getfval(x))
919 sprintf(p, fmt, (int) getfval(x));
920 else {
921 *p++ = '\0'; /* explicit null byte */
922 *p = '\0'; /* next output will start here */
924 } else
925 sprintf(p, fmt, getsval(x)[0]);
926 break;
927 default:
928 FATAL("can't happen: bad conversion %c in format()", flag);
930 tempfree(x);
931 p += strlen(p);
932 s++;
934 *p = '\0';
935 free(fmt);
936 for ( ; a; a = a->nnext) /* evaluate any remaining args */
937 execute(a);
938 *pbuf = buf;
939 *pbufsize = bufsize;
940 return p - buf;
943 Cell *awksprintf(Node **a, int n) /* sprintf(a[0]) */
945 Cell *x;
946 Node *y;
947 char *buf;
948 int bufsz=3*recsize;
950 if ((buf = (char *) malloc(bufsz)) == NULL)
951 FATAL("out of memory in awksprintf");
952 y = a[0]->nnext;
953 x = execute(a[0]);
954 if (format(&buf, &bufsz, getsval(x), y) == -1)
955 FATAL("sprintf string %.30s... too long. can't happen.", buf);
956 tempfree(x);
957 x = gettemp();
958 x->sval = buf;
959 x->tval = STR;
960 return(x);
963 Cell *awkprintf(Node **a, int n) /* printf */
964 { /* a[0] is list of args, starting with format string */
965 /* a[1] is redirection operator, a[2] is redirection file */
966 FILE *fp;
967 Cell *x;
968 Node *y;
969 char *buf;
970 int len;
971 int bufsz=3*recsize;
973 if ((buf = (char *) malloc(bufsz)) == NULL)
974 FATAL("out of memory in awkprintf");
975 y = a[0]->nnext;
976 x = execute(a[0]);
977 if ((len = format(&buf, &bufsz, getsval(x), y)) == -1)
978 FATAL("printf string %.30s... too long. can't happen.", buf);
979 tempfree(x);
980 if (a[1] == NULL) {
981 /* fputs(buf, stdout); */
982 fwrite(buf, len, 1, stdout);
983 if (ferror(stdout))
984 FATAL("write error on stdout");
985 } else {
986 fp = redirect(ptoi(a[1]), a[2]);
987 /* fputs(buf, fp); */
988 fwrite(buf, len, 1, fp);
989 fflush(fp);
990 if (ferror(fp))
991 FATAL("write error on %s", filename(fp));
993 free(buf);
994 return(True);
997 Cell *arith(Node **a, int n) /* a[0] + a[1], etc. also -a[0] */
999 Awkfloat i, j = 0;
1000 double v;
1001 Cell *x, *y, *z;
1003 x = execute(a[0]);
1004 i = getfval(x);
1005 tempfree(x);
1006 if (n != UMINUS) {
1007 y = execute(a[1]);
1008 j = getfval(y);
1009 tempfree(y);
1011 z = gettemp();
1012 switch (n) {
1013 case ADD:
1014 i += j;
1015 break;
1016 case MINUS:
1017 i -= j;
1018 break;
1019 case MULT:
1020 i *= j;
1021 break;
1022 case DIVIDE:
1023 if (j == 0)
1024 FATAL("division by zero");
1025 i /= j;
1026 break;
1027 case MOD:
1028 if (j == 0)
1029 FATAL("division by zero in mod");
1030 modf(i/j, &v);
1031 i = i - j * v;
1032 break;
1033 case UMINUS:
1034 i = -i;
1035 break;
1036 case POWER:
1037 if (j >= 0 && modf(j, &v) == 0.0) /* pos integer exponent */
1038 i = ipow(i, (int) j);
1039 else
1040 i = errcheck(pow(i, j), "pow");
1041 break;
1042 default: /* can't happen */
1043 FATAL("illegal arithmetic operator %d", n);
1045 setfval(z, i);
1046 return(z);
1049 double ipow(double x, int n) /* x**n. ought to be done by pow, but isn't always */
1051 double v;
1053 if (n <= 0)
1054 return 1;
1055 v = ipow(x, n/2);
1056 if (n % 2 == 0)
1057 return v * v;
1058 else
1059 return x * v * v;
1062 Cell *incrdecr(Node **a, int n) /* a[0]++, etc. */
1064 Cell *x, *z;
1065 int k;
1066 Awkfloat xf;
1068 x = execute(a[0]);
1069 xf = getfval(x);
1070 k = (n == PREINCR || n == POSTINCR) ? 1 : -1;
1071 if (n == PREINCR || n == PREDECR) {
1072 setfval(x, xf + k);
1073 return(x);
1075 z = gettemp();
1076 setfval(z, xf);
1077 setfval(x, xf + k);
1078 tempfree(x);
1079 return(z);
1082 Cell *assign(Node **a, int n) /* a[0] = a[1], a[0] += a[1], etc. */
1083 { /* this is subtle; don't muck with it. */
1084 Cell *x, *y;
1085 Awkfloat xf, yf;
1086 double v;
1088 y = execute(a[1]);
1089 x = execute(a[0]);
1090 if (n == ASSIGN) { /* ordinary assignment */
1091 if (x == y && !(x->tval & (FLD|REC))) /* self-assignment: */
1092 ; /* leave alone unless it's a field */
1093 else if ((y->tval & (STR|NUM)) == (STR|NUM)) {
1094 setsval(x, getsval(y));
1095 x->fval = getfval(y);
1096 x->tval |= NUM;
1098 else if (isstr(y))
1099 setsval(x, getsval(y));
1100 else if (isnum(y))
1101 setfval(x, getfval(y));
1102 else
1103 funnyvar(y, "read value of");
1104 tempfree(y);
1105 return(x);
1107 xf = getfval(x);
1108 yf = getfval(y);
1109 switch (n) {
1110 case ADDEQ:
1111 xf += yf;
1112 break;
1113 case SUBEQ:
1114 xf -= yf;
1115 break;
1116 case MULTEQ:
1117 xf *= yf;
1118 break;
1119 case DIVEQ:
1120 if (yf == 0)
1121 FATAL("division by zero in /=");
1122 xf /= yf;
1123 break;
1124 case MODEQ:
1125 if (yf == 0)
1126 FATAL("division by zero in %%=");
1127 modf(xf/yf, &v);
1128 xf = xf - yf * v;
1129 break;
1130 case POWEQ:
1131 if (yf >= 0 && modf(yf, &v) == 0.0) /* pos integer exponent */
1132 xf = ipow(xf, (int) yf);
1133 else
1134 xf = errcheck(pow(xf, yf), "pow");
1135 break;
1136 default:
1137 FATAL("illegal assignment operator %d", n);
1138 break;
1140 tempfree(y);
1141 setfval(x, xf);
1142 return(x);
1145 Cell *cat(Node **a, int q) /* a[0] cat a[1] */
1147 Cell *x, *y, *z;
1148 int n1, n2;
1149 char *s;
1151 x = execute(a[0]);
1152 y = execute(a[1]);
1153 getsval(x);
1154 getsval(y);
1155 n1 = strlen(x->sval);
1156 n2 = strlen(y->sval);
1157 s = (char *) malloc(n1 + n2 + 1);
1158 if (s == NULL)
1159 FATAL("out of space concatenating %.15s... and %.15s...",
1160 x->sval, y->sval);
1161 strcpy(s, x->sval);
1162 strcpy(s+n1, y->sval);
1163 tempfree(x);
1164 tempfree(y);
1165 z = gettemp();
1166 z->sval = s;
1167 z->tval = STR;
1168 return(z);
1171 Cell *pastat(Node **a, int n) /* a[0] { a[1] } */
1173 Cell *x;
1175 if (a[0] == NULL)
1176 x = execute(a[1]);
1177 else {
1178 x = execute(a[0]);
1179 if (istrue(x)) {
1180 tempfree(x);
1181 x = execute(a[1]);
1184 return x;
1187 Cell *dopa2(Node **a, int n) /* a[0], a[1] { a[2] } */
1189 Cell *x;
1190 int pair;
1192 pair = ptoi(a[3]);
1193 if (pairstack[pair] == 0) {
1194 x = execute(a[0]);
1195 if (istrue(x))
1196 pairstack[pair] = 1;
1197 tempfree(x);
1199 if (pairstack[pair] == 1) {
1200 x = execute(a[1]);
1201 if (istrue(x))
1202 pairstack[pair] = 0;
1203 tempfree(x);
1204 x = execute(a[2]);
1205 return(x);
1207 return(False);
1210 Cell *split(Node **a, int nnn) /* split(a[0], a[1], a[2]); a[3] is type */
1212 Cell *x = NULL, *y, *ap;
1213 char *s, *origs;
1214 int sep;
1215 char *t, temp, num[50], *fs = NULL;
1216 int n, tempstat, arg3type;
1218 y = execute(a[0]); /* source string */
1219 origs = s = strdup(getsval(y));
1220 arg3type = ptoi(a[3]);
1221 if (a[2] == NULL) /* fs string */
1222 fs = *FS;
1223 else if (arg3type == STRING) { /* split(str,arr,"string") */
1224 x = execute(a[2]);
1225 fs = getsval(x);
1226 } else if (arg3type == REGEXPR)
1227 fs = "(regexpr)"; /* split(str,arr,/regexpr/) */
1228 else
1229 FATAL("illegal type of split");
1230 sep = *fs;
1231 ap = execute(a[1]); /* array name */
1232 freesymtab(ap);
1233 dprintf( ("split: s=|%s|, a=%s, sep=|%s|\n", s, NN(ap->nval), fs) );
1234 ap->tval &= ~STR;
1235 ap->tval |= ARR;
1236 ap->sval = (char *) makesymtab(NSYMTAB);
1238 n = 0;
1239 if (arg3type == REGEXPR && strlen((char*)((fa*)a[2])->restr) == 0) {
1240 /* split(s, a, //); have to arrange that it looks like empty sep */
1241 arg3type = 0;
1242 fs = "";
1243 sep = 0;
1245 if (*s != '\0' && (strlen(fs) > 1 || arg3type == REGEXPR)) { /* reg expr */
1246 fa *pfa;
1247 if (arg3type == REGEXPR) { /* it's ready already */
1248 pfa = (fa *) a[2];
1249 } else {
1250 pfa = makedfa(fs, 1);
1252 if (nematch(pfa,s)) {
1253 tempstat = pfa->initstat;
1254 pfa->initstat = 2;
1255 do {
1256 n++;
1257 sprintf(num, "%d", n);
1258 temp = *patbeg;
1259 *patbeg = '\0';
1260 if (is_number(s))
1261 setsymtab(num, s, atof(s), STR|NUM, (Array *) ap->sval);
1262 else
1263 setsymtab(num, s, 0.0, STR, (Array *) ap->sval);
1264 *patbeg = temp;
1265 s = patbeg + patlen;
1266 if (*(patbeg+patlen-1) == 0 || *s == 0) {
1267 n++;
1268 sprintf(num, "%d", n);
1269 setsymtab(num, "", 0.0, STR, (Array *) ap->sval);
1270 pfa->initstat = tempstat;
1271 goto spdone;
1273 } while (nematch(pfa,s));
1274 pfa->initstat = tempstat; /* bwk: has to be here to reset */
1275 /* cf gsub and refldbld */
1277 n++;
1278 sprintf(num, "%d", n);
1279 if (is_number(s))
1280 setsymtab(num, s, atof(s), STR|NUM, (Array *) ap->sval);
1281 else
1282 setsymtab(num, s, 0.0, STR, (Array *) ap->sval);
1283 spdone:
1284 pfa = NULL;
1285 } else if (sep == ' ') {
1286 for (n = 0; ; ) {
1287 while (*s == ' ' || *s == '\t' || *s == '\n')
1288 s++;
1289 if (*s == 0)
1290 break;
1291 n++;
1292 t = s;
1294 s++;
1295 while (*s!=' ' && *s!='\t' && *s!='\n' && *s!='\0');
1296 temp = *s;
1297 *s = '\0';
1298 sprintf(num, "%d", n);
1299 if (is_number(t))
1300 setsymtab(num, t, atof(t), STR|NUM, (Array *) ap->sval);
1301 else
1302 setsymtab(num, t, 0.0, STR, (Array *) ap->sval);
1303 *s = temp;
1304 if (*s != 0)
1305 s++;
1307 } else if (sep == 0) { /* new: split(s, a, "") => 1 char/elem */
1308 for (n = 0; *s != 0; s++) {
1309 char buf[2];
1310 n++;
1311 sprintf(num, "%d", n);
1312 buf[0] = *s;
1313 buf[1] = 0;
1314 if (isdigit((uschar)buf[0]))
1315 setsymtab(num, buf, atof(buf), STR|NUM, (Array *) ap->sval);
1316 else
1317 setsymtab(num, buf, 0.0, STR, (Array *) ap->sval);
1319 } else if (*s != 0) {
1320 for (;;) {
1321 n++;
1322 t = s;
1323 while (*s != sep && *s != '\n' && *s != '\0')
1324 s++;
1325 temp = *s;
1326 *s = '\0';
1327 sprintf(num, "%d", n);
1328 if (is_number(t))
1329 setsymtab(num, t, atof(t), STR|NUM, (Array *) ap->sval);
1330 else
1331 setsymtab(num, t, 0.0, STR, (Array *) ap->sval);
1332 *s = temp;
1333 if (*s++ == 0)
1334 break;
1337 tempfree(ap);
1338 tempfree(y);
1339 free(origs);
1340 if (a[2] != NULL && arg3type == STRING) {
1341 tempfree(x);
1343 x = gettemp();
1344 x->tval = NUM;
1345 x->fval = n;
1346 return(x);
1349 Cell *condexpr(Node **a, int n) /* a[0] ? a[1] : a[2] */
1351 Cell *x;
1353 x = execute(a[0]);
1354 if (istrue(x)) {
1355 tempfree(x);
1356 x = execute(a[1]);
1357 } else {
1358 tempfree(x);
1359 x = execute(a[2]);
1361 return(x);
1364 Cell *ifstat(Node **a, int n) /* if (a[0]) a[1]; else a[2] */
1366 Cell *x;
1368 x = execute(a[0]);
1369 if (istrue(x)) {
1370 tempfree(x);
1371 x = execute(a[1]);
1372 } else if (a[2] != NULL) {
1373 tempfree(x);
1374 x = execute(a[2]);
1376 return(x);
1379 Cell *whilestat(Node **a, int n) /* while (a[0]) a[1] */
1381 Cell *x;
1383 for (;;) {
1384 x = execute(a[0]);
1385 if (!istrue(x))
1386 return(x);
1387 tempfree(x);
1388 x = execute(a[1]);
1389 if (isbreak(x)) {
1390 x = True;
1391 return(x);
1393 if (isnext(x) || isexit(x) || isret(x))
1394 return(x);
1395 tempfree(x);
1399 Cell *dostat(Node **a, int n) /* do a[0]; while(a[1]) */
1401 Cell *x;
1403 for (;;) {
1404 x = execute(a[0]);
1405 if (isbreak(x))
1406 return True;
1407 if (isnext(x) || isexit(x) || isret(x))
1408 return(x);
1409 tempfree(x);
1410 x = execute(a[1]);
1411 if (!istrue(x))
1412 return(x);
1413 tempfree(x);
1417 Cell *forstat(Node **a, int n) /* for (a[0]; a[1]; a[2]) a[3] */
1419 Cell *x;
1421 x = execute(a[0]);
1422 tempfree(x);
1423 for (;;) {
1424 if (a[1]!=NULL) {
1425 x = execute(a[1]);
1426 if (!istrue(x)) return(x);
1427 else tempfree(x);
1429 x = execute(a[3]);
1430 if (isbreak(x)) /* turn off break */
1431 return True;
1432 if (isnext(x) || isexit(x) || isret(x))
1433 return(x);
1434 tempfree(x);
1435 x = execute(a[2]);
1436 tempfree(x);
1440 Cell *instat(Node **a, int n) /* for (a[0] in a[1]) a[2] */
1442 Cell *x, *vp, *arrayp, *cp, *ncp;
1443 Array *tp;
1444 int i;
1446 vp = execute(a[0]);
1447 arrayp = execute(a[1]);
1448 if (!isarr(arrayp)) {
1449 return True;
1451 tp = (Array *) arrayp->sval;
1452 tempfree(arrayp);
1453 for (i = 0; i < tp->size; i++) { /* this routine knows too much */
1454 for (cp = tp->tab[i]; cp != NULL; cp = ncp) {
1455 setsval(vp, cp->nval);
1456 ncp = cp->cnext;
1457 x = execute(a[2]);
1458 if (isbreak(x)) {
1459 tempfree(vp);
1460 return True;
1462 if (isnext(x) || isexit(x) || isret(x)) {
1463 tempfree(vp);
1464 return(x);
1466 tempfree(x);
1469 return True;
1472 Cell *bltin(Node **a, int n) /* builtin functions. a[0] is type, a[1] is arg list */
1474 Cell *x, *y;
1475 Awkfloat u;
1476 int t;
1477 Awkfloat tmp;
1478 char *p, *buf;
1479 Node *nextarg;
1480 FILE *fp;
1481 void flush_all(void);
1483 t = ptoi(a[0]);
1484 x = execute(a[1]);
1485 nextarg = a[1]->nnext;
1486 switch (t) {
1487 case FLENGTH:
1488 if (isarr(x))
1489 u = ((Array *) x->sval)->nelem; /* GROT. should be function*/
1490 else
1491 u = strlen(getsval(x));
1492 break;
1493 case FLOG:
1494 u = errcheck(log(getfval(x)), "log"); break;
1495 case FINT:
1496 modf(getfval(x), &u); break;
1497 case FEXP:
1498 u = errcheck(exp(getfval(x)), "exp"); break;
1499 case FSQRT:
1500 u = errcheck(sqrt(getfval(x)), "sqrt"); break;
1501 case FSIN:
1502 u = sin(getfval(x)); break;
1503 case FCOS:
1504 u = cos(getfval(x)); break;
1505 case FATAN:
1506 if (nextarg == NULL) {
1507 WARNING("atan2 requires two arguments; returning 1.0");
1508 u = 1.0;
1509 } else {
1510 y = execute(a[1]->nnext);
1511 u = atan2(getfval(x), getfval(y));
1512 tempfree(y);
1513 nextarg = nextarg->nnext;
1515 break;
1516 case FSYSTEM:
1517 fflush(stdout); /* in case something is buffered already */
1518 u = (Awkfloat) system(getsval(x)) / 256; /* 256 is unix-dep */
1519 break;
1520 case FRAND:
1521 /* random() returns numbers in [0..2^31-1]
1522 * in order to get a number in [0, 1), divide it by 2^31
1524 u = (Awkfloat) random() / (0x7fffffffL + 0x1UL);
1525 break;
1526 case FSRAND:
1527 if (isrec(x)) /* no argument provided */
1528 u = time((time_t *)0);
1529 else
1530 u = getfval(x);
1531 tmp = u;
1532 srandom((unsigned long) u);
1533 u = srand_seed;
1534 srand_seed = tmp;
1535 break;
1536 case FTOUPPER:
1537 case FTOLOWER:
1538 buf = tostring(getsval(x));
1539 if (t == FTOUPPER) {
1540 for (p = buf; *p; p++)
1541 if (islower((uschar) *p))
1542 *p = toupper((uschar)*p);
1543 } else {
1544 for (p = buf; *p; p++)
1545 if (isupper((uschar) *p))
1546 *p = tolower((uschar)*p);
1548 tempfree(x);
1549 x = gettemp();
1550 setsval(x, buf);
1551 free(buf);
1552 return x;
1553 case FFLUSH:
1554 if (isrec(x) || strlen(getsval(x)) == 0) {
1555 flush_all(); /* fflush() or fflush("") -> all */
1556 u = 0;
1557 } else if ((fp = openfile(FFLUSH, getsval(x))) == NULL)
1558 u = EOF;
1559 else
1560 u = fflush(fp);
1561 break;
1562 default: /* can't happen */
1563 FATAL("illegal function type %d", t);
1564 break;
1566 tempfree(x);
1567 x = gettemp();
1568 setfval(x, u);
1569 if (nextarg != NULL) {
1570 WARNING("warning: function has too many arguments");
1571 for ( ; nextarg; nextarg = nextarg->nnext)
1572 execute(nextarg);
1574 return(x);
1577 Cell *printstat(Node **a, int n) /* print a[0] */
1579 Node *x;
1580 Cell *y;
1581 FILE *fp;
1583 if (a[1] == NULL) /* a[1] is redirection operator, a[2] is file */
1584 fp = stdout;
1585 else
1586 fp = redirect(ptoi(a[1]), a[2]);
1587 for (x = a[0]; x != NULL; x = x->nnext) {
1588 y = execute(x);
1589 fputs(getpssval(y), fp);
1590 tempfree(y);
1591 if (x->nnext == NULL)
1592 fputs(*ORS, fp);
1593 else
1594 fputs(*OFS, fp);
1596 if (a[1] != NULL)
1597 fflush(fp);
1598 if (ferror(fp))
1599 FATAL("write error on %s", filename(fp));
1600 return(True);
1603 Cell *nullproc(Node **a, int n)
1605 n = n;
1606 a = a;
1607 return 0;
1611 FILE *redirect(int a, Node *b) /* set up all i/o redirections */
1613 FILE *fp;
1614 Cell *x;
1615 char *fname;
1617 x = execute(b);
1618 fname = getsval(x);
1619 fp = openfile(a, fname);
1620 if (fp == NULL)
1621 FATAL("can't open file %s", fname);
1622 tempfree(x);
1623 return fp;
1626 struct files {
1627 FILE *fp;
1628 const char *fname;
1629 int mode; /* '|', 'a', 'w' => LE/LT, GT */
1630 } *files;
1632 int nfiles;
1634 void stdinit(void) /* in case stdin, etc., are not constants */
1636 nfiles = FOPEN_MAX;
1637 files = calloc(nfiles, sizeof(*files));
1638 if (files == NULL)
1639 FATAL("can't allocate file memory for %u files", nfiles);
1640 files[0].fp = stdin;
1641 files[0].fname = "/dev/stdin";
1642 files[0].mode = LT;
1643 files[1].fp = stdout;
1644 files[1].fname = "/dev/stdout";
1645 files[1].mode = GT;
1646 files[2].fp = stderr;
1647 files[2].fname = "/dev/stderr";
1648 files[2].mode = GT;
1651 FILE *openfile(int a, const char *us)
1653 const char *s = us;
1654 int i, m;
1655 FILE *fp = NULL;
1657 if (*s == '\0')
1658 FATAL("null file name in print or getline");
1659 for (i=0; i < nfiles; i++)
1660 if (files[i].fname && strcmp(s, files[i].fname) == 0) {
1661 if (a == files[i].mode || (a==APPEND && files[i].mode==GT))
1662 return files[i].fp;
1663 if (a == FFLUSH)
1664 return files[i].fp;
1666 if (a == FFLUSH) /* didn't find it, so don't create it! */
1667 return NULL;
1669 for (i=0; i < nfiles; i++)
1670 if (files[i].fp == NULL)
1671 break;
1672 if (i >= nfiles) {
1673 struct files *nf;
1674 int nnf = nfiles + FOPEN_MAX;
1675 nf = realloc(files, nnf * sizeof(*nf));
1676 if (nf == NULL)
1677 FATAL("cannot grow files for %s and %d files", s, nnf);
1678 memset(&nf[nfiles], 0, FOPEN_MAX * sizeof(*nf));
1679 nfiles = nnf;
1680 files = nf;
1682 fflush(stdout); /* force a semblance of order */
1683 m = a;
1684 if (a == GT) {
1685 fp = fopen(s, "w");
1686 } else if (a == APPEND) {
1687 fp = fopen(s, "a");
1688 m = GT; /* so can mix > and >> */
1689 } else if (a == '|') { /* output pipe */
1690 fp = popen(s, "w");
1691 } else if (a == LE) { /* input pipe */
1692 fp = popen(s, "r");
1693 } else if (a == LT) { /* getline <file */
1694 fp = strcmp(s, "-") == 0 ? stdin : fopen(s, "r"); /* "-" is stdin */
1695 } else /* can't happen */
1696 FATAL("illegal redirection %d", a);
1697 if (fp != NULL) {
1698 files[i].fname = tostring(s);
1699 files[i].fp = fp;
1700 files[i].mode = m;
1702 return fp;
1705 const char *filename(FILE *fp)
1707 int i;
1709 for (i = 0; i < nfiles; i++)
1710 if (fp == files[i].fp)
1711 return files[i].fname;
1712 return "???";
1715 Cell *closefile(Node **a, int n)
1717 Cell *x;
1718 int i, stat;
1720 n = n;
1721 x = execute(a[0]);
1722 getsval(x);
1723 stat = -1;
1724 for (i = 0; i < nfiles; i++) {
1725 if (files[i].fname && strcmp(x->sval, files[i].fname) == 0) {
1726 if (ferror(files[i].fp))
1727 WARNING( "i/o error occurred on %s", files[i].fname );
1728 if (files[i].mode == '|' || files[i].mode == LE)
1729 stat = pclose(files[i].fp);
1730 else
1731 stat = fclose(files[i].fp);
1732 if (stat == EOF)
1733 WARNING( "i/o error occurred closing %s", files[i].fname );
1734 if (i > 2) /* don't do /dev/std... */
1735 xfree(files[i].fname);
1736 files[i].fname = NULL; /* watch out for ref thru this */
1737 files[i].fp = NULL;
1740 tempfree(x);
1741 x = gettemp();
1742 setfval(x, (Awkfloat) stat);
1743 return(x);
1746 void closeall(void)
1748 int i, stat;
1750 for (i = 0; i < FOPEN_MAX; i++) {
1751 if (files[i].fp) {
1752 if (ferror(files[i].fp))
1753 WARNING( "i/o error occurred on %s", files[i].fname );
1754 if (files[i].mode == '|' || files[i].mode == LE)
1755 stat = pclose(files[i].fp);
1756 else
1757 stat = fclose(files[i].fp);
1758 if (stat == EOF)
1759 WARNING( "i/o error occurred while closing %s", files[i].fname );
1764 void flush_all(void)
1766 int i;
1768 for (i = 0; i < nfiles; i++)
1769 if (files[i].fp)
1770 fflush(files[i].fp);
1773 void backsub(char **pb_ptr, char **sptr_ptr);
1775 Cell *sub(Node **a, int nnn) /* substitute command */
1777 char *sptr, *pb, *q;
1778 Cell *x, *y, *result;
1779 char *t, *buf;
1780 fa *pfa;
1781 int bufsz = recsize;
1783 if ((buf = (char *) malloc(bufsz)) == NULL)
1784 FATAL("out of memory in sub");
1785 x = execute(a[3]); /* target string */
1786 t = getsval(x);
1787 if (a[0] == NULL) /* 0 => a[1] is already-compiled regexpr */
1788 pfa = (fa *) a[1]; /* regular expression */
1789 else {
1790 y = execute(a[1]);
1791 pfa = makedfa(getsval(y), 1);
1792 tempfree(y);
1794 y = execute(a[2]); /* replacement string */
1795 result = False;
1796 if (pmatch(pfa, t)) {
1797 sptr = t;
1798 adjbuf(&buf, &bufsz, 1+patbeg-sptr, recsize, 0, "sub");
1799 pb = buf;
1800 while (sptr < patbeg)
1801 *pb++ = *sptr++;
1802 sptr = getsval(y);
1803 while (*sptr != 0) {
1804 adjbuf(&buf, &bufsz, 5+pb-buf, recsize, &pb, "sub");
1805 if (*sptr == '\\') {
1806 backsub(&pb, &sptr);
1807 } else if (*sptr == '&') {
1808 sptr++;
1809 adjbuf(&buf, &bufsz, 1+patlen+pb-buf, recsize, &pb, "sub");
1810 for (q = patbeg; q < patbeg+patlen; )
1811 *pb++ = *q++;
1812 } else
1813 *pb++ = *sptr++;
1815 *pb = '\0';
1816 if (pb > buf + bufsz)
1817 FATAL("sub result1 %.30s too big; can't happen", buf);
1818 sptr = patbeg + patlen;
1819 if ((patlen == 0 && *patbeg) || (patlen && *(sptr-1))) {
1820 adjbuf(&buf, &bufsz, 1+strlen(sptr)+pb-buf, 0, &pb, "sub");
1821 while ((*pb++ = *sptr++) != 0)
1824 if (pb > buf + bufsz)
1825 FATAL("sub result2 %.30s too big; can't happen", buf);
1826 setsval(x, buf); /* BUG: should be able to avoid copy */
1827 result = True;
1829 tempfree(x);
1830 tempfree(y);
1831 free(buf);
1832 return result;
1835 Cell *gsub(Node **a, int nnn) /* global substitute */
1837 Cell *x, *y;
1838 char *rptr, *sptr, *t, *pb, *q;
1839 char *buf;
1840 fa *pfa;
1841 int mflag, tempstat, num;
1842 int bufsz = recsize;
1844 if ((buf = (char *) malloc(bufsz)) == NULL)
1845 FATAL("out of memory in gsub");
1846 mflag = 0; /* if mflag == 0, can replace empty string */
1847 num = 0;
1848 x = execute(a[3]); /* target string */
1849 t = getsval(x);
1850 if (a[0] == NULL) /* 0 => a[1] is already-compiled regexpr */
1851 pfa = (fa *) a[1]; /* regular expression */
1852 else {
1853 y = execute(a[1]);
1854 pfa = makedfa(getsval(y), 1);
1855 tempfree(y);
1857 y = execute(a[2]); /* replacement string */
1858 if (pmatch(pfa, t)) {
1859 tempstat = pfa->initstat;
1860 pfa->initstat = 2;
1861 pb = buf;
1862 rptr = getsval(y);
1863 do {
1864 if (patlen == 0 && *patbeg != 0) { /* matched empty string */
1865 if (mflag == 0) { /* can replace empty */
1866 num++;
1867 sptr = rptr;
1868 while (*sptr != 0) {
1869 adjbuf(&buf, &bufsz, 5+pb-buf, recsize, &pb, "gsub");
1870 if (*sptr == '\\') {
1871 backsub(&pb, &sptr);
1872 } else if (*sptr == '&') {
1873 sptr++;
1874 adjbuf(&buf, &bufsz, 1+patlen+pb-buf, recsize, &pb, "gsub");
1875 for (q = patbeg; q < patbeg+patlen; )
1876 *pb++ = *q++;
1877 } else
1878 *pb++ = *sptr++;
1881 if (*t == 0) /* at end */
1882 goto done;
1883 adjbuf(&buf, &bufsz, 2+pb-buf, recsize, &pb, "gsub");
1884 *pb++ = *t++;
1885 if (pb > buf + bufsz) /* BUG: not sure of this test */
1886 FATAL("gsub result0 %.30s too big; can't happen", buf);
1887 mflag = 0;
1889 else { /* matched nonempty string */
1890 num++;
1891 sptr = t;
1892 adjbuf(&buf, &bufsz, 1+(patbeg-sptr)+pb-buf, recsize, &pb, "gsub");
1893 while (sptr < patbeg)
1894 *pb++ = *sptr++;
1895 sptr = rptr;
1896 while (*sptr != 0) {
1897 adjbuf(&buf, &bufsz, 5+pb-buf, recsize, &pb, "gsub");
1898 if (*sptr == '\\') {
1899 backsub(&pb, &sptr);
1900 } else if (*sptr == '&') {
1901 sptr++;
1902 adjbuf(&buf, &bufsz, 1+patlen+pb-buf, recsize, &pb, "gsub");
1903 for (q = patbeg; q < patbeg+patlen; )
1904 *pb++ = *q++;
1905 } else
1906 *pb++ = *sptr++;
1908 t = patbeg + patlen;
1909 if (patlen == 0 || *t == 0 || *(t-1) == 0)
1910 goto done;
1911 if (pb > buf + bufsz)
1912 FATAL("gsub result1 %.30s too big; can't happen", buf);
1913 mflag = 1;
1915 } while (pmatch(pfa,t));
1916 sptr = t;
1917 adjbuf(&buf, &bufsz, 1+strlen(sptr)+pb-buf, 0, &pb, "gsub");
1918 while ((*pb++ = *sptr++) != 0)
1920 done: if (pb < buf + bufsz)
1921 *pb = '\0';
1922 else if (*(pb-1) != '\0')
1923 FATAL("gsub result2 %.30s truncated; can't happen", buf);
1924 setsval(x, buf); /* BUG: should be able to avoid copy + free */
1925 pfa->initstat = tempstat;
1927 tempfree(x);
1928 tempfree(y);
1929 x = gettemp();
1930 x->tval = NUM;
1931 x->fval = num;
1932 free(buf);
1933 return(x);
1936 void backsub(char **pb_ptr, char **sptr_ptr) /* handle \\& variations */
1937 { /* sptr[0] == '\\' */
1938 char *pb = *pb_ptr, *sptr = *sptr_ptr;
1940 if (sptr[1] == '\\') {
1941 if (sptr[2] == '\\' && sptr[3] == '&') { /* \\\& -> \& */
1942 *pb++ = '\\';
1943 *pb++ = '&';
1944 sptr += 4;
1945 } else if (sptr[2] == '&') { /* \\& -> \ + matched */
1946 *pb++ = '\\';
1947 sptr += 2;
1948 } else { /* \\x -> \\x */
1949 *pb++ = *sptr++;
1950 *pb++ = *sptr++;
1952 } else if (sptr[1] == '&') { /* literal & */
1953 sptr++;
1954 *pb++ = *sptr++;
1955 } else /* literal \ */
1956 *pb++ = *sptr++;
1958 *pb_ptr = pb;
1959 *sptr_ptr = sptr;