• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /****************************************************************
2 Copyright (C) Lucent Technologies 1997
3 All Rights Reserved
4 
5 Permission to use, copy, modify, and distribute this software and
6 its documentation for any purpose and without fee is hereby
7 granted, provided that the above copyright notice appear in all
8 copies and that both that the copyright notice and this
9 permission notice and warranty disclaimer appear in supporting
10 documentation, and that the name Lucent Technologies or any of
11 its entities not be used in advertising or publicity pertaining
12 to distribution of the software without specific, written prior
13 permission.
14 
15 LUCENT DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE,
16 INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS.
17 IN NO EVENT SHALL LUCENT OR ANY OF ITS ENTITIES BE LIABLE FOR ANY
18 SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
19 WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER
20 IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION,
21 ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF
22 THIS SOFTWARE.
23 ****************************************************************/
24 
25 #define DEBUG
26 #include <stdio.h>
27 #include <ctype.h>
28 #include <setjmp.h>
29 #include <limits.h>
30 #include <math.h>
31 #include <string.h>
32 #include <stdlib.h>
33 #include <time.h>
34 #include "awk.h"
35 #include "ytab.h"
36 
37 #define tempfree(x)	if (istemp(x)) tfree(x); else
38 
39 /*
40 #undef tempfree
41 
42 void tempfree(Cell *p) {
43 	if (p->ctype == OCELL && (p->csub < CUNK || p->csub > CFREE)) {
44 		WARNING("bad csub %d in Cell %d %s",
45 			p->csub, p->ctype, p->sval);
46 	}
47 	if (istemp(p))
48 		tfree(p);
49 }
50 */
51 
52 /* do we really need these? */
53 /* #ifdef _NFILE */
54 /* #ifndef FOPEN_MAX */
55 /* #define FOPEN_MAX _NFILE */
56 /* #endif */
57 /* #endif */
58 /*  */
59 /* #ifndef	FOPEN_MAX */
60 /* #define	FOPEN_MAX	40 */	/* max number of open files */
61 /* #endif */
62 /*  */
63 /* #ifndef RAND_MAX */
64 /* #define RAND_MAX	32767 */	/* all that ansi guarantees */
65 /* #endif */
66 
67 jmp_buf env;
68 extern	int	pairstack[];
69 extern	Awkfloat	srand_seed;
70 
71 Node	*winner = NULL;	/* root of parse tree */
72 Cell	*tmps;		/* free temporary cells for execution */
73 
74 static Cell	truecell	={ OBOOL, BTRUE, 0, 0, 1.0, NUM };
75 Cell	*True	= &truecell;
76 static Cell	falsecell	={ OBOOL, BFALSE, 0, 0, 0.0, NUM };
77 Cell	*False	= &falsecell;
78 static Cell	breakcell	={ OJUMP, JBREAK, 0, 0, 0.0, NUM };
79 Cell	*jbreak	= &breakcell;
80 static Cell	contcell	={ OJUMP, JCONT, 0, 0, 0.0, NUM };
81 Cell	*jcont	= &contcell;
82 static Cell	nextcell	={ OJUMP, JNEXT, 0, 0, 0.0, NUM };
83 Cell	*jnext	= &nextcell;
84 static Cell	nextfilecell	={ OJUMP, JNEXTFILE, 0, 0, 0.0, NUM };
85 Cell	*jnextfile	= &nextfilecell;
86 static Cell	exitcell	={ OJUMP, JEXIT, 0, 0, 0.0, NUM };
87 Cell	*jexit	= &exitcell;
88 static Cell	retcell		={ OJUMP, JRET, 0, 0, 0.0, NUM };
89 Cell	*jret	= &retcell;
90 static Cell	tempcell	={ OCELL, CTEMP, 0, "", 0.0, NUM|STR|DONTFREE };
91 
92 Node	*curnode = NULL;	/* the node being executed, for debugging */
93 
94 /* buffer memory management */
adjbuf(char ** pbuf,int * psiz,int minlen,int quantum,char ** pbptr,const char * whatrtn)95 int adjbuf(char **pbuf, int *psiz, int minlen, int quantum, char **pbptr,
96 	const char *whatrtn)
97 /* pbuf:    address of pointer to buffer being managed
98  * psiz:    address of buffer size variable
99  * minlen:  minimum length of buffer needed
100  * quantum: buffer size quantum
101  * pbptr:   address of movable pointer into buffer, or 0 if none
102  * whatrtn: name of the calling routine if failure should cause fatal error
103  *
104  * return   0 for realloc failure, !=0 for success
105  */
106 {
107 	if (minlen > *psiz) {
108 		char *tbuf;
109 		int rminlen = quantum ? minlen % quantum : 0;
110 		int boff = pbptr ? *pbptr - *pbuf : 0;
111 		/* round up to next multiple of quantum */
112 		if (rminlen)
113 			minlen += quantum - rminlen;
114 		tbuf = (char *) realloc(*pbuf, minlen);
115 		dprintf( ("adjbuf %s: %d %d (pbuf=%p, tbuf=%p)\n", whatrtn, *psiz, minlen, *pbuf, tbuf) );
116 		if (tbuf == NULL) {
117 			if (whatrtn)
118 				FATAL("out of memory in %s", whatrtn);
119 			return 0;
120 		}
121 		*pbuf = tbuf;
122 		*psiz = minlen;
123 		if (pbptr)
124 			*pbptr = tbuf + boff;
125 	}
126 	return 1;
127 }
128 
run(Node * a)129 void run(Node *a)	/* execution of parse tree starts here */
130 {
131 	extern void stdinit(void);
132 
133 	stdinit();
134 	execute(a);
135 	closeall();
136 }
137 
execute(Node * u)138 Cell *execute(Node *u)	/* execute a node of the parse tree */
139 {
140 	Cell *(*proc)(Node **, int);
141 	Cell *x;
142 	Node *a;
143 
144 	if (u == NULL)
145 		return(True);
146 	for (a = u; ; a = a->nnext) {
147 		curnode = a;
148 		if (isvalue(a)) {
149 			x = (Cell *) (a->narg[0]);
150 			if (isfld(x) && !donefld)
151 				fldbld();
152 			else if (isrec(x) && !donerec)
153 				recbld();
154 			return(x);
155 		}
156 		if (notlegal(a->nobj))	/* probably a Cell* but too risky to print */
157 			FATAL("illegal statement");
158 		proc = proctab[a->nobj-FIRSTTOKEN];
159 		x = (*proc)(a->narg, a->nobj);
160 		if (isfld(x) && !donefld)
161 			fldbld();
162 		else if (isrec(x) && !donerec)
163 			recbld();
164 		if (isexpr(a))
165 			return(x);
166 		if (isjump(x))
167 			return(x);
168 		if (a->nnext == NULL)
169 			return(x);
170 		tempfree(x);
171 	}
172 }
173 
174 
program(Node ** a,int n)175 Cell *program(Node **a, int n)	/* execute an awk program */
176 {				/* a[0] = BEGIN, a[1] = body, a[2] = END */
177 	Cell *x;
178 
179 	if (setjmp(env) != 0)
180 		goto ex;
181 	if (a[0]) {		/* BEGIN */
182 		x = execute(a[0]);
183 		if (isexit(x))
184 			return(True);
185 		if (isjump(x))
186 			FATAL("illegal break, continue, next or nextfile from BEGIN");
187 		tempfree(x);
188 	}
189 	if (a[1] || a[2])
190 		while (getrec(&record, &recsize, 1) > 0) {
191 			x = execute(a[1]);
192 			if (isexit(x))
193 				break;
194 			tempfree(x);
195 		}
196   ex:
197 	if (setjmp(env) != 0)	/* handles exit within END */
198 		goto ex1;
199 	if (a[2]) {		/* END */
200 		x = execute(a[2]);
201 		if (isbreak(x) || isnext(x) || iscont(x))
202 			FATAL("illegal break, continue, next or nextfile from END");
203 		tempfree(x);
204 	}
205   ex1:
206 	return(True);
207 }
208 
209 struct Frame {	/* stack frame for awk function calls */
210 	int nargs;	/* number of arguments in this call */
211 	Cell *fcncell;	/* pointer to Cell for function */
212 	Cell **args;	/* pointer to array of arguments after execute */
213 	Cell *retval;	/* return value */
214 };
215 
216 #define	NARGS	50	/* max args in a call */
217 
218 struct Frame *frame = NULL;	/* base of stack frames; dynamically allocated */
219 int	nframe = 0;		/* number of frames allocated */
220 struct Frame *fp = NULL;	/* frame pointer. bottom level unused */
221 
call(Node ** a,int n)222 Cell *call(Node **a, int n)	/* function call.  very kludgy and fragile */
223 {
224 	static Cell newcopycell = { OCELL, CCOPY, 0, "", 0.0, NUM|STR|DONTFREE };
225 	int i, ncall, ndef;
226 	int freed = 0; /* handles potential double freeing when fcn & param share a tempcell */
227 	Node *x;
228 	Cell *args[NARGS], *oargs[NARGS];	/* BUG: fixed size arrays */
229 	Cell *y, *z, *fcn;
230 	char *s;
231 
232 	fcn = execute(a[0]);	/* the function itself */
233 	s = fcn->nval;
234 	if (!isfcn(fcn))
235 		FATAL("calling undefined function %s", s);
236 	if (frame == NULL) {
237 		fp = frame = (struct Frame *) calloc(nframe += 100, sizeof(struct Frame));
238 		if (frame == NULL)
239 			FATAL("out of space for stack frames calling %s", s);
240 	}
241 	for (ncall = 0, x = a[1]; x != NULL; x = x->nnext)	/* args in call */
242 		ncall++;
243 	ndef = (int) fcn->fval;			/* args in defn */
244 	   dprintf( ("calling %s, %d args (%d in defn), fp=%d\n", s, ncall, ndef, (int) (fp-frame)) );
245 	if (ncall > ndef)
246 		WARNING("function %s called with %d args, uses only %d",
247 			s, ncall, ndef);
248 	if (ncall + ndef > NARGS)
249 		FATAL("function %s has %d arguments, limit %d", s, ncall+ndef, NARGS);
250 	for (i = 0, x = a[1]; x != NULL; i++, x = x->nnext) {	/* get call args */
251 		   dprintf( ("evaluate args[%d], fp=%d:\n", i, (int) (fp-frame)) );
252 		y = execute(x);
253 		oargs[i] = y;
254 		   dprintf( ("args[%d]: %s %f <%s>, t=%o\n",
255 			   i, NN(y->nval), y->fval, isarr(y) ? "(array)" : NN(y->sval), y->tval) );
256 		if (isfcn(y))
257 			FATAL("can't use function %s as argument in %s", y->nval, s);
258 		if (isarr(y))
259 			args[i] = y;	/* arrays by ref */
260 		else
261 			args[i] = copycell(y);
262 		tempfree(y);
263 	}
264 	for ( ; i < ndef; i++) {	/* add null args for ones not provided */
265 		args[i] = gettemp();
266 		*args[i] = newcopycell;
267 	}
268 	fp++;	/* now ok to up frame */
269 	if (fp >= frame + nframe) {
270 		int dfp = fp - frame;	/* old index */
271 		frame = (struct Frame *)
272 			realloc((char *) frame, (nframe += 100) * sizeof(struct Frame));
273 		if (frame == NULL)
274 			FATAL("out of space for stack frames in %s", s);
275 		fp = frame + dfp;
276 	}
277 	fp->fcncell = fcn;
278 	fp->args = args;
279 	fp->nargs = ndef;	/* number defined with (excess are locals) */
280 	fp->retval = gettemp();
281 
282 	   dprintf( ("start exec of %s, fp=%d\n", s, (int) (fp-frame)) );
283 	y = execute((Node *)(fcn->sval));	/* execute body */
284 	   dprintf( ("finished exec of %s, fp=%d\n", s, (int) (fp-frame)) );
285 
286 	for (i = 0; i < ndef; i++) {
287 		Cell *t = fp->args[i];
288 		if (isarr(t)) {
289 			if (t->csub == CCOPY) {
290 				if (i >= ncall) {
291 					freesymtab(t);
292 					t->csub = CTEMP;
293 					tempfree(t);
294 				} else {
295 					oargs[i]->tval = t->tval;
296 					oargs[i]->tval &= ~(STR|NUM|DONTFREE);
297 					oargs[i]->sval = t->sval;
298 					tempfree(t);
299 				}
300 			}
301 		} else if (t != y) {	/* kludge to prevent freeing twice */
302 			t->csub = CTEMP;
303 			tempfree(t);
304 		} else if (t == y && t->csub == CCOPY) {
305 			t->csub = CTEMP;
306 			tempfree(t);
307 			freed = 1;
308 		}
309 	}
310 	tempfree(fcn);
311 	if (isexit(y) || isnext(y))
312 		return y;
313 	if (freed == 0) {
314 		tempfree(y);	/* don't free twice! */
315 	}
316 	z = fp->retval;			/* return value */
317 	   dprintf( ("%s returns %g |%s| %o\n", s, getfval(z), getsval(z), z->tval) );
318 	fp--;
319 	return(z);
320 }
321 
copycell(Cell * x)322 Cell *copycell(Cell *x)	/* make a copy of a cell in a temp */
323 {
324 	Cell *y;
325 
326 	y = gettemp();
327 	y->csub = CCOPY;	/* prevents freeing until call is over */
328 	y->nval = x->nval;	/* BUG? */
329 	if (isstr(x))
330 		y->sval = tostring(x->sval);
331 	y->fval = x->fval;
332 	y->tval = x->tval & ~(CON|FLD|REC|DONTFREE);	/* copy is not constant or field */
333 							/* is DONTFREE right? */
334 	return y;
335 }
336 
arg(Node ** a,int n)337 Cell *arg(Node **a, int n)	/* nth argument of a function */
338 {
339 
340 	n = ptoi(a[0]);	/* argument number, counting from 0 */
341 	   dprintf( ("arg(%d), fp->nargs=%d\n", n, fp->nargs) );
342 	if (n+1 > fp->nargs)
343 		FATAL("argument #%d of function %s was not supplied",
344 			n+1, fp->fcncell->nval);
345 	return fp->args[n];
346 }
347 
jump(Node ** a,int n)348 Cell *jump(Node **a, int n)	/* break, continue, next, nextfile, return */
349 {
350 	Cell *y;
351 
352 	switch (n) {
353 	case EXIT:
354 		if (a[0] != NULL) {
355 			y = execute(a[0]);
356 			errorflag = (int) getfval(y);
357 			tempfree(y);
358 		}
359 		longjmp(env, 1);
360 	case RETURN:
361 		if (a[0] != NULL) {
362 			y = execute(a[0]);
363 			if ((y->tval & (STR|NUM)) == (STR|NUM)) {
364 				setsval(fp->retval, getsval(y));
365 				fp->retval->fval = getfval(y);
366 				fp->retval->tval |= NUM;
367 			}
368 			else if (y->tval & STR)
369 				setsval(fp->retval, getsval(y));
370 			else if (y->tval & NUM)
371 				setfval(fp->retval, getfval(y));
372 			else		/* can't happen */
373 				FATAL("bad type variable %d", y->tval);
374 			tempfree(y);
375 		}
376 		return(jret);
377 	case NEXT:
378 		return(jnext);
379 	case NEXTFILE:
380 		nextfile();
381 		return(jnextfile);
382 	case BREAK:
383 		return(jbreak);
384 	case CONTINUE:
385 		return(jcont);
386 	default:	/* can't happen */
387 		FATAL("illegal jump type %d", n);
388 	}
389 	return 0;	/* not reached */
390 }
391 
awkgetline(Node ** a,int n)392 Cell *awkgetline(Node **a, int n)	/* get next line from specific input */
393 {		/* a[0] is variable, a[1] is operator, a[2] is filename */
394 	Cell *r, *x;
395 	extern Cell **fldtab;
396 	FILE *fp;
397 	char *buf;
398 	int bufsize = recsize;
399 	int mode;
400 
401 	if ((buf = (char *) malloc(bufsize)) == NULL)
402 		FATAL("out of memory in getline");
403 
404 	fflush(stdout);	/* in case someone is waiting for a prompt */
405 	r = gettemp();
406 	if (a[1] != NULL) {		/* getline < file */
407 		x = execute(a[2]);		/* filename */
408 		mode = ptoi(a[1]);
409 		if (mode == '|')		/* input pipe */
410 			mode = LE;	/* arbitrary flag */
411 		fp = openfile(mode, getsval(x));
412 		tempfree(x);
413 		if (fp == NULL)
414 			n = -1;
415 		else
416 			n = readrec(&buf, &bufsize, fp);
417 		if (n <= 0) {
418 			;
419 		} else if (a[0] != NULL) {	/* getline var <file */
420 			x = execute(a[0]);
421 			setsval(x, buf);
422 			tempfree(x);
423 		} else {			/* getline <file */
424 			setsval(fldtab[0], buf);
425 			if (is_number(fldtab[0]->sval)) {
426 				fldtab[0]->fval = atof(fldtab[0]->sval);
427 				fldtab[0]->tval |= NUM;
428 			}
429 		}
430 	} else {			/* bare getline; use current input */
431 		if (a[0] == NULL)	/* getline */
432 			n = getrec(&record, &recsize, 1);
433 		else {			/* getline var */
434 			n = getrec(&buf, &bufsize, 0);
435 			x = execute(a[0]);
436 			setsval(x, buf);
437 			tempfree(x);
438 		}
439 	}
440 	setfval(r, (Awkfloat) n);
441 	free(buf);
442 	return r;
443 }
444 
getnf(Node ** a,int n)445 Cell *getnf(Node **a, int n)	/* get NF */
446 {
447 	if (donefld == 0)
448 		fldbld();
449 	return (Cell *) a[0];
450 }
451 
array(Node ** a,int n)452 Cell *array(Node **a, int n)	/* a[0] is symtab, a[1] is list of subscripts */
453 {
454 	Cell *x, *y, *z;
455 	char *s;
456 	Node *np;
457 	char *buf;
458 	int bufsz = recsize;
459 	int nsub = strlen(*SUBSEP);
460 
461 	if ((buf = (char *) malloc(bufsz)) == NULL)
462 		FATAL("out of memory in array");
463 
464 	x = execute(a[0]);	/* Cell* for symbol table */
465 	buf[0] = 0;
466 	for (np = a[1]; np; np = np->nnext) {
467 		y = execute(np);	/* subscript */
468 		s = getsval(y);
469 		if (!adjbuf(&buf, &bufsz, strlen(buf)+strlen(s)+nsub+1, recsize, 0, "array"))
470 			FATAL("out of memory for %s[%s...]", x->nval, buf);
471 		strcat(buf, s);
472 		if (np->nnext)
473 			strcat(buf, *SUBSEP);
474 		tempfree(y);
475 	}
476 	if (!isarr(x)) {
477 		   dprintf( ("making %s into an array\n", NN(x->nval)) );
478 		if (freeable(x))
479 			xfree(x->sval);
480 		x->tval &= ~(STR|NUM|DONTFREE);
481 		x->tval |= ARR;
482 		x->sval = (char *) makesymtab(NSYMTAB);
483 	}
484 	z = setsymtab(buf, "", 0.0, STR|NUM, (Array *) x->sval);
485 	z->ctype = OCELL;
486 	z->csub = CVAR;
487 	tempfree(x);
488 	free(buf);
489 	return(z);
490 }
491 
awkdelete(Node ** a,int n)492 Cell *awkdelete(Node **a, int n)	/* a[0] is symtab, a[1] is list of subscripts */
493 {
494 	Cell *x, *y;
495 	Node *np;
496 	char *s;
497 	int nsub = strlen(*SUBSEP);
498 
499 	x = execute(a[0]);	/* Cell* for symbol table */
500 	if (!isarr(x))
501 		return True;
502 	if (a[1] == 0) {	/* delete the elements, not the table */
503 		freesymtab(x);
504 		x->tval &= ~STR;
505 		x->tval |= ARR;
506 		x->sval = (char *) makesymtab(NSYMTAB);
507 	} else {
508 		int bufsz = recsize;
509 		char *buf;
510 		if ((buf = (char *) malloc(bufsz)) == NULL)
511 			FATAL("out of memory in adelete");
512 		buf[0] = 0;
513 		for (np = a[1]; np; np = np->nnext) {
514 			y = execute(np);	/* subscript */
515 			s = getsval(y);
516 			if (!adjbuf(&buf, &bufsz, strlen(buf)+strlen(s)+nsub+1, recsize, 0, "awkdelete"))
517 				FATAL("out of memory deleting %s[%s...]", x->nval, buf);
518 			strcat(buf, s);
519 			if (np->nnext)
520 				strcat(buf, *SUBSEP);
521 			tempfree(y);
522 		}
523 		freeelem(x, buf);
524 		free(buf);
525 	}
526 	tempfree(x);
527 	return True;
528 }
529 
intest(Node ** a,int n)530 Cell *intest(Node **a, int n)	/* a[0] is index (list), a[1] is symtab */
531 {
532 	Cell *x, *ap, *k;
533 	Node *p;
534 	char *buf;
535 	char *s;
536 	int bufsz = recsize;
537 	int nsub = strlen(*SUBSEP);
538 
539 	ap = execute(a[1]);	/* array name */
540 	if (!isarr(ap)) {
541 		   dprintf( ("making %s into an array\n", ap->nval) );
542 		if (freeable(ap))
543 			xfree(ap->sval);
544 		ap->tval &= ~(STR|NUM|DONTFREE);
545 		ap->tval |= ARR;
546 		ap->sval = (char *) makesymtab(NSYMTAB);
547 	}
548 	if ((buf = (char *) malloc(bufsz)) == NULL) {
549 		FATAL("out of memory in intest");
550 	}
551 	buf[0] = 0;
552 	for (p = a[0]; p; p = p->nnext) {
553 		x = execute(p);	/* expr */
554 		s = getsval(x);
555 		if (!adjbuf(&buf, &bufsz, strlen(buf)+strlen(s)+nsub+1, recsize, 0, "intest"))
556 			FATAL("out of memory deleting %s[%s...]", x->nval, buf);
557 		strcat(buf, s);
558 		tempfree(x);
559 		if (p->nnext)
560 			strcat(buf, *SUBSEP);
561 	}
562 	k = lookup(buf, (Array *) ap->sval);
563 	tempfree(ap);
564 	free(buf);
565 	if (k == NULL)
566 		return(False);
567 	else
568 		return(True);
569 }
570 
571 
matchop(Node ** a,int n)572 Cell *matchop(Node **a, int n)	/* ~ and match() */
573 {
574 	Cell *x, *y;
575 	char *s, *t;
576 	int i;
577 	fa *pfa;
578 	int (*mf)(fa *, const char *) = match, mode = 0;
579 
580 	if (n == MATCHFCN) {
581 		mf = pmatch;
582 		mode = 1;
583 	}
584 	x = execute(a[1]);	/* a[1] = target text */
585 	s = getsval(x);
586 	if (a[0] == 0)		/* a[1] == 0: already-compiled reg expr */
587 		i = (*mf)((fa *) a[2], s);
588 	else {
589 		y = execute(a[2]);	/* a[2] = regular expr */
590 		t = getsval(y);
591 		pfa = makedfa(t, mode);
592 		i = (*mf)(pfa, s);
593 		tempfree(y);
594 	}
595 	tempfree(x);
596 	if (n == MATCHFCN) {
597 		int start = patbeg - s + 1;
598 		if (patlen < 0)
599 			start = 0;
600 		setfval(rstartloc, (Awkfloat) start);
601 		setfval(rlengthloc, (Awkfloat) patlen);
602 		x = gettemp();
603 		x->tval = NUM;
604 		x->fval = start;
605 		return x;
606 	} else if ((n == MATCH && i == 1) || (n == NOTMATCH && i == 0))
607 		return(True);
608 	else
609 		return(False);
610 }
611 
612 
boolop(Node ** a,int n)613 Cell *boolop(Node **a, int n)	/* a[0] || a[1], a[0] && a[1], !a[0] */
614 {
615 	Cell *x, *y;
616 	int i;
617 
618 	x = execute(a[0]);
619 	i = istrue(x);
620 	tempfree(x);
621 	switch (n) {
622 	case BOR:
623 		if (i) return(True);
624 		y = execute(a[1]);
625 		i = istrue(y);
626 		tempfree(y);
627 		if (i) return(True);
628 		else return(False);
629 	case AND:
630 		if ( !i ) return(False);
631 		y = execute(a[1]);
632 		i = istrue(y);
633 		tempfree(y);
634 		if (i) return(True);
635 		else return(False);
636 	case NOT:
637 		if (i) return(False);
638 		else return(True);
639 	default:	/* can't happen */
640 		FATAL("unknown boolean operator %d", n);
641 	}
642 	return 0;	/*NOTREACHED*/
643 }
644 
relop(Node ** a,int n)645 Cell *relop(Node **a, int n)	/* a[0 < a[1], etc. */
646 {
647 	int i;
648 	Cell *x, *y;
649 	Awkfloat j;
650 
651 	x = execute(a[0]);
652 	y = execute(a[1]);
653 	if (x->tval&NUM && y->tval&NUM) {
654 		j = x->fval - y->fval;
655 		i = j<0? -1: (j>0? 1: 0);
656 	} else {
657 		i = strcmp(getsval(x), getsval(y));
658 	}
659 	tempfree(x);
660 	tempfree(y);
661 	switch (n) {
662 	case LT:	if (i<0) return(True);
663 			else return(False);
664 	case LE:	if (i<=0) return(True);
665 			else return(False);
666 	case NE:	if (i!=0) return(True);
667 			else return(False);
668 	case EQ:	if (i == 0) return(True);
669 			else return(False);
670 	case GE:	if (i>=0) return(True);
671 			else return(False);
672 	case GT:	if (i>0) return(True);
673 			else return(False);
674 	default:	/* can't happen */
675 		FATAL("unknown relational operator %d", n);
676 	}
677 	return 0;	/*NOTREACHED*/
678 }
679 
tfree(Cell * a)680 void tfree(Cell *a)	/* free a tempcell */
681 {
682 	if (freeable(a)) {
683 		   dprintf( ("freeing %s %s %o\n", NN(a->nval), NN(a->sval), a->tval) );
684 		xfree(a->sval);
685 	}
686 	if (a == tmps)
687 		FATAL("tempcell list is curdled");
688 	a->cnext = tmps;
689 	tmps = a;
690 }
691 
gettemp(void)692 Cell *gettemp(void)	/* get a tempcell */
693 {	int i;
694 	Cell *x;
695 
696 	if (!tmps) {
697 		tmps = (Cell *) calloc(100, sizeof(Cell));
698 		if (!tmps)
699 			FATAL("out of space for temporaries");
700 		for(i = 1; i < 100; i++)
701 			tmps[i-1].cnext = &tmps[i];
702 		tmps[i-1].cnext = 0;
703 	}
704 	x = tmps;
705 	tmps = x->cnext;
706 	*x = tempcell;
707 	return(x);
708 }
709 
indirect(Node ** a,int n)710 Cell *indirect(Node **a, int n)	/* $( a[0] ) */
711 {
712 	Awkfloat val;
713 	Cell *x;
714 	int m;
715 	char *s;
716 
717 	x = execute(a[0]);
718 	val = getfval(x);	/* freebsd: defend against super large field numbers */
719 	if ((Awkfloat)INT_MAX < val)
720 		FATAL("trying to access out of range field %s", x->nval);
721 	m = (int) val;
722 	if (m == 0 && !is_number(s = getsval(x)))	/* suspicion! */
723 		FATAL("illegal field $(%s), name \"%s\"", s, x->nval);
724 		/* BUG: can x->nval ever be null??? */
725 	tempfree(x);
726 	x = fieldadr(m);
727 	x->ctype = OCELL;	/* BUG?  why are these needed? */
728 	x->csub = CFLD;
729 	return(x);
730 }
731 
substr(Node ** a,int nnn)732 Cell *substr(Node **a, int nnn)		/* substr(a[0], a[1], a[2]) */
733 {
734 	int k, m, n;
735 	char *s;
736 	int temp;
737 	Cell *x, *y, *z = 0;
738 
739 	x = execute(a[0]);
740 	y = execute(a[1]);
741 	if (a[2] != 0)
742 		z = execute(a[2]);
743 	s = getsval(x);
744 	k = strlen(s) + 1;
745 	if (k <= 1) {
746 		tempfree(x);
747 		tempfree(y);
748 		if (a[2] != 0) {
749 			tempfree(z);
750 		}
751 		x = gettemp();
752 		setsval(x, "");
753 		return(x);
754 	}
755 	m = (int) getfval(y);
756 	if (m <= 0)
757 		m = 1;
758 	else if (m > k)
759 		m = k;
760 	tempfree(y);
761 	if (a[2] != 0) {
762 		n = (int) getfval(z);
763 		tempfree(z);
764 	} else
765 		n = k - 1;
766 	if (n < 0)
767 		n = 0;
768 	else if (n > k - m)
769 		n = k - m;
770 	   dprintf( ("substr: m=%d, n=%d, s=%s\n", m, n, s) );
771 	y = gettemp();
772 	temp = s[n+m-1];	/* with thanks to John Linderman */
773 	s[n+m-1] = '\0';
774 	setsval(y, s + m - 1);
775 	s[n+m-1] = temp;
776 	tempfree(x);
777 	return(y);
778 }
779 
sindex(Node ** a,int nnn)780 Cell *sindex(Node **a, int nnn)		/* index(a[0], a[1]) */
781 {
782 	Cell *x, *y, *z;
783 	char *s1, *s2, *p1, *p2, *q;
784 	Awkfloat v = 0.0;
785 
786 	x = execute(a[0]);
787 	s1 = getsval(x);
788 	y = execute(a[1]);
789 	s2 = getsval(y);
790 
791 	z = gettemp();
792 	for (p1 = s1; *p1 != '\0'; p1++) {
793 		for (q=p1, p2=s2; *p2 != '\0' && *q == *p2; q++, p2++)
794 			;
795 		if (*p2 == '\0') {
796 			v = (Awkfloat) (p1 - s1 + 1);	/* origin 1 */
797 			break;
798 		}
799 	}
800 	tempfree(x);
801 	tempfree(y);
802 	setfval(z, v);
803 	return(z);
804 }
805 
806 #define	MAXNUMSIZE	50
807 
format(char ** pbuf,int * pbufsize,const char * s,Node * a)808 int format(char **pbuf, int *pbufsize, const char *s, Node *a)	/* printf-like conversions */
809 {
810 	char *fmt;
811 	char *p, *t;
812 	const char *os;
813 	Cell *x;
814 	int flag = 0, n;
815 	int fmtwd; /* format width */
816 	int fmtsz = recsize;
817 	char *buf = *pbuf;
818 	int bufsize = *pbufsize;
819 
820 	os = s;
821 	p = buf;
822 	if ((fmt = (char *) malloc(fmtsz)) == NULL)
823 		FATAL("out of memory in format()");
824 	while (*s) {
825 		adjbuf(&buf, &bufsize, MAXNUMSIZE+1+p-buf, recsize, &p, "format1");
826 		if (*s != '%') {
827 			*p++ = *s++;
828 			continue;
829 		}
830 		if (*(s+1) == '%') {
831 			*p++ = '%';
832 			s += 2;
833 			continue;
834 		}
835 		/* have to be real careful in case this is a huge number, eg, %100000d */
836 		fmtwd = atoi(s+1);
837 		if (fmtwd < 0)
838 			fmtwd = -fmtwd;
839 		adjbuf(&buf, &bufsize, fmtwd+1+p-buf, recsize, &p, "format2");
840 		for (t = fmt; (*t++ = *s) != '\0'; s++) {
841 			if (!adjbuf(&fmt, &fmtsz, MAXNUMSIZE+1+t-fmt, recsize, &t, "format3"))
842 				FATAL("format item %.30s... ran format() out of memory", os);
843 			if (isalpha((uschar)*s) && *s != 'l' && *s != 'h' && *s != 'L')
844 				break;	/* the ansi panoply */
845 			if (*s == '*') {
846 				x = execute(a);
847 				a = a->nnext;
848 				sprintf(t-1, "%d", fmtwd=(int) getfval(x));
849 				if (fmtwd < 0)
850 					fmtwd = -fmtwd;
851 				adjbuf(&buf, &bufsize, fmtwd+1+p-buf, recsize, &p, "format");
852 				t = fmt + strlen(fmt);
853 				tempfree(x);
854 			}
855 		}
856 		*t = '\0';
857 		if (fmtwd < 0)
858 			fmtwd = -fmtwd;
859 		adjbuf(&buf, &bufsize, fmtwd+1+p-buf, recsize, &p, "format4");
860 
861 		switch (*s) {
862 		case 'f': case 'e': case 'g': case 'E': case 'G':
863 			flag = 'f';
864 			break;
865 		case 'd': case 'i':
866 			flag = 'd';
867 			if(*(s-1) == 'l') break;
868 			*(t-1) = 'l';
869 			*t = 'd';
870 			*++t = '\0';
871 			break;
872 		case 'o': case 'x': case 'X': case 'u':
873 			flag = *(s-1) == 'l' ? 'd' : 'u';
874 			break;
875 		case 's':
876 			flag = 's';
877 			break;
878 		case 'c':
879 			flag = 'c';
880 			break;
881 		default:
882 			WARNING("weird printf conversion %s", fmt);
883 			flag = '?';
884 			break;
885 		}
886 		if (a == NULL)
887 			FATAL("not enough args in printf(%s)", os);
888 		x = execute(a);
889 		a = a->nnext;
890 		n = MAXNUMSIZE;
891 		if (fmtwd > n)
892 			n = fmtwd;
893 		adjbuf(&buf, &bufsize, 1+n+p-buf, recsize, &p, "format5");
894 		switch (flag) {
895 		case '?':	sprintf(p, "%s", fmt);	/* unknown, so dump it too */
896 			t = getsval(x);
897 			n = strlen(t);
898 			if (fmtwd > n)
899 				n = fmtwd;
900 			adjbuf(&buf, &bufsize, 1+strlen(p)+n+p-buf, recsize, &p, "format6");
901 			p += strlen(p);
902 			sprintf(p, "%s", t);
903 			break;
904 		case 'f':	sprintf(p, fmt, getfval(x)); break;
905 		case 'd':	sprintf(p, fmt, (long) getfval(x)); break;
906 		case 'u':	sprintf(p, fmt, (int) getfval(x)); break;
907 		case 's':
908 			t = getsval(x);
909 			n = strlen(t);
910 			if (fmtwd > n)
911 				n = fmtwd;
912 			if (!adjbuf(&buf, &bufsize, 1+n+p-buf, recsize, &p, "format7"))
913 				FATAL("huge string/format (%d chars) in printf %.30s... ran format() out of memory", n, t);
914 			sprintf(p, fmt, t);
915 			break;
916 		case 'c':
917 			if (isnum(x)) {
918 				if (getfval(x))
919 					sprintf(p, fmt, (int) getfval(x));
920 				else {
921 					*p++ = '\0'; /* explicit null byte */
922 					*p = '\0';   /* next output will start here */
923 				}
924 			} else
925 				sprintf(p, fmt, getsval(x)[0]);
926 			break;
927 		default:
928 			FATAL("can't happen: bad conversion %c in format()", flag);
929 		}
930 		tempfree(x);
931 		p += strlen(p);
932 		s++;
933 	}
934 	*p = '\0';
935 	free(fmt);
936 	for ( ; a; a = a->nnext)		/* evaluate any remaining args */
937 		execute(a);
938 	*pbuf = buf;
939 	*pbufsize = bufsize;
940 	return p - buf;
941 }
942 
awksprintf(Node ** a,int n)943 Cell *awksprintf(Node **a, int n)		/* sprintf(a[0]) */
944 {
945 	Cell *x;
946 	Node *y;
947 	char *buf;
948 	int bufsz=3*recsize;
949 
950 	if ((buf = (char *) malloc(bufsz)) == NULL)
951 		FATAL("out of memory in awksprintf");
952 	y = a[0]->nnext;
953 	x = execute(a[0]);
954 	if (format(&buf, &bufsz, getsval(x), y) == -1)
955 		FATAL("sprintf string %.30s... too long.  can't happen.", buf);
956 	tempfree(x);
957 	x = gettemp();
958 	x->sval = buf;
959 	x->tval = STR;
960 	return(x);
961 }
962 
awkprintf(Node ** a,int n)963 Cell *awkprintf(Node **a, int n)		/* printf */
964 {	/* a[0] is list of args, starting with format string */
965 	/* a[1] is redirection operator, a[2] is redirection file */
966 	FILE *fp;
967 	Cell *x;
968 	Node *y;
969 	char *buf;
970 	int len;
971 	int bufsz=3*recsize;
972 
973 	if ((buf = (char *) malloc(bufsz)) == NULL)
974 		FATAL("out of memory in awkprintf");
975 	y = a[0]->nnext;
976 	x = execute(a[0]);
977 	if ((len = format(&buf, &bufsz, getsval(x), y)) == -1)
978 		FATAL("printf string %.30s... too long.  can't happen.", buf);
979 	tempfree(x);
980 	if (a[1] == NULL) {
981 		/* fputs(buf, stdout); */
982 		fwrite(buf, len, 1, stdout);
983 		if (ferror(stdout))
984 			FATAL("write error on stdout");
985 	} else {
986 		fp = redirect(ptoi(a[1]), a[2]);
987 		/* fputs(buf, fp); */
988 		fwrite(buf, len, 1, fp);
989 		fflush(fp);
990 		if (ferror(fp))
991 			FATAL("write error on %s", filename(fp));
992 	}
993 	free(buf);
994 	return(True);
995 }
996 
arith(Node ** a,int n)997 Cell *arith(Node **a, int n)	/* a[0] + a[1], etc.  also -a[0] */
998 {
999 	Awkfloat i, j = 0;
1000 	double v;
1001 	Cell *x, *y, *z;
1002 
1003 	x = execute(a[0]);
1004 	i = getfval(x);
1005 	tempfree(x);
1006 	if (n != UMINUS) {
1007 		y = execute(a[1]);
1008 		j = getfval(y);
1009 		tempfree(y);
1010 	}
1011 	z = gettemp();
1012 	switch (n) {
1013 	case ADD:
1014 		i += j;
1015 		break;
1016 	case MINUS:
1017 		i -= j;
1018 		break;
1019 	case MULT:
1020 		i *= j;
1021 		break;
1022 	case DIVIDE:
1023 		if (j == 0)
1024 			FATAL("division by zero");
1025 		i /= j;
1026 		break;
1027 	case MOD:
1028 		if (j == 0)
1029 			FATAL("division by zero in mod");
1030 		modf(i/j, &v);
1031 		i = i - j * v;
1032 		break;
1033 	case UMINUS:
1034 		i = -i;
1035 		break;
1036 	case POWER:
1037 		if (j >= 0 && modf(j, &v) == 0.0)	/* pos integer exponent */
1038 			i = ipow(i, (int) j);
1039 		else
1040 			i = errcheck(pow(i, j), "pow");
1041 		break;
1042 	default:	/* can't happen */
1043 		FATAL("illegal arithmetic operator %d", n);
1044 	}
1045 	setfval(z, i);
1046 	return(z);
1047 }
1048 
ipow(double x,int n)1049 double ipow(double x, int n)	/* x**n.  ought to be done by pow, but isn't always */
1050 {
1051 	double v;
1052 
1053 	if (n <= 0)
1054 		return 1;
1055 	v = ipow(x, n/2);
1056 	if (n % 2 == 0)
1057 		return v * v;
1058 	else
1059 		return x * v * v;
1060 }
1061 
incrdecr(Node ** a,int n)1062 Cell *incrdecr(Node **a, int n)		/* a[0]++, etc. */
1063 {
1064 	Cell *x, *z;
1065 	int k;
1066 	Awkfloat xf;
1067 
1068 	x = execute(a[0]);
1069 	xf = getfval(x);
1070 	k = (n == PREINCR || n == POSTINCR) ? 1 : -1;
1071 	if (n == PREINCR || n == PREDECR) {
1072 		setfval(x, xf + k);
1073 		return(x);
1074 	}
1075 	z = gettemp();
1076 	setfval(z, xf);
1077 	setfval(x, xf + k);
1078 	tempfree(x);
1079 	return(z);
1080 }
1081 
assign(Node ** a,int n)1082 Cell *assign(Node **a, int n)	/* a[0] = a[1], a[0] += a[1], etc. */
1083 {		/* this is subtle; don't muck with it. */
1084 	Cell *x, *y;
1085 	Awkfloat xf, yf;
1086 	double v;
1087 
1088 	y = execute(a[1]);
1089 	x = execute(a[0]);
1090 	if (n == ASSIGN) {	/* ordinary assignment */
1091 		if (x == y && !(x->tval & (FLD|REC)))	/* self-assignment: */
1092 			;		/* leave alone unless it's a field */
1093 		else if ((y->tval & (STR|NUM)) == (STR|NUM)) {
1094 			setsval(x, getsval(y));
1095 			x->fval = getfval(y);
1096 			x->tval |= NUM;
1097 		}
1098 		else if (isstr(y))
1099 			setsval(x, getsval(y));
1100 		else if (isnum(y))
1101 			setfval(x, getfval(y));
1102 		else
1103 			funnyvar(y, "read value of");
1104 		tempfree(y);
1105 		return(x);
1106 	}
1107 	xf = getfval(x);
1108 	yf = getfval(y);
1109 	switch (n) {
1110 	case ADDEQ:
1111 		xf += yf;
1112 		break;
1113 	case SUBEQ:
1114 		xf -= yf;
1115 		break;
1116 	case MULTEQ:
1117 		xf *= yf;
1118 		break;
1119 	case DIVEQ:
1120 		if (yf == 0)
1121 			FATAL("division by zero in /=");
1122 		xf /= yf;
1123 		break;
1124 	case MODEQ:
1125 		if (yf == 0)
1126 			FATAL("division by zero in %%=");
1127 		modf(xf/yf, &v);
1128 		xf = xf - yf * v;
1129 		break;
1130 	case POWEQ:
1131 		if (yf >= 0 && modf(yf, &v) == 0.0)	/* pos integer exponent */
1132 			xf = ipow(xf, (int) yf);
1133 		else
1134 			xf = errcheck(pow(xf, yf), "pow");
1135 		break;
1136 	default:
1137 		FATAL("illegal assignment operator %d", n);
1138 		break;
1139 	}
1140 	tempfree(y);
1141 	setfval(x, xf);
1142 	return(x);
1143 }
1144 
cat(Node ** a,int q)1145 Cell *cat(Node **a, int q)	/* a[0] cat a[1] */
1146 {
1147 	Cell *x, *y, *z;
1148 	int n1, n2;
1149 	char *s;
1150 
1151 	x = execute(a[0]);
1152 	y = execute(a[1]);
1153 	getsval(x);
1154 	getsval(y);
1155 	n1 = strlen(x->sval);
1156 	n2 = strlen(y->sval);
1157 	s = (char *) malloc(n1 + n2 + 1);
1158 	if (s == NULL)
1159 		FATAL("out of space concatenating %.15s... and %.15s...",
1160 			x->sval, y->sval);
1161 	strcpy(s, x->sval);
1162 	strcpy(s+n1, y->sval);
1163 	tempfree(x);
1164 	tempfree(y);
1165 	z = gettemp();
1166 	z->sval = s;
1167 	z->tval = STR;
1168 	return(z);
1169 }
1170 
pastat(Node ** a,int n)1171 Cell *pastat(Node **a, int n)	/* a[0] { a[1] } */
1172 {
1173 	Cell *x;
1174 
1175 	if (a[0] == 0)
1176 		x = execute(a[1]);
1177 	else {
1178 		x = execute(a[0]);
1179 		if (istrue(x)) {
1180 			tempfree(x);
1181 			x = execute(a[1]);
1182 		}
1183 	}
1184 	return x;
1185 }
1186 
dopa2(Node ** a,int n)1187 Cell *dopa2(Node **a, int n)	/* a[0], a[1] { a[2] } */
1188 {
1189 	Cell *x;
1190 	int pair;
1191 
1192 	pair = ptoi(a[3]);
1193 	if (pairstack[pair] == 0) {
1194 		x = execute(a[0]);
1195 		if (istrue(x))
1196 			pairstack[pair] = 1;
1197 		tempfree(x);
1198 	}
1199 	if (pairstack[pair] == 1) {
1200 		x = execute(a[1]);
1201 		if (istrue(x))
1202 			pairstack[pair] = 0;
1203 		tempfree(x);
1204 		x = execute(a[2]);
1205 		return(x);
1206 	}
1207 	return(False);
1208 }
1209 
split(Node ** a,int nnn)1210 Cell *split(Node **a, int nnn)	/* split(a[0], a[1], a[2]); a[3] is type */
1211 {
1212 	Cell *x = 0, *y, *ap;
1213 	char *s, *origs;
1214 	int sep;
1215 	char *t, temp, num[50], *fs = 0;
1216 	int n, tempstat, arg3type;
1217 
1218 	y = execute(a[0]);	/* source string */
1219 	origs = s = strdup(getsval(y));
1220 	arg3type = ptoi(a[3]);
1221 	if (a[2] == 0)		/* fs string */
1222 		fs = *FS;
1223 	else if (arg3type == STRING) {	/* split(str,arr,"string") */
1224 		x = execute(a[2]);
1225 		fs = getsval(x);
1226 	} else if (arg3type == REGEXPR)
1227 		fs = "(regexpr)";	/* split(str,arr,/regexpr/) */
1228 	else
1229 		FATAL("illegal type of split");
1230 	sep = *fs;
1231 	ap = execute(a[1]);	/* array name */
1232 	freesymtab(ap);
1233 	   dprintf( ("split: s=|%s|, a=%s, sep=|%s|\n", s, NN(ap->nval), fs) );
1234 	ap->tval &= ~STR;
1235 	ap->tval |= ARR;
1236 	ap->sval = (char *) makesymtab(NSYMTAB);
1237 
1238 	n = 0;
1239         if (arg3type == REGEXPR && strlen((char*)((fa*)a[2])->restr) == 0) {
1240 		/* split(s, a, //); have to arrange that it looks like empty sep */
1241 		arg3type = 0;
1242 		fs = "";
1243 		sep = 0;
1244 	}
1245 	if (*s != '\0' && (strlen(fs) > 1 || arg3type == REGEXPR)) {	/* reg expr */
1246 		fa *pfa;
1247 		if (arg3type == REGEXPR) {	/* it's ready already */
1248 			pfa = (fa *) a[2];
1249 		} else {
1250 			pfa = makedfa(fs, 1);
1251 		}
1252 		if (nematch(pfa,s)) {
1253 			tempstat = pfa->initstat;
1254 			pfa->initstat = 2;
1255 			do {
1256 				n++;
1257 				sprintf(num, "%d", n);
1258 				temp = *patbeg;
1259 				*patbeg = '\0';
1260 				if (is_number(s))
1261 					setsymtab(num, s, atof(s), STR|NUM, (Array *) ap->sval);
1262 				else
1263 					setsymtab(num, s, 0.0, STR, (Array *) ap->sval);
1264 				*patbeg = temp;
1265 				s = patbeg + patlen;
1266 				if (*(patbeg+patlen-1) == 0 || *s == 0) {
1267 					n++;
1268 					sprintf(num, "%d", n);
1269 					setsymtab(num, "", 0.0, STR, (Array *) ap->sval);
1270 					pfa->initstat = tempstat;
1271 					goto spdone;
1272 				}
1273 			} while (nematch(pfa,s));
1274 			pfa->initstat = tempstat; 	/* bwk: has to be here to reset */
1275 							/* cf gsub and refldbld */
1276 		}
1277 		n++;
1278 		sprintf(num, "%d", n);
1279 		if (is_number(s))
1280 			setsymtab(num, s, atof(s), STR|NUM, (Array *) ap->sval);
1281 		else
1282 			setsymtab(num, s, 0.0, STR, (Array *) ap->sval);
1283   spdone:
1284 		pfa = NULL;
1285 	} else if (sep == ' ') {
1286 		for (n = 0; ; ) {
1287 			while (*s == ' ' || *s == '\t' || *s == '\n')
1288 				s++;
1289 			if (*s == 0)
1290 				break;
1291 			n++;
1292 			t = s;
1293 			do
1294 				s++;
1295 			while (*s!=' ' && *s!='\t' && *s!='\n' && *s!='\0');
1296 			temp = *s;
1297 			*s = '\0';
1298 			sprintf(num, "%d", n);
1299 			if (is_number(t))
1300 				setsymtab(num, t, atof(t), STR|NUM, (Array *) ap->sval);
1301 			else
1302 				setsymtab(num, t, 0.0, STR, (Array *) ap->sval);
1303 			*s = temp;
1304 			if (*s != 0)
1305 				s++;
1306 		}
1307 	} else if (sep == 0) {	/* new: split(s, a, "") => 1 char/elem */
1308 		for (n = 0; *s != 0; s++) {
1309 			char buf[2];
1310 			n++;
1311 			sprintf(num, "%d", n);
1312 			buf[0] = *s;
1313 			buf[1] = 0;
1314 			if (isdigit((uschar)buf[0]))
1315 				setsymtab(num, buf, atof(buf), STR|NUM, (Array *) ap->sval);
1316 			else
1317 				setsymtab(num, buf, 0.0, STR, (Array *) ap->sval);
1318 		}
1319 	} else if (*s != 0) {
1320 		for (;;) {
1321 			n++;
1322 			t = s;
1323 			while (*s != sep && *s != '\n' && *s != '\0')
1324 				s++;
1325 			temp = *s;
1326 			*s = '\0';
1327 			sprintf(num, "%d", n);
1328 			if (is_number(t))
1329 				setsymtab(num, t, atof(t), STR|NUM, (Array *) ap->sval);
1330 			else
1331 				setsymtab(num, t, 0.0, STR, (Array *) ap->sval);
1332 			*s = temp;
1333 			if (*s++ == 0)
1334 				break;
1335 		}
1336 	}
1337 	tempfree(ap);
1338 	tempfree(y);
1339 	free(origs);
1340 	if (a[2] != 0 && arg3type == STRING) {
1341 		tempfree(x);
1342 	}
1343 	x = gettemp();
1344 	x->tval = NUM;
1345 	x->fval = n;
1346 	return(x);
1347 }
1348 
condexpr(Node ** a,int n)1349 Cell *condexpr(Node **a, int n)	/* a[0] ? a[1] : a[2] */
1350 {
1351 	Cell *x;
1352 
1353 	x = execute(a[0]);
1354 	if (istrue(x)) {
1355 		tempfree(x);
1356 		x = execute(a[1]);
1357 	} else {
1358 		tempfree(x);
1359 		x = execute(a[2]);
1360 	}
1361 	return(x);
1362 }
1363 
ifstat(Node ** a,int n)1364 Cell *ifstat(Node **a, int n)	/* if (a[0]) a[1]; else a[2] */
1365 {
1366 	Cell *x;
1367 
1368 	x = execute(a[0]);
1369 	if (istrue(x)) {
1370 		tempfree(x);
1371 		x = execute(a[1]);
1372 	} else if (a[2] != 0) {
1373 		tempfree(x);
1374 		x = execute(a[2]);
1375 	}
1376 	return(x);
1377 }
1378 
whilestat(Node ** a,int n)1379 Cell *whilestat(Node **a, int n)	/* while (a[0]) a[1] */
1380 {
1381 	Cell *x;
1382 
1383 	for (;;) {
1384 		x = execute(a[0]);
1385 		if (!istrue(x))
1386 			return(x);
1387 		tempfree(x);
1388 		x = execute(a[1]);
1389 		if (isbreak(x)) {
1390 			x = True;
1391 			return(x);
1392 		}
1393 		if (isnext(x) || isexit(x) || isret(x))
1394 			return(x);
1395 		tempfree(x);
1396 	}
1397 }
1398 
dostat(Node ** a,int n)1399 Cell *dostat(Node **a, int n)	/* do a[0]; while(a[1]) */
1400 {
1401 	Cell *x;
1402 
1403 	for (;;) {
1404 		x = execute(a[0]);
1405 		if (isbreak(x))
1406 			return True;
1407 		if (isnext(x) || isexit(x) || isret(x))
1408 			return(x);
1409 		tempfree(x);
1410 		x = execute(a[1]);
1411 		if (!istrue(x))
1412 			return(x);
1413 		tempfree(x);
1414 	}
1415 }
1416 
forstat(Node ** a,int n)1417 Cell *forstat(Node **a, int n)	/* for (a[0]; a[1]; a[2]) a[3] */
1418 {
1419 	Cell *x;
1420 
1421 	x = execute(a[0]);
1422 	tempfree(x);
1423 	for (;;) {
1424 		if (a[1]!=0) {
1425 			x = execute(a[1]);
1426 			if (!istrue(x)) return(x);
1427 			else tempfree(x);
1428 		}
1429 		x = execute(a[3]);
1430 		if (isbreak(x))		/* turn off break */
1431 			return True;
1432 		if (isnext(x) || isexit(x) || isret(x))
1433 			return(x);
1434 		tempfree(x);
1435 		x = execute(a[2]);
1436 		tempfree(x);
1437 	}
1438 }
1439 
instat(Node ** a,int n)1440 Cell *instat(Node **a, int n)	/* for (a[0] in a[1]) a[2] */
1441 {
1442 	Cell *x, *vp, *arrayp, *cp, *ncp;
1443 	Array *tp;
1444 	int i;
1445 
1446 	vp = execute(a[0]);
1447 	arrayp = execute(a[1]);
1448 	if (!isarr(arrayp)) {
1449 		return True;
1450 	}
1451 	tp = (Array *) arrayp->sval;
1452 	tempfree(arrayp);
1453 	for (i = 0; i < tp->size; i++) {	/* this routine knows too much */
1454 		for (cp = tp->tab[i]; cp != NULL; cp = ncp) {
1455 			setsval(vp, cp->nval);
1456 			ncp = cp->cnext;
1457 			x = execute(a[2]);
1458 			if (isbreak(x)) {
1459 				tempfree(vp);
1460 				return True;
1461 			}
1462 			if (isnext(x) || isexit(x) || isret(x)) {
1463 				tempfree(vp);
1464 				return(x);
1465 			}
1466 			tempfree(x);
1467 		}
1468 	}
1469 	return True;
1470 }
1471 
bltin(Node ** a,int n)1472 Cell *bltin(Node **a, int n)	/* builtin functions. a[0] is type, a[1] is arg list */
1473 {
1474 	Cell *x, *y;
1475 	Awkfloat u;
1476 	int t;
1477 	Awkfloat tmp;
1478 	char *p, *buf;
1479 	Node *nextarg;
1480 	FILE *fp;
1481 	void flush_all(void);
1482 
1483 	t = ptoi(a[0]);
1484 	x = execute(a[1]);
1485 	nextarg = a[1]->nnext;
1486 	switch (t) {
1487 	case FLENGTH:
1488 		if (isarr(x))
1489 			u = ((Array *) x->sval)->nelem;	/* GROT.  should be function*/
1490 		else
1491 			u = strlen(getsval(x));
1492 		break;
1493 	case FLOG:
1494 		u = errcheck(log(getfval(x)), "log"); break;
1495 	case FINT:
1496 		modf(getfval(x), &u); break;
1497 	case FEXP:
1498 		u = errcheck(exp(getfval(x)), "exp"); break;
1499 	case FSQRT:
1500 		u = errcheck(sqrt(getfval(x)), "sqrt"); break;
1501 	case FSIN:
1502 		u = sin(getfval(x)); break;
1503 	case FCOS:
1504 		u = cos(getfval(x)); break;
1505 	case FATAN:
1506 		if (nextarg == 0) {
1507 			WARNING("atan2 requires two arguments; returning 1.0");
1508 			u = 1.0;
1509 		} else {
1510 			y = execute(a[1]->nnext);
1511 			u = atan2(getfval(x), getfval(y));
1512 			tempfree(y);
1513 			nextarg = nextarg->nnext;
1514 		}
1515 		break;
1516 	case FSYSTEM:
1517 		fflush(stdout);		/* in case something is buffered already */
1518 		u = (Awkfloat) system(getsval(x)) / 256;   /* 256 is unix-dep */
1519 		break;
1520 	case FRAND:
1521 		/* in principle, rand() returns something in 0..RAND_MAX */
1522 		u = (Awkfloat) (rand() % RAND_MAX) / RAND_MAX;
1523 		break;
1524 	case FSRAND:
1525 		if (isrec(x))	/* no argument provided */
1526 			u = time((time_t *)0);
1527 		else
1528 			u = getfval(x);
1529 		tmp = u;
1530 		srand((unsigned int) u);
1531 		u = srand_seed;
1532 		srand_seed = tmp;
1533 		break;
1534 	case FTOUPPER:
1535 	case FTOLOWER:
1536 		buf = tostring(getsval(x));
1537 		if (t == FTOUPPER) {
1538 			for (p = buf; *p; p++)
1539 				if (islower((uschar) *p))
1540 					*p = toupper((uschar)*p);
1541 		} else {
1542 			for (p = buf; *p; p++)
1543 				if (isupper((uschar) *p))
1544 					*p = tolower((uschar)*p);
1545 		}
1546 		tempfree(x);
1547 		x = gettemp();
1548 		setsval(x, buf);
1549 		free(buf);
1550 		return x;
1551 	case FFLUSH:
1552 		if (isrec(x) || strlen(getsval(x)) == 0) {
1553 			flush_all();	/* fflush() or fflush("") -> all */
1554 			u = 0;
1555 		} else if ((fp = openfile(FFLUSH, getsval(x))) == NULL)
1556 			u = EOF;
1557 		else
1558 			u = fflush(fp);
1559 		break;
1560 	default:	/* can't happen */
1561 		FATAL("illegal function type %d", t);
1562 		break;
1563 	}
1564 	tempfree(x);
1565 	x = gettemp();
1566 	setfval(x, u);
1567 	if (nextarg != 0) {
1568 		WARNING("warning: function has too many arguments");
1569 		for ( ; nextarg; nextarg = nextarg->nnext)
1570 			execute(nextarg);
1571 	}
1572 	return(x);
1573 }
1574 
printstat(Node ** a,int n)1575 Cell *printstat(Node **a, int n)	/* print a[0] */
1576 {
1577 	Node *x;
1578 	Cell *y;
1579 	FILE *fp;
1580 
1581 	if (a[1] == 0)	/* a[1] is redirection operator, a[2] is file */
1582 		fp = stdout;
1583 	else
1584 		fp = redirect(ptoi(a[1]), a[2]);
1585 	for (x = a[0]; x != NULL; x = x->nnext) {
1586 		y = execute(x);
1587 		fputs(getpssval(y), fp);
1588 		tempfree(y);
1589 		if (x->nnext == NULL)
1590 			fputs(*ORS, fp);
1591 		else
1592 			fputs(*OFS, fp);
1593 	}
1594 	if (a[1] != 0)
1595 		fflush(fp);
1596 	if (ferror(fp))
1597 		FATAL("write error on %s", filename(fp));
1598 	return(True);
1599 }
1600 
nullproc(Node ** a,int n)1601 Cell *nullproc(Node **a, int n)
1602 {
1603 	n = n;
1604 	a = a;
1605 	return 0;
1606 }
1607 
1608 
redirect(int a,Node * b)1609 FILE *redirect(int a, Node *b)	/* set up all i/o redirections */
1610 {
1611 	FILE *fp;
1612 	Cell *x;
1613 	char *fname;
1614 
1615 	x = execute(b);
1616 	fname = getsval(x);
1617 	fp = openfile(a, fname);
1618 	if (fp == NULL)
1619 		FATAL("can't open file %s", fname);
1620 	tempfree(x);
1621 	return fp;
1622 }
1623 
1624 struct files {
1625 	FILE	*fp;
1626 	const char	*fname;
1627 	int	mode;	/* '|', 'a', 'w' => LE/LT, GT */
1628 } *files;
1629 
1630 int nfiles;
1631 
stdinit(void)1632 void stdinit(void)	/* in case stdin, etc., are not constants */
1633 {
1634 	nfiles = FOPEN_MAX;
1635 	files = calloc(nfiles, sizeof(*files));
1636 	if (files == NULL)
1637 		FATAL("can't allocate file memory for %u files", nfiles);
1638         files[0].fp = stdin;
1639 	files[0].fname = "/dev/stdin";
1640 	files[0].mode = LT;
1641         files[1].fp = stdout;
1642 	files[1].fname = "/dev/stdout";
1643 	files[1].mode = GT;
1644         files[2].fp = stderr;
1645 	files[2].fname = "/dev/stderr";
1646 	files[2].mode = GT;
1647 }
1648 
openfile(int a,const char * us)1649 FILE *openfile(int a, const char *us)
1650 {
1651 	const char *s = us;
1652 	int i, m;
1653 	FILE *fp = 0;
1654 
1655 	if (*s == '\0')
1656 		FATAL("null file name in print or getline");
1657 	for (i=0; i < nfiles; i++)
1658 		if (files[i].fname && strcmp(s, files[i].fname) == 0) {
1659 			if (a == files[i].mode || (a==APPEND && files[i].mode==GT))
1660 				return files[i].fp;
1661 			if (a == FFLUSH)
1662 				return files[i].fp;
1663 		}
1664 	if (a == FFLUSH)	/* didn't find it, so don't create it! */
1665 		return NULL;
1666 
1667 	for (i=0; i < nfiles; i++)
1668 		if (files[i].fp == 0)
1669 			break;
1670 	if (i >= nfiles) {
1671 		struct files *nf;
1672 		int nnf = nfiles + FOPEN_MAX;
1673 		nf = realloc(files, nnf * sizeof(*nf));
1674 		if (nf == NULL)
1675 			FATAL("cannot grow files for %s and %d files", s, nnf);
1676 		memset(&nf[nfiles], 0, FOPEN_MAX * sizeof(*nf));
1677 		nfiles = nnf;
1678 		files = nf;
1679 	}
1680 	fflush(stdout);	/* force a semblance of order */
1681 	m = a;
1682 	if (a == GT) {
1683 		fp = fopen(s, "w");
1684 	} else if (a == APPEND) {
1685 		fp = fopen(s, "a");
1686 		m = GT;	/* so can mix > and >> */
1687 	} else if (a == '|') {	/* output pipe */
1688 		fp = popen(s, "w");
1689 	} else if (a == LE) {	/* input pipe */
1690 		fp = popen(s, "r");
1691 	} else if (a == LT) {	/* getline <file */
1692 		fp = strcmp(s, "-") == 0 ? stdin : fopen(s, "r");	/* "-" is stdin */
1693 	} else	/* can't happen */
1694 		FATAL("illegal redirection %d", a);
1695 	if (fp != NULL) {
1696 		files[i].fname = tostring(s);
1697 		files[i].fp = fp;
1698 		files[i].mode = m;
1699 	}
1700 	return fp;
1701 }
1702 
filename(FILE * fp)1703 const char *filename(FILE *fp)
1704 {
1705 	int i;
1706 
1707 	for (i = 0; i < nfiles; i++)
1708 		if (fp == files[i].fp)
1709 			return files[i].fname;
1710 	return "???";
1711 }
1712 
closefile(Node ** a,int n)1713 Cell *closefile(Node **a, int n)
1714 {
1715 	Cell *x;
1716 	int i, stat;
1717 
1718 	n = n;
1719 	x = execute(a[0]);
1720 	getsval(x);
1721 	stat = -1;
1722 	for (i = 0; i < nfiles; i++) {
1723 		if (files[i].fname && strcmp(x->sval, files[i].fname) == 0) {
1724 			if (ferror(files[i].fp))
1725 				WARNING( "i/o error occurred on %s", files[i].fname );
1726 			if (files[i].mode == '|' || files[i].mode == LE)
1727 				stat = pclose(files[i].fp);
1728 			else
1729 				stat = fclose(files[i].fp);
1730 			if (stat == EOF)
1731 				WARNING( "i/o error occurred closing %s", files[i].fname );
1732 			if (i > 2)	/* don't do /dev/std... */
1733 				xfree(files[i].fname);
1734 			files[i].fname = NULL;	/* watch out for ref thru this */
1735 			files[i].fp = NULL;
1736 		}
1737 	}
1738 	tempfree(x);
1739 	x = gettemp();
1740 	setfval(x, (Awkfloat) stat);
1741 	return(x);
1742 }
1743 
closeall(void)1744 void closeall(void)
1745 {
1746 	int i, stat;
1747 
1748 	for (i = 0; i < FOPEN_MAX; i++) {
1749 		if (files[i].fp) {
1750 			if (ferror(files[i].fp))
1751 				WARNING( "i/o error occurred on %s", files[i].fname );
1752 			if (files[i].mode == '|' || files[i].mode == LE)
1753 				stat = pclose(files[i].fp);
1754 			else
1755 				stat = fclose(files[i].fp);
1756 			if (stat == EOF)
1757 				WARNING( "i/o error occurred while closing %s", files[i].fname );
1758 		}
1759 	}
1760 }
1761 
flush_all(void)1762 void flush_all(void)
1763 {
1764 	int i;
1765 
1766 	for (i = 0; i < nfiles; i++)
1767 		if (files[i].fp)
1768 			fflush(files[i].fp);
1769 }
1770 
1771 void backsub(char **pb_ptr, char **sptr_ptr);
1772 
sub(Node ** a,int nnn)1773 Cell *sub(Node **a, int nnn)	/* substitute command */
1774 {
1775 	char *sptr, *pb, *q;
1776 	Cell *x, *y, *result;
1777 	char *t, *buf;
1778 	fa *pfa;
1779 	int bufsz = recsize;
1780 
1781 	if ((buf = (char *) malloc(bufsz)) == NULL)
1782 		FATAL("out of memory in sub");
1783 	x = execute(a[3]);	/* target string */
1784 	t = getsval(x);
1785 	if (a[0] == 0)		/* 0 => a[1] is already-compiled regexpr */
1786 		pfa = (fa *) a[1];	/* regular expression */
1787 	else {
1788 		y = execute(a[1]);
1789 		pfa = makedfa(getsval(y), 1);
1790 		tempfree(y);
1791 	}
1792 	y = execute(a[2]);	/* replacement string */
1793 	result = False;
1794 	if (pmatch(pfa, t)) {
1795 		sptr = t;
1796 		adjbuf(&buf, &bufsz, 1+patbeg-sptr, recsize, 0, "sub");
1797 		pb = buf;
1798 		while (sptr < patbeg)
1799 			*pb++ = *sptr++;
1800 		sptr = getsval(y);
1801 		while (*sptr != 0) {
1802 			adjbuf(&buf, &bufsz, 5+pb-buf, recsize, &pb, "sub");
1803 			if (*sptr == '\\') {
1804 				backsub(&pb, &sptr);
1805 			} else if (*sptr == '&') {
1806 				sptr++;
1807 				adjbuf(&buf, &bufsz, 1+patlen+pb-buf, recsize, &pb, "sub");
1808 				for (q = patbeg; q < patbeg+patlen; )
1809 					*pb++ = *q++;
1810 			} else
1811 				*pb++ = *sptr++;
1812 		}
1813 		*pb = '\0';
1814 		if (pb > buf + bufsz)
1815 			FATAL("sub result1 %.30s too big; can't happen", buf);
1816 		sptr = patbeg + patlen;
1817 		if ((patlen == 0 && *patbeg) || (patlen && *(sptr-1))) {
1818 			adjbuf(&buf, &bufsz, 1+strlen(sptr)+pb-buf, 0, &pb, "sub");
1819 			while ((*pb++ = *sptr++) != 0)
1820 				;
1821 		}
1822 		if (pb > buf + bufsz)
1823 			FATAL("sub result2 %.30s too big; can't happen", buf);
1824 		setsval(x, buf);	/* BUG: should be able to avoid copy */
1825 		result = True;;
1826 	}
1827 	tempfree(x);
1828 	tempfree(y);
1829 	free(buf);
1830 	return result;
1831 }
1832 
gsub(Node ** a,int nnn)1833 Cell *gsub(Node **a, int nnn)	/* global substitute */
1834 {
1835 	Cell *x, *y;
1836 	char *rptr, *sptr, *t, *pb, *q;
1837 	char *buf;
1838 	fa *pfa;
1839 	int mflag, tempstat, num;
1840 	int bufsz = recsize;
1841 
1842 	if ((buf = (char *) malloc(bufsz)) == NULL)
1843 		FATAL("out of memory in gsub");
1844 	mflag = 0;	/* if mflag == 0, can replace empty string */
1845 	num = 0;
1846 	x = execute(a[3]);	/* target string */
1847 	t = getsval(x);
1848 	if (a[0] == 0)		/* 0 => a[1] is already-compiled regexpr */
1849 		pfa = (fa *) a[1];	/* regular expression */
1850 	else {
1851 		y = execute(a[1]);
1852 		pfa = makedfa(getsval(y), 1);
1853 		tempfree(y);
1854 	}
1855 	y = execute(a[2]);	/* replacement string */
1856 	if (pmatch(pfa, t)) {
1857 		tempstat = pfa->initstat;
1858 		pfa->initstat = 2;
1859 		pb = buf;
1860 		rptr = getsval(y);
1861 		do {
1862 			if (patlen == 0 && *patbeg != 0) {	/* matched empty string */
1863 				if (mflag == 0) {	/* can replace empty */
1864 					num++;
1865 					sptr = rptr;
1866 					while (*sptr != 0) {
1867 						adjbuf(&buf, &bufsz, 5+pb-buf, recsize, &pb, "gsub");
1868 						if (*sptr == '\\') {
1869 							backsub(&pb, &sptr);
1870 						} else if (*sptr == '&') {
1871 							sptr++;
1872 							adjbuf(&buf, &bufsz, 1+patlen+pb-buf, recsize, &pb, "gsub");
1873 							for (q = patbeg; q < patbeg+patlen; )
1874 								*pb++ = *q++;
1875 						} else
1876 							*pb++ = *sptr++;
1877 					}
1878 				}
1879 				if (*t == 0)	/* at end */
1880 					goto done;
1881 				adjbuf(&buf, &bufsz, 2+pb-buf, recsize, &pb, "gsub");
1882 				*pb++ = *t++;
1883 				if (pb > buf + bufsz)	/* BUG: not sure of this test */
1884 					FATAL("gsub result0 %.30s too big; can't happen", buf);
1885 				mflag = 0;
1886 			}
1887 			else {	/* matched nonempty string */
1888 				num++;
1889 				sptr = t;
1890 				adjbuf(&buf, &bufsz, 1+(patbeg-sptr)+pb-buf, recsize, &pb, "gsub");
1891 				while (sptr < patbeg)
1892 					*pb++ = *sptr++;
1893 				sptr = rptr;
1894 				while (*sptr != 0) {
1895 					adjbuf(&buf, &bufsz, 5+pb-buf, recsize, &pb, "gsub");
1896 					if (*sptr == '\\') {
1897 						backsub(&pb, &sptr);
1898 					} else if (*sptr == '&') {
1899 						sptr++;
1900 						adjbuf(&buf, &bufsz, 1+patlen+pb-buf, recsize, &pb, "gsub");
1901 						for (q = patbeg; q < patbeg+patlen; )
1902 							*pb++ = *q++;
1903 					} else
1904 						*pb++ = *sptr++;
1905 				}
1906 				t = patbeg + patlen;
1907 				if (patlen == 0 || *t == 0 || *(t-1) == 0)
1908 					goto done;
1909 				if (pb > buf + bufsz)
1910 					FATAL("gsub result1 %.30s too big; can't happen", buf);
1911 				mflag = 1;
1912 			}
1913 		} while (pmatch(pfa,t));
1914 		sptr = t;
1915 		adjbuf(&buf, &bufsz, 1+strlen(sptr)+pb-buf, 0, &pb, "gsub");
1916 		while ((*pb++ = *sptr++) != 0)
1917 			;
1918 	done:	if (pb < buf + bufsz)
1919 			*pb = '\0';
1920 		else if (*(pb-1) != '\0')
1921 			FATAL("gsub result2 %.30s truncated; can't happen", buf);
1922 		setsval(x, buf);	/* BUG: should be able to avoid copy + free */
1923 		pfa->initstat = tempstat;
1924 	}
1925 	tempfree(x);
1926 	tempfree(y);
1927 	x = gettemp();
1928 	x->tval = NUM;
1929 	x->fval = num;
1930 	free(buf);
1931 	return(x);
1932 }
1933 
backsub(char ** pb_ptr,char ** sptr_ptr)1934 void backsub(char **pb_ptr, char **sptr_ptr)	/* handle \\& variations */
1935 {						/* sptr[0] == '\\' */
1936 	char *pb = *pb_ptr, *sptr = *sptr_ptr;
1937 
1938 	if (sptr[1] == '\\') {
1939 		if (sptr[2] == '\\' && sptr[3] == '&') { /* \\\& -> \& */
1940 			*pb++ = '\\';
1941 			*pb++ = '&';
1942 			sptr += 4;
1943 		} else if (sptr[2] == '&') {	/* \\& -> \ + matched */
1944 			*pb++ = '\\';
1945 			sptr += 2;
1946 		} else {			/* \\x -> \\x */
1947 			*pb++ = *sptr++;
1948 			*pb++ = *sptr++;
1949 		}
1950 	} else if (sptr[1] == '&') {	/* literal & */
1951 		sptr++;
1952 		*pb++ = *sptr++;
1953 	} else				/* literal \ */
1954 		*pb++ = *sptr++;
1955 
1956 	*pb_ptr = pb;
1957 	*sptr_ptr = sptr;
1958 }
1959