xref: /openbsd/bin/ksh/expr.c (revision 0ac57757)
1 /*	$OpenBSD: expr.c,v 1.34 2019/02/20 23:59:17 schwarze Exp $	*/
2 
3 /*
4  * Korn expression evaluation
5  */
6 /*
7  * todo: better error handling: if in builtin, should be builtin error, etc.
8  */
9 
10 #include <ctype.h>
11 #include <limits.h>
12 #include <string.h>
13 
14 #include "sh.h"
15 
16 /* The order of these enums is constrained by the order of opinfo[] */
17 enum token {
18 	/* some (long) unary operators */
19 	O_PLUSPLUS = 0, O_MINUSMINUS,
20 	/* binary operators */
21 	O_EQ, O_NE,
22 	/* assignments are assumed to be in range O_ASN .. O_BORASN */
23 	O_ASN, O_TIMESASN, O_DIVASN, O_MODASN, O_PLUSASN, O_MINUSASN,
24 	O_LSHIFTASN, O_RSHIFTASN, O_BANDASN, O_BXORASN, O_BORASN,
25 	O_LSHIFT, O_RSHIFT,
26 	O_LE, O_GE, O_LT, O_GT,
27 	O_LAND,
28 	O_LOR,
29 	O_TIMES, O_DIV, O_MOD,
30 	O_PLUS, O_MINUS,
31 	O_BAND,
32 	O_BXOR,
33 	O_BOR,
34 	O_TERN,
35 	O_COMMA,
36 	/* things after this aren't used as binary operators */
37 	/* unary that are not also binaries */
38 	O_BNOT, O_LNOT,
39 	/* misc */
40 	OPEN_PAREN, CLOSE_PAREN, CTERN,
41 	/* things that don't appear in the opinfo[] table */
42 	VAR, LIT, END, BAD
43 };
44 #define IS_BINOP(op) (((int)op) >= (int)O_EQ && ((int)op) <= (int)O_COMMA)
45 #define IS_ASSIGNOP(op)	((int)(op) >= (int)O_ASN && (int)(op) <= (int)O_BORASN)
46 
47 enum prec {
48 	P_PRIMARY = 0,		/* VAR, LIT, (), ~ ! - + */
49 	P_MULT,			/* * / % */
50 	P_ADD,			/* + - */
51 	P_SHIFT,		/* << >> */
52 	P_RELATION,		/* < <= > >= */
53 	P_EQUALITY,		/* == != */
54 	P_BAND,			/* & */
55 	P_BXOR,			/* ^ */
56 	P_BOR,			/* | */
57 	P_LAND,			/* && */
58 	P_LOR,			/* || */
59 	P_TERN,			/* ?: */
60 	P_ASSIGN,		/* = *= /= %= += -= <<= >>= &= ^= |= */
61 	P_COMMA			/* , */
62 };
63 #define MAX_PREC	P_COMMA
64 
65 struct opinfo {
66 	char		name[4];
67 	int		len;	/* name length */
68 	enum prec	prec;	/* precedence: lower is higher */
69 };
70 
71 /* Tokens in this table must be ordered so the longest are first
72  * (eg, += before +).  If you change something, change the order
73  * of enum token too.
74  */
75 static const struct opinfo opinfo[] = {
76 	{ "++",	 2, P_PRIMARY },	/* before + */
77 	{ "--",	 2, P_PRIMARY },	/* before - */
78 	{ "==",	 2, P_EQUALITY },	/* before = */
79 	{ "!=",	 2, P_EQUALITY },	/* before ! */
80 	{ "=",	 1, P_ASSIGN },		/* keep assigns in a block */
81 	{ "*=",	 2, P_ASSIGN },
82 	{ "/=",	 2, P_ASSIGN },
83 	{ "%=",	 2, P_ASSIGN },
84 	{ "+=",	 2, P_ASSIGN },
85 	{ "-=",	 2, P_ASSIGN },
86 	{ "<<=", 3, P_ASSIGN },
87 	{ ">>=", 3, P_ASSIGN },
88 	{ "&=",	 2, P_ASSIGN },
89 	{ "^=",	 2, P_ASSIGN },
90 	{ "|=",	 2, P_ASSIGN },
91 	{ "<<",	 2, P_SHIFT },
92 	{ ">>",	 2, P_SHIFT },
93 	{ "<=",	 2, P_RELATION },
94 	{ ">=",	 2, P_RELATION },
95 	{ "<",	 1, P_RELATION },
96 	{ ">",	 1, P_RELATION },
97 	{ "&&",	 2, P_LAND },
98 	{ "||",	 2, P_LOR },
99 	{ "*",	 1, P_MULT },
100 	{ "/",	 1, P_MULT },
101 	{ "%",	 1, P_MULT },
102 	{ "+",	 1, P_ADD },
103 	{ "-",	 1, P_ADD },
104 	{ "&",	 1, P_BAND },
105 	{ "^",	 1, P_BXOR },
106 	{ "|",	 1, P_BOR },
107 	{ "?",	 1, P_TERN },
108 	{ ",",	 1, P_COMMA },
109 	{ "~",	 1, P_PRIMARY },
110 	{ "!",	 1, P_PRIMARY },
111 	{ "(",	 1, P_PRIMARY },
112 	{ ")",	 1, P_PRIMARY },
113 	{ ":",	 1, P_PRIMARY },
114 	{ "",	 0, P_PRIMARY } /* end of table */
115 };
116 
117 
118 typedef struct expr_state Expr_state;
119 struct expr_state {
120 	const char *expression;		/* expression being evaluated */
121 	const char *tokp;		/* lexical position */
122 	enum token  tok;		/* token from token() */
123 	int	    noassign;		/* don't do assigns (for ?:,&&,||) */
124 	bool	    arith;		/* true if evaluating an $(())
125 					 * expression
126 					 */
127 	struct tbl *val;		/* value from token() */
128 	struct tbl *evaling;		/* variable that is being recursively
129 					 * expanded (EXPRINEVAL flag set)
130 					 */
131 };
132 
133 enum error_type {
134 	ET_UNEXPECTED, ET_BADLIT, ET_RECURSIVE,
135 	ET_LVALUE, ET_RDONLY, ET_STR
136 };
137 
138 static void	   evalerr(Expr_state *, enum error_type, const char *)
139 		    __attribute__((__noreturn__));
140 static struct tbl *evalexpr(Expr_state *, enum prec);
141 static void	   token(Expr_state *);
142 static struct tbl *do_ppmm(Expr_state *, enum token, struct tbl *, bool);
143 static void	   assign_check(Expr_state *, enum token, struct tbl *);
144 static struct tbl *tempvar(void);
145 static struct tbl *intvar(Expr_state *, struct tbl *);
146 
147 /*
148  * parse and evaluate expression
149  */
150 int
evaluate(const char * expr,int64_t * rval,int error_ok,bool arith)151 evaluate(const char *expr, int64_t *rval, int error_ok, bool arith)
152 {
153 	struct tbl v;
154 	int ret;
155 
156 	v.flag = DEFINED|INTEGER;
157 	v.type = 0;
158 	ret = v_evaluate(&v, expr, error_ok, arith);
159 	*rval = v.val.i;
160 	return ret;
161 }
162 
163 /*
164  * parse and evaluate expression, storing result in vp.
165  */
166 int
v_evaluate(struct tbl * vp,const char * expr,volatile int error_ok,bool arith)167 v_evaluate(struct tbl *vp, const char *expr, volatile int error_ok,
168     bool arith)
169 {
170 	struct tbl *v;
171 	Expr_state curstate;
172 	Expr_state * const es = &curstate;
173 	int save_disable_subst;
174 	int i;
175 
176 	/* save state to allow recursive calls */
177 	curstate.expression = curstate.tokp = expr;
178 	curstate.noassign = 0;
179 	curstate.arith = arith;
180 	curstate.evaling = NULL;
181 	curstate.val = NULL;
182 
183 	newenv(E_ERRH);
184 	save_disable_subst = disable_subst;
185 	i = sigsetjmp(genv->jbuf, 0);
186 	if (i) {
187 		disable_subst = save_disable_subst;
188 		/* Clear EXPRINEVAL in of any variables we were playing with */
189 		if (curstate.evaling)
190 			curstate.evaling->flag &= ~EXPRINEVAL;
191 		quitenv(NULL);
192 		if (i == LAEXPR) {
193 			if (error_ok == KSH_RETURN_ERROR)
194 				return 0;
195 			errorf(NULL);
196 		}
197 		unwind(i);
198 		/* NOTREACHED */
199 	}
200 
201 	token(es);
202 #if 1 /* ifdef-out to disallow empty expressions to be treated as 0 */
203 	if (es->tok == END) {
204 		es->tok = LIT;
205 		es->val = tempvar();
206 	}
207 #endif /* 0 */
208 	v = intvar(es, evalexpr(es, MAX_PREC));
209 
210 	if (es->tok != END)
211 		evalerr(es, ET_UNEXPECTED, NULL);
212 
213 	if (vp->flag & INTEGER)
214 		setint_v(vp, v, es->arith);
215 	else
216 		/* can fail if readonly */
217 		setstr(vp, str_val(v), error_ok);
218 
219 	quitenv(NULL);
220 
221 	return 1;
222 }
223 
224 static void
evalerr(Expr_state * es,enum error_type type,const char * str)225 evalerr(Expr_state *es, enum error_type type, const char *str)
226 {
227 	char tbuf[2];
228 	const char *s;
229 
230 	es->arith = false;
231 	switch (type) {
232 	case ET_UNEXPECTED:
233 		switch (es->tok) {
234 		case VAR:
235 			s = es->val->name;
236 			break;
237 		case LIT:
238 			s = str_val(es->val);
239 			break;
240 		case END:
241 			s = "end of expression";
242 			break;
243 		case BAD:
244 			tbuf[0] = *es->tokp;
245 			tbuf[1] = '\0';
246 			s = tbuf;
247 			break;
248 		default:
249 			s = opinfo[(int)es->tok].name;
250 		}
251 		warningf(true, "%s: unexpected `%s'", es->expression, s);
252 		break;
253 
254 	case ET_BADLIT:
255 		warningf(true, "%s: bad number `%s'", es->expression, str);
256 		break;
257 
258 	case ET_RECURSIVE:
259 		warningf(true, "%s: expression recurses on parameter `%s'",
260 		    es->expression, str);
261 		break;
262 
263 	case ET_LVALUE:
264 		warningf(true, "%s: %s requires lvalue",
265 		    es->expression, str);
266 		break;
267 
268 	case ET_RDONLY:
269 		warningf(true, "%s: %s applied to read only variable",
270 		    es->expression, str);
271 		break;
272 
273 	default: /* keep gcc happy */
274 	case ET_STR:
275 		warningf(true, "%s: %s", es->expression, str);
276 		break;
277 	}
278 	unwind(LAEXPR);
279 }
280 
281 static struct tbl *
evalexpr(Expr_state * es,enum prec prec)282 evalexpr(Expr_state *es, enum prec prec)
283 {
284 	struct tbl *vl, *vr = NULL, *vasn;
285 	enum token op;
286 	int64_t res = 0;
287 
288 	if (prec == P_PRIMARY) {
289 		op = es->tok;
290 		if (op == O_BNOT || op == O_LNOT || op == O_MINUS ||
291 		    op == O_PLUS) {
292 			token(es);
293 			vl = intvar(es, evalexpr(es, P_PRIMARY));
294 			if (op == O_BNOT)
295 				vl->val.i = ~vl->val.i;
296 			else if (op == O_LNOT)
297 				vl->val.i = !vl->val.i;
298 			else if (op == O_MINUS)
299 				vl->val.i = -vl->val.i;
300 			/* op == O_PLUS is a no-op */
301 		} else if (op == OPEN_PAREN) {
302 			token(es);
303 			vl = evalexpr(es, MAX_PREC);
304 			if (es->tok != CLOSE_PAREN)
305 				evalerr(es, ET_STR, "missing )");
306 			token(es);
307 		} else if (op == O_PLUSPLUS || op == O_MINUSMINUS) {
308 			token(es);
309 			vl = do_ppmm(es, op, es->val, true);
310 			token(es);
311 		} else if (op == VAR || op == LIT) {
312 			vl = es->val;
313 			token(es);
314 		} else {
315 			evalerr(es, ET_UNEXPECTED, NULL);
316 			/* NOTREACHED */
317 		}
318 		if (es->tok == O_PLUSPLUS || es->tok == O_MINUSMINUS) {
319 			vl = do_ppmm(es, es->tok, vl, false);
320 			token(es);
321 		}
322 		return vl;
323 	}
324 	vl = evalexpr(es, ((int) prec) - 1);
325 	for (op = es->tok; IS_BINOP(op) && opinfo[(int) op].prec == prec;
326 	    op = es->tok) {
327 		token(es);
328 		vasn = vl;
329 		if (op != O_ASN) /* vl may not have a value yet */
330 			vl = intvar(es, vl);
331 		if (IS_ASSIGNOP(op)) {
332 			assign_check(es, op, vasn);
333 			vr = intvar(es, evalexpr(es, P_ASSIGN));
334 		} else if (op != O_TERN && op != O_LAND && op != O_LOR)
335 			vr = intvar(es, evalexpr(es, ((int) prec) - 1));
336 		if ((op == O_DIV || op == O_MOD || op == O_DIVASN ||
337 		    op == O_MODASN) && vr->val.i == 0) {
338 			if (es->noassign)
339 				vr->val.i = 1;
340 			else
341 				evalerr(es, ET_STR, "zero divisor");
342 		}
343 		switch ((int) op) {
344 		case O_TIMES:
345 		case O_TIMESASN:
346 			res = vl->val.i * vr->val.i;
347 			break;
348 		case O_DIV:
349 		case O_DIVASN:
350 			if (vl->val.i == LONG_MIN && vr->val.i == -1)
351 				res = LONG_MIN;
352 			else
353 				res = vl->val.i / vr->val.i;
354 			break;
355 		case O_MOD:
356 		case O_MODASN:
357 			if (vl->val.i == LONG_MIN && vr->val.i == -1)
358 				res = 0;
359 			else
360 				res = vl->val.i % vr->val.i;
361 			break;
362 		case O_PLUS:
363 		case O_PLUSASN:
364 			res = vl->val.i + vr->val.i;
365 			break;
366 		case O_MINUS:
367 		case O_MINUSASN:
368 			res = vl->val.i - vr->val.i;
369 			break;
370 		case O_LSHIFT:
371 		case O_LSHIFTASN:
372 			res = vl->val.i << vr->val.i;
373 			break;
374 		case O_RSHIFT:
375 		case O_RSHIFTASN:
376 			res = vl->val.i >> vr->val.i;
377 			break;
378 		case O_LT:
379 			res = vl->val.i < vr->val.i;
380 			break;
381 		case O_LE:
382 			res = vl->val.i <= vr->val.i;
383 			break;
384 		case O_GT:
385 			res = vl->val.i > vr->val.i;
386 			break;
387 		case O_GE:
388 			res = vl->val.i >= vr->val.i;
389 			break;
390 		case O_EQ:
391 			res = vl->val.i == vr->val.i;
392 			break;
393 		case O_NE:
394 			res = vl->val.i != vr->val.i;
395 			break;
396 		case O_BAND:
397 		case O_BANDASN:
398 			res = vl->val.i & vr->val.i;
399 			break;
400 		case O_BXOR:
401 		case O_BXORASN:
402 			res = vl->val.i ^ vr->val.i;
403 			break;
404 		case O_BOR:
405 		case O_BORASN:
406 			res = vl->val.i | vr->val.i;
407 			break;
408 		case O_LAND:
409 			if (!vl->val.i)
410 				es->noassign++;
411 			vr = intvar(es, evalexpr(es, ((int) prec) - 1));
412 			res = vl->val.i && vr->val.i;
413 			if (!vl->val.i)
414 				es->noassign--;
415 			break;
416 		case O_LOR:
417 			if (vl->val.i)
418 				es->noassign++;
419 			vr = intvar(es, evalexpr(es, ((int) prec) - 1));
420 			res = vl->val.i || vr->val.i;
421 			if (vl->val.i)
422 				es->noassign--;
423 			break;
424 		case O_TERN:
425 			{
426 				int e = vl->val.i != 0;
427 
428 				if (!e)
429 					es->noassign++;
430 				vl = evalexpr(es, MAX_PREC);
431 				if (!e)
432 					es->noassign--;
433 				if (es->tok != CTERN)
434 					evalerr(es, ET_STR, "missing :");
435 				token(es);
436 				if (e)
437 					es->noassign++;
438 				vr = evalexpr(es, P_TERN);
439 				if (e)
440 					es->noassign--;
441 				vl = e ? vl : vr;
442 			}
443 			break;
444 		case O_ASN:
445 			res = vr->val.i;
446 			break;
447 		case O_COMMA:
448 			res = vr->val.i;
449 			break;
450 		}
451 		if (IS_ASSIGNOP(op)) {
452 			vr->val.i = res;
453 			if (vasn->flag & INTEGER)
454 				setint_v(vasn, vr, es->arith);
455 			else
456 				setint(vasn, res);
457 			vl = vr;
458 		} else if (op != O_TERN)
459 			vl->val.i = res;
460 	}
461 	return vl;
462 }
463 
464 static void
token(Expr_state * es)465 token(Expr_state *es)
466 {
467 	const char *cp;
468 	int c;
469 	char *tvar;
470 
471 	/* skip white space */
472 	for (cp = es->tokp; (c = *cp), isspace((unsigned char)c); cp++)
473 		;
474 	es->tokp = cp;
475 
476 	if (c == '\0')
477 		es->tok = END;
478 	else if (letter(c)) {
479 		for (; letnum(c); c = *cp)
480 			cp++;
481 		if (c == '[') {
482 			int len;
483 
484 			len = array_ref_len(cp);
485 			if (len == 0)
486 				evalerr(es, ET_STR, "missing ]");
487 			cp += len;
488 		} else if (c == '(' /*)*/ ) {
489 			/* todo: add math functions (all take single argument):
490 			 * abs acos asin atan cos cosh exp int log sin sinh sqrt
491 			 * tan tanh
492 			 */
493 			;
494 		}
495 		if (es->noassign) {
496 			es->val = tempvar();
497 			es->val->flag |= EXPRLVALUE;
498 		} else {
499 			tvar = str_nsave(es->tokp, cp - es->tokp, ATEMP);
500 			es->val = global(tvar);
501 			afree(tvar, ATEMP);
502 		}
503 		es->tok = VAR;
504 	} else if (digit(c)) {
505 		for (; c != '_' && (letnum(c) || c == '#'); c = *cp++)
506 			;
507 		tvar = str_nsave(es->tokp, --cp - es->tokp, ATEMP);
508 		es->val = tempvar();
509 		es->val->flag &= ~INTEGER;
510 		es->val->type = 0;
511 		es->val->val.s = tvar;
512 		if (setint_v(es->val, es->val, es->arith) == NULL)
513 			evalerr(es, ET_BADLIT, tvar);
514 		afree(tvar, ATEMP);
515 		es->tok = LIT;
516 	} else {
517 		int i, n0;
518 
519 		for (i = 0; (n0 = opinfo[i].name[0]); i++)
520 			if (c == n0 &&
521 			    strncmp(cp, opinfo[i].name, opinfo[i].len) == 0) {
522 				es->tok = (enum token) i;
523 				cp += opinfo[i].len;
524 				break;
525 			}
526 		if (!n0)
527 			es->tok = BAD;
528 	}
529 	es->tokp = cp;
530 }
531 
532 /* Do a ++ or -- operation */
533 static struct tbl *
do_ppmm(Expr_state * es,enum token op,struct tbl * vasn,bool is_prefix)534 do_ppmm(Expr_state *es, enum token op, struct tbl *vasn, bool is_prefix)
535 {
536 	struct tbl *vl;
537 	int oval;
538 
539 	assign_check(es, op, vasn);
540 
541 	vl = intvar(es, vasn);
542 	oval = op == O_PLUSPLUS ? vl->val.i++ : vl->val.i--;
543 	if (vasn->flag & INTEGER)
544 		setint_v(vasn, vl, es->arith);
545 	else
546 		setint(vasn, vl->val.i);
547 	if (!is_prefix)		/* undo the inc/dec */
548 		vl->val.i = oval;
549 
550 	return vl;
551 }
552 
553 static void
assign_check(Expr_state * es,enum token op,struct tbl * vasn)554 assign_check(Expr_state *es, enum token op, struct tbl *vasn)
555 {
556 	if (es->tok == END || vasn == NULL ||
557 	    (vasn->name[0] == '\0' && !(vasn->flag & EXPRLVALUE)))
558 		evalerr(es, ET_LVALUE, opinfo[(int) op].name);
559 	else if (vasn->flag & RDONLY)
560 		evalerr(es, ET_RDONLY, opinfo[(int) op].name);
561 }
562 
563 static struct tbl *
tempvar(void)564 tempvar(void)
565 {
566 	struct tbl *vp;
567 
568 	vp = alloc(sizeof(struct tbl), ATEMP);
569 	vp->flag = ISSET|INTEGER;
570 	vp->type = 0;
571 	vp->areap = ATEMP;
572 	vp->val.i = 0;
573 	vp->name[0] = '\0';
574 	return vp;
575 }
576 
577 /* cast (string) variable to temporary integer variable */
578 static struct tbl *
intvar(Expr_state * es,struct tbl * vp)579 intvar(Expr_state *es, struct tbl *vp)
580 {
581 	struct tbl *vq;
582 
583 	/* try to avoid replacing a temp var with another temp var */
584 	if (vp->name[0] == '\0' &&
585 	    (vp->flag & (ISSET|INTEGER|EXPRLVALUE)) == (ISSET|INTEGER))
586 		return vp;
587 
588 	vq = tempvar();
589 	if (setint_v(vq, vp, es->arith) == NULL) {
590 		if (vp->flag & EXPRINEVAL)
591 			evalerr(es, ET_RECURSIVE, vp->name);
592 		es->evaling = vp;
593 		vp->flag |= EXPRINEVAL;
594 		disable_subst++;
595 		v_evaluate(vq, str_val(vp), KSH_UNWIND_ERROR, es->arith);
596 		disable_subst--;
597 		vp->flag &= ~EXPRINEVAL;
598 		es->evaling = NULL;
599 	}
600 	return vq;
601 }
602