xref: /aosp_15_r20/external/toybox/toys/pending/expr.c (revision cf5a6c84e2b8763fc1a7db14496fd4742913b199)
1*cf5a6c84SAndroid Build Coastguard Worker /* expr.c - evaluate expression
2*cf5a6c84SAndroid Build Coastguard Worker  *
3*cf5a6c84SAndroid Build Coastguard Worker  * Copyright 2016 Google Inc.
4*cf5a6c84SAndroid Build Coastguard Worker  * Copyright 2013 Daniel Verkamp <[email protected]>
5*cf5a6c84SAndroid Build Coastguard Worker  *
6*cf5a6c84SAndroid Build Coastguard Worker  * http://pubs.opengroup.org/onlinepubs/9699919799/utilities/expr.html
7*cf5a6c84SAndroid Build Coastguard Worker  *
8*cf5a6c84SAndroid Build Coastguard Worker  * The web standard is incomplete (precedence grouping missing), see:
9*cf5a6c84SAndroid Build Coastguard Worker  * http://permalink.gmane.org/gmane.comp.standards.posix.austin.general/10141
10*cf5a6c84SAndroid Build Coastguard Worker  *
11*cf5a6c84SAndroid Build Coastguard Worker  * eval_expr() uses the recursive "Precedence Climbing" algorithm:
12*cf5a6c84SAndroid Build Coastguard Worker  *
13*cf5a6c84SAndroid Build Coastguard Worker  * Clarke, Keith. "The top-down parsing of expressions." University of London.
14*cf5a6c84SAndroid Build Coastguard Worker  * Queen Mary College. Department of Computer Science and Statistics, 1986.
15*cf5a6c84SAndroid Build Coastguard Worker  *
16*cf5a6c84SAndroid Build Coastguard Worker  * http://www.antlr.org/papers/Clarke-expr-parsing-1986.pdf
17*cf5a6c84SAndroid Build Coastguard Worker  *
18*cf5a6c84SAndroid Build Coastguard Worker  * Nice explanation and Python implementation:
19*cf5a6c84SAndroid Build Coastguard Worker  * http://eli.thegreenplace.net/2012/08/02/parsing-expressions-by-precedence-climbing
20*cf5a6c84SAndroid Build Coastguard Worker 
21*cf5a6c84SAndroid Build Coastguard Worker USE_EXPR(NEWTOY(expr, 0, TOYFLAG_USR|TOYFLAG_BIN|TOYFLAG_ARGFAIL(2)))
22*cf5a6c84SAndroid Build Coastguard Worker 
23*cf5a6c84SAndroid Build Coastguard Worker config EXPR
24*cf5a6c84SAndroid Build Coastguard Worker   bool "expr"
25*cf5a6c84SAndroid Build Coastguard Worker   default n
26*cf5a6c84SAndroid Build Coastguard Worker   help
27*cf5a6c84SAndroid Build Coastguard Worker     usage: expr ARG1 OPERATOR ARG2...
28*cf5a6c84SAndroid Build Coastguard Worker 
29*cf5a6c84SAndroid Build Coastguard Worker     Evaluate expression and print result. For example, "expr 1 + 2" prints "3".
30*cf5a6c84SAndroid Build Coastguard Worker 
31*cf5a6c84SAndroid Build Coastguard Worker     The supported operators are (grouped from highest to lowest priority):
32*cf5a6c84SAndroid Build Coastguard Worker 
33*cf5a6c84SAndroid Build Coastguard Worker       ( )    :    * / %    + -    != <= < >= > =    &    |
34*cf5a6c84SAndroid Build Coastguard Worker 
35*cf5a6c84SAndroid Build Coastguard Worker     Each constant and operator must be a separate command line argument.
36*cf5a6c84SAndroid Build Coastguard Worker     All operators are infix, requiring a value on each side of the operator.
37*cf5a6c84SAndroid Build Coastguard Worker     Operators of the same priority are evaluated left to right. Parentheses
38*cf5a6c84SAndroid Build Coastguard Worker     elevate the priority of expression they contain. The & and | operators
39*cf5a6c84SAndroid Build Coastguard Worker     are logical (not bitwise).
40*cf5a6c84SAndroid Build Coastguard Worker 
41*cf5a6c84SAndroid Build Coastguard Worker     All operators yield integers, and most operators expect integer arguments.
42*cf5a6c84SAndroid Build Coastguard Worker     Comparisons may alphabetically compare strings, logical operators treat a
43*cf5a6c84SAndroid Build Coastguard Worker     blank string as false and nonblank as true, and the regex operator
44*cf5a6c84SAndroid Build Coastguard Worker     (str : pattern) yields the initial number of matching bytes. (So
45*cf5a6c84SAndroid Build Coastguard Worker     "abc : ab" is 2, but "abc : bc" is 0.)
46*cf5a6c84SAndroid Build Coastguard Worker 
47*cf5a6c84SAndroid Build Coastguard Worker     Calling expr from a command shell requires a lot of \( or '*' escaping
48*cf5a6c84SAndroid Build Coastguard Worker     to avoid interpreting shell control characters, vs the shell's "$((1+6/3))".
49*cf5a6c84SAndroid Build Coastguard Worker */
50*cf5a6c84SAndroid Build Coastguard Worker 
51*cf5a6c84SAndroid Build Coastguard Worker // TODO: int overflow checking
52*cf5a6c84SAndroid Build Coastguard Worker 
53*cf5a6c84SAndroid Build Coastguard Worker #define FOR_expr
54*cf5a6c84SAndroid Build Coastguard Worker #include "toys.h"
55*cf5a6c84SAndroid Build Coastguard Worker 
56*cf5a6c84SAndroid Build Coastguard Worker GLOBALS(
57*cf5a6c84SAndroid Build Coastguard Worker   char **tok, *delete;
58*cf5a6c84SAndroid Build Coastguard Worker )
59*cf5a6c84SAndroid Build Coastguard Worker 
60*cf5a6c84SAndroid Build Coastguard Worker // If s string, otherwise int.
61*cf5a6c84SAndroid Build Coastguard Worker struct value {
62*cf5a6c84SAndroid Build Coastguard Worker   char *s;
63*cf5a6c84SAndroid Build Coastguard Worker   long long i;
64*cf5a6c84SAndroid Build Coastguard Worker };
65*cf5a6c84SAndroid Build Coastguard Worker 
66*cf5a6c84SAndroid Build Coastguard Worker // Get the value as a string.
get_str(struct value * v)67*cf5a6c84SAndroid Build Coastguard Worker char *get_str(struct value *v)
68*cf5a6c84SAndroid Build Coastguard Worker {
69*cf5a6c84SAndroid Build Coastguard Worker   if (v->s) return v->s;
70*cf5a6c84SAndroid Build Coastguard Worker   else return xmprintf("%lld", v->i);
71*cf5a6c84SAndroid Build Coastguard Worker }
72*cf5a6c84SAndroid Build Coastguard Worker 
73*cf5a6c84SAndroid Build Coastguard Worker // Get the value as an integer and return 1, or return 0 on error.
get_int(struct value * v,long long * ret)74*cf5a6c84SAndroid Build Coastguard Worker int get_int(struct value *v, long long *ret)
75*cf5a6c84SAndroid Build Coastguard Worker {
76*cf5a6c84SAndroid Build Coastguard Worker   char *end;
77*cf5a6c84SAndroid Build Coastguard Worker 
78*cf5a6c84SAndroid Build Coastguard Worker   if (v->s) {
79*cf5a6c84SAndroid Build Coastguard Worker     *ret = strtoll(v->s, &end, 10); // base 10 or autodetect?
80*cf5a6c84SAndroid Build Coastguard Worker     if (*end) return 0;
81*cf5a6c84SAndroid Build Coastguard Worker   } else *ret = v->i;
82*cf5a6c84SAndroid Build Coastguard Worker 
83*cf5a6c84SAndroid Build Coastguard Worker   return 1;
84*cf5a6c84SAndroid Build Coastguard Worker }
85*cf5a6c84SAndroid Build Coastguard Worker 
86*cf5a6c84SAndroid Build Coastguard Worker // Preserve the invariant that v.s is NULL when the value is an integer.
assign_int(struct value * v,long long i)87*cf5a6c84SAndroid Build Coastguard Worker void assign_int(struct value *v, long long i)
88*cf5a6c84SAndroid Build Coastguard Worker {
89*cf5a6c84SAndroid Build Coastguard Worker   v->i = i;
90*cf5a6c84SAndroid Build Coastguard Worker   v->s = 0;
91*cf5a6c84SAndroid Build Coastguard Worker }
92*cf5a6c84SAndroid Build Coastguard Worker 
93*cf5a6c84SAndroid Build Coastguard Worker // Check if v is 0 or the empty string.
is_false(struct value * v)94*cf5a6c84SAndroid Build Coastguard Worker static int is_false(struct value *v)
95*cf5a6c84SAndroid Build Coastguard Worker {
96*cf5a6c84SAndroid Build Coastguard Worker   return get_int(v, &v->i) && !v->i;
97*cf5a6c84SAndroid Build Coastguard Worker }
98*cf5a6c84SAndroid Build Coastguard Worker 
99*cf5a6c84SAndroid Build Coastguard Worker // 'ret' is filled with a string capture or int match position.
re(char * target,char * pattern,struct value * ret)100*cf5a6c84SAndroid Build Coastguard Worker static void re(char *target, char *pattern, struct value *ret)
101*cf5a6c84SAndroid Build Coastguard Worker {
102*cf5a6c84SAndroid Build Coastguard Worker   regex_t pat;
103*cf5a6c84SAndroid Build Coastguard Worker   regmatch_t m[2];
104*cf5a6c84SAndroid Build Coastguard Worker 
105*cf5a6c84SAndroid Build Coastguard Worker   xregcomp(&pat, pattern, 0);
106*cf5a6c84SAndroid Build Coastguard Worker   // must match at pos 0
107*cf5a6c84SAndroid Build Coastguard Worker   if (!regexec(&pat, target, 2, m, 0) && !m[0].rm_so) {
108*cf5a6c84SAndroid Build Coastguard Worker     // Return first parenthesized subexpression as string, or length of match
109*cf5a6c84SAndroid Build Coastguard Worker     if (pat.re_nsub>0) {
110*cf5a6c84SAndroid Build Coastguard Worker       ret->s = xmprintf("%.*s", (int)(m[1].rm_eo-m[1].rm_so), target+m[1].rm_so);
111*cf5a6c84SAndroid Build Coastguard Worker       free(TT.delete);
112*cf5a6c84SAndroid Build Coastguard Worker       TT.delete = ret->s;
113*cf5a6c84SAndroid Build Coastguard Worker     } else assign_int(ret, m[0].rm_eo);
114*cf5a6c84SAndroid Build Coastguard Worker   } else {
115*cf5a6c84SAndroid Build Coastguard Worker     if (pat.re_nsub>0) ret->s = "";
116*cf5a6c84SAndroid Build Coastguard Worker     else assign_int(ret, 0);
117*cf5a6c84SAndroid Build Coastguard Worker   }
118*cf5a6c84SAndroid Build Coastguard Worker   regfree(&pat);
119*cf5a6c84SAndroid Build Coastguard Worker }
120*cf5a6c84SAndroid Build Coastguard Worker 
121*cf5a6c84SAndroid Build Coastguard Worker // 4 different signatures of operators.  S = string, I = int, SI = string or
122*cf5a6c84SAndroid Build Coastguard Worker // int.
123*cf5a6c84SAndroid Build Coastguard Worker enum { SI_TO_SI = 1, SI_TO_I, I_TO_I, S_TO_SI };
124*cf5a6c84SAndroid Build Coastguard Worker 
125*cf5a6c84SAndroid Build Coastguard Worker enum { OR = 1, AND, EQ, NE, GT, GTE, LT, LTE, ADD, SUB, MUL, DIVI, MOD, RE };
126*cf5a6c84SAndroid Build Coastguard Worker 
127*cf5a6c84SAndroid Build Coastguard Worker // operators grouped by precedence
128*cf5a6c84SAndroid Build Coastguard Worker static struct op_def {
129*cf5a6c84SAndroid Build Coastguard Worker   char *tok;
130*cf5a6c84SAndroid Build Coastguard Worker   char prec, sig, op; // precedence, signature for type coercion, operator ID
131*cf5a6c84SAndroid Build Coastguard Worker } OPS[] = {
132*cf5a6c84SAndroid Build Coastguard Worker   // logical ops, precedence 1 and 2, signature SI_TO_SI
133*cf5a6c84SAndroid Build Coastguard Worker   {"|", 1, SI_TO_SI, OR  },
134*cf5a6c84SAndroid Build Coastguard Worker   {"&", 2, SI_TO_SI, AND },
135*cf5a6c84SAndroid Build Coastguard Worker   // comparison ops, precedence 3, signature SI_TO_I
136*cf5a6c84SAndroid Build Coastguard Worker   {"=", 3, SI_TO_I, EQ }, {"==", 3, SI_TO_I, EQ  }, {"!=", 3, SI_TO_I, NE },
137*cf5a6c84SAndroid Build Coastguard Worker   {">", 3, SI_TO_I, GT }, {">=", 3, SI_TO_I, GTE },
138*cf5a6c84SAndroid Build Coastguard Worker   {"<", 3, SI_TO_I, LT }, {"<=", 3, SI_TO_I, LTE },
139*cf5a6c84SAndroid Build Coastguard Worker   // arithmetic ops, precedence 4 and 5, signature I_TO_I
140*cf5a6c84SAndroid Build Coastguard Worker   {"+", 4, I_TO_I, ADD }, {"-",  4, I_TO_I, SUB },
141*cf5a6c84SAndroid Build Coastguard Worker   {"*", 5, I_TO_I, MUL }, {"/",  5, I_TO_I, DIVI }, {"%", 5, I_TO_I, MOD },
142*cf5a6c84SAndroid Build Coastguard Worker   // regex match, precedence 6, signature S_TO_SI
143*cf5a6c84SAndroid Build Coastguard Worker   {":", 6, S_TO_SI, RE },
144*cf5a6c84SAndroid Build Coastguard Worker   {NULL, 0, 0, 0}, // sentinel
145*cf5a6c84SAndroid Build Coastguard Worker };
146*cf5a6c84SAndroid Build Coastguard Worker 
eval_op(struct op_def * o,struct value * ret,struct value * rhs)147*cf5a6c84SAndroid Build Coastguard Worker void eval_op(struct op_def *o, struct value *ret, struct value *rhs)
148*cf5a6c84SAndroid Build Coastguard Worker {
149*cf5a6c84SAndroid Build Coastguard Worker   long long cmp, a, b, x = 0; // x = a OP b for ints.
150*cf5a6c84SAndroid Build Coastguard Worker   char *s, *t; // string operands
151*cf5a6c84SAndroid Build Coastguard Worker 
152*cf5a6c84SAndroid Build Coastguard Worker   switch (o->sig) {
153*cf5a6c84SAndroid Build Coastguard Worker 
154*cf5a6c84SAndroid Build Coastguard Worker   case SI_TO_SI:
155*cf5a6c84SAndroid Build Coastguard Worker     switch (o->op) {
156*cf5a6c84SAndroid Build Coastguard Worker     case OR:  if (is_false(ret)) *ret = *rhs; break;
157*cf5a6c84SAndroid Build Coastguard Worker     case AND: if (is_false(ret) || is_false(rhs)) assign_int(ret, 0); break;
158*cf5a6c84SAndroid Build Coastguard Worker     }
159*cf5a6c84SAndroid Build Coastguard Worker     break;
160*cf5a6c84SAndroid Build Coastguard Worker 
161*cf5a6c84SAndroid Build Coastguard Worker   case SI_TO_I:
162*cf5a6c84SAndroid Build Coastguard Worker     if (get_int(ret, &a) && get_int(rhs, &b)) { // both are ints
163*cf5a6c84SAndroid Build Coastguard Worker       cmp = a - b;
164*cf5a6c84SAndroid Build Coastguard Worker     } else { // otherwise compare both as strings
165*cf5a6c84SAndroid Build Coastguard Worker       cmp = strcmp(s = get_str(ret), t = get_str(rhs));
166*cf5a6c84SAndroid Build Coastguard Worker       if (ret->s != s) free(s);
167*cf5a6c84SAndroid Build Coastguard Worker       if (rhs->s != t) free(t);
168*cf5a6c84SAndroid Build Coastguard Worker     }
169*cf5a6c84SAndroid Build Coastguard Worker     switch (o->op) {
170*cf5a6c84SAndroid Build Coastguard Worker     case EQ:  x = cmp == 0; break;
171*cf5a6c84SAndroid Build Coastguard Worker     case NE:  x = cmp != 0; break;
172*cf5a6c84SAndroid Build Coastguard Worker     case GT:  x = cmp >  0; break;
173*cf5a6c84SAndroid Build Coastguard Worker     case GTE: x = cmp >= 0; break;
174*cf5a6c84SAndroid Build Coastguard Worker     case LT:  x = cmp <  0; break;
175*cf5a6c84SAndroid Build Coastguard Worker     case LTE: x = cmp <= 0; break;
176*cf5a6c84SAndroid Build Coastguard Worker     }
177*cf5a6c84SAndroid Build Coastguard Worker     assign_int(ret, x);
178*cf5a6c84SAndroid Build Coastguard Worker     break;
179*cf5a6c84SAndroid Build Coastguard Worker 
180*cf5a6c84SAndroid Build Coastguard Worker   case I_TO_I:
181*cf5a6c84SAndroid Build Coastguard Worker     if (!get_int(ret, &a) || !get_int(rhs, &b))
182*cf5a6c84SAndroid Build Coastguard Worker       error_exit("non-integer argument");
183*cf5a6c84SAndroid Build Coastguard Worker     switch (o->op) {
184*cf5a6c84SAndroid Build Coastguard Worker     case ADD: x = a + b; break;
185*cf5a6c84SAndroid Build Coastguard Worker     case SUB: x = a - b; break;
186*cf5a6c84SAndroid Build Coastguard Worker     case MUL: x = a * b; break;
187*cf5a6c84SAndroid Build Coastguard Worker     case DIVI: if (b == 0) error_exit("division by zero"); x = a / b; break;
188*cf5a6c84SAndroid Build Coastguard Worker     case MOD:  if (b == 0) error_exit("division by zero"); x = a % b; break;
189*cf5a6c84SAndroid Build Coastguard Worker     }
190*cf5a6c84SAndroid Build Coastguard Worker     assign_int(ret, x);
191*cf5a6c84SAndroid Build Coastguard Worker     break;
192*cf5a6c84SAndroid Build Coastguard Worker 
193*cf5a6c84SAndroid Build Coastguard Worker   case S_TO_SI: // op == RE
194*cf5a6c84SAndroid Build Coastguard Worker     s = get_str(ret);
195*cf5a6c84SAndroid Build Coastguard Worker     cmp = ret->s!=s; // ret overwritten by re so check now
196*cf5a6c84SAndroid Build Coastguard Worker     re(s, t = get_str(rhs), ret);
197*cf5a6c84SAndroid Build Coastguard Worker     if (cmp) free(s);
198*cf5a6c84SAndroid Build Coastguard Worker     if (rhs->s!=t) free(t);
199*cf5a6c84SAndroid Build Coastguard Worker     break;
200*cf5a6c84SAndroid Build Coastguard Worker   }
201*cf5a6c84SAndroid Build Coastguard Worker }
202*cf5a6c84SAndroid Build Coastguard Worker 
203*cf5a6c84SAndroid Build Coastguard Worker // Recurive "Precedence Climbing" evaluation of compound expression, setting ret
eval_expr(struct value * ret,int min_prec)204*cf5a6c84SAndroid Build Coastguard Worker static void eval_expr(struct value *ret, int min_prec)
205*cf5a6c84SAndroid Build Coastguard Worker {
206*cf5a6c84SAndroid Build Coastguard Worker   struct value rhs;
207*cf5a6c84SAndroid Build Coastguard Worker 
208*cf5a6c84SAndroid Build Coastguard Worker   if (!*TT.tok) error_exit("need arg @%td", TT.tok-toys.optargs);
209*cf5a6c84SAndroid Build Coastguard Worker 
210*cf5a6c84SAndroid Build Coastguard Worker   // Everything is infix, so set ret to first value, handling parentheses
211*cf5a6c84SAndroid Build Coastguard Worker   if (!strcmp(*TT.tok, "(")) {
212*cf5a6c84SAndroid Build Coastguard Worker     TT.tok++;
213*cf5a6c84SAndroid Build Coastguard Worker     eval_expr(ret, 1);        // We're inside ( ), so min_prec = 1
214*cf5a6c84SAndroid Build Coastguard Worker     if (ret->s && !strcmp(ret->s, ")")) error_exit("empty ( )");
215*cf5a6c84SAndroid Build Coastguard Worker     if (!*TT.tok || strcmp(*TT.tok, ")"))
216*cf5a6c84SAndroid Build Coastguard Worker       error_exit("Expected ) @%td", TT.tok-toys.optargs);
217*cf5a6c84SAndroid Build Coastguard Worker   } else ret->s = *TT.tok;  // simple literal, all values start as strings
218*cf5a6c84SAndroid Build Coastguard Worker   TT.tok++;
219*cf5a6c84SAndroid Build Coastguard Worker 
220*cf5a6c84SAndroid Build Coastguard Worker   // Evaluate RHS and apply operator until precedence is too low.
221*cf5a6c84SAndroid Build Coastguard Worker   while (*TT.tok) {
222*cf5a6c84SAndroid Build Coastguard Worker     struct op_def *o = OPS;
223*cf5a6c84SAndroid Build Coastguard Worker 
224*cf5a6c84SAndroid Build Coastguard Worker     while (o->tok) { // Look up operator
225*cf5a6c84SAndroid Build Coastguard Worker       if (!strcmp(*TT.tok, o->tok)) break;
226*cf5a6c84SAndroid Build Coastguard Worker       o++;
227*cf5a6c84SAndroid Build Coastguard Worker     }
228*cf5a6c84SAndroid Build Coastguard Worker     if (!o->tok) break; // Not an operator (extra input will fail later)
229*cf5a6c84SAndroid Build Coastguard Worker     if (o->prec < min_prec) break; // Precedence too low, pop a stack frame
230*cf5a6c84SAndroid Build Coastguard Worker     TT.tok++;
231*cf5a6c84SAndroid Build Coastguard Worker 
232*cf5a6c84SAndroid Build Coastguard Worker     eval_expr(&rhs, o->prec + 1); // Evaluate RHS, with higher min precedence
233*cf5a6c84SAndroid Build Coastguard Worker     eval_op(o, ret, &rhs); // Apply operator, setting 'ret'
234*cf5a6c84SAndroid Build Coastguard Worker   }
235*cf5a6c84SAndroid Build Coastguard Worker }
236*cf5a6c84SAndroid Build Coastguard Worker 
expr_main(void)237*cf5a6c84SAndroid Build Coastguard Worker void expr_main(void)
238*cf5a6c84SAndroid Build Coastguard Worker {
239*cf5a6c84SAndroid Build Coastguard Worker   struct value ret = {0};
240*cf5a6c84SAndroid Build Coastguard Worker 
241*cf5a6c84SAndroid Build Coastguard Worker   TT.tok = toys.optargs; // initialize global token
242*cf5a6c84SAndroid Build Coastguard Worker   eval_expr(&ret, 1);
243*cf5a6c84SAndroid Build Coastguard Worker   if (*TT.tok) error_exit("Unexpected extra input '%s'\n", *TT.tok);
244*cf5a6c84SAndroid Build Coastguard Worker 
245*cf5a6c84SAndroid Build Coastguard Worker   if (ret.s) printf("%s\n", ret.s);
246*cf5a6c84SAndroid Build Coastguard Worker   else printf("%lld\n", ret.i);
247*cf5a6c84SAndroid Build Coastguard Worker 
248*cf5a6c84SAndroid Build Coastguard Worker   toys.exitval = is_false(&ret);
249*cf5a6c84SAndroid Build Coastguard Worker 
250*cf5a6c84SAndroid Build Coastguard Worker   if (CFG_TOYBOX_FREE && TT.delete) free(TT.delete);
251*cf5a6c84SAndroid Build Coastguard Worker }
252