/*- * Copyright (c) 2010 The NetBSD Foundation, Inc. * All rights reserved. * * This code is derived from software contributed to The NetBSD Foundation * by David A. Holland. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE * POSSIBILITY OF SUCH DAMAGE. */ #include <stdlib.h> #include <string.h> #include <limits.h> #include <errno.h> //#define DEBUG #ifdef DEBUG #include <stdio.h> #endif #include "utils.h" #include "array.h" #include "mode.h" #include "place.h" #include "eval.h" /* * e ::= * e1 ? e2 : e3 * e1 || e2 * e1 && e2 * e1 | e2 * e1 ^ e2 * e1 & e2 * e1 == e2 | e1 != e2 * e1 < e2 | e1 <= e2 | e1 > e2 | e1 >= e2 * e1 << e2 | e1 >> e2 * e1 + e2 | e1 - e2 * e1 * e2 | e1 / e2 | e1 % e2 * !e | ~e | -e | +e * ( e ) | ident */ enum tokens { T_EOF, /* end of input */ T_VAL, /* value */ T_LPAREN, /* parens */ T_RPAREN, T_PIPEPIPE, /* operators */ T_AMPAMP, T_EQEQ, T_BANGEQ, T_LTEQ, T_GTEQ, T_LTLT, T_GTGT, T_QUES, T_COLON, T_PIPE, T_CARET, T_AMP, T_LT, T_GT, T_PLUS, T_MINUS, T_STAR, T_SLASH, T_PCT, T_BANG, T_TILDE, }; static const struct { char c1, c2; enum tokens tok; } tokens_2[] = { { '|', '|', T_PIPEPIPE }, { '&', '&', T_AMPAMP }, { '=', '=', T_EQEQ }, { '!', '=', T_BANGEQ }, { '<', '=', T_LTEQ }, { '>', '=', T_GTEQ }, { '<', '<', T_LTLT }, { '>', '>', T_GTGT }, }; static const unsigned num_tokens_2 = HOWMANY(tokens_2); static const struct { char c1; enum tokens tok; } tokens_1[] = { { '?', T_QUES }, { ':', T_COLON }, { '|', T_PIPE }, { '^', T_CARET }, { '&', T_AMP }, { '<', T_LT }, { '>', T_GT }, { '+', T_PLUS }, { '-', T_MINUS }, { '*', T_STAR }, { '/', T_SLASH }, { '%', T_PCT }, { '!', T_BANG }, { '~', T_TILDE }, { '(', T_LPAREN }, { ')', T_RPAREN }, }; static const unsigned num_tokens_1 = HOWMANY(tokens_1); struct token { struct place place; enum tokens tok; int val; }; DECLARRAY(token, static UNUSED); DEFARRAY(token, static); static struct tokenarray tokens; static struct token * token_create(const struct place *p, enum tokens tok, int val) { struct token *t; t = domalloc(sizeof(*t)); t->place = *p; t->tok = tok; t->val = val; return t; } static void token_destroy(struct token *t) { dofree(t, sizeof(*t)); } DESTROYALL_ARRAY(token, ); #ifdef DEBUG static void printtokens(void) { unsigned i, num; struct token *t; fprintf(stderr, "tokens:"); num = tokenarray_num(&tokens); for (i=0; i<num; i++) { t = tokenarray_get(&tokens, i); switch (t->tok) { case T_EOF: fprintf(stderr, " <eof>"); break; case T_VAL: fprintf(stderr, " %d", t->val); break; case T_LPAREN: fprintf(stderr, " ("); break; case T_RPAREN: fprintf(stderr, " )"); break; case T_PIPEPIPE: fprintf(stderr, " ||"); break; case T_AMPAMP: fprintf(stderr, " &&"); break; case T_EQEQ: fprintf(stderr, " =="); break; case T_BANGEQ: fprintf(stderr, " !="); break; case T_LTEQ: fprintf(stderr, " <="); break; case T_GTEQ: fprintf(stderr, " >="); break; case T_LTLT: fprintf(stderr, " <<"); break; case T_GTGT: fprintf(stderr, " >>"); break; case T_QUES: fprintf(stderr, " ?"); break; case T_COLON: fprintf(stderr, " :"); break; case T_PIPE: fprintf(stderr, " |"); break; case T_CARET: fprintf(stderr, " ^"); break; case T_AMP: fprintf(stderr, " &"); break; case T_LT: fprintf(stderr, " <"); break; case T_GT: fprintf(stderr, " >"); break; case T_PLUS: fprintf(stderr, " +"); break; case T_MINUS: fprintf(stderr, " -"); break; case T_STAR: fprintf(stderr, " *"); break; case T_SLASH: fprintf(stderr, " /"); break; case T_PCT: fprintf(stderr, " %%"); break; case T_BANG: fprintf(stderr, " !"); break; case T_TILDE: fprintf(stderr, " ~"); break; } } fprintf(stderr, "\n"); } #endif static bool isuop(enum tokens tok) { switch (tok) { case T_BANG: case T_TILDE: case T_MINUS: case T_PLUS: return true; default: break; } return false; } static bool isbop(enum tokens tok) { switch (tok) { case T_EOF: case T_VAL: case T_LPAREN: case T_RPAREN: case T_COLON: case T_QUES: case T_BANG: case T_TILDE: return false; default: break; } return true; } static bool isop(enum tokens tok) { switch (tok) { case T_EOF: case T_VAL: case T_LPAREN: case T_RPAREN: return false; default: break; } return true; } static int getprec(enum tokens tok) { switch (tok) { case T_BANG: case T_TILDE: return -1; case T_STAR: case T_SLASH: case T_PCT: return 0; case T_PLUS: case T_MINUS: return 1; case T_LTLT: case T_GTGT: return 2; case T_LT: case T_LTEQ: case T_GT: case T_GTEQ: return 3; case T_EQEQ: case T_BANGEQ: return 4; case T_AMP: return 5; case T_CARET: return 6; case T_PIPE: return 7; case T_AMPAMP: return 8; case T_PIPEPIPE: return 9; default: break; } return 10; } static bool looser(enum tokens t1, enum tokens t2) { return getprec(t1) >= getprec(t2); } static int eval_uop(enum tokens op, int val) { switch (op) { case T_BANG: val = !val; break; case T_TILDE: val = (int)~(unsigned)val; break; case T_MINUS: val = -val; break; case T_PLUS: break; default: assert(0); break; } return val; } static int eval_bop(struct place *p, int lv, enum tokens op, int rv) { unsigned mask; switch (op) { case T_PIPEPIPE: return lv || rv; case T_AMPAMP: return lv && rv; case T_PIPE: return (int)((unsigned)lv | (unsigned)rv); case T_CARET: return (int)((unsigned)lv ^ (unsigned)rv); case T_AMP: return (int)((unsigned)lv & (unsigned)rv); case T_EQEQ: return lv == rv; case T_BANGEQ: return lv != rv; case T_LT: return lv < rv; case T_GT: return lv > rv; case T_LTEQ: return lv <= rv; case T_GTEQ: return lv >= rv; case T_LTLT: case T_GTGT: if (rv < 0) { complain(p, "Negative bit-shift"); complain_fail(); rv = 0; } if ((unsigned)rv >= CHAR_BIT * sizeof(unsigned)) { complain(p, "Bit-shift farther than type width"); complain_fail(); rv = 0; } if (op == T_LTLT) { return (int)((unsigned)lv << (unsigned)rv); } mask = ((unsigned)-1) << (CHAR_BIT * sizeof(unsigned) - rv); lv = (int)(((unsigned)lv >> (unsigned)rv) | mask); return lv; case T_MINUS: if (rv == INT_MIN) { if (lv == INT_MIN) { return 0; } lv--; rv++; } rv = -rv; /* FALLTHROUGH */ case T_PLUS: if (rv > 0 && lv > (INT_MAX - rv)) { complain(p, "Integer overflow"); complain_fail(); return INT_MAX; } if (rv < 0 && lv < (INT_MIN - rv)) { complain(p, "Integer underflow"); complain_fail(); return INT_MIN; } return lv + rv; case T_STAR: if (rv == 0) { return 0; } if (rv == 1) { return lv; } if (rv == -1 && lv == INT_MIN) { lv++; lv = -lv; if (lv == INT_MAX) { complain(p, "Integer overflow"); complain_fail(); return INT_MAX; } lv++; return lv; } if (lv == INT_MIN && rv < 0) { complain(p, "Integer overflow"); complain_fail(); return INT_MAX; } if (lv == INT_MIN && rv > 0) { complain(p, "Integer underflow"); complain_fail(); return INT_MIN; } if (rv < 0) { rv = -rv; lv = -lv; } if (lv > 0 && lv > INT_MAX / rv) { complain(p, "Integer overflow"); complain_fail(); return INT_MAX; } if (lv < 0 && lv < INT_MIN / rv) { complain(p, "Integer underflow"); complain_fail(); return INT_MIN; } return lv * rv; case T_SLASH: if (rv == 0) { complain(p, "Division by zero"); complain_fail(); return 0; } return lv / rv; case T_PCT: if (rv == 0) { complain(p, "Modulus by zero"); complain_fail(); return 0; } return lv % rv; default: assert(0); break; } return 0; } static void tryreduce(void) { unsigned num; struct token *t1, *t2, *t3, *t4, *t5, *t6; while (1) { #ifdef DEBUG printtokens(); #endif num = tokenarray_num(&tokens); t1 = (num >= 1) ? tokenarray_get(&tokens, num-1) : NULL; t2 = (num >= 2) ? tokenarray_get(&tokens, num-2) : NULL; t3 = (num >= 3) ? tokenarray_get(&tokens, num-3) : NULL; if (num >= 3 && t3->tok == T_LPAREN && t2->tok == T_VAL && t1->tok == T_RPAREN) { /* (x) -> x */ t2->place = t3->place; token_destroy(t1); token_destroy(t3); tokenarray_remove(&tokens, num-1); tokenarray_remove(&tokens, num-3); continue; } if (num >= 2 && (num == 2 || isop(t3->tok) || t3->tok == T_LPAREN) && isuop(t2->tok) && t1->tok == T_VAL) { /* unary operator */ t1->val = eval_uop(t2->tok, t1->val); t1->place = t2->place; token_destroy(t2); tokenarray_remove(&tokens, num-2); continue; } if (num >= 2 && (num == 2 || isop(t3->tok) || t3->tok == T_LPAREN) && t2->tok != T_LPAREN && t2->tok != T_VAL && t1->tok == T_VAL) { complain(&t2->place, "Invalid unary operator"); complain_fail(); token_destroy(t2); tokenarray_remove(&tokens, num-2); continue; } t4 = (num >= 4) ? tokenarray_get(&tokens, num-4) : NULL; if (num >= 4 && t4->tok == T_VAL && isbop(t3->tok) && t2->tok == T_VAL) { /* binary operator */ if (looser(t1->tok, t3->tok)) { t4->val = eval_bop(&t3->place, t4->val, t3->tok, t2->val); token_destroy(t2); token_destroy(t3); tokenarray_remove(&tokens, num-2); tokenarray_remove(&tokens, num-3); continue; } break; } t5 = (num >= 5) ? tokenarray_get(&tokens, num-5) : NULL; t6 = (num >= 6) ? tokenarray_get(&tokens, num-6) : NULL; if (num >= 6 && t6->tok == T_VAL && t5->tok == T_QUES && t4->tok == T_VAL && t3->tok == T_COLON && t2->tok == T_VAL && !isop(t1->tok)) { /* conditional expression */ t6->val = t6->val ? t4->val : t2->val; token_destroy(t2); token_destroy(t3); token_destroy(t4); token_destroy(t5); tokenarray_remove(&tokens, num-2); tokenarray_remove(&tokens, num-3); tokenarray_remove(&tokens, num-4); tokenarray_remove(&tokens, num-5); continue; } if (num >= 2 && t2->tok == T_LPAREN && t1->tok == T_RPAREN) { complain(&t1->place, "Value expected within ()"); complain_fail(); t1->tok = T_VAL; t1->val = 0; token_destroy(t1); tokenarray_remove(&tokens, num-1); continue; } if (num >= 2 && t2->tok == T_VAL && t1->tok == T_VAL) { complain(&t1->place, "Operator expected"); complain_fail(); token_destroy(t1); tokenarray_remove(&tokens, num-1); continue; } if (num >= 2 && isop(t2->tok) && t1->tok == T_EOF) { complain(&t1->place, "Value expected after operator"); complain_fail(); token_destroy(t2); tokenarray_remove(&tokens, num-2); continue; } if (num == 2 && t2->tok == T_VAL && t1->tok == T_RPAREN) { complain(&t1->place, "Excess right parenthesis"); complain_fail(); token_destroy(t1); tokenarray_remove(&tokens, num-1); continue; } if (num == 3 && t3->tok == T_LPAREN && t2->tok == T_VAL && t1->tok == T_EOF) { complain(&t1->place, "Unclosed left parenthesis"); complain_fail(); token_destroy(t3); tokenarray_remove(&tokens, num-3); continue; } if (num == 2 && t2->tok == T_VAL && t1->tok == T_EOF) { /* accepting state */ break; } if (num >= 1 && t1->tok == T_EOF) { /* any other configuration at eof is an error */ complain(&t1->place, "Parse error"); complain_fail(); break; } /* otherwise, wait for more input */ break; } } static void token(struct place *p, enum tokens tok, int val) { struct token *t; t = token_create(p, tok, val); tokenarray_add(&tokens, t, NULL); tryreduce(); } static int wordval(struct place *p, char *word) { unsigned long val; char *t; if (word[0] >= '0' && word[0] <= '9') { errno = 0; val = strtoul(word, &t, 0); if (errno) { complain(p, "Invalid integer constant"); complain_fail(); return 0; } while (*t == 'U' || *t == 'L') { t++; } if (*t != '\0') { complain(p, "Trailing garbage after integer constant"); complain_fail(); return 0; } if (val > INT_MAX) { complain(p, "Integer constant too large"); complain_fail(); return INT_MAX; } return val; } /* if it's a symbol, warn and substitute 0. */ if (warns.undef) { complain(p, "Warning: value of undefined symbol %s is 0", word); if (mode.werror) { complain_fail(); } } debuglog(p, "Undefined symbol %s; substituting 0", word); return 0; } static bool check_word(struct place *p, char *expr, size_t pos, size_t *len_ret) { size_t len; int val; char tmp; if (!strchr(alnum, expr[pos])) { return false; } len = strspn(expr + pos, alnum); tmp = expr[pos + len]; expr[pos + len] = '\0'; val = wordval(p, expr + pos); expr[pos + len] = tmp; token(p, T_VAL, val); *len_ret = len; return true; } static bool check_tokens_2(struct place *p, char *expr, size_t pos) { unsigned i; for (i=0; i<num_tokens_2; i++) { if (expr[pos] == tokens_2[i].c1 && expr[pos+1] == tokens_2[i].c2) { token(p, tokens_2[i].tok, 0); return true; } } return false; } static bool check_tokens_1(struct place *p, char *expr, size_t pos) { unsigned i; for (i=0; i<num_tokens_1; i++) { if (expr[pos] == tokens_1[i].c1) { token(p, tokens_1[i].tok, 0); return true; } } return false; } static void tokenize(struct place *p, char *expr) { size_t pos, len; pos = 0; while (expr[pos] != '\0') { len = strspn(expr+pos, ws); pos += len; p->column += len; /* trailing whitespace is supposed to have been pruned */ assert(expr[pos] != '\0'); if (check_word(p, expr, pos, &len)) { pos += len; p->column += len; continue; } if (check_tokens_2(p, expr, pos)) { pos += 2; p->column += 2; continue; } if (check_tokens_1(p, expr, pos)) { pos++; p->column++; continue; } complain(p, "Invalid character %u in #if-expression", (unsigned char)expr[pos]); complain_fail(); pos++; p->column++; } token(p, T_EOF, 0); } bool eval(struct place *p, char *expr) { struct token *t1, *t2; unsigned num; bool result; #ifdef DEBUG fprintf(stderr, "eval: %s\n", expr); #endif debuglog(p, "eval: %s", expr); tokenarray_init(&tokens); tokenize(p, expr); result = false; num = tokenarray_num(&tokens); if (num == 2) { t1 = tokenarray_get(&tokens, num-1); t2 = tokenarray_get(&tokens, num-2); if (t2->tok == T_VAL && t1->tok == T_EOF) { result = t2->val != 0; } } tokenarray_destroyall(&tokens); tokenarray_cleanup(&tokens); return result; }