Edit

IABSD.fr/src/libexec/tradcpp/eval.c

Branch :

  • Show log

    Commit

  • Author : jsg
    Date : 2019-08-23 04:38:55
    Hash : 88157d21
    Message : update tradcpp to 0.5.3

  • libexec/tradcpp/eval.c
  • /*-
     * Copyright (c) 2010 The NetBSD Foundation, Inc.
     * All rights reserved.
     *
     * This code is derived from software contributed to The NetBSD Foundation
     * by David A. Holland.
     *
     * Redistribution and use in source and binary forms, with or without
     * modification, are permitted provided that the following conditions
     * are met:
     * 1. Redistributions of source code must retain the above copyright
     *    notice, this list of conditions and the following disclaimer.
     * 2. Redistributions in binary form must reproduce the above copyright
     *    notice, this list of conditions and the following disclaimer in the
     *    documentation and/or other materials provided with the distribution.
     *
     * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     * POSSIBILITY OF SUCH DAMAGE.
     */
    
    #include <stdlib.h>
    #include <string.h>
    #include <limits.h>
    #include <errno.h>
    
    //#define DEBUG
    #ifdef DEBUG
    #include <stdio.h>
    #endif
    
    #include "utils.h"
    #include "array.h"
    #include "mode.h"
    #include "place.h"
    #include "eval.h"
    
    /*
     * e ::=
     *    e1 ? e2 : e3
     *    e1 || e2
     *    e1 && e2
     *    e1 | e2
     *    e1 ^ e2
     *    e1 & e2
     *    e1 == e2  |  e1 != e2
     *    e1 < e2   |  e1 <= e2  |  e1 > e2  |  e1 >= e2
     *    e1 << e2  |  e1 >> e2
     *    e1 + e2   |  e1 - e2
     *    e1 * e2   |  e1 / e2   |  e1 % e2
     *    !e  |  ~e  |  -e  |  +e
     *    ( e )  |  ident
     */
    
    enum tokens {
    	T_EOF,		/* end of input */
    	T_VAL,		/* value */
    	T_LPAREN,	/* parens */
    	T_RPAREN,
    	T_PIPEPIPE,	/* operators */
    	T_AMPAMP,
    	T_EQEQ,
    	T_BANGEQ,
    	T_LTEQ,
    	T_GTEQ,
    	T_LTLT,
    	T_GTGT,
    	T_QUES,
    	T_COLON,
    	T_PIPE,
    	T_CARET,
    	T_AMP,
    	T_LT,
    	T_GT,
    	T_PLUS,
    	T_MINUS,
    	T_STAR,
    	T_SLASH,
    	T_PCT,
    	T_BANG,
    	T_TILDE,
    };
    
    static const struct {
    	char c1, c2;
    	enum tokens tok;
    } tokens_2[] = {
    	{ '|', '|', T_PIPEPIPE },
    	{ '&', '&', T_AMPAMP },
    	{ '=', '=', T_EQEQ },
    	{ '!', '=', T_BANGEQ },
    	{ '<', '=', T_LTEQ },
    	{ '>', '=', T_GTEQ },
    	{ '<', '<', T_LTLT },
    	{ '>', '>', T_GTGT },
    };
    static const unsigned num_tokens_2 = HOWMANY(tokens_2);
    
    static const struct {
    	char c1;
    	enum tokens tok;
    } tokens_1[] = {
    	{ '?', T_QUES },
    	{ ':', T_COLON },
    	{ '|', T_PIPE },
    	{ '^', T_CARET },
    	{ '&', T_AMP },
    	{ '<', T_LT },
    	{ '>', T_GT },
    	{ '+', T_PLUS },
    	{ '-', T_MINUS },
    	{ '*', T_STAR },
    	{ '/', T_SLASH },
    	{ '%', T_PCT },
    	{ '!', T_BANG },
    	{ '~', T_TILDE },
    	{ '(', T_LPAREN },
    	{ ')', T_RPAREN },
    };
    static const unsigned num_tokens_1 = HOWMANY(tokens_1);
    
    struct token {
    	struct place place;
    	enum tokens tok;
    	int val;
    };
    DECLARRAY(token, static UNUSED);
    DEFARRAY(token, static);
    
    static struct tokenarray tokens;
    
    static
    struct token *
    token_create(const struct place *p, enum tokens tok, int val)
    {
    	struct token *t;
    
    	t = domalloc(sizeof(*t));
    	t->place = *p;
    	t->tok = tok;
    	t->val = val;
    	return t;
    }
    
    static
    void
    token_destroy(struct token *t)
    {
    	dofree(t, sizeof(*t));
    }
    
    DESTROYALL_ARRAY(token, );
    
    #ifdef DEBUG
    static
    void
    printtokens(void)
    {
    	unsigned i, num;
    	struct token *t;
    
    	fprintf(stderr, "tokens:");
    	num = tokenarray_num(&tokens);
    	for (i=0; i<num; i++) {
    		t = tokenarray_get(&tokens, i);
    		switch (t->tok) {
    		    case T_EOF: fprintf(stderr, " <eof>"); break;
    		    case T_VAL: fprintf(stderr, " %d", t->val); break;
    		    case T_LPAREN: fprintf(stderr, " ("); break;
    		    case T_RPAREN: fprintf(stderr, " )"); break;
    		    case T_PIPEPIPE: fprintf(stderr, " ||"); break;
    		    case T_AMPAMP: fprintf(stderr, " &&"); break;
    		    case T_EQEQ: fprintf(stderr, " =="); break;
    		    case T_BANGEQ: fprintf(stderr, " !="); break;
    		    case T_LTEQ: fprintf(stderr, " <="); break;
    		    case T_GTEQ: fprintf(stderr, " >="); break;
    		    case T_LTLT: fprintf(stderr, " <<"); break;
    		    case T_GTGT: fprintf(stderr, " >>"); break;
    		    case T_QUES: fprintf(stderr, " ?"); break;
    		    case T_COLON: fprintf(stderr, " :"); break;
    		    case T_PIPE: fprintf(stderr, " |"); break;
    		    case T_CARET: fprintf(stderr, " ^"); break;
    		    case T_AMP: fprintf(stderr, " &"); break;
    		    case T_LT: fprintf(stderr, " <"); break;
    		    case T_GT: fprintf(stderr, " >"); break;
    		    case T_PLUS: fprintf(stderr, " +"); break;
    		    case T_MINUS: fprintf(stderr, " -"); break;
    		    case T_STAR: fprintf(stderr, " *"); break;
    		    case T_SLASH: fprintf(stderr, " /"); break;
    		    case T_PCT: fprintf(stderr, " %%"); break;
    		    case T_BANG: fprintf(stderr, " !"); break;
    		    case T_TILDE: fprintf(stderr, " ~"); break;
    		}
    	}
    	fprintf(stderr, "\n");
    }
    #endif
    
    static
    bool
    isuop(enum tokens tok)
    {
    	switch (tok) {
    	    case T_BANG:
    	    case T_TILDE:
    	    case T_MINUS:
    	    case T_PLUS:
    		return true;
    	    default:
    		break;
    	}
    	return false;
    }
    
    static
    bool
    isbop(enum tokens tok)
    {
    	switch (tok) {
    	    case T_EOF:
    	    case T_VAL:
    	    case T_LPAREN:
    	    case T_RPAREN:
    	    case T_COLON:
    	    case T_QUES:
    	    case T_BANG:
    	    case T_TILDE:
    		return false;
    	    default:
    		break;
    	}
    	return true;
    }
    
    static
    bool
    isop(enum tokens tok)
    {
    	switch (tok) {
    	    case T_EOF:
    	    case T_VAL:
    	    case T_LPAREN:
    	    case T_RPAREN:
    		return false;
    	    default:
    		break;
    	}
    	return true;
    }
    
    static
    int
    getprec(enum tokens tok)
    {
    	switch (tok) {
    	    case T_BANG: case T_TILDE: return -1;
    	    case T_STAR: case T_SLASH: case T_PCT: return 0;
    	    case T_PLUS: case T_MINUS: return 1;
    	    case T_LTLT: case T_GTGT: return 2;
    	    case T_LT: case T_LTEQ: case T_GT: case T_GTEQ: return 3;
    	    case T_EQEQ: case T_BANGEQ: return 4;
    	    case T_AMP: return 5;
    	    case T_CARET: return 6;
    	    case T_PIPE: return 7;
    	    case T_AMPAMP: return 8;
    	    case T_PIPEPIPE: return 9;
    	    default: break;
    	}
    	return 10;
    }
    
    static
    bool
    looser(enum tokens t1, enum tokens t2)
    {
    	return getprec(t1) >= getprec(t2);
    }
    
    static
    int
    eval_uop(enum tokens op, int val)
    {
    	switch (op) {
    	    case T_BANG: val = !val; break;
    	    case T_TILDE: val = (int)~(unsigned)val; break;
    	    case T_MINUS: val = -val; break;
    	    case T_PLUS: break;
    	    default: assert(0); break;
    	}
    	return val;
    }
    
    static
    int
    eval_bop(struct place *p, int lv, enum tokens op, int rv)
    {
    	unsigned mask;
    
    	switch (op) {
    	    case T_PIPEPIPE: return lv || rv;
    	    case T_AMPAMP:   return lv && rv;
    	    case T_PIPE:     return (int)((unsigned)lv | (unsigned)rv);
    	    case T_CARET:    return (int)((unsigned)lv ^ (unsigned)rv);
    	    case T_AMP:      return (int)((unsigned)lv & (unsigned)rv);
    	    case T_EQEQ:     return lv == rv;
    	    case T_BANGEQ:   return lv != rv;
    	    case T_LT:       return lv < rv;
    	    case T_GT:       return lv > rv;
    	    case T_LTEQ:     return lv <= rv;
    	    case T_GTEQ:     return lv >= rv;
    
    	    case T_LTLT:
    	    case T_GTGT:
    		if (rv < 0) {
    			complain(p, "Negative bit-shift");
    			complain_fail();
    			rv = 0;
    		}
    		if ((unsigned)rv >= CHAR_BIT * sizeof(unsigned)) {
    			complain(p, "Bit-shift farther than type width");
    			complain_fail();
    			rv = 0;
    		}
    		if (op == T_LTLT) {
    			return (int)((unsigned)lv << (unsigned)rv);
    		}
    		mask = ((unsigned)-1) << (CHAR_BIT * sizeof(unsigned) - rv);
    		lv = (int)(((unsigned)lv >> (unsigned)rv) | mask);
    		return lv;
    
    	    case T_MINUS:
    		if (rv == INT_MIN) {
    			if (lv == INT_MIN) {
    				return 0;
    			}
    			lv--;
    			rv++;
    		}
    		rv = -rv;
    		/* FALLTHROUGH */
    	    case T_PLUS:
    		if (rv > 0 && lv > (INT_MAX - rv)) {
    			complain(p, "Integer overflow");
    			complain_fail();
    			return INT_MAX;
    		}
    		if (rv < 0 && lv < (INT_MIN - rv)) {
    			complain(p, "Integer underflow");
    			complain_fail();
    			return INT_MIN;
    		}
    		return lv + rv;
    
    	    case T_STAR:
    		if (rv == 0) {
    			return 0;
    		}
    		if (rv == 1) {
    			return lv;
    		}
    		if (rv == -1 && lv == INT_MIN) {
    			lv++;
    			lv = -lv;
    			if (lv == INT_MAX) {
    				complain(p, "Integer overflow");
    				complain_fail();
    				return INT_MAX;
    			}
    			lv++;
    			return lv;
    		}
    		if (lv == INT_MIN && rv < 0) {
    			complain(p, "Integer overflow");
    			complain_fail();
    			return INT_MAX;
    		}
    		if (lv == INT_MIN && rv > 0) {
    			complain(p, "Integer underflow");
    			complain_fail();
    			return INT_MIN;
    		}
    		if (rv < 0) {
    			rv = -rv;
    			lv = -lv;
    		}
    		if (lv > 0 && lv > INT_MAX / rv) {
    			complain(p, "Integer overflow");
    			complain_fail();
    			return INT_MAX;
    		}
    		if (lv < 0 && lv < INT_MIN / rv) {
    			complain(p, "Integer underflow");
    			complain_fail();
    			return INT_MIN;
    		}
    		return lv * rv;
    
    	    case T_SLASH:
    		if (rv == 0) {
    			complain(p, "Division by zero");
    			complain_fail();
    			return 0;
    		}
    		return lv / rv;
    
    	    case T_PCT:
    		if (rv == 0) {
    			complain(p, "Modulus by zero");
    			complain_fail();
    			return 0;
    		}
    		return lv % rv;
    
    	    default: assert(0); break;
    	}
    	return 0;
    }
    
    static
    void
    tryreduce(void)
    {
    	unsigned num;
    	struct token *t1, *t2, *t3, *t4, *t5, *t6;
    
    	while (1) {
    #ifdef DEBUG
    		printtokens();
    #endif
    		num = tokenarray_num(&tokens);
    		t1 = (num >= 1) ? tokenarray_get(&tokens, num-1) : NULL;
    		t2 = (num >= 2) ? tokenarray_get(&tokens, num-2) : NULL;
    		t3 = (num >= 3) ? tokenarray_get(&tokens, num-3) : NULL;
    
    		if (num >= 3 &&
    		    t3->tok == T_LPAREN &&
    		    t2->tok == T_VAL &&
    		    t1->tok == T_RPAREN) {
    			/* (x) -> x */
    			t2->place = t3->place;
    			token_destroy(t1);
    			token_destroy(t3);
    			tokenarray_remove(&tokens, num-1);
    			tokenarray_remove(&tokens, num-3);
    			continue;
    		}
    
    		if (num >= 2 &&
    		    (num == 2 || isop(t3->tok) || t3->tok == T_LPAREN) &&
    		    isuop(t2->tok) &&
    		    t1->tok == T_VAL) {
    			/* unary operator */
    			t1->val = eval_uop(t2->tok, t1->val);
    			t1->place = t2->place;
    			token_destroy(t2);
    			tokenarray_remove(&tokens, num-2);
    			continue;
    		}
    		if (num >= 2 &&
    		    (num == 2 || isop(t3->tok) || t3->tok == T_LPAREN) &&
    		    t2->tok != T_LPAREN && t2->tok != T_VAL &&
    		    t1->tok == T_VAL) {
    			complain(&t2->place, "Invalid unary operator");
    			complain_fail();
    			token_destroy(t2);
    			tokenarray_remove(&tokens, num-2);
    			continue;
    		}
    
    			
    		t4 = (num >= 4) ? tokenarray_get(&tokens, num-4) : NULL;
    
    		if (num >= 4 &&
    		    t4->tok == T_VAL &&
    		    isbop(t3->tok) &&
    		    t2->tok == T_VAL) {
    			/* binary operator */
    			if (looser(t1->tok, t3->tok)) {
    				t4->val = eval_bop(&t3->place,
    						   t4->val, t3->tok, t2->val);
    				token_destroy(t2);
    				token_destroy(t3);
    				tokenarray_remove(&tokens, num-2);
    				tokenarray_remove(&tokens, num-3);
    				continue;
    			}
    			break;
    		}
    
    		t5 = (num >= 5) ? tokenarray_get(&tokens, num-5) : NULL;
    		t6 = (num >= 6) ? tokenarray_get(&tokens, num-6) : NULL;
    
    		if (num >= 6 &&
    		    t6->tok == T_VAL &&
    		    t5->tok == T_QUES &&
    		    t4->tok == T_VAL &&
    		    t3->tok == T_COLON &&
    		    t2->tok == T_VAL &&
    		    !isop(t1->tok)) {
    			/* conditional expression */
    			t6->val = t6->val ? t4->val : t2->val;
    			token_destroy(t2);
    			token_destroy(t3);
    			token_destroy(t4);
    			token_destroy(t5);
    			tokenarray_remove(&tokens, num-2);
    			tokenarray_remove(&tokens, num-3);
    			tokenarray_remove(&tokens, num-4);
    			tokenarray_remove(&tokens, num-5);
    			continue;
    		}
    
    		if (num >= 2 &&
    		    t2->tok == T_LPAREN &&
    		    t1->tok == T_RPAREN) {
    			complain(&t1->place, "Value expected within ()");
    			complain_fail();
    			t1->tok = T_VAL;
    			t1->val = 0;
    			token_destroy(t1);
    			tokenarray_remove(&tokens, num-1);
    			continue;
    		}
    
    		if (num >= 2 &&
    		    t2->tok == T_VAL &&
    		    t1->tok == T_VAL) {
    			complain(&t1->place, "Operator expected");
    			complain_fail();
    			token_destroy(t1);
    			tokenarray_remove(&tokens, num-1);
    			continue;
    		}
    
    		if (num >= 2 &&
    		    isop(t2->tok) &&
    		    t1->tok == T_EOF) {
    			complain(&t1->place, "Value expected after operator");
    			complain_fail();
    			token_destroy(t2);
    			tokenarray_remove(&tokens, num-2);
    			continue;
    		}
    
    		if (num == 2 &&
    		    t2->tok == T_VAL &&
    		    t1->tok == T_RPAREN) {
    			complain(&t1->place, "Excess right parenthesis");
    			complain_fail();
    			token_destroy(t1);
    			tokenarray_remove(&tokens, num-1);
    			continue;
    		}
    
    		if (num == 3 &&
    		    t3->tok == T_LPAREN &&
    		    t2->tok == T_VAL &&
    		    t1->tok == T_EOF) {
    			complain(&t1->place, "Unclosed left parenthesis");
    			complain_fail();
    			token_destroy(t3);
    			tokenarray_remove(&tokens, num-3);
    			continue;
    		}
    
    		if (num == 2 &&
    		    t2->tok == T_VAL &&
    		    t1->tok == T_EOF) {
    			/* accepting state */
    			break;
    		}
    
    		if (num >= 1 &&
    		    t1->tok == T_EOF) {
    			/* any other configuration at eof is an error */
    			complain(&t1->place, "Parse error");
    			complain_fail();
    			break;
    		}
    
    		/* otherwise, wait for more input */
    		break;
    	}
    }
    
    static
    void
    token(struct place *p, enum tokens tok, int val)
    {
    	struct token *t;
    
    	t = token_create(p, tok, val);
    
    	tokenarray_add(&tokens, t, NULL);
    	tryreduce();
    }
    
    static
    int
    wordval(struct place *p, char *word)
    {
    	unsigned long val;
    	char *t;
    
    	if (word[0] >= '0' && word[0] <= '9') {
    		errno = 0;
    		val = strtoul(word, &t, 0);
    		if (errno) {
    			complain(p, "Invalid integer constant");
    			complain_fail();
    			return 0;
    		}
    		while (*t == 'U' || *t == 'L') {
    			t++;
    		}
    		if (*t != '\0') {
    			complain(p, "Trailing garbage after integer constant");
    			complain_fail();
    			return 0;
    		}
    		if (val > INT_MAX) {
    			complain(p, "Integer constant too large");
    			complain_fail();
    			return INT_MAX;
    		}
    		return val;
    	}
    
    	/* if it's a symbol, warn and substitute 0. */
    	if (warns.undef) {
    		complain(p, "Warning: value of undefined symbol %s is 0",
    			 word);
    		if (mode.werror) {
    			complain_fail();
    		}
    	}
    	debuglog(p, "Undefined symbol %s; substituting 0", word);
    	return 0;
    }
    
    static
    bool
    check_word(struct place *p, char *expr, size_t pos, size_t *len_ret)
    {
    	size_t len;
    	int val;
    	char tmp;
    
    	if (!strchr(alnum, expr[pos])) {
    		return false;
    	}
    	len = strspn(expr + pos, alnum);
    	tmp = expr[pos + len];
    	expr[pos + len] = '\0';
    	val = wordval(p, expr + pos);
    	expr[pos + len] = tmp;
    	token(p, T_VAL, val);
    	*len_ret = len;
    	return true;
    }
    
    static
    bool
    check_tokens_2(struct place *p, char *expr, size_t pos)
    {
    	unsigned i;
    
    	for (i=0; i<num_tokens_2; i++) {
    		if (expr[pos] == tokens_2[i].c1 &&
    		    expr[pos+1] == tokens_2[i].c2) {
    			token(p, tokens_2[i].tok, 0);
    			return true;
    		}
    	}
    	return false;
    }
    
    static
    bool
    check_tokens_1(struct place *p, char *expr, size_t pos)
    {
    	unsigned i;
    
    	for (i=0; i<num_tokens_1; i++) {
    		if (expr[pos] == tokens_1[i].c1) {
    			token(p, tokens_1[i].tok, 0);
    			return true;
    		}
    	}
    	return false;
    }
    
    static
    void
    tokenize(struct place *p, char *expr)
    {
    	size_t pos, len;
    
    	pos = 0;
    	while (expr[pos] != '\0') {
    		len = strspn(expr+pos, ws);
    		pos += len;
    		place_addcolumns(p, len);
    		/* trailing whitespace is supposed to have been pruned */
    		assert(expr[pos] != '\0');
    		if (check_word(p, expr, pos, &len)) {
    			pos += len;
    			place_addcolumns(p, len);
    			continue;
    		}
    		if (check_tokens_2(p, expr, pos)) {
    			pos += 2;
    			place_addcolumns(p, 2);
    			continue;
    		}
    		if (check_tokens_1(p, expr, pos)) {
    			pos++;
    			place_addcolumns(p, 1);
    			continue;
    		}
    		complain(p, "Invalid character %u in #if-expression",
    			 (unsigned char)expr[pos]);
    		complain_fail();
    		pos++;
    		place_addcolumns(p, 1);
    	}
    	token(p, T_EOF, 0);
    }
    
    bool
    eval(struct place *p, char *expr)
    {
    	struct token *t1, *t2;
    	unsigned num;
    	bool result;
    
    #ifdef DEBUG
    	fprintf(stderr, "eval: %s\n", expr);
    #endif
    	debuglog(p, "eval: %s", expr);
    
    	tokenarray_init(&tokens);
    	tokenize(p, expr);
    
    	result = false;
    	num = tokenarray_num(&tokens);
    	if (num == 2) {
    		t1 = tokenarray_get(&tokens, num-1);
    		t2 = tokenarray_get(&tokens, num-2);
    		if (t2->tok == T_VAL &&
    		    t1->tok == T_EOF) {
    			result = t2->val != 0;
    		}
    	}
    
    	tokenarray_destroyall(&tokens);
    	tokenarray_cleanup(&tokens);
    	return result;
    }