src/qmasm/assertions.py

###################################
# Parse an !assert directive      #
# By Scott Pakin <pakin@lanl.gov> #
###################################

import qmasm
import re
import sys

class AST(object):
    "Represent an abstract syntax tree."

    def __init__(self, qmasm_obj, type, value, kids=[]):
        self.qmasm = qmasm_obj
        self.type = type
        self.value = value
        self.kids = kids
        self.code = lambda isb: self.qmasm.abend("Internal error: Attempt to evaluate an AST without compiling it first")     # Function that evaluates the AST given a mapping from identifiers to bits
        self._str = None   # Memoized string representation
        self.pin_parser = qmasm.parse.PinParser()

    def _needs_parens(self):
        "Return True if an AST node should be parenthesized."
        return self.type == "factor" and self.kids[0].type == "conn"

    def _str_helper(self):
        "Do most of the work for the __str__ method."
        # Conditionally parenthesize all child strings.
        nkids = len(self.kids)
        kids_str = [str(k) for k in self.kids]
        for i in range(nkids):
            if self.kids[i]._needs_parens():
                kids_str[i] = "(" + kids_str[i] + ")"

        # Return ourself as a string.
        if nkids == 0:
            return str(self.value)
        if nkids == 1:
            if self.type == "unary" and self.value != "id":
                return "%s%s" % (self.value, kids_str[0])
            return kids_str[0]
        if nkids == 2:
            if self.value in ["*", "/", "%", "&", "<<", ">>", "**"]:
                return "%s%s%s" % (kids_str[0], self.value, kids_str[1])
            else:
                return "%s %s %s" % (kids_str[0], self.value, kids_str[1])
        if nkids == 3:
            if self.type == "if_expr":
                return "if %s then %s else %s endif" % (str(self.kids[0]), str(self.kids[1]), str(self.kids[2]))
        raise Exception("Internal error parsing (%s, %s)" % (repr(self.type), repr(self.value)))

    def __str__(self):
        if self._str == None:
            self._str = self._str_helper()
        return self._str

    def prefix_identifiers(self, prefix, next_prefix):
        "Prefix every identifier with a given string."
        if self.type == "ident":
            self.value = self.qmasm.apply_prefix(self.value, prefix, next_prefix)
        else:
            for k in self.kids:
                k.prefix_identifiers(prefix, next_prefix)

    def replace_ident(self, old_ident, new_ident):
        "Replace every occurrence of one identifer with another."
        if self.type == "ident":
            if self.value == old_ident:
                self.value = new_ident
        else:
            for k in self.kids:
                k.replace_ident(old_ident, new_ident)

    class EvaluationError(Exception):
        "Represent an exception thrown during AST evaluation."
        pass

    def _evaluate_ident(self, i2b):
        "Evaluate a variable, including array variables."
        val = 0
        for v in self.pin_parser.parse_lhs(self.value):
            try:
                bit = i2b[v]
                if bit == None:
                    raise self.EvaluationError("Unused variable %s" % v)
                val = val*2 + bit
            except KeyError:
                raise self.EvaluationError("Undefined variable %s" % v)
        return val

    def _compile_unary(self, kvals):
        "Compile a unary expression."
        if self.value == "-":
            return lambda i2b: -kvals[0](i2b)
        elif self.value == "~":
            return lambda i2b: ~kvals[0](i2b)
        elif self.value == "!":
            return lambda i2b: int(kvals[0](i2b) == 0)
        elif self.value in ["+", "id"]:
            return lambda i2b: kvals[0](i2b)
        else:
            raise self.EvaluationError('Internal error compiling unary "%s"' % self.value)

    def _evaluate_power(self, base, exp):
        "Raise one integer to the power of another."
        if exp < 0:
            raise self.EvaluationError("Negative powers (%d) are not allowed" % exp)
        return base**exp

    def _compile_arith(self, kvals):
        "Compile an arithmetic expression."
        if self.value == "+":
            return lambda i2b: kvals[0](i2b) + kvals[1](i2b)
        elif self.value == "-":
            return lambda i2b: kvals[0](i2b) - kvals[1](i2b)
        elif self.value == "*":
            return lambda i2b: kvals[0](i2b) * kvals[1](i2b)
        elif self.value == "/":
            return lambda i2b: kvals[0](i2b) // kvals[1](i2b)
        elif self.value == "%":
            return lambda i2b: kvals[0](i2b) % kvals[1](i2b)
        elif self.value == "&":
            return lambda i2b: kvals[0](i2b) & kvals[1](i2b)
        elif self.value == "|":
            return lambda i2b: kvals[0](i2b) | kvals[1](i2b)
        elif self.value == "^":
            return lambda i2b: kvals[0](i2b) ^ kvals[1](i2b)
        elif self.value == "<<":
            return lambda i2b: kvals[0](i2b) << kvals[1](i2b)
        elif self.value == ">>":
            return lambda i2b: kvals[0](i2b) >> kvals[1](i2b)
        elif self.value == "**":
            return lambda i2b: self._evaluate_power(kvals[0](i2b), kvals[1](i2b))
        else:
            raise self.EvaluationError("Internal error compiling arithmetic operator %s" % self.value)

    def _compile_rel(self, kvals):
        "Compile a relational expression."
        if self.value == "=":
            return lambda i2b: kvals[0](i2b) == kvals[1](i2b)
        elif self.value == "/=":
            return lambda i2b: kvals[0](i2b) != kvals[1](i2b)
        elif self.value == "<":
            return lambda i2b: kvals[0](i2b) < kvals[1](i2b)
        elif self.value == "<=":
            return lambda i2b: kvals[0](i2b) <= kvals[1](i2b)
        elif self.value == ">":
            return lambda i2b: kvals[0](i2b) > kvals[1](i2b)
        elif self.value == ">=":
            return lambda i2b: kvals[0](i2b) >= kvals[1](i2b)
        else:
            raise self.EvaluationError("Internal error compiling relational operator %s" % self.value)

    def _compile_conn(self, kvals):
        "Compile a logical connective."
        if self.value == "&&":
            return lambda i2b: kvals[0](i2b) and kvals[1](i2b)
        elif self.value == "||":
            return lambda i2b: kvals[0](i2b) or kvals[1](i2b)
        else:
            raise self.EvaluationError("Internal error compiling logical connective %s" % self.value)

    def _evaluate_if_expr(self, i2b, kvals):
        if kvals[0](i2b):
            return kvals[1](i2b)
        else:
            return kvals[2](i2b)

    def _compile_if_expr(self, kvals):
        "Compile an if...then...else expression."
        return lambda i2b: self._evaluate_if_expr(i2b, kvals)

    def _compile_node(self):

        """Compile the AST to a function that returns either True or False
        given a mapping from identifiers to bits."""
        kvals = [k._compile_node() for k in self.kids]
        if self.type == "ident":
            # Variable
            return lambda i2b: self._evaluate_ident(i2b)
        elif self.type == "int":
            # Constant
            return lambda i2b: self.value
        elif self.type == "unary":
            # Unary expression
            return self._compile_unary(kvals)
        elif len(kvals) == 1:
            # All other single-child nodes return their child unmodified.
            return kvals[0]
        elif self.type in ["power", "term", "expr"]:
            return self._compile_arith(kvals)
        elif self.type == "rel":
            return self._compile_rel(kvals)
        elif self.type == "conn":
            return self._compile_conn(kvals)
        elif self.type == "if_expr":
            return self._compile_if_expr(kvals)
        else:
            raise self.EvaluationError("Internal error compiling AST node of type %s, value %s" % (repr(self.type), repr(self.value)))

    def compile(self):
        "Compile an AST for faster evaluation."
        self.code = self._compile_node()

    def evaluate(self, i2b):
        "Evaluate the AST to a value, given a mapping from identifiers to bits."
        try:
            return self.code(i2b)
        except self.EvaluationError as e:
            self.qmasm.abend("%s in assertion %s" % (e, self))

class AssertParser(object):
    int_re = re.compile(r'\d+')
    conn_re = re.compile(r'\|\||&&')
    rel_re = re.compile(r'/?=|[<>]=?')
    arith_re = re.compile(r'[-+/%&\|^~!]|>>|<<|\*\*?')
    keyword_re = re.compile(r'\b(if|then|else|endif)\b')

    def __init__(self, qmasm):
        self.qmasm = qmasm

    class ParseError(Exception):
        pass

    def lex(self, s):
        "Split a string into tokens (tuples of type and value)."
        tokens = []
        s = s.lstrip()
        while len(s) > 0:
            # Match parentheses.
            if s[0] == "(":
                tokens.append(("lparen", "("))
                s = s[1:].lstrip()
                continue
            if s[0] == ")":
                tokens.append(("rparen", ")"))
                s = s[1:].lstrip()
                continue

            # Match keywords.
            mo = self.keyword_re.match(s)
            if mo != None:
                match = mo.group(0)
                tokens.append((match, match))
                s = s[len(match):].lstrip()
                continue

            # Match positive integers.
            mo = self.int_re.match(s)
            if mo != None:
                match = mo.group(0)
                tokens.append(("int", int(match)))
                s = s[len(match):].lstrip()
                continue

            # Match connectives.
            mo = self.conn_re.match(s)
            if mo != None:
                match = mo.group(0)
                tokens.append(("conn", match))
                s = s[len(match):].lstrip()
                continue

            # Match "<<" and ">>" before we match "<" and ">".
            if len(s) >= 2 and (s[:2] == "<<" or s[:2] == ">>"):
                tokens.append(("arith", s[:2]))
                s = s[2:].lstrip()
                continue

            # Match relational operators.
            mo = self.rel_re.match(s)
            if mo != None:
                match = mo.group(0)
                tokens.append(("rel", match))
                s = s[len(match):].lstrip()
                continue

            # Match "**" before we match "*".
            if len(s) >= 2 and s[:2] == "**":
                tokens.append(("power", s[:2]))
                s = s[2:].lstrip()
                continue

            # Match arithmetic operators.
            mo = self.arith_re.match(s)
            if mo != None:
                match = mo.group(0)
                tokens.append(("arith", match))
                s = s[len(match):].lstrip()
                continue

            # Everything else is an identifier.
            mo = self.qmasm.ident_re.match(s)
            if mo != None:
                match = mo.group(0)
                tokens.append(("ident", match))
                s = s[len(match):].lstrip()
                continue
            raise self.ParseError("Failed to parse %s" % s)
        tokens.append(("EOF", "EOF"))
        return tokens

    def advance(self):
        "Advance to the next symbol."
        self.tokidx += 1
        self.sym = self.tokens[self.tokidx]

    def accept(self, ty):
        """Advance to the next token if the current token matches a given
        token type and return True.  Otherwise, return False."""
        if self.sym[0] == ty:
            self.advance()
            return True
        return False

    def expect(self, ty):
        """Advance to the next token if the current token matches a given
        token.  Otherwise, fail."""
        if not self.accept(ty):
            raise self.ParseError("Expected %s but saw %s" % (ty, repr(self.sym[1])))

    def generic_operator(self, return_type, child_method, sym_type, valid_ops):
        "Match one or more somethings to produce something else."
        # Produce a list of ASTs representing children.
        c = child_method()
        ops = [self.sym[1]]
        asts = [c]
        while self.sym[0] == sym_type and ops[-1] in valid_ops:
            self.advance()
            c = child_method()
            ops.append(self.sym[1])
            asts.append(c)

        # Handle the trivial case of the identity operation.
        if len(asts) == 1:
            return AST(self.qmasm, return_type, None, asts)

        # Merge the ASTs in a left-associative fashion into a single AST.
        ops.pop()
        while len(asts) > 1:
            asts = [AST(self.qmasm, return_type, ops[0], [asts[0], asts[1]])] + asts[2:]
            ops.pop(0)
        return asts[0]

    def if_expr(self):
        "Return an if...then...else expression."
        self.expect("if")
        cond = self.conjunction()
        self.expect("then")
        then_expr = self.expression()
        self.expect("else")
        else_expr = self.expression()
        self.expect("endif")
        return AST(self.qmasm, "if_expr", None, [cond, then_expr, else_expr])

    def factor(self):
        "Return a factor (variable, integer, or expression)."
        val = self.sym[1]
        if self.accept("ident"):
            child = AST(self.qmasm, "ident", val)
        elif self.accept("int"):
            child = AST(self.qmasm, "int", val)
        elif self.accept("lparen"):
            child = self.disjunction()
            self.expect("rparen")
        elif self.sym[0] == "arith":
            child = self.unary()
        elif self.sym[0] == "if":
            child = self.if_expr()
        elif val == "EOF":
            raise self.ParseError("Parse error at end of expression")
        else:
            raise self.ParseError('Parse error at "%s"' % val)
        return AST(self.qmasm, "factor", None, [child])

    def power(self):
        "Return a factor or a factor raised to the power of a second factor."
        f1 = self.factor()
        op = self.sym[1]
        if self.sym[0] == "power" and op == "**":
            self.advance()
            f2 = self.power()
            return AST(self.qmasm, "power", op, [f1, f2])
        return AST(self.qmasm, "power", None, [f1])

    def unary(self):
        "Return a unary operator applied to a power."
        op = self.sym[1]
        if op in ["+", "-", "~", "!"]:
            self.advance()
        else:
            op = "id"
        return AST(self.qmasm, "unary", op, [self.power()])

    def term(self):
        "Return a term (product of one or more unaries)."
        return self.generic_operator("term", self.unary, "arith", ["*", "/", "%", "&", "<<", ">>"])

    def expression(self):
        "Return an expression (sum of one or more terms)."
        return self.generic_operator("expr", self.term, "arith", ["+", "-", "|", "^"])

    def comparison(self):
        "Return a comparison of exactly two expressions."
        e1 = self.expression()
        op = self.sym[1]
        if self.sym[0] != "rel":
            return AST(self.qmasm, "rel", None, [e1])
        self.advance()
        e2 = self.expression()
        return AST(self.qmasm, "rel", op, [e1, e2])

    def conjunction(self):
        "Return a conjunction (logical AND of one or more comparisons)."
        return self.generic_operator("conn", self.comparison, "conn", ["&&"])

    def disjunction(self):
        "Return a disjunction (logical OR of one or more conjunctions)."
        return self.generic_operator("conn", self.conjunction, "conn", ["||"])

    def parse(self, s):
        "Parse a relational expression into an AST"
        self.tokens = self.lex(s)
        self.tokidx = -1
        self.advance()
        try:
            ast = self.disjunction()
            if self.sym[0] != "EOF":
                raise self.ParseError('Parse error at "%s"' % self.sym[1])
        except self.ParseError as e:
            qmasm.abend('%s in "%s"' % (e, s))
        return ast