This is not really AQA, I just put it here

calaldees · calaldees · commit 684cb47c53c0 · 2025-12-04T08:52:42.000Z
This is an attempt at an interpreter from the book "Crafting Interpriters".
I'm just a copy monkey that is stepping through the book like a chimpo
Pretty cool though! I have a working scanner and expression parser! and it parses! .. holy shit!
diff --git a/teachprogramming/static/language_reference/languages/aqa/AQA.py b/teachprogramming/static/language_reference/languages/aqa/AQA.py
@@ -0,0 +1,353 @@
+import enum
+from typing import NamedTuple, Self, Callable
+from collections.abc import Sequence,  MutableSequence, Mapping
+from functools import cached_property
+from pprint import pprint as pp
+import functools
+import logging
+
+
+log = logging.getLogger(__name__)
+
+# https://filestore.aqa.org.uk/resources/computing/AQA-8525-NG-PC.PDF
+
+# https://www.geeksforgeeks.org/compiler-design/recursive-descent-parser/
+# https://craftinginterpreters.com/parsing-expressions.html
+
+
+
+
+class TokenType(enum.StrEnum):
+    IDENTIFIER = enum.auto()
+    STRING = enum.auto()
+    NUMBER = enum.auto()
+    EOF = enum.auto()
+
+    BANG_EQUAL = '!='
+    EQUAL_EQUAL = '=='
+    LESS_EQUAL = '<='
+    GREATER_EQUAL = '>='
+
+    LEFT_PAREN = '('
+    RIGHT_PAREN = ')'
+    LEFT_BRACE = '{'
+    RIGHT_BRACE = '}'
+    COMMA = ','
+    DOT = '.'
+    MINUS = '-'
+    PLUS = '+'
+    SEMICOLON = ';'
+    STAR = '*'
+    BANG = '!'
+    GREATER = '>'
+    LESS = '<'
+    EQUAL = '='
+    SLASH = '/'
+
+    AND = enum.auto()
+    CLASS = enum.auto()
+    ELSE = enum.auto()
+    FALSE = enum.auto()
+    FOR = enum.auto()
+    IF = enum.auto()
+    NIL = enum.auto()
+    OR = enum.auto()
+    PRINT = enum.auto()
+    RETURN = enum.auto()
+    SUPER = enum.auto()
+    THIS = enum.auto()
+    TRUE = enum.auto()
+    VAR = enum.auto()
+    WHILE = enum.auto()
+
+# ------------------------------------------------------------------------------
+
+class TextLocation(NamedTuple):
+    line: int
+    col: int
+    def __str__(self) -> str:
+        return f'Line: {self.line} Col: {self.col}'
+class Token(NamedTuple):
+    location: TextLocation
+    lexeme: str
+    type: TokenType
+    literal: str
+class TokenError(NamedTuple):
+    location: TextLocation
+    message: str
+class MutableTextLocation():
+    line: int = 0
+    col: int = 0
+    @property
+    def immutable(self) -> TextLocation:
+        return TextLocation(self.line, self.col)
+    def newLine(self):
+        self.line += 1
+        self.col = 0
+
+type wasConsumed = bool | None
+TokenHandler = Callable[['Scanner'], wasConsumed]
+
+class Scanner():
+    def __init__(self, source: str, token_handlers: Sequence[TokenHandler]):
+        assert source
+        assert token_handlers
+        self.source = source
+        self.token_handlers = token_handlers
+        self.location = MutableTextLocation()
+        self.index_start: int = 0
+        self.index_current: int = 0
+        self._tokens: MutableSequence[Token] = []
+        self._errors: MutableSequence[TokenError] = []
+    @property
+    def isAtEnd(self) -> bool:
+        return self.index_current >= len(self.source)
+    def advance(self, inc=1) -> None:
+        self.index_current += inc
+        self.location.col += inc
+    def match(self, expected: str) -> bool:
+        if expected != self.peek(len(expected)): return False
+        self.advance(len(expected))
+        return True
+    def peek(self, offset:int=1) -> str:
+        return self.source[self.index_current : min(self.index_current+offset, len(self.source))]
+    def addToken(self, type: TokenType, literal: str = '') -> None:
+        self._tokens.append(Token(
+            location=self.location.immutable,
+            lexeme=self.source[self.index_start:self.index_current],
+            type=type,
+            literal=literal
+        ))
+    @cached_property
+    def tokens(self) -> Sequence[Token]:
+        while not self.isAtEnd:
+            self.index_start = self.index_current
+            if not any(token_handler(self) for token_handler in self.token_handlers):
+                self._errors.append(TokenError(self.location.immutable, f"Unexpected character {self.peek()}"))
+        self.addToken(TokenType.EOF, '')
+        return self._tokens
+
+
+
+
+def white_space(s: Scanner) -> wasConsumed:
+    return any((s.match(i) for i in (' ', '\t', '\r')))
+
+def new_line(s: Scanner) -> wasConsumed:
+    if s.match('\n'):
+        s.location.newLine()
+        return True
+
+def comment(s: Scanner) -> wasConsumed:
+    if s.match('#'):
+        while (s.peek() not in ('\n', '')):
+            s.advance()
+
+def string(s: Scanner) -> wasConsumed:
+    if s.match('"'):
+        while s.peek() != '"' and not s.isAtEnd:
+            s.advance()
+            if s.peek() == '\n': s.location.newLine()
+        s.advance()
+        if s.isAtEnd:
+            s._errors.append(TokenError(s.location.immutable, 'Unterminated string'))
+        s.addToken(TokenType.STRING, s.source[s.index_start+1:s.index_current-1])
+
+def number(s: Scanner) -> wasConsumed:
+    if s.peek().isdigit():
+        while s.peek().isdigit(): s.advance()
+        peek = s.peek(2)
+        if len(peek)==2 and peek[0] == '.' and peek[1].isdigit():
+            s.advance()  # consume the '.'
+            while s.peek().isdigit(): s.advance()
+        s.addToken(TokenType.NUMBER, s.source[s.index_start:s.index_current])
+
+KEYWORDS = frozenset((
+    TokenType.AND,
+    TokenType.CLASS,
+    TokenType.ELSE,
+    TokenType.FALSE,
+    TokenType.FOR,
+    TokenType.IF,
+    TokenType.NIL,
+    TokenType.OR,
+    TokenType.PRINT,
+    TokenType.RETURN,
+    TokenType.SUPER,
+    TokenType.THIS,
+    TokenType.TRUE,
+    TokenType.VAR,
+    TokenType.WHILE,
+))
+
+def identifier(s: Scanner) -> wasConsumed:
+    if s.peek().isalpha():
+        while s.peek().isalnum(): s.advance()
+        text = s.source[s.index_start:s.index_current]
+        s.addToken(TokenType(text) if text in KEYWORDS else TokenType.IDENTIFIER, text)
+
+def createDefaultTokenHandlerFor(t: str) -> TokenHandler:
+    def _t(s: Scanner) -> wasConsumed:
+        if s.match(t):
+            s.addToken(TokenType(t), t)
+            return True
+    return _t
+
+DEFAULT_TOKEN_HANDLERS: Sequence[TokenHandler] = (
+    white_space,
+    new_line,
+    comment,
+    string,
+    number,
+    identifier,
+    *map(createDefaultTokenHandlerFor, ('!=', '==', '<=', '>=', '(', ')', '{', '}', ',', '.', '-', '+', ';', '*', '!', '>', '<', '=', '/'))
+)
+
+
+def test_scanner():
+    tokens = Scanner('thing = ("test" + 1.23) # This is a comment', DEFAULT_TOKEN_HANDLERS).tokens
+    token_types = tuple(t.type for t in tokens)
+    assert token_types == (
+        TokenType.IDENTIFIER,
+        TokenType.EQUAL,
+        TokenType.LEFT_PAREN,
+        TokenType.STRING,
+        TokenType.PLUS,
+        TokenType.NUMBER,
+        TokenType.RIGHT_PAREN,
+        TokenType.EOF,
+    )
+
+
+# ------------------------------------------------------------------------------
+
+import abc
+
+class Expr(abc.ABC):
+    pass
+class Literal(Expr):
+    def __init__(self, literal: str|bool|None|int|float):
+        self.literal = literal
+    def __str__(self) -> str:
+        return str(self.literal)
+class Unary(Expr):
+    def __init__(self, operator: Token, expression: Expr):
+        self.operator = operator
+        self.expression = expression
+    def __str__(self) -> str:
+        return f'{self.operator.type.value}{self.expression}'
+class Binary(Expr):
+    def __init__(self, expression1: Expr, operator: Token, expression2: Expr):
+        self.expression1 = expression1
+        self.operator = operator
+        self.expression2 = expression2
+    def __str__(self) -> str:
+        return ''.join(map(str, (self.expression1, self.operator.type.value, self.expression2)))
+class Grouping(Expr):
+    def __init__(self, expression: Expr):
+        self.expression = expression
+    def __str__(self) -> str:
+        return f'({self.expression})'
+
+
+class Parser():
+    class ParseError(BaseException): ...
+
+    def __init__(self, tokens: Sequence[Token]):
+        self.tokens = tokens
+        self.index_current: int = 0
+
+    @property
+    def parse(self) -> Expr | None:
+        try:
+            return self.expression()
+        except self.ParseError as pe:
+            return None
+
+    @property
+    def peek(self) -> Token:
+        return self.tokens[self.index_current]
+    @property
+    def previous(self) -> Token:
+        return self.tokens[self.index_current - 1]
+    @property
+    def advance(self) -> Token:
+        if not self.isAtEnd: self.index_current += 1
+        return self.previous
+    @property
+    def isAtEnd(self) -> bool:
+        return self.peek.type == TokenType.EOF
+    def check(self, type: TokenType) -> bool:
+        if self.isAtEnd: return False
+        return self.peek.type == type
+    def match(self, *types: TokenType) -> Token | None:
+        for t in types:
+            if self.check(t):
+                return self.advance
+    def consume(self, type: TokenType, error_message: str) -> Token:
+        if self.check(type): return self.advance
+        raise self.error(self.peek, error_message)
+
+    def error(self, token: Token, error_message: str) -> 'Parser.ParseError':
+        log.error(f'{token.location} - {token.lexeme} - {error_message}')
+        return self.ParseError()
+    def synchronize(self) -> None:
+        # humm ... sure this can be python-ed and simplified
+        self.advance
+        while not self.isAtEnd:
+            if self.previous.type == TokenType.SEMICOLON: return
+            match self.peek.type:
+                case (TokenType.CLASS, TokenType.VAR, TokenType.FOR, TokenType.IF, TokenType.WHILE, TokenType.PRINT, TokenType.RETURN):
+                    return
+            self.advance
+    """
+    expression     → equality ;
+    equality       → comparison ( ( "!=" | "==" ) comparison )* ;
+    comparison     → term ( ( ">" | ">=" | "<" | "<=" ) term )* ;
+    term           → factor ( ( "-" | "+" ) factor )* ;
+    factor         → unary ( ( "/" | "*" ) unary )* ;
+    unary          → ( "!" | "-" ) unary | primary ;
+    primary        → NUMBER | STRING | "true" | "false" | "nil" | "(" expression ")" ;
+    """
+    def expression(self) -> Expr:
+        return self.equality()
+    def equality(self) -> Expr:
+        expr = self.comparison()
+        while operator := self.match(TokenType.BANG_EQUAL, TokenType.EQUAL_EQUAL):
+            expr = Binary(expr, operator, self.comparison())
+        return expr
+    def comparison(self) -> Expr:
+        expr = self.term()
+        while operator := self.match(TokenType.GREATER, TokenType.GREATER_EQUAL, TokenType.LESS, TokenType.LESS_EQUAL):
+            expr = Binary(expr, operator, self.term())
+        return expr
+    def term(self) -> Expr:
+        expr = self.factor()
+        while operator := self.match(TokenType.MINUS, TokenType.PLUS):
+            expr = Binary(expr, operator, self.factor())
+        return expr
+    def factor(self) -> Expr:
+        expr = self.unary()
+        while operator := self.match(TokenType.SLASH, TokenType.STAR):
+            expr = Binary(expr, operator, self.unary())
+        return expr
+    def unary(self) -> Expr:
+        if operator := self.match(TokenType.BANG, TokenType.MINUS):
+            return Unary(operator, self.unary())
+        return self.primary()
+    def primary(self) -> Expr:
+        if self.match(TokenType.FALSE): return Literal(False)
+        if self.match(TokenType.TRUE): return Literal(True)
+        if self.match(TokenType.NIL): return Literal(None)
+        if token := self.match(TokenType.NUMBER, TokenType.STRING): return Literal(token.literal)
+        if self.match(TokenType.LEFT_PAREN):
+            expr = self.expression()
+            self.consume(TokenType.RIGHT_PAREN, "Expect ')' after expression.")
+            return Grouping(expr)
+        raise self.error(self.peek, "Expect expression.")
+
+
+def test_parser():
+    tokens = Scanner('12.3 * (45 - "test") >= !10', DEFAULT_TOKEN_HANDLERS).tokens
+    expr = Parser(tokens).parse
+    assert False