agent-orchestrator-benchmark/calculators/builder-adversary-lean/run-05/calc/lexer.py

import re

_NUMBER_RE = re.compile(r'\d+\.?\d*|\.\d+')

_SINGLE = {
    '+': 'PLUS',
    '-': 'MINUS',
    '*': 'STAR',
    '/': 'SLASH',
    '(': 'LPAREN',
    ')': 'RPAREN',
}


class LexError(Exception):
    pass


class Token:
    __slots__ = ('kind', 'value')

    def __init__(self, kind: str, value):
        self.kind = kind
        self.value = value

    def __repr__(self):
        return f'Token({self.kind}, {self.value!r})'

    def __eq__(self, other):
        return isinstance(other, Token) and self.kind == other.kind and self.value == other.value


def tokenize(src: str) -> list:
    tokens = []
    i = 0
    while i < len(src):
        ch = src[i]
        if ch in ' \t':
            i += 1
            continue
        if ch in _SINGLE:
            tokens.append(Token(_SINGLE[ch], ch))
            i += 1
            continue
        m = _NUMBER_RE.match(src, i)
        if m:
            raw = m.group()
            value = float(raw) if '.' in raw else int(raw)
            tokens.append(Token('NUMBER', value))
            i = m.end()
            continue
        raise LexError(f"unexpected character {ch!r} at position {i}")
    tokens.append(Token('EOF', None))
    return tokens