Files
agent-orchestrator-benchmark/calculators/builder-adversary-lean/run-05/calc/lexer.py

55 lines
1.2 KiB
Python

import re
_NUMBER_RE = re.compile(r'\d+\.?\d*|\.\d+')
_SINGLE = {
'+': 'PLUS',
'-': 'MINUS',
'*': 'STAR',
'/': 'SLASH',
'(': 'LPAREN',
')': 'RPAREN',
}
class LexError(Exception):
pass
class Token:
__slots__ = ('kind', 'value')
def __init__(self, kind: str, value):
self.kind = kind
self.value = value
def __repr__(self):
return f'Token({self.kind}, {self.value!r})'
def __eq__(self, other):
return isinstance(other, Token) and self.kind == other.kind and self.value == other.value
def tokenize(src: str) -> list:
tokens = []
i = 0
while i < len(src):
ch = src[i]
if ch in ' \t':
i += 1
continue
if ch in _SINGLE:
tokens.append(Token(_SINGLE[ch], ch))
i += 1
continue
m = _NUMBER_RE.match(src, i)
if m:
raw = m.group()
value = float(raw) if '.' in raw else int(raw)
tokens.append(Token('NUMBER', value))
i = m.end()
continue
raise LexError(f"unexpected character {ch!r} at position {i}")
tokens.append(Token('EOF', None))
return tokens