Tokenizer functional, fragile parsing
This commit is contained in:
@@ -0,0 +1,51 @@
|
||||
import re
|
||||
from typing import Any
|
||||
import lisp
|
||||
import atom
|
||||
|
||||
|
||||
class Reader:
|
||||
tokens: list[str|Any]
|
||||
|
||||
def __init__(self):
|
||||
self.tokens = []
|
||||
self.interpreter = lisp.Lisp()
|
||||
|
||||
def tokenize(self, expression: str):
|
||||
self.tokens += re.findall(r"""[\s,]*[;.*]*([()']|"(?:\\.|[^\\"])*"?|[^\s()'",;]*)""", expression)
|
||||
while self.peek() != "":
|
||||
self.read_expression()
|
||||
self.consume()
|
||||
|
||||
def peek(self):
|
||||
return self.tokens[0]
|
||||
|
||||
def consume(self):
|
||||
token = self.tokens[0]
|
||||
self.tokens = self.tokens[1:]
|
||||
return token
|
||||
|
||||
def read_expression(self) -> atom.Atom | None:
|
||||
if len(self.tokens) == 0:
|
||||
return None
|
||||
if self.peek() == "(":
|
||||
self.consume()
|
||||
return self.read_list()
|
||||
else:
|
||||
return self.read_atom()
|
||||
|
||||
def read_list(self):
|
||||
token = self.peek()
|
||||
last = atom.Atom(None, None)
|
||||
first = last
|
||||
while token != ")":
|
||||
last.setval(self.read_expression())
|
||||
last.append(atom.Atom(None, None))
|
||||
last = last.cdr
|
||||
token = self.peek()
|
||||
self.consume()
|
||||
return first
|
||||
|
||||
def read_atom(self) -> atom.Atom:
|
||||
print(self.peek())
|
||||
return atom.Atom(self.consume(), None)
|
||||
Reference in New Issue
Block a user