jcmorrow · January 31, 2019 22:30
diff --git a/lisp_parser.py b/lisp_parser.py
 import re
 import click


 class Tokenizer:
    TOKENS = [
        ("\\(", "list_start"),
        ("\\)", "list_end"),
        ("\\b[a-zA-z]+\\b", "atom"),
        ("\\b[0-9]+\\b", "integer"),
        ("\\B[/+*-]\\B", "operator")
    ]

    def __init__(self, code):
        self.code = code.strip()

    def run(self):
        tmp_code = self.code
        tokens = []

        while len(tmp_code):
            (token, match) = self.next_token_from_code(tmp_code)
            if match:
                tokens.append((token[1], tmp_code[:match.end()]))
                tmp_code = tmp_code[match.end():].strip()
            else:
                raise Exception("Unexpected Token: {}".format(tmp_code))

        return tokens

    def next_token_from_code(self, code):
        for token in self.TOKENS:
            match = re.match(re.compile(token[0]), code)
            if match:
                return (token, match)
        return (None, None)


 class Parser:
    def __init__(self, tokens):
        self.tokens = tokens

    def run(self):
        tmp_tokens = self.tokens
        ast = []
        while tmp_tokens:
            next_token = tmp_tokens[0]
            tmp_tokens = tmp_tokens[1:]
            if next_token[0] == "list_start":
                (inner_list, tmp_tokens) = self.parse_inner_list(tmp_tokens)
                ast.append(inner_list)
            elif next_token[0] == "atom":
                ast.append(next_token[1])
            elif next_token[0] == "integer":
                ast.append(int(next_token[1]))
            elif next_token[0] == "operator":
                ast.append(next_token[1])

        return ast

    def parse_inner_list(self, tokens):
        parens = 0
        inner_list_contents = []
        while tokens:
            next_token = tokens[0]
            tokens = tokens[1:]
            if next_token[0] == "list_start":
                parens = parens + 1
            if next_token[0] == "list_end":
                if parens > 0:
                    parens = parens - 1
                else:
                    return (Parser(inner_list_contents).run(), tokens)
            inner_list_contents.append(next_token)
        raise Exception("Unterminated List")


 def parse(code):
    return Parser(Tokenizer(code).run()).run()
  

 @click.command()
 @click.option('--code', default="", help='A line of lisp')
 def cli_parse(code):
    print(parse(code))


 if __name__ == "__main__":
    cli_parse()
	import re
	import click


	class Tokenizer:
	TOKENS = [
	("\\(", "list_start"),
	("\\)", "list_end"),
	("\\b[a-zA-z]+\\b", "atom"),
	("\\b[0-9]+\\b", "integer"),
	("\\B[/+*-]\\B", "operator")
	]

	def __init__(self, code):
	self.code = code.strip()

	def run(self):
	tmp_code = self.code
	tokens = []

	while len(tmp_code):
	(token, match) = self.next_token_from_code(tmp_code)
	if match:
	tokens.append((token[1], tmp_code[:match.end()]))
	tmp_code = tmp_code[match.end():].strip()
	else:
	raise Exception("Unexpected Token: {}".format(tmp_code))

	return tokens

	def next_token_from_code(self, code):
	for token in self.TOKENS:
	match = re.match(re.compile(token[0]), code)
	if match:
	return (token, match)
	return (None, None)


	class Parser:
	def __init__(self, tokens):
	self.tokens = tokens

	def run(self):
	tmp_tokens = self.tokens
	ast = []
	while tmp_tokens:
	next_token = tmp_tokens[0]
	tmp_tokens = tmp_tokens[1:]
	if next_token[0] == "list_start":
	(inner_list, tmp_tokens) = self.parse_inner_list(tmp_tokens)
	ast.append(inner_list)
	elif next_token[0] == "atom":
	ast.append(next_token[1])
	elif next_token[0] == "integer":
	ast.append(int(next_token[1]))
	elif next_token[0] == "operator":
	ast.append(next_token[1])

	return ast

	def parse_inner_list(self, tokens):
	parens = 0
	inner_list_contents = []
	while tokens:
	next_token = tokens[0]
	tokens = tokens[1:]
	if next_token[0] == "list_start":
	parens = parens + 1
	if next_token[0] == "list_end":
	if parens > 0:
	parens = parens - 1
	else:
	return (Parser(inner_list_contents).run(), tokens)
	inner_list_contents.append(next_token)
	raise Exception("Unterminated List")


	def parse(code):
	return Parser(Tokenizer(code).run()).run()


	@click.command()
	@click.option('--code', default="", help='A line of lisp')
	def cli_parse(code):
	print(parse(code))


	if __name__ == "__main__":
	cli_parse()