Last active
April 13, 2023 02:34
-
-
Save oliver-ni/f2e99c847b367a89ea4905b44b4c93c3 to your computer and use it in GitHub Desktop.
Formats Scheme source code
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import argparse | |
import sys | |
from dataclasses import dataclass | |
from typing import Callable, List, TypeVar, Union | |
T = TypeVar("T") | |
class SExpr(List[T]): | |
BEGIN = "(" | |
END = ")" | |
def __init__(self, *args, **kwargs): | |
super().__init__(*args, **kwargs) | |
def __str__(self) -> str: | |
return f"({' '.join(map(str, self))})" | |
class QuotedSExpr(SExpr): | |
BEGIN = "'(" | |
def __str__(self) -> str: | |
return f"'{super().__str__()}" | |
class TaggedExpr: | |
def __init__(self, expr: Union[str, SExpr["TaggedExpr"]], start: int, end: int): | |
self.inner = expr | |
self.start_pos = start | |
self.end_pos = end | |
def __bool__(self): | |
return bool(self.inner) | |
def __eq__(self, value: object): | |
return self.inner == value | |
@dataclass | |
class FormatOptions: | |
indent_seq: str = " " | |
class ParserFormatter: | |
DELIMETERS = SExpr.BEGIN, QuotedSExpr.BEGIN, SExpr.END | |
def __init__(self, code: str, options: FormatOptions = FormatOptions()): | |
self.code = code | |
self.options = options | |
self.pos = 0 | |
def cursor(self, length: int = 1): | |
return self.code[self.pos : self.pos + length] | |
def take(self, t: str): | |
if self.cursor(len(t)) == t: | |
self.pos += len(t) | |
return t | |
def take_until(self, f: Callable[[str], bool]): | |
start_pos = self.pos | |
while self.cursor(): | |
if f(self.cursor()): | |
break | |
self.pos += 1 | |
return self.code[start_pos : self.pos] | |
def take_whitespace(self): | |
return self.take_until(lambda s: not s.isspace()) | |
def take_token(self): | |
for t in self.DELIMETERS: | |
if self.take(t): | |
return t | |
return self.take_until( | |
lambda s: s.isspace() | |
or any(self.cursor(len(d)) == d for d in self.DELIMETERS) | |
) | |
def parse_expr(self): | |
self.take_whitespace() | |
start_pos = self.pos | |
t = self.take_token() | |
if t == SExpr.BEGIN: | |
expr = SExpr() | |
elif t == QuotedSExpr.BEGIN: | |
expr = QuotedSExpr() | |
else: | |
return TaggedExpr(t, start_pos, self.pos) | |
while True: | |
elem = self.parse_expr() | |
if not elem or elem == expr.END: | |
break | |
expr.append(elem) | |
if elem != expr.END: | |
raise ValueError(f"Expected ')', found {elem!r}") | |
return TaggedExpr(expr, start_pos, self.pos) | |
def parse(self): | |
yield from iter(self.parse_expr, "") | |
def _fmt_expr(self, expr: TaggedExpr, indent: int): | |
if isinstance(expr.inner, str): | |
yield expr.inner | |
return | |
yield expr.inner.BEGIN | |
if len(expr.inner) > 0: | |
yield from self._fmt_expr(expr.inner[0], indent=indent + 1) | |
for prev, elem in zip(expr.inner, expr.inner[1:]): | |
if "\n" in self.code[prev.end_pos : elem.start_pos]: | |
yield "\n" | |
yield self.options.indent_seq * indent | |
else: | |
yield " " | |
yield from self._fmt_expr(elem, indent=indent + 1) | |
yield expr.inner.END | |
def fmt_expr(self, expr: TaggedExpr): | |
return "".join(self._fmt_expr(expr, 1)) | |
def fmt(self): | |
for expr in self.parse(): | |
yield self.fmt_expr(expr) | |
if __name__ == "__main__": | |
BOLD = "\033[1m" | |
RESET = "\033[0m" | |
BLUE = "\033[94m" | |
parser = argparse.ArgumentParser( | |
prog="scheme-fmt", description="Formats scheme code" | |
) | |
parser.add_argument("--indent-with", choices=["tabs", "spaces"], default="spaces") | |
parser.add_argument("--indent-size", type=int, default=2) | |
parser.add_argument("files", nargs="+", type=argparse.FileType("r+")) | |
args = parser.parse_args() | |
indent_seq = "\t" if args.indent_with == "tabs" else " " * args.indent_size | |
options = FormatOptions(indent_seq=indent_seq) | |
num_fmt = len(args.files) | |
for f in args.files: | |
code = f.read() | |
pf = ParserFormatter(code, options=options) | |
result = "\n\n".join(pf.fmt()) + "\n" | |
if f is sys.stdin: | |
sys.stdout.write(result) | |
elif code != result: | |
f.seek(0) | |
f.write(result) | |
f.truncate() | |
f.close() | |
if code == result: | |
num_fmt -= 1 | |
else: | |
print(f"{BOLD}reformatted {f.name}{RESET}", file=sys.stderr) | |
if num_fmt > 0: | |
print(file=sys.stderr) | |
print(f"{BOLD}All done!{RESET} ✨ 🍰 ✨", file=sys.stderr) | |
def file(n: int): | |
return f"file" if n == 1 else f"files" | |
num_nofmt = len(args.files) - num_fmt | |
fmt_text = f"{BOLD}{BLUE}{num_fmt}{RESET}{BOLD} {file(num_fmt)} reformatted{RESET}" | |
nofmt_text = f"{BLUE}{num_nofmt}{RESET} {file(num_nofmt)} left unchanged" | |
if num_fmt == 0 and num_nofmt == 0: | |
print(f"{BOLD}No files given{RESET}.", file=sys.stderr) | |
elif num_fmt == 0: | |
print(nofmt_text, file=sys.stderr) | |
elif num_nofmt == 0: | |
print(fmt_text, file=sys.stderr) | |
else: | |
print(f"{fmt_text}, {nofmt_text}.", file=sys.stderr) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment