Add document rendering to harness

To debug pretty-printing. Noticing some weirdness!
This commit is contained in:
John Doty 2024-09-13 16:45:54 -07:00
parent 9cdfda6ec5
commit 265f07fd5a
2 changed files with 107 additions and 26 deletions

View file

@ -85,6 +85,7 @@ class FineGrammar(Grammar):
indent(nl, mark(opt(self.class_body), field="body")),
nl,
self.RCURLY,
nl, # Extra newline at the end of the class
)
@rule("ClassBody")
@ -93,7 +94,7 @@ class FineGrammar(Grammar):
@rule
def _class_members(self) -> Rule:
return self._class_member | seq(self._class_members, self._class_member)
return self._class_member | seq(self._class_members, nl, self._class_member)
@rule
def _class_member(self) -> Rule:
@ -101,7 +102,7 @@ class FineGrammar(Grammar):
@rule("FieldDecl")
def field_declaration(self) -> Rule:
return group(self.IDENTIFIER, self.COLON, sp, self.type_expression, self.SEMICOLON) + nl
return group(self.IDENTIFIER, self.COLON, sp, self.type_expression, self.SEMICOLON)
# Types
@rule("TypeExpression")
@ -138,10 +139,14 @@ class FineGrammar(Grammar):
sp,
mark(self.IDENTIFIER, field="name", highlight=highlight.entity.name.function),
sp,
mark(self.function_parameters, field="parameters"),
mark(opt(sp, self.ARROW, sp, self.type_expression), field="return_type"),
group(
mark(self.function_parameters, field="parameters"),
mark(opt(sp, group(self.ARROW, sp, self.type_expression)), field="return_type"),
),
),
sp,
mark(self.block, field="body"),
nl,
)
@rule("ParamList")
@ -177,7 +182,7 @@ class FineGrammar(Grammar):
def block(self) -> Rule:
return alt(
group(self.LCURLY, nl, self.RCURLY),
seq(self.LCURLY, indent(br, self.block_body), br, self.RCURLY),
seq(self.LCURLY, indent(nl, self.block_body), nl, self.RCURLY),
)
@rule("BlockBody")
@ -185,7 +190,7 @@ class FineGrammar(Grammar):
return alt(
self.expression,
self._statement_list,
seq(self._statement_list, br, self.expression),
seq(self._statement_list, nl, self.expression),
)
@rule
@ -338,15 +343,17 @@ class FineGrammar(Grammar):
@rule
def match_expression(self) -> Rule:
return group(group(self.MATCH, sp, self.expression), sp, self.match_body)
@rule("MatchBody")
def match_body(self) -> Rule:
return alt(
group(self.LCURLY, nl, self.RCURLY),
group(self.LCURLY, indent(nl, self._match_arms), nl, self.RCURLY),
return group(
group(self.MATCH, sp, self.expression, sp, self.LCURLY),
indent(sp, self.match_arms),
sp,
self.RCURLY,
)
@rule("MatchArms")
def match_arms(self) -> Rule:
return self._match_arms
@rule
def _match_arms(self) -> Rule:
return (
@ -381,7 +388,7 @@ class FineGrammar(Grammar):
@rule
def object_constructor_expression(self) -> Rule:
return group(self.NEW, sp, self.type_identifier, self.field_list)
return group(self.NEW, sp, self.type_identifier, sp, self.field_list)
@rule
def field_list(self) -> Rule:

View file

@ -18,6 +18,7 @@ import typing
import parser
from parser import runtime
from parser import wadler
# from parser import Token, Grammar, rule, seq
@ -191,10 +192,28 @@ class DynamicLexerModule(DynamicModule[typing.Callable[[str], runtime.TokenStrea
return get_tokens
class DynamicPrinterModule(DynamicModule[wadler.Printer]):
def __init__(self, file_name, member_name):
super().__init__(file_name, member_name)
def _predicate(self, member) -> bool:
if not super()._predicate(member):
return False
if getattr(member, "build_table", None):
return True
return False
def _transform(self, value):
return wadler.Printer(value())
class DisplayMode(enum.Enum):
TREE = 0
ERRORS = 1
LOG = 2
DOCUMENT = 3
class ListHandler(logging.Handler):
@ -224,6 +243,7 @@ class Harness:
source: str | None
table: parser.ParseTable | None
tree: runtime.Tree | None
document: wadler.Document
mode: DisplayMode
log_handler: ListHandler
@ -252,6 +272,7 @@ class Harness:
self.table = None
self.tokens = None
self.tree = None
self.document = None
self.errors = []
self.state_count = 0
@ -267,6 +288,7 @@ class Harness:
)
self.lexer_module = DynamicLexerModule(self.lexer_file, self.grammar_member)
self.printer_module = DynamicPrinterModule(self.grammar_file, self.grammar_member)
self.log_handler = ListHandler()
logging.basicConfig(level=logging.INFO, handlers=[self.log_handler])
@ -287,6 +309,9 @@ class Harness:
elif k == "l":
self.mode = DisplayMode.LOG
self.lines = None
elif k == "d":
self.mode = DisplayMode.DOCUMENT
self.lines = None
elif k == "j":
self.line_start = self.line_start - 1
elif k == "k":
@ -301,6 +326,9 @@ class Harness:
def load_grammar(self) -> parser.ParseTable:
return self.grammar_module.get()
def load_printer(self) -> wadler.Printer:
return self.printer_module.get()
def update(self):
global VERSION
@ -337,6 +365,12 @@ class Harness:
self.average_entries = sum(len(row) for row in states) / len(states)
self.max_entries = max(len(row) for row in states)
printer = self.load_printer()
if self.tree is not None:
self.document = printer.convert_tree_to_document(self.tree)
else:
self.document = None
except Exception as e:
self.tree = None
self.errors = ["Error loading grammar:"] + [
@ -410,10 +444,14 @@ class Harness:
has_errors = "*" if self.errors else " "
has_tree = "*" if self.tree else " "
has_log = " " if self.log_handler.logs else " "
has_log = "*" if self.log_handler.logs else " "
has_document = "*" if self.document else " "
goto_cursor(0, rows - 1)
print(("\u2500" * cols) + "\r")
print(f"(e)rrors{has_errors} | (t)ree{has_tree} | (l)og{has_log} | (q)uit\r", end="")
print(
f"(e)rrors{has_errors} | (t)ree{has_tree} | (l)og{has_log} | (d)ocument{has_document} | (q)uit\r",
end="",
)
sys.stdout.flush()
sys.stdout.buffer.flush()
@ -433,6 +471,10 @@ class Harness:
case DisplayMode.LOG:
lines.extend(line for line in self.log_handler.logs)
case DisplayMode.DOCUMENT:
if self.document is not None:
self.format_document(lines, self.document)
case _:
typing.assert_never(self.mode)
@ -459,18 +501,50 @@ class Harness:
return lines
def format_node(self, lines, node: runtime.Tree | runtime.TokenValue, indent=0):
def format_node(self, lines, node: runtime.Tree):
"""Print out an indented concrete syntax tree, from parse()."""
match node:
case runtime.Tree(name=name, start=start, end=end, children=children):
lines.append((" " * indent) + f"{name or '???'} [{start}, {end})")
for child in children:
self.format_node(lines, child, indent + 2)
lines.extend(node.format_lines(self.source))
case runtime.TokenValue(kind=kind, start=start, end=end):
assert self.source is not None
value = self.source[start:end]
lines.append((" " * indent) + f"{kind}:'{value}' [{start}, {end})")
def format_document(self, lines: list[str], doc: wadler.Document, indent: int = 0):
def append(x: str):
lines.append((" " * indent) + x)
match doc:
case wadler.NewLine(replace):
append(f"newline {repr(replace)}")
case wadler.ForceBreak():
append(f"forced break")
case wadler.Indent():
append(f"indent {doc.amount}")
self.format_document(lines, doc.doc, indent + 1)
case wadler.Text(start, end):
if self.source is not None:
append(f"< {self.source[start:end]}")
else:
append(f"< ??? {start}:{end}")
case wadler.Literal(text):
append(f"' {text}")
case wadler.Group():
append("group")
self.format_document(lines, doc.child, indent + 1)
case wadler.Lazy():
self.format_document(lines, doc.resolve(), indent)
case wadler.Cons():
self.format_document(lines, doc.left, indent)
self.format_document(lines, doc.right, indent)
case None:
pass
case _:
typing.assert_never(doc)
def main(args: list[str]):