2020-04-22 19:29:27 -03:00
|
|
|
#!/usr/bin/env python3.8
|
|
|
|
|
|
|
|
"""pegen -- PEG Generator.
|
|
|
|
|
|
|
|
Search the web for PEG Parsers for reference.
|
|
|
|
"""
|
|
|
|
|
|
|
|
import argparse
|
|
|
|
import sys
|
|
|
|
import time
|
|
|
|
import token
|
|
|
|
import traceback
|
|
|
|
|
|
|
|
|
|
|
|
argparser = argparse.ArgumentParser(
|
|
|
|
prog="pegen", description="Experimental PEG-like parser generator"
|
|
|
|
)
|
|
|
|
argparser.add_argument("-q", "--quiet", action="store_true", help="Don't print the parsed grammar")
|
|
|
|
argparser.add_argument(
|
|
|
|
"-v",
|
|
|
|
"--verbose",
|
|
|
|
action="count",
|
|
|
|
default=0,
|
|
|
|
help="Print timing stats; repeat for more debug output",
|
|
|
|
)
|
|
|
|
argparser.add_argument(
|
|
|
|
"-c", "--cpython", action="store_true", help="Generate C code for inclusion into CPython"
|
|
|
|
)
|
|
|
|
argparser.add_argument(
|
|
|
|
"--compile-extension",
|
|
|
|
action="store_true",
|
|
|
|
help="Compile generated C code into an extension module",
|
|
|
|
)
|
|
|
|
argparser.add_argument(
|
|
|
|
"-o",
|
|
|
|
"--output",
|
|
|
|
metavar="OUT",
|
|
|
|
help="Where to write the generated parser (default parse.py or parse.c)",
|
|
|
|
)
|
|
|
|
argparser.add_argument("filename", help="Grammar description")
|
|
|
|
argparser.add_argument(
|
|
|
|
"--optimized", action="store_true", help="Compile the extension in optimized mode"
|
|
|
|
)
|
|
|
|
argparser.add_argument(
|
|
|
|
"--skip-actions", action="store_true", help="Suppress code emission for rule actions",
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
def main() -> None:
|
2020-04-23 20:53:29 -03:00
|
|
|
from pegen.build import build_parser_and_generator
|
|
|
|
from pegen.testutil import print_memstats
|
|
|
|
|
2020-04-22 19:29:27 -03:00
|
|
|
args = argparser.parse_args()
|
|
|
|
verbose = args.verbose
|
|
|
|
verbose_tokenizer = verbose >= 3
|
|
|
|
verbose_parser = verbose == 2 or verbose >= 4
|
|
|
|
t0 = time.time()
|
|
|
|
|
|
|
|
output_file = args.output
|
|
|
|
if not output_file:
|
|
|
|
if args.cpython:
|
|
|
|
output_file = "parse.c"
|
|
|
|
else:
|
|
|
|
output_file = "parse.py"
|
|
|
|
|
|
|
|
try:
|
|
|
|
grammar, parser, tokenizer, gen = build_parser_and_generator(
|
|
|
|
args.filename,
|
|
|
|
output_file,
|
|
|
|
args.compile_extension,
|
|
|
|
verbose_tokenizer,
|
|
|
|
verbose_parser,
|
|
|
|
args.verbose,
|
|
|
|
keep_asserts_in_extension=False if args.optimized else True,
|
|
|
|
skip_actions=args.skip_actions,
|
|
|
|
)
|
|
|
|
except Exception as err:
|
|
|
|
if args.verbose:
|
|
|
|
raise # Show traceback
|
|
|
|
traceback.print_exception(err.__class__, err, None)
|
|
|
|
sys.stderr.write("For full traceback, use -v\n")
|
|
|
|
sys.exit(1)
|
|
|
|
|
|
|
|
if not args.quiet:
|
|
|
|
if args.verbose:
|
|
|
|
print("Raw Grammar:")
|
|
|
|
for line in repr(grammar).splitlines():
|
|
|
|
print(" ", line)
|
|
|
|
|
|
|
|
print("Clean Grammar:")
|
|
|
|
for line in str(grammar).splitlines():
|
|
|
|
print(" ", line)
|
|
|
|
|
|
|
|
if args.verbose:
|
|
|
|
print("First Graph:")
|
|
|
|
for src, dsts in gen.first_graph.items():
|
|
|
|
print(f" {src} -> {', '.join(dsts)}")
|
|
|
|
print("First SCCS:")
|
|
|
|
for scc in gen.first_sccs:
|
|
|
|
print(" ", scc, end="")
|
|
|
|
if len(scc) > 1:
|
|
|
|
print(
|
|
|
|
" # Indirectly left-recursive; leaders:",
|
|
|
|
{name for name in scc if grammar.rules[name].leader},
|
|
|
|
)
|
|
|
|
else:
|
|
|
|
name = next(iter(scc))
|
|
|
|
if name in gen.first_graph[name]:
|
|
|
|
print(" # Left-recursive")
|
|
|
|
else:
|
|
|
|
print()
|
|
|
|
|
|
|
|
t1 = time.time()
|
|
|
|
|
|
|
|
if args.verbose:
|
|
|
|
dt = t1 - t0
|
|
|
|
diag = tokenizer.diagnose()
|
|
|
|
nlines = diag.end[0]
|
|
|
|
if diag.type == token.ENDMARKER:
|
|
|
|
nlines -= 1
|
|
|
|
print(f"Total time: {dt:.3f} sec; {nlines} lines", end="")
|
|
|
|
if dt:
|
|
|
|
print(f"; {nlines / dt:.0f} lines/sec")
|
|
|
|
else:
|
|
|
|
print()
|
|
|
|
print("Caches sizes:")
|
|
|
|
print(f" token array : {len(tokenizer._tokens):10}")
|
|
|
|
print(f" cache : {len(parser._cache):10}")
|
|
|
|
if not print_memstats():
|
|
|
|
print("(Can't find psutil; install it for memory stats.)")
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
2020-04-23 20:53:29 -03:00
|
|
|
if sys.version_info < (3, 8):
|
|
|
|
print("ERROR: using pegen requires at least Python 3.8!", file=sys.stderr)
|
|
|
|
sys.exit(1)
|
2020-04-22 19:29:27 -03:00
|
|
|
main()
|