2023-12-12 08:12:17 -04:00
|
|
|
"""Generate the cases for the tier 2 interpreter.
|
|
|
|
Reads the instruction definitions from bytecodes.c.
|
|
|
|
Writes the cases to executor_cases.c.h, which is #included in ceval.c.
|
|
|
|
"""
|
|
|
|
|
|
|
|
import argparse
|
|
|
|
|
|
|
|
from analyzer import (
|
|
|
|
Analysis,
|
|
|
|
Instruction,
|
|
|
|
Uop,
|
|
|
|
analyze_files,
|
|
|
|
StackItem,
|
|
|
|
analysis_error,
|
|
|
|
)
|
|
|
|
from generators_common import (
|
|
|
|
DEFAULT_INPUT,
|
|
|
|
ROOT,
|
|
|
|
emit_to,
|
2024-08-06 09:04:33 -03:00
|
|
|
write_header,
|
2024-07-09 07:33:56 -03:00
|
|
|
type_and_null,
|
2024-08-08 06:57:59 -03:00
|
|
|
Emitter,
|
2024-10-07 10:56:39 -03:00
|
|
|
TokenIterator,
|
|
|
|
always_true,
|
2023-12-12 08:12:17 -04:00
|
|
|
)
|
|
|
|
from cwriter import CWriter
|
|
|
|
from typing import TextIO, Iterator
|
|
|
|
from lexer import Token
|
2024-10-07 10:56:39 -03:00
|
|
|
from stack import Local, Stack, StackError, Storage
|
2023-12-12 08:12:17 -04:00
|
|
|
|
|
|
|
DEFAULT_OUTPUT = ROOT / "Python/executor_cases.c.h"
|
|
|
|
|
|
|
|
|
2024-02-20 06:50:59 -04:00
|
|
|
def declare_variable(
|
2024-07-18 08:49:24 -03:00
|
|
|
var: StackItem, uop: Uop, required: set[str], out: CWriter
|
2024-02-20 06:50:59 -04:00
|
|
|
) -> None:
|
2024-10-07 10:56:39 -03:00
|
|
|
if not var.used or var.name not in required:
|
2024-02-20 06:50:59 -04:00
|
|
|
return
|
2024-07-18 08:49:24 -03:00
|
|
|
required.remove(var.name)
|
2024-07-09 07:33:56 -03:00
|
|
|
type, null = type_and_null(var)
|
2024-06-26 16:10:43 -03:00
|
|
|
space = " " if type[-1].isalnum() else ""
|
2024-02-20 06:50:59 -04:00
|
|
|
if var.condition:
|
2024-06-26 16:10:43 -03:00
|
|
|
out.emit(f"{type}{space}{var.name} = {null};\n")
|
2024-02-20 06:50:59 -04:00
|
|
|
if uop.replicates:
|
|
|
|
# Replicas may not use all their conditional variables
|
|
|
|
# So avoid a compiler warning with a fake use
|
|
|
|
out.emit(f"(void){var.name};\n")
|
|
|
|
else:
|
2024-06-26 16:10:43 -03:00
|
|
|
out.emit(f"{type}{space}{var.name};\n")
|
2024-02-20 06:50:59 -04:00
|
|
|
|
|
|
|
|
2023-12-12 08:12:17 -04:00
|
|
|
def declare_variables(uop: Uop, out: CWriter) -> None:
|
2024-07-18 08:49:24 -03:00
|
|
|
stack = Stack()
|
2023-12-12 08:12:17 -04:00
|
|
|
for var in reversed(uop.stack.inputs):
|
2024-07-18 08:49:24 -03:00
|
|
|
stack.pop(var)
|
2023-12-12 08:12:17 -04:00
|
|
|
for var in uop.stack.outputs:
|
2024-10-07 10:56:39 -03:00
|
|
|
stack.push(Local.undefined(var))
|
2024-07-18 08:49:24 -03:00
|
|
|
required = set(stack.defined)
|
2024-08-01 05:27:26 -03:00
|
|
|
required.discard("unused")
|
2024-07-18 08:49:24 -03:00
|
|
|
for var in reversed(uop.stack.inputs):
|
|
|
|
declare_variable(var, uop, required, out)
|
|
|
|
for var in uop.stack.outputs:
|
|
|
|
declare_variable(var, uop, required, out)
|
2023-12-12 08:12:17 -04:00
|
|
|
|
2024-02-20 06:50:59 -04:00
|
|
|
|
2024-08-06 09:04:33 -03:00
|
|
|
class Tier2Emitter(Emitter):
|
2024-10-28 07:30:31 -03:00
|
|
|
|
2024-08-06 09:04:33 -03:00
|
|
|
def __init__(self, out: CWriter):
|
|
|
|
super().__init__(out)
|
|
|
|
self._replacers["oparg"] = self.oparg
|
|
|
|
|
|
|
|
def error_if(
|
|
|
|
self,
|
|
|
|
tkn: Token,
|
2024-10-07 10:56:39 -03:00
|
|
|
tkn_iter: TokenIterator,
|
2024-08-06 09:04:33 -03:00
|
|
|
uop: Uop,
|
2024-10-07 10:56:39 -03:00
|
|
|
storage: Storage,
|
2024-08-06 09:04:33 -03:00
|
|
|
inst: Instruction | None,
|
2024-10-07 10:56:39 -03:00
|
|
|
) -> bool:
|
2024-08-06 09:04:33 -03:00
|
|
|
self.out.emit_at("if ", tkn)
|
2024-10-07 10:56:39 -03:00
|
|
|
lparen = next(tkn_iter)
|
|
|
|
self.emit(lparen)
|
|
|
|
assert lparen.kind == "LPAREN"
|
|
|
|
first_tkn = next(tkn_iter)
|
|
|
|
self.out.emit(first_tkn)
|
2024-08-06 09:04:33 -03:00
|
|
|
emit_to(self.out, tkn_iter, "COMMA")
|
|
|
|
label = next(tkn_iter).text
|
|
|
|
next(tkn_iter) # RPAREN
|
|
|
|
next(tkn_iter) # Semi colon
|
|
|
|
self.emit(") JUMP_TO_ERROR();\n")
|
2024-10-07 10:56:39 -03:00
|
|
|
return not always_true(first_tkn)
|
|
|
|
|
2024-08-06 09:04:33 -03:00
|
|
|
|
|
|
|
def error_no_pop(
|
|
|
|
self,
|
|
|
|
tkn: Token,
|
2024-10-07 10:56:39 -03:00
|
|
|
tkn_iter: TokenIterator,
|
2024-08-06 09:04:33 -03:00
|
|
|
uop: Uop,
|
2024-10-07 10:56:39 -03:00
|
|
|
storage: Storage,
|
2024-08-06 09:04:33 -03:00
|
|
|
inst: Instruction | None,
|
2024-10-07 10:56:39 -03:00
|
|
|
) -> bool:
|
2024-08-06 09:04:33 -03:00
|
|
|
next(tkn_iter) # LPAREN
|
|
|
|
next(tkn_iter) # RPAREN
|
|
|
|
next(tkn_iter) # Semi colon
|
|
|
|
self.out.emit_at("JUMP_TO_ERROR();", tkn)
|
2024-10-07 10:56:39 -03:00
|
|
|
return False
|
2024-08-06 09:04:33 -03:00
|
|
|
|
|
|
|
def deopt_if(
|
|
|
|
self,
|
|
|
|
tkn: Token,
|
2024-10-07 10:56:39 -03:00
|
|
|
tkn_iter: TokenIterator,
|
2024-08-06 09:04:33 -03:00
|
|
|
uop: Uop,
|
2024-10-07 10:56:39 -03:00
|
|
|
storage: Storage,
|
2024-08-06 09:04:33 -03:00
|
|
|
inst: Instruction | None,
|
2024-10-07 10:56:39 -03:00
|
|
|
) -> bool:
|
2024-08-06 09:04:33 -03:00
|
|
|
self.out.emit_at("if ", tkn)
|
2024-10-07 10:56:39 -03:00
|
|
|
lparen = next(tkn_iter)
|
|
|
|
self.emit(lparen)
|
|
|
|
assert lparen.kind == "LPAREN"
|
|
|
|
first_tkn = tkn_iter.peek()
|
2024-08-06 09:04:33 -03:00
|
|
|
emit_to(self.out, tkn_iter, "RPAREN")
|
|
|
|
next(tkn_iter) # Semi colon
|
|
|
|
self.emit(") {\n")
|
|
|
|
self.emit("UOP_STAT_INC(uopcode, miss);\n")
|
2024-08-08 06:57:59 -03:00
|
|
|
self.emit("JUMP_TO_JUMP_TARGET();\n")
|
2024-08-06 09:04:33 -03:00
|
|
|
self.emit("}\n")
|
2024-10-07 10:56:39 -03:00
|
|
|
return not always_true(first_tkn)
|
2024-08-06 09:04:33 -03:00
|
|
|
|
2024-08-08 06:57:59 -03:00
|
|
|
def exit_if( # type: ignore[override]
|
2024-08-06 09:04:33 -03:00
|
|
|
self,
|
|
|
|
tkn: Token,
|
2024-10-07 10:56:39 -03:00
|
|
|
tkn_iter: TokenIterator,
|
2024-08-06 09:04:33 -03:00
|
|
|
uop: Uop,
|
2024-10-07 10:56:39 -03:00
|
|
|
storage: Storage,
|
2024-08-06 09:04:33 -03:00
|
|
|
inst: Instruction | None,
|
2024-10-07 10:56:39 -03:00
|
|
|
) -> bool:
|
2024-08-06 09:04:33 -03:00
|
|
|
self.out.emit_at("if ", tkn)
|
2024-10-07 10:56:39 -03:00
|
|
|
lparen = next(tkn_iter)
|
|
|
|
self.emit(lparen)
|
|
|
|
first_tkn = tkn_iter.peek()
|
2024-08-06 09:04:33 -03:00
|
|
|
emit_to(self.out, tkn_iter, "RPAREN")
|
|
|
|
next(tkn_iter) # Semi colon
|
|
|
|
self.emit(") {\n")
|
|
|
|
self.emit("UOP_STAT_INC(uopcode, miss);\n")
|
|
|
|
self.emit("JUMP_TO_JUMP_TARGET();\n")
|
|
|
|
self.emit("}\n")
|
2024-10-07 10:56:39 -03:00
|
|
|
return not always_true(first_tkn)
|
2024-08-06 09:04:33 -03:00
|
|
|
|
|
|
|
def oparg(
|
|
|
|
self,
|
|
|
|
tkn: Token,
|
2024-10-07 10:56:39 -03:00
|
|
|
tkn_iter: TokenIterator,
|
2024-08-06 09:04:33 -03:00
|
|
|
uop: Uop,
|
2024-10-07 10:56:39 -03:00
|
|
|
storage: Storage,
|
2024-08-06 09:04:33 -03:00
|
|
|
inst: Instruction | None,
|
2024-10-07 10:56:39 -03:00
|
|
|
) -> bool:
|
2024-08-06 09:04:33 -03:00
|
|
|
if not uop.name.endswith("_0") and not uop.name.endswith("_1"):
|
|
|
|
self.emit(tkn)
|
2024-10-07 10:56:39 -03:00
|
|
|
return True
|
2024-08-06 09:04:33 -03:00
|
|
|
amp = next(tkn_iter)
|
|
|
|
if amp.text != "&":
|
|
|
|
self.emit(tkn)
|
|
|
|
self.emit(amp)
|
2024-10-07 10:56:39 -03:00
|
|
|
return True
|
2024-08-06 09:04:33 -03:00
|
|
|
one = next(tkn_iter)
|
|
|
|
assert one.text == "1"
|
|
|
|
self.out.emit_at(uop.name[-1], tkn)
|
2024-10-07 10:56:39 -03:00
|
|
|
return True
|
2024-08-06 09:04:33 -03:00
|
|
|
|
2024-08-08 06:57:59 -03:00
|
|
|
|
2024-10-07 10:56:39 -03:00
|
|
|
def write_uop(uop: Uop, emitter: Emitter, stack: Stack) -> Stack:
|
2024-08-01 05:27:26 -03:00
|
|
|
locals: dict[str, Local] = {}
|
2023-12-12 08:12:17 -04:00
|
|
|
try:
|
2024-08-06 09:04:33 -03:00
|
|
|
emitter.out.start_line()
|
2023-12-12 08:12:17 -04:00
|
|
|
if uop.properties.oparg:
|
2024-08-06 09:04:33 -03:00
|
|
|
emitter.emit("oparg = CURRENT_OPARG();\n")
|
2024-02-20 06:50:59 -04:00
|
|
|
assert uop.properties.const_oparg < 0
|
|
|
|
elif uop.properties.const_oparg >= 0:
|
2024-08-06 09:04:33 -03:00
|
|
|
emitter.emit(f"oparg = {uop.properties.const_oparg};\n")
|
|
|
|
emitter.emit(f"assert(oparg == CURRENT_OPARG());\n")
|
2024-10-07 10:56:39 -03:00
|
|
|
code_list, storage = Storage.for_uop(stack, uop)
|
|
|
|
for code in code_list:
|
2024-08-06 09:04:33 -03:00
|
|
|
emitter.emit(code)
|
2024-11-08 23:35:33 -04:00
|
|
|
for idx, cache in enumerate(uop.caches):
|
2023-12-12 08:12:17 -04:00
|
|
|
if cache.name != "unused":
|
|
|
|
if cache.size == 4:
|
2023-12-20 10:27:25 -04:00
|
|
|
type = cast = "PyObject *"
|
2023-12-12 08:12:17 -04:00
|
|
|
else:
|
2023-12-13 08:31:41 -04:00
|
|
|
type = f"uint{cache.size*16}_t "
|
|
|
|
cast = f"uint{cache.size*16}_t"
|
2024-11-08 23:35:33 -04:00
|
|
|
emitter.emit(f"{type}{cache.name} = ({cast})CURRENT_OPERAND{idx}();\n")
|
2024-10-07 10:56:39 -03:00
|
|
|
storage = emitter.emit_tokens(uop, storage, None)
|
2024-07-18 08:49:24 -03:00
|
|
|
except StackError as ex:
|
|
|
|
raise analysis_error(ex.args[0], uop.body[0]) from None
|
2024-10-07 10:56:39 -03:00
|
|
|
return storage.stack
|
2023-12-12 08:12:17 -04:00
|
|
|
|
|
|
|
SKIPS = ("_EXTENDED_ARG",)
|
|
|
|
|
|
|
|
|
|
|
|
def generate_tier2(
|
|
|
|
filenames: list[str], analysis: Analysis, outfile: TextIO, lines: bool
|
|
|
|
) -> None:
|
|
|
|
write_header(__file__, filenames, outfile)
|
|
|
|
outfile.write(
|
|
|
|
"""
|
|
|
|
#ifdef TIER_ONE
|
|
|
|
#error "This file is for Tier 2 only"
|
|
|
|
#endif
|
|
|
|
#define TIER_TWO 2
|
|
|
|
"""
|
|
|
|
)
|
|
|
|
out = CWriter(outfile, 2, lines)
|
2024-08-06 09:04:33 -03:00
|
|
|
emitter = Tier2Emitter(out)
|
2023-12-12 08:12:17 -04:00
|
|
|
out.emit("\n")
|
|
|
|
for name, uop in analysis.uops.items():
|
2024-02-23 13:31:57 -04:00
|
|
|
if uop.properties.tier == 1:
|
2023-12-12 08:12:17 -04:00
|
|
|
continue
|
2024-02-20 06:50:59 -04:00
|
|
|
if uop.properties.oparg_and_1:
|
|
|
|
out.emit(f"/* {uop.name} is split on (oparg & 1) */\n\n")
|
|
|
|
continue
|
2023-12-20 10:27:25 -04:00
|
|
|
if uop.is_super():
|
2023-12-12 08:12:17 -04:00
|
|
|
continue
|
2024-03-26 06:35:11 -03:00
|
|
|
why_not_viable = uop.why_not_viable()
|
|
|
|
if why_not_viable is not None:
|
2024-08-08 06:57:59 -03:00
|
|
|
out.emit(
|
|
|
|
f"/* {uop.name} is not a viable micro-op for tier 2 because it {why_not_viable} */\n\n"
|
|
|
|
)
|
2023-12-12 08:12:17 -04:00
|
|
|
continue
|
|
|
|
out.emit(f"case {uop.name}: {{\n")
|
|
|
|
declare_variables(uop, out)
|
|
|
|
stack = Stack()
|
2024-10-07 10:56:39 -03:00
|
|
|
stack = write_uop(uop, emitter, stack)
|
2023-12-12 08:12:17 -04:00
|
|
|
out.start_line()
|
|
|
|
if not uop.properties.always_exits:
|
|
|
|
stack.flush(out)
|
|
|
|
out.emit("break;\n")
|
|
|
|
out.start_line()
|
|
|
|
out.emit("}")
|
|
|
|
out.emit("\n\n")
|
|
|
|
outfile.write("#undef TIER_TWO\n")
|
|
|
|
|
|
|
|
|
|
|
|
arg_parser = argparse.ArgumentParser(
|
|
|
|
description="Generate the code for the tier 2 interpreter.",
|
|
|
|
formatter_class=argparse.ArgumentDefaultsHelpFormatter,
|
|
|
|
)
|
|
|
|
|
|
|
|
arg_parser.add_argument(
|
|
|
|
"-o", "--output", type=str, help="Generated code", default=DEFAULT_OUTPUT
|
|
|
|
)
|
|
|
|
|
|
|
|
arg_parser.add_argument(
|
|
|
|
"-l", "--emit-line-directives", help="Emit #line directives", action="store_true"
|
|
|
|
)
|
|
|
|
|
|
|
|
arg_parser.add_argument(
|
|
|
|
"input", nargs=argparse.REMAINDER, help="Instruction definition file(s)"
|
|
|
|
)
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
args = arg_parser.parse_args()
|
|
|
|
if len(args.input) == 0:
|
|
|
|
args.input.append(DEFAULT_INPUT)
|
|
|
|
data = analyze_files(args.input)
|
|
|
|
with open(args.output, "w") as outfile:
|
|
|
|
generate_tier2(args.input, data, outfile, args.emit_line_directives)
|