bytecode_to_cfg.py 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337
  1. """Converts bytecode IR to CFG IR."""
  2. import modelverse_jit.bytecode_ir as bytecode_ir
  3. import modelverse_jit.cfg_ir as cfg_ir
  4. import modelverse_jit.runtime as jit_runtime
  5. def emit_debug_info_trace(block, debug_info, function_name):
  6. """Appends a tracing instruction to the given block that prints
  7. the given debug information and function name."""
  8. if debug_info is not None or function_name is not None:
  9. block.append_definition(
  10. cfg_ir.create_print(
  11. block.append_definition(
  12. cfg_ir.Literal(jit_runtime.format_trace_message(
  13. debug_info, function_name, jit_runtime.FAST_JIT_ORIGIN_NAME)))))
  14. class AnalysisState(object):
  15. """State that is common to the bytecode->CFG transformation of a function."""
  16. def __init__(self, jit, function_name, param_dict):
  17. self.jit = jit
  18. self.function_name = function_name
  19. self.counter = cfg_ir.SharedCounter()
  20. self.analyzed_instructions = set()
  21. self.loop_instructions = {}
  22. self.entry_point = cfg_ir.BasicBlock(self.counter)
  23. self.current_block = self.entry_point
  24. self.root_node = None
  25. self.__write_prolog(param_dict)
  26. def __write_prolog(self, param_dict):
  27. # Write a prolog in CFG IR.
  28. # We want to create the following definition:
  29. #
  30. # !entry_point():
  31. # $jit_locals = alloc-root-node
  32. # $_ = declare-local var(...)
  33. # $param_1 = resolve-local var(...)
  34. # $arg_1 = function-parameter ...
  35. # $_ = store $param_1, $arg_1
  36. # ...
  37. #
  38. # We also want to store '$jit_locals' in an attribute, so we can
  39. # use it to shield locals from the GC.
  40. self.root_node = self.current_block.append_definition(cfg_ir.AllocateRootNode())
  41. for node_id, name in param_dict.items():
  42. variable = bytecode_ir.VariableNode(node_id, name)
  43. self.current_block.append_definition(cfg_ir.DeclareLocal(variable, self.root_node))
  44. param_i = self.current_block.append_definition(cfg_ir.ResolveLocal(variable))
  45. arg_i = self.current_block.append_definition(cfg_ir.FunctionParameter(name))
  46. self.current_block.append_definition(cfg_ir.StoreAtPointer(param_i, arg_i))
  47. def analyze(self, instruction):
  48. """Analyzes the given instruction as a basic block."""
  49. if instruction in self.analyzed_instructions:
  50. raise jit_runtime.JitCompilationFailedException(
  51. 'Cannot jit non-tree instruction graph.')
  52. self.analyzed_instructions.add(instruction)
  53. # Find an analyzer.
  54. instruction_type = type(instruction)
  55. if instruction_type in self.instruction_analyzers:
  56. if self.jit.tracing_enabled:
  57. emit_debug_info_trace(
  58. self.current_block, instruction.debug_information, self.function_name)
  59. # Analyze the instruction.
  60. result = self.instruction_analyzers[instruction_type](self, instruction)
  61. # Check if the instruction has a 'next' instruction. If so, analyze it!
  62. if instruction.next_instruction is not None:
  63. next_result = self.analyze(instruction.next_instruction)
  64. if next_result.value.has_value() or (not result.value.has_value()):
  65. result = next_result
  66. return result
  67. else:
  68. raise jit_runtime.JitCompilationFailedException(
  69. "Unknown instruction type: '%s'" % type(instruction))
  70. def emit_select(self, create_condition, create_if_body, create_else_body):
  71. """Emits a 'select' instruction."""
  72. # Create blocks that look like this:
  73. #
  74. # !current_block(...):
  75. # ...
  76. # $cond = <condition>
  77. # select $cond, !if_block(), !else_block()
  78. #
  79. # !if_block():
  80. # $if_result = <if-body>
  81. # jump !phi_block($if_result)
  82. #
  83. # !else_block():
  84. # $else_result = <else-body>
  85. # jump !phi_block($else_result)
  86. #
  87. # !phi_block($result = block-parameter):
  88. # ...
  89. #
  90. if_block = cfg_ir.BasicBlock(self.counter)
  91. else_block = cfg_ir.BasicBlock(self.counter)
  92. phi_block = cfg_ir.BasicBlock(self.counter)
  93. param_def = phi_block.append_parameter(cfg_ir.BlockParameter())
  94. condition = create_condition()
  95. self.current_block.flow = cfg_ir.SelectFlow(
  96. condition, cfg_ir.Branch(if_block), cfg_ir.Branch(else_block))
  97. self.current_block = if_block
  98. if_result = create_if_body()
  99. self.current_block.flow = cfg_ir.create_jump(phi_block, [if_result])
  100. self.current_block = else_block
  101. else_result = create_else_body()
  102. self.current_block.flow = cfg_ir.create_jump(phi_block, [else_result])
  103. self.current_block = phi_block
  104. return param_def
  105. def analyze_if(self, instruction):
  106. """Analyzes an 'if' instruction."""
  107. def __analyze_condition():
  108. condition_node = self.analyze(instruction.condition)
  109. return self.current_block.append_definition(cfg_ir.Read(condition_node))
  110. return self.emit_select(
  111. __analyze_condition,
  112. lambda: self.analyze(instruction.if_clause),
  113. lambda:
  114. self.current_block.append_definition(cfg_ir.Literal(None))
  115. if instruction.else_clause is None
  116. else self.analyze(instruction.else_clause))
  117. def analyze_while(self, instruction):
  118. """Analyzes a 'while' instruction."""
  119. # Create blocks that look like this:
  120. #
  121. # !current_block(...):
  122. # ...
  123. # jump !loop_condition()
  124. #
  125. # !loop_condition():
  126. # $condition_node = <condition>
  127. # $condition = read condition_node
  128. # select $condition, !loop_body(), !loop_exit()
  129. #
  130. # !loop_body():
  131. # $result = <body>
  132. # static if jit.nop_insertion_enabled:
  133. # $_ = direct-call ('macro-io', void) nop()
  134. # jump !loop_condition()
  135. #
  136. # !loop_exit():
  137. # $nothing = literal None
  138. # ...
  139. loop_condition_block = cfg_ir.BasicBlock(self.counter)
  140. loop_body_block = cfg_ir.BasicBlock(self.counter)
  141. loop_exit_block = cfg_ir.BasicBlock(self.counter)
  142. self.loop_instructions[instruction] = (loop_condition_block, loop_exit_block)
  143. self.current_block.flow = cfg_ir.create_jump(loop_condition_block)
  144. self.current_block = loop_condition_block
  145. condition_node = self.analyze(instruction.condition)
  146. condition = self.current_block.append_definition(cfg_ir.Read(condition_node))
  147. self.current_block.flow = cfg_ir.SelectFlow(
  148. condition, cfg_ir.Branch(loop_body_block), cfg_ir.Branch(loop_exit_block))
  149. self.current_block = loop_body_block
  150. self.analyze(instruction.body)
  151. if self.jit.nop_insertion_enabled:
  152. self.current_block.append_definition(cfg_ir.create_nop())
  153. self.current_block.flow = cfg_ir.create_jump(loop_condition_block)
  154. self.current_block = loop_exit_block
  155. return loop_exit_block.append_definition(cfg_ir.Literal(None))
  156. def analyze_return(self, instruction):
  157. """Analyzes a 'return' instruction."""
  158. if instruction.value is None:
  159. return_value = self.current_block.append_definition(cfg_ir.Literal(None))
  160. else:
  161. return_value = self.analyze(instruction.value)
  162. # Don't forget to deallocate the root node.
  163. self.current_block.append_definition(cfg_ir.DeallocateRootNode(self.root_node))
  164. self.current_block.flow = cfg_ir.ReturnFlow(return_value)
  165. self.current_block = cfg_ir.BasicBlock(self.counter)
  166. return self.current_block.append_definition(cfg_ir.Literal(None))
  167. def analyze_constant(self, instruction):
  168. """Analyzes a 'constant' instruction."""
  169. return self.current_block.append_definition(cfg_ir.Literal(instruction.constant_id))
  170. def analyze_resolve(self, instruction):
  171. """Analyzes a 'resolve' instruction."""
  172. def __resolve_global_carefully():
  173. # We might be resolving a global that does not exist. In that case, we
  174. # need to throw. We want to create the following blocks:
  175. #
  176. # !current_block(...):
  177. # ...
  178. # $resolved_global = resolve-global global
  179. # $nothing = literal None
  180. # $condition = binary $resolved_global, 'is', $nothing
  181. # select $condition, !no_global_block(), !global_exists_block()
  182. #
  183. # !no_global_block():
  184. # $message = literal <GLOBAL_NOT_FOUND_MESSAGE_FORMAT % instruction.variable.name>
  185. # $exception = direct-call "simple-positional" Exception(message=$message)
  186. # throw $exception
  187. #
  188. # !global_exists_block():
  189. # ...
  190. #
  191. no_global_block = cfg_ir.BasicBlock(self.counter)
  192. global_exists_block = cfg_ir.BasicBlock(self.counter)
  193. resolved_global = self.current_block.append_definition(
  194. cfg_ir.ResolveGlobal(instruction.variable))
  195. nothing = self.current_block.append_definition(cfg_ir.Literal(None))
  196. condition = self.current_block.append_definition(
  197. cfg_ir.Binary(resolved_global, 'is', nothing))
  198. self.current_block.flow = cfg_ir.SelectFlow(
  199. condition, cfg_ir.Branch(no_global_block), cfg_ir.Branch(global_exists_block))
  200. message = no_global_block.append_definition(
  201. cfg_ir.Literal(
  202. jit_runtime.GLOBAL_NOT_FOUND_MESSAGE_FORMAT % instruction.variable.name))
  203. exception = no_global_block.append_definition(
  204. cfg_ir.DirectFunctionCall(
  205. 'Exception',
  206. [('message', message)],
  207. cfg_ir.SIMPLE_POSITIONAL_CALLING_CONVENTION))
  208. no_global_block.flow = cfg_ir.ThrowFlow(exception)
  209. self.current_block = global_exists_block
  210. return resolved_global
  211. return self.emit_select(
  212. lambda:
  213. self.current_block.append_definition(
  214. cfg_ir.CheckLocalExists(instruction.variable)),
  215. lambda:
  216. self.current_block.append_definition(
  217. cfg_ir.ResolveLocal(instruction.variable)),
  218. __resolve_global_carefully)
  219. def analyze_declare(self, instruction):
  220. """Analyzes a 'declare' instruction."""
  221. return self.current_block.append_definition(
  222. cfg_ir.DeclareLocal(instruction.variable, self.root_node))
  223. def analyze_global(self, instruction):
  224. """Analyzes a 'global' instruction."""
  225. resolved_global = self.current_block.append_definition(
  226. cfg_ir.ResolveGlobal(instruction.variable))
  227. nothing = self.current_block.append_definition(cfg_ir.Literal(None))
  228. return self.emit_select(
  229. lambda:
  230. self.current_block.append_definition(
  231. cfg_ir.Binary(resolved_global, 'is', nothing)),
  232. lambda:
  233. self.current_block.append_definition(
  234. cfg_ir.DeclareGlobal(instruction.variable)),
  235. lambda: resolved_global)
  236. def analyze_assign(self, instruction):
  237. """Analyzes an 'assign' instruction."""
  238. pointer_result = self.analyze(instruction.pointer)
  239. value_result = self.analyze(instruction.value)
  240. return self.current_block.append_definition(
  241. cfg_ir.StoreAtPointer(pointer_result, value_result))
  242. def analyze_access(self, instruction):
  243. """Analyzes an 'access' instruction."""
  244. pointer_result = self.analyze(instruction.pointer)
  245. return self.current_block.append_definition(cfg_ir.LoadPointer(pointer_result))
  246. def analyze_output(self, instruction):
  247. """Analyzes an 'output' instruction."""
  248. value_result = self.analyze(instruction.value)
  249. return self.current_block.append_definition(cfg_ir.create_output(value_result))
  250. def analyze_input(self, _):
  251. """Analyzes an 'input' instruction."""
  252. return self.current_block.append_definition(cfg_ir.create_input())
  253. def analyze_break(self, instruction):
  254. """Analyzes a 'break' instruction."""
  255. if instruction.loop not in self.loop_instructions:
  256. raise jit_runtime.JitCompilationFailedException(
  257. "'break' instruction targets a 'while' loop that has not been defined yet.")
  258. _, exit_block = self.loop_instructions[instruction.loop]
  259. self.current_block.flow = cfg_ir.create_jump(exit_block)
  260. self.current_block = cfg_ir.BasicBlock(self.counter)
  261. return self.current_block.append_definition(cfg_ir.Literal(None))
  262. def analyze_continue(self, instruction):
  263. """Analyzes a 'continue' instruction."""
  264. if instruction.loop not in self.loop_instructions:
  265. raise jit_runtime.JitCompilationFailedException(
  266. "'continue' instruction targets a 'while' loop that has not been defined yet.")
  267. if self.jit.nop_insertion_enabled:
  268. self.current_block.append_definition(cfg_ir.create_nop())
  269. cond_block, _ = self.loop_instructions[instruction.loop]
  270. self.current_block.flow = cfg_ir.create_jump(cond_block)
  271. self.current_block = cfg_ir.BasicBlock(self.counter)
  272. return self.current_block.append_definition(cfg_ir.Literal(None))
  273. def analyze_call(self, instruction):
  274. """Analyzes the given 'call' instruction."""
  275. target = self.analyze(instruction.target)
  276. arg_list = []
  277. for key, arg_instruction in instruction.argument_list:
  278. arg_list.append((key, self.analyze(arg_instruction)))
  279. return self.current_block.append_definition(cfg_ir.IndirectFunctionCall(target, arg_list))
  280. instruction_analyzers = {
  281. bytecode_ir.SelectInstruction : analyze_if,
  282. bytecode_ir.WhileInstruction : analyze_while,
  283. bytecode_ir.ReturnInstruction : analyze_return,
  284. bytecode_ir.ConstantInstruction : analyze_constant,
  285. bytecode_ir.ResolveInstruction : analyze_resolve,
  286. bytecode_ir.DeclareInstruction : analyze_declare,
  287. bytecode_ir.GlobalInstruction : analyze_global,
  288. bytecode_ir.AssignInstruction : analyze_assign,
  289. bytecode_ir.AccessInstruction : analyze_access,
  290. bytecode_ir.OutputInstruction : analyze_output,
  291. bytecode_ir.InputInstruction : analyze_input,
  292. bytecode_ir.CallInstruction : analyze_call,
  293. bytecode_ir.BreakInstruction : analyze_break,
  294. bytecode_ir.ContinueInstruction : analyze_continue
  295. }