| 1 | """A pure-Python Python bytecode interpreter.""" | 
| 2 | # Based on: | 
| 3 | # pyvm2 by Paul Swartz (z3p), from http://www.twistedmatrix.com/users/z3p/ | 
| 4 |  | 
| 5 | from __future__ import print_function, division | 
| 6 | import linecache | 
| 7 | import operator | 
| 8 | import os | 
| 9 | import repr as repr_lib  # Don't conflict with builtin repr() | 
| 10 | import sys | 
| 11 | import traceback | 
| 12 | import types | 
| 13 |  | 
| 14 | # Function used in MAKE_FUNCTION, MAKE_CLOSURE | 
| 15 | # Generator used in YIELD_FROM, which we might not need. | 
| 16 | from pyobj import Frame, Block, Function, Generator | 
| 17 |  | 
| 18 | from opy.lib import dis | 
| 19 |  | 
| 20 | # Create a repr that won't overflow. | 
| 21 | repr_obj = repr_lib.Repr() | 
| 22 | repr_obj.maxother = 120 | 
| 23 | repper = repr_obj.repr | 
| 24 |  | 
| 25 | VERBOSE = True | 
| 26 | VERBOSE = False | 
| 27 |  | 
| 28 | # Different than log | 
| 29 | def debug(msg, *args): | 
| 30 | if not VERBOSE: | 
| 31 | return | 
| 32 |  | 
| 33 | debug1(msg, *args) | 
| 34 |  | 
| 35 |  | 
| 36 | def debug1(msg, *args): | 
| 37 | if args: | 
| 38 | msg = msg % args | 
| 39 | print(msg, file=sys.stderr) | 
| 40 |  | 
| 41 |  | 
| 42 | class VirtualMachineError(Exception): | 
| 43 | """For raising errors in the operation of the VM.""" | 
| 44 | pass | 
| 45 |  | 
| 46 |  | 
| 47 | class GuestException(Exception): | 
| 48 | """For errors raised by the interpreter program. | 
| 49 |  | 
| 50 | NOTE: I added this because the host traceback was conflated with the guest | 
| 51 | traceback. | 
| 52 | """ | 
| 53 |  | 
| 54 | def __init__(self, exctype, value, frames): | 
| 55 | self.exctype = exctype | 
| 56 | if isinstance(value, GuestException): | 
| 57 | raise AssertionError | 
| 58 | self.value = value | 
| 59 | self.frames = frames | 
| 60 |  | 
| 61 | def __str__(self): | 
| 62 | parts = [] | 
| 63 | parts.append('Guest Exception Traceback:') | 
| 64 | parts.append('') | 
| 65 | for f in self.frames: | 
| 66 | filename = f.f_code.co_filename | 
| 67 | lineno = f.line_number() | 
| 68 | parts.append( | 
| 69 | '- File "%s", line %d, in %s' % | 
| 70 | (filename, lineno, f.f_code.co_name)) | 
| 71 | linecache.checkcache(filename) | 
| 72 | line = linecache.getline(filename, lineno, f.f_globals) | 
| 73 | if line: | 
| 74 | parts.append('    ' + line.strip()) | 
| 75 | parts.append('') | 
| 76 | parts.append('exctype: %s' % self.exctype) | 
| 77 | parts.append('value: %s' % self.value) | 
| 78 |  | 
| 79 | return '\n'.join(parts) + '\n' | 
| 80 |  | 
| 81 |  | 
| 82 | def run_code(vm, code, f_globals=None): | 
| 83 | """Main entry point. | 
| 84 |  | 
| 85 | Used by tests and by execfile. | 
| 86 | """ | 
| 87 | frame = vm.make_frame(code, f_globals=f_globals) | 
| 88 | val = vm.run_frame(frame) | 
| 89 | vm.check_invariants() | 
| 90 | if os.getenv('BYTERUN_SUMMARY'): | 
| 91 | debug1('*** Byterun executed for %d ticks', vm.num_ticks) | 
| 92 | # If we return the number of ticks here, the unit tests break. | 
| 93 | return val | 
| 94 |  | 
| 95 |  | 
| 96 | class VirtualMachine(object): | 
| 97 |  | 
| 98 | def __init__(self, subset=False, verbose=VERBOSE): | 
| 99 | """ | 
| 100 | Args: | 
| 101 | subset: turn off bytecodes that OPy doesn't need (e.g. print | 
| 102 | statement, etc.) | 
| 103 | verbose: turn on logging | 
| 104 | """ | 
| 105 | self.subset = subset | 
| 106 | self.more_info = False | 
| 107 | #self.more_info = True | 
| 108 | self.verbose = verbose | 
| 109 | # some objects define __repr__, which means our debug() logging screws | 
| 110 | # things up!  Even though they don't have side effects, this somehow | 
| 111 | # matters. | 
| 112 | self.repr_ok = True | 
| 113 |  | 
| 114 | # The call stack of frames. | 
| 115 | self.frames = [] | 
| 116 | # The current frame. | 
| 117 | self.frame = None | 
| 118 | self.return_value = None | 
| 119 |  | 
| 120 | self.last_exception = None | 
| 121 | self.except_frames = []  # Frames saved for GuestException | 
| 122 | self.cur_line = None  # current line number | 
| 123 | self.num_ticks = 0 | 
| 124 |  | 
| 125 | def top(self): | 
| 126 | return self.frame.top() | 
| 127 |  | 
| 128 | def pop(self, i=0): | 
| 129 | return self.frame.pop(i=i) | 
| 130 |  | 
| 131 | def push(self, *vals): | 
| 132 | self.frame.push(*vals) | 
| 133 |  | 
| 134 | def popn(self, n): | 
| 135 | return self.frame.popn(n) | 
| 136 |  | 
| 137 | def peek(self, n): | 
| 138 | return self.frame.peek(n) | 
| 139 |  | 
| 140 | def jump(self, offset): | 
| 141 | self.frame.jump(offset) | 
| 142 |  | 
| 143 | def make_frame(self, code, callargs={}, f_globals=None, f_locals=None): | 
| 144 | """ | 
| 145 | Called by self.run_code and Function.__call__. | 
| 146 | """ | 
| 147 | # NOTE: repper causes problems running code!  See testdata/repr_method.py | 
| 148 | #debug("make_frame: code=%r, callargs=%s", code, repper(callargs)) | 
| 149 | if f_globals is not None: | 
| 150 | f_globals = f_globals | 
| 151 | if f_locals is None: | 
| 152 | f_locals = f_globals | 
| 153 | elif self.frames: | 
| 154 | f_globals = self.frame.f_globals | 
| 155 | f_locals = {} | 
| 156 | else: | 
| 157 | f_globals = f_locals = { | 
| 158 | '__builtins__': __builtins__, | 
| 159 | '__name__': '__main__', | 
| 160 | '__doc__': None, | 
| 161 | '__package__': None, | 
| 162 | } | 
| 163 | f_locals.update(callargs) | 
| 164 | frame = Frame(code, f_globals, f_locals, self.frame) | 
| 165 | return frame | 
| 166 |  | 
| 167 | def resume_frame(self, frame): | 
| 168 | """Called by Generator.""" | 
| 169 | frame.f_back = self.frame | 
| 170 |  | 
| 171 | # NOTE: Could raise exceptions! | 
| 172 | val = self.run_frame(frame) | 
| 173 |  | 
| 174 | frame.f_back = None | 
| 175 | return val | 
| 176 |  | 
| 177 | def log_tick(self, byteName, arguments, opoffset, linestarts): | 
| 178 | """ Log arguments, block stack, and data stack for each opcode.""" | 
| 179 | indent = "    " * (len(self.frames)-1) | 
| 180 | stack_rep = repper(self.frame.stack) | 
| 181 | #block_stack_rep = repper(self.frame.block_stack) | 
| 182 | # repr_lib is causing problems | 
| 183 | if self.repr_ok: | 
| 184 | stack_rep = repr(self.frame.stack) | 
| 185 | #block_stack_rep = repr(self.frame.block_stack) | 
| 186 |  | 
| 187 | arg_str = '' | 
| 188 | if arguments and self.repr_ok: | 
| 189 | arg_str = ' %r' % (arguments[0],) | 
| 190 |  | 
| 191 | # TODO: Should increment | 
| 192 |  | 
| 193 | li = linestarts.get(opoffset, None) | 
| 194 | if li is not None and self.cur_line != li: | 
| 195 | self.cur_line = li | 
| 196 |  | 
| 197 | debug('%s%d: %s%s (line %s)', indent, opoffset, byteName, arg_str, | 
| 198 | self.cur_line) | 
| 199 | if self.repr_ok: | 
| 200 | debug('  %sval stack: %s', indent, stack_rep) | 
| 201 | #debug('  %sblock stack: %s', indent, block_stack_rep) | 
| 202 | debug('') | 
| 203 |  | 
| 204 | def dispatch(self, byteName, arguments): | 
| 205 | """ Dispatch by bytename to the corresponding methods. | 
| 206 | Exceptions are caught and set on the virtual machine.""" | 
| 207 | why = None | 
| 208 | try: | 
| 209 | if byteName.startswith('UNARY_'): | 
| 210 | self.unaryOperator(byteName[6:]) | 
| 211 | elif byteName.startswith('BINARY_'): | 
| 212 | self.binaryOperator(byteName[7:]) | 
| 213 | elif byteName.startswith('INPLACE_'): | 
| 214 | self.inplaceOperator(byteName[8:]) | 
| 215 | elif 'SLICE+' in byteName: | 
| 216 | self.sliceOperator(byteName) | 
| 217 | else: | 
| 218 | # dispatch | 
| 219 | bytecode_fn = getattr(self, 'byte_%s' % byteName, None) | 
| 220 | if not bytecode_fn:            # pragma: no cover | 
| 221 | raise VirtualMachineError( | 
| 222 | "unknown bytecode type: %s" % byteName | 
| 223 | ) | 
| 224 | why = bytecode_fn(*arguments) | 
| 225 |  | 
| 226 | except: | 
| 227 | # Deal with exceptions encountered while executing the op. | 
| 228 | self.last_exception = sys.exc_info()[:2] + (None,) | 
| 229 |  | 
| 230 | # NOTE: Why doesn't byterun use this info? | 
| 231 | #tb = sys.exc_info()[2] | 
| 232 | #traceback.print_tb(tb) | 
| 233 |  | 
| 234 | #debug1("Caught exception during execution of %s: %d", byteName, | 
| 235 | #       len(self.frames)) | 
| 236 | why = 'exception' | 
| 237 | self.except_frames = list(self.frames) | 
| 238 |  | 
| 239 | return why | 
| 240 |  | 
| 241 | # Helpers for run_frame | 
| 242 | def _push_frame(self, frame): | 
| 243 | self.frames.append(frame) | 
| 244 | self.frame = frame | 
| 245 |  | 
| 246 | def _pop_frame(self): | 
| 247 | self.frames.pop() | 
| 248 | if self.frames: | 
| 249 | self.frame = self.frames[-1] | 
| 250 | else: | 
| 251 | self.frame = None | 
| 252 |  | 
| 253 | def run_frame(self, frame): | 
| 254 | """Run a frame until it returns or raises an exception. | 
| 255 |  | 
| 256 | This function raises GuestException or returns the return value. | 
| 257 |  | 
| 258 | Corresponds to PyEval_EvalFrameEx in ceval.c.  That returns 'PyObject* | 
| 259 | retval' -- but how does it indicate an exception? | 
| 260 |  | 
| 261 | I think retval is NULL, and then | 
| 262 |  | 
| 263 | """ | 
| 264 | # bytecode offset -> line number | 
| 265 | #print('frame %s ' % frame) | 
| 266 | # NOTE: Also done in Frmae.line_number() | 
| 267 | linestarts = dict(dis.findlinestarts(frame.f_code)) | 
| 268 | #print('STARTS %s ' % linestarts) | 
| 269 |  | 
| 270 | self._push_frame(frame) | 
| 271 | while True: | 
| 272 | self.num_ticks += 1 | 
| 273 |  | 
| 274 | opoffset = self.frame.f_lasti  # For logging only | 
| 275 | byteName, arguments = self.frame.decode_next() | 
| 276 | if self.verbose: | 
| 277 | self.log_tick(byteName, arguments, opoffset, linestarts) | 
| 278 |  | 
| 279 | # When unwinding the block stack, we need to keep track of why we | 
| 280 | # are doing it. | 
| 281 |  | 
| 282 | # NOTE: In addition to returning why == 'exception', this can also | 
| 283 | # RAISE GuestException from recursive call via call_function. | 
| 284 |  | 
| 285 | why = self.dispatch(byteName, arguments) | 
| 286 | if why == 'exception': | 
| 287 | # TODO: ceval calls PyTraceBack_Here, not sure what that does. | 
| 288 | pass | 
| 289 |  | 
| 290 | if why == 'reraise': | 
| 291 | why = 'exception' | 
| 292 |  | 
| 293 | if why != 'yield': | 
| 294 |  | 
| 295 | # NOTE: why is used in a frame INTERNALLY after bytecode dispatch. | 
| 296 | # But what about ACROSS frames.  We need to unwind the call | 
| 297 | # stack too!  How is that done? | 
| 298 | # I don't want it to be done with GuestException! | 
| 299 |  | 
| 300 | while why and frame.block_stack: | 
| 301 | debug('WHY %s', why) | 
| 302 | debug('STACK %s', frame.block_stack) | 
| 303 | why = self.frame.handle_block_stack(why, self) | 
| 304 |  | 
| 305 | if why: | 
| 306 | break | 
| 307 |  | 
| 308 | # TODO: handle generator exception state | 
| 309 |  | 
| 310 | self._pop_frame() | 
| 311 |  | 
| 312 | if why == 'exception': | 
| 313 | exctype, value, tb = self.last_exception | 
| 314 |  | 
| 315 | #debug('exctype: %s' % exctype) | 
| 316 | #debug('value: %s' % value) | 
| 317 | #debug('unused tb: %s' % tb) | 
| 318 |  | 
| 319 | if self.more_info: | 
| 320 | # Recursive function calls can cause this I guess. | 
| 321 | if isinstance(value, GuestException): | 
| 322 | raise value | 
| 323 | else: | 
| 324 | # Raise an exception with the EMULATED (guest) stack frames. | 
| 325 | raise GuestException(exctype, value, self.except_frames) | 
| 326 | else: | 
| 327 | raise exctype, value, tb | 
| 328 |  | 
| 329 | #debug1('num_ticks: %d' % num_ticks) | 
| 330 | return self.return_value | 
| 331 |  | 
| 332 | def check_invariants(self): | 
| 333 | # Check some invariants | 
| 334 | if self.frames:            # pragma: no cover | 
| 335 | raise VirtualMachineError("Frames left over!") | 
| 336 | if self.frame and self.frame.stack:             # pragma: no cover | 
| 337 | raise VirtualMachineError("Data left on stack! %r" % self.frame.stack) | 
| 338 |  | 
| 339 | ## Stack manipulation | 
| 340 |  | 
| 341 | def byte_LOAD_CONST(self, const): | 
| 342 | self.push(const) | 
| 343 |  | 
| 344 | def byte_POP_TOP(self): | 
| 345 | self.pop() | 
| 346 |  | 
| 347 | def byte_DUP_TOP(self): | 
| 348 | self.push(self.top()) | 
| 349 |  | 
| 350 | def byte_DUP_TOPX(self, count): | 
| 351 | items = self.popn(count) | 
| 352 | for i in [1, 2]: | 
| 353 | self.push(*items) | 
| 354 |  | 
| 355 | def byte_DUP_TOP_TWO(self): | 
| 356 | # Py3 only | 
| 357 | a, b = self.popn(2) | 
| 358 | self.push(a, b, a, b) | 
| 359 |  | 
| 360 | def byte_ROT_TWO(self): | 
| 361 | a, b = self.popn(2) | 
| 362 | self.push(b, a) | 
| 363 |  | 
| 364 | def byte_ROT_THREE(self): | 
| 365 | a, b, c = self.popn(3) | 
| 366 | self.push(c, a, b) | 
| 367 |  | 
| 368 | def byte_ROT_FOUR(self): | 
| 369 | a, b, c, d = self.popn(4) | 
| 370 | self.push(d, a, b, c) | 
| 371 |  | 
| 372 | ## Names | 
| 373 |  | 
| 374 | def byte_LOAD_NAME(self, name): | 
| 375 | frame = self.frame | 
| 376 | if name in frame.f_locals: | 
| 377 | val = frame.f_locals[name] | 
| 378 | elif name in frame.f_globals: | 
| 379 | val = frame.f_globals[name] | 
| 380 | elif name in frame.f_builtins: | 
| 381 | val = frame.f_builtins[name] | 
| 382 | else: | 
| 383 | raise NameError("name '%s' is not defined" % name) | 
| 384 | self.push(val) | 
| 385 |  | 
| 386 | def byte_STORE_NAME(self, name): | 
| 387 | self.frame.f_locals[name] = self.pop() | 
| 388 |  | 
| 389 | def byte_DELETE_NAME(self, name): | 
| 390 | del self.frame.f_locals[name] | 
| 391 |  | 
| 392 | def byte_LOAD_FAST(self, name): | 
| 393 | if name in self.frame.f_locals: | 
| 394 | val = self.frame.f_locals[name] | 
| 395 | else: | 
| 396 | raise UnboundLocalError( | 
| 397 | "local variable '%s' referenced before assignment" % name | 
| 398 | ) | 
| 399 | self.push(val) | 
| 400 |  | 
| 401 | def byte_STORE_FAST(self, name): | 
| 402 | self.frame.f_locals[name] = self.pop() | 
| 403 |  | 
| 404 | def byte_DELETE_FAST(self, name): | 
| 405 | del self.frame.f_locals[name] | 
| 406 |  | 
| 407 | def byte_LOAD_GLOBAL(self, name): | 
| 408 | f = self.frame | 
| 409 | if name in f.f_globals: | 
| 410 | val = f.f_globals[name] | 
| 411 | elif name in f.f_builtins: | 
| 412 | val = f.f_builtins[name] | 
| 413 | else: | 
| 414 | raise NameError("global name '%s' is not defined" % name) | 
| 415 | self.push(val) | 
| 416 |  | 
| 417 | def byte_STORE_GLOBAL(self, name): | 
| 418 | f = self.frame | 
| 419 | f.f_globals[name] = self.pop() | 
| 420 |  | 
| 421 | def byte_LOAD_DEREF(self, name): | 
| 422 | self.push(self.frame.cells[name].get()) | 
| 423 |  | 
| 424 | def byte_STORE_DEREF(self, name): | 
| 425 | self.frame.cells[name].set(self.pop()) | 
| 426 |  | 
| 427 | def byte_LOAD_LOCALS(self): | 
| 428 | self.push(self.frame.f_locals) | 
| 429 |  | 
| 430 | ## Operators | 
| 431 |  | 
| 432 | UNARY_OPERATORS = { | 
| 433 | 'POSITIVE': operator.pos, | 
| 434 | 'NEGATIVE': operator.neg, | 
| 435 | 'NOT':      operator.not_, | 
| 436 | 'CONVERT':  repr, | 
| 437 | 'INVERT':   operator.invert, | 
| 438 | } | 
| 439 |  | 
| 440 | def unaryOperator(self, op): | 
| 441 | x = self.pop() | 
| 442 | self.push(self.UNARY_OPERATORS[op](x)) | 
| 443 |  | 
| 444 | BINARY_OPERATORS = { | 
| 445 | 'POWER':    pow, | 
| 446 | 'MULTIPLY': operator.mul, | 
| 447 | 'DIVIDE':   getattr(operator, 'div', lambda x, y: None), | 
| 448 | 'FLOOR_DIVIDE': operator.floordiv, | 
| 449 | 'TRUE_DIVIDE':  operator.truediv, | 
| 450 | 'MODULO':   operator.mod, | 
| 451 | 'ADD':      operator.add, | 
| 452 | 'SUBTRACT': operator.sub, | 
| 453 | 'SUBSCR':   operator.getitem, | 
| 454 | 'LSHIFT':   operator.lshift, | 
| 455 | 'RSHIFT':   operator.rshift, | 
| 456 | 'AND':      operator.and_, | 
| 457 | 'XOR':      operator.xor, | 
| 458 | 'OR':       operator.or_, | 
| 459 | } | 
| 460 |  | 
| 461 | def binaryOperator(self, op): | 
| 462 | x, y = self.popn(2) | 
| 463 | self.push(self.BINARY_OPERATORS[op](x, y)) | 
| 464 |  | 
| 465 | def inplaceOperator(self, op): | 
| 466 | x, y = self.popn(2) | 
| 467 | if op == 'POWER': | 
| 468 | x **= y | 
| 469 | elif op == 'MULTIPLY': | 
| 470 | x *= y | 
| 471 | elif op in ['DIVIDE', 'FLOOR_DIVIDE']: | 
| 472 | x //= y | 
| 473 | elif op == 'TRUE_DIVIDE': | 
| 474 | x /= y | 
| 475 | elif op == 'MODULO': | 
| 476 | x %= y | 
| 477 | elif op == 'ADD': | 
| 478 | x += y | 
| 479 | elif op == 'SUBTRACT': | 
| 480 | x -= y | 
| 481 | elif op == 'LSHIFT': | 
| 482 | x <<= y | 
| 483 | elif op == 'RSHIFT': | 
| 484 | x >>= y | 
| 485 | elif op == 'AND': | 
| 486 | x &= y | 
| 487 | elif op == 'XOR': | 
| 488 | x ^= y | 
| 489 | elif op == 'OR': | 
| 490 | x |= y | 
| 491 | else:           # pragma: no cover | 
| 492 | raise VirtualMachineError("Unknown in-place operator: %r" % op) | 
| 493 | self.push(x) | 
| 494 |  | 
| 495 | def sliceOperator(self, op): | 
| 496 | start = 0 | 
| 497 | end = None          # we will take this to mean end | 
| 498 | op, count = op[:-2], int(op[-1]) | 
| 499 | if count == 1: | 
| 500 | start = self.pop() | 
| 501 | elif count == 2: | 
| 502 | end = self.pop() | 
| 503 | elif count == 3: | 
| 504 | end = self.pop() | 
| 505 | start = self.pop() | 
| 506 | l = self.pop() | 
| 507 | if end is None: | 
| 508 | end = len(l) | 
| 509 | if op.startswith('STORE_'): | 
| 510 | l[start:end] = self.pop() | 
| 511 | elif op.startswith('DELETE_'): | 
| 512 | del l[start:end] | 
| 513 | else: | 
| 514 | self.push(l[start:end]) | 
| 515 |  | 
| 516 | COMPARE_OPERATORS = [ | 
| 517 | operator.lt, | 
| 518 | operator.le, | 
| 519 | operator.eq, | 
| 520 | operator.ne, | 
| 521 | operator.gt, | 
| 522 | operator.ge, | 
| 523 | lambda x, y: x in y, | 
| 524 | lambda x, y: x not in y, | 
| 525 | lambda x, y: x is y, | 
| 526 | lambda x, y: x is not y, | 
| 527 | lambda x, y: issubclass(x, Exception) and issubclass(x, y), | 
| 528 | ] | 
| 529 |  | 
| 530 | def byte_COMPARE_OP(self, opnum): | 
| 531 | x, y = self.popn(2) | 
| 532 | self.push(self.COMPARE_OPERATORS[opnum](x, y)) | 
| 533 |  | 
| 534 | ## Attributes and indexing | 
| 535 |  | 
| 536 | def byte_LOAD_ATTR(self, attr): | 
| 537 | obj = self.pop() | 
| 538 | #debug1('obj=%s, attr=%s', obj, attr) | 
| 539 | #debug1('dir(obj)=%s', dir(obj)) | 
| 540 | val = getattr(obj, attr) | 
| 541 | self.push(val) | 
| 542 |  | 
| 543 | def byte_STORE_ATTR(self, name): | 
| 544 | val, obj = self.popn(2) | 
| 545 | setattr(obj, name, val) | 
| 546 |  | 
| 547 | def byte_DELETE_ATTR(self, name): | 
| 548 | obj = self.pop() | 
| 549 | delattr(obj, name) | 
| 550 |  | 
| 551 | def byte_STORE_SUBSCR(self): | 
| 552 | val, obj, subscr = self.popn(3) | 
| 553 | obj[subscr] = val | 
| 554 |  | 
| 555 | def byte_DELETE_SUBSCR(self): | 
| 556 | obj, subscr = self.popn(2) | 
| 557 | del obj[subscr] | 
| 558 |  | 
| 559 | ## Building | 
| 560 |  | 
| 561 | def byte_BUILD_TUPLE(self, count): | 
| 562 | elts = self.popn(count) | 
| 563 | self.push(tuple(elts)) | 
| 564 |  | 
| 565 | def byte_BUILD_LIST(self, count): | 
| 566 | elts = self.popn(count) | 
| 567 | self.push(elts) | 
| 568 |  | 
| 569 | def byte_BUILD_SET(self, count): | 
| 570 | # TODO: Not documented in Py2 docs. | 
| 571 | elts = self.popn(count) | 
| 572 | self.push(set(elts)) | 
| 573 |  | 
| 574 | def byte_BUILD_MAP(self, size): | 
| 575 | # size is ignored. | 
| 576 | self.push({}) | 
| 577 |  | 
| 578 | def byte_STORE_MAP(self): | 
| 579 | the_map, val, key = self.popn(3) | 
| 580 | the_map[key] = val | 
| 581 | self.push(the_map) | 
| 582 |  | 
| 583 | def byte_UNPACK_SEQUENCE(self, count): | 
| 584 | seq = self.pop() | 
| 585 | for x in reversed(seq): | 
| 586 | self.push(x) | 
| 587 |  | 
| 588 | def byte_BUILD_SLICE(self, count): | 
| 589 | if count == 2: | 
| 590 | x, y = self.popn(2) | 
| 591 | self.push(slice(x, y)) | 
| 592 | elif count == 3: | 
| 593 | x, y, z = self.popn(3) | 
| 594 | self.push(slice(x, y, z)) | 
| 595 | else:           # pragma: no cover | 
| 596 | raise VirtualMachineError("Strange BUILD_SLICE count: %r" % count) | 
| 597 |  | 
| 598 | def byte_LIST_APPEND(self, count): | 
| 599 | val = self.pop() | 
| 600 | the_list = self.peek(count) | 
| 601 | the_list.append(val) | 
| 602 |  | 
| 603 | def byte_SET_ADD(self, count): | 
| 604 | val = self.pop() | 
| 605 | the_set = self.peek(count) | 
| 606 | the_set.add(val) | 
| 607 |  | 
| 608 | def byte_MAP_ADD(self, count): | 
| 609 | val, key = self.popn(2) | 
| 610 | the_map = self.peek(count) | 
| 611 | the_map[key] = val | 
| 612 |  | 
| 613 | ## Printing | 
| 614 |  | 
| 615 | if 0:   # Only used in the interactive interpreter, not in modules. | 
| 616 | def byte_PRINT_EXPR(self): | 
| 617 | print(self.pop()) | 
| 618 |  | 
| 619 | def byte_PRINT_ITEM(self): | 
| 620 | item = self.pop() | 
| 621 | self.print_item(item) | 
| 622 |  | 
| 623 | def byte_PRINT_ITEM_TO(self): | 
| 624 | to = self.pop() | 
| 625 | item = self.pop() | 
| 626 | self.print_item(item, to) | 
| 627 |  | 
| 628 | def byte_PRINT_NEWLINE(self): | 
| 629 | self.print_newline() | 
| 630 |  | 
| 631 | def byte_PRINT_NEWLINE_TO(self): | 
| 632 | to = self.pop() | 
| 633 | self.print_newline(to) | 
| 634 |  | 
| 635 | def print_item(self, item, to=None): | 
| 636 | if to is None: | 
| 637 | to = sys.stdout | 
| 638 | if to.softspace: | 
| 639 | print(" ", end="", file=to) | 
| 640 | to.softspace = 0 | 
| 641 | print(item, end="", file=to) | 
| 642 | if isinstance(item, str): | 
| 643 | if (not item) or (not item[-1].isspace()) or (item[-1] == " "): | 
| 644 | to.softspace = 1 | 
| 645 | else: | 
| 646 | to.softspace = 1 | 
| 647 |  | 
| 648 | def print_newline(self, to=None): | 
| 649 | if to is None: | 
| 650 | to = sys.stdout | 
| 651 | print("", file=to) | 
| 652 | to.softspace = 0 | 
| 653 |  | 
| 654 | ## Jumps | 
| 655 |  | 
| 656 | def byte_JUMP_FORWARD(self, jump): | 
| 657 | self.jump(jump) | 
| 658 |  | 
| 659 | def byte_JUMP_ABSOLUTE(self, jump): | 
| 660 | self.jump(jump) | 
| 661 |  | 
| 662 | if 0:   # Not in py2.7 | 
| 663 | def byte_JUMP_IF_TRUE(self, jump): | 
| 664 | val = self.top() | 
| 665 | if val: | 
| 666 | self.jump(jump) | 
| 667 |  | 
| 668 | def byte_JUMP_IF_FALSE(self, jump): | 
| 669 | val = self.top() | 
| 670 | if not val: | 
| 671 | self.jump(jump) | 
| 672 |  | 
| 673 | def byte_POP_JUMP_IF_TRUE(self, jump): | 
| 674 | val = self.pop() | 
| 675 | if val: | 
| 676 | self.jump(jump) | 
| 677 |  | 
| 678 | def byte_POP_JUMP_IF_FALSE(self, jump): | 
| 679 | val = self.pop() | 
| 680 | if not val: | 
| 681 | self.jump(jump) | 
| 682 |  | 
| 683 | def byte_JUMP_IF_TRUE_OR_POP(self, jump): | 
| 684 | val = self.top() | 
| 685 | if val: | 
| 686 | self.jump(jump) | 
| 687 | else: | 
| 688 | self.pop() | 
| 689 |  | 
| 690 | def byte_JUMP_IF_FALSE_OR_POP(self, jump): | 
| 691 | val = self.top() | 
| 692 | if not val: | 
| 693 | self.jump(jump) | 
| 694 | else: | 
| 695 | self.pop() | 
| 696 |  | 
| 697 | ## Blocks | 
| 698 |  | 
| 699 | def byte_SETUP_LOOP(self, dest): | 
| 700 | self.frame.push_block('loop', dest) | 
| 701 |  | 
| 702 | def byte_GET_ITER(self): | 
| 703 | self.push(iter(self.pop())) | 
| 704 |  | 
| 705 | def byte_FOR_ITER(self, jump): | 
| 706 | iterobj = self.top() | 
| 707 | try: | 
| 708 | v = next(iterobj) | 
| 709 | self.push(v) | 
| 710 | except StopIteration: | 
| 711 | self.pop() | 
| 712 | self.jump(jump) | 
| 713 |  | 
| 714 | def byte_BREAK_LOOP(self): | 
| 715 | return 'break' | 
| 716 |  | 
| 717 | def byte_CONTINUE_LOOP(self, dest): | 
| 718 | # This is a trick with the return value. | 
| 719 | # While unrolling blocks, continue and return both have to preserve | 
| 720 | # state as the finally blocks are executed.  For continue, it's | 
| 721 | # where to jump to, for return, it's the value to return.  It gets | 
| 722 | # pushed on the stack for both, so continue puts the jump destination | 
| 723 | # into return_value. | 
| 724 | self.return_value = dest | 
| 725 | return 'continue' | 
| 726 |  | 
| 727 | def byte_SETUP_EXCEPT(self, dest): | 
| 728 | self.frame.push_block('setup-except', dest) | 
| 729 |  | 
| 730 | def byte_SETUP_FINALLY(self, dest): | 
| 731 | self.frame.push_block('finally', dest) | 
| 732 |  | 
| 733 | def byte_END_FINALLY(self): | 
| 734 | v = self.pop() | 
| 735 | #debug('V %s', v) | 
| 736 | if isinstance(v, str): | 
| 737 | why = v | 
| 738 | if why in ('return', 'continue'): | 
| 739 | self.return_value = self.pop() | 
| 740 | elif v is None: | 
| 741 | why = None | 
| 742 | elif issubclass(v, BaseException): | 
| 743 | exctype = v | 
| 744 | val = self.pop() | 
| 745 | tb = self.pop() | 
| 746 | self.last_exception = (exctype, val, tb) | 
| 747 |  | 
| 748 | why = 'reraise' | 
| 749 | else:       # pragma: no cover | 
| 750 | raise VirtualMachineError("Confused END_FINALLY") | 
| 751 | return why | 
| 752 |  | 
| 753 | def byte_POP_BLOCK(self): | 
| 754 | self.frame.pop_block() | 
| 755 |  | 
| 756 | def byte_RAISE_VARARGS(self, argc): | 
| 757 | # NOTE: the dis docs are completely wrong about the order of the | 
| 758 | # operands on the stack! | 
| 759 | exctype = val = tb = None | 
| 760 | if argc == 0: | 
| 761 | exctype, val, tb = self.last_exception | 
| 762 | elif argc == 1: | 
| 763 | exctype = self.pop() | 
| 764 | elif argc == 2: | 
| 765 | val = self.pop() | 
| 766 | exctype = self.pop() | 
| 767 | elif argc == 3: | 
| 768 | tb = self.pop() | 
| 769 | val = self.pop() | 
| 770 | exctype = self.pop() | 
| 771 |  | 
| 772 | # There are a number of forms of "raise", normalize them somewhat. | 
| 773 | if isinstance(exctype, BaseException): | 
| 774 | val = exctype | 
| 775 | exctype = type(val) | 
| 776 |  | 
| 777 | self.last_exception = (exctype, val, tb) | 
| 778 |  | 
| 779 | if tb: | 
| 780 | return 'reraise' | 
| 781 | else: | 
| 782 | return 'exception' | 
| 783 |  | 
| 784 | def byte_SETUP_WITH(self, dest): | 
| 785 | ctxmgr = self.pop() | 
| 786 | self.push(ctxmgr.__exit__) | 
| 787 | ctxmgr_obj = ctxmgr.__enter__() | 
| 788 | self.frame.push_block('with', dest) | 
| 789 | self.push(ctxmgr_obj) | 
| 790 |  | 
| 791 | def byte_WITH_CLEANUP(self): | 
| 792 | # The code here does some weird stack manipulation: the exit function | 
| 793 | # is buried in the stack, and where depends on what's on top of it. | 
| 794 | # Pull out the exit function, and leave the rest in place. | 
| 795 | v = w = None | 
| 796 | u = self.top() | 
| 797 | if u is None: | 
| 798 | exit_func = self.pop(1) | 
| 799 | elif isinstance(u, str): | 
| 800 | if u in ('return', 'continue'): | 
| 801 | exit_func = self.pop(2) | 
| 802 | else: | 
| 803 | exit_func = self.pop(1) | 
| 804 | u = None | 
| 805 | elif issubclass(u, BaseException): | 
| 806 | w, v, u = self.popn(3) | 
| 807 | exit_func = self.pop() | 
| 808 | self.push(w, v, u) | 
| 809 | else:       # pragma: no cover | 
| 810 | raise VirtualMachineError("Confused WITH_CLEANUP") | 
| 811 | exit_ret = exit_func(u, v, w) | 
| 812 | err = (u is not None) and bool(exit_ret) | 
| 813 | if err: | 
| 814 | # An error occurred, and was suppressed | 
| 815 | self.popn(3) | 
| 816 | self.push(None) | 
| 817 |  | 
| 818 | ## Functions | 
| 819 |  | 
| 820 | def byte_MAKE_FUNCTION(self, argc): | 
| 821 | """Make a runtime object from a types.CodeObject, typically in a .pyc file.""" | 
| 822 | name = None | 
| 823 | code = self.pop() | 
| 824 | defaults = self.popn(argc) | 
| 825 | globs = self.frame.f_globals | 
| 826 | fn = Function(name, code, globs, defaults, None, self) | 
| 827 | self.push(fn) | 
| 828 |  | 
| 829 | def byte_LOAD_CLOSURE(self, name): | 
| 830 | self.push(self.frame.cells[name]) | 
| 831 |  | 
| 832 | def byte_MAKE_CLOSURE(self, argc): | 
| 833 | name = None | 
| 834 | closure, code = self.popn(2) | 
| 835 | defaults = self.popn(argc) | 
| 836 | globs = self.frame.f_globals | 
| 837 | fn = Function(name, code, globs, defaults, closure, self) | 
| 838 | self.push(fn) | 
| 839 |  | 
| 840 | def byte_CALL_FUNCTION(self, arg): | 
| 841 | return self.call_function(arg, [], {}) | 
| 842 |  | 
| 843 | def byte_CALL_FUNCTION_VAR(self, arg): | 
| 844 | args = self.pop() | 
| 845 | return self.call_function(arg, args, {}) | 
| 846 |  | 
| 847 | def byte_CALL_FUNCTION_KW(self, arg): | 
| 848 | kwargs = self.pop() | 
| 849 | return self.call_function(arg, [], kwargs) | 
| 850 |  | 
| 851 | def byte_CALL_FUNCTION_VAR_KW(self, arg): | 
| 852 | args, kwargs = self.popn(2) | 
| 853 | return self.call_function(arg, args, kwargs) | 
| 854 |  | 
| 855 | def call_function(self, arg, args, kwargs): | 
| 856 | len_kw, len_pos = divmod(arg, 256) | 
| 857 | namedargs = {} | 
| 858 | for i in xrange(len_kw): | 
| 859 | key, val = self.popn(2) | 
| 860 | namedargs[key] = val | 
| 861 | namedargs.update(kwargs) | 
| 862 | posargs = self.popn(len_pos) | 
| 863 | posargs.extend(args) | 
| 864 |  | 
| 865 | #debug('*** call_function stack = %s', self.frame.stack) | 
| 866 |  | 
| 867 | func = self.pop() | 
| 868 | #debug1('*** call_function POPPED %s', func) | 
| 869 | if getattr(func, 'func_name', None) == 'decode_next': | 
| 870 | raise AssertionError('BAD: %s' % func) | 
| 871 |  | 
| 872 | frame = self.frame | 
| 873 | if hasattr(func, 'im_func'): | 
| 874 | # Methods get self as an implicit first parameter. | 
| 875 |  | 
| 876 | #debug('') | 
| 877 | #debug('im_self %r', (func.im_self,)) | 
| 878 | #debug('posargs %r', (posargs,)) | 
| 879 |  | 
| 880 | if func.im_self is not None: | 
| 881 | posargs.insert(0, func.im_self) | 
| 882 |  | 
| 883 | #debug('posargs AFTER %r', (posargs,)) | 
| 884 |  | 
| 885 | # TODO: We have the frame here, but I also want the location. | 
| 886 | # dis has it! | 
| 887 |  | 
| 888 | # The first parameter must be the correct type. | 
| 889 | if not isinstance(posargs[0], func.im_class): | 
| 890 | # Must match Python interpreter to pass unit tests! | 
| 891 | if self.more_info: | 
| 892 | # More informative error that shows the frame. | 
| 893 | raise TypeError( | 
| 894 | 'unbound method %s() must be called with %s instance ' | 
| 895 | 'as first argument, was called with %s instance ' | 
| 896 | '(frame: %s)' % ( | 
| 897 | func.im_func.func_name, | 
| 898 | func.im_class.__name__, | 
| 899 | type(posargs[0]).__name__, | 
| 900 | #posargs[0], | 
| 901 | self.frame, | 
| 902 | ) | 
| 903 | ) | 
| 904 | else: | 
| 905 | raise TypeError( | 
| 906 | 'unbound method %s() must be called with %s instance ' | 
| 907 | 'as first argument (got %s instance instead)' % ( | 
| 908 | func.im_func.func_name, | 
| 909 | func.im_class.__name__, | 
| 910 | type(posargs[0]).__name__, | 
| 911 | ) | 
| 912 | ) | 
| 913 | func = func.im_func | 
| 914 |  | 
| 915 | # BUG FIX: The callable must be a pyobj.Function, not a native Python | 
| 916 | # function (types.FunctionType).  The latter will be executed using the | 
| 917 | # HOST CPython interpreter rather than the byterun interpreter. | 
| 918 |  | 
| 919 | # Cases: | 
| 920 | # 1. builtin functions like int().  We want to use the host here. | 
| 921 | # 2. User-defined functions from this module.  These are created with | 
| 922 | #    MAKE_FUNCTION, which properly turns them into pyobj.Function. | 
| 923 | # 3. User-defined function from another module.  These are created with | 
| 924 | #    __import__, which yields a native function. | 
| 925 | # 4. pyobj.Generator is on the stack, and you get its next() value. | 
| 926 | #    We should do something smarter. | 
| 927 |  | 
| 928 | # This check is broken! | 
| 929 | # next() and send()  that is a native python function.  We DO NOT need | 
| 930 | # to wrap it. | 
| 931 |  | 
| 932 | do_wrap = False | 
| 933 | #debug1('FUNC %s', dir(func)) | 
| 934 | if isinstance(func, types.FunctionType): | 
| 935 | do_wrap = True | 
| 936 |  | 
| 937 | # Hack for case #4. | 
| 938 | if getattr(func, '__doc__', None) == 'DO_NOT_INTERPRET': | 
| 939 | do_wrap = False | 
| 940 | #raise AssertionError | 
| 941 |  | 
| 942 | #debug1('do_wrap: %s', do_wrap) | 
| 943 |  | 
| 944 | if do_wrap: | 
| 945 | #debug1('*** WRAPPING %s', func) | 
| 946 | #debug1('%s', dir(func)) | 
| 947 | #debug1('__doc__ %s', func.__doc__) | 
| 948 |  | 
| 949 | defaults = func.func_defaults or () | 
| 950 | byterun_func = Function( | 
| 951 | func.func_name, func.func_code, func.func_globals, | 
| 952 | defaults, func.func_closure, self) | 
| 953 | else: | 
| 954 | byterun_func = func | 
| 955 |  | 
| 956 | #debug1('  Calling: %s', byterun_func) | 
| 957 | retval = byterun_func(*posargs, **namedargs) | 
| 958 | self.push(retval) | 
| 959 |  | 
| 960 | def byte_RETURN_VALUE(self): | 
| 961 | self.return_value = self.pop() | 
| 962 | if self.frame.generator: | 
| 963 | self.frame.generator.finished = True | 
| 964 | return "return" | 
| 965 |  | 
| 966 | def byte_YIELD_VALUE(self): | 
| 967 | self.return_value = self.pop() | 
| 968 | return "yield" | 
| 969 |  | 
| 970 | def byte_YIELD_FROM(self): | 
| 971 | u = self.pop() | 
| 972 | x = self.top() | 
| 973 |  | 
| 974 | try: | 
| 975 | if not isinstance(x, Generator) or u is None: | 
| 976 | # Call next on iterators. | 
| 977 | retval = next(x) | 
| 978 | else: | 
| 979 | retval = x.send(u) | 
| 980 | self.return_value = retval | 
| 981 | except StopIteration as e: | 
| 982 | self.pop() | 
| 983 | self.push(e.value) | 
| 984 | else: | 
| 985 | # YIELD_FROM decrements f_lasti, so that it will be called | 
| 986 | # repeatedly until a StopIteration is raised. | 
| 987 | self.jump(self.frame.f_lasti - 1) | 
| 988 | # Returning "yield" prevents the block stack cleanup code | 
| 989 | # from executing, suspending the frame in its current state. | 
| 990 | return "yield" | 
| 991 |  | 
| 992 | ## Importing | 
| 993 |  | 
| 994 | def byte_IMPORT_NAME(self, name): | 
| 995 | level, fromlist = self.popn(2) | 
| 996 | frame = self.frame | 
| 997 |  | 
| 998 | # NOTE: This can read .pyc files not compiled with OPy! | 
| 999 | # TODO: Respect OPY_PATH | 
| 1000 |  | 
| 1001 | #debug1('IMPORT name=%s fromlist=%s level=%s', name, fromlist, level) | 
| 1002 |  | 
| 1003 | mod = __import__(name, frame.f_globals, frame.f_locals, fromlist, level) | 
| 1004 |  | 
| 1005 | #debug1('IMPORTED %s -> %s' % (name, mod)) | 
| 1006 |  | 
| 1007 | self.push(mod) | 
| 1008 |  | 
| 1009 | def byte_IMPORT_STAR(self): | 
| 1010 | # TODO: this doesn't use __all__ properly. | 
| 1011 | mod = self.pop() | 
| 1012 | for attr in dir(mod): | 
| 1013 | if attr[0] != '_': | 
| 1014 | self.frame.f_locals[attr] = getattr(mod, attr) | 
| 1015 |  | 
| 1016 | def byte_IMPORT_FROM(self, name): | 
| 1017 | mod = self.top() | 
| 1018 | self.push(getattr(mod, name)) | 
| 1019 |  | 
| 1020 | ## And the rest... | 
| 1021 |  | 
| 1022 | def byte_EXEC_STMT(self): | 
| 1023 | stmt, globs, locs = self.popn(3) | 
| 1024 | exec stmt in globs, locs | 
| 1025 |  | 
| 1026 | def byte_BUILD_CLASS(self): | 
| 1027 | name, bases, methods = self.popn(3) | 
| 1028 | self.push(type(name, bases, methods)) |