paul@4 | 1 | #!/usr/bin/env python |
paul@4 | 2 | |
paul@4 | 3 | """ |
paul@4 | 4 | Java bytecode conversion. Specification found at the following URL: |
paul@4 | 5 | http://java.sun.com/docs/books/vmspec/2nd-edition/html/Instructions2.doc.html |
paul@5 | 6 | |
paul@5 | 7 | NOTE: Synchronized constructs are not actually supported. |
paul@4 | 8 | """ |
paul@4 | 9 | |
paul@8 | 10 | from dis import opmap, cmp_op # for access to Python bytecode values and operators |
paul@6 | 11 | from UserDict import UserDict |
paul@4 | 12 | |
paul@5 | 13 | # Bytecode production classes. |
paul@5 | 14 | |
paul@5 | 15 | class BytecodeWriter: |
paul@7 | 16 | |
paul@7 | 17 | "A Python bytecode writer." |
paul@7 | 18 | |
paul@5 | 19 | def __init__(self): |
paul@11 | 20 | # A stack of loop block or exception block start positions. |
paul@11 | 21 | self.blocks = [] |
paul@11 | 22 | |
paul@11 | 23 | # A stack of exception block handler pointers. |
paul@11 | 24 | self.exception_handlers = [] |
paul@11 | 25 | |
paul@11 | 26 | # A dictionary mapping labels to jump instructions referencing such labels. |
paul@6 | 27 | self.jumps = {} |
paul@11 | 28 | |
paul@11 | 29 | # The output values, including "lazy" subvalues which will need evaluating. |
paul@5 | 30 | self.output = [] |
paul@11 | 31 | |
paul@11 | 32 | # The current Python bytecode instruction position. |
paul@5 | 33 | self.position = 0 |
paul@5 | 34 | |
paul@8 | 35 | # Stack depth estimation. |
paul@8 | 36 | self.stack_depth = 0 |
paul@8 | 37 | self.max_stack_depth = 0 |
paul@8 | 38 | |
paul@15 | 39 | # Local variable estimation. |
paul@15 | 40 | self.max_locals = 0 |
paul@15 | 41 | |
paul@6 | 42 | # Mapping from values to indexes. |
paul@6 | 43 | self.constants = {} |
paul@6 | 44 | |
paul@6 | 45 | # Mapping from names to indexes. |
paul@6 | 46 | # NOTE: This may be acquired from elsewhere. |
paul@8 | 47 | #self.globals = {} |
paul@6 | 48 | |
paul@7 | 49 | # Mapping from names to indexes. |
paul@7 | 50 | self.names = {} |
paul@7 | 51 | |
paul@8 | 52 | # A list of constants used as exception handler return addresses. |
paul@8 | 53 | self.constants_for_exceptions = [] |
paul@8 | 54 | |
paul@6 | 55 | def get_output(self): |
paul@6 | 56 | output = [] |
paul@6 | 57 | for element in self.output: |
paul@8 | 58 | if isinstance(element, LazySubValue): |
paul@8 | 59 | value = element.value |
paul@6 | 60 | else: |
paul@8 | 61 | value = element |
paul@8 | 62 | output.append(chr(value)) |
paul@6 | 63 | return "".join(output) |
paul@6 | 64 | |
paul@8 | 65 | def get_constants(self): |
paul@8 | 66 | l = self._get_list(self._invert(self.constants)) |
paul@8 | 67 | result = [] |
paul@8 | 68 | for i in l: |
paul@8 | 69 | if isinstance(i, LazyValue): |
paul@8 | 70 | result.append(i.get_value()) |
paul@8 | 71 | else: |
paul@8 | 72 | result.append(i) |
paul@8 | 73 | return result |
paul@8 | 74 | |
paul@8 | 75 | #def get_globals(self): |
paul@8 | 76 | # return self._get_list(self._invert(self.globals)) |
paul@8 | 77 | |
paul@8 | 78 | def get_names(self): |
paul@8 | 79 | return self._get_list(self._invert(self.names)) |
paul@8 | 80 | |
paul@8 | 81 | def _invert(self, d): |
paul@8 | 82 | inverted = {} |
paul@8 | 83 | for k, v in d.items(): |
paul@8 | 84 | inverted[v] = k |
paul@8 | 85 | return inverted |
paul@8 | 86 | |
paul@8 | 87 | def _get_list(self, d): |
paul@8 | 88 | l = [] |
paul@8 | 89 | for i in range(0, len(d.keys())): |
paul@8 | 90 | l.append(d[i]) |
paul@8 | 91 | return l |
paul@8 | 92 | |
paul@8 | 93 | # Administrative methods. |
paul@8 | 94 | |
paul@8 | 95 | def update_stack_depth(self, change): |
paul@8 | 96 | self.stack_depth += change |
paul@8 | 97 | if self.stack_depth > self.max_stack_depth: |
paul@8 | 98 | self.max_stack_depth = self.stack_depth |
paul@8 | 99 | |
paul@15 | 100 | def update_locals(self, index): |
paul@15 | 101 | if index > self.max_locals: |
paul@15 | 102 | self.max_locals = index |
paul@15 | 103 | |
paul@5 | 104 | # Special methods. |
paul@5 | 105 | |
paul@8 | 106 | def _write_value(self, value): |
paul@8 | 107 | if isinstance(value, LazyValue): |
paul@8 | 108 | # NOTE: Assume a 16-bit value. |
paul@8 | 109 | self.output.append(value.values[0]) |
paul@8 | 110 | self.output.append(value.values[1]) |
paul@11 | 111 | self.position += 2 |
paul@8 | 112 | elif value <= 0xffff: |
paul@8 | 113 | self.output.append(value & 0xff) |
paul@8 | 114 | self.output.append((value & 0xff00) >> 8) |
paul@8 | 115 | self.position += 2 |
paul@8 | 116 | else: |
paul@8 | 117 | # NOTE: EXTENDED_ARG not yet supported. |
paul@8 | 118 | raise ValueError, value |
paul@8 | 119 | |
paul@9 | 120 | def setup_loop(self): |
paul@11 | 121 | self.blocks.append(self.position) |
paul@9 | 122 | self.output.append(opmap["SETUP_LOOP"]) |
paul@9 | 123 | self.position += 1 |
paul@9 | 124 | self._write_value(0) # To be filled in later |
paul@9 | 125 | |
paul@5 | 126 | def end_loop(self): |
paul@11 | 127 | current_loop_start = self.blocks.pop() |
paul@5 | 128 | self.jump_absolute(current_loop_start) |
paul@11 | 129 | # NOTE: Using 3 as the assumed length of the SETUP_LOOP instruction. |
paul@11 | 130 | # NOTE: 8-bit limit. |
paul@11 | 131 | self.output[current_loop_start + 1] = self.position - current_loop_start - 3 |
paul@11 | 132 | self.output[current_loop_start + 2] = 0 |
paul@5 | 133 | self.pop_block() |
paul@5 | 134 | |
paul@6 | 135 | def jump_to_label(self, status, name): |
paul@6 | 136 | # Record the instruction using the jump. |
paul@8 | 137 | jump_instruction = self.position |
paul@6 | 138 | if status is None: |
paul@6 | 139 | self.jump_forward() |
paul@6 | 140 | elif status: |
paul@5 | 141 | self.jump_if_true() |
paul@5 | 142 | else: |
paul@5 | 143 | self.jump_if_false() |
paul@8 | 144 | # Record the following instruction, too. |
paul@8 | 145 | if not self.jumps.has_key(name): |
paul@8 | 146 | self.jumps[name] = [] |
paul@8 | 147 | self.jumps[name].append((jump_instruction, self.position)) |
paul@5 | 148 | |
paul@6 | 149 | def start_label(self, name): |
paul@6 | 150 | # Fill in all jump instructions. |
paul@8 | 151 | for jump_instruction, following_instruction in self.jumps[name]: |
paul@11 | 152 | # NOTE: 8-bit limit. |
paul@8 | 153 | self.output[jump_instruction + 1] = self.position - following_instruction |
paul@11 | 154 | self.output[jump_instruction + 2] = 0 |
paul@8 | 155 | del self.jumps[name] |
paul@8 | 156 | |
paul@8 | 157 | def load_const_ret(self, value): |
paul@22 | 158 | self.constants_for_exceptions.append(value) |
paul@22 | 159 | self.load_const(value) |
paul@8 | 160 | |
paul@8 | 161 | def ret(self, index): |
paul@18 | 162 | self.load_fast(index) |
paul@22 | 163 | # Previously, the constant stored on the stack by jsr/jsr_w was stored |
paul@22 | 164 | # in a local variable. In the JVM, extracting the value from the local |
paul@22 | 165 | # variable and jumping can be done at runtime. In the Python VM, any |
paul@22 | 166 | # jump target must be known in advance and written into the bytecode. |
paul@22 | 167 | for constant in self.constants_for_exceptions: |
paul@22 | 168 | self.dup_top() # Stack: actual-address, actual-address |
paul@22 | 169 | self.load_const(constant) # Stack: actual-address, actual-address, suggested-address |
paul@22 | 170 | self.compare_op("==") # Stack: actual-address, result |
paul@22 | 171 | self.jump_to_label(0, "const") |
paul@22 | 172 | self.pop_top() # Stack: actual-address |
paul@22 | 173 | self.pop_top() # Stack: |
paul@22 | 174 | self.jump_absolute(constant) |
paul@22 | 175 | self.start_label("const") |
paul@22 | 176 | self.pop_top() # Stack: actual-address |
paul@22 | 177 | # NOTE: If we get here, something is really wrong. |
paul@22 | 178 | self.pop_top() # Stack: |
paul@11 | 179 | |
paul@11 | 180 | def setup_except(self, target): |
paul@11 | 181 | self.blocks.append(self.position) |
paul@11 | 182 | self.exception_handlers.append(target) |
paul@22 | 183 | #print "-", self.position, target |
paul@11 | 184 | self.output.append(opmap["SETUP_EXCEPT"]) |
paul@11 | 185 | self.position += 1 |
paul@11 | 186 | self._write_value(0) # To be filled in later |
paul@11 | 187 | |
paul@11 | 188 | def setup_finally(self, target): |
paul@11 | 189 | self.blocks.append(self.position) |
paul@11 | 190 | self.exception_handlers.append(target) |
paul@22 | 191 | #print "-", self.position, target |
paul@11 | 192 | self.output.append(opmap["SETUP_FINALLY"]) |
paul@11 | 193 | self.position += 1 |
paul@11 | 194 | self._write_value(0) # To be filled in later |
paul@11 | 195 | |
paul@11 | 196 | def end_exception(self): |
paul@11 | 197 | current_exception_start = self.blocks.pop() |
paul@11 | 198 | # Convert the "lazy" absolute value. |
paul@11 | 199 | current_exception_target = self.exception_handlers.pop() |
paul@11 | 200 | target = current_exception_target.get_value() |
paul@22 | 201 | #print "*", current_exception_start, target |
paul@11 | 202 | # NOTE: Using 3 as the assumed length of the SETUP_* instruction. |
paul@11 | 203 | # NOTE: 8-bit limit. |
paul@11 | 204 | self.output[current_exception_start + 1] = target - current_exception_start - 3 |
paul@11 | 205 | self.output[current_exception_start + 2] = 0 |
paul@24 | 206 | |
paul@24 | 207 | def start_handler(self, exc_name): |
paul@24 | 208 | # Where handlers are begun, produce bytecode to test the type of |
paul@24 | 209 | # the exception. |
paul@24 | 210 | self.dup_top() # Stack: exception, exception |
paul@24 | 211 | self.load_global(str(exc_name)) # Stack: exception, exception, handled-exception |
paul@24 | 212 | self.compare_op("exception match") # Stack: exception, result |
paul@24 | 213 | self.jump_to_label(1, "handler") |
paul@24 | 214 | self.pop_top() |
paul@24 | 215 | self.end_finally() |
paul@24 | 216 | self.start_label("handler") |
paul@24 | 217 | self.pop_top() |
paul@6 | 218 | |
paul@6 | 219 | # Complicated methods. |
paul@6 | 220 | |
paul@6 | 221 | def load_const(self, value): |
paul@6 | 222 | self.output.append(opmap["LOAD_CONST"]) |
paul@6 | 223 | if not self.constants.has_key(value): |
paul@6 | 224 | self.constants[value] = len(self.constants.keys()) |
paul@8 | 225 | self.position += 1 |
paul@8 | 226 | self._write_value(self.constants[value]) |
paul@8 | 227 | self.update_stack_depth(1) |
paul@6 | 228 | |
paul@6 | 229 | def load_global(self, name): |
paul@6 | 230 | self.output.append(opmap["LOAD_GLOBAL"]) |
paul@8 | 231 | if not self.names.has_key(name): |
paul@8 | 232 | self.names[name] = len(self.names.keys()) |
paul@8 | 233 | self.position += 1 |
paul@8 | 234 | self._write_value(self.names[name]) |
paul@8 | 235 | self.update_stack_depth(1) |
paul@7 | 236 | |
paul@7 | 237 | def load_attr(self, name): |
paul@7 | 238 | self.output.append(opmap["LOAD_ATTR"]) |
paul@7 | 239 | if not self.names.has_key(name): |
paul@7 | 240 | self.names[name] = len(self.names.keys()) |
paul@8 | 241 | self.position += 1 |
paul@8 | 242 | self._write_value(self.names[name]) |
paul@8 | 243 | |
paul@8 | 244 | def load_name(self, name): |
paul@8 | 245 | self.output.append(opmap["LOAD_NAME"]) |
paul@8 | 246 | if not self.names.has_key(name): |
paul@8 | 247 | self.names[name] = len(self.names.keys()) |
paul@8 | 248 | self.position += 1 |
paul@8 | 249 | self._write_value(self.names[name]) |
paul@8 | 250 | self.update_stack_depth(1) |
paul@6 | 251 | |
paul@6 | 252 | def load_fast(self, index): |
paul@6 | 253 | self.output.append(opmap["LOAD_FAST"]) |
paul@8 | 254 | self.position += 1 |
paul@8 | 255 | self._write_value(index) |
paul@8 | 256 | self.update_stack_depth(1) |
paul@15 | 257 | self.update_locals(index) |
paul@8 | 258 | |
paul@8 | 259 | def store_attr(self, name): |
paul@8 | 260 | self.output.append(opmap["STORE_ATTR"]) |
paul@8 | 261 | if not self.names.has_key(name): |
paul@8 | 262 | self.names[name] = len(self.names.keys()) |
paul@8 | 263 | self.position += 1 |
paul@8 | 264 | self._write_value(self.names[name]) |
paul@8 | 265 | self.update_stack_depth(-1) |
paul@8 | 266 | |
paul@8 | 267 | def store_fast(self, index): |
paul@8 | 268 | self.output.append(opmap["STORE_FAST"]) |
paul@8 | 269 | self.position += 1 |
paul@8 | 270 | self._write_value(index) |
paul@8 | 271 | self.update_stack_depth(-1) |
paul@15 | 272 | self.update_locals(index) |
paul@5 | 273 | |
paul@5 | 274 | # Normal bytecode generators. |
paul@5 | 275 | |
paul@5 | 276 | def for_iter(self): |
paul@11 | 277 | self.blocks.append(self.position) |
paul@5 | 278 | self.output.append(opmap["FOR_ITER"]) |
paul@8 | 279 | self.position += 1 |
paul@8 | 280 | self._write_value(0) # To be filled in later |
paul@8 | 281 | self.update_stack_depth(1) |
paul@5 | 282 | |
paul@8 | 283 | def jump_if_false(self, offset=0): |
paul@5 | 284 | self.output.append(opmap["JUMP_IF_FALSE"]) |
paul@8 | 285 | self.position += 1 |
paul@8 | 286 | self._write_value(offset) # May be filled in later |
paul@5 | 287 | |
paul@8 | 288 | def jump_if_true(self, offset=0): |
paul@5 | 289 | self.output.append(opmap["JUMP_IF_TRUE"]) |
paul@8 | 290 | self.position += 1 |
paul@8 | 291 | self._write_value(offset) # May be filled in later |
paul@5 | 292 | |
paul@8 | 293 | def jump_forward(self, offset=0): |
paul@6 | 294 | self.output.append(opmap["JUMP_FORWARD"]) |
paul@8 | 295 | self.position += 1 |
paul@8 | 296 | self._write_value(offset) # May be filled in later |
paul@8 | 297 | |
paul@8 | 298 | def jump_absolute(self, address=0): |
paul@8 | 299 | self.output.append(opmap["JUMP_ABSOLUTE"]) |
paul@8 | 300 | self.position += 1 |
paul@8 | 301 | self._write_value(address) # May be filled in later |
paul@6 | 302 | |
paul@7 | 303 | def build_tuple(self, count): |
paul@7 | 304 | self.output.append(opmap["BUILD_TUPLE"]) |
paul@8 | 305 | self.position += 1 |
paul@8 | 306 | self._write_value(count) |
paul@8 | 307 | self.update_stack_depth(-(count - 1)) |
paul@8 | 308 | |
paul@8 | 309 | def build_list(self, count): |
paul@8 | 310 | self.output.append(opmap["BUILD_LIST"]) |
paul@8 | 311 | self.position += 1 |
paul@8 | 312 | self._write_value(count) |
paul@8 | 313 | self.update_stack_depth(-(count - 1)) |
paul@8 | 314 | |
paul@8 | 315 | def pop_top(self): |
paul@8 | 316 | self.output.append(opmap["POP_TOP"]) |
paul@8 | 317 | self.position += 1 |
paul@8 | 318 | self.update_stack_depth(-1) |
paul@8 | 319 | |
paul@8 | 320 | def dup_top(self): |
paul@8 | 321 | self.output.append(opmap["DUP_TOP"]) |
paul@8 | 322 | self.position += 1 |
paul@8 | 323 | self.update_stack_depth(1) |
paul@7 | 324 | |
paul@7 | 325 | def rot_two(self): |
paul@7 | 326 | self.output.append(opmap["ROT_TWO"]) |
paul@7 | 327 | self.position += 1 |
paul@7 | 328 | |
paul@7 | 329 | def rot_three(self): |
paul@7 | 330 | self.output.append(opmap["ROT_THREE"]) |
paul@7 | 331 | self.position += 1 |
paul@7 | 332 | |
paul@7 | 333 | def rot_four(self): |
paul@7 | 334 | self.output.append(opmap["ROT_FOUR"]) |
paul@7 | 335 | self.position += 1 |
paul@7 | 336 | |
paul@7 | 337 | def call_function(self, count): |
paul@7 | 338 | self.output.append(opmap["CALL_FUNCTION"]) |
paul@8 | 339 | self.position += 1 |
paul@8 | 340 | self._write_value(count) |
paul@8 | 341 | self.update_stack_depth(-count) |
paul@8 | 342 | |
paul@8 | 343 | def binary_subscr(self): |
paul@8 | 344 | self.output.append(opmap["BINARY_SUBSCR"]) |
paul@8 | 345 | self.position += 1 |
paul@8 | 346 | self.update_stack_depth(-1) |
paul@8 | 347 | |
paul@8 | 348 | def binary_add(self): |
paul@8 | 349 | self.output.append(opmap["BINARY_ADD"]) |
paul@8 | 350 | self.position += 1 |
paul@8 | 351 | self.update_stack_depth(-1) |
paul@8 | 352 | |
paul@8 | 353 | def binary_divide(self): |
paul@8 | 354 | self.output.append(opmap["BINARY_DIVIDE"]) |
paul@8 | 355 | self.position += 1 |
paul@8 | 356 | self.update_stack_depth(-1) |
paul@8 | 357 | |
paul@8 | 358 | def binary_multiply(self): |
paul@8 | 359 | self.output.append(opmap["BINARY_MULTIPLY"]) |
paul@8 | 360 | self.position += 1 |
paul@8 | 361 | self.update_stack_depth(-1) |
paul@8 | 362 | |
paul@8 | 363 | def binary_modulo(self): |
paul@8 | 364 | self.output.append(opmap["BINARY_MODULO"]) |
paul@8 | 365 | self.position += 1 |
paul@8 | 366 | self.update_stack_depth(-1) |
paul@8 | 367 | |
paul@8 | 368 | def binary_subtract(self): |
paul@8 | 369 | self.output.append(opmap["BINARY_SUBTRACT"]) |
paul@8 | 370 | self.position += 1 |
paul@8 | 371 | self.update_stack_depth(-1) |
paul@8 | 372 | |
paul@8 | 373 | def binary_and(self): |
paul@8 | 374 | self.output.append(opmap["BINARY_AND"]) |
paul@8 | 375 | self.position += 1 |
paul@8 | 376 | self.update_stack_depth(-1) |
paul@8 | 377 | |
paul@8 | 378 | def binary_or(self): |
paul@8 | 379 | self.output.append(opmap["BINARY_XOR"]) |
paul@8 | 380 | self.position += 1 |
paul@8 | 381 | self.update_stack_depth(-1) |
paul@8 | 382 | |
paul@8 | 383 | def binary_lshift(self): |
paul@8 | 384 | self.output.append(opmap["BINARY_LSHIFT"]) |
paul@8 | 385 | self.position += 1 |
paul@8 | 386 | self.update_stack_depth(-1) |
paul@8 | 387 | |
paul@8 | 388 | def binary_rshift(self): |
paul@8 | 389 | self.output.append(opmap["BINARY_RSHIFT"]) |
paul@8 | 390 | self.position += 1 |
paul@8 | 391 | self.update_stack_depth(-1) |
paul@8 | 392 | |
paul@8 | 393 | def binary_xor(self): |
paul@8 | 394 | self.output.append(opmap["BINARY_XOR"]) |
paul@8 | 395 | self.position += 1 |
paul@8 | 396 | self.update_stack_depth(-1) |
paul@8 | 397 | |
paul@8 | 398 | def compare_op(self, op): |
paul@8 | 399 | self.output.append(opmap["COMPARE_OP"]) |
paul@8 | 400 | self.position += 1 |
paul@8 | 401 | self._write_value(list(cmp_op).index(op)) |
paul@8 | 402 | self.update_stack_depth(-1) |
paul@8 | 403 | |
paul@8 | 404 | def return_value(self): |
paul@8 | 405 | self.output.append(opmap["RETURN_VALUE"]) |
paul@8 | 406 | self.position += 1 |
paul@8 | 407 | self.update_stack_depth(-1) |
paul@8 | 408 | |
paul@8 | 409 | def raise_varargs(self, count): |
paul@8 | 410 | self.output.append(opmap["RAISE_VARARGS"]) |
paul@8 | 411 | self.position += 1 |
paul@8 | 412 | self._write_value(count) |
paul@7 | 413 | |
paul@9 | 414 | def pop_block(self): |
paul@9 | 415 | self.output.append(opmap["POP_BLOCK"]) |
paul@9 | 416 | self.position += 1 |
paul@9 | 417 | |
paul@11 | 418 | def end_finally(self): |
paul@11 | 419 | self.output.append(opmap["END_FINALLY"]) |
paul@11 | 420 | self.position += 1 |
paul@11 | 421 | |
paul@6 | 422 | # Utility classes and functions. |
paul@6 | 423 | |
paul@6 | 424 | class LazyDict(UserDict): |
paul@6 | 425 | def __getitem__(self, key): |
paul@6 | 426 | if not self.data.has_key(key): |
paul@8 | 427 | # NOTE: Assume 16-bit value. |
paul@8 | 428 | self.data[key] = LazyValue(2) |
paul@6 | 429 | return self.data[key] |
paul@6 | 430 | def __setitem__(self, key, value): |
paul@6 | 431 | if self.data.has_key(key): |
paul@6 | 432 | existing_value = self.data[key] |
paul@6 | 433 | if isinstance(existing_value, LazyValue): |
paul@8 | 434 | existing_value.set_value(value) |
paul@6 | 435 | return |
paul@6 | 436 | self.data[key] = value |
paul@6 | 437 | |
paul@6 | 438 | class LazyValue: |
paul@8 | 439 | def __init__(self, nvalues): |
paul@8 | 440 | self.values = [] |
paul@8 | 441 | for i in range(0, nvalues): |
paul@8 | 442 | self.values.append(LazySubValue()) |
paul@8 | 443 | def set_value(self, value): |
paul@8 | 444 | # NOTE: Assume at least 16-bit value. No "filling" performed. |
paul@8 | 445 | if value <= 0xffff: |
paul@8 | 446 | self.values[0].set_value(value & 0xff) |
paul@8 | 447 | self.values[1].set_value((value & 0xff00) >> 8) |
paul@8 | 448 | else: |
paul@8 | 449 | # NOTE: EXTENDED_ARG not yet supported. |
paul@8 | 450 | raise ValueError, value |
paul@8 | 451 | def get_value(self): |
paul@8 | 452 | value = 0 |
paul@11 | 453 | values = self.values[:] |
paul@11 | 454 | for i in range(0, len(values)): |
paul@11 | 455 | value = (value << 8) + values.pop().value |
paul@8 | 456 | return value |
paul@8 | 457 | |
paul@8 | 458 | class LazySubValue: |
paul@8 | 459 | def __init__(self): |
paul@8 | 460 | self.value = 0 |
paul@8 | 461 | def set_value(self, value): |
paul@6 | 462 | self.value = value |
paul@6 | 463 | |
paul@6 | 464 | def signed(value, limit): |
paul@6 | 465 | |
paul@6 | 466 | """ |
paul@6 | 467 | Return the signed integer from the unsigned 'value', where 'limit' (a value |
paul@6 | 468 | one greater than the highest possible positive integer) is used to determine |
paul@6 | 469 | whether a negative or positive result is produced. |
paul@6 | 470 | """ |
paul@6 | 471 | |
paul@6 | 472 | d, r = divmod(value, limit) |
paul@6 | 473 | if d == 1: |
paul@6 | 474 | mask = limit * 2 - 1 |
paul@6 | 475 | return -1 - (value ^ mask) |
paul@6 | 476 | else: |
paul@6 | 477 | return value |
paul@6 | 478 | |
paul@6 | 479 | def signed2(value): |
paul@6 | 480 | return signed(value, 0x8000) |
paul@6 | 481 | |
paul@6 | 482 | def signed4(value): |
paul@6 | 483 | return signed(value, 0x80000000) |
paul@6 | 484 | |
paul@4 | 485 | # Bytecode conversion. |
paul@4 | 486 | |
paul@5 | 487 | class BytecodeReader: |
paul@7 | 488 | |
paul@7 | 489 | "A generic Java bytecode reader." |
paul@7 | 490 | |
paul@5 | 491 | def __init__(self, class_file): |
paul@5 | 492 | self.class_file = class_file |
paul@6 | 493 | self.position_mapping = LazyDict() |
paul@5 | 494 | |
paul@22 | 495 | def process(self, method, program): |
paul@5 | 496 | self.java_position = 0 |
paul@22 | 497 | self.in_finally = 0 |
paul@22 | 498 | self.method = method |
paul@22 | 499 | |
paul@22 | 500 | # NOTE: Not guaranteed. |
paul@22 | 501 | attribute = method.attributes[0] |
paul@22 | 502 | code, exception_table = attribute.code, attribute.exception_table |
paul@11 | 503 | |
paul@11 | 504 | # Produce a structure which permits fast access to exception details. |
paul@11 | 505 | exception_block_start = {} |
paul@11 | 506 | exception_block_end = {} |
paul@11 | 507 | exception_block_handler = {} |
paul@11 | 508 | reversed_exception_table = exception_table[:] |
paul@11 | 509 | reversed_exception_table.reverse() |
paul@11 | 510 | |
paul@11 | 511 | # Later entries have wider coverage than earlier entries. |
paul@11 | 512 | for exception in reversed_exception_table: |
paul@11 | 513 | # Index start positions. |
paul@11 | 514 | if not exception_block_start.has_key(exception.start_pc): |
paul@11 | 515 | exception_block_start[exception.start_pc] = [] |
paul@11 | 516 | exception_block_start[exception.start_pc].append(exception) |
paul@11 | 517 | # Index end positions. |
paul@11 | 518 | if not exception_block_end.has_key(exception.end_pc): |
paul@11 | 519 | exception_block_end[exception.end_pc] = [] |
paul@11 | 520 | exception_block_end[exception.end_pc].append(exception) |
paul@11 | 521 | # Index handler positions. |
paul@11 | 522 | if not exception_block_handler.has_key(exception.handler_pc): |
paul@11 | 523 | exception_block_handler[exception.handler_pc] = [] |
paul@11 | 524 | exception_block_handler[exception.handler_pc].append(exception) |
paul@11 | 525 | |
paul@11 | 526 | # Process each instruction in the code. |
paul@5 | 527 | while self.java_position < len(code): |
paul@5 | 528 | self.position_mapping[self.java_position] = program.position |
paul@11 | 529 | |
paul@11 | 530 | # Insert exception handling constructs. |
paul@22 | 531 | block_starts = exception_block_start.get(self.java_position, []) |
paul@22 | 532 | for exception in block_starts: |
paul@11 | 533 | # Note that the absolute position is used. |
paul@11 | 534 | if exception.catch_type == 0: |
paul@11 | 535 | program.setup_finally(self.position_mapping[exception.handler_pc]) |
paul@11 | 536 | else: |
paul@11 | 537 | program.setup_except(self.position_mapping[exception.handler_pc]) |
paul@22 | 538 | if block_starts: |
paul@22 | 539 | self.in_finally = 0 |
paul@11 | 540 | |
paul@15 | 541 | # Insert exception handler details. |
paul@15 | 542 | # NOTE: Ensure that pop_block is reachable by possibly inserting it at the start of finally handlers. |
paul@15 | 543 | # NOTE: Insert a check for the correct exception at the start of each handler. |
paul@15 | 544 | for exception in exception_block_handler.get(self.java_position, []): |
paul@11 | 545 | program.end_exception() |
paul@22 | 546 | if exception.catch_type == 0: |
paul@22 | 547 | self.in_finally = 1 |
paul@24 | 548 | else: |
paul@24 | 549 | program.start_handler(self.class_file.constants[exception.catch_type - 1].get_python_name()) |
paul@11 | 550 | |
paul@11 | 551 | # Process the bytecode at the current position. |
paul@5 | 552 | bytecode = ord(code[self.java_position]) |
paul@5 | 553 | mnemonic, number_of_arguments = self.java_bytecodes[bytecode] |
paul@11 | 554 | number_of_arguments = self.process_bytecode(mnemonic, number_of_arguments, code, program) |
paul@11 | 555 | next_java_position = self.java_position + 1 + number_of_arguments |
paul@11 | 556 | |
paul@18 | 557 | # Insert exception block end details. |
paul@18 | 558 | for exception in exception_block_end.get(next_java_position, []): |
paul@18 | 559 | # NOTE: Insert jump beyond handlers. |
paul@18 | 560 | # NOTE: program.jump_forward/absolute(...) |
paul@18 | 561 | # NOTE: Insert end finally at end of handlers as well as where "ret" occurs. |
paul@18 | 562 | if exception.catch_type != 0: |
paul@18 | 563 | program.pop_block() |
paul@18 | 564 | |
paul@11 | 565 | # Only advance the JVM position after sneaking in extra Python |
paul@11 | 566 | # instructions. |
paul@11 | 567 | self.java_position = next_java_position |
paul@5 | 568 | |
paul@7 | 569 | def process_bytecode(self, mnemonic, number_of_arguments, code, program): |
paul@5 | 570 | if number_of_arguments is not None: |
paul@5 | 571 | arguments = [] |
paul@5 | 572 | for j in range(0, number_of_arguments): |
paul@5 | 573 | arguments.append(ord(code[self.java_position + 1 + j])) |
paul@5 | 574 | |
paul@5 | 575 | # Call the handler. |
paul@5 | 576 | getattr(self, mnemonic)(arguments, program) |
paul@11 | 577 | return number_of_arguments |
paul@5 | 578 | else: |
paul@5 | 579 | # Call the handler. |
paul@11 | 580 | return getattr(self, mnemonic)(code[self.java_position+1:], program) |
paul@5 | 581 | |
paul@5 | 582 | java_bytecodes = { |
paul@5 | 583 | # code : (mnemonic, number of following bytes, change in stack) |
paul@5 | 584 | 0 : ("nop", 0), |
paul@5 | 585 | 1 : ("aconst_null", 0), |
paul@5 | 586 | 2 : ("iconst_m1", 0), |
paul@5 | 587 | 3 : ("iconst_0", 0), |
paul@5 | 588 | 4 : ("iconst_1", 0), |
paul@5 | 589 | 5 : ("iconst_2", 0), |
paul@5 | 590 | 6 : ("iconst_3", 0), |
paul@5 | 591 | 7 : ("iconst_4", 0), |
paul@5 | 592 | 8 : ("iconst_5", 0), |
paul@5 | 593 | 9 : ("lconst_0", 0), |
paul@5 | 594 | 10 : ("lconst_1", 0), |
paul@5 | 595 | 11 : ("fconst_0", 0), |
paul@5 | 596 | 12 : ("fconst_1", 0), |
paul@5 | 597 | 13 : ("fconst_2", 0), |
paul@5 | 598 | 14 : ("dconst_0", 0), |
paul@5 | 599 | 15 : ("dconst_1", 0), |
paul@5 | 600 | 16 : ("bipush", 1), |
paul@5 | 601 | 17 : ("sipush", 2), |
paul@5 | 602 | 18 : ("ldc", 1), |
paul@5 | 603 | 19 : ("ldc_w", 2), |
paul@5 | 604 | 20 : ("ldc2_w", 2), |
paul@5 | 605 | 21 : ("iload", 1), |
paul@5 | 606 | 22 : ("lload", 1), |
paul@5 | 607 | 23 : ("fload", 1), |
paul@5 | 608 | 24 : ("dload", 1), |
paul@5 | 609 | 25 : ("aload", 1), |
paul@5 | 610 | 26 : ("iload_0", 0), |
paul@5 | 611 | 27 : ("iload_1", 0), |
paul@5 | 612 | 28 : ("iload_2", 0), |
paul@5 | 613 | 29 : ("iload_3", 0), |
paul@5 | 614 | 30 : ("lload_0", 0), |
paul@5 | 615 | 31 : ("lload_1", 0), |
paul@5 | 616 | 32 : ("lload_2", 0), |
paul@5 | 617 | 33 : ("lload_3", 0), |
paul@5 | 618 | 34 : ("fload_0", 0), |
paul@5 | 619 | 35 : ("fload_1", 0), |
paul@5 | 620 | 36 : ("fload_2", 0), |
paul@5 | 621 | 37 : ("fload_3", 0), |
paul@5 | 622 | 38 : ("dload_0", 0), |
paul@5 | 623 | 39 : ("dload_1", 0), |
paul@5 | 624 | 40 : ("dload_2", 0), |
paul@5 | 625 | 41 : ("dload_3", 0), |
paul@5 | 626 | 42 : ("aload_0", 0), |
paul@5 | 627 | 43 : ("aload_1", 0), |
paul@5 | 628 | 44 : ("aload_2", 0), |
paul@5 | 629 | 45 : ("aload_3", 0), |
paul@5 | 630 | 46 : ("iaload", 0), |
paul@5 | 631 | 47 : ("laload", 0), |
paul@5 | 632 | 48 : ("faload", 0), |
paul@5 | 633 | 49 : ("daload", 0), |
paul@5 | 634 | 50 : ("aaload", 0), |
paul@5 | 635 | 51 : ("baload", 0), |
paul@5 | 636 | 52 : ("caload", 0), |
paul@5 | 637 | 53 : ("saload", 0), |
paul@5 | 638 | 54 : ("istore", 1), |
paul@5 | 639 | 55 : ("lstore", 1), |
paul@5 | 640 | 56 : ("fstore", 1), |
paul@5 | 641 | 57 : ("dstore", 1), |
paul@5 | 642 | 58 : ("astore", 1), |
paul@5 | 643 | 59 : ("istore_0", 0), |
paul@5 | 644 | 60 : ("istore_1", 0), |
paul@5 | 645 | 61 : ("istore_2", 0), |
paul@5 | 646 | 62 : ("istore_3", 0), |
paul@5 | 647 | 63 : ("lstore_0", 0), |
paul@5 | 648 | 64 : ("lstore_1", 0), |
paul@5 | 649 | 65 : ("lstore_2", 0), |
paul@5 | 650 | 66 : ("lstore_3", 0), |
paul@5 | 651 | 67 : ("fstore_0", 0), |
paul@5 | 652 | 68 : ("fstore_1", 0), |
paul@5 | 653 | 69 : ("fstore_2", 0), |
paul@5 | 654 | 70 : ("fstore_3", 0), |
paul@5 | 655 | 71 : ("dstore_0", 0), |
paul@5 | 656 | 72 : ("dstore_1", 0), |
paul@5 | 657 | 73 : ("dstore_2", 0), |
paul@5 | 658 | 74 : ("dstore_3", 0), |
paul@5 | 659 | 75 : ("astore_0", 0), |
paul@5 | 660 | 76 : ("astore_1", 0), |
paul@5 | 661 | 77 : ("astore_2", 0), |
paul@5 | 662 | 78 : ("astore_3", 0), |
paul@5 | 663 | 79 : ("iastore", 0), |
paul@5 | 664 | 80 : ("lastore", 0), |
paul@5 | 665 | 81 : ("fastore", 0), |
paul@5 | 666 | 82 : ("dastore", 0), |
paul@5 | 667 | 83 : ("aastore", 0), |
paul@5 | 668 | 84 : ("bastore", 0), |
paul@5 | 669 | 85 : ("castore", 0), |
paul@5 | 670 | 86 : ("sastore", 0), |
paul@5 | 671 | 87 : ("pop", 0), |
paul@5 | 672 | 88 : ("pop2", 0), |
paul@5 | 673 | 89 : ("dup", 0), |
paul@5 | 674 | 90 : ("dup_x1", 0), |
paul@5 | 675 | 91 : ("dup_x2", 0), |
paul@5 | 676 | 92 : ("dup2", 0), |
paul@5 | 677 | 93 : ("dup2_x1", 0), |
paul@5 | 678 | 94 : ("dup2_x2", 0), |
paul@5 | 679 | 95 : ("swap", 0), |
paul@5 | 680 | 96 : ("iadd", 0), |
paul@5 | 681 | 97 : ("ladd", 0), |
paul@5 | 682 | 98 : ("fadd", 0), |
paul@5 | 683 | 99 : ("dadd", 0), |
paul@5 | 684 | 100 : ("isub", 0), |
paul@5 | 685 | 101 : ("lsub", 0), |
paul@5 | 686 | 102 : ("fsub", 0), |
paul@5 | 687 | 103 : ("dsub", 0), |
paul@5 | 688 | 104 : ("imul", 0), |
paul@5 | 689 | 105 : ("lmul", 0), |
paul@5 | 690 | 106 : ("fmul", 0), |
paul@5 | 691 | 107 : ("dmul", 0), |
paul@5 | 692 | 108 : ("idiv", 0), |
paul@5 | 693 | 109 : ("ldiv", 0), |
paul@5 | 694 | 110 : ("fdiv", 0), |
paul@5 | 695 | 111 : ("ddiv", 0), |
paul@5 | 696 | 112 : ("irem", 0), |
paul@5 | 697 | 113 : ("lrem", 0), |
paul@5 | 698 | 114 : ("frem", 0), |
paul@5 | 699 | 115 : ("drem", 0), |
paul@5 | 700 | 116 : ("ineg", 0), |
paul@5 | 701 | 117 : ("lneg", 0), |
paul@5 | 702 | 118 : ("fneg", 0), |
paul@5 | 703 | 119 : ("dneg", 0), |
paul@5 | 704 | 120 : ("ishl", 0), |
paul@5 | 705 | 121 : ("lshl", 0), |
paul@5 | 706 | 122 : ("ishr", 0), |
paul@5 | 707 | 123 : ("lshr", 0), |
paul@5 | 708 | 124 : ("iushr", 0), |
paul@5 | 709 | 125 : ("lushr", 0), |
paul@5 | 710 | 126 : ("iand", 0), |
paul@5 | 711 | 127 : ("land", 0), |
paul@5 | 712 | 128 : ("ior", 0), |
paul@5 | 713 | 129 : ("lor", 0), |
paul@5 | 714 | 130 : ("ixor", 0), |
paul@5 | 715 | 131 : ("lxor", 0), |
paul@5 | 716 | 132 : ("iinc", 2), |
paul@5 | 717 | 133 : ("i2l", 0), |
paul@5 | 718 | 134 : ("i2f", 0), |
paul@5 | 719 | 135 : ("i2d", 0), |
paul@5 | 720 | 136 : ("l2i", 0), |
paul@5 | 721 | 137 : ("l2f", 0), |
paul@5 | 722 | 138 : ("l2d", 0), |
paul@5 | 723 | 139 : ("f2i", 0), |
paul@5 | 724 | 140 : ("f2l", 0), |
paul@5 | 725 | 141 : ("f2d", 0), |
paul@5 | 726 | 142 : ("d2i", 0), |
paul@5 | 727 | 143 : ("d2l", 0), |
paul@5 | 728 | 144 : ("d2f", 0), |
paul@5 | 729 | 145 : ("i2b", 0), |
paul@5 | 730 | 146 : ("i2c", 0), |
paul@5 | 731 | 147 : ("i2s", 0), |
paul@5 | 732 | 148 : ("lcmp", 0), |
paul@5 | 733 | 149 : ("fcmpl", 0), |
paul@5 | 734 | 150 : ("fcmpg", 0), |
paul@5 | 735 | 151 : ("dcmpl", 0), |
paul@5 | 736 | 152 : ("dcmpg", 0), |
paul@5 | 737 | 153 : ("ifeq", 2), |
paul@5 | 738 | 154 : ("ifne", 2), |
paul@5 | 739 | 155 : ("iflt", 2), |
paul@5 | 740 | 156 : ("ifge", 2), |
paul@5 | 741 | 157 : ("ifgt", 2), |
paul@5 | 742 | 158 : ("ifle", 2), |
paul@5 | 743 | 159 : ("if_icmpeq", 2), |
paul@5 | 744 | 160 : ("if_icmpne", 2), |
paul@5 | 745 | 161 : ("if_icmplt", 2), |
paul@5 | 746 | 162 : ("if_icmpge", 2), |
paul@5 | 747 | 163 : ("if_icmpgt", 2), |
paul@5 | 748 | 164 : ("if_icmple", 2), |
paul@5 | 749 | 165 : ("if_acmpeq", 2), |
paul@5 | 750 | 166 : ("if_acmpne", 2), |
paul@5 | 751 | 167 : ("goto", 2), |
paul@5 | 752 | 168 : ("jsr", 2), |
paul@5 | 753 | 169 : ("ret", 1), |
paul@5 | 754 | 170 : ("tableswitch", None), # variable number of arguments |
paul@5 | 755 | 171 : ("lookupswitch", None), # variable number of arguments |
paul@5 | 756 | 172 : ("ireturn", 0), |
paul@5 | 757 | 173 : ("lreturn", 0), |
paul@5 | 758 | 174 : ("freturn", 0), |
paul@5 | 759 | 175 : ("dreturn", 0), |
paul@5 | 760 | 176 : ("areturn", 0), |
paul@8 | 761 | 177 : ("return_", 0), |
paul@5 | 762 | 178 : ("getstatic", 2), |
paul@5 | 763 | 179 : ("putstatic", 2), |
paul@5 | 764 | 180 : ("getfield", 2), |
paul@5 | 765 | 181 : ("putfield", 2), |
paul@5 | 766 | 182 : ("invokevirtual", 2), |
paul@5 | 767 | 183 : ("invokespecial", 2), |
paul@5 | 768 | 184 : ("invokestatic", 2), |
paul@5 | 769 | 185 : ("invokeinterface", 4), |
paul@5 | 770 | 187 : ("new", 2), |
paul@5 | 771 | 188 : ("newarray", 1), |
paul@5 | 772 | 189 : ("anewarray", 2), |
paul@5 | 773 | 190 : ("arraylength", 0), |
paul@5 | 774 | 191 : ("athrow", 0), |
paul@5 | 775 | 192 : ("checkcast", 2), |
paul@5 | 776 | 193 : ("instanceof", 2), |
paul@5 | 777 | 194 : ("monitorenter", 0), |
paul@5 | 778 | 195 : ("monitorexit", 0), |
paul@5 | 779 | 196 : ("wide", None), # 3 or 5 arguments, stack changes according to modified element |
paul@5 | 780 | 197 : ("multianewarray", 3), |
paul@5 | 781 | 198 : ("ifnull", 2), |
paul@5 | 782 | 199 : ("ifnonnull", 2), |
paul@5 | 783 | 200 : ("goto_w", 4), |
paul@5 | 784 | 201 : ("jsr_w", 4), |
paul@5 | 785 | } |
paul@5 | 786 | |
paul@7 | 787 | class BytecodeDisassembler(BytecodeReader): |
paul@7 | 788 | |
paul@7 | 789 | "A Java bytecode disassembler." |
paul@7 | 790 | |
paul@7 | 791 | bytecode_methods = [spec[0] for spec in BytecodeReader.java_bytecodes.values()] |
paul@7 | 792 | |
paul@7 | 793 | def __getattr__(self, name): |
paul@7 | 794 | if name in self.bytecode_methods: |
paul@18 | 795 | print "%5s %s" % (self.java_position, name), |
paul@7 | 796 | return self.generic |
paul@7 | 797 | else: |
paul@7 | 798 | raise AttributeError, name |
paul@7 | 799 | |
paul@7 | 800 | def generic(self, arguments, program): |
paul@7 | 801 | print arguments |
paul@7 | 802 | |
paul@7 | 803 | class BytecodeDisassemblerProgram: |
paul@7 | 804 | position = 0 |
paul@11 | 805 | def setup_except(self, target): |
paul@11 | 806 | print "(setup_except %s)" % target |
paul@11 | 807 | def setup_finally(self, target): |
paul@11 | 808 | print "(setup_finally %s)" % target |
paul@11 | 809 | def end_exception(self): |
paul@11 | 810 | print "(end_exception)" |
paul@24 | 811 | def start_handler(self, exc_name): |
paul@24 | 812 | print "(start_handler %s)" % exc_name |
paul@11 | 813 | def pop_block(self): |
paul@11 | 814 | print "(pop_block)" |
paul@7 | 815 | |
paul@7 | 816 | class BytecodeTranslator(BytecodeReader): |
paul@7 | 817 | |
paul@7 | 818 | "A Java bytecode translator which uses a Python bytecode writer." |
paul@7 | 819 | |
paul@7 | 820 | def aaload(self, arguments, program): |
paul@7 | 821 | # NOTE: No type checking performed. |
paul@7 | 822 | program.binary_subscr() |
paul@7 | 823 | |
paul@7 | 824 | def aastore(self, arguments, program): |
paul@7 | 825 | # NOTE: No type checking performed. |
paul@7 | 826 | # Stack: arrayref, index, value |
paul@7 | 827 | program.rot_three() # Stack: value, arrayref, index |
paul@7 | 828 | program.store_subscr() |
paul@7 | 829 | |
paul@7 | 830 | def aconst_null(self, arguments, program): |
paul@18 | 831 | program.load_const(None) |
paul@7 | 832 | |
paul@7 | 833 | def aload(self, arguments, program): |
paul@7 | 834 | program.load_fast(arguments[0]) |
paul@7 | 835 | |
paul@7 | 836 | def aload_0(self, arguments, program): |
paul@7 | 837 | program.load_fast(0) |
paul@7 | 838 | |
paul@7 | 839 | def aload_1(self, arguments, program): |
paul@7 | 840 | program.load_fast(1) |
paul@7 | 841 | |
paul@7 | 842 | def aload_2(self, arguments, program): |
paul@7 | 843 | program.load_fast(2) |
paul@7 | 844 | |
paul@7 | 845 | def aload_3(self, arguments, program): |
paul@7 | 846 | program.load_fast(3) |
paul@7 | 847 | |
paul@7 | 848 | def anewarray(self, arguments, program): |
paul@7 | 849 | # NOTE: Does not raise NegativeArraySizeException. |
paul@7 | 850 | # NOTE: Not using the index to type the list/array. |
paul@7 | 851 | index = (arguments[0] << 8) + arguments[1] |
paul@8 | 852 | self._newarray(program) |
paul@7 | 853 | |
paul@8 | 854 | def _newarray(self, program): |
paul@7 | 855 | program.build_list() # Stack: count, list |
paul@7 | 856 | program.rot_two() # Stack: list, count |
paul@7 | 857 | program.setup_loop() |
paul@7 | 858 | program.load_global("range") |
paul@7 | 859 | program.load_const(0) # Stack: list, count, range, 0 |
paul@7 | 860 | program.rot_three() # Stack: list, 0, count, range |
paul@7 | 861 | program.rot_three() # Stack: list, range, 0, count |
paul@7 | 862 | program.call_function(2) # Stack: list, range_list |
paul@7 | 863 | program.get_iter() # Stack: list, iter |
paul@7 | 864 | program.for_iter() # Stack: list, iter, value |
paul@7 | 865 | program.pop_top() # Stack: list, iter |
paul@7 | 866 | program.rot_two() # Stack: iter, list |
paul@7 | 867 | program.dup_top() # Stack: iter, list, list |
paul@7 | 868 | program.load_attr("append") # Stack: iter, list, append |
paul@18 | 869 | program.load_const(None) # Stack: iter, list, append, None |
paul@7 | 870 | program.call_function(1) # Stack: iter, list, None |
paul@7 | 871 | program.pop_top() # Stack: iter, list |
paul@7 | 872 | program.rot_two() # Stack: list, iter |
paul@7 | 873 | program.end_loop() # Back to for_iter above |
paul@7 | 874 | |
paul@7 | 875 | def areturn(self, arguments, program): |
paul@7 | 876 | program.return_value() |
paul@7 | 877 | |
paul@7 | 878 | def arraylength(self, arguments, program): |
paul@7 | 879 | program.load_global("len") # Stack: arrayref, len |
paul@7 | 880 | program.rot_two() # Stack: len, arrayref |
paul@7 | 881 | program.call_function(1) |
paul@7 | 882 | |
paul@7 | 883 | def astore(self, arguments, program): |
paul@7 | 884 | program.store_fast(arguments[0]) |
paul@7 | 885 | |
paul@7 | 886 | def astore_0(self, arguments, program): |
paul@7 | 887 | program.store_fast(0) |
paul@7 | 888 | |
paul@7 | 889 | def astore_1(self, arguments, program): |
paul@7 | 890 | program.store_fast(1) |
paul@7 | 891 | |
paul@7 | 892 | def astore_2(self, arguments, program): |
paul@7 | 893 | program.store_fast(2) |
paul@7 | 894 | |
paul@7 | 895 | def astore_3(self, arguments, program): |
paul@7 | 896 | program.store_fast(3) |
paul@7 | 897 | |
paul@7 | 898 | def athrow(self, arguments, program): |
paul@7 | 899 | # NOTE: NullPointerException not raised where null/None is found on the stack. |
paul@22 | 900 | # If this instruction appears in a finally handler, use end_finally instead. |
paul@22 | 901 | if self.in_finally: |
paul@22 | 902 | program.end_finally() |
paul@22 | 903 | else: |
paul@22 | 904 | program.dup_top() |
paul@22 | 905 | program.raise_varargs(1) |
paul@7 | 906 | |
paul@7 | 907 | baload = aaload |
paul@7 | 908 | bastore = aastore |
paul@7 | 909 | |
paul@7 | 910 | def bipush(self, arguments, program): |
paul@7 | 911 | program.load_const(arguments[0]) |
paul@7 | 912 | |
paul@7 | 913 | caload = aaload |
paul@7 | 914 | castore = aastore |
paul@7 | 915 | |
paul@7 | 916 | def checkcast(self, arguments, program): |
paul@7 | 917 | index = (arguments[0] << 8) + arguments[1] |
paul@23 | 918 | target_name = self.class_file.constants[index - 1].get_python_name() |
paul@11 | 919 | # NOTE: Using the string version of the name which may contain incompatible characters. |
paul@11 | 920 | target_components = str(target_name).split("/") |
paul@7 | 921 | |
paul@7 | 922 | program.dup_top() # Stack: objectref, objectref |
paul@7 | 923 | program.load_global("isinstance") # Stack: objectref, objectref, isinstance |
paul@7 | 924 | program.rot_two() # Stack: objectref, isinstance, objectref |
paul@7 | 925 | program.load_global(target_components[0]) |
paul@7 | 926 | for target_component in target_components[1:]: |
paul@7 | 927 | program.load_attr(target_component) |
paul@7 | 928 | program.call_function(2) # Stack: objectref |
paul@7 | 929 | |
paul@7 | 930 | def d2f(self, arguments, program): |
paul@7 | 931 | pass |
paul@7 | 932 | |
paul@7 | 933 | def d2i(self, arguments, program): |
paul@7 | 934 | program.load_global("int") # Stack: value, int |
paul@7 | 935 | program.rot_two() # Stack: int, value |
paul@7 | 936 | program.call_function(1) # Stack: result |
paul@7 | 937 | |
paul@7 | 938 | d2l = d2i # Preserving Java semantics |
paul@7 | 939 | |
paul@7 | 940 | def dadd(self, arguments, program): |
paul@7 | 941 | # NOTE: No type checking performed. |
paul@7 | 942 | program.binary_add() |
paul@7 | 943 | |
paul@7 | 944 | daload = aaload |
paul@7 | 945 | dastore = aastore |
paul@7 | 946 | |
paul@7 | 947 | def dcmpg(self, arguments, program): |
paul@7 | 948 | # NOTE: No type checking performed. |
paul@7 | 949 | program.compare_op(">") |
paul@7 | 950 | |
paul@7 | 951 | def dcmpl(self, arguments, program): |
paul@7 | 952 | # NOTE: No type checking performed. |
paul@7 | 953 | program.compare_op("<") |
paul@7 | 954 | |
paul@7 | 955 | def dconst_0(self, arguments, program): |
paul@7 | 956 | program.load_const(0.0) |
paul@7 | 957 | |
paul@7 | 958 | def dconst_1(self, arguments, program): |
paul@7 | 959 | program.load_const(1.0) |
paul@7 | 960 | |
paul@7 | 961 | def ddiv(self, arguments, program): |
paul@7 | 962 | # NOTE: No type checking performed. |
paul@7 | 963 | program.binary_divide() |
paul@7 | 964 | |
paul@7 | 965 | dload = aload |
paul@7 | 966 | dload_0 = aload_0 |
paul@7 | 967 | dload_1 = aload_1 |
paul@7 | 968 | dload_2 = aload_2 |
paul@7 | 969 | dload_3 = aload_3 |
paul@7 | 970 | |
paul@7 | 971 | def dmul(self, arguments, program): |
paul@7 | 972 | # NOTE: No type checking performed. |
paul@7 | 973 | program.binary_multiply() |
paul@7 | 974 | |
paul@7 | 975 | def dneg(self, arguments, program): |
paul@7 | 976 | # NOTE: No type checking performed. |
paul@7 | 977 | program.unary_negative() |
paul@7 | 978 | |
paul@7 | 979 | def drem(self, arguments, program): |
paul@7 | 980 | # NOTE: No type checking performed. |
paul@7 | 981 | program.binary_modulo() |
paul@7 | 982 | |
paul@7 | 983 | dreturn = areturn |
paul@7 | 984 | dstore = astore |
paul@7 | 985 | dstore_0 = astore_0 |
paul@7 | 986 | dstore_1 = astore_1 |
paul@7 | 987 | dstore_2 = astore_2 |
paul@7 | 988 | dstore_3 = astore_3 |
paul@7 | 989 | |
paul@7 | 990 | def dsub(self, arguments, program): |
paul@7 | 991 | # NOTE: No type checking performed. |
paul@7 | 992 | program.binary_subtract() |
paul@7 | 993 | |
paul@7 | 994 | def dup(self, arguments, program): |
paul@7 | 995 | program.dup_top() |
paul@7 | 996 | |
paul@7 | 997 | def dup_x1(self, arguments, program): |
paul@7 | 998 | # Ignoring computational type categories. |
paul@7 | 999 | program.dup_top() |
paul@7 | 1000 | program.rot_three() |
paul@7 | 1001 | |
paul@7 | 1002 | def dup_x2(self, arguments, program): |
paul@7 | 1003 | # Ignoring computational type categories. |
paul@7 | 1004 | program.dup_top() |
paul@7 | 1005 | program.rot_four() |
paul@7 | 1006 | |
paul@7 | 1007 | dup2 = dup # Ignoring computational type categories |
paul@7 | 1008 | dup2_x1 = dup_x1 # Ignoring computational type categories |
paul@7 | 1009 | dup2_x2 = dup_x2 # Ignoring computational type categories |
paul@7 | 1010 | |
paul@7 | 1011 | def f2d(self, arguments, program): |
paul@7 | 1012 | pass # Preserving Java semantics |
paul@7 | 1013 | |
paul@7 | 1014 | def f2i(self, arguments, program): |
paul@7 | 1015 | program.load_global("int") # Stack: value, int |
paul@7 | 1016 | program.rot_two() # Stack: int, value |
paul@7 | 1017 | program.call_function(1) # Stack: result |
paul@7 | 1018 | |
paul@7 | 1019 | f2l = f2i # Preserving Java semantics |
paul@7 | 1020 | fadd = dadd |
paul@7 | 1021 | faload = daload |
paul@7 | 1022 | fastore = dastore |
paul@7 | 1023 | fcmpg = dcmpg |
paul@7 | 1024 | fcmpl = dcmpl |
paul@7 | 1025 | fconst_0 = dconst_0 |
paul@7 | 1026 | fconst_1 = dconst_1 |
paul@7 | 1027 | |
paul@7 | 1028 | def fconst_2(self, arguments, program): |
paul@7 | 1029 | program.load_const(2.0) |
paul@7 | 1030 | |
paul@7 | 1031 | fdiv = ddiv |
paul@7 | 1032 | fload = dload |
paul@7 | 1033 | fload_0 = dload_0 |
paul@7 | 1034 | fload_1 = dload_1 |
paul@7 | 1035 | fload_2 = dload_2 |
paul@7 | 1036 | fload_3 = dload_3 |
paul@7 | 1037 | fmul = dmul |
paul@7 | 1038 | fneg = dneg |
paul@7 | 1039 | frem = drem |
paul@7 | 1040 | freturn = dreturn |
paul@7 | 1041 | fstore = dstore |
paul@7 | 1042 | fstore_0 = dstore_0 |
paul@7 | 1043 | fstore_1 = dstore_1 |
paul@7 | 1044 | fstore_2 = dstore_2 |
paul@7 | 1045 | fstore_3 = dstore_3 |
paul@7 | 1046 | fsub = dsub |
paul@7 | 1047 | |
paul@7 | 1048 | def getfield(self, arguments, program): |
paul@7 | 1049 | index = (arguments[0] << 8) + arguments[1] |
paul@13 | 1050 | target_name = self.class_file.constants[index - 1].get_python_name() |
paul@7 | 1051 | # NOTE: Using the string version of the name which may contain incompatible characters. |
paul@7 | 1052 | program.load_attr(str(target_name)) |
paul@7 | 1053 | |
paul@8 | 1054 | def getstatic(self, arguments, program): |
paul@8 | 1055 | index = (arguments[0] << 8) + arguments[1] |
paul@13 | 1056 | target_name = self.class_file.constants[index - 1].get_python_name() |
paul@8 | 1057 | program.load_name("self") |
paul@8 | 1058 | program.load_attr("__class__") |
paul@8 | 1059 | # NOTE: Using the string version of the name which may contain incompatible characters. |
paul@8 | 1060 | program.load_attr(str(target_name)) |
paul@7 | 1061 | |
paul@7 | 1062 | def goto(self, arguments, program): |
paul@7 | 1063 | offset = signed2((arguments[0] << 8) + arguments[1]) |
paul@7 | 1064 | java_absolute = self.java_position + offset |
paul@7 | 1065 | program.jump_absolute(self.position_mapping[java_absolute]) |
paul@7 | 1066 | |
paul@7 | 1067 | def goto_w(self, arguments, program): |
paul@7 | 1068 | offset = signed4((arguments[0] << 24) + (arguments[1] << 16) + (arguments[2] << 8) + arguments[3]) |
paul@7 | 1069 | java_absolute = self.java_position + offset |
paul@7 | 1070 | program.jump_absolute(self.position_mapping[java_absolute]) |
paul@7 | 1071 | |
paul@7 | 1072 | def i2b(self, arguments, program): |
paul@7 | 1073 | pass |
paul@7 | 1074 | |
paul@7 | 1075 | def i2c(self, arguments, program): |
paul@7 | 1076 | program.load_global("chr") # Stack: value, chr |
paul@7 | 1077 | program.rot_two() # Stack: chr, value |
paul@7 | 1078 | program.call_function(1) # Stack: result |
paul@7 | 1079 | |
paul@7 | 1080 | def i2d(self, arguments, program): |
paul@7 | 1081 | program.load_global("float") # Stack: value, float |
paul@7 | 1082 | program.rot_two() # Stack: float, value |
paul@7 | 1083 | program.call_function(1) # Stack: result |
paul@7 | 1084 | |
paul@7 | 1085 | i2f = i2d # Not distinguishing between float and double |
paul@7 | 1086 | |
paul@7 | 1087 | def i2l(self, arguments, program): |
paul@7 | 1088 | pass # Preserving Java semantics |
paul@7 | 1089 | |
paul@7 | 1090 | def i2s(self, arguments, program): |
paul@7 | 1091 | pass # Not distinguishing between int and short |
paul@7 | 1092 | |
paul@7 | 1093 | iadd = fadd |
paul@7 | 1094 | iaload = faload |
paul@7 | 1095 | |
paul@7 | 1096 | def iand(self, arguments, program): |
paul@7 | 1097 | # NOTE: No type checking performed. |
paul@7 | 1098 | program.binary_and() |
paul@7 | 1099 | |
paul@7 | 1100 | iastore = fastore |
paul@7 | 1101 | |
paul@7 | 1102 | def iconst_m1(self, arguments, program): |
paul@7 | 1103 | program.load_const(-1) |
paul@7 | 1104 | |
paul@7 | 1105 | def iconst_0(self, arguments, program): |
paul@7 | 1106 | program.load_const(0) |
paul@7 | 1107 | |
paul@7 | 1108 | def iconst_1(self, arguments, program): |
paul@7 | 1109 | program.load_const(1) |
paul@7 | 1110 | |
paul@7 | 1111 | def iconst_2(self, arguments, program): |
paul@7 | 1112 | program.load_const(2) |
paul@7 | 1113 | |
paul@7 | 1114 | def iconst_3(self, arguments, program): |
paul@7 | 1115 | program.load_const(3) |
paul@7 | 1116 | |
paul@7 | 1117 | def iconst_4(self, arguments, program): |
paul@7 | 1118 | program.load_const(4) |
paul@7 | 1119 | |
paul@7 | 1120 | def iconst_5(self, arguments, program): |
paul@7 | 1121 | program.load_const(5) |
paul@7 | 1122 | |
paul@7 | 1123 | idiv = fdiv |
paul@7 | 1124 | |
paul@7 | 1125 | def _if_xcmpx(self, arguments, program, op): |
paul@7 | 1126 | offset = signed2((arguments[0] << 8) + arguments[1]) |
paul@7 | 1127 | java_absolute = self.java_position + offset |
paul@7 | 1128 | program.compare_op(op) |
paul@7 | 1129 | program.jump_to_label(0, "next") # skip if false |
paul@18 | 1130 | program.pop_top() |
paul@15 | 1131 | program.jump_absolute(self.position_mapping[java_absolute]) |
paul@7 | 1132 | program.start_label("next") |
paul@18 | 1133 | program.pop_top() |
paul@7 | 1134 | |
paul@7 | 1135 | def if_acmpeq(self, arguments, program): |
paul@7 | 1136 | # NOTE: No type checking performed. |
paul@7 | 1137 | self._if_xcmpx(arguments, program, "is") |
paul@7 | 1138 | |
paul@7 | 1139 | def if_acmpne(self, arguments, program): |
paul@7 | 1140 | # NOTE: No type checking performed. |
paul@7 | 1141 | self._if_xcmpx(arguments, program, "is not") |
paul@7 | 1142 | |
paul@7 | 1143 | def if_icmpeq(self, arguments, program): |
paul@7 | 1144 | # NOTE: No type checking performed. |
paul@7 | 1145 | self._if_xcmpx(arguments, program, "==") |
paul@7 | 1146 | |
paul@7 | 1147 | def if_icmpne(self, arguments, program): |
paul@7 | 1148 | # NOTE: No type checking performed. |
paul@7 | 1149 | self._if_xcmpx(arguments, program, "!=") |
paul@7 | 1150 | |
paul@7 | 1151 | def if_icmplt(self, arguments, program): |
paul@7 | 1152 | # NOTE: No type checking performed. |
paul@7 | 1153 | self._if_xcmpx(arguments, program, "<") |
paul@7 | 1154 | |
paul@7 | 1155 | def if_icmpge(self, arguments, program): |
paul@7 | 1156 | # NOTE: No type checking performed. |
paul@7 | 1157 | self._if_xcmpx(arguments, program, ">=") |
paul@7 | 1158 | |
paul@7 | 1159 | def if_icmpgt(self, arguments, program): |
paul@7 | 1160 | # NOTE: No type checking performed. |
paul@7 | 1161 | self._if_xcmpx(arguments, program, ">") |
paul@7 | 1162 | |
paul@7 | 1163 | def if_icmple(self, arguments, program): |
paul@7 | 1164 | # NOTE: No type checking performed. |
paul@7 | 1165 | self._if_xcmpx(arguments, program, "<=") |
paul@7 | 1166 | |
paul@7 | 1167 | def ifeq(self, arguments, program): |
paul@7 | 1168 | # NOTE: No type checking performed. |
paul@7 | 1169 | program.load_const(0) |
paul@7 | 1170 | self._if_xcmpx(arguments, program, "==") |
paul@7 | 1171 | |
paul@7 | 1172 | def ifne(self, arguments, program): |
paul@7 | 1173 | # NOTE: No type checking performed. |
paul@7 | 1174 | program.load_const(0) |
paul@7 | 1175 | self._if_xcmpx(arguments, program, "!=") |
paul@7 | 1176 | |
paul@7 | 1177 | def iflt(self, arguments, program): |
paul@7 | 1178 | # NOTE: No type checking performed. |
paul@7 | 1179 | program.load_const(0) |
paul@7 | 1180 | self._if_xcmpx(arguments, program, "<") |
paul@7 | 1181 | |
paul@7 | 1182 | def ifge(self, arguments, program): |
paul@7 | 1183 | # NOTE: No type checking performed. |
paul@7 | 1184 | program.load_const(0) |
paul@7 | 1185 | self._if_xcmpx(arguments, program, ">=") |
paul@7 | 1186 | |
paul@7 | 1187 | def ifgt(self, arguments, program): |
paul@7 | 1188 | # NOTE: No type checking performed. |
paul@7 | 1189 | program.load_const(0) |
paul@7 | 1190 | self._if_xcmpx(arguments, program, ">") |
paul@7 | 1191 | |
paul@7 | 1192 | def ifle(self, arguments, program): |
paul@7 | 1193 | # NOTE: No type checking performed. |
paul@7 | 1194 | program.load_const(0) |
paul@7 | 1195 | self._if_xcmpx(arguments, program, "<=") |
paul@7 | 1196 | |
paul@7 | 1197 | def ifnonnull(self, arguments, program): |
paul@7 | 1198 | # NOTE: No type checking performed. |
paul@7 | 1199 | program.load_const(None) |
paul@7 | 1200 | self._if_xcmpx(arguments, program, "is not") |
paul@7 | 1201 | |
paul@7 | 1202 | def ifnull(self, arguments, program): |
paul@7 | 1203 | # NOTE: No type checking performed. |
paul@7 | 1204 | program.load_const(None) |
paul@7 | 1205 | self._if_xcmpx(arguments, program, "is") |
paul@7 | 1206 | |
paul@7 | 1207 | def iinc(self, arguments, program): |
paul@7 | 1208 | # NOTE: No type checking performed. |
paul@7 | 1209 | program.load_fast(arguments[0]) |
paul@7 | 1210 | program.load_const(arguments[1]) |
paul@7 | 1211 | program.binary_add() |
paul@7 | 1212 | |
paul@7 | 1213 | iload = fload |
paul@7 | 1214 | iload_0 = fload_0 |
paul@7 | 1215 | iload_1 = fload_1 |
paul@7 | 1216 | iload_2 = fload_2 |
paul@7 | 1217 | iload_3 = fload_3 |
paul@7 | 1218 | imul = fmul |
paul@7 | 1219 | ineg = fneg |
paul@7 | 1220 | |
paul@7 | 1221 | def instanceof(self, arguments, program): |
paul@7 | 1222 | index = (arguments[0] << 8) + arguments[1] |
paul@23 | 1223 | target_name = self.class_file.constants[index - 1].get_python_name() |
paul@11 | 1224 | # NOTE: Using the string version of the name which may contain incompatible characters. |
paul@11 | 1225 | target_components = str(target_name).split("/") |
paul@7 | 1226 | |
paul@7 | 1227 | program.load_global("isinstance") # Stack: objectref, isinstance |
paul@7 | 1228 | program.rot_two() # Stack: isinstance, objectref |
paul@7 | 1229 | program.load_global(target_components[0]) |
paul@7 | 1230 | for target_component in target_components[1:]: |
paul@7 | 1231 | program.load_attr(target_component) |
paul@7 | 1232 | program.call_function(2) # Stack: result |
paul@7 | 1233 | |
paul@7 | 1234 | def _invoke(self, target_name, program): |
paul@7 | 1235 | # NOTE: Using the string version of the name which may contain incompatible characters. |
paul@7 | 1236 | program.load_attr(str(target_name)) # Stack: tuple, method |
paul@7 | 1237 | program.rot_two() # Stack: method, tuple |
paul@7 | 1238 | program.load_global("apply") # Stack: method, tuple, apply |
paul@7 | 1239 | program.rot_three() # Stack: apply, method, tuple |
paul@7 | 1240 | program.call_function(2) |
paul@7 | 1241 | |
paul@7 | 1242 | def invokeinterface(self, arguments, program): |
paul@7 | 1243 | # NOTE: This implementation does not perform the necessary checks for |
paul@7 | 1244 | # NOTE: signature-based polymorphism. |
paul@7 | 1245 | # NOTE: Java rules not specifically obeyed. |
paul@7 | 1246 | index = (arguments[0] << 8) + arguments[1] |
paul@7 | 1247 | count = arguments[2] |
paul@13 | 1248 | target_name = self.class_file.constants[index - 1].get_python_name() |
paul@7 | 1249 | # Stack: objectref, arg1, arg2, ... |
paul@7 | 1250 | program.build_tuple(count) # Stack: objectref, tuple |
paul@8 | 1251 | program.rot_two() # Stack: tuple, objectref |
paul@7 | 1252 | self._invoke(target_name, program) |
paul@7 | 1253 | |
paul@7 | 1254 | def invokespecial(self, arguments, program): |
paul@7 | 1255 | # NOTE: This implementation does not perform the necessary checks for |
paul@7 | 1256 | # NOTE: signature-based polymorphism. |
paul@7 | 1257 | # NOTE: Java rules not specifically obeyed. |
paul@7 | 1258 | index = (arguments[0] << 8) + arguments[1] |
paul@7 | 1259 | target = self.class_file.constants[index - 1] |
paul@13 | 1260 | target_name = target.get_python_name() |
paul@7 | 1261 | # Get the number of parameters from the descriptor. |
paul@7 | 1262 | count = len(target.get_descriptor()[0]) |
paul@22 | 1263 | |
paul@22 | 1264 | # Check for the method name and invoke superclasses where appropriate. |
paul@23 | 1265 | if str(self.method.get_python_name()) == "__init__": |
paul@22 | 1266 | program.build_tuple(count + 1) # Stack: tuple |
paul@23 | 1267 | # Must use the actual class. |
paul@23 | 1268 | # NOTE: Verify this. |
paul@23 | 1269 | program.load_global(str(self.class_file.this_class.get_python_name())) |
paul@23 | 1270 | # Stack: tuple, classref |
paul@22 | 1271 | program.load_attr("__bases__") # Stack: tuple, bases |
paul@22 | 1272 | program.dup_top() # Stack: tuple, bases, bases |
paul@22 | 1273 | program.load_global("len") # Stack: tuple, bases, bases, len |
paul@22 | 1274 | program.rot_two() # Stack: tuple, bases, len, bases |
paul@22 | 1275 | program.call_function(1) # Stack: tuple, bases, #bases |
paul@22 | 1276 | program.load_const(0) # Stack: tuple, bases, #bases, 0 |
paul@22 | 1277 | program.compare_op("==") # Stack: tuple, bases, result |
paul@22 | 1278 | program.jump_to_label(1, "next") |
paul@22 | 1279 | program.pop_top() # Stack: tuple, bases |
paul@22 | 1280 | program.load_const(0) # Stack: tuple, bases, 0 |
paul@22 | 1281 | program.binary_subscr() # Stack: tuple, bases[0] |
paul@22 | 1282 | self._invoke(target_name, program) |
paul@22 | 1283 | program.jump_to_label(None, "next2") |
paul@22 | 1284 | program.start_label("next") |
paul@22 | 1285 | program.pop_top() # Stack: tuple, bases |
paul@22 | 1286 | program.pop_top() # Stack: tuple |
paul@22 | 1287 | program.pop_top() # Stack: |
paul@22 | 1288 | program.start_label("next2") |
paul@22 | 1289 | |
paul@22 | 1290 | elif str(target_name) == "__init__": |
paul@22 | 1291 | # NOTE: Due to changes with the new instruction's implementation, the |
paul@22 | 1292 | # NOTE: stack differs from that stated: objectref, arg1, arg2, ... |
paul@22 | 1293 | # Stack: classref, arg1, arg2, ... |
paul@22 | 1294 | program.build_tuple(count) # Stack: classref, tuple |
paul@22 | 1295 | # NOTE: Stack: objectref, tuple |
paul@22 | 1296 | program.load_global("apply") # Stack: classref, tuple, apply |
paul@22 | 1297 | program.rot_three() # Stack: apply, classref, tuple |
paul@22 | 1298 | program.call_function(2) |
paul@22 | 1299 | |
paul@22 | 1300 | else: |
paul@22 | 1301 | program.build_tuple(count) # Stack: objectref, tuple |
paul@22 | 1302 | program.rot_two() # Stack: tuple, objectref |
paul@22 | 1303 | self._invoke(target_name, program) |
paul@15 | 1304 | |
paul@15 | 1305 | """ |
paul@15 | 1306 | def invokespecial(self, arguments, program): |
paul@15 | 1307 | # NOTE: This implementation does not perform the necessary checks for |
paul@15 | 1308 | # NOTE: signature-based polymorphism. |
paul@15 | 1309 | # NOTE: Java rules not specifically obeyed. |
paul@15 | 1310 | index = (arguments[0] << 8) + arguments[1] |
paul@15 | 1311 | target = self.class_file.constants[index - 1] |
paul@15 | 1312 | target_name = target.get_python_name() |
paul@15 | 1313 | # Get the number of parameters from the descriptor. |
paul@15 | 1314 | count = len(target.get_descriptor()[0]) |
paul@15 | 1315 | # Stack: objectref, arg1, arg2, ... |
paul@8 | 1316 | program.build_tuple(count + 1) # Stack: tuple |
paul@8 | 1317 | # Use the class to provide access to static methods. |
paul@8 | 1318 | program.load_name("self") # Stack: tuple, self |
paul@8 | 1319 | program.load_attr("__class__") # Stack: tuple, class |
paul@8 | 1320 | program.load_attr("__bases__") # Stack: tuple, base-classes |
paul@8 | 1321 | program.dup_top() # Stack: tuple, base-classes, base-classes |
paul@8 | 1322 | program.load_global("len") # Stack: tuple, base-classes, base-classes, len |
paul@8 | 1323 | program.rot_two() # Stack: tuple, base-classes, len, base-classes |
paul@8 | 1324 | program.call_function(1) # Stack: tuple, base-classes, count |
paul@8 | 1325 | program.load_const(0) # Stack: tuple, base-classes, count, 0 |
paul@8 | 1326 | program.compare_op("==") # Stack: tuple, base-classes, result |
paul@8 | 1327 | program.jump_to_label(1, "next") |
paul@8 | 1328 | program.pop_top() # Stack: tuple, base-classes |
paul@8 | 1329 | program.load_const(0) # Stack: tuple, base-classes, 0 |
paul@8 | 1330 | program.binary_subscr() # Stack: tuple, superclass |
paul@7 | 1331 | self._invoke(target_name, program) |
paul@8 | 1332 | program.jump_to_label(None, "next2") |
paul@8 | 1333 | program.start_label("next") |
paul@8 | 1334 | program.pop_top() # Stack: tuple, base-classes |
paul@8 | 1335 | program.pop_top() # Stack: tuple |
paul@8 | 1336 | program.pop_top() # Stack: |
paul@8 | 1337 | program.start_label("next2") |
paul@15 | 1338 | """ |
paul@7 | 1339 | |
paul@7 | 1340 | def invokestatic(self, arguments, program): |
paul@7 | 1341 | # NOTE: This implementation does not perform the necessary checks for |
paul@7 | 1342 | # NOTE: signature-based polymorphism. |
paul@7 | 1343 | # NOTE: Java rules not specifically obeyed. |
paul@7 | 1344 | index = (arguments[0] << 8) + arguments[1] |
paul@7 | 1345 | target = self.class_file.constants[index - 1] |
paul@13 | 1346 | target_name = target.get_python_name() |
paul@7 | 1347 | # Get the number of parameters from the descriptor. |
paul@7 | 1348 | count = len(target.get_descriptor()[0]) |
paul@7 | 1349 | # Stack: arg1, arg2, ... |
paul@8 | 1350 | program.build_tuple(count) # Stack: tuple |
paul@8 | 1351 | # Use the class to provide access to static methods. |
paul@8 | 1352 | program.load_name("self") # Stack: tuple, self |
paul@8 | 1353 | program.load_attr("__class__") # Stack: tuple, class |
paul@7 | 1354 | self._invoke(target_name, program) |
paul@7 | 1355 | |
paul@22 | 1356 | def invokevirtual (self, arguments, program): |
paul@22 | 1357 | # NOTE: This implementation does not perform the necessary checks for |
paul@22 | 1358 | # NOTE: signature-based polymorphism. |
paul@22 | 1359 | # NOTE: Java rules not specifically obeyed. |
paul@22 | 1360 | index = (arguments[0] << 8) + arguments[1] |
paul@22 | 1361 | target = self.class_file.constants[index - 1] |
paul@22 | 1362 | target_name = target.get_python_name() |
paul@22 | 1363 | # Get the number of parameters from the descriptor. |
paul@22 | 1364 | count = len(target.get_descriptor()[0]) |
paul@22 | 1365 | # Stack: objectref, arg1, arg2, ... |
paul@22 | 1366 | program.build_tuple(count) # Stack: objectref, tuple |
paul@22 | 1367 | program.rot_two() # Stack: tuple, objectref |
paul@22 | 1368 | self._invoke(target_name, program) |
paul@7 | 1369 | |
paul@7 | 1370 | def ior(self, arguments, program): |
paul@7 | 1371 | # NOTE: No type checking performed. |
paul@7 | 1372 | program.binary_or() |
paul@7 | 1373 | |
paul@7 | 1374 | irem = frem |
paul@7 | 1375 | ireturn = freturn |
paul@7 | 1376 | |
paul@7 | 1377 | def ishl(self, arguments, program): |
paul@7 | 1378 | # NOTE: No type checking performed. |
paul@7 | 1379 | # NOTE: Not verified. |
paul@7 | 1380 | program.binary_lshift() |
paul@7 | 1381 | |
paul@7 | 1382 | def ishr(self, arguments, program): |
paul@7 | 1383 | # NOTE: No type checking performed. |
paul@7 | 1384 | # NOTE: Not verified. |
paul@7 | 1385 | program.binary_rshift() |
paul@7 | 1386 | |
paul@7 | 1387 | istore = fstore |
paul@7 | 1388 | istore_0 = fstore_0 |
paul@7 | 1389 | istore_1 = fstore_1 |
paul@7 | 1390 | istore_2 = fstore_2 |
paul@7 | 1391 | istore_3 = fstore_3 |
paul@7 | 1392 | isub = fsub |
paul@7 | 1393 | iushr = ishr # Ignoring distinctions between arithmetic and logical shifts |
paul@7 | 1394 | |
paul@7 | 1395 | def ixor(self, arguments, program): |
paul@7 | 1396 | # NOTE: No type checking performed. |
paul@7 | 1397 | program.binary_xor() |
paul@7 | 1398 | |
paul@7 | 1399 | def jsr(self, arguments, program): |
paul@7 | 1400 | offset = signed2((arguments[0] << 8) + arguments[1]) |
paul@7 | 1401 | java_absolute = self.java_position + offset |
paul@7 | 1402 | # Store the address of the next instruction. |
paul@8 | 1403 | program.load_const_ret(self.position_mapping[self.java_position + 3]) |
paul@7 | 1404 | program.jump_absolute(self.position_mapping[java_absolute]) |
paul@7 | 1405 | |
paul@7 | 1406 | def jsr_w(self, arguments, program): |
paul@7 | 1407 | offset = signed4((arguments[0] << 24) + (arguments[1] << 16) + (arguments[2] << 8) + arguments[3]) |
paul@7 | 1408 | java_absolute = self.java_position + offset |
paul@7 | 1409 | # Store the address of the next instruction. |
paul@8 | 1410 | program.load_const_ret(self.position_mapping[self.java_position + 5]) |
paul@7 | 1411 | program.jump_absolute(self.position_mapping[java_absolute]) |
paul@7 | 1412 | |
paul@7 | 1413 | l2d = i2d |
paul@7 | 1414 | l2f = i2f |
paul@7 | 1415 | |
paul@7 | 1416 | def l2i(self, arguments, program): |
paul@7 | 1417 | pass # Preserving Java semantics |
paul@7 | 1418 | |
paul@7 | 1419 | ladd = iadd |
paul@7 | 1420 | laload = iaload |
paul@7 | 1421 | land = iand |
paul@7 | 1422 | lastore = iastore |
paul@7 | 1423 | |
paul@7 | 1424 | def lcmp(self, arguments, program): |
paul@7 | 1425 | # NOTE: No type checking performed. |
paul@7 | 1426 | program.dup_topx(2) # Stack: value1, value2, value1, value2 |
paul@7 | 1427 | program.compare_op(">") # Stack: value1, value2, result |
paul@7 | 1428 | program.jump_to_label(0, "equals") |
paul@7 | 1429 | # True - produce result and branch. |
paul@7 | 1430 | program.pop_top() # Stack: value1, value2 |
paul@7 | 1431 | program.pop_top() # Stack: value1 |
paul@7 | 1432 | program.pop_top() # Stack: |
paul@7 | 1433 | program.load_const(1) # Stack: 1 |
paul@7 | 1434 | program.jump_to_label(None, "next") |
paul@7 | 1435 | # False - test equality. |
paul@7 | 1436 | program.start_label("equals") |
paul@7 | 1437 | program.pop_top() # Stack: value1, value2 |
paul@7 | 1438 | program.dup_topx(2) # Stack: value1, value2, value1, value2 |
paul@7 | 1439 | program.compare_op("==") # Stack: value1, value2, result |
paul@7 | 1440 | program.jump_to_label(0, "less") |
paul@7 | 1441 | # True - produce result and branch. |
paul@7 | 1442 | program.pop_top() # Stack: value1, value2 |
paul@7 | 1443 | program.pop_top() # Stack: value1 |
paul@7 | 1444 | program.pop_top() # Stack: |
paul@7 | 1445 | program.load_const(0) # Stack: 0 |
paul@7 | 1446 | program.jump_to_label(None, "next") |
paul@7 | 1447 | # False - produce result. |
paul@7 | 1448 | program.start_label("less") |
paul@7 | 1449 | program.pop_top() # Stack: value1, value2 |
paul@7 | 1450 | program.pop_top() # Stack: value1 |
paul@7 | 1451 | program.pop_top() # Stack: |
paul@7 | 1452 | program.load_const(-1) # Stack: -1 |
paul@7 | 1453 | program.start_label("next") |
paul@7 | 1454 | |
paul@7 | 1455 | lconst_0 = iconst_0 |
paul@7 | 1456 | lconst_1 = iconst_1 |
paul@7 | 1457 | |
paul@7 | 1458 | def ldc(self, arguments, program): |
paul@7 | 1459 | program.load_const(self.class_file.constants[arguments[0] - 1]) |
paul@7 | 1460 | |
paul@7 | 1461 | def ldc_w(self, arguments, program): |
paul@7 | 1462 | program.load_const(self.class_file.constants[(arguments[0] << 8) + arguments[1] - 1]) |
paul@7 | 1463 | |
paul@7 | 1464 | ldc2_w = ldc_w |
paul@7 | 1465 | ldiv = idiv |
paul@7 | 1466 | lload = iload |
paul@7 | 1467 | lload_0 = iload_0 |
paul@7 | 1468 | lload_1 = iload_1 |
paul@7 | 1469 | lload_2 = iload_2 |
paul@7 | 1470 | lload_3 = iload_3 |
paul@7 | 1471 | lmul = imul |
paul@7 | 1472 | lneg = ineg |
paul@7 | 1473 | |
paul@7 | 1474 | def lookupswitch(self, arguments, program): |
paul@7 | 1475 | # Find the offset to the next 4 byte boundary in the code. |
paul@7 | 1476 | d, r = divmod(self.java_position, 4) |
paul@7 | 1477 | to_boundary = (4 - r) % 4 |
paul@7 | 1478 | # Get the pertinent arguments. |
paul@7 | 1479 | arguments = arguments[to_boundary:] |
paul@7 | 1480 | default = (arguments[0] << 24) + (arguments[1] << 16) + (arguments[2] << 8) + arguments[3] |
paul@7 | 1481 | npairs = (arguments[4] << 24) + (arguments[5] << 16) + (arguments[6] << 8) + arguments[7] |
paul@7 | 1482 | # Process the pairs. |
paul@7 | 1483 | # NOTE: This is not the most optimal implementation. |
paul@7 | 1484 | pair_index = 8 |
paul@7 | 1485 | for pair in range(0, npairs): |
paul@7 | 1486 | match = ((arguments[pair_index] << 24) + (arguments[pair_index + 1] << 16) + |
paul@7 | 1487 | (arguments[pair_index + 2] << 8) + arguments[pair_index + 3]) |
paul@7 | 1488 | offset = signed4((arguments[pair_index + 4] << 24) + (arguments[pair_index + 5] << 16) + |
paul@7 | 1489 | (arguments[pair_index + 6] << 8) + arguments[pair_index + 7]) |
paul@7 | 1490 | # Calculate the branch target. |
paul@7 | 1491 | java_absolute = self.java_position + offset |
paul@7 | 1492 | # Generate branching code. |
paul@7 | 1493 | program.dup_top() # Stack: key, key |
paul@7 | 1494 | program.load_const(match) # Stack: key, key, match |
paul@7 | 1495 | program.compare_op("==") # Stack: key, result |
paul@8 | 1496 | program.jump_to_label(0, "end") |
paul@7 | 1497 | program.pop_top() # Stack: key |
paul@7 | 1498 | program.pop_top() # Stack: |
paul@7 | 1499 | program.jump_absolute(self.position_mapping[java_absolute]) |
paul@7 | 1500 | # Generate the label for the end of the branching code. |
paul@8 | 1501 | program.start_label("end") |
paul@7 | 1502 | program.pop_top() # Stack: key |
paul@7 | 1503 | # Update the index. |
paul@7 | 1504 | pair_index += 8 |
paul@7 | 1505 | # Generate the default. |
paul@7 | 1506 | java_absolute = self.java_position + default |
paul@7 | 1507 | program.jump_absolute(self.position_mapping[java_absolute]) |
paul@7 | 1508 | |
paul@7 | 1509 | lor = ior |
paul@7 | 1510 | lrem = irem |
paul@7 | 1511 | lreturn = ireturn |
paul@7 | 1512 | lshl = ishl |
paul@7 | 1513 | lshr = ishr |
paul@7 | 1514 | lstore = istore |
paul@7 | 1515 | lstore_0 = istore_0 |
paul@7 | 1516 | lstore_1 = istore_1 |
paul@7 | 1517 | lstore_2 = istore_2 |
paul@7 | 1518 | lstore_3 = istore_3 |
paul@7 | 1519 | lsub = isub |
paul@7 | 1520 | lushr = iushr |
paul@7 | 1521 | lxor = ixor |
paul@7 | 1522 | |
paul@7 | 1523 | def monitorenter(self, arguments, program): |
paul@7 | 1524 | # NOTE: To be implemented. |
paul@7 | 1525 | pass |
paul@7 | 1526 | |
paul@7 | 1527 | def monitorexit(self, arguments, program): |
paul@7 | 1528 | # NOTE: To be implemented. |
paul@7 | 1529 | pass |
paul@7 | 1530 | |
paul@7 | 1531 | def multianewarray(self, arguments, program): |
paul@8 | 1532 | # NOTE: To be implemented. |
paul@8 | 1533 | pass |
paul@8 | 1534 | |
paul@8 | 1535 | def new(self, arguments, program): |
paul@8 | 1536 | # This operation is considered to be the same as the calling of the |
paul@8 | 1537 | # initialisation method of the given class with no arguments. |
paul@8 | 1538 | index = (arguments[0] << 8) + arguments[1] |
paul@23 | 1539 | target_name = self.class_file.constants[index - 1].get_python_name() |
paul@8 | 1540 | # NOTE: Using the string version of the name which may contain incompatible characters. |
paul@8 | 1541 | program.load_global(str(target_name)) |
paul@22 | 1542 | # NOTE: Unlike Java, we do not provide an object reference. Instead, a |
paul@22 | 1543 | # NOTE: class reference is provided, and the invokespecial method's |
paul@22 | 1544 | # NOTE: behaviour is changed. |
paul@22 | 1545 | #program.call_function(0) |
paul@8 | 1546 | |
paul@8 | 1547 | def newarray(self, arguments, program): |
paul@8 | 1548 | # NOTE: Does not raise NegativeArraySizeException. |
paul@8 | 1549 | # NOTE: Not using the arguments to type the list/array. |
paul@8 | 1550 | self._newarray(program) |
paul@8 | 1551 | |
paul@8 | 1552 | def nop(self, arguments, program): |
paul@8 | 1553 | pass |
paul@8 | 1554 | |
paul@8 | 1555 | def pop(self, arguments, program): |
paul@8 | 1556 | program.pop_top() |
paul@8 | 1557 | |
paul@8 | 1558 | pop2 = pop # ignoring Java stack value distinctions |
paul@8 | 1559 | |
paul@8 | 1560 | def putfield(self, arguments, program): |
paul@8 | 1561 | index = (arguments[0] << 8) + arguments[1] |
paul@13 | 1562 | target_name = self.class_file.constants[index - 1].get_python_name() |
paul@8 | 1563 | program.rot_two() |
paul@8 | 1564 | # NOTE: Using the string version of the name which may contain incompatible characters. |
paul@8 | 1565 | program.store_attr(str(target_name)) |
paul@8 | 1566 | |
paul@8 | 1567 | def putstatic(self, arguments, program): |
paul@8 | 1568 | index = (arguments[0] << 8) + arguments[1] |
paul@13 | 1569 | target_name = self.class_file.constants[index - 1].get_python_name() |
paul@8 | 1570 | program.load_name("self") |
paul@8 | 1571 | program.load_attr("__class__") |
paul@8 | 1572 | # NOTE: Using the string version of the name which may contain incompatible characters. |
paul@8 | 1573 | program.store_attr(str(target_name)) |
paul@8 | 1574 | |
paul@8 | 1575 | def ret(self, arguments, program): |
paul@8 | 1576 | program.ret(arguments[0]) |
paul@22 | 1577 | # Indicate that the finally handler is probably over. |
paul@22 | 1578 | # NOTE: This is seemingly not guaranteed. |
paul@22 | 1579 | self.in_finally = 0 |
paul@8 | 1580 | |
paul@8 | 1581 | def return_(self, arguments, program): |
paul@8 | 1582 | program.load_const(None) |
paul@8 | 1583 | program.return_value() |
paul@8 | 1584 | |
paul@8 | 1585 | saload = laload |
paul@8 | 1586 | sastore = lastore |
paul@8 | 1587 | |
paul@8 | 1588 | def sipush(self, arguments, program): |
paul@8 | 1589 | program.load_const((arguments[0] << 8) + arguments[1]) |
paul@8 | 1590 | |
paul@8 | 1591 | def swap(self, arguments, program): |
paul@8 | 1592 | program.rot_two() |
paul@8 | 1593 | |
paul@8 | 1594 | def tableswitch(self, arguments, program): |
paul@8 | 1595 | # Find the offset to the next 4 byte boundary in the code. |
paul@8 | 1596 | d, r = divmod(self.java_position, 4) |
paul@8 | 1597 | to_boundary = (4 - r) % 4 |
paul@8 | 1598 | # Get the pertinent arguments. |
paul@8 | 1599 | arguments = arguments[to_boundary:] |
paul@8 | 1600 | default = (arguments[0] << 24) + (arguments[1] << 16) + (arguments[2] << 8) + arguments[3] |
paul@8 | 1601 | low = (arguments[4] << 24) + (arguments[5] << 16) + (arguments[6] << 8) + arguments[7] |
paul@8 | 1602 | high = (arguments[8] << 24) + (arguments[9] << 16) + (arguments[10] << 8) + arguments[11] |
paul@8 | 1603 | # Process the jump entries. |
paul@8 | 1604 | # NOTE: This is not the most optimal implementation. |
paul@8 | 1605 | jump_index = 8 |
paul@8 | 1606 | for jump in range(low, high + 1): |
paul@8 | 1607 | offset = signed4((arguments[jump_index] << 24) + (arguments[jump_index + 1] << 16) + |
paul@8 | 1608 | (arguments[jump_index + 2] << 8) + arguments[jump_index + 3]) |
paul@8 | 1609 | # Calculate the branch target. |
paul@8 | 1610 | java_absolute = self.java_position + offset |
paul@8 | 1611 | # Generate branching code. |
paul@8 | 1612 | program.dup_top() # Stack: key, key |
paul@8 | 1613 | program.load_const(jump) # Stack: key, key, jump |
paul@8 | 1614 | program.compare_op("==") # Stack: key, result |
paul@8 | 1615 | program.jump_to_label(0, "end") |
paul@8 | 1616 | program.pop_top() # Stack: key |
paul@8 | 1617 | program.pop_top() # Stack: |
paul@8 | 1618 | program.jump_absolute(self.position_mapping[java_absolute]) |
paul@8 | 1619 | # Generate the label for the end of the branching code. |
paul@8 | 1620 | program.start_label("end") |
paul@8 | 1621 | program.pop_top() # Stack: key |
paul@8 | 1622 | # Update the index. |
paul@8 | 1623 | jump_index += 8 |
paul@8 | 1624 | # Generate the default. |
paul@8 | 1625 | java_absolute = self.java_position + default |
paul@8 | 1626 | program.jump_absolute(self.position_mapping[java_absolute]) |
paul@7 | 1627 | |
paul@7 | 1628 | def wide(self, code, program): |
paul@7 | 1629 | # NOTE: To be implemented. |
paul@7 | 1630 | return number_of_arguments |
paul@7 | 1631 | |
paul@22 | 1632 | def disassemble(class_file, method): |
paul@7 | 1633 | disassembler = BytecodeDisassembler(class_file) |
paul@22 | 1634 | disassembler.process(method, BytecodeDisassemblerProgram()) |
paul@7 | 1635 | |
paul@22 | 1636 | def translate(class_file, method): |
paul@7 | 1637 | translator = BytecodeTranslator(class_file) |
paul@7 | 1638 | writer = BytecodeWriter() |
paul@22 | 1639 | translator.process(method, writer) |
paul@11 | 1640 | return translator, writer |
paul@7 | 1641 | |
paul@15 | 1642 | def make_varnames(nlocals): |
paul@15 | 1643 | l = ["self"] |
paul@15 | 1644 | for i in range(1, nlocals): |
paul@15 | 1645 | l.append("_l%s" % i) |
paul@15 | 1646 | return l[:nlocals] |
paul@15 | 1647 | |
paul@5 | 1648 | if __name__ == "__main__": |
paul@5 | 1649 | import sys |
paul@5 | 1650 | from classfile import ClassFile |
paul@18 | 1651 | global_names = {} |
paul@18 | 1652 | global_names.update(__builtins__.__dict__) |
paul@18 | 1653 | for filename in sys.argv[1:]: |
paul@18 | 1654 | f = open(filename, "rb") |
paul@18 | 1655 | c = ClassFile(f.read()) |
paul@18 | 1656 | import dis, new |
paul@18 | 1657 | namespace = {} |
paul@18 | 1658 | for method in c.methods: |
paul@18 | 1659 | nargs = len(method.get_descriptor()[0]) + 1 |
paul@22 | 1660 | t, w = translate(c, method) |
paul@18 | 1661 | nlocals = w.max_locals + 1 |
paul@18 | 1662 | filename = str(c.attributes[0].get_name()) |
paul@22 | 1663 | method_name = str(method.get_python_name()) |
paul@18 | 1664 | code = new.code(nargs, nlocals, w.max_stack_depth, 67, w.get_output(), tuple(w.get_constants()), tuple(w.get_names()), |
paul@18 | 1665 | tuple(make_varnames(nlocals)), filename, method_name, 0, "") |
paul@18 | 1666 | # NOTE: May need more globals. |
paul@18 | 1667 | fn = new.function(code, global_names) |
paul@18 | 1668 | namespace[method_name] = fn |
paul@18 | 1669 | # NOTE: Define superclasses properly. |
paul@23 | 1670 | if str(c.super_class.get_name()) not in ("java/lang/Object", "java/lang/Exception"): |
paul@23 | 1671 | bases = (global_names[str(c.super_class.get_python_name())],) |
paul@23 | 1672 | else: |
paul@23 | 1673 | bases = () |
paul@23 | 1674 | cls = new.classobj(str(c.this_class.get_python_name()), bases, namespace) |
paul@18 | 1675 | global_names[cls.__name__] = cls |
paul@4 | 1676 | |
paul@4 | 1677 | # vim: tabstop=4 expandtab shiftwidth=4 |