You've already forked python-uncompyle6
mirror of
https://github.com/rocky/python-uncompyle6.git
synced 2025-08-03 00:45:53 +08:00
148 lines
5.7 KiB
Python
148 lines
5.7 KiB
Python
# Copyright (c) 2019-2022 by Rocky Bernstein
|
|
#
|
|
# This program is free software: you can redistribute it and/or modify
|
|
# it under the terms of the GNU General Public License as published by
|
|
# the Free Software Foundation, either version 3 of the License, or
|
|
# (at your option) any later version.
|
|
#
|
|
# This program is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
# GNU General Public License for more details.
|
|
#
|
|
# You should have received a copy of the GNU General Public License
|
|
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
"""
|
|
Python 3.8 bytecode decompiler scanner.
|
|
|
|
Does some additional massaging of xdis-disassembled instructions to
|
|
make things easier for decompilation.
|
|
|
|
This sets up opcodes Python's 3.8 and calls a generalized
|
|
scanner routine for Python 3.7 and up.
|
|
"""
|
|
|
|
from uncompyle6.scanners.tok import off2int
|
|
from uncompyle6.scanners.scanner37 import Scanner37
|
|
from uncompyle6.scanners.scanner37base import Scanner37Base
|
|
|
|
# bytecode verification, verify(), uses JUMP_OPs from here
|
|
from xdis.opcodes import opcode_38 as opc
|
|
|
|
# bytecode verification, verify(), uses JUMP_OPS from here
|
|
JUMP_OPs = opc.JUMP_OPS
|
|
|
|
|
|
class Scanner38(Scanner37):
|
|
def __init__(self, show_asm=None):
|
|
Scanner37Base.__init__(self, (3, 8), show_asm)
|
|
self.debug = False
|
|
return
|
|
|
|
pass
|
|
|
|
def ingest(self, co, classname=None, code_objects={}, show_asm=None):
|
|
tokens, customize = super(Scanner38, self).ingest(
|
|
co, classname, code_objects, show_asm
|
|
)
|
|
|
|
# Hacky way to detect loop ranges.
|
|
# The key in jump_back_targets is the start of the loop.
|
|
# The value is where the loop ends. In current Python,
|
|
# JUMP_BACKS are always to loops. And blocks are ordered so that the
|
|
# JUMP_BACK with the highest offset will be where the range ends.
|
|
jump_back_targets = {}
|
|
for token in tokens:
|
|
if token.kind == "JUMP_BACK":
|
|
jump_back_targets[token.attr] = token.offset
|
|
pass
|
|
pass
|
|
|
|
if self.debug and jump_back_targets:
|
|
print(jump_back_targets)
|
|
loop_ends = []
|
|
next_end = tokens[len(tokens) - 1].off2int() + 10
|
|
|
|
new_tokens = []
|
|
for i, token in enumerate(tokens):
|
|
opname = token.kind
|
|
offset = token.offset
|
|
if offset == next_end:
|
|
loop_ends.pop()
|
|
if self.debug:
|
|
print("%sremove loop offset %s" % (" " * len(loop_ends), offset))
|
|
pass
|
|
next_end = (
|
|
loop_ends[-1]
|
|
if len(loop_ends)
|
|
else tokens[len(tokens) - 1].off2int() + 10
|
|
)
|
|
|
|
# things that smash new_tokens like BUILD_LIST have to come first.
|
|
|
|
if offset in jump_back_targets:
|
|
next_end = off2int(jump_back_targets[offset], prefer_last=False)
|
|
if self.debug:
|
|
print(
|
|
"%sadding loop offset %s ending at %s"
|
|
% (" " * len(loop_ends), offset, next_end)
|
|
)
|
|
loop_ends.append(next_end)
|
|
|
|
# Turn JUMP opcodes into "BREAK_LOOP" opcodes.
|
|
# FIXME: this should be replaced by proper control flow.
|
|
if opname in ("JUMP_FORWARD", "JUMP_ABSOLUTE") and len(loop_ends):
|
|
jump_target = token.attr
|
|
|
|
if opname == "JUMP_ABSOLUTE" and jump_target <= next_end:
|
|
# Not a forward-enough jump to break out of the next loop, so continue.
|
|
# FIXME: Do we need "continue" detection?
|
|
new_tokens.append(token)
|
|
continue
|
|
|
|
# We also want to avoid confusing BREAK_LOOPS with parts of the
|
|
# grammar rules for loops. (Perhaps we should change the grammar.)
|
|
# Try to find an adjacent JUMP_BACK which is part of the normal loop end.
|
|
|
|
if i + 1 < len(tokens) and tokens[i + 1] == "JUMP_BACK":
|
|
# Sometimes the jump back is after the "break" instruction..
|
|
jump_back_index = i + 1
|
|
else:
|
|
# and sometimes, because of jump-to-jump optimization, it is before the
|
|
# jump target instruction.
|
|
jump_back_index = self.offset2tok_index[jump_target] - 1
|
|
while tokens[jump_back_index].kind.startswith("COME_FROM_"):
|
|
jump_back_index -= 1
|
|
pass
|
|
pass
|
|
jump_back_token = tokens[jump_back_index]
|
|
|
|
# Is this a forward jump not next to a JUMP_BACK ? ...
|
|
break_loop = token.linestart and jump_back_token != "JUMP_BACK"
|
|
|
|
# or if there is looping jump back, then that loop
|
|
# should start before where the "break" instruction sits.
|
|
if break_loop or (
|
|
jump_back_token == "JUMP_BACK"
|
|
and jump_back_token.attr < token.off2int()
|
|
):
|
|
token.kind = "BREAK_LOOP"
|
|
pass
|
|
new_tokens.append(token)
|
|
return new_tokens, customize
|
|
|
|
|
|
if __name__ == "__main__":
|
|
from xdis.version_info import PYTHON_VERSION_TRIPLE, version_tuple_to_str
|
|
|
|
if PYTHON_VERSION_TRIPLE[:2] == (3, 8):
|
|
import inspect
|
|
|
|
co = inspect.currentframe().f_code # type: ignore
|
|
tokens, customize = Scanner38().ingest(co)
|
|
for t in tokens:
|
|
print(t.format())
|
|
pass
|
|
else:
|
|
print("Need to be Python 3.8 to demo; I am version %s" % version_tuple_to_str())
|