diff options
author | Bryan Bishop <kanzure@gmail.com> | 2012-06-07 01:07:48 -0500 |
---|---|---|
committer | Bryan Bishop <kanzure@gmail.com> | 2012-06-07 01:07:48 -0500 |
commit | e91193e3eab217ac2ea54068f4ac2e75dadc6ea9 (patch) | |
tree | b87d13aa1fe60666aba1fc8039c789a87f76f3d1 /romstr.py | |
parent | 96559874adc1d0c2b7d63ea75fc176327ec79299 (diff) |
almost complete new disassembler version
original-commit-id: 7dd0c86a6b6ebe03ed00dc7bd75d54d7b33db374
Diffstat (limited to 'romstr.py')
-rw-r--r-- | romstr.py | 176 |
1 files changed, 167 insertions, 9 deletions
@@ -1,17 +1,43 @@ +from gbz80disasm import opt_table, end_08_scripts_with, relative_jumps, relative_unconditional_jumps, call_commands + class RomStr(str): - """ Simple wrapper to prevent a giant rom from being shown on screen + """ Simple wrapper to prevent a giant rom from being shown on screen. """ + def __repr__(self): + """ Simplifies this object so that the output doesn't overflow stdout. + """ + return "RomStr(too long)" + + @classmethod + def load(cls, crystal=True, red=False): + """ Loads a ROM into a RomStr. + """ + if crystal and not red: + file_handler = open("../baserom.gbc", "r") + elif red and not crystal: + file_handler = open("../pokered-baserom.gbc", "r") + else: + raise Exception, "not sure which rom to load?" + bytes = file_handler.read() + file_handler.close() + return RomStr(bytes) + def length(self): - """len(self)""" + """ len(self) + """ return len(self) - def __repr__(self): - return "RomStr(too long)" + def len(self): + """ len(self) + """ + return self.length() def interval(self, offset, length, strings=True, debug=True): - """returns hex values for the rom starting at offset until offset+length""" - returnable = [] + """ returns hex values for the rom starting at offset until + offset+length + """ + returnable = [] for byte in self[offset:offset+length]: if strings: returnable.append(hex(ord(byte))) @@ -20,16 +46,148 @@ class RomStr(str): return returnable def until(self, offset, byte, strings=True, debug=False): - """returns hex values from rom starting at offset until the given byte""" + """ Returns hex values from rom starting at offset until the given + byte. + """ return self.interval(offset, self.find(chr(byte), offset) - offset, strings=strings) + def to_asm(self, address, end_address=None, size=None, max_size=0x4000, debug=None): + """ Disassembles ASM at some address. This will stop disassembling when + either the end_address or size is met. Also, there's a maximum size + that will be parsed, so that large patches of data aren't parsed as + code. + """ + start_address = address + if start_address == None: + raise Exception, "address must be given" + + if debug == None: + if not hasattr(self, "debug"): + debug = False + else: + debug = self.debug + + # this is probably a terrible idea.. why am i doing this? + if size != None and max_size < size: + raise Exception, "max_size must be greater than or equal to size" + elif end_address != None and (end_address - start_address) > max_size: + raise Exception, "end_address is out of bounds" + elif end_address != None and size != None: + if (end_address - start_address) >= size: + size = end_address - start_address + else: + end_address = start_address + size + elif end_address == None and size != None: + end_address = start_address + size + elif end_address != None and size == None: + size = end_address - start_address + + return Asm(start_address=start_address, end_address=end_address, size=size, max_size=max_size, debug=debug, rom=self) + +class Asm: + """ z80 disassembler + """ + + def __init__(self, start_address=None, end_address=None, size=None, max_size=0x4000, debug=True, rom=None): + assert start_address != None, "start_address must be given" + + if rom == None: + file_handler = open("../baserom.gbc", "r") + bytes = file_handler.read() + file_handler.close() + rom = RomStr(bytes) + + if debug not in [None, True, False]: + raise Exception, "debug param is invalid" + if debug == None: + debug = False + + # get end_address and size in sync with each other + if end_address == None and size != None: + end_address = start_address + size + elif end_address != None and size == None: + size = end_address - start_address + elif end_address != None and size != None: + size = max(end_address - start_address, size) + end_address = start_address + size + + # check that the bounds make sense + if end_address != None: + if end_address <= start_address: + raise Exception, "end_address is out of bounds" + elif (end_address - start_address) > max_size: + raise Exception, "end_address goes beyond max_size" + + # check more edge cases + if not start_address >= 0: + raise Exception, "start_address must be at least 0" + elif not end_address >= 0: + raise Exception, "end_address must be at least 0" + + self.rom = rom + self.start_address = start_address + self.end_address = end_address + self.size = size + self.max_size = max_size + self.debug = debug + + self.parse() + + def parse(self): + """ Disassembles stuff and things. + """ + + rom = self.rom + start_address = self.start_address + end_address = self.end_address + max_size = self.max_size + debug = self.debug + + bank_id = start_address / 0x4000 + + # [{"command": 0x20, "bytes": [0x20, 0x40, 0x50], + # "asm": "jp $5040", "label": "Unknown5040"}] + asm_commands = [] + + offset = start_address + + current_byte_number = 0 + + last_hl_address = None + last_a_address = None + used_3d97 = False + + keep_reading = True + + # for labeling future bytes (like for relative jumps) + byte_labels = {} + + while offset <= end_address and keep_reading: + current_byte = ord(rom[offset]) + + is_data = False + + maybe_byte = current_byte + + # stuff... + raise NotImplementedError, "o_______o" + + def __str__(self): + """ ASM pretty printer. + """ + raise NotImplementedError, "zzzzzz" + class AsmList(list): - """simple wrapper to prevent all asm lines from being shown on screen""" + """ Simple wrapper to prevent all asm lines from being shown on screen. + """ def length(self): - """len(self)""" + """ len(self) + """ return len(self) def __repr__(self): + """ Simplifies this object so that the output doesn't overflow stdout. + """ return "AsmList(too long)" |