Compare commits

...

3 Commits

Author SHA1 Message Date
Elliot Nunn f67194a889 Flattener: 32-bit 2022-03-31 11:00:01 +08:00
Elliot Nunn e568ef33af jump_table now a dict, and strip some junk 2022-03-31 10:12:52 +08:00
Elliot Nunn c6b92f627b Find more MacsBug strings 2022-03-31 09:49:21 +08:00
1 changed files with 129 additions and 52 deletions

View File

@ -34,15 +34,7 @@ if not resources or resources[0].id != 0:
jt_resource, *other_resources = resources
bigboy = bytearray()
for r in other_resources:
bigboy.extend(bytes(addr(r.id) - len(bigboy)))
bigboy.extend(r)
with open(args.dest, "wb") as f:
f.write(bigboy)
jump_table = [] # (a5_ofs, segnum, seg_ofs)
jump_table = {} # a5_ofs: (segnum, seg_ofs)
(jt_size, a5_offset_of_jt) = struct.unpack_from(">LL", jt_resource, 8)
thirtytwo = False
@ -58,11 +50,7 @@ for jt_ofs in range(16, 16 + jt_size, 8):
if be_a9f0 != 0xA9F0:
raise ValueError("32-bit jt")
rbyid = {r.id: r for r in resources}[segnum]
(adjust,) = struct.unpack_from(">L", r, 0x20)
# ofs += adjust
jump_table.append((jt_ofs - 16 + a5_offset_of_jt + 2, segnum, ofs))
jump_table[jt_ofs - 16 + a5_offset_of_jt + 2] = (segnum, ofs)
else:
ofs, be_3f3c, segnum, be_a9f0 = struct.unpack_from(">HHHH", jt_resource, jt_ofs)
@ -70,55 +58,136 @@ for jt_ofs in range(16, 16 + jt_size, 8):
if be_3f3c != 0x3F3C or be_a9f0 != 0xA9F0:
raise ValueError("16-bit jt")
jump_table.append((jt_ofs - 16 + a5_offset_of_jt + 2, segnum, ofs + 4))
jump_table[jt_ofs - 16 + a5_offset_of_jt + 2] = (segnum, ofs)
# From https://github.com/elliotnunn/mps/blob/master/stacktrace.go
def macsbug_syms(blob):
bigmv = memoryview(blob)
for i in range(0, len(blob) - 2, 2):
try:
mv = bigmv[i:]
# RTS or JMP(A0)
if mv[:2] == b"\x4e\x75" or mv[:2] == b"\x4e\xd0":
j = i + 2
# RTD #<word>
elif mv[:3] == b"\x4e\x74\x00":
j = i + 4
# Not the end of a procedure
else:
continue
mv = bigmv[j:]
# "Old style" MacsBug symbol format
# Haven't done the MacApp format
if 0x20 <= mv[0] & 0x7F <= 0x7F and 0x20 <= mv[1] <= 0x7F:
k = j + 1
ln = 8
# Apple Compiler symbol
elif mv[0] == 0x80 and mv[1] != 0:
k = j + 2
ln = mv[1]
# Apple Compiler symbol
elif 0x81 <= mv[0] <= 0x9F:
k = j + 1
ln = mv[0] & 0x7F
# No MacsBug string
else:
continue
s = bytes(bigmv[k : k + ln])
# Sanitise the string
if is_mxbg_str(s):
yield i, k, s.decode("ascii")
except IndexError:
pass
def is_mxbg_str(s):
for c in s:
if not ((ord("a") <= c <= ord("z")) or (ord("A") <= c <= ord("Z")) or (ord("0") <= c <= ord("9")) or c in (ord(" "), ord("%"), ord("_"))):
return False
return True
def unpack_relocs(blob):
# blob = memoryview(blob)
while True:
if blob[:2] == b"\x00\x00":
break
elif blob[0] == 0 and blob[1] & 0x80:
yield ((blob[1] << 25) + (blob[2] << 17) + (blob[3] << 9) + (blob[4] << 1)) & 0xFFFFFFFF
blob = blob[5:]
elif blob[0] & 0x80:
yield ((blob[0] << 9) + (blob[1] << 1)) & 0xFFFF
blob = blob[2:]
else:
yield blob[0] << 1
blob = blob[1:]
with open(args.dest + ".py", "w") as idascript:
# Find MacsBug symbols
namedict = {}
for r in other_resources:
targets = set(ofs for _, seg, ofs in jump_table if seg == r.id)
targets = set(ofs for seg, ofs in jump_table.values() if seg == r.id)
bugnames = []
lastfound = 0
for i in range(0, len(r) - 2, 2):
namelen = r[i + 2]
if r[i : i + 2] not in (b"\x4e\x75", b"\x4e\xd0"):
continue
if not (0x81 <= namelen < 0xB0):
continue
namelen &= 0x3F
if i + 3 + namelen > len(r):
continue
name = r[i + 3 : i + 3 + namelen].decode("latin-1")
if not all(c in OKCHARS for c in name):
continue
for rtsoffset, stringoffset, name in macsbug_syms(r):
print(f"idaapi.make_ascii_string({addr(r.id)+stringoffset:#X}, {(len(name)+2)&~1}, ASCSTR_C)", file=idascript)
print(f"set_cmt({addr(r.id)+stringoffset:#X}, 'MacsBug symbol', 0)", file=idascript)
print(f"idaapi.make_ascii_string(0x{addr(r.id)+i+2:X}, {(namelen+2)&~1}, ASCSTR_PASCAL)", file=idascript)
print(f"set_cmt(0x{addr(r.id)+i+2:X}, 'MacsBug symbol', 0)", file=idascript)
for funcoffset in reversed(range(0, rtsoffset, 2)):
inst = bytes(r[funcoffset : funcoffset + 2])
if inst in (b"\x4E\x75", b"\x4E\x74", b"\x4E\xD0"):
break # encountered a func-end
possibles = []
for j in reversed(range(lastfound, i, 2)):
if r[j : j + 2] == b"Nu":
break # stop looking after an RTS
if r[j : j + 2] == b"NV" or j in targets:
possibles.append(j)
lastfound = i
if len(possibles) > 3:
continue # don't bother with this name, too ambiguous
for j, p in enumerate(possibles, 1):
namedict[addr(r.id) + p] = name if len(possibles) == 1 else f"{name}?{j}"
if funcoffset in targets or inst == b"NV":
namedict[addr(r.id) + funcoffset] = name
break
interseg_calls = {}
for r in other_resources:
for i in range(0, len(r) - 3, 2):
if r[i : i + 2] in (b"\x4e\xad", b"\x48\x6d") or (r[i] == 0x41 and r[i + 1] & 0xF8 == 0xE8):
(targ,) = struct.unpack_from(">h", r, i + 2)
if targ > 0:
interseg_calls.setdefault(targ, []).append(addr(r.id) + i)
# 32-bit segment
if r[:2] == b"\xFF\xFF":
a5relocs, pcrelocs = struct.unpack_from(">LxxxxL", r, 0x14)
ofs = 0
for reloc in unpack_relocs(r[a5relocs:]):
ofs = (ofs + reloc) & 0xFFFFFFFF # reloc can be negative!
(a5offset,) = struct.unpack_from(">L", r, ofs)
# Instead of hacking IDA to treat xxxx(A5) as a function address,
# just stuff the actual function address in the JMP target
if a5offset in jump_table:
target_seg, target_seg_offset = jump_table[a5offset]
target_addr = addr(target_seg) + target_seg_offset
struct.pack_into(">L", r, ofs, target_addr)
ofs = 0
for reloc in unpack_relocs(r[pcrelocs:]):
ofs = (ofs + reloc) & 0xFFFFFFFF # reloc can be negative!
(target_addr,) = struct.unpack_from(">L", r, ofs)
target_addr += addr(r.id)
struct.pack_into(">L", r, ofs, target_addr)
# 16-bit segment
else:
for i in range(0, len(r) - 3, 2):
if r[i : i + 2] in (b"\x4e\xad", b"\x48\x6d") or (r[i] == 0x41 and r[i + 1] & 0xF8 == 0xE8):
(targ,) = struct.unpack_from(">h", r, i + 2)
if targ > 0:
interseg_calls.setdefault(targ, []).append(addr(r.id) + i)
# Make some neat names for the segments...
segnames = {}
@ -128,7 +197,7 @@ with open(args.dest + ".py", "w") as idascript:
else:
segnames[r.id] = f"seg_{r.id:X}"
for a5_ofs, segnum, ofs in jump_table:
for a5_ofs, (segnum, ofs) in jump_table.items():
bigboy_ofs = addr(segnum) + ofs
cool_name = f"{segnames[segnum]}$"
@ -146,3 +215,11 @@ with open(args.dest + ".py", "w") as idascript:
for bigboy_ofs, name in sorted(namedict.items()):
cool_name = f"{segnames[bigboy_ofs >> 20]}${name}"
print(f'MakeFunction(0x{bigboy_ofs:X}); MakeName(0x{bigboy_ofs:X}, "{cool_name}")', file=idascript)
bigboy = bytearray()
for r in other_resources:
bigboy.extend(bytes(addr(r.id) - len(bigboy)))
bigboy.extend(r)
with open(args.dest, "wb") as f:
f.write(bigboy)