mirror of
https://github.com/robmcmullen/atrcopy.git
synced 2025-02-02 20:30:56 +00:00
846a744bd1
* added -s flag to display segments * added optional name for segments
478 lines
16 KiB
Python
Executable File
478 lines
16 KiB
Python
Executable File
#!/usr/bin/env python
|
|
|
|
|
|
__version__ = "1.0.1"
|
|
|
|
|
|
import struct
|
|
from cStringIO import StringIO
|
|
|
|
class AtrError(RuntimeError):
|
|
pass
|
|
|
|
class InvalidAtrHeader(AtrError):
|
|
pass
|
|
|
|
class LastDirent(AtrError):
|
|
pass
|
|
|
|
class FileNumberMismatchError164(AtrError):
|
|
pass
|
|
|
|
class ByteNotInFile166(AtrError):
|
|
pass
|
|
|
|
class AtrHeader(object):
|
|
format = "<hhhBLLB"
|
|
file_format = "ATR"
|
|
|
|
def __init__(self, bytes=None):
|
|
self.size_in_bytes = 0
|
|
self.sector_size = 0
|
|
self.crc = 0
|
|
self.unused = 0
|
|
self.flags = 0
|
|
self.atr_header_offset = 0
|
|
self.initial_sector_size = 0
|
|
self.num_initial_sectors = 0
|
|
self.max_sectors = 0
|
|
if bytes is None:
|
|
return
|
|
|
|
if len(bytes) == 16:
|
|
values = struct.unpack(self.format, bytes)
|
|
if values[0] != 0x296:
|
|
raise InvalidAtrHeader
|
|
self.size_in_bytes = (values[3] * 256 * 256 + values[1]) * 16
|
|
self.sector_size = values[2]
|
|
self.crc = values[4]
|
|
self.unused = values[5]
|
|
self.flags = values[6]
|
|
self.atr_header_offset = 16
|
|
else:
|
|
raise InvalidAtrHeader
|
|
|
|
def __str__(self):
|
|
return "%s Disk Image (size=%d (%dx%db), crc=%d flags=%d unused=%d)" % (self.file_format, self.size_in_bytes, self.max_sectors, self.sector_size, self.crc, self.flags, self.unused)
|
|
|
|
def check_size(self, size):
|
|
if self.size_in_bytes == 0:
|
|
if size == 92160:
|
|
self.size_in_bytes = size
|
|
self.sector_size = 128
|
|
elif size == 184320:
|
|
self.size_in_bytes = size
|
|
self.sector_size = 256
|
|
self.initial_sector_size = self.sector_size
|
|
self.num_initial_sectors = 0
|
|
self.max_sectors = self.size_in_bytes / self.sector_size
|
|
|
|
def sector_is_valid(self, sector):
|
|
return sector >= 0 and sector < self.max_sectors
|
|
|
|
def get_pos(self, sector):
|
|
if not self.sector_is_valid(sector):
|
|
raise ByteNotInFile166("Sector %d out of range" % sector)
|
|
if sector <= self.num_initial_sectors:
|
|
pos = self.num_initial_sectors * (sector - 1)
|
|
size = self.initial_sector_size
|
|
else:
|
|
pos = self.num_initial_sectors * self.initial_sector_size + (sector - 1 - self.num_initial_sectors) * self.sector_size
|
|
size = self.sector_size
|
|
pos += self.atr_header_offset
|
|
return pos, size
|
|
|
|
class XfdHeader(AtrHeader):
|
|
file_format = "XFD"
|
|
|
|
def __str__(self):
|
|
return "%s Disk Image (size=%d (%dx%db)" % (self.file_format, self.size_in_bytes, self.max_sectors, self.sector_size)
|
|
|
|
class AtrDirent(object):
|
|
format = "<Bhh8s3s"
|
|
|
|
def __init__(self, disk, file_num=0, bytes=None):
|
|
self.file_num = file_num
|
|
self.flag = 0
|
|
self.opened_output = False
|
|
self.dos_2 = False
|
|
self.mydos = False
|
|
self.is_dir = False
|
|
self.locked = False
|
|
self.in_use = False
|
|
self.deleted = False
|
|
self.num_sectors = 0
|
|
self.starting_sector = 0
|
|
self.filename = ""
|
|
self.ext = ""
|
|
if bytes is None:
|
|
return
|
|
values = struct.unpack(self.format, bytes)
|
|
flag = values[0]
|
|
self.flag = flag
|
|
self.opened_output = (flag&0x01) > 0
|
|
self.dos_2 = (flag&0x02) > 0
|
|
self.mydos = (flag&0x04) > 0
|
|
self.is_dir = (flag&0x10) > 0
|
|
self.locked = (flag&0x20) > 0
|
|
self.in_use = (flag&0x40) > 0
|
|
self.deleted = (flag&0x80) > 0
|
|
self.num_sectors = values[1]
|
|
self.starting_sector = values[2]
|
|
self.filename = values[3].rstrip()
|
|
self.ext = values[4].rstrip()
|
|
self.current_sector = 0
|
|
self.is_sane = self.sanity_check(disk)
|
|
|
|
def __str__(self):
|
|
output = "o" if self.opened_output else "."
|
|
dos2 = "2" if self.dos_2 else "."
|
|
mydos = "m" if self.mydos else "."
|
|
in_use = "u" if self.in_use else "."
|
|
deleted = "d" if self.deleted else "."
|
|
locked = "*" if self.locked else " "
|
|
flags = "%s%s%s%s%s%s %03d" % (output, dos2, mydos, in_use, deleted, locked, self.starting_sector)
|
|
if self.in_use:
|
|
return "File #%-2d (%s) %-8s%-3s %03d" % (self.file_num, flags, self.filename, self.ext, self.num_sectors)
|
|
return
|
|
|
|
def sanity_check(self, disk):
|
|
if not self.in_use:
|
|
return True
|
|
if not disk.header.sector_is_valid(self.starting_sector):
|
|
return False
|
|
if self.num_sectors < 0 or self.num_sectors > disk.header.max_sectors:
|
|
return False
|
|
return True
|
|
|
|
def start_read(self):
|
|
self.current_sector = self.starting_sector
|
|
self.current_read = self.num_sectors
|
|
|
|
def read_sector(self, disk):
|
|
raw = disk.get_raw_bytes(self.current_sector)
|
|
bytes = self.process_raw_sector(disk, raw)
|
|
return (bytes, self.current_sector == 0)
|
|
|
|
def process_raw_sector(self, disk, raw):
|
|
file_num = ord(raw[-3]) >> 2
|
|
if file_num != self.file_num:
|
|
raise FileNumberMismatchError164()
|
|
self.current_sector = ((ord(raw[-3]) & 0x3) << 8) + ord(raw[-2])
|
|
num_bytes = ord(raw[-1])
|
|
return raw[0:num_bytes]
|
|
|
|
def get_filename(self):
|
|
ext = ("." + self.ext) if self.ext else ""
|
|
return self.filename + ext
|
|
|
|
class MydosDirent(AtrDirent):
|
|
def process_raw_sector(self, disk, raw):
|
|
self.current_read -= 1
|
|
if self.current_read == 0:
|
|
self.current_sector = 0
|
|
else:
|
|
self.current_sector += 1
|
|
if self.current_sector == disk.first_vtoc:
|
|
self.current_sector = disk.first_data_after_vtoc
|
|
return raw
|
|
|
|
|
|
class InvalidBinaryFile(AtrError):
|
|
pass
|
|
|
|
class ObjSegment(object):
|
|
def __init__(self, metadata_start, data_start, start_addr, end_addr, data, name="", error=None):
|
|
self.name = name
|
|
self.metadata_start = metadata_start
|
|
self.data_start = data_start
|
|
self.start_addr = start_addr
|
|
self.end_addr = end_addr
|
|
self.data = data
|
|
self.error = error
|
|
if name and not name.endswith(" "):
|
|
name += " "
|
|
self.name = name
|
|
|
|
def __str__(self):
|
|
s = "%s%04x-%04x (%04x @ %04x)" % (self.name, self.start_addr, self.end_addr, len(self.data), self.data_start)
|
|
if self.error:
|
|
s += " " + self.error
|
|
return s
|
|
|
|
def __len__(self):
|
|
return len(self.data)
|
|
|
|
def __getitem__(self, val):
|
|
return self.data[val]
|
|
|
|
class AtariDosFile(object):
|
|
"""Parse a binary chunk into segments according to the Atari DOS object
|
|
file format.
|
|
|
|
Ref: http://www.atarimax.com/jindroush.atari.org/afmtexe.html
|
|
"""
|
|
def __init__(self, data):
|
|
self.data = data
|
|
self.size = len(data)
|
|
self.segments = []
|
|
self.parse_segments()
|
|
|
|
def __str__(self):
|
|
return "\n".join(str(s) for s in self.segments) + "\n"
|
|
|
|
def parse_segments(self):
|
|
bytes = self.data
|
|
pos = 0
|
|
first = True
|
|
while pos < self.size:
|
|
header, = struct.unpack("<H", bytes[pos:pos+2])
|
|
if header == 0xffff:
|
|
# Apparently 0xffff header can appear in any segment, not just
|
|
# the first. Regardless, it is ignored everywhere.
|
|
pos += 2
|
|
elif first:
|
|
raise InvalidBinaryFile
|
|
first = False
|
|
if len(bytes[pos:pos + 4]) < 4:
|
|
self.segments.append(ObjSegment(0, 0, bytes[pos:pos + 4], "Short Segment Header"))
|
|
break
|
|
start, end = struct.unpack("<HH", bytes[pos:pos + 4])
|
|
count = end - start + 1
|
|
found = len(bytes[pos + 4:pos + 4 + count])
|
|
if found < count:
|
|
self.segments.append(ObjSegment(pos, pos + 4, start, end, bytes[pos + 4:pos + 4 + count], "Incomplete Data"))
|
|
break
|
|
self.segments.append(ObjSegment(pos, pos + 4, start, end, bytes[pos + 4:pos + 4 + count]))
|
|
pos += 4 + count
|
|
|
|
class AtrFileSegment(ObjSegment):
|
|
def __init__(self, dirent, data, error=None):
|
|
ObjSegment.__init__(self, 0, data, error)
|
|
self.dirent = dirent
|
|
|
|
def __str__(self):
|
|
s = str(self.dirent)
|
|
if self.error:
|
|
s += " " + self.error
|
|
return s
|
|
|
|
class AtrDiskImage(object):
|
|
def __init__(self, bytes):
|
|
self.bytes = bytes
|
|
self.header = None
|
|
self.first_vtoc = 360
|
|
self.first_data_after_vtoc = 369
|
|
self.total_sectors = 0
|
|
self.unused_sectors = 0
|
|
self.files = []
|
|
self.segments = []
|
|
self.all_sane = True
|
|
self.setup()
|
|
|
|
def __str__(self):
|
|
if self.all_sane:
|
|
return "%s %d usable sectors (%d free), %d files" % (self.header, self.total_sectors, self.unused_sectors, len(self.files))
|
|
else:
|
|
return "%s bad directory entries; possible boot disk? Use -f option to try to extract anyway" % self.header
|
|
|
|
def dir(self):
|
|
lines = []
|
|
lines.append(str(self))
|
|
for dirent in self.files:
|
|
if dirent.in_use:
|
|
lines.append(str(dirent))
|
|
return "\n".join(lines)
|
|
|
|
def setup(self):
|
|
self.size = len(self.bytes)
|
|
|
|
self.read_atr_header()
|
|
self.check_size()
|
|
self.get_vtoc()
|
|
self.get_directory()
|
|
|
|
def read_atr_header(self):
|
|
bytes = self.bytes[0:16]
|
|
try:
|
|
self.header = AtrHeader(bytes)
|
|
except InvalidAtrHeader:
|
|
self.header = XfdHeader()
|
|
|
|
def check_size(self):
|
|
self.header.check_size(self.size)
|
|
|
|
def get_raw_bytes(self, sector):
|
|
pos, size = self.header.get_pos(sector)
|
|
return self.bytes[pos:pos + size]
|
|
|
|
def get_sectors(self, start, end=None):
|
|
""" Get contiguous sectors
|
|
|
|
:param start: first sector number to read (note: numbering starts from 1)
|
|
:param end: last sector number to read
|
|
:returns: bytes
|
|
"""
|
|
pos, size = self.header.get_pos(start)
|
|
if end is None:
|
|
end = start
|
|
while start < end:
|
|
start += 1
|
|
_, more = self.header.get_pos(start)
|
|
size += more
|
|
return self.bytes[pos:pos + size]
|
|
|
|
def get_vtoc(self):
|
|
bytes = self.get_sectors(360)[0:5]
|
|
values = struct.unpack("<BHH", bytes)
|
|
code = values[0]
|
|
if code == 0 or code == 2:
|
|
num = 1
|
|
else:
|
|
num = (code * 2) - 3
|
|
self.first_vtoc = 360 - num + 1
|
|
self.total_sectors = values[1]
|
|
self.unused_sectors = values[2]
|
|
|
|
def get_directory(self):
|
|
dir_bytes = self.get_sectors(361, 368)
|
|
i = 0
|
|
num = 0
|
|
files = []
|
|
while i < len(dir_bytes):
|
|
dirent = AtrDirent(self, num, dir_bytes[i:i+16])
|
|
if dirent.mydos:
|
|
dirent = MydosDirent(self, num, dir_bytes[i:i+16])
|
|
|
|
if dirent.in_use:
|
|
files.append(dirent)
|
|
if not dirent.is_sane:
|
|
self.all_sane = False
|
|
elif dirent.flag == 0:
|
|
break
|
|
i += 16
|
|
num += 1
|
|
self.files = files
|
|
|
|
def get_file(self, dirent):
|
|
output = StringIO()
|
|
dirent.start_read()
|
|
while True:
|
|
bytes, last = dirent.read_sector(self)
|
|
output.write(bytes)
|
|
if last:
|
|
break
|
|
return output.getvalue()
|
|
|
|
def find_file(self, filename):
|
|
for dirent in self.files:
|
|
if filename == dirent.get_filename():
|
|
bytes = self.get_file(dirent)
|
|
return bytes
|
|
return ""
|
|
|
|
def get_boot_segments(self):
|
|
bytes = self.get_sectors(1)[0:20]
|
|
values = struct.unpack("<BBHHBHBBBHBHBH", bytes)
|
|
flag = values[0]
|
|
segments = []
|
|
if flag == 0:
|
|
num = values[1]
|
|
addr = values[2]
|
|
bytes = self.get_sectors(1, num)
|
|
header = ObjSegment(0, 0, addr, addr + 20, bytes[0:20], name="Boot Header")
|
|
sectors = ObjSegment(0, 0, addr, addr + len(bytes), bytes, name="Boot Sectors")
|
|
code = ObjSegment(0, 0, addr + 20, addr + len(bytes), bytes[20:], name="Boot Code")
|
|
segments = [sectors, header, code]
|
|
return segments
|
|
|
|
def parse_segments(self):
|
|
if self.header.size_in_bytes > 0:
|
|
self.segments.append(ObjSegment(0, 0, 0, self.header.atr_header_offset, self.bytes[0:self.header.atr_header_offset], name="%s Header" % self.header.file_format))
|
|
self.segments.append(ObjSegment(0, 0, 0, self.header.size_in_bytes, self.bytes[self.header.atr_header_offset:], name="Raw disk sectors"))
|
|
self.segments.extend(self.get_boot_segments())
|
|
|
|
|
|
# for dirent in self.atr.files:
|
|
# try:
|
|
# bytes = self.get_file(dirent)
|
|
# error = None
|
|
# except atrcopy.FileNumberMismatchError164:
|
|
# bytes = None
|
|
# error = "Error 164"
|
|
# except atrcopy.ByteNotInFile166:
|
|
# bytes = None
|
|
# error = "Invalid sector"
|
|
# a = AtrFileSegment(dirent, bytes, error)
|
|
# self.segments.append(AtrSegment(dirent))
|
|
|
|
def process(dirent, options):
|
|
skip = False
|
|
action = "copying to"
|
|
filename = dirent.get_filename()
|
|
outfilename = filename
|
|
if options.no_sys:
|
|
if dirent.ext == "SYS":
|
|
skip = True
|
|
action = "skipping system file"
|
|
if not skip:
|
|
if options.xex:
|
|
outfilename = "%s%s.XEX" % (dirent.filename, dirent.ext)
|
|
if options.lower:
|
|
outfilename = outfilename.lower()
|
|
|
|
if options.dry_run:
|
|
action = "DRY_RUN: %s" % action
|
|
skip = True
|
|
if not skip:
|
|
bytes = atr.get_file(dirent)
|
|
with open(outfilename, "wb") as fh:
|
|
fh.write(bytes)
|
|
if options.extract:
|
|
print "%s: %s %s" % (dirent, action, outfilename)
|
|
else:
|
|
print dirent
|
|
|
|
if __name__ == "__main__":
|
|
import sys
|
|
import argparse
|
|
|
|
parser = argparse.ArgumentParser(description="Extract images off ATR format disks")
|
|
parser.add_argument("-v", "--verbose", default=0, action="count")
|
|
parser.add_argument("-l", "--lower", action="store_true", default=False, help="convert filenames to lower case")
|
|
parser.add_argument("--dry-run", action="store_true", default=False, help="don't extract, just show what would have been extracted")
|
|
parser.add_argument("-n", "--no-sys", action="store_true", default=False, help="only extract things that look like games (no DOS or .SYS files)")
|
|
parser.add_argument("-x", "--extract", action="store_true", default=False, help="extract files")
|
|
parser.add_argument("--xex", action="store_true", default=False, help="add .xex extension")
|
|
parser.add_argument("-f", "--force", action="store_true", default=False, help="force operation on disk images that have bad directory entries or look like boot disks")
|
|
parser.add_argument("files", metavar="ATR", nargs="+", help="an ATR image file [or a list of them]")
|
|
parser.add_argument("-s", "--segments", action="store_true", default=False, help="display segments")
|
|
options, extra_args = parser.parse_known_args()
|
|
|
|
for filename in options.files:
|
|
with open(filename, "rb") as fh:
|
|
data = fh.read()
|
|
try:
|
|
atr = AtrDiskImage(data)
|
|
print "%s: %s" % (filename, atr)
|
|
except:
|
|
print "%s: Doesn't look like a supported disk image" % filename
|
|
try:
|
|
xex = AtariDosFile(data)
|
|
print xex
|
|
except InvalidBinaryFile:
|
|
print "%s: Doesn't look like an XEX either" % filename
|
|
continue
|
|
if options.segments:
|
|
atr.parse_segments()
|
|
print "\n".join([str(a) for a in atr.segments])
|
|
elif atr.all_sane or options.force:
|
|
for dirent in atr.files:
|
|
try:
|
|
process(dirent, options)
|
|
except FileNumberMismatchError164:
|
|
print "Error 164: %s" % str(dirent)
|
|
except ByteNotInFile166:
|
|
print "Invalid sector for: %s" % str(dirent)
|
|
|