#!/usr/bin/env python __version__ = "2.0.0" import types import numpy as np class AtrError(RuntimeError): pass class InvalidAtrHeader(AtrError): pass class LastDirent(AtrError): pass class FileNumberMismatchError164(AtrError): pass class ByteNotInFile166(AtrError): pass class AtrHeader(object): # ATR Format described in http://www.atarimax.com/jindroush.atari.org/afmtatr.html format = np.dtype([ ('wMagic', ' 0 and sector <= self.max_sectors def get_pos(self, sector): if not self.sector_is_valid(sector): raise ByteNotInFile166("Sector %d out of range" % sector) if sector <= self.num_initial_sectors: pos = self.num_initial_sectors * (sector - 1) size = self.initial_sector_size else: pos = self.num_initial_sectors * self.initial_sector_size + (sector - 1 - self.num_initial_sectors) * self.sector_size size = self.sector_size pos += self.atr_header_offset return pos, size class XfdHeader(AtrHeader): file_format = "XFD" def __str__(self): return "%s Disk Image (size=%d (%dx%db)" % (self.file_format, self.size_in_bytes, self.max_sectors, self.sector_size) class AtrDirent(object): # ATR Dirent structure described at http://atari.kensclassics.org/dos.htm format = np.dtype([ ('FLAG', 'u1'), ('COUNT', ' 0 self.dos_2 = (flag&0x02) > 0 self.mydos = (flag&0x04) > 0 self.is_dir = (flag&0x10) > 0 self.locked = (flag&0x20) > 0 self.in_use = (flag&0x40) > 0 self.deleted = (flag&0x80) > 0 self.num_sectors = int(values[1]) self.starting_sector = int(values[2]) self.filename = str(values[3]).rstrip() self.ext = str(values[4]).rstrip() self.current_sector = 0 self.is_sane = self.sanity_check(disk) def __str__(self): output = "o" if self.opened_output else "." dos2 = "2" if self.dos_2 else "." mydos = "m" if self.mydos else "." in_use = "u" if self.in_use else "." deleted = "d" if self.deleted else "." locked = "*" if self.locked else " " flags = "%s%s%s%s%s%s %03d" % (output, dos2, mydos, in_use, deleted, locked, self.starting_sector) if self.in_use: return "File #%-2d (%s) %-8s%-3s %03d" % (self.file_num, flags, self.filename, self.ext, self.num_sectors) return def sanity_check(self, disk): if not self.in_use: return True if not disk.header.sector_is_valid(self.starting_sector): return False if self.num_sectors < 0 or self.num_sectors > disk.header.max_sectors: return False return True def start_read(self): self.current_sector = self.starting_sector self.current_read = self.num_sectors def read_sector(self, disk): raw, pos, size = disk.get_raw_bytes(self.current_sector) bytes, num_data_bytes = self.process_raw_sector(disk, raw) return bytes, self.current_sector == 0, pos, num_data_bytes def process_raw_sector(self, disk, raw): try: file_num = ord(raw[-3]) >> 2 except TypeError: # if numpy data, don't need the ord() return self.process_raw_sector_numpy(disk, raw) if file_num != self.file_num: raise FileNumberMismatchError164() self.current_sector = ((ord(raw[-3]) & 0x3) << 8) + ord(raw[-2]) num_bytes = ord(raw[-1]) return raw[0:num_bytes], num_bytes def process_raw_sector_numpy(self, disk, raw): file_num = raw[-3] >> 2 if file_num != self.file_num: raise FileNumberMismatchError164() self.current_sector = ((raw[-3] & 0x3) << 8) + raw[-2] num_bytes = raw[-1] return raw[0:num_bytes], num_bytes def get_filename(self): ext = ("." + self.ext) if self.ext else "" return self.filename + ext class MydosDirent(AtrDirent): def process_raw_sector(self, disk, raw): self.current_read -= 1 if self.current_read == 0: self.current_sector = 0 else: self.current_sector += 1 if self.current_sector == disk.first_vtoc: self.current_sector = disk.first_data_after_vtoc return raw class InvalidBinaryFile(AtrError): pass class DefaultSegment(object): debug = False def __init__(self, start_addr=0, data=None, name="All", error=None): self.start_addr = int(start_addr) # force python int to decouple from possibly being a numpy datatype if data is None: data = np.fromstring("", dtype=np.uint8) else: data = to_numpy(data) self.data = data self.style = np.zeros_like(self.data, dtype=np.uint8) if self.debug: self.style = np.arange(len(self), dtype=np.uint8) self.error = error self.name = name self.page_size = -1 self.map_width = 40 self._search_copy = None def __str__(self): return "%s (%d bytes)" % (self.name, len(self)) def __len__(self): return np.alen(self.data) def __getitem__(self, index): return self.data[index] def __setitem__(self, index, value): self.data[index] = value self._search_copy = None def byte_bounds_offset(self): return np.byte_bounds(self.data)[0] def tostring(self): return self.data.tostring() def get_style_bits(self, match=False, comment=False): style_bits = 0 if match: style_bits |= 1 if comment: style_bits |= 0x80 return style_bits def get_style_mask(self, match=False, comment=False): style_mask = 0xff if match: style_mask &= 0xfe if comment: style_mask &= 0x7f return style_mask def set_style_ranges(self, ranges, **kwargs): style_bits = self.get_style_bits(**kwargs) s = self.style for start, end in ranges: s[start:end] |= style_bits def clear_style_bits(self, **kwargs): style_mask = self.get_style_mask(**kwargs) self.style &= style_mask def label(self, index, lower_case=True): if lower_case: return "%04x" % (index + self.start_addr) else: return "%04X" % (index + self.start_addr) @property def search_copy(self): if self._search_copy is None: self._search_copy = self.data.tostring() return self._search_copy class ObjSegment(DefaultSegment): def __init__(self, metadata_start, data_start, start_addr, end_addr, data, name="", error=None): DefaultSegment.__init__(self, start_addr, data, name, error) self.metadata_start = metadata_start self.data_start = data_start def __str__(self): count = len(self) s = "%s $%04x-$%04x ($%04x @ $%04x)" % (self.name, self.start_addr, self.start_addr + count, count, self.data_start) if self.error: s += " " + self.error return s class RawSectorsSegment(DefaultSegment): def __init__(self, first_sector, num_sectors, count, data, **kwargs): DefaultSegment.__init__(self, 0, data, **kwargs) self.page_size = 128 self.first_sector = first_sector self.num_sectors = num_sectors def __str__(self): if self.num_sectors > 1: s = "%s (sectors %d-%d)" % (self.name, self.first_sector, self.first_sector + self.num_sectors - 1) else: s = "%s (sector %d)" % (self.name, self.first_sector) if self.error: s += " " + self.error return s def label(self, index, lower_case=True): sector, byte = divmod(index, self.page_size) if lower_case: return "s%03d:%02x" % (sector + self.first_sector, byte) return "s%03d:%02X" % (sector + self.first_sector, byte) class IndexedByteSegment(DefaultSegment): def __init__(self, byte_order, bytes, **kwargs): self.order = byte_order DefaultSegment.__init__(self, 0, bytes, **kwargs) def __str__(self): return "%s ($%x @ $%x)" % (self.name, len(self), self.order[0]) def __len__(self): return np.alen(self.order) def __getitem__(self, index): return self.data[self.order[index]] def __setitem__(self, index, value): self.data[self.order[index]] = value self._search_copy = None def byte_bounds_offset(self): return np.byte_bounds(self.data)[0] + self.order[0] def tostring(self): return self.data[self.order[:]].tostring() class AtariDosFile(object): """Parse a binary chunk into segments according to the Atari DOS object file format. Ref: http://www.atarimax.com/jindroush.atari.org/afmtexe.html """ def __init__(self, data): self.data = to_numpy(data) self.size = len(self.data) self.segments = [] self.parse_segments() def __str__(self): return "\n".join(str(s) for s in self.segments) + "\n" def get_obj_segment(self, metadata_start, data_start, start_addr, end_addr, data, name=""): """Subclass use: override this method to create a custom segment. By default uses an ObjSegment """ return ObjSegment(metadata_start, data_start, start_addr, end_addr, data, name) def parse_segments(self): bytes = self.data pos = 0 first = True while pos < self.size: header, = bytes[pos:pos+2].view(dtype=np.uint16) if header == 0xffff: # Apparently 0xffff header can appear in any segment, not just # the first. Regardless, it is ignored everywhere. pos += 2 elif first: raise InvalidBinaryFile first = False if len(bytes[pos:pos + 4]) < 4: self.segments.append(self.get_obj_segment(0, 0, bytes[pos:pos + 4], "Short Segment Header")) break start, end = bytes[pos:pos + 4].view(dtype=np.uint16) count = end - start + 1 found = len(bytes[pos + 4:pos + 4 + count]) if found < count: self.segments.append(self.get_obj_segment(pos, pos + 4, start, end, bytes[pos + 4:pos + 4 + count], "Incomplete Data")) break self.segments.append(self.get_obj_segment(pos, pos + 4, start, end, bytes[pos + 4:pos + 4 + count])) pos += 4 + count class AtrFileSegment(ObjSegment): def __init__(self, dirent, data, error=None): ObjSegment.__init__(self, 0, data, error) self.dirent = dirent def __str__(self): s = str(self.dirent) if self.error: s += " " + self.error return s class AtrDiskImage(object): def __init__(self, bytes): self.bytes = to_numpy(bytes) self.header = None self.first_vtoc = 360 self.num_vtoc = 1 self.first_data_after_vtoc = 369 self.total_sectors = 0 self.unused_sectors = 0 self.files = [] self.segments = [] self.all_sane = True self.setup() def __str__(self): if self.all_sane: return "%s %d usable sectors (%d free), %d files" % (self.header, self.total_sectors, self.unused_sectors, len(self.files)) else: return "%s bad directory entries; possible boot disk? Use -f option to try to extract anyway" % self.header def dir(self): lines = [] lines.append(str(self)) for dirent in self.files: if dirent.in_use: lines.append(str(dirent)) return "\n".join(lines) def setup(self): self.size = len(self.bytes) self.read_atr_header() self.check_size() self.get_vtoc() self.get_directory() def read_atr_header(self): bytes = self.bytes[0:16] try: self.header = AtrHeader(bytes) except InvalidAtrHeader: self.header = XfdHeader() def check_size(self): self.header.check_size(self.size) def get_raw_bytes(self, sector): pos, size = self.header.get_pos(sector) return self.bytes[pos:pos + size], pos, size def get_sectors(self, start, end=None): """ Get contiguous sectors :param start: first sector number to read (note: numbering starts from 1) :param end: last sector number to read :returns: bytes """ pos, size = self.header.get_pos(start) if end is None: end = start while start < end: start += 1 _, more = self.header.get_pos(start) size += more return self.bytes[pos:pos + size] vtoc_type = np.dtype([ ('code', 'u1'), ('total',' 0: self.segments.append(self.get_obj_segment(0, 0, 0, self.header.atr_header_offset, self.bytes[0:self.header.atr_header_offset], name="%s Header" % self.header.file_format)) self.segments.append(self.get_raw_sectors_segment(1, self.header.max_sectors, self.header.size_in_bytes, self.bytes[self.header.atr_header_offset:], name="Raw disk sectors")) self.segments.extend(self.get_boot_segments()) self.segments.extend(self.get_vtoc_segments()) self.segments.extend(self.get_directory_segments()) self.segments.extend(self.get_file_segments()) # for dirent in self.atr.files: # try: # bytes = self.get_file(dirent) # error = None # except atrcopy.FileNumberMismatchError164: # bytes = None # error = "Error 164" # except atrcopy.ByteNotInFile166: # bytes = None # error = "Invalid sector" # a = AtrFileSegment(dirent, bytes, error) # self.segments.append(AtrSegment(dirent)) def to_numpy(value): if type(value) is np.ndarray: return value elif type(value) is types.StringType: return np.fromstring(value, dtype=np.uint8) raise TypeError("Can't convert to numpy data") def process(dirent, options): skip = False action = "copying to" filename = dirent.get_filename() outfilename = filename if options.no_sys: if dirent.ext == "SYS": skip = True action = "skipping system file" if not skip: if options.xex: outfilename = "%s%s.XEX" % (dirent.filename, dirent.ext) if options.lower: outfilename = outfilename.lower() if options.dry_run: action = "DRY_RUN: %s" % action skip = True if options.extract: print "%s: %s %s" % (dirent, action, outfilename) if not skip: bytes = atr.get_file(dirent) with open(outfilename, "wb") as fh: fh.write(bytes) else: print dirent if __name__ == "__main__": import sys import argparse parser = argparse.ArgumentParser(description="Extract images off ATR format disks") parser.add_argument("-v", "--verbose", default=0, action="count") parser.add_argument("-l", "--lower", action="store_true", default=False, help="convert filenames to lower case") parser.add_argument("--dry-run", action="store_true", default=False, help="don't extract, just show what would have been extracted") parser.add_argument("-n", "--no-sys", action="store_true", default=False, help="only extract things that look like games (no DOS or .SYS files)") parser.add_argument("-x", "--extract", action="store_true", default=False, help="extract files") parser.add_argument("--xex", action="store_true", default=False, help="add .xex extension") parser.add_argument("-f", "--force", action="store_true", default=False, help="force operation on disk images that have bad directory entries or look like boot disks") parser.add_argument("files", metavar="ATR", nargs="+", help="an ATR image file [or a list of them]") parser.add_argument("-s", "--segments", action="store_true", default=False, help="display segments") options, extra_args = parser.parse_known_args() for filename in options.files: with open(filename, "rb") as fh: data = fh.read() try: atr = AtrDiskImage(data) print "%s: %s" % (filename, atr) except: print "%s: Doesn't look like a supported disk image" % filename try: xex = AtariDosFile(data) print xex except InvalidBinaryFile: print "%s: Doesn't look like an XEX either" % filename continue if options.segments: atr.parse_segments() print "\n".join([str(a) for a in atr.segments]) elif atr.all_sane or options.force: for dirent in atr.files: try: process(dirent, options) except FileNumberMismatchError164: print "Error 164: %s" % str(dirent) except ByteNotInFile166: print "Invalid sector for: %s" % str(dirent)