1
0
mirror of https://github.com/TomHarte/CLK.git synced 2024-11-26 23:52:26 +00:00
CLK/Storage/Disk/DiskImage/Formats/IPF.cpp

440 lines
14 KiB
C++
Raw Normal View History

2021-12-25 22:06:47 +00:00
//
// IPF.cpp
// Clock Signal
//
// Created by Thomas Harte on 25/12/2021.
// Copyright © 2021 Thomas Harte. All rights reserved.
//
#include "IPF.hpp"
#include "../../Encodings/MFM/Encoder.hpp"
2022-01-02 00:03:07 +00:00
#include <cassert>
2021-12-25 22:06:47 +00:00
using namespace Storage::Disk;
2021-12-26 00:36:54 +00:00
namespace {
2021-12-26 14:12:44 +00:00
constexpr uint32_t block(const char (& src)[5]) {
return uint32_t(
(uint32_t(src[0]) << 24) |
(uint32_t(src[1]) << 16) |
(uint32_t(src[2]) << 8) |
uint32_t(src[3])
);
2021-12-26 00:36:54 +00:00
}
size_t block_size(Storage::FileHolder &file, uint8_t header) {
2021-12-27 23:12:44 +00:00
uint8_t size_width = header >> 5;
size_t length = 0;
while(size_width--) {
length = (length << 8) | file.get8();
}
return length;
}
2021-12-26 00:36:54 +00:00
}
2021-12-25 22:06:47 +00:00
IPF::IPF(const std::string &file_name) : file_(file_name) {
2021-12-26 19:49:51 +00:00
std::map<uint32_t, Track::Address> tracks_by_data_key;
// For now, just build up a list of tracks that exist, noting the file position at which their data begins
// plus the other fields that'll be necessary to convert them into flux on demand later.
while(true) {
const auto start_of_block = file_.tell();
const uint32_t type = file_.get32be();
uint32_t length = file_.get32be(); // Can't be const because of the dumb encoding of DATA blocks.
[[maybe_unused]] const uint32_t crc = file_.get32be();
if(file_.eof()) break;
2021-12-25 22:32:29 +00:00
// Sanity check: the first thing in a file should be the CAPS record.
2021-12-26 00:36:54 +00:00
if(!start_of_block && type != block("CAPS")) {
2021-12-25 22:32:29 +00:00
throw Error::InvalidFormat;
}
switch(type) {
default:
printf("Ignoring %c%c%c%c, starting at %ld of length %d\n", (type >> 24), (type >> 16) & 0xff, (type >> 8) & 0xff, type & 0xff, start_of_block, length);
break;
2021-12-26 00:36:54 +00:00
case block("CAPS"):
2021-12-25 22:32:29 +00:00
// Analogously to the sanity check above, if a CAPS block is anywhere other
// than first then something is amiss.
if(start_of_block) {
throw Error::InvalidFormat;
}
break;
2021-12-26 00:36:54 +00:00
case block("INFO"): {
2021-12-25 23:17:13 +00:00
// There are a lot of useful archival fields in the info chunk, which for emulation
// aren't that interesting.
// Make sure this is a floppy disk.
const uint32_t media_type = file_.get32be();
if(media_type != 1) {
throw Error::InvalidFormat;
}
2021-12-27 23:12:44 +00:00
// Determine whether this is a newer SPS-style file.
is_sps_format_ = file_.get32be() > 1;
// Skip: revision, file key and revision, CRC of the original .ctr, and minimum track.
file_.seek(20, SEEK_CUR);
2021-12-25 23:17:13 +00:00
track_count_ = int(1 + file_.get32be());
// Skip: min side.
file_.seek(4, SEEK_CUR);
head_count_ = int(1 + file_.get32be());
// Skip: creation date, time.
file_.seek(8, SEEK_CUR);
platform_type_ = 0;
for(int c = 0; c < 4; c++) {
const uint8_t platform = file_.get8();
switch(platform) {
default: break;
case 1: platform_type_ |= TargetPlatform::Amiga; break;
case 2: platform_type_ |= TargetPlatform::AtariST; break;
/* Omitted: 3 -> IBM PC */
case 4: platform_type_ |= TargetPlatform::AmstradCPC; break;
case 5: platform_type_ |= TargetPlatform::ZXSpectrum; break;
/* Omitted: 6 -> Sam Coupé */
/* Omitted: 7 -> Archimedes */
/* Omitted: 8 -> C64 */
/* Omitted: 9 -> Atari 8-bit */
}
}
// If the file didn't declare anything, default to supporting everything.
if(!platform_type_) {
platform_type_ = ~0;
}
// Ignore: disk number, creator ID, reserved area.
} break;
2021-12-26 19:49:51 +00:00
case block("IMGE"): {
// Get track location.
const uint32_t track = file_.get32be();
const uint32_t side = file_.get32be();
const Track::Address address{int(side), HeadPosition(int(track))};
// Hence generate a TrackDescription.
auto pair = tracks_.emplace(address, TrackDescription());
TrackDescription &description = pair.first->second;
// Read those fields of interest...
// Bit density. I've no idea why the density can't just be given as a measurement.
description.density = TrackDescription::Density(file_.get32be());
if(description.density > TrackDescription::Density::Max) {
description.density = TrackDescription::Density::Unknown;
}
file_.seek(12, SEEK_CUR); // Skipped: signal type, track bytes, start byte position.
description.start_bit_pos = file_.get32be();
description.data_bits = file_.get32be();
description.gap_bits = file_.get32be();
file_.seek(4, SEEK_CUR); // Skipped: track bits, which is entirely redundant.
description.block_count = file_.get32be();
file_.seek(4, SEEK_CUR); // Skipped: encoder process.
description.has_fuzzy_bits = file_.get32be() & 1;
// For some reason the authors decided to introduce another primary key,
// in addition to that which naturally exists of (track, side). So set up
// a mapping from the one to the other.
const uint32_t data_key = file_.get32be();
tracks_by_data_key.emplace(data_key, address);
} break;
2021-12-26 14:12:44 +00:00
2021-12-26 00:36:54 +00:00
case block("DATA"): {
length += file_.get32be();
2021-12-26 19:49:51 +00:00
file_.seek(8, SEEK_CUR); // Skipped: bit size, CRC.
// Grab the data key and use that to establish the file starting
// position for this track.
//
// Assumed here: DATA records will come after corresponding IMGE records.
const uint32_t data_key = file_.get32be();
const auto pair = tracks_by_data_key.find(data_key);
if(pair == tracks_by_data_key.end()) {
break;
}
auto description = tracks_.find(pair->second);
if(description == tracks_.end()) {
break;
}
description->second.file_offset = file_.tell();
} break;
}
file_.seek(start_of_block + length, SEEK_SET);
}
2021-12-25 22:06:47 +00:00
}
HeadPosition IPF::get_maximum_head_position() {
2021-12-25 23:17:13 +00:00
return HeadPosition(track_count_);
2021-12-25 22:06:47 +00:00
}
int IPF::get_head_count() {
2021-12-25 23:17:13 +00:00
return head_count_;
2021-12-25 22:06:47 +00:00
}
std::shared_ptr<Track> IPF::get_track_at_position([[maybe_unused]] Track::Address address) {
2021-12-27 23:12:44 +00:00
// Get the track description, if it exists, and check either that the file has contents for the track.
auto pair = tracks_.find(address);
if(pair == tracks_.end()) {
return nullptr;
}
const TrackDescription &description = pair->second;
if(!description.file_offset) {
return nullptr;
}
// Seek to track content.
file_.seek(description.file_offset, SEEK_SET);
// Read the block descriptions up front.
//
// This is less efficient than just seeking for each block in turn,
// but is a useful crutch to comprehension of the file format on a
// first run through.
struct BlockDescriptor {
uint32_t data_bits = 0;
uint32_t gap_bits = 0;
uint32_t gap_offset = 0;
bool is_mfm = false;
bool has_forward_gap = false;
bool has_backwards_gap = false;
bool data_unit_is_bits = false;
uint32_t default_gap_value = 0;
uint32_t data_offset = 0;
};
std::vector<BlockDescriptor> blocks;
blocks.reserve(description.block_count);
for(uint32_t c = 0; c < description.block_count; c++) {
auto &block = blocks.emplace_back();
block.data_bits = file_.get32be();
block.gap_bits = file_.get32be();
if(is_sps_format_) {
block.gap_offset = file_.get32be();
file_.seek(4, SEEK_CUR); // Skip 'cell type' which appears to provide no content.
} else {
// Skip potlower-resolution copies of data_bits and gap_bits.
file_.seek(8, SEEK_CUR);
}
block.is_mfm = file_.get32be() == 1;
const uint32_t flags = file_.get32be();
block.has_forward_gap = flags & 1;
block.has_backwards_gap = flags & 2;
block.data_unit_is_bits = flags & 4;
block.default_gap_value = file_.get32be();
block.data_offset = file_.get32be();
}
std::vector<Storage::Disk::PCMSegment> segments;
int block_count = 0;
2021-12-27 23:12:44 +00:00
for(auto &block: blocks) {
const auto length_of_a_bit = bit_length(description.density, block_count);
2021-12-27 23:12:44 +00:00
if(block.gap_offset) {
file_.seek(description.file_offset + block.gap_offset, SEEK_SET);
while(true) {
const uint8_t gap_header = file_.get8();
if(!gap_header) break;
// Decompose the header and read the length.
enum class Type {
None, GapLength, SampleLength
} type = Type(gap_header & 0x1f);
const size_t length = block_size(file_, gap_header);
switch(type) {
case Type::GapLength:
printf("Adding gap length %zu bits\n", length);
add_gap(segments, length_of_a_bit, length, block.default_gap_value);
2021-12-27 23:12:44 +00:00
break;
default:
case Type::SampleLength:
printf("Adding sampled gap length %zu bits\n", length);
add_raw_data(segments, length_of_a_bit, length);
// file_.seek(long(length >> 3), SEEK_CUR);
2021-12-27 23:12:44 +00:00
break;
}
}
} else if(block.gap_bits) {
add_gap(segments, length_of_a_bit, block.gap_bits, block.default_gap_value);
2021-12-27 23:12:44 +00:00
}
if(block.data_offset) {
file_.seek(description.file_offset + block.data_offset, SEEK_SET);
while(true) {
const uint8_t data_header = file_.get8();
if(!data_header) break;
// Decompose the header and read the length.
enum class Type {
None, Sync, Data, Gap, Raw, Fuzzy
} type = Type(data_header & 0x1f);
const size_t length = block_size(file_, data_header) * (block.data_unit_is_bits ? 1 : 8);
#ifndef NDEBUG
const auto next_chunk = file_.tell() + long(length >> 3);
#endif
2021-12-27 23:12:44 +00:00
switch(type) {
case Type::Gap:
case Type::Data:
add_unencoded_data(segments, length_of_a_bit, length);
break;
case Type::Sync:
case Type::Raw:
add_raw_data(segments, length_of_a_bit, length);
break;
2021-12-27 23:12:44 +00:00
default:
2021-12-27 23:55:11 +00:00
printf("Unhandled data type %d, length %zu bits\n", int(type), length);
2021-12-27 23:12:44 +00:00
break;
}
assert(file_.tell() == next_chunk);
2021-12-27 23:12:44 +00:00
}
}
++block_count;
2021-12-27 23:12:44 +00:00
}
return std::make_shared<Storage::Disk::PCMTrack>(segments);
2021-12-25 22:06:47 +00:00
}
/// @returns The correct bit length for @c block on a track of @c density.
///
/// @discussion At least to me, this is the least well-designed part] of the IPF specification; rather than just dictating cell
/// densities (or, equivalently, lengths) in the file, densities are named according to their protection scheme and the decoder
/// is required to know all named protection schemes. Which makes IPF unable to handle arbitrary disks (or, indeed, disks
/// with multiple protection schemes on a single track).
Storage::Time IPF::bit_length(TrackDescription::Density density, int block) {
constexpr unsigned int us = 100'000'000;
static constexpr auto us170 = Storage::Time::simplified(170, us);
static constexpr auto us180 = Storage::Time::simplified(180, us);
static constexpr auto us189 = Storage::Time::simplified(189, us);
static constexpr auto us190 = Storage::Time::simplified(190, us);
static constexpr auto us199 = Storage::Time::simplified(199, us);
static constexpr auto us200 = Storage::Time::simplified(200, us);
static constexpr auto us209 = Storage::Time::simplified(209, us);
static constexpr auto us210 = Storage::Time::simplified(210, us);
static constexpr auto us220 = Storage::Time::simplified(220, us);
switch(density) {
default:
break;
case TrackDescription::Density::CopylockAmiga:
if(block == 4) return us189;
if(block == 5) return us199;
if(block == 6) return us209;
break;
case TrackDescription::Density::CopylockAmigaNew:
if(block == 0) return us189;
if(block == 1) return us199;
if(block == 2) return us209;
break;
case TrackDescription::Density::CopylockST:
if(block == 5) return us210;
break;
case TrackDescription::Density::SpeedlockAmiga:
if(block == 1) return us220;
if(block == 2) return us180;
break;
case TrackDescription::Density::OldSpeedlockAmiga:
if(block == 1) return us210;
break;
case TrackDescription::Density::AdamBrierleyAmiga:
if(block == 1) return us220;
if(block == 2) return us210;
if(block == 3) return us200;
if(block == 4) return us190;
if(block == 5) return us180;
if(block == 6) return us170;
break;
// TODO: AdamBrierleyDensityKeyAmiga.
}
return us200; // i.e. default to 2µs.
}
void IPF::add_gap(std::vector<Storage::Disk::PCMSegment> &track, Time bit_length, size_t num_bits, uint32_t value) {
auto &segment = track.emplace_back();
segment.length_of_a_bit = bit_length;
// Empirically, I think gaps require MFM encoding.
const auto byte_length = (num_bits + 7) >> 3;
segment.data.reserve(byte_length * 16);
auto encoder = Storage::Encodings::MFM::GetMFMEncoder(segment.data);
while(segment.data.size() < num_bits) {
encoder->add_byte(uint8_t(value >> 24));
value = (value << 8) | (value >> 24);
}
assert(segment.data.size() <= (byte_length * 16));
segment.data.resize(num_bits);
}
void IPF::add_unencoded_data(std::vector<Storage::Disk::PCMSegment> &track, Time bit_length, size_t num_bits) {
auto &segment = track.emplace_back();
segment.length_of_a_bit = bit_length;
// Length appears to be in pre-encoded bits; double that to get encoded bits.
2022-06-03 19:43:27 +00:00
#ifndef NDEBUG
const auto byte_length = (num_bits + 7) >> 3;
2022-06-03 19:43:27 +00:00
#endif
segment.data.reserve(num_bits * 16);
auto encoder = Storage::Encodings::MFM::GetMFMEncoder(segment.data);
for(size_t c = 0; c < num_bits; c += 8) {
encoder->add_byte(file_.get8());
}
assert(segment.data.size() <= (byte_length * 16));
segment.data.resize(num_bits * 2);
}
void IPF::add_raw_data(std::vector<Storage::Disk::PCMSegment> &track, Time bit_length, size_t num_bits) {
auto &segment = track.emplace_back();
segment.length_of_a_bit = bit_length;
const auto num_bits_ceiling = size_t(num_bits + 7) & size_t(~7);
segment.data.reserve(num_bits_ceiling);
for(size_t bit = 0; bit < num_bits; bit += 8) {
const uint8_t next = file_.get8();
segment.data.push_back(next & 0x80);
segment.data.push_back(next & 0x40);
segment.data.push_back(next & 0x20);
segment.data.push_back(next & 0x10);
segment.data.push_back(next & 0x08);
segment.data.push_back(next & 0x04);
segment.data.push_back(next & 0x02);
segment.data.push_back(next & 0x01);
}
assert(segment.data.size() <= num_bits_ceiling);
segment.data.resize(num_bits);
}