mirror of
https://github.com/TomHarte/CLK.git
synced 2025-02-21 20:29:06 +00:00
Begin a full-synchronous usage of the sequencer, at least exposing poor handling of the pipeline.
This commit is contained in:
parent
1ac0a4e924
commit
03d4960a03
@ -130,6 +130,7 @@ void Blitter::set_control(int index, uint16_t value) {
|
|||||||
channel_enables_[2] = value & 0x200;
|
channel_enables_[2] = value & 0x200;
|
||||||
channel_enables_[1] = value & 0x400;
|
channel_enables_[1] = value & 0x400;
|
||||||
channel_enables_[0] = value & 0x800;
|
channel_enables_[0] = value & 0x800;
|
||||||
|
sequencer_.set_control(value >> 8);
|
||||||
}
|
}
|
||||||
shifts_[index] = value >> 12;
|
shifts_[index] = value >> 12;
|
||||||
LOG("Set control " << index << " to " << PADHEX(4) << value);
|
LOG("Set control " << index << " to " << PADHEX(4) << value);
|
||||||
@ -335,89 +336,124 @@ bool Blitter::advance_dma() {
|
|||||||
// Copy mode.
|
// Copy mode.
|
||||||
|
|
||||||
// Quick hack: do the entire action atomically.
|
// Quick hack: do the entire action atomically.
|
||||||
|
sequencer_.begin();
|
||||||
a32_ = 0;
|
a32_ = 0;
|
||||||
b32_ = 0;
|
b32_ = 0;
|
||||||
|
|
||||||
for(int y = 0; y < height_; y++) {
|
y_ = 0;
|
||||||
bool fill_carry = fill_carry_;
|
x_ = 0;
|
||||||
|
int loop_index_ = -1;
|
||||||
|
write_phase_ = WritePhase::Starting;
|
||||||
|
stopping_ = false;
|
||||||
|
|
||||||
for(int x = 0; x < width_; x++) {
|
while(true) {
|
||||||
uint16_t a_mask = 0xffff;
|
const auto next = sequencer_.next();
|
||||||
if(x == 0) a_mask &= a_mask_[0];
|
|
||||||
if(x == width_ - 1) a_mask &= a_mask_[1];
|
|
||||||
|
|
||||||
if(channel_enables_[0]) {
|
// If this is the start of a new iteration, check for end of line,
|
||||||
a_data_ = ram_[pointer_[0] & ram_mask_];
|
// or of blit, and pick an appropriate mask for A based on location.
|
||||||
pointer_[0] += direction_;
|
if(next.second != loop_index_) {
|
||||||
}
|
transient_a_mask_ = 0xffff;
|
||||||
a32_ = (a32_ << 16) | (a_data_ & a_mask);
|
if(x_ == 0) transient_a_mask_ &= a_mask_[0];
|
||||||
|
if(x_ == width_ - 1) transient_a_mask_ &= a_mask_[1];
|
||||||
|
|
||||||
if(channel_enables_[1]) {
|
++x_;
|
||||||
b_data_ = ram_[pointer_[1] & ram_mask_];
|
if(x_ == width_) {
|
||||||
pointer_[1] += direction_;
|
x_ = 0;
|
||||||
}
|
++y_;
|
||||||
b32_ = (b32_ << 16) | b_data_;
|
if(y_ == height_) {
|
||||||
|
sequencer_.complete();
|
||||||
if(channel_enables_[2]) {
|
stopping_ = true;
|
||||||
c_data_ = ram_[pointer_[2] & ram_mask_];
|
|
||||||
pointer_[2] += direction_;
|
|
||||||
}
|
|
||||||
|
|
||||||
uint16_t a, b;
|
|
||||||
|
|
||||||
// The barrel shifter shifts to the right in ascending address mode,
|
|
||||||
// but to the left otherwise
|
|
||||||
if(!one_dot_) {
|
|
||||||
a = uint16_t(a32_ >> shifts_[0]);
|
|
||||||
b = uint16_t(b32_ >> shifts_[1]);
|
|
||||||
} else {
|
|
||||||
// TODO: there must be a neater solution than this.
|
|
||||||
a = uint16_t(
|
|
||||||
(a32_ << shifts_[0]) |
|
|
||||||
(a32_ >> (32 - shifts_[0]))
|
|
||||||
);
|
|
||||||
|
|
||||||
b = uint16_t(
|
|
||||||
(b32_ << shifts_[1]) |
|
|
||||||
(b32_ >> (32 - shifts_[1]))
|
|
||||||
);
|
|
||||||
}
|
|
||||||
|
|
||||||
uint16_t output =
|
|
||||||
apply_minterm<uint16_t>(
|
|
||||||
a,
|
|
||||||
b,
|
|
||||||
c_data_,
|
|
||||||
minterms_);
|
|
||||||
|
|
||||||
if(exclusive_fill_ || inclusive_fill_) {
|
|
||||||
// Use the fill tables nibble-by-nibble to figure out the filled word.
|
|
||||||
uint16_t fill_output = 0;
|
|
||||||
int ongoing_carry = fill_carry;
|
|
||||||
const int type_mask = exclusive_fill_ ? (1 << 5) : 0;
|
|
||||||
for(int c = 0; c < 16; c += 4) {
|
|
||||||
const int total_index = (output & 0xf) | (ongoing_carry << 4) | type_mask;
|
|
||||||
fill_output |= ((fill_values[total_index >> 3] >> ((total_index & 7) * 4)) & 0xf) << c;
|
|
||||||
ongoing_carry = (fill_carries[total_index >> 5] >> (total_index & 31)) & 1;
|
|
||||||
output >>= 4;
|
|
||||||
}
|
}
|
||||||
|
pointer_[0] += modulos_[0] * channel_enables_[0] * direction_;
|
||||||
output = fill_output;
|
pointer_[1] += modulos_[1] * channel_enables_[1] * direction_;
|
||||||
fill_carry = ongoing_carry;
|
pointer_[2] += modulos_[2] * channel_enables_[2] * direction_;
|
||||||
}
|
pointer_[3] += modulos_[3] * channel_enables_[3] * direction_;
|
||||||
|
|
||||||
not_zero_flag_ |= output;
|
|
||||||
|
|
||||||
if(channel_enables_[3]) {
|
|
||||||
ram_[pointer_[3] & ram_mask_] = output;
|
|
||||||
pointer_[3] += direction_;
|
|
||||||
}
|
}
|
||||||
|
++loop_index_;
|
||||||
}
|
}
|
||||||
|
|
||||||
pointer_[0] += modulos_[0] * channel_enables_[0] * direction_;
|
using Channel = BlitterSequencer::Channel;
|
||||||
pointer_[1] += modulos_[1] * channel_enables_[1] * direction_;
|
switch(next.first) {
|
||||||
pointer_[2] += modulos_[2] * channel_enables_[2] * direction_;
|
case Channel::A:
|
||||||
pointer_[3] += modulos_[3] * channel_enables_[3] * direction_;
|
a_data_ = ram_[pointer_[0] & ram_mask_];
|
||||||
|
pointer_[0] += direction_;
|
||||||
|
continue;
|
||||||
|
case Channel::B:
|
||||||
|
b_data_ = ram_[pointer_[1] & ram_mask_];
|
||||||
|
pointer_[1] += direction_;
|
||||||
|
continue;
|
||||||
|
case Channel::C:
|
||||||
|
c_data_ = ram_[pointer_[2] & ram_mask_];
|
||||||
|
pointer_[2] += direction_;
|
||||||
|
continue;
|
||||||
|
case Channel::None:
|
||||||
|
continue;
|
||||||
|
case Channel::Write: break;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
a32_ = (a32_ << 16) | (a_data_ & transient_a_mask_);
|
||||||
|
b32_ = (b32_ << 16) | b_data_;
|
||||||
|
|
||||||
|
uint16_t a, b;
|
||||||
|
|
||||||
|
// The barrel shifter shifts to the right in ascending address mode,
|
||||||
|
// but to the left otherwise.
|
||||||
|
if(!one_dot_) {
|
||||||
|
a = uint16_t(a32_ >> shifts_[0]);
|
||||||
|
b = uint16_t(b32_ >> shifts_[1]);
|
||||||
|
} else {
|
||||||
|
// TODO: there must be a neater solution than this.
|
||||||
|
a = uint16_t(
|
||||||
|
(a32_ << shifts_[0]) |
|
||||||
|
(a32_ >> (32 - shifts_[0]))
|
||||||
|
);
|
||||||
|
|
||||||
|
b = uint16_t(
|
||||||
|
(b32_ << shifts_[1]) |
|
||||||
|
(b32_ >> (32 - shifts_[1]))
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
|
uint16_t output =
|
||||||
|
apply_minterm<uint16_t>(
|
||||||
|
a,
|
||||||
|
b,
|
||||||
|
c_data_,
|
||||||
|
minterms_);
|
||||||
|
|
||||||
|
if(exclusive_fill_ || inclusive_fill_) {
|
||||||
|
// Use the fill tables nibble-by-nibble to figure out the filled word.
|
||||||
|
uint16_t fill_output = 0;
|
||||||
|
int ongoing_carry = fill_carry_;
|
||||||
|
const int type_mask = exclusive_fill_ ? (1 << 5) : 0;
|
||||||
|
for(int c = 0; c < 16; c += 4) {
|
||||||
|
const int total_index = (output & 0xf) | (ongoing_carry << 4) | type_mask;
|
||||||
|
fill_output |= ((fill_values[total_index >> 3] >> ((total_index & 7) * 4)) & 0xf) << c;
|
||||||
|
ongoing_carry = (fill_carries[total_index >> 5] >> (total_index & 31)) & 1;
|
||||||
|
output >>= 4;
|
||||||
|
}
|
||||||
|
|
||||||
|
output = fill_output;
|
||||||
|
fill_carry_ = ongoing_carry;
|
||||||
|
}
|
||||||
|
|
||||||
|
not_zero_flag_ |= output;
|
||||||
|
|
||||||
|
switch(write_phase_) {
|
||||||
|
case WritePhase::Full:
|
||||||
|
ram_[write_address_ & ram_mask_] = output;
|
||||||
|
[[fallthrough]];
|
||||||
|
|
||||||
|
case WritePhase::Starting:
|
||||||
|
write_phase_ = WritePhase::Full;
|
||||||
|
write_address_ = pointer_[3];
|
||||||
|
write_value_ = output;
|
||||||
|
continue;
|
||||||
|
|
||||||
|
default: break;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -27,8 +27,9 @@ class BlitterSequencer {
|
|||||||
public:
|
public:
|
||||||
enum class Channel {
|
enum class Channel {
|
||||||
/// Tells the caller to calculate and load a new piece of output
|
/// Tells the caller to calculate and load a new piece of output
|
||||||
/// into the output pipeline if any new inputs have been provided
|
/// into the output pipeline,
|
||||||
/// if any inputs are enabled then a two-stage output pipeline applies:
|
///
|
||||||
|
/// If any inputs are enabled then a two-stage output pipeline applies:
|
||||||
/// if anything is already in the pipeline then it should now be written.
|
/// if anything is already in the pipeline then it should now be written.
|
||||||
/// Then the new value should be placed into the pipeline ready for the
|
/// Then the new value should be placed into the pipeline ready for the
|
||||||
/// next write slot.
|
/// next write slot.
|
||||||
@ -205,6 +206,16 @@ class Blitter: public DMADevice<4, 4> {
|
|||||||
uint16_t a_data_ = 0, b_data_ = 0, c_data_ = 0;
|
uint16_t a_data_ = 0, b_data_ = 0, c_data_ = 0;
|
||||||
|
|
||||||
bool not_zero_flag_ = false;
|
bool not_zero_flag_ = false;
|
||||||
|
|
||||||
|
BlitterSequencer sequencer_;
|
||||||
|
uint32_t write_address_ = 0xffff'ffff;
|
||||||
|
uint16_t write_value_ = 0;
|
||||||
|
enum WritePhase {
|
||||||
|
Starting, Full, Stopped
|
||||||
|
} write_phase_;
|
||||||
|
int y_, x_;
|
||||||
|
uint16_t transient_a_mask_;
|
||||||
|
bool stopping_;
|
||||||
};
|
};
|
||||||
|
|
||||||
}
|
}
|
||||||
|
Loading…
x
Reference in New Issue
Block a user