Begin a full-synchronous usage of the sequencer, at least exposing poor handling of the pipeline.

2025-02-21 20:29:06 +00:00 · 2022-07-29 16:15:18 -04:00 · 2022-07-29 16:15:18 -04:00 · 03d4960a03
commit 03d4960a03
parent 1ac0a4e924
2 changed files with 122 additions and 75 deletions
--- a/Machines/Amiga/Blitter.cpp
+++ b/Machines/Amiga/Blitter.cpp
@ -130,6 +130,7 @@ void Blitter::set_control(int index, uint16_t value) {
 		channel_enables_[2] = value & 0x200;
 		channel_enables_[1] = value & 0x400;
 		channel_enables_[0] = value & 0x800;
 		sequencer_.set_control(value >> 8);
 	}
 	shifts_[index] = value >> 12;
 	LOG("Set control " << index << " to " << PADHEX(4) << value);
@ -335,89 +336,124 @@ bool Blitter::advance_dma() {
 		// Copy mode.
 		// Quick hack: do the entire action atomically.
 		sequencer_.begin();
 		a32_ = 0;
 		b32_ = 0;
-		for(int y = 0; y < height_; y++) {
+		y_ = 0;
-			bool fill_carry = fill_carry_;
+		x_ = 0;
 		int loop_index_ = -1;
 		write_phase_ = WritePhase::Starting;
 		stopping_ = false;
-			for(int x = 0; x < width_; x++) {
+		while(true) {
-				uint16_t a_mask = 0xffff;
+			const auto next = sequencer_.next();
 				if(x == 0) a_mask &= a_mask_[0];
 				if(x == width_ - 1) a_mask &= a_mask_[1];
-				if(channel_enables_[0]) {
+			// If this is the start of a new iteration, check for end of line,
-					a_data_ = ram_[pointer_[0] & ram_mask_];
+			// or of blit, and pick an appropriate mask for A based on location.
-					pointer_[0] += direction_;
+			if(next.second != loop_index_) {
-				}
+				transient_a_mask_ = 0xffff;
-				a32_ = (a32_ << 16) | (a_data_ & a_mask);
+				if(x_ == 0) transient_a_mask_ &= a_mask_[0];
 				if(x_ == width_ - 1) transient_a_mask_ &= a_mask_[1];
-				if(channel_enables_[1]) {
+				++x_;
-					b_data_ = ram_[pointer_[1] & ram_mask_];
+				if(x_ == width_) {
-					pointer_[1] += direction_;
+					x_ = 0;
-				}
+					++y_;
-				b32_ = (b32_ << 16) | b_data_;
+					if(y_ == height_) {
-
+						sequencer_.complete();
-				if(channel_enables_[2]) {
+						stopping_ = true;
 					c_data_ = ram_[pointer_[2] & ram_mask_];
 					pointer_[2] += direction_;
 				}
 				uint16_t a, b;
 				// The barrel shifter shifts to the right in ascending address mode,
 				// but to the left otherwise
 				if(!one_dot_) {
 					a = uint16_t(a32_ >> shifts_[0]);
 					b = uint16_t(b32_ >> shifts_[1]);
 				} else {
 					// TODO: there must be a neater solution than this.
 					a = uint16_t(
 						(a32_ << shifts_[0]) |
 						(a32_ >> (32 - shifts_[0]))
 					);
 					b = uint16_t(
 						(b32_ << shifts_[1]) |
 						(b32_ >> (32 - shifts_[1]))
 					);
 				}
 				uint16_t output =
 					apply_minterm<uint16_t>(
 						a,
 						b,
 						c_data_,
 						minterms_);
 				if(exclusive_fill_ || inclusive_fill_) {
 					// Use the fill tables nibble-by-nibble to figure out the filled word.
 					uint16_t fill_output = 0;
 					int ongoing_carry = fill_carry;
 					const int type_mask = exclusive_fill_ ? (1 << 5) : 0;
 					for(int c = 0; c < 16; c += 4) {
 						const int total_index = (output & 0xf) | (ongoing_carry << 4) | type_mask;
 						fill_output |= ((fill_values[total_index >> 3] >> ((total_index & 7) * 4)) & 0xf) << c;
 						ongoing_carry = (fill_carries[total_index >> 5] >> (total_index & 31)) & 1;
 						output >>= 4;
 					}
-
+					pointer_[0] += modulos_[0] * channel_enables_[0] * direction_;
-					output = fill_output;
+					pointer_[1] += modulos_[1] * channel_enables_[1] * direction_;
-					fill_carry = ongoing_carry;
+					pointer_[2] += modulos_[2] * channel_enables_[2] * direction_;
-				}
+					pointer_[3] += modulos_[3] * channel_enables_[3] * direction_;
 				not_zero_flag_ |= output;
 				if(channel_enables_[3]) {
 					ram_[pointer_[3] & ram_mask_] = output;
 					pointer_[3] += direction_;
 				}
 				++loop_index_;
 			}
-			pointer_[0] += modulos_[0] * channel_enables_[0] * direction_;
+			using Channel = BlitterSequencer::Channel;
-			pointer_[1] += modulos_[1] * channel_enables_[1] * direction_;
+			switch(next.first) {
-			pointer_[2] += modulos_[2] * channel_enables_[2] * direction_;
+				case Channel::A:
-			pointer_[3] += modulos_[3] * channel_enables_[3] * direction_;
+					a_data_ = ram_[pointer_[0] & ram_mask_];
 					pointer_[0] += direction_;
 				continue;
 				case Channel::B:
 					b_data_ = ram_[pointer_[1] & ram_mask_];
 					pointer_[1] += direction_;
 				continue;
 				case Channel::C:
 					c_data_ = ram_[pointer_[2] & ram_mask_];
 					pointer_[2] += direction_;
 				continue;
 				case Channel::None:
 				continue;
 				case Channel::Write: break;
 			}
 			a32_ = (a32_ << 16) | (a_data_ & transient_a_mask_);
 			b32_ = (b32_ << 16) | b_data_;
 			uint16_t a, b;
 			// The barrel shifter shifts to the right in ascending address mode,
 			// but to the left otherwise.
 			if(!one_dot_) {
 				a = uint16_t(a32_ >> shifts_[0]);
 				b = uint16_t(b32_ >> shifts_[1]);
 			} else {
 				// TODO: there must be a neater solution than this.
 				a = uint16_t(
 					(a32_ << shifts_[0]) |
 					(a32_ >> (32 - shifts_[0]))
 				);
 				b = uint16_t(
 					(b32_ << shifts_[1]) |
 					(b32_ >> (32 - shifts_[1]))
 				);
 			}
 			uint16_t output =
 				apply_minterm<uint16_t>(
 					a,
 					b,
 					c_data_,
 					minterms_);
 			if(exclusive_fill_ || inclusive_fill_) {
 				// Use the fill tables nibble-by-nibble to figure out the filled word.
 				uint16_t fill_output = 0;
 				int ongoing_carry = fill_carry_;
 				const int type_mask = exclusive_fill_ ? (1 << 5) : 0;
 				for(int c = 0; c < 16; c += 4) {
 					const int total_index = (output & 0xf) | (ongoing_carry << 4) | type_mask;
 					fill_output |= ((fill_values[total_index >> 3] >> ((total_index & 7) * 4)) & 0xf) << c;
 					ongoing_carry = (fill_carries[total_index >> 5] >> (total_index & 31)) & 1;
 					output >>= 4;
 				}
 				output = fill_output;
 				fill_carry_ = ongoing_carry;
 			}
 			not_zero_flag_ |= output;
 			switch(write_phase_) {
 				case WritePhase::Full:
 					ram_[write_address_ & ram_mask_] = output;
 					[[fallthrough]];
 				case WritePhase::Starting:
 					write_phase_ = WritePhase::Full;
 					write_address_ = pointer_[3];
 					write_value_ = output;
 				continue;
 				default: break;
 			}
 		}
 	}
--- a/Machines/Amiga/Blitter.hpp
+++ b/Machines/Amiga/Blitter.hpp
@ -27,8 +27,9 @@ class BlitterSequencer {
 	public:
 		enum class Channel {
 			/// Tells the caller to calculate and load a new piece of output
-			/// into the output pipeline if any new inputs have been provided
+			/// into the output pipeline,
-			/// if any inputs are enabled then a two-stage output pipeline applies:
+			///
 			/// If any inputs are enabled then a two-stage output pipeline applies:
 			/// if anything is already in the pipeline then it should now be written.
 			/// Then the new value should be placed into the pipeline ready for the
 			/// next write slot.
@ -205,6 +206,16 @@ class Blitter: public DMADevice<4, 4> {
 		uint16_t a_data_ = 0, b_data_ = 0, c_data_ = 0;
 		bool not_zero_flag_ = false;
 		BlitterSequencer sequencer_;
 		uint32_t write_address_ = 0xffff'ffff;
 		uint16_t write_value_ = 0;
 		enum WritePhase {
 			Starting, Full, Stopped
 		} write_phase_;
 		int y_, x_;
 		uint16_t transient_a_mask_;
 		bool stopping_;
 };
 }