iigs-game-engine/src/blitter/Horz.s

714 lines
26 KiB
ArmAsm

; Subroutines that deal with the horizontal scrolling. The primary function of
; these routines are to adjust tables and patch in new values into the code field
; when the virtual X-position of the play field changes.
; Simple function that restores the saved opcode that are stashed in _applyBG0Xpos. It is
; very important that opcodes are restored before new ones are inserted, because there is
; only one, fixed storage location and old values will be overwritten if operations are not
; performed in order.
;
; Experimental -- this is a parameterized version that does not rely on direct page
; state variables for input and attempts to be more optimized.
;
; A = starting virtual line in the code field (0 - 207)
; X = number of lines to render (0 - 200)
_RestoreBG0Opcodes
:virt_line_x2 equ tmp1
:lines_left_x2 equ tmp2
:draw_count_x2 equ tmp3
:exit_offset equ tmp4
:stk_save equ tmp5
phb ; Save data bank
asl
sta :virt_line_x2 ; Keep track of it
txa
asl
sta :lines_left_x2
lda LastPatchOffset ; If zero, there are no saved opcodes
sta :exit_offset
tsc
sta :stk_save
:loop
ldx :virt_line_x2
ldal BTableLow,x ; Get the address of the first code field line
tay
ldal BTableHigh,x ; This intentionally leaks one byte on the stack
pha
plb ; This is the bank that will receive the updates
txa ; lda :virt_line_x2
and #$001E
eor #$FFFF
sec
adc #32
min :lines_left_x2
sta :draw_count_x2 ; Do half of this many lines
; y is already set to :base_address
tax ; :draw_count * 2
clc
adc :virt_line_x2
sta :virt_line_x2
tya
adc :exit_offset ; Add some offsets to get the base address in the code field line
RestoreOpcode
lda :lines_left_x2 ; subtract the number of lines we just completed
sec
sbc :draw_count_x2
sta :lines_left_x2
jne :loop
stz LastPatchOffset ; Clear the value once completed
lda :stk_save
tcs
plb
rts
; Based on the current value of StartX in the direct page, patch up the code fields
; to render the correct data. Note that we do *not* do the OpcodeRestore in this
; routine. The reason is that the restore *must* be applied using the (StartX, StartY)
; values from the previous frame, which requires logic that is not relevant to setting
; up the code field.
;
; This function is where the reverse-mapping aspect of the code field is compensated
; for. In the initialize case where X = 0, the exit point is at the *end* of
; the code buffer line
;
; +----+----+ ... +----+----+----+
; | 82 | 80 | | 04 | 02 | 00 |
; +----+----+ ... +----+----+----+
; ^ x=0
;
; As the screen scrolls right-to-left, the exit position moves to earlier memory
; locations until wrapping around from 163 to 0.
;
; The net calculation are
;
; x_exit = (164 - x) % 164
; x_enter = (164 - x - width) % 164
;
; Small routine to put the data in a consistent state. Called before any routines need to draw on
; the code buffer, but before we patch out the instructions.
_ApplyBG0XPosPre
lda StartX ; This is the starting byte offset (0 - 163)
jsr Mod164
sta StartXMod164
rts
_ApplyBG0XPos
:stk_save equ tmp0
:virt_line_x2 equ tmp1
:lines_left_x2 equ tmp2
:draw_count_x2 equ tmp3
:exit_offset equ tmp4
:entry_offset equ tmp5
:exit_bra equ tmp6
:exit_address equ tmp7
:base_address equ tmp8
:opcode equ tmp9
:odd_entry_offset equ tmp10
; If there are saved opcodes that have not been restored, do not run this routine
lda LastPatchOffset
beq :ok
rts
; This code is fairly succinct. See the corresponding code in Vert.s for more detailed comments.
:ok
lda StartYMod208 ; This is the base line of the virtual screen
asl
sta :virt_line_x2 ; Keep track of it
lda ScreenHeight
asl
sta :lines_left_x2
; Calculate the exit and entry offsets into the code fields. This is a bit tricky, because odd-aligned
; rendering causes the left and right edges to move in a staggered fashion.
;
; ... +----+----+----+----+----+- ... -+----+----+----+----+----+
; | 04 | 06 | 08 | 0A | 0C | | 44 | 46 | 48 | 4A |
; ... +----+----+----+----+----+- ... -+----+----+----+----+----+
; | |
; +---- screen width --------------+
; entry | | exit
;
; Here is an example of a screen 64 bytes wide. When everything is aligned to an even offset
; then the entry point is column $08 and the exit point is column $48
;
; If we move the screen forward one byte (which means the pointers move backwards) then the low-byte
; of column $06 will be on the right edge of the screen and the high-byte of column $46 will left-edge
; of the screen. Since the one-byte edges are handled specially, the exit point shifts one column, but
; the entry point does not.
;
; ... +----+----+----+----+----+- ... -+----+----+----+----+----+
; | 04 | 06 | 08 | 0A | 0C | | 44 | 46 | 48 | 4A |
; ... +----+----+----+----+----+- ... -+----+----+----+----+----+
; | | | |
; +--|------ screen width -------|--+
; entry | | exit
;
; When the screen is moved one more byte forward, then the entry point will move to the
; next column.
;
; ... +----+----+----+----+----+- ... -+----+----+----+----+----+
; | 04 | 06 | 08 | 0A | 0C | | 44 | 46 | 48 | 4A |
; ... +----+----+----+----+----+- ... -+----+----+----+----+----+
; | |
; +------ screen width ------------+
; entry | | exit
;
; So, in short, the entry tile position is rounded up from the x-position and the exit
; tile position is rounded down.
;
; Now, the left edge of the screen is pushed last, so we need to exit one instruction *after*
; the location (163 - StartX % 164)
;
; x = 0
;
; | PEA $0000 |
; +-----------+
; | PEA $0000 |
; +-----------+
; | JMP loop | <-- Exit here
; +-----------+
;
; x = 1 and 2
;
; | PEA $0000 |
; +-----------+
; | PEA $0000 | <-- Exit Here
; +-----------+
; | JMP loop |
; +-----------+
lda StartXMod164
; Right now we have the offset of the left-edge visible byte. Move one byte earlier to figure out
; where the exit will be patched in
dec ; (a - 1) % 164
bpl :hop1
lda #163
:hop1
; If the exit byte is odd, then the left edge is even-aligned and we round down and exit at at
; that word.
;
; If the exit byte is even, then the left edge is odd-aligned and we exit at this word.
bit #$0001
beq :odd_exit
; This is the even code path
and #$FFFE
tax
lda CodeFieldEvenBRA,x
sta :exit_bra
lda Col2CodeOffset,x
sta :exit_offset
sta LastPatchOffset ; Cache as a flag for later
bra :do_entry
; This is the odd code path
:odd_exit tax
lda CodeFieldOddBRA,x
sta :exit_bra
lda Col2CodeOffset,x
sta :exit_offset
sta LastPatchOffset ; Cache as a flag for later
; Calculate the entry point into the code field by calculating the right edge
:do_entry lda StartXMod164
clc
adc ScreenWidth ; move to the right edge and back up a byte
dec ; to get the index of the first on-screen byte
cmp #164 ; Keep the value in range
bcc :hop2
sbc #164
:hop2
; Same logic as above. If the right edge is odd, then the full word needs to be drawn and we
; will enter at that index, rounded down.
;
; If the right edge is even, then only the low byte needs to be drawn, which is handled before
; entering the code field. So enter one word before the right edge.
bit #$0001
beq :odd_entry
and #$FFFE
tax
lda Col2CodeOffset,x
sta :entry_offset
lda #$004C ; set the entry_jmp opcode to JMP
sta :opcode
stz :odd_entry_offset ; mark as an even case
bra :prep_complete
:odd_entry
tax
lda Col2CodeOffset,x
sta :entry_offset ; Will be used to load the data
lda Col2CodeOffset-2,x
sta :odd_entry_offset ; will the the actual location to jump to
lda #$00AF ; set the entry_jmp opcode to LDAL
sta :opcode
:prep_complete
; Main loop that
;
; 1. Saves the opcodes in the code field
; 2. Writes the BRA instruction to exit the code field
; 3. Writes the JMP entry point to enter the code field
phb ; Save the existing bank
tsc
sta :stk_save
:loop
ldx :virt_line_x2
ldal BTableLow,x ; Get the address of the first code field line
tay ; Save it to use as the base address
clc
adc :exit_offset ; Add some offsets to get the base address in the code field line
sta :exit_address
sty :base_address
ldal BTableHigh,x
pha
plb
txa
and #$001E
eor #$FFFF
sec
adc #32
min :lines_left_x2
sta :draw_count_x2
; First step is to set the BRA instruction to exit the code field at the proper location. There
; are two sub-steps to do here; we need to save the 16-bit value that exists at the location and
; then overwrite it with the branch instruction.
;
; Special note, the SaveOpcode function stores the opcode *within* the code field as it is
; used in odd-aligned cases to determine how to draw the 8-bit value on the left edge of the
; screen
; y is already set to :base_address
tax ; :draw_count_x2
clc ; advance to the virtual line after the segment we just
adc :virt_line_x2 ; filled in
sta :virt_line_x2
lda :exit_address ; Save from this location (not needed in fast mode)
SaveOpcode ; X = :exit_address on return
txy ; ldy :exit_address -- starting at this address
ldx :draw_count_x2 ; Do this many lines
lda :exit_bra ; Copy this value into all of the lines
SetConst ; All registers are preserved
; Next, patch in the CODE_ENTRY value, which is the low byte of a JMP instruction. This is an
; 8-bit operation and, since the PEA code is bank aligned, we use the entry_offset value directly
sep #$20
lda :entry_offset
ldy :base_address
SetCodeEntry ; All registers are preserved
; Now, patch in the opcode
lda :opcode
SetCodeEntryOpcode ; All registers are preserved
; If this is an odd entry, also set the odd_entry low byte and save the operand high byte
lda :odd_entry_offset
jeq :not_odd
SetOddCodeEntry ; All registers are preserved
SaveHighOperand :exit_address ; Only used once, so "inline" it
:not_odd
rep #$21 ; clear the carry
; Do the end of the loop -- update the virtual line counter and reduce the number
; of lines left to render
lda :lines_left_x2 ; subtract the number of lines we just completed
sec
sbc :draw_count_x2
sta :lines_left_x2
jne :loop
lda :stk_save
tcs
plb
rts
; SaveHighOperand
;
; Save the high byte of the 3-byte code field instruction into the odd handler at the end
; of each line. This is only needed
;
; X = number of lines * 2, 0 to 32
; Y = starting line * $1000
; A = code field location * $1000
SaveHighOperand mac
jmp (dispTbl,x)
dispTbl da bottom
da do01,do02,do03,do04
da do05,do06,do07,do08
da do09,do10,do11,do12
da do13,do14,do15,do16
do15 ldx ]1 ; accumulator is in 8-bit mode, so can't use TAX
bra x15
do14 ldx ]1
bra x14
do13 ldx ]1
bra x13
do12 ldx ]1
bra x12
do11 ldx ]1
bra x11
do10 ldx ]1
bra x10
do09 ldx ]1
bra x09
do08 ldx ]1
bra x08
do07 ldx ]1
bra x07
do06 ldx ]1
bra x06
do05 ldx ]1
bra x05
do04 ldx ]1
bra x04
do03 ldx ]1
bra x03
do02 ldx ]1
bra x02
do01 ldx ]1
bra x01
do16 ldx ]1
x16 lda $F002,x
sta OPCODE_HIGH_SAVE+$F000,y
x15 lda $E002,x
sta OPCODE_HIGH_SAVE+$E000,y
x14 lda $D002,x
sta OPCODE_HIGH_SAVE+$D000,y
x13 lda $C002,x
sta OPCODE_HIGH_SAVE+$C000,y
x12 lda $B002,x
sta OPCODE_HIGH_SAVE+$B000,y
x11 lda $A002,x
sta OPCODE_HIGH_SAVE+$A000,y
x10 lda $9002,x
sta OPCODE_HIGH_SAVE+$9000,y
x09 lda $8002,x
sta OPCODE_HIGH_SAVE+$8000,y
x08 lda $7002,x
sta OPCODE_HIGH_SAVE+$7000,y
x07 lda $6002,x
sta OPCODE_HIGH_SAVE+$6000,y
x06 lda $5002,x
sta OPCODE_HIGH_SAVE+$5000,y
x05 lda $4002,x
sta OPCODE_HIGH_SAVE+$4000,y
x04 lda $3002,x
sta OPCODE_HIGH_SAVE+$3000,y
x03 lda $2002,x
sta OPCODE_HIGH_SAVE+$2000,y
x02 lda $1002,x
sta OPCODE_HIGH_SAVE+$1000,y
x01 lda: $0002,x
sta: OPCODE_HIGH_SAVE+$0000,y
bottom <<<
; SaveOpcode
;
; Save the values to the restore location. This should only be used to patch the
; code field since the save location is fixed.
;
; X = number of lines * 2, 0 to 32
; Y = starting line * $1000
; A = code field location * $1000
SaveOpcode mac
jmp (dispTbl,x)
dispTbl da bottom
da do01,do02,do03,do04
da do05,do06,do07,do08
da do09,do10,do11,do12
da do13,do14,do15,do16
do15 tax
bra x15
do14 tax
bra x14
do13 tax
bra x13
do12 tax
bra x12
do11 tax
bra x11
do10 tax
bra x10
do09 tax
bra x09
do08 tax
bra x08
do07 tax
bra x07
do06 tax
bra x06
do05 tax
bra x05
do04 tax
bra x04
do03 tax
bra x03
do02 tax
bra x02
do01 tax
bra x01
do16 tax
x16 lda $F000,x
sta OPCODE_SAVE+$F000,y
x15 lda $E000,x
sta OPCODE_SAVE+$E000,y
x14 lda $D000,x
sta OPCODE_SAVE+$D000,y
x13 lda $C000,x
sta OPCODE_SAVE+$C000,y
x12 lda $B000,x
sta OPCODE_SAVE+$B000,y
x11 lda $A000,x
sta OPCODE_SAVE+$A000,y
x10 lda $9000,x
sta OPCODE_SAVE+$9000,y
x09 lda $8000,x
sta OPCODE_SAVE+$8000,y
x08 lda $7000,x
sta OPCODE_SAVE+$7000,y
x07 lda $6000,x
sta OPCODE_SAVE+$6000,y
x06 lda $5000,x
sta OPCODE_SAVE+$5000,y
x05 lda $4000,x
sta OPCODE_SAVE+$4000,y
x04 lda $3000,x
sta OPCODE_SAVE+$3000,y
x03 lda $2000,x
sta OPCODE_SAVE+$2000,y
x02 lda $1000,x
sta OPCODE_SAVE+$1000,y
x01 lda: $0000,x
sta: OPCODE_SAVE+$0000,y
bottom
<<<
; RestoreOpcode
;
; Restore the values back to the code field.
;
; X = number of lines * 2, 0 to 32
; Y = starting line * $1000
; A = code field location * $1000
RestoreOpcode mac
jmp (dispTbl,x)
dispTbl da bottom
da do01,do02,do03,do04
da do05,do06,do07,do08
da do09,do10,do11,do12
da do13,do14,do15,do16
do15 tax
bra x15
do14 tax
bra x14
do13 tax
bra x13
do12 tax
bra x12
do11 tax
bra x11
do10 tax
bra x10
do09 tax
bra x09
do08 tax
bra x08
do07 tax
bra x07
do06 tax
bra x06
do05 tax
bra x05
do04 tax
bra x04
do03 tax
bra x03
do02 tax
bra x02
do01 tax
bra x01
do16 tax
x16 lda OPCODE_SAVE+$F000,y
sta $F000,x
x15 lda OPCODE_SAVE+$E000,y
sta $E000,x
x14 lda OPCODE_SAVE+$D000,y
sta $D000,x
x13 lda OPCODE_SAVE+$C000,y
sta $C000,x
x12 lda OPCODE_SAVE+$B000,y
sta $B000,x
x11 lda OPCODE_SAVE+$A000,y
sta $A000,x
x10 lda OPCODE_SAVE+$9000,y
sta $9000,x
x09 lda OPCODE_SAVE+$8000,y
sta $8000,x
x08 lda OPCODE_SAVE+$7000,y
sta $7000,x
x07 lda OPCODE_SAVE+$6000,y
sta $6000,x
x06 lda OPCODE_SAVE+$5000,y
sta $5000,x
x05 lda OPCODE_SAVE+$4000,y
sta $4000,x
x04 lda OPCODE_SAVE+$3000,y
sta $3000,x
x03 lda OPCODE_SAVE+$2000,y
sta $2000,x
x02 lda OPCODE_SAVE+$1000,y
sta $1000,x
x01 lda: OPCODE_SAVE+$0000,y
sta: $0000,x
bottom
<<<
; SetCodeEntry
;
; Patch in the low byte at the CODE_ENTRY. Must be called with 8-bit accumulator
;
; X = number of lines * 2, 0 to 32
; Y = starting line * $1000
; A = address low byte
SetCodeEntry mac
jmp (dispTbl,x)
dispTbl da bottom-00,bottom-03,bottom-06,bottom-09
da bottom-12,bottom-15,bottom-18,bottom-21
da bottom-24,bottom-27,bottom-30,bottom-33
da bottom-36,bottom-39,bottom-42,bottom-45
da bottom-48
sta CODE_ENTRY+$F000,y
sta CODE_ENTRY+$E000,y
sta CODE_ENTRY+$D000,y
sta CODE_ENTRY+$C000,y
sta CODE_ENTRY+$B000,y
sta CODE_ENTRY+$A000,y
sta CODE_ENTRY+$9000,y
sta CODE_ENTRY+$8000,y
sta CODE_ENTRY+$7000,y
sta CODE_ENTRY+$6000,y
sta CODE_ENTRY+$5000,y
sta CODE_ENTRY+$4000,y
sta CODE_ENTRY+$3000,y
sta CODE_ENTRY+$2000,y
sta CODE_ENTRY+$1000,y
sta: CODE_ENTRY+$0000,y
bottom
<<<
; SetOddCodeEntry
;
; Patch in the low byte at the ODD_ENTRY. Must be called with 8-bit accumulator
;
; X = number of lines * 2, 0 to 32
; Y = starting line * $1000
; A = address low byte
SetOddCodeEntry mac
jmp (dispTbl,x)
dispTbl da bottom-00,bottom-03,bottom-06,bottom-09
da bottom-12,bottom-15,bottom-18,bottom-21
da bottom-24,bottom-27,bottom-30,bottom-33
da bottom-36,bottom-39,bottom-42,bottom-45
da bottom-48
sta ODD_ENTRY+$F000,y
sta ODD_ENTRY+$E000,y
sta ODD_ENTRY+$D000,y
sta ODD_ENTRY+$C000,y
sta ODD_ENTRY+$B000,y
sta ODD_ENTRY+$A000,y
sta ODD_ENTRY+$9000,y
sta ODD_ENTRY+$8000,y
sta ODD_ENTRY+$7000,y
sta ODD_ENTRY+$6000,y
sta ODD_ENTRY+$5000,y
sta ODD_ENTRY+$4000,y
sta ODD_ENTRY+$3000,y
sta ODD_ENTRY+$2000,y
sta ODD_ENTRY+$1000,y
sta: ODD_ENTRY+$0000,y
bottom
<<<
; SetCodeEntryOpcode
;
; Patch in the opcode at the CODE_ENTRY_OPCODE. Must be called with 8-bit accumulator
;
; X = number of lines * 2, 0 to 32
; Y = starting line * $1000
; A = opcode value
SetCodeEntryOpcode mac
jmp (dispTbl,x)
dispTbl da bottom-00,bottom-03,bottom-06,bottom-09
da bottom-12,bottom-15,bottom-18,bottom-21
da bottom-24,bottom-27,bottom-30,bottom-33
da bottom-36,bottom-39,bottom-42,bottom-45
da bottom-48
sta CODE_ENTRY_OPCODE+$F000,y
sta CODE_ENTRY_OPCODE+$E000,y
sta CODE_ENTRY_OPCODE+$D000,y
sta CODE_ENTRY_OPCODE+$C000,y
sta CODE_ENTRY_OPCODE+$B000,y
sta CODE_ENTRY_OPCODE+$A000,y
sta CODE_ENTRY_OPCODE+$9000,y
sta CODE_ENTRY_OPCODE+$8000,y
sta CODE_ENTRY_OPCODE+$7000,y
sta CODE_ENTRY_OPCODE+$6000,y
sta CODE_ENTRY_OPCODE+$5000,y
sta CODE_ENTRY_OPCODE+$4000,y
sta CODE_ENTRY_OPCODE+$3000,y
sta CODE_ENTRY_OPCODE+$2000,y
sta CODE_ENTRY_OPCODE+$1000,y
sta: CODE_ENTRY_OPCODE+$0000,y
bottom
<<<