Merge pull request #50 from dougmasten/dev

Optimization to 6809 depacker and added new H6309 version
This commit is contained in:
Emmanuel Marty 2020-10-18 13:54:25 +02:00 committed by GitHub
commit 27b04e8bd4
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
6 changed files with 246 additions and 35 deletions

90
asm/6809/unlzsa1-6309.s Normal file
View File

@ -0,0 +1,90 @@
; unlzsa1-6309.s - Hitachi 6309 decompression routine for raw LZSA1 - 92 bytes
; compress with lzsa -f1 -r <original_file> <compressed_file>
;
; in: x = start of compressed data
; y = start of decompression buffer
; out: y = end of decompression buffer + 1
;
; Copyright (C) 2020 Emmanuel Marty, Doug Masten
;
; This software is provided 'as-is', without any express or implied
; warranty. In no event will the authors be held liable for any damages
; arising from the use of this software.
;
; Permission is granted to anyone to use this software for any purpose,
; including commercial applications, and to alter it and redistribute it
; freely, subject to the following restrictions:
;
; 1. The origin of this software must not be misrepresented; you must not
; claim that you wrote the original software. If you use this software
; in a product, an acknowledgment in the product documentation would be
; appreciated but is not required.
; 2. Altered source versions must be plainly marked as such, and must not be
; misrepresented as being the original software.
; 3. This notice may not be removed or altered from any source distribution.
decompress_lzsa1 equ lz1token
lz1bigof lda ,x+ ; O set: load MSB 16-bit (negative, signed) offest
lz1gotof leau d,y ; put backreference start address in U (dst+offset)
ldd #$000f ; clear MSB match length and set mask for MMMM
andb ,s+ ; isolate MMMM (embedded match length) in token
addb #$03 ; add MIN_MATCH_SIZE
cmpb #$12 ; MATCH_RUN_LEN?
bne lz1gotln ; no, we have the full match length, go copy
addb ,x+ ; add extra match length byte + MIN_MATCH_SIZE + MATCH_RUN_LEN
bcc lz1gotln ; if no overflow, we have the full length
bne lz1midln
ldb ,x+ ; load 16-bit len in D (low part in B, high in A)
lda ,x+ ; (little endian)
bne lz1gotln ; check if we hit EOD (16-bit length = 0)
tstb
bne lz1gotln ; go copy matched bytes if not
rts ; done, bail
lz1midln tfr b,a ; copy high part of len into A
ldb ,x+ ; grab low 8 bits of len in B
lz1gotln tfr d,w ; set W with match length for TFM instruction
tfm u+,y+ ; copy match bytes
lz1token ldb ,x+ ; load next token into B: O|LLL|MMMM
pshs b ; save it
andb #$70 ; isolate LLL (embedded literals count) in B
beq lz1nolt ; skip if no literals
cmpb #$70 ; LITERALS_RUN_LEN?
bne lz1declt ; if not, we have the complete count, go unshift
ldb ,x+ ; load extra literals count byte
addb #$07 ; add LITERALS_RUN_LEN
bcc lz1gotla ; if no overflow, we got the complete count, copy
bne lz1midlt
ldb ,x+ ; load low 8 bits of little-endian literals count
lda ,x+ ; load high 8 bits of literal count
bra lz1gotlt ; we now have the complete count, go copy
lz1midlt tfr b,a ; copy high part of literals count into A
ldb ,x+ ; load low 8 bits of literals count
bra lz1gotlt ; we now have the complete count, go copy
lz1declt lsrb ; shift literals count into place
lsrb
lsrb
lsrb
lz1gotla clra ; clear A (high part of literals count)
lz1gotlt tfr d,w ; set W with literals count for TFM instruction
tfm x+,y+ ; copy literal bytes
lz1nolt ldb ,x+ ; load either 8-bit or LSB 16-bit offset (negative, signed)
lda ,s ; get token again, don't pop it from the stack
bmi lz1bigof ; test O bit (small or large offset)
lda #$ff ; set high 8 bits
bra lz1gotof

View File

@ -28,10 +28,8 @@ decompress_lzsa1 equ lz1token
lz1bigof lda ,x+ ; O set: load MSB 16-bit (negative, signed) offest lz1bigof lda ,x+ ; O set: load MSB 16-bit (negative, signed) offest
lz1gotof leau d,y ; put backreference start address in U (dst+offset) lz1gotof leau d,y ; put backreference start address in U (dst+offset)
puls b ; restore token ldd #$000f ; clear MSB match length and set mask for MMMM
andb ,s+ ; isolate MMMM (embedded match length) in token
clra ; clear A (high part of match length)
andb #$0F ; isolate MMMM (embedded match length)
addb #$03 ; add MIN_MATCH_SIZE addb #$03 ; add MIN_MATCH_SIZE
cmpb #$12 ; MATCH_RUN_LEN? cmpb #$12 ; MATCH_RUN_LEN?
bne lz1gotln ; no, we have the full match length, go copy bne lz1gotln ; no, we have the full match length, go copy
@ -88,13 +86,13 @@ lz1declt lsrb ; shift literals count into place
lsrb lsrb
lz1gotla clra ; clear A (high part of literals count) lz1gotla clra ; clear A (high part of literals count)
lz1gotlt tfr x,u lz1gotlt leau ,x
tfr d,x ; transfer 16-bit count into X tfr d,x ; transfer 16-bit count into X
lz1cpylt lda ,u+ ; copy literal byte lz1cpylt lda ,u+ ; copy literal byte
sta ,y+ sta ,y+
leax -1,x ; decrement X and update Z flag leax -1,x ; decrement X and update Z flag
bne lz1cpylt ; loop until all literal bytes are copied bne lz1cpylt ; loop until all literal bytes are copied
tfr u,x leax ,u
lz1nolt ldb ,x+ ; load either 8-bit or LSB 16-bit offset (negative, signed) lz1nolt ldb ,x+ ; load either 8-bit or LSB 16-bit offset (negative, signed)
lda ,s ; get token again, don't pop it from the stack lda ,s ; get token again, don't pop it from the stack

View File

@ -34,10 +34,9 @@ lz1gotof nega ; reverse sign of offset in D
sbca #0 sbca #0
leau d,y ; put backreference start address in U (dst+offset) leau d,y ; put backreference start address in U (dst+offset)
puls b ; restore token ldd #$000f ; clear MSB match length and set mask for MMMM
andb ,s+ ; isolate MMMM (embedded match length) in token
clra ; clear A (high part of match length)
andb #$0F ; isolate MMMM (embedded match length)
addb #$03 ; add MIN_MATCH_SIZE addb #$03 ; add MIN_MATCH_SIZE
cmpb #$12 ; MATCH_RUN_LEN? cmpb #$12 ; MATCH_RUN_LEN?
bne lz1gotln ; no, we have the full match length, go copy bne lz1gotln ; no, we have the full match length, go copy
@ -90,13 +89,13 @@ lz1declt lsrb ; shift literals count into place
lsrb lsrb
lz1gotla clra ; clear A (high part of literals count) lz1gotla clra ; clear A (high part of literals count)
lz1gotlt tfr x,u lz1gotlt leau ,x
tfr d,x ; transfer 16-bit count into X tfr d,x ; transfer 16-bit count into X
lz1cpylt lda ,-u ; copy literal byte lz1cpylt lda ,-u ; copy literal byte
sta ,-y sta ,-y
leax -1,x ; decrement X and update Z flag leax -1,x ; decrement X and update Z flag
bne lz1cpylt ; loop until all literal bytes are copied bne lz1cpylt ; loop until all literal bytes are copied
tfr u,x leax ,u
lz1nolt ldb ,s ; get token again, don't pop it from the stack lz1nolt ldb ,s ; get token again, don't pop it from the stack
bmi lz1bigof ; test O bit (small or large offset) bmi lz1bigof ; test O bit (small or large offset)

129
asm/6809/unlzsa2-6309.s Normal file
View File

@ -0,0 +1,129 @@
; unlzsa2-6309.s - Hitachi 6309 decompression routine for raw LZSA2 - 150 bytes
; compress with lzsa -f2 -r <original_file> <compressed_file>
;
; in: x = start of compressed data
; y = start of decompression buffer
; out: y = end of decompression buffer + 1
;
; Copyright (C) 2020 Emmanuel Marty, Doug Masten
;
; This software is provided 'as-is', without any express or implied
; warranty. In no event will the authors be held liable for any damages
; arising from the use of this software.
;
; Permission is granted to anyone to use this software for any purpose,
; including commercial applications, and to alter it and redistribute it
; freely, subject to the following restrictions:
;
; 1. The origin of this software must not be misrepresented; you must not
; claim that you wrote the original software. If you use this software
; in a product, an acknowledgment in the product documentation would be
; appreciated but is not required.
; 2. Altered source versions must be plainly marked as such, and must not be
; misrepresented as being the original software.
; 3. This notice may not be removed or altered from any source distribution.
decompress_lzsa2
clr lz2nibct ; reset nibble available flag
bra lz2token
lz2nibct fcb 0 ; nibble ready flag
lz2replg lslb ; push token's Y flag bit into carry
bcs lz2rep16 ; if token's Y bit is set, rep or 16 bit offset
sex ; push token's Z flag bit into reg A
bsr lz2nibl ; get offset nibble in B
lsla ; push token's Z flag bit into carry
rolb ; shift Z flag from carry into bit 0 of B
eorb #$e1 ; set bits 13-15 of offset, reverse bit 8
tfr b,a ; copy bits 8-15 of offset into A
suba #$02 ; substract 512 from offset
ldb ,x+ ; load low 8 bits of (negative, signed) offset
bra lz2gotof
lz2rep16 bmi lz2repof ; if token's Z flag bit is set, rep match
ldd ,x++ ; load high then low 8 bits of offset
lz2gotof std lz2moff+2 ; store match offset
lz2repof ldd #$0007 ; clear MSB match length and set mask for MMM
andb ,u ; isolate MMM (embedded match length) in token
lz2moff leau $aaaa,y ; put backreference start address in U (dst+offset)
addb #$02 ; add MIN_MATCH_SIZE_V2
cmpb #$09 ; MIN_MATCH_SIZE_V2 + MATCH_RUN_LEN_V2?
bne lz2gotln ; no, we have the full match length, go copy
bsr lz2nibl ; get offset nibble in B
addb #$09 ; add MIN_MATCH_SIZE_V2 + MATCH_RUN_LEN_V2
cmpb #$18 ; MIN_MATCH_SIZE_V2 + MATCH_RUN_LEN_V2 + 15?
bne lz2gotln ; if not, we have the full match length, go copy
addb ,x+ ; add extra length byte + MIN_MATCH_SIZE_V2 + MATCH_RUN_LEN_V2 + 15
bcc lz2gotln ; if no overflow, we have the full length
beq lz2done ; detect EOD code
ldb ,x+ ; load 16-bit len in D (low part in B, high in A)
lda ,x+ ; (little endian)
lz2gotln tfr d,w ; set W with match count for TFM instruction
tfm u+,y+ ; copy match bytes
lz2token tfr x,u ; save token address
ldb ,x+ ; load next token into B: XYZ|LL|MMM
andb #$18 ; isolate LL (embedded literals count) in B
beq lz2nolt ; skip if no literals
cmpb #$18 ; LITERALS_RUN_LEN_V2?
bne lz2declt ; if not, we have the complete count, go unshift
bsr lz2nibl ; get extra literals length nibble in B
addb #$03 ; add LITERALS_RUN_LEN_V2
cmpb #$12 ; LITERALS_RUN_LEN_V2 + 15 ?
bne lz2gotla ; if not, we have the full literals count, go copy
addb ,x+ ; add extra literals count byte + LITERALS_RUN_LEN + 15
bcc lz2gotla ; if no overflow, we got the complete count, copy
ldb ,x+ ; load low 8 bits of little-endian literals count
lda ,x+ ; load high 8 bits of literal count
bra lz2gotlt ; we now have the complete count, go copy
lz2declt lsrb ; shift literals count into place
lsrb
lsrb
lz2gotla clra ; clear A (high part of literals count)
lz2gotlt tfr d,w ; set W with literals count for TFM instruction
tfm x+,y+ ; copy literal bytes
lz2nolt ldb ,u ; get token again
lslb ; push token's X flag bit into carry
bcs lz2replg ; if token's X bit is set, rep or large offset
lslb ; push token's Y flag bit into carry
sex ; push token's Z flag bit into reg A (carry flag is not effected)
bcs lz2offs9 ; if token's Y bit is set, 9 bits offset
bsr lz2nibl ; get offset nibble in B
lsla ; retrieve token's Z flag bit and push into carry
rolb ; shift Z flag from carry into bit 0 of B
eorb #$e1 ; set bits 5-7 of offset, reverse bit 0
sex ; set bits 8-15 of offset to $FF
bra lz2gotof
lz2offs9 deca ; set bits 9-15 of offset, reverse bit 8
ldb ,x+ ; load low 8 bits of (negative, signed) offset
bra lz2gotof
lz2nibl ldb #$aa
com lz2nibct ; nibble ready?
bpl lz2gotnb
ldb ,x+ ; load two nibbles
stb lz2nibl+1 ; store nibble for next time (low 4 bits)
lsrb ; shift 4 high bits of nibble down
lsrb
lsrb
lsrb
lz2gotnb andb #$0f ; only keep low 4 bits
lz2done rts

View File

@ -1,4 +1,4 @@
; unlzsa2.s - 6809 decompression routine for raw LZSA2 - 172 bytes ; unlzsa2.s - 6809 decompression routine for raw LZSA2 - 169 bytes
; compress with lzsa -f2 -r <original_file> <compressed_file> ; compress with lzsa -f2 -r <original_file> <compressed_file>
; ;
; in: x = start of compressed data ; in: x = start of compressed data
@ -24,7 +24,7 @@
; 3. This notice may not be removed or altered from any source distribution. ; 3. This notice may not be removed or altered from any source distribution.
decompress_lzsa2 decompress_lzsa2
lsr <lz2nibct,pcr ; reset nibble available flag clr <lz2nibct,pcr ; reset nibble available flag
lz2token ldb ,x+ ; load next token into B: XYZ|LL|MMM lz2token ldb ,x+ ; load next token into B: XYZ|LL|MMM
pshs b ; save it pshs b ; save it
@ -49,15 +49,15 @@ lz2token ldb ,x+ ; load next token into B: XYZ|LL|MMM
lz2declt lsrb ; shift literals count into place lz2declt lsrb ; shift literals count into place
lsrb lsrb
lsrb lsrb
lz2gotla clra ; clear A (high part of literals count) lz2gotla clra ; clear A (high part of literals count)
lz2gotlt tfr x,u
lz2gotlt leau ,x
tfr d,x ; transfer 16-bit count into X tfr d,x ; transfer 16-bit count into X
lz2cpylt lda ,u+ ; copy literal byte lz2cpylt lda ,u+ ; copy literal byte
sta ,y+ sta ,y+
leax -1,x ; decrement X and update Z flag leax -1,x ; decrement X and update Z flag
bne lz2cpylt ; loop until all literal bytes are copied bne lz2cpylt ; loop until all literal bytes are copied
tfr u,x leax ,u
lz2nolt ldb ,s ; get token again, don't pop it from the stack lz2nolt ldb ,s ; get token again, don't pop it from the stack
@ -83,10 +83,9 @@ lz2offs9 deca ; set bits 9-15 of offset, reverse bit 8
lz2nibct fcb $00 ; nibble ready flag lz2nibct fcb $00 ; nibble ready flag
lz2nibl ldb #$aa lz2nibl ldb #$aa
lsr <lz2nibct,pcr ; nibble ready? com <lz2nibct,pcr ; toggle nibble ready flag and check
bcs lz2gotnb bpl lz2gotnb
inc <lz2nibct,pcr ; flag nibble as ready for next time
ldb ,x+ ; load two nibbles ldb ,x+ ; load two nibbles
stb <lz2nibl+1,pcr ; store nibble for next time (low 4 bits) stb <lz2nibl+1,pcr ; store nibble for next time (low 4 bits)
@ -117,10 +116,8 @@ lz2rep16 bmi lz2repof ; if token's Z flag bit is set, rep match
lz2gotof std <lz2repof+2,pcr ; store match offset lz2gotof std <lz2repof+2,pcr ; store match offset
lz2repof leau $aaaa,y ; put backreference start address in U (dst+offset) lz2repof leau $aaaa,y ; put backreference start address in U (dst+offset)
puls b ; restore token ldd #$0007 ; clear MSB match length and set mask for MMM
andb ,s+ ; isolate MMM (embedded match length) in token
clra ; clear A (high part of match length)
andb #$07 ; isolate MMM (embedded match length)
addb #$02 ; add MIN_MATCH_SIZE_V2 addb #$02 ; add MIN_MATCH_SIZE_V2
cmpb #$09 ; MIN_MATCH_SIZE_V2 + MATCH_RUN_LEN_V2? cmpb #$09 ; MIN_MATCH_SIZE_V2 + MATCH_RUN_LEN_V2?
bne lz2gotln ; no, we have the full match length, go copy bne lz2gotln ; no, we have the full match length, go copy

View File

@ -1,4 +1,4 @@
; unlzsa2b.s - 6809 backward decompression routine for raw LZSA2 - 174 bytes ; unlzsa2b.s - 6809 backward decompression routine for raw LZSA2 - 171 bytes
; compress with lzsa -f2 -r -b <original_file> <compressed_file> ; compress with lzsa -f2 -r -b <original_file> <compressed_file>
; ;
; in: x = last byte of compressed data ; in: x = last byte of compressed data
@ -24,7 +24,7 @@
; 3. This notice may not be removed or altered from any source distribution. ; 3. This notice may not be removed or altered from any source distribution.
decompress_lzsa2 decompress_lzsa2
lsr <lz2nibct,pcr ; reset nibble available flag clr <lz2nibct,pcr ; reset nibble available flag
leax 1,x leax 1,x
leay 1,y leay 1,y
@ -41,7 +41,7 @@ lz2token ldb ,-x ; load next token into B: XYZ|LL|MMM
cmpb #$12 ; LITERALS_RUN_LEN_V2 + 15 ? cmpb #$12 ; LITERALS_RUN_LEN_V2 + 15 ?
bne lz2gotla ; if not, we have the full literals count, go copy bne lz2gotla ; if not, we have the full literals count, go copy
addb ,-x ; add extra literals count byte + LITERALS_RUN_LEN + 15 addb ,-x ; add extra literals count byte + LITERALS_RUN_LEN + 15
bcc lz2gotla ; if no overflow, we got the complete count, copy bcc lz2gotla ; if no overflow, we got the complete count, copy
ldd ,--x ; load 16 bit count in D (low part in B, high in A) ldd ,--x ; load 16 bit count in D (low part in B, high in A)
@ -52,13 +52,13 @@ lz2declt lsrb ; shift literals count into place
lsrb lsrb
lz2gotla clra ; clear A (high part of literals count) lz2gotla clra ; clear A (high part of literals count)
lz2gotlt tfr x,u lz2gotlt leau ,x
tfr d,x ; transfer 16-bit count into X tfr d,x ; transfer 16-bit count into X
lz2cpylt lda ,-u ; copy literal byte lz2cpylt lda ,-u ; copy literal byte
sta ,-y sta ,-y
leax -1,x ; decrement X and update Z flag leax -1,x ; decrement X and update Z flag
bne lz2cpylt ; loop until all literal bytes are copied bne lz2cpylt ; loop until all literal bytes are copied
tfr u,x leax ,u
lz2nolt ldb ,s ; get token again, don't pop it from the stack lz2nolt ldb ,s ; get token again, don't pop it from the stack
@ -77,16 +77,15 @@ lz2nolt ldb ,s ; get token again, don't pop it from the stack
sex ; set bits 8-15 of offset to $FF sex ; set bits 8-15 of offset to $FF
bra lz2gotof bra lz2gotof
lz2offs9 deca ; set bits 9-15 of offset, reverse bit 8 lz2offs9 deca ; set bits 9-15 of offset, reverse bit 8
bra lz2lowof bra lz2lowof
lz2nibct fcb $00 ; nibble ready flag lz2nibct fcb $00 ; nibble ready flag
lz2nibl ldb #$aa lz2nibl ldb #$aa
lsr <lz2nibct,pcr ; nibble ready? com <lz2nibct,pcr ; toggle nibble ready flag and check
bcs lz2gotnb bpl lz2gotnb
inc <lz2nibct,pcr ; flag nibble as ready for next time
ldb ,-x ; load two nibbles ldb ,-x ; load two nibbles
stb <lz2nibl+1,pcr ; store nibble for next time (low 4 bits) stb <lz2nibl+1,pcr ; store nibble for next time (low 4 bits)
@ -123,10 +122,9 @@ lz2gotof nega ; reverse sign of offset in D
lz2repof leau $aaaa,y ; put backreference start address in U (dst+offset) lz2repof leau $aaaa,y ; put backreference start address in U (dst+offset)
puls b ; restore token ldd #$0007 ; clear MSB match length and set mask for MMM
andb ,s+ ; isolate MMM (embedded match length) in token
clra ; clear A (high part of match length)
andb #$07 ; isolate MMM (embedded match length)
addb #$02 ; add MIN_MATCH_SIZE_V2 addb #$02 ; add MIN_MATCH_SIZE_V2
cmpb #$09 ; MIN_MATCH_SIZE_V2 + MATCH_RUN_LEN_V2? cmpb #$09 ; MIN_MATCH_SIZE_V2 + MATCH_RUN_LEN_V2?
bne lz2gotln ; no, we have the full match length, go copy bne lz2gotln ; no, we have the full match length, go copy