mirror of
https://github.com/cc65/cc65.git
synced 2025-01-09 11:30:29 +00:00
df92f7585f
git-svn-id: svn://svn.cc65.org/cc65/trunk@1125 b7a2c559-68d2-44c3-8de9-860c34a00d81
677 lines
14 KiB
ArmAsm
677 lines
14 KiB
ArmAsm
;
|
|
; Piotr Fusik, 23.11.2001
|
|
;
|
|
; unsigned __fastcall__ inflatemem (char* dest, const char* source);
|
|
;
|
|
|
|
.export _inflatemem
|
|
|
|
.import incsp2
|
|
.importzp sp, sreg, ptr1, ptr2, ptr3, ptr4, tmp1
|
|
|
|
; --------------------------------------------------------------------------
|
|
;
|
|
; Constants
|
|
;
|
|
|
|
; Maximum length of a Huffman code
|
|
MAX_BITS = 15
|
|
; Index in bitsCount, bitsPointer_l and bitsPointer_h
|
|
; for temporary tree or literal/length tree
|
|
PRIMARY_TREE = 0
|
|
; Index in bitsCount, bitsPointer_l and bitsPointer_h for distance tree
|
|
DISTANCE_TREE = MAX_BITS
|
|
; Size of each of bitsCount, bitsPointer_l and bitsPointer_h
|
|
TREES_SIZE = 2*MAX_BITS
|
|
|
|
; --------------------------------------------------------------------------
|
|
;
|
|
; Page zero
|
|
;
|
|
|
|
; Pointer to compressed data
|
|
inputPointer = ptr1 ; 2 bytes
|
|
; Pointer to uncompressed data
|
|
outputPointer = ptr2 ; 2 bytes
|
|
|
|
; Local variables
|
|
getBit_hold = tmp1 ; 1 byte
|
|
|
|
inflateDynamicBlock_cnt = ptr3 ; 1 byte
|
|
inflateCodes_src = ptr3 ; 2 bytes
|
|
buildHuffmanTree_src = ptr3 ; 2 bytes
|
|
getNextLength_last = ptr3 ; 1 byte
|
|
getNextLength_index = ptr3+1 ; 1 byte
|
|
|
|
buildHuffmanTree_ptr = ptr4 ; 2 bytes
|
|
fetchCode_ptr = ptr4 ; 2 bytes
|
|
getBits_tmp = ptr4 ; 1 byte
|
|
|
|
moveBlock_len = sreg ; 2 bytes
|
|
inflateDynamicBlock_np = sreg ; 1 byte
|
|
inflateDynamicBlock_nd = sreg+1 ; 1 byte
|
|
|
|
; --------------------------------------------------------------------------
|
|
;
|
|
; Code
|
|
;
|
|
|
|
_inflatemem:
|
|
|
|
; inputPointer = source
|
|
sta inputPointer
|
|
stx inputPointer+1
|
|
; outputPointer = dest
|
|
.ifpc02
|
|
lda (sp)
|
|
ldy #1
|
|
.else
|
|
ldy #0
|
|
lda (sp),y
|
|
iny
|
|
.endif
|
|
sta outputPointer
|
|
lda (sp),y
|
|
sta outputPointer+1
|
|
|
|
; ldy #1
|
|
sty getBit_hold
|
|
inflatemem_1:
|
|
; Get a bit of EOF and two bits of block type
|
|
ldx #3
|
|
lda #0
|
|
jsr getBits
|
|
lsr a
|
|
tax
|
|
; X contains block type, C contains EOF flag
|
|
; Save EOF flag
|
|
php
|
|
; Go to the routine decompressing this block
|
|
jsr callExtr
|
|
plp
|
|
bcc inflatemem_1
|
|
; C flag is set!
|
|
|
|
; return outputPointer - dest;
|
|
lda outputPointer
|
|
.ifpc02
|
|
sbc (sp) ; C flag is set
|
|
ldy #1
|
|
.else
|
|
ldy #0
|
|
sbc (sp),y ; C flag is set
|
|
iny
|
|
.endif
|
|
pha
|
|
lda outputPointer+1
|
|
sbc (sp),y
|
|
tax
|
|
pla
|
|
; pop dest
|
|
jmp incsp2
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Go to the routine decompressing block type X
|
|
|
|
callExtr:
|
|
lda extr_h,x
|
|
pha
|
|
lda extr_l,x
|
|
pha
|
|
rts
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Decompress 'stored' data block
|
|
|
|
inflateCopyBlock:
|
|
; Ignore bits until byte boundary
|
|
ldy #1
|
|
sty getBit_hold
|
|
; Get 16-bit length
|
|
ldx #inputPointer
|
|
lda (0,x)
|
|
sta moveBlock_len
|
|
lda (inputPointer),y
|
|
sta moveBlock_len+1
|
|
; Skip length and one's complement of it
|
|
lda #4
|
|
clc
|
|
adc inputPointer
|
|
sta inputPointer
|
|
bcc moveBlock
|
|
inc inputPointer+1
|
|
; jmp moveBlock
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Copy block of length moveBlock_len from (0,x) to output
|
|
|
|
moveBlock:
|
|
ldy moveBlock_len
|
|
beq moveBlock_1
|
|
.ifpc02
|
|
.else
|
|
ldy #0
|
|
.endif
|
|
inc moveBlock_len+1
|
|
moveBlock_1:
|
|
lda (0,x)
|
|
.ifpc02
|
|
sta (outputPointer)
|
|
.else
|
|
sta (outputPointer),y
|
|
.endif
|
|
inc 0,x
|
|
bne moveBlock_2
|
|
inc 1,x
|
|
moveBlock_2:
|
|
inc outputPointer
|
|
bne moveBlock_3
|
|
inc outputPointer+1
|
|
moveBlock_3:
|
|
.ifpc02
|
|
dey
|
|
.else
|
|
dec moveBlock_len
|
|
.endif
|
|
bne moveBlock_1
|
|
dec moveBlock_len+1
|
|
bne moveBlock_1
|
|
rts
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Decompress Huffman-coded data block with default Huffman trees:
|
|
; literalCodeLength: 144 times 8, 112 times 9
|
|
; endCodeLength: 24 times 7, 6 times 8
|
|
; distanceCodeLength: 30 times 5+DISTANCE_TREE, 2 times 8
|
|
; (two 8-bit codes from primary tree are not used)
|
|
|
|
inflateFixedBlock:
|
|
ldx #159
|
|
stx distanceCodeLength+32
|
|
lda #8
|
|
inflateFixedBlock_1:
|
|
sta literalCodeLength-1,x
|
|
sta literalCodeLength+159-1,x
|
|
dex
|
|
bne inflateFixedBlock_1
|
|
ldx #112
|
|
; lda #9
|
|
inflateFixedBlock_2:
|
|
inc literalCodeLength+144-1,x ; sta
|
|
dex
|
|
bne inflateFixedBlock_2
|
|
ldx #24
|
|
; lda #7
|
|
inflateFixedBlock_3:
|
|
dec endCodeLength-1,x ; sta
|
|
dex
|
|
bne inflateFixedBlock_3
|
|
ldx #30
|
|
lda #5+DISTANCE_TREE
|
|
inflateFixedBlock_4:
|
|
sta distanceCodeLength-1,x
|
|
dex
|
|
bne inflateFixedBlock_4
|
|
jmp inflateCodes
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Decompress Huffman-coded data block, reading Huffman trees first
|
|
|
|
inflateDynamicBlock:
|
|
; numberOfPrimaryCodes = 257 + getBits(5)
|
|
ldx #5
|
|
lda #1
|
|
jsr getBits
|
|
sta inflateDynamicBlock_np
|
|
; numberOfDistanceCodes = 1 + getBits(5)
|
|
ldx #5
|
|
lda #1+29+1
|
|
jsr getBits
|
|
sta inflateDynamicBlock_nd
|
|
; numberOfTemporaryCodes = 4 + getBits(4)
|
|
lda #4
|
|
tax
|
|
jsr getBits
|
|
sta inflateDynamicBlock_cnt
|
|
; Get lengths of temporary codes in order stored in tempCodeLengthOrder
|
|
ldy #0
|
|
inflateDynamicBlock_1:
|
|
ldx #3
|
|
lda #0
|
|
jsr getBits ; does not change Y
|
|
inflateDynamicBlock_2:
|
|
ldx tempCodeLengthOrder,y
|
|
sta literalCodeLength,x
|
|
iny
|
|
cpy inflateDynamicBlock_cnt
|
|
bcc inflateDynamicBlock_1
|
|
lda #0
|
|
cpy #19
|
|
bcc inflateDynamicBlock_2
|
|
ror literalCodeLength+19 ; C flag is set, so it will set b7
|
|
; Build tree for temporary codes
|
|
jsr buildHuffmanTree
|
|
|
|
; Use temporary codes to get lengths for literal/length and distance codes
|
|
ldx #0
|
|
ldy #1
|
|
stx getNextLength_last
|
|
inflateDynamicBlock_3:
|
|
jsr getNextLength
|
|
sta literalCodeLength,x
|
|
inx
|
|
bne inflateDynamicBlock_3
|
|
inflateDynamicBlock_4:
|
|
jsr getNextLength
|
|
sta endCodeLength,x
|
|
inx
|
|
cpx inflateDynamicBlock_np
|
|
bcc inflateDynamicBlock_4
|
|
.ifpc02
|
|
bcs inflateDynamicBlock_6 ; branch always
|
|
inflateDynamicBlock_5:
|
|
stz endCodeLength,x
|
|
.else
|
|
lda #0
|
|
bcs inflateDynamicBlock_6 ; branch always
|
|
inflateDynamicBlock_5:
|
|
sta endCodeLength,x
|
|
.endif
|
|
inx
|
|
inflateDynamicBlock_6:
|
|
cpx #1+29
|
|
bcc inflateDynamicBlock_5
|
|
inflateDynamicBlock_7:
|
|
jsr getNextLength
|
|
cmp #0
|
|
beq inflateDynamicBlock_8
|
|
adc #DISTANCE_TREE-1 ; C flag is set
|
|
inflateDynamicBlock_8:
|
|
sta endCodeLength,x
|
|
inx
|
|
cpx inflateDynamicBlock_nd
|
|
bcc inflateDynamicBlock_7
|
|
ror endCodeLength,x ; C flag is set, so it will set b7
|
|
; jmp inflateCodes
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Decompress data block basing on given Huffman trees
|
|
|
|
inflateCodes:
|
|
jsr buildHuffmanTree
|
|
inflateCodes_1:
|
|
jsr fetchPrimaryCode
|
|
bcs inflateCodes_2
|
|
; Literal code
|
|
.ifpc02
|
|
sta (outputPointer)
|
|
.else
|
|
ldy #0
|
|
sta (outputPointer),y
|
|
.endif
|
|
inc outputPointer
|
|
bne inflateCodes_1
|
|
inc outputPointer+1
|
|
bcc inflateCodes_1 ; branch always
|
|
; End of block
|
|
inflateCodes_ret:
|
|
rts
|
|
inflateCodes_2:
|
|
beq inflateCodes_ret
|
|
; Repeat block
|
|
jsr getValue
|
|
sta moveBlock_len
|
|
tya
|
|
jsr getBits
|
|
sta moveBlock_len+1
|
|
ldx #DISTANCE_TREE
|
|
jsr fetchCode
|
|
jsr getValue
|
|
sec
|
|
eor #$ff
|
|
adc outputPointer
|
|
sta inflateCodes_src
|
|
php
|
|
tya
|
|
jsr getBits
|
|
plp
|
|
eor #$ff
|
|
adc outputPointer+1
|
|
sta inflateCodes_src+1
|
|
ldx #inflateCodes_src
|
|
jsr moveBlock
|
|
beq inflateCodes_1 ; branch always
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Build Huffman trees basing on code lengths.
|
|
; Lengths (in bits) are stored in *CodeLength tables.
|
|
; A byte with highest bit set marks end of length table.
|
|
|
|
buildHuffmanTree:
|
|
lda #<literalCodeLength
|
|
sta buildHuffmanTree_src
|
|
lda #>literalCodeLength
|
|
sta buildHuffmanTree_src+1
|
|
; Clear bitsCount and bitsPointer_l
|
|
ldy #2*TREES_SIZE+1
|
|
lda #0
|
|
buildHuffmanTree_1:
|
|
sta bitsCount-1,y
|
|
dey
|
|
bne buildHuffmanTree_1
|
|
beq buildHuffmanTree_3 ; branch always
|
|
; Count number of codes of each length
|
|
buildHuffmanTree_2:
|
|
tax
|
|
inc bitsPointer_l,x
|
|
iny
|
|
bne buildHuffmanTree_3
|
|
inc buildHuffmanTree_src+1
|
|
buildHuffmanTree_3:
|
|
lda (buildHuffmanTree_src),y
|
|
bpl buildHuffmanTree_2
|
|
; Calculate pointer for each length
|
|
ldx #0
|
|
lda #<sortedCodes
|
|
ldy #>sortedCodes
|
|
clc
|
|
buildHuffmanTree_4:
|
|
sta bitsPointer_l,x
|
|
tya
|
|
sta bitsPointer_h,x
|
|
lda bitsPointer_l+1,x
|
|
adc bitsPointer_l,x ; C flag is zero
|
|
bcc buildHuffmanTree_5
|
|
iny
|
|
buildHuffmanTree_5:
|
|
inx
|
|
cpx #TREES_SIZE
|
|
bcc buildHuffmanTree_4
|
|
lda #>literalCodeLength
|
|
sta buildHuffmanTree_src+1
|
|
ldy #0
|
|
bcs buildHuffmanTree_9 ; branch always
|
|
; Put codes into their place in sorted table
|
|
buildHuffmanTree_6:
|
|
beq buildHuffmanTree_7
|
|
tax
|
|
lda bitsPointer_l-1,x
|
|
sta buildHuffmanTree_ptr
|
|
lda bitsPointer_h-1,x
|
|
sta buildHuffmanTree_ptr+1
|
|
tya
|
|
ldy bitsCount-1,x
|
|
inc bitsCount-1,x
|
|
sta (buildHuffmanTree_ptr),y
|
|
tay
|
|
buildHuffmanTree_7:
|
|
iny
|
|
bne buildHuffmanTree_9
|
|
inc buildHuffmanTree_src+1
|
|
ldx #MAX_BITS-1
|
|
buildHuffmanTree_8:
|
|
lda bitsCount,x
|
|
sta literalCount,x
|
|
dex
|
|
bpl buildHuffmanTree_8
|
|
buildHuffmanTree_9:
|
|
lda (buildHuffmanTree_src),y
|
|
bpl buildHuffmanTree_6
|
|
rts
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Get next code length basing on temporary codes
|
|
|
|
getNextLength:
|
|
stx getNextLength_index
|
|
dey
|
|
bne getNextLength_1
|
|
; Fetch a temporary code
|
|
jsr fetchPrimaryCode
|
|
; Temporary code 0..15: put this length
|
|
ldy #1
|
|
cmp #16
|
|
bcc getNextLength_2
|
|
; Temporary code 16: repeat last length 3 + getBits(2) times
|
|
; Temporary code 17: put zero length 3 + getBits(3) times
|
|
; Temporary code 18: put zero length 11 + getBits(7) times
|
|
tay
|
|
ldx tempExtraBits-16,y
|
|
lda tempBaseValue-16,y
|
|
jsr getBits
|
|
cpy #17
|
|
tay
|
|
lda #0
|
|
bcs getNextLength_2
|
|
getNextLength_1:
|
|
lda getNextLength_last
|
|
getNextLength_2:
|
|
sta getNextLength_last
|
|
ldx getNextLength_index
|
|
rts
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Read code basing on primary tree
|
|
|
|
fetchPrimaryCode:
|
|
ldx #PRIMARY_TREE
|
|
; jmp fetchCode
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Read code from input stream basing on tree given in X.
|
|
; Return low byte of code in A.
|
|
; For literal/length tree, C is: 0 if literal code, 1 if end or length code.
|
|
|
|
fetchCode:
|
|
lda #0
|
|
fetchCode_1:
|
|
jsr getBit
|
|
rol a
|
|
cmp bitsCount,x
|
|
bcc fetchCode_2
|
|
sbc bitsCount,x ; C flag is set
|
|
inx
|
|
bcs fetchCode_1 ; branch always
|
|
fetchCode_2:
|
|
cmp literalCount,x
|
|
sta fetchCode_ptr
|
|
ldy bitsPointer_l,x
|
|
lda bitsPointer_h,x
|
|
sta fetchCode_ptr+1
|
|
lda (fetchCode_ptr),y
|
|
rts
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Read low byte of value (length or distance), basing on code A
|
|
|
|
getValue:
|
|
tay
|
|
ldx lengthExtraBits-1,y
|
|
lda lengthBaseValue_l-1,y
|
|
pha
|
|
lda lengthBaseValue_h-1,y
|
|
tay
|
|
pla
|
|
; jmp getBits
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Read X-bit number from input stream and add it to A.
|
|
; In case of carry, Y is incremented.
|
|
; If X > 8, only 8 bits are read.
|
|
; On return X holds number of unread bits: X = (X > 8 ? X - 8 : 0);
|
|
|
|
getBits:
|
|
cpx #0
|
|
beq getBits_ret
|
|
pha
|
|
lda #1
|
|
sta getBits_tmp
|
|
pla
|
|
getBits_1:
|
|
jsr getBit
|
|
bcc getBits_2
|
|
clc
|
|
adc getBits_tmp
|
|
bcc getBits_2
|
|
iny
|
|
getBits_2:
|
|
dex
|
|
beq getBits_ret
|
|
asl getBits_tmp
|
|
bcc getBits_1
|
|
getBits_ret:
|
|
rts
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Read single bit from input stream, return it in C flag
|
|
|
|
getBit:
|
|
lsr getBit_hold
|
|
bne getBit_ret
|
|
pha
|
|
.ifpc02
|
|
lda (inputPointer)
|
|
.else
|
|
tya
|
|
pha
|
|
ldy #0
|
|
lda (inputPointer),y
|
|
.endif
|
|
inc inputPointer
|
|
bne getBit_1
|
|
inc inputPointer+1
|
|
getBit_1:
|
|
ror a ; C flag is set
|
|
sta getBit_hold
|
|
.ifpc02
|
|
.else
|
|
pla
|
|
tay
|
|
.endif
|
|
pla
|
|
getBit_ret:
|
|
rts
|
|
|
|
; --------------------------------------------------------------------------
|
|
;
|
|
; Constant data
|
|
;
|
|
|
|
.rodata
|
|
; --------------------------------------------------------------------------
|
|
; Addresses of functions extracting different blocks
|
|
extr_l:
|
|
.byte <(inflateCopyBlock-1)
|
|
.byte <(inflateFixedBlock-1)
|
|
.byte <(inflateDynamicBlock-1)
|
|
extr_h:
|
|
.byte >(inflateCopyBlock-1)
|
|
.byte >(inflateFixedBlock-1)
|
|
.byte >(inflateDynamicBlock-1)
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Tables for temporary codes
|
|
; Value is BaseValue + getBits(ExtraBits)
|
|
|
|
; Order, in which lengths of temporary codes are stored
|
|
tempCodeLengthOrder:
|
|
.byte 16,17,18,0,8,7,9,6,10,5,11,4,12,3,13,2,14,1,15
|
|
|
|
; Base values
|
|
tempBaseValue:
|
|
.byte 3,3,11
|
|
|
|
; Number of extra bits to read
|
|
tempExtraBits:
|
|
.byte 2,3,7
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Tables for length and distance codes
|
|
; Value is BaseValue + getBits(ExtraBits)
|
|
|
|
; Base values
|
|
lengthBaseValue_l:
|
|
.byte <3,<4,<5,<6,<7,<8,<9,<10
|
|
.byte <11,<13,<15,<17,<19,<23,<27,<31
|
|
.byte <35,<43,<51,<59,<67,<83,<99,<115
|
|
.byte <131,<163,<195,<227,<258
|
|
distanceBaseValue_l:
|
|
.byte <1,<2,<3,<4,<5,<7,<9,<13
|
|
.byte <17,<25,<33,<49,<65,<97,<129,<193
|
|
.byte <257,<385,<513,<769,<1025,<1537,<2049,<3073
|
|
.byte <4097,<6145,<8193,<12289,<16385,<24577
|
|
lengthBaseValue_h:
|
|
.byte >3,>4,>5,>6,>7,>8,>9,>10
|
|
.byte >11,>13,>15,>17,>19,>23,>27,>31
|
|
.byte >35,>43,>51,>59,>67,>83,>99,>115
|
|
.byte >131,>163,>195,>227,>258
|
|
distanceBaseValue_h:
|
|
.byte >1,>2,>3,>4,>5,>7,>9,>13
|
|
.byte >17,>25,>33,>49,>65,>97,>129,>193
|
|
.byte >257,>385,>513,>769,>1025,>1537,>2049,>3073
|
|
.byte >4097,>6145,>8193,>12289,>16385,>24577
|
|
|
|
; Number of extra bits to read
|
|
lengthExtraBits:
|
|
.byte 0,0,0,0,0,0,0,0
|
|
.byte 1,1,1,1,2,2,2,2
|
|
.byte 3,3,3,3,4,4,4,4
|
|
.byte 5,5,5,5,0
|
|
distanceExtraBits:
|
|
.byte 0,0,0,0,1,1,2,2
|
|
.byte 3,3,4,4,5,5,6,6
|
|
.byte 7,7,8,8,9,9,10,10
|
|
.byte 11,11,12,12,13,13
|
|
|
|
; --------------------------------------------------------------------------
|
|
;
|
|
; Uninitialised data
|
|
;
|
|
|
|
.bss
|
|
|
|
; Number of literal codes of each length in primary tree
|
|
; (MAX_BITS bytes, overlap with literalCodeLength)
|
|
literalCount:
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Data for building primary tree
|
|
|
|
; Lengths of literal codes
|
|
literalCodeLength:
|
|
.res 256
|
|
; Length of end code
|
|
endCodeLength:
|
|
.res 1
|
|
; Lengths of length codes
|
|
lengthCodeLength:
|
|
.res 29
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Data for building distance tree
|
|
|
|
; Lengths of distance codes
|
|
distanceCodeLength:
|
|
.res 30
|
|
; For two unused codes in fixed trees and end-of-table flag
|
|
.res 3
|
|
|
|
; --------------------------------------------------------------------------
|
|
; Huffman tree structure
|
|
|
|
; Number of codes of each length
|
|
bitsCount:
|
|
.res TREES_SIZE
|
|
; Pointer to sorted codes of each length
|
|
bitsPointer_l:
|
|
.res TREES_SIZE+1
|
|
bitsPointer_h:
|
|
.res TREES_SIZE
|
|
|
|
; Sorted codes
|
|
sortedCodes:
|
|
.res 256+1+29+30+2
|
|
|
|
|
|
|