mirror of
https://github.com/cc65/cc65.git
synced 2025-02-19 06:30:53 +00:00
The upper 16 bit differ between signed and unsigned multiplication, so while
for 16x16=16, the unsigned routine can be used, regardless of signedness, this is not true for 16x16=32. git-svn-id: svn://svn.cc65.org/cc65/trunk@4438 b7a2c559-68d2-44c3-8de9-860c34a00d81
This commit is contained in:
parent
1bec071755
commit
7c804513fa
@ -81,6 +81,7 @@ OBJS = add.o \
|
|||||||
ge.o \
|
ge.o \
|
||||||
gt.o \
|
gt.o \
|
||||||
icmp.o \
|
icmp.o \
|
||||||
|
imul16x16r32.o \
|
||||||
incax1.o \
|
incax1.o \
|
||||||
incax2.o \
|
incax2.o \
|
||||||
incax3.o \
|
incax3.o \
|
||||||
@ -152,7 +153,6 @@ OBJS = add.o \
|
|||||||
makebool.o \
|
makebool.o \
|
||||||
mod.o \
|
mod.o \
|
||||||
mul.o \
|
mul.o \
|
||||||
mul16x16r32.o \
|
|
||||||
mul8.o \
|
mul8.o \
|
||||||
mul8x8r16.o \
|
mul8x8r16.o \
|
||||||
mulax3.o \
|
mulax3.o \
|
||||||
@ -219,6 +219,7 @@ OBJS = add.o \
|
|||||||
ule.o \
|
ule.o \
|
||||||
ult.o \
|
ult.o \
|
||||||
umod.o \
|
umod.o \
|
||||||
|
umul16x16r32.o \
|
||||||
xor.o \
|
xor.o \
|
||||||
zeropage.o
|
zeropage.o
|
||||||
|
|
||||||
|
50
libsrc/runtime/imul16x16r32.s
Normal file
50
libsrc/runtime/imul16x16r32.s
Normal file
@ -0,0 +1,50 @@
|
|||||||
|
;
|
||||||
|
; Ullrich von Bassewitz, 2010-11-03
|
||||||
|
;
|
||||||
|
; CC65 runtime: 16x16 => 32 signed multiplication
|
||||||
|
;
|
||||||
|
|
||||||
|
.export imul16x16r32, _cc65_imul16x16r32
|
||||||
|
.import popax, negax, umul16x16r32m, negeax
|
||||||
|
.importzp ptr1, ptr3, tmp1
|
||||||
|
|
||||||
|
|
||||||
|
;---------------------------------------------------------------------------
|
||||||
|
; 16x16 => 32 signed multiplication routine.
|
||||||
|
;
|
||||||
|
; lhs rhs result result also in
|
||||||
|
; -------------------------------------------------------------
|
||||||
|
; ptr1 ax ax:sreg
|
||||||
|
;
|
||||||
|
; There is probably a faster way to do this.
|
||||||
|
;
|
||||||
|
|
||||||
|
|
||||||
|
_cc65_imul16x16r32:
|
||||||
|
sta ptr1
|
||||||
|
stx ptr1+1
|
||||||
|
jsr popax
|
||||||
|
|
||||||
|
imul16x16r32:
|
||||||
|
stx tmp1
|
||||||
|
cpx #0
|
||||||
|
bpl @L1
|
||||||
|
jsr negax
|
||||||
|
@L1: sta ptr3
|
||||||
|
stx ptr3+1
|
||||||
|
|
||||||
|
lda ptr1+1
|
||||||
|
eor tmp1
|
||||||
|
sta tmp1
|
||||||
|
lda ptr1
|
||||||
|
ldx ptr1+1
|
||||||
|
bpl @L2
|
||||||
|
jsr negax
|
||||||
|
sta ptr1
|
||||||
|
stx ptr1+1
|
||||||
|
@L2: jsr umul16x16r32m
|
||||||
|
ldy tmp1
|
||||||
|
bpl @L3
|
||||||
|
jmp negeax
|
||||||
|
@L3: rts
|
||||||
|
|
@ -1,17 +1,16 @@
|
|||||||
;
|
;
|
||||||
; Ullrich von Bassewitz, 2010-11-03
|
; Ullrich von Bassewitz, 2010-11-03
|
||||||
;
|
;
|
||||||
; CC65 runtime: 16x16 => 32 multiplication
|
; CC65 runtime: 16x16 => 32 unsigned multiplication
|
||||||
;
|
;
|
||||||
|
|
||||||
.export umul16x16r32, _cc65_umul16x16r32
|
.export _cc65_umul16x16r32, umul16x16r32, umul16x16r32m
|
||||||
.export mul16x16r32 := umul16x16r32
|
|
||||||
.import popax
|
.import popax
|
||||||
.importzp ptr1, ptr2, ptr3, ptr4, sreg
|
.importzp ptr1, ptr3, sreg
|
||||||
|
|
||||||
|
|
||||||
;---------------------------------------------------------------------------
|
;---------------------------------------------------------------------------
|
||||||
; 16x16 => 32 multiplication routine.
|
; 16x16 => 32 unsigned multiplication routine.
|
||||||
;
|
;
|
||||||
; lhs rhs result result also in
|
; lhs rhs result result also in
|
||||||
; -------------------------------------------------------------
|
; -------------------------------------------------------------
|
||||||
@ -26,6 +25,8 @@ _cc65_umul16x16r32:
|
|||||||
umul16x16r32:
|
umul16x16r32:
|
||||||
sta ptr3
|
sta ptr3
|
||||||
stx ptr3+1
|
stx ptr3+1
|
||||||
|
|
||||||
|
umul16x16r32m:
|
||||||
lda #0
|
lda #0
|
||||||
sta sreg+1
|
sta sreg+1
|
||||||
ldy #16 ; Number of bits
|
ldy #16 ; Number of bits
|
||||||
@ -37,7 +38,7 @@ umul16x16r32:
|
|||||||
clc
|
clc
|
||||||
adc ptr3
|
adc ptr3
|
||||||
pha
|
pha
|
||||||
txa ; hi byte of left op
|
lda ptr3+1
|
||||||
adc sreg+1
|
adc sreg+1
|
||||||
sta sreg+1
|
sta sreg+1
|
||||||
pla
|
pla
|
Loading…
x
Reference in New Issue
Block a user