mirror of
https://github.com/cc65/cc65.git
synced 2024-11-16 02:10:52 +00:00
8a140e6503
cputc: -2 cycles per char, -2 cycles per carriage return cputs: -5 cycles per char, -3 cycles on cputsxy vcprintf: -6 cycles per char
169 lines
3.9 KiB
ArmAsm
169 lines
3.9 KiB
ArmAsm
;
|
|
; int __fastcall__ vcprintf (const char* Format, va_list ap);
|
|
;
|
|
; Ullrich von Bassewitz, 2.12.2000
|
|
;
|
|
|
|
.export _vcprintf
|
|
.import pushax, popax, popptr1
|
|
.import __printf, _cputc
|
|
.importzp sp, ptr1, ptr2, ptr3, tmp1
|
|
|
|
.macpack generic
|
|
.macpack cpu
|
|
|
|
.data
|
|
|
|
; ----------------------------------------------------------------------------
|
|
;
|
|
; Static data for the _vsprintf routine
|
|
;
|
|
|
|
outdesc: ; Static outdesc structure
|
|
.word 0 ; ccount
|
|
.word out ; Output function pointer
|
|
.word 0 ; ptr
|
|
.word 0 ; uns
|
|
|
|
.code
|
|
|
|
; ----------------------------------------------------------------------------
|
|
; Callback routine used for the actual output.
|
|
;
|
|
; static void __cdecl__ out (struct outdesc* d, const char* buf, unsigned count)
|
|
; /* Routine used for writing */
|
|
; {
|
|
; /* Fast screen output */
|
|
; d->ccount += count;
|
|
; while (count) {
|
|
; cputc (*buf);
|
|
; ++buf;
|
|
; --count;
|
|
; }
|
|
; }
|
|
;
|
|
; We're using ptr1 and tmp1, since we know that the cputc routine will not use
|
|
; them (they're also used in cputs, so they must be safe).
|
|
|
|
out: jsr popax ; count
|
|
sta ptr2
|
|
stx ptr2+1
|
|
inx
|
|
stx outdesc+7
|
|
tax
|
|
inx
|
|
stx outdesc+6
|
|
|
|
jsr popptr1 ; buf
|
|
|
|
jsr popax ; d
|
|
sta ptr3
|
|
stx ptr3+1
|
|
|
|
; Sum up the total count of characters
|
|
|
|
ldy #0 ; ccount in struct outdesc
|
|
sty tmp1 ; Initialize tmp1 while we have zero available
|
|
lda (ptr3),y
|
|
add ptr2
|
|
sta (ptr3),y
|
|
iny
|
|
lda (ptr3),y
|
|
adc ptr2+1
|
|
sta (ptr3),y
|
|
|
|
; Loop outputting characters
|
|
|
|
.if (.cpu .bitand CPU_ISET_65SC02)
|
|
|
|
@L1: dec outdesc+6
|
|
beq @L4
|
|
@L2: lda (ptr1) ; (5)
|
|
inc ptr1 ; (10)
|
|
bne @L3 ; (12)
|
|
inc ptr1+1 ; (17)
|
|
@L3: jsr _cputc ; (23)
|
|
bra @L1 ; (26)
|
|
|
|
@L4: dec outdesc+7
|
|
bne @L2
|
|
rts
|
|
|
|
.else
|
|
|
|
@L1: dec outdesc+6
|
|
beq @L4
|
|
@L2: ldy tmp1 ; (3)
|
|
lda (ptr1),y ; (8)
|
|
iny ; (10)
|
|
bne @L3 ; (12)
|
|
inc ptr1+1 ; (17)
|
|
@L3: sty tmp1 ; (20)
|
|
jsr _cputc ; (26)
|
|
jmp @L1 ; (32)
|
|
|
|
@L4: dec outdesc+7
|
|
bne @L2
|
|
rts
|
|
|
|
.endif
|
|
|
|
; ----------------------------------------------------------------------------
|
|
; vcprintf - formatted console i/o
|
|
;
|
|
; int __fastcall__ vcprintf (const char* format, va_list ap)
|
|
; {
|
|
; struct outdesc d;
|
|
;
|
|
; /* Setup descriptor */
|
|
; d.fout = out;
|
|
;
|
|
; /* Do formatting and output */
|
|
; _printf (&d, format, ap);
|
|
;
|
|
; /* Return bytes written */
|
|
; return d.ccount;
|
|
; }
|
|
|
|
_vcprintf:
|
|
sta ptr1 ; Save ap
|
|
stx ptr1+1
|
|
|
|
; Setup the outdesc structure
|
|
|
|
lda #0
|
|
sta outdesc
|
|
sta outdesc+1 ; Clear ccount
|
|
|
|
; Get the format parameter and push it again
|
|
|
|
ldy #1
|
|
lda (sp),y
|
|
tax
|
|
dey
|
|
lda (sp),y
|
|
jsr pushax
|
|
|
|
; Replace the passed format parameter on the stack by &d - this creates
|
|
; exactly the stack frame _printf expects. Parameters will get dropped
|
|
; by _printf.
|
|
|
|
ldy #2 ; Low byte of d
|
|
lda #<outdesc
|
|
sta (sp),y
|
|
iny
|
|
lda #>outdesc
|
|
sta (sp),y
|
|
|
|
; Restore ap and call _printf
|
|
|
|
lda ptr1
|
|
ldx ptr1+1
|
|
jsr __printf
|
|
|
|
; Return the number of bytes written.
|
|
|
|
lda outdesc ; ccount
|
|
ldx outdesc+1
|
|
rts
|