1
0
mirror of https://github.com/cc65/cc65.git synced 2025-01-25 11:30:06 +00:00

Merge pull request #226 from greg-king5/pce-memset

Add a PC-Engine version of memset().
This commit is contained in:
Oliver Schmidt 2015-11-07 11:37:36 +01:00
commit ced08a1f44
3 changed files with 80 additions and 12 deletions

View File

@ -8,9 +8,10 @@
; ;
; void* __fastcall__ memcpy (void* dest, const void* src, size_t size); ; void* __fastcall__ memcpy (void* dest, const void* src, size_t size);
; ;
; NOTE: This function contains entry points for memmove, which will resort ; NOTE: This function contains entry points for memmove(), which resorts to
; to memcpy for an incrementing copy. Don't change this module without looking ; memcpy() for incrementing copies. The PC-Engine memset() uses this memcpy()
; at "pce/memmove.s"! ; to fill memory quickly. Don't change this module without looking at
; "pce/memmove.s" and "pce/memset.s"!
; ;
.export _memcpy .export _memcpy
@ -34,25 +35,25 @@ _memcpy:
jsr memcpy_getparams jsr memcpy_getparams
memcpy_increment: memcpy_increment:
ldy #$73 ; TII ldy #$73 ; TII opcode
memcpy_transfer: memcpy_transfer:
sty transfer+opcode sty transfer + opcode
lda ptr1 lda ptr1
ldx ptr1+1 ldx ptr1+1
sta transfer+source sta transfer + source
stx transfer+source+1 stx transfer + source+1
lda ptr2 lda ptr2
ldx ptr2+1 ldx ptr2+1
sta transfer+destination sta transfer + destination
stx transfer+destination+1 stx transfer + destination+1
lda ptr3 lda ptr3
ldx ptr3+1 ldx ptr3+1
sta transfer+length sta transfer + length
stx transfer+length+1 stx transfer + length+1
jmp transfer jmp transfer

View File

@ -59,5 +59,5 @@ _memmove:
dec ptr2+1 dec ptr2+1
@L2: dec ptr2 @L2: dec ptr2
ldy #$C3 ; TDD ldy #$C3 ; TDD opcode
jmp memcpy_transfer jmp memcpy_transfer

67
libsrc/pce/memset.s Normal file
View File

@ -0,0 +1,67 @@
;
; This file, instead of "common/memset.s", will be assembled for the pce
; target. This version is smaller and faster because it uses a HuC6280
; block-copy instruction.
;
; 1998-05-29, Ullrich von Bassewitz
; 2015-11-06, Greg King
;
; void* __fastcall__ _bzero (void* ptr, size_t n);
; void __fastcall__ bzero (void* ptr, size_t n);
; void* __fastcall__ memset (void* ptr, int c, size_t n);
;
; NOTE: bzero() will return its first argument, as memset() does. It is no
; problem to declare the return value as void, because it can be ignored.
; _bzero() (note the leading underscore) is declared with the proper
; return type because the compiler will replace memset() by _bzero() if
; the fill value is zero; and, the optimizer looks at the return type
; to see if the value in .XA is of any use.
;
; NOTE: This function uses entry points from "pce/memcpy.s"!
;
.export __bzero, _bzero, _memset
.import memcpy_getparams, memcpy_increment
.import pushax, popax
.importzp ptr1, ptr2, ptr3
.macpack longbranch
; ----------------------------------------------------------------------
__bzero:
_bzero: pha
cla ; fill with zeros
jsr pushax ; (high byte isn't important)
pla
_memset:
jsr memcpy_getparams
; The fill byte is put at the beginning of the buffer; then, the buffer is
; copied to a second buffer that starts one byte above the start of the first
; buffer. Normally, we would use memmove() to avoid trouble; but here, we
; exploit that overlap, by using memcpy(). Therefore, the fill value is copied
; from each byte to the next byte, all the way to the end of the buffer.
lda ptr1 ; get fill value
sta (ptr2)
lda ptr3 ; count first byte
bne @L3
dec ptr3+1
@L3: dec a
sta ptr3
ora ptr3+1
jeq popax ; return ptr. if no more bytes
lda ptr2 ; point to first buffer
ldx ptr2+1
sta ptr1
stx ptr1+1
inc ptr2 ; point to second buffer
bne @L2
inc ptr2+1
@L2: jmp memcpy_increment