mirror of
https://github.com/cc65/cc65.git
synced 2025-01-25 11:30:06 +00:00
Merge pull request #226 from greg-king5/pce-memset
Add a PC-Engine version of memset().
This commit is contained in:
commit
ced08a1f44
@ -8,9 +8,10 @@
|
|||||||
;
|
;
|
||||||
; void* __fastcall__ memcpy (void* dest, const void* src, size_t size);
|
; void* __fastcall__ memcpy (void* dest, const void* src, size_t size);
|
||||||
;
|
;
|
||||||
; NOTE: This function contains entry points for memmove, which will resort
|
; NOTE: This function contains entry points for memmove(), which resorts to
|
||||||
; to memcpy for an incrementing copy. Don't change this module without looking
|
; memcpy() for incrementing copies. The PC-Engine memset() uses this memcpy()
|
||||||
; at "pce/memmove.s"!
|
; to fill memory quickly. Don't change this module without looking at
|
||||||
|
; "pce/memmove.s" and "pce/memset.s"!
|
||||||
;
|
;
|
||||||
|
|
||||||
.export _memcpy
|
.export _memcpy
|
||||||
@ -34,25 +35,25 @@ _memcpy:
|
|||||||
jsr memcpy_getparams
|
jsr memcpy_getparams
|
||||||
|
|
||||||
memcpy_increment:
|
memcpy_increment:
|
||||||
ldy #$73 ; TII
|
ldy #$73 ; TII opcode
|
||||||
|
|
||||||
memcpy_transfer:
|
memcpy_transfer:
|
||||||
sty transfer+opcode
|
sty transfer + opcode
|
||||||
|
|
||||||
lda ptr1
|
lda ptr1
|
||||||
ldx ptr1+1
|
ldx ptr1+1
|
||||||
sta transfer+source
|
sta transfer + source
|
||||||
stx transfer+source+1
|
stx transfer + source+1
|
||||||
|
|
||||||
lda ptr2
|
lda ptr2
|
||||||
ldx ptr2+1
|
ldx ptr2+1
|
||||||
sta transfer+destination
|
sta transfer + destination
|
||||||
stx transfer+destination+1
|
stx transfer + destination+1
|
||||||
|
|
||||||
lda ptr3
|
lda ptr3
|
||||||
ldx ptr3+1
|
ldx ptr3+1
|
||||||
sta transfer+length
|
sta transfer + length
|
||||||
stx transfer+length+1
|
stx transfer + length+1
|
||||||
|
|
||||||
jmp transfer
|
jmp transfer
|
||||||
|
|
||||||
|
@ -59,5 +59,5 @@ _memmove:
|
|||||||
dec ptr2+1
|
dec ptr2+1
|
||||||
@L2: dec ptr2
|
@L2: dec ptr2
|
||||||
|
|
||||||
ldy #$C3 ; TDD
|
ldy #$C3 ; TDD opcode
|
||||||
jmp memcpy_transfer
|
jmp memcpy_transfer
|
||||||
|
67
libsrc/pce/memset.s
Normal file
67
libsrc/pce/memset.s
Normal file
@ -0,0 +1,67 @@
|
|||||||
|
;
|
||||||
|
; This file, instead of "common/memset.s", will be assembled for the pce
|
||||||
|
; target. This version is smaller and faster because it uses a HuC6280
|
||||||
|
; block-copy instruction.
|
||||||
|
;
|
||||||
|
; 1998-05-29, Ullrich von Bassewitz
|
||||||
|
; 2015-11-06, Greg King
|
||||||
|
;
|
||||||
|
; void* __fastcall__ _bzero (void* ptr, size_t n);
|
||||||
|
; void __fastcall__ bzero (void* ptr, size_t n);
|
||||||
|
; void* __fastcall__ memset (void* ptr, int c, size_t n);
|
||||||
|
;
|
||||||
|
; NOTE: bzero() will return its first argument, as memset() does. It is no
|
||||||
|
; problem to declare the return value as void, because it can be ignored.
|
||||||
|
; _bzero() (note the leading underscore) is declared with the proper
|
||||||
|
; return type because the compiler will replace memset() by _bzero() if
|
||||||
|
; the fill value is zero; and, the optimizer looks at the return type
|
||||||
|
; to see if the value in .XA is of any use.
|
||||||
|
;
|
||||||
|
; NOTE: This function uses entry points from "pce/memcpy.s"!
|
||||||
|
;
|
||||||
|
|
||||||
|
.export __bzero, _bzero, _memset
|
||||||
|
|
||||||
|
.import memcpy_getparams, memcpy_increment
|
||||||
|
.import pushax, popax
|
||||||
|
.importzp ptr1, ptr2, ptr3
|
||||||
|
|
||||||
|
.macpack longbranch
|
||||||
|
|
||||||
|
|
||||||
|
; ----------------------------------------------------------------------
|
||||||
|
__bzero:
|
||||||
|
_bzero: pha
|
||||||
|
cla ; fill with zeros
|
||||||
|
jsr pushax ; (high byte isn't important)
|
||||||
|
pla
|
||||||
|
|
||||||
|
_memset:
|
||||||
|
jsr memcpy_getparams
|
||||||
|
|
||||||
|
; The fill byte is put at the beginning of the buffer; then, the buffer is
|
||||||
|
; copied to a second buffer that starts one byte above the start of the first
|
||||||
|
; buffer. Normally, we would use memmove() to avoid trouble; but here, we
|
||||||
|
; exploit that overlap, by using memcpy(). Therefore, the fill value is copied
|
||||||
|
; from each byte to the next byte, all the way to the end of the buffer.
|
||||||
|
|
||||||
|
lda ptr1 ; get fill value
|
||||||
|
sta (ptr2)
|
||||||
|
|
||||||
|
lda ptr3 ; count first byte
|
||||||
|
bne @L3
|
||||||
|
dec ptr3+1
|
||||||
|
@L3: dec a
|
||||||
|
sta ptr3
|
||||||
|
ora ptr3+1
|
||||||
|
jeq popax ; return ptr. if no more bytes
|
||||||
|
|
||||||
|
lda ptr2 ; point to first buffer
|
||||||
|
ldx ptr2+1
|
||||||
|
sta ptr1
|
||||||
|
stx ptr1+1
|
||||||
|
inc ptr2 ; point to second buffer
|
||||||
|
bne @L2
|
||||||
|
inc ptr2+1
|
||||||
|
|
||||||
|
@L2: jmp memcpy_increment
|
Loading…
x
Reference in New Issue
Block a user