|
|
MiNT 1.12
; Copyright 1992 Eric R. Smith ; Copyright 1993 Atari Corporation ; All rights reserved. ; ; quickmove(char *dst, char *src, long nbytes): ; quickly copy "nbytes" bytes from src to dst. Assumes that both ; src and dst are word aligned. ; ; quickmovb(char *dst, char *src, long nbytes): ; like memcpy, does unaligned too... does not check for overlap (memmove). ; TEXT XDEF _quickmove XDEF _quickmovb ;%ifdef OWN_LIB XDEF _bcopy XDEF __bcopy XDEF _memcpy _bcopy: __bcopy: move.l 8(sp),a0 ; get dst move.l 4(sp),a1 ; get src bra.s _quickmovb1 ;%endif ; for gcc >= 2.5.8 _memcpy: _quickmovb: move.l 4(sp),a0 ; get dst move.l 8(sp),a1 ; get src _quickmovb1: move.w a0,d0 move.w a1,d1 eor.w d1,d0 ; bit 0 == unaligned lsr.w #1,d0 ; ...now in x flag move.l 12(sp),d0 ; get nbytes beq Ldone roxr.w #1,d1 ; bit 0 == both odd, msb == unaligned bmi bytecopy ; unaligned, do the slow thing... bcc.s quickmov1 ; both even, ok subq.l #1,d0 ; both odd, can be fixed move.b (a1)+,(a0)+ bra.s quickmov1 _quickmove: move.l 4(sp),a0 ; get dst move.l 8(sp),a1 ; get src move.l 12(sp),d0 ; get nbytes quickmov1: move.w #$1ff,d1 and.w d0,d1 ; d1 = nbytes % 512 lsr.l #8,d0 ; lsr.l #1,d0 ; d0 = nbytes / 512 ble.s Leftover ; if <= 0, skip movem.l d1-d7/a2-a6,-(sp) ; save regs L1: movem.l (a1)+,d1-d7/a2-a6 ; read 12*4 = 48 bytes movem.l d1-d7/a2-a6,(a0) ; movem.l (a1)+,d1-d7/a2-a6 ; 2nd read movem.l d1-d7/a2-a6,48(a0) ; movem.l (a1)+,d1-d7/a2-a6 ; 3rd read movem.l d1-d7/a2-a6,96(a0) ; movem.l (a1)+,d1-d7/a2-a6 ; 4th read movem.l d1-d7/a2-a6,144(a0) ; movem.l (a1)+,d1-d7/a2-a6 ; 5th movem.l d1-d7/a2-a6,192(a0) ; movem.l (a1)+,d1-d7/a2-a6 ; 6th movem.l d1-d7/a2-a6,240(a0) ; movem.l (a1)+,d1-d7/a2-a6 ; 7th movem.l d1-d7/a2-a6,288(a0) ; movem.l (a1)+,d1-d7/a2-a6 ; 8th movem.l d1-d7/a2-a6,336(a0) ; movem.l (a1)+,d1-d7/a2-a6 ; 9th movem.l d1-d7/a2-a6,384(a0) ; movem.l (a1)+,d1-d7/a2-a6 ; 10th movem.l d1-d7/a2-a6,432(a0) ; At this point, 480 bytes done movem.l (a1)+,d1-d7/a2 ; Only do 32 more bytes movem.l d1-d7/a2,480(a0) ; for a total of 512 lea 512(a0),a0 subq.l #1,d0 bgt.s L1 movem.l (sp)+,d1-d7/a2-a6 ; pop registers Leftover: ; do the remaining bytes moveq.l #3,d0 and.w d1,d0 lsr.w #2,d1 subq.w #1,d1 ; prepare for dbra loop bmi.s L4done lsr.w #1,d1 bcc.s L23 L2l: move.l (a1)+,(a0)+ L23: move.l (a1)+,(a0)+ dbra d1,L2l L4done: subq.w #1,d0 ; prepare for dbra loop bmi.s Ldone L2: move.b (a1)+,(a0)+ dbra d0,L2 Ldone: rts ; return bytecopy: subq.l #1,d0 ; prepare for dbra loop move.l d0,d1 swap d1 L3: move.b (a1)+,(a0)+ dbra d0,L3 dbra d1,L3 rts ; return END
This archive runs on limited infrastructure. Preserving old code on modern bandwidth. Automated agents are requested to crawl responsibly.