Home | History | Annotate | Line # | Download | only in string
bcopy.S revision 1.1.16.2
      1  1.1.16.1  martin /*	$NetBSD: bcopy.S,v 1.1.16.2 2020/04/21 19:37:43 martin Exp $	*/
      2       1.1   scole 
      3       1.1   scole /*-
      4       1.1   scole  * Copyright (c) 2000 Doug Rabson
      5       1.1   scole  * All rights reserved.
      6       1.1   scole  *
      7       1.1   scole  * Redistribution and use in source and binary forms, with or without
      8       1.1   scole  * modification, are permitted provided that the following conditions
      9       1.1   scole  * are met:
     10       1.1   scole  * 1. Redistributions of source code must retain the above copyright
     11       1.1   scole  *    notice, this list of conditions and the following disclaimer.
     12       1.1   scole  * 2. Redistributions in binary form must reproduce the above copyright
     13       1.1   scole  *    notice, this list of conditions and the following disclaimer in the
     14       1.1   scole  *    documentation and/or other materials provided with the distribution.
     15       1.1   scole  *
     16       1.1   scole  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     17       1.1   scole  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     18       1.1   scole  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     19       1.1   scole  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     20       1.1   scole  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     21       1.1   scole  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     22       1.1   scole  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     23       1.1   scole  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     24       1.1   scole  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     25       1.1   scole  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     26       1.1   scole  * SUCH DAMAGE.
     27       1.1   scole  *
     28       1.1   scole  * __FBSDID("$FreeBSD: releng/10.1/lib/libc/ia64/string/bcopy.S 125669 2004-02-10 20:45:28Z cperciva $");
     29       1.1   scole  */
     30       1.1   scole 
     31       1.1   scole #include <machine/asm.h>
     32       1.1   scole 
     33       1.1   scole /*
     34       1.1   scole  * void
     35       1.1   scole  * bcopy(const void *src, void *dst, size_t len);
     36       1.1   scole  */
     37       1.1   scole 
     38       1.1   scole /*
     39       1.1   scole  * Not the fastest bcopy in the world.
     40       1.1   scole  */
     41       1.1   scole ENTRY(bcopy, 3)
     42       1.1   scole 
     43       1.1   scole 	cmp.le	p6,p0=in2,r0			// bail if len <= 0
     44       1.1   scole (p6)	br.ret.spnt.few rp
     45       1.1   scole 
     46       1.1   scole 	sub	r14=in1,in0 ;;			// check for overlap
     47       1.1   scole 	cmp.ltu	p6,p0=r14,in2			// dst-src < len
     48       1.1   scole (p6)	br.cond.spnt.few 5f
     49       1.1   scole 
     50       1.1   scole 	extr.u	r14=in0,0,3			// src & 7
     51       1.1   scole 	extr.u	r15=in1,0,3 ;;			// dst & 7
     52       1.1   scole 	cmp.eq	p6,p0=r14,r15			// different alignment?
     53       1.1   scole (p6)	br.cond.spnt.few 2f			// branch if same alignment
     54       1.1   scole 
     55       1.1   scole 1:	ld1	r14=[in0],1 ;;			// copy bytewise
     56       1.1   scole 	st1	[in1]=r14,1
     57       1.1   scole 	add	in2=-1,in2 ;;			// len--
     58       1.1   scole 	cmp.ne	p6,p0=r0,in2
     59       1.1   scole (p6)	br.cond.dptk.few 1b			// loop
     60       1.1   scole 	br.ret.sptk.few rp			// done
     61       1.1   scole 
     62       1.1   scole 2:	cmp.eq	p6,p0=r14,r0			// aligned?
     63       1.1   scole (p6)	br.cond.sptk.few 4f
     64       1.1   scole 
     65       1.1   scole 3:	ld1	r14=[in0],1 ;;			// copy bytewise
     66       1.1   scole 	st1	[in1]=r14,1
     67       1.1   scole 	extr.u	r15=in0,0,3			// src & 7
     68       1.1   scole 	add	in2=-1,in2 ;;			// len--
     69       1.1   scole 	cmp.eq	p6,p0=r0,in2			// done?
     70       1.1   scole 	cmp.eq	p7,p0=r0,r15 ;;			// aligned now?
     71       1.1   scole (p6)	br.ret.spnt.few rp			// return if done
     72       1.1   scole (p7)	br.cond.spnt.few 4f			// go to main copy
     73       1.1   scole 	br.cond.sptk.few 3b			// more bytes to copy
     74       1.1   scole 
     75       1.1   scole 	// At this point, in2 is non-zero
     76       1.1   scole 
     77       1.1   scole 4:	mov	r14=8 ;;
     78       1.1   scole 	cmp.ltu	p6,p0=in2,r14 ;;		// len < 8?
     79       1.1   scole (p6)	br.cond.spnt.few 1b			// byte copy the end
     80       1.1   scole 	ld8	r15=[in0],8 ;;			// copy word
     81       1.1   scole 	st8	[in1]=r15,8
     82       1.1   scole 	add	in2=-8,in2 ;;			// len -= 8
     83       1.1   scole 	cmp.ne	p6,p0=r0,in2			// done?
     84       1.1   scole (p6)	br.cond.spnt.few 4b			// again
     85       1.1   scole 
     86       1.1   scole 	br.ret.sptk.few rp			// return
     87       1.1   scole 
     88       1.1   scole 	// Don't bother optimising overlap case
     89       1.1   scole 
     90       1.1   scole 5:	add	in0=in0,in2
     91       1.1   scole 	add	in1=in1,in2 ;;
     92       1.1   scole 	add	in0=-1,in0
     93       1.1   scole 	add	in1=-1,in1 ;;
     94       1.1   scole 
     95       1.1   scole 6:	ld1	r14=[in0],-1 ;;
     96       1.1   scole 	st1	[in1]=r14,-1
     97       1.1   scole 	add	in2=-1,in2 ;;
     98       1.1   scole 	cmp.ne	p6,p0=r0,in2
     99       1.1   scole (p6)	br.cond.spnt.few 6b
    100       1.1   scole 
    101       1.1   scole 	br.ret.sptk.few rp
    102       1.1   scole END(bcopy)
    103