Home | History | Annotate | Line # | Download | only in string
      1  1.6   mlelstv /*	$NetBSD: memcpy_xscale.S,v 1.6 2023/01/19 18:03:03 mlelstv Exp $	*/
      2  1.1  christos 
      3  1.1  christos /*
      4  1.1  christos  * Copyright 2003 Wasabi Systems, Inc.
      5  1.1  christos  * All rights reserved.
      6  1.1  christos  *
      7  1.1  christos  * Written by Steve C. Woodford for Wasabi Systems, Inc.
      8  1.1  christos  *
      9  1.1  christos  * Redistribution and use in source and binary forms, with or without
     10  1.1  christos  * modification, are permitted provided that the following conditions
     11  1.1  christos  * are met:
     12  1.1  christos  * 1. Redistributions of source code must retain the above copyright
     13  1.1  christos  *    notice, this list of conditions and the following disclaimer.
     14  1.1  christos  * 2. Redistributions in binary form must reproduce the above copyright
     15  1.1  christos  *    notice, this list of conditions and the following disclaimer in the
     16  1.1  christos  *    documentation and/or other materials provided with the distribution.
     17  1.1  christos  * 3. All advertising materials mentioning features or use of this software
     18  1.1  christos  *    must display the following acknowledgement:
     19  1.1  christos  *      This product includes software developed for the NetBSD Project by
     20  1.1  christos  *      Wasabi Systems, Inc.
     21  1.1  christos  * 4. The name of Wasabi Systems, Inc. may not be used to endorse
     22  1.1  christos  *    or promote products derived from this software without specific prior
     23  1.1  christos  *    written permission.
     24  1.1  christos  *
     25  1.1  christos  * THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
     26  1.1  christos  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     27  1.1  christos  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     28  1.1  christos  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL WASABI SYSTEMS, INC
     29  1.1  christos  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     30  1.1  christos  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     31  1.1  christos  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     32  1.1  christos  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     33  1.1  christos  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     34  1.1  christos  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     35  1.1  christos  * POSSIBILITY OF SUCH DAMAGE.
     36  1.1  christos  */
     37  1.1  christos 
     38  1.1  christos #include <machine/asm.h>
     39  1.1  christos 
     40  1.1  christos /* LINTSTUB: Func: void *memcpy(void *dst, const void *src, size_t len) */
     41  1.1  christos ENTRY(memcpy)
     42  1.1  christos 	pld	[r1]
     43  1.1  christos 	cmp	r2, #0x0c
     44  1.6   mlelstv 	bls	.Lmemcpy_short		/* <= 12 bytes */
     45  1.1  christos 	mov	r3, r0			/* We must not clobber r0 */
     46  1.1  christos 
     47  1.1  christos 	/* Word-align the destination buffer */
     48  1.1  christos 	ands	ip, r3, #0x03		/* Already word aligned? */
     49  1.1  christos 	beq	.Lmemcpy_wordaligned	/* Yup */
     50  1.1  christos 	cmp	ip, #0x02
     51  1.1  christos 	ldrb	ip, [r1], #0x01
     52  1.1  christos 	sub	r2, r2, #0x01
     53  1.1  christos 	strb	ip, [r3], #0x01
     54  1.6   mlelstv 	ldrbls	ip, [r1], #0x01
     55  1.6   mlelstv 	subls	r2, r2, #0x01
     56  1.6   mlelstv 	strbls	ip, [r3], #0x01
     57  1.6   mlelstv 	ldrblo	ip, [r1], #0x01
     58  1.6   mlelstv 	sublo	r2, r2, #0x01
     59  1.6   mlelstv 	strblo	ip, [r3], #0x01
     60  1.1  christos 
     61  1.1  christos 	/* Destination buffer is now word aligned */
     62  1.1  christos .Lmemcpy_wordaligned:
     63  1.1  christos 	ands	ip, r1, #0x03		/* Is src also word-aligned? */
     64  1.1  christos 	bne	.Lmemcpy_bad_align	/* Nope. Things just got bad */
     65  1.1  christos 
     66  1.1  christos 	/* Quad-align the destination buffer */
     67  1.1  christos 	tst	r3, #0x07		/* Already quad aligned? */
     68  1.1  christos 	ldrne	ip, [r1], #0x04
     69  1.3      matt 	push	{r4-r9}		/* Free up some registers */
     70  1.1  christos 	subne	r2, r2, #0x04
     71  1.1  christos 	strne	ip, [r3], #0x04
     72  1.1  christos 
     73  1.1  christos 	/* Destination buffer quad aligned, source is at least word aligned */
     74  1.1  christos 	subs	r2, r2, #0x80
     75  1.6   mlelstv 	blo	.Lmemcpy_w_lessthan128
     76  1.1  christos 
     77  1.1  christos 	/* Copy 128 bytes at a time */
     78  1.1  christos .Lmemcpy_w_loop128:
     79  1.1  christos 	ldr	r4, [r1], #0x04		/* LD:00-03 */
     80  1.1  christos 	ldr	r5, [r1], #0x04		/* LD:04-07 */
     81  1.1  christos 	pld	[r1, #0x18]		/* Prefetch 0x20 */
     82  1.1  christos 	ldr	r6, [r1], #0x04		/* LD:08-0b */
     83  1.1  christos 	ldr	r7, [r1], #0x04		/* LD:0c-0f */
     84  1.1  christos 	ldr	r8, [r1], #0x04		/* LD:10-13 */
     85  1.1  christos 	ldr	r9, [r1], #0x04		/* LD:14-17 */
     86  1.5     joerg 	strd	r4, r5, [r3], #0x08	/* ST:00-07 */
     87  1.1  christos 	ldr	r4, [r1], #0x04		/* LD:18-1b */
     88  1.1  christos 	ldr	r5, [r1], #0x04		/* LD:1c-1f */
     89  1.5     joerg 	strd	r6, r7, [r3], #0x08	/* ST:08-0f */
     90  1.1  christos 	ldr	r6, [r1], #0x04		/* LD:20-23 */
     91  1.1  christos 	ldr	r7, [r1], #0x04		/* LD:24-27 */
     92  1.1  christos 	pld	[r1, #0x18]		/* Prefetch 0x40 */
     93  1.5     joerg 	strd	r8, r9, [r3], #0x08	/* ST:10-17 */
     94  1.1  christos 	ldr	r8, [r1], #0x04		/* LD:28-2b */
     95  1.1  christos 	ldr	r9, [r1], #0x04		/* LD:2c-2f */
     96  1.5     joerg 	strd	r4, r5, [r3], #0x08	/* ST:18-1f */
     97  1.1  christos 	ldr	r4, [r1], #0x04		/* LD:30-33 */
     98  1.1  christos 	ldr	r5, [r1], #0x04		/* LD:34-37 */
     99  1.5     joerg 	strd	r6, r7, [r3], #0x08	/* ST:20-27 */
    100  1.1  christos 	ldr	r6, [r1], #0x04		/* LD:38-3b */
    101  1.1  christos 	ldr	r7, [r1], #0x04		/* LD:3c-3f */
    102  1.5     joerg 	strd	r8, r9, [r3], #0x08	/* ST:28-2f */
    103  1.1  christos 	ldr	r8, [r1], #0x04		/* LD:40-43 */
    104  1.1  christos 	ldr	r9, [r1], #0x04		/* LD:44-47 */
    105  1.1  christos 	pld	[r1, #0x18]		/* Prefetch 0x60 */
    106  1.5     joerg 	strd	r4, r5, [r3], #0x08	/* ST:30-37 */
    107  1.1  christos 	ldr	r4, [r1], #0x04		/* LD:48-4b */
    108  1.1  christos 	ldr	r5, [r1], #0x04		/* LD:4c-4f */
    109  1.5     joerg 	strd	r6, r7, [r3], #0x08	/* ST:38-3f */
    110  1.1  christos 	ldr	r6, [r1], #0x04		/* LD:50-53 */
    111  1.1  christos 	ldr	r7, [r1], #0x04		/* LD:54-57 */
    112  1.5     joerg 	strd	r8, r9, [r3], #0x08	/* ST:40-47 */
    113  1.1  christos 	ldr	r8, [r1], #0x04		/* LD:58-5b */
    114  1.1  christos 	ldr	r9, [r1], #0x04		/* LD:5c-5f */
    115  1.5     joerg 	strd	r4, r5, [r3], #0x08	/* ST:48-4f */
    116  1.1  christos 	ldr	r4, [r1], #0x04		/* LD:60-63 */
    117  1.1  christos 	ldr	r5, [r1], #0x04		/* LD:64-67 */
    118  1.1  christos 	pld	[r1, #0x18]		/* Prefetch 0x80 */
    119  1.5     joerg 	strd	r6, r7, [r3], #0x08	/* ST:50-57 */
    120  1.1  christos 	ldr	r6, [r1], #0x04		/* LD:68-6b */
    121  1.1  christos 	ldr	r7, [r1], #0x04		/* LD:6c-6f */
    122  1.5     joerg 	strd	r8, r9, [r3], #0x08	/* ST:58-5f */
    123  1.1  christos 	ldr	r8, [r1], #0x04		/* LD:70-73 */
    124  1.1  christos 	ldr	r9, [r1], #0x04		/* LD:74-77 */
    125  1.5     joerg 	strd	r4, r5, [r3], #0x08	/* ST:60-67 */
    126  1.1  christos 	ldr	r4, [r1], #0x04		/* LD:78-7b */
    127  1.1  christos 	ldr	r5, [r1], #0x04		/* LD:7c-7f */
    128  1.5     joerg 	strd	r6, r7, [r3], #0x08	/* ST:68-6f */
    129  1.5     joerg 	strd	r8, r9, [r3], #0x08	/* ST:70-77 */
    130  1.1  christos 	subs	r2, r2, #0x80
    131  1.5     joerg 	strd	r4, r5, [r3], #0x08	/* ST:78-7f */
    132  1.6   mlelstv 	bhs	.Lmemcpy_w_loop128
    133  1.1  christos 
    134  1.1  christos .Lmemcpy_w_lessthan128:
    135  1.1  christos 	adds	r2, r2, #0x80		/* Adjust for extra sub */
    136  1.3      matt 	popeq	{r4-r9}
    137  1.3      matt 	RETc(eq)			/* Return now if done */
    138  1.1  christos 	subs	r2, r2, #0x20
    139  1.6   mlelstv 	blo	.Lmemcpy_w_lessthan32
    140  1.1  christos 
    141  1.1  christos 	/* Copy 32 bytes at a time */
    142  1.1  christos .Lmemcpy_w_loop32:
    143  1.1  christos 	ldr	r4, [r1], #0x04
    144  1.1  christos 	ldr	r5, [r1], #0x04
    145  1.1  christos 	pld	[r1, #0x18]
    146  1.1  christos 	ldr	r6, [r1], #0x04
    147  1.1  christos 	ldr	r7, [r1], #0x04
    148  1.1  christos 	ldr	r8, [r1], #0x04
    149  1.1  christos 	ldr	r9, [r1], #0x04
    150  1.5     joerg 	strd	r4, r5, [r3], #0x08
    151  1.1  christos 	ldr	r4, [r1], #0x04
    152  1.1  christos 	ldr	r5, [r1], #0x04
    153  1.5     joerg 	strd	r6, r7, [r3], #0x08
    154  1.5     joerg 	strd	r8, r9, [r3], #0x08
    155  1.1  christos 	subs	r2, r2, #0x20
    156  1.5     joerg 	strd	r4, r5, [r3], #0x08
    157  1.6   mlelstv 	bhs	.Lmemcpy_w_loop32
    158  1.1  christos 
    159  1.1  christos .Lmemcpy_w_lessthan32:
    160  1.1  christos 	adds	r2, r2, #0x20		/* Adjust for extra sub */
    161  1.3      matt 	popeq	{r4-r9}
    162  1.3      matt 	RETc(eq)			/* Return now if done */
    163  1.1  christos 
    164  1.1  christos 	and	r4, r2, #0x18
    165  1.1  christos 	rsbs	r4, r4, #0x18
    166  1.1  christos 	addne	pc, pc, r4, lsl #1
    167  1.1  christos 	nop
    168  1.1  christos 
    169  1.1  christos 	/* At least 24 bytes remaining */
    170  1.1  christos 	ldr	r4, [r1], #0x04
    171  1.1  christos 	ldr	r5, [r1], #0x04
    172  1.1  christos 	sub	r2, r2, #0x08
    173  1.5     joerg 	strd	r4, r5, [r3], #0x08
    174  1.1  christos 
    175  1.1  christos 	/* At least 16 bytes remaining */
    176  1.1  christos 	ldr	r4, [r1], #0x04
    177  1.1  christos 	ldr	r5, [r1], #0x04
    178  1.1  christos 	sub	r2, r2, #0x08
    179  1.5     joerg 	strd	r4, r5, [r3], #0x08
    180  1.1  christos 
    181  1.1  christos 	/* At least 8 bytes remaining */
    182  1.1  christos 	ldr	r4, [r1], #0x04
    183  1.1  christos 	ldr	r5, [r1], #0x04
    184  1.1  christos 	subs	r2, r2, #0x08
    185  1.5     joerg 	strd	r4, r5, [r3], #0x08
    186  1.1  christos 
    187  1.1  christos 	/* Less than 8 bytes remaining */
    188  1.3      matt 	pop	{r4-r9}
    189  1.3      matt 	RETc(eq)			/* Return now if done */
    190  1.1  christos 	subs	r2, r2, #0x04
    191  1.6   mlelstv 	ldrhs	ip, [r1], #0x04
    192  1.6   mlelstv 	strhs	ip, [r3], #0x04
    193  1.3      matt 	RETc(eq)			/* Return now if done */
    194  1.6   mlelstv 	addlo	r2, r2, #0x04
    195  1.1  christos 	ldrb	ip, [r1], #0x01
    196  1.1  christos 	cmp	r2, #0x02
    197  1.6   mlelstv 	ldrbhs	r2, [r1], #0x01
    198  1.1  christos 	strb	ip, [r3], #0x01
    199  1.6   mlelstv 	ldrbhi	ip, [r1]
    200  1.6   mlelstv 	strbhs	r2, [r3], #0x01
    201  1.6   mlelstv 	strbhi	ip, [r3]
    202  1.3      matt 	RET
    203  1.1  christos 
    204  1.1  christos 
    205  1.1  christos /*
    206  1.1  christos  * At this point, it has not been possible to word align both buffers.
    207  1.1  christos  * The destination buffer is word aligned, but the source buffer is not.
    208  1.1  christos  */
    209  1.1  christos .Lmemcpy_bad_align:
    210  1.3      matt 	push	{r4-r7}
    211  1.1  christos 	bic	r1, r1, #0x03
    212  1.1  christos 	cmp	ip, #2
    213  1.1  christos 	ldr	ip, [r1], #0x04
    214  1.6   mlelstv 	bhi	.Lmemcpy_bad3
    215  1.1  christos 	beq	.Lmemcpy_bad2
    216  1.1  christos 	b	.Lmemcpy_bad1
    217  1.1  christos 
    218  1.1  christos .Lmemcpy_bad1_loop16:
    219  1.1  christos #ifdef __ARMEB__
    220  1.1  christos 	mov	r4, ip, lsl #8
    221  1.1  christos #else
    222  1.1  christos 	mov	r4, ip, lsr #8
    223  1.1  christos #endif
    224  1.1  christos 	ldr	r5, [r1], #0x04
    225  1.1  christos 	pld	[r1, #0x018]
    226  1.1  christos 	ldr	r6, [r1], #0x04
    227  1.1  christos 	ldr	r7, [r1], #0x04
    228  1.1  christos 	ldr	ip, [r1], #0x04
    229  1.1  christos #ifdef __ARMEB__
    230  1.1  christos 	orr	r4, r4, r5, lsr #24
    231  1.1  christos 	mov	r5, r5, lsl #8
    232  1.1  christos 	orr	r5, r5, r6, lsr #24
    233  1.1  christos 	mov	r6, r6, lsl #8
    234  1.1  christos 	orr	r6, r6, r7, lsr #24
    235  1.1  christos 	mov	r7, r7, lsl #8
    236  1.1  christos 	orr	r7, r7, ip, lsr #24
    237  1.1  christos #else
    238  1.1  christos 	orr	r4, r4, r5, lsl #24
    239  1.1  christos 	mov	r5, r5, lsr #8
    240  1.1  christos 	orr	r5, r5, r6, lsl #24
    241  1.1  christos 	mov	r6, r6, lsr #8
    242  1.1  christos 	orr	r6, r6, r7, lsl #24
    243  1.1  christos 	mov	r7, r7, lsr #8
    244  1.1  christos 	orr	r7, r7, ip, lsl #24
    245  1.1  christos #endif
    246  1.1  christos 	str	r4, [r3], #0x04
    247  1.1  christos 	str	r5, [r3], #0x04
    248  1.1  christos 	str	r6, [r3], #0x04
    249  1.1  christos 	str	r7, [r3], #0x04
    250  1.2       scw 	sub	r2, r2, #0x10
    251  1.2       scw 
    252  1.1  christos .Lmemcpy_bad1:
    253  1.2       scw 	cmp	r2, #0x20
    254  1.6   mlelstv 	bhs	.Lmemcpy_bad1_loop16
    255  1.2       scw 	cmp	r2, #0x10
    256  1.6   mlelstv 	blo	.Lmemcpy_bad1_loop16_short
    257  1.1  christos 
    258  1.2       scw 	/* copy last 16 bytes (without preload) */
    259  1.2       scw #ifdef __ARMEB__
    260  1.2       scw 	mov	r4, ip, lsl #8
    261  1.2       scw #else
    262  1.2       scw 	mov	r4, ip, lsr #8
    263  1.2       scw #endif
    264  1.2       scw 	ldr	r5, [r1], #0x04
    265  1.2       scw 	ldr	r6, [r1], #0x04
    266  1.2       scw 	ldr	r7, [r1], #0x04
    267  1.2       scw 	ldr	ip, [r1], #0x04
    268  1.2       scw #ifdef __ARMEB__
    269  1.2       scw 	orr	r4, r4, r5, lsr #24
    270  1.2       scw 	mov	r5, r5, lsl #8
    271  1.2       scw 	orr	r5, r5, r6, lsr #24
    272  1.2       scw 	mov	r6, r6, lsl #8
    273  1.2       scw 	orr	r6, r6, r7, lsr #24
    274  1.2       scw 	mov	r7, r7, lsl #8
    275  1.2       scw 	orr	r7, r7, ip, lsr #24
    276  1.2       scw #else
    277  1.2       scw 	orr	r4, r4, r5, lsl #24
    278  1.2       scw 	mov	r5, r5, lsr #8
    279  1.2       scw 	orr	r5, r5, r6, lsl #24
    280  1.2       scw 	mov	r6, r6, lsr #8
    281  1.2       scw 	orr	r6, r6, r7, lsl #24
    282  1.2       scw 	mov	r7, r7, lsr #8
    283  1.2       scw 	orr	r7, r7, ip, lsl #24
    284  1.2       scw #endif
    285  1.2       scw 	str	r4, [r3], #0x04
    286  1.2       scw 	str	r5, [r3], #0x04
    287  1.2       scw 	str	r6, [r3], #0x04
    288  1.2       scw 	str	r7, [r3], #0x04
    289  1.2       scw 	subs	r2, r2, #0x10
    290  1.3      matt 	popeq	{r4-r7}
    291  1.3      matt 	RETc(eq)			/* Return now if done */
    292  1.2       scw 
    293  1.2       scw .Lmemcpy_bad1_loop16_short:
    294  1.1  christos 	subs	r2, r2, #0x04
    295  1.6   mlelstv 	sublo	r1, r1, #0x03
    296  1.6   mlelstv 	blo	.Lmemcpy_bad_done
    297  1.1  christos 
    298  1.1  christos .Lmemcpy_bad1_loop4:
    299  1.1  christos #ifdef __ARMEB__
    300  1.1  christos 	mov	r4, ip, lsl #8
    301  1.1  christos #else
    302  1.1  christos 	mov	r4, ip, lsr #8
    303  1.1  christos #endif
    304  1.1  christos 	ldr	ip, [r1], #0x04
    305  1.1  christos 	subs	r2, r2, #0x04
    306  1.1  christos #ifdef __ARMEB__
    307  1.1  christos 	orr	r4, r4, ip, lsr #24
    308  1.1  christos #else
    309  1.1  christos 	orr	r4, r4, ip, lsl #24
    310  1.1  christos #endif
    311  1.1  christos 	str	r4, [r3], #0x04
    312  1.6   mlelstv 	bhs	.Lmemcpy_bad1_loop4
    313  1.1  christos 	sub	r1, r1, #0x03
    314  1.1  christos 	b	.Lmemcpy_bad_done
    315  1.1  christos 
    316  1.1  christos .Lmemcpy_bad2_loop16:
    317  1.1  christos #ifdef __ARMEB__
    318  1.1  christos 	mov	r4, ip, lsl #16
    319  1.1  christos #else
    320  1.1  christos 	mov	r4, ip, lsr #16
    321  1.1  christos #endif
    322  1.1  christos 	ldr	r5, [r1], #0x04
    323  1.1  christos 	pld	[r1, #0x018]
    324  1.1  christos 	ldr	r6, [r1], #0x04
    325  1.1  christos 	ldr	r7, [r1], #0x04
    326  1.1  christos 	ldr	ip, [r1], #0x04
    327  1.1  christos #ifdef __ARMEB__
    328  1.1  christos 	orr	r4, r4, r5, lsr #16
    329  1.1  christos 	mov	r5, r5, lsl #16
    330  1.1  christos 	orr	r5, r5, r6, lsr #16
    331  1.1  christos 	mov	r6, r6, lsl #16
    332  1.1  christos 	orr	r6, r6, r7, lsr #16
    333  1.1  christos 	mov	r7, r7, lsl #16
    334  1.1  christos 	orr	r7, r7, ip, lsr #16
    335  1.1  christos #else
    336  1.1  christos 	orr	r4, r4, r5, lsl #16
    337  1.1  christos 	mov	r5, r5, lsr #16
    338  1.1  christos 	orr	r5, r5, r6, lsl #16
    339  1.1  christos 	mov	r6, r6, lsr #16
    340  1.1  christos 	orr	r6, r6, r7, lsl #16
    341  1.1  christos 	mov	r7, r7, lsr #16
    342  1.1  christos 	orr	r7, r7, ip, lsl #16
    343  1.1  christos #endif
    344  1.1  christos 	str	r4, [r3], #0x04
    345  1.1  christos 	str	r5, [r3], #0x04
    346  1.1  christos 	str	r6, [r3], #0x04
    347  1.1  christos 	str	r7, [r3], #0x04
    348  1.2       scw 	sub	r2, r2, #0x10
    349  1.2       scw 
    350  1.1  christos .Lmemcpy_bad2:
    351  1.2       scw 	cmp	r2, #0x20
    352  1.6   mlelstv 	bhs	.Lmemcpy_bad2_loop16
    353  1.2       scw 	cmp	r2, #0x10
    354  1.6   mlelstv 	blo	.Lmemcpy_bad2_loop16_short
    355  1.1  christos 
    356  1.2       scw 	/* copy last 16 bytes (without preload) */
    357  1.2       scw #ifdef __ARMEB__
    358  1.2       scw 	mov	r4, ip, lsl #16
    359  1.2       scw #else
    360  1.2       scw 	mov	r4, ip, lsr #16
    361  1.2       scw #endif
    362  1.2       scw 	ldr	r5, [r1], #0x04
    363  1.2       scw 	ldr	r6, [r1], #0x04
    364  1.2       scw 	ldr	r7, [r1], #0x04
    365  1.2       scw 	ldr	ip, [r1], #0x04
    366  1.2       scw #ifdef __ARMEB__
    367  1.2       scw 	orr	r4, r4, r5, lsr #16
    368  1.2       scw 	mov	r5, r5, lsl #16
    369  1.2       scw 	orr	r5, r5, r6, lsr #16
    370  1.2       scw 	mov	r6, r6, lsl #16
    371  1.2       scw 	orr	r6, r6, r7, lsr #16
    372  1.2       scw 	mov	r7, r7, lsl #16
    373  1.2       scw 	orr	r7, r7, ip, lsr #16
    374  1.2       scw #else
    375  1.2       scw 	orr	r4, r4, r5, lsl #16
    376  1.2       scw 	mov	r5, r5, lsr #16
    377  1.2       scw 	orr	r5, r5, r6, lsl #16
    378  1.2       scw 	mov	r6, r6, lsr #16
    379  1.2       scw 	orr	r6, r6, r7, lsl #16
    380  1.2       scw 	mov	r7, r7, lsr #16
    381  1.2       scw 	orr	r7, r7, ip, lsl #16
    382  1.2       scw #endif
    383  1.2       scw 	str	r4, [r3], #0x04
    384  1.2       scw 	str	r5, [r3], #0x04
    385  1.2       scw 	str	r6, [r3], #0x04
    386  1.2       scw 	str	r7, [r3], #0x04
    387  1.2       scw 	subs	r2, r2, #0x10
    388  1.3      matt 	popeq	{r4-r7}
    389  1.3      matt 	RETc(eq)			/* Return now if done */
    390  1.2       scw 
    391  1.2       scw .Lmemcpy_bad2_loop16_short:
    392  1.1  christos 	subs	r2, r2, #0x04
    393  1.6   mlelstv 	sublo	r1, r1, #0x02
    394  1.6   mlelstv 	blo	.Lmemcpy_bad_done
    395  1.1  christos 
    396  1.1  christos .Lmemcpy_bad2_loop4:
    397  1.1  christos #ifdef __ARMEB__
    398  1.1  christos 	mov	r4, ip, lsl #16
    399  1.1  christos #else
    400  1.1  christos 	mov	r4, ip, lsr #16
    401  1.1  christos #endif
    402  1.1  christos 	ldr	ip, [r1], #0x04
    403  1.1  christos 	subs	r2, r2, #0x04
    404  1.1  christos #ifdef __ARMEB__
    405  1.1  christos 	orr	r4, r4, ip, lsr #16
    406  1.1  christos #else
    407  1.1  christos 	orr	r4, r4, ip, lsl #16
    408  1.1  christos #endif
    409  1.1  christos 	str	r4, [r3], #0x04
    410  1.6   mlelstv 	bhs	.Lmemcpy_bad2_loop4
    411  1.1  christos 	sub	r1, r1, #0x02
    412  1.1  christos 	b	.Lmemcpy_bad_done
    413  1.1  christos 
    414  1.1  christos .Lmemcpy_bad3_loop16:
    415  1.1  christos #ifdef __ARMEB__
    416  1.1  christos 	mov	r4, ip, lsl #24
    417  1.1  christos #else
    418  1.1  christos 	mov	r4, ip, lsr #24
    419  1.1  christos #endif
    420  1.1  christos 	ldr	r5, [r1], #0x04
    421  1.1  christos 	pld	[r1, #0x018]
    422  1.1  christos 	ldr	r6, [r1], #0x04
    423  1.1  christos 	ldr	r7, [r1], #0x04
    424  1.1  christos 	ldr	ip, [r1], #0x04
    425  1.1  christos #ifdef __ARMEB__
    426  1.1  christos 	orr	r4, r4, r5, lsr #8
    427  1.1  christos 	mov	r5, r5, lsl #24
    428  1.1  christos 	orr	r5, r5, r6, lsr #8
    429  1.1  christos 	mov	r6, r6, lsl #24
    430  1.1  christos 	orr	r6, r6, r7, lsr #8
    431  1.1  christos 	mov	r7, r7, lsl #24
    432  1.1  christos 	orr	r7, r7, ip, lsr #8
    433  1.1  christos #else
    434  1.1  christos 	orr	r4, r4, r5, lsl #8
    435  1.1  christos 	mov	r5, r5, lsr #24
    436  1.1  christos 	orr	r5, r5, r6, lsl #8
    437  1.1  christos 	mov	r6, r6, lsr #24
    438  1.1  christos 	orr	r6, r6, r7, lsl #8
    439  1.1  christos 	mov	r7, r7, lsr #24
    440  1.1  christos 	orr	r7, r7, ip, lsl #8
    441  1.1  christos #endif
    442  1.1  christos 	str	r4, [r3], #0x04
    443  1.1  christos 	str	r5, [r3], #0x04
    444  1.1  christos 	str	r6, [r3], #0x04
    445  1.1  christos 	str	r7, [r3], #0x04
    446  1.2       scw 	sub	r2, r2, #0x10
    447  1.2       scw 
    448  1.1  christos .Lmemcpy_bad3:
    449  1.2       scw 	cmp	r2, #0x20
    450  1.6   mlelstv 	bhs	.Lmemcpy_bad3_loop16
    451  1.2       scw 	cmp	r2, #0x10
    452  1.6   mlelstv 	blo	.Lmemcpy_bad3_loop16_short
    453  1.1  christos 
    454  1.2       scw 	/* copy last 16 bytes (without preload) */
    455  1.2       scw #ifdef __ARMEB__
    456  1.2       scw 	mov	r4, ip, lsl #24
    457  1.2       scw #else
    458  1.2       scw 	mov	r4, ip, lsr #24
    459  1.2       scw #endif
    460  1.2       scw 	ldr	r5, [r1], #0x04
    461  1.2       scw 	ldr	r6, [r1], #0x04
    462  1.2       scw 	ldr	r7, [r1], #0x04
    463  1.2       scw 	ldr	ip, [r1], #0x04
    464  1.2       scw #ifdef __ARMEB__
    465  1.2       scw 	orr	r4, r4, r5, lsr #8
    466  1.2       scw 	mov	r5, r5, lsl #24
    467  1.2       scw 	orr	r5, r5, r6, lsr #8
    468  1.2       scw 	mov	r6, r6, lsl #24
    469  1.2       scw 	orr	r6, r6, r7, lsr #8
    470  1.2       scw 	mov	r7, r7, lsl #24
    471  1.2       scw 	orr	r7, r7, ip, lsr #8
    472  1.2       scw #else
    473  1.2       scw 	orr	r4, r4, r5, lsl #8
    474  1.2       scw 	mov	r5, r5, lsr #24
    475  1.2       scw 	orr	r5, r5, r6, lsl #8
    476  1.2       scw 	mov	r6, r6, lsr #24
    477  1.2       scw 	orr	r6, r6, r7, lsl #8
    478  1.2       scw 	mov	r7, r7, lsr #24
    479  1.2       scw 	orr	r7, r7, ip, lsl #8
    480  1.2       scw #endif
    481  1.2       scw 	str	r4, [r3], #0x04
    482  1.2       scw 	str	r5, [r3], #0x04
    483  1.2       scw 	str	r6, [r3], #0x04
    484  1.2       scw 	str	r7, [r3], #0x04
    485  1.2       scw 	subs	r2, r2, #0x10
    486  1.3      matt 	popeq	{r4-r7}
    487  1.3      matt 	RETc(eq)			/* Return now if done */
    488  1.2       scw 
    489  1.2       scw .Lmemcpy_bad3_loop16_short:
    490  1.1  christos 	subs	r2, r2, #0x04
    491  1.6   mlelstv 	sublo	r1, r1, #0x01
    492  1.6   mlelstv 	blo	.Lmemcpy_bad_done
    493  1.1  christos 
    494  1.1  christos .Lmemcpy_bad3_loop4:
    495  1.1  christos #ifdef __ARMEB__
    496  1.1  christos 	mov	r4, ip, lsl #24
    497  1.1  christos #else
    498  1.1  christos 	mov	r4, ip, lsr #24
    499  1.1  christos #endif
    500  1.1  christos 	ldr	ip, [r1], #0x04
    501  1.1  christos 	subs	r2, r2, #0x04
    502  1.1  christos #ifdef __ARMEB__
    503  1.1  christos 	orr	r4, r4, ip, lsr #8
    504  1.1  christos #else
    505  1.1  christos 	orr	r4, r4, ip, lsl #8
    506  1.1  christos #endif
    507  1.1  christos 	str	r4, [r3], #0x04
    508  1.6   mlelstv 	bhs	.Lmemcpy_bad3_loop4
    509  1.1  christos 	sub	r1, r1, #0x01
    510  1.1  christos 
    511  1.1  christos .Lmemcpy_bad_done:
    512  1.3      matt 	pop	{r4-r7}
    513  1.1  christos 	adds	r2, r2, #0x04
    514  1.3      matt 	RETc(eq)
    515  1.1  christos 	ldrb	ip, [r1], #0x01
    516  1.1  christos 	cmp	r2, #0x02
    517  1.6   mlelstv 	ldrbhs	r2, [r1], #0x01
    518  1.1  christos 	strb	ip, [r3], #0x01
    519  1.6   mlelstv 	ldrbhi	ip, [r1]
    520  1.6   mlelstv 	strbhs	r2, [r3], #0x01
    521  1.6   mlelstv 	strbhi	ip, [r3]
    522  1.3      matt 	RET
    523  1.1  christos 
    524  1.1  christos 
    525  1.1  christos /*
    526  1.1  christos  * Handle short copies (less than 16 bytes), possibly misaligned.
    527  1.1  christos  * Some of these are *very* common, thanks to the network stack,
    528  1.1  christos  * and so are handled specially.
    529  1.1  christos  */
    530  1.1  christos .Lmemcpy_short:
    531  1.1  christos #ifndef _STANDALONE
    532  1.1  christos 	add	pc, pc, r2, lsl #2
    533  1.1  christos 	nop
    534  1.3      matt 	RET				/* 0x00 */
    535  1.1  christos 	b	.Lmemcpy_bytewise	/* 0x01 */
    536  1.1  christos 	b	.Lmemcpy_bytewise	/* 0x02 */
    537  1.1  christos 	b	.Lmemcpy_bytewise	/* 0x03 */
    538  1.1  christos 	b	.Lmemcpy_4		/* 0x04 */
    539  1.1  christos 	b	.Lmemcpy_bytewise	/* 0x05 */
    540  1.1  christos 	b	.Lmemcpy_6		/* 0x06 */
    541  1.1  christos 	b	.Lmemcpy_bytewise	/* 0x07 */
    542  1.1  christos 	b	.Lmemcpy_8		/* 0x08 */
    543  1.1  christos 	b	.Lmemcpy_bytewise	/* 0x09 */
    544  1.1  christos 	b	.Lmemcpy_bytewise	/* 0x0a */
    545  1.1  christos 	b	.Lmemcpy_bytewise	/* 0x0b */
    546  1.1  christos 	b	.Lmemcpy_c		/* 0x0c */
    547  1.1  christos #endif
    548  1.1  christos .Lmemcpy_bytewise:
    549  1.1  christos 	mov	r3, r0			/* We must not clobber r0 */
    550  1.1  christos 	ldrb	ip, [r1], #0x01
    551  1.1  christos 1:	subs	r2, r2, #0x01
    552  1.1  christos 	strb	ip, [r3], #0x01
    553  1.3      matt 	ldrbne	ip, [r1], #0x01
    554  1.1  christos 	bne	1b
    555  1.3      matt 	RET
    556  1.1  christos 
    557  1.1  christos #ifndef _STANDALONE
    558  1.1  christos /******************************************************************************
    559  1.1  christos  * Special case for 4 byte copies
    560  1.1  christos  */
    561  1.1  christos #define	LMEMCPY_4_LOG2	6	/* 64 bytes */
    562  1.1  christos #define	LMEMCPY_4_PAD	.align LMEMCPY_4_LOG2
    563  1.1  christos 	LMEMCPY_4_PAD
    564  1.1  christos .Lmemcpy_4:
    565  1.1  christos 	and	r2, r1, #0x03
    566  1.1  christos 	orr	r2, r2, r0, lsl #2
    567  1.1  christos 	ands	r2, r2, #0x0f
    568  1.1  christos 	sub	r3, pc, #0x14
    569  1.1  christos 	addne	pc, r3, r2, lsl #LMEMCPY_4_LOG2
    570  1.1  christos 
    571  1.1  christos /*
    572  1.1  christos  * 0000: dst is 32-bit aligned, src is 32-bit aligned
    573  1.1  christos  */
    574  1.1  christos 	ldr	r2, [r1]
    575  1.1  christos 	str	r2, [r0]
    576  1.3      matt 	RET
    577  1.1  christos 	LMEMCPY_4_PAD
    578  1.1  christos 
    579  1.1  christos /*
    580  1.1  christos  * 0001: dst is 32-bit aligned, src is 8-bit aligned
    581  1.1  christos  */
    582  1.1  christos 	ldr	r3, [r1, #-1]		/* BE:r3 = x012  LE:r3 = 210x */
    583  1.1  christos 	ldr	r2, [r1, #3]		/* BE:r2 = 3xxx  LE:r2 = xxx3 */
    584  1.1  christos #ifdef __ARMEB__
    585  1.1  christos 	mov	r3, r3, lsl #8		/* r3 = 012. */
    586  1.1  christos 	orr	r3, r3, r2, lsr #24	/* r3 = 0123 */
    587  1.1  christos #else
    588  1.1  christos 	mov	r3, r3, lsr #8		/* r3 = .210 */
    589  1.1  christos 	orr	r3, r3, r2, lsl #24	/* r3 = 3210 */
    590  1.1  christos #endif
    591  1.1  christos 	str	r3, [r0]
    592  1.3      matt 	RET
    593  1.1  christos 	LMEMCPY_4_PAD
    594  1.1  christos 
    595  1.1  christos /*
    596  1.1  christos  * 0010: dst is 32-bit aligned, src is 16-bit aligned
    597  1.1  christos  */
    598  1.1  christos #ifdef __ARMEB__
    599  1.1  christos 	ldrh	r3, [r1]
    600  1.1  christos 	ldrh	r2, [r1, #0x02]
    601  1.1  christos #else
    602  1.1  christos 	ldrh	r3, [r1, #0x02]
    603  1.1  christos 	ldrh	r2, [r1]
    604  1.1  christos #endif
    605  1.1  christos 	orr	r3, r2, r3, lsl #16
    606  1.1  christos 	str	r3, [r0]
    607  1.3      matt 	RET
    608  1.1  christos 	LMEMCPY_4_PAD
    609  1.1  christos 
    610  1.1  christos /*
    611  1.1  christos  * 0011: dst is 32-bit aligned, src is 8-bit aligned
    612  1.1  christos  */
    613  1.1  christos 	ldr	r3, [r1, #-3]		/* BE:r3 = xxx0  LE:r3 = 0xxx */
    614  1.1  christos 	ldr	r2, [r1, #1]		/* BE:r2 = 123x  LE:r2 = x321 */
    615  1.1  christos #ifdef __ARMEB__
    616  1.1  christos 	mov	r3, r3, lsl #24		/* r3 = 0... */
    617  1.1  christos 	orr	r3, r3, r2, lsr #8	/* r3 = 0123 */
    618  1.1  christos #else
    619  1.1  christos 	mov	r3, r3, lsr #24		/* r3 = ...0 */
    620  1.1  christos 	orr	r3, r3, r2, lsl #8	/* r3 = 3210 */
    621  1.1  christos #endif
    622  1.1  christos 	str	r3, [r0]
    623  1.3      matt 	RET
    624  1.1  christos 	LMEMCPY_4_PAD
    625  1.1  christos 
    626  1.1  christos /*
    627  1.1  christos  * 0100: dst is 8-bit aligned, src is 32-bit aligned
    628  1.1  christos  */
    629  1.1  christos 	ldr	r2, [r1]
    630  1.1  christos #ifdef __ARMEB__
    631  1.1  christos 	strb	r2, [r0, #0x03]
    632  1.1  christos 	mov	r3, r2, lsr #8
    633  1.1  christos 	mov	r1, r2, lsr #24
    634  1.1  christos 	strb	r1, [r0]
    635  1.1  christos #else
    636  1.1  christos 	strb	r2, [r0]
    637  1.1  christos 	mov	r3, r2, lsr #8
    638  1.1  christos 	mov	r1, r2, lsr #24
    639  1.1  christos 	strb	r1, [r0, #0x03]
    640  1.1  christos #endif
    641  1.1  christos 	strh	r3, [r0, #0x01]
    642  1.3      matt 	RET
    643  1.1  christos 	LMEMCPY_4_PAD
    644  1.1  christos 
    645  1.1  christos /*
    646  1.1  christos  * 0101: dst is 8-bit aligned, src is 8-bit aligned
    647  1.1  christos  */
    648  1.1  christos 	ldrb	r2, [r1]
    649  1.1  christos 	ldrh	r3, [r1, #0x01]
    650  1.1  christos 	ldrb	r1, [r1, #0x03]
    651  1.1  christos 	strb	r2, [r0]
    652  1.1  christos 	strh	r3, [r0, #0x01]
    653  1.1  christos 	strb	r1, [r0, #0x03]
    654  1.3      matt 	RET
    655  1.1  christos 	LMEMCPY_4_PAD
    656  1.1  christos 
    657  1.1  christos /*
    658  1.1  christos  * 0110: dst is 8-bit aligned, src is 16-bit aligned
    659  1.1  christos  */
    660  1.1  christos 	ldrh	r2, [r1]		/* BE:r2 = ..01  LE:r2 = ..10 */
    661  1.1  christos 	ldrh	r3, [r1, #0x02]		/* LE:r3 = ..23  LE:r3 = ..32 */
    662  1.1  christos #ifdef __ARMEB__
    663  1.1  christos 	mov	r1, r2, lsr #8		/* r1 = ...0 */
    664  1.1  christos 	strb	r1, [r0]
    665  1.1  christos 	mov	r2, r2, lsl #8		/* r2 = .01. */
    666  1.1  christos 	orr	r2, r2, r3, lsr #8	/* r2 = .012 */
    667  1.1  christos #else
    668  1.1  christos 	strb	r2, [r0]
    669  1.1  christos 	mov	r2, r2, lsr #8		/* r2 = ...1 */
    670  1.1  christos 	orr	r2, r2, r3, lsl #8	/* r2 = .321 */
    671  1.1  christos 	mov	r3, r3, lsr #8		/* r3 = ...3 */
    672  1.1  christos #endif
    673  1.1  christos 	strh	r2, [r0, #0x01]
    674  1.1  christos 	strb	r3, [r0, #0x03]
    675  1.3      matt 	RET
    676  1.1  christos 	LMEMCPY_4_PAD
    677  1.1  christos 
    678  1.1  christos /*
    679  1.1  christos  * 0111: dst is 8-bit aligned, src is 8-bit aligned
    680  1.1  christos  */
    681  1.1  christos 	ldrb	r2, [r1]
    682  1.1  christos 	ldrh	r3, [r1, #0x01]
    683  1.1  christos 	ldrb	r1, [r1, #0x03]
    684  1.1  christos 	strb	r2, [r0]
    685  1.1  christos 	strh	r3, [r0, #0x01]
    686  1.1  christos 	strb	r1, [r0, #0x03]
    687  1.3      matt 	RET
    688  1.1  christos 	LMEMCPY_4_PAD
    689  1.1  christos 
    690  1.1  christos /*
    691  1.1  christos  * 1000: dst is 16-bit aligned, src is 32-bit aligned
    692  1.1  christos  */
    693  1.1  christos 	ldr	r2, [r1]
    694  1.1  christos #ifdef __ARMEB__
    695  1.1  christos 	strh	r2, [r0, #0x02]
    696  1.1  christos 	mov	r3, r2, lsr #16
    697  1.1  christos 	strh	r3, [r0]
    698  1.1  christos #else
    699  1.1  christos 	strh	r2, [r0]
    700  1.1  christos 	mov	r3, r2, lsr #16
    701  1.1  christos 	strh	r3, [r0, #0x02]
    702  1.1  christos #endif
    703  1.3      matt 	RET
    704  1.1  christos 	LMEMCPY_4_PAD
    705  1.1  christos 
    706  1.1  christos /*
    707  1.1  christos  * 1001: dst is 16-bit aligned, src is 8-bit aligned
    708  1.1  christos  */
    709  1.1  christos 	ldr	r2, [r1, #-1]		/* BE:r2 = x012  LE:r2 = 210x */
    710  1.1  christos 	ldr	r3, [r1, #3]		/* BE:r3 = 3xxx  LE:r3 = xxx3 */
    711  1.1  christos 	mov	r1, r2, lsr #8		/* BE:r1 = .x01  LE:r1 = .210 */
    712  1.1  christos 	strh	r1, [r0]
    713  1.1  christos #ifdef __ARMEB__
    714  1.1  christos 	mov	r2, r2, lsl #8		/* r2 = 012. */
    715  1.1  christos 	orr	r2, r2, r3, lsr #24	/* r2 = 0123 */
    716  1.1  christos #else
    717  1.1  christos 	mov	r2, r2, lsr #24		/* r2 = ...2 */
    718  1.1  christos 	orr	r2, r2, r3, lsl #8	/* r2 = xx32 */
    719  1.1  christos #endif
    720  1.1  christos 	strh	r2, [r0, #0x02]
    721  1.3      matt 	RET
    722  1.1  christos 	LMEMCPY_4_PAD
    723  1.1  christos 
    724  1.1  christos /*
    725  1.1  christos  * 1010: dst is 16-bit aligned, src is 16-bit aligned
    726  1.1  christos  */
    727  1.1  christos 	ldrh	r2, [r1]
    728  1.1  christos 	ldrh	r3, [r1, #0x02]
    729  1.1  christos 	strh	r2, [r0]
    730  1.1  christos 	strh	r3, [r0, #0x02]
    731  1.3      matt 	RET
    732  1.1  christos 	LMEMCPY_4_PAD
    733  1.1  christos 
    734  1.1  christos /*
    735  1.1  christos  * 1011: dst is 16-bit aligned, src is 8-bit aligned
    736  1.1  christos  */
    737  1.1  christos 	ldr	r3, [r1, #1]		/* BE:r3 = 123x  LE:r3 = x321 */
    738  1.1  christos 	ldr	r2, [r1, #-3]		/* BE:r2 = xxx0  LE:r2 = 0xxx */
    739  1.1  christos 	mov	r1, r3, lsr #8		/* BE:r1 = .123  LE:r1 = .x32 */
    740  1.1  christos 	strh	r1, [r0, #0x02]
    741  1.1  christos #ifdef __ARMEB__
    742  1.1  christos 	mov	r3, r3, lsr #24		/* r3 = ...1 */
    743  1.1  christos 	orr	r3, r3, r2, lsl #8	/* r3 = xx01 */
    744  1.1  christos #else
    745  1.1  christos 	mov	r3, r3, lsl #8		/* r3 = 321. */
    746  1.1  christos 	orr	r3, r3, r2, lsr #24	/* r3 = 3210 */
    747  1.1  christos #endif
    748  1.1  christos 	strh	r3, [r0]
    749  1.3      matt 	RET
    750  1.1  christos 	LMEMCPY_4_PAD
    751  1.1  christos 
    752  1.1  christos /*
    753  1.1  christos  * 1100: dst is 8-bit aligned, src is 32-bit aligned
    754  1.1  christos  */
    755  1.1  christos 	ldr	r2, [r1]		/* BE:r2 = 0123  LE:r2 = 3210 */
    756  1.1  christos #ifdef __ARMEB__
    757  1.1  christos 	strb	r2, [r0, #0x03]
    758  1.1  christos 	mov	r3, r2, lsr #8
    759  1.1  christos 	mov	r1, r2, lsr #24
    760  1.1  christos 	strh	r3, [r0, #0x01]
    761  1.1  christos 	strb	r1, [r0]
    762  1.1  christos #else
    763  1.1  christos 	strb	r2, [r0]
    764  1.1  christos 	mov	r3, r2, lsr #8
    765  1.1  christos 	mov	r1, r2, lsr #24
    766  1.1  christos 	strh	r3, [r0, #0x01]
    767  1.1  christos 	strb	r1, [r0, #0x03]
    768  1.1  christos #endif
    769  1.3      matt 	RET
    770  1.1  christos 	LMEMCPY_4_PAD
    771  1.1  christos 
    772  1.1  christos /*
    773  1.1  christos  * 1101: dst is 8-bit aligned, src is 8-bit aligned
    774  1.1  christos  */
    775  1.1  christos 	ldrb	r2, [r1]
    776  1.1  christos 	ldrh	r3, [r1, #0x01]
    777  1.1  christos 	ldrb	r1, [r1, #0x03]
    778  1.1  christos 	strb	r2, [r0]
    779  1.1  christos 	strh	r3, [r0, #0x01]
    780  1.1  christos 	strb	r1, [r0, #0x03]
    781  1.3      matt 	RET
    782  1.1  christos 	LMEMCPY_4_PAD
    783  1.1  christos 
    784  1.1  christos /*
    785  1.1  christos  * 1110: dst is 8-bit aligned, src is 16-bit aligned
    786  1.1  christos  */
    787  1.1  christos #ifdef __ARMEB__
    788  1.1  christos 	ldrh	r3, [r1, #0x02]		/* BE:r3 = ..23  LE:r3 = ..32 */
    789  1.1  christos 	ldrh	r2, [r1]		/* BE:r2 = ..01  LE:r2 = ..10 */
    790  1.1  christos 	strb	r3, [r0, #0x03]
    791  1.1  christos 	mov	r3, r3, lsr #8		/* r3 = ...2 */
    792  1.1  christos 	orr	r3, r3, r2, lsl #8	/* r3 = ..12 */
    793  1.1  christos 	strh	r3, [r0, #0x01]
    794  1.1  christos 	mov	r2, r2, lsr #8		/* r2 = ...0 */
    795  1.1  christos 	strb	r2, [r0]
    796  1.1  christos #else
    797  1.1  christos 	ldrh	r2, [r1]		/* BE:r2 = ..01  LE:r2 = ..10 */
    798  1.1  christos 	ldrh	r3, [r1, #0x02]		/* BE:r3 = ..23  LE:r3 = ..32 */
    799  1.1  christos 	strb	r2, [r0]
    800  1.1  christos 	mov	r2, r2, lsr #8		/* r2 = ...1 */
    801  1.1  christos 	orr	r2, r2, r3, lsl #8	/* r2 = .321 */
    802  1.1  christos 	strh	r2, [r0, #0x01]
    803  1.1  christos 	mov	r3, r3, lsr #8		/* r3 = ...3 */
    804  1.1  christos 	strb	r3, [r0, #0x03]
    805  1.1  christos #endif
    806  1.3      matt 	RET
    807  1.1  christos 	LMEMCPY_4_PAD
    808  1.1  christos 
    809  1.1  christos /*
    810  1.1  christos  * 1111: dst is 8-bit aligned, src is 8-bit aligned
    811  1.1  christos  */
    812  1.1  christos 	ldrb	r2, [r1]
    813  1.1  christos 	ldrh	r3, [r1, #0x01]
    814  1.1  christos 	ldrb	r1, [r1, #0x03]
    815  1.1  christos 	strb	r2, [r0]
    816  1.1  christos 	strh	r3, [r0, #0x01]
    817  1.1  christos 	strb	r1, [r0, #0x03]
    818  1.3      matt 	RET
    819  1.1  christos 	LMEMCPY_4_PAD
    820  1.1  christos 
    821  1.1  christos 
    822  1.1  christos /******************************************************************************
    823  1.1  christos  * Special case for 6 byte copies
    824  1.1  christos  */
    825  1.1  christos #define	LMEMCPY_6_LOG2	6	/* 64 bytes */
    826  1.1  christos #define	LMEMCPY_6_PAD	.align LMEMCPY_6_LOG2
    827  1.1  christos 	LMEMCPY_6_PAD
    828  1.1  christos .Lmemcpy_6:
    829  1.1  christos 	and	r2, r1, #0x03
    830  1.1  christos 	orr	r2, r2, r0, lsl #2
    831  1.1  christos 	ands	r2, r2, #0x0f
    832  1.1  christos 	sub	r3, pc, #0x14
    833  1.1  christos 	addne	pc, r3, r2, lsl #LMEMCPY_6_LOG2
    834  1.1  christos 
    835  1.1  christos /*
    836  1.1  christos  * 0000: dst is 32-bit aligned, src is 32-bit aligned
    837  1.1  christos  */
    838  1.1  christos 	ldr	r2, [r1]
    839  1.1  christos 	ldrh	r3, [r1, #0x04]
    840  1.1  christos 	str	r2, [r0]
    841  1.1  christos 	strh	r3, [r0, #0x04]
    842  1.3      matt 	RET
    843  1.1  christos 	LMEMCPY_6_PAD
    844  1.1  christos 
    845  1.1  christos /*
    846  1.1  christos  * 0001: dst is 32-bit aligned, src is 8-bit aligned
    847  1.1  christos  */
    848  1.1  christos 	ldr	r2, [r1, #-1]		/* BE:r2 = x012  LE:r2 = 210x */
    849  1.1  christos 	ldr	r3, [r1, #0x03]		/* BE:r3 = 345x  LE:r3 = x543 */
    850  1.1  christos #ifdef __ARMEB__
    851  1.1  christos 	mov	r2, r2, lsl #8		/* r2 = 012. */
    852  1.1  christos 	orr	r2, r2, r3, lsr #24	/* r2 = 0123 */
    853  1.1  christos #else
    854  1.1  christos 	mov	r2, r2, lsr #8		/* r2 = .210 */
    855  1.1  christos 	orr	r2, r2, r3, lsl #24	/* r2 = 3210 */
    856  1.1  christos #endif
    857  1.1  christos 	mov	r3, r3, lsr #8		/* BE:r3 = .345  LE:r3 = .x54 */
    858  1.1  christos 	str	r2, [r0]
    859  1.1  christos 	strh	r3, [r0, #0x04]
    860  1.3      matt 	RET
    861  1.1  christos 	LMEMCPY_6_PAD
    862  1.1  christos 
    863  1.1  christos /*
    864  1.1  christos  * 0010: dst is 32-bit aligned, src is 16-bit aligned
    865  1.1  christos  */
    866  1.1  christos 	ldr	r3, [r1, #0x02]		/* BE:r3 = 2345  LE:r3 = 5432 */
    867  1.1  christos 	ldrh	r2, [r1]		/* BE:r2 = ..01  LE:r2 = ..10 */
    868  1.1  christos #ifdef __ARMEB__
    869  1.1  christos 	mov	r1, r3, lsr #16		/* r1 = ..23 */
    870  1.1  christos 	orr	r1, r1, r2, lsl #16	/* r1 = 0123 */
    871  1.1  christos 	str	r1, [r0]
    872  1.1  christos 	strh	r3, [r0, #0x04]
    873  1.1  christos #else
    874  1.1  christos 	mov	r1, r3, lsr #16		/* r1 = ..54 */
    875  1.1  christos 	orr	r2, r2, r3, lsl #16	/* r2 = 3210 */
    876  1.1  christos 	str	r2, [r0]
    877  1.1  christos 	strh	r1, [r0, #0x04]
    878  1.1  christos #endif
    879  1.3      matt 	RET
    880  1.1  christos 	LMEMCPY_6_PAD
    881  1.1  christos 
    882  1.1  christos /*
    883  1.1  christos  * 0011: dst is 32-bit aligned, src is 8-bit aligned
    884  1.1  christos  */
    885  1.1  christos 	ldr	r2, [r1, #-3]		/* BE:r2 = xxx0  LE:r2 = 0xxx */
    886  1.1  christos 	ldr	r3, [r1, #1]		/* BE:r3 = 1234  LE:r3 = 4321 */
    887  1.1  christos 	ldr	r1, [r1, #5]		/* BE:r1 = 5xxx  LE:r3 = xxx5 */
    888  1.1  christos #ifdef __ARMEB__
    889  1.1  christos 	mov	r2, r2, lsl #24		/* r2 = 0... */
    890  1.1  christos 	orr	r2, r2, r3, lsr #8	/* r2 = 0123 */
    891  1.1  christos 	mov	r3, r3, lsl #8		/* r3 = 234. */
    892  1.1  christos 	orr	r1, r3, r1, lsr #24	/* r1 = 2345 */
    893  1.1  christos #else
    894  1.1  christos 	mov	r2, r2, lsr #24		/* r2 = ...0 */
    895  1.1  christos 	orr	r2, r2, r3, lsl #8	/* r2 = 3210 */
    896  1.1  christos 	mov	r1, r1, lsl #8		/* r1 = xx5. */
    897  1.1  christos 	orr	r1, r1, r3, lsr #24	/* r1 = xx54 */
    898  1.1  christos #endif
    899  1.1  christos 	str	r2, [r0]
    900  1.1  christos 	strh	r1, [r0, #0x04]
    901  1.3      matt 	RET
    902  1.1  christos 	LMEMCPY_6_PAD
    903  1.1  christos 
    904  1.1  christos /*
    905  1.1  christos  * 0100: dst is 8-bit aligned, src is 32-bit aligned
    906  1.1  christos  */
    907  1.1  christos 	ldr	r3, [r1]		/* BE:r3 = 0123  LE:r3 = 3210 */
    908  1.1  christos 	ldrh	r2, [r1, #0x04]		/* BE:r2 = ..45  LE:r2 = ..54 */
    909  1.1  christos 	mov	r1, r3, lsr #8		/* BE:r1 = .012  LE:r1 = .321 */
    910  1.1  christos 	strh	r1, [r0, #0x01]
    911  1.1  christos #ifdef __ARMEB__
    912  1.1  christos 	mov	r1, r3, lsr #24		/* r1 = ...0 */
    913  1.1  christos 	strb	r1, [r0]
    914  1.1  christos 	mov	r3, r3, lsl #8		/* r3 = 123. */
    915  1.1  christos 	orr	r3, r3, r2, lsr #8	/* r3 = 1234 */
    916  1.1  christos #else
    917  1.1  christos 	strb	r3, [r0]
    918  1.1  christos 	mov	r3, r3, lsr #24		/* r3 = ...3 */
    919  1.1  christos 	orr	r3, r3, r2, lsl #8	/* r3 = .543 */
    920  1.1  christos 	mov	r2, r2, lsr #8		/* r2 = ...5 */
    921  1.1  christos #endif
    922  1.1  christos 	strh	r3, [r0, #0x03]
    923  1.1  christos 	strb	r2, [r0, #0x05]
    924  1.3      matt 	RET
    925  1.1  christos 	LMEMCPY_6_PAD
    926  1.1  christos 
    927  1.1  christos /*
    928  1.1  christos  * 0101: dst is 8-bit aligned, src is 8-bit aligned
    929  1.1  christos  */
    930  1.1  christos 	ldrb	r2, [r1]
    931  1.1  christos 	ldrh	r3, [r1, #0x01]
    932  1.1  christos 	ldrh	ip, [r1, #0x03]
    933  1.1  christos 	ldrb	r1, [r1, #0x05]
    934  1.1  christos 	strb	r2, [r0]
    935  1.1  christos 	strh	r3, [r0, #0x01]
    936  1.1  christos 	strh	ip, [r0, #0x03]
    937  1.1  christos 	strb	r1, [r0, #0x05]
    938  1.3      matt 	RET
    939  1.1  christos 	LMEMCPY_6_PAD
    940  1.1  christos 
    941  1.1  christos /*
    942  1.1  christos  * 0110: dst is 8-bit aligned, src is 16-bit aligned
    943  1.1  christos  */
    944  1.1  christos 	ldrh	r2, [r1]		/* BE:r2 = ..01  LE:r2 = ..10 */
    945  1.1  christos 	ldr	r1, [r1, #0x02]		/* BE:r1 = 2345  LE:r1 = 5432 */
    946  1.1  christos #ifdef __ARMEB__
    947  1.1  christos 	mov	r3, r2, lsr #8		/* r3 = ...0 */
    948  1.1  christos 	strb	r3, [r0]
    949  1.1  christos 	strb	r1, [r0, #0x05]
    950  1.1  christos 	mov	r3, r1, lsr #8		/* r3 = .234 */
    951  1.1  christos 	strh	r3, [r0, #0x03]
    952  1.1  christos 	mov	r3, r2, lsl #8		/* r3 = .01. */
    953  1.1  christos 	orr	r3, r3, r1, lsr #24	/* r3 = .012 */
    954  1.1  christos 	strh	r3, [r0, #0x01]
    955  1.1  christos #else
    956  1.1  christos 	strb	r2, [r0]
    957  1.1  christos 	mov	r3, r1, lsr #24
    958  1.1  christos 	strb	r3, [r0, #0x05]
    959  1.1  christos 	mov	r3, r1, lsr #8		/* r3 = .543 */
    960  1.1  christos 	strh	r3, [r0, #0x03]
    961  1.1  christos 	mov	r3, r2, lsr #8		/* r3 = ...1 */
    962  1.1  christos 	orr	r3, r3, r1, lsl #8	/* r3 = 4321 */
    963  1.1  christos 	strh	r3, [r0, #0x01]
    964  1.1  christos #endif
    965  1.3      matt 	RET
    966  1.1  christos 	LMEMCPY_6_PAD
    967  1.1  christos 
    968  1.1  christos /*
    969  1.1  christos  * 0111: dst is 8-bit aligned, src is 8-bit aligned
    970  1.1  christos  */
    971  1.1  christos 	ldrb	r2, [r1]
    972  1.1  christos 	ldrh	r3, [r1, #0x01]
    973  1.1  christos 	ldrh	ip, [r1, #0x03]
    974  1.1  christos 	ldrb	r1, [r1, #0x05]
    975  1.1  christos 	strb	r2, [r0]
    976  1.1  christos 	strh	r3, [r0, #0x01]
    977  1.1  christos 	strh	ip, [r0, #0x03]
    978  1.1  christos 	strb	r1, [r0, #0x05]
    979  1.3      matt 	RET
    980  1.1  christos 	LMEMCPY_6_PAD
    981  1.1  christos 
    982  1.1  christos /*
    983  1.1  christos  * 1000: dst is 16-bit aligned, src is 32-bit aligned
    984  1.1  christos  */
    985  1.1  christos #ifdef __ARMEB__
    986  1.1  christos 	ldr	r2, [r1]		/* r2 = 0123 */
    987  1.1  christos 	ldrh	r3, [r1, #0x04]		/* r3 = ..45 */
    988  1.1  christos 	mov	r1, r2, lsr #16		/* r1 = ..01 */
    989  1.1  christos 	orr	r3, r3, r2, lsl#16	/* r3 = 2345 */
    990  1.1  christos 	strh	r1, [r0]
    991  1.1  christos 	str	r3, [r0, #0x02]
    992  1.1  christos #else
    993  1.1  christos 	ldrh	r2, [r1, #0x04]		/* r2 = ..54 */
    994  1.1  christos 	ldr	r3, [r1]		/* r3 = 3210 */
    995  1.1  christos 	mov	r2, r2, lsl #16		/* r2 = 54.. */
    996  1.1  christos 	orr	r2, r2, r3, lsr #16	/* r2 = 5432 */
    997  1.1  christos 	strh	r3, [r0]
    998  1.1  christos 	str	r2, [r0, #0x02]
    999  1.1  christos #endif
   1000  1.3      matt 	RET
   1001  1.1  christos 	LMEMCPY_6_PAD
   1002  1.1  christos 
   1003  1.1  christos /*
   1004  1.1  christos  * 1001: dst is 16-bit aligned, src is 8-bit aligned
   1005  1.1  christos  */
   1006  1.1  christos 	ldr	r3, [r1, #-1]		/* BE:r3 = x012  LE:r3 = 210x */
   1007  1.1  christos 	ldr	r2, [r1, #3]		/* BE:r2 = 345x  LE:r2 = x543 */
   1008  1.1  christos 	mov	r1, r3, lsr #8		/* BE:r1 = .x01  LE:r1 = .210 */
   1009  1.1  christos #ifdef __ARMEB__
   1010  1.1  christos 	mov	r2, r2, lsr #8		/* r2 = .345 */
   1011  1.1  christos 	orr	r2, r2, r3, lsl #24	/* r2 = 2345 */
   1012  1.1  christos #else
   1013  1.1  christos 	mov	r2, r2, lsl #8		/* r2 = 543. */
   1014  1.1  christos 	orr	r2, r2, r3, lsr #24	/* r2 = 5432 */
   1015  1.1  christos #endif
   1016  1.1  christos 	strh	r1, [r0]
   1017  1.1  christos 	str	r2, [r0, #0x02]
   1018  1.3      matt 	RET
   1019  1.1  christos 	LMEMCPY_6_PAD
   1020  1.1  christos 
   1021  1.1  christos /*
   1022  1.1  christos  * 1010: dst is 16-bit aligned, src is 16-bit aligned
   1023  1.1  christos  */
   1024  1.1  christos 	ldrh	r2, [r1]
   1025  1.1  christos 	ldr	r3, [r1, #0x02]
   1026  1.1  christos 	strh	r2, [r0]
   1027  1.1  christos 	str	r3, [r0, #0x02]
   1028  1.3      matt 	RET
   1029  1.1  christos 	LMEMCPY_6_PAD
   1030  1.1  christos 
   1031  1.1  christos /*
   1032  1.1  christos  * 1011: dst is 16-bit aligned, src is 8-bit aligned
   1033  1.1  christos  */
   1034  1.1  christos 	ldrb	r3, [r1]		/* r3 = ...0 */
   1035  1.1  christos 	ldr	r2, [r1, #0x01]		/* BE:r2 = 1234  LE:r2 = 4321 */
   1036  1.1  christos 	ldrb	r1, [r1, #0x05]		/* r1 = ...5 */
   1037  1.1  christos #ifdef __ARMEB__
   1038  1.1  christos 	mov	r3, r3, lsl #8		/* r3 = ..0. */
   1039  1.1  christos 	orr	r3, r3, r2, lsr #24	/* r3 = ..01 */
   1040  1.1  christos 	orr	r1, r1, r2, lsl #8	/* r1 = 2345 */
   1041  1.1  christos #else
   1042  1.1  christos 	orr	r3, r3, r2, lsl #8	/* r3 = 3210 */
   1043  1.1  christos 	mov	r1, r1, lsl #24		/* r1 = 5... */
   1044  1.1  christos 	orr	r1, r1, r2, lsr #8	/* r1 = 5432 */
   1045  1.1  christos #endif
   1046  1.1  christos 	strh	r3, [r0]
   1047  1.1  christos 	str	r1, [r0, #0x02]
   1048  1.3      matt 	RET
   1049  1.1  christos 	LMEMCPY_6_PAD
   1050  1.1  christos 
   1051  1.1  christos /*
   1052  1.1  christos  * 1100: dst is 8-bit aligned, src is 32-bit aligned
   1053  1.1  christos  */
   1054  1.1  christos 	ldr	r2, [r1]		/* BE:r2 = 0123  LE:r2 = 3210 */
   1055  1.1  christos 	ldrh	r1, [r1, #0x04]		/* BE:r1 = ..45  LE:r1 = ..54 */
   1056  1.1  christos #ifdef __ARMEB__
   1057  1.1  christos 	mov	r3, r2, lsr #24		/* r3 = ...0 */
   1058  1.1  christos 	strb	r3, [r0]
   1059  1.1  christos 	mov	r2, r2, lsl #8		/* r2 = 123. */
   1060  1.1  christos 	orr	r2, r2, r1, lsr #8	/* r2 = 1234 */
   1061  1.1  christos #else
   1062  1.1  christos 	strb	r2, [r0]
   1063  1.1  christos 	mov	r2, r2, lsr #8		/* r2 = .321 */
   1064  1.1  christos 	orr	r2, r2, r1, lsl #24	/* r2 = 4321 */
   1065  1.1  christos 	mov	r1, r1, lsr #8		/* r1 = ...5 */
   1066  1.1  christos #endif
   1067  1.1  christos 	str	r2, [r0, #0x01]
   1068  1.1  christos 	strb	r1, [r0, #0x05]
   1069  1.3      matt 	RET
   1070  1.1  christos 	LMEMCPY_6_PAD
   1071  1.1  christos 
   1072  1.1  christos /*
   1073  1.1  christos  * 1101: dst is 8-bit aligned, src is 8-bit aligned
   1074  1.1  christos  */
   1075  1.1  christos 	ldrb	r2, [r1]
   1076  1.1  christos 	ldrh	r3, [r1, #0x01]
   1077  1.1  christos 	ldrh	ip, [r1, #0x03]
   1078  1.1  christos 	ldrb	r1, [r1, #0x05]
   1079  1.1  christos 	strb	r2, [r0]
   1080  1.1  christos 	strh	r3, [r0, #0x01]
   1081  1.1  christos 	strh	ip, [r0, #0x03]
   1082  1.1  christos 	strb	r1, [r0, #0x05]
   1083  1.3      matt 	RET
   1084  1.1  christos 	LMEMCPY_6_PAD
   1085  1.1  christos 
   1086  1.1  christos /*
   1087  1.1  christos  * 1110: dst is 8-bit aligned, src is 16-bit aligned
   1088  1.1  christos  */
   1089  1.1  christos 	ldrh	r2, [r1]		/* BE:r2 = ..01  LE:r2 = ..10 */
   1090  1.1  christos 	ldr	r1, [r1, #0x02]		/* BE:r1 = 2345  LE:r1 = 5432 */
   1091  1.1  christos #ifdef __ARMEB__
   1092  1.1  christos 	mov	r3, r2, lsr #8		/* r3 = ...0 */
   1093  1.1  christos 	strb	r3, [r0]
   1094  1.1  christos 	mov	r2, r2, lsl #24		/* r2 = 1... */
   1095  1.1  christos 	orr	r2, r2, r1, lsr #8	/* r2 = 1234 */
   1096  1.1  christos #else
   1097  1.1  christos 	strb	r2, [r0]
   1098  1.1  christos 	mov	r2, r2, lsr #8		/* r2 = ...1 */
   1099  1.1  christos 	orr	r2, r2, r1, lsl #8	/* r2 = 4321 */
   1100  1.1  christos 	mov	r1, r1, lsr #24		/* r1 = ...5 */
   1101  1.1  christos #endif
   1102  1.1  christos 	str	r2, [r0, #0x01]
   1103  1.1  christos 	strb	r1, [r0, #0x05]
   1104  1.3      matt 	RET
   1105  1.1  christos 	LMEMCPY_6_PAD
   1106  1.1  christos 
   1107  1.1  christos /*
   1108  1.1  christos  * 1111: dst is 8-bit aligned, src is 8-bit aligned
   1109  1.1  christos  */
   1110  1.1  christos 	ldrb	r2, [r1]
   1111  1.1  christos 	ldr	r3, [r1, #0x01]
   1112  1.1  christos 	ldrb	r1, [r1, #0x05]
   1113  1.1  christos 	strb	r2, [r0]
   1114  1.1  christos 	str	r3, [r0, #0x01]
   1115  1.1  christos 	strb	r1, [r0, #0x05]
   1116  1.3      matt 	RET
   1117  1.1  christos 	LMEMCPY_6_PAD
   1118  1.1  christos 
   1119  1.1  christos 
   1120  1.1  christos /******************************************************************************
   1121  1.1  christos  * Special case for 8 byte copies
   1122  1.1  christos  */
   1123  1.1  christos #define	LMEMCPY_8_LOG2	6	/* 64 bytes */
   1124  1.1  christos #define	LMEMCPY_8_PAD	.align LMEMCPY_8_LOG2
   1125  1.1  christos 	LMEMCPY_8_PAD
   1126  1.1  christos .Lmemcpy_8:
   1127  1.1  christos 	and	r2, r1, #0x03
   1128  1.1  christos 	orr	r2, r2, r0, lsl #2
   1129  1.1  christos 	ands	r2, r2, #0x0f
   1130  1.1  christos 	sub	r3, pc, #0x14
   1131  1.1  christos 	addne	pc, r3, r2, lsl #LMEMCPY_8_LOG2
   1132  1.1  christos 
   1133  1.1  christos /*
   1134  1.1  christos  * 0000: dst is 32-bit aligned, src is 32-bit aligned
   1135  1.1  christos  */
   1136  1.1  christos 	ldr	r2, [r1]
   1137  1.1  christos 	ldr	r3, [r1, #0x04]
   1138  1.1  christos 	str	r2, [r0]
   1139  1.1  christos 	str	r3, [r0, #0x04]
   1140  1.3      matt 	RET
   1141  1.1  christos 	LMEMCPY_8_PAD
   1142  1.1  christos 
   1143  1.1  christos /*
   1144  1.1  christos  * 0001: dst is 32-bit aligned, src is 8-bit aligned
   1145  1.1  christos  */
   1146  1.1  christos 	ldr	r3, [r1, #-1]		/* BE:r3 = x012  LE:r3 = 210x */
   1147  1.1  christos 	ldr	r2, [r1, #0x03]		/* BE:r2 = 3456  LE:r2 = 6543 */
   1148  1.1  christos 	ldrb	r1, [r1, #0x07]		/* r1 = ...7 */
   1149  1.1  christos #ifdef __ARMEB__
   1150  1.1  christos 	mov	r3, r3, lsl #8		/* r3 = 012. */
   1151  1.1  christos 	orr	r3, r3, r2, lsr #24	/* r3 = 0123 */
   1152  1.1  christos 	orr	r2, r1, r2, lsl #8	/* r2 = 4567 */
   1153  1.1  christos #else
   1154  1.1  christos 	mov	r3, r3, lsr #8		/* r3 = .210 */
   1155  1.1  christos 	orr	r3, r3, r2, lsl #24	/* r3 = 3210 */
   1156  1.1  christos 	mov	r1, r1, lsl #24		/* r1 = 7... */
   1157  1.1  christos 	orr	r2, r1, r2, lsr #8	/* r2 = 7654 */
   1158  1.1  christos #endif
   1159  1.1  christos 	str	r3, [r0]
   1160  1.1  christos 	str	r2, [r0, #0x04]
   1161  1.3      matt 	RET
   1162  1.1  christos 	LMEMCPY_8_PAD
   1163  1.1  christos 
   1164  1.1  christos /*
   1165  1.1  christos  * 0010: dst is 32-bit aligned, src is 16-bit aligned
   1166  1.1  christos  */
   1167  1.1  christos 	ldrh	r2, [r1]		/* BE:r2 = ..01  LE:r2 = ..10 */
   1168  1.1  christos 	ldr	r3, [r1, #0x02]		/* BE:r3 = 2345  LE:r3 = 5432 */
   1169  1.1  christos 	ldrh	r1, [r1, #0x06]		/* BE:r1 = ..67  LE:r1 = ..76 */
   1170  1.1  christos #ifdef __ARMEB__
   1171  1.1  christos 	mov	r2, r2, lsl #16		/* r2 = 01.. */
   1172  1.1  christos 	orr	r2, r2, r3, lsr #16	/* r2 = 0123 */
   1173  1.1  christos 	orr	r3, r1, r3, lsl #16	/* r3 = 4567 */
   1174  1.1  christos #else
   1175  1.1  christos 	orr	r2, r2, r3, lsl #16	/* r2 = 3210 */
   1176  1.1  christos 	mov	r3, r3, lsr #16		/* r3 = ..54 */
   1177  1.1  christos 	orr	r3, r3, r1, lsl #16	/* r3 = 7654 */
   1178  1.1  christos #endif
   1179  1.1  christos 	str	r2, [r0]
   1180  1.1  christos 	str	r3, [r0, #0x04]
   1181  1.3      matt 	RET
   1182  1.1  christos 	LMEMCPY_8_PAD
   1183  1.1  christos 
   1184  1.1  christos /*
   1185  1.1  christos  * 0011: dst is 32-bit aligned, src is 8-bit aligned
   1186  1.1  christos  */
   1187  1.1  christos 	ldrb	r3, [r1]		/* r3 = ...0 */
   1188  1.1  christos 	ldr	r2, [r1, #0x01]		/* BE:r2 = 1234  LE:r2 = 4321 */
   1189  1.1  christos 	ldr	r1, [r1, #0x05]		/* BE:r1 = 567x  LE:r1 = x765 */
   1190  1.1  christos #ifdef __ARMEB__
   1191  1.1  christos 	mov	r3, r3, lsl #24		/* r3 = 0... */
   1192  1.1  christos 	orr	r3, r3, r2, lsr #8	/* r3 = 0123 */
   1193  1.1  christos 	mov	r2, r2, lsl #24		/* r2 = 4... */
   1194  1.1  christos 	orr	r2, r2, r1, lsr #8	/* r2 = 4567 */
   1195  1.1  christos #else
   1196  1.1  christos 	orr	r3, r3, r2, lsl #8	/* r3 = 3210 */
   1197  1.1  christos 	mov	r2, r2, lsr #24		/* r2 = ...4 */
   1198  1.1  christos 	orr	r2, r2, r1, lsl #8	/* r2 = 7654 */
   1199  1.1  christos #endif
   1200  1.1  christos 	str	r3, [r0]
   1201  1.1  christos 	str	r2, [r0, #0x04]
   1202  1.3      matt 	RET
   1203  1.1  christos 	LMEMCPY_8_PAD
   1204  1.1  christos 
   1205  1.1  christos /*
   1206  1.1  christos  * 0100: dst is 8-bit aligned, src is 32-bit aligned
   1207  1.1  christos  */
   1208  1.1  christos 	ldr	r3, [r1]		/* BE:r3 = 0123  LE:r3 = 3210 */
   1209  1.1  christos 	ldr	r2, [r1, #0x04]		/* BE:r2 = 4567  LE:r2 = 7654 */
   1210  1.1  christos #ifdef __ARMEB__
   1211  1.1  christos 	mov	r1, r3, lsr #24		/* r1 = ...0 */
   1212  1.1  christos 	strb	r1, [r0]
   1213  1.1  christos 	mov	r1, r3, lsr #8		/* r1 = .012 */
   1214  1.1  christos 	strb	r2, [r0, #0x07]
   1215  1.1  christos 	mov	r3, r3, lsl #24		/* r3 = 3... */
   1216  1.1  christos 	orr	r3, r3, r2, lsr #8	/* r3 = 3456 */
   1217  1.1  christos #else
   1218  1.1  christos 	strb	r3, [r0]
   1219  1.1  christos 	mov	r1, r2, lsr #24		/* r1 = ...7 */
   1220  1.1  christos 	strb	r1, [r0, #0x07]
   1221  1.1  christos 	mov	r1, r3, lsr #8		/* r1 = .321 */
   1222  1.1  christos 	mov	r3, r3, lsr #24		/* r3 = ...3 */
   1223  1.1  christos 	orr	r3, r3, r2, lsl #8	/* r3 = 6543 */
   1224  1.1  christos #endif
   1225  1.1  christos 	strh	r1, [r0, #0x01]
   1226  1.1  christos 	str	r3, [r0, #0x03]
   1227  1.3      matt 	RET
   1228  1.1  christos 	LMEMCPY_8_PAD
   1229  1.1  christos 
   1230  1.1  christos /*
   1231  1.1  christos  * 0101: dst is 8-bit aligned, src is 8-bit aligned
   1232  1.1  christos  */
   1233  1.1  christos 	ldrb	r2, [r1]
   1234  1.1  christos 	ldrh	r3, [r1, #0x01]
   1235  1.1  christos 	ldr	ip, [r1, #0x03]
   1236  1.1  christos 	ldrb	r1, [r1, #0x07]
   1237  1.1  christos 	strb	r2, [r0]
   1238  1.1  christos 	strh	r3, [r0, #0x01]
   1239  1.1  christos 	str	ip, [r0, #0x03]
   1240  1.1  christos 	strb	r1, [r0, #0x07]
   1241  1.3      matt 	RET
   1242  1.1  christos 	LMEMCPY_8_PAD
   1243  1.1  christos 
   1244  1.1  christos /*
   1245  1.1  christos  * 0110: dst is 8-bit aligned, src is 16-bit aligned
   1246  1.1  christos  */
   1247  1.1  christos 	ldrh	r2, [r1]		/* BE:r2 = ..01  LE:r2 = ..10 */
   1248  1.1  christos 	ldr	r3, [r1, #0x02]		/* BE:r3 = 2345  LE:r3 = 5432 */
   1249  1.1  christos 	ldrh	r1, [r1, #0x06]		/* BE:r1 = ..67  LE:r1 = ..76 */
   1250  1.1  christos #ifdef __ARMEB__
   1251  1.1  christos 	mov	ip, r2, lsr #8		/* ip = ...0 */
   1252  1.1  christos 	strb	ip, [r0]
   1253  1.1  christos 	mov	ip, r2, lsl #8		/* ip = .01. */
   1254  1.1  christos 	orr	ip, ip, r3, lsr #24	/* ip = .012 */
   1255  1.1  christos 	strb	r1, [r0, #0x07]
   1256  1.1  christos 	mov	r3, r3, lsl #8		/* r3 = 345. */
   1257  1.1  christos 	orr	r3, r3, r1, lsr #8	/* r3 = 3456 */
   1258  1.1  christos #else
   1259  1.1  christos 	strb	r2, [r0]		/* 0 */
   1260  1.1  christos 	mov	ip, r1, lsr #8		/* ip = ...7 */
   1261  1.1  christos 	strb	ip, [r0, #0x07]		/* 7 */
   1262  1.1  christos 	mov	ip, r2, lsr #8		/* ip = ...1 */
   1263  1.1  christos 	orr	ip, ip, r3, lsl #8	/* ip = 4321 */
   1264  1.1  christos 	mov	r3, r3, lsr #8		/* r3 = .543 */
   1265  1.1  christos 	orr	r3, r3, r1, lsl #24	/* r3 = 6543 */
   1266  1.1  christos #endif
   1267  1.1  christos 	strh	ip, [r0, #0x01]
   1268  1.1  christos 	str	r3, [r0, #0x03]
   1269  1.3      matt 	RET
   1270  1.1  christos 	LMEMCPY_8_PAD
   1271  1.1  christos 
   1272  1.1  christos /*
   1273  1.1  christos  * 0111: dst is 8-bit aligned, src is 8-bit aligned
   1274  1.1  christos  */
   1275  1.1  christos 	ldrb	r3, [r1]		/* r3 = ...0 */
   1276  1.1  christos 	ldr	ip, [r1, #0x01]		/* BE:ip = 1234  LE:ip = 4321 */
   1277  1.1  christos 	ldrh	r2, [r1, #0x05]		/* BE:r2 = ..56  LE:r2 = ..65 */
   1278  1.1  christos 	ldrb	r1, [r1, #0x07]		/* r1 = ...7 */
   1279  1.1  christos 	strb	r3, [r0]
   1280  1.1  christos 	mov	r3, ip, lsr #16		/* BE:r3 = ..12  LE:r3 = ..43 */
   1281  1.1  christos #ifdef __ARMEB__
   1282  1.1  christos 	strh	r3, [r0, #0x01]
   1283  1.1  christos 	orr	r2, r2, ip, lsl #16	/* r2 = 3456 */
   1284  1.1  christos #else
   1285  1.1  christos 	strh	ip, [r0, #0x01]
   1286  1.1  christos 	orr	r2, r3, r2, lsl #16	/* r2 = 6543 */
   1287  1.1  christos #endif
   1288  1.1  christos 	str	r2, [r0, #0x03]
   1289  1.1  christos 	strb	r1, [r0, #0x07]
   1290  1.3      matt 	RET
   1291  1.1  christos 	LMEMCPY_8_PAD
   1292  1.1  christos 
   1293  1.1  christos /*
   1294  1.1  christos  * 1000: dst is 16-bit aligned, src is 32-bit aligned
   1295  1.1  christos  */
   1296  1.1  christos 	ldr	r2, [r1]		/* BE:r2 = 0123  LE:r2 = 3210 */
   1297  1.1  christos 	ldr	r3, [r1, #0x04]		/* BE:r3 = 4567  LE:r3 = 7654 */
   1298  1.1  christos 	mov	r1, r2, lsr #16		/* BE:r1 = ..01  LE:r1 = ..32 */
   1299  1.1  christos #ifdef __ARMEB__
   1300  1.1  christos 	strh	r1, [r0]
   1301  1.1  christos 	mov	r1, r3, lsr #16		/* r1 = ..45 */
   1302  1.1  christos 	orr	r2, r1 ,r2, lsl #16	/* r2 = 2345 */
   1303  1.1  christos #else
   1304  1.1  christos 	strh	r2, [r0]
   1305  1.1  christos 	orr	r2, r1, r3, lsl #16	/* r2 = 5432 */
   1306  1.1  christos 	mov	r3, r3, lsr #16		/* r3 = ..76 */
   1307  1.1  christos #endif
   1308  1.1  christos 	str	r2, [r0, #0x02]
   1309  1.1  christos 	strh	r3, [r0, #0x06]
   1310  1.3      matt 	RET
   1311  1.1  christos 	LMEMCPY_8_PAD
   1312  1.1  christos 
   1313  1.1  christos /*
   1314  1.1  christos  * 1001: dst is 16-bit aligned, src is 8-bit aligned
   1315  1.1  christos  */
   1316  1.1  christos 	ldr	r2, [r1, #-1]		/* BE:r2 = x012  LE:r2 = 210x */
   1317  1.1  christos 	ldr	r3, [r1, #0x03]		/* BE:r3 = 3456  LE:r3 = 6543 */
   1318  1.1  christos 	ldrb	ip, [r1, #0x07]		/* ip = ...7 */
   1319  1.1  christos 	mov	r1, r2, lsr #8		/* BE:r1 = .x01  LE:r1 = .210 */
   1320  1.1  christos 	strh	r1, [r0]
   1321  1.1  christos #ifdef __ARMEB__
   1322  1.1  christos 	mov	r1, r2, lsl #24		/* r1 = 2... */
   1323  1.1  christos 	orr	r1, r1, r3, lsr #8	/* r1 = 2345 */
   1324  1.1  christos 	orr	r3, ip, r3, lsl #8	/* r3 = 4567 */
   1325  1.1  christos #else
   1326  1.1  christos 	mov	r1, r2, lsr #24		/* r1 = ...2 */
   1327  1.1  christos 	orr	r1, r1, r3, lsl #8	/* r1 = 5432 */
   1328  1.1  christos 	mov	r3, r3, lsr #24		/* r3 = ...6 */
   1329  1.1  christos 	orr	r3, r3, ip, lsl #8	/* r3 = ..76 */
   1330  1.1  christos #endif
   1331  1.1  christos 	str	r1, [r0, #0x02]
   1332  1.1  christos 	strh	r3, [r0, #0x06]
   1333  1.3      matt 	RET
   1334  1.1  christos 	LMEMCPY_8_PAD
   1335  1.1  christos 
   1336  1.1  christos /*
   1337  1.1  christos  * 1010: dst is 16-bit aligned, src is 16-bit aligned
   1338  1.1  christos  */
   1339  1.1  christos 	ldrh	r2, [r1]
   1340  1.1  christos 	ldr	ip, [r1, #0x02]
   1341  1.1  christos 	ldrh	r3, [r1, #0x06]
   1342  1.1  christos 	strh	r2, [r0]
   1343  1.1  christos 	str	ip, [r0, #0x02]
   1344  1.1  christos 	strh	r3, [r0, #0x06]
   1345  1.3      matt 	RET
   1346  1.1  christos 	LMEMCPY_8_PAD
   1347  1.1  christos 
   1348  1.1  christos /*
   1349  1.1  christos  * 1011: dst is 16-bit aligned, src is 8-bit aligned
   1350  1.1  christos  */
   1351  1.1  christos 	ldr	r3, [r1, #0x05]		/* BE:r3 = 567x  LE:r3 = x765 */
   1352  1.1  christos 	ldr	r2, [r1, #0x01]		/* BE:r2 = 1234  LE:r2 = 4321 */
   1353  1.1  christos 	ldrb	ip, [r1]		/* ip = ...0 */
   1354  1.1  christos 	mov	r1, r3, lsr #8		/* BE:r1 = .567  LE:r1 = .x76 */
   1355  1.1  christos 	strh	r1, [r0, #0x06]
   1356  1.1  christos #ifdef __ARMEB__
   1357  1.1  christos 	mov	r3, r3, lsr #24		/* r3 = ...5 */
   1358  1.1  christos 	orr	r3, r3, r2, lsl #8	/* r3 = 2345 */
   1359  1.1  christos 	mov	r2, r2, lsr #24		/* r2 = ...1 */
   1360  1.1  christos 	orr	r2, r2, ip, lsl #8	/* r2 = ..01 */
   1361  1.1  christos #else
   1362  1.1  christos 	mov	r3, r3, lsl #24		/* r3 = 5... */
   1363  1.1  christos 	orr	r3, r3, r2, lsr #8	/* r3 = 5432 */
   1364  1.1  christos 	orr	r2, ip, r2, lsl #8	/* r2 = 3210 */
   1365  1.1  christos #endif
   1366  1.1  christos 	str	r3, [r0, #0x02]
   1367  1.1  christos 	strh	r2, [r0]
   1368  1.3      matt 	RET
   1369  1.1  christos 	LMEMCPY_8_PAD
   1370  1.1  christos 
   1371  1.1  christos /*
   1372  1.1  christos  * 1100: dst is 8-bit aligned, src is 32-bit aligned
   1373  1.1  christos  */
   1374  1.1  christos 	ldr	r3, [r1, #0x04]		/* BE:r3 = 4567  LE:r3 = 7654 */
   1375  1.1  christos 	ldr	r2, [r1]		/* BE:r2 = 0123  LE:r2 = 3210 */
   1376  1.1  christos 	mov	r1, r3, lsr #8		/* BE:r1 = .456  LE:r1 = .765 */
   1377  1.1  christos 	strh	r1, [r0, #0x05]
   1378  1.1  christos #ifdef __ARMEB__
   1379  1.1  christos 	strb	r3, [r0, #0x07]
   1380  1.1  christos 	mov	r1, r2, lsr #24		/* r1 = ...0 */
   1381  1.1  christos 	strb	r1, [r0]
   1382  1.1  christos 	mov	r2, r2, lsl #8		/* r2 = 123. */
   1383  1.1  christos 	orr	r2, r2, r3, lsr #24	/* r2 = 1234 */
   1384  1.1  christos 	str	r2, [r0, #0x01]
   1385  1.1  christos #else
   1386  1.1  christos 	strb	r2, [r0]
   1387  1.1  christos 	mov	r1, r3, lsr #24		/* r1 = ...7 */
   1388  1.1  christos 	strb	r1, [r0, #0x07]
   1389  1.1  christos 	mov	r2, r2, lsr #8		/* r2 = .321 */
   1390  1.1  christos 	orr	r2, r2, r3, lsl #24	/* r2 = 4321 */
   1391  1.1  christos 	str	r2, [r0, #0x01]
   1392  1.1  christos #endif
   1393  1.3      matt 	RET
   1394  1.1  christos 	LMEMCPY_8_PAD
   1395  1.1  christos 
   1396  1.1  christos /*
   1397  1.1  christos  * 1101: dst is 8-bit aligned, src is 8-bit aligned
   1398  1.1  christos  */
   1399  1.1  christos 	ldrb	r3, [r1]		/* r3 = ...0 */
   1400  1.1  christos 	ldrh	r2, [r1, #0x01]		/* BE:r2 = ..12  LE:r2 = ..21 */
   1401  1.1  christos 	ldr	ip, [r1, #0x03]		/* BE:ip = 3456  LE:ip = 6543 */
   1402  1.1  christos 	ldrb	r1, [r1, #0x07]		/* r1 = ...7 */
   1403  1.1  christos 	strb	r3, [r0]
   1404  1.1  christos 	mov	r3, ip, lsr #16		/* BE:r3 = ..34  LE:r3 = ..65 */
   1405  1.1  christos #ifdef __ARMEB__
   1406  1.1  christos 	strh	ip, [r0, #0x05]
   1407  1.1  christos 	orr	r2, r3, r2, lsl #16	/* r2 = 1234 */
   1408  1.1  christos #else
   1409  1.1  christos 	strh	r3, [r0, #0x05]
   1410  1.1  christos 	orr	r2, r2, ip, lsl #16	/* r2 = 4321 */
   1411  1.1  christos #endif
   1412  1.1  christos 	str	r2, [r0, #0x01]
   1413  1.1  christos 	strb	r1, [r0, #0x07]
   1414  1.3      matt 	RET
   1415  1.1  christos 	LMEMCPY_8_PAD
   1416  1.1  christos 
   1417  1.1  christos /*
   1418  1.1  christos  * 1110: dst is 8-bit aligned, src is 16-bit aligned
   1419  1.1  christos  */
   1420  1.1  christos 	ldrh	r2, [r1]		/* BE:r2 = ..01  LE:r2 = ..10 */
   1421  1.1  christos 	ldr	r3, [r1, #0x02]		/* BE:r3 = 2345  LE:r3 = 5432 */
   1422  1.1  christos 	ldrh	r1, [r1, #0x06]		/* BE:r1 = ..67  LE:r1 = ..76 */
   1423  1.1  christos #ifdef __ARMEB__
   1424  1.1  christos 	mov	ip, r2, lsr #8		/* ip = ...0 */
   1425  1.1  christos 	strb	ip, [r0]
   1426  1.1  christos 	mov	ip, r2, lsl #24		/* ip = 1... */
   1427  1.1  christos 	orr	ip, ip, r3, lsr #8	/* ip = 1234 */
   1428  1.1  christos 	strb	r1, [r0, #0x07]
   1429  1.1  christos 	mov	r1, r1, lsr #8		/* r1 = ...6 */
   1430  1.1  christos 	orr	r1, r1, r3, lsl #8	/* r1 = 3456 */
   1431  1.1  christos #else
   1432  1.1  christos 	strb	r2, [r0]
   1433  1.1  christos 	mov	ip, r2, lsr #8		/* ip = ...1 */
   1434  1.1  christos 	orr	ip, ip, r3, lsl #8	/* ip = 4321 */
   1435  1.1  christos 	mov	r2, r1, lsr #8		/* r2 = ...7 */
   1436  1.1  christos 	strb	r2, [r0, #0x07]
   1437  1.1  christos 	mov	r1, r1, lsl #8		/* r1 = .76. */
   1438  1.1  christos 	orr	r1, r1, r3, lsr #24	/* r1 = .765 */
   1439  1.1  christos #endif
   1440  1.1  christos 	str	ip, [r0, #0x01]
   1441  1.1  christos 	strh	r1, [r0, #0x05]
   1442  1.3      matt 	RET
   1443  1.1  christos 	LMEMCPY_8_PAD
   1444  1.1  christos 
   1445  1.1  christos /*
   1446  1.1  christos  * 1111: dst is 8-bit aligned, src is 8-bit aligned
   1447  1.1  christos  */
   1448  1.1  christos 	ldrb	r2, [r1]
   1449  1.1  christos 	ldr	ip, [r1, #0x01]
   1450  1.1  christos 	ldrh	r3, [r1, #0x05]
   1451  1.1  christos 	ldrb	r1, [r1, #0x07]
   1452  1.1  christos 	strb	r2, [r0]
   1453  1.1  christos 	str	ip, [r0, #0x01]
   1454  1.1  christos 	strh	r3, [r0, #0x05]
   1455  1.1  christos 	strb	r1, [r0, #0x07]
   1456  1.3      matt 	RET
   1457  1.1  christos 	LMEMCPY_8_PAD
   1458  1.1  christos 
   1459  1.1  christos /******************************************************************************
   1460  1.1  christos  * Special case for 12 byte copies
   1461  1.1  christos  */
   1462  1.1  christos #define	LMEMCPY_C_LOG2	7	/* 128 bytes */
   1463  1.1  christos #define	LMEMCPY_C_PAD	.align LMEMCPY_C_LOG2
   1464  1.1  christos 	LMEMCPY_C_PAD
   1465  1.1  christos .Lmemcpy_c:
   1466  1.1  christos 	and	r2, r1, #0x03
   1467  1.1  christos 	orr	r2, r2, r0, lsl #2
   1468  1.1  christos 	ands	r2, r2, #0x0f
   1469  1.1  christos 	sub	r3, pc, #0x14
   1470  1.1  christos 	addne	pc, r3, r2, lsl #LMEMCPY_C_LOG2
   1471  1.1  christos 
   1472  1.1  christos /*
   1473  1.1  christos  * 0000: dst is 32-bit aligned, src is 32-bit aligned
   1474  1.1  christos  */
   1475  1.1  christos 	ldr	r2, [r1]
   1476  1.1  christos 	ldr	r3, [r1, #0x04]
   1477  1.1  christos 	ldr	r1, [r1, #0x08]
   1478  1.1  christos 	str	r2, [r0]
   1479  1.1  christos 	str	r3, [r0, #0x04]
   1480  1.1  christos 	str	r1, [r0, #0x08]
   1481  1.3      matt 	RET
   1482  1.1  christos 	LMEMCPY_C_PAD
   1483  1.1  christos 
   1484  1.1  christos /*
   1485  1.1  christos  * 0001: dst is 32-bit aligned, src is 8-bit aligned
   1486  1.1  christos  */
   1487  1.1  christos 	ldrb	r2, [r1, #0xb]		/* r2 = ...B */
   1488  1.1  christos 	ldr	ip, [r1, #0x07]		/* BE:ip = 789A  LE:ip = A987 */
   1489  1.1  christos 	ldr	r3, [r1, #0x03]		/* BE:r3 = 3456  LE:r3 = 6543 */
   1490  1.1  christos 	ldr	r1, [r1, #-1]		/* BE:r1 = x012  LE:r1 = 210x */
   1491  1.1  christos #ifdef __ARMEB__
   1492  1.1  christos 	orr	r2, r2, ip, lsl #8	/* r2 = 89AB */
   1493  1.1  christos 	str	r2, [r0, #0x08]
   1494  1.1  christos 	mov	r2, ip, lsr #24		/* r2 = ...7 */
   1495  1.1  christos 	orr	r2, r2, r3, lsl #8	/* r2 = 4567 */
   1496  1.1  christos 	mov	r1, r1, lsl #8		/* r1 = 012. */
   1497  1.1  christos 	orr	r1, r1, r3, lsr #24	/* r1 = 0123 */
   1498  1.1  christos #else
   1499  1.1  christos 	mov	r2, r2, lsl #24		/* r2 = B... */
   1500  1.1  christos 	orr	r2, r2, ip, lsr #8	/* r2 = BA98 */
   1501  1.1  christos 	str	r2, [r0, #0x08]
   1502  1.1  christos 	mov	r2, ip, lsl #24		/* r2 = 7... */
   1503  1.1  christos 	orr	r2, r2, r3, lsr #8	/* r2 = 7654 */
   1504  1.1  christos 	mov	r1, r1, lsr #8		/* r1 = .210 */
   1505  1.1  christos 	orr	r1, r1, r3, lsl #24	/* r1 = 3210 */
   1506  1.1  christos #endif
   1507  1.1  christos 	str	r2, [r0, #0x04]
   1508  1.1  christos 	str	r1, [r0]
   1509  1.3      matt 	RET
   1510  1.1  christos 	LMEMCPY_C_PAD
   1511  1.1  christos 
   1512  1.1  christos /*
   1513  1.1  christos  * 0010: dst is 32-bit aligned, src is 16-bit aligned
   1514  1.1  christos  */
   1515  1.1  christos 	ldrh	r2, [r1]		/* BE:r2 = ..01  LE:r2 = ..10 */
   1516  1.1  christos 	ldr	r3, [r1, #0x02]		/* BE:r3 = 2345  LE:r3 = 5432 */
   1517  1.1  christos 	ldr	ip, [r1, #0x06]		/* BE:ip = 6789  LE:ip = 9876 */
   1518  1.1  christos 	ldrh	r1, [r1, #0x0a]		/* BE:r1 = ..AB  LE:r1 = ..BA */
   1519  1.1  christos #ifdef __ARMEB__
   1520  1.1  christos 	mov	r2, r2, lsl #16		/* r2 = 01.. */
   1521  1.1  christos 	orr	r2, r2, r3, lsr #16	/* r2 = 0123 */
   1522  1.1  christos 	str	r2, [r0]
   1523  1.1  christos 	mov	r3, r3, lsl #16		/* r3 = 45.. */
   1524  1.1  christos 	orr	r3, r3, ip, lsr #16	/* r3 = 4567 */
   1525  1.1  christos 	orr	r1, r1, ip, lsl #16	/* r1 = 89AB */
   1526  1.1  christos #else
   1527  1.1  christos 	orr	r2, r2, r3, lsl #16	/* r2 = 3210 */
   1528  1.1  christos 	str	r2, [r0]
   1529  1.1  christos 	mov	r3, r3, lsr #16		/* r3 = ..54 */
   1530  1.1  christos 	orr	r3, r3, ip, lsl #16	/* r3 = 7654 */
   1531  1.1  christos 	mov	r1, r1, lsl #16		/* r1 = BA.. */
   1532  1.1  christos 	orr	r1, r1, ip, lsr #16	/* r1 = BA98 */
   1533  1.1  christos #endif
   1534  1.1  christos 	str	r3, [r0, #0x04]
   1535  1.1  christos 	str	r1, [r0, #0x08]
   1536  1.3      matt 	RET
   1537  1.1  christos 	LMEMCPY_C_PAD
   1538  1.1  christos 
   1539  1.1  christos /*
   1540  1.1  christos  * 0011: dst is 32-bit aligned, src is 8-bit aligned
   1541  1.1  christos  */
   1542  1.1  christos 	ldrb	r2, [r1]		/* r2 = ...0 */
   1543  1.1  christos 	ldr	r3, [r1, #0x01]		/* BE:r3 = 1234  LE:r3 = 4321 */
   1544  1.1  christos 	ldr	ip, [r1, #0x05]		/* BE:ip = 5678  LE:ip = 8765 */
   1545  1.1  christos 	ldr	r1, [r1, #0x09]		/* BE:r1 = 9ABx  LE:r1 = xBA9 */
   1546  1.1  christos #ifdef __ARMEB__
   1547  1.1  christos 	mov	r2, r2, lsl #24		/* r2 = 0... */
   1548  1.1  christos 	orr	r2, r2, r3, lsr #8	/* r2 = 0123 */
   1549  1.1  christos 	str	r2, [r0]
   1550  1.1  christos 	mov	r3, r3, lsl #24		/* r3 = 4... */
   1551  1.1  christos 	orr	r3, r3, ip, lsr #8	/* r3 = 4567 */
   1552  1.1  christos 	mov	r1, r1, lsr #8		/* r1 = .9AB */
   1553  1.1  christos 	orr	r1, r1, ip, lsl #24	/* r1 = 89AB */
   1554  1.1  christos #else
   1555  1.1  christos 	orr	r2, r2, r3, lsl #8	/* r2 = 3210 */
   1556  1.1  christos 	str	r2, [r0]
   1557  1.1  christos 	mov	r3, r3, lsr #24		/* r3 = ...4 */
   1558  1.1  christos 	orr	r3, r3, ip, lsl #8	/* r3 = 7654 */
   1559  1.1  christos 	mov	r1, r1, lsl #8		/* r1 = BA9. */
   1560  1.1  christos 	orr	r1, r1, ip, lsr #24	/* r1 = BA98 */
   1561  1.1  christos #endif
   1562  1.1  christos 	str	r3, [r0, #0x04]
   1563  1.1  christos 	str	r1, [r0, #0x08]
   1564  1.3      matt 	RET
   1565  1.1  christos 	LMEMCPY_C_PAD
   1566  1.1  christos 
   1567  1.1  christos /*
   1568  1.1  christos  * 0100: dst is 8-bit aligned (byte 1), src is 32-bit aligned
   1569  1.1  christos  */
   1570  1.1  christos 	ldr	r2, [r1]		/* BE:r2 = 0123  LE:r2 = 3210 */
   1571  1.1  christos 	ldr	r3, [r1, #0x04]		/* BE:r3 = 4567  LE:r3 = 7654 */
   1572  1.1  christos 	ldr	ip, [r1, #0x08]		/* BE:ip = 89AB  LE:ip = BA98 */
   1573  1.1  christos 	mov	r1, r2, lsr #8		/* BE:r1 = .012  LE:r1 = .321 */
   1574  1.1  christos 	strh	r1, [r0, #0x01]
   1575  1.1  christos #ifdef __ARMEB__
   1576  1.1  christos 	mov	r1, r2, lsr #24		/* r1 = ...0 */
   1577  1.1  christos 	strb	r1, [r0]
   1578  1.1  christos 	mov	r1, r2, lsl #24		/* r1 = 3... */
   1579  1.1  christos 	orr	r2, r1, r3, lsr #8	/* r1 = 3456 */
   1580  1.1  christos 	mov	r1, r3, lsl #24		/* r1 = 7... */
   1581  1.1  christos 	orr	r1, r1, ip, lsr #8	/* r1 = 789A */
   1582  1.1  christos #else
   1583  1.1  christos 	strb	r2, [r0]
   1584  1.1  christos 	mov	r1, r2, lsr #24		/* r1 = ...3 */
   1585  1.1  christos 	orr	r2, r1, r3, lsl #8	/* r1 = 6543 */
   1586  1.1  christos 	mov	r1, r3, lsr #24		/* r1 = ...7 */
   1587  1.1  christos 	orr	r1, r1, ip, lsl #8	/* r1 = A987 */
   1588  1.1  christos 	mov	ip, ip, lsr #24		/* ip = ...B */
   1589  1.1  christos #endif
   1590  1.1  christos 	str	r2, [r0, #0x03]
   1591  1.1  christos 	str	r1, [r0, #0x07]
   1592  1.1  christos 	strb	ip, [r0, #0x0b]
   1593  1.3      matt 	RET
   1594  1.1  christos 	LMEMCPY_C_PAD
   1595  1.1  christos 
   1596  1.1  christos /*
   1597  1.1  christos  * 0101: dst is 8-bit aligned (byte 1), src is 8-bit aligned (byte 1)
   1598  1.1  christos  */
   1599  1.1  christos 	ldrb	r2, [r1]
   1600  1.1  christos 	ldrh	r3, [r1, #0x01]
   1601  1.1  christos 	ldr	ip, [r1, #0x03]
   1602  1.1  christos 	strb	r2, [r0]
   1603  1.1  christos 	ldr	r2, [r1, #0x07]
   1604  1.1  christos 	ldrb	r1, [r1, #0x0b]
   1605  1.1  christos 	strh	r3, [r0, #0x01]
   1606  1.1  christos 	str	ip, [r0, #0x03]
   1607  1.1  christos 	str	r2, [r0, #0x07]
   1608  1.1  christos 	strb	r1, [r0, #0x0b]
   1609  1.3      matt 	RET
   1610  1.1  christos 	LMEMCPY_C_PAD
   1611  1.1  christos 
   1612  1.1  christos /*
   1613  1.1  christos  * 0110: dst is 8-bit aligned (byte 1), src is 16-bit aligned
   1614  1.1  christos  */
   1615  1.1  christos 	ldrh	r2, [r1]		/* BE:r2 = ..01  LE:r2 = ..10 */
   1616  1.1  christos 	ldr	r3, [r1, #0x02]		/* BE:r3 = 2345  LE:r3 = 5432 */
   1617  1.1  christos 	ldr	ip, [r1, #0x06]		/* BE:ip = 6789  LE:ip = 9876 */
   1618  1.1  christos 	ldrh	r1, [r1, #0x0a]		/* BE:r1 = ..AB  LE:r1 = ..BA */
   1619  1.1  christos #ifdef __ARMEB__
   1620  1.1  christos 	mov	r2, r2, ror #8		/* r2 = 1..0 */
   1621  1.1  christos 	strb	r2, [r0]
   1622  1.1  christos 	mov	r2, r2, lsr #16		/* r2 = ..1. */
   1623  1.1  christos 	orr	r2, r2, r3, lsr #24	/* r2 = ..12 */
   1624  1.1  christos 	strh	r2, [r0, #0x01]
   1625  1.1  christos 	mov	r2, r3, lsl #8		/* r2 = 345. */
   1626  1.1  christos 	orr	r3, r2, ip, lsr #24	/* r3 = 3456 */
   1627  1.1  christos 	mov	r2, ip, lsl #8		/* r2 = 789. */
   1628  1.1  christos 	orr	r2, r2, r1, lsr #8	/* r2 = 789A */
   1629  1.1  christos #else
   1630  1.1  christos 	strb	r2, [r0]
   1631  1.1  christos 	mov	r2, r2, lsr #8		/* r2 = ...1 */
   1632  1.1  christos 	orr	r2, r2, r3, lsl #8	/* r2 = 4321 */
   1633  1.1  christos 	strh	r2, [r0, #0x01]
   1634  1.1  christos 	mov	r2, r3, lsr #8		/* r2 = .543 */
   1635  1.1  christos 	orr	r3, r2, ip, lsl #24	/* r3 = 6543 */
   1636  1.1  christos 	mov	r2, ip, lsr #8		/* r2 = .987 */
   1637  1.1  christos 	orr	r2, r2, r1, lsl #24	/* r2 = A987 */
   1638  1.1  christos 	mov	r1, r1, lsr #8		/* r1 = ...B */
   1639  1.1  christos #endif
   1640  1.1  christos 	str	r3, [r0, #0x03]
   1641  1.1  christos 	str	r2, [r0, #0x07]
   1642  1.1  christos 	strb	r1, [r0, #0x0b]
   1643  1.3      matt 	RET
   1644  1.1  christos 	LMEMCPY_C_PAD
   1645  1.1  christos 
   1646  1.1  christos /*
   1647  1.1  christos  * 0111: dst is 8-bit aligned (byte 1), src is 8-bit aligned (byte 3)
   1648  1.1  christos  */
   1649  1.1  christos 	ldrb	r2, [r1]
   1650  1.1  christos 	ldr	r3, [r1, #0x01]		/* BE:r3 = 1234  LE:r3 = 4321 */
   1651  1.1  christos 	ldr	ip, [r1, #0x05]		/* BE:ip = 5678  LE:ip = 8765 */
   1652  1.1  christos 	ldr	r1, [r1, #0x09]		/* BE:r1 = 9ABx  LE:r1 = xBA9 */
   1653  1.1  christos 	strb	r2, [r0]
   1654  1.1  christos #ifdef __ARMEB__
   1655  1.1  christos 	mov	r2, r3, lsr #16		/* r2 = ..12 */
   1656  1.1  christos 	strh	r2, [r0, #0x01]
   1657  1.1  christos 	mov	r3, r3, lsl #16		/* r3 = 34.. */
   1658  1.1  christos 	orr	r3, r3, ip, lsr #16	/* r3 = 3456 */
   1659  1.1  christos 	mov	ip, ip, lsl #16		/* ip = 78.. */
   1660  1.1  christos 	orr	ip, ip, r1, lsr #16	/* ip = 789A */
   1661  1.1  christos 	mov	r1, r1, lsr #8		/* r1 = .9AB */
   1662  1.1  christos #else
   1663  1.1  christos 	strh	r3, [r0, #0x01]
   1664  1.1  christos 	mov	r3, r3, lsr #16		/* r3 = ..43 */
   1665  1.1  christos 	orr	r3, r3, ip, lsl #16	/* r3 = 6543 */
   1666  1.1  christos 	mov	ip, ip, lsr #16		/* ip = ..87 */
   1667  1.1  christos 	orr	ip, ip, r1, lsl #16	/* ip = A987 */
   1668  1.1  christos 	mov	r1, r1, lsr #16		/* r1 = ..xB */
   1669  1.1  christos #endif
   1670  1.1  christos 	str	r3, [r0, #0x03]
   1671  1.1  christos 	str	ip, [r0, #0x07]
   1672  1.1  christos 	strb	r1, [r0, #0x0b]
   1673  1.3      matt 	RET
   1674  1.1  christos 	LMEMCPY_C_PAD
   1675  1.1  christos 
   1676  1.1  christos /*
   1677  1.1  christos  * 1000: dst is 16-bit aligned, src is 32-bit aligned
   1678  1.1  christos  */
   1679  1.1  christos 	ldr	ip, [r1]		/* BE:ip = 0123  LE:ip = 3210 */
   1680  1.1  christos 	ldr	r3, [r1, #0x04]		/* BE:r3 = 4567  LE:r3 = 7654 */
   1681  1.1  christos 	ldr	r2, [r1, #0x08]		/* BE:r2 = 89AB  LE:r2 = BA98 */
   1682  1.1  christos 	mov	r1, ip, lsr #16		/* BE:r1 = ..01  LE:r1 = ..32 */
   1683  1.1  christos #ifdef __ARMEB__
   1684  1.1  christos 	strh	r1, [r0]
   1685  1.1  christos 	mov	r1, ip, lsl #16		/* r1 = 23.. */
   1686  1.1  christos 	orr	r1, r1, r3, lsr #16	/* r1 = 2345 */
   1687  1.1  christos 	mov	r3, r3, lsl #16		/* r3 = 67.. */
   1688  1.1  christos 	orr	r3, r3, r2, lsr #16	/* r3 = 6789 */
   1689  1.1  christos #else
   1690  1.1  christos 	strh	ip, [r0]
   1691  1.1  christos 	orr	r1, r1, r3, lsl #16	/* r1 = 5432 */
   1692  1.1  christos 	mov	r3, r3, lsr #16		/* r3 = ..76 */
   1693  1.1  christos 	orr	r3, r3, r2, lsl #16	/* r3 = 9876 */
   1694  1.1  christos 	mov	r2, r2, lsr #16		/* r2 = ..BA */
   1695  1.1  christos #endif
   1696  1.1  christos 	str	r1, [r0, #0x02]
   1697  1.1  christos 	str	r3, [r0, #0x06]
   1698  1.1  christos 	strh	r2, [r0, #0x0a]
   1699  1.3      matt 	RET
   1700  1.1  christos 	LMEMCPY_C_PAD
   1701  1.1  christos 
   1702  1.1  christos /*
   1703  1.1  christos  * 1001: dst is 16-bit aligned, src is 8-bit aligned (byte 1)
   1704  1.1  christos  */
   1705  1.1  christos 	ldr	r2, [r1, #-1]		/* BE:r2 = x012  LE:r2 = 210x */
   1706  1.1  christos 	ldr	r3, [r1, #0x03]		/* BE:r3 = 3456  LE:r3 = 6543 */
   1707  1.1  christos 	mov	ip, r2, lsr #8		/* BE:ip = .x01  LE:ip = .210 */
   1708  1.1  christos 	strh	ip, [r0]
   1709  1.1  christos 	ldr	ip, [r1, #0x07]		/* BE:ip = 789A  LE:ip = A987 */
   1710  1.1  christos 	ldrb	r1, [r1, #0x0b]		/* r1 = ...B */
   1711  1.1  christos #ifdef __ARMEB__
   1712  1.1  christos 	mov	r2, r2, lsl #24		/* r2 = 2... */
   1713  1.1  christos 	orr	r2, r2, r3, lsr #8	/* r2 = 2345 */
   1714  1.1  christos 	mov	r3, r3, lsl #24		/* r3 = 6... */
   1715  1.1  christos 	orr	r3, r3, ip, lsr #8	/* r3 = 6789 */
   1716  1.1  christos 	orr	r1, r1, ip, lsl #8	/* r1 = 89AB */
   1717  1.1  christos #else
   1718  1.1  christos 	mov	r2, r2, lsr #24		/* r2 = ...2 */
   1719  1.1  christos 	orr	r2, r2, r3, lsl #8	/* r2 = 5432 */
   1720  1.1  christos 	mov	r3, r3, lsr #24		/* r3 = ...6 */
   1721  1.1  christos 	orr	r3, r3, ip, lsl #8	/* r3 = 9876 */
   1722  1.1  christos 	mov	r1, r1, lsl #8		/* r1 = ..B. */
   1723  1.1  christos 	orr	r1, r1, ip, lsr #24	/* r1 = ..BA */
   1724  1.1  christos #endif
   1725  1.1  christos 	str	r2, [r0, #0x02]
   1726  1.1  christos 	str	r3, [r0, #0x06]
   1727  1.1  christos 	strh	r1, [r0, #0x0a]
   1728  1.3      matt 	RET
   1729  1.1  christos 	LMEMCPY_C_PAD
   1730  1.1  christos 
   1731  1.1  christos /*
   1732  1.1  christos  * 1010: dst is 16-bit aligned, src is 16-bit aligned
   1733  1.1  christos  */
   1734  1.1  christos 	ldrh	r2, [r1]
   1735  1.1  christos 	ldr	r3, [r1, #0x02]
   1736  1.1  christos 	ldr	ip, [r1, #0x06]
   1737  1.1  christos 	ldrh	r1, [r1, #0x0a]
   1738  1.1  christos 	strh	r2, [r0]
   1739  1.1  christos 	str	r3, [r0, #0x02]
   1740  1.1  christos 	str	ip, [r0, #0x06]
   1741  1.1  christos 	strh	r1, [r0, #0x0a]
   1742  1.3      matt 	RET
   1743  1.1  christos 	LMEMCPY_C_PAD
   1744  1.1  christos 
   1745  1.1  christos /*
   1746  1.1  christos  * 1011: dst is 16-bit aligned, src is 8-bit aligned (byte 3)
   1747  1.1  christos  */
   1748  1.1  christos 	ldr	r2, [r1, #0x09]		/* BE:r2 = 9ABx  LE:r2 = xBA9 */
   1749  1.1  christos 	ldr	r3, [r1, #0x05]		/* BE:r3 = 5678  LE:r3 = 8765 */
   1750  1.1  christos 	mov	ip, r2, lsr #8		/* BE:ip = .9AB  LE:ip = .xBA */
   1751  1.1  christos 	strh	ip, [r0, #0x0a]
   1752  1.1  christos 	ldr	ip, [r1, #0x01]		/* BE:ip = 1234  LE:ip = 4321 */
   1753  1.1  christos 	ldrb	r1, [r1]		/* r1 = ...0 */
   1754  1.1  christos #ifdef __ARMEB__
   1755  1.1  christos 	mov	r2, r2, lsr #24		/* r2 = ...9 */
   1756  1.1  christos 	orr	r2, r2, r3, lsl #8	/* r2 = 6789 */
   1757  1.1  christos 	mov	r3, r3, lsr #24		/* r3 = ...5 */
   1758  1.1  christos 	orr	r3, r3, ip, lsl #8	/* r3 = 2345 */
   1759  1.1  christos 	mov	r1, r1, lsl #8		/* r1 = ..0. */
   1760  1.1  christos 	orr	r1, r1, ip, lsr #24	/* r1 = ..01 */
   1761  1.1  christos #else
   1762  1.1  christos 	mov	r2, r2, lsl #24		/* r2 = 9... */
   1763  1.1  christos 	orr	r2, r2, r3, lsr #8	/* r2 = 9876 */
   1764  1.1  christos 	mov	r3, r3, lsl #24		/* r3 = 5... */
   1765  1.1  christos 	orr	r3, r3, ip, lsr #8	/* r3 = 5432 */
   1766  1.1  christos 	orr	r1, r1, ip, lsl #8	/* r1 = 3210 */
   1767  1.1  christos #endif
   1768  1.1  christos 	str	r2, [r0, #0x06]
   1769  1.1  christos 	str	r3, [r0, #0x02]
   1770  1.1  christos 	strh	r1, [r0]
   1771  1.3      matt 	RET
   1772  1.1  christos 	LMEMCPY_C_PAD
   1773  1.1  christos 
   1774  1.1  christos /*
   1775  1.1  christos  * 1100: dst is 8-bit aligned (byte 3), src is 32-bit aligned
   1776  1.1  christos  */
   1777  1.1  christos 	ldr	r2, [r1]		/* BE:r2 = 0123  LE:r2 = 3210 */
   1778  1.1  christos 	ldr	ip, [r1, #0x04]		/* BE:ip = 4567  LE:ip = 7654 */
   1779  1.1  christos 	ldr	r1, [r1, #0x08]		/* BE:r1 = 89AB  LE:r1 = BA98 */
   1780  1.1  christos #ifdef __ARMEB__
   1781  1.1  christos 	mov	r3, r2, lsr #24		/* r3 = ...0 */
   1782  1.1  christos 	strb	r3, [r0]
   1783  1.1  christos 	mov	r2, r2, lsl #8		/* r2 = 123. */
   1784  1.1  christos 	orr	r2, r2, ip, lsr #24	/* r2 = 1234 */
   1785  1.1  christos 	str	r2, [r0, #0x01]
   1786  1.1  christos 	mov	r2, ip, lsl #8		/* r2 = 567. */
   1787  1.1  christos 	orr	r2, r2, r1, lsr #24	/* r2 = 5678 */
   1788  1.1  christos 	str	r2, [r0, #0x05]
   1789  1.1  christos 	mov	r2, r1, lsr #8		/* r2 = ..9A */
   1790  1.1  christos 	strh	r2, [r0, #0x09]
   1791  1.1  christos 	strb	r1, [r0, #0x0b]
   1792  1.1  christos #else
   1793  1.1  christos 	strb	r2, [r0]
   1794  1.1  christos 	mov	r3, r2, lsr #8		/* r3 = .321 */
   1795  1.1  christos 	orr	r3, r3, ip, lsl #24	/* r3 = 4321 */
   1796  1.1  christos 	str	r3, [r0, #0x01]
   1797  1.1  christos 	mov	r3, ip, lsr #8		/* r3 = .765 */
   1798  1.1  christos 	orr	r3, r3, r1, lsl #24	/* r3 = 8765 */
   1799  1.1  christos 	str	r3, [r0, #0x05]
   1800  1.1  christos 	mov	r1, r1, lsr #8		/* r1 = .BA9 */
   1801  1.1  christos 	strh	r1, [r0, #0x09]
   1802  1.1  christos 	mov	r1, r1, lsr #16		/* r1 = ...B */
   1803  1.1  christos 	strb	r1, [r0, #0x0b]
   1804  1.1  christos #endif
   1805  1.3      matt 	RET
   1806  1.1  christos 	LMEMCPY_C_PAD
   1807  1.1  christos 
   1808  1.1  christos /*
   1809  1.1  christos  * 1101: dst is 8-bit aligned (byte 3), src is 8-bit aligned (byte 1)
   1810  1.1  christos  */
   1811  1.1  christos 	ldrb	r2, [r1, #0x0b]		/* r2 = ...B */
   1812  1.1  christos 	ldr	r3, [r1, #0x07]		/* BE:r3 = 789A  LE:r3 = A987 */
   1813  1.1  christos 	ldr	ip, [r1, #0x03]		/* BE:ip = 3456  LE:ip = 6543 */
   1814  1.1  christos 	ldr	r1, [r1, #-1]		/* BE:r1 = x012  LE:r1 = 210x */
   1815  1.1  christos 	strb	r2, [r0, #0x0b]
   1816  1.1  christos #ifdef __ARMEB__
   1817  1.1  christos 	strh	r3, [r0, #0x09]
   1818  1.1  christos 	mov	r3, r3, lsr #16		/* r3 = ..78 */
   1819  1.1  christos 	orr	r3, r3, ip, lsl #16	/* r3 = 5678 */
   1820  1.1  christos 	mov	ip, ip, lsr #16		/* ip = ..34 */
   1821  1.1  christos 	orr	ip, ip, r1, lsl #16	/* ip = 1234 */
   1822  1.1  christos 	mov	r1, r1, lsr #16		/* r1 = ..x0 */
   1823  1.1  christos #else
   1824  1.1  christos 	mov	r2, r3, lsr #16		/* r2 = ..A9 */
   1825  1.1  christos 	strh	r2, [r0, #0x09]
   1826  1.1  christos 	mov	r3, r3, lsl #16		/* r3 = 87.. */
   1827  1.1  christos 	orr	r3, r3, ip, lsr #16	/* r3 = 8765 */
   1828  1.1  christos 	mov	ip, ip, lsl #16		/* ip = 43.. */
   1829  1.1  christos 	orr	ip, ip, r1, lsr #16	/* ip = 4321 */
   1830  1.1  christos 	mov	r1, r1, lsr #8		/* r1 = .210 */
   1831  1.1  christos #endif
   1832  1.1  christos 	str	r3, [r0, #0x05]
   1833  1.1  christos 	str	ip, [r0, #0x01]
   1834  1.1  christos 	strb	r1, [r0]
   1835  1.3      matt 	RET
   1836  1.1  christos 	LMEMCPY_C_PAD
   1837  1.1  christos 
   1838  1.1  christos /*
   1839  1.1  christos  * 1110: dst is 8-bit aligned (byte 3), src is 16-bit aligned
   1840  1.1  christos  */
   1841  1.1  christos #ifdef __ARMEB__
   1842  1.1  christos 	ldrh	r2, [r1, #0x0a]		/* r2 = ..AB */
   1843  1.1  christos 	ldr	ip, [r1, #0x06]		/* ip = 6789 */
   1844  1.1  christos 	ldr	r3, [r1, #0x02]		/* r3 = 2345 */
   1845  1.1  christos 	ldrh	r1, [r1]		/* r1 = ..01 */
   1846  1.1  christos 	strb	r2, [r0, #0x0b]
   1847  1.1  christos 	mov	r2, r2, lsr #8		/* r2 = ...A */
   1848  1.1  christos 	orr	r2, r2, ip, lsl #8	/* r2 = 789A */
   1849  1.1  christos 	mov	ip, ip, lsr #8		/* ip = .678 */
   1850  1.1  christos 	orr	ip, ip, r3, lsl #24	/* ip = 5678 */
   1851  1.1  christos 	mov	r3, r3, lsr #8		/* r3 = .234 */
   1852  1.1  christos 	orr	r3, r3, r1, lsl #24	/* r3 = 1234 */
   1853  1.1  christos 	mov	r1, r1, lsr #8		/* r1 = ...0 */
   1854  1.1  christos 	strb	r1, [r0]
   1855  1.1  christos 	str	r3, [r0, #0x01]
   1856  1.1  christos 	str	ip, [r0, #0x05]
   1857  1.1  christos 	strh	r2, [r0, #0x09]
   1858  1.1  christos #else
   1859  1.1  christos 	ldrh	r2, [r1]		/* r2 = ..10 */
   1860  1.1  christos 	ldr	r3, [r1, #0x02]		/* r3 = 5432 */
   1861  1.1  christos 	ldr	ip, [r1, #0x06]		/* ip = 9876 */
   1862  1.1  christos 	ldrh	r1, [r1, #0x0a]		/* r1 = ..BA */
   1863  1.1  christos 	strb	r2, [r0]
   1864  1.1  christos 	mov	r2, r2, lsr #8		/* r2 = ...1 */
   1865  1.1  christos 	orr	r2, r2, r3, lsl #8	/* r2 = 4321 */
   1866  1.1  christos 	mov	r3, r3, lsr #24		/* r3 = ...5 */
   1867  1.1  christos 	orr	r3, r3, ip, lsl #8	/* r3 = 8765 */
   1868  1.1  christos 	mov	ip, ip, lsr #24		/* ip = ...9 */
   1869  1.1  christos 	orr	ip, ip, r1, lsl #8	/* ip = .BA9 */
   1870  1.1  christos 	mov	r1, r1, lsr #8		/* r1 = ...B */
   1871  1.1  christos 	str	r2, [r0, #0x01]
   1872  1.1  christos 	str	r3, [r0, #0x05]
   1873  1.1  christos 	strh	ip, [r0, #0x09]
   1874  1.1  christos 	strb	r1, [r0, #0x0b]
   1875  1.1  christos #endif
   1876  1.3      matt 	RET
   1877  1.1  christos 	LMEMCPY_C_PAD
   1878  1.1  christos 
   1879  1.1  christos /*
   1880  1.1  christos  * 1111: dst is 8-bit aligned (byte 3), src is 8-bit aligned (byte 3)
   1881  1.1  christos  */
   1882  1.1  christos 	ldrb	r2, [r1]
   1883  1.1  christos 	ldr	r3, [r1, #0x01]
   1884  1.1  christos 	ldr	ip, [r1, #0x05]
   1885  1.1  christos 	strb	r2, [r0]
   1886  1.1  christos 	ldrh	r2, [r1, #0x09]
   1887  1.1  christos 	ldrb	r1, [r1, #0x0b]
   1888  1.1  christos 	str	r3, [r0, #0x01]
   1889  1.1  christos 	str	ip, [r0, #0x05]
   1890  1.1  christos 	strh	r2, [r0, #0x09]
   1891  1.1  christos 	strb	r1, [r0, #0x0b]
   1892  1.3      matt 	RET
   1893  1.4      matt END(memcpy)
   1894  1.1  christos #endif	/* !_STANDALONE */
   1895