1 1.1 matt /* $NetBSD: memcpy.c,v 1.1 2014/09/03 19:34:25 matt Exp $ */ 2 1.1 matt /*- 3 1.1 matt * Copyright (c) 2014 The NetBSD Foundation, Inc. 4 1.1 matt * All rights reserved. 5 1.1 matt * 6 1.1 matt * This code is derived from software contributed to The NetBSD Foundation 7 1.1 matt * by Matt Thomas of 3am Software Foundry. 8 1.1 matt * 9 1.1 matt * Redistribution and use in source and binary forms, with or without 10 1.1 matt * modification, are permitted provided that the following conditions 11 1.1 matt * are met: 12 1.1 matt * 1. Redistributions of source code must retain the above copyright 13 1.1 matt * notice, this list of conditions and the following disclaimer. 14 1.1 matt * 2. Redistributions in binary form must reproduce the above copyright 15 1.1 matt * notice, this list of conditions and the following disclaimer in the 16 1.1 matt * documentation and/or other materials provided with the distribution. 17 1.1 matt * 18 1.1 matt * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS 19 1.1 matt * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED 20 1.1 matt * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 21 1.1 matt * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS 22 1.1 matt * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 23 1.1 matt * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 24 1.1 matt * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 25 1.1 matt * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 26 1.1 matt * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 27 1.1 matt * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 28 1.1 matt * POSSIBILITY OF SUCH DAMAGE. 29 1.1 matt */ 30 1.1 matt 31 1.1 matt #include <sys/cdefs.h> 32 1.1 matt 33 1.1 matt __RCSID("$NetBSD: memcpy.c,v 1.1 2014/09/03 19:34:25 matt Exp $"); 34 1.1 matt 35 1.1 matt #include <stddef.h> 36 1.1 matt #include <stdint.h> 37 1.1 matt #include <string.h> 38 1.1 matt 39 1.1 matt static inline unsigned long 40 1.1 matt combine_words(unsigned long w1, unsigned long w2, int shift1, int shift2) 41 1.1 matt { 42 1.1 matt #if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__ 43 1.1 matt return (w1 << shift1) | (w2 >> shift2); 44 1.1 matt #else 45 1.1 matt return (w1 >> shift1) | (w2 << shift2); 46 1.1 matt #endif 47 1.1 matt } 48 1.1 matt 49 1.1 matt void * 50 1.1 matt memcpy(void * restrict a, const void * restrict b, size_t len) 51 1.1 matt { 52 1.1 matt const unsigned char *cb = b; 53 1.1 matt unsigned char *ca = a; 54 1.1 matt 55 1.1 matt if (len == 0) 56 1.1 matt return a; 57 1.1 matt 58 1.1 matt /* 59 1.1 matt * Make sure the destination is long aligned. 60 1.1 matt */ 61 1.1 matt while ((uintptr_t)ca & (sizeof(long) - 1)) { 62 1.1 matt *ca++ = *cb++; 63 1.1 matt if (--len == 0) 64 1.1 matt return a; 65 1.1 matt } 66 1.1 matt 67 1.1 matt unsigned long *la = (long *)ca; 68 1.1 matt const int offset = (uintptr_t)cb & (sizeof(*la) - 1); 69 1.1 matt const unsigned long *lb = (const unsigned long *) (cb - offset); 70 1.1 matt unsigned long * const ea = la + len / sizeof(*la); 71 1.1 matt 72 1.1 matt if (offset == 0) { 73 1.1 matt /* 74 1.1 matt * a & b are now both long alignment. 75 1.1 matt * First try to copy 4 longs at a time, 76 1.1 matt */ 77 1.1 matt for (; la + 4 <= ea; la += 4, lb += 4) { 78 1.1 matt la[0] = lb[0]; 79 1.1 matt la[1] = lb[1]; 80 1.1 matt la[2] = lb[2]; 81 1.1 matt la[3] = lb[3]; 82 1.1 matt } 83 1.1 matt /* 84 1.1 matt * Now try to copy one long at a time. 85 1.1 matt */ 86 1.1 matt while (la <= ea) { 87 1.1 matt *la++ = *lb++; 88 1.1 matt } 89 1.1 matt } else { 90 1.1 matt const int shift1 = offset * 8; 91 1.1 matt const int shift2 = sizeof(*la) * 8 - shift1; 92 1.1 matt unsigned long w1 = *lb++; 93 1.1 matt 94 1.1 matt /* 95 1.1 matt * We try to write 4 words per loop. 96 1.1 matt */ 97 1.1 matt for (; la + 4 <= ea; la += 4, lb += 4) { 98 1.1 matt unsigned long w2 = lb[0]; 99 1.1 matt 100 1.1 matt la[0] = combine_words(w1, w2, shift1, shift2); 101 1.1 matt 102 1.1 matt w1 = lb[1]; 103 1.1 matt 104 1.1 matt la[1] = combine_words(w2, w1, shift1, shift2); 105 1.1 matt 106 1.1 matt w2 = lb[2]; 107 1.1 matt 108 1.1 matt la[2] = combine_words(w1, w2, shift1, shift2); 109 1.1 matt 110 1.1 matt w1 = lb[3]; 111 1.1 matt 112 1.1 matt la[3] = combine_words(w2, w1, shift1, shift2); 113 1.1 matt } 114 1.1 matt 115 1.1 matt /* 116 1.1 matt * Now try to copy one long at a time. 117 1.1 matt */ 118 1.1 matt while (la <= ea) { 119 1.1 matt unsigned long w2 = *lb++; 120 1.1 matt 121 1.1 matt *la++ = combine_words(w1, w2, shift1, shift2); 122 1.1 matt 123 1.1 matt w1 = w2; 124 1.1 matt } 125 1.1 matt } 126 1.1 matt len &= sizeof(*la) - 1; 127 1.1 matt if (len) { 128 1.1 matt cb = (const unsigned char *)lb + offset; 129 1.1 matt ca = (unsigned char *)la; 130 1.1 matt while (len-- > 0) { 131 1.1 matt *ca++ = *cb++; 132 1.1 matt } 133 1.1 matt } 134 1.1 matt return a; 135 1.1 matt } 136