memmove.S revision 1.1 1 1.1 matt /* $NetBSD: memmove.S,v 1.1 2014/09/03 19:34:25 matt Exp $ */
2 1.1 matt
3 1.1 matt /* stropt/memmove.S, pl_string_common, pl_linux 10/11/04 11:45:37
4 1.1 matt * ==========================================================================
5 1.1 matt * Optimized memmove implementation for IBM PowerPC 405/440.
6 1.1 matt *
7 1.1 matt * Copyright (c) 2003, IBM Corporation
8 1.1 matt * All rights reserved.
9 1.1 matt *
10 1.1 matt * Redistribution and use in source and binary forms, with or
11 1.1 matt * without modification, are permitted provided that the following
12 1.1 matt * conditions are met:
13 1.1 matt *
14 1.1 matt * * Redistributions of source code must retain the above
15 1.1 matt * copyright notice, this list of conditions and the following
16 1.1 matt * disclaimer.
17 1.1 matt * * Redistributions in binary form must reproduce the above
18 1.1 matt * copyright notice, this list of conditions and the following
19 1.1 matt * disclaimer in the documentation and/or other materials
20 1.1 matt * provided with the distribution.
21 1.1 matt * * Neither the name of IBM nor the names of its contributors
22 1.1 matt * may be used to endorse or promote products derived from this
23 1.1 matt * software without specific prior written permission.
24 1.1 matt *
25 1.1 matt * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
26 1.1 matt * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
27 1.1 matt * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
28 1.1 matt * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
29 1.1 matt * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS
30 1.1 matt * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY,
31 1.1 matt * OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
32 1.1 matt * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
33 1.1 matt * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
34 1.1 matt * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
35 1.1 matt * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE
36 1.1 matt * USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
37 1.1 matt *
38 1.1 matt * ==========================================================================
39 1.1 matt *
40 1.1 matt * Function: Move memory area (handles overlapping regions)
41 1.1 matt *
42 1.1 matt * void *memmove(void * dest, const void * src, int n)
43 1.1 matt *
44 1.1 matt * Input: r3 - destination address
45 1.1 matt * r4 - source address
46 1.1 matt * r5 - byte count
47 1.1 matt * Output: r11 - destination address
48 1.1 matt *
49 1.1 matt * ==========================================================================
50 1.1 matt */
51 1.1 matt
52 1.1 matt #include <machine/asm.h>
53 1.1 matt
54 1.1 matt #ifdef _BCOPY
55 1.1 matt /* bcopy = memcpy/memmove with arguments reversed. */
56 1.1 matt /* LINTSTUB: Func: void bcopy(void *, void *, size_t) */
57 1.1 matt ENTRY(bcopy)
58 1.1 matt l.or r6, r3, r0 /* swap src/dst */
59 1.1 matt l.or r3, r4, r0
60 1.1 matt l.or r4, r6, r0
61 1.1 matt #else
62 1.1 matt /* LINTSTUB: Func: void *memmove(void *, const void *, size_t) */
63 1.1 matt ENTRY(memmove)
64 1.1 matt #endif
65 1.1 matt
66 1.1 matt l.or r11, r3, r0 /* Save dst (return value) */
67 1.1 matt
68 1.1 matt l.sfges r4, r3 /* Branch to reverse if */
69 1.1 matt l.bnf .Lreverse /* src < dest. Don't want to */
70 1.1 matt /* overwrite end of src with */
71 1.1 matt /* start of dest */
72 1.1 matt
73 1.1 matt l.addi r4, r4, -4 /* Back up src and dst pointers */
74 1.1 matt l.addi r3, r3, -4 /* due to auto-update of 'load' */
75 1.1 matt
76 1.1 matt l.srli r13, r5, 2 /* How many words in total cnt */
77 1.1 matt l.sfeqi r13, 0
78 1.1 matt l.bf .Llast1 /* Handle byte by byte if < 4 */
79 1.1 matt /* bytes total */
80 1.1 matt l.lwz r7, 4(r4) /* Preload first word */
81 1.1 matt l.addi r4, r4, 4
82 1.1 matt
83 1.1 matt l.j .Lg1
84 1.1 matt l.nop
85 1.1 matt
86 1.1 matt .Lg0: /* Main loop */
87 1.1 matt
88 1.1 matt l.lwz r7, 4(r4) /* Load a new word */
89 1.1 matt l.sw 4(r3), r6 /* Store previous word */
90 1.1 matt l.addi r4, r4, 4 /* advance */
91 1.1 matt l.addi r3, r3, 4 /* advance */
92 1.1 matt
93 1.1 matt .Lg1:
94 1.1 matt
95 1.1 matt l.addi r13, r13, -1
96 1.1 matt l.sfeqi r13, 0
97 1.1 matt l.bf .Llast /* Dec cnt, and branch if just */
98 1.1 matt l.nop
99 1.1 matt /* one word to store */
100 1.1 matt l.lwz r6, 4(r4) /* Load another word */
101 1.1 matt l.sw 4(r3), r7 /* Store previous word */
102 1.1 matt l.addi r4, r4, 4 /* advance to next word */
103 1.1 matt l.addi r3, r3, 4 /* advance to next word */
104 1.1 matt l.addi r13, r13, -1 /* Decrement count */
105 1.1 matt l.sfeqi r13, 0 /* last word? */
106 1.1 matt l.bnf .Lg0 /* no, loop, more words */
107 1.1 matt l.nop
108 1.1 matt
109 1.1 matt l.or r7, r6, r0 /* If word count -> 0, then... */
110 1.1 matt
111 1.1 matt .Llast:
112 1.1 matt
113 1.1 matt l.sw 4(r3), r7 /* ... store last word */
114 1.1 matt l.addi r3, r3, 4
115 1.1 matt
116 1.1 matt .Llast1: /* Byte-by-byte copy */
117 1.1 matt
118 1.1 matt l.andi r5, r5, 3 /* get remaining byte count */
119 1.1 matt l.sfeqi r5, 0 /* is it 0? */
120 1.1 matt l.bf .Ldone /* yes, we're done */
121 1.1 matt l.nop /* -- delay slot -- */
122 1.1 matt
123 1.1 matt l.lbz r6, 4(r4) /* 1st byte: update addr by 4 */
124 1.1 matt l.sb 4(r3), r6 /* since we pre-adjusted by 4 */
125 1.1 matt l.addi r4, r4, 4 /* advance to next word */
126 1.1 matt l.addi r3, r3, 4 /* advance to next word */
127 1.1 matt l.addi r5, r5, -1 /* decrement count */
128 1.1 matt l.sfeqi r5, 0 /* is it 0? */
129 1.1 matt l.bf .Ldone /* yes, we're done */
130 1.1 matt l.nop /* -- delay slot -- */
131 1.1 matt
132 1.1 matt .Llast2:
133 1.1 matt
134 1.1 matt l.lbz r6, 1(r4) /* But handle the rest by */
135 1.1 matt l.sb 1(r3), r6 /* updating addr by 1 */
136 1.1 matt l.addi r4, r4, 1 /* advance to next word */
137 1.1 matt l.addi r3, r3, 1 /* advance to next word */
138 1.1 matt l.addi r5, r5, -1 /* decrement count */
139 1.1 matt l.sfeqi r5, 0 /* is it 0? */
140 1.1 matt l.bnf .Llast2 /* yes, we're done */
141 1.1 matt l.nop /* -- delay slot -- */
142 1.1 matt .Ldone:
143 1.1 matt l.jr lr /* return */
144 1.1 matt l.nop /* -- delay slot -- */
145 1.1 matt
146 1.1 matt /* We're here since src < dest. Don't want to overwrite end of */
147 1.1 matt /* src with start of dest */
148 1.1 matt
149 1.1 matt .Lreverse:
150 1.1 matt
151 1.1 matt l.add r4, r4, r5 /* Work from end to beginning */
152 1.1 matt l.add r3, r3, r5 /* so add count to string ptrs */
153 1.1 matt l.srli r13, r5, 2 /* Words in total count */
154 1.1 matt l.sfeqi r13, 0
155 1.1 matt l.bf .Lrlast1 /* Handle byte by byte if < 4 */
156 1.1 matt /* bytes total */
157 1.1 matt l.nop
158 1.1 matt
159 1.1 matt l.lwz r7, -4(r4) /* Preload first word */
160 1.1 matt l.addi r4, r4, -4 /* update pointer */
161 1.1 matt
162 1.1 matt l.j .Lrg1
163 1.1 matt
164 1.1 matt .Lrg0: /* Main loop */
165 1.1 matt
166 1.1 matt l.lwz r7, -4(r4) /* Load a new word */
167 1.1 matt l.sw -4(r3), r6 /* Store previous word */
168 1.1 matt l.addi r4, r4, -4
169 1.1 matt l.addi r3, r3, -4
170 1.1 matt
171 1.1 matt .Lrg1:
172 1.1 matt
173 1.1 matt l.addi r13, r13, -1 /* decrement count */
174 1.1 matt l.sfeqi r13, 0 /* just one pending word left? */
175 1.1 matt l.bf .Lrlast /* yes, deal with it */
176 1.1 matt
177 1.1 matt l.lwz r6, -4(r4) /* Load another word */
178 1.1 matt l.sw -4(r3), r7 /* Store previous word */
179 1.1 matt l.addi r4, r4, -4
180 1.1 matt l.addi r3, r3, -4
181 1.1 matt
182 1.1 matt l.addi r13, r13, -1 /* decrement count */
183 1.1 matt l.sfeqi r13, 0 /* just one pending word left? */
184 1.1 matt l.bnf .Lrg0 /* no, loop again more words */
185 1.1 matt l.nop
186 1.1 matt
187 1.1 matt l.or r7, r6, r0 /* If word count -> 0, then... */
188 1.1 matt
189 1.1 matt .Lrlast:
190 1.1 matt
191 1.1 matt l.sw -4(r3), r7 /* ... store last word */
192 1.1 matt l.addi r3, r3, -4 /* update pointer */
193 1.1 matt
194 1.1 matt .Lrlast1: /* Byte-by-byte copy */
195 1.1 matt
196 1.1 matt l.andi r5, r5, 3
197 1.1 matt l.sfeqi r5, 0
198 1.1 matt l.bf .Lrdone
199 1.1 matt
200 1.1 matt .Lrlast2:
201 1.1 matt
202 1.1 matt l.lbz r6, -1(r4) /* Handle the rest, byte by */
203 1.1 matt l.sb -1(r3), r6 /* byte */
204 1.1 matt l.addi r4, r4, -1
205 1.1 matt l.addi r3, r3, -1
206 1.1 matt l.addi r5, r5, -1 /* decrement count */
207 1.1 matt l.sfeqi r5, 0 /* is it 0? */
208 1.1 matt l.bnf .Lrlast2 /* no, loop again */
209 1.1 matt l.nop
210 1.1 matt .Lrdone:
211 1.1 matt l.jr lr
212 1.1 matt l.nop
213 1.1 matt
214 1.1 matt #ifdef _BCOPY
215 1.1 matt END(bcopy)
216 1.1 matt #else
217 1.1 matt END(memmove)
218 1.1 matt #endif
219