atomic.S revision 1.9 1 1.9 ad /* $NetBSD: atomic.S,v 1.9 2008/02/10 13:25:46 ad Exp $ */
2 1.1 ad
3 1.1 ad /*-
4 1.1 ad * Copyright (c) 2007 The NetBSD Foundation, Inc.
5 1.1 ad * All rights reserved.
6 1.1 ad *
7 1.1 ad * This code is derived from software contributed to The NetBSD Foundation
8 1.1 ad * by Jason R. Thorpe, and by Andrew Doran.
9 1.1 ad *
10 1.1 ad * Redistribution and use in source and binary forms, with or without
11 1.1 ad * modification, are permitted provided that the following conditions
12 1.1 ad * are met:
13 1.1 ad * 1. Redistributions of source code must retain the above copyright
14 1.1 ad * notice, this list of conditions and the following disclaimer.
15 1.1 ad * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 ad * notice, this list of conditions and the following disclaimer in the
17 1.1 ad * documentation and/or other materials provided with the distribution.
18 1.1 ad * 3. All advertising materials mentioning features or use of this software
19 1.1 ad * must display the following acknowledgement:
20 1.1 ad * This product includes software developed by the NetBSD
21 1.1 ad * Foundation, Inc. and its contributors.
22 1.1 ad * 4. Neither the name of The NetBSD Foundation nor the names of its
23 1.1 ad * contributors may be used to endorse or promote products derived
24 1.1 ad * from this software without specific prior written permission.
25 1.1 ad *
26 1.1 ad * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
27 1.1 ad * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
28 1.1 ad * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
29 1.1 ad * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
30 1.1 ad * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
31 1.1 ad * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
32 1.1 ad * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
33 1.1 ad * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
34 1.1 ad * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
35 1.1 ad * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
36 1.1 ad * POSSIBILITY OF SUCH DAMAGE.
37 1.1 ad */
38 1.1 ad
39 1.1 ad #include <machine/asm.h>
40 1.1 ad
41 1.1 ad #ifdef _KERNEL
42 1.1 ad #define LOCK(n) .Lpatch/**/n: lock
43 1.1 ad #define ALIAS(f, t) STRONG_ALIAS(f,t)
44 1.2 ad #define END(a) _ALIGN_TEXT; LABEL(a)
45 1.1 ad #else
46 1.1 ad #define LOCK(n) lock
47 1.1 ad #define ALIAS(f, t) WEAK_ALIAS(f,t)
48 1.2 ad #define END(a) /* nothing */
49 1.1 ad #endif
50 1.1 ad
51 1.1 ad .text
52 1.1 ad
53 1.1 ad NENTRY(_atomic_add_32)
54 1.1 ad movl 4(%esp), %edx
55 1.1 ad movl 8(%esp), %eax
56 1.1 ad LOCK(1)
57 1.1 ad addl %eax, (%edx)
58 1.1 ad ret
59 1.1 ad
60 1.1 ad NENTRY(_atomic_add_32_nv)
61 1.1 ad movl 4(%esp), %edx
62 1.1 ad movl 8(%esp), %eax
63 1.1 ad movl %eax, %ecx
64 1.1 ad LOCK(2)
65 1.1 ad xaddl %eax, (%edx)
66 1.1 ad addl %ecx, %eax
67 1.1 ad ret
68 1.1 ad
69 1.1 ad NENTRY(_atomic_and_32)
70 1.1 ad movl 4(%esp), %edx
71 1.1 ad movl 8(%esp), %eax
72 1.1 ad LOCK(3)
73 1.1 ad andl %eax, (%edx)
74 1.1 ad ret
75 1.1 ad
76 1.1 ad NENTRY(_atomic_and_32_nv)
77 1.1 ad movl 4(%esp), %edx
78 1.1 ad movl (%edx), %eax
79 1.1 ad 1:
80 1.1 ad movl %eax, %ecx
81 1.1 ad andl 8(%esp), %ecx
82 1.1 ad LOCK(4)
83 1.1 ad cmpxchgl %ecx, (%edx)
84 1.1 ad jnz 1b
85 1.1 ad movl %ecx, %eax
86 1.1 ad ret
87 1.1 ad
88 1.1 ad NENTRY(_atomic_dec_32)
89 1.1 ad movl 4(%esp), %edx
90 1.1 ad LOCK(5)
91 1.1 ad decl (%edx)
92 1.1 ad ret
93 1.1 ad
94 1.1 ad NENTRY(_atomic_dec_32_nv)
95 1.1 ad movl 4(%esp), %edx
96 1.1 ad movl $-1, %eax
97 1.1 ad LOCK(6)
98 1.1 ad xaddl %eax, (%edx)
99 1.1 ad decl %eax
100 1.1 ad ret
101 1.1 ad
102 1.1 ad NENTRY(_atomic_inc_32)
103 1.1 ad movl 4(%esp), %edx
104 1.1 ad LOCK(7)
105 1.1 ad incl (%edx)
106 1.1 ad ret
107 1.1 ad
108 1.1 ad NENTRY(_atomic_inc_32_nv)
109 1.1 ad movl 4(%esp), %edx
110 1.1 ad movl $1, %eax
111 1.1 ad LOCK(8)
112 1.1 ad xaddl %eax, (%edx)
113 1.1 ad incl %eax
114 1.1 ad ret
115 1.1 ad
116 1.1 ad NENTRY(_atomic_or_32)
117 1.1 ad movl 4(%esp), %edx
118 1.1 ad movl 8(%esp), %eax
119 1.1 ad LOCK(9)
120 1.1 ad orl %eax, (%edx)
121 1.1 ad ret
122 1.1 ad
123 1.1 ad NENTRY(_atomic_or_32_nv)
124 1.1 ad movl 4(%esp), %edx
125 1.1 ad movl (%edx), %eax
126 1.1 ad 1:
127 1.1 ad movl %eax, %ecx
128 1.1 ad orl 8(%esp), %ecx
129 1.1 ad LOCK(10)
130 1.1 ad cmpxchgl %ecx, (%edx)
131 1.1 ad jnz 1b
132 1.1 ad movl %ecx, %eax
133 1.1 ad ret
134 1.1 ad
135 1.1 ad NENTRY(_atomic_swap_32)
136 1.1 ad movl 4(%esp), %edx
137 1.1 ad movl 8(%esp), %eax
138 1.1 ad xchgl %eax, (%edx)
139 1.1 ad ret
140 1.1 ad
141 1.1 ad NENTRY(_atomic_cas_32)
142 1.1 ad movl 4(%esp), %edx
143 1.1 ad movl 8(%esp), %eax
144 1.1 ad movl 12(%esp), %ecx
145 1.1 ad LOCK(12)
146 1.1 ad cmpxchgl %ecx, (%edx)
147 1.1 ad /* %eax now contains the old value */
148 1.1 ad ret
149 1.1 ad
150 1.9 ad NENTRY(_atomic_cas_32_ni)
151 1.9 ad movl 4(%esp), %edx
152 1.9 ad movl 8(%esp), %eax
153 1.9 ad movl 12(%esp), %ecx
154 1.9 ad cmpxchgl %ecx, (%edx)
155 1.9 ad /* %eax now contains the old value */
156 1.9 ad ret
157 1.9 ad
158 1.1 ad NENTRY(_membar_consumer)
159 1.1 ad LOCK(13)
160 1.1 ad addl $0, -4(%esp)
161 1.1 ad ret
162 1.2 ad END(membar_consumer_end)
163 1.1 ad
164 1.1 ad NENTRY(_membar_producer)
165 1.1 ad /* A store is enough */
166 1.1 ad movl $0, -4(%esp)
167 1.1 ad ret
168 1.2 ad END(membar_producer_end)
169 1.1 ad
170 1.1 ad NENTRY(_membar_sync)
171 1.1 ad LOCK(14)
172 1.1 ad addl $0, -4(%esp)
173 1.1 ad ret
174 1.2 ad END(membar_sync_end)
175 1.1 ad
176 1.1 ad #ifdef _KERNEL
177 1.6 ad NENTRY(_atomic_cas_64)
178 1.6 ad cli
179 1.6 ad pushl %edi
180 1.6 ad pushl %ebx
181 1.6 ad movl 12(%esp), %edi
182 1.6 ad movl 16(%esp), %eax
183 1.6 ad movl 20(%esp), %edx
184 1.6 ad movl 24(%esp), %ebx
185 1.6 ad movl 28(%esp), %ecx
186 1.6 ad cmpl 0(%edi), %eax
187 1.6 ad jne 2f
188 1.6 ad cmpl 4(%edi), %edx
189 1.6 ad jne 2f
190 1.6 ad movl %ebx, 0(%edi)
191 1.6 ad movl %ecx, 4(%edi)
192 1.6 ad 1:
193 1.6 ad popl %ebx
194 1.6 ad popl %edi
195 1.6 ad sti
196 1.6 ad ret
197 1.6 ad 2:
198 1.6 ad movl 0(%edi), %eax
199 1.6 ad movl 4(%edi), %edx
200 1.6 ad jmp 1b
201 1.6 ad END(_atomic_cas_64_end)
202 1.6 ad
203 1.6 ad NENTRY(_atomic_cas_cx8)
204 1.6 ad pushl %edi
205 1.6 ad pushl %ebx
206 1.6 ad movl 12(%esp), %edi
207 1.6 ad movl 16(%esp), %eax
208 1.6 ad movl 20(%esp), %edx
209 1.6 ad movl 24(%esp), %ebx
210 1.6 ad movl 28(%esp), %ecx
211 1.6 ad LOCK(15)
212 1.6 ad cmpxchg8b (%edi)
213 1.6 ad popl %ebx
214 1.6 ad popl %edi
215 1.6 ad ret
216 1.7 ad .space 32, 0x90
217 1.6 ad END(_atomic_cas_cx8_end)
218 1.6 ad
219 1.1 ad NENTRY(sse2_lfence)
220 1.1 ad lfence
221 1.1 ad ret
222 1.2 ad END(sse2_lfence_end)
223 1.1 ad
224 1.1 ad NENTRY(sse2_mfence)
225 1.1 ad mfence
226 1.1 ad ret
227 1.2 ad END(sse2_mfence_end)
228 1.1 ad
229 1.1 ad atomic_lockpatch:
230 1.1 ad .globl atomic_lockpatch
231 1.1 ad .long .Lpatch1, .Lpatch2, .Lpatch3, .Lpatch4, .Lpatch5
232 1.1 ad .long .Lpatch6, .Lpatch7, .Lpatch8, .Lpatch9, .Lpatch10
233 1.6 ad .long .Lpatch12, .Lpatch13, .Lpatch14, .Lpatch15, 0
234 1.7 ad #else
235 1.7 ad NENTRY(_atomic_cas_64)
236 1.7 ad pushl %edi
237 1.7 ad pushl %ebx
238 1.7 ad movl 12(%esp), %edi
239 1.7 ad movl 16(%esp), %eax
240 1.7 ad movl 20(%esp), %edx
241 1.7 ad movl 24(%esp), %ebx
242 1.7 ad movl 28(%esp), %ecx
243 1.7 ad lock
244 1.7 ad cmpxchg8b (%edi)
245 1.7 ad popl %ebx
246 1.7 ad popl %edi
247 1.7 ad ret
248 1.1 ad #endif /* _KERNEL */
249 1.1 ad
250 1.1 ad ALIAS(atomic_add_32,_atomic_add_32)
251 1.4 ad ALIAS(atomic_add_int,_atomic_add_32)
252 1.4 ad ALIAS(atomic_add_long,_atomic_add_32)
253 1.1 ad ALIAS(atomic_add_ptr,_atomic_add_32)
254 1.1 ad
255 1.1 ad ALIAS(atomic_add_32_nv,_atomic_add_32_nv)
256 1.4 ad ALIAS(atomic_add_int_nv,_atomic_add_32_nv)
257 1.4 ad ALIAS(atomic_add_long_nv,_atomic_add_32_nv)
258 1.1 ad ALIAS(atomic_add_ptr_nv,_atomic_add_32_nv)
259 1.1 ad
260 1.1 ad ALIAS(atomic_and_32,_atomic_and_32)
261 1.1 ad ALIAS(atomic_and_uint,_atomic_and_32)
262 1.1 ad ALIAS(atomic_and_ulong,_atomic_and_32)
263 1.1 ad ALIAS(atomic_and_ptr,_atomic_and_32)
264 1.1 ad
265 1.1 ad ALIAS(atomic_and_32_nv,_atomic_and_32_nv)
266 1.1 ad ALIAS(atomic_and_uint_nv,_atomic_and_32_nv)
267 1.1 ad ALIAS(atomic_and_ulong_nv,_atomic_and_32_nv)
268 1.1 ad ALIAS(atomic_and_ptr_nv,_atomic_and_32_nv)
269 1.1 ad
270 1.1 ad ALIAS(atomic_dec_32,_atomic_dec_32)
271 1.1 ad ALIAS(atomic_dec_uint,_atomic_dec_32)
272 1.1 ad ALIAS(atomic_dec_ulong,_atomic_dec_32)
273 1.1 ad ALIAS(atomic_dec_ptr,_atomic_dec_32)
274 1.1 ad
275 1.1 ad ALIAS(atomic_dec_32_nv,_atomic_dec_32_nv)
276 1.1 ad ALIAS(atomic_dec_uint_nv,_atomic_dec_32_nv)
277 1.1 ad ALIAS(atomic_dec_ulong_nv,_atomic_dec_32_nv)
278 1.1 ad ALIAS(atomic_dec_ptr_nv,_atomic_dec_32_nv)
279 1.1 ad
280 1.1 ad ALIAS(atomic_inc_32,_atomic_inc_32)
281 1.1 ad ALIAS(atomic_inc_uint,_atomic_inc_32)
282 1.1 ad ALIAS(atomic_inc_ulong,_atomic_inc_32)
283 1.1 ad ALIAS(atomic_inc_ptr,_atomic_inc_32)
284 1.1 ad
285 1.1 ad ALIAS(atomic_inc_32_nv,_atomic_inc_32_nv)
286 1.1 ad ALIAS(atomic_inc_uint_nv,_atomic_inc_32_nv)
287 1.1 ad ALIAS(atomic_inc_ulong_nv,_atomic_inc_32_nv)
288 1.1 ad ALIAS(atomic_inc_ptr_nv,_atomic_inc_32_nv)
289 1.1 ad
290 1.1 ad ALIAS(atomic_or_32,_atomic_or_32)
291 1.1 ad ALIAS(atomic_or_uint,_atomic_or_32)
292 1.1 ad ALIAS(atomic_or_ulong,_atomic_or_32)
293 1.1 ad ALIAS(atomic_or_ptr,_atomic_or_32)
294 1.1 ad
295 1.1 ad ALIAS(atomic_or_32_nv,_atomic_or_32_nv)
296 1.1 ad ALIAS(atomic_or_uint_nv,_atomic_or_32_nv)
297 1.1 ad ALIAS(atomic_or_ulong_nv,_atomic_or_32_nv)
298 1.1 ad ALIAS(atomic_or_ptr_nv,_atomic_or_32_nv)
299 1.1 ad
300 1.1 ad ALIAS(atomic_swap_32,_atomic_swap_32)
301 1.1 ad ALIAS(atomic_swap_uint,_atomic_swap_32)
302 1.1 ad ALIAS(atomic_swap_ulong,_atomic_swap_32)
303 1.1 ad ALIAS(atomic_swap_ptr,_atomic_swap_32)
304 1.1 ad
305 1.1 ad ALIAS(atomic_cas_32,_atomic_cas_32)
306 1.1 ad ALIAS(atomic_cas_uint,_atomic_cas_32)
307 1.1 ad ALIAS(atomic_cas_ulong,_atomic_cas_32)
308 1.1 ad ALIAS(atomic_cas_ptr,_atomic_cas_32)
309 1.1 ad
310 1.9 ad ALIAS(atomic_cas_32_ni,_atomic_cas_32_ni)
311 1.9 ad ALIAS(atomic_cas_uint_ni,_atomic_cas_32_ni)
312 1.9 ad ALIAS(atomic_cas_ulong_ni,_atomic_cas_32_ni)
313 1.9 ad ALIAS(atomic_cas_ptr_ni,_atomic_cas_32_ni)
314 1.9 ad
315 1.6 ad ALIAS(atomic_cas_64,_atomic_cas_64)
316 1.9 ad ALIAS(atomic_cas_64_ni,_atomic_cas_64)
317 1.6 ad
318 1.1 ad ALIAS(membar_consumer,_membar_consumer)
319 1.1 ad ALIAS(membar_producer,_membar_producer)
320 1.8 ad ALIAS(membar_enter,_membar_consumer)
321 1.8 ad ALIAS(membar_exit,_membar_producer)
322 1.1 ad ALIAS(membar_sync,_membar_sync)
323 1.5 ad
324 1.5 ad STRONG_ALIAS(_atomic_add_int,_atomic_add_32)
325 1.5 ad STRONG_ALIAS(_atomic_add_long,_atomic_add_32)
326 1.5 ad STRONG_ALIAS(_atomic_add_ptr,_atomic_add_32)
327 1.5 ad
328 1.5 ad STRONG_ALIAS(_atomic_add_int_nv,_atomic_add_32_nv)
329 1.5 ad STRONG_ALIAS(_atomic_add_long_nv,_atomic_add_32_nv)
330 1.5 ad STRONG_ALIAS(_atomic_add_ptr_nv,_atomic_add_32_nv)
331 1.5 ad
332 1.5 ad STRONG_ALIAS(_atomic_and_uint,_atomic_and_32)
333 1.5 ad STRONG_ALIAS(_atomic_and_ulong,_atomic_and_32)
334 1.5 ad STRONG_ALIAS(_atomic_and_ptr,_atomic_and_32)
335 1.5 ad
336 1.5 ad STRONG_ALIAS(_atomic_and_uint_nv,_atomic_and_32_nv)
337 1.5 ad STRONG_ALIAS(_atomic_and_ulong_nv,_atomic_and_32_nv)
338 1.5 ad STRONG_ALIAS(_atomic_and_ptr_nv,_atomic_and_32_nv)
339 1.5 ad
340 1.5 ad STRONG_ALIAS(_atomic_dec_uint,_atomic_dec_32)
341 1.5 ad STRONG_ALIAS(_atomic_dec_ulong,_atomic_dec_32)
342 1.5 ad STRONG_ALIAS(_atomic_dec_ptr,_atomic_dec_32)
343 1.5 ad
344 1.5 ad STRONG_ALIAS(_atomic_dec_uint_nv,_atomic_dec_32_nv)
345 1.5 ad STRONG_ALIAS(_atomic_dec_ulong_nv,_atomic_dec_32_nv)
346 1.5 ad STRONG_ALIAS(_atomic_dec_ptr_nv,_atomic_dec_32_nv)
347 1.5 ad
348 1.5 ad STRONG_ALIAS(_atomic_inc_uint,_atomic_inc_32)
349 1.5 ad STRONG_ALIAS(_atomic_inc_ulong,_atomic_inc_32)
350 1.5 ad STRONG_ALIAS(_atomic_inc_ptr,_atomic_inc_32)
351 1.5 ad
352 1.5 ad STRONG_ALIAS(_atomic_inc_uint_nv,_atomic_inc_32_nv)
353 1.5 ad STRONG_ALIAS(_atomic_inc_ulong_nv,_atomic_inc_32_nv)
354 1.5 ad STRONG_ALIAS(_atomic_inc_ptr_nv,_atomic_inc_32_nv)
355 1.5 ad
356 1.5 ad STRONG_ALIAS(_atomic_or_uint,_atomic_or_32)
357 1.5 ad STRONG_ALIAS(_atomic_or_ulong,_atomic_or_32)
358 1.5 ad STRONG_ALIAS(_atomic_or_ptr,_atomic_or_32)
359 1.5 ad
360 1.5 ad STRONG_ALIAS(_atomic_or_uint_nv,_atomic_or_32_nv)
361 1.5 ad STRONG_ALIAS(_atomic_or_ulong_nv,_atomic_or_32_nv)
362 1.5 ad STRONG_ALIAS(_atomic_or_ptr_nv,_atomic_or_32_nv)
363 1.5 ad
364 1.5 ad STRONG_ALIAS(_atomic_swap_uint,_atomic_swap_32)
365 1.5 ad STRONG_ALIAS(_atomic_swap_ulong,_atomic_swap_32)
366 1.5 ad STRONG_ALIAS(_atomic_swap_ptr,_atomic_swap_32)
367 1.5 ad
368 1.5 ad STRONG_ALIAS(_atomic_cas_uint,_atomic_cas_32)
369 1.5 ad STRONG_ALIAS(_atomic_cas_ulong,_atomic_cas_32)
370 1.5 ad STRONG_ALIAS(_atomic_cas_ptr,_atomic_cas_32)
371 1.8 ad
372 1.9 ad STRONG_ALIAS(_atomic_cas_uint_ni,_atomic_cas_32_ni)
373 1.9 ad STRONG_ALIAS(_atomic_cas_ulong_ni,_atomic_cas_32_ni)
374 1.9 ad STRONG_ALIAS(_atomic_cas_ptr_ni,_atomic_cas_32_ni)
375 1.9 ad
376 1.8 ad STRONG_ALIAS(_membar_enter,_membar_consumer)
377 1.8 ad STRONG_ALIAS(_membar_exit,_membar_producer)
378