atomic.S revision 1.33 1 1.33 riastrad /* $NetBSD: atomic.S,v 1.33 2022/04/09 12:07:29 riastradh Exp $ */
2 1.1 ad
3 1.1 ad /*-
4 1.1 ad * Copyright (c) 2007 The NetBSD Foundation, Inc.
5 1.1 ad * All rights reserved.
6 1.1 ad *
7 1.1 ad * This code is derived from software contributed to The NetBSD Foundation
8 1.1 ad * by Jason R. Thorpe, and by Andrew Doran.
9 1.1 ad *
10 1.1 ad * Redistribution and use in source and binary forms, with or without
11 1.1 ad * modification, are permitted provided that the following conditions
12 1.1 ad * are met:
13 1.1 ad * 1. Redistributions of source code must retain the above copyright
14 1.1 ad * notice, this list of conditions and the following disclaimer.
15 1.1 ad * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 ad * notice, this list of conditions and the following disclaimer in the
17 1.1 ad * documentation and/or other materials provided with the distribution.
18 1.30 riastrad *
19 1.1 ad * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.1 ad * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.1 ad * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.1 ad * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.1 ad * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.1 ad * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.1 ad * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.1 ad * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.1 ad * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.1 ad * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.1 ad * POSSIBILITY OF SUCH DAMAGE.
30 1.1 ad */
31 1.1 ad
32 1.16 pooka #include <sys/param.h>
33 1.1 ad #include <machine/asm.h>
34 1.21 christos /*
35 1.21 christos * __HAVE_ constants should not be in <machine/types.h>
36 1.21 christos * because we can't use them from assembly. OTOH we
37 1.21 christos * only need __HAVE_ATOMIC64_OPS here, and we don't.
38 1.21 christos */
39 1.18 pooka #ifdef _KERNEL
40 1.18 pooka #define ALIAS(f, t) STRONG_ALIAS(f,t)
41 1.18 pooka #else
42 1.18 pooka #define ALIAS(f, t) WEAK_ALIAS(f,t)
43 1.18 pooka #endif
44 1.18 pooka
45 1.15 pooka #ifdef _HARDKERNEL
46 1.23 bouyer #include "opt_xen.h"
47 1.25 maxv #include <machine/frameasm.h>
48 1.28 maxv #define LOCK HOTPATCH(HP_NAME_NOLOCK, 1); lock
49 1.28 maxv #define HOTPATCH_SSE2_MFENCE HOTPATCH(HP_NAME_SSE2_MFENCE, 7);
50 1.29 maxv #define HOTPATCH_CAS_64 HOTPATCH(HP_NAME_CAS_64, 49);
51 1.1 ad #else
52 1.28 maxv #define LOCK lock
53 1.28 maxv #define HOTPATCH_SSE2_MFENCE /* nothing */
54 1.29 maxv #define HOTPATCH_CAS_64 /* nothing */
55 1.1 ad #endif
56 1.1 ad
57 1.1 ad .text
58 1.1 ad
59 1.13 chs ENTRY(_atomic_add_32)
60 1.1 ad movl 4(%esp), %edx
61 1.1 ad movl 8(%esp), %eax
62 1.27 maxv LOCK
63 1.1 ad addl %eax, (%edx)
64 1.1 ad ret
65 1.22 uebayasi END(_atomic_add_32)
66 1.1 ad
67 1.13 chs ENTRY(_atomic_add_32_nv)
68 1.1 ad movl 4(%esp), %edx
69 1.1 ad movl 8(%esp), %eax
70 1.1 ad movl %eax, %ecx
71 1.27 maxv LOCK
72 1.1 ad xaddl %eax, (%edx)
73 1.1 ad addl %ecx, %eax
74 1.1 ad ret
75 1.22 uebayasi END(_atomic_add_32_nv)
76 1.1 ad
77 1.13 chs ENTRY(_atomic_and_32)
78 1.1 ad movl 4(%esp), %edx
79 1.1 ad movl 8(%esp), %eax
80 1.27 maxv LOCK
81 1.1 ad andl %eax, (%edx)
82 1.1 ad ret
83 1.22 uebayasi END(_atomic_and_32)
84 1.1 ad
85 1.13 chs ENTRY(_atomic_and_32_nv)
86 1.1 ad movl 4(%esp), %edx
87 1.1 ad movl (%edx), %eax
88 1.14 ad 0:
89 1.1 ad movl %eax, %ecx
90 1.1 ad andl 8(%esp), %ecx
91 1.27 maxv LOCK
92 1.1 ad cmpxchgl %ecx, (%edx)
93 1.14 ad jnz 1f
94 1.1 ad movl %ecx, %eax
95 1.1 ad ret
96 1.14 ad 1:
97 1.14 ad jmp 0b
98 1.22 uebayasi END(_atomic_and_32_nv)
99 1.1 ad
100 1.13 chs ENTRY(_atomic_dec_32)
101 1.1 ad movl 4(%esp), %edx
102 1.27 maxv LOCK
103 1.1 ad decl (%edx)
104 1.1 ad ret
105 1.22 uebayasi END(_atomic_dec_32)
106 1.1 ad
107 1.13 chs ENTRY(_atomic_dec_32_nv)
108 1.1 ad movl 4(%esp), %edx
109 1.1 ad movl $-1, %eax
110 1.27 maxv LOCK
111 1.1 ad xaddl %eax, (%edx)
112 1.1 ad decl %eax
113 1.1 ad ret
114 1.22 uebayasi END(_atomic_dec_32_nv)
115 1.1 ad
116 1.13 chs ENTRY(_atomic_inc_32)
117 1.1 ad movl 4(%esp), %edx
118 1.27 maxv LOCK
119 1.1 ad incl (%edx)
120 1.1 ad ret
121 1.22 uebayasi END(_atomic_inc_32)
122 1.1 ad
123 1.13 chs ENTRY(_atomic_inc_32_nv)
124 1.1 ad movl 4(%esp), %edx
125 1.1 ad movl $1, %eax
126 1.27 maxv LOCK
127 1.1 ad xaddl %eax, (%edx)
128 1.1 ad incl %eax
129 1.1 ad ret
130 1.22 uebayasi END(_atomic_inc_32_nv)
131 1.1 ad
132 1.13 chs ENTRY(_atomic_or_32)
133 1.1 ad movl 4(%esp), %edx
134 1.1 ad movl 8(%esp), %eax
135 1.27 maxv LOCK
136 1.1 ad orl %eax, (%edx)
137 1.1 ad ret
138 1.22 uebayasi END(_atomic_or_32)
139 1.1 ad
140 1.13 chs ENTRY(_atomic_or_32_nv)
141 1.1 ad movl 4(%esp), %edx
142 1.1 ad movl (%edx), %eax
143 1.14 ad 0:
144 1.1 ad movl %eax, %ecx
145 1.1 ad orl 8(%esp), %ecx
146 1.27 maxv LOCK
147 1.1 ad cmpxchgl %ecx, (%edx)
148 1.14 ad jnz 1f
149 1.1 ad movl %ecx, %eax
150 1.1 ad ret
151 1.14 ad 1:
152 1.14 ad jmp 0b
153 1.22 uebayasi END(_atomic_or_32_nv)
154 1.1 ad
155 1.13 chs ENTRY(_atomic_swap_32)
156 1.1 ad movl 4(%esp), %edx
157 1.1 ad movl 8(%esp), %eax
158 1.1 ad xchgl %eax, (%edx)
159 1.1 ad ret
160 1.22 uebayasi END(_atomic_swap_32)
161 1.1 ad
162 1.13 chs ENTRY(_atomic_cas_32)
163 1.1 ad movl 4(%esp), %edx
164 1.1 ad movl 8(%esp), %eax
165 1.1 ad movl 12(%esp), %ecx
166 1.27 maxv LOCK
167 1.1 ad cmpxchgl %ecx, (%edx)
168 1.1 ad /* %eax now contains the old value */
169 1.1 ad ret
170 1.22 uebayasi END(_atomic_cas_32)
171 1.1 ad
172 1.13 chs ENTRY(_atomic_cas_32_ni)
173 1.9 ad movl 4(%esp), %edx
174 1.9 ad movl 8(%esp), %eax
175 1.9 ad movl 12(%esp), %ecx
176 1.9 ad cmpxchgl %ecx, (%edx)
177 1.9 ad /* %eax now contains the old value */
178 1.9 ad ret
179 1.22 uebayasi END(_atomic_cas_32_ni)
180 1.9 ad
181 1.13 chs ENTRY(_membar_consumer)
182 1.31 riastrad /*
183 1.31 riastrad * Every load from normal memory is a load-acquire on x86, so
184 1.31 riastrad * there is never any need for explicit barriers to order
185 1.31 riastrad * load-before-anything.
186 1.31 riastrad */
187 1.1 ad ret
188 1.22 uebayasi END(_membar_consumer)
189 1.1 ad
190 1.13 chs ENTRY(_membar_producer)
191 1.32 riastrad /*
192 1.32 riastrad * Every store to normal memory is a store-release on x86, so
193 1.32 riastrad * there is never any need for explicit barriers to order
194 1.32 riastrad * anything-before-store.
195 1.32 riastrad */
196 1.1 ad ret
197 1.22 uebayasi END(_membar_producer)
198 1.1 ad
199 1.13 chs ENTRY(_membar_sync)
200 1.33 riastrad /*
201 1.33 riastrad * MFENCE, or a serializing instruction like a locked addq,
202 1.33 riastrad * is necessary to order store-before-load. Every other
203 1.33 riastrad * ordering -- load-before-anything, anything-before-store --
204 1.33 riastrad * is already guaranteed without explicit barriers.
205 1.33 riastrad */
206 1.28 maxv HOTPATCH_SSE2_MFENCE
207 1.28 maxv /* 7 bytes of instructions */
208 1.27 maxv LOCK
209 1.1 ad addl $0, -4(%esp)
210 1.1 ad ret
211 1.22 uebayasi END(_membar_sync)
212 1.1 ad
213 1.21 christos #if defined(__HAVE_ATOMIC64_OPS) || defined(_KERNEL)
214 1.24 bouyer #ifdef XENPV
215 1.23 bouyer STRONG_ALIAS(_atomic_cas_64,_atomic_cas_cx8)
216 1.23 bouyer #else
217 1.21 christos ENTRY(_atomic_cas_64)
218 1.29 maxv HOTPATCH_CAS_64
219 1.29 maxv /* 49 bytes of instructions */
220 1.15 pooka #ifdef _HARDKERNEL
221 1.14 ad pushf
222 1.6 ad cli
223 1.29 maxv #endif
224 1.6 ad pushl %edi
225 1.6 ad pushl %ebx
226 1.6 ad movl 12(%esp), %edi
227 1.6 ad movl 16(%esp), %eax
228 1.6 ad movl 20(%esp), %edx
229 1.6 ad movl 24(%esp), %ebx
230 1.6 ad movl 28(%esp), %ecx
231 1.6 ad cmpl 0(%edi), %eax
232 1.6 ad jne 2f
233 1.6 ad cmpl 4(%edi), %edx
234 1.6 ad jne 2f
235 1.6 ad movl %ebx, 0(%edi)
236 1.6 ad movl %ecx, 4(%edi)
237 1.6 ad 1:
238 1.6 ad popl %ebx
239 1.6 ad popl %edi
240 1.21 christos #ifdef _HARDKERNEL
241 1.14 ad popf
242 1.29 maxv #endif
243 1.6 ad ret
244 1.6 ad 2:
245 1.6 ad movl 0(%edi), %eax
246 1.6 ad movl 4(%edi), %edx
247 1.6 ad jmp 1b
248 1.22 uebayasi END(_atomic_cas_64)
249 1.29 maxv #endif /* !XENPV */
250 1.6 ad
251 1.13 chs ENTRY(_atomic_cas_cx8)
252 1.29 maxv /* 49 bytes of instructions */
253 1.6 ad pushl %edi
254 1.6 ad pushl %ebx
255 1.6 ad movl 12(%esp), %edi
256 1.6 ad movl 16(%esp), %eax
257 1.6 ad movl 20(%esp), %edx
258 1.6 ad movl 24(%esp), %ebx
259 1.6 ad movl 28(%esp), %ecx
260 1.27 maxv LOCK
261 1.6 ad cmpxchg8b (%edi)
262 1.6 ad popl %ebx
263 1.6 ad popl %edi
264 1.6 ad ret
265 1.21 christos #ifdef _HARDKERNEL
266 1.29 maxv .space 20, 0xCC
267 1.17 enami #endif
268 1.22 uebayasi END(_atomic_cas_cx8)
269 1.29 maxv LABEL(_atomic_cas_cx8_end)
270 1.21 christos #endif /* __HAVE_ATOMIC64_OPS || _KERNEL */
271 1.6 ad
272 1.1 ad ALIAS(atomic_add_32,_atomic_add_32)
273 1.4 ad ALIAS(atomic_add_int,_atomic_add_32)
274 1.4 ad ALIAS(atomic_add_long,_atomic_add_32)
275 1.1 ad ALIAS(atomic_add_ptr,_atomic_add_32)
276 1.1 ad
277 1.1 ad ALIAS(atomic_add_32_nv,_atomic_add_32_nv)
278 1.4 ad ALIAS(atomic_add_int_nv,_atomic_add_32_nv)
279 1.4 ad ALIAS(atomic_add_long_nv,_atomic_add_32_nv)
280 1.1 ad ALIAS(atomic_add_ptr_nv,_atomic_add_32_nv)
281 1.1 ad
282 1.1 ad ALIAS(atomic_and_32,_atomic_and_32)
283 1.1 ad ALIAS(atomic_and_uint,_atomic_and_32)
284 1.1 ad ALIAS(atomic_and_ulong,_atomic_and_32)
285 1.1 ad ALIAS(atomic_and_ptr,_atomic_and_32)
286 1.1 ad
287 1.1 ad ALIAS(atomic_and_32_nv,_atomic_and_32_nv)
288 1.1 ad ALIAS(atomic_and_uint_nv,_atomic_and_32_nv)
289 1.1 ad ALIAS(atomic_and_ulong_nv,_atomic_and_32_nv)
290 1.1 ad ALIAS(atomic_and_ptr_nv,_atomic_and_32_nv)
291 1.1 ad
292 1.1 ad ALIAS(atomic_dec_32,_atomic_dec_32)
293 1.1 ad ALIAS(atomic_dec_uint,_atomic_dec_32)
294 1.1 ad ALIAS(atomic_dec_ulong,_atomic_dec_32)
295 1.1 ad ALIAS(atomic_dec_ptr,_atomic_dec_32)
296 1.1 ad
297 1.1 ad ALIAS(atomic_dec_32_nv,_atomic_dec_32_nv)
298 1.1 ad ALIAS(atomic_dec_uint_nv,_atomic_dec_32_nv)
299 1.1 ad ALIAS(atomic_dec_ulong_nv,_atomic_dec_32_nv)
300 1.1 ad ALIAS(atomic_dec_ptr_nv,_atomic_dec_32_nv)
301 1.1 ad
302 1.1 ad ALIAS(atomic_inc_32,_atomic_inc_32)
303 1.1 ad ALIAS(atomic_inc_uint,_atomic_inc_32)
304 1.1 ad ALIAS(atomic_inc_ulong,_atomic_inc_32)
305 1.1 ad ALIAS(atomic_inc_ptr,_atomic_inc_32)
306 1.1 ad
307 1.1 ad ALIAS(atomic_inc_32_nv,_atomic_inc_32_nv)
308 1.1 ad ALIAS(atomic_inc_uint_nv,_atomic_inc_32_nv)
309 1.1 ad ALIAS(atomic_inc_ulong_nv,_atomic_inc_32_nv)
310 1.1 ad ALIAS(atomic_inc_ptr_nv,_atomic_inc_32_nv)
311 1.1 ad
312 1.1 ad ALIAS(atomic_or_32,_atomic_or_32)
313 1.1 ad ALIAS(atomic_or_uint,_atomic_or_32)
314 1.1 ad ALIAS(atomic_or_ulong,_atomic_or_32)
315 1.1 ad ALIAS(atomic_or_ptr,_atomic_or_32)
316 1.1 ad
317 1.1 ad ALIAS(atomic_or_32_nv,_atomic_or_32_nv)
318 1.1 ad ALIAS(atomic_or_uint_nv,_atomic_or_32_nv)
319 1.1 ad ALIAS(atomic_or_ulong_nv,_atomic_or_32_nv)
320 1.1 ad ALIAS(atomic_or_ptr_nv,_atomic_or_32_nv)
321 1.1 ad
322 1.1 ad ALIAS(atomic_swap_32,_atomic_swap_32)
323 1.1 ad ALIAS(atomic_swap_uint,_atomic_swap_32)
324 1.1 ad ALIAS(atomic_swap_ulong,_atomic_swap_32)
325 1.1 ad ALIAS(atomic_swap_ptr,_atomic_swap_32)
326 1.1 ad
327 1.1 ad ALIAS(atomic_cas_32,_atomic_cas_32)
328 1.1 ad ALIAS(atomic_cas_uint,_atomic_cas_32)
329 1.1 ad ALIAS(atomic_cas_ulong,_atomic_cas_32)
330 1.1 ad ALIAS(atomic_cas_ptr,_atomic_cas_32)
331 1.1 ad
332 1.9 ad ALIAS(atomic_cas_32_ni,_atomic_cas_32_ni)
333 1.9 ad ALIAS(atomic_cas_uint_ni,_atomic_cas_32_ni)
334 1.9 ad ALIAS(atomic_cas_ulong_ni,_atomic_cas_32_ni)
335 1.9 ad ALIAS(atomic_cas_ptr_ni,_atomic_cas_32_ni)
336 1.9 ad
337 1.21 christos #if defined(__HAVE_ATOMIC64_OPS) || defined(_KERNEL)
338 1.6 ad ALIAS(atomic_cas_64,_atomic_cas_64)
339 1.9 ad ALIAS(atomic_cas_64_ni,_atomic_cas_64)
340 1.20 martin ALIAS(__sync_val_compare_and_swap_8,_atomic_cas_64)
341 1.21 christos #endif /* __HAVE_ATOMIC64_OPS || _KERNEL */
342 1.6 ad
343 1.1 ad ALIAS(membar_consumer,_membar_consumer)
344 1.1 ad ALIAS(membar_producer,_membar_producer)
345 1.8 ad ALIAS(membar_enter,_membar_consumer)
346 1.8 ad ALIAS(membar_exit,_membar_producer)
347 1.1 ad ALIAS(membar_sync,_membar_sync)
348 1.5 ad
349 1.5 ad STRONG_ALIAS(_atomic_add_int,_atomic_add_32)
350 1.5 ad STRONG_ALIAS(_atomic_add_long,_atomic_add_32)
351 1.5 ad STRONG_ALIAS(_atomic_add_ptr,_atomic_add_32)
352 1.5 ad
353 1.5 ad STRONG_ALIAS(_atomic_add_int_nv,_atomic_add_32_nv)
354 1.5 ad STRONG_ALIAS(_atomic_add_long_nv,_atomic_add_32_nv)
355 1.5 ad STRONG_ALIAS(_atomic_add_ptr_nv,_atomic_add_32_nv)
356 1.5 ad
357 1.5 ad STRONG_ALIAS(_atomic_and_uint,_atomic_and_32)
358 1.5 ad STRONG_ALIAS(_atomic_and_ulong,_atomic_and_32)
359 1.5 ad STRONG_ALIAS(_atomic_and_ptr,_atomic_and_32)
360 1.5 ad
361 1.5 ad STRONG_ALIAS(_atomic_and_uint_nv,_atomic_and_32_nv)
362 1.5 ad STRONG_ALIAS(_atomic_and_ulong_nv,_atomic_and_32_nv)
363 1.5 ad STRONG_ALIAS(_atomic_and_ptr_nv,_atomic_and_32_nv)
364 1.5 ad
365 1.5 ad STRONG_ALIAS(_atomic_dec_uint,_atomic_dec_32)
366 1.5 ad STRONG_ALIAS(_atomic_dec_ulong,_atomic_dec_32)
367 1.5 ad STRONG_ALIAS(_atomic_dec_ptr,_atomic_dec_32)
368 1.5 ad
369 1.5 ad STRONG_ALIAS(_atomic_dec_uint_nv,_atomic_dec_32_nv)
370 1.5 ad STRONG_ALIAS(_atomic_dec_ulong_nv,_atomic_dec_32_nv)
371 1.5 ad STRONG_ALIAS(_atomic_dec_ptr_nv,_atomic_dec_32_nv)
372 1.5 ad
373 1.5 ad STRONG_ALIAS(_atomic_inc_uint,_atomic_inc_32)
374 1.5 ad STRONG_ALIAS(_atomic_inc_ulong,_atomic_inc_32)
375 1.5 ad STRONG_ALIAS(_atomic_inc_ptr,_atomic_inc_32)
376 1.5 ad
377 1.5 ad STRONG_ALIAS(_atomic_inc_uint_nv,_atomic_inc_32_nv)
378 1.5 ad STRONG_ALIAS(_atomic_inc_ulong_nv,_atomic_inc_32_nv)
379 1.5 ad STRONG_ALIAS(_atomic_inc_ptr_nv,_atomic_inc_32_nv)
380 1.5 ad
381 1.5 ad STRONG_ALIAS(_atomic_or_uint,_atomic_or_32)
382 1.5 ad STRONG_ALIAS(_atomic_or_ulong,_atomic_or_32)
383 1.5 ad STRONG_ALIAS(_atomic_or_ptr,_atomic_or_32)
384 1.5 ad
385 1.5 ad STRONG_ALIAS(_atomic_or_uint_nv,_atomic_or_32_nv)
386 1.5 ad STRONG_ALIAS(_atomic_or_ulong_nv,_atomic_or_32_nv)
387 1.5 ad STRONG_ALIAS(_atomic_or_ptr_nv,_atomic_or_32_nv)
388 1.5 ad
389 1.5 ad STRONG_ALIAS(_atomic_swap_uint,_atomic_swap_32)
390 1.5 ad STRONG_ALIAS(_atomic_swap_ulong,_atomic_swap_32)
391 1.5 ad STRONG_ALIAS(_atomic_swap_ptr,_atomic_swap_32)
392 1.5 ad
393 1.5 ad STRONG_ALIAS(_atomic_cas_uint,_atomic_cas_32)
394 1.5 ad STRONG_ALIAS(_atomic_cas_ulong,_atomic_cas_32)
395 1.5 ad STRONG_ALIAS(_atomic_cas_ptr,_atomic_cas_32)
396 1.8 ad
397 1.9 ad STRONG_ALIAS(_atomic_cas_uint_ni,_atomic_cas_32_ni)
398 1.9 ad STRONG_ALIAS(_atomic_cas_ulong_ni,_atomic_cas_32_ni)
399 1.9 ad STRONG_ALIAS(_atomic_cas_ptr_ni,_atomic_cas_32_ni)
400 1.9 ad
401 1.8 ad STRONG_ALIAS(_membar_enter,_membar_consumer)
402 1.8 ad STRONG_ALIAS(_membar_exit,_membar_producer)
403 1.28 maxv
404 1.28 maxv #ifdef _HARDKERNEL
405 1.28 maxv .section .rodata
406 1.28 maxv
407 1.28 maxv LABEL(sse2_mfence)
408 1.28 maxv mfence
409 1.28 maxv ret
410 1.28 maxv nop; nop; nop;
411 1.28 maxv LABEL(sse2_mfence_end)
412 1.28 maxv #endif /* _HARDKERNEL */
413