Home | History | Annotate | Line # | Download | only in atomic
atomic.S revision 1.3
      1  1.3  ad /*	$NetBSD: atomic.S,v 1.3 2007/11/28 18:02:29 ad Exp $	*/
      2  1.1  ad 
      3  1.1  ad /*-
      4  1.1  ad  * Copyright (c) 2007 The NetBSD Foundation, Inc.
      5  1.1  ad  * All rights reserved.
      6  1.1  ad  *
      7  1.1  ad  * This code is derived from software contributed to The NetBSD Foundation
      8  1.1  ad  * by Jason R. Thorpe, and by Andrew Doran.
      9  1.1  ad  *
     10  1.1  ad  * Redistribution and use in source and binary forms, with or without
     11  1.1  ad  * modification, are permitted provided that the following conditions
     12  1.1  ad  * are met:
     13  1.1  ad  * 1. Redistributions of source code must retain the above copyright
     14  1.1  ad  *    notice, this list of conditions and the following disclaimer.
     15  1.1  ad  * 2. Redistributions in binary form must reproduce the above copyright
     16  1.1  ad  *    notice, this list of conditions and the following disclaimer in the
     17  1.1  ad  *    documentation and/or other materials provided with the distribution.
     18  1.1  ad  * 3. All advertising materials mentioning features or use of this software
     19  1.1  ad  *    must display the following acknowledgement:
     20  1.1  ad  *	This product includes software developed by the NetBSD
     21  1.1  ad  *	Foundation, Inc. and its contributors.
     22  1.1  ad  * 4. Neither the name of The NetBSD Foundation nor the names of its
     23  1.1  ad  *    contributors may be used to endorse or promote products derived
     24  1.1  ad  *    from this software without specific prior written permission.
     25  1.1  ad  *
     26  1.1  ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     27  1.1  ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     28  1.1  ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     29  1.1  ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     30  1.1  ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     31  1.1  ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     32  1.1  ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     33  1.1  ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     34  1.1  ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     35  1.1  ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     36  1.1  ad  * POSSIBILITY OF SUCH DAMAGE.
     37  1.1  ad  */
     38  1.1  ad 
     39  1.1  ad #include <machine/asm.h>
     40  1.1  ad 
     41  1.1  ad #ifdef _KERNEL
     42  1.1  ad #define	LOCK(n)		.Lpatch/**/n:	lock
     43  1.1  ad #define	ALIAS(f, t)	STRONG_ALIAS(f,t)
     44  1.2  ad #define	END(a)		_ALIGN_TEXT; LABEL(a)
     45  1.1  ad #else
     46  1.1  ad #define	LOCK(n)		lock
     47  1.1  ad #define	ALIAS(f, t)	WEAK_ALIAS(f,t)
     48  1.2  ad #define	END(a)		/* nothing */
     49  1.1  ad #endif
     50  1.1  ad 
     51  1.1  ad 	.text
     52  1.1  ad 
     53  1.1  ad /* 32-bit */
     54  1.1  ad 
     55  1.1  ad NENTRY(_atomic_add_32)
     56  1.1  ad 	LOCK(1)
     57  1.1  ad 	addl	%esi, (%rdi)
     58  1.1  ad 	ret
     59  1.1  ad 
     60  1.1  ad NENTRY(_atomic_add_32_nv)
     61  1.1  ad 	movl	%esi, %eax
     62  1.1  ad 	LOCK(2)
     63  1.1  ad 	xaddl	%eax, (%rdi)
     64  1.1  ad 	addl	%esi, %eax
     65  1.1  ad 	ret
     66  1.1  ad 
     67  1.1  ad NENTRY(_atomic_and_32)
     68  1.1  ad 	LOCK(3)
     69  1.1  ad 	andl	%esi, (%rdi)
     70  1.1  ad 	ret
     71  1.1  ad 
     72  1.1  ad NENTRY(_atomic_and_32_nv)
     73  1.1  ad 	movl	(%rdi), %eax
     74  1.1  ad 1:
     75  1.1  ad 	movl	%eax, %ecx
     76  1.1  ad 	andl	%esi, %ecx
     77  1.1  ad 	LOCK(4)
     78  1.1  ad 	cmpxchgl %ecx, (%rdi)
     79  1.1  ad 	jnz	1b
     80  1.1  ad 	movl	%ecx, %eax
     81  1.1  ad 	ret
     82  1.1  ad 
     83  1.1  ad NENTRY(_atomic_dec_32)
     84  1.1  ad 	LOCK(5)
     85  1.1  ad 	decl	(%rdi)
     86  1.1  ad 	ret
     87  1.1  ad 
     88  1.1  ad NENTRY(_atomic_dec_32_nv)
     89  1.1  ad 	movl	$-1, %eax
     90  1.1  ad 	LOCK(6)
     91  1.1  ad 	xaddl	%eax, (%rdi)
     92  1.1  ad 	decl	%eax
     93  1.1  ad 	ret
     94  1.1  ad 
     95  1.1  ad NENTRY(_atomic_inc_32)
     96  1.1  ad 	LOCK(7)
     97  1.1  ad 	incl	(%rdi)
     98  1.1  ad 	ret
     99  1.1  ad 
    100  1.1  ad NENTRY(_atomic_inc_32_nv)
    101  1.1  ad 	movl	$1, %eax
    102  1.1  ad 	LOCK(8)
    103  1.1  ad 	xaddl	%eax, (%rdi)
    104  1.1  ad 	incl	%eax
    105  1.1  ad 	ret
    106  1.1  ad 
    107  1.1  ad NENTRY(_atomic_or_32)
    108  1.1  ad 	LOCK(9)
    109  1.1  ad 	orl	%esi, (%rdi)
    110  1.1  ad 	ret
    111  1.1  ad 
    112  1.1  ad NENTRY(_atomic_or_32_nv)
    113  1.1  ad 	movl	(%rdi), %eax
    114  1.1  ad 1:
    115  1.1  ad 	movl	%eax, %ecx
    116  1.1  ad 	orl	%esi, %ecx
    117  1.1  ad 	LOCK(10)
    118  1.1  ad 	cmpxchgl %ecx, (%rdi)
    119  1.1  ad 	jnz	1b
    120  1.1  ad 	movl	%ecx, %eax
    121  1.1  ad 	ret
    122  1.1  ad 
    123  1.1  ad NENTRY(_atomic_swap_32)
    124  1.1  ad 	xchgl	%esi, (%rdi)
    125  1.1  ad 	ret
    126  1.1  ad 
    127  1.1  ad NENTRY(_atomic_cas_32)
    128  1.1  ad 	movl	%esi, %eax
    129  1.1  ad 	LOCK(12)
    130  1.1  ad 	cmpxchgl %edx, (%rdi)
    131  1.1  ad 	/* %eax now contains the old value */
    132  1.1  ad 	ret
    133  1.1  ad 
    134  1.1  ad /* 64-bit */
    135  1.1  ad 
    136  1.1  ad NENTRY(_atomic_add_64)
    137  1.1  ad 	LOCK(13)
    138  1.1  ad 	addq	%rsi, (%rdi)
    139  1.1  ad 	ret
    140  1.1  ad 
    141  1.1  ad NENTRY(_atomic_add_64_nv)
    142  1.1  ad 	movq	%rsi, %rax
    143  1.1  ad 	LOCK(14)
    144  1.1  ad 	xaddq	%rax, (%rdi)
    145  1.1  ad 	addq	%rsi, %rax
    146  1.1  ad 	ret
    147  1.1  ad 
    148  1.1  ad NENTRY(_atomic_and_64)
    149  1.1  ad 	LOCK(15)
    150  1.1  ad 	andq	%rsi, (%rdi)
    151  1.1  ad 	ret
    152  1.1  ad 
    153  1.1  ad NENTRY(_atomic_and_64_nv)
    154  1.1  ad 	movq	(%rdi), %rax
    155  1.1  ad 1:
    156  1.1  ad 	movq	%rax, %rcx
    157  1.1  ad 	andq	%rsi, %rcx
    158  1.1  ad 	LOCK(16)
    159  1.1  ad 	cmpxchgq %rcx, (%rdi)
    160  1.1  ad 	jnz	1b
    161  1.1  ad 	movq	%rcx, %rax
    162  1.1  ad 	ret
    163  1.1  ad 
    164  1.1  ad NENTRY(_atomic_dec_64)
    165  1.1  ad 	LOCK(17)
    166  1.1  ad 	decq	(%rdi)
    167  1.1  ad 	ret
    168  1.1  ad 
    169  1.1  ad NENTRY(_atomic_dec_64_nv)
    170  1.1  ad 	movq	$-1, %rax
    171  1.1  ad 	LOCK(18)
    172  1.1  ad 	xaddq	%rax, (%rdi)
    173  1.1  ad 	decq	%rax
    174  1.1  ad 	ret
    175  1.1  ad 
    176  1.1  ad NENTRY(_atomic_inc_64)
    177  1.1  ad 	LOCK(19)
    178  1.1  ad 	incq	(%rdi)
    179  1.1  ad 	ret
    180  1.1  ad 
    181  1.1  ad NENTRY(_atomic_inc_64_nv)
    182  1.1  ad 	movq	$1, %rax
    183  1.1  ad 	LOCK(20)
    184  1.1  ad 	xaddq	%rax, (%rdi)
    185  1.1  ad 	incq	%rax
    186  1.1  ad 	ret
    187  1.1  ad 
    188  1.1  ad NENTRY(_atomic_or_64)
    189  1.1  ad 	LOCK(21)
    190  1.1  ad 	orq	%rsi, (%rdi)
    191  1.1  ad 	ret
    192  1.1  ad 
    193  1.1  ad NENTRY(_atomic_or_64_nv)
    194  1.1  ad 	movq	(%rdi), %rax
    195  1.1  ad 1:
    196  1.1  ad 	movq	%rax, %rcx
    197  1.1  ad 	orq	%rsi, %rcx
    198  1.1  ad 	LOCK(22)
    199  1.1  ad 	cmpxchgq %rcx, (%rdi)
    200  1.1  ad 	jnz	1b
    201  1.1  ad 	movq	%rcx, %rax
    202  1.1  ad 	ret
    203  1.1  ad 
    204  1.1  ad NENTRY(_atomic_swap_64)
    205  1.1  ad 	xchgq	%rsi, (%rdi)
    206  1.1  ad 	ret
    207  1.1  ad 
    208  1.1  ad NENTRY(_atomic_cas_64)
    209  1.1  ad 	movq	%rsi, %rax
    210  1.1  ad 	LOCK(24)
    211  1.1  ad 	cmpxchgl %edx, (%rdi)
    212  1.1  ad 	/* %eax now contains the old value */
    213  1.1  ad 	ret
    214  1.1  ad 
    215  1.1  ad /* memory barriers */
    216  1.1  ad 
    217  1.1  ad NENTRY(_membar_consumer)
    218  1.1  ad 	LOCK(25)
    219  1.1  ad 	addq	$0, -8(%rsp)
    220  1.1  ad 	ret
    221  1.2  ad END(membar_consumer_end)
    222  1.1  ad 
    223  1.1  ad NENTRY(_membar_producer)
    224  1.1  ad 	/* A store is enough */
    225  1.1  ad 	movq	$0, -8(%rsp)
    226  1.1  ad 	ret
    227  1.2  ad END(membar_producer_end)
    228  1.1  ad 
    229  1.1  ad NENTRY(_membar_enter)
    230  1.1  ad 	/* A store is enough */
    231  1.1  ad 	movq	$0, -8(%rsp)
    232  1.1  ad 	ret
    233  1.2  ad END(membar_enter_end)
    234  1.1  ad 
    235  1.1  ad NENTRY(_membar_exit)
    236  1.1  ad 	/* A store is enough */
    237  1.1  ad 	movq	$0, -8(%rsp)
    238  1.1  ad 	ret
    239  1.2  ad END(membar_exit_end)
    240  1.1  ad 
    241  1.1  ad NENTRY(_membar_sync)
    242  1.1  ad 	LOCK(26)
    243  1.1  ad 	addq	$0, -8(%rsp)
    244  1.1  ad 	ret
    245  1.2  ad END(membar_sync_end)
    246  1.1  ad 
    247  1.1  ad #ifdef _KERNEL
    248  1.1  ad NENTRY(sse2_lfence)
    249  1.1  ad 	lfence
    250  1.1  ad 	ret
    251  1.2  ad END(sse2_lfence_end)
    252  1.1  ad 
    253  1.1  ad NENTRY(sse2_mfence)
    254  1.1  ad 	mfence
    255  1.1  ad 	ret
    256  1.2  ad END(sse2_mfence_end)
    257  1.1  ad 
    258  1.1  ad atomic_lockpatch:
    259  1.1  ad 	.globl	atomic_lockpatch
    260  1.2  ad 	.quad	.Lpatch1, .Lpatch2, .Lpatch3, .Lpatch4, .Lpatch5
    261  1.2  ad 	.quad	.Lpatch6, .Lpatch7, .Lpatch8, .Lpatch9, .Lpatch10
    262  1.3  ad 	.quad	.Lpatch12, .Lpatch13, .Lpatch14, .Lpatch15
    263  1.2  ad 	.quad	.Lpatch16, .Lpatch17, .Lpatch18, .Lpatch19, .Lpatch20
    264  1.3  ad 	.quad	.Lpatch21, .Lpatch22, .Lpatch24, .Lpatch25
    265  1.2  ad 	.quad	.Lpatch26, 0
    266  1.1  ad #endif	/* _KERNEL */
    267  1.1  ad 
    268  1.1  ad ALIAS(atomic_add_32,_atomic_add_32)
    269  1.1  ad ALIAS(atomic_add_64,_atomic_add_64)
    270  1.1  ad ALIAS(atomic_add_uint,_atomic_add_32)
    271  1.1  ad ALIAS(atomic_add_ulong,_atomic_add_64)
    272  1.1  ad ALIAS(atomic_add_ptr,_atomic_add_64)
    273  1.1  ad 
    274  1.1  ad ALIAS(atomic_add_32_nv,_atomic_add_32_nv)
    275  1.1  ad ALIAS(atomic_add_64_nv,_atomic_add_64_nv)
    276  1.1  ad ALIAS(atomic_add_uint_nv,_atomic_add_32_nv)
    277  1.1  ad ALIAS(atomic_add_ulong_nv,_atomic_add_64_nv)
    278  1.1  ad ALIAS(atomic_add_ptr_nv,_atomic_add_64_nv)
    279  1.1  ad 
    280  1.1  ad ALIAS(atomic_and_32,_atomic_and_32)
    281  1.1  ad ALIAS(atomic_and_64,_atomic_and_64)
    282  1.1  ad ALIAS(atomic_and_uint,_atomic_and_32)
    283  1.1  ad ALIAS(atomic_and_ulong,_atomic_and_64)
    284  1.1  ad ALIAS(atomic_and_ptr,_atomic_and_64)
    285  1.1  ad 
    286  1.1  ad ALIAS(atomic_and_32_nv,_atomic_and_32_nv)
    287  1.1  ad ALIAS(atomic_and_64_nv,_atomic_and_64_nv)
    288  1.1  ad ALIAS(atomic_and_uint_nv,_atomic_and_32_nv)
    289  1.1  ad ALIAS(atomic_and_ulong_nv,_atomic_and_64_nv)
    290  1.1  ad ALIAS(atomic_and_ptr_nv,_atomic_and_64_nv)
    291  1.1  ad 
    292  1.1  ad ALIAS(atomic_dec_32,_atomic_dec_32)
    293  1.1  ad ALIAS(atomic_dec_64,_atomic_dec_64)
    294  1.1  ad ALIAS(atomic_dec_uint,_atomic_dec_32)
    295  1.1  ad ALIAS(atomic_dec_ulong,_atomic_dec_64)
    296  1.1  ad ALIAS(atomic_dec_ptr,_atomic_dec_64)
    297  1.1  ad 
    298  1.1  ad ALIAS(atomic_dec_32_nv,_atomic_dec_32_nv)
    299  1.1  ad ALIAS(atomic_dec_64_nv,_atomic_dec_64_nv)
    300  1.1  ad ALIAS(atomic_dec_uint_nv,_atomic_dec_32_nv)
    301  1.1  ad ALIAS(atomic_dec_ulong_nv,_atomic_dec_64_nv)
    302  1.1  ad ALIAS(atomic_dec_ptr_nv,_atomic_dec_64_nv)
    303  1.1  ad 
    304  1.1  ad ALIAS(atomic_inc_32,_atomic_inc_32)
    305  1.1  ad ALIAS(atomic_inc_64,_atomic_inc_64)
    306  1.1  ad ALIAS(atomic_inc_uint,_atomic_inc_32)
    307  1.1  ad ALIAS(atomic_inc_ulong,_atomic_inc_64)
    308  1.1  ad ALIAS(atomic_inc_ptr,_atomic_inc_64)
    309  1.1  ad 
    310  1.1  ad ALIAS(atomic_inc_32_nv,_atomic_inc_32_nv)
    311  1.1  ad ALIAS(atomic_inc_64_nv,_atomic_inc_64_nv)
    312  1.1  ad ALIAS(atomic_inc_uint_nv,_atomic_inc_32_nv)
    313  1.1  ad ALIAS(atomic_inc_ulong_nv,_atomic_inc_64_nv)
    314  1.1  ad ALIAS(atomic_inc_ptr_nv,_atomic_inc_64_nv)
    315  1.1  ad 
    316  1.1  ad ALIAS(atomic_or_32,_atomic_or_32)
    317  1.1  ad ALIAS(atomic_or_uint,_atomic_or_32)
    318  1.1  ad ALIAS(atomic_or_ulong,_atomic_or_64)
    319  1.1  ad ALIAS(atomic_or_ptr,_atomic_or_64)
    320  1.1  ad 
    321  1.1  ad ALIAS(atomic_or_32_nv,_atomic_or_32_nv)
    322  1.1  ad ALIAS(atomic_or_64_nv,_atomic_or_64_nv)
    323  1.1  ad ALIAS(atomic_or_uint_nv,_atomic_or_32_nv)
    324  1.1  ad ALIAS(atomic_or_ulong_nv,_atomic_or_64_nv)
    325  1.1  ad ALIAS(atomic_or_ptr_nv,_atomic_or_64_nv)
    326  1.1  ad 
    327  1.1  ad ALIAS(atomic_swap_32,_atomic_swap_32)
    328  1.1  ad ALIAS(atomic_swap_64,_atomic_swap_64)
    329  1.1  ad ALIAS(atomic_swap_uint,_atomic_swap_32)
    330  1.1  ad ALIAS(atomic_swap_ulong,_atomic_swap_64)
    331  1.1  ad ALIAS(atomic_swap_ptr,_atomic_swap_64)
    332  1.1  ad 
    333  1.1  ad ALIAS(atomic_cas_32,_atomic_cas_32)
    334  1.1  ad ALIAS(atomic_cas_64,_atomic_cas_64)
    335  1.1  ad ALIAS(atomic_cas_uint,_atomic_cas_32)
    336  1.1  ad ALIAS(atomic_cas_ulong,_atomic_cas_64)
    337  1.1  ad ALIAS(atomic_cas_ptr,_atomic_cas_64)
    338  1.1  ad 
    339  1.1  ad ALIAS(membar_consumer,_membar_consumer)
    340  1.1  ad ALIAS(membar_producer,_membar_producer)
    341  1.1  ad ALIAS(membar_enter,_membar_enter)
    342  1.1  ad ALIAS(membar_exit,_membar_exit)
    343  1.1  ad ALIAS(membar_sync,_membar_sync)
    344