Home | History | Annotate | Line # | Download | only in atomic
atomic.S revision 1.2
      1  1.2  ad /*	$NetBSD: atomic.S,v 1.2 2007/11/28 15:24:38 ad Exp $	*/
      2  1.1  ad 
      3  1.1  ad /*-
      4  1.1  ad  * Copyright (c) 2007 The NetBSD Foundation, Inc.
      5  1.1  ad  * All rights reserved.
      6  1.1  ad  *
      7  1.1  ad  * This code is derived from software contributed to The NetBSD Foundation
      8  1.1  ad  * by Jason R. Thorpe, and by Andrew Doran.
      9  1.1  ad  *
     10  1.1  ad  * Redistribution and use in source and binary forms, with or without
     11  1.1  ad  * modification, are permitted provided that the following conditions
     12  1.1  ad  * are met:
     13  1.1  ad  * 1. Redistributions of source code must retain the above copyright
     14  1.1  ad  *    notice, this list of conditions and the following disclaimer.
     15  1.1  ad  * 2. Redistributions in binary form must reproduce the above copyright
     16  1.1  ad  *    notice, this list of conditions and the following disclaimer in the
     17  1.1  ad  *    documentation and/or other materials provided with the distribution.
     18  1.1  ad  * 3. All advertising materials mentioning features or use of this software
     19  1.1  ad  *    must display the following acknowledgement:
     20  1.1  ad  *	This product includes software developed by the NetBSD
     21  1.1  ad  *	Foundation, Inc. and its contributors.
     22  1.1  ad  * 4. Neither the name of The NetBSD Foundation nor the names of its
     23  1.1  ad  *    contributors may be used to endorse or promote products derived
     24  1.1  ad  *    from this software without specific prior written permission.
     25  1.1  ad  *
     26  1.1  ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     27  1.1  ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     28  1.1  ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     29  1.1  ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     30  1.1  ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     31  1.1  ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     32  1.1  ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     33  1.1  ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     34  1.1  ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     35  1.1  ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     36  1.1  ad  * POSSIBILITY OF SUCH DAMAGE.
     37  1.1  ad  */
     38  1.1  ad 
     39  1.1  ad #include <machine/asm.h>
     40  1.1  ad 
     41  1.1  ad #ifdef _KERNEL
     42  1.1  ad #define	LOCK(n)		.Lpatch/**/n:	lock
     43  1.1  ad #define	ALIAS(f, t)	STRONG_ALIAS(f,t)
     44  1.2  ad #define	END(a)		_ALIGN_TEXT; LABEL(a)
     45  1.1  ad #else
     46  1.1  ad #define	LOCK(n)		lock
     47  1.1  ad #define	ALIAS(f, t)	WEAK_ALIAS(f,t)
     48  1.2  ad #define	END(a)		/* nothing */
     49  1.1  ad #endif
     50  1.1  ad 
     51  1.1  ad 	.text
     52  1.1  ad 
     53  1.1  ad /* 32-bit */
     54  1.1  ad 
     55  1.1  ad NENTRY(_atomic_add_32)
     56  1.1  ad 	LOCK(1)
     57  1.1  ad 	addl	%esi, (%rdi)
     58  1.1  ad 	ret
     59  1.1  ad 
     60  1.1  ad NENTRY(_atomic_add_32_nv)
     61  1.1  ad 	movl	%esi, %eax
     62  1.1  ad 	LOCK(2)
     63  1.1  ad 	xaddl	%eax, (%rdi)
     64  1.1  ad 	addl	%esi, %eax
     65  1.1  ad 	ret
     66  1.1  ad 
     67  1.1  ad NENTRY(_atomic_and_32)
     68  1.1  ad 	LOCK(3)
     69  1.1  ad 	andl	%esi, (%rdi)
     70  1.1  ad 	ret
     71  1.1  ad 
     72  1.1  ad NENTRY(_atomic_and_32_nv)
     73  1.1  ad 	movl	(%rdi), %eax
     74  1.1  ad 1:
     75  1.1  ad 	movl	%eax, %ecx
     76  1.1  ad 	andl	%esi, %ecx
     77  1.1  ad 	LOCK(4)
     78  1.1  ad 	cmpxchgl %ecx, (%rdi)
     79  1.1  ad 	jnz	1b
     80  1.1  ad 	movl	%ecx, %eax
     81  1.1  ad 	ret
     82  1.1  ad 
     83  1.1  ad NENTRY(_atomic_dec_32)
     84  1.1  ad 	LOCK(5)
     85  1.1  ad 	decl	(%rdi)
     86  1.1  ad 	ret
     87  1.1  ad 
     88  1.1  ad NENTRY(_atomic_dec_32_nv)
     89  1.1  ad 	movl	$-1, %eax
     90  1.1  ad 	LOCK(6)
     91  1.1  ad 	xaddl	%eax, (%rdi)
     92  1.1  ad 	decl	%eax
     93  1.1  ad 	ret
     94  1.1  ad 
     95  1.1  ad NENTRY(_atomic_inc_32)
     96  1.1  ad 	LOCK(7)
     97  1.1  ad 	incl	(%rdi)
     98  1.1  ad 	ret
     99  1.1  ad 
    100  1.1  ad NENTRY(_atomic_inc_32_nv)
    101  1.1  ad 	movl	$1, %eax
    102  1.1  ad 	LOCK(8)
    103  1.1  ad 	xaddl	%eax, (%rdi)
    104  1.1  ad 	incl	%eax
    105  1.1  ad 	ret
    106  1.1  ad 
    107  1.1  ad NENTRY(_atomic_or_32)
    108  1.1  ad 	LOCK(9)
    109  1.1  ad 	orl	%esi, (%rdi)
    110  1.1  ad 	ret
    111  1.1  ad 
    112  1.1  ad NENTRY(_atomic_or_32_nv)
    113  1.1  ad 	movl	(%rdi), %eax
    114  1.1  ad 1:
    115  1.1  ad 	movl	%eax, %ecx
    116  1.1  ad 	orl	%esi, %ecx
    117  1.1  ad 	LOCK(10)
    118  1.1  ad 	cmpxchgl %ecx, (%rdi)
    119  1.1  ad 	jnz	1b
    120  1.1  ad 	movl	%ecx, %eax
    121  1.1  ad 	ret
    122  1.1  ad 
    123  1.1  ad NENTRY(_atomic_swap_32)
    124  1.1  ad 	LOCK(11)
    125  1.1  ad 	xchgl	%esi, (%rdi)
    126  1.1  ad 	ret
    127  1.1  ad 
    128  1.1  ad NENTRY(_atomic_cas_32)
    129  1.1  ad 	movl	%esi, %eax
    130  1.1  ad 	LOCK(12)
    131  1.1  ad 	cmpxchgl %edx, (%rdi)
    132  1.1  ad 	/* %eax now contains the old value */
    133  1.1  ad 	ret
    134  1.1  ad 
    135  1.1  ad /* 64-bit */
    136  1.1  ad 
    137  1.1  ad NENTRY(_atomic_add_64)
    138  1.1  ad 	LOCK(13)
    139  1.1  ad 	addq	%rsi, (%rdi)
    140  1.1  ad 	ret
    141  1.1  ad 
    142  1.1  ad NENTRY(_atomic_add_64_nv)
    143  1.1  ad 	movq	%rsi, %rax
    144  1.1  ad 	LOCK(14)
    145  1.1  ad 	xaddq	%rax, (%rdi)
    146  1.1  ad 	addq	%rsi, %rax
    147  1.1  ad 	ret
    148  1.1  ad 
    149  1.1  ad NENTRY(_atomic_and_64)
    150  1.1  ad 	LOCK(15)
    151  1.1  ad 	andq	%rsi, (%rdi)
    152  1.1  ad 	ret
    153  1.1  ad 
    154  1.1  ad NENTRY(_atomic_and_64_nv)
    155  1.1  ad 	movq	(%rdi), %rax
    156  1.1  ad 1:
    157  1.1  ad 	movq	%rax, %rcx
    158  1.1  ad 	andq	%rsi, %rcx
    159  1.1  ad 	LOCK(16)
    160  1.1  ad 	cmpxchgq %rcx, (%rdi)
    161  1.1  ad 	jnz	1b
    162  1.1  ad 	movq	%rcx, %rax
    163  1.1  ad 	ret
    164  1.1  ad 
    165  1.1  ad NENTRY(_atomic_dec_64)
    166  1.1  ad 	LOCK(17)
    167  1.1  ad 	decq	(%rdi)
    168  1.1  ad 	ret
    169  1.1  ad 
    170  1.1  ad NENTRY(_atomic_dec_64_nv)
    171  1.1  ad 	movq	$-1, %rax
    172  1.1  ad 	LOCK(18)
    173  1.1  ad 	xaddq	%rax, (%rdi)
    174  1.1  ad 	decq	%rax
    175  1.1  ad 	ret
    176  1.1  ad 
    177  1.1  ad NENTRY(_atomic_inc_64)
    178  1.1  ad 	LOCK(19)
    179  1.1  ad 	incq	(%rdi)
    180  1.1  ad 	ret
    181  1.1  ad 
    182  1.1  ad NENTRY(_atomic_inc_64_nv)
    183  1.1  ad 	movq	$1, %rax
    184  1.1  ad 	LOCK(20)
    185  1.1  ad 	xaddq	%rax, (%rdi)
    186  1.1  ad 	incq	%rax
    187  1.1  ad 	ret
    188  1.1  ad 
    189  1.1  ad NENTRY(_atomic_or_64)
    190  1.1  ad 	LOCK(21)
    191  1.1  ad 	orq	%rsi, (%rdi)
    192  1.1  ad 	ret
    193  1.1  ad 
    194  1.1  ad NENTRY(_atomic_or_64_nv)
    195  1.1  ad 	movq	(%rdi), %rax
    196  1.1  ad 1:
    197  1.1  ad 	movq	%rax, %rcx
    198  1.1  ad 	orq	%rsi, %rcx
    199  1.1  ad 	LOCK(22)
    200  1.1  ad 	cmpxchgq %rcx, (%rdi)
    201  1.1  ad 	jnz	1b
    202  1.1  ad 	movq	%rcx, %rax
    203  1.1  ad 	ret
    204  1.1  ad 
    205  1.1  ad NENTRY(_atomic_swap_64)
    206  1.1  ad 	LOCK(23)
    207  1.1  ad 	xchgq	%rsi, (%rdi)
    208  1.1  ad 	ret
    209  1.1  ad 
    210  1.1  ad NENTRY(_atomic_cas_64)
    211  1.1  ad 	movq	%rsi, %rax
    212  1.1  ad 	LOCK(24)
    213  1.1  ad 	cmpxchgl %edx, (%rdi)
    214  1.1  ad 	/* %eax now contains the old value */
    215  1.1  ad 	ret
    216  1.1  ad 
    217  1.1  ad /* memory barriers */
    218  1.1  ad 
    219  1.1  ad NENTRY(_membar_consumer)
    220  1.1  ad 	LOCK(25)
    221  1.1  ad 	addq	$0, -8(%rsp)
    222  1.1  ad 	ret
    223  1.2  ad END(membar_consumer_end)
    224  1.1  ad 
    225  1.1  ad NENTRY(_membar_producer)
    226  1.1  ad 	/* A store is enough */
    227  1.1  ad 	movq	$0, -8(%rsp)
    228  1.1  ad 	ret
    229  1.2  ad END(membar_producer_end)
    230  1.1  ad 
    231  1.1  ad NENTRY(_membar_enter)
    232  1.1  ad 	/* A store is enough */
    233  1.1  ad 	movq	$0, -8(%rsp)
    234  1.1  ad 	ret
    235  1.2  ad END(membar_enter_end)
    236  1.1  ad 
    237  1.1  ad NENTRY(_membar_exit)
    238  1.1  ad 	/* A store is enough */
    239  1.1  ad 	movq	$0, -8(%rsp)
    240  1.1  ad 	ret
    241  1.2  ad END(membar_exit_end)
    242  1.1  ad 
    243  1.1  ad NENTRY(_membar_sync)
    244  1.1  ad 	LOCK(26)
    245  1.1  ad 	addq	$0, -8(%rsp)
    246  1.1  ad 	ret
    247  1.2  ad END(membar_sync_end)
    248  1.1  ad 
    249  1.1  ad #ifdef _KERNEL
    250  1.1  ad NENTRY(sse2_lfence)
    251  1.1  ad 	lfence
    252  1.1  ad 	ret
    253  1.2  ad END(sse2_lfence_end)
    254  1.1  ad 
    255  1.1  ad NENTRY(sse2_mfence)
    256  1.1  ad 	mfence
    257  1.1  ad 	ret
    258  1.2  ad END(sse2_mfence_end)
    259  1.1  ad 
    260  1.1  ad atomic_lockpatch:
    261  1.1  ad 	.globl	atomic_lockpatch
    262  1.2  ad 	.quad	.Lpatch1, .Lpatch2, .Lpatch3, .Lpatch4, .Lpatch5
    263  1.2  ad 	.quad	.Lpatch6, .Lpatch7, .Lpatch8, .Lpatch9, .Lpatch10
    264  1.2  ad 	.quad	.Lpatch11, .Lpatch12, .Lpatch13, .Lpatch14, .Lpatch15
    265  1.2  ad 	.quad	.Lpatch16, .Lpatch17, .Lpatch18, .Lpatch19, .Lpatch20
    266  1.2  ad 	.quad	.Lpatch21, .Lpatch22, .Lpatch23, .Lpatch24, .Lpatch25
    267  1.2  ad 	.quad	.Lpatch26, 0
    268  1.1  ad #endif	/* _KERNEL */
    269  1.1  ad 
    270  1.1  ad ALIAS(atomic_add_32,_atomic_add_32)
    271  1.1  ad ALIAS(atomic_add_64,_atomic_add_64)
    272  1.1  ad ALIAS(atomic_add_uint,_atomic_add_32)
    273  1.1  ad ALIAS(atomic_add_ulong,_atomic_add_64)
    274  1.1  ad ALIAS(atomic_add_ptr,_atomic_add_64)
    275  1.1  ad 
    276  1.1  ad ALIAS(atomic_add_32_nv,_atomic_add_32_nv)
    277  1.1  ad ALIAS(atomic_add_64_nv,_atomic_add_64_nv)
    278  1.1  ad ALIAS(atomic_add_uint_nv,_atomic_add_32_nv)
    279  1.1  ad ALIAS(atomic_add_ulong_nv,_atomic_add_64_nv)
    280  1.1  ad ALIAS(atomic_add_ptr_nv,_atomic_add_64_nv)
    281  1.1  ad 
    282  1.1  ad ALIAS(atomic_and_32,_atomic_and_32)
    283  1.1  ad ALIAS(atomic_and_64,_atomic_and_64)
    284  1.1  ad ALIAS(atomic_and_uint,_atomic_and_32)
    285  1.1  ad ALIAS(atomic_and_ulong,_atomic_and_64)
    286  1.1  ad ALIAS(atomic_and_ptr,_atomic_and_64)
    287  1.1  ad 
    288  1.1  ad ALIAS(atomic_and_32_nv,_atomic_and_32_nv)
    289  1.1  ad ALIAS(atomic_and_64_nv,_atomic_and_64_nv)
    290  1.1  ad ALIAS(atomic_and_uint_nv,_atomic_and_32_nv)
    291  1.1  ad ALIAS(atomic_and_ulong_nv,_atomic_and_64_nv)
    292  1.1  ad ALIAS(atomic_and_ptr_nv,_atomic_and_64_nv)
    293  1.1  ad 
    294  1.1  ad ALIAS(atomic_dec_32,_atomic_dec_32)
    295  1.1  ad ALIAS(atomic_dec_64,_atomic_dec_64)
    296  1.1  ad ALIAS(atomic_dec_uint,_atomic_dec_32)
    297  1.1  ad ALIAS(atomic_dec_ulong,_atomic_dec_64)
    298  1.1  ad ALIAS(atomic_dec_ptr,_atomic_dec_64)
    299  1.1  ad 
    300  1.1  ad ALIAS(atomic_dec_32_nv,_atomic_dec_32_nv)
    301  1.1  ad ALIAS(atomic_dec_64_nv,_atomic_dec_64_nv)
    302  1.1  ad ALIAS(atomic_dec_uint_nv,_atomic_dec_32_nv)
    303  1.1  ad ALIAS(atomic_dec_ulong_nv,_atomic_dec_64_nv)
    304  1.1  ad ALIAS(atomic_dec_ptr_nv,_atomic_dec_64_nv)
    305  1.1  ad 
    306  1.1  ad ALIAS(atomic_inc_32,_atomic_inc_32)
    307  1.1  ad ALIAS(atomic_inc_64,_atomic_inc_64)
    308  1.1  ad ALIAS(atomic_inc_uint,_atomic_inc_32)
    309  1.1  ad ALIAS(atomic_inc_ulong,_atomic_inc_64)
    310  1.1  ad ALIAS(atomic_inc_ptr,_atomic_inc_64)
    311  1.1  ad 
    312  1.1  ad ALIAS(atomic_inc_32_nv,_atomic_inc_32_nv)
    313  1.1  ad ALIAS(atomic_inc_64_nv,_atomic_inc_64_nv)
    314  1.1  ad ALIAS(atomic_inc_uint_nv,_atomic_inc_32_nv)
    315  1.1  ad ALIAS(atomic_inc_ulong_nv,_atomic_inc_64_nv)
    316  1.1  ad ALIAS(atomic_inc_ptr_nv,_atomic_inc_64_nv)
    317  1.1  ad 
    318  1.1  ad ALIAS(atomic_or_32,_atomic_or_32)
    319  1.1  ad ALIAS(atomic_or_uint,_atomic_or_32)
    320  1.1  ad ALIAS(atomic_or_ulong,_atomic_or_64)
    321  1.1  ad ALIAS(atomic_or_ptr,_atomic_or_64)
    322  1.1  ad 
    323  1.1  ad ALIAS(atomic_or_32_nv,_atomic_or_32_nv)
    324  1.1  ad ALIAS(atomic_or_64_nv,_atomic_or_64_nv)
    325  1.1  ad ALIAS(atomic_or_uint_nv,_atomic_or_32_nv)
    326  1.1  ad ALIAS(atomic_or_ulong_nv,_atomic_or_64_nv)
    327  1.1  ad ALIAS(atomic_or_ptr_nv,_atomic_or_64_nv)
    328  1.1  ad 
    329  1.1  ad ALIAS(atomic_swap_32,_atomic_swap_32)
    330  1.1  ad ALIAS(atomic_swap_64,_atomic_swap_64)
    331  1.1  ad ALIAS(atomic_swap_uint,_atomic_swap_32)
    332  1.1  ad ALIAS(atomic_swap_ulong,_atomic_swap_64)
    333  1.1  ad ALIAS(atomic_swap_ptr,_atomic_swap_64)
    334  1.1  ad 
    335  1.1  ad ALIAS(atomic_cas_32,_atomic_cas_32)
    336  1.1  ad ALIAS(atomic_cas_64,_atomic_cas_64)
    337  1.1  ad ALIAS(atomic_cas_uint,_atomic_cas_32)
    338  1.1  ad ALIAS(atomic_cas_ulong,_atomic_cas_64)
    339  1.1  ad ALIAS(atomic_cas_ptr,_atomic_cas_64)
    340  1.1  ad 
    341  1.1  ad ALIAS(membar_consumer,_membar_consumer)
    342  1.1  ad ALIAS(membar_producer,_membar_producer)
    343  1.1  ad ALIAS(membar_enter,_membar_enter)
    344  1.1  ad ALIAS(membar_exit,_membar_exit)
    345  1.1  ad ALIAS(membar_sync,_membar_sync)
    346