Home | History | Annotate | Line # | Download | only in atomic
atomic.S revision 1.9
      1  1.9  ad /*	$NetBSD: atomic.S,v 1.9 2008/02/10 13:25:46 ad Exp $	*/
      2  1.1  ad 
      3  1.1  ad /*-
      4  1.1  ad  * Copyright (c) 2007 The NetBSD Foundation, Inc.
      5  1.1  ad  * All rights reserved.
      6  1.1  ad  *
      7  1.1  ad  * This code is derived from software contributed to The NetBSD Foundation
      8  1.1  ad  * by Jason R. Thorpe, and by Andrew Doran.
      9  1.1  ad  *
     10  1.1  ad  * Redistribution and use in source and binary forms, with or without
     11  1.1  ad  * modification, are permitted provided that the following conditions
     12  1.1  ad  * are met:
     13  1.1  ad  * 1. Redistributions of source code must retain the above copyright
     14  1.1  ad  *    notice, this list of conditions and the following disclaimer.
     15  1.1  ad  * 2. Redistributions in binary form must reproduce the above copyright
     16  1.1  ad  *    notice, this list of conditions and the following disclaimer in the
     17  1.1  ad  *    documentation and/or other materials provided with the distribution.
     18  1.1  ad  * 3. All advertising materials mentioning features or use of this software
     19  1.1  ad  *    must display the following acknowledgement:
     20  1.1  ad  *	This product includes software developed by the NetBSD
     21  1.1  ad  *	Foundation, Inc. and its contributors.
     22  1.1  ad  * 4. Neither the name of The NetBSD Foundation nor the names of its
     23  1.1  ad  *    contributors may be used to endorse or promote products derived
     24  1.1  ad  *    from this software without specific prior written permission.
     25  1.1  ad  *
     26  1.1  ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     27  1.1  ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     28  1.1  ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     29  1.1  ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     30  1.1  ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     31  1.1  ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     32  1.1  ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     33  1.1  ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     34  1.1  ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     35  1.1  ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     36  1.1  ad  * POSSIBILITY OF SUCH DAMAGE.
     37  1.1  ad  */
     38  1.1  ad 
     39  1.1  ad #include <machine/asm.h>
     40  1.1  ad 
     41  1.1  ad #ifdef _KERNEL
     42  1.1  ad #define	LOCK(n)		.Lpatch/**/n:	lock
     43  1.1  ad #define	ALIAS(f, t)	STRONG_ALIAS(f,t)
     44  1.2  ad #define	END(a)		_ALIGN_TEXT; LABEL(a)
     45  1.1  ad #else
     46  1.1  ad #define	LOCK(n)		lock
     47  1.1  ad #define	ALIAS(f, t)	WEAK_ALIAS(f,t)
     48  1.2  ad #define	END(a)		/* nothing */
     49  1.1  ad #endif
     50  1.1  ad 
     51  1.1  ad 	.text
     52  1.1  ad 
     53  1.1  ad NENTRY(_atomic_add_32)
     54  1.1  ad 	movl	4(%esp), %edx
     55  1.1  ad 	movl	8(%esp), %eax
     56  1.1  ad 	LOCK(1)
     57  1.1  ad 	addl	%eax, (%edx)
     58  1.1  ad 	ret
     59  1.1  ad 
     60  1.1  ad NENTRY(_atomic_add_32_nv)
     61  1.1  ad 	movl	4(%esp), %edx
     62  1.1  ad 	movl	8(%esp), %eax
     63  1.1  ad 	movl	%eax, %ecx
     64  1.1  ad 	LOCK(2)
     65  1.1  ad 	xaddl	%eax, (%edx)
     66  1.1  ad 	addl	%ecx, %eax
     67  1.1  ad 	ret
     68  1.1  ad 
     69  1.1  ad NENTRY(_atomic_and_32)
     70  1.1  ad 	movl	4(%esp), %edx
     71  1.1  ad 	movl	8(%esp), %eax
     72  1.1  ad 	LOCK(3)
     73  1.1  ad 	andl	%eax, (%edx)
     74  1.1  ad 	ret
     75  1.1  ad 
     76  1.1  ad NENTRY(_atomic_and_32_nv)
     77  1.1  ad 	movl	4(%esp), %edx
     78  1.1  ad 	movl	(%edx), %eax
     79  1.1  ad 1:
     80  1.1  ad 	movl	%eax, %ecx
     81  1.1  ad 	andl	8(%esp), %ecx
     82  1.1  ad 	LOCK(4)
     83  1.1  ad 	cmpxchgl %ecx, (%edx)
     84  1.1  ad 	jnz	1b
     85  1.1  ad 	movl	%ecx, %eax
     86  1.1  ad 	ret
     87  1.1  ad 
     88  1.1  ad NENTRY(_atomic_dec_32)
     89  1.1  ad 	movl	4(%esp), %edx
     90  1.1  ad 	LOCK(5)
     91  1.1  ad 	decl	(%edx)
     92  1.1  ad 	ret
     93  1.1  ad 
     94  1.1  ad NENTRY(_atomic_dec_32_nv)
     95  1.1  ad 	movl	4(%esp), %edx
     96  1.1  ad 	movl	$-1, %eax
     97  1.1  ad 	LOCK(6)
     98  1.1  ad 	xaddl	%eax, (%edx)
     99  1.1  ad 	decl	%eax
    100  1.1  ad 	ret
    101  1.1  ad 
    102  1.1  ad NENTRY(_atomic_inc_32)
    103  1.1  ad 	movl	4(%esp), %edx
    104  1.1  ad 	LOCK(7)
    105  1.1  ad 	incl	(%edx)
    106  1.1  ad 	ret
    107  1.1  ad 
    108  1.1  ad NENTRY(_atomic_inc_32_nv)
    109  1.1  ad 	movl	4(%esp), %edx
    110  1.1  ad 	movl	$1, %eax
    111  1.1  ad 	LOCK(8)
    112  1.1  ad 	xaddl	%eax, (%edx)
    113  1.1  ad 	incl	%eax
    114  1.1  ad 	ret
    115  1.1  ad 
    116  1.1  ad NENTRY(_atomic_or_32)
    117  1.1  ad 	movl	4(%esp), %edx
    118  1.1  ad 	movl	8(%esp), %eax
    119  1.1  ad 	LOCK(9)
    120  1.1  ad 	orl	%eax, (%edx)
    121  1.1  ad 	ret
    122  1.1  ad 
    123  1.1  ad NENTRY(_atomic_or_32_nv)
    124  1.1  ad 	movl	4(%esp), %edx
    125  1.1  ad 	movl	(%edx), %eax
    126  1.1  ad 1:
    127  1.1  ad 	movl	%eax, %ecx
    128  1.1  ad 	orl	8(%esp), %ecx
    129  1.1  ad 	LOCK(10)
    130  1.1  ad 	cmpxchgl %ecx, (%edx)
    131  1.1  ad 	jnz	1b
    132  1.1  ad 	movl	%ecx, %eax
    133  1.1  ad 	ret
    134  1.1  ad 
    135  1.1  ad NENTRY(_atomic_swap_32)
    136  1.1  ad 	movl	4(%esp), %edx
    137  1.1  ad 	movl	8(%esp), %eax
    138  1.1  ad 	xchgl	%eax, (%edx)
    139  1.1  ad 	ret
    140  1.1  ad 
    141  1.1  ad NENTRY(_atomic_cas_32)
    142  1.1  ad 	movl	4(%esp), %edx
    143  1.1  ad 	movl	8(%esp), %eax
    144  1.1  ad 	movl	12(%esp), %ecx
    145  1.1  ad 	LOCK(12)
    146  1.1  ad 	cmpxchgl %ecx, (%edx)
    147  1.1  ad 	/* %eax now contains the old value */
    148  1.1  ad 	ret
    149  1.1  ad 
    150  1.9  ad NENTRY(_atomic_cas_32_ni)
    151  1.9  ad 	movl	4(%esp), %edx
    152  1.9  ad 	movl	8(%esp), %eax
    153  1.9  ad 	movl	12(%esp), %ecx
    154  1.9  ad 	cmpxchgl %ecx, (%edx)
    155  1.9  ad 	/* %eax now contains the old value */
    156  1.9  ad 	ret
    157  1.9  ad 
    158  1.1  ad NENTRY(_membar_consumer)
    159  1.1  ad 	LOCK(13)
    160  1.1  ad 	addl	$0, -4(%esp)
    161  1.1  ad 	ret
    162  1.2  ad END(membar_consumer_end)
    163  1.1  ad 
    164  1.1  ad NENTRY(_membar_producer)
    165  1.1  ad 	/* A store is enough */
    166  1.1  ad 	movl	$0, -4(%esp)
    167  1.1  ad 	ret
    168  1.2  ad END(membar_producer_end)
    169  1.1  ad 
    170  1.1  ad NENTRY(_membar_sync)
    171  1.1  ad 	LOCK(14)
    172  1.1  ad 	addl	$0, -4(%esp)
    173  1.1  ad 	ret
    174  1.2  ad END(membar_sync_end)
    175  1.1  ad 
    176  1.1  ad #ifdef _KERNEL
    177  1.6  ad NENTRY(_atomic_cas_64)
    178  1.6  ad 	cli
    179  1.6  ad 	pushl	%edi
    180  1.6  ad 	pushl	%ebx
    181  1.6  ad 	movl	12(%esp), %edi
    182  1.6  ad 	movl	16(%esp), %eax
    183  1.6  ad 	movl	20(%esp), %edx
    184  1.6  ad 	movl	24(%esp), %ebx
    185  1.6  ad 	movl	28(%esp), %ecx
    186  1.6  ad 	cmpl	0(%edi), %eax
    187  1.6  ad 	jne	2f
    188  1.6  ad 	cmpl	4(%edi), %edx
    189  1.6  ad 	jne	2f
    190  1.6  ad 	movl	%ebx, 0(%edi)
    191  1.6  ad 	movl	%ecx, 4(%edi)
    192  1.6  ad 1:
    193  1.6  ad 	popl	%ebx
    194  1.6  ad 	popl	%edi
    195  1.6  ad 	sti
    196  1.6  ad 	ret
    197  1.6  ad 2:
    198  1.6  ad 	movl	0(%edi), %eax
    199  1.6  ad 	movl	4(%edi), %edx
    200  1.6  ad 	jmp	1b
    201  1.6  ad END(_atomic_cas_64_end)
    202  1.6  ad 
    203  1.6  ad NENTRY(_atomic_cas_cx8)
    204  1.6  ad 	pushl	%edi
    205  1.6  ad 	pushl	%ebx
    206  1.6  ad 	movl	12(%esp), %edi
    207  1.6  ad 	movl	16(%esp), %eax
    208  1.6  ad 	movl	20(%esp), %edx
    209  1.6  ad 	movl	24(%esp), %ebx
    210  1.6  ad 	movl	28(%esp), %ecx
    211  1.6  ad 	LOCK(15)
    212  1.6  ad 	cmpxchg8b (%edi)
    213  1.6  ad 	popl	%ebx
    214  1.6  ad 	popl	%edi
    215  1.6  ad 	ret
    216  1.7  ad 	.space	32, 0x90
    217  1.6  ad END(_atomic_cas_cx8_end)
    218  1.6  ad 
    219  1.1  ad NENTRY(sse2_lfence)
    220  1.1  ad 	lfence
    221  1.1  ad 	ret
    222  1.2  ad END(sse2_lfence_end)
    223  1.1  ad 
    224  1.1  ad NENTRY(sse2_mfence)
    225  1.1  ad 	mfence
    226  1.1  ad 	ret
    227  1.2  ad END(sse2_mfence_end)
    228  1.1  ad 
    229  1.1  ad atomic_lockpatch:
    230  1.1  ad 	.globl	atomic_lockpatch
    231  1.1  ad 	.long	.Lpatch1, .Lpatch2, .Lpatch3, .Lpatch4, .Lpatch5
    232  1.1  ad 	.long	.Lpatch6, .Lpatch7, .Lpatch8, .Lpatch9, .Lpatch10
    233  1.6  ad 	.long	.Lpatch12, .Lpatch13, .Lpatch14, .Lpatch15, 0
    234  1.7  ad #else
    235  1.7  ad NENTRY(_atomic_cas_64)
    236  1.7  ad 	pushl	%edi
    237  1.7  ad 	pushl	%ebx
    238  1.7  ad 	movl	12(%esp), %edi
    239  1.7  ad 	movl	16(%esp), %eax
    240  1.7  ad 	movl	20(%esp), %edx
    241  1.7  ad 	movl	24(%esp), %ebx
    242  1.7  ad 	movl	28(%esp), %ecx
    243  1.7  ad 	lock
    244  1.7  ad 	cmpxchg8b (%edi)
    245  1.7  ad 	popl	%ebx
    246  1.7  ad 	popl	%edi
    247  1.7  ad 	ret
    248  1.1  ad #endif	/* _KERNEL */
    249  1.1  ad 
    250  1.1  ad ALIAS(atomic_add_32,_atomic_add_32)
    251  1.4  ad ALIAS(atomic_add_int,_atomic_add_32)
    252  1.4  ad ALIAS(atomic_add_long,_atomic_add_32)
    253  1.1  ad ALIAS(atomic_add_ptr,_atomic_add_32)
    254  1.1  ad 
    255  1.1  ad ALIAS(atomic_add_32_nv,_atomic_add_32_nv)
    256  1.4  ad ALIAS(atomic_add_int_nv,_atomic_add_32_nv)
    257  1.4  ad ALIAS(atomic_add_long_nv,_atomic_add_32_nv)
    258  1.1  ad ALIAS(atomic_add_ptr_nv,_atomic_add_32_nv)
    259  1.1  ad 
    260  1.1  ad ALIAS(atomic_and_32,_atomic_and_32)
    261  1.1  ad ALIAS(atomic_and_uint,_atomic_and_32)
    262  1.1  ad ALIAS(atomic_and_ulong,_atomic_and_32)
    263  1.1  ad ALIAS(atomic_and_ptr,_atomic_and_32)
    264  1.1  ad 
    265  1.1  ad ALIAS(atomic_and_32_nv,_atomic_and_32_nv)
    266  1.1  ad ALIAS(atomic_and_uint_nv,_atomic_and_32_nv)
    267  1.1  ad ALIAS(atomic_and_ulong_nv,_atomic_and_32_nv)
    268  1.1  ad ALIAS(atomic_and_ptr_nv,_atomic_and_32_nv)
    269  1.1  ad 
    270  1.1  ad ALIAS(atomic_dec_32,_atomic_dec_32)
    271  1.1  ad ALIAS(atomic_dec_uint,_atomic_dec_32)
    272  1.1  ad ALIAS(atomic_dec_ulong,_atomic_dec_32)
    273  1.1  ad ALIAS(atomic_dec_ptr,_atomic_dec_32)
    274  1.1  ad 
    275  1.1  ad ALIAS(atomic_dec_32_nv,_atomic_dec_32_nv)
    276  1.1  ad ALIAS(atomic_dec_uint_nv,_atomic_dec_32_nv)
    277  1.1  ad ALIAS(atomic_dec_ulong_nv,_atomic_dec_32_nv)
    278  1.1  ad ALIAS(atomic_dec_ptr_nv,_atomic_dec_32_nv)
    279  1.1  ad 
    280  1.1  ad ALIAS(atomic_inc_32,_atomic_inc_32)
    281  1.1  ad ALIAS(atomic_inc_uint,_atomic_inc_32)
    282  1.1  ad ALIAS(atomic_inc_ulong,_atomic_inc_32)
    283  1.1  ad ALIAS(atomic_inc_ptr,_atomic_inc_32)
    284  1.1  ad 
    285  1.1  ad ALIAS(atomic_inc_32_nv,_atomic_inc_32_nv)
    286  1.1  ad ALIAS(atomic_inc_uint_nv,_atomic_inc_32_nv)
    287  1.1  ad ALIAS(atomic_inc_ulong_nv,_atomic_inc_32_nv)
    288  1.1  ad ALIAS(atomic_inc_ptr_nv,_atomic_inc_32_nv)
    289  1.1  ad 
    290  1.1  ad ALIAS(atomic_or_32,_atomic_or_32)
    291  1.1  ad ALIAS(atomic_or_uint,_atomic_or_32)
    292  1.1  ad ALIAS(atomic_or_ulong,_atomic_or_32)
    293  1.1  ad ALIAS(atomic_or_ptr,_atomic_or_32)
    294  1.1  ad 
    295  1.1  ad ALIAS(atomic_or_32_nv,_atomic_or_32_nv)
    296  1.1  ad ALIAS(atomic_or_uint_nv,_atomic_or_32_nv)
    297  1.1  ad ALIAS(atomic_or_ulong_nv,_atomic_or_32_nv)
    298  1.1  ad ALIAS(atomic_or_ptr_nv,_atomic_or_32_nv)
    299  1.1  ad 
    300  1.1  ad ALIAS(atomic_swap_32,_atomic_swap_32)
    301  1.1  ad ALIAS(atomic_swap_uint,_atomic_swap_32)
    302  1.1  ad ALIAS(atomic_swap_ulong,_atomic_swap_32)
    303  1.1  ad ALIAS(atomic_swap_ptr,_atomic_swap_32)
    304  1.1  ad 
    305  1.1  ad ALIAS(atomic_cas_32,_atomic_cas_32)
    306  1.1  ad ALIAS(atomic_cas_uint,_atomic_cas_32)
    307  1.1  ad ALIAS(atomic_cas_ulong,_atomic_cas_32)
    308  1.1  ad ALIAS(atomic_cas_ptr,_atomic_cas_32)
    309  1.1  ad 
    310  1.9  ad ALIAS(atomic_cas_32_ni,_atomic_cas_32_ni)
    311  1.9  ad ALIAS(atomic_cas_uint_ni,_atomic_cas_32_ni)
    312  1.9  ad ALIAS(atomic_cas_ulong_ni,_atomic_cas_32_ni)
    313  1.9  ad ALIAS(atomic_cas_ptr_ni,_atomic_cas_32_ni)
    314  1.9  ad 
    315  1.6  ad ALIAS(atomic_cas_64,_atomic_cas_64)
    316  1.9  ad ALIAS(atomic_cas_64_ni,_atomic_cas_64)
    317  1.6  ad 
    318  1.1  ad ALIAS(membar_consumer,_membar_consumer)
    319  1.1  ad ALIAS(membar_producer,_membar_producer)
    320  1.8  ad ALIAS(membar_enter,_membar_consumer)
    321  1.8  ad ALIAS(membar_exit,_membar_producer)
    322  1.1  ad ALIAS(membar_sync,_membar_sync)
    323  1.5  ad 
    324  1.5  ad STRONG_ALIAS(_atomic_add_int,_atomic_add_32)
    325  1.5  ad STRONG_ALIAS(_atomic_add_long,_atomic_add_32)
    326  1.5  ad STRONG_ALIAS(_atomic_add_ptr,_atomic_add_32)
    327  1.5  ad 
    328  1.5  ad STRONG_ALIAS(_atomic_add_int_nv,_atomic_add_32_nv)
    329  1.5  ad STRONG_ALIAS(_atomic_add_long_nv,_atomic_add_32_nv)
    330  1.5  ad STRONG_ALIAS(_atomic_add_ptr_nv,_atomic_add_32_nv)
    331  1.5  ad 
    332  1.5  ad STRONG_ALIAS(_atomic_and_uint,_atomic_and_32)
    333  1.5  ad STRONG_ALIAS(_atomic_and_ulong,_atomic_and_32)
    334  1.5  ad STRONG_ALIAS(_atomic_and_ptr,_atomic_and_32)
    335  1.5  ad 
    336  1.5  ad STRONG_ALIAS(_atomic_and_uint_nv,_atomic_and_32_nv)
    337  1.5  ad STRONG_ALIAS(_atomic_and_ulong_nv,_atomic_and_32_nv)
    338  1.5  ad STRONG_ALIAS(_atomic_and_ptr_nv,_atomic_and_32_nv)
    339  1.5  ad 
    340  1.5  ad STRONG_ALIAS(_atomic_dec_uint,_atomic_dec_32)
    341  1.5  ad STRONG_ALIAS(_atomic_dec_ulong,_atomic_dec_32)
    342  1.5  ad STRONG_ALIAS(_atomic_dec_ptr,_atomic_dec_32)
    343  1.5  ad 
    344  1.5  ad STRONG_ALIAS(_atomic_dec_uint_nv,_atomic_dec_32_nv)
    345  1.5  ad STRONG_ALIAS(_atomic_dec_ulong_nv,_atomic_dec_32_nv)
    346  1.5  ad STRONG_ALIAS(_atomic_dec_ptr_nv,_atomic_dec_32_nv)
    347  1.5  ad 
    348  1.5  ad STRONG_ALIAS(_atomic_inc_uint,_atomic_inc_32)
    349  1.5  ad STRONG_ALIAS(_atomic_inc_ulong,_atomic_inc_32)
    350  1.5  ad STRONG_ALIAS(_atomic_inc_ptr,_atomic_inc_32)
    351  1.5  ad 
    352  1.5  ad STRONG_ALIAS(_atomic_inc_uint_nv,_atomic_inc_32_nv)
    353  1.5  ad STRONG_ALIAS(_atomic_inc_ulong_nv,_atomic_inc_32_nv)
    354  1.5  ad STRONG_ALIAS(_atomic_inc_ptr_nv,_atomic_inc_32_nv)
    355  1.5  ad 
    356  1.5  ad STRONG_ALIAS(_atomic_or_uint,_atomic_or_32)
    357  1.5  ad STRONG_ALIAS(_atomic_or_ulong,_atomic_or_32)
    358  1.5  ad STRONG_ALIAS(_atomic_or_ptr,_atomic_or_32)
    359  1.5  ad 
    360  1.5  ad STRONG_ALIAS(_atomic_or_uint_nv,_atomic_or_32_nv)
    361  1.5  ad STRONG_ALIAS(_atomic_or_ulong_nv,_atomic_or_32_nv)
    362  1.5  ad STRONG_ALIAS(_atomic_or_ptr_nv,_atomic_or_32_nv)
    363  1.5  ad 
    364  1.5  ad STRONG_ALIAS(_atomic_swap_uint,_atomic_swap_32)
    365  1.5  ad STRONG_ALIAS(_atomic_swap_ulong,_atomic_swap_32)
    366  1.5  ad STRONG_ALIAS(_atomic_swap_ptr,_atomic_swap_32)
    367  1.5  ad 
    368  1.5  ad STRONG_ALIAS(_atomic_cas_uint,_atomic_cas_32)
    369  1.5  ad STRONG_ALIAS(_atomic_cas_ulong,_atomic_cas_32)
    370  1.5  ad STRONG_ALIAS(_atomic_cas_ptr,_atomic_cas_32)
    371  1.8  ad 
    372  1.9  ad STRONG_ALIAS(_atomic_cas_uint_ni,_atomic_cas_32_ni)
    373  1.9  ad STRONG_ALIAS(_atomic_cas_ulong_ni,_atomic_cas_32_ni)
    374  1.9  ad STRONG_ALIAS(_atomic_cas_ptr_ni,_atomic_cas_32_ni)
    375  1.9  ad 
    376  1.8  ad STRONG_ALIAS(_membar_enter,_membar_consumer)
    377  1.8  ad STRONG_ALIAS(_membar_exit,_membar_producer)
    378