Home | History | Annotate | Line # | Download | only in atomic
atomic.S revision 1.18
      1  1.18  pooka /*	$NetBSD: atomic.S,v 1.18 2009/11/26 07:40:34 pooka Exp $	*/
      2   1.1     ad 
      3   1.1     ad /*-
      4   1.1     ad  * Copyright (c) 2007 The NetBSD Foundation, Inc.
      5   1.1     ad  * All rights reserved.
      6   1.1     ad  *
      7   1.1     ad  * This code is derived from software contributed to The NetBSD Foundation
      8   1.1     ad  * by Jason R. Thorpe, and by Andrew Doran.
      9   1.1     ad  *
     10   1.1     ad  * Redistribution and use in source and binary forms, with or without
     11   1.1     ad  * modification, are permitted provided that the following conditions
     12   1.1     ad  * are met:
     13   1.1     ad  * 1. Redistributions of source code must retain the above copyright
     14   1.1     ad  *    notice, this list of conditions and the following disclaimer.
     15   1.1     ad  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.1     ad  *    notice, this list of conditions and the following disclaimer in the
     17   1.1     ad  *    documentation and/or other materials provided with the distribution.
     18   1.1     ad  *
     19   1.1     ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.1     ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.1     ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.1     ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.1     ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.1     ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.1     ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.1     ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.1     ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.1     ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.1     ad  * POSSIBILITY OF SUCH DAMAGE.
     30   1.1     ad  */
     31   1.1     ad 
     32  1.16  pooka #include <sys/param.h>
     33   1.1     ad #include <machine/asm.h>
     34   1.1     ad 
     35  1.18  pooka #ifdef _KERNEL
     36  1.18  pooka #define	ALIAS(f, t)	STRONG_ALIAS(f,t)
     37  1.18  pooka #else
     38  1.18  pooka #define	ALIAS(f, t)	WEAK_ALIAS(f,t)
     39  1.18  pooka #endif
     40  1.18  pooka 
     41  1.15  pooka #ifdef _HARDKERNEL
     42   1.1     ad #define	LOCK(n)		.Lpatch/**/n:	lock
     43  1.12   yamt #define	ENDLABEL(a)	_ALIGN_TEXT; LABEL(a)
     44   1.1     ad #else
     45   1.1     ad #define	LOCK(n)		lock
     46  1.12   yamt #define	ENDLABEL(a)	/* nothing */
     47   1.1     ad #endif
     48   1.1     ad 
     49   1.1     ad 	.text
     50   1.1     ad 
     51  1.13    chs ENTRY(_atomic_add_32)
     52   1.1     ad 	movl	4(%esp), %edx
     53   1.1     ad 	movl	8(%esp), %eax
     54   1.1     ad 	LOCK(1)
     55   1.1     ad 	addl	%eax, (%edx)
     56   1.1     ad 	ret
     57   1.1     ad 
     58  1.13    chs ENTRY(_atomic_add_32_nv)
     59   1.1     ad 	movl	4(%esp), %edx
     60   1.1     ad 	movl	8(%esp), %eax
     61   1.1     ad 	movl	%eax, %ecx
     62   1.1     ad 	LOCK(2)
     63   1.1     ad 	xaddl	%eax, (%edx)
     64   1.1     ad 	addl	%ecx, %eax
     65   1.1     ad 	ret
     66   1.1     ad 
     67  1.13    chs ENTRY(_atomic_and_32)
     68   1.1     ad 	movl	4(%esp), %edx
     69   1.1     ad 	movl	8(%esp), %eax
     70   1.1     ad 	LOCK(3)
     71   1.1     ad 	andl	%eax, (%edx)
     72   1.1     ad 	ret
     73   1.1     ad 
     74  1.13    chs ENTRY(_atomic_and_32_nv)
     75   1.1     ad 	movl	4(%esp), %edx
     76   1.1     ad 	movl	(%edx), %eax
     77  1.14     ad 0:
     78   1.1     ad 	movl	%eax, %ecx
     79   1.1     ad 	andl	8(%esp), %ecx
     80   1.1     ad 	LOCK(4)
     81   1.1     ad 	cmpxchgl %ecx, (%edx)
     82  1.14     ad 	jnz	1f
     83   1.1     ad 	movl	%ecx, %eax
     84   1.1     ad 	ret
     85  1.14     ad 1:
     86  1.14     ad 	jmp	0b
     87   1.1     ad 
     88  1.13    chs ENTRY(_atomic_dec_32)
     89   1.1     ad 	movl	4(%esp), %edx
     90   1.1     ad 	LOCK(5)
     91   1.1     ad 	decl	(%edx)
     92   1.1     ad 	ret
     93   1.1     ad 
     94  1.13    chs ENTRY(_atomic_dec_32_nv)
     95   1.1     ad 	movl	4(%esp), %edx
     96   1.1     ad 	movl	$-1, %eax
     97   1.1     ad 	LOCK(6)
     98   1.1     ad 	xaddl	%eax, (%edx)
     99   1.1     ad 	decl	%eax
    100   1.1     ad 	ret
    101   1.1     ad 
    102  1.13    chs ENTRY(_atomic_inc_32)
    103   1.1     ad 	movl	4(%esp), %edx
    104   1.1     ad 	LOCK(7)
    105   1.1     ad 	incl	(%edx)
    106   1.1     ad 	ret
    107   1.1     ad 
    108  1.13    chs ENTRY(_atomic_inc_32_nv)
    109   1.1     ad 	movl	4(%esp), %edx
    110   1.1     ad 	movl	$1, %eax
    111   1.1     ad 	LOCK(8)
    112   1.1     ad 	xaddl	%eax, (%edx)
    113   1.1     ad 	incl	%eax
    114   1.1     ad 	ret
    115   1.1     ad 
    116  1.13    chs ENTRY(_atomic_or_32)
    117   1.1     ad 	movl	4(%esp), %edx
    118   1.1     ad 	movl	8(%esp), %eax
    119   1.1     ad 	LOCK(9)
    120   1.1     ad 	orl	%eax, (%edx)
    121   1.1     ad 	ret
    122   1.1     ad 
    123  1.13    chs ENTRY(_atomic_or_32_nv)
    124   1.1     ad 	movl	4(%esp), %edx
    125   1.1     ad 	movl	(%edx), %eax
    126  1.14     ad 0:
    127   1.1     ad 	movl	%eax, %ecx
    128   1.1     ad 	orl	8(%esp), %ecx
    129   1.1     ad 	LOCK(10)
    130   1.1     ad 	cmpxchgl %ecx, (%edx)
    131  1.14     ad 	jnz	1f
    132   1.1     ad 	movl	%ecx, %eax
    133   1.1     ad 	ret
    134  1.14     ad 1:
    135  1.14     ad 	jmp	0b
    136   1.1     ad 
    137  1.13    chs ENTRY(_atomic_swap_32)
    138   1.1     ad 	movl	4(%esp), %edx
    139   1.1     ad 	movl	8(%esp), %eax
    140   1.1     ad 	xchgl	%eax, (%edx)
    141   1.1     ad 	ret
    142   1.1     ad 
    143  1.13    chs ENTRY(_atomic_cas_32)
    144   1.1     ad 	movl	4(%esp), %edx
    145   1.1     ad 	movl	8(%esp), %eax
    146   1.1     ad 	movl	12(%esp), %ecx
    147   1.1     ad 	LOCK(12)
    148   1.1     ad 	cmpxchgl %ecx, (%edx)
    149   1.1     ad 	/* %eax now contains the old value */
    150   1.1     ad 	ret
    151   1.1     ad 
    152  1.13    chs ENTRY(_atomic_cas_32_ni)
    153   1.9     ad 	movl	4(%esp), %edx
    154   1.9     ad 	movl	8(%esp), %eax
    155   1.9     ad 	movl	12(%esp), %ecx
    156   1.9     ad 	cmpxchgl %ecx, (%edx)
    157   1.9     ad 	/* %eax now contains the old value */
    158   1.9     ad 	ret
    159   1.9     ad 
    160  1.13    chs ENTRY(_membar_consumer)
    161   1.1     ad 	LOCK(13)
    162   1.1     ad 	addl	$0, -4(%esp)
    163   1.1     ad 	ret
    164  1.11   yamt ENDLABEL(membar_consumer_end)
    165   1.1     ad 
    166  1.13    chs ENTRY(_membar_producer)
    167   1.1     ad 	/* A store is enough */
    168   1.1     ad 	movl	$0, -4(%esp)
    169   1.1     ad 	ret
    170  1.11   yamt ENDLABEL(membar_producer_end)
    171   1.1     ad 
    172  1.13    chs ENTRY(_membar_sync)
    173   1.1     ad 	LOCK(14)
    174   1.1     ad 	addl	$0, -4(%esp)
    175   1.1     ad 	ret
    176  1.11   yamt ENDLABEL(membar_sync_end)
    177   1.1     ad 
    178  1.15  pooka #ifdef _HARDKERNEL
    179  1.13    chs ENTRY(_atomic_cas_64)
    180  1.14     ad 	pushf
    181   1.6     ad 	cli
    182   1.6     ad 	pushl	%edi
    183   1.6     ad 	pushl	%ebx
    184   1.6     ad 	movl	12(%esp), %edi
    185   1.6     ad 	movl	16(%esp), %eax
    186   1.6     ad 	movl	20(%esp), %edx
    187   1.6     ad 	movl	24(%esp), %ebx
    188   1.6     ad 	movl	28(%esp), %ecx
    189   1.6     ad 	cmpl	0(%edi), %eax
    190   1.6     ad 	jne	2f
    191   1.6     ad 	cmpl	4(%edi), %edx
    192   1.6     ad 	jne	2f
    193   1.6     ad 	movl	%ebx, 0(%edi)
    194   1.6     ad 	movl	%ecx, 4(%edi)
    195   1.6     ad 1:
    196   1.6     ad 	popl	%ebx
    197   1.6     ad 	popl	%edi
    198  1.14     ad 	popf
    199   1.6     ad 	ret
    200   1.6     ad 2:
    201   1.6     ad 	movl	0(%edi), %eax
    202   1.6     ad 	movl	4(%edi), %edx
    203   1.6     ad 	jmp	1b
    204  1.11   yamt ENDLABEL(_atomic_cas_64_end)
    205   1.6     ad 
    206  1.13    chs ENTRY(_atomic_cas_cx8)
    207   1.6     ad 	pushl	%edi
    208   1.6     ad 	pushl	%ebx
    209   1.6     ad 	movl	12(%esp), %edi
    210   1.6     ad 	movl	16(%esp), %eax
    211   1.6     ad 	movl	20(%esp), %edx
    212   1.6     ad 	movl	24(%esp), %ebx
    213   1.6     ad 	movl	28(%esp), %ecx
    214   1.6     ad 	LOCK(15)
    215   1.6     ad 	cmpxchg8b (%edi)
    216   1.6     ad 	popl	%ebx
    217   1.6     ad 	popl	%edi
    218   1.6     ad 	ret
    219  1.17  enami #ifdef GPROF
    220  1.17  enami 	.space	16, 0x90
    221  1.17  enami #else
    222   1.7     ad 	.space	32, 0x90
    223  1.17  enami #endif
    224  1.11   yamt ENDLABEL(_atomic_cas_cx8_end)
    225   1.6     ad 
    226  1.13    chs ENTRY(sse2_lfence)
    227   1.1     ad 	lfence
    228   1.1     ad 	ret
    229  1.11   yamt ENDLABEL(sse2_lfence_end)
    230   1.1     ad 
    231  1.13    chs ENTRY(sse2_mfence)
    232   1.1     ad 	mfence
    233   1.1     ad 	ret
    234  1.11   yamt ENDLABEL(sse2_mfence_end)
    235   1.1     ad 
    236   1.1     ad atomic_lockpatch:
    237   1.1     ad 	.globl	atomic_lockpatch
    238   1.1     ad 	.long	.Lpatch1, .Lpatch2, .Lpatch3, .Lpatch4, .Lpatch5
    239   1.1     ad 	.long	.Lpatch6, .Lpatch7, .Lpatch8, .Lpatch9, .Lpatch10
    240   1.6     ad 	.long	.Lpatch12, .Lpatch13, .Lpatch14, .Lpatch15, 0
    241   1.7     ad #else
    242  1.13    chs ENTRY(_atomic_cas_64)
    243   1.7     ad 	pushl	%edi
    244   1.7     ad 	pushl	%ebx
    245   1.7     ad 	movl	12(%esp), %edi
    246   1.7     ad 	movl	16(%esp), %eax
    247   1.7     ad 	movl	20(%esp), %edx
    248   1.7     ad 	movl	24(%esp), %ebx
    249   1.7     ad 	movl	28(%esp), %ecx
    250   1.7     ad 	lock
    251   1.7     ad 	cmpxchg8b (%edi)
    252   1.7     ad 	popl	%ebx
    253   1.7     ad 	popl	%edi
    254   1.7     ad 	ret
    255  1.15  pooka #endif	/* _HARDKERNEL */
    256   1.1     ad 
    257   1.1     ad ALIAS(atomic_add_32,_atomic_add_32)
    258   1.4     ad ALIAS(atomic_add_int,_atomic_add_32)
    259   1.4     ad ALIAS(atomic_add_long,_atomic_add_32)
    260   1.1     ad ALIAS(atomic_add_ptr,_atomic_add_32)
    261   1.1     ad 
    262   1.1     ad ALIAS(atomic_add_32_nv,_atomic_add_32_nv)
    263   1.4     ad ALIAS(atomic_add_int_nv,_atomic_add_32_nv)
    264   1.4     ad ALIAS(atomic_add_long_nv,_atomic_add_32_nv)
    265   1.1     ad ALIAS(atomic_add_ptr_nv,_atomic_add_32_nv)
    266   1.1     ad 
    267   1.1     ad ALIAS(atomic_and_32,_atomic_and_32)
    268   1.1     ad ALIAS(atomic_and_uint,_atomic_and_32)
    269   1.1     ad ALIAS(atomic_and_ulong,_atomic_and_32)
    270   1.1     ad ALIAS(atomic_and_ptr,_atomic_and_32)
    271   1.1     ad 
    272   1.1     ad ALIAS(atomic_and_32_nv,_atomic_and_32_nv)
    273   1.1     ad ALIAS(atomic_and_uint_nv,_atomic_and_32_nv)
    274   1.1     ad ALIAS(atomic_and_ulong_nv,_atomic_and_32_nv)
    275   1.1     ad ALIAS(atomic_and_ptr_nv,_atomic_and_32_nv)
    276   1.1     ad 
    277   1.1     ad ALIAS(atomic_dec_32,_atomic_dec_32)
    278   1.1     ad ALIAS(atomic_dec_uint,_atomic_dec_32)
    279   1.1     ad ALIAS(atomic_dec_ulong,_atomic_dec_32)
    280   1.1     ad ALIAS(atomic_dec_ptr,_atomic_dec_32)
    281   1.1     ad 
    282   1.1     ad ALIAS(atomic_dec_32_nv,_atomic_dec_32_nv)
    283   1.1     ad ALIAS(atomic_dec_uint_nv,_atomic_dec_32_nv)
    284   1.1     ad ALIAS(atomic_dec_ulong_nv,_atomic_dec_32_nv)
    285   1.1     ad ALIAS(atomic_dec_ptr_nv,_atomic_dec_32_nv)
    286   1.1     ad 
    287   1.1     ad ALIAS(atomic_inc_32,_atomic_inc_32)
    288   1.1     ad ALIAS(atomic_inc_uint,_atomic_inc_32)
    289   1.1     ad ALIAS(atomic_inc_ulong,_atomic_inc_32)
    290   1.1     ad ALIAS(atomic_inc_ptr,_atomic_inc_32)
    291   1.1     ad 
    292   1.1     ad ALIAS(atomic_inc_32_nv,_atomic_inc_32_nv)
    293   1.1     ad ALIAS(atomic_inc_uint_nv,_atomic_inc_32_nv)
    294   1.1     ad ALIAS(atomic_inc_ulong_nv,_atomic_inc_32_nv)
    295   1.1     ad ALIAS(atomic_inc_ptr_nv,_atomic_inc_32_nv)
    296   1.1     ad 
    297   1.1     ad ALIAS(atomic_or_32,_atomic_or_32)
    298   1.1     ad ALIAS(atomic_or_uint,_atomic_or_32)
    299   1.1     ad ALIAS(atomic_or_ulong,_atomic_or_32)
    300   1.1     ad ALIAS(atomic_or_ptr,_atomic_or_32)
    301   1.1     ad 
    302   1.1     ad ALIAS(atomic_or_32_nv,_atomic_or_32_nv)
    303   1.1     ad ALIAS(atomic_or_uint_nv,_atomic_or_32_nv)
    304   1.1     ad ALIAS(atomic_or_ulong_nv,_atomic_or_32_nv)
    305   1.1     ad ALIAS(atomic_or_ptr_nv,_atomic_or_32_nv)
    306   1.1     ad 
    307   1.1     ad ALIAS(atomic_swap_32,_atomic_swap_32)
    308   1.1     ad ALIAS(atomic_swap_uint,_atomic_swap_32)
    309   1.1     ad ALIAS(atomic_swap_ulong,_atomic_swap_32)
    310   1.1     ad ALIAS(atomic_swap_ptr,_atomic_swap_32)
    311   1.1     ad 
    312   1.1     ad ALIAS(atomic_cas_32,_atomic_cas_32)
    313   1.1     ad ALIAS(atomic_cas_uint,_atomic_cas_32)
    314   1.1     ad ALIAS(atomic_cas_ulong,_atomic_cas_32)
    315   1.1     ad ALIAS(atomic_cas_ptr,_atomic_cas_32)
    316   1.1     ad 
    317   1.9     ad ALIAS(atomic_cas_32_ni,_atomic_cas_32_ni)
    318   1.9     ad ALIAS(atomic_cas_uint_ni,_atomic_cas_32_ni)
    319   1.9     ad ALIAS(atomic_cas_ulong_ni,_atomic_cas_32_ni)
    320   1.9     ad ALIAS(atomic_cas_ptr_ni,_atomic_cas_32_ni)
    321   1.9     ad 
    322   1.6     ad ALIAS(atomic_cas_64,_atomic_cas_64)
    323   1.9     ad ALIAS(atomic_cas_64_ni,_atomic_cas_64)
    324   1.6     ad 
    325   1.1     ad ALIAS(membar_consumer,_membar_consumer)
    326   1.1     ad ALIAS(membar_producer,_membar_producer)
    327   1.8     ad ALIAS(membar_enter,_membar_consumer)
    328   1.8     ad ALIAS(membar_exit,_membar_producer)
    329   1.1     ad ALIAS(membar_sync,_membar_sync)
    330   1.5     ad 
    331   1.5     ad STRONG_ALIAS(_atomic_add_int,_atomic_add_32)
    332   1.5     ad STRONG_ALIAS(_atomic_add_long,_atomic_add_32)
    333   1.5     ad STRONG_ALIAS(_atomic_add_ptr,_atomic_add_32)
    334   1.5     ad 
    335   1.5     ad STRONG_ALIAS(_atomic_add_int_nv,_atomic_add_32_nv)
    336   1.5     ad STRONG_ALIAS(_atomic_add_long_nv,_atomic_add_32_nv)
    337   1.5     ad STRONG_ALIAS(_atomic_add_ptr_nv,_atomic_add_32_nv)
    338   1.5     ad 
    339   1.5     ad STRONG_ALIAS(_atomic_and_uint,_atomic_and_32)
    340   1.5     ad STRONG_ALIAS(_atomic_and_ulong,_atomic_and_32)
    341   1.5     ad STRONG_ALIAS(_atomic_and_ptr,_atomic_and_32)
    342   1.5     ad 
    343   1.5     ad STRONG_ALIAS(_atomic_and_uint_nv,_atomic_and_32_nv)
    344   1.5     ad STRONG_ALIAS(_atomic_and_ulong_nv,_atomic_and_32_nv)
    345   1.5     ad STRONG_ALIAS(_atomic_and_ptr_nv,_atomic_and_32_nv)
    346   1.5     ad 
    347   1.5     ad STRONG_ALIAS(_atomic_dec_uint,_atomic_dec_32)
    348   1.5     ad STRONG_ALIAS(_atomic_dec_ulong,_atomic_dec_32)
    349   1.5     ad STRONG_ALIAS(_atomic_dec_ptr,_atomic_dec_32)
    350   1.5     ad 
    351   1.5     ad STRONG_ALIAS(_atomic_dec_uint_nv,_atomic_dec_32_nv)
    352   1.5     ad STRONG_ALIAS(_atomic_dec_ulong_nv,_atomic_dec_32_nv)
    353   1.5     ad STRONG_ALIAS(_atomic_dec_ptr_nv,_atomic_dec_32_nv)
    354   1.5     ad 
    355   1.5     ad STRONG_ALIAS(_atomic_inc_uint,_atomic_inc_32)
    356   1.5     ad STRONG_ALIAS(_atomic_inc_ulong,_atomic_inc_32)
    357   1.5     ad STRONG_ALIAS(_atomic_inc_ptr,_atomic_inc_32)
    358   1.5     ad 
    359   1.5     ad STRONG_ALIAS(_atomic_inc_uint_nv,_atomic_inc_32_nv)
    360   1.5     ad STRONG_ALIAS(_atomic_inc_ulong_nv,_atomic_inc_32_nv)
    361   1.5     ad STRONG_ALIAS(_atomic_inc_ptr_nv,_atomic_inc_32_nv)
    362   1.5     ad 
    363   1.5     ad STRONG_ALIAS(_atomic_or_uint,_atomic_or_32)
    364   1.5     ad STRONG_ALIAS(_atomic_or_ulong,_atomic_or_32)
    365   1.5     ad STRONG_ALIAS(_atomic_or_ptr,_atomic_or_32)
    366   1.5     ad 
    367   1.5     ad STRONG_ALIAS(_atomic_or_uint_nv,_atomic_or_32_nv)
    368   1.5     ad STRONG_ALIAS(_atomic_or_ulong_nv,_atomic_or_32_nv)
    369   1.5     ad STRONG_ALIAS(_atomic_or_ptr_nv,_atomic_or_32_nv)
    370   1.5     ad 
    371   1.5     ad STRONG_ALIAS(_atomic_swap_uint,_atomic_swap_32)
    372   1.5     ad STRONG_ALIAS(_atomic_swap_ulong,_atomic_swap_32)
    373   1.5     ad STRONG_ALIAS(_atomic_swap_ptr,_atomic_swap_32)
    374   1.5     ad 
    375   1.5     ad STRONG_ALIAS(_atomic_cas_uint,_atomic_cas_32)
    376   1.5     ad STRONG_ALIAS(_atomic_cas_ulong,_atomic_cas_32)
    377   1.5     ad STRONG_ALIAS(_atomic_cas_ptr,_atomic_cas_32)
    378   1.8     ad 
    379   1.9     ad STRONG_ALIAS(_atomic_cas_uint_ni,_atomic_cas_32_ni)
    380   1.9     ad STRONG_ALIAS(_atomic_cas_ulong_ni,_atomic_cas_32_ni)
    381   1.9     ad STRONG_ALIAS(_atomic_cas_ptr_ni,_atomic_cas_32_ni)
    382   1.9     ad 
    383   1.8     ad STRONG_ALIAS(_membar_enter,_membar_consumer)
    384   1.8     ad STRONG_ALIAS(_membar_exit,_membar_producer)
    385