Home | History | Annotate | Line # | Download | only in atomic
atomic.S revision 1.16.2.1
      1  1.16.2.1    jym /*	$NetBSD: atomic.S,v 1.16.2.1 2009/05/13 17:23:11 jym Exp $	*/
      2       1.1     ad 
      3       1.1     ad /*-
      4       1.1     ad  * Copyright (c) 2007 The NetBSD Foundation, Inc.
      5       1.1     ad  * All rights reserved.
      6       1.1     ad  *
      7       1.1     ad  * This code is derived from software contributed to The NetBSD Foundation
      8       1.1     ad  * by Jason R. Thorpe, and by Andrew Doran.
      9       1.1     ad  *
     10       1.1     ad  * Redistribution and use in source and binary forms, with or without
     11       1.1     ad  * modification, are permitted provided that the following conditions
     12       1.1     ad  * are met:
     13       1.1     ad  * 1. Redistributions of source code must retain the above copyright
     14       1.1     ad  *    notice, this list of conditions and the following disclaimer.
     15       1.1     ad  * 2. Redistributions in binary form must reproduce the above copyright
     16       1.1     ad  *    notice, this list of conditions and the following disclaimer in the
     17       1.1     ad  *    documentation and/or other materials provided with the distribution.
     18       1.1     ad  *
     19       1.1     ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20       1.1     ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21       1.1     ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22       1.1     ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23       1.1     ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24       1.1     ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25       1.1     ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26       1.1     ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27       1.1     ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28       1.1     ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29       1.1     ad  * POSSIBILITY OF SUCH DAMAGE.
     30       1.1     ad  */
     31       1.1     ad 
     32      1.16  pooka #include <sys/param.h>
     33       1.1     ad #include <machine/asm.h>
     34       1.1     ad 
     35      1.15  pooka #ifdef _HARDKERNEL
     36       1.1     ad #define	LOCK(n)		.Lpatch/**/n:	lock
     37       1.1     ad #define	ALIAS(f, t)	STRONG_ALIAS(f,t)
     38      1.12   yamt #define	ENDLABEL(a)	_ALIGN_TEXT; LABEL(a)
     39       1.1     ad #else
     40       1.1     ad #define	LOCK(n)		lock
     41       1.1     ad #define	ALIAS(f, t)	WEAK_ALIAS(f,t)
     42      1.12   yamt #define	ENDLABEL(a)	/* nothing */
     43       1.1     ad #endif
     44       1.1     ad 
     45       1.1     ad 	.text
     46       1.1     ad 
     47      1.13    chs ENTRY(_atomic_add_32)
     48       1.1     ad 	movl	4(%esp), %edx
     49       1.1     ad 	movl	8(%esp), %eax
     50       1.1     ad 	LOCK(1)
     51       1.1     ad 	addl	%eax, (%edx)
     52       1.1     ad 	ret
     53       1.1     ad 
     54      1.13    chs ENTRY(_atomic_add_32_nv)
     55       1.1     ad 	movl	4(%esp), %edx
     56       1.1     ad 	movl	8(%esp), %eax
     57       1.1     ad 	movl	%eax, %ecx
     58       1.1     ad 	LOCK(2)
     59       1.1     ad 	xaddl	%eax, (%edx)
     60       1.1     ad 	addl	%ecx, %eax
     61       1.1     ad 	ret
     62       1.1     ad 
     63      1.13    chs ENTRY(_atomic_and_32)
     64       1.1     ad 	movl	4(%esp), %edx
     65       1.1     ad 	movl	8(%esp), %eax
     66       1.1     ad 	LOCK(3)
     67       1.1     ad 	andl	%eax, (%edx)
     68       1.1     ad 	ret
     69       1.1     ad 
     70      1.13    chs ENTRY(_atomic_and_32_nv)
     71       1.1     ad 	movl	4(%esp), %edx
     72       1.1     ad 	movl	(%edx), %eax
     73      1.14     ad 0:
     74       1.1     ad 	movl	%eax, %ecx
     75       1.1     ad 	andl	8(%esp), %ecx
     76       1.1     ad 	LOCK(4)
     77       1.1     ad 	cmpxchgl %ecx, (%edx)
     78      1.14     ad 	jnz	1f
     79       1.1     ad 	movl	%ecx, %eax
     80       1.1     ad 	ret
     81      1.14     ad 1:
     82      1.14     ad 	jmp	0b
     83       1.1     ad 
     84      1.13    chs ENTRY(_atomic_dec_32)
     85       1.1     ad 	movl	4(%esp), %edx
     86       1.1     ad 	LOCK(5)
     87       1.1     ad 	decl	(%edx)
     88       1.1     ad 	ret
     89       1.1     ad 
     90      1.13    chs ENTRY(_atomic_dec_32_nv)
     91       1.1     ad 	movl	4(%esp), %edx
     92       1.1     ad 	movl	$-1, %eax
     93       1.1     ad 	LOCK(6)
     94       1.1     ad 	xaddl	%eax, (%edx)
     95       1.1     ad 	decl	%eax
     96       1.1     ad 	ret
     97       1.1     ad 
     98      1.13    chs ENTRY(_atomic_inc_32)
     99       1.1     ad 	movl	4(%esp), %edx
    100       1.1     ad 	LOCK(7)
    101       1.1     ad 	incl	(%edx)
    102       1.1     ad 	ret
    103       1.1     ad 
    104      1.13    chs ENTRY(_atomic_inc_32_nv)
    105       1.1     ad 	movl	4(%esp), %edx
    106       1.1     ad 	movl	$1, %eax
    107       1.1     ad 	LOCK(8)
    108       1.1     ad 	xaddl	%eax, (%edx)
    109       1.1     ad 	incl	%eax
    110       1.1     ad 	ret
    111       1.1     ad 
    112      1.13    chs ENTRY(_atomic_or_32)
    113       1.1     ad 	movl	4(%esp), %edx
    114       1.1     ad 	movl	8(%esp), %eax
    115       1.1     ad 	LOCK(9)
    116       1.1     ad 	orl	%eax, (%edx)
    117       1.1     ad 	ret
    118       1.1     ad 
    119      1.13    chs ENTRY(_atomic_or_32_nv)
    120       1.1     ad 	movl	4(%esp), %edx
    121       1.1     ad 	movl	(%edx), %eax
    122      1.14     ad 0:
    123       1.1     ad 	movl	%eax, %ecx
    124       1.1     ad 	orl	8(%esp), %ecx
    125       1.1     ad 	LOCK(10)
    126       1.1     ad 	cmpxchgl %ecx, (%edx)
    127      1.14     ad 	jnz	1f
    128       1.1     ad 	movl	%ecx, %eax
    129       1.1     ad 	ret
    130      1.14     ad 1:
    131      1.14     ad 	jmp	0b
    132       1.1     ad 
    133      1.13    chs ENTRY(_atomic_swap_32)
    134       1.1     ad 	movl	4(%esp), %edx
    135       1.1     ad 	movl	8(%esp), %eax
    136       1.1     ad 	xchgl	%eax, (%edx)
    137       1.1     ad 	ret
    138       1.1     ad 
    139      1.13    chs ENTRY(_atomic_cas_32)
    140       1.1     ad 	movl	4(%esp), %edx
    141       1.1     ad 	movl	8(%esp), %eax
    142       1.1     ad 	movl	12(%esp), %ecx
    143       1.1     ad 	LOCK(12)
    144       1.1     ad 	cmpxchgl %ecx, (%edx)
    145       1.1     ad 	/* %eax now contains the old value */
    146       1.1     ad 	ret
    147       1.1     ad 
    148      1.13    chs ENTRY(_atomic_cas_32_ni)
    149       1.9     ad 	movl	4(%esp), %edx
    150       1.9     ad 	movl	8(%esp), %eax
    151       1.9     ad 	movl	12(%esp), %ecx
    152       1.9     ad 	cmpxchgl %ecx, (%edx)
    153       1.9     ad 	/* %eax now contains the old value */
    154       1.9     ad 	ret
    155       1.9     ad 
    156      1.13    chs ENTRY(_membar_consumer)
    157       1.1     ad 	LOCK(13)
    158       1.1     ad 	addl	$0, -4(%esp)
    159       1.1     ad 	ret
    160      1.11   yamt ENDLABEL(membar_consumer_end)
    161       1.1     ad 
    162      1.13    chs ENTRY(_membar_producer)
    163       1.1     ad 	/* A store is enough */
    164       1.1     ad 	movl	$0, -4(%esp)
    165       1.1     ad 	ret
    166      1.11   yamt ENDLABEL(membar_producer_end)
    167       1.1     ad 
    168      1.13    chs ENTRY(_membar_sync)
    169       1.1     ad 	LOCK(14)
    170       1.1     ad 	addl	$0, -4(%esp)
    171       1.1     ad 	ret
    172      1.11   yamt ENDLABEL(membar_sync_end)
    173       1.1     ad 
    174      1.15  pooka #ifdef _HARDKERNEL
    175      1.13    chs ENTRY(_atomic_cas_64)
    176      1.14     ad 	pushf
    177       1.6     ad 	cli
    178       1.6     ad 	pushl	%edi
    179       1.6     ad 	pushl	%ebx
    180       1.6     ad 	movl	12(%esp), %edi
    181       1.6     ad 	movl	16(%esp), %eax
    182       1.6     ad 	movl	20(%esp), %edx
    183       1.6     ad 	movl	24(%esp), %ebx
    184       1.6     ad 	movl	28(%esp), %ecx
    185       1.6     ad 	cmpl	0(%edi), %eax
    186       1.6     ad 	jne	2f
    187       1.6     ad 	cmpl	4(%edi), %edx
    188       1.6     ad 	jne	2f
    189       1.6     ad 	movl	%ebx, 0(%edi)
    190       1.6     ad 	movl	%ecx, 4(%edi)
    191       1.6     ad 1:
    192       1.6     ad 	popl	%ebx
    193       1.6     ad 	popl	%edi
    194      1.14     ad 	popf
    195       1.6     ad 	ret
    196       1.6     ad 2:
    197       1.6     ad 	movl	0(%edi), %eax
    198       1.6     ad 	movl	4(%edi), %edx
    199       1.6     ad 	jmp	1b
    200      1.11   yamt ENDLABEL(_atomic_cas_64_end)
    201       1.6     ad 
    202      1.13    chs ENTRY(_atomic_cas_cx8)
    203       1.6     ad 	pushl	%edi
    204       1.6     ad 	pushl	%ebx
    205       1.6     ad 	movl	12(%esp), %edi
    206       1.6     ad 	movl	16(%esp), %eax
    207       1.6     ad 	movl	20(%esp), %edx
    208       1.6     ad 	movl	24(%esp), %ebx
    209       1.6     ad 	movl	28(%esp), %ecx
    210       1.6     ad 	LOCK(15)
    211       1.6     ad 	cmpxchg8b (%edi)
    212       1.6     ad 	popl	%ebx
    213       1.6     ad 	popl	%edi
    214       1.6     ad 	ret
    215  1.16.2.1    jym #ifdef GPROF
    216  1.16.2.1    jym 	.space	16, 0x90
    217  1.16.2.1    jym #else
    218       1.7     ad 	.space	32, 0x90
    219  1.16.2.1    jym #endif
    220      1.11   yamt ENDLABEL(_atomic_cas_cx8_end)
    221       1.6     ad 
    222      1.13    chs ENTRY(sse2_lfence)
    223       1.1     ad 	lfence
    224       1.1     ad 	ret
    225      1.11   yamt ENDLABEL(sse2_lfence_end)
    226       1.1     ad 
    227      1.13    chs ENTRY(sse2_mfence)
    228       1.1     ad 	mfence
    229       1.1     ad 	ret
    230      1.11   yamt ENDLABEL(sse2_mfence_end)
    231       1.1     ad 
    232       1.1     ad atomic_lockpatch:
    233       1.1     ad 	.globl	atomic_lockpatch
    234       1.1     ad 	.long	.Lpatch1, .Lpatch2, .Lpatch3, .Lpatch4, .Lpatch5
    235       1.1     ad 	.long	.Lpatch6, .Lpatch7, .Lpatch8, .Lpatch9, .Lpatch10
    236       1.6     ad 	.long	.Lpatch12, .Lpatch13, .Lpatch14, .Lpatch15, 0
    237       1.7     ad #else
    238      1.13    chs ENTRY(_atomic_cas_64)
    239       1.7     ad 	pushl	%edi
    240       1.7     ad 	pushl	%ebx
    241       1.7     ad 	movl	12(%esp), %edi
    242       1.7     ad 	movl	16(%esp), %eax
    243       1.7     ad 	movl	20(%esp), %edx
    244       1.7     ad 	movl	24(%esp), %ebx
    245       1.7     ad 	movl	28(%esp), %ecx
    246       1.7     ad 	lock
    247       1.7     ad 	cmpxchg8b (%edi)
    248       1.7     ad 	popl	%ebx
    249       1.7     ad 	popl	%edi
    250       1.7     ad 	ret
    251      1.15  pooka #endif	/* _HARDKERNEL */
    252       1.1     ad 
    253       1.1     ad ALIAS(atomic_add_32,_atomic_add_32)
    254       1.4     ad ALIAS(atomic_add_int,_atomic_add_32)
    255       1.4     ad ALIAS(atomic_add_long,_atomic_add_32)
    256       1.1     ad ALIAS(atomic_add_ptr,_atomic_add_32)
    257       1.1     ad 
    258       1.1     ad ALIAS(atomic_add_32_nv,_atomic_add_32_nv)
    259       1.4     ad ALIAS(atomic_add_int_nv,_atomic_add_32_nv)
    260       1.4     ad ALIAS(atomic_add_long_nv,_atomic_add_32_nv)
    261       1.1     ad ALIAS(atomic_add_ptr_nv,_atomic_add_32_nv)
    262       1.1     ad 
    263       1.1     ad ALIAS(atomic_and_32,_atomic_and_32)
    264       1.1     ad ALIAS(atomic_and_uint,_atomic_and_32)
    265       1.1     ad ALIAS(atomic_and_ulong,_atomic_and_32)
    266       1.1     ad ALIAS(atomic_and_ptr,_atomic_and_32)
    267       1.1     ad 
    268       1.1     ad ALIAS(atomic_and_32_nv,_atomic_and_32_nv)
    269       1.1     ad ALIAS(atomic_and_uint_nv,_atomic_and_32_nv)
    270       1.1     ad ALIAS(atomic_and_ulong_nv,_atomic_and_32_nv)
    271       1.1     ad ALIAS(atomic_and_ptr_nv,_atomic_and_32_nv)
    272       1.1     ad 
    273       1.1     ad ALIAS(atomic_dec_32,_atomic_dec_32)
    274       1.1     ad ALIAS(atomic_dec_uint,_atomic_dec_32)
    275       1.1     ad ALIAS(atomic_dec_ulong,_atomic_dec_32)
    276       1.1     ad ALIAS(atomic_dec_ptr,_atomic_dec_32)
    277       1.1     ad 
    278       1.1     ad ALIAS(atomic_dec_32_nv,_atomic_dec_32_nv)
    279       1.1     ad ALIAS(atomic_dec_uint_nv,_atomic_dec_32_nv)
    280       1.1     ad ALIAS(atomic_dec_ulong_nv,_atomic_dec_32_nv)
    281       1.1     ad ALIAS(atomic_dec_ptr_nv,_atomic_dec_32_nv)
    282       1.1     ad 
    283       1.1     ad ALIAS(atomic_inc_32,_atomic_inc_32)
    284       1.1     ad ALIAS(atomic_inc_uint,_atomic_inc_32)
    285       1.1     ad ALIAS(atomic_inc_ulong,_atomic_inc_32)
    286       1.1     ad ALIAS(atomic_inc_ptr,_atomic_inc_32)
    287       1.1     ad 
    288       1.1     ad ALIAS(atomic_inc_32_nv,_atomic_inc_32_nv)
    289       1.1     ad ALIAS(atomic_inc_uint_nv,_atomic_inc_32_nv)
    290       1.1     ad ALIAS(atomic_inc_ulong_nv,_atomic_inc_32_nv)
    291       1.1     ad ALIAS(atomic_inc_ptr_nv,_atomic_inc_32_nv)
    292       1.1     ad 
    293       1.1     ad ALIAS(atomic_or_32,_atomic_or_32)
    294       1.1     ad ALIAS(atomic_or_uint,_atomic_or_32)
    295       1.1     ad ALIAS(atomic_or_ulong,_atomic_or_32)
    296       1.1     ad ALIAS(atomic_or_ptr,_atomic_or_32)
    297       1.1     ad 
    298       1.1     ad ALIAS(atomic_or_32_nv,_atomic_or_32_nv)
    299       1.1     ad ALIAS(atomic_or_uint_nv,_atomic_or_32_nv)
    300       1.1     ad ALIAS(atomic_or_ulong_nv,_atomic_or_32_nv)
    301       1.1     ad ALIAS(atomic_or_ptr_nv,_atomic_or_32_nv)
    302       1.1     ad 
    303       1.1     ad ALIAS(atomic_swap_32,_atomic_swap_32)
    304       1.1     ad ALIAS(atomic_swap_uint,_atomic_swap_32)
    305       1.1     ad ALIAS(atomic_swap_ulong,_atomic_swap_32)
    306       1.1     ad ALIAS(atomic_swap_ptr,_atomic_swap_32)
    307       1.1     ad 
    308       1.1     ad ALIAS(atomic_cas_32,_atomic_cas_32)
    309       1.1     ad ALIAS(atomic_cas_uint,_atomic_cas_32)
    310       1.1     ad ALIAS(atomic_cas_ulong,_atomic_cas_32)
    311       1.1     ad ALIAS(atomic_cas_ptr,_atomic_cas_32)
    312       1.1     ad 
    313       1.9     ad ALIAS(atomic_cas_32_ni,_atomic_cas_32_ni)
    314       1.9     ad ALIAS(atomic_cas_uint_ni,_atomic_cas_32_ni)
    315       1.9     ad ALIAS(atomic_cas_ulong_ni,_atomic_cas_32_ni)
    316       1.9     ad ALIAS(atomic_cas_ptr_ni,_atomic_cas_32_ni)
    317       1.9     ad 
    318       1.6     ad ALIAS(atomic_cas_64,_atomic_cas_64)
    319       1.9     ad ALIAS(atomic_cas_64_ni,_atomic_cas_64)
    320       1.6     ad 
    321       1.1     ad ALIAS(membar_consumer,_membar_consumer)
    322       1.1     ad ALIAS(membar_producer,_membar_producer)
    323       1.8     ad ALIAS(membar_enter,_membar_consumer)
    324       1.8     ad ALIAS(membar_exit,_membar_producer)
    325       1.1     ad ALIAS(membar_sync,_membar_sync)
    326       1.5     ad 
    327       1.5     ad STRONG_ALIAS(_atomic_add_int,_atomic_add_32)
    328       1.5     ad STRONG_ALIAS(_atomic_add_long,_atomic_add_32)
    329       1.5     ad STRONG_ALIAS(_atomic_add_ptr,_atomic_add_32)
    330       1.5     ad 
    331       1.5     ad STRONG_ALIAS(_atomic_add_int_nv,_atomic_add_32_nv)
    332       1.5     ad STRONG_ALIAS(_atomic_add_long_nv,_atomic_add_32_nv)
    333       1.5     ad STRONG_ALIAS(_atomic_add_ptr_nv,_atomic_add_32_nv)
    334       1.5     ad 
    335       1.5     ad STRONG_ALIAS(_atomic_and_uint,_atomic_and_32)
    336       1.5     ad STRONG_ALIAS(_atomic_and_ulong,_atomic_and_32)
    337       1.5     ad STRONG_ALIAS(_atomic_and_ptr,_atomic_and_32)
    338       1.5     ad 
    339       1.5     ad STRONG_ALIAS(_atomic_and_uint_nv,_atomic_and_32_nv)
    340       1.5     ad STRONG_ALIAS(_atomic_and_ulong_nv,_atomic_and_32_nv)
    341       1.5     ad STRONG_ALIAS(_atomic_and_ptr_nv,_atomic_and_32_nv)
    342       1.5     ad 
    343       1.5     ad STRONG_ALIAS(_atomic_dec_uint,_atomic_dec_32)
    344       1.5     ad STRONG_ALIAS(_atomic_dec_ulong,_atomic_dec_32)
    345       1.5     ad STRONG_ALIAS(_atomic_dec_ptr,_atomic_dec_32)
    346       1.5     ad 
    347       1.5     ad STRONG_ALIAS(_atomic_dec_uint_nv,_atomic_dec_32_nv)
    348       1.5     ad STRONG_ALIAS(_atomic_dec_ulong_nv,_atomic_dec_32_nv)
    349       1.5     ad STRONG_ALIAS(_atomic_dec_ptr_nv,_atomic_dec_32_nv)
    350       1.5     ad 
    351       1.5     ad STRONG_ALIAS(_atomic_inc_uint,_atomic_inc_32)
    352       1.5     ad STRONG_ALIAS(_atomic_inc_ulong,_atomic_inc_32)
    353       1.5     ad STRONG_ALIAS(_atomic_inc_ptr,_atomic_inc_32)
    354       1.5     ad 
    355       1.5     ad STRONG_ALIAS(_atomic_inc_uint_nv,_atomic_inc_32_nv)
    356       1.5     ad STRONG_ALIAS(_atomic_inc_ulong_nv,_atomic_inc_32_nv)
    357       1.5     ad STRONG_ALIAS(_atomic_inc_ptr_nv,_atomic_inc_32_nv)
    358       1.5     ad 
    359       1.5     ad STRONG_ALIAS(_atomic_or_uint,_atomic_or_32)
    360       1.5     ad STRONG_ALIAS(_atomic_or_ulong,_atomic_or_32)
    361       1.5     ad STRONG_ALIAS(_atomic_or_ptr,_atomic_or_32)
    362       1.5     ad 
    363       1.5     ad STRONG_ALIAS(_atomic_or_uint_nv,_atomic_or_32_nv)
    364       1.5     ad STRONG_ALIAS(_atomic_or_ulong_nv,_atomic_or_32_nv)
    365       1.5     ad STRONG_ALIAS(_atomic_or_ptr_nv,_atomic_or_32_nv)
    366       1.5     ad 
    367       1.5     ad STRONG_ALIAS(_atomic_swap_uint,_atomic_swap_32)
    368       1.5     ad STRONG_ALIAS(_atomic_swap_ulong,_atomic_swap_32)
    369       1.5     ad STRONG_ALIAS(_atomic_swap_ptr,_atomic_swap_32)
    370       1.5     ad 
    371       1.5     ad STRONG_ALIAS(_atomic_cas_uint,_atomic_cas_32)
    372       1.5     ad STRONG_ALIAS(_atomic_cas_ulong,_atomic_cas_32)
    373       1.5     ad STRONG_ALIAS(_atomic_cas_ptr,_atomic_cas_32)
    374       1.8     ad 
    375       1.9     ad STRONG_ALIAS(_atomic_cas_uint_ni,_atomic_cas_32_ni)
    376       1.9     ad STRONG_ALIAS(_atomic_cas_ulong_ni,_atomic_cas_32_ni)
    377       1.9     ad STRONG_ALIAS(_atomic_cas_ptr_ni,_atomic_cas_32_ni)
    378       1.9     ad 
    379       1.8     ad STRONG_ALIAS(_membar_enter,_membar_consumer)
    380       1.8     ad STRONG_ALIAS(_membar_exit,_membar_producer)
    381