Home | History | Annotate | Line # | Download | only in atomic
atomic.S revision 1.9.4.1
      1  1.9.4.1  yamt /*	$NetBSD: atomic.S,v 1.9.4.1 2008/05/18 12:28:45 yamt Exp $	*/
      2      1.1    ad 
      3      1.1    ad /*-
      4      1.1    ad  * Copyright (c) 2007 The NetBSD Foundation, Inc.
      5      1.1    ad  * All rights reserved.
      6      1.1    ad  *
      7      1.1    ad  * This code is derived from software contributed to The NetBSD Foundation
      8      1.1    ad  * by Jason R. Thorpe, and by Andrew Doran.
      9      1.1    ad  *
     10      1.1    ad  * Redistribution and use in source and binary forms, with or without
     11      1.1    ad  * modification, are permitted provided that the following conditions
     12      1.1    ad  * are met:
     13      1.1    ad  * 1. Redistributions of source code must retain the above copyright
     14      1.1    ad  *    notice, this list of conditions and the following disclaimer.
     15      1.1    ad  * 2. Redistributions in binary form must reproduce the above copyright
     16      1.1    ad  *    notice, this list of conditions and the following disclaimer in the
     17      1.1    ad  *    documentation and/or other materials provided with the distribution.
     18      1.1    ad  *
     19      1.1    ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20      1.1    ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21      1.1    ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22      1.1    ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23      1.1    ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24      1.1    ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25      1.1    ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26      1.1    ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27      1.1    ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28      1.1    ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29      1.1    ad  * POSSIBILITY OF SUCH DAMAGE.
     30      1.1    ad  */
     31      1.1    ad 
     32      1.1    ad #include <machine/asm.h>
     33      1.1    ad 
     34      1.1    ad #ifdef _KERNEL
     35      1.1    ad #define	LOCK(n)		.Lpatch/**/n:	lock
     36      1.1    ad #define	ALIAS(f, t)	STRONG_ALIAS(f,t)
     37  1.9.4.1  yamt #define	ENDLABEL(a)	_ALIGN_TEXT; LABEL(a)
     38      1.1    ad #else
     39      1.1    ad #define	LOCK(n)		lock
     40      1.1    ad #define	ALIAS(f, t)	WEAK_ALIAS(f,t)
     41  1.9.4.1  yamt #define	ENDLABEL(a)	/* nothing */
     42      1.1    ad #endif
     43      1.1    ad 
     44      1.1    ad 	.text
     45      1.1    ad 
     46      1.1    ad NENTRY(_atomic_add_32)
     47      1.1    ad 	movl	4(%esp), %edx
     48      1.1    ad 	movl	8(%esp), %eax
     49      1.1    ad 	LOCK(1)
     50      1.1    ad 	addl	%eax, (%edx)
     51      1.1    ad 	ret
     52      1.1    ad 
     53      1.1    ad NENTRY(_atomic_add_32_nv)
     54      1.1    ad 	movl	4(%esp), %edx
     55      1.1    ad 	movl	8(%esp), %eax
     56      1.1    ad 	movl	%eax, %ecx
     57      1.1    ad 	LOCK(2)
     58      1.1    ad 	xaddl	%eax, (%edx)
     59      1.1    ad 	addl	%ecx, %eax
     60      1.1    ad 	ret
     61      1.1    ad 
     62      1.1    ad NENTRY(_atomic_and_32)
     63      1.1    ad 	movl	4(%esp), %edx
     64      1.1    ad 	movl	8(%esp), %eax
     65      1.1    ad 	LOCK(3)
     66      1.1    ad 	andl	%eax, (%edx)
     67      1.1    ad 	ret
     68      1.1    ad 
     69      1.1    ad NENTRY(_atomic_and_32_nv)
     70      1.1    ad 	movl	4(%esp), %edx
     71      1.1    ad 	movl	(%edx), %eax
     72      1.1    ad 1:
     73      1.1    ad 	movl	%eax, %ecx
     74      1.1    ad 	andl	8(%esp), %ecx
     75      1.1    ad 	LOCK(4)
     76      1.1    ad 	cmpxchgl %ecx, (%edx)
     77      1.1    ad 	jnz	1b
     78      1.1    ad 	movl	%ecx, %eax
     79      1.1    ad 	ret
     80      1.1    ad 
     81      1.1    ad NENTRY(_atomic_dec_32)
     82      1.1    ad 	movl	4(%esp), %edx
     83      1.1    ad 	LOCK(5)
     84      1.1    ad 	decl	(%edx)
     85      1.1    ad 	ret
     86      1.1    ad 
     87      1.1    ad NENTRY(_atomic_dec_32_nv)
     88      1.1    ad 	movl	4(%esp), %edx
     89      1.1    ad 	movl	$-1, %eax
     90      1.1    ad 	LOCK(6)
     91      1.1    ad 	xaddl	%eax, (%edx)
     92      1.1    ad 	decl	%eax
     93      1.1    ad 	ret
     94      1.1    ad 
     95      1.1    ad NENTRY(_atomic_inc_32)
     96      1.1    ad 	movl	4(%esp), %edx
     97      1.1    ad 	LOCK(7)
     98      1.1    ad 	incl	(%edx)
     99      1.1    ad 	ret
    100      1.1    ad 
    101      1.1    ad NENTRY(_atomic_inc_32_nv)
    102      1.1    ad 	movl	4(%esp), %edx
    103      1.1    ad 	movl	$1, %eax
    104      1.1    ad 	LOCK(8)
    105      1.1    ad 	xaddl	%eax, (%edx)
    106      1.1    ad 	incl	%eax
    107      1.1    ad 	ret
    108      1.1    ad 
    109      1.1    ad NENTRY(_atomic_or_32)
    110      1.1    ad 	movl	4(%esp), %edx
    111      1.1    ad 	movl	8(%esp), %eax
    112      1.1    ad 	LOCK(9)
    113      1.1    ad 	orl	%eax, (%edx)
    114      1.1    ad 	ret
    115      1.1    ad 
    116      1.1    ad NENTRY(_atomic_or_32_nv)
    117      1.1    ad 	movl	4(%esp), %edx
    118      1.1    ad 	movl	(%edx), %eax
    119      1.1    ad 1:
    120      1.1    ad 	movl	%eax, %ecx
    121      1.1    ad 	orl	8(%esp), %ecx
    122      1.1    ad 	LOCK(10)
    123      1.1    ad 	cmpxchgl %ecx, (%edx)
    124      1.1    ad 	jnz	1b
    125      1.1    ad 	movl	%ecx, %eax
    126      1.1    ad 	ret
    127      1.1    ad 
    128      1.1    ad NENTRY(_atomic_swap_32)
    129      1.1    ad 	movl	4(%esp), %edx
    130      1.1    ad 	movl	8(%esp), %eax
    131      1.1    ad 	xchgl	%eax, (%edx)
    132      1.1    ad 	ret
    133      1.1    ad 
    134      1.1    ad NENTRY(_atomic_cas_32)
    135      1.1    ad 	movl	4(%esp), %edx
    136      1.1    ad 	movl	8(%esp), %eax
    137      1.1    ad 	movl	12(%esp), %ecx
    138      1.1    ad 	LOCK(12)
    139      1.1    ad 	cmpxchgl %ecx, (%edx)
    140      1.1    ad 	/* %eax now contains the old value */
    141      1.1    ad 	ret
    142      1.1    ad 
    143      1.9    ad NENTRY(_atomic_cas_32_ni)
    144      1.9    ad 	movl	4(%esp), %edx
    145      1.9    ad 	movl	8(%esp), %eax
    146      1.9    ad 	movl	12(%esp), %ecx
    147      1.9    ad 	cmpxchgl %ecx, (%edx)
    148      1.9    ad 	/* %eax now contains the old value */
    149      1.9    ad 	ret
    150      1.9    ad 
    151      1.1    ad NENTRY(_membar_consumer)
    152      1.1    ad 	LOCK(13)
    153      1.1    ad 	addl	$0, -4(%esp)
    154      1.1    ad 	ret
    155  1.9.4.1  yamt ENDLABEL(membar_consumer_end)
    156      1.1    ad 
    157      1.1    ad NENTRY(_membar_producer)
    158      1.1    ad 	/* A store is enough */
    159      1.1    ad 	movl	$0, -4(%esp)
    160      1.1    ad 	ret
    161  1.9.4.1  yamt ENDLABEL(membar_producer_end)
    162      1.1    ad 
    163      1.1    ad NENTRY(_membar_sync)
    164      1.1    ad 	LOCK(14)
    165      1.1    ad 	addl	$0, -4(%esp)
    166      1.1    ad 	ret
    167  1.9.4.1  yamt ENDLABEL(membar_sync_end)
    168      1.1    ad 
    169      1.1    ad #ifdef _KERNEL
    170      1.6    ad NENTRY(_atomic_cas_64)
    171      1.6    ad 	cli
    172      1.6    ad 	pushl	%edi
    173      1.6    ad 	pushl	%ebx
    174      1.6    ad 	movl	12(%esp), %edi
    175      1.6    ad 	movl	16(%esp), %eax
    176      1.6    ad 	movl	20(%esp), %edx
    177      1.6    ad 	movl	24(%esp), %ebx
    178      1.6    ad 	movl	28(%esp), %ecx
    179      1.6    ad 	cmpl	0(%edi), %eax
    180      1.6    ad 	jne	2f
    181      1.6    ad 	cmpl	4(%edi), %edx
    182      1.6    ad 	jne	2f
    183      1.6    ad 	movl	%ebx, 0(%edi)
    184      1.6    ad 	movl	%ecx, 4(%edi)
    185      1.6    ad 1:
    186      1.6    ad 	popl	%ebx
    187      1.6    ad 	popl	%edi
    188      1.6    ad 	sti
    189      1.6    ad 	ret
    190      1.6    ad 2:
    191      1.6    ad 	movl	0(%edi), %eax
    192      1.6    ad 	movl	4(%edi), %edx
    193      1.6    ad 	jmp	1b
    194  1.9.4.1  yamt ENDLABEL(_atomic_cas_64_end)
    195      1.6    ad 
    196      1.6    ad NENTRY(_atomic_cas_cx8)
    197      1.6    ad 	pushl	%edi
    198      1.6    ad 	pushl	%ebx
    199      1.6    ad 	movl	12(%esp), %edi
    200      1.6    ad 	movl	16(%esp), %eax
    201      1.6    ad 	movl	20(%esp), %edx
    202      1.6    ad 	movl	24(%esp), %ebx
    203      1.6    ad 	movl	28(%esp), %ecx
    204      1.6    ad 	LOCK(15)
    205      1.6    ad 	cmpxchg8b (%edi)
    206      1.6    ad 	popl	%ebx
    207      1.6    ad 	popl	%edi
    208      1.6    ad 	ret
    209      1.7    ad 	.space	32, 0x90
    210  1.9.4.1  yamt ENDLABEL(_atomic_cas_cx8_end)
    211      1.6    ad 
    212      1.1    ad NENTRY(sse2_lfence)
    213      1.1    ad 	lfence
    214      1.1    ad 	ret
    215  1.9.4.1  yamt ENDLABEL(sse2_lfence_end)
    216      1.1    ad 
    217      1.1    ad NENTRY(sse2_mfence)
    218      1.1    ad 	mfence
    219      1.1    ad 	ret
    220  1.9.4.1  yamt ENDLABEL(sse2_mfence_end)
    221      1.1    ad 
    222      1.1    ad atomic_lockpatch:
    223      1.1    ad 	.globl	atomic_lockpatch
    224      1.1    ad 	.long	.Lpatch1, .Lpatch2, .Lpatch3, .Lpatch4, .Lpatch5
    225      1.1    ad 	.long	.Lpatch6, .Lpatch7, .Lpatch8, .Lpatch9, .Lpatch10
    226      1.6    ad 	.long	.Lpatch12, .Lpatch13, .Lpatch14, .Lpatch15, 0
    227      1.7    ad #else
    228      1.7    ad NENTRY(_atomic_cas_64)
    229      1.7    ad 	pushl	%edi
    230      1.7    ad 	pushl	%ebx
    231      1.7    ad 	movl	12(%esp), %edi
    232      1.7    ad 	movl	16(%esp), %eax
    233      1.7    ad 	movl	20(%esp), %edx
    234      1.7    ad 	movl	24(%esp), %ebx
    235      1.7    ad 	movl	28(%esp), %ecx
    236      1.7    ad 	lock
    237      1.7    ad 	cmpxchg8b (%edi)
    238      1.7    ad 	popl	%ebx
    239      1.7    ad 	popl	%edi
    240      1.7    ad 	ret
    241      1.1    ad #endif	/* _KERNEL */
    242      1.1    ad 
    243      1.1    ad ALIAS(atomic_add_32,_atomic_add_32)
    244      1.4    ad ALIAS(atomic_add_int,_atomic_add_32)
    245      1.4    ad ALIAS(atomic_add_long,_atomic_add_32)
    246      1.1    ad ALIAS(atomic_add_ptr,_atomic_add_32)
    247      1.1    ad 
    248      1.1    ad ALIAS(atomic_add_32_nv,_atomic_add_32_nv)
    249      1.4    ad ALIAS(atomic_add_int_nv,_atomic_add_32_nv)
    250      1.4    ad ALIAS(atomic_add_long_nv,_atomic_add_32_nv)
    251      1.1    ad ALIAS(atomic_add_ptr_nv,_atomic_add_32_nv)
    252      1.1    ad 
    253      1.1    ad ALIAS(atomic_and_32,_atomic_and_32)
    254      1.1    ad ALIAS(atomic_and_uint,_atomic_and_32)
    255      1.1    ad ALIAS(atomic_and_ulong,_atomic_and_32)
    256      1.1    ad ALIAS(atomic_and_ptr,_atomic_and_32)
    257      1.1    ad 
    258      1.1    ad ALIAS(atomic_and_32_nv,_atomic_and_32_nv)
    259      1.1    ad ALIAS(atomic_and_uint_nv,_atomic_and_32_nv)
    260      1.1    ad ALIAS(atomic_and_ulong_nv,_atomic_and_32_nv)
    261      1.1    ad ALIAS(atomic_and_ptr_nv,_atomic_and_32_nv)
    262      1.1    ad 
    263      1.1    ad ALIAS(atomic_dec_32,_atomic_dec_32)
    264      1.1    ad ALIAS(atomic_dec_uint,_atomic_dec_32)
    265      1.1    ad ALIAS(atomic_dec_ulong,_atomic_dec_32)
    266      1.1    ad ALIAS(atomic_dec_ptr,_atomic_dec_32)
    267      1.1    ad 
    268      1.1    ad ALIAS(atomic_dec_32_nv,_atomic_dec_32_nv)
    269      1.1    ad ALIAS(atomic_dec_uint_nv,_atomic_dec_32_nv)
    270      1.1    ad ALIAS(atomic_dec_ulong_nv,_atomic_dec_32_nv)
    271      1.1    ad ALIAS(atomic_dec_ptr_nv,_atomic_dec_32_nv)
    272      1.1    ad 
    273      1.1    ad ALIAS(atomic_inc_32,_atomic_inc_32)
    274      1.1    ad ALIAS(atomic_inc_uint,_atomic_inc_32)
    275      1.1    ad ALIAS(atomic_inc_ulong,_atomic_inc_32)
    276      1.1    ad ALIAS(atomic_inc_ptr,_atomic_inc_32)
    277      1.1    ad 
    278      1.1    ad ALIAS(atomic_inc_32_nv,_atomic_inc_32_nv)
    279      1.1    ad ALIAS(atomic_inc_uint_nv,_atomic_inc_32_nv)
    280      1.1    ad ALIAS(atomic_inc_ulong_nv,_atomic_inc_32_nv)
    281      1.1    ad ALIAS(atomic_inc_ptr_nv,_atomic_inc_32_nv)
    282      1.1    ad 
    283      1.1    ad ALIAS(atomic_or_32,_atomic_or_32)
    284      1.1    ad ALIAS(atomic_or_uint,_atomic_or_32)
    285      1.1    ad ALIAS(atomic_or_ulong,_atomic_or_32)
    286      1.1    ad ALIAS(atomic_or_ptr,_atomic_or_32)
    287      1.1    ad 
    288      1.1    ad ALIAS(atomic_or_32_nv,_atomic_or_32_nv)
    289      1.1    ad ALIAS(atomic_or_uint_nv,_atomic_or_32_nv)
    290      1.1    ad ALIAS(atomic_or_ulong_nv,_atomic_or_32_nv)
    291      1.1    ad ALIAS(atomic_or_ptr_nv,_atomic_or_32_nv)
    292      1.1    ad 
    293      1.1    ad ALIAS(atomic_swap_32,_atomic_swap_32)
    294      1.1    ad ALIAS(atomic_swap_uint,_atomic_swap_32)
    295      1.1    ad ALIAS(atomic_swap_ulong,_atomic_swap_32)
    296      1.1    ad ALIAS(atomic_swap_ptr,_atomic_swap_32)
    297      1.1    ad 
    298      1.1    ad ALIAS(atomic_cas_32,_atomic_cas_32)
    299      1.1    ad ALIAS(atomic_cas_uint,_atomic_cas_32)
    300      1.1    ad ALIAS(atomic_cas_ulong,_atomic_cas_32)
    301      1.1    ad ALIAS(atomic_cas_ptr,_atomic_cas_32)
    302      1.1    ad 
    303      1.9    ad ALIAS(atomic_cas_32_ni,_atomic_cas_32_ni)
    304      1.9    ad ALIAS(atomic_cas_uint_ni,_atomic_cas_32_ni)
    305      1.9    ad ALIAS(atomic_cas_ulong_ni,_atomic_cas_32_ni)
    306      1.9    ad ALIAS(atomic_cas_ptr_ni,_atomic_cas_32_ni)
    307      1.9    ad 
    308      1.6    ad ALIAS(atomic_cas_64,_atomic_cas_64)
    309      1.9    ad ALIAS(atomic_cas_64_ni,_atomic_cas_64)
    310      1.6    ad 
    311      1.1    ad ALIAS(membar_consumer,_membar_consumer)
    312      1.1    ad ALIAS(membar_producer,_membar_producer)
    313      1.8    ad ALIAS(membar_enter,_membar_consumer)
    314      1.8    ad ALIAS(membar_exit,_membar_producer)
    315      1.1    ad ALIAS(membar_sync,_membar_sync)
    316      1.5    ad 
    317      1.5    ad STRONG_ALIAS(_atomic_add_int,_atomic_add_32)
    318      1.5    ad STRONG_ALIAS(_atomic_add_long,_atomic_add_32)
    319      1.5    ad STRONG_ALIAS(_atomic_add_ptr,_atomic_add_32)
    320      1.5    ad 
    321      1.5    ad STRONG_ALIAS(_atomic_add_int_nv,_atomic_add_32_nv)
    322      1.5    ad STRONG_ALIAS(_atomic_add_long_nv,_atomic_add_32_nv)
    323      1.5    ad STRONG_ALIAS(_atomic_add_ptr_nv,_atomic_add_32_nv)
    324      1.5    ad 
    325      1.5    ad STRONG_ALIAS(_atomic_and_uint,_atomic_and_32)
    326      1.5    ad STRONG_ALIAS(_atomic_and_ulong,_atomic_and_32)
    327      1.5    ad STRONG_ALIAS(_atomic_and_ptr,_atomic_and_32)
    328      1.5    ad 
    329      1.5    ad STRONG_ALIAS(_atomic_and_uint_nv,_atomic_and_32_nv)
    330      1.5    ad STRONG_ALIAS(_atomic_and_ulong_nv,_atomic_and_32_nv)
    331      1.5    ad STRONG_ALIAS(_atomic_and_ptr_nv,_atomic_and_32_nv)
    332      1.5    ad 
    333      1.5    ad STRONG_ALIAS(_atomic_dec_uint,_atomic_dec_32)
    334      1.5    ad STRONG_ALIAS(_atomic_dec_ulong,_atomic_dec_32)
    335      1.5    ad STRONG_ALIAS(_atomic_dec_ptr,_atomic_dec_32)
    336      1.5    ad 
    337      1.5    ad STRONG_ALIAS(_atomic_dec_uint_nv,_atomic_dec_32_nv)
    338      1.5    ad STRONG_ALIAS(_atomic_dec_ulong_nv,_atomic_dec_32_nv)
    339      1.5    ad STRONG_ALIAS(_atomic_dec_ptr_nv,_atomic_dec_32_nv)
    340      1.5    ad 
    341      1.5    ad STRONG_ALIAS(_atomic_inc_uint,_atomic_inc_32)
    342      1.5    ad STRONG_ALIAS(_atomic_inc_ulong,_atomic_inc_32)
    343      1.5    ad STRONG_ALIAS(_atomic_inc_ptr,_atomic_inc_32)
    344      1.5    ad 
    345      1.5    ad STRONG_ALIAS(_atomic_inc_uint_nv,_atomic_inc_32_nv)
    346      1.5    ad STRONG_ALIAS(_atomic_inc_ulong_nv,_atomic_inc_32_nv)
    347      1.5    ad STRONG_ALIAS(_atomic_inc_ptr_nv,_atomic_inc_32_nv)
    348      1.5    ad 
    349      1.5    ad STRONG_ALIAS(_atomic_or_uint,_atomic_or_32)
    350      1.5    ad STRONG_ALIAS(_atomic_or_ulong,_atomic_or_32)
    351      1.5    ad STRONG_ALIAS(_atomic_or_ptr,_atomic_or_32)
    352      1.5    ad 
    353      1.5    ad STRONG_ALIAS(_atomic_or_uint_nv,_atomic_or_32_nv)
    354      1.5    ad STRONG_ALIAS(_atomic_or_ulong_nv,_atomic_or_32_nv)
    355      1.5    ad STRONG_ALIAS(_atomic_or_ptr_nv,_atomic_or_32_nv)
    356      1.5    ad 
    357      1.5    ad STRONG_ALIAS(_atomic_swap_uint,_atomic_swap_32)
    358      1.5    ad STRONG_ALIAS(_atomic_swap_ulong,_atomic_swap_32)
    359      1.5    ad STRONG_ALIAS(_atomic_swap_ptr,_atomic_swap_32)
    360      1.5    ad 
    361      1.5    ad STRONG_ALIAS(_atomic_cas_uint,_atomic_cas_32)
    362      1.5    ad STRONG_ALIAS(_atomic_cas_ulong,_atomic_cas_32)
    363      1.5    ad STRONG_ALIAS(_atomic_cas_ptr,_atomic_cas_32)
    364      1.8    ad 
    365      1.9    ad STRONG_ALIAS(_atomic_cas_uint_ni,_atomic_cas_32_ni)
    366      1.9    ad STRONG_ALIAS(_atomic_cas_ulong_ni,_atomic_cas_32_ni)
    367      1.9    ad STRONG_ALIAS(_atomic_cas_ptr_ni,_atomic_cas_32_ni)
    368      1.9    ad 
    369      1.8    ad STRONG_ALIAS(_membar_enter,_membar_consumer)
    370      1.8    ad STRONG_ALIAS(_membar_exit,_membar_producer)
    371