Home | History | Annotate | Line # | Download | only in include
lock.h revision 1.13
      1  1.13        ad /*	$NetBSD: lock.h,v 1.13 2007/02/09 21:55:14 ad Exp $	*/
      2   1.1      fvdl 
      3   1.1      fvdl /*-
      4  1.12        ad  * Copyright (c) 2000, 2006 The NetBSD Foundation, Inc.
      5   1.1      fvdl  * All rights reserved.
      6   1.1      fvdl  *
      7   1.1      fvdl  * This code is derived from software contributed to The NetBSD Foundation
      8  1.12        ad  * by Jason R. Thorpe and Andrew Doran.
      9   1.1      fvdl  *
     10   1.1      fvdl  * Redistribution and use in source and binary forms, with or without
     11   1.1      fvdl  * modification, are permitted provided that the following conditions
     12   1.1      fvdl  * are met:
     13   1.1      fvdl  * 1. Redistributions of source code must retain the above copyright
     14   1.1      fvdl  *    notice, this list of conditions and the following disclaimer.
     15   1.1      fvdl  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.1      fvdl  *    notice, this list of conditions and the following disclaimer in the
     17   1.1      fvdl  *    documentation and/or other materials provided with the distribution.
     18   1.1      fvdl  * 3. All advertising materials mentioning features or use of this software
     19   1.1      fvdl  *    must display the following acknowledgement:
     20   1.1      fvdl  *	This product includes software developed by the NetBSD
     21   1.1      fvdl  *	Foundation, Inc. and its contributors.
     22   1.1      fvdl  * 4. Neither the name of The NetBSD Foundation nor the names of its
     23   1.1      fvdl  *    contributors may be used to endorse or promote products derived
     24   1.1      fvdl  *    from this software without specific prior written permission.
     25   1.1      fvdl  *
     26   1.1      fvdl  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     27   1.1      fvdl  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     28   1.1      fvdl  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     29   1.1      fvdl  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     30   1.1      fvdl  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     31   1.1      fvdl  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     32   1.1      fvdl  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     33   1.1      fvdl  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     34   1.1      fvdl  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     35   1.1      fvdl  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     36   1.1      fvdl  * POSSIBILITY OF SUCH DAMAGE.
     37   1.1      fvdl  */
     38   1.1      fvdl 
     39   1.1      fvdl /*
     40   1.1      fvdl  * Machine-dependent spin lock operations.
     41   1.1      fvdl  */
     42   1.1      fvdl 
     43   1.9      yamt #ifndef _X86_LOCK_H_
     44   1.9      yamt #define	_X86_LOCK_H_
     45   1.1      fvdl 
     46   1.1      fvdl #if defined(_KERNEL_OPT)
     47   1.1      fvdl #include "opt_lockdebug.h"
     48   1.1      fvdl #endif
     49   1.1      fvdl 
     50   1.2      fvdl #include <machine/cpufunc.h>
     51   1.1      fvdl 
     52   1.1      fvdl #ifdef LOCKDEBUG
     53   1.1      fvdl 
     54   1.5  junyoung extern void __cpu_simple_lock_init(__cpu_simple_lock_t *);
     55   1.5  junyoung extern void __cpu_simple_lock(__cpu_simple_lock_t *);
     56   1.5  junyoung extern int __cpu_simple_lock_try(__cpu_simple_lock_t *);
     57   1.5  junyoung extern void __cpu_simple_unlock(__cpu_simple_lock_t *);
     58   1.1      fvdl 
     59   1.1      fvdl #else
     60   1.1      fvdl 
     61   1.1      fvdl #include <machine/atomic.h>
     62   1.1      fvdl 
     63  1.11     perry static __inline void __cpu_simple_lock_init(__cpu_simple_lock_t *)
     64   1.1      fvdl 	__attribute__((__unused__));
     65  1.11     perry static __inline void __cpu_simple_lock(__cpu_simple_lock_t *)
     66   1.1      fvdl 	__attribute__((__unused__));
     67  1.11     perry static __inline int __cpu_simple_lock_try(__cpu_simple_lock_t *)
     68   1.1      fvdl 	__attribute__((__unused__));
     69  1.11     perry static __inline void __cpu_simple_unlock(__cpu_simple_lock_t *)
     70   1.1      fvdl 	__attribute__((__unused__));
     71   1.1      fvdl 
     72  1.11     perry static __inline void
     73   1.1      fvdl __cpu_simple_lock_init(__cpu_simple_lock_t *lockp)
     74   1.1      fvdl {
     75   1.1      fvdl 
     76   1.1      fvdl 	*lockp = __SIMPLELOCK_UNLOCKED;
     77   1.7      yamt 	__insn_barrier();
     78   1.1      fvdl }
     79   1.1      fvdl 
     80  1.11     perry static __inline void
     81   1.1      fvdl __cpu_simple_lock(__cpu_simple_lock_t *lockp)
     82   1.1      fvdl {
     83   1.1      fvdl 
     84  1.13        ad 	while (x86_atomic_testset_b(lockp, __SIMPLELOCK_LOCKED)
     85   1.6      yamt 	    != __SIMPLELOCK_UNLOCKED) {
     86   1.6      yamt 		do {
     87   1.6      yamt 			x86_pause();
     88   1.6      yamt 		} while (*lockp == __SIMPLELOCK_LOCKED);
     89   1.6      yamt 	}
     90   1.7      yamt 	__insn_barrier();
     91   1.1      fvdl }
     92   1.1      fvdl 
     93  1.11     perry static __inline int
     94   1.1      fvdl __cpu_simple_lock_try(__cpu_simple_lock_t *lockp)
     95   1.1      fvdl {
     96  1.13        ad 	int r = (x86_atomic_testset_b(lockp, __SIMPLELOCK_LOCKED)
     97   1.1      fvdl 	    == __SIMPLELOCK_UNLOCKED);
     98   1.1      fvdl 
     99   1.7      yamt 	__insn_barrier();
    100   1.1      fvdl 
    101   1.1      fvdl 	return (r);
    102   1.1      fvdl }
    103   1.1      fvdl 
    104  1.12        ad /*
    105  1.12        ad  * Note on x86 memory ordering
    106  1.12        ad  *
    107  1.12        ad  * When releasing a lock we must ensure that no stores or loads from within
    108  1.12        ad  * the critical section are re-ordered by the CPU to occur outside of it:
    109  1.12        ad  * they must have completed and be visible to other processors once the lock
    110  1.12        ad  * has been released.
    111  1.12        ad  *
    112  1.12        ad  * NetBSD usually runs with the kernel mapped (via MTRR) in a WB (write
    113  1.12        ad  * back) memory region.  In that case, memory ordering on x86 platforms
    114  1.12        ad  * looks like this:
    115  1.12        ad  *
    116  1.12        ad  * i386		All loads/stores occur in instruction sequence.
    117  1.12        ad  *
    118  1.12        ad  * i486		All loads/stores occur in instruction sequence.  In
    119  1.12        ad  * Pentium	exceptional circumstances, loads can be re-ordered around
    120  1.12        ad  *		stores, but for the purposes of releasing a lock it does
    121  1.12        ad  *		not matter.  Stores may not be immediately visible to other
    122  1.12        ad  *		processors as they can be buffered.  However, since the
    123  1.12        ad  *		stores are buffered in order the lock release will always be
    124  1.12        ad  *		the last operation in the critical section that becomes
    125  1.12        ad  *		visible to other CPUs.
    126  1.12        ad  *
    127  1.12        ad  * Pentium Pro	The "Intel 64 and IA-32 Architectures Software Developer's
    128  1.12        ad  * onwards	Manual" volume 3A (order number 248966) says that (1) "Reads
    129  1.12        ad  *		can be carried out speculatively and in any order" and (2)
    130  1.12        ad  *		"Reads can pass buffered stores, but the processor is
    131  1.12        ad  *		self-consistent.".  This would be a problem for the below,
    132  1.12        ad  *		and would mandate a locked instruction cycle or load fence
    133  1.12        ad  *		before releasing the simple lock.
    134  1.12        ad  *
    135  1.12        ad  *		The "Intel Pentium 4 Processor Optimization" guide (order
    136  1.12        ad  *		number 253668-022US) says: "Loads can be moved before stores
    137  1.12        ad  *		that occurred earlier in the program if they are not
    138  1.12        ad  *		predicted to load from the same linear address.".  This is
    139  1.12        ad  *		not a problem since the only loads that can be re-ordered
    140  1.12        ad  *		take place once the lock has been released via a store.
    141  1.12        ad  *
    142  1.12        ad  *		The above two documents seem to contradict each other,
    143  1.12        ad  *		however with the exception of early steppings of the Pentium
    144  1.12        ad  *		Pro, the second document is closer to the truth: a store
    145  1.12        ad  *		will always act as a load fence for all loads that precede
    146  1.12        ad  *		the store in instruction order.
    147  1.12        ad  *
    148  1.12        ad  *		Again, note that stores can be buffered and will not always
    149  1.12        ad  *		become immediately visible to other CPUs: they are however
    150  1.12        ad  *		buffered in order.
    151  1.12        ad  *
    152  1.12        ad  * AMD64	Stores occur in order and are buffered.  Loads can be
    153  1.12        ad  *		reordered, however stores act as load fences, meaning that
    154  1.12        ad  *		loads can not be reordered around stores.
    155  1.12        ad  */
    156  1.11     perry static __inline void
    157   1.1      fvdl __cpu_simple_unlock(__cpu_simple_lock_t *lockp)
    158   1.1      fvdl {
    159   1.1      fvdl 
    160   1.7      yamt 	__insn_barrier();
    161   1.1      fvdl 	*lockp = __SIMPLELOCK_UNLOCKED;
    162   1.1      fvdl }
    163   1.1      fvdl 
    164   1.1      fvdl #endif /* !LOCKDEBUG */
    165   1.4      yamt 
    166  1.13        ad #define	SPINLOCK_SPIN_HOOK	/* nothing */
    167  1.13        ad #define	SPINLOCK_BACKOFF_HOOK	x86_pause()
    168  1.13        ad 
    169   1.4      yamt #ifdef _KERNEL
    170  1.13        ad void	mb_read(void);
    171  1.13        ad void	mb_write(void);
    172  1.13        ad void	mb_memory(void);
    173  1.13        ad #else	/* _KERNEL */
    174  1.13        ad static inline void
    175  1.13        ad mb_read(void)
    176  1.13        ad {
    177  1.13        ad 	x86_lfence();
    178  1.13        ad }
    179  1.13        ad 
    180  1.13        ad static inline void
    181  1.13        ad mb_write(void)
    182  1.13        ad {
    183  1.13        ad 	__insn_barrier();
    184  1.13        ad }
    185  1.13        ad 
    186  1.13        ad static inline void
    187  1.13        ad mb_memory(void)
    188  1.13        ad {
    189  1.13        ad 	x86_mfence();
    190  1.13        ad }
    191  1.13        ad #endif	/* _KERNEL */
    192   1.1      fvdl 
    193   1.9      yamt #endif /* _X86_LOCK_H_ */
    194