1 1.29 riastrad /* $NetBSD: lock.h,v 1.29 2022/02/12 17:17:54 riastradh Exp $ */ 2 1.1 fvdl 3 1.1 fvdl /*- 4 1.12 ad * Copyright (c) 2000, 2006 The NetBSD Foundation, Inc. 5 1.1 fvdl * All rights reserved. 6 1.1 fvdl * 7 1.1 fvdl * This code is derived from software contributed to The NetBSD Foundation 8 1.12 ad * by Jason R. Thorpe and Andrew Doran. 9 1.1 fvdl * 10 1.1 fvdl * Redistribution and use in source and binary forms, with or without 11 1.1 fvdl * modification, are permitted provided that the following conditions 12 1.1 fvdl * are met: 13 1.1 fvdl * 1. Redistributions of source code must retain the above copyright 14 1.1 fvdl * notice, this list of conditions and the following disclaimer. 15 1.1 fvdl * 2. Redistributions in binary form must reproduce the above copyright 16 1.1 fvdl * notice, this list of conditions and the following disclaimer in the 17 1.1 fvdl * documentation and/or other materials provided with the distribution. 18 1.1 fvdl * 19 1.1 fvdl * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS 20 1.1 fvdl * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED 21 1.1 fvdl * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 22 1.1 fvdl * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS 23 1.1 fvdl * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 24 1.1 fvdl * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 25 1.1 fvdl * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 26 1.1 fvdl * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 27 1.1 fvdl * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 28 1.1 fvdl * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 29 1.1 fvdl * POSSIBILITY OF SUCH DAMAGE. 30 1.1 fvdl */ 31 1.1 fvdl 32 1.1 fvdl /* 33 1.1 fvdl * Machine-dependent spin lock operations. 34 1.1 fvdl */ 35 1.1 fvdl 36 1.9 yamt #ifndef _X86_LOCK_H_ 37 1.9 yamt #define _X86_LOCK_H_ 38 1.1 fvdl 39 1.25 pooka #include <sys/param.h> 40 1.25 pooka 41 1.15 skrll static __inline int 42 1.28 christos __SIMPLELOCK_LOCKED_P(const __cpu_simple_lock_t *__ptr) 43 1.15 skrll { 44 1.15 skrll return *__ptr == __SIMPLELOCK_LOCKED; 45 1.15 skrll } 46 1.15 skrll 47 1.15 skrll static __inline int 48 1.28 christos __SIMPLELOCK_UNLOCKED_P(const __cpu_simple_lock_t *__ptr) 49 1.15 skrll { 50 1.15 skrll return *__ptr == __SIMPLELOCK_UNLOCKED; 51 1.15 skrll } 52 1.15 skrll 53 1.16 skrll static __inline void 54 1.16 skrll __cpu_simple_lock_set(__cpu_simple_lock_t *__ptr) 55 1.16 skrll { 56 1.16 skrll 57 1.16 skrll *__ptr = __SIMPLELOCK_LOCKED; 58 1.16 skrll } 59 1.16 skrll 60 1.16 skrll static __inline void 61 1.16 skrll __cpu_simple_lock_clear(__cpu_simple_lock_t *__ptr) 62 1.16 skrll { 63 1.16 skrll 64 1.16 skrll *__ptr = __SIMPLELOCK_UNLOCKED; 65 1.16 skrll } 66 1.16 skrll 67 1.25 pooka #ifdef _HARDKERNEL 68 1.27 christos # include <machine/cpufunc.h> 69 1.27 christos # define SPINLOCK_SPIN_HOOK /* nothing */ 70 1.27 christos # ifdef SPINLOCK_BACKOFF_HOOK 71 1.27 christos # undef SPINLOCK_BACKOFF_HOOK 72 1.27 christos # endif 73 1.27 christos # define SPINLOCK_BACKOFF_HOOK x86_pause() 74 1.27 christos # define SPINLOCK_INLINE 75 1.27 christos #else /* !_HARDKERNEL */ 76 1.27 christos # define SPINLOCK_BODY 77 1.27 christos # define SPINLOCK_INLINE static __inline __unused 78 1.27 christos #endif /* _HARDKERNEL */ 79 1.27 christos 80 1.27 christos SPINLOCK_INLINE void __cpu_simple_lock_init(__cpu_simple_lock_t *); 81 1.27 christos SPINLOCK_INLINE void __cpu_simple_lock(__cpu_simple_lock_t *); 82 1.27 christos SPINLOCK_INLINE int __cpu_simple_lock_try(__cpu_simple_lock_t *); 83 1.27 christos SPINLOCK_INLINE void __cpu_simple_unlock(__cpu_simple_lock_t *); 84 1.20 ad 85 1.27 christos #ifdef SPINLOCK_BODY 86 1.27 christos SPINLOCK_INLINE void 87 1.1 fvdl __cpu_simple_lock_init(__cpu_simple_lock_t *lockp) 88 1.1 fvdl { 89 1.1 fvdl 90 1.1 fvdl *lockp = __SIMPLELOCK_UNLOCKED; 91 1.1 fvdl } 92 1.1 fvdl 93 1.27 christos SPINLOCK_INLINE int 94 1.20 ad __cpu_simple_lock_try(__cpu_simple_lock_t *lockp) 95 1.1 fvdl { 96 1.20 ad uint8_t val; 97 1.1 fvdl 98 1.20 ad val = __SIMPLELOCK_LOCKED; 99 1.20 ad __asm volatile ("xchgb %0,(%2)" : 100 1.26 apb "=qQ" (val) 101 1.20 ad :"0" (val), "r" (lockp)); 102 1.7 yamt __insn_barrier(); 103 1.20 ad return val == __SIMPLELOCK_UNLOCKED; 104 1.1 fvdl } 105 1.1 fvdl 106 1.27 christos SPINLOCK_INLINE void 107 1.20 ad __cpu_simple_lock(__cpu_simple_lock_t *lockp) 108 1.1 fvdl { 109 1.1 fvdl 110 1.20 ad while (!__cpu_simple_lock_try(lockp)) 111 1.20 ad /* nothing */; 112 1.7 yamt __insn_barrier(); 113 1.1 fvdl } 114 1.1 fvdl 115 1.12 ad /* 116 1.12 ad * Note on x86 memory ordering 117 1.12 ad * 118 1.12 ad * When releasing a lock we must ensure that no stores or loads from within 119 1.12 ad * the critical section are re-ordered by the CPU to occur outside of it: 120 1.12 ad * they must have completed and be visible to other processors once the lock 121 1.12 ad * has been released. 122 1.12 ad * 123 1.12 ad * NetBSD usually runs with the kernel mapped (via MTRR) in a WB (write 124 1.12 ad * back) memory region. In that case, memory ordering on x86 platforms 125 1.12 ad * looks like this: 126 1.12 ad * 127 1.12 ad * i386 All loads/stores occur in instruction sequence. 128 1.12 ad * 129 1.12 ad * i486 All loads/stores occur in instruction sequence. In 130 1.12 ad * Pentium exceptional circumstances, loads can be re-ordered around 131 1.12 ad * stores, but for the purposes of releasing a lock it does 132 1.12 ad * not matter. Stores may not be immediately visible to other 133 1.12 ad * processors as they can be buffered. However, since the 134 1.12 ad * stores are buffered in order the lock release will always be 135 1.12 ad * the last operation in the critical section that becomes 136 1.12 ad * visible to other CPUs. 137 1.12 ad * 138 1.12 ad * Pentium Pro The "Intel 64 and IA-32 Architectures Software Developer's 139 1.12 ad * onwards Manual" volume 3A (order number 248966) says that (1) "Reads 140 1.12 ad * can be carried out speculatively and in any order" and (2) 141 1.12 ad * "Reads can pass buffered stores, but the processor is 142 1.12 ad * self-consistent.". This would be a problem for the below, 143 1.12 ad * and would mandate a locked instruction cycle or load fence 144 1.12 ad * before releasing the simple lock. 145 1.12 ad * 146 1.12 ad * The "Intel Pentium 4 Processor Optimization" guide (order 147 1.12 ad * number 253668-022US) says: "Loads can be moved before stores 148 1.12 ad * that occurred earlier in the program if they are not 149 1.12 ad * predicted to load from the same linear address.". This is 150 1.12 ad * not a problem since the only loads that can be re-ordered 151 1.12 ad * take place once the lock has been released via a store. 152 1.12 ad * 153 1.12 ad * The above two documents seem to contradict each other, 154 1.12 ad * however with the exception of early steppings of the Pentium 155 1.12 ad * Pro, the second document is closer to the truth: a store 156 1.12 ad * will always act as a load fence for all loads that precede 157 1.12 ad * the store in instruction order. 158 1.12 ad * 159 1.12 ad * Again, note that stores can be buffered and will not always 160 1.12 ad * become immediately visible to other CPUs: they are however 161 1.12 ad * buffered in order. 162 1.12 ad * 163 1.12 ad * AMD64 Stores occur in order and are buffered. Loads can be 164 1.12 ad * reordered, however stores act as load fences, meaning that 165 1.12 ad * loads can not be reordered around stores. 166 1.12 ad */ 167 1.27 christos SPINLOCK_INLINE void 168 1.1 fvdl __cpu_simple_unlock(__cpu_simple_lock_t *lockp) 169 1.1 fvdl { 170 1.1 fvdl 171 1.7 yamt __insn_barrier(); 172 1.1 fvdl *lockp = __SIMPLELOCK_UNLOCKED; 173 1.1 fvdl } 174 1.1 fvdl 175 1.27 christos #endif /* SPINLOCK_BODY */ 176 1.1 fvdl 177 1.9 yamt #endif /* _X86_LOCK_H_ */ 178