lock_stubs.S revision 1.18
11.18Sad/* $NetBSD: lock_stubs.S,v 1.18 2008/05/06 23:03:03 ad Exp $ */ 21.2Sad 31.2Sad/*- 41.13Sad * Copyright (c) 2006, 2007, 2008 The NetBSD Foundation, Inc. 51.2Sad * All rights reserved. 61.2Sad * 71.2Sad * This code is derived from software contributed to The NetBSD Foundation 81.2Sad * by Andrew Doran. 91.2Sad * 101.2Sad * Redistribution and use in source and binary forms, with or without 111.2Sad * modification, are permitted provided that the following conditions 121.2Sad * are met: 131.2Sad * 1. Redistributions of source code must retain the above copyright 141.2Sad * notice, this list of conditions and the following disclaimer. 151.2Sad * 2. Redistributions in binary form must reproduce the above copyright 161.2Sad * notice, this list of conditions and the following disclaimer in the 171.2Sad * documentation and/or other materials provided with the distribution. 181.2Sad * 191.2Sad * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS 201.2Sad * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED 211.2Sad * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 221.2Sad * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS 231.2Sad * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 241.2Sad * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 251.2Sad * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 261.2Sad * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 271.2Sad * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 281.2Sad * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 291.2Sad * POSSIBILITY OF SUCH DAMAGE. 301.2Sad */ 311.2Sad 321.2Sad/* 331.2Sad * AMD64 lock stubs. Calling convention: 341.2Sad * 351.2Sad * %rdi arg 1 361.2Sad * %rsi arg 2 371.2Sad * %rdx arg 3 381.2Sad * %rax return value 391.2Sad */ 401.2Sad 411.2Sad#include "opt_multiprocessor.h" 421.2Sad#include "opt_lockdebug.h" 431.2Sad 441.2Sad#include <machine/asm.h> 451.8Sbouyer#include <machine/frameasm.h> 461.2Sad 471.2Sad#include "assym.h" 481.2Sad 491.2Sad#if defined(DIAGNOSTIC) || defined(MULTIPROCESSOR) || defined(LOCKDEBUG) 501.2Sad#define FULL 511.2Sad#endif 521.2Sad 531.16Syamt#define ENDLABEL(name,a) .align a; LABEL(name) 541.11Sad#define LOCK(num) .Lpatch/**/num: lock 551.2Sad 561.2Sad#ifndef LOCKDEBUG 571.2Sad 581.2Sad/* 591.2Sad * void mutex_enter(kmutex_t *mtx); 601.2Sad * 611.2Sad * Acquire a mutex and post a load fence. 621.2Sad */ 631.2Sad .align 64 641.2Sad 651.11SadNENTRY(mutex_enter) 661.2Sad movq CPUVAR(CURLWP), %rcx 671.2Sad xorq %rax, %rax 681.11Sad LOCK(1) 691.2Sad cmpxchgq %rcx, MTX_OWNER(%rdi) 701.14Sad jnz 1f 711.2Sad ret 721.14Sad1: 731.14Sad jmp _C_LABEL(mutex_vector_enter) 741.2Sad 751.2Sad/* 761.2Sad * void mutex_exit(kmutex_t *mtx); 771.2Sad * 781.2Sad * Release a mutex and post a load fence. 791.2Sad * 801.2Sad * See comments in mutex_vector_enter() about doing this operation unlocked 811.2Sad * on multiprocessor systems, and comments in arch/x86/include/lock.h about 821.2Sad * memory ordering on Intel x86 systems. 831.2Sad */ 841.11SadNENTRY(mutex_exit) 851.2Sad movq CPUVAR(CURLWP), %rax 861.2Sad xorq %rdx, %rdx 871.2Sad cmpxchgq %rdx, MTX_OWNER(%rdi) 881.14Sad jnz 1f 891.2Sad ret 901.14Sad1: 911.14Sad jmp _C_LABEL(mutex_vector_exit) 921.2Sad 931.2Sad/* 941.2Sad * void mutex_spin_enter(kmutex_t *mtx); 951.2Sad * 961.2Sad * Acquire a spin mutex and post a load fence. 971.2Sad */ 981.4SadNENTRY(mutex_spin_enter) 991.2Sad#if defined(FULL) 1001.2Sad movl $0x0100, %eax /* new + expected value */ 1011.2Sad#endif 1021.14Sad movl CPUVAR(ILEVEL), %esi 1031.2Sad movzbl MTX_IPL(%rdi), %ecx /* new SPL */ 1041.2Sad cmpl %ecx, %esi /* higher? */ 1051.2Sad cmovgl %esi, %ecx 1061.14Sad movl %ecx, CPUVAR(ILEVEL) /* splraiseipl() */ 1071.14Sad subl $1, CPUVAR(MTX_COUNT) /* decl doesnt set CF */ 1081.14Sad cmovncl CPUVAR(MTX_OLDSPL), %esi 1091.14Sad movl %esi, CPUVAR(MTX_OLDSPL) 1101.2Sad#if defined(FULL) 1111.11Sad LOCK(11) 1121.2Sad cmpxchgb %ah, MTX_LOCK(%rdi) /* lock */ 1131.14Sad jnz 1f 1141.2Sad#endif 1151.2Sad ret 1161.14Sad1: 1171.14Sad jmp _C_LABEL(mutex_spin_retry) /* failed; hard case */ 1181.2Sad 1191.2Sad/* 1201.2Sad * void mutex_spin_exit(kmutex_t *mtx); 1211.2Sad * 1221.2Sad * Release a spin mutex and post a load fence. 1231.2Sad */ 1241.4SadNENTRY(mutex_spin_exit) 1251.2Sad#ifdef DIAGNOSTIC 1261.2Sad 1271.2Sad movl $0x0001, %eax /* new + expected value */ 1281.4Sad movq CPUVAR(SELF), %r8 1291.2Sad cmpxchgb %ah, MTX_LOCK(%rdi) /* unlock */ 1301.2Sad jnz,pn _C_LABEL(mutex_vector_exit) /* hard case if problems */ 1311.4Sad movl CPU_INFO_MTX_OLDSPL(%r8), %edi 1321.4Sad incl CPU_INFO_MTX_COUNT(%r8) 1331.2Sad jnz 1f 1341.4Sad cmpl CPU_INFO_ILEVEL(%r8), %edi 1351.2Sad jae 1f 1361.4Sad movl CPU_INFO_IUNMASK(%r8,%rdi,4), %esi 1371.12Sdsl CLI(ax) 1381.4Sad testl CPU_INFO_IPENDING(%r8), %esi 1391.2Sad jnz _C_LABEL(Xspllower) 1401.4Sad movl %edi, CPU_INFO_ILEVEL(%r8) 1411.12Sdsl STI(ax) 1421.2Sad1: rep /* double byte ret as branch */ 1431.2Sad ret /* target: see AMD docs */ 1441.2Sad 1451.2Sad#else /* DIAGNOSTIC */ 1461.2Sad 1471.4Sad movq CPUVAR(SELF), %rsi 1481.2Sad#ifdef MULTIPROCESSOR 1491.2Sad movb $0x00, MTX_LOCK(%rdi) 1501.2Sad#endif 1511.4Sad movl CPU_INFO_MTX_OLDSPL(%rsi), %ecx 1521.4Sad incl CPU_INFO_MTX_COUNT(%rsi) 1531.4Sad movl CPU_INFO_ILEVEL(%rsi),%edx 1541.2Sad cmovnzl %edx,%ecx 1551.2Sad cmpl %edx,%ecx /* new level is lower? */ 1561.2Sad pushq %rbx 1571.2Sad jae,pn 2f 1581.2Sad1: 1591.4Sad movl CPU_INFO_IPENDING(%rsi),%eax 1601.4Sad testl %eax,CPU_INFO_IUNMASK(%rsi,%rcx,4)/* deferred interrupts? */ 1611.2Sad movl %eax,%ebx 1621.2Sad jnz,pn 3f 1631.4Sad cmpxchg8b CPU_INFO_ISTATE(%rsi) /* swap in new ilevel */ 1641.3Syamt jnz,pn 1b 1651.2Sad2: 1661.2Sad popq %rbx 1671.2Sad ret 1681.2Sad3: 1691.2Sad popq %rbx 1701.2Sad movl %ecx, %edi 1711.2Sad jmp _C_LABEL(Xspllower) 1721.2Sad 1731.2Sad#endif /* DIAGNOSTIC */ 1741.2Sad 1751.2Sad/* 1761.2Sad * void rw_enter(krwlock_t *rwl, krw_t op); 1771.2Sad * 1781.2Sad * Acquire one hold on a RW lock. 1791.2Sad */ 1801.11SadNENTRY(rw_enter) 1811.2Sad cmpl $RW_READER, %esi 1821.2Sad jne 2f 1831.2Sad 1841.2Sad /* 1851.2Sad * Reader: this is the most common case. 1861.2Sad */ 1871.2Sad1: movq RW_OWNER(%rdi), %rax 1881.2Sad testb $(RW_WRITE_LOCKED|RW_WRITE_WANTED), %al 1891.2Sad leaq RW_READ_INCR(%rax), %rdx 1901.14Sad jnz 3f 1911.11Sad LOCK(2) 1921.2Sad cmpxchgq %rdx, RW_OWNER(%rdi) 1931.2Sad jnz,pn 1b 1941.2Sad ret 1951.2Sad 1961.2Sad /* 1971.2Sad * Writer: if the compare-and-set fails, don't bother retrying. 1981.2Sad */ 1991.2Sad2: movq CPUVAR(CURLWP), %rcx 2001.2Sad xorq %rax, %rax 2011.2Sad orq $RW_WRITE_LOCKED, %rcx 2021.11Sad LOCK(3) 2031.2Sad cmpxchgq %rcx, RW_OWNER(%rdi) 2041.14Sad jnz 3f 2051.2Sad ret 2061.14Sad3: 2071.14Sad jmp _C_LABEL(rw_vector_enter) 2081.2Sad 2091.2Sad/* 2101.2Sad * void rw_exit(krwlock_t *rwl); 2111.2Sad * 2121.2Sad * Release one hold on a RW lock. 2131.2Sad */ 2141.11SadNENTRY(rw_exit) 2151.2Sad movq RW_OWNER(%rdi), %rax 2161.2Sad testb $RW_WRITE_LOCKED, %al 2171.2Sad jnz 2f 2181.2Sad 2191.2Sad /* 2201.2Sad * Reader 2211.2Sad */ 2221.2Sad1: testb $RW_HAS_WAITERS, %al 2231.14Sad jnz 3f 2241.2Sad cmpq $RW_READ_INCR, %rax 2251.2Sad leaq -RW_READ_INCR(%rax), %rdx 2261.14Sad jb 3f 2271.11Sad LOCK(4) 2281.2Sad cmpxchgq %rdx, RW_OWNER(%rdi) 2291.2Sad jnz,pn 1b 2301.2Sad ret 2311.2Sad 2321.2Sad /* 2331.2Sad * Writer 2341.2Sad */ 2351.2Sad2: leaq -RW_WRITE_LOCKED(%rax), %rdx 2361.2Sad subq CPUVAR(CURLWP), %rdx 2371.14Sad jnz 3f 2381.11Sad LOCK(5) 2391.2Sad cmpxchgq %rdx, RW_OWNER(%rdi) 2401.2Sad jnz 3f 2411.2Sad ret 2421.2Sad 2431.2Sad3: jmp _C_LABEL(rw_vector_exit) 2441.2Sad 2451.13Sad/* 2461.13Sad * int rw_tryenter(krwlock_t *rwl, krw_t op); 2471.13Sad * 2481.13Sad * Try to acquire one hold on a RW lock. 2491.13Sad */ 2501.13SadNENTRY(rw_tryenter) 2511.13Sad cmpl $RW_READER, %esi 2521.13Sad jne 2f 2531.13Sad 2541.13Sad /* 2551.13Sad * Reader: this is the most common case. 2561.13Sad */ 2571.17Sad movq RW_OWNER(%rdi), %rax 2581.17Sad1: 2591.13Sad testb $(RW_WRITE_LOCKED|RW_WRITE_WANTED), %al 2601.13Sad leaq RW_READ_INCR(%rax), %rdx 2611.13Sad jnz 3f 2621.13Sad LOCK(8) 2631.13Sad cmpxchgq %rdx, RW_OWNER(%rdi) 2641.17Sad jnz 1b 2651.17Sad movl %edi, %eax /* nonzero */ 2661.13Sad ret 2671.13Sad 2681.13Sad /* 2691.13Sad * Writer: if the compare-and-set fails, don't bother retrying. 2701.13Sad */ 2711.13Sad2: movq CPUVAR(CURLWP), %rcx 2721.13Sad xorq %rax, %rax 2731.13Sad orq $RW_WRITE_LOCKED, %rcx 2741.13Sad LOCK(9) 2751.13Sad cmpxchgq %rcx, RW_OWNER(%rdi) 2761.18Sad movl $0, %eax 2771.13Sad setz %al 2781.13Sad ret 2791.13Sad 2801.13Sad3: xorl %eax, %eax 2811.13Sad ret 2821.13Sad 2831.2Sad#endif /* LOCKDEBUG */ 2841.2Sad 2851.2Sad/* 2861.11Sad * Spinlocks. 2871.2Sad */ 2881.11SadNENTRY(__cpu_simple_lock_init) 2891.11Sad movb $0, (%rdi) 2901.2Sad ret 2911.2Sad 2921.11SadNENTRY(__cpu_simple_lock) 2931.11Sad movl $0x0100, %eax 2941.11Sad1: 2951.11Sad LOCK(6) 2961.11Sad cmpxchgb %ah, (%rdi) 2971.11Sad jnz 2f 2981.2Sad ret 2991.11Sad2: 3001.11Sad movl $0x0100, %eax 3011.11Sad pause 3021.11Sad nop 3031.7Sad nop 3041.11Sad cmpb $0, (%rdi) 3051.11Sad je 1b 3061.11Sad jmp 2b 3071.11Sad 3081.11SadNENTRY(__cpu_simple_unlock) 3091.11Sad movb $0, (%rdi) 3101.2Sad ret 3111.7Sad 3121.11SadNENTRY(__cpu_simple_lock_try) 3131.11Sad movl $0x0100, %eax 3141.11Sad LOCK(7) 3151.11Sad cmpxchgb %ah, (%rdi) 3161.11Sad movl $0, %eax 3171.11Sad setz %al 3181.2Sad ret 3191.2Sad 3201.2Sad/* 3211.7Sad * Patchpoints to replace with NOP when ncpu == 1. 3221.7Sad */ 3231.7Sad#ifndef LOCKDEBUG 3241.7SadLABEL(x86_lockpatch) 3251.11Sad .quad .Lpatch1, .Lpatch2, .Lpatch3, .Lpatch4 3261.13Sad .quad .Lpatch5, .Lpatch6, .Lpatch7, .Lpatch8 3271.13Sad .quad .Lpatch9 3281.7Sad#ifdef FULL 3291.11Sad .quad .Lpatch11 3301.7Sad#endif 3311.7Sad .quad 0 3321.7Sad#endif 333