Home | History | Annotate | Line # | Download | only in i386
linux_machdep.c revision 1.161
      1  1.161  christos /*	$NetBSD: linux_machdep.c,v 1.161 2015/12/08 21:27:50 christos Exp $	*/
      2    1.1      fvdl 
      3   1.45      fvdl /*-
      4  1.143        ad  * Copyright (c) 1995, 2000, 2008, 2009 The NetBSD Foundation, Inc.
      5    1.1      fvdl  * All rights reserved.
      6    1.1      fvdl  *
      7   1.45      fvdl  * This code is derived from software contributed to The NetBSD Foundation
      8  1.143        ad  * by Frank van der Linden, and by Andrew Doran.
      9   1.45      fvdl  *
     10    1.1      fvdl  * Redistribution and use in source and binary forms, with or without
     11    1.1      fvdl  * modification, are permitted provided that the following conditions
     12    1.1      fvdl  * are met:
     13    1.1      fvdl  * 1. Redistributions of source code must retain the above copyright
     14    1.1      fvdl  *    notice, this list of conditions and the following disclaimer.
     15    1.1      fvdl  * 2. Redistributions in binary form must reproduce the above copyright
     16    1.1      fvdl  *    notice, this list of conditions and the following disclaimer in the
     17    1.1      fvdl  *    documentation and/or other materials provided with the distribution.
     18    1.1      fvdl  *
     19   1.45      fvdl  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.45      fvdl  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.45      fvdl  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.45      fvdl  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.45      fvdl  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.45      fvdl  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.45      fvdl  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.45      fvdl  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.45      fvdl  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.45      fvdl  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.45      fvdl  * POSSIBILITY OF SUCH DAMAGE.
     30    1.1      fvdl  */
     31   1.68     lukem 
     32   1.68     lukem #include <sys/cdefs.h>
     33  1.161  christos __KERNEL_RCSID(0, "$NetBSD: linux_machdep.c,v 1.161 2015/12/08 21:27:50 christos Exp $");
     34   1.35   thorpej 
     35   1.63       mrg #if defined(_KERNEL_OPT)
     36   1.35   thorpej #include "opt_vm86.h"
     37   1.36   thorpej #include "opt_user_ldt.h"
     38   1.51  jdolecek #endif
     39    1.1      fvdl 
     40    1.1      fvdl #include <sys/param.h>
     41    1.1      fvdl #include <sys/systm.h>
     42    1.1      fvdl #include <sys/signalvar.h>
     43    1.1      fvdl #include <sys/kernel.h>
     44    1.1      fvdl #include <sys/proc.h>
     45    1.1      fvdl #include <sys/buf.h>
     46    1.1      fvdl #include <sys/reboot.h>
     47    1.1      fvdl #include <sys/conf.h>
     48   1.31   thorpej #include <sys/exec.h>
     49    1.1      fvdl #include <sys/file.h>
     50    1.1      fvdl #include <sys/callout.h>
     51    1.1      fvdl #include <sys/mbuf.h>
     52    1.1      fvdl #include <sys/msgbuf.h>
     53    1.1      fvdl #include <sys/mount.h>
     54    1.1      fvdl #include <sys/vnode.h>
     55    1.1      fvdl #include <sys/device.h>
     56    1.1      fvdl #include <sys/syscallargs.h>
     57   1.13      fvdl #include <sys/filedesc.h>
     58   1.39   mycroft #include <sys/exec_elf.h>
     59   1.52      fvdl #include <sys/disklabel.h>
     60   1.62      manu #include <sys/ioctl.h>
     61  1.110  christos #include <sys/wait.h>
     62  1.113      elad #include <sys/kauth.h>
     63  1.143        ad #include <sys/kmem.h>
     64  1.113      elad 
     65   1.52      fvdl #include <miscfs/specfs/specdev.h>
     66    1.7   mycroft 
     67   1.44  christos #include <compat/linux/common/linux_types.h>
     68   1.44  christos #include <compat/linux/common/linux_signal.h>
     69   1.44  christos #include <compat/linux/common/linux_util.h>
     70   1.44  christos #include <compat/linux/common/linux_ioctl.h>
     71   1.52      fvdl #include <compat/linux/common/linux_hdio.h>
     72   1.44  christos #include <compat/linux/common/linux_exec.h>
     73   1.44  christos #include <compat/linux/common/linux_machdep.h>
     74   1.98  jdolecek #include <compat/linux/common/linux_errno.h>
     75   1.44  christos 
     76    1.1      fvdl #include <compat/linux/linux_syscallargs.h>
     77    1.1      fvdl 
     78  1.130        ad #include <sys/cpu.h>
     79    1.1      fvdl #include <machine/cpufunc.h>
     80    1.1      fvdl #include <machine/psl.h>
     81    1.1      fvdl #include <machine/reg.h>
     82    1.7   mycroft #include <machine/segments.h>
     83    1.1      fvdl #include <machine/specialreg.h>
     84    1.7   mycroft #include <machine/sysarch.h>
     85   1.26   mycroft #include <machine/vm86.h>
     86   1.34   mycroft #include <machine/vmparam.h>
     87    1.1      fvdl 
     88  1.158       dsl #include <x86/fpu.h>
     89  1.158       dsl 
     90    1.1      fvdl /*
     91   1.50     veego  * To see whether wscons is configured (for virtual console ioctl calls).
     92   1.13      fvdl  */
     93   1.63       mrg #if defined(_KERNEL_OPT)
     94   1.41  drochner #include "wsdisplay.h"
     95   1.51  jdolecek #endif
     96   1.41  drochner #if (NWSDISPLAY > 0)
     97   1.52      fvdl #include <dev/wscons/wsconsio.h>
     98   1.41  drochner #include <dev/wscons/wsdisplay_usl_io.h>
     99   1.63       mrg #if defined(_KERNEL_OPT)
    100   1.41  drochner #include "opt_xserver.h"
    101   1.51  jdolecek #endif
    102   1.41  drochner #endif
    103   1.41  drochner 
    104   1.72  christos #ifdef DEBUG_LINUX
    105   1.72  christos #define DPRINTF(a) uprintf a
    106   1.72  christos #else
    107   1.72  christos #define DPRINTF(a)
    108   1.72  christos #endif
    109   1.72  christos 
    110  1.131       dsl static struct biosdisk_info *fd2biosinfo(struct proc *, struct file *);
    111  1.103   thorpej extern struct disklist *x86_alldisks;
    112  1.131       dsl static void linux_save_ucontext(struct lwp *, struct trapframe *,
    113  1.131       dsl     const sigset_t *, struct sigaltstack *, struct linux_ucontext *);
    114  1.131       dsl static void linux_save_sigcontext(struct lwp *, struct trapframe *,
    115  1.131       dsl     const sigset_t *, struct linux_sigcontext *);
    116  1.131       dsl static int linux_restore_sigcontext(struct lwp *,
    117  1.131       dsl     struct linux_sigcontext *, register_t *);
    118  1.131       dsl static void linux_rt_sendsig(const ksiginfo_t *, const sigset_t *);
    119  1.131       dsl static void linux_old_sendsig(const ksiginfo_t *, const sigset_t *);
    120   1.52      fvdl 
    121   1.83  christos extern char linux_sigcode[], linux_rt_sigcode[];
    122  1.149       chs 
    123   1.13      fvdl /*
    124    1.1      fvdl  * Deal with some i386-specific things in the Linux emulation code.
    125    1.1      fvdl  */
    126   1.37   mycroft 
    127   1.37   mycroft void
    128  1.149       chs linux_setregs(struct lwp *l, struct exec_package *epp, vaddr_t stack)
    129   1.37   mycroft {
    130   1.73  christos 	struct trapframe *tf;
    131   1.73  christos 
    132   1.73  christos #ifdef USER_LDT
    133   1.85   thorpej 	pmap_ldt_cleanup(l);
    134   1.73  christos #endif
    135   1.37   mycroft 
    136  1.157       dsl 	fpu_save_area_clear(l, __Linux_NPXCW__);
    137   1.73  christos 
    138   1.85   thorpej 	tf = l->l_md.md_regs;
    139  1.149       chs 	tf->tf_gs = 0;
    140   1.73  christos 	tf->tf_fs = GSEL(GUDATA_SEL, SEL_UPL);
    141   1.73  christos 	tf->tf_es = GSEL(GUDATA_SEL, SEL_UPL);
    142   1.73  christos 	tf->tf_ds = GSEL(GUDATA_SEL, SEL_UPL);
    143   1.73  christos 	tf->tf_edi = 0;
    144   1.73  christos 	tf->tf_esi = 0;
    145   1.73  christos 	tf->tf_ebp = 0;
    146  1.150     joerg 	tf->tf_ebx = l->l_proc->p_psstrp;
    147   1.73  christos 	tf->tf_edx = 0;
    148   1.73  christos 	tf->tf_ecx = 0;
    149   1.73  christos 	tf->tf_eax = 0;
    150   1.73  christos 	tf->tf_eip = epp->ep_entry;
    151   1.95       chs 	tf->tf_cs = GSEL(GUCODEBIG_SEL, SEL_UPL);
    152   1.73  christos 	tf->tf_eflags = PSL_USERSET;
    153   1.73  christos 	tf->tf_esp = stack;
    154   1.73  christos 	tf->tf_ss = GSEL(GUDATA_SEL, SEL_UPL);
    155   1.37   mycroft }
    156    1.1      fvdl 
    157    1.1      fvdl /*
    158    1.1      fvdl  * Send an interrupt to process.
    159    1.1      fvdl  *
    160    1.1      fvdl  * Stack is set up to allow sigcode stored
    161    1.1      fvdl  * in u. to call routine, followed by kcall
    162    1.1      fvdl  * to sigreturn routine below.  After sigreturn
    163    1.1      fvdl  * resets the signal mask, the stack, and the
    164    1.1      fvdl  * frame pointer, it returns to the user
    165    1.1      fvdl  * specified pc, psl.
    166    1.1      fvdl  */
    167    1.1      fvdl 
    168    1.1      fvdl void
    169   1.99  christos linux_sendsig(const ksiginfo_t *ksi, const sigset_t *mask)
    170    1.1      fvdl {
    171   1.96  christos 	if (SIGACTION(curproc, ksi->ksi_signo).sa_flags & SA_SIGINFO)
    172   1.97  christos 		linux_rt_sendsig(ksi, mask);
    173   1.83  christos 	else
    174   1.97  christos 		linux_old_sendsig(ksi, mask);
    175   1.83  christos }
    176   1.83  christos 
    177   1.83  christos 
    178   1.83  christos static void
    179  1.132       dsl linux_save_ucontext(struct lwp *l, struct trapframe *tf, const sigset_t *mask, struct sigaltstack *sas, struct linux_ucontext *uc)
    180   1.90  christos {
    181   1.90  christos 	uc->uc_flags = 0;
    182   1.90  christos 	uc->uc_link = NULL;
    183   1.90  christos 	native_to_linux_sigaltstack(&uc->uc_stack, sas);
    184   1.90  christos 	linux_save_sigcontext(l, tf, mask, &uc->uc_mcontext);
    185   1.90  christos 	native_to_linux_sigset(&uc->uc_sigmask, mask);
    186   1.90  christos 	(void)memset(&uc->uc_fpregs_mem, 0, sizeof(uc->uc_fpregs_mem));
    187   1.90  christos }
    188   1.90  christos 
    189   1.90  christos static void
    190  1.146     rmind linux_save_sigcontext(struct lwp *l, struct trapframe *tf,
    191  1.146     rmind     const sigset_t *mask, struct linux_sigcontext *sc)
    192   1.83  christos {
    193  1.146     rmind 	struct pcb *pcb = lwp_getpcb(l);
    194  1.146     rmind 
    195   1.83  christos 	/* Save register context. */
    196   1.83  christos #ifdef VM86
    197   1.83  christos 	if (tf->tf_eflags & PSL_VM) {
    198   1.83  christos 		sc->sc_gs = tf->tf_vm86_gs;
    199   1.83  christos 		sc->sc_fs = tf->tf_vm86_fs;
    200   1.83  christos 		sc->sc_es = tf->tf_vm86_es;
    201   1.83  christos 		sc->sc_ds = tf->tf_vm86_ds;
    202   1.85   thorpej 		sc->sc_eflags = get_vflags(l);
    203   1.83  christos 	} else
    204   1.83  christos #endif
    205   1.83  christos 	{
    206   1.83  christos 		sc->sc_gs = tf->tf_gs;
    207  1.106     perry 		sc->sc_fs = tf->tf_fs;
    208   1.83  christos 		sc->sc_es = tf->tf_es;
    209   1.83  christos 		sc->sc_ds = tf->tf_ds;
    210   1.83  christos 		sc->sc_eflags = tf->tf_eflags;
    211   1.83  christos 	}
    212   1.83  christos 	sc->sc_edi = tf->tf_edi;
    213   1.83  christos 	sc->sc_esi = tf->tf_esi;
    214   1.83  christos 	sc->sc_esp = tf->tf_esp;
    215   1.83  christos 	sc->sc_ebp = tf->tf_ebp;
    216   1.83  christos 	sc->sc_ebx = tf->tf_ebx;
    217   1.83  christos 	sc->sc_edx = tf->tf_edx;
    218   1.83  christos 	sc->sc_ecx = tf->tf_ecx;
    219   1.83  christos 	sc->sc_eax = tf->tf_eax;
    220   1.83  christos 	sc->sc_eip = tf->tf_eip;
    221   1.83  christos 	sc->sc_cs = tf->tf_cs;
    222   1.83  christos 	sc->sc_esp_at_signal = tf->tf_esp;
    223   1.83  christos 	sc->sc_ss = tf->tf_ss;
    224   1.83  christos 	sc->sc_err = tf->tf_err;
    225   1.83  christos 	sc->sc_trapno = tf->tf_trapno;
    226  1.146     rmind 	sc->sc_cr2 = pcb->pcb_cr2;
    227   1.83  christos 	sc->sc_387 = NULL;
    228   1.83  christos 
    229   1.83  christos 	/* Save signal stack. */
    230   1.83  christos 	/* Linux doesn't save the onstack flag in sigframe */
    231   1.83  christos 
    232   1.83  christos 	/* Save signal mask. */
    233   1.83  christos 	native_to_linux_old_sigset(&sc->sc_mask, mask);
    234   1.83  christos }
    235   1.83  christos 
    236   1.83  christos static void
    237   1.99  christos linux_rt_sendsig(const ksiginfo_t *ksi, const sigset_t *mask)
    238   1.83  christos {
    239   1.85   thorpej 	struct lwp *l = curlwp;
    240   1.85   thorpej 	struct proc *p = l->l_proc;
    241   1.48  augustss 	struct trapframe *tf;
    242   1.83  christos 	struct linux_rt_sigframe *fp, frame;
    243  1.122        ad 	int onstack, error;
    244   1.98  jdolecek 	int sig = ksi->ksi_signo;
    245   1.78   thorpej 	sig_t catcher = SIGACTION(p, sig).sa_handler;
    246  1.122        ad 	struct sigaltstack *sas = &l->l_sigstk;
    247    1.1      fvdl 
    248   1.85   thorpej 	tf = l->l_md.md_regs;
    249   1.66  jdolecek 	/* Do we need to jump onto the signal stack? */
    250   1.82  christos 	onstack = (sas->ss_flags & (SS_DISABLE | SS_ONSTACK)) == 0 &&
    251   1.66  jdolecek 	    (SIGACTION(p, sig).sa_flags & SA_ONSTACK) != 0;
    252   1.66  jdolecek 
    253   1.83  christos 
    254   1.42   mycroft 	/* Allocate space for the signal handler context. */
    255   1.66  jdolecek 	if (onstack)
    256  1.123  christos 		fp = (struct linux_rt_sigframe *)((char *)sas->ss_sp +
    257   1.83  christos 		    sas->ss_size);
    258   1.66  jdolecek 	else
    259   1.83  christos 		fp = (struct linux_rt_sigframe *)tf->tf_esp;
    260   1.42   mycroft 	fp--;
    261    1.1      fvdl 
    262   1.92  christos 	DPRINTF(("rt: onstack = %d, fp = %p sig = %d eip = 0x%x cr2 = 0x%x\n",
    263  1.146     rmind 	    onstack, fp, sig, tf->tf_eip,
    264  1.146     rmind 	    ((struct pcb *)lwp_getpcb(l))->pcb_cr2));
    265   1.83  christos 
    266   1.42   mycroft 	/* Build stack frame for signal trampoline. */
    267    1.7   mycroft 	frame.sf_handler = catcher;
    268   1.74  christos 	frame.sf_sig = native_to_linux_signo[sig];
    269   1.82  christos 	frame.sf_sip = &fp->sf_si;
    270   1.90  christos 	frame.sf_ucp = &fp->sf_uc;
    271   1.83  christos 
    272   1.82  christos 	/*
    273   1.97  christos 	 * XXX: the following code assumes that the constants for
    274   1.97  christos 	 * siginfo are the same between linux and NetBSD.
    275   1.82  christos 	 */
    276  1.151  christos 	native_to_linux_siginfo(&frame.sf_si, &ksi->ksi_info);
    277    1.1      fvdl 
    278   1.42   mycroft 	/* Save register context. */
    279   1.90  christos 	linux_save_ucontext(l, tf, mask, sas, &frame.sf_uc);
    280  1.122        ad 	sendsig_reset(l, sig);
    281   1.83  christos 
    282  1.135        ad 	mutex_exit(p->p_lock);
    283  1.122        ad 	error = copyout(&frame, fp, sizeof(frame));
    284  1.135        ad 	mutex_enter(p->p_lock);
    285  1.122        ad 
    286  1.122        ad 	if (error != 0) {
    287   1.83  christos 		/*
    288   1.83  christos 		 * Process has trashed its stack; give it an illegal
    289   1.83  christos 		 * instruction to halt it in its tracks.
    290   1.83  christos 		 */
    291   1.85   thorpej 		sigexit(l, SIGILL);
    292   1.83  christos 		/* NOTREACHED */
    293    1.4   mycroft 	}
    294    1.1      fvdl 
    295   1.83  christos 	/*
    296   1.83  christos 	 * Build context to run handler in.
    297   1.83  christos 	 */
    298   1.83  christos 	tf->tf_fs = GSEL(GUDATA_SEL, SEL_UPL);
    299   1.83  christos 	tf->tf_es = GSEL(GUDATA_SEL, SEL_UPL);
    300   1.83  christos 	tf->tf_ds = GSEL(GUDATA_SEL, SEL_UPL);
    301  1.106     perry 	tf->tf_eip = ((int)p->p_sigctx.ps_sigcode) +
    302   1.83  christos 	    (linux_rt_sigcode - linux_sigcode);
    303   1.83  christos 	tf->tf_cs = GSEL(GUCODE_SEL, SEL_UPL);
    304  1.138  christos 	tf->tf_eflags &= ~PSL_CLEARSIG;
    305   1.83  christos 	tf->tf_esp = (int)fp;
    306   1.83  christos 	tf->tf_ss = GSEL(GUDATA_SEL, SEL_UPL);
    307   1.83  christos 
    308   1.83  christos 	/* Remember that we're now on the signal stack. */
    309   1.83  christos 	if (onstack)
    310   1.83  christos 		sas->ss_flags |= SS_ONSTACK;
    311   1.83  christos }
    312   1.83  christos 
    313   1.83  christos static void
    314   1.99  christos linux_old_sendsig(const ksiginfo_t *ksi, const sigset_t *mask)
    315   1.83  christos {
    316   1.85   thorpej 	struct lwp *l = curlwp;
    317   1.85   thorpej 	struct proc *p = l->l_proc;
    318   1.83  christos 	struct trapframe *tf;
    319   1.83  christos 	struct linux_sigframe *fp, frame;
    320  1.122        ad 	int onstack, error;
    321   1.97  christos 	int sig = ksi->ksi_signo;
    322   1.83  christos 	sig_t catcher = SIGACTION(p, sig).sa_handler;
    323  1.122        ad 	struct sigaltstack *sas = &l->l_sigstk;
    324   1.83  christos 
    325   1.85   thorpej 	tf = l->l_md.md_regs;
    326   1.83  christos 
    327   1.83  christos 	/* Do we need to jump onto the signal stack? */
    328   1.83  christos 	onstack = (sas->ss_flags & (SS_DISABLE | SS_ONSTACK)) == 0 &&
    329   1.83  christos 	    (SIGACTION(p, sig).sa_flags & SA_ONSTACK) != 0;
    330   1.83  christos 
    331   1.83  christos 	/* Allocate space for the signal handler context. */
    332   1.83  christos 	if (onstack)
    333  1.123  christos 		fp = (struct linux_sigframe *) ((char *)sas->ss_sp +
    334   1.83  christos 		    sas->ss_size);
    335   1.83  christos 	else
    336   1.83  christos 		fp = (struct linux_sigframe *)tf->tf_esp;
    337   1.83  christos 	fp--;
    338   1.83  christos 
    339   1.92  christos 	DPRINTF(("old: onstack = %d, fp = %p sig = %d eip = 0x%x cr2 = 0x%x\n",
    340  1.146     rmind 	    onstack, fp, sig, tf->tf_eip,
    341  1.146     rmind 	    ((struct pcb *)lwp_getpcb(l))->pcb_cr2));
    342   1.83  christos 
    343   1.83  christos 	/* Build stack frame for signal trampoline. */
    344   1.83  christos 	frame.sf_handler = catcher;
    345   1.83  christos 	frame.sf_sig = native_to_linux_signo[sig];
    346   1.42   mycroft 
    347   1.90  christos 	linux_save_sigcontext(l, tf, mask, &frame.sf_sc);
    348  1.122        ad 	sendsig_reset(l, sig);
    349  1.122        ad 
    350  1.135        ad 	mutex_exit(p->p_lock);
    351  1.122        ad 	error = copyout(&frame, fp, sizeof(frame));
    352  1.135        ad 	mutex_enter(p->p_lock);
    353   1.42   mycroft 
    354  1.122        ad 	if (error != 0) {
    355    1.1      fvdl 		/*
    356    1.1      fvdl 		 * Process has trashed its stack; give it an illegal
    357    1.1      fvdl 		 * instruction to halt it in its tracks.
    358    1.1      fvdl 		 */
    359   1.85   thorpej 		sigexit(l, SIGILL);
    360    1.1      fvdl 		/* NOTREACHED */
    361    1.1      fvdl 	}
    362    1.1      fvdl 
    363    1.1      fvdl 	/*
    364    1.1      fvdl 	 * Build context to run handler in.
    365    1.1      fvdl 	 */
    366   1.75  christos 	tf->tf_fs = GSEL(GUDATA_SEL, SEL_UPL);
    367   1.26   mycroft 	tf->tf_es = GSEL(GUDATA_SEL, SEL_UPL);
    368   1.26   mycroft 	tf->tf_ds = GSEL(GUDATA_SEL, SEL_UPL);
    369   1.56  jdolecek 	tf->tf_eip = (int)p->p_sigctx.ps_sigcode;
    370   1.95       chs 	tf->tf_cs = GSEL(GUCODEBIG_SEL, SEL_UPL);
    371  1.138  christos 	tf->tf_eflags &= ~PSL_CLEARSIG;
    372   1.26   mycroft 	tf->tf_esp = (int)fp;
    373   1.23   mycroft 	tf->tf_ss = GSEL(GUDATA_SEL, SEL_UPL);
    374   1.42   mycroft 
    375   1.42   mycroft 	/* Remember that we're now on the signal stack. */
    376   1.66  jdolecek 	if (onstack)
    377   1.82  christos 		sas->ss_flags |= SS_ONSTACK;
    378    1.1      fvdl }
    379    1.1      fvdl 
    380    1.1      fvdl /*
    381    1.1      fvdl  * System call to cleanup state after a signal
    382    1.1      fvdl  * has been taken.  Reset signal mask and
    383    1.1      fvdl  * stack state from context left by sendsig (above).
    384    1.1      fvdl  * Return to previous pc and psl as specified by
    385    1.1      fvdl  * context left by sendsig. Check carefully to
    386    1.1      fvdl  * make sure that the user has not modified the
    387    1.1      fvdl  * psl to gain improper privileges or to cause
    388    1.1      fvdl  * a machine fault.
    389    1.1      fvdl  */
    390   1.43       erh int
    391  1.133       dsl linux_sys_rt_sigreturn(struct lwp *l, const struct linux_sys_rt_sigreturn_args *uap, register_t *retval)
    392   1.43       erh {
    393  1.133       dsl 	/* {
    394   1.90  christos 		syscallarg(struct linux_ucontext *) ucp;
    395  1.133       dsl 	} */
    396   1.90  christos 	struct linux_ucontext context, *ucp = SCARG(uap, ucp);
    397   1.90  christos 	int error;
    398   1.90  christos 
    399   1.90  christos 	/*
    400   1.90  christos 	 * The trampoline code hands us the context.
    401   1.90  christos 	 * It is unsafe to keep track of it ourselves, in the event that a
    402   1.90  christos 	 * program jumps out of a signal handler.
    403   1.90  christos 	 */
    404   1.90  christos 	if ((error = copyin(ucp, &context, sizeof(*ucp))) != 0)
    405   1.90  christos 		return error;
    406   1.90  christos 
    407   1.90  christos 	/* XXX XAX we can do better here by using more of the ucontext */
    408   1.90  christos 	return linux_restore_sigcontext(l, &context.uc_mcontext, retval);
    409   1.43       erh }
    410   1.43       erh 
    411    1.1      fvdl int
    412  1.133       dsl linux_sys_sigreturn(struct lwp *l, const struct linux_sys_sigreturn_args *uap, register_t *retval)
    413   1.19   thorpej {
    414  1.133       dsl 	/* {
    415    1.1      fvdl 		syscallarg(struct linux_sigcontext *) scp;
    416  1.133       dsl 	} */
    417   1.90  christos 	struct linux_sigcontext context, *scp = SCARG(uap, scp);
    418   1.90  christos 	int error;
    419    1.1      fvdl 
    420    1.1      fvdl 	/*
    421    1.1      fvdl 	 * The trampoline code hands us the context.
    422    1.1      fvdl 	 * It is unsafe to keep track of it ourselves, in the event that a
    423    1.1      fvdl 	 * program jumps out of a signal handler.
    424    1.1      fvdl 	 */
    425  1.123  christos 	if ((error = copyin((void *)scp, &context, sizeof(*scp))) != 0)
    426   1.90  christos 		return error;
    427   1.90  christos 	return linux_restore_sigcontext(l, &context, retval);
    428   1.90  christos }
    429    1.1      fvdl 
    430   1.90  christos static int
    431  1.116  christos linux_restore_sigcontext(struct lwp *l, struct linux_sigcontext *scp,
    432  1.119  christos     register_t *retval)
    433   1.90  christos {
    434   1.90  christos 	struct proc *p = l->l_proc;
    435  1.122        ad 	struct sigaltstack *sas = &l->l_sigstk;
    436   1.90  christos 	struct trapframe *tf;
    437   1.90  christos 	sigset_t mask;
    438   1.90  christos 	ssize_t ss_gap;
    439  1.149       chs 
    440   1.42   mycroft 	/* Restore register context. */
    441   1.85   thorpej 	tf = l->l_md.md_regs;
    442  1.149       chs 	DPRINTF(("sigreturn enter esp=0x%x eip=0x%x\n", tf->tf_esp, tf->tf_eip));
    443   1.83  christos 
    444    1.4   mycroft #ifdef VM86
    445   1.90  christos 	if (scp->sc_eflags & PSL_VM) {
    446  1.131       dsl 		void syscall_vm86(struct trapframe *);
    447   1.83  christos 
    448   1.90  christos 		tf->tf_vm86_gs = scp->sc_gs;
    449   1.90  christos 		tf->tf_vm86_fs = scp->sc_fs;
    450   1.90  christos 		tf->tf_vm86_es = scp->sc_es;
    451   1.90  christos 		tf->tf_vm86_ds = scp->sc_ds;
    452   1.90  christos 		set_vflags(l, scp->sc_eflags);
    453   1.83  christos 		p->p_md.md_syscall = syscall_vm86;
    454    1.4   mycroft 	} else
    455    1.4   mycroft #endif
    456    1.4   mycroft 	{
    457   1.26   mycroft 		/*
    458   1.26   mycroft 		 * Check for security violations.  If we're returning to
    459   1.26   mycroft 		 * protected mode, the CPU will validate the segment registers
    460   1.26   mycroft 		 * automatically and generate a trap on violations.  We handle
    461   1.26   mycroft 		 * the trap, rather than doing all of the checking here.
    462   1.26   mycroft 		 */
    463   1.90  christos 		if (((scp->sc_eflags ^ tf->tf_eflags) & PSL_USERSTATIC) != 0 ||
    464   1.90  christos 		    !USERMODE(scp->sc_cs, scp->sc_eflags))
    465   1.83  christos 			return EINVAL;
    466   1.26   mycroft 
    467   1.90  christos 		tf->tf_gs = scp->sc_gs;
    468   1.90  christos 		tf->tf_fs = scp->sc_fs;
    469   1.90  christos 		tf->tf_es = scp->sc_es;
    470   1.90  christos 		tf->tf_ds = scp->sc_ds;
    471   1.83  christos #ifdef VM86
    472   1.83  christos 		if (tf->tf_eflags & PSL_VM)
    473   1.83  christos 			(*p->p_emul->e_syscall_intern)(p);
    474   1.83  christos #endif
    475   1.90  christos 		tf->tf_eflags = scp->sc_eflags;
    476    1.4   mycroft 	}
    477   1.90  christos 	tf->tf_edi = scp->sc_edi;
    478   1.90  christos 	tf->tf_esi = scp->sc_esi;
    479   1.90  christos 	tf->tf_ebp = scp->sc_ebp;
    480   1.90  christos 	tf->tf_ebx = scp->sc_ebx;
    481   1.90  christos 	tf->tf_edx = scp->sc_edx;
    482   1.90  christos 	tf->tf_ecx = scp->sc_ecx;
    483   1.90  christos 	tf->tf_eax = scp->sc_eax;
    484   1.90  christos 	tf->tf_eip = scp->sc_eip;
    485   1.90  christos 	tf->tf_cs = scp->sc_cs;
    486   1.90  christos 	tf->tf_esp = scp->sc_esp_at_signal;
    487   1.90  christos 	tf->tf_ss = scp->sc_ss;
    488   1.26   mycroft 
    489   1.42   mycroft 	/* Restore signal stack. */
    490   1.66  jdolecek 	/*
    491   1.66  jdolecek 	 * Linux really does it this way; it doesn't have space in sigframe
    492   1.66  jdolecek 	 * to save the onstack flag.
    493   1.66  jdolecek 	 */
    494  1.135        ad 	mutex_enter(p->p_lock);
    495  1.123  christos 	ss_gap = (ssize_t)((char *)scp->sc_esp_at_signal - (char *)sas->ss_sp);
    496   1.82  christos 	if (ss_gap >= 0 && ss_gap < sas->ss_size)
    497   1.82  christos 		sas->ss_flags |= SS_ONSTACK;
    498   1.66  jdolecek 	else
    499   1.82  christos 		sas->ss_flags &= ~SS_ONSTACK;
    500   1.42   mycroft 
    501   1.42   mycroft 	/* Restore signal mask. */
    502   1.90  christos 	linux_old_to_native_sigset(&mask, &scp->sc_mask);
    503  1.122        ad 	(void) sigprocmask1(l, SIG_SETMASK, &mask, 0);
    504  1.135        ad 	mutex_exit(p->p_lock);
    505  1.122        ad 
    506  1.149       chs 	DPRINTF(("sigreturn exit esp=0x%x eip=0x%x\n", tf->tf_esp, tf->tf_eip));
    507   1.83  christos 	return EJUSTRETURN;
    508    1.6   mycroft }
    509    1.6   mycroft 
    510    1.7   mycroft #ifdef USER_LDT
    511    1.7   mycroft 
    512  1.128       dsl static int
    513  1.133       dsl linux_read_ldt(struct lwp *l, const struct linux_sys_modify_ldt_args *uap,
    514  1.128       dsl     register_t *retval)
    515    1.7   mycroft {
    516  1.124        ad 	struct x86_get_ldt_args gl;
    517    1.7   mycroft 	int error;
    518  1.128       dsl 	union descriptor *ldt_buf;
    519  1.143        ad 	size_t sz;
    520  1.128       dsl 
    521  1.128       dsl 	/*
    522  1.128       dsl 	 * I've checked the linux code - this function is asymetric with
    523  1.128       dsl 	 * linux_write_ldt, and returns raw ldt entries.
    524  1.128       dsl 	 * NB, the code I saw zerod the spare parts of the user buffer.
    525  1.128       dsl 	 */
    526    1.7   mycroft 
    527   1.72  christos 	DPRINTF(("linux_read_ldt!"));
    528  1.128       dsl 
    529  1.143        ad 	sz = 8192 * sizeof(*ldt_buf);
    530  1.143        ad 	ldt_buf = kmem_zalloc(sz, KM_SLEEP);
    531    1.7   mycroft 	gl.start = 0;
    532  1.128       dsl 	gl.desc = NULL;
    533    1.7   mycroft 	gl.num = SCARG(uap, bytecount) / sizeof(union descriptor);
    534  1.128       dsl 	error = x86_get_ldt1(l, &gl, ldt_buf);
    535  1.128       dsl 	/* NB gl.num might have changed */
    536  1.128       dsl 	if (error == 0) {
    537  1.128       dsl 		*retval = gl.num * sizeof *ldt;
    538  1.128       dsl 		error = copyout(ldt_buf, SCARG(uap, ptr),
    539  1.128       dsl 		    gl.num * sizeof *ldt_buf);
    540  1.128       dsl 	}
    541  1.143        ad 	kmem_free(ldt_buf, sz);
    542    1.7   mycroft 
    543  1.128       dsl 	return error;
    544    1.7   mycroft }
    545    1.7   mycroft 
    546    1.7   mycroft struct linux_ldt_info {
    547    1.7   mycroft 	u_int entry_number;
    548    1.7   mycroft 	u_long base_addr;
    549    1.7   mycroft 	u_int limit;
    550    1.7   mycroft 	u_int seg_32bit:1;
    551    1.7   mycroft 	u_int contents:2;
    552    1.7   mycroft 	u_int read_exec_only:1;
    553    1.7   mycroft 	u_int limit_in_pages:1;
    554    1.7   mycroft 	u_int seg_not_present:1;
    555   1.72  christos 	u_int useable:1;
    556    1.7   mycroft };
    557    1.7   mycroft 
    558  1.128       dsl static int
    559  1.133       dsl linux_write_ldt(struct lwp *l, const struct linux_sys_modify_ldt_args *uap,
    560  1.128       dsl     int oldmode)
    561    1.7   mycroft {
    562    1.7   mycroft 	struct linux_ldt_info ldt_info;
    563  1.128       dsl 	union descriptor d;
    564  1.124        ad 	struct x86_set_ldt_args sl;
    565    1.7   mycroft 	int error;
    566    1.7   mycroft 
    567   1.72  christos 	DPRINTF(("linux_write_ldt %d\n", oldmode));
    568    1.7   mycroft 	if (SCARG(uap, bytecount) != sizeof(ldt_info))
    569    1.7   mycroft 		return (EINVAL);
    570   1.29  christos 	if ((error = copyin(SCARG(uap, ptr), &ldt_info, sizeof(ldt_info))) != 0)
    571    1.7   mycroft 		return error;
    572   1.72  christos 	if (ldt_info.entry_number >= 8192)
    573    1.7   mycroft 		return (EINVAL);
    574   1.72  christos 	if (ldt_info.contents == 3) {
    575   1.72  christos 		if (oldmode)
    576   1.72  christos 			return (EINVAL);
    577   1.72  christos 		if (ldt_info.seg_not_present)
    578   1.72  christos 			return (EINVAL);
    579   1.72  christos 	}
    580    1.7   mycroft 
    581   1.72  christos 	if (ldt_info.base_addr == 0 && ldt_info.limit == 0 &&
    582   1.72  christos 	    (oldmode || (ldt_info.contents == 0 &&
    583   1.72  christos 	    ldt_info.read_exec_only == 1 && ldt_info.seg_32bit == 0 &&
    584   1.72  christos 	    ldt_info.limit_in_pages == 0 && ldt_info.seg_not_present == 1 &&
    585   1.72  christos 	    ldt_info.useable == 0))) {
    586   1.70  christos 		/* this means you should zero the ldt */
    587  1.128       dsl 		(void)memset(&d, 0, sizeof(d));
    588   1.70  christos 	} else {
    589  1.128       dsl 		d.sd.sd_lobase = ldt_info.base_addr & 0xffffff;
    590  1.128       dsl 		d.sd.sd_hibase = (ldt_info.base_addr >> 24) & 0xff;
    591  1.128       dsl 		d.sd.sd_lolimit = ldt_info.limit & 0xffff;
    592  1.128       dsl 		d.sd.sd_hilimit = (ldt_info.limit >> 16) & 0xf;
    593  1.128       dsl 		d.sd.sd_type = 16 | (ldt_info.contents << 2) |
    594   1.70  christos 		    (!ldt_info.read_exec_only << 1);
    595  1.128       dsl 		d.sd.sd_dpl = SEL_UPL;
    596  1.128       dsl 		d.sd.sd_p = !ldt_info.seg_not_present;
    597  1.128       dsl 		d.sd.sd_def32 = ldt_info.seg_32bit;
    598  1.128       dsl 		d.sd.sd_gran = ldt_info.limit_in_pages;
    599   1.72  christos 		if (!oldmode)
    600  1.128       dsl 			d.sd.sd_xx = ldt_info.useable;
    601   1.73  christos 		else
    602  1.128       dsl 			d.sd.sd_xx = 0;
    603   1.70  christos 	}
    604    1.7   mycroft 	sl.start = ldt_info.entry_number;
    605  1.147   mbalmer 	sl.desc = NULL;
    606    1.7   mycroft 	sl.num = 1;
    607    1.7   mycroft 
    608   1.72  christos 	DPRINTF(("linux_write_ldt: idx=%d, base=0x%lx, limit=0x%x\n",
    609   1.72  christos 	    ldt_info.entry_number, ldt_info.base_addr, ldt_info.limit));
    610    1.7   mycroft 
    611  1.128       dsl 	return x86_set_ldt1(l, &sl, &d);
    612    1.7   mycroft }
    613    1.7   mycroft 
    614    1.7   mycroft #endif /* USER_LDT */
    615    1.7   mycroft 
    616    1.6   mycroft int
    617  1.133       dsl linux_sys_modify_ldt(struct lwp *l, const struct linux_sys_modify_ldt_args *uap, register_t *retval)
    618   1.19   thorpej {
    619  1.133       dsl 	/* {
    620    1.6   mycroft 		syscallarg(int) func;
    621    1.6   mycroft 		syscallarg(void *) ptr;
    622    1.6   mycroft 		syscallarg(size_t) bytecount;
    623  1.133       dsl 	} */
    624    1.6   mycroft 
    625    1.6   mycroft 	switch (SCARG(uap, func)) {
    626    1.7   mycroft #ifdef USER_LDT
    627    1.6   mycroft 	case 0:
    628  1.133       dsl 		return linux_read_ldt(l, (const void *)uap, retval);
    629    1.6   mycroft 	case 1:
    630  1.133       dsl 		return linux_write_ldt(l, (const void *)uap, 1);
    631   1.72  christos 	case 2:
    632   1.72  christos #ifdef notyet
    633  1.148       wiz 		return linux_read_default_ldt(l, (const void *)uap, retval);
    634   1.72  christos #else
    635   1.72  christos 		return (ENOSYS);
    636   1.72  christos #endif
    637   1.72  christos 	case 0x11:
    638  1.133       dsl 		return linux_write_ldt(l, (const void *)uap, 0);
    639    1.7   mycroft #endif /* USER_LDT */
    640    1.7   mycroft 
    641    1.6   mycroft 	default:
    642    1.6   mycroft 		return (ENOSYS);
    643    1.6   mycroft 	}
    644   1.13      fvdl }
    645   1.13      fvdl 
    646   1.13      fvdl /*
    647   1.13      fvdl  * XXX Pathetic hack to make svgalib work. This will fake the major
    648   1.13      fvdl  * device number of an opened VT so that svgalib likes it. grmbl.
    649   1.13      fvdl  * Should probably do it 'wrong the right way' and use a mapping
    650   1.13      fvdl  * array for all major device numbers, and map linux_mknod too.
    651   1.13      fvdl  */
    652   1.13      fvdl dev_t
    653  1.132       dsl linux_fakedev(dev_t dev, int raw)
    654   1.13      fvdl {
    655  1.104  christos 	extern const struct cdevsw ptc_cdevsw, pts_cdevsw;
    656  1.104  christos 	const struct cdevsw *cd = cdevsw_lookup(dev);
    657  1.104  christos 
    658   1.69  christos 	if (raw) {
    659   1.41  drochner #if (NWSDISPLAY > 0)
    660   1.79   gehenna 		extern const struct cdevsw wsdisplay_cdevsw;
    661  1.104  christos 		if (cd == &wsdisplay_cdevsw)
    662   1.69  christos 			return makedev(LINUX_CONS_MAJOR, (minor(dev) + 1));
    663   1.41  drochner #endif
    664   1.69  christos 	}
    665   1.77  jdolecek 
    666  1.104  christos 	if (cd == &ptc_cdevsw)
    667  1.104  christos 		return makedev(LINUX_PTC_MAJOR, minor(dev));
    668  1.104  christos 	if (cd == &pts_cdevsw)
    669  1.104  christos 		return makedev(LINUX_PTS_MAJOR, minor(dev));
    670  1.104  christos 
    671   1.77  jdolecek 	return dev;
    672   1.13      fvdl }
    673   1.13      fvdl 
    674   1.49     jhawk #if (NWSDISPLAY > 0)
    675   1.41  drochner /*
    676   1.41  drochner  * That's not complete, but enough to get an X server running.
    677   1.41  drochner  */
    678   1.41  drochner #define NR_KEYS 128
    679   1.61  jdolecek static const u_short plain_map[NR_KEYS] = {
    680   1.41  drochner 	0x0200,	0x001b,	0x0031,	0x0032,	0x0033,	0x0034,	0x0035,	0x0036,
    681   1.41  drochner 	0x0037,	0x0038,	0x0039,	0x0030,	0x002d,	0x003d,	0x007f,	0x0009,
    682   1.41  drochner 	0x0b71,	0x0b77,	0x0b65,	0x0b72,	0x0b74,	0x0b79,	0x0b75,	0x0b69,
    683   1.41  drochner 	0x0b6f,	0x0b70,	0x005b,	0x005d,	0x0201,	0x0702,	0x0b61,	0x0b73,
    684   1.41  drochner 	0x0b64,	0x0b66,	0x0b67,	0x0b68,	0x0b6a,	0x0b6b,	0x0b6c,	0x003b,
    685   1.41  drochner 	0x0027,	0x0060,	0x0700,	0x005c,	0x0b7a,	0x0b78,	0x0b63,	0x0b76,
    686   1.41  drochner 	0x0b62,	0x0b6e,	0x0b6d,	0x002c,	0x002e,	0x002f,	0x0700,	0x030c,
    687   1.41  drochner 	0x0703,	0x0020,	0x0207,	0x0100,	0x0101,	0x0102,	0x0103,	0x0104,
    688   1.41  drochner 	0x0105,	0x0106,	0x0107,	0x0108,	0x0109,	0x0208,	0x0209,	0x0307,
    689   1.41  drochner 	0x0308,	0x0309,	0x030b,	0x0304,	0x0305,	0x0306,	0x030a,	0x0301,
    690   1.41  drochner 	0x0302,	0x0303,	0x0300,	0x0310,	0x0206,	0x0200,	0x003c,	0x010a,
    691   1.41  drochner 	0x010b,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    692   1.41  drochner 	0x030e,	0x0702,	0x030d,	0x001c,	0x0701,	0x0205,	0x0114,	0x0603,
    693   1.41  drochner 	0x0118,	0x0601,	0x0602,	0x0117,	0x0600,	0x0119,	0x0115,	0x0116,
    694   1.41  drochner 	0x011a,	0x010c,	0x010d,	0x011b,	0x011c,	0x0110,	0x0311,	0x011d,
    695   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    696   1.41  drochner }, shift_map[NR_KEYS] = {
    697   1.41  drochner 	0x0200,	0x001b,	0x0021,	0x0040,	0x0023,	0x0024,	0x0025,	0x005e,
    698   1.41  drochner 	0x0026,	0x002a,	0x0028,	0x0029,	0x005f,	0x002b,	0x007f,	0x0009,
    699   1.41  drochner 	0x0b51,	0x0b57,	0x0b45,	0x0b52,	0x0b54,	0x0b59,	0x0b55,	0x0b49,
    700   1.41  drochner 	0x0b4f,	0x0b50,	0x007b,	0x007d,	0x0201,	0x0702,	0x0b41,	0x0b53,
    701   1.41  drochner 	0x0b44,	0x0b46,	0x0b47,	0x0b48,	0x0b4a,	0x0b4b,	0x0b4c,	0x003a,
    702   1.41  drochner 	0x0022,	0x007e,	0x0700,	0x007c,	0x0b5a,	0x0b58,	0x0b43,	0x0b56,
    703   1.41  drochner 	0x0b42,	0x0b4e,	0x0b4d,	0x003c,	0x003e,	0x003f,	0x0700,	0x030c,
    704   1.41  drochner 	0x0703,	0x0020,	0x0207,	0x010a,	0x010b,	0x010c,	0x010d,	0x010e,
    705   1.41  drochner 	0x010f,	0x0110,	0x0111,	0x0112,	0x0113,	0x0213,	0x0203,	0x0307,
    706   1.41  drochner 	0x0308,	0x0309,	0x030b,	0x0304,	0x0305,	0x0306,	0x030a,	0x0301,
    707   1.41  drochner 	0x0302,	0x0303,	0x0300,	0x0310,	0x0206,	0x0200,	0x003e,	0x010a,
    708   1.41  drochner 	0x010b,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    709   1.41  drochner 	0x030e,	0x0702,	0x030d,	0x0200,	0x0701,	0x0205,	0x0114,	0x0603,
    710   1.41  drochner 	0x020b,	0x0601,	0x0602,	0x0117,	0x0600,	0x020a,	0x0115,	0x0116,
    711   1.41  drochner 	0x011a,	0x010c,	0x010d,	0x011b,	0x011c,	0x0110,	0x0311,	0x011d,
    712   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    713   1.41  drochner }, altgr_map[NR_KEYS] = {
    714   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0040,	0x0200,	0x0024,	0x0200,	0x0200,
    715   1.41  drochner 	0x007b,	0x005b,	0x005d,	0x007d,	0x005c,	0x0200,	0x0200,	0x0200,
    716   1.41  drochner 	0x0b71,	0x0b77,	0x0918,	0x0b72,	0x0b74,	0x0b79,	0x0b75,	0x0b69,
    717   1.41  drochner 	0x0b6f,	0x0b70,	0x0200,	0x007e,	0x0201,	0x0702,	0x0914,	0x0b73,
    718   1.41  drochner 	0x0917,	0x0919,	0x0b67,	0x0b68,	0x0b6a,	0x0b6b,	0x0b6c,	0x0200,
    719   1.41  drochner 	0x0200,	0x0200,	0x0700,	0x0200,	0x0b7a,	0x0b78,	0x0916,	0x0b76,
    720   1.41  drochner 	0x0915,	0x0b6e,	0x0b6d,	0x0200,	0x0200,	0x0200,	0x0700,	0x030c,
    721   1.41  drochner 	0x0703,	0x0200,	0x0207,	0x050c,	0x050d,	0x050e,	0x050f,	0x0510,
    722   1.41  drochner 	0x0511,	0x0512,	0x0513,	0x0514,	0x0515,	0x0208,	0x0202,	0x0911,
    723   1.41  drochner 	0x0912,	0x0913,	0x030b,	0x090e,	0x090f,	0x0910,	0x030a,	0x090b,
    724   1.41  drochner 	0x090c,	0x090d,	0x090a,	0x0310,	0x0206,	0x0200,	0x007c,	0x0516,
    725   1.41  drochner 	0x0517,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    726   1.41  drochner 	0x030e,	0x0702,	0x030d,	0x0200,	0x0701,	0x0205,	0x0114,	0x0603,
    727   1.41  drochner 	0x0118,	0x0601,	0x0602,	0x0117,	0x0600,	0x0119,	0x0115,	0x0116,
    728   1.41  drochner 	0x011a,	0x010c,	0x010d,	0x011b,	0x011c,	0x0110,	0x0311,	0x011d,
    729   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    730   1.41  drochner }, ctrl_map[NR_KEYS] = {
    731   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0000,	0x001b,	0x001c,	0x001d,	0x001e,
    732   1.41  drochner 	0x001f,	0x007f,	0x0200,	0x0200,	0x001f,	0x0200,	0x0008,	0x0200,
    733   1.41  drochner 	0x0011,	0x0017,	0x0005,	0x0012,	0x0014,	0x0019,	0x0015,	0x0009,
    734   1.41  drochner 	0x000f,	0x0010,	0x001b,	0x001d,	0x0201,	0x0702,	0x0001,	0x0013,
    735   1.41  drochner 	0x0004,	0x0006,	0x0007,	0x0008,	0x000a,	0x000b,	0x000c,	0x0200,
    736   1.41  drochner 	0x0007,	0x0000,	0x0700,	0x001c,	0x001a,	0x0018,	0x0003,	0x0016,
    737   1.41  drochner 	0x0002,	0x000e,	0x000d,	0x0200,	0x020e,	0x007f,	0x0700,	0x030c,
    738   1.41  drochner 	0x0703,	0x0000,	0x0207,	0x0100,	0x0101,	0x0102,	0x0103,	0x0104,
    739   1.41  drochner 	0x0105,	0x0106,	0x0107,	0x0108,	0x0109,	0x0208,	0x0204,	0x0307,
    740   1.41  drochner 	0x0308,	0x0309,	0x030b,	0x0304,	0x0305,	0x0306,	0x030a,	0x0301,
    741   1.41  drochner 	0x0302,	0x0303,	0x0300,	0x0310,	0x0206,	0x0200,	0x0200,	0x010a,
    742   1.41  drochner 	0x010b,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    743   1.41  drochner 	0x030e,	0x0702,	0x030d,	0x001c,	0x0701,	0x0205,	0x0114,	0x0603,
    744   1.41  drochner 	0x0118,	0x0601,	0x0602,	0x0117,	0x0600,	0x0119,	0x0115,	0x0116,
    745   1.41  drochner 	0x011a,	0x010c,	0x010d,	0x011b,	0x011c,	0x0110,	0x0311,	0x011d,
    746   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    747   1.41  drochner };
    748   1.41  drochner 
    749   1.61  jdolecek const u_short * const linux_keytabs[] = {
    750   1.41  drochner 	plain_map, shift_map, altgr_map, altgr_map, ctrl_map
    751   1.41  drochner };
    752   1.41  drochner #endif
    753   1.41  drochner 
    754   1.52      fvdl static struct biosdisk_info *
    755  1.119  christos fd2biosinfo(struct proc *p, struct file *fp)
    756   1.52      fvdl {
    757   1.52      fvdl 	struct vnode *vp;
    758   1.52      fvdl 	const char *blkname;
    759   1.52      fvdl 	char diskname[16];
    760   1.52      fvdl 	int i;
    761   1.52      fvdl 	struct nativedisk_info *nip;
    762  1.103   thorpej 	struct disklist *dl = x86_alldisks;
    763   1.52      fvdl 
    764   1.52      fvdl 	if (fp->f_type != DTYPE_VNODE)
    765   1.52      fvdl 		return NULL;
    766   1.52      fvdl 	vp = (struct vnode *)fp->f_data;
    767   1.52      fvdl 
    768   1.52      fvdl 	if (vp->v_type != VBLK)
    769   1.52      fvdl 		return NULL;
    770   1.52      fvdl 
    771   1.79   gehenna 	blkname = devsw_blk2name(major(vp->v_rdev));
    772  1.142  christos 	snprintf(diskname, sizeof diskname, "%s%llu", blkname,
    773  1.142  christos 	    (unsigned long long)DISKUNIT(vp->v_rdev));
    774   1.52      fvdl 
    775   1.52      fvdl 	for (i = 0; i < dl->dl_nnativedisks; i++) {
    776   1.52      fvdl 		nip = &dl->dl_nativedisks[i];
    777   1.52      fvdl 		if (strcmp(diskname, nip->ni_devname))
    778   1.52      fvdl 			continue;
    779   1.52      fvdl 		if (nip->ni_nmatches != 0)
    780   1.52      fvdl 			return &dl->dl_biosdisks[nip->ni_biosmatches[0]];
    781   1.52      fvdl 	}
    782   1.52      fvdl 
    783   1.52      fvdl 	return NULL;
    784   1.52      fvdl }
    785   1.52      fvdl 
    786   1.52      fvdl 
    787   1.13      fvdl /*
    788   1.13      fvdl  * We come here in a last attempt to satisfy a Linux ioctl() call
    789   1.13      fvdl  */
    790   1.13      fvdl int
    791  1.133       dsl linux_machdepioctl(struct lwp *l, const struct linux_sys_ioctl_args *uap, register_t *retval)
    792   1.19   thorpej {
    793  1.133       dsl 	/* {
    794   1.13      fvdl 		syscallarg(int) fd;
    795   1.13      fvdl 		syscallarg(u_long) com;
    796  1.123  christos 		syscallarg(void *) data;
    797  1.133       dsl 	} */
    798   1.29  christos 	struct sys_ioctl_args bia;
    799   1.15      fvdl 	u_long com;
    800   1.52      fvdl 	int error, error1;
    801   1.50     veego #if (NWSDISPLAY > 0)
    802   1.13      fvdl 	struct vt_mode lvt;
    803   1.41  drochner 	struct kbentry kbe;
    804   1.41  drochner #endif
    805   1.52      fvdl 	struct linux_hd_geometry hdg;
    806   1.52      fvdl 	struct linux_hd_big_geometry hdg_big;
    807   1.52      fvdl 	struct biosdisk_info *bip;
    808  1.134        ad 	file_t *fp;
    809   1.52      fvdl 	int fd;
    810  1.161  christos 	struct disklabel label;
    811   1.52      fvdl 	struct partinfo partp;
    812  1.134        ad 	int (*ioctlf)(struct file *, u_long, void *);
    813   1.52      fvdl 	u_long start, biostotal, realtotal;
    814   1.52      fvdl 	u_char heads, sectors;
    815   1.52      fvdl 	u_int cylinders;
    816   1.55      fvdl 	struct ioctl_pt pt;
    817   1.13      fvdl 
    818   1.52      fvdl 	fd = SCARG(uap, fd);
    819   1.52      fvdl 	SCARG(&bia, fd) = fd;
    820   1.13      fvdl 	SCARG(&bia, data) = SCARG(uap, data);
    821   1.13      fvdl 	com = SCARG(uap, com);
    822   1.13      fvdl 
    823  1.134        ad 	if ((fp = fd_getfile(fd)) == NULL)
    824   1.53   thorpej 		return (EBADF);
    825   1.52      fvdl 
    826   1.13      fvdl 	switch (com) {
    827   1.50     veego #if (NWSDISPLAY > 0)
    828   1.13      fvdl 	case LINUX_KDGKBMODE:
    829   1.21      fvdl 		com = KDGKBMODE;
    830   1.21      fvdl 		break;
    831   1.13      fvdl 	case LINUX_KDSKBMODE:
    832   1.13      fvdl 		com = KDSKBMODE;
    833   1.13      fvdl 		if ((unsigned)SCARG(uap, data) == LINUX_K_MEDIUMRAW)
    834  1.123  christos 			SCARG(&bia, data) = (void *)K_RAW;
    835   1.13      fvdl 		break;
    836   1.59      fvdl 	case LINUX_KIOCSOUND:
    837   1.59      fvdl 		SCARG(&bia, data) =
    838  1.123  christos 		    (void *)(((unsigned long)SCARG(&bia, data)) & 0xffff);
    839   1.59      fvdl 		/* fall through */
    840   1.13      fvdl 	case LINUX_KDMKTONE:
    841   1.13      fvdl 		com = KDMKTONE;
    842   1.13      fvdl 		break;
    843   1.13      fvdl 	case LINUX_KDSETMODE:
    844   1.13      fvdl 		com = KDSETMODE;
    845   1.58      fvdl 		break;
    846   1.58      fvdl 	case LINUX_KDGETMODE:
    847   1.58      fvdl 		/* KD_* values are equal to the wscons numbers */
    848   1.58      fvdl 		com = WSDISPLAYIO_GMODE;
    849   1.13      fvdl 		break;
    850   1.13      fvdl 	case LINUX_KDENABIO:
    851   1.13      fvdl 		com = KDENABIO;
    852   1.13      fvdl 		break;
    853   1.13      fvdl 	case LINUX_KDDISABIO:
    854   1.13      fvdl 		com = KDDISABIO;
    855   1.13      fvdl 		break;
    856   1.13      fvdl 	case LINUX_KDGETLED:
    857   1.13      fvdl 		com = KDGETLED;
    858   1.13      fvdl 		break;
    859   1.13      fvdl 	case LINUX_KDSETLED:
    860   1.13      fvdl 		com = KDSETLED;
    861   1.13      fvdl 		break;
    862   1.13      fvdl 	case LINUX_VT_OPENQRY:
    863   1.13      fvdl 		com = VT_OPENQRY;
    864   1.13      fvdl 		break;
    865   1.13      fvdl 	case LINUX_VT_GETMODE:
    866  1.134        ad 		error = fp->f_ops->fo_ioctl(fp, VT_GETMODE, &lvt);
    867  1.129       dsl 		if (error != 0)
    868   1.86      yamt 			goto out;
    869   1.74  christos 		lvt.relsig = native_to_linux_signo[lvt.relsig];
    870   1.74  christos 		lvt.acqsig = native_to_linux_signo[lvt.acqsig];
    871   1.74  christos 		lvt.frsig = native_to_linux_signo[lvt.frsig];
    872  1.129       dsl 		error = copyout(&lvt, SCARG(uap, data), sizeof (lvt));
    873   1.86      yamt 		goto out;
    874   1.13      fvdl 	case LINUX_VT_SETMODE:
    875  1.129       dsl 		error = copyin(SCARG(uap, data), &lvt, sizeof (lvt));
    876  1.129       dsl 		if (error != 0)
    877   1.86      yamt 			goto out;
    878   1.74  christos 		lvt.relsig = linux_to_native_signo[lvt.relsig];
    879   1.74  christos 		lvt.acqsig = linux_to_native_signo[lvt.acqsig];
    880   1.74  christos 		lvt.frsig = linux_to_native_signo[lvt.frsig];
    881  1.134        ad 		error = fp->f_ops->fo_ioctl(fp, VT_SETMODE, &lvt);
    882  1.129       dsl 		goto out;
    883   1.52      fvdl 	case LINUX_VT_DISALLOCATE:
    884   1.52      fvdl 		/* XXX should use WSDISPLAYIO_DELSCREEN */
    885   1.86      yamt 		error = 0;
    886   1.86      yamt 		goto out;
    887   1.13      fvdl 	case LINUX_VT_RELDISP:
    888   1.13      fvdl 		com = VT_RELDISP;
    889   1.13      fvdl 		break;
    890   1.13      fvdl 	case LINUX_VT_ACTIVATE:
    891   1.13      fvdl 		com = VT_ACTIVATE;
    892   1.13      fvdl 		break;
    893   1.13      fvdl 	case LINUX_VT_WAITACTIVE:
    894   1.13      fvdl 		com = VT_WAITACTIVE;
    895   1.13      fvdl 		break;
    896   1.41  drochner 	case LINUX_VT_GETSTATE:
    897   1.41  drochner 		com = VT_GETSTATE;
    898   1.41  drochner 		break;
    899   1.41  drochner 	case LINUX_KDGKBTYPE:
    900   1.91  jdolecek 	    {
    901   1.91  jdolecek 		static const u_int8_t kb101 = KB_101;
    902   1.91  jdolecek 
    903   1.41  drochner 		/* This is what Linux does. */
    904   1.91  jdolecek 		error = copyout(&kb101, SCARG(uap, data), 1);
    905   1.86      yamt 		goto out;
    906   1.91  jdolecek 	    }
    907   1.41  drochner 	case LINUX_KDGKBENT:
    908   1.41  drochner 		/*
    909   1.41  drochner 		 * The Linux KDGKBENT ioctl is different from the
    910   1.41  drochner 		 * SYSV original. So we handle it in machdep code.
    911   1.41  drochner 		 * XXX We should use keyboard mapping information
    912   1.41  drochner 		 * from wsdisplay, but this would be expensive.
    913   1.41  drochner 		 */
    914   1.41  drochner 		if ((error = copyin(SCARG(uap, data), &kbe,
    915   1.41  drochner 				    sizeof(struct kbentry))))
    916   1.86      yamt 			goto out;
    917   1.41  drochner 		if (kbe.kb_table >= sizeof(linux_keytabs) / sizeof(u_short *)
    918   1.86      yamt 		    || kbe.kb_index >= NR_KEYS) {
    919   1.86      yamt 			error = EINVAL;
    920   1.86      yamt 			goto out;
    921   1.86      yamt 		}
    922   1.41  drochner 		kbe.kb_value = linux_keytabs[kbe.kb_table][kbe.kb_index];
    923   1.86      yamt 		error = copyout(&kbe, SCARG(uap, data),
    924   1.86      yamt 				sizeof(struct kbentry));
    925   1.86      yamt 		goto out;
    926   1.54      fvdl #endif
    927   1.52      fvdl 	case LINUX_HDIO_GETGEO:
    928   1.52      fvdl 	case LINUX_HDIO_GETGEO_BIG:
    929   1.52      fvdl 		/*
    930   1.52      fvdl 		 * Try to mimic Linux behaviour: return the BIOS geometry
    931   1.52      fvdl 		 * if possible (extending its # of cylinders if it's beyond
    932   1.52      fvdl 		 * the 1023 limit), fall back to the MI geometry (i.e.
    933   1.52      fvdl 		 * the real geometry) if not found, by returning an
    934   1.52      fvdl 		 * error. See common/linux_hdio.c
    935   1.52      fvdl 		 */
    936  1.134        ad 		bip = fd2biosinfo(curproc, fp);
    937   1.52      fvdl 		ioctlf = fp->f_ops->fo_ioctl;
    938  1.161  christos 		error = ioctlf(fp, DIOCGDINFO, (void *)&label);
    939  1.160  christos 		error1 = ioctlf(fp, DIOCGPARTINFO, (void *)&partp);
    940   1.86      yamt 		if (error != 0 && error1 != 0) {
    941   1.86      yamt 			error = error1;
    942   1.86      yamt 			goto out;
    943   1.86      yamt 		}
    944  1.161  christos 		start = error1 != 0 ? partp.pi_offset : 0;
    945   1.52      fvdl 		if (bip != NULL && bip->bi_head != 0 && bip->bi_sec != 0
    946   1.52      fvdl 		    && bip->bi_cyl != 0) {
    947   1.52      fvdl 			heads = bip->bi_head;
    948   1.52      fvdl 			sectors = bip->bi_sec;
    949   1.52      fvdl 			cylinders = bip->bi_cyl;
    950   1.52      fvdl 			biostotal = heads * sectors * cylinders;
    951  1.161  christos 			realtotal = label.d_ntracks * label.d_nsectors *
    952  1.161  christos 			    label.d_ncylinders;
    953   1.52      fvdl 			if (realtotal > biostotal)
    954   1.52      fvdl 				cylinders = realtotal / (heads * sectors);
    955   1.52      fvdl 		} else {
    956  1.161  christos 			heads = label.d_ntracks;
    957  1.161  christos 			cylinders = label.d_ncylinders;
    958  1.161  christos 			sectors = label.d_nsectors;
    959   1.52      fvdl 		}
    960   1.52      fvdl 		if (com == LINUX_HDIO_GETGEO) {
    961   1.52      fvdl 			hdg.start = start;
    962   1.52      fvdl 			hdg.heads = heads;
    963   1.52      fvdl 			hdg.cylinders = cylinders;
    964   1.52      fvdl 			hdg.sectors = sectors;
    965   1.86      yamt 			error = copyout(&hdg, SCARG(uap, data), sizeof hdg);
    966   1.86      yamt 			goto out;
    967   1.52      fvdl 		} else {
    968   1.52      fvdl 			hdg_big.start = start;
    969   1.52      fvdl 			hdg_big.heads = heads;
    970   1.52      fvdl 			hdg_big.cylinders = cylinders;
    971   1.52      fvdl 			hdg_big.sectors = sectors;
    972   1.86      yamt 			error = copyout(&hdg_big, SCARG(uap, data),
    973   1.52      fvdl 			    sizeof hdg_big);
    974   1.86      yamt 			goto out;
    975   1.52      fvdl 		}
    976   1.52      fvdl 
    977   1.13      fvdl 	default:
    978   1.54      fvdl 		/*
    979   1.55      fvdl 		 * Unknown to us. If it's on a device, just pass it through
    980   1.55      fvdl 		 * using PTIOCLINUX, the device itself might be able to
    981   1.55      fvdl 		 * make some sense of it.
    982   1.57      fvdl 		 * XXX hack: if the function returns EJUSTRETURN,
    983   1.57      fvdl 		 * it has stuffed a sysctl return value in pt.data.
    984   1.54      fvdl 		 */
    985   1.55      fvdl 		ioctlf = fp->f_ops->fo_ioctl;
    986   1.55      fvdl 		pt.com = SCARG(uap, com);
    987   1.55      fvdl 		pt.data = SCARG(uap, data);
    988  1.134        ad 		error = ioctlf(fp, PTIOCLINUX, &pt);
    989   1.57      fvdl 		if (error == EJUSTRETURN) {
    990   1.57      fvdl 			retval[0] = (register_t)pt.data;
    991   1.57      fvdl 			error = 0;
    992   1.57      fvdl 		}
    993   1.55      fvdl 
    994  1.115  christos 		if (error == ENOTTY) {
    995   1.72  christos 			DPRINTF(("linux_machdepioctl: invalid ioctl %08lx\n",
    996   1.72  christos 			    com));
    997  1.115  christos 		}
    998   1.86      yamt 		goto out;
    999   1.13      fvdl 	}
   1000   1.13      fvdl 	SCARG(&bia, com) = com;
   1001   1.86      yamt 	error = sys_ioctl(curlwp, &bia, retval);
   1002   1.86      yamt out:
   1003  1.134        ad 	fd_putfile(fd);
   1004   1.86      yamt 	return error;
   1005   1.13      fvdl }
   1006   1.13      fvdl 
   1007   1.13      fvdl /*
   1008   1.13      fvdl  * Set I/O permissions for a process. Just set the maximum level
   1009   1.13      fvdl  * right away (ignoring the argument), otherwise we would have
   1010   1.13      fvdl  * to rely on I/O permission maps, which are not implemented.
   1011   1.13      fvdl  */
   1012   1.13      fvdl int
   1013  1.133       dsl linux_sys_iopl(struct lwp *l, const struct linux_sys_iopl_args *uap, register_t *retval)
   1014   1.19   thorpej {
   1015  1.133       dsl 	/* {
   1016   1.13      fvdl 		syscallarg(int) level;
   1017  1.133       dsl 	} */
   1018   1.85   thorpej 	struct trapframe *fp = l->l_md.md_regs;
   1019   1.13      fvdl 
   1020  1.120      elad 	if (kauth_authorize_machdep(l->l_cred, KAUTH_MACHDEP_IOPL,
   1021  1.120      elad 	    NULL, NULL, NULL, NULL) != 0)
   1022   1.13      fvdl 		return EPERM;
   1023   1.13      fvdl 	fp->tf_eflags |= PSL_IOPL;
   1024   1.13      fvdl 	*retval = 0;
   1025   1.13      fvdl 	return 0;
   1026   1.13      fvdl }
   1027   1.13      fvdl 
   1028   1.13      fvdl /*
   1029   1.13      fvdl  * See above. If a root process tries to set access to an I/O port,
   1030   1.13      fvdl  * just let it have the whole range.
   1031   1.13      fvdl  */
   1032   1.13      fvdl int
   1033  1.133       dsl linux_sys_ioperm(struct lwp *l, const struct linux_sys_ioperm_args *uap, register_t *retval)
   1034   1.19   thorpej {
   1035  1.133       dsl 	/* {
   1036   1.13      fvdl 		syscallarg(unsigned int) lo;
   1037   1.13      fvdl 		syscallarg(unsigned int) hi;
   1038   1.13      fvdl 		syscallarg(int) val;
   1039  1.133       dsl 	} */
   1040   1.85   thorpej 	struct trapframe *fp = l->l_md.md_regs;
   1041   1.13      fvdl 
   1042  1.120      elad 	if (kauth_authorize_machdep(l->l_cred, SCARG(uap, val) ?
   1043  1.120      elad 	    KAUTH_MACHDEP_IOPERM_SET : KAUTH_MACHDEP_IOPERM_GET, NULL, NULL,
   1044  1.120      elad 	    NULL, NULL) != 0)
   1045   1.13      fvdl 		return EPERM;
   1046   1.13      fvdl 	if (SCARG(uap, val))
   1047   1.13      fvdl 		fp->tf_eflags |= PSL_IOPL;
   1048   1.13      fvdl 	*retval = 0;
   1049   1.92  christos 	return 0;
   1050   1.92  christos }
   1051  1.107      fvdl 
   1052  1.107      fvdl int
   1053  1.119  christos linux_usertrap(struct lwp *l, vaddr_t trapaddr,
   1054  1.119  christos     void *arg)
   1055  1.107      fvdl {
   1056  1.107      fvdl 	return 0;
   1057  1.107      fvdl }
   1058  1.125  christos 
   1059  1.125  christos const char *
   1060  1.125  christos linux_get_uname_arch(void)
   1061  1.125  christos {
   1062  1.125  christos 	static char uname_arch[5] = "i386";
   1063  1.125  christos 
   1064  1.125  christos 	if (uname_arch[1] == '3')
   1065  1.125  christos 		uname_arch[1] += cpu_class;
   1066  1.125  christos 	return uname_arch;
   1067  1.125  christos }
   1068