Home | History | Annotate | Line # | Download | only in i386
linux_machdep.c revision 1.157
      1  1.157       dsl /*	$NetBSD: linux_machdep.c,v 1.157 2014/02/15 10:11:15 dsl Exp $	*/
      2    1.1      fvdl 
      3   1.45      fvdl /*-
      4  1.143        ad  * Copyright (c) 1995, 2000, 2008, 2009 The NetBSD Foundation, Inc.
      5    1.1      fvdl  * All rights reserved.
      6    1.1      fvdl  *
      7   1.45      fvdl  * This code is derived from software contributed to The NetBSD Foundation
      8  1.143        ad  * by Frank van der Linden, and by Andrew Doran.
      9   1.45      fvdl  *
     10    1.1      fvdl  * Redistribution and use in source and binary forms, with or without
     11    1.1      fvdl  * modification, are permitted provided that the following conditions
     12    1.1      fvdl  * are met:
     13    1.1      fvdl  * 1. Redistributions of source code must retain the above copyright
     14    1.1      fvdl  *    notice, this list of conditions and the following disclaimer.
     15    1.1      fvdl  * 2. Redistributions in binary form must reproduce the above copyright
     16    1.1      fvdl  *    notice, this list of conditions and the following disclaimer in the
     17    1.1      fvdl  *    documentation and/or other materials provided with the distribution.
     18    1.1      fvdl  *
     19   1.45      fvdl  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.45      fvdl  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.45      fvdl  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.45      fvdl  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.45      fvdl  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.45      fvdl  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.45      fvdl  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.45      fvdl  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.45      fvdl  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.45      fvdl  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.45      fvdl  * POSSIBILITY OF SUCH DAMAGE.
     30    1.1      fvdl  */
     31   1.68     lukem 
     32   1.68     lukem #include <sys/cdefs.h>
     33  1.157       dsl __KERNEL_RCSID(0, "$NetBSD: linux_machdep.c,v 1.157 2014/02/15 10:11:15 dsl Exp $");
     34   1.35   thorpej 
     35   1.63       mrg #if defined(_KERNEL_OPT)
     36   1.35   thorpej #include "opt_vm86.h"
     37   1.36   thorpej #include "opt_user_ldt.h"
     38   1.51  jdolecek #endif
     39    1.1      fvdl 
     40    1.1      fvdl #include <sys/param.h>
     41    1.1      fvdl #include <sys/systm.h>
     42    1.1      fvdl #include <sys/signalvar.h>
     43    1.1      fvdl #include <sys/kernel.h>
     44    1.1      fvdl #include <sys/proc.h>
     45    1.1      fvdl #include <sys/buf.h>
     46    1.1      fvdl #include <sys/reboot.h>
     47    1.1      fvdl #include <sys/conf.h>
     48   1.31   thorpej #include <sys/exec.h>
     49    1.1      fvdl #include <sys/file.h>
     50    1.1      fvdl #include <sys/callout.h>
     51    1.1      fvdl #include <sys/malloc.h>
     52    1.1      fvdl #include <sys/mbuf.h>
     53    1.1      fvdl #include <sys/msgbuf.h>
     54    1.1      fvdl #include <sys/mount.h>
     55    1.1      fvdl #include <sys/vnode.h>
     56    1.1      fvdl #include <sys/device.h>
     57    1.1      fvdl #include <sys/syscallargs.h>
     58   1.13      fvdl #include <sys/filedesc.h>
     59   1.39   mycroft #include <sys/exec_elf.h>
     60   1.52      fvdl #include <sys/disklabel.h>
     61   1.62      manu #include <sys/ioctl.h>
     62  1.110  christos #include <sys/wait.h>
     63  1.113      elad #include <sys/kauth.h>
     64  1.143        ad #include <sys/kmem.h>
     65  1.113      elad 
     66   1.52      fvdl #include <miscfs/specfs/specdev.h>
     67    1.7   mycroft 
     68   1.44  christos #include <compat/linux/common/linux_types.h>
     69   1.44  christos #include <compat/linux/common/linux_signal.h>
     70   1.44  christos #include <compat/linux/common/linux_util.h>
     71   1.44  christos #include <compat/linux/common/linux_ioctl.h>
     72   1.52      fvdl #include <compat/linux/common/linux_hdio.h>
     73   1.44  christos #include <compat/linux/common/linux_exec.h>
     74   1.44  christos #include <compat/linux/common/linux_machdep.h>
     75   1.98  jdolecek #include <compat/linux/common/linux_errno.h>
     76   1.44  christos 
     77    1.1      fvdl #include <compat/linux/linux_syscallargs.h>
     78    1.1      fvdl 
     79  1.130        ad #include <sys/cpu.h>
     80    1.1      fvdl #include <machine/cpufunc.h>
     81    1.1      fvdl #include <machine/psl.h>
     82    1.1      fvdl #include <machine/reg.h>
     83    1.7   mycroft #include <machine/segments.h>
     84    1.1      fvdl #include <machine/specialreg.h>
     85    1.7   mycroft #include <machine/sysarch.h>
     86   1.26   mycroft #include <machine/vm86.h>
     87   1.34   mycroft #include <machine/vmparam.h>
     88    1.1      fvdl 
     89    1.1      fvdl /*
     90   1.50     veego  * To see whether wscons is configured (for virtual console ioctl calls).
     91   1.13      fvdl  */
     92   1.63       mrg #if defined(_KERNEL_OPT)
     93   1.41  drochner #include "wsdisplay.h"
     94   1.51  jdolecek #endif
     95   1.41  drochner #if (NWSDISPLAY > 0)
     96   1.52      fvdl #include <dev/wscons/wsconsio.h>
     97   1.41  drochner #include <dev/wscons/wsdisplay_usl_io.h>
     98   1.63       mrg #if defined(_KERNEL_OPT)
     99   1.41  drochner #include "opt_xserver.h"
    100   1.51  jdolecek #endif
    101   1.41  drochner #endif
    102   1.41  drochner 
    103   1.72  christos #ifdef DEBUG_LINUX
    104   1.72  christos #define DPRINTF(a) uprintf a
    105   1.72  christos #else
    106   1.72  christos #define DPRINTF(a)
    107   1.72  christos #endif
    108   1.72  christos 
    109  1.131       dsl static struct biosdisk_info *fd2biosinfo(struct proc *, struct file *);
    110  1.103   thorpej extern struct disklist *x86_alldisks;
    111  1.131       dsl static void linux_save_ucontext(struct lwp *, struct trapframe *,
    112  1.131       dsl     const sigset_t *, struct sigaltstack *, struct linux_ucontext *);
    113  1.131       dsl static void linux_save_sigcontext(struct lwp *, struct trapframe *,
    114  1.131       dsl     const sigset_t *, struct linux_sigcontext *);
    115  1.131       dsl static int linux_restore_sigcontext(struct lwp *,
    116  1.131       dsl     struct linux_sigcontext *, register_t *);
    117  1.131       dsl static void linux_rt_sendsig(const ksiginfo_t *, const sigset_t *);
    118  1.131       dsl static void linux_old_sendsig(const ksiginfo_t *, const sigset_t *);
    119   1.52      fvdl 
    120   1.83  christos extern char linux_sigcode[], linux_rt_sigcode[];
    121  1.149       chs 
    122   1.13      fvdl /*
    123    1.1      fvdl  * Deal with some i386-specific things in the Linux emulation code.
    124    1.1      fvdl  */
    125   1.37   mycroft 
    126   1.37   mycroft void
    127  1.149       chs linux_setregs(struct lwp *l, struct exec_package *epp, vaddr_t stack)
    128   1.37   mycroft {
    129   1.73  christos 	struct trapframe *tf;
    130   1.73  christos 
    131   1.73  christos #ifdef USER_LDT
    132   1.85   thorpej 	pmap_ldt_cleanup(l);
    133   1.73  christos #endif
    134   1.37   mycroft 
    135  1.157       dsl 	fpu_save_area_clear(l, __Linux_NPXCW__);
    136   1.73  christos 
    137   1.85   thorpej 	tf = l->l_md.md_regs;
    138  1.149       chs 	tf->tf_gs = 0;
    139   1.73  christos 	tf->tf_fs = GSEL(GUDATA_SEL, SEL_UPL);
    140   1.73  christos 	tf->tf_es = GSEL(GUDATA_SEL, SEL_UPL);
    141   1.73  christos 	tf->tf_ds = GSEL(GUDATA_SEL, SEL_UPL);
    142   1.73  christos 	tf->tf_edi = 0;
    143   1.73  christos 	tf->tf_esi = 0;
    144   1.73  christos 	tf->tf_ebp = 0;
    145  1.150     joerg 	tf->tf_ebx = l->l_proc->p_psstrp;
    146   1.73  christos 	tf->tf_edx = 0;
    147   1.73  christos 	tf->tf_ecx = 0;
    148   1.73  christos 	tf->tf_eax = 0;
    149   1.73  christos 	tf->tf_eip = epp->ep_entry;
    150   1.95       chs 	tf->tf_cs = GSEL(GUCODEBIG_SEL, SEL_UPL);
    151   1.73  christos 	tf->tf_eflags = PSL_USERSET;
    152   1.73  christos 	tf->tf_esp = stack;
    153   1.73  christos 	tf->tf_ss = GSEL(GUDATA_SEL, SEL_UPL);
    154   1.37   mycroft }
    155    1.1      fvdl 
    156    1.1      fvdl /*
    157    1.1      fvdl  * Send an interrupt to process.
    158    1.1      fvdl  *
    159    1.1      fvdl  * Stack is set up to allow sigcode stored
    160    1.1      fvdl  * in u. to call routine, followed by kcall
    161    1.1      fvdl  * to sigreturn routine below.  After sigreturn
    162    1.1      fvdl  * resets the signal mask, the stack, and the
    163    1.1      fvdl  * frame pointer, it returns to the user
    164    1.1      fvdl  * specified pc, psl.
    165    1.1      fvdl  */
    166    1.1      fvdl 
    167    1.1      fvdl void
    168   1.99  christos linux_sendsig(const ksiginfo_t *ksi, const sigset_t *mask)
    169    1.1      fvdl {
    170   1.96  christos 	if (SIGACTION(curproc, ksi->ksi_signo).sa_flags & SA_SIGINFO)
    171   1.97  christos 		linux_rt_sendsig(ksi, mask);
    172   1.83  christos 	else
    173   1.97  christos 		linux_old_sendsig(ksi, mask);
    174   1.83  christos }
    175   1.83  christos 
    176   1.83  christos 
    177   1.83  christos static void
    178  1.132       dsl linux_save_ucontext(struct lwp *l, struct trapframe *tf, const sigset_t *mask, struct sigaltstack *sas, struct linux_ucontext *uc)
    179   1.90  christos {
    180   1.90  christos 	uc->uc_flags = 0;
    181   1.90  christos 	uc->uc_link = NULL;
    182   1.90  christos 	native_to_linux_sigaltstack(&uc->uc_stack, sas);
    183   1.90  christos 	linux_save_sigcontext(l, tf, mask, &uc->uc_mcontext);
    184   1.90  christos 	native_to_linux_sigset(&uc->uc_sigmask, mask);
    185   1.90  christos 	(void)memset(&uc->uc_fpregs_mem, 0, sizeof(uc->uc_fpregs_mem));
    186   1.90  christos }
    187   1.90  christos 
    188   1.90  christos static void
    189  1.146     rmind linux_save_sigcontext(struct lwp *l, struct trapframe *tf,
    190  1.146     rmind     const sigset_t *mask, struct linux_sigcontext *sc)
    191   1.83  christos {
    192  1.146     rmind 	struct pcb *pcb = lwp_getpcb(l);
    193  1.146     rmind 
    194   1.83  christos 	/* Save register context. */
    195   1.83  christos #ifdef VM86
    196   1.83  christos 	if (tf->tf_eflags & PSL_VM) {
    197   1.83  christos 		sc->sc_gs = tf->tf_vm86_gs;
    198   1.83  christos 		sc->sc_fs = tf->tf_vm86_fs;
    199   1.83  christos 		sc->sc_es = tf->tf_vm86_es;
    200   1.83  christos 		sc->sc_ds = tf->tf_vm86_ds;
    201   1.85   thorpej 		sc->sc_eflags = get_vflags(l);
    202   1.83  christos 	} else
    203   1.83  christos #endif
    204   1.83  christos 	{
    205   1.83  christos 		sc->sc_gs = tf->tf_gs;
    206  1.106     perry 		sc->sc_fs = tf->tf_fs;
    207   1.83  christos 		sc->sc_es = tf->tf_es;
    208   1.83  christos 		sc->sc_ds = tf->tf_ds;
    209   1.83  christos 		sc->sc_eflags = tf->tf_eflags;
    210   1.83  christos 	}
    211   1.83  christos 	sc->sc_edi = tf->tf_edi;
    212   1.83  christos 	sc->sc_esi = tf->tf_esi;
    213   1.83  christos 	sc->sc_esp = tf->tf_esp;
    214   1.83  christos 	sc->sc_ebp = tf->tf_ebp;
    215   1.83  christos 	sc->sc_ebx = tf->tf_ebx;
    216   1.83  christos 	sc->sc_edx = tf->tf_edx;
    217   1.83  christos 	sc->sc_ecx = tf->tf_ecx;
    218   1.83  christos 	sc->sc_eax = tf->tf_eax;
    219   1.83  christos 	sc->sc_eip = tf->tf_eip;
    220   1.83  christos 	sc->sc_cs = tf->tf_cs;
    221   1.83  christos 	sc->sc_esp_at_signal = tf->tf_esp;
    222   1.83  christos 	sc->sc_ss = tf->tf_ss;
    223   1.83  christos 	sc->sc_err = tf->tf_err;
    224   1.83  christos 	sc->sc_trapno = tf->tf_trapno;
    225  1.146     rmind 	sc->sc_cr2 = pcb->pcb_cr2;
    226   1.83  christos 	sc->sc_387 = NULL;
    227   1.83  christos 
    228   1.83  christos 	/* Save signal stack. */
    229   1.83  christos 	/* Linux doesn't save the onstack flag in sigframe */
    230   1.83  christos 
    231   1.83  christos 	/* Save signal mask. */
    232   1.83  christos 	native_to_linux_old_sigset(&sc->sc_mask, mask);
    233   1.83  christos }
    234   1.83  christos 
    235   1.83  christos static void
    236   1.99  christos linux_rt_sendsig(const ksiginfo_t *ksi, const sigset_t *mask)
    237   1.83  christos {
    238   1.85   thorpej 	struct lwp *l = curlwp;
    239   1.85   thorpej 	struct proc *p = l->l_proc;
    240   1.48  augustss 	struct trapframe *tf;
    241   1.83  christos 	struct linux_rt_sigframe *fp, frame;
    242  1.122        ad 	int onstack, error;
    243   1.98  jdolecek 	int sig = ksi->ksi_signo;
    244   1.78   thorpej 	sig_t catcher = SIGACTION(p, sig).sa_handler;
    245  1.122        ad 	struct sigaltstack *sas = &l->l_sigstk;
    246    1.1      fvdl 
    247   1.85   thorpej 	tf = l->l_md.md_regs;
    248   1.66  jdolecek 	/* Do we need to jump onto the signal stack? */
    249   1.82  christos 	onstack = (sas->ss_flags & (SS_DISABLE | SS_ONSTACK)) == 0 &&
    250   1.66  jdolecek 	    (SIGACTION(p, sig).sa_flags & SA_ONSTACK) != 0;
    251   1.66  jdolecek 
    252   1.83  christos 
    253   1.42   mycroft 	/* Allocate space for the signal handler context. */
    254   1.66  jdolecek 	if (onstack)
    255  1.123  christos 		fp = (struct linux_rt_sigframe *)((char *)sas->ss_sp +
    256   1.83  christos 		    sas->ss_size);
    257   1.66  jdolecek 	else
    258   1.83  christos 		fp = (struct linux_rt_sigframe *)tf->tf_esp;
    259   1.42   mycroft 	fp--;
    260    1.1      fvdl 
    261   1.92  christos 	DPRINTF(("rt: onstack = %d, fp = %p sig = %d eip = 0x%x cr2 = 0x%x\n",
    262  1.146     rmind 	    onstack, fp, sig, tf->tf_eip,
    263  1.146     rmind 	    ((struct pcb *)lwp_getpcb(l))->pcb_cr2));
    264   1.83  christos 
    265   1.42   mycroft 	/* Build stack frame for signal trampoline. */
    266    1.7   mycroft 	frame.sf_handler = catcher;
    267   1.74  christos 	frame.sf_sig = native_to_linux_signo[sig];
    268   1.82  christos 	frame.sf_sip = &fp->sf_si;
    269   1.90  christos 	frame.sf_ucp = &fp->sf_uc;
    270   1.83  christos 
    271   1.82  christos 	/*
    272   1.97  christos 	 * XXX: the following code assumes that the constants for
    273   1.97  christos 	 * siginfo are the same between linux and NetBSD.
    274   1.82  christos 	 */
    275  1.151  christos 	native_to_linux_siginfo(&frame.sf_si, &ksi->ksi_info);
    276    1.1      fvdl 
    277   1.42   mycroft 	/* Save register context. */
    278   1.90  christos 	linux_save_ucontext(l, tf, mask, sas, &frame.sf_uc);
    279  1.122        ad 	sendsig_reset(l, sig);
    280   1.83  christos 
    281  1.135        ad 	mutex_exit(p->p_lock);
    282  1.122        ad 	error = copyout(&frame, fp, sizeof(frame));
    283  1.135        ad 	mutex_enter(p->p_lock);
    284  1.122        ad 
    285  1.122        ad 	if (error != 0) {
    286   1.83  christos 		/*
    287   1.83  christos 		 * Process has trashed its stack; give it an illegal
    288   1.83  christos 		 * instruction to halt it in its tracks.
    289   1.83  christos 		 */
    290   1.85   thorpej 		sigexit(l, SIGILL);
    291   1.83  christos 		/* NOTREACHED */
    292    1.4   mycroft 	}
    293    1.1      fvdl 
    294   1.83  christos 	/*
    295   1.83  christos 	 * Build context to run handler in.
    296   1.83  christos 	 */
    297   1.83  christos 	tf->tf_fs = GSEL(GUDATA_SEL, SEL_UPL);
    298   1.83  christos 	tf->tf_es = GSEL(GUDATA_SEL, SEL_UPL);
    299   1.83  christos 	tf->tf_ds = GSEL(GUDATA_SEL, SEL_UPL);
    300  1.106     perry 	tf->tf_eip = ((int)p->p_sigctx.ps_sigcode) +
    301   1.83  christos 	    (linux_rt_sigcode - linux_sigcode);
    302   1.83  christos 	tf->tf_cs = GSEL(GUCODE_SEL, SEL_UPL);
    303  1.138  christos 	tf->tf_eflags &= ~PSL_CLEARSIG;
    304   1.83  christos 	tf->tf_esp = (int)fp;
    305   1.83  christos 	tf->tf_ss = GSEL(GUDATA_SEL, SEL_UPL);
    306   1.83  christos 
    307   1.83  christos 	/* Remember that we're now on the signal stack. */
    308   1.83  christos 	if (onstack)
    309   1.83  christos 		sas->ss_flags |= SS_ONSTACK;
    310   1.83  christos }
    311   1.83  christos 
    312   1.83  christos static void
    313   1.99  christos linux_old_sendsig(const ksiginfo_t *ksi, const sigset_t *mask)
    314   1.83  christos {
    315   1.85   thorpej 	struct lwp *l = curlwp;
    316   1.85   thorpej 	struct proc *p = l->l_proc;
    317   1.83  christos 	struct trapframe *tf;
    318   1.83  christos 	struct linux_sigframe *fp, frame;
    319  1.122        ad 	int onstack, error;
    320   1.97  christos 	int sig = ksi->ksi_signo;
    321   1.83  christos 	sig_t catcher = SIGACTION(p, sig).sa_handler;
    322  1.122        ad 	struct sigaltstack *sas = &l->l_sigstk;
    323   1.83  christos 
    324   1.85   thorpej 	tf = l->l_md.md_regs;
    325   1.83  christos 
    326   1.83  christos 	/* Do we need to jump onto the signal stack? */
    327   1.83  christos 	onstack = (sas->ss_flags & (SS_DISABLE | SS_ONSTACK)) == 0 &&
    328   1.83  christos 	    (SIGACTION(p, sig).sa_flags & SA_ONSTACK) != 0;
    329   1.83  christos 
    330   1.83  christos 	/* Allocate space for the signal handler context. */
    331   1.83  christos 	if (onstack)
    332  1.123  christos 		fp = (struct linux_sigframe *) ((char *)sas->ss_sp +
    333   1.83  christos 		    sas->ss_size);
    334   1.83  christos 	else
    335   1.83  christos 		fp = (struct linux_sigframe *)tf->tf_esp;
    336   1.83  christos 	fp--;
    337   1.83  christos 
    338   1.92  christos 	DPRINTF(("old: onstack = %d, fp = %p sig = %d eip = 0x%x cr2 = 0x%x\n",
    339  1.146     rmind 	    onstack, fp, sig, tf->tf_eip,
    340  1.146     rmind 	    ((struct pcb *)lwp_getpcb(l))->pcb_cr2));
    341   1.83  christos 
    342   1.83  christos 	/* Build stack frame for signal trampoline. */
    343   1.83  christos 	frame.sf_handler = catcher;
    344   1.83  christos 	frame.sf_sig = native_to_linux_signo[sig];
    345   1.42   mycroft 
    346   1.90  christos 	linux_save_sigcontext(l, tf, mask, &frame.sf_sc);
    347  1.122        ad 	sendsig_reset(l, sig);
    348  1.122        ad 
    349  1.135        ad 	mutex_exit(p->p_lock);
    350  1.122        ad 	error = copyout(&frame, fp, sizeof(frame));
    351  1.135        ad 	mutex_enter(p->p_lock);
    352   1.42   mycroft 
    353  1.122        ad 	if (error != 0) {
    354    1.1      fvdl 		/*
    355    1.1      fvdl 		 * Process has trashed its stack; give it an illegal
    356    1.1      fvdl 		 * instruction to halt it in its tracks.
    357    1.1      fvdl 		 */
    358   1.85   thorpej 		sigexit(l, SIGILL);
    359    1.1      fvdl 		/* NOTREACHED */
    360    1.1      fvdl 	}
    361    1.1      fvdl 
    362    1.1      fvdl 	/*
    363    1.1      fvdl 	 * Build context to run handler in.
    364    1.1      fvdl 	 */
    365   1.75  christos 	tf->tf_fs = GSEL(GUDATA_SEL, SEL_UPL);
    366   1.26   mycroft 	tf->tf_es = GSEL(GUDATA_SEL, SEL_UPL);
    367   1.26   mycroft 	tf->tf_ds = GSEL(GUDATA_SEL, SEL_UPL);
    368   1.56  jdolecek 	tf->tf_eip = (int)p->p_sigctx.ps_sigcode;
    369   1.95       chs 	tf->tf_cs = GSEL(GUCODEBIG_SEL, SEL_UPL);
    370  1.138  christos 	tf->tf_eflags &= ~PSL_CLEARSIG;
    371   1.26   mycroft 	tf->tf_esp = (int)fp;
    372   1.23   mycroft 	tf->tf_ss = GSEL(GUDATA_SEL, SEL_UPL);
    373   1.42   mycroft 
    374   1.42   mycroft 	/* Remember that we're now on the signal stack. */
    375   1.66  jdolecek 	if (onstack)
    376   1.82  christos 		sas->ss_flags |= SS_ONSTACK;
    377    1.1      fvdl }
    378    1.1      fvdl 
    379    1.1      fvdl /*
    380    1.1      fvdl  * System call to cleanup state after a signal
    381    1.1      fvdl  * has been taken.  Reset signal mask and
    382    1.1      fvdl  * stack state from context left by sendsig (above).
    383    1.1      fvdl  * Return to previous pc and psl as specified by
    384    1.1      fvdl  * context left by sendsig. Check carefully to
    385    1.1      fvdl  * make sure that the user has not modified the
    386    1.1      fvdl  * psl to gain improper privileges or to cause
    387    1.1      fvdl  * a machine fault.
    388    1.1      fvdl  */
    389   1.43       erh int
    390  1.133       dsl linux_sys_rt_sigreturn(struct lwp *l, const struct linux_sys_rt_sigreturn_args *uap, register_t *retval)
    391   1.43       erh {
    392  1.133       dsl 	/* {
    393   1.90  christos 		syscallarg(struct linux_ucontext *) ucp;
    394  1.133       dsl 	} */
    395   1.90  christos 	struct linux_ucontext context, *ucp = SCARG(uap, ucp);
    396   1.90  christos 	int error;
    397   1.90  christos 
    398   1.90  christos 	/*
    399   1.90  christos 	 * The trampoline code hands us the context.
    400   1.90  christos 	 * It is unsafe to keep track of it ourselves, in the event that a
    401   1.90  christos 	 * program jumps out of a signal handler.
    402   1.90  christos 	 */
    403   1.90  christos 	if ((error = copyin(ucp, &context, sizeof(*ucp))) != 0)
    404   1.90  christos 		return error;
    405   1.90  christos 
    406   1.90  christos 	/* XXX XAX we can do better here by using more of the ucontext */
    407   1.90  christos 	return linux_restore_sigcontext(l, &context.uc_mcontext, retval);
    408   1.43       erh }
    409   1.43       erh 
    410    1.1      fvdl int
    411  1.133       dsl linux_sys_sigreturn(struct lwp *l, const struct linux_sys_sigreturn_args *uap, register_t *retval)
    412   1.19   thorpej {
    413  1.133       dsl 	/* {
    414    1.1      fvdl 		syscallarg(struct linux_sigcontext *) scp;
    415  1.133       dsl 	} */
    416   1.90  christos 	struct linux_sigcontext context, *scp = SCARG(uap, scp);
    417   1.90  christos 	int error;
    418    1.1      fvdl 
    419    1.1      fvdl 	/*
    420    1.1      fvdl 	 * The trampoline code hands us the context.
    421    1.1      fvdl 	 * It is unsafe to keep track of it ourselves, in the event that a
    422    1.1      fvdl 	 * program jumps out of a signal handler.
    423    1.1      fvdl 	 */
    424  1.123  christos 	if ((error = copyin((void *)scp, &context, sizeof(*scp))) != 0)
    425   1.90  christos 		return error;
    426   1.90  christos 	return linux_restore_sigcontext(l, &context, retval);
    427   1.90  christos }
    428    1.1      fvdl 
    429   1.90  christos static int
    430  1.116  christos linux_restore_sigcontext(struct lwp *l, struct linux_sigcontext *scp,
    431  1.119  christos     register_t *retval)
    432   1.90  christos {
    433   1.90  christos 	struct proc *p = l->l_proc;
    434  1.122        ad 	struct sigaltstack *sas = &l->l_sigstk;
    435   1.90  christos 	struct trapframe *tf;
    436   1.90  christos 	sigset_t mask;
    437   1.90  christos 	ssize_t ss_gap;
    438  1.149       chs 
    439   1.42   mycroft 	/* Restore register context. */
    440   1.85   thorpej 	tf = l->l_md.md_regs;
    441  1.149       chs 	DPRINTF(("sigreturn enter esp=0x%x eip=0x%x\n", tf->tf_esp, tf->tf_eip));
    442   1.83  christos 
    443    1.4   mycroft #ifdef VM86
    444   1.90  christos 	if (scp->sc_eflags & PSL_VM) {
    445  1.131       dsl 		void syscall_vm86(struct trapframe *);
    446   1.83  christos 
    447   1.90  christos 		tf->tf_vm86_gs = scp->sc_gs;
    448   1.90  christos 		tf->tf_vm86_fs = scp->sc_fs;
    449   1.90  christos 		tf->tf_vm86_es = scp->sc_es;
    450   1.90  christos 		tf->tf_vm86_ds = scp->sc_ds;
    451   1.90  christos 		set_vflags(l, scp->sc_eflags);
    452   1.83  christos 		p->p_md.md_syscall = syscall_vm86;
    453    1.4   mycroft 	} else
    454    1.4   mycroft #endif
    455    1.4   mycroft 	{
    456   1.26   mycroft 		/*
    457   1.26   mycroft 		 * Check for security violations.  If we're returning to
    458   1.26   mycroft 		 * protected mode, the CPU will validate the segment registers
    459   1.26   mycroft 		 * automatically and generate a trap on violations.  We handle
    460   1.26   mycroft 		 * the trap, rather than doing all of the checking here.
    461   1.26   mycroft 		 */
    462   1.90  christos 		if (((scp->sc_eflags ^ tf->tf_eflags) & PSL_USERSTATIC) != 0 ||
    463   1.90  christos 		    !USERMODE(scp->sc_cs, scp->sc_eflags))
    464   1.83  christos 			return EINVAL;
    465   1.26   mycroft 
    466   1.90  christos 		tf->tf_gs = scp->sc_gs;
    467   1.90  christos 		tf->tf_fs = scp->sc_fs;
    468   1.90  christos 		tf->tf_es = scp->sc_es;
    469   1.90  christos 		tf->tf_ds = scp->sc_ds;
    470   1.83  christos #ifdef VM86
    471   1.83  christos 		if (tf->tf_eflags & PSL_VM)
    472   1.83  christos 			(*p->p_emul->e_syscall_intern)(p);
    473   1.83  christos #endif
    474   1.90  christos 		tf->tf_eflags = scp->sc_eflags;
    475    1.4   mycroft 	}
    476   1.90  christos 	tf->tf_edi = scp->sc_edi;
    477   1.90  christos 	tf->tf_esi = scp->sc_esi;
    478   1.90  christos 	tf->tf_ebp = scp->sc_ebp;
    479   1.90  christos 	tf->tf_ebx = scp->sc_ebx;
    480   1.90  christos 	tf->tf_edx = scp->sc_edx;
    481   1.90  christos 	tf->tf_ecx = scp->sc_ecx;
    482   1.90  christos 	tf->tf_eax = scp->sc_eax;
    483   1.90  christos 	tf->tf_eip = scp->sc_eip;
    484   1.90  christos 	tf->tf_cs = scp->sc_cs;
    485   1.90  christos 	tf->tf_esp = scp->sc_esp_at_signal;
    486   1.90  christos 	tf->tf_ss = scp->sc_ss;
    487   1.26   mycroft 
    488   1.42   mycroft 	/* Restore signal stack. */
    489   1.66  jdolecek 	/*
    490   1.66  jdolecek 	 * Linux really does it this way; it doesn't have space in sigframe
    491   1.66  jdolecek 	 * to save the onstack flag.
    492   1.66  jdolecek 	 */
    493  1.135        ad 	mutex_enter(p->p_lock);
    494  1.123  christos 	ss_gap = (ssize_t)((char *)scp->sc_esp_at_signal - (char *)sas->ss_sp);
    495   1.82  christos 	if (ss_gap >= 0 && ss_gap < sas->ss_size)
    496   1.82  christos 		sas->ss_flags |= SS_ONSTACK;
    497   1.66  jdolecek 	else
    498   1.82  christos 		sas->ss_flags &= ~SS_ONSTACK;
    499   1.42   mycroft 
    500   1.42   mycroft 	/* Restore signal mask. */
    501   1.90  christos 	linux_old_to_native_sigset(&mask, &scp->sc_mask);
    502  1.122        ad 	(void) sigprocmask1(l, SIG_SETMASK, &mask, 0);
    503  1.135        ad 	mutex_exit(p->p_lock);
    504  1.122        ad 
    505  1.149       chs 	DPRINTF(("sigreturn exit esp=0x%x eip=0x%x\n", tf->tf_esp, tf->tf_eip));
    506   1.83  christos 	return EJUSTRETURN;
    507    1.6   mycroft }
    508    1.6   mycroft 
    509    1.7   mycroft #ifdef USER_LDT
    510    1.7   mycroft 
    511  1.128       dsl static int
    512  1.133       dsl linux_read_ldt(struct lwp *l, const struct linux_sys_modify_ldt_args *uap,
    513  1.128       dsl     register_t *retval)
    514    1.7   mycroft {
    515  1.124        ad 	struct x86_get_ldt_args gl;
    516    1.7   mycroft 	int error;
    517  1.128       dsl 	union descriptor *ldt_buf;
    518  1.143        ad 	size_t sz;
    519  1.128       dsl 
    520  1.128       dsl 	/*
    521  1.128       dsl 	 * I've checked the linux code - this function is asymetric with
    522  1.128       dsl 	 * linux_write_ldt, and returns raw ldt entries.
    523  1.128       dsl 	 * NB, the code I saw zerod the spare parts of the user buffer.
    524  1.128       dsl 	 */
    525    1.7   mycroft 
    526   1.72  christos 	DPRINTF(("linux_read_ldt!"));
    527  1.128       dsl 
    528  1.143        ad 	sz = 8192 * sizeof(*ldt_buf);
    529  1.143        ad 	ldt_buf = kmem_zalloc(sz, KM_SLEEP);
    530    1.7   mycroft 	gl.start = 0;
    531  1.128       dsl 	gl.desc = NULL;
    532    1.7   mycroft 	gl.num = SCARG(uap, bytecount) / sizeof(union descriptor);
    533  1.128       dsl 	error = x86_get_ldt1(l, &gl, ldt_buf);
    534  1.128       dsl 	/* NB gl.num might have changed */
    535  1.128       dsl 	if (error == 0) {
    536  1.128       dsl 		*retval = gl.num * sizeof *ldt;
    537  1.128       dsl 		error = copyout(ldt_buf, SCARG(uap, ptr),
    538  1.128       dsl 		    gl.num * sizeof *ldt_buf);
    539  1.128       dsl 	}
    540  1.143        ad 	kmem_free(ldt_buf, sz);
    541    1.7   mycroft 
    542  1.128       dsl 	return error;
    543    1.7   mycroft }
    544    1.7   mycroft 
    545    1.7   mycroft struct linux_ldt_info {
    546    1.7   mycroft 	u_int entry_number;
    547    1.7   mycroft 	u_long base_addr;
    548    1.7   mycroft 	u_int limit;
    549    1.7   mycroft 	u_int seg_32bit:1;
    550    1.7   mycroft 	u_int contents:2;
    551    1.7   mycroft 	u_int read_exec_only:1;
    552    1.7   mycroft 	u_int limit_in_pages:1;
    553    1.7   mycroft 	u_int seg_not_present:1;
    554   1.72  christos 	u_int useable:1;
    555    1.7   mycroft };
    556    1.7   mycroft 
    557  1.128       dsl static int
    558  1.133       dsl linux_write_ldt(struct lwp *l, const struct linux_sys_modify_ldt_args *uap,
    559  1.128       dsl     int oldmode)
    560    1.7   mycroft {
    561    1.7   mycroft 	struct linux_ldt_info ldt_info;
    562  1.128       dsl 	union descriptor d;
    563  1.124        ad 	struct x86_set_ldt_args sl;
    564    1.7   mycroft 	int error;
    565    1.7   mycroft 
    566   1.72  christos 	DPRINTF(("linux_write_ldt %d\n", oldmode));
    567    1.7   mycroft 	if (SCARG(uap, bytecount) != sizeof(ldt_info))
    568    1.7   mycroft 		return (EINVAL);
    569   1.29  christos 	if ((error = copyin(SCARG(uap, ptr), &ldt_info, sizeof(ldt_info))) != 0)
    570    1.7   mycroft 		return error;
    571   1.72  christos 	if (ldt_info.entry_number >= 8192)
    572    1.7   mycroft 		return (EINVAL);
    573   1.72  christos 	if (ldt_info.contents == 3) {
    574   1.72  christos 		if (oldmode)
    575   1.72  christos 			return (EINVAL);
    576   1.72  christos 		if (ldt_info.seg_not_present)
    577   1.72  christos 			return (EINVAL);
    578   1.72  christos 	}
    579    1.7   mycroft 
    580   1.72  christos 	if (ldt_info.base_addr == 0 && ldt_info.limit == 0 &&
    581   1.72  christos 	    (oldmode || (ldt_info.contents == 0 &&
    582   1.72  christos 	    ldt_info.read_exec_only == 1 && ldt_info.seg_32bit == 0 &&
    583   1.72  christos 	    ldt_info.limit_in_pages == 0 && ldt_info.seg_not_present == 1 &&
    584   1.72  christos 	    ldt_info.useable == 0))) {
    585   1.70  christos 		/* this means you should zero the ldt */
    586  1.128       dsl 		(void)memset(&d, 0, sizeof(d));
    587   1.70  christos 	} else {
    588  1.128       dsl 		d.sd.sd_lobase = ldt_info.base_addr & 0xffffff;
    589  1.128       dsl 		d.sd.sd_hibase = (ldt_info.base_addr >> 24) & 0xff;
    590  1.128       dsl 		d.sd.sd_lolimit = ldt_info.limit & 0xffff;
    591  1.128       dsl 		d.sd.sd_hilimit = (ldt_info.limit >> 16) & 0xf;
    592  1.128       dsl 		d.sd.sd_type = 16 | (ldt_info.contents << 2) |
    593   1.70  christos 		    (!ldt_info.read_exec_only << 1);
    594  1.128       dsl 		d.sd.sd_dpl = SEL_UPL;
    595  1.128       dsl 		d.sd.sd_p = !ldt_info.seg_not_present;
    596  1.128       dsl 		d.sd.sd_def32 = ldt_info.seg_32bit;
    597  1.128       dsl 		d.sd.sd_gran = ldt_info.limit_in_pages;
    598   1.72  christos 		if (!oldmode)
    599  1.128       dsl 			d.sd.sd_xx = ldt_info.useable;
    600   1.73  christos 		else
    601  1.128       dsl 			d.sd.sd_xx = 0;
    602   1.70  christos 	}
    603    1.7   mycroft 	sl.start = ldt_info.entry_number;
    604  1.147   mbalmer 	sl.desc = NULL;
    605    1.7   mycroft 	sl.num = 1;
    606    1.7   mycroft 
    607   1.72  christos 	DPRINTF(("linux_write_ldt: idx=%d, base=0x%lx, limit=0x%x\n",
    608   1.72  christos 	    ldt_info.entry_number, ldt_info.base_addr, ldt_info.limit));
    609    1.7   mycroft 
    610  1.128       dsl 	return x86_set_ldt1(l, &sl, &d);
    611    1.7   mycroft }
    612    1.7   mycroft 
    613    1.7   mycroft #endif /* USER_LDT */
    614    1.7   mycroft 
    615    1.6   mycroft int
    616  1.133       dsl linux_sys_modify_ldt(struct lwp *l, const struct linux_sys_modify_ldt_args *uap, register_t *retval)
    617   1.19   thorpej {
    618  1.133       dsl 	/* {
    619    1.6   mycroft 		syscallarg(int) func;
    620    1.6   mycroft 		syscallarg(void *) ptr;
    621    1.6   mycroft 		syscallarg(size_t) bytecount;
    622  1.133       dsl 	} */
    623    1.6   mycroft 
    624    1.6   mycroft 	switch (SCARG(uap, func)) {
    625    1.7   mycroft #ifdef USER_LDT
    626    1.6   mycroft 	case 0:
    627  1.133       dsl 		return linux_read_ldt(l, (const void *)uap, retval);
    628    1.6   mycroft 	case 1:
    629  1.133       dsl 		return linux_write_ldt(l, (const void *)uap, 1);
    630   1.72  christos 	case 2:
    631   1.72  christos #ifdef notyet
    632  1.148       wiz 		return linux_read_default_ldt(l, (const void *)uap, retval);
    633   1.72  christos #else
    634   1.72  christos 		return (ENOSYS);
    635   1.72  christos #endif
    636   1.72  christos 	case 0x11:
    637  1.133       dsl 		return linux_write_ldt(l, (const void *)uap, 0);
    638    1.7   mycroft #endif /* USER_LDT */
    639    1.7   mycroft 
    640    1.6   mycroft 	default:
    641    1.6   mycroft 		return (ENOSYS);
    642    1.6   mycroft 	}
    643   1.13      fvdl }
    644   1.13      fvdl 
    645   1.13      fvdl /*
    646   1.13      fvdl  * XXX Pathetic hack to make svgalib work. This will fake the major
    647   1.13      fvdl  * device number of an opened VT so that svgalib likes it. grmbl.
    648   1.13      fvdl  * Should probably do it 'wrong the right way' and use a mapping
    649   1.13      fvdl  * array for all major device numbers, and map linux_mknod too.
    650   1.13      fvdl  */
    651   1.13      fvdl dev_t
    652  1.132       dsl linux_fakedev(dev_t dev, int raw)
    653   1.13      fvdl {
    654  1.104  christos 	extern const struct cdevsw ptc_cdevsw, pts_cdevsw;
    655  1.104  christos 	const struct cdevsw *cd = cdevsw_lookup(dev);
    656  1.104  christos 
    657   1.69  christos 	if (raw) {
    658   1.41  drochner #if (NWSDISPLAY > 0)
    659   1.79   gehenna 		extern const struct cdevsw wsdisplay_cdevsw;
    660  1.104  christos 		if (cd == &wsdisplay_cdevsw)
    661   1.69  christos 			return makedev(LINUX_CONS_MAJOR, (minor(dev) + 1));
    662   1.41  drochner #endif
    663   1.69  christos 	}
    664   1.77  jdolecek 
    665  1.104  christos 	if (cd == &ptc_cdevsw)
    666  1.104  christos 		return makedev(LINUX_PTC_MAJOR, minor(dev));
    667  1.104  christos 	if (cd == &pts_cdevsw)
    668  1.104  christos 		return makedev(LINUX_PTS_MAJOR, minor(dev));
    669  1.104  christos 
    670   1.77  jdolecek 	return dev;
    671   1.13      fvdl }
    672   1.13      fvdl 
    673   1.49     jhawk #if (NWSDISPLAY > 0)
    674   1.41  drochner /*
    675   1.41  drochner  * That's not complete, but enough to get an X server running.
    676   1.41  drochner  */
    677   1.41  drochner #define NR_KEYS 128
    678   1.61  jdolecek static const u_short plain_map[NR_KEYS] = {
    679   1.41  drochner 	0x0200,	0x001b,	0x0031,	0x0032,	0x0033,	0x0034,	0x0035,	0x0036,
    680   1.41  drochner 	0x0037,	0x0038,	0x0039,	0x0030,	0x002d,	0x003d,	0x007f,	0x0009,
    681   1.41  drochner 	0x0b71,	0x0b77,	0x0b65,	0x0b72,	0x0b74,	0x0b79,	0x0b75,	0x0b69,
    682   1.41  drochner 	0x0b6f,	0x0b70,	0x005b,	0x005d,	0x0201,	0x0702,	0x0b61,	0x0b73,
    683   1.41  drochner 	0x0b64,	0x0b66,	0x0b67,	0x0b68,	0x0b6a,	0x0b6b,	0x0b6c,	0x003b,
    684   1.41  drochner 	0x0027,	0x0060,	0x0700,	0x005c,	0x0b7a,	0x0b78,	0x0b63,	0x0b76,
    685   1.41  drochner 	0x0b62,	0x0b6e,	0x0b6d,	0x002c,	0x002e,	0x002f,	0x0700,	0x030c,
    686   1.41  drochner 	0x0703,	0x0020,	0x0207,	0x0100,	0x0101,	0x0102,	0x0103,	0x0104,
    687   1.41  drochner 	0x0105,	0x0106,	0x0107,	0x0108,	0x0109,	0x0208,	0x0209,	0x0307,
    688   1.41  drochner 	0x0308,	0x0309,	0x030b,	0x0304,	0x0305,	0x0306,	0x030a,	0x0301,
    689   1.41  drochner 	0x0302,	0x0303,	0x0300,	0x0310,	0x0206,	0x0200,	0x003c,	0x010a,
    690   1.41  drochner 	0x010b,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    691   1.41  drochner 	0x030e,	0x0702,	0x030d,	0x001c,	0x0701,	0x0205,	0x0114,	0x0603,
    692   1.41  drochner 	0x0118,	0x0601,	0x0602,	0x0117,	0x0600,	0x0119,	0x0115,	0x0116,
    693   1.41  drochner 	0x011a,	0x010c,	0x010d,	0x011b,	0x011c,	0x0110,	0x0311,	0x011d,
    694   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    695   1.41  drochner }, shift_map[NR_KEYS] = {
    696   1.41  drochner 	0x0200,	0x001b,	0x0021,	0x0040,	0x0023,	0x0024,	0x0025,	0x005e,
    697   1.41  drochner 	0x0026,	0x002a,	0x0028,	0x0029,	0x005f,	0x002b,	0x007f,	0x0009,
    698   1.41  drochner 	0x0b51,	0x0b57,	0x0b45,	0x0b52,	0x0b54,	0x0b59,	0x0b55,	0x0b49,
    699   1.41  drochner 	0x0b4f,	0x0b50,	0x007b,	0x007d,	0x0201,	0x0702,	0x0b41,	0x0b53,
    700   1.41  drochner 	0x0b44,	0x0b46,	0x0b47,	0x0b48,	0x0b4a,	0x0b4b,	0x0b4c,	0x003a,
    701   1.41  drochner 	0x0022,	0x007e,	0x0700,	0x007c,	0x0b5a,	0x0b58,	0x0b43,	0x0b56,
    702   1.41  drochner 	0x0b42,	0x0b4e,	0x0b4d,	0x003c,	0x003e,	0x003f,	0x0700,	0x030c,
    703   1.41  drochner 	0x0703,	0x0020,	0x0207,	0x010a,	0x010b,	0x010c,	0x010d,	0x010e,
    704   1.41  drochner 	0x010f,	0x0110,	0x0111,	0x0112,	0x0113,	0x0213,	0x0203,	0x0307,
    705   1.41  drochner 	0x0308,	0x0309,	0x030b,	0x0304,	0x0305,	0x0306,	0x030a,	0x0301,
    706   1.41  drochner 	0x0302,	0x0303,	0x0300,	0x0310,	0x0206,	0x0200,	0x003e,	0x010a,
    707   1.41  drochner 	0x010b,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    708   1.41  drochner 	0x030e,	0x0702,	0x030d,	0x0200,	0x0701,	0x0205,	0x0114,	0x0603,
    709   1.41  drochner 	0x020b,	0x0601,	0x0602,	0x0117,	0x0600,	0x020a,	0x0115,	0x0116,
    710   1.41  drochner 	0x011a,	0x010c,	0x010d,	0x011b,	0x011c,	0x0110,	0x0311,	0x011d,
    711   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    712   1.41  drochner }, altgr_map[NR_KEYS] = {
    713   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0040,	0x0200,	0x0024,	0x0200,	0x0200,
    714   1.41  drochner 	0x007b,	0x005b,	0x005d,	0x007d,	0x005c,	0x0200,	0x0200,	0x0200,
    715   1.41  drochner 	0x0b71,	0x0b77,	0x0918,	0x0b72,	0x0b74,	0x0b79,	0x0b75,	0x0b69,
    716   1.41  drochner 	0x0b6f,	0x0b70,	0x0200,	0x007e,	0x0201,	0x0702,	0x0914,	0x0b73,
    717   1.41  drochner 	0x0917,	0x0919,	0x0b67,	0x0b68,	0x0b6a,	0x0b6b,	0x0b6c,	0x0200,
    718   1.41  drochner 	0x0200,	0x0200,	0x0700,	0x0200,	0x0b7a,	0x0b78,	0x0916,	0x0b76,
    719   1.41  drochner 	0x0915,	0x0b6e,	0x0b6d,	0x0200,	0x0200,	0x0200,	0x0700,	0x030c,
    720   1.41  drochner 	0x0703,	0x0200,	0x0207,	0x050c,	0x050d,	0x050e,	0x050f,	0x0510,
    721   1.41  drochner 	0x0511,	0x0512,	0x0513,	0x0514,	0x0515,	0x0208,	0x0202,	0x0911,
    722   1.41  drochner 	0x0912,	0x0913,	0x030b,	0x090e,	0x090f,	0x0910,	0x030a,	0x090b,
    723   1.41  drochner 	0x090c,	0x090d,	0x090a,	0x0310,	0x0206,	0x0200,	0x007c,	0x0516,
    724   1.41  drochner 	0x0517,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    725   1.41  drochner 	0x030e,	0x0702,	0x030d,	0x0200,	0x0701,	0x0205,	0x0114,	0x0603,
    726   1.41  drochner 	0x0118,	0x0601,	0x0602,	0x0117,	0x0600,	0x0119,	0x0115,	0x0116,
    727   1.41  drochner 	0x011a,	0x010c,	0x010d,	0x011b,	0x011c,	0x0110,	0x0311,	0x011d,
    728   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    729   1.41  drochner }, ctrl_map[NR_KEYS] = {
    730   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0000,	0x001b,	0x001c,	0x001d,	0x001e,
    731   1.41  drochner 	0x001f,	0x007f,	0x0200,	0x0200,	0x001f,	0x0200,	0x0008,	0x0200,
    732   1.41  drochner 	0x0011,	0x0017,	0x0005,	0x0012,	0x0014,	0x0019,	0x0015,	0x0009,
    733   1.41  drochner 	0x000f,	0x0010,	0x001b,	0x001d,	0x0201,	0x0702,	0x0001,	0x0013,
    734   1.41  drochner 	0x0004,	0x0006,	0x0007,	0x0008,	0x000a,	0x000b,	0x000c,	0x0200,
    735   1.41  drochner 	0x0007,	0x0000,	0x0700,	0x001c,	0x001a,	0x0018,	0x0003,	0x0016,
    736   1.41  drochner 	0x0002,	0x000e,	0x000d,	0x0200,	0x020e,	0x007f,	0x0700,	0x030c,
    737   1.41  drochner 	0x0703,	0x0000,	0x0207,	0x0100,	0x0101,	0x0102,	0x0103,	0x0104,
    738   1.41  drochner 	0x0105,	0x0106,	0x0107,	0x0108,	0x0109,	0x0208,	0x0204,	0x0307,
    739   1.41  drochner 	0x0308,	0x0309,	0x030b,	0x0304,	0x0305,	0x0306,	0x030a,	0x0301,
    740   1.41  drochner 	0x0302,	0x0303,	0x0300,	0x0310,	0x0206,	0x0200,	0x0200,	0x010a,
    741   1.41  drochner 	0x010b,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    742   1.41  drochner 	0x030e,	0x0702,	0x030d,	0x001c,	0x0701,	0x0205,	0x0114,	0x0603,
    743   1.41  drochner 	0x0118,	0x0601,	0x0602,	0x0117,	0x0600,	0x0119,	0x0115,	0x0116,
    744   1.41  drochner 	0x011a,	0x010c,	0x010d,	0x011b,	0x011c,	0x0110,	0x0311,	0x011d,
    745   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    746   1.41  drochner };
    747   1.41  drochner 
    748   1.61  jdolecek const u_short * const linux_keytabs[] = {
    749   1.41  drochner 	plain_map, shift_map, altgr_map, altgr_map, ctrl_map
    750   1.41  drochner };
    751   1.41  drochner #endif
    752   1.41  drochner 
    753   1.52      fvdl static struct biosdisk_info *
    754  1.119  christos fd2biosinfo(struct proc *p, struct file *fp)
    755   1.52      fvdl {
    756   1.52      fvdl 	struct vnode *vp;
    757   1.52      fvdl 	const char *blkname;
    758   1.52      fvdl 	char diskname[16];
    759   1.52      fvdl 	int i;
    760   1.52      fvdl 	struct nativedisk_info *nip;
    761  1.103   thorpej 	struct disklist *dl = x86_alldisks;
    762   1.52      fvdl 
    763   1.52      fvdl 	if (fp->f_type != DTYPE_VNODE)
    764   1.52      fvdl 		return NULL;
    765   1.52      fvdl 	vp = (struct vnode *)fp->f_data;
    766   1.52      fvdl 
    767   1.52      fvdl 	if (vp->v_type != VBLK)
    768   1.52      fvdl 		return NULL;
    769   1.52      fvdl 
    770   1.79   gehenna 	blkname = devsw_blk2name(major(vp->v_rdev));
    771  1.142  christos 	snprintf(diskname, sizeof diskname, "%s%llu", blkname,
    772  1.142  christos 	    (unsigned long long)DISKUNIT(vp->v_rdev));
    773   1.52      fvdl 
    774   1.52      fvdl 	for (i = 0; i < dl->dl_nnativedisks; i++) {
    775   1.52      fvdl 		nip = &dl->dl_nativedisks[i];
    776   1.52      fvdl 		if (strcmp(diskname, nip->ni_devname))
    777   1.52      fvdl 			continue;
    778   1.52      fvdl 		if (nip->ni_nmatches != 0)
    779   1.52      fvdl 			return &dl->dl_biosdisks[nip->ni_biosmatches[0]];
    780   1.52      fvdl 	}
    781   1.52      fvdl 
    782   1.52      fvdl 	return NULL;
    783   1.52      fvdl }
    784   1.52      fvdl 
    785   1.52      fvdl 
    786   1.13      fvdl /*
    787   1.13      fvdl  * We come here in a last attempt to satisfy a Linux ioctl() call
    788   1.13      fvdl  */
    789   1.13      fvdl int
    790  1.133       dsl linux_machdepioctl(struct lwp *l, const struct linux_sys_ioctl_args *uap, register_t *retval)
    791   1.19   thorpej {
    792  1.133       dsl 	/* {
    793   1.13      fvdl 		syscallarg(int) fd;
    794   1.13      fvdl 		syscallarg(u_long) com;
    795  1.123  christos 		syscallarg(void *) data;
    796  1.133       dsl 	} */
    797   1.29  christos 	struct sys_ioctl_args bia;
    798   1.15      fvdl 	u_long com;
    799   1.52      fvdl 	int error, error1;
    800   1.50     veego #if (NWSDISPLAY > 0)
    801   1.13      fvdl 	struct vt_mode lvt;
    802   1.41  drochner 	struct kbentry kbe;
    803   1.41  drochner #endif
    804   1.52      fvdl 	struct linux_hd_geometry hdg;
    805   1.52      fvdl 	struct linux_hd_big_geometry hdg_big;
    806   1.52      fvdl 	struct biosdisk_info *bip;
    807  1.134        ad 	file_t *fp;
    808   1.52      fvdl 	int fd;
    809   1.52      fvdl 	struct disklabel label, *labp;
    810   1.52      fvdl 	struct partinfo partp;
    811  1.134        ad 	int (*ioctlf)(struct file *, u_long, void *);
    812   1.52      fvdl 	u_long start, biostotal, realtotal;
    813   1.52      fvdl 	u_char heads, sectors;
    814   1.52      fvdl 	u_int cylinders;
    815   1.55      fvdl 	struct ioctl_pt pt;
    816   1.13      fvdl 
    817   1.52      fvdl 	fd = SCARG(uap, fd);
    818   1.52      fvdl 	SCARG(&bia, fd) = fd;
    819   1.13      fvdl 	SCARG(&bia, data) = SCARG(uap, data);
    820   1.13      fvdl 	com = SCARG(uap, com);
    821   1.13      fvdl 
    822  1.134        ad 	if ((fp = fd_getfile(fd)) == NULL)
    823   1.53   thorpej 		return (EBADF);
    824   1.52      fvdl 
    825   1.13      fvdl 	switch (com) {
    826   1.50     veego #if (NWSDISPLAY > 0)
    827   1.13      fvdl 	case LINUX_KDGKBMODE:
    828   1.21      fvdl 		com = KDGKBMODE;
    829   1.21      fvdl 		break;
    830   1.13      fvdl 	case LINUX_KDSKBMODE:
    831   1.13      fvdl 		com = KDSKBMODE;
    832   1.13      fvdl 		if ((unsigned)SCARG(uap, data) == LINUX_K_MEDIUMRAW)
    833  1.123  christos 			SCARG(&bia, data) = (void *)K_RAW;
    834   1.13      fvdl 		break;
    835   1.59      fvdl 	case LINUX_KIOCSOUND:
    836   1.59      fvdl 		SCARG(&bia, data) =
    837  1.123  christos 		    (void *)(((unsigned long)SCARG(&bia, data)) & 0xffff);
    838   1.59      fvdl 		/* fall through */
    839   1.13      fvdl 	case LINUX_KDMKTONE:
    840   1.13      fvdl 		com = KDMKTONE;
    841   1.13      fvdl 		break;
    842   1.13      fvdl 	case LINUX_KDSETMODE:
    843   1.13      fvdl 		com = KDSETMODE;
    844   1.58      fvdl 		break;
    845   1.58      fvdl 	case LINUX_KDGETMODE:
    846   1.58      fvdl 		/* KD_* values are equal to the wscons numbers */
    847   1.58      fvdl 		com = WSDISPLAYIO_GMODE;
    848   1.13      fvdl 		break;
    849   1.13      fvdl 	case LINUX_KDENABIO:
    850   1.13      fvdl 		com = KDENABIO;
    851   1.13      fvdl 		break;
    852   1.13      fvdl 	case LINUX_KDDISABIO:
    853   1.13      fvdl 		com = KDDISABIO;
    854   1.13      fvdl 		break;
    855   1.13      fvdl 	case LINUX_KDGETLED:
    856   1.13      fvdl 		com = KDGETLED;
    857   1.13      fvdl 		break;
    858   1.13      fvdl 	case LINUX_KDSETLED:
    859   1.13      fvdl 		com = KDSETLED;
    860   1.13      fvdl 		break;
    861   1.13      fvdl 	case LINUX_VT_OPENQRY:
    862   1.13      fvdl 		com = VT_OPENQRY;
    863   1.13      fvdl 		break;
    864   1.13      fvdl 	case LINUX_VT_GETMODE:
    865  1.134        ad 		error = fp->f_ops->fo_ioctl(fp, VT_GETMODE, &lvt);
    866  1.129       dsl 		if (error != 0)
    867   1.86      yamt 			goto out;
    868   1.74  christos 		lvt.relsig = native_to_linux_signo[lvt.relsig];
    869   1.74  christos 		lvt.acqsig = native_to_linux_signo[lvt.acqsig];
    870   1.74  christos 		lvt.frsig = native_to_linux_signo[lvt.frsig];
    871  1.129       dsl 		error = copyout(&lvt, SCARG(uap, data), sizeof (lvt));
    872   1.86      yamt 		goto out;
    873   1.13      fvdl 	case LINUX_VT_SETMODE:
    874  1.129       dsl 		error = copyin(SCARG(uap, data), &lvt, sizeof (lvt));
    875  1.129       dsl 		if (error != 0)
    876   1.86      yamt 			goto out;
    877   1.74  christos 		lvt.relsig = linux_to_native_signo[lvt.relsig];
    878   1.74  christos 		lvt.acqsig = linux_to_native_signo[lvt.acqsig];
    879   1.74  christos 		lvt.frsig = linux_to_native_signo[lvt.frsig];
    880  1.134        ad 		error = fp->f_ops->fo_ioctl(fp, VT_SETMODE, &lvt);
    881  1.129       dsl 		goto out;
    882   1.52      fvdl 	case LINUX_VT_DISALLOCATE:
    883   1.52      fvdl 		/* XXX should use WSDISPLAYIO_DELSCREEN */
    884   1.86      yamt 		error = 0;
    885   1.86      yamt 		goto out;
    886   1.13      fvdl 	case LINUX_VT_RELDISP:
    887   1.13      fvdl 		com = VT_RELDISP;
    888   1.13      fvdl 		break;
    889   1.13      fvdl 	case LINUX_VT_ACTIVATE:
    890   1.13      fvdl 		com = VT_ACTIVATE;
    891   1.13      fvdl 		break;
    892   1.13      fvdl 	case LINUX_VT_WAITACTIVE:
    893   1.13      fvdl 		com = VT_WAITACTIVE;
    894   1.13      fvdl 		break;
    895   1.41  drochner 	case LINUX_VT_GETSTATE:
    896   1.41  drochner 		com = VT_GETSTATE;
    897   1.41  drochner 		break;
    898   1.41  drochner 	case LINUX_KDGKBTYPE:
    899   1.91  jdolecek 	    {
    900   1.91  jdolecek 		static const u_int8_t kb101 = KB_101;
    901   1.91  jdolecek 
    902   1.41  drochner 		/* This is what Linux does. */
    903   1.91  jdolecek 		error = copyout(&kb101, SCARG(uap, data), 1);
    904   1.86      yamt 		goto out;
    905   1.91  jdolecek 	    }
    906   1.41  drochner 	case LINUX_KDGKBENT:
    907   1.41  drochner 		/*
    908   1.41  drochner 		 * The Linux KDGKBENT ioctl is different from the
    909   1.41  drochner 		 * SYSV original. So we handle it in machdep code.
    910   1.41  drochner 		 * XXX We should use keyboard mapping information
    911   1.41  drochner 		 * from wsdisplay, but this would be expensive.
    912   1.41  drochner 		 */
    913   1.41  drochner 		if ((error = copyin(SCARG(uap, data), &kbe,
    914   1.41  drochner 				    sizeof(struct kbentry))))
    915   1.86      yamt 			goto out;
    916   1.41  drochner 		if (kbe.kb_table >= sizeof(linux_keytabs) / sizeof(u_short *)
    917   1.86      yamt 		    || kbe.kb_index >= NR_KEYS) {
    918   1.86      yamt 			error = EINVAL;
    919   1.86      yamt 			goto out;
    920   1.86      yamt 		}
    921   1.41  drochner 		kbe.kb_value = linux_keytabs[kbe.kb_table][kbe.kb_index];
    922   1.86      yamt 		error = copyout(&kbe, SCARG(uap, data),
    923   1.86      yamt 				sizeof(struct kbentry));
    924   1.86      yamt 		goto out;
    925   1.54      fvdl #endif
    926   1.52      fvdl 	case LINUX_HDIO_GETGEO:
    927   1.52      fvdl 	case LINUX_HDIO_GETGEO_BIG:
    928   1.52      fvdl 		/*
    929   1.52      fvdl 		 * Try to mimic Linux behaviour: return the BIOS geometry
    930   1.52      fvdl 		 * if possible (extending its # of cylinders if it's beyond
    931   1.52      fvdl 		 * the 1023 limit), fall back to the MI geometry (i.e.
    932   1.52      fvdl 		 * the real geometry) if not found, by returning an
    933   1.52      fvdl 		 * error. See common/linux_hdio.c
    934   1.52      fvdl 		 */
    935  1.134        ad 		bip = fd2biosinfo(curproc, fp);
    936   1.52      fvdl 		ioctlf = fp->f_ops->fo_ioctl;
    937  1.134        ad 		error = ioctlf(fp, DIOCGDEFLABEL, (void *)&label);
    938  1.134        ad 		error1 = ioctlf(fp, DIOCGPART, (void *)&partp);
    939   1.86      yamt 		if (error != 0 && error1 != 0) {
    940   1.86      yamt 			error = error1;
    941   1.86      yamt 			goto out;
    942   1.86      yamt 		}
    943   1.52      fvdl 		labp = error != 0 ? &label : partp.disklab;
    944   1.52      fvdl 		start = error1 != 0 ? partp.part->p_offset : 0;
    945   1.52      fvdl 		if (bip != NULL && bip->bi_head != 0 && bip->bi_sec != 0
    946   1.52      fvdl 		    && bip->bi_cyl != 0) {
    947   1.52      fvdl 			heads = bip->bi_head;
    948   1.52      fvdl 			sectors = bip->bi_sec;
    949   1.52      fvdl 			cylinders = bip->bi_cyl;
    950   1.52      fvdl 			biostotal = heads * sectors * cylinders;
    951   1.52      fvdl 			realtotal = labp->d_ntracks * labp->d_nsectors *
    952   1.52      fvdl 			    labp->d_ncylinders;
    953   1.52      fvdl 			if (realtotal > biostotal)
    954   1.52      fvdl 				cylinders = realtotal / (heads * sectors);
    955   1.52      fvdl 		} else {
    956   1.52      fvdl 			heads = labp->d_ntracks;
    957   1.52      fvdl 			cylinders = labp->d_ncylinders;
    958   1.52      fvdl 			sectors = labp->d_nsectors;
    959   1.52      fvdl 		}
    960   1.52      fvdl 		if (com == LINUX_HDIO_GETGEO) {
    961   1.52      fvdl 			hdg.start = start;
    962   1.52      fvdl 			hdg.heads = heads;
    963   1.52      fvdl 			hdg.cylinders = cylinders;
    964   1.52      fvdl 			hdg.sectors = sectors;
    965   1.86      yamt 			error = copyout(&hdg, SCARG(uap, data), sizeof hdg);
    966   1.86      yamt 			goto out;
    967   1.52      fvdl 		} else {
    968   1.52      fvdl 			hdg_big.start = start;
    969   1.52      fvdl 			hdg_big.heads = heads;
    970   1.52      fvdl 			hdg_big.cylinders = cylinders;
    971   1.52      fvdl 			hdg_big.sectors = sectors;
    972   1.86      yamt 			error = copyout(&hdg_big, SCARG(uap, data),
    973   1.52      fvdl 			    sizeof hdg_big);
    974   1.86      yamt 			goto out;
    975   1.52      fvdl 		}
    976   1.52      fvdl 
    977   1.13      fvdl 	default:
    978   1.54      fvdl 		/*
    979   1.55      fvdl 		 * Unknown to us. If it's on a device, just pass it through
    980   1.55      fvdl 		 * using PTIOCLINUX, the device itself might be able to
    981   1.55      fvdl 		 * make some sense of it.
    982   1.57      fvdl 		 * XXX hack: if the function returns EJUSTRETURN,
    983   1.57      fvdl 		 * it has stuffed a sysctl return value in pt.data.
    984   1.54      fvdl 		 */
    985   1.55      fvdl 		ioctlf = fp->f_ops->fo_ioctl;
    986   1.55      fvdl 		pt.com = SCARG(uap, com);
    987   1.55      fvdl 		pt.data = SCARG(uap, data);
    988  1.134        ad 		error = ioctlf(fp, PTIOCLINUX, &pt);
    989   1.57      fvdl 		if (error == EJUSTRETURN) {
    990   1.57      fvdl 			retval[0] = (register_t)pt.data;
    991   1.57      fvdl 			error = 0;
    992   1.57      fvdl 		}
    993   1.55      fvdl 
    994  1.115  christos 		if (error == ENOTTY) {
    995   1.72  christos 			DPRINTF(("linux_machdepioctl: invalid ioctl %08lx\n",
    996   1.72  christos 			    com));
    997  1.115  christos 		}
    998   1.86      yamt 		goto out;
    999   1.13      fvdl 	}
   1000   1.13      fvdl 	SCARG(&bia, com) = com;
   1001   1.86      yamt 	error = sys_ioctl(curlwp, &bia, retval);
   1002   1.86      yamt out:
   1003  1.134        ad 	fd_putfile(fd);
   1004   1.86      yamt 	return error;
   1005   1.13      fvdl }
   1006   1.13      fvdl 
   1007   1.13      fvdl /*
   1008   1.13      fvdl  * Set I/O permissions for a process. Just set the maximum level
   1009   1.13      fvdl  * right away (ignoring the argument), otherwise we would have
   1010   1.13      fvdl  * to rely on I/O permission maps, which are not implemented.
   1011   1.13      fvdl  */
   1012   1.13      fvdl int
   1013  1.133       dsl linux_sys_iopl(struct lwp *l, const struct linux_sys_iopl_args *uap, register_t *retval)
   1014   1.19   thorpej {
   1015  1.133       dsl 	/* {
   1016   1.13      fvdl 		syscallarg(int) level;
   1017  1.133       dsl 	} */
   1018   1.85   thorpej 	struct trapframe *fp = l->l_md.md_regs;
   1019   1.13      fvdl 
   1020  1.120      elad 	if (kauth_authorize_machdep(l->l_cred, KAUTH_MACHDEP_IOPL,
   1021  1.120      elad 	    NULL, NULL, NULL, NULL) != 0)
   1022   1.13      fvdl 		return EPERM;
   1023   1.13      fvdl 	fp->tf_eflags |= PSL_IOPL;
   1024   1.13      fvdl 	*retval = 0;
   1025   1.13      fvdl 	return 0;
   1026   1.13      fvdl }
   1027   1.13      fvdl 
   1028   1.13      fvdl /*
   1029   1.13      fvdl  * See above. If a root process tries to set access to an I/O port,
   1030   1.13      fvdl  * just let it have the whole range.
   1031   1.13      fvdl  */
   1032   1.13      fvdl int
   1033  1.133       dsl linux_sys_ioperm(struct lwp *l, const struct linux_sys_ioperm_args *uap, register_t *retval)
   1034   1.19   thorpej {
   1035  1.133       dsl 	/* {
   1036   1.13      fvdl 		syscallarg(unsigned int) lo;
   1037   1.13      fvdl 		syscallarg(unsigned int) hi;
   1038   1.13      fvdl 		syscallarg(int) val;
   1039  1.133       dsl 	} */
   1040   1.85   thorpej 	struct trapframe *fp = l->l_md.md_regs;
   1041   1.13      fvdl 
   1042  1.120      elad 	if (kauth_authorize_machdep(l->l_cred, SCARG(uap, val) ?
   1043  1.120      elad 	    KAUTH_MACHDEP_IOPERM_SET : KAUTH_MACHDEP_IOPERM_GET, NULL, NULL,
   1044  1.120      elad 	    NULL, NULL) != 0)
   1045   1.13      fvdl 		return EPERM;
   1046   1.13      fvdl 	if (SCARG(uap, val))
   1047   1.13      fvdl 		fp->tf_eflags |= PSL_IOPL;
   1048   1.13      fvdl 	*retval = 0;
   1049   1.92  christos 	return 0;
   1050   1.92  christos }
   1051  1.107      fvdl 
   1052  1.107      fvdl int
   1053  1.119  christos linux_usertrap(struct lwp *l, vaddr_t trapaddr,
   1054  1.119  christos     void *arg)
   1055  1.107      fvdl {
   1056  1.107      fvdl 	return 0;
   1057  1.107      fvdl }
   1058  1.125  christos 
   1059  1.125  christos const char *
   1060  1.125  christos linux_get_uname_arch(void)
   1061  1.125  christos {
   1062  1.125  christos 	static char uname_arch[5] = "i386";
   1063  1.125  christos 
   1064  1.125  christos 	if (uname_arch[1] == '3')
   1065  1.125  christos 		uname_arch[1] += cpu_class;
   1066  1.125  christos 	return uname_arch;
   1067  1.125  christos }
   1068