Home | History | Annotate | Line # | Download | only in i386
linux_machdep.c revision 1.168
      1  1.168  riastrad /*	$NetBSD: linux_machdep.c,v 1.168 2021/09/07 11:43:04 riastradh Exp $	*/
      2    1.1      fvdl 
      3   1.45      fvdl /*-
      4  1.143        ad  * Copyright (c) 1995, 2000, 2008, 2009 The NetBSD Foundation, Inc.
      5    1.1      fvdl  * All rights reserved.
      6    1.1      fvdl  *
      7   1.45      fvdl  * This code is derived from software contributed to The NetBSD Foundation
      8  1.143        ad  * by Frank van der Linden, and by Andrew Doran.
      9   1.45      fvdl  *
     10    1.1      fvdl  * Redistribution and use in source and binary forms, with or without
     11    1.1      fvdl  * modification, are permitted provided that the following conditions
     12    1.1      fvdl  * are met:
     13    1.1      fvdl  * 1. Redistributions of source code must retain the above copyright
     14    1.1      fvdl  *    notice, this list of conditions and the following disclaimer.
     15    1.1      fvdl  * 2. Redistributions in binary form must reproduce the above copyright
     16    1.1      fvdl  *    notice, this list of conditions and the following disclaimer in the
     17    1.1      fvdl  *    documentation and/or other materials provided with the distribution.
     18    1.1      fvdl  *
     19   1.45      fvdl  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.45      fvdl  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.45      fvdl  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.45      fvdl  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.45      fvdl  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.45      fvdl  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.45      fvdl  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.45      fvdl  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.45      fvdl  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.45      fvdl  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.45      fvdl  * POSSIBILITY OF SUCH DAMAGE.
     30    1.1      fvdl  */
     31   1.68     lukem 
     32   1.68     lukem #include <sys/cdefs.h>
     33  1.168  riastrad __KERNEL_RCSID(0, "$NetBSD: linux_machdep.c,v 1.168 2021/09/07 11:43:04 riastradh Exp $");
     34   1.35   thorpej 
     35   1.63       mrg #if defined(_KERNEL_OPT)
     36   1.36   thorpej #include "opt_user_ldt.h"
     37   1.51  jdolecek #endif
     38    1.1      fvdl 
     39    1.1      fvdl #include <sys/param.h>
     40    1.1      fvdl #include <sys/systm.h>
     41    1.1      fvdl #include <sys/signalvar.h>
     42    1.1      fvdl #include <sys/kernel.h>
     43    1.1      fvdl #include <sys/proc.h>
     44    1.1      fvdl #include <sys/buf.h>
     45    1.1      fvdl #include <sys/reboot.h>
     46    1.1      fvdl #include <sys/conf.h>
     47   1.31   thorpej #include <sys/exec.h>
     48    1.1      fvdl #include <sys/file.h>
     49    1.1      fvdl #include <sys/callout.h>
     50    1.1      fvdl #include <sys/mbuf.h>
     51    1.1      fvdl #include <sys/msgbuf.h>
     52    1.1      fvdl #include <sys/mount.h>
     53    1.1      fvdl #include <sys/vnode.h>
     54    1.1      fvdl #include <sys/device.h>
     55    1.1      fvdl #include <sys/syscallargs.h>
     56   1.13      fvdl #include <sys/filedesc.h>
     57   1.39   mycroft #include <sys/exec_elf.h>
     58   1.52      fvdl #include <sys/disklabel.h>
     59   1.62      manu #include <sys/ioctl.h>
     60  1.110  christos #include <sys/wait.h>
     61  1.113      elad #include <sys/kauth.h>
     62  1.143        ad #include <sys/kmem.h>
     63  1.113      elad 
     64   1.52      fvdl #include <miscfs/specfs/specdev.h>
     65    1.7   mycroft 
     66   1.44  christos #include <compat/linux/common/linux_types.h>
     67   1.44  christos #include <compat/linux/common/linux_signal.h>
     68   1.44  christos #include <compat/linux/common/linux_util.h>
     69   1.44  christos #include <compat/linux/common/linux_ioctl.h>
     70   1.52      fvdl #include <compat/linux/common/linux_hdio.h>
     71   1.44  christos #include <compat/linux/common/linux_exec.h>
     72   1.44  christos #include <compat/linux/common/linux_machdep.h>
     73   1.98  jdolecek #include <compat/linux/common/linux_errno.h>
     74   1.44  christos 
     75    1.1      fvdl #include <compat/linux/linux_syscallargs.h>
     76    1.1      fvdl 
     77  1.130        ad #include <sys/cpu.h>
     78    1.1      fvdl #include <machine/cpufunc.h>
     79    1.1      fvdl #include <machine/psl.h>
     80    1.1      fvdl #include <machine/reg.h>
     81    1.7   mycroft #include <machine/segments.h>
     82    1.1      fvdl #include <machine/specialreg.h>
     83    1.7   mycroft #include <machine/sysarch.h>
     84   1.34   mycroft #include <machine/vmparam.h>
     85    1.1      fvdl 
     86  1.158       dsl #include <x86/fpu.h>
     87  1.158       dsl 
     88    1.1      fvdl /*
     89   1.50     veego  * To see whether wscons is configured (for virtual console ioctl calls).
     90   1.13      fvdl  */
     91   1.63       mrg #if defined(_KERNEL_OPT)
     92   1.41  drochner #include "wsdisplay.h"
     93   1.51  jdolecek #endif
     94   1.41  drochner #if (NWSDISPLAY > 0)
     95   1.52      fvdl #include <dev/wscons/wsconsio.h>
     96   1.41  drochner #include <dev/wscons/wsdisplay_usl_io.h>
     97   1.63       mrg #if defined(_KERNEL_OPT)
     98   1.41  drochner #include "opt_xserver.h"
     99   1.51  jdolecek #endif
    100   1.41  drochner #endif
    101   1.41  drochner 
    102   1.72  christos #ifdef DEBUG_LINUX
    103   1.72  christos #define DPRINTF(a) uprintf a
    104   1.72  christos #else
    105   1.72  christos #define DPRINTF(a)
    106   1.72  christos #endif
    107   1.72  christos 
    108  1.162      maxv extern struct disklist *x86_alldisks;
    109  1.162      maxv 
    110  1.131       dsl static struct biosdisk_info *fd2biosinfo(struct proc *, struct file *);
    111  1.131       dsl static void linux_save_ucontext(struct lwp *, struct trapframe *,
    112  1.131       dsl     const sigset_t *, struct sigaltstack *, struct linux_ucontext *);
    113  1.131       dsl static void linux_save_sigcontext(struct lwp *, struct trapframe *,
    114  1.131       dsl     const sigset_t *, struct linux_sigcontext *);
    115  1.131       dsl static int linux_restore_sigcontext(struct lwp *,
    116  1.131       dsl     struct linux_sigcontext *, register_t *);
    117  1.131       dsl static void linux_rt_sendsig(const ksiginfo_t *, const sigset_t *);
    118  1.131       dsl static void linux_old_sendsig(const ksiginfo_t *, const sigset_t *);
    119   1.52      fvdl 
    120   1.83  christos extern char linux_sigcode[], linux_rt_sigcode[];
    121  1.149       chs 
    122   1.13      fvdl /*
    123    1.1      fvdl  * Deal with some i386-specific things in the Linux emulation code.
    124    1.1      fvdl  */
    125   1.37   mycroft 
    126   1.37   mycroft void
    127  1.149       chs linux_setregs(struct lwp *l, struct exec_package *epp, vaddr_t stack)
    128   1.37   mycroft {
    129   1.73  christos 	struct trapframe *tf;
    130   1.73  christos 
    131   1.73  christos #ifdef USER_LDT
    132   1.85   thorpej 	pmap_ldt_cleanup(l);
    133   1.73  christos #endif
    134   1.37   mycroft 
    135  1.166      maxv 	fpu_clear(l, __Linux_NPXCW__);
    136   1.73  christos 
    137   1.85   thorpej 	tf = l->l_md.md_regs;
    138  1.149       chs 	tf->tf_gs = 0;
    139   1.73  christos 	tf->tf_fs = GSEL(GUDATA_SEL, SEL_UPL);
    140   1.73  christos 	tf->tf_es = GSEL(GUDATA_SEL, SEL_UPL);
    141   1.73  christos 	tf->tf_ds = GSEL(GUDATA_SEL, SEL_UPL);
    142   1.73  christos 	tf->tf_edi = 0;
    143   1.73  christos 	tf->tf_esi = 0;
    144   1.73  christos 	tf->tf_ebp = 0;
    145  1.150     joerg 	tf->tf_ebx = l->l_proc->p_psstrp;
    146   1.73  christos 	tf->tf_edx = 0;
    147   1.73  christos 	tf->tf_ecx = 0;
    148   1.73  christos 	tf->tf_eax = 0;
    149   1.73  christos 	tf->tf_eip = epp->ep_entry;
    150   1.95       chs 	tf->tf_cs = GSEL(GUCODEBIG_SEL, SEL_UPL);
    151   1.73  christos 	tf->tf_eflags = PSL_USERSET;
    152   1.73  christos 	tf->tf_esp = stack;
    153   1.73  christos 	tf->tf_ss = GSEL(GUDATA_SEL, SEL_UPL);
    154   1.37   mycroft }
    155    1.1      fvdl 
    156    1.1      fvdl /*
    157    1.1      fvdl  * Send an interrupt to process.
    158    1.1      fvdl  *
    159    1.1      fvdl  * Stack is set up to allow sigcode stored
    160    1.1      fvdl  * in u. to call routine, followed by kcall
    161    1.1      fvdl  * to sigreturn routine below.  After sigreturn
    162    1.1      fvdl  * resets the signal mask, the stack, and the
    163    1.1      fvdl  * frame pointer, it returns to the user
    164    1.1      fvdl  * specified pc, psl.
    165    1.1      fvdl  */
    166    1.1      fvdl 
    167    1.1      fvdl void
    168   1.99  christos linux_sendsig(const ksiginfo_t *ksi, const sigset_t *mask)
    169    1.1      fvdl {
    170   1.96  christos 	if (SIGACTION(curproc, ksi->ksi_signo).sa_flags & SA_SIGINFO)
    171   1.97  christos 		linux_rt_sendsig(ksi, mask);
    172   1.83  christos 	else
    173   1.97  christos 		linux_old_sendsig(ksi, mask);
    174   1.83  christos }
    175   1.83  christos 
    176   1.83  christos 
    177   1.83  christos static void
    178  1.132       dsl linux_save_ucontext(struct lwp *l, struct trapframe *tf, const sigset_t *mask, struct sigaltstack *sas, struct linux_ucontext *uc)
    179   1.90  christos {
    180   1.90  christos 	uc->uc_flags = 0;
    181   1.90  christos 	uc->uc_link = NULL;
    182   1.90  christos 	native_to_linux_sigaltstack(&uc->uc_stack, sas);
    183   1.90  christos 	linux_save_sigcontext(l, tf, mask, &uc->uc_mcontext);
    184   1.90  christos 	native_to_linux_sigset(&uc->uc_sigmask, mask);
    185   1.90  christos 	(void)memset(&uc->uc_fpregs_mem, 0, sizeof(uc->uc_fpregs_mem));
    186   1.90  christos }
    187   1.90  christos 
    188   1.90  christos static void
    189  1.146     rmind linux_save_sigcontext(struct lwp *l, struct trapframe *tf,
    190  1.146     rmind     const sigset_t *mask, struct linux_sigcontext *sc)
    191   1.83  christos {
    192  1.146     rmind 	struct pcb *pcb = lwp_getpcb(l);
    193  1.146     rmind 
    194   1.83  christos 	/* Save register context. */
    195  1.164      maxv 	sc->sc_gs = tf->tf_gs;
    196  1.164      maxv 	sc->sc_fs = tf->tf_fs;
    197  1.164      maxv 	sc->sc_es = tf->tf_es;
    198  1.164      maxv 	sc->sc_ds = tf->tf_ds;
    199  1.164      maxv 	sc->sc_eflags = tf->tf_eflags;
    200  1.164      maxv 
    201   1.83  christos 	sc->sc_edi = tf->tf_edi;
    202   1.83  christos 	sc->sc_esi = tf->tf_esi;
    203   1.83  christos 	sc->sc_esp = tf->tf_esp;
    204   1.83  christos 	sc->sc_ebp = tf->tf_ebp;
    205   1.83  christos 	sc->sc_ebx = tf->tf_ebx;
    206   1.83  christos 	sc->sc_edx = tf->tf_edx;
    207   1.83  christos 	sc->sc_ecx = tf->tf_ecx;
    208   1.83  christos 	sc->sc_eax = tf->tf_eax;
    209   1.83  christos 	sc->sc_eip = tf->tf_eip;
    210   1.83  christos 	sc->sc_cs = tf->tf_cs;
    211   1.83  christos 	sc->sc_esp_at_signal = tf->tf_esp;
    212   1.83  christos 	sc->sc_ss = tf->tf_ss;
    213   1.83  christos 	sc->sc_err = tf->tf_err;
    214   1.83  christos 	sc->sc_trapno = tf->tf_trapno;
    215  1.146     rmind 	sc->sc_cr2 = pcb->pcb_cr2;
    216   1.83  christos 	sc->sc_387 = NULL;
    217   1.83  christos 
    218   1.83  christos 	/* Save signal stack. */
    219   1.83  christos 	/* Linux doesn't save the onstack flag in sigframe */
    220   1.83  christos 
    221   1.83  christos 	/* Save signal mask. */
    222   1.83  christos 	native_to_linux_old_sigset(&sc->sc_mask, mask);
    223   1.83  christos }
    224   1.83  christos 
    225   1.83  christos static void
    226   1.99  christos linux_rt_sendsig(const ksiginfo_t *ksi, const sigset_t *mask)
    227   1.83  christos {
    228   1.85   thorpej 	struct lwp *l = curlwp;
    229   1.85   thorpej 	struct proc *p = l->l_proc;
    230   1.48  augustss 	struct trapframe *tf;
    231   1.83  christos 	struct linux_rt_sigframe *fp, frame;
    232  1.122        ad 	int onstack, error;
    233   1.98  jdolecek 	int sig = ksi->ksi_signo;
    234   1.78   thorpej 	sig_t catcher = SIGACTION(p, sig).sa_handler;
    235  1.122        ad 	struct sigaltstack *sas = &l->l_sigstk;
    236    1.1      fvdl 
    237   1.85   thorpej 	tf = l->l_md.md_regs;
    238   1.66  jdolecek 	/* Do we need to jump onto the signal stack? */
    239   1.82  christos 	onstack = (sas->ss_flags & (SS_DISABLE | SS_ONSTACK)) == 0 &&
    240   1.66  jdolecek 	    (SIGACTION(p, sig).sa_flags & SA_ONSTACK) != 0;
    241   1.66  jdolecek 
    242   1.83  christos 
    243   1.42   mycroft 	/* Allocate space for the signal handler context. */
    244   1.66  jdolecek 	if (onstack)
    245  1.123  christos 		fp = (struct linux_rt_sigframe *)((char *)sas->ss_sp +
    246   1.83  christos 		    sas->ss_size);
    247   1.66  jdolecek 	else
    248   1.83  christos 		fp = (struct linux_rt_sigframe *)tf->tf_esp;
    249   1.42   mycroft 	fp--;
    250    1.1      fvdl 
    251   1.92  christos 	DPRINTF(("rt: onstack = %d, fp = %p sig = %d eip = 0x%x cr2 = 0x%x\n",
    252  1.146     rmind 	    onstack, fp, sig, tf->tf_eip,
    253  1.146     rmind 	    ((struct pcb *)lwp_getpcb(l))->pcb_cr2));
    254   1.83  christos 
    255  1.168  riastrad 	memset(&frame, 0, sizeof(frame));
    256  1.168  riastrad 
    257   1.42   mycroft 	/* Build stack frame for signal trampoline. */
    258    1.7   mycroft 	frame.sf_handler = catcher;
    259   1.74  christos 	frame.sf_sig = native_to_linux_signo[sig];
    260   1.82  christos 	frame.sf_sip = &fp->sf_si;
    261   1.90  christos 	frame.sf_ucp = &fp->sf_uc;
    262   1.83  christos 
    263   1.82  christos 	/*
    264   1.97  christos 	 * XXX: the following code assumes that the constants for
    265   1.97  christos 	 * siginfo are the same between linux and NetBSD.
    266   1.82  christos 	 */
    267  1.151  christos 	native_to_linux_siginfo(&frame.sf_si, &ksi->ksi_info);
    268    1.1      fvdl 
    269   1.42   mycroft 	/* Save register context. */
    270   1.90  christos 	linux_save_ucontext(l, tf, mask, sas, &frame.sf_uc);
    271  1.122        ad 	sendsig_reset(l, sig);
    272   1.83  christos 
    273  1.135        ad 	mutex_exit(p->p_lock);
    274  1.122        ad 	error = copyout(&frame, fp, sizeof(frame));
    275  1.135        ad 	mutex_enter(p->p_lock);
    276  1.122        ad 
    277  1.122        ad 	if (error != 0) {
    278   1.83  christos 		/*
    279   1.83  christos 		 * Process has trashed its stack; give it an illegal
    280   1.83  christos 		 * instruction to halt it in its tracks.
    281   1.83  christos 		 */
    282   1.85   thorpej 		sigexit(l, SIGILL);
    283   1.83  christos 		/* NOTREACHED */
    284    1.4   mycroft 	}
    285    1.1      fvdl 
    286   1.83  christos 	/*
    287   1.83  christos 	 * Build context to run handler in.
    288   1.83  christos 	 */
    289   1.83  christos 	tf->tf_fs = GSEL(GUDATA_SEL, SEL_UPL);
    290   1.83  christos 	tf->tf_es = GSEL(GUDATA_SEL, SEL_UPL);
    291   1.83  christos 	tf->tf_ds = GSEL(GUDATA_SEL, SEL_UPL);
    292  1.106     perry 	tf->tf_eip = ((int)p->p_sigctx.ps_sigcode) +
    293   1.83  christos 	    (linux_rt_sigcode - linux_sigcode);
    294   1.83  christos 	tf->tf_cs = GSEL(GUCODE_SEL, SEL_UPL);
    295  1.138  christos 	tf->tf_eflags &= ~PSL_CLEARSIG;
    296   1.83  christos 	tf->tf_esp = (int)fp;
    297   1.83  christos 	tf->tf_ss = GSEL(GUDATA_SEL, SEL_UPL);
    298   1.83  christos 
    299   1.83  christos 	/* Remember that we're now on the signal stack. */
    300   1.83  christos 	if (onstack)
    301   1.83  christos 		sas->ss_flags |= SS_ONSTACK;
    302   1.83  christos }
    303   1.83  christos 
    304   1.83  christos static void
    305   1.99  christos linux_old_sendsig(const ksiginfo_t *ksi, const sigset_t *mask)
    306   1.83  christos {
    307   1.85   thorpej 	struct lwp *l = curlwp;
    308   1.85   thorpej 	struct proc *p = l->l_proc;
    309   1.83  christos 	struct trapframe *tf;
    310   1.83  christos 	struct linux_sigframe *fp, frame;
    311  1.122        ad 	int onstack, error;
    312   1.97  christos 	int sig = ksi->ksi_signo;
    313   1.83  christos 	sig_t catcher = SIGACTION(p, sig).sa_handler;
    314  1.122        ad 	struct sigaltstack *sas = &l->l_sigstk;
    315   1.83  christos 
    316   1.85   thorpej 	tf = l->l_md.md_regs;
    317   1.83  christos 
    318   1.83  christos 	/* Do we need to jump onto the signal stack? */
    319   1.83  christos 	onstack = (sas->ss_flags & (SS_DISABLE | SS_ONSTACK)) == 0 &&
    320   1.83  christos 	    (SIGACTION(p, sig).sa_flags & SA_ONSTACK) != 0;
    321   1.83  christos 
    322   1.83  christos 	/* Allocate space for the signal handler context. */
    323   1.83  christos 	if (onstack)
    324  1.123  christos 		fp = (struct linux_sigframe *) ((char *)sas->ss_sp +
    325   1.83  christos 		    sas->ss_size);
    326   1.83  christos 	else
    327   1.83  christos 		fp = (struct linux_sigframe *)tf->tf_esp;
    328   1.83  christos 	fp--;
    329   1.83  christos 
    330   1.92  christos 	DPRINTF(("old: onstack = %d, fp = %p sig = %d eip = 0x%x cr2 = 0x%x\n",
    331  1.146     rmind 	    onstack, fp, sig, tf->tf_eip,
    332  1.146     rmind 	    ((struct pcb *)lwp_getpcb(l))->pcb_cr2));
    333   1.83  christos 
    334  1.168  riastrad 	memset(&frame, 0, sizeof(frame));
    335  1.168  riastrad 
    336   1.83  christos 	/* Build stack frame for signal trampoline. */
    337   1.83  christos 	frame.sf_handler = catcher;
    338   1.83  christos 	frame.sf_sig = native_to_linux_signo[sig];
    339   1.42   mycroft 
    340   1.90  christos 	linux_save_sigcontext(l, tf, mask, &frame.sf_sc);
    341  1.122        ad 	sendsig_reset(l, sig);
    342  1.122        ad 
    343  1.135        ad 	mutex_exit(p->p_lock);
    344  1.122        ad 	error = copyout(&frame, fp, sizeof(frame));
    345  1.135        ad 	mutex_enter(p->p_lock);
    346   1.42   mycroft 
    347  1.122        ad 	if (error != 0) {
    348    1.1      fvdl 		/*
    349    1.1      fvdl 		 * Process has trashed its stack; give it an illegal
    350    1.1      fvdl 		 * instruction to halt it in its tracks.
    351    1.1      fvdl 		 */
    352   1.85   thorpej 		sigexit(l, SIGILL);
    353    1.1      fvdl 		/* NOTREACHED */
    354    1.1      fvdl 	}
    355    1.1      fvdl 
    356    1.1      fvdl 	/*
    357    1.1      fvdl 	 * Build context to run handler in.
    358    1.1      fvdl 	 */
    359   1.75  christos 	tf->tf_fs = GSEL(GUDATA_SEL, SEL_UPL);
    360   1.26   mycroft 	tf->tf_es = GSEL(GUDATA_SEL, SEL_UPL);
    361   1.26   mycroft 	tf->tf_ds = GSEL(GUDATA_SEL, SEL_UPL);
    362   1.56  jdolecek 	tf->tf_eip = (int)p->p_sigctx.ps_sigcode;
    363   1.95       chs 	tf->tf_cs = GSEL(GUCODEBIG_SEL, SEL_UPL);
    364  1.138  christos 	tf->tf_eflags &= ~PSL_CLEARSIG;
    365   1.26   mycroft 	tf->tf_esp = (int)fp;
    366   1.23   mycroft 	tf->tf_ss = GSEL(GUDATA_SEL, SEL_UPL);
    367   1.42   mycroft 
    368   1.42   mycroft 	/* Remember that we're now on the signal stack. */
    369   1.66  jdolecek 	if (onstack)
    370   1.82  christos 		sas->ss_flags |= SS_ONSTACK;
    371    1.1      fvdl }
    372    1.1      fvdl 
    373    1.1      fvdl /*
    374    1.1      fvdl  * System call to cleanup state after a signal
    375    1.1      fvdl  * has been taken.  Reset signal mask and
    376    1.1      fvdl  * stack state from context left by sendsig (above).
    377    1.1      fvdl  * Return to previous pc and psl as specified by
    378    1.1      fvdl  * context left by sendsig. Check carefully to
    379    1.1      fvdl  * make sure that the user has not modified the
    380    1.1      fvdl  * psl to gain improper privileges or to cause
    381    1.1      fvdl  * a machine fault.
    382    1.1      fvdl  */
    383   1.43       erh int
    384  1.133       dsl linux_sys_rt_sigreturn(struct lwp *l, const struct linux_sys_rt_sigreturn_args *uap, register_t *retval)
    385   1.43       erh {
    386  1.133       dsl 	/* {
    387   1.90  christos 		syscallarg(struct linux_ucontext *) ucp;
    388  1.133       dsl 	} */
    389   1.90  christos 	struct linux_ucontext context, *ucp = SCARG(uap, ucp);
    390   1.90  christos 	int error;
    391   1.90  christos 
    392   1.90  christos 	/*
    393   1.90  christos 	 * The trampoline code hands us the context.
    394   1.90  christos 	 * It is unsafe to keep track of it ourselves, in the event that a
    395   1.90  christos 	 * program jumps out of a signal handler.
    396   1.90  christos 	 */
    397   1.90  christos 	if ((error = copyin(ucp, &context, sizeof(*ucp))) != 0)
    398   1.90  christos 		return error;
    399   1.90  christos 
    400   1.90  christos 	/* XXX XAX we can do better here by using more of the ucontext */
    401   1.90  christos 	return linux_restore_sigcontext(l, &context.uc_mcontext, retval);
    402   1.43       erh }
    403   1.43       erh 
    404    1.1      fvdl int
    405  1.133       dsl linux_sys_sigreturn(struct lwp *l, const struct linux_sys_sigreturn_args *uap, register_t *retval)
    406   1.19   thorpej {
    407  1.133       dsl 	/* {
    408    1.1      fvdl 		syscallarg(struct linux_sigcontext *) scp;
    409  1.133       dsl 	} */
    410   1.90  christos 	struct linux_sigcontext context, *scp = SCARG(uap, scp);
    411   1.90  christos 	int error;
    412    1.1      fvdl 
    413    1.1      fvdl 	/*
    414    1.1      fvdl 	 * The trampoline code hands us the context.
    415    1.1      fvdl 	 * It is unsafe to keep track of it ourselves, in the event that a
    416    1.1      fvdl 	 * program jumps out of a signal handler.
    417    1.1      fvdl 	 */
    418  1.123  christos 	if ((error = copyin((void *)scp, &context, sizeof(*scp))) != 0)
    419   1.90  christos 		return error;
    420   1.90  christos 	return linux_restore_sigcontext(l, &context, retval);
    421   1.90  christos }
    422    1.1      fvdl 
    423   1.90  christos static int
    424  1.116  christos linux_restore_sigcontext(struct lwp *l, struct linux_sigcontext *scp,
    425  1.119  christos     register_t *retval)
    426   1.90  christos {
    427   1.90  christos 	struct proc *p = l->l_proc;
    428  1.122        ad 	struct sigaltstack *sas = &l->l_sigstk;
    429   1.90  christos 	struct trapframe *tf;
    430   1.90  christos 	sigset_t mask;
    431   1.90  christos 	ssize_t ss_gap;
    432  1.149       chs 
    433   1.42   mycroft 	/* Restore register context. */
    434   1.85   thorpej 	tf = l->l_md.md_regs;
    435  1.149       chs 	DPRINTF(("sigreturn enter esp=0x%x eip=0x%x\n", tf->tf_esp, tf->tf_eip));
    436   1.83  christos 
    437  1.164      maxv 	/*
    438  1.164      maxv 	 * Check for security violations.  If we're returning to
    439  1.164      maxv 	 * protected mode, the CPU will validate the segment registers
    440  1.164      maxv 	 * automatically and generate a trap on violations.  We handle
    441  1.164      maxv 	 * the trap, rather than doing all of the checking here.
    442  1.164      maxv 	 */
    443  1.164      maxv 	if (((scp->sc_eflags ^ tf->tf_eflags) & PSL_USERSTATIC) != 0 ||
    444  1.165      maxv 	    !USERMODE(scp->sc_cs))
    445  1.164      maxv 		return EINVAL;
    446  1.164      maxv 
    447  1.164      maxv 	tf->tf_gs = scp->sc_gs;
    448  1.164      maxv 	tf->tf_fs = scp->sc_fs;
    449  1.164      maxv 	tf->tf_es = scp->sc_es;
    450  1.164      maxv 	tf->tf_ds = scp->sc_ds;
    451  1.164      maxv 	tf->tf_eflags = scp->sc_eflags;
    452  1.164      maxv 
    453   1.90  christos 	tf->tf_edi = scp->sc_edi;
    454   1.90  christos 	tf->tf_esi = scp->sc_esi;
    455   1.90  christos 	tf->tf_ebp = scp->sc_ebp;
    456   1.90  christos 	tf->tf_ebx = scp->sc_ebx;
    457   1.90  christos 	tf->tf_edx = scp->sc_edx;
    458   1.90  christos 	tf->tf_ecx = scp->sc_ecx;
    459   1.90  christos 	tf->tf_eax = scp->sc_eax;
    460   1.90  christos 	tf->tf_eip = scp->sc_eip;
    461   1.90  christos 	tf->tf_cs = scp->sc_cs;
    462   1.90  christos 	tf->tf_esp = scp->sc_esp_at_signal;
    463   1.90  christos 	tf->tf_ss = scp->sc_ss;
    464   1.26   mycroft 
    465   1.42   mycroft 	/* Restore signal stack. */
    466   1.66  jdolecek 	/*
    467   1.66  jdolecek 	 * Linux really does it this way; it doesn't have space in sigframe
    468   1.66  jdolecek 	 * to save the onstack flag.
    469   1.66  jdolecek 	 */
    470  1.135        ad 	mutex_enter(p->p_lock);
    471  1.123  christos 	ss_gap = (ssize_t)((char *)scp->sc_esp_at_signal - (char *)sas->ss_sp);
    472   1.82  christos 	if (ss_gap >= 0 && ss_gap < sas->ss_size)
    473   1.82  christos 		sas->ss_flags |= SS_ONSTACK;
    474   1.66  jdolecek 	else
    475   1.82  christos 		sas->ss_flags &= ~SS_ONSTACK;
    476   1.42   mycroft 
    477   1.42   mycroft 	/* Restore signal mask. */
    478   1.90  christos 	linux_old_to_native_sigset(&mask, &scp->sc_mask);
    479  1.122        ad 	(void) sigprocmask1(l, SIG_SETMASK, &mask, 0);
    480  1.135        ad 	mutex_exit(p->p_lock);
    481  1.122        ad 
    482  1.149       chs 	DPRINTF(("sigreturn exit esp=0x%x eip=0x%x\n", tf->tf_esp, tf->tf_eip));
    483   1.83  christos 	return EJUSTRETURN;
    484    1.6   mycroft }
    485    1.6   mycroft 
    486    1.7   mycroft #ifdef USER_LDT
    487    1.7   mycroft 
    488  1.128       dsl static int
    489  1.133       dsl linux_read_ldt(struct lwp *l, const struct linux_sys_modify_ldt_args *uap,
    490  1.128       dsl     register_t *retval)
    491    1.7   mycroft {
    492  1.124        ad 	struct x86_get_ldt_args gl;
    493    1.7   mycroft 	int error;
    494  1.128       dsl 	union descriptor *ldt_buf;
    495  1.143        ad 	size_t sz;
    496  1.128       dsl 
    497  1.128       dsl 	/*
    498  1.167    andvar 	 * I've checked the linux code - this function is asymmetric with
    499  1.128       dsl 	 * linux_write_ldt, and returns raw ldt entries.
    500  1.128       dsl 	 * NB, the code I saw zerod the spare parts of the user buffer.
    501  1.128       dsl 	 */
    502    1.7   mycroft 
    503   1.72  christos 	DPRINTF(("linux_read_ldt!"));
    504  1.128       dsl 
    505  1.143        ad 	sz = 8192 * sizeof(*ldt_buf);
    506  1.143        ad 	ldt_buf = kmem_zalloc(sz, KM_SLEEP);
    507    1.7   mycroft 	gl.start = 0;
    508  1.128       dsl 	gl.desc = NULL;
    509    1.7   mycroft 	gl.num = SCARG(uap, bytecount) / sizeof(union descriptor);
    510  1.128       dsl 	error = x86_get_ldt1(l, &gl, ldt_buf);
    511  1.128       dsl 	/* NB gl.num might have changed */
    512  1.128       dsl 	if (error == 0) {
    513  1.163      maxv 		*retval = gl.num * sizeof(*ldtstore);
    514  1.128       dsl 		error = copyout(ldt_buf, SCARG(uap, ptr),
    515  1.128       dsl 		    gl.num * sizeof *ldt_buf);
    516  1.128       dsl 	}
    517  1.143        ad 	kmem_free(ldt_buf, sz);
    518    1.7   mycroft 
    519  1.128       dsl 	return error;
    520    1.7   mycroft }
    521    1.7   mycroft 
    522    1.7   mycroft struct linux_ldt_info {
    523    1.7   mycroft 	u_int entry_number;
    524    1.7   mycroft 	u_long base_addr;
    525    1.7   mycroft 	u_int limit;
    526    1.7   mycroft 	u_int seg_32bit:1;
    527    1.7   mycroft 	u_int contents:2;
    528    1.7   mycroft 	u_int read_exec_only:1;
    529    1.7   mycroft 	u_int limit_in_pages:1;
    530    1.7   mycroft 	u_int seg_not_present:1;
    531   1.72  christos 	u_int useable:1;
    532    1.7   mycroft };
    533    1.7   mycroft 
    534  1.128       dsl static int
    535  1.133       dsl linux_write_ldt(struct lwp *l, const struct linux_sys_modify_ldt_args *uap,
    536  1.128       dsl     int oldmode)
    537    1.7   mycroft {
    538    1.7   mycroft 	struct linux_ldt_info ldt_info;
    539  1.128       dsl 	union descriptor d;
    540  1.124        ad 	struct x86_set_ldt_args sl;
    541    1.7   mycroft 	int error;
    542    1.7   mycroft 
    543   1.72  christos 	DPRINTF(("linux_write_ldt %d\n", oldmode));
    544    1.7   mycroft 	if (SCARG(uap, bytecount) != sizeof(ldt_info))
    545    1.7   mycroft 		return (EINVAL);
    546   1.29  christos 	if ((error = copyin(SCARG(uap, ptr), &ldt_info, sizeof(ldt_info))) != 0)
    547    1.7   mycroft 		return error;
    548   1.72  christos 	if (ldt_info.entry_number >= 8192)
    549    1.7   mycroft 		return (EINVAL);
    550   1.72  christos 	if (ldt_info.contents == 3) {
    551   1.72  christos 		if (oldmode)
    552   1.72  christos 			return (EINVAL);
    553   1.72  christos 		if (ldt_info.seg_not_present)
    554   1.72  christos 			return (EINVAL);
    555   1.72  christos 	}
    556    1.7   mycroft 
    557   1.72  christos 	if (ldt_info.base_addr == 0 && ldt_info.limit == 0 &&
    558   1.72  christos 	    (oldmode || (ldt_info.contents == 0 &&
    559   1.72  christos 	    ldt_info.read_exec_only == 1 && ldt_info.seg_32bit == 0 &&
    560   1.72  christos 	    ldt_info.limit_in_pages == 0 && ldt_info.seg_not_present == 1 &&
    561   1.72  christos 	    ldt_info.useable == 0))) {
    562   1.70  christos 		/* this means you should zero the ldt */
    563  1.128       dsl 		(void)memset(&d, 0, sizeof(d));
    564   1.70  christos 	} else {
    565  1.128       dsl 		d.sd.sd_lobase = ldt_info.base_addr & 0xffffff;
    566  1.128       dsl 		d.sd.sd_hibase = (ldt_info.base_addr >> 24) & 0xff;
    567  1.128       dsl 		d.sd.sd_lolimit = ldt_info.limit & 0xffff;
    568  1.128       dsl 		d.sd.sd_hilimit = (ldt_info.limit >> 16) & 0xf;
    569  1.128       dsl 		d.sd.sd_type = 16 | (ldt_info.contents << 2) |
    570   1.70  christos 		    (!ldt_info.read_exec_only << 1);
    571  1.128       dsl 		d.sd.sd_dpl = SEL_UPL;
    572  1.128       dsl 		d.sd.sd_p = !ldt_info.seg_not_present;
    573  1.128       dsl 		d.sd.sd_def32 = ldt_info.seg_32bit;
    574  1.128       dsl 		d.sd.sd_gran = ldt_info.limit_in_pages;
    575   1.72  christos 		if (!oldmode)
    576  1.128       dsl 			d.sd.sd_xx = ldt_info.useable;
    577   1.73  christos 		else
    578  1.128       dsl 			d.sd.sd_xx = 0;
    579   1.70  christos 	}
    580    1.7   mycroft 	sl.start = ldt_info.entry_number;
    581  1.147   mbalmer 	sl.desc = NULL;
    582    1.7   mycroft 	sl.num = 1;
    583    1.7   mycroft 
    584   1.72  christos 	DPRINTF(("linux_write_ldt: idx=%d, base=0x%lx, limit=0x%x\n",
    585   1.72  christos 	    ldt_info.entry_number, ldt_info.base_addr, ldt_info.limit));
    586    1.7   mycroft 
    587  1.128       dsl 	return x86_set_ldt1(l, &sl, &d);
    588    1.7   mycroft }
    589    1.7   mycroft 
    590    1.7   mycroft #endif /* USER_LDT */
    591    1.7   mycroft 
    592    1.6   mycroft int
    593  1.133       dsl linux_sys_modify_ldt(struct lwp *l, const struct linux_sys_modify_ldt_args *uap, register_t *retval)
    594   1.19   thorpej {
    595  1.133       dsl 	/* {
    596    1.6   mycroft 		syscallarg(int) func;
    597    1.6   mycroft 		syscallarg(void *) ptr;
    598    1.6   mycroft 		syscallarg(size_t) bytecount;
    599  1.133       dsl 	} */
    600    1.6   mycroft 
    601    1.6   mycroft 	switch (SCARG(uap, func)) {
    602    1.7   mycroft #ifdef USER_LDT
    603    1.6   mycroft 	case 0:
    604  1.133       dsl 		return linux_read_ldt(l, (const void *)uap, retval);
    605    1.6   mycroft 	case 1:
    606  1.133       dsl 		return linux_write_ldt(l, (const void *)uap, 1);
    607   1.72  christos 	case 2:
    608   1.72  christos #ifdef notyet
    609  1.148       wiz 		return linux_read_default_ldt(l, (const void *)uap, retval);
    610   1.72  christos #else
    611   1.72  christos 		return (ENOSYS);
    612   1.72  christos #endif
    613   1.72  christos 	case 0x11:
    614  1.133       dsl 		return linux_write_ldt(l, (const void *)uap, 0);
    615    1.7   mycroft #endif /* USER_LDT */
    616    1.7   mycroft 
    617    1.6   mycroft 	default:
    618    1.6   mycroft 		return (ENOSYS);
    619    1.6   mycroft 	}
    620   1.13      fvdl }
    621   1.13      fvdl 
    622   1.13      fvdl /*
    623   1.13      fvdl  * XXX Pathetic hack to make svgalib work. This will fake the major
    624   1.13      fvdl  * device number of an opened VT so that svgalib likes it. grmbl.
    625   1.13      fvdl  * Should probably do it 'wrong the right way' and use a mapping
    626   1.13      fvdl  * array for all major device numbers, and map linux_mknod too.
    627   1.13      fvdl  */
    628   1.13      fvdl dev_t
    629  1.132       dsl linux_fakedev(dev_t dev, int raw)
    630   1.13      fvdl {
    631  1.104  christos 	extern const struct cdevsw ptc_cdevsw, pts_cdevsw;
    632  1.104  christos 	const struct cdevsw *cd = cdevsw_lookup(dev);
    633  1.104  christos 
    634   1.69  christos 	if (raw) {
    635   1.41  drochner #if (NWSDISPLAY > 0)
    636   1.79   gehenna 		extern const struct cdevsw wsdisplay_cdevsw;
    637  1.104  christos 		if (cd == &wsdisplay_cdevsw)
    638   1.69  christos 			return makedev(LINUX_CONS_MAJOR, (minor(dev) + 1));
    639   1.41  drochner #endif
    640   1.69  christos 	}
    641   1.77  jdolecek 
    642  1.104  christos 	if (cd == &ptc_cdevsw)
    643  1.104  christos 		return makedev(LINUX_PTC_MAJOR, minor(dev));
    644  1.104  christos 	if (cd == &pts_cdevsw)
    645  1.104  christos 		return makedev(LINUX_PTS_MAJOR, minor(dev));
    646  1.104  christos 
    647   1.77  jdolecek 	return dev;
    648   1.13      fvdl }
    649   1.13      fvdl 
    650   1.49     jhawk #if (NWSDISPLAY > 0)
    651   1.41  drochner /*
    652   1.41  drochner  * That's not complete, but enough to get an X server running.
    653   1.41  drochner  */
    654   1.41  drochner #define NR_KEYS 128
    655   1.61  jdolecek static const u_short plain_map[NR_KEYS] = {
    656   1.41  drochner 	0x0200,	0x001b,	0x0031,	0x0032,	0x0033,	0x0034,	0x0035,	0x0036,
    657   1.41  drochner 	0x0037,	0x0038,	0x0039,	0x0030,	0x002d,	0x003d,	0x007f,	0x0009,
    658   1.41  drochner 	0x0b71,	0x0b77,	0x0b65,	0x0b72,	0x0b74,	0x0b79,	0x0b75,	0x0b69,
    659   1.41  drochner 	0x0b6f,	0x0b70,	0x005b,	0x005d,	0x0201,	0x0702,	0x0b61,	0x0b73,
    660   1.41  drochner 	0x0b64,	0x0b66,	0x0b67,	0x0b68,	0x0b6a,	0x0b6b,	0x0b6c,	0x003b,
    661   1.41  drochner 	0x0027,	0x0060,	0x0700,	0x005c,	0x0b7a,	0x0b78,	0x0b63,	0x0b76,
    662   1.41  drochner 	0x0b62,	0x0b6e,	0x0b6d,	0x002c,	0x002e,	0x002f,	0x0700,	0x030c,
    663   1.41  drochner 	0x0703,	0x0020,	0x0207,	0x0100,	0x0101,	0x0102,	0x0103,	0x0104,
    664   1.41  drochner 	0x0105,	0x0106,	0x0107,	0x0108,	0x0109,	0x0208,	0x0209,	0x0307,
    665   1.41  drochner 	0x0308,	0x0309,	0x030b,	0x0304,	0x0305,	0x0306,	0x030a,	0x0301,
    666   1.41  drochner 	0x0302,	0x0303,	0x0300,	0x0310,	0x0206,	0x0200,	0x003c,	0x010a,
    667   1.41  drochner 	0x010b,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    668   1.41  drochner 	0x030e,	0x0702,	0x030d,	0x001c,	0x0701,	0x0205,	0x0114,	0x0603,
    669   1.41  drochner 	0x0118,	0x0601,	0x0602,	0x0117,	0x0600,	0x0119,	0x0115,	0x0116,
    670   1.41  drochner 	0x011a,	0x010c,	0x010d,	0x011b,	0x011c,	0x0110,	0x0311,	0x011d,
    671   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    672   1.41  drochner }, shift_map[NR_KEYS] = {
    673   1.41  drochner 	0x0200,	0x001b,	0x0021,	0x0040,	0x0023,	0x0024,	0x0025,	0x005e,
    674   1.41  drochner 	0x0026,	0x002a,	0x0028,	0x0029,	0x005f,	0x002b,	0x007f,	0x0009,
    675   1.41  drochner 	0x0b51,	0x0b57,	0x0b45,	0x0b52,	0x0b54,	0x0b59,	0x0b55,	0x0b49,
    676   1.41  drochner 	0x0b4f,	0x0b50,	0x007b,	0x007d,	0x0201,	0x0702,	0x0b41,	0x0b53,
    677   1.41  drochner 	0x0b44,	0x0b46,	0x0b47,	0x0b48,	0x0b4a,	0x0b4b,	0x0b4c,	0x003a,
    678   1.41  drochner 	0x0022,	0x007e,	0x0700,	0x007c,	0x0b5a,	0x0b58,	0x0b43,	0x0b56,
    679   1.41  drochner 	0x0b42,	0x0b4e,	0x0b4d,	0x003c,	0x003e,	0x003f,	0x0700,	0x030c,
    680   1.41  drochner 	0x0703,	0x0020,	0x0207,	0x010a,	0x010b,	0x010c,	0x010d,	0x010e,
    681   1.41  drochner 	0x010f,	0x0110,	0x0111,	0x0112,	0x0113,	0x0213,	0x0203,	0x0307,
    682   1.41  drochner 	0x0308,	0x0309,	0x030b,	0x0304,	0x0305,	0x0306,	0x030a,	0x0301,
    683   1.41  drochner 	0x0302,	0x0303,	0x0300,	0x0310,	0x0206,	0x0200,	0x003e,	0x010a,
    684   1.41  drochner 	0x010b,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    685   1.41  drochner 	0x030e,	0x0702,	0x030d,	0x0200,	0x0701,	0x0205,	0x0114,	0x0603,
    686   1.41  drochner 	0x020b,	0x0601,	0x0602,	0x0117,	0x0600,	0x020a,	0x0115,	0x0116,
    687   1.41  drochner 	0x011a,	0x010c,	0x010d,	0x011b,	0x011c,	0x0110,	0x0311,	0x011d,
    688   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    689   1.41  drochner }, altgr_map[NR_KEYS] = {
    690   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0040,	0x0200,	0x0024,	0x0200,	0x0200,
    691   1.41  drochner 	0x007b,	0x005b,	0x005d,	0x007d,	0x005c,	0x0200,	0x0200,	0x0200,
    692   1.41  drochner 	0x0b71,	0x0b77,	0x0918,	0x0b72,	0x0b74,	0x0b79,	0x0b75,	0x0b69,
    693   1.41  drochner 	0x0b6f,	0x0b70,	0x0200,	0x007e,	0x0201,	0x0702,	0x0914,	0x0b73,
    694   1.41  drochner 	0x0917,	0x0919,	0x0b67,	0x0b68,	0x0b6a,	0x0b6b,	0x0b6c,	0x0200,
    695   1.41  drochner 	0x0200,	0x0200,	0x0700,	0x0200,	0x0b7a,	0x0b78,	0x0916,	0x0b76,
    696   1.41  drochner 	0x0915,	0x0b6e,	0x0b6d,	0x0200,	0x0200,	0x0200,	0x0700,	0x030c,
    697   1.41  drochner 	0x0703,	0x0200,	0x0207,	0x050c,	0x050d,	0x050e,	0x050f,	0x0510,
    698   1.41  drochner 	0x0511,	0x0512,	0x0513,	0x0514,	0x0515,	0x0208,	0x0202,	0x0911,
    699   1.41  drochner 	0x0912,	0x0913,	0x030b,	0x090e,	0x090f,	0x0910,	0x030a,	0x090b,
    700   1.41  drochner 	0x090c,	0x090d,	0x090a,	0x0310,	0x0206,	0x0200,	0x007c,	0x0516,
    701   1.41  drochner 	0x0517,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    702   1.41  drochner 	0x030e,	0x0702,	0x030d,	0x0200,	0x0701,	0x0205,	0x0114,	0x0603,
    703   1.41  drochner 	0x0118,	0x0601,	0x0602,	0x0117,	0x0600,	0x0119,	0x0115,	0x0116,
    704   1.41  drochner 	0x011a,	0x010c,	0x010d,	0x011b,	0x011c,	0x0110,	0x0311,	0x011d,
    705   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    706   1.41  drochner }, ctrl_map[NR_KEYS] = {
    707   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0000,	0x001b,	0x001c,	0x001d,	0x001e,
    708   1.41  drochner 	0x001f,	0x007f,	0x0200,	0x0200,	0x001f,	0x0200,	0x0008,	0x0200,
    709   1.41  drochner 	0x0011,	0x0017,	0x0005,	0x0012,	0x0014,	0x0019,	0x0015,	0x0009,
    710   1.41  drochner 	0x000f,	0x0010,	0x001b,	0x001d,	0x0201,	0x0702,	0x0001,	0x0013,
    711   1.41  drochner 	0x0004,	0x0006,	0x0007,	0x0008,	0x000a,	0x000b,	0x000c,	0x0200,
    712   1.41  drochner 	0x0007,	0x0000,	0x0700,	0x001c,	0x001a,	0x0018,	0x0003,	0x0016,
    713   1.41  drochner 	0x0002,	0x000e,	0x000d,	0x0200,	0x020e,	0x007f,	0x0700,	0x030c,
    714   1.41  drochner 	0x0703,	0x0000,	0x0207,	0x0100,	0x0101,	0x0102,	0x0103,	0x0104,
    715   1.41  drochner 	0x0105,	0x0106,	0x0107,	0x0108,	0x0109,	0x0208,	0x0204,	0x0307,
    716   1.41  drochner 	0x0308,	0x0309,	0x030b,	0x0304,	0x0305,	0x0306,	0x030a,	0x0301,
    717   1.41  drochner 	0x0302,	0x0303,	0x0300,	0x0310,	0x0206,	0x0200,	0x0200,	0x010a,
    718   1.41  drochner 	0x010b,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    719   1.41  drochner 	0x030e,	0x0702,	0x030d,	0x001c,	0x0701,	0x0205,	0x0114,	0x0603,
    720   1.41  drochner 	0x0118,	0x0601,	0x0602,	0x0117,	0x0600,	0x0119,	0x0115,	0x0116,
    721   1.41  drochner 	0x011a,	0x010c,	0x010d,	0x011b,	0x011c,	0x0110,	0x0311,	0x011d,
    722   1.41  drochner 	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,	0x0200,
    723   1.41  drochner };
    724   1.41  drochner 
    725   1.61  jdolecek const u_short * const linux_keytabs[] = {
    726   1.41  drochner 	plain_map, shift_map, altgr_map, altgr_map, ctrl_map
    727   1.41  drochner };
    728   1.41  drochner #endif
    729   1.41  drochner 
    730   1.52      fvdl static struct biosdisk_info *
    731  1.119  christos fd2biosinfo(struct proc *p, struct file *fp)
    732   1.52      fvdl {
    733   1.52      fvdl 	struct vnode *vp;
    734   1.52      fvdl 	const char *blkname;
    735   1.52      fvdl 	char diskname[16];
    736   1.52      fvdl 	int i;
    737   1.52      fvdl 	struct nativedisk_info *nip;
    738  1.103   thorpej 	struct disklist *dl = x86_alldisks;
    739   1.52      fvdl 
    740  1.162      maxv 	if (dl == NULL)
    741  1.162      maxv 		return NULL;
    742   1.52      fvdl 	if (fp->f_type != DTYPE_VNODE)
    743   1.52      fvdl 		return NULL;
    744   1.52      fvdl 	vp = (struct vnode *)fp->f_data;
    745   1.52      fvdl 
    746   1.52      fvdl 	if (vp->v_type != VBLK)
    747   1.52      fvdl 		return NULL;
    748   1.52      fvdl 
    749   1.79   gehenna 	blkname = devsw_blk2name(major(vp->v_rdev));
    750  1.142  christos 	snprintf(diskname, sizeof diskname, "%s%llu", blkname,
    751  1.142  christos 	    (unsigned long long)DISKUNIT(vp->v_rdev));
    752   1.52      fvdl 
    753   1.52      fvdl 	for (i = 0; i < dl->dl_nnativedisks; i++) {
    754   1.52      fvdl 		nip = &dl->dl_nativedisks[i];
    755   1.52      fvdl 		if (strcmp(diskname, nip->ni_devname))
    756   1.52      fvdl 			continue;
    757   1.52      fvdl 		if (nip->ni_nmatches != 0)
    758   1.52      fvdl 			return &dl->dl_biosdisks[nip->ni_biosmatches[0]];
    759   1.52      fvdl 	}
    760   1.52      fvdl 
    761   1.52      fvdl 	return NULL;
    762   1.52      fvdl }
    763   1.52      fvdl 
    764   1.52      fvdl 
    765   1.13      fvdl /*
    766   1.13      fvdl  * We come here in a last attempt to satisfy a Linux ioctl() call
    767   1.13      fvdl  */
    768   1.13      fvdl int
    769  1.133       dsl linux_machdepioctl(struct lwp *l, const struct linux_sys_ioctl_args *uap, register_t *retval)
    770   1.19   thorpej {
    771  1.133       dsl 	/* {
    772   1.13      fvdl 		syscallarg(int) fd;
    773   1.13      fvdl 		syscallarg(u_long) com;
    774  1.123  christos 		syscallarg(void *) data;
    775  1.133       dsl 	} */
    776   1.29  christos 	struct sys_ioctl_args bia;
    777   1.15      fvdl 	u_long com;
    778   1.52      fvdl 	int error, error1;
    779   1.50     veego #if (NWSDISPLAY > 0)
    780   1.13      fvdl 	struct vt_mode lvt;
    781   1.41  drochner 	struct kbentry kbe;
    782   1.41  drochner #endif
    783   1.52      fvdl 	struct linux_hd_geometry hdg;
    784   1.52      fvdl 	struct linux_hd_big_geometry hdg_big;
    785   1.52      fvdl 	struct biosdisk_info *bip;
    786  1.134        ad 	file_t *fp;
    787   1.52      fvdl 	int fd;
    788  1.161  christos 	struct disklabel label;
    789   1.52      fvdl 	struct partinfo partp;
    790  1.134        ad 	int (*ioctlf)(struct file *, u_long, void *);
    791   1.52      fvdl 	u_long start, biostotal, realtotal;
    792   1.52      fvdl 	u_char heads, sectors;
    793   1.52      fvdl 	u_int cylinders;
    794   1.55      fvdl 	struct ioctl_pt pt;
    795   1.13      fvdl 
    796   1.52      fvdl 	fd = SCARG(uap, fd);
    797   1.52      fvdl 	SCARG(&bia, fd) = fd;
    798   1.13      fvdl 	SCARG(&bia, data) = SCARG(uap, data);
    799   1.13      fvdl 	com = SCARG(uap, com);
    800   1.13      fvdl 
    801  1.134        ad 	if ((fp = fd_getfile(fd)) == NULL)
    802   1.53   thorpej 		return (EBADF);
    803   1.52      fvdl 
    804   1.13      fvdl 	switch (com) {
    805   1.50     veego #if (NWSDISPLAY > 0)
    806   1.13      fvdl 	case LINUX_KDGKBMODE:
    807   1.21      fvdl 		com = KDGKBMODE;
    808   1.21      fvdl 		break;
    809   1.13      fvdl 	case LINUX_KDSKBMODE:
    810   1.13      fvdl 		com = KDSKBMODE;
    811   1.13      fvdl 		if ((unsigned)SCARG(uap, data) == LINUX_K_MEDIUMRAW)
    812  1.123  christos 			SCARG(&bia, data) = (void *)K_RAW;
    813   1.13      fvdl 		break;
    814   1.59      fvdl 	case LINUX_KIOCSOUND:
    815   1.59      fvdl 		SCARG(&bia, data) =
    816  1.123  christos 		    (void *)(((unsigned long)SCARG(&bia, data)) & 0xffff);
    817   1.59      fvdl 		/* fall through */
    818   1.13      fvdl 	case LINUX_KDMKTONE:
    819   1.13      fvdl 		com = KDMKTONE;
    820   1.13      fvdl 		break;
    821   1.13      fvdl 	case LINUX_KDSETMODE:
    822   1.13      fvdl 		com = KDSETMODE;
    823   1.58      fvdl 		break;
    824   1.58      fvdl 	case LINUX_KDGETMODE:
    825   1.58      fvdl 		/* KD_* values are equal to the wscons numbers */
    826   1.58      fvdl 		com = WSDISPLAYIO_GMODE;
    827   1.13      fvdl 		break;
    828   1.13      fvdl 	case LINUX_KDENABIO:
    829   1.13      fvdl 		com = KDENABIO;
    830   1.13      fvdl 		break;
    831   1.13      fvdl 	case LINUX_KDDISABIO:
    832   1.13      fvdl 		com = KDDISABIO;
    833   1.13      fvdl 		break;
    834   1.13      fvdl 	case LINUX_KDGETLED:
    835   1.13      fvdl 		com = KDGETLED;
    836   1.13      fvdl 		break;
    837   1.13      fvdl 	case LINUX_KDSETLED:
    838   1.13      fvdl 		com = KDSETLED;
    839   1.13      fvdl 		break;
    840   1.13      fvdl 	case LINUX_VT_OPENQRY:
    841   1.13      fvdl 		com = VT_OPENQRY;
    842   1.13      fvdl 		break;
    843   1.13      fvdl 	case LINUX_VT_GETMODE:
    844  1.168  riastrad 		memset(&lvt, 0, sizeof(lvt));
    845  1.134        ad 		error = fp->f_ops->fo_ioctl(fp, VT_GETMODE, &lvt);
    846  1.129       dsl 		if (error != 0)
    847   1.86      yamt 			goto out;
    848   1.74  christos 		lvt.relsig = native_to_linux_signo[lvt.relsig];
    849   1.74  christos 		lvt.acqsig = native_to_linux_signo[lvt.acqsig];
    850   1.74  christos 		lvt.frsig = native_to_linux_signo[lvt.frsig];
    851  1.129       dsl 		error = copyout(&lvt, SCARG(uap, data), sizeof (lvt));
    852   1.86      yamt 		goto out;
    853   1.13      fvdl 	case LINUX_VT_SETMODE:
    854  1.129       dsl 		error = copyin(SCARG(uap, data), &lvt, sizeof (lvt));
    855  1.129       dsl 		if (error != 0)
    856   1.86      yamt 			goto out;
    857   1.74  christos 		lvt.relsig = linux_to_native_signo[lvt.relsig];
    858   1.74  christos 		lvt.acqsig = linux_to_native_signo[lvt.acqsig];
    859   1.74  christos 		lvt.frsig = linux_to_native_signo[lvt.frsig];
    860  1.134        ad 		error = fp->f_ops->fo_ioctl(fp, VT_SETMODE, &lvt);
    861  1.129       dsl 		goto out;
    862   1.52      fvdl 	case LINUX_VT_DISALLOCATE:
    863   1.52      fvdl 		/* XXX should use WSDISPLAYIO_DELSCREEN */
    864   1.86      yamt 		error = 0;
    865   1.86      yamt 		goto out;
    866   1.13      fvdl 	case LINUX_VT_RELDISP:
    867   1.13      fvdl 		com = VT_RELDISP;
    868   1.13      fvdl 		break;
    869   1.13      fvdl 	case LINUX_VT_ACTIVATE:
    870   1.13      fvdl 		com = VT_ACTIVATE;
    871   1.13      fvdl 		break;
    872   1.13      fvdl 	case LINUX_VT_WAITACTIVE:
    873   1.13      fvdl 		com = VT_WAITACTIVE;
    874   1.13      fvdl 		break;
    875   1.41  drochner 	case LINUX_VT_GETSTATE:
    876   1.41  drochner 		com = VT_GETSTATE;
    877   1.41  drochner 		break;
    878   1.41  drochner 	case LINUX_KDGKBTYPE:
    879   1.91  jdolecek 	    {
    880   1.91  jdolecek 		static const u_int8_t kb101 = KB_101;
    881   1.91  jdolecek 
    882   1.41  drochner 		/* This is what Linux does. */
    883   1.91  jdolecek 		error = copyout(&kb101, SCARG(uap, data), 1);
    884   1.86      yamt 		goto out;
    885   1.91  jdolecek 	    }
    886   1.41  drochner 	case LINUX_KDGKBENT:
    887   1.41  drochner 		/*
    888   1.41  drochner 		 * The Linux KDGKBENT ioctl is different from the
    889   1.41  drochner 		 * SYSV original. So we handle it in machdep code.
    890   1.41  drochner 		 * XXX We should use keyboard mapping information
    891   1.41  drochner 		 * from wsdisplay, but this would be expensive.
    892   1.41  drochner 		 */
    893   1.41  drochner 		if ((error = copyin(SCARG(uap, data), &kbe,
    894   1.41  drochner 				    sizeof(struct kbentry))))
    895   1.86      yamt 			goto out;
    896   1.41  drochner 		if (kbe.kb_table >= sizeof(linux_keytabs) / sizeof(u_short *)
    897   1.86      yamt 		    || kbe.kb_index >= NR_KEYS) {
    898   1.86      yamt 			error = EINVAL;
    899   1.86      yamt 			goto out;
    900   1.86      yamt 		}
    901   1.41  drochner 		kbe.kb_value = linux_keytabs[kbe.kb_table][kbe.kb_index];
    902   1.86      yamt 		error = copyout(&kbe, SCARG(uap, data),
    903   1.86      yamt 				sizeof(struct kbentry));
    904   1.86      yamt 		goto out;
    905   1.54      fvdl #endif
    906   1.52      fvdl 	case LINUX_HDIO_GETGEO:
    907   1.52      fvdl 	case LINUX_HDIO_GETGEO_BIG:
    908   1.52      fvdl 		/*
    909   1.52      fvdl 		 * Try to mimic Linux behaviour: return the BIOS geometry
    910   1.52      fvdl 		 * if possible (extending its # of cylinders if it's beyond
    911   1.52      fvdl 		 * the 1023 limit), fall back to the MI geometry (i.e.
    912   1.52      fvdl 		 * the real geometry) if not found, by returning an
    913   1.52      fvdl 		 * error. See common/linux_hdio.c
    914   1.52      fvdl 		 */
    915  1.134        ad 		bip = fd2biosinfo(curproc, fp);
    916   1.52      fvdl 		ioctlf = fp->f_ops->fo_ioctl;
    917  1.161  christos 		error = ioctlf(fp, DIOCGDINFO, (void *)&label);
    918  1.160  christos 		error1 = ioctlf(fp, DIOCGPARTINFO, (void *)&partp);
    919   1.86      yamt 		if (error != 0 && error1 != 0) {
    920   1.86      yamt 			error = error1;
    921   1.86      yamt 			goto out;
    922   1.86      yamt 		}
    923  1.161  christos 		start = error1 != 0 ? partp.pi_offset : 0;
    924   1.52      fvdl 		if (bip != NULL && bip->bi_head != 0 && bip->bi_sec != 0
    925   1.52      fvdl 		    && bip->bi_cyl != 0) {
    926   1.52      fvdl 			heads = bip->bi_head;
    927   1.52      fvdl 			sectors = bip->bi_sec;
    928   1.52      fvdl 			cylinders = bip->bi_cyl;
    929   1.52      fvdl 			biostotal = heads * sectors * cylinders;
    930  1.161  christos 			realtotal = label.d_ntracks * label.d_nsectors *
    931  1.161  christos 			    label.d_ncylinders;
    932   1.52      fvdl 			if (realtotal > biostotal)
    933   1.52      fvdl 				cylinders = realtotal / (heads * sectors);
    934   1.52      fvdl 		} else {
    935  1.161  christos 			heads = label.d_ntracks;
    936  1.161  christos 			cylinders = label.d_ncylinders;
    937  1.161  christos 			sectors = label.d_nsectors;
    938   1.52      fvdl 		}
    939   1.52      fvdl 		if (com == LINUX_HDIO_GETGEO) {
    940  1.168  riastrad 			memset(&hdg, 0, sizeof(hdg));
    941   1.52      fvdl 			hdg.start = start;
    942   1.52      fvdl 			hdg.heads = heads;
    943   1.52      fvdl 			hdg.cylinders = cylinders;
    944   1.52      fvdl 			hdg.sectors = sectors;
    945   1.86      yamt 			error = copyout(&hdg, SCARG(uap, data), sizeof hdg);
    946   1.86      yamt 			goto out;
    947   1.52      fvdl 		} else {
    948  1.168  riastrad 			memset(&hdg_big, 0, sizeof(hdg_big));
    949   1.52      fvdl 			hdg_big.start = start;
    950   1.52      fvdl 			hdg_big.heads = heads;
    951   1.52      fvdl 			hdg_big.cylinders = cylinders;
    952   1.52      fvdl 			hdg_big.sectors = sectors;
    953   1.86      yamt 			error = copyout(&hdg_big, SCARG(uap, data),
    954   1.52      fvdl 			    sizeof hdg_big);
    955   1.86      yamt 			goto out;
    956   1.52      fvdl 		}
    957   1.52      fvdl 
    958   1.13      fvdl 	default:
    959   1.54      fvdl 		/*
    960   1.55      fvdl 		 * Unknown to us. If it's on a device, just pass it through
    961   1.55      fvdl 		 * using PTIOCLINUX, the device itself might be able to
    962   1.55      fvdl 		 * make some sense of it.
    963   1.57      fvdl 		 * XXX hack: if the function returns EJUSTRETURN,
    964   1.57      fvdl 		 * it has stuffed a sysctl return value in pt.data.
    965   1.54      fvdl 		 */
    966   1.55      fvdl 		ioctlf = fp->f_ops->fo_ioctl;
    967   1.55      fvdl 		pt.com = SCARG(uap, com);
    968   1.55      fvdl 		pt.data = SCARG(uap, data);
    969  1.134        ad 		error = ioctlf(fp, PTIOCLINUX, &pt);
    970   1.57      fvdl 		if (error == EJUSTRETURN) {
    971   1.57      fvdl 			retval[0] = (register_t)pt.data;
    972   1.57      fvdl 			error = 0;
    973   1.57      fvdl 		}
    974   1.55      fvdl 
    975  1.115  christos 		if (error == ENOTTY) {
    976   1.72  christos 			DPRINTF(("linux_machdepioctl: invalid ioctl %08lx\n",
    977   1.72  christos 			    com));
    978  1.115  christos 		}
    979   1.86      yamt 		goto out;
    980   1.13      fvdl 	}
    981   1.13      fvdl 	SCARG(&bia, com) = com;
    982   1.86      yamt 	error = sys_ioctl(curlwp, &bia, retval);
    983   1.86      yamt out:
    984  1.134        ad 	fd_putfile(fd);
    985   1.86      yamt 	return error;
    986   1.13      fvdl }
    987   1.13      fvdl 
    988   1.13      fvdl /*
    989   1.13      fvdl  * Set I/O permissions for a process. Just set the maximum level
    990   1.13      fvdl  * right away (ignoring the argument), otherwise we would have
    991   1.13      fvdl  * to rely on I/O permission maps, which are not implemented.
    992   1.13      fvdl  */
    993   1.13      fvdl int
    994  1.133       dsl linux_sys_iopl(struct lwp *l, const struct linux_sys_iopl_args *uap, register_t *retval)
    995   1.19   thorpej {
    996  1.133       dsl 	/* {
    997   1.13      fvdl 		syscallarg(int) level;
    998  1.133       dsl 	} */
    999   1.85   thorpej 	struct trapframe *fp = l->l_md.md_regs;
   1000   1.13      fvdl 
   1001  1.120      elad 	if (kauth_authorize_machdep(l->l_cred, KAUTH_MACHDEP_IOPL,
   1002  1.120      elad 	    NULL, NULL, NULL, NULL) != 0)
   1003   1.13      fvdl 		return EPERM;
   1004   1.13      fvdl 	fp->tf_eflags |= PSL_IOPL;
   1005   1.13      fvdl 	*retval = 0;
   1006   1.13      fvdl 	return 0;
   1007   1.13      fvdl }
   1008   1.13      fvdl 
   1009   1.13      fvdl /*
   1010   1.13      fvdl  * See above. If a root process tries to set access to an I/O port,
   1011   1.13      fvdl  * just let it have the whole range.
   1012   1.13      fvdl  */
   1013   1.13      fvdl int
   1014  1.133       dsl linux_sys_ioperm(struct lwp *l, const struct linux_sys_ioperm_args *uap, register_t *retval)
   1015   1.19   thorpej {
   1016  1.133       dsl 	/* {
   1017   1.13      fvdl 		syscallarg(unsigned int) lo;
   1018   1.13      fvdl 		syscallarg(unsigned int) hi;
   1019   1.13      fvdl 		syscallarg(int) val;
   1020  1.133       dsl 	} */
   1021   1.85   thorpej 	struct trapframe *fp = l->l_md.md_regs;
   1022   1.13      fvdl 
   1023  1.120      elad 	if (kauth_authorize_machdep(l->l_cred, SCARG(uap, val) ?
   1024  1.120      elad 	    KAUTH_MACHDEP_IOPERM_SET : KAUTH_MACHDEP_IOPERM_GET, NULL, NULL,
   1025  1.120      elad 	    NULL, NULL) != 0)
   1026   1.13      fvdl 		return EPERM;
   1027   1.13      fvdl 	if (SCARG(uap, val))
   1028   1.13      fvdl 		fp->tf_eflags |= PSL_IOPL;
   1029   1.13      fvdl 	*retval = 0;
   1030   1.92  christos 	return 0;
   1031   1.92  christos }
   1032  1.107      fvdl 
   1033  1.107      fvdl int
   1034  1.119  christos linux_usertrap(struct lwp *l, vaddr_t trapaddr,
   1035  1.119  christos     void *arg)
   1036  1.107      fvdl {
   1037  1.107      fvdl 	return 0;
   1038  1.107      fvdl }
   1039  1.125  christos 
   1040  1.125  christos const char *
   1041  1.125  christos linux_get_uname_arch(void)
   1042  1.125  christos {
   1043  1.125  christos 	static char uname_arch[5] = "i386";
   1044  1.125  christos 
   1045  1.125  christos 	if (uname_arch[1] == '3')
   1046  1.125  christos 		uname_arch[1] += cpu_class;
   1047  1.125  christos 	return uname_arch;
   1048  1.125  christos }
   1049