Home | History | Annotate | Line # | Download | only in x86
sys_machdep.c revision 1.9
      1  1.9  yamt /*	$NetBSD: sys_machdep.c,v 1.9 2008/01/04 15:55:31 yamt Exp $	*/
      2  1.1    ad 
      3  1.1    ad /*-
      4  1.1    ad  * Copyright (c) 1998, 2007 The NetBSD Foundation, Inc.
      5  1.1    ad  * All rights reserved.
      6  1.1    ad  *
      7  1.1    ad  * This code is derived from software contributed to The NetBSD Foundation
      8  1.1    ad  * by Charles M. Hannum, and by Andrew Doran.
      9  1.1    ad  *
     10  1.1    ad  * Redistribution and use in source and binary forms, with or without
     11  1.1    ad  * modification, are permitted provided that the following conditions
     12  1.1    ad  * are met:
     13  1.1    ad  * 1. Redistributions of source code must retain the above copyright
     14  1.1    ad  *    notice, this list of conditions and the following disclaimer.
     15  1.1    ad  * 2. Redistributions in binary form must reproduce the above copyright
     16  1.1    ad  *    notice, this list of conditions and the following disclaimer in the
     17  1.1    ad  *    documentation and/or other materials provided with the distribution.
     18  1.1    ad  * 3. All advertising materials mentioning features or use of this software
     19  1.1    ad  *    must display the following acknowledgement:
     20  1.1    ad  *        This product includes software developed by the NetBSD
     21  1.1    ad  *        Foundation, Inc. and its contributors.
     22  1.1    ad  * 4. Neither the name of The NetBSD Foundation nor the names of its
     23  1.1    ad  *    contributors may be used to endorse or promote products derived
     24  1.1    ad  *    from this software without specific prior written permission.
     25  1.1    ad  *
     26  1.1    ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     27  1.1    ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     28  1.1    ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     29  1.1    ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     30  1.1    ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     31  1.1    ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     32  1.1    ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     33  1.1    ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     34  1.1    ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     35  1.1    ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     36  1.1    ad  * POSSIBILITY OF SUCH DAMAGE.
     37  1.1    ad  */
     38  1.1    ad 
     39  1.1    ad #include <sys/cdefs.h>
     40  1.9  yamt __KERNEL_RCSID(0, "$NetBSD: sys_machdep.c,v 1.9 2008/01/04 15:55:31 yamt Exp $");
     41  1.1    ad 
     42  1.1    ad #include "opt_compat_netbsd.h"
     43  1.1    ad #include "opt_mtrr.h"
     44  1.1    ad #include "opt_perfctrs.h"
     45  1.1    ad #include "opt_user_ldt.h"
     46  1.1    ad #include "opt_vm86.h"
     47  1.1    ad #include "opt_xen.h"
     48  1.1    ad 
     49  1.1    ad #include <sys/param.h>
     50  1.1    ad #include <sys/systm.h>
     51  1.1    ad #include <sys/ioctl.h>
     52  1.1    ad #include <sys/file.h>
     53  1.1    ad #include <sys/time.h>
     54  1.1    ad #include <sys/proc.h>
     55  1.1    ad #include <sys/user.h>
     56  1.1    ad #include <sys/uio.h>
     57  1.1    ad #include <sys/kernel.h>
     58  1.1    ad #include <sys/buf.h>
     59  1.1    ad #include <sys/signal.h>
     60  1.1    ad #include <sys/malloc.h>
     61  1.9  yamt #include <sys/kmem.h>
     62  1.1    ad #include <sys/kauth.h>
     63  1.1    ad 
     64  1.1    ad #include <sys/mount.h>
     65  1.1    ad #include <sys/syscallargs.h>
     66  1.1    ad 
     67  1.1    ad #include <uvm/uvm_extern.h>
     68  1.1    ad 
     69  1.1    ad #include <machine/cpu.h>
     70  1.1    ad #include <machine/cpufunc.h>
     71  1.1    ad #include <machine/gdt.h>
     72  1.1    ad #include <machine/psl.h>
     73  1.1    ad #include <machine/reg.h>
     74  1.1    ad #include <machine/sysarch.h>
     75  1.1    ad #include <machine/mtrr.h>
     76  1.1    ad 
     77  1.1    ad #ifdef __x86_64__
     78  1.1    ad /* Need to be checked. */
     79  1.1    ad #undef	USER_LDT
     80  1.1    ad #undef	PERFCTRS
     81  1.1    ad #undef	VM86
     82  1.1    ad #undef	IOPERM
     83  1.1    ad #else
     84  1.9  yamt #if defined(XEN)
     85  1.9  yamt #undef	IOPERM
     86  1.9  yamt #else /* defined(XEN) */
     87  1.1    ad #define	IOPERM
     88  1.9  yamt #endif /* defined(XEN) */
     89  1.1    ad #endif
     90  1.1    ad 
     91  1.1    ad #ifdef VM86
     92  1.1    ad #include <machine/vm86.h>
     93  1.1    ad #endif
     94  1.1    ad 
     95  1.1    ad #ifdef PERFCTRS
     96  1.1    ad #include <machine/pmc.h>
     97  1.1    ad #endif
     98  1.1    ad 
     99  1.3    ad /* XXX needs changes from vmlocking branch */
    100  1.3    ad #define	mutex_enter(x)	/* nothing */
    101  1.3    ad #define	mutex_exit(x)	/* nothing */
    102  1.3    ad 
    103  1.1    ad extern struct vm_map *kernel_map;
    104  1.1    ad 
    105  1.1    ad int x86_get_ioperm(struct lwp *, void *, register_t *);
    106  1.1    ad int x86_set_ioperm(struct lwp *, void *, register_t *);
    107  1.1    ad int x86_get_mtrr(struct lwp *, void *, register_t *);
    108  1.1    ad int x86_set_mtrr(struct lwp *, void *, register_t *);
    109  1.5    ad int x86_set_sdbase(void *arg, char which);
    110  1.5    ad int x86_get_sdbase(void *arg, char which);
    111  1.1    ad 
    112  1.1    ad #ifdef LDT_DEBUG
    113  1.1    ad static void x86_print_ldt(int, const struct segment_descriptor *);
    114  1.1    ad 
    115  1.1    ad static void
    116  1.1    ad x86_print_ldt(int i, const struct segment_descriptor *d)
    117  1.1    ad {
    118  1.1    ad 	printf("[%d] lolimit=0x%x, lobase=0x%x, type=%u, dpl=%u, p=%u, "
    119  1.1    ad 	    "hilimit=0x%x, xx=%x, def32=%u, gran=%u, hibase=0x%x\n",
    120  1.1    ad 	    i, d->sd_lolimit, d->sd_lobase, d->sd_type, d->sd_dpl, d->sd_p,
    121  1.1    ad 	    d->sd_hilimit, d->sd_xx, d->sd_def32, d->sd_gran, d->sd_hibase);
    122  1.1    ad }
    123  1.1    ad #endif
    124  1.1    ad 
    125  1.1    ad int
    126  1.2   dsl x86_get_ldt_len(struct lwp *l)
    127  1.2   dsl {
    128  1.2   dsl #ifndef USER_LDT
    129  1.2   dsl 	return -1;
    130  1.2   dsl #else
    131  1.2   dsl 	pmap_t pmap = l->l_proc->p_vmspace->vm_map.pmap;
    132  1.2   dsl 	int nldt;
    133  1.2   dsl 
    134  1.3    ad 	mutex_enter(&pmap->pm_lock);
    135  1.2   dsl 
    136  1.2   dsl 	if (pmap->pm_flags & PMF_USER_LDT) {
    137  1.2   dsl 		nldt = pmap->pm_ldt_len;
    138  1.2   dsl 	} else {
    139  1.2   dsl 		nldt = NLDT;
    140  1.2   dsl 	}
    141  1.3    ad 	mutex_exit(&pmap->pm_lock);
    142  1.2   dsl 	return nldt;
    143  1.2   dsl #endif
    144  1.2   dsl }
    145  1.2   dsl 
    146  1.2   dsl 
    147  1.2   dsl int
    148  1.1    ad x86_get_ldt(struct lwp *l, void *args, register_t *retval)
    149  1.1    ad {
    150  1.2   dsl #ifndef USER_LDT
    151  1.2   dsl 	return EINVAL;
    152  1.2   dsl #else
    153  1.2   dsl 	struct x86_get_ldt_args ua;
    154  1.2   dsl 	union descriptor *cp;
    155  1.2   dsl 	int error;
    156  1.2   dsl 
    157  1.2   dsl 	if ((error = copyin(args, &ua, sizeof(ua))) != 0)
    158  1.2   dsl 		return error;
    159  1.2   dsl 
    160  1.2   dsl 	if (ua.num < 0 || ua.num > 8192)
    161  1.2   dsl 		return EINVAL;
    162  1.2   dsl 
    163  1.2   dsl 	cp = malloc(ua.num * sizeof(union descriptor), M_TEMP, M_WAITOK);
    164  1.2   dsl 	if (cp == NULL)
    165  1.2   dsl 		return ENOMEM;
    166  1.2   dsl 
    167  1.2   dsl 	error = x86_get_ldt1(l, &ua, cp);
    168  1.2   dsl 	*retval = ua.num;
    169  1.2   dsl 	if (error == 0)
    170  1.2   dsl 		error = copyout(cp, ua.desc, ua.num * sizeof(*cp));
    171  1.2   dsl 
    172  1.2   dsl 	free(cp, M_TEMP);
    173  1.2   dsl 	return error;
    174  1.2   dsl #endif
    175  1.2   dsl }
    176  1.2   dsl 
    177  1.2   dsl int
    178  1.2   dsl x86_get_ldt1(struct lwp *l, struct x86_get_ldt_args *ua, union descriptor *cp)
    179  1.2   dsl {
    180  1.2   dsl #ifndef USER_LDT
    181  1.2   dsl 	return EINVAL;
    182  1.2   dsl #else
    183  1.1    ad 	int error;
    184  1.1    ad 	struct proc *p = l->l_proc;
    185  1.1    ad 	pmap_t pmap = p->p_vmspace->vm_map.pmap;
    186  1.1    ad 	int nldt, num;
    187  1.2   dsl 	union descriptor *lp;
    188  1.1    ad 
    189  1.1    ad 	error = kauth_authorize_machdep(l->l_cred, KAUTH_MACHDEP_LDT_GET,
    190  1.1    ad 	    NULL, NULL, NULL, NULL);
    191  1.1    ad 	if (error)
    192  1.1    ad 		return (error);
    193  1.1    ad 
    194  1.1    ad #ifdef	LDT_DEBUG
    195  1.2   dsl 	printf("x86_get_ldt: start=%d num=%d descs=%p\n", ua->start,
    196  1.2   dsl 	    ua->num, ua->desc);
    197  1.1    ad #endif
    198  1.1    ad 
    199  1.2   dsl 	if (ua->start < 0 || ua->num < 0 || ua->start > 8192 || ua->num > 8192 ||
    200  1.2   dsl 	    ua->start + ua->num > 8192)
    201  1.1    ad 		return (EINVAL);
    202  1.1    ad 
    203  1.3    ad 	mutex_enter(&pmap->pm_lock);
    204  1.1    ad 
    205  1.1    ad 	if (pmap->pm_flags & PMF_USER_LDT) {
    206  1.1    ad 		nldt = pmap->pm_ldt_len;
    207  1.1    ad 		lp = pmap->pm_ldt;
    208  1.1    ad 	} else {
    209  1.1    ad 		nldt = NLDT;
    210  1.1    ad 		lp = ldt;
    211  1.1    ad 	}
    212  1.1    ad 
    213  1.2   dsl 	if (ua->start > nldt) {
    214  1.3    ad 		mutex_exit(&pmap->pm_lock);
    215  1.1    ad 		return (EINVAL);
    216  1.1    ad 	}
    217  1.1    ad 
    218  1.2   dsl 	lp += ua->start;
    219  1.2   dsl 	num = min(ua->num, nldt - ua->start);
    220  1.2   dsl 	ua->num = num;
    221  1.1    ad #ifdef LDT_DEBUG
    222  1.1    ad 	{
    223  1.1    ad 		int i;
    224  1.1    ad 		for (i = 0; i < num; i++)
    225  1.1    ad 			x86_print_ldt(i, &lp[i].sd);
    226  1.1    ad 	}
    227  1.1    ad #endif
    228  1.1    ad 
    229  1.1    ad 	memcpy(cp, lp, num * sizeof(union descriptor));
    230  1.3    ad 	mutex_exit(&pmap->pm_lock);
    231  1.1    ad 
    232  1.2   dsl 	return 0;
    233  1.2   dsl #endif
    234  1.2   dsl }
    235  1.2   dsl 
    236  1.2   dsl int
    237  1.2   dsl x86_set_ldt(struct lwp *l, void *args, register_t *retval)
    238  1.2   dsl {
    239  1.2   dsl #ifndef USER_LDT
    240  1.2   dsl 	return EINVAL;
    241  1.2   dsl #else
    242  1.2   dsl 	struct x86_set_ldt_args ua;
    243  1.2   dsl 	union descriptor *descv;
    244  1.2   dsl 	int error;
    245  1.2   dsl 
    246  1.2   dsl 	if ((error = copyin(args, &ua, sizeof(ua))) != 0)
    247  1.2   dsl 		return (error);
    248  1.2   dsl 
    249  1.2   dsl 	if (ua.num < 0 || ua.num > 8192)
    250  1.2   dsl 		return EINVAL;
    251  1.2   dsl 
    252  1.2   dsl 	descv = malloc(sizeof (*descv) * ua.num, M_TEMP, M_NOWAIT);
    253  1.2   dsl 	if (descv == NULL)
    254  1.2   dsl 		return ENOMEM;
    255  1.2   dsl 
    256  1.2   dsl 	error = copyin(ua.desc, descv, sizeof (*descv) * ua.num);
    257  1.1    ad 	if (error == 0)
    258  1.2   dsl 		error = x86_set_ldt1(l, &ua, descv);
    259  1.2   dsl 	*retval = ua.start;
    260  1.1    ad 
    261  1.2   dsl 	free(descv, M_TEMP);
    262  1.2   dsl 	return error;
    263  1.1    ad #endif
    264  1.1    ad }
    265  1.1    ad 
    266  1.1    ad int
    267  1.2   dsl x86_set_ldt1(struct lwp *l, struct x86_set_ldt_args *ua,
    268  1.2   dsl     union descriptor *descv)
    269  1.1    ad {
    270  1.2   dsl #ifndef USER_LDT
    271  1.2   dsl 	return EINVAL;
    272  1.2   dsl #else
    273  1.1    ad 	int error, i, n, sel, free_sel;
    274  1.1    ad 	struct proc *p = l->l_proc;
    275  1.1    ad 	struct pcb *pcb = &l->l_addr->u_pcb;
    276  1.1    ad 	pmap_t pmap = p->p_vmspace->vm_map.pmap;
    277  1.1    ad 	size_t old_len, new_len, ldt_len, free_len;
    278  1.1    ad 	union descriptor *old_ldt, *new_ldt, *free_ldt;
    279  1.1    ad 
    280  1.1    ad 	error = kauth_authorize_machdep(l->l_cred, KAUTH_MACHDEP_LDT_SET,
    281  1.1    ad 	    NULL, NULL, NULL, NULL);
    282  1.1    ad 	if (error)
    283  1.1    ad 		return (error);
    284  1.1    ad 
    285  1.2   dsl 	if (ua->start < 0 || ua->num < 0 || ua->start > 8192 || ua->num > 8192 ||
    286  1.2   dsl 	    ua->start + ua->num > 8192)
    287  1.1    ad 		return (EINVAL);
    288  1.1    ad 
    289  1.1    ad 	/* Check descriptors for access violations. */
    290  1.2   dsl 	for (i = 0; i < ua->num; i++) {
    291  1.1    ad 		union descriptor *desc = &descv[i];
    292  1.1    ad 
    293  1.1    ad 		switch (desc->sd.sd_type) {
    294  1.1    ad 		case SDT_SYSNULL:
    295  1.1    ad 			desc->sd.sd_p = 0;
    296  1.1    ad 			break;
    297  1.1    ad 		case SDT_SYS286CGT:
    298  1.1    ad 		case SDT_SYS386CGT:
    299  1.1    ad 			/*
    300  1.1    ad 			 * Only allow call gates targeting a segment
    301  1.1    ad 			 * in the LDT or a user segment in the fixed
    302  1.1    ad 			 * part of the gdt.  Segments in the LDT are
    303  1.1    ad 			 * constrained (below) to be user segments.
    304  1.1    ad 			 */
    305  1.1    ad 			if (desc->gd.gd_p != 0 &&
    306  1.1    ad 			    !ISLDT(desc->gd.gd_selector) &&
    307  1.1    ad 			    ((IDXSEL(desc->gd.gd_selector) >= NGDT) ||
    308  1.1    ad 			     (gdt[IDXSEL(desc->gd.gd_selector)].sd.sd_dpl !=
    309  1.1    ad 				 SEL_UPL))) {
    310  1.2   dsl 				return EACCES;
    311  1.1    ad 			}
    312  1.1    ad 			break;
    313  1.1    ad 		case SDT_MEMEC:
    314  1.1    ad 		case SDT_MEMEAC:
    315  1.1    ad 		case SDT_MEMERC:
    316  1.1    ad 		case SDT_MEMERAC:
    317  1.1    ad 			/* Must be "present" if executable and conforming. */
    318  1.2   dsl 			if (desc->sd.sd_p == 0)
    319  1.2   dsl 				return EACCES;
    320  1.1    ad 			break;
    321  1.1    ad 		case SDT_MEMRO:
    322  1.1    ad 		case SDT_MEMROA:
    323  1.1    ad 		case SDT_MEMRW:
    324  1.1    ad 		case SDT_MEMRWA:
    325  1.1    ad 		case SDT_MEMROD:
    326  1.1    ad 		case SDT_MEMRODA:
    327  1.1    ad 		case SDT_MEMRWD:
    328  1.1    ad 		case SDT_MEMRWDA:
    329  1.1    ad 		case SDT_MEME:
    330  1.1    ad 		case SDT_MEMEA:
    331  1.1    ad 		case SDT_MEMER:
    332  1.1    ad 		case SDT_MEMERA:
    333  1.1    ad 			break;
    334  1.1    ad 		default:
    335  1.1    ad 			/*
    336  1.1    ad 			 * Make sure that unknown descriptor types are
    337  1.1    ad 			 * not marked present.
    338  1.1    ad 			 */
    339  1.2   dsl 			if (desc->sd.sd_p != 0)
    340  1.2   dsl 				return EACCES;
    341  1.1    ad 			break;
    342  1.1    ad 		}
    343  1.1    ad 
    344  1.1    ad 		if (desc->sd.sd_p != 0) {
    345  1.1    ad 			/* Only user (ring-3) descriptors may be present. */
    346  1.2   dsl 			if (desc->sd.sd_dpl != SEL_UPL)
    347  1.2   dsl 				return EACCES;
    348  1.1    ad 		}
    349  1.1    ad 	}
    350  1.1    ad 
    351  1.1    ad 	/* allocate user ldt */
    352  1.1    ad 	free_sel = -1;
    353  1.1    ad 	new_ldt = NULL;
    354  1.1    ad 	new_len = 0;
    355  1.1    ad 	free_ldt = NULL;
    356  1.1    ad 	free_len = 0;
    357  1.3    ad 	mutex_enter(&pmap->pm_lock);
    358  1.2   dsl 	if (pmap->pm_ldt == 0 || (ua->start + ua->num) > pmap->pm_ldt_len) {
    359  1.1    ad 		if (pmap->pm_flags & PMF_USER_LDT)
    360  1.1    ad 			ldt_len = pmap->pm_ldt_len;
    361  1.1    ad 		else
    362  1.1    ad 			ldt_len = 512;
    363  1.2   dsl 		while ((ua->start + ua->num) > ldt_len)
    364  1.1    ad 			ldt_len *= 2;
    365  1.1    ad 		new_len = ldt_len * sizeof(union descriptor);
    366  1.1    ad 
    367  1.3    ad 		mutex_exit(&pmap->pm_lock);
    368  1.1    ad 		new_ldt = (union descriptor *)uvm_km_alloc(kernel_map,
    369  1.1    ad 		    new_len, 0, UVM_KMF_WIRED);
    370  1.1    ad 		memset(new_ldt, 0, new_len);
    371  1.1    ad 		sel = ldt_alloc(new_ldt, new_len);
    372  1.3    ad 		mutex_enter(&pmap->pm_lock);
    373  1.1    ad 
    374  1.1    ad 		if (pmap->pm_ldt != NULL && ldt_len <= pmap->pm_ldt_len) {
    375  1.1    ad 			/*
    376  1.1    ad 			 * Another thread (re)allocated the LDT to
    377  1.1    ad 			 * sufficient size while we were blocked in
    378  1.1    ad 			 * uvm_km_alloc. Oh well. The new entries
    379  1.1    ad 			 * will quite probably not be right, but
    380  1.1    ad 			 * hey.. not our problem if user applications
    381  1.1    ad 			 * have race conditions like that.
    382  1.1    ad 			 */
    383  1.1    ad 			goto copy;
    384  1.1    ad 		}
    385  1.1    ad 
    386  1.1    ad 		old_ldt = pmap->pm_ldt;
    387  1.1    ad 		free_ldt = old_ldt;
    388  1.1    ad 		free_len = pmap->pm_ldt_len * sizeof(union descriptor);
    389  1.1    ad 
    390  1.1    ad 		if (old_ldt != NULL) {
    391  1.1    ad 			old_len = pmap->pm_ldt_len * sizeof(union descriptor);
    392  1.1    ad 		} else {
    393  1.1    ad 			old_len = NLDT * sizeof(union descriptor);
    394  1.1    ad 			old_ldt = ldt;
    395  1.1    ad 		}
    396  1.1    ad 
    397  1.1    ad 		memcpy(new_ldt, old_ldt, old_len);
    398  1.1    ad 		memset((char *)new_ldt + old_len, 0, new_len - old_len);
    399  1.1    ad 
    400  1.1    ad 		pmap->pm_ldt = new_ldt;
    401  1.1    ad 		pmap->pm_ldt_len = ldt_len;
    402  1.1    ad 
    403  1.1    ad 		if (pmap->pm_flags & PMF_USER_LDT)
    404  1.1    ad 			free_sel = pmap->pm_ldt_sel;
    405  1.1    ad 		else {
    406  1.1    ad 			pmap->pm_flags |= PMF_USER_LDT;
    407  1.1    ad 			free_sel = -1;
    408  1.1    ad 		}
    409  1.1    ad 		pmap->pm_ldt_sel = sel;
    410  1.1    ad 		pcb->pcb_ldt_sel = pmap->pm_ldt_sel;
    411  1.1    ad 		if (pcb == curpcb)
    412  1.1    ad 			lldt(pcb->pcb_ldt_sel);
    413  1.1    ad 		new_ldt = NULL;
    414  1.1    ad 	}
    415  1.1    ad copy:
    416  1.1    ad 	/* Now actually replace the descriptors. */
    417  1.2   dsl 	for (i = 0, n = ua->start; i < ua->num; i++, n++)
    418  1.1    ad 		pmap->pm_ldt[n] = descv[i];
    419  1.1    ad 
    420  1.3    ad 	mutex_exit(&pmap->pm_lock);
    421  1.1    ad 
    422  1.1    ad 	if (new_ldt != NULL)
    423  1.1    ad 		uvm_km_free(kernel_map, (vaddr_t)new_ldt, new_len,
    424  1.1    ad 		    UVM_KMF_WIRED);
    425  1.1    ad 	if (free_sel != -1)
    426  1.1    ad 		ldt_free(free_sel);
    427  1.1    ad 	if (free_ldt != NULL)
    428  1.1    ad 		uvm_km_free(kernel_map, (vaddr_t)free_ldt, free_len,
    429  1.1    ad 		    UVM_KMF_WIRED);
    430  1.2   dsl 
    431  1.1    ad 	return (error);
    432  1.1    ad #endif
    433  1.1    ad }
    434  1.1    ad 
    435  1.1    ad int
    436  1.1    ad x86_iopl(struct lwp *l, void *args, register_t *retval)
    437  1.1    ad {
    438  1.1    ad 	int error;
    439  1.1    ad 	struct x86_iopl_args ua;
    440  1.1    ad #ifdef XEN
    441  1.9  yamt 	int iopl;
    442  1.1    ad #else
    443  1.1    ad 	struct trapframe *tf = l->l_md.md_regs;
    444  1.1    ad #endif
    445  1.1    ad 
    446  1.1    ad 	error = kauth_authorize_machdep(l->l_cred, KAUTH_MACHDEP_IOPL,
    447  1.1    ad 	    NULL, NULL, NULL, NULL);
    448  1.1    ad 	if (error)
    449  1.1    ad 		return (error);
    450  1.1    ad 
    451  1.1    ad 	if ((error = copyin(args, &ua, sizeof(ua))) != 0)
    452  1.1    ad 		return error;
    453  1.1    ad 
    454  1.1    ad #ifdef XEN
    455  1.9  yamt 	if (ua.iopl)
    456  1.9  yamt 		iopl = SEL_UPL;
    457  1.9  yamt 	else
    458  1.9  yamt 		iopl = SEL_KPL;
    459  1.1    ad 	/* Force the change at ring 0. */
    460  1.1    ad #ifdef XEN3
    461  1.1    ad 	{
    462  1.1    ad 		struct physdev_op physop;
    463  1.1    ad 		physop.cmd = PHYSDEVOP_SET_IOPL;
    464  1.9  yamt 		physop.u.set_iopl.iopl = iopl;
    465  1.1    ad 		HYPERVISOR_physdev_op(&physop);
    466  1.1    ad 	}
    467  1.1    ad #else /* XEN3 */
    468  1.1    ad 	{
    469  1.1    ad 		dom0_op_t op;
    470  1.1    ad 		op.cmd = DOM0_IOPL;
    471  1.1    ad 		op.u.iopl.domain = DOMID_SELF;
    472  1.9  yamt 		op.u.iopl.iopl = iopl;
    473  1.1    ad 		HYPERVISOR_dom0_op(&op);
    474  1.1    ad 	}
    475  1.1    ad #endif /* XEN3 */
    476  1.1    ad #elif defined(__x86_64__)
    477  1.1    ad 	if (ua.iopl)
    478  1.1    ad 		tf->tf_rflags |= PSL_IOPL;
    479  1.1    ad 	else
    480  1.1    ad 		tf->tf_rflags &= ~PSL_IOPL;
    481  1.1    ad #else
    482  1.1    ad 	if (ua.iopl)
    483  1.1    ad 		tf->tf_eflags |= PSL_IOPL;
    484  1.1    ad 	else
    485  1.1    ad 		tf->tf_eflags &= ~PSL_IOPL;
    486  1.1    ad #endif
    487  1.1    ad 
    488  1.1    ad 	return 0;
    489  1.1    ad }
    490  1.1    ad 
    491  1.1    ad int
    492  1.1    ad x86_get_ioperm(struct lwp *l, void *args, register_t *retval)
    493  1.1    ad {
    494  1.1    ad #ifdef IOPERM
    495  1.1    ad 	int error;
    496  1.1    ad 	struct pcb *pcb = &l->l_addr->u_pcb;
    497  1.1    ad 	struct x86_get_ioperm_args ua;
    498  1.9  yamt 	void *dummymap = NULL;
    499  1.9  yamt 	void *iomap;
    500  1.1    ad 
    501  1.1    ad 	error = kauth_authorize_machdep(l->l_cred, KAUTH_MACHDEP_IOPERM_GET,
    502  1.1    ad 	    NULL, NULL, NULL, NULL);
    503  1.1    ad 	if (error)
    504  1.1    ad 		return (error);
    505  1.1    ad 
    506  1.1    ad 	if ((error = copyin(args, &ua, sizeof(ua))) != 0)
    507  1.1    ad 		return (error);
    508  1.1    ad 
    509  1.9  yamt 	iomap = pcb->pcb_iomap;
    510  1.9  yamt 	if (iomap == NULL) {
    511  1.9  yamt 		iomap = dummymap = kmem_alloc(IOMAPSIZE, KM_SLEEP);
    512  1.9  yamt 		memset(dummymap, 0xff, IOMAPSIZE);
    513  1.9  yamt 	}
    514  1.9  yamt 	error = copyout(iomap, ua.iomap, IOMAPSIZE);
    515  1.9  yamt 	if (dummymap != NULL) {
    516  1.9  yamt 		kmem_free(dummymap, IOMAPSIZE);
    517  1.9  yamt 	}
    518  1.9  yamt 	return error;
    519  1.1    ad #else
    520  1.1    ad 	return EINVAL;
    521  1.1    ad #endif
    522  1.1    ad }
    523  1.1    ad 
    524  1.1    ad int
    525  1.1    ad x86_set_ioperm(struct lwp *l, void *args, register_t *retval)
    526  1.1    ad {
    527  1.1    ad #ifdef IOPERM
    528  1.9  yamt 	struct cpu_info *ci;
    529  1.1    ad 	int error;
    530  1.1    ad 	struct pcb *pcb = &l->l_addr->u_pcb;
    531  1.1    ad 	struct x86_set_ioperm_args ua;
    532  1.9  yamt 	void *new;
    533  1.9  yamt 	void *old;
    534  1.1    ad 
    535  1.1    ad   	error = kauth_authorize_machdep(l->l_cred, KAUTH_MACHDEP_IOPERM_SET,
    536  1.1    ad 	    NULL, NULL, NULL, NULL);
    537  1.1    ad 	if (error)
    538  1.1    ad 		return (error);
    539  1.1    ad 
    540  1.1    ad 	if ((error = copyin(args, &ua, sizeof(ua))) != 0)
    541  1.1    ad 		return (error);
    542  1.1    ad 
    543  1.9  yamt 	new = kmem_alloc(IOMAPSIZE, KM_SLEEP);
    544  1.9  yamt 	error = copyin(ua.iomap, new, IOMAPSIZE);
    545  1.9  yamt 	if (error) {
    546  1.9  yamt 		kmem_free(new, IOMAPSIZE);
    547  1.9  yamt 		return error;
    548  1.9  yamt 	}
    549  1.9  yamt 	old = pcb->pcb_iomap;
    550  1.9  yamt 	pcb->pcb_iomap = new;
    551  1.9  yamt 	if (old != NULL) {
    552  1.9  yamt 		kmem_free(old, IOMAPSIZE);
    553  1.9  yamt 	}
    554  1.9  yamt 
    555  1.9  yamt 	crit_enter();
    556  1.9  yamt 	ci = curcpu();
    557  1.9  yamt 	memcpy(ci->ci_iomap, pcb->pcb_iomap, sizeof(ci->ci_iomap));
    558  1.9  yamt 	ci->ci_tss.tss_iobase =
    559  1.9  yamt 	    ((uintptr_t)ci->ci_iomap - (uintptr_t)&ci->ci_tss) << 16;
    560  1.9  yamt 	crit_exit();
    561  1.9  yamt 
    562  1.9  yamt 	return error;
    563  1.1    ad #else
    564  1.1    ad 	return EINVAL;
    565  1.1    ad #endif
    566  1.1    ad }
    567  1.1    ad 
    568  1.1    ad int
    569  1.1    ad x86_get_mtrr(struct lwp *l, void *args, register_t *retval)
    570  1.1    ad {
    571  1.1    ad #ifdef MTRR
    572  1.1    ad 	struct x86_get_mtrr_args ua;
    573  1.1    ad 	int error, n;
    574  1.1    ad 
    575  1.1    ad 	if (mtrr_funcs == NULL)
    576  1.1    ad 		return ENOSYS;
    577  1.1    ad 
    578  1.1    ad  	error = kauth_authorize_machdep(l->l_cred, KAUTH_MACHDEP_MTRR_GET,
    579  1.1    ad 	    NULL, NULL, NULL, NULL);
    580  1.1    ad 	if (error)
    581  1.1    ad 		return (error);
    582  1.1    ad 
    583  1.1    ad 	error = copyin(args, &ua, sizeof ua);
    584  1.1    ad 	if (error != 0)
    585  1.1    ad 		return error;
    586  1.1    ad 
    587  1.1    ad 	error = copyin(ua.n, &n, sizeof n);
    588  1.1    ad 	if (error != 0)
    589  1.1    ad 		return error;
    590  1.1    ad 
    591  1.1    ad 	error = mtrr_get(ua.mtrrp, &n, l->l_proc, MTRR_GETSET_USER);
    592  1.1    ad 
    593  1.1    ad 	copyout(&n, ua.n, sizeof (int));
    594  1.1    ad 
    595  1.1    ad 	return error;
    596  1.1    ad #else
    597  1.1    ad 	return EINVAL;
    598  1.1    ad #endif
    599  1.1    ad }
    600  1.1    ad 
    601  1.1    ad int
    602  1.1    ad x86_set_mtrr(struct lwp *l, void *args, register_t *retval)
    603  1.1    ad {
    604  1.1    ad #ifdef MTRR
    605  1.1    ad 	int error, n;
    606  1.1    ad 	struct x86_set_mtrr_args ua;
    607  1.1    ad 
    608  1.1    ad 	if (mtrr_funcs == NULL)
    609  1.1    ad 		return ENOSYS;
    610  1.1    ad 
    611  1.1    ad  	error = kauth_authorize_machdep(l->l_cred, KAUTH_MACHDEP_MTRR_SET,
    612  1.1    ad 	    NULL, NULL, NULL, NULL);
    613  1.1    ad 	if (error)
    614  1.1    ad 		return (error);
    615  1.1    ad 
    616  1.1    ad 	error = copyin(args, &ua, sizeof ua);
    617  1.1    ad 	if (error != 0)
    618  1.1    ad 		return error;
    619  1.1    ad 
    620  1.1    ad 	error = copyin(ua.n, &n, sizeof n);
    621  1.1    ad 	if (error != 0)
    622  1.1    ad 		return error;
    623  1.1    ad 
    624  1.1    ad 	error = mtrr_set(ua.mtrrp, &n, l->l_proc, MTRR_GETSET_USER);
    625  1.1    ad 	if (n != 0)
    626  1.1    ad 		mtrr_commit();
    627  1.1    ad 
    628  1.1    ad 	copyout(&n, ua.n, sizeof n);
    629  1.1    ad 
    630  1.1    ad 	return error;
    631  1.1    ad #else
    632  1.1    ad 	return EINVAL;
    633  1.1    ad #endif
    634  1.1    ad }
    635  1.1    ad 
    636  1.1    ad int
    637  1.5    ad x86_set_sdbase(void *arg, char which)
    638  1.5    ad {
    639  1.5    ad #ifdef i386
    640  1.6    ad 	struct segment_descriptor sd;
    641  1.5    ad 	vaddr_t base;
    642  1.6    ad 	int error;
    643  1.5    ad 
    644  1.5    ad 	error = copyin(arg, &base, sizeof(base));
    645  1.5    ad 	if (error != 0)
    646  1.5    ad 		return error;
    647  1.5    ad 
    648  1.6    ad 	sd.sd_lobase = base & 0xffffff;
    649  1.6    ad 	sd.sd_hibase = (base >> 24) & 0xff;
    650  1.6    ad 	sd.sd_lolimit = 0xffff;
    651  1.6    ad 	sd.sd_hilimit = 0xf;
    652  1.6    ad 	sd.sd_type = SDT_MEMRWA;
    653  1.6    ad 	sd.sd_dpl = SEL_UPL;
    654  1.6    ad 	sd.sd_p = 1;
    655  1.6    ad 	sd.sd_xx = 0;
    656  1.6    ad 	sd.sd_def32 = 1;
    657  1.6    ad 	sd.sd_gran = 1;
    658  1.6    ad 
    659  1.6    ad 	crit_enter();
    660  1.6    ad 	if (which == 'f') {
    661  1.6    ad 		memcpy(&curpcb->pcb_fsd, &sd, sizeof(sd));
    662  1.6    ad 		memcpy(&curcpu()->ci_gdt[GUFS_SEL], &sd, sizeof(sd));
    663  1.6    ad 	} else /* which == 'g' */ {
    664  1.6    ad 		memcpy(&curpcb->pcb_gsd, &sd, sizeof(sd));
    665  1.6    ad 		memcpy(&curcpu()->ci_gdt[GUGS_SEL], &sd, sizeof(sd));
    666  1.6    ad 	}
    667  1.6    ad 	crit_exit();
    668  1.5    ad 
    669  1.5    ad 	return 0;
    670  1.5    ad #else
    671  1.5    ad 	return EINVAL;
    672  1.5    ad #endif
    673  1.5    ad }
    674  1.5    ad 
    675  1.5    ad int
    676  1.5    ad x86_get_sdbase(void *arg, char which)
    677  1.5    ad {
    678  1.5    ad #ifdef i386
    679  1.5    ad 	struct segment_descriptor *sd;
    680  1.5    ad 	vaddr_t base;
    681  1.5    ad 
    682  1.5    ad 	switch (which) {
    683  1.5    ad 	case 'f':
    684  1.6    ad 		sd = (struct segment_descriptor *)&curpcb->pcb_fsd;
    685  1.5    ad 		break;
    686  1.5    ad 	case 'g':
    687  1.6    ad 		sd = (struct segment_descriptor *)&curpcb->pcb_gsd;
    688  1.5    ad 		break;
    689  1.5    ad 	default:
    690  1.5    ad 		panic("x86_get_sdbase");
    691  1.5    ad 	}
    692  1.5    ad 
    693  1.5    ad 	base = sd->sd_hibase << 24 | sd->sd_lobase;
    694  1.5    ad 	return copyout(&base, &arg, sizeof(base));
    695  1.5    ad #else
    696  1.5    ad 	return EINVAL;
    697  1.5    ad #endif
    698  1.5    ad }
    699  1.5    ad 
    700  1.5    ad int
    701  1.8   dsl sys_sysarch(struct lwp *l, const struct sys_sysarch_args *uap, register_t *retval)
    702  1.1    ad {
    703  1.8   dsl 	/* {
    704  1.1    ad 		syscallarg(int) op;
    705  1.1    ad 		syscallarg(void *) parms;
    706  1.8   dsl 	} */
    707  1.1    ad 	int error = 0;
    708  1.1    ad 
    709  1.1    ad 	switch(SCARG(uap, op)) {
    710  1.1    ad 	case X86_IOPL:
    711  1.1    ad 		error = x86_iopl(l, SCARG(uap, parms), retval);
    712  1.1    ad 		break;
    713  1.1    ad 
    714  1.1    ad 	case X86_GET_LDT:
    715  1.1    ad 		error = x86_get_ldt(l, SCARG(uap, parms), retval);
    716  1.1    ad 		break;
    717  1.1    ad 
    718  1.1    ad 	case X86_SET_LDT:
    719  1.1    ad 		error = x86_set_ldt(l, SCARG(uap, parms), retval);
    720  1.1    ad 		break;
    721  1.1    ad 
    722  1.1    ad 	case X86_GET_IOPERM:
    723  1.1    ad 		error = x86_get_ioperm(l, SCARG(uap, parms), retval);
    724  1.1    ad 		break;
    725  1.1    ad 
    726  1.1    ad 	case X86_SET_IOPERM:
    727  1.1    ad 		error = x86_set_ioperm(l, SCARG(uap, parms), retval);
    728  1.1    ad 		break;
    729  1.1    ad 
    730  1.1    ad 	case X86_GET_MTRR:
    731  1.1    ad 		error = x86_get_mtrr(l, SCARG(uap, parms), retval);
    732  1.1    ad 		break;
    733  1.1    ad 	case X86_SET_MTRR:
    734  1.1    ad 		error = x86_set_mtrr(l, SCARG(uap, parms), retval);
    735  1.1    ad 		break;
    736  1.1    ad 
    737  1.1    ad #ifdef VM86
    738  1.1    ad 	case X86_VM86:
    739  1.1    ad 		error = x86_vm86(l, SCARG(uap, parms), retval);
    740  1.1    ad 		break;
    741  1.1    ad #ifdef COMPAT_16
    742  1.1    ad 	case X86_OLD_VM86:
    743  1.1    ad 		error = compat_16_x86_vm86(l, SCARG(uap, parms), retval);
    744  1.1    ad 		break;
    745  1.1    ad #endif
    746  1.1    ad #endif
    747  1.1    ad 
    748  1.1    ad #ifdef PERFCTRS
    749  1.1    ad 	case X86_PMC_INFO:
    750  1.1    ad 		error = pmc_info(l, SCARG(uap, parms), retval);
    751  1.1    ad 		break;
    752  1.1    ad 
    753  1.1    ad 	case X86_PMC_STARTSTOP:
    754  1.1    ad 		error = pmc_startstop(l, SCARG(uap, parms), retval);
    755  1.1    ad 		break;
    756  1.1    ad 
    757  1.1    ad 	case X86_PMC_READ:
    758  1.1    ad 		error = pmc_read(l, SCARG(uap, parms), retval);
    759  1.1    ad 		break;
    760  1.1    ad #endif
    761  1.1    ad 
    762  1.5    ad 	case X86_SET_FSBASE:
    763  1.5    ad 		error = x86_set_sdbase(SCARG(uap, parms), 'f');
    764  1.5    ad 		break;
    765  1.5    ad 
    766  1.5    ad 	case X86_SET_GSBASE:
    767  1.5    ad 		error = x86_set_sdbase(SCARG(uap, parms), 'g');
    768  1.5    ad 		break;
    769  1.5    ad 
    770  1.5    ad 	case X86_GET_FSBASE:
    771  1.5    ad 		error = x86_get_sdbase(SCARG(uap, parms), 'f');
    772  1.5    ad 		break;
    773  1.5    ad 
    774  1.5    ad 	case X86_GET_GSBASE:
    775  1.5    ad 		error = x86_get_sdbase(SCARG(uap, parms), 'g');
    776  1.5    ad 		break;
    777  1.5    ad 
    778  1.1    ad 	default:
    779  1.1    ad 		error = EINVAL;
    780  1.1    ad 		break;
    781  1.1    ad 	}
    782  1.1    ad 	return (error);
    783  1.1    ad }
    784