Home | History | Annotate | Line # | Download | only in x86
nvmm_x86.c revision 1.18
      1 /*	$NetBSD: nvmm_x86.c,v 1.18 2020/09/05 07:45:44 maxv Exp $	*/
      2 
      3 /*
      4  * Copyright (c) 2018-2020 Maxime Villard, m00nbsd.net
      5  * All rights reserved.
      6  *
      7  * This code is part of the NVMM hypervisor.
      8  *
      9  * Redistribution and use in source and binary forms, with or without
     10  * modification, are permitted provided that the following conditions
     11  * are met:
     12  * 1. Redistributions of source code must retain the above copyright
     13  *    notice, this list of conditions and the following disclaimer.
     14  * 2. Redistributions in binary form must reproduce the above copyright
     15  *    notice, this list of conditions and the following disclaimer in the
     16  *    documentation and/or other materials provided with the distribution.
     17  *
     18  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     19  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     20  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     21  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     22  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
     23  * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
     24  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
     25  * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
     26  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     27  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     28  * SUCH DAMAGE.
     29  */
     30 
     31 #include <sys/cdefs.h>
     32 __KERNEL_RCSID(0, "$NetBSD: nvmm_x86.c,v 1.18 2020/09/05 07:45:44 maxv Exp $");
     33 
     34 #include <sys/param.h>
     35 #include <sys/systm.h>
     36 #include <sys/kernel.h>
     37 #include <sys/cpu.h>
     38 
     39 #include <uvm/uvm.h>
     40 #include <uvm/uvm_page.h>
     41 
     42 #include <x86/cputypes.h>
     43 #include <x86/specialreg.h>
     44 #include <x86/pmap.h>
     45 
     46 #include <dev/nvmm/nvmm.h>
     47 #include <dev/nvmm/nvmm_internal.h>
     48 #include <dev/nvmm/x86/nvmm_x86.h>
     49 
     50 /*
     51  * Code shared between x86-SVM and x86-VMX.
     52  */
     53 
     54 const struct nvmm_x64_state nvmm_x86_reset_state = {
     55 	.segs = {
     56 		[NVMM_X64_SEG_ES] = {
     57 			.selector = 0x0000,
     58 			.base = 0x00000000,
     59 			.limit = 0xFFFF,
     60 			.attrib = {
     61 				.type = 3,
     62 				.s = 1,
     63 				.p = 1,
     64 			}
     65 		},
     66 		[NVMM_X64_SEG_CS] = {
     67 			.selector = 0xF000,
     68 			.base = 0xFFFF0000,
     69 			.limit = 0xFFFF,
     70 			.attrib = {
     71 				.type = 3,
     72 				.s = 1,
     73 				.p = 1,
     74 			}
     75 		},
     76 		[NVMM_X64_SEG_SS] = {
     77 			.selector = 0x0000,
     78 			.base = 0x00000000,
     79 			.limit = 0xFFFF,
     80 			.attrib = {
     81 				.type = 3,
     82 				.s = 1,
     83 				.p = 1,
     84 			}
     85 		},
     86 		[NVMM_X64_SEG_DS] = {
     87 			.selector = 0x0000,
     88 			.base = 0x00000000,
     89 			.limit = 0xFFFF,
     90 			.attrib = {
     91 				.type = 3,
     92 				.s = 1,
     93 				.p = 1,
     94 			}
     95 		},
     96 		[NVMM_X64_SEG_FS] = {
     97 			.selector = 0x0000,
     98 			.base = 0x00000000,
     99 			.limit = 0xFFFF,
    100 			.attrib = {
    101 				.type = 3,
    102 				.s = 1,
    103 				.p = 1,
    104 			}
    105 		},
    106 		[NVMM_X64_SEG_GS] = {
    107 			.selector = 0x0000,
    108 			.base = 0x00000000,
    109 			.limit = 0xFFFF,
    110 			.attrib = {
    111 				.type = 3,
    112 				.s = 1,
    113 				.p = 1,
    114 			}
    115 		},
    116 		[NVMM_X64_SEG_GDT] = {
    117 			.selector = 0x0000,
    118 			.base = 0x00000000,
    119 			.limit = 0xFFFF,
    120 			.attrib = {
    121 				.type = 2,
    122 				.s = 1,
    123 				.p = 1,
    124 			}
    125 		},
    126 		[NVMM_X64_SEG_IDT] = {
    127 			.selector = 0x0000,
    128 			.base = 0x00000000,
    129 			.limit = 0xFFFF,
    130 			.attrib = {
    131 				.type = 2,
    132 				.s = 1,
    133 				.p = 1,
    134 			}
    135 		},
    136 		[NVMM_X64_SEG_LDT] = {
    137 			.selector = 0x0000,
    138 			.base = 0x00000000,
    139 			.limit = 0xFFFF,
    140 			.attrib = {
    141 				.type = SDT_SYSLDT,
    142 				.s = 0,
    143 				.p = 1,
    144 			}
    145 		},
    146 		[NVMM_X64_SEG_TR] = {
    147 			.selector = 0x0000,
    148 			.base = 0x00000000,
    149 			.limit = 0xFFFF,
    150 			.attrib = {
    151 				.type = SDT_SYS286BSY,
    152 				.s = 0,
    153 				.p = 1,
    154 			}
    155 		},
    156 	},
    157 
    158 	.gprs = {
    159 		[NVMM_X64_GPR_RAX] = 0x00000000,
    160 		[NVMM_X64_GPR_RCX] = 0x00000000,
    161 		[NVMM_X64_GPR_RDX] = 0x00000600,
    162 		[NVMM_X64_GPR_RBX] = 0x00000000,
    163 		[NVMM_X64_GPR_RSP] = 0x00000000,
    164 		[NVMM_X64_GPR_RBP] = 0x00000000,
    165 		[NVMM_X64_GPR_RSI] = 0x00000000,
    166 		[NVMM_X64_GPR_RDI] = 0x00000000,
    167 		[NVMM_X64_GPR_R8] = 0x00000000,
    168 		[NVMM_X64_GPR_R9] = 0x00000000,
    169 		[NVMM_X64_GPR_R10] = 0x00000000,
    170 		[NVMM_X64_GPR_R11] = 0x00000000,
    171 		[NVMM_X64_GPR_R12] = 0x00000000,
    172 		[NVMM_X64_GPR_R13] = 0x00000000,
    173 		[NVMM_X64_GPR_R14] = 0x00000000,
    174 		[NVMM_X64_GPR_R15] = 0x00000000,
    175 		[NVMM_X64_GPR_RIP] = 0x0000FFF0,
    176 		[NVMM_X64_GPR_RFLAGS] = 0x00000002,
    177 	},
    178 
    179 	.crs = {
    180 		[NVMM_X64_CR_CR0] = 0x60000010,
    181 		[NVMM_X64_CR_CR2] = 0x00000000,
    182 		[NVMM_X64_CR_CR3] = 0x00000000,
    183 		[NVMM_X64_CR_CR4] = 0x00000000,
    184 		[NVMM_X64_CR_CR8] = 0x00000000,
    185 		[NVMM_X64_CR_XCR0] = 0x00000001,
    186 	},
    187 
    188 	.drs = {
    189 		[NVMM_X64_DR_DR0] = 0x00000000,
    190 		[NVMM_X64_DR_DR1] = 0x00000000,
    191 		[NVMM_X64_DR_DR2] = 0x00000000,
    192 		[NVMM_X64_DR_DR3] = 0x00000000,
    193 		[NVMM_X64_DR_DR6] = 0xFFFF0FF0,
    194 		[NVMM_X64_DR_DR7] = 0x00000400,
    195 	},
    196 
    197 	.msrs = {
    198 		[NVMM_X64_MSR_EFER] = 0x00000000,
    199 		[NVMM_X64_MSR_STAR] = 0x00000000,
    200 		[NVMM_X64_MSR_LSTAR] = 0x00000000,
    201 		[NVMM_X64_MSR_CSTAR] = 0x00000000,
    202 		[NVMM_X64_MSR_SFMASK] = 0x00000000,
    203 		[NVMM_X64_MSR_KERNELGSBASE] = 0x00000000,
    204 		[NVMM_X64_MSR_SYSENTER_CS] = 0x00000000,
    205 		[NVMM_X64_MSR_SYSENTER_ESP] = 0x00000000,
    206 		[NVMM_X64_MSR_SYSENTER_EIP] = 0x00000000,
    207 		[NVMM_X64_MSR_PAT] =
    208 		    PATENTRY(0, PAT_WB) | PATENTRY(1, PAT_WT) |
    209 		    PATENTRY(2, PAT_UCMINUS) | PATENTRY(3, PAT_UC) |
    210 		    PATENTRY(4, PAT_WB) | PATENTRY(5, PAT_WT) |
    211 		    PATENTRY(6, PAT_UCMINUS) | PATENTRY(7, PAT_UC),
    212 		[NVMM_X64_MSR_TSC] = 0,
    213 	},
    214 
    215 	.intr = {
    216 		.int_shadow = 0,
    217 		.int_window_exiting = 0,
    218 		.nmi_window_exiting = 0,
    219 		.evt_pending = 0,
    220 	},
    221 
    222 	.fpu = {
    223 		.fx_cw = 0x0040,
    224 		.fx_sw = 0x0000,
    225 		.fx_tw = 0x55,
    226 		.fx_zero = 0x55,
    227 		.fx_mxcsr = 0x1F80,
    228 	}
    229 };
    230 
    231 const struct nvmm_x86_cpuid_mask nvmm_cpuid_00000001 = {
    232 	.eax = ~0,
    233 	.ebx = ~0,
    234 	.ecx =
    235 	    CPUID2_SSE3 |
    236 	    CPUID2_PCLMULQDQ |
    237 	    /* CPUID2_DTES64 excluded */
    238 	    /* CPUID2_MONITOR excluded */
    239 	    /* CPUID2_DS_CPL excluded */
    240 	    /* CPUID2_VMX excluded */
    241 	    /* CPUID2_SMX excluded */
    242 	    /* CPUID2_EST excluded */
    243 	    /* CPUID2_TM2 excluded */
    244 	    CPUID2_SSSE3 |
    245 	    /* CPUID2_CNXTID excluded */
    246 	    /* CPUID2_SDBG excluded */
    247 	    CPUID2_FMA |
    248 	    CPUID2_CX16 |
    249 	    /* CPUID2_XTPR excluded */
    250 	    /* CPUID2_PDCM excluded */
    251 	    /* CPUID2_PCID excluded, but re-included in VMX */
    252 	    /* CPUID2_DCA excluded */
    253 	    CPUID2_SSE41 |
    254 	    CPUID2_SSE42 |
    255 	    /* CPUID2_X2APIC excluded */
    256 	    CPUID2_MOVBE |
    257 	    CPUID2_POPCNT |
    258 	    /* CPUID2_DEADLINE excluded */
    259 	    CPUID2_AESNI |
    260 	    CPUID2_XSAVE |
    261 	    CPUID2_OSXSAVE |
    262 	    /* CPUID2_AVX excluded */
    263 	    CPUID2_F16C |
    264 	    CPUID2_RDRAND,
    265 	    /* CPUID2_RAZ excluded */
    266 	.edx =
    267 	    CPUID_FPU |
    268 	    CPUID_VME |
    269 	    CPUID_DE |
    270 	    CPUID_PSE |
    271 	    CPUID_TSC |
    272 	    CPUID_MSR |
    273 	    CPUID_PAE |
    274 	    /* CPUID_MCE excluded */
    275 	    CPUID_CX8 |
    276 	    CPUID_APIC |
    277 	    CPUID_SEP |
    278 	    /* CPUID_MTRR excluded */
    279 	    CPUID_PGE |
    280 	    /* CPUID_MCA excluded */
    281 	    CPUID_CMOV |
    282 	    CPUID_PAT |
    283 	    CPUID_PSE36 |
    284 	    /* CPUID_PSN excluded */
    285 	    CPUID_CLFSH |
    286 	    /* CPUID_DS excluded */
    287 	    /* CPUID_ACPI excluded */
    288 	    CPUID_MMX |
    289 	    CPUID_FXSR |
    290 	    CPUID_SSE |
    291 	    CPUID_SSE2 |
    292 	    CPUID_SS |
    293 	    CPUID_HTT |
    294 	    /* CPUID_TM excluded */
    295 	    CPUID_PBE
    296 };
    297 
    298 const struct nvmm_x86_cpuid_mask nvmm_cpuid_00000007 = {
    299 	.eax = ~0,
    300 	.ebx =
    301 	    CPUID_SEF_FSGSBASE |
    302 	    /* CPUID_SEF_TSC_ADJUST excluded */
    303 	    /* CPUID_SEF_SGX excluded */
    304 	    CPUID_SEF_BMI1 |
    305 	    /* CPUID_SEF_HLE excluded */
    306 	    /* CPUID_SEF_AVX2 excluded */
    307 	    CPUID_SEF_FDPEXONLY |
    308 	    CPUID_SEF_SMEP |
    309 	    CPUID_SEF_BMI2 |
    310 	    CPUID_SEF_ERMS |
    311 	    /* CPUID_SEF_INVPCID excluded, but re-included in VMX */
    312 	    /* CPUID_SEF_RTM excluded */
    313 	    /* CPUID_SEF_QM excluded */
    314 	    CPUID_SEF_FPUCSDS |
    315 	    /* CPUID_SEF_MPX excluded */
    316 	    CPUID_SEF_PQE |
    317 	    /* CPUID_SEF_AVX512F excluded */
    318 	    /* CPUID_SEF_AVX512DQ excluded */
    319 	    CPUID_SEF_RDSEED |
    320 	    CPUID_SEF_ADX |
    321 	    CPUID_SEF_SMAP |
    322 	    /* CPUID_SEF_AVX512_IFMA excluded */
    323 	    CPUID_SEF_CLFLUSHOPT |
    324 	    CPUID_SEF_CLWB,
    325 	    /* CPUID_SEF_PT excluded */
    326 	    /* CPUID_SEF_AVX512PF excluded */
    327 	    /* CPUID_SEF_AVX512ER excluded */
    328 	    /* CPUID_SEF_AVX512CD excluded */
    329 	    /* CPUID_SEF_SHA excluded */
    330 	    /* CPUID_SEF_AVX512BW excluded */
    331 	    /* CPUID_SEF_AVX512VL excluded */
    332 	.ecx =
    333 	    CPUID_SEF_PREFETCHWT1 |
    334 	    /* CPUID_SEF_AVX512_VBMI excluded */
    335 	    CPUID_SEF_UMIP |
    336 	    /* CPUID_SEF_PKU excluded */
    337 	    /* CPUID_SEF_OSPKE excluded */
    338 	    /* CPUID_SEF_WAITPKG excluded */
    339 	    /* CPUID_SEF_AVX512_VBMI2 excluded */
    340 	    /* CPUID_SEF_CET_SS excluded */
    341 	    CPUID_SEF_GFNI |
    342 	    CPUID_SEF_VAES |
    343 	    CPUID_SEF_VPCLMULQDQ |
    344 	    /* CPUID_SEF_AVX512_VNNI excluded */
    345 	    /* CPUID_SEF_AVX512_BITALG excluded */
    346 	    /* CPUID_SEF_AVX512_VPOPCNTDQ excluded */
    347 	    /* CPUID_SEF_MAWAU excluded */
    348 	    /* CPUID_SEF_RDPID excluded */
    349 	    CPUID_SEF_CLDEMOTE |
    350 	    CPUID_SEF_MOVDIRI |
    351 	    CPUID_SEF_MOVDIR64B,
    352 	    /* CPUID_SEF_SGXLC excluded */
    353 	    /* CPUID_SEF_PKS excluded */
    354 	.edx =
    355 	    /* CPUID_SEF_AVX512_4VNNIW excluded */
    356 	    /* CPUID_SEF_AVX512_4FMAPS excluded */
    357 	    CPUID_SEF_FSREP_MOV |
    358 	    /* CPUID_SEF_AVX512_VP2INTERSECT excluded */
    359 	    /* CPUID_SEF_SRBDS_CTRL excluded */
    360 	    CPUID_SEF_MD_CLEAR |
    361 	    /* CPUID_SEF_TSX_FORCE_ABORT excluded */
    362 	    CPUID_SEF_SERIALIZE |
    363 	    /* CPUID_SEF_HYBRID excluded */
    364 	    /* CPUID_SEF_TSXLDTRK excluded */
    365 	    /* CPUID_SEF_CET_IBT excluded */
    366 	    /* CPUID_SEF_IBRS excluded */
    367 	    /* CPUID_SEF_STIBP excluded */
    368 	    /* CPUID_SEF_L1D_FLUSH excluded */
    369 	    CPUID_SEF_ARCH_CAP
    370 	    /* CPUID_SEF_CORE_CAP excluded */
    371 	    /* CPUID_SEF_SSBD excluded */
    372 };
    373 
    374 const struct nvmm_x86_cpuid_mask nvmm_cpuid_80000001 = {
    375 	.eax = ~0,
    376 	.ebx = ~0,
    377 	.ecx =
    378 	    CPUID_LAHF |
    379 	    CPUID_CMPLEGACY |
    380 	    /* CPUID_SVM excluded */
    381 	    /* CPUID_EAPIC excluded */
    382 	    CPUID_ALTMOVCR0 |
    383 	    CPUID_ABM |
    384 	    CPUID_SSE4A |
    385 	    CPUID_MISALIGNSSE |
    386 	    CPUID_3DNOWPF |
    387 	    /* CPUID_OSVW excluded */
    388 	    /* CPUID_IBS excluded */
    389 	    CPUID_XOP |
    390 	    /* CPUID_SKINIT excluded */
    391 	    /* CPUID_WDT excluded */
    392 	    /* CPUID_LWP excluded */
    393 	    CPUID_FMA4 |
    394 	    CPUID_TCE |
    395 	    /* CPUID_NODEID excluded */
    396 	    CPUID_TBM |
    397 	    CPUID_TOPOEXT,
    398 	    /* CPUID_PCEC excluded */
    399 	    /* CPUID_PCENB excluded */
    400 	    /* CPUID_SPM excluded */
    401 	    /* CPUID_DBE excluded */
    402 	    /* CPUID_PTSC excluded */
    403 	    /* CPUID_L2IPERFC excluded */
    404 	    /* CPUID_MWAITX excluded */
    405 	.edx =
    406 	    CPUID_SYSCALL |
    407 	    CPUID_MPC |
    408 	    CPUID_XD |
    409 	    CPUID_MMXX |
    410 	    CPUID_MMX |
    411 	    CPUID_FXSR |
    412 	    CPUID_FFXSR |
    413 	    CPUID_PAGE1GB |
    414 	    /* CPUID_RDTSCP excluded */
    415 	    CPUID_EM64T |
    416 	    CPUID_3DNOW2 |
    417 	    CPUID_3DNOW
    418 };
    419 
    420 const struct nvmm_x86_cpuid_mask nvmm_cpuid_80000007 = {
    421 	.eax = 0,
    422 	.ebx = 0,
    423 	.ecx = 0,
    424 	.edx = CPUID_APM_ITSC
    425 };
    426 
    427 const struct nvmm_x86_cpuid_mask nvmm_cpuid_80000008 = {
    428 	.eax = ~0,
    429 	.ebx =
    430 	    CPUID_CAPEX_CLZERO |
    431 	    /* CPUID_CAPEX_IRPERF excluded */
    432 	    CPUID_CAPEX_XSAVEERPTR |
    433 	    /* CPUID_CAPEX_RDPRU excluded */
    434 	    /* CPUID_CAPEX_MCOMMIT excluded */
    435 	    CPUID_CAPEX_WBNOINVD,
    436 	.ecx = ~0, /* TODO? */
    437 	.edx = 0
    438 };
    439 
    440 bool
    441 nvmm_x86_pat_validate(uint64_t val)
    442 {
    443 	uint8_t *pat = (uint8_t *)&val;
    444 	size_t i;
    445 
    446 	for (i = 0; i < 8; i++) {
    447 		if (__predict_false(pat[i] & ~__BITS(2,0)))
    448 			return false;
    449 		if (__predict_false(pat[i] == 2 || pat[i] == 3))
    450 			return false;
    451 	}
    452 
    453 	return true;
    454 }
    455