cpu.h revision 1.45 1 /* $NetBSD: cpu.h,v 1.45 2011/12/30 17:57:49 cherry Exp $ */
2
3 /*-
4 * Copyright (c) 1990 The Regents of the University of California.
5 * All rights reserved.
6 *
7 * This code is derived from software contributed to Berkeley by
8 * William Jolitz.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 * 3. Neither the name of the University nor the names of its contributors
19 * may be used to endorse or promote products derived from this software
20 * without specific prior written permission.
21 *
22 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32 * SUCH DAMAGE.
33 *
34 * @(#)cpu.h 5.4 (Berkeley) 5/9/91
35 */
36
37 #ifndef _X86_CPU_H_
38 #define _X86_CPU_H_
39
40 #if defined(_KERNEL) || defined(_STANDALONE)
41 #include <sys/types.h>
42 #else
43 #include <stdbool.h>
44 #endif /* _KERNEL || _STANDALONE */
45
46 #if defined(_KERNEL) || defined(_KMEMUSER)
47 #if defined(_KERNEL_OPT)
48 #include "opt_xen.h"
49 #ifdef i386
50 #include "opt_user_ldt.h"
51 #include "opt_vm86.h"
52 #endif
53 #endif
54
55 /*
56 * Definitions unique to x86 cpu support.
57 */
58 #include <machine/frame.h>
59 #include <machine/pte.h>
60 #include <machine/segments.h>
61 #include <machine/tss.h>
62 #include <machine/intrdefs.h>
63
64 #include <x86/cacheinfo.h>
65
66 #include <sys/cpu_data.h>
67 #include <sys/evcnt.h>
68 #include <sys/device_if.h> /* for device_t */
69
70 #ifdef XEN
71 #include <xen/xen-public/xen.h>
72 #include <xen/xen-public/event_channel.h>
73 #endif /* XEN */
74
75 struct intrsource;
76 struct pmap;
77 struct device;
78
79 #ifdef __x86_64__
80 #define i386tss x86_64_tss
81 #endif
82
83 #define NIOPORTS 1024 /* # of ports we allow to be mapped */
84 #define IOMAPSIZE (NIOPORTS / 8) /* I/O bitmap size in bytes */
85
86 /*
87 * a bunch of this belongs in cpuvar.h; move it later..
88 */
89
90 struct cpu_info {
91 struct cpu_data ci_data; /* MI per-cpu data */
92 device_t ci_dev; /* pointer to our device */
93 struct cpu_info *ci_self; /* self-pointer */
94 volatile struct vcpu_info *ci_vcpu; /* for XEN */
95 void *ci_tlog_base; /* Trap log base */
96 int32_t ci_tlog_offset; /* Trap log current offset */
97
98 /*
99 * Will be accessed by other CPUs.
100 */
101 struct cpu_info *ci_next; /* next cpu */
102 struct lwp *ci_curlwp; /* current owner of the processor */
103 struct lwp *ci_fpcurlwp; /* current owner of the FPU */
104 int ci_fpsaving; /* save in progress */
105 int ci_fpused; /* XEN: FPU was used by curlwp */
106 cpuid_t ci_cpuid; /* our CPU ID */
107 int ci_cpumask; /* (1 << CPU ID) */
108 uint32_t ci_acpiid; /* our ACPI/MADT ID */
109 uint32_t ci_initapicid; /* our intitial APIC ID */
110
111 /*
112 * Private members.
113 */
114 struct evcnt ci_tlb_evcnt; /* tlb shootdown counter */
115 struct pmap *ci_pmap; /* current pmap */
116 int ci_need_tlbwait; /* need to wait for TLB invalidations */
117 int ci_want_pmapload; /* pmap_load() is needed */
118 volatile int ci_tlbstate; /* one of TLBSTATE_ states. see below */
119 #define TLBSTATE_VALID 0 /* all user tlbs are valid */
120 #define TLBSTATE_LAZY 1 /* tlbs are valid but won't be kept uptodate */
121 #define TLBSTATE_STALE 2 /* we might have stale user tlbs */
122 int ci_curldt; /* current LDT descriptor */
123 int ci_nintrhand; /* number of H/W interrupt handlers */
124 uint64_t ci_scratch;
125 uintptr_t ci_pmap_data[128 / sizeof(uintptr_t)];
126
127 #ifdef XEN
128 struct iplsource *ci_isources[NIPL];
129 u_long ci_evtmask[NR_EVENT_CHANNELS]; /* events allowed on this CPU */
130 #else
131 struct intrsource *ci_isources[MAX_INTR_SOURCES];
132 #endif
133 volatile int ci_mtx_count; /* Negative count of spin mutexes */
134 volatile int ci_mtx_oldspl; /* Old SPL at this ci_idepth */
135
136 /* The following must be aligned for cmpxchg8b. */
137 struct {
138 uint32_t ipending;
139 int ilevel;
140 } ci_istate __aligned(8);
141 #define ci_ipending ci_istate.ipending
142 #define ci_ilevel ci_istate.ilevel
143
144 int ci_idepth;
145 void * ci_intrstack;
146 uint32_t ci_imask[NIPL];
147 uint32_t ci_iunmask[NIPL];
148
149 uint32_t ci_flags; /* flags; see below */
150 uint32_t ci_ipis; /* interprocessor interrupts pending */
151 uint32_t sc_apic_version; /* local APIC version */
152
153 uint32_t ci_signature; /* X86 cpuid type */
154 uint32_t ci_vendor[4]; /* vendor string */
155 uint32_t ci_cpu_serial[3]; /* PIII serial number */
156 volatile uint32_t ci_lapic_counter;
157
158 uint32_t ci_feat_val[5]; /* X86 CPUID feature bits
159 * [0] basic features %edx
160 * [1] basic features %ecx
161 * [2] extended features %edx
162 * [3] extended features %ecx
163 * [4] VIA padlock features
164 */
165
166 const struct cpu_functions *ci_func; /* start/stop functions */
167 struct trapframe *ci_ddb_regs;
168
169 u_int ci_cflush_lsize; /* CFLUSH insn line size */
170 struct x86_cache_info ci_cinfo[CAI_COUNT];
171
172 union descriptor *ci_gdt;
173
174 #ifdef i386
175 struct i386tss ci_doubleflt_tss;
176 struct i386tss ci_ddbipi_tss;
177 #endif
178
179 #ifdef PAE
180 uint32_t ci_pae_l3_pdirpa; /* PA of L3 PD */
181 pd_entry_t * ci_pae_l3_pdir; /* VA pointer to L3 PD */
182 #endif
183
184 #if defined(XEN) && (defined(PAE) || defined(__x86_64__))
185 /* Currently active user PGD (can't use rcr3() with Xen) */
186 pd_entry_t * ci_kpm_pdir; /* per-cpu PMD (va) */
187 paddr_t ci_kpm_pdirpa; /* per-cpu PMD (pa) */
188 #if defined(__x86_64__)
189 paddr_t ci_xen_current_user_pgd;
190 #endif /* __x86_64__ */
191 #endif /* XEN et.al */
192
193
194 char *ci_doubleflt_stack;
195 char *ci_ddbipi_stack;
196
197 #ifndef XEN
198 struct evcnt ci_ipi_events[X86_NIPI];
199 #else /* XEN */
200 struct evcnt ci_ipi_events[XEN_NIPIS];
201 evtchn_port_t ci_ipi_evtchn;
202 #endif /* XEN */
203
204 device_t ci_frequency; /* Frequency scaling technology */
205 device_t ci_padlock; /* VIA PadLock private storage */
206 device_t ci_temperature; /* Intel coretemp(4) or equivalent */
207 device_t ci_vm; /* Virtual machine guest driver */
208
209 struct i386tss ci_tss; /* Per-cpu TSS; shared among LWPs */
210 char ci_iomap[IOMAPSIZE]; /* I/O Bitmap */
211 int ci_tss_sel; /* TSS selector of this cpu */
212
213 /*
214 * The following two are actually region_descriptors,
215 * but that would pollute the namespace.
216 */
217 uintptr_t ci_suspend_gdt;
218 uint16_t ci_suspend_gdt_padding;
219 uintptr_t ci_suspend_idt;
220 uint16_t ci_suspend_idt_padding;
221
222 uint16_t ci_suspend_tr;
223 uint16_t ci_suspend_ldt;
224 uintptr_t ci_suspend_fs;
225 uintptr_t ci_suspend_gs;
226 uintptr_t ci_suspend_kgs;
227 uintptr_t ci_suspend_efer;
228 uintptr_t ci_suspend_reg[12];
229 uintptr_t ci_suspend_cr0;
230 uintptr_t ci_suspend_cr2;
231 uintptr_t ci_suspend_cr3;
232 uintptr_t ci_suspend_cr4;
233 uintptr_t ci_suspend_cr8;
234
235 /* The following must be in a single cache line. */
236 int ci_want_resched __aligned(64);
237 int ci_padout __aligned(64);
238 };
239
240 /*
241 * Macros to handle (some) trapframe registers for common x86 code.
242 */
243 #ifdef __x86_64__
244 #define X86_TF_RAX(tf) tf->tf_rax
245 #define X86_TF_RDX(tf) tf->tf_rdx
246 #define X86_TF_RSP(tf) tf->tf_rsp
247 #define X86_TF_RIP(tf) tf->tf_rip
248 #define X86_TF_RFLAGS(tf) tf->tf_rflags
249 #else
250 #define X86_TF_RAX(tf) tf->tf_eax
251 #define X86_TF_RDX(tf) tf->tf_edx
252 #define X86_TF_RSP(tf) tf->tf_esp
253 #define X86_TF_RIP(tf) tf->tf_eip
254 #define X86_TF_RFLAGS(tf) tf->tf_eflags
255 #endif
256
257 /*
258 * Processor flag notes: The "primary" CPU has certain MI-defined
259 * roles (mostly relating to hardclock handling); we distinguish
260 * betwen the processor which booted us, and the processor currently
261 * holding the "primary" role just to give us the flexibility later to
262 * change primaries should we be sufficiently twisted.
263 */
264
265 #define CPUF_BSP 0x0001 /* CPU is the original BSP */
266 #define CPUF_AP 0x0002 /* CPU is an AP */
267 #define CPUF_SP 0x0004 /* CPU is only processor */
268 #define CPUF_PRIMARY 0x0008 /* CPU is active primary processor */
269
270 #define CPUF_SYNCTSC 0x0800 /* Synchronize TSC */
271 #define CPUF_PRESENT 0x1000 /* CPU is present */
272 #define CPUF_RUNNING 0x2000 /* CPU is running */
273 #define CPUF_PAUSE 0x4000 /* CPU is paused in DDB */
274 #define CPUF_GO 0x8000 /* CPU should start running */
275
276 #endif /* _KERNEL || __KMEMUSER */
277
278 #ifdef _KERNEL
279 /*
280 * We statically allocate the CPU info for the primary CPU (or,
281 * the only CPU on uniprocessors), and the primary CPU is the
282 * first CPU on the CPU info list.
283 */
284 extern struct cpu_info cpu_info_primary;
285 extern struct cpu_info *cpu_info_list;
286
287 #define CPU_INFO_ITERATOR int
288 #define CPU_INFO_FOREACH(cii, ci) cii = 0, ci = cpu_info_list; \
289 ci != NULL; ci = ci->ci_next
290
291 #define CPU_STARTUP(_ci, _target) ((_ci)->ci_func->start(_ci, _target))
292 #define CPU_STOP(_ci) ((_ci)->ci_func->stop(_ci))
293 #define CPU_START_CLEANUP(_ci) ((_ci)->ci_func->cleanup(_ci))
294
295 #if !defined(__GNUC__) || defined(_MODULE)
296 /* For non-GCC and modules */
297 struct cpu_info *x86_curcpu(void);
298 void cpu_set_curpri(int);
299 # ifdef __GNUC__
300 lwp_t *x86_curlwp(void) __attribute__ ((const));
301 # else
302 lwp_t *x86_curlwp(void);
303 # endif
304 #endif
305
306 #define cpu_number() (cpu_index(curcpu()))
307
308 #define CPU_IS_PRIMARY(ci) ((ci)->ci_flags & CPUF_PRIMARY)
309
310 #define X86_AST_GENERIC 0x01
311 #define X86_AST_PREEMPT 0x02
312
313 #define aston(l, why) ((l)->l_md.md_astpending |= (why))
314 #define cpu_did_resched(l) ((l)->l_md.md_astpending &= ~X86_AST_PREEMPT)
315
316 void cpu_boot_secondary_processors(void);
317 void cpu_init_idle_lwps(void);
318 void cpu_init_msrs(struct cpu_info *, bool);
319 void cpu_load_pmap(struct pmap *);
320 void cpu_broadcast_halt(void);
321 void cpu_kick(struct cpu_info *);
322
323 extern uint32_t cpus_attached;
324
325 #define curcpu() x86_curcpu()
326 #define curlwp x86_curlwp()
327 #define curpcb ((struct pcb *)lwp_getpcb(curlwp))
328
329 /*
330 * Arguments to hardclock, softclock and statclock
331 * encapsulate the previous machine state in an opaque
332 * clockframe; for now, use generic intrframe.
333 */
334 struct clockframe {
335 struct intrframe cf_if;
336 };
337
338 /*
339 * Give a profiling tick to the current process when the user profiling
340 * buffer pages are invalid. On the i386, request an ast to send us
341 * through trap(), marking the proc as needing a profiling tick.
342 */
343 extern void cpu_need_proftick(struct lwp *l);
344
345 /*
346 * Notify the LWP l that it has a signal pending, process as soon as
347 * possible.
348 */
349 extern void cpu_signotify(struct lwp *);
350
351 /*
352 * We need a machine-independent name for this.
353 */
354 extern void (*delay_func)(unsigned int);
355 struct timeval;
356
357 #define DELAY(x) (*delay_func)(x)
358 #define delay(x) (*delay_func)(x)
359
360 extern int biosbasemem;
361 extern int biosextmem;
362 extern int cpu;
363 extern int cpuid_level;
364 extern int cpu_class;
365 extern char cpu_brand_string[];
366 extern int use_pae;
367
368 extern int i386_use_fxsave;
369 extern int i386_has_sse;
370 extern int i386_has_sse2;
371
372 extern void (*x86_cpu_idle)(void);
373 #define cpu_idle() (*x86_cpu_idle)()
374
375 /* machdep.c */
376 void dumpconf(void);
377 void cpu_reset(void);
378 void i386_proc0_tss_ldt_init(void);
379 void dumpconf(void);
380 void cpu_reset(void);
381 void x86_64_proc0_tss_ldt_init(void);
382 void x86_64_init_pcb_tss_ldt(struct cpu_info *);
383
384 /* longrun.c */
385 u_int tmx86_get_longrun_mode(void);
386 void tmx86_get_longrun_status(u_int *, u_int *, u_int *);
387 void tmx86_init_longrun(void);
388
389 /* identcpu.c */
390 void cpu_probe(struct cpu_info *);
391 void cpu_identify(struct cpu_info *);
392
393 /* cpu_topology.c */
394 void x86_cpu_topology(struct cpu_info *);
395
396 /* vm_machdep.c */
397 void cpu_proc_fork(struct proc *, struct proc *);
398
399 /* locore.s */
400 struct region_descriptor;
401 void lgdt(struct region_descriptor *);
402 #ifdef XEN
403 void lgdt_finish(void);
404 void i386_switch_context(lwp_t *);
405 #endif
406
407 struct pcb;
408 void savectx(struct pcb *);
409 void lwp_trampoline(void);
410 void child_trampoline(void);
411 #ifdef XEN
412 void startrtclock(void);
413 void xen_delay(unsigned int);
414 void xen_initclocks(void);
415 void xen_suspendclocks(void);
416 void xen_resumeclocks(void);
417 #else
418 /* clock.c */
419 void initrtclock(u_long);
420 void startrtclock(void);
421 void i8254_delay(unsigned int);
422 void i8254_microtime(struct timeval *);
423 void i8254_initclocks(void);
424 #endif
425
426 /* cpu.c */
427
428 void cpu_probe_features(struct cpu_info *);
429
430 /* npx.c */
431 void npxsave_lwp(struct lwp *, bool);
432 void npxsave_cpu(bool);
433
434 /* vm_machdep.c */
435 paddr_t kvtop(void *);
436
437 #ifdef USER_LDT
438 /* sys_machdep.h */
439 int x86_get_ldt(struct lwp *, void *, register_t *);
440 int x86_set_ldt(struct lwp *, void *, register_t *);
441 #endif
442
443 /* isa_machdep.c */
444 void isa_defaultirq(void);
445 int isa_nmi(void);
446
447 #ifdef VM86
448 /* vm86.c */
449 void vm86_gpfault(struct lwp *, int);
450 #endif /* VM86 */
451
452 /* consinit.c */
453 void kgdb_port_init(void);
454
455 /* bus_machdep.c */
456 void x86_bus_space_init(void);
457 void x86_bus_space_mallocok(void);
458
459 #endif /* _KERNEL */
460
461 #if defined(_KERNEL) || defined(_KMEMUSER)
462 #include <machine/psl.h> /* Must be after struct cpu_info declaration */
463 #endif /* _KERNEL || __KMEMUSER */
464
465 /*
466 * CTL_MACHDEP definitions.
467 */
468 #define CPU_CONSDEV 1 /* dev_t: console terminal device */
469 #define CPU_BIOSBASEMEM 2 /* int: bios-reported base mem (K) */
470 #define CPU_BIOSEXTMEM 3 /* int: bios-reported ext. mem (K) */
471 /* CPU_NKPDE 4 obsolete: int: number of kernel PDEs */
472 #define CPU_BOOTED_KERNEL 5 /* string: booted kernel name */
473 #define CPU_DISKINFO 6 /* struct disklist *:
474 * disk geometry information */
475 #define CPU_FPU_PRESENT 7 /* int: FPU is present */
476 #define CPU_OSFXSR 8 /* int: OS uses FXSAVE/FXRSTOR */
477 #define CPU_SSE 9 /* int: OS/CPU supports SSE */
478 #define CPU_SSE2 10 /* int: OS/CPU supports SSE2 */
479 #define CPU_TMLR_MODE 11 /* int: longrun mode
480 * 0: minimum frequency
481 * 1: economy
482 * 2: performance
483 * 3: maximum frequency
484 */
485 #define CPU_TMLR_FREQUENCY 12 /* int: current frequency */
486 #define CPU_TMLR_VOLTAGE 13 /* int: curret voltage */
487 #define CPU_TMLR_PERCENTAGE 14 /* int: current clock percentage */
488 #define CPU_MAXID 15 /* number of valid machdep ids */
489
490 /*
491 * Structure for CPU_DISKINFO sysctl call.
492 * XXX this should be somewhere else.
493 */
494 #define MAX_BIOSDISKS 16
495
496 struct disklist {
497 int dl_nbiosdisks; /* number of bios disks */
498 struct biosdisk_info {
499 int bi_dev; /* BIOS device # (0x80 ..) */
500 int bi_cyl; /* cylinders on disk */
501 int bi_head; /* heads per track */
502 int bi_sec; /* sectors per track */
503 uint64_t bi_lbasecs; /* total sec. (iff ext13) */
504 #define BIFLAG_INVALID 0x01
505 #define BIFLAG_EXTINT13 0x02
506 int bi_flags;
507 } dl_biosdisks[MAX_BIOSDISKS];
508
509 int dl_nnativedisks; /* number of native disks */
510 struct nativedisk_info {
511 char ni_devname[16]; /* native device name */
512 int ni_nmatches; /* # of matches w/ BIOS */
513 int ni_biosmatches[MAX_BIOSDISKS]; /* indices in dl_biosdisks */
514 } dl_nativedisks[1]; /* actually longer */
515 };
516 #endif /* !_X86_CPU_H_ */
517