tprof_x86.c revision 1.12 1 1.12 msaitoh /* $NetBSD: tprof_x86.c,v 1.12 2022/06/13 09:28:58 msaitoh Exp $ */
2 1.1 maxv
3 1.1 maxv /*
4 1.8 maxv * Copyright (c) 2018-2019 The NetBSD Foundation, Inc.
5 1.1 maxv * All rights reserved.
6 1.1 maxv *
7 1.1 maxv * This code is derived from software contributed to The NetBSD Foundation
8 1.1 maxv * by Maxime Villard.
9 1.1 maxv *
10 1.1 maxv * Redistribution and use in source and binary forms, with or without
11 1.1 maxv * modification, are permitted provided that the following conditions
12 1.1 maxv * are met:
13 1.1 maxv * 1. Redistributions of source code must retain the above copyright
14 1.1 maxv * notice, this list of conditions and the following disclaimer.
15 1.1 maxv * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 maxv * notice, this list of conditions and the following disclaimer in the
17 1.1 maxv * documentation and/or other materials provided with the distribution.
18 1.1 maxv *
19 1.1 maxv * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.1 maxv * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.1 maxv * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.1 maxv * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.1 maxv * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.1 maxv * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.1 maxv * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.1 maxv * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.1 maxv * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.1 maxv * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.1 maxv * POSSIBILITY OF SUCH DAMAGE.
30 1.1 maxv */
31 1.1 maxv
32 1.1 maxv #include <sys/cdefs.h>
33 1.1 maxv #include <stdio.h>
34 1.1 maxv #include <stdlib.h>
35 1.1 maxv #include <stdbool.h>
36 1.1 maxv #include <string.h>
37 1.1 maxv #include <unistd.h>
38 1.1 maxv #include <err.h>
39 1.1 maxv #include <machine/specialreg.h>
40 1.1 maxv #include <dev/tprof/tprof_ioctl.h>
41 1.1 maxv #include "../tprof.h"
42 1.1 maxv
43 1.1 maxv int tprof_event_init(uint32_t);
44 1.1 maxv void tprof_event_list(void);
45 1.1 maxv void tprof_event_lookup(const char *, struct tprof_param *);
46 1.1 maxv
47 1.1 maxv struct name_to_event {
48 1.1 maxv const char *name;
49 1.1 maxv uint64_t event;
50 1.1 maxv uint64_t unit;
51 1.1 maxv bool enabled;
52 1.1 maxv };
53 1.1 maxv
54 1.1 maxv struct event_table {
55 1.1 maxv const char *tablename;
56 1.1 maxv struct name_to_event *names;
57 1.1 maxv size_t nevents;
58 1.1 maxv struct event_table *next;
59 1.1 maxv };
60 1.1 maxv
61 1.1 maxv static struct event_table *cpuevents = NULL;
62 1.1 maxv
63 1.1 maxv static void x86_cpuid(unsigned int *eax, unsigned int *ebx,
64 1.1 maxv unsigned int *ecx, unsigned int *edx)
65 1.1 maxv {
66 1.1 maxv asm volatile("cpuid"
67 1.1 maxv : "=a" (*eax),
68 1.1 maxv "=b" (*ebx),
69 1.1 maxv "=c" (*ecx),
70 1.1 maxv "=d" (*edx)
71 1.1 maxv : "0" (*eax), "2" (*ecx));
72 1.1 maxv }
73 1.1 maxv
74 1.1 maxv /* -------------------------------------------------------------------------- */
75 1.1 maxv
76 1.1 maxv /*
77 1.1 maxv * Intel Architectural Version 1.
78 1.1 maxv */
79 1.1 maxv static struct name_to_event intel_arch1_names[] = {
80 1.1 maxv /* Event Name - Event Select - UMask */
81 1.1 maxv { "unhalted-core-cycles", 0x3C, 0x00, true },
82 1.1 maxv { "instruction-retired", 0xC0, 0x00, true },
83 1.1 maxv { "unhalted-reference-cycles", 0x3C, 0x01, true },
84 1.1 maxv { "llc-reference", 0x2E, 0x4F, true },
85 1.1 maxv { "llc-misses", 0x2E, 0x41, true },
86 1.1 maxv { "branch-instruction-retired", 0xC4, 0x00, true },
87 1.1 maxv { "branch-misses-retired", 0xC5, 0x00, true },
88 1.11 msaitoh { "topdown-slots", 0xA4, 0x01, true },
89 1.1 maxv };
90 1.1 maxv
91 1.1 maxv static struct event_table intel_arch1 = {
92 1.1 maxv .tablename = "Intel Architectural Version 1",
93 1.1 maxv .names = intel_arch1_names,
94 1.1 maxv .nevents = sizeof(intel_arch1_names) /
95 1.1 maxv sizeof(struct name_to_event),
96 1.1 maxv .next = NULL
97 1.1 maxv };
98 1.1 maxv
99 1.1 maxv static struct event_table *
100 1.1 maxv init_intel_arch1(void)
101 1.1 maxv {
102 1.12 msaitoh unsigned int eax, ebx, ecx, edx, vectorlen;
103 1.1 maxv struct event_table *table;
104 1.1 maxv size_t i;
105 1.1 maxv
106 1.1 maxv eax = 0x0A;
107 1.1 maxv ebx = 0;
108 1.1 maxv ecx = 0;
109 1.1 maxv edx = 0;
110 1.1 maxv x86_cpuid(&eax, &ebx, &ecx, &edx);
111 1.1 maxv
112 1.12 msaitoh vectorlen = __SHIFTOUT(eax, CPUID_PERF_BVECLEN);
113 1.12 msaitoh
114 1.1 maxv table = &intel_arch1;
115 1.1 maxv for (i = 0; i < table->nevents; i++) {
116 1.12 msaitoh /*
117 1.12 msaitoh * Disable the unsupported events from:
118 1.12 msaitoh * a) the bit vector length in EAX.
119 1.12 msaitoh * b) the disable bit in EBX.
120 1.12 msaitoh */
121 1.12 msaitoh if (i >= vectorlen)
122 1.12 msaitoh table->names[i].enabled = false;
123 1.1 maxv if ((ebx & (i << 1)) != 0)
124 1.1 maxv table->names[i].enabled = false;
125 1.1 maxv }
126 1.1 maxv
127 1.1 maxv return table;
128 1.1 maxv }
129 1.1 maxv
130 1.1 maxv /*
131 1.5 knakahar * Intel Silvermont/Airmont.
132 1.5 knakahar */
133 1.5 knakahar static struct name_to_event intel_silvermont_airmont_names[] = {
134 1.5 knakahar { "REHABQ.LD_BLOCK_ST_FORWARD", 0x03, 0x01, true },
135 1.5 knakahar { "REHABQ.LD_BLOCK_STD_NOTREADY", 0x03, 0x02, true },
136 1.5 knakahar { "REHABQ.ST_SPLITS", 0x03, 0x04, true },
137 1.5 knakahar { "REHABQ.LD_SPLITS", 0x03, 0x08, true },
138 1.5 knakahar { "REHABQ.LOCK", 0x03, 0x10, true },
139 1.5 knakahar { "REHABQ.STA_FULL", 0x03, 0x20, true },
140 1.5 knakahar { "REHABQ.ANY_LD", 0x03, 0x40, true },
141 1.5 knakahar { "REHABQ.ANY_ST", 0x03, 0x80, true },
142 1.5 knakahar { "MEM_UOPS_RETIRED.L1_MISS_LOADS", 0x04, 0x01, true },
143 1.5 knakahar { "MEM_UOPS_RETIRED.L2_HIT_LOADS", 0x04, 0x02, true },
144 1.5 knakahar { "MEM_UOPS_RETIRED.L2_MISS_LOADS", 0x04, 0x04, true },
145 1.5 knakahar { "MEM_UOPS_RETIRED.DTLB_MISS_LOADS", 0x04, 0x08, true },
146 1.5 knakahar { "MEM_UOPS_RETIRED.UTLB_MISS", 0x04, 0x10, true },
147 1.5 knakahar { "MEM_UOPS_RETIRED.HITM", 0x04, 0x20, true },
148 1.5 knakahar { "MEM_UOPS_RETIRED.ALL_LOADS", 0x04, 0x40, true },
149 1.5 knakahar { "MEM_UOP_RETIRED.ALL_STORES", 0x04, 0x80, true },
150 1.5 knakahar { "PAGE_WALKS.D_SIDE_CYCLES", 0x05, 0x01, true },
151 1.5 knakahar { "PAGE_WALKS.I_SIDE_CYCLES", 0x05, 0x02, true },
152 1.5 knakahar { "PAGE_WALKS.WALKS", 0x05, 0x03, true },
153 1.5 knakahar { "LONGEST_LAT_CACHE.MISS", 0x2E, 0x41, true },
154 1.5 knakahar { "LONGEST_LAT_CACHE.REFERENCE", 0x2E, 0x4F, true },
155 1.5 knakahar { "L2_REJECT_XQ.ALL", 0x30, 0x00, true },
156 1.5 knakahar { "CORE_REJECT_L2Q.ALL", 0x31, 0x00, true },
157 1.5 knakahar { "CPU_CLK_UNHALTED.CORE_P", 0x3C, 0x00, true },
158 1.5 knakahar { "CPU_CLK_UNHALTED.REF_P", 0x3C, 0x01, true },
159 1.5 knakahar { "ICACHE.HIT", 0x80, 0x01, true },
160 1.5 knakahar { "ICACHE.MISSES", 0x80, 0x02, true },
161 1.5 knakahar { "ICACHE.ACCESSES", 0x80, 0x03, true },
162 1.5 knakahar { "OFFCORE_RESPONSE_0", 0xB7, 0x01, true },
163 1.5 knakahar { "OFFCORE_RESPONSE_1", 0xB7, 0x02, true },
164 1.5 knakahar { "INST_RETIRED.ANY_P", 0xC0, 0x00, true },
165 1.5 knakahar { "UOPS_RETIRED.MS", 0xC2, 0x01, true },
166 1.5 knakahar { "UOPS_RETIRED.ALL", 0xC2, 0x10, true },
167 1.5 knakahar { "MACHINE_CLEARS.SMC", 0xC3, 0x01, true },
168 1.5 knakahar { "MACHINE_CLEARS.MEMORY_ORDERING", 0xC3, 0x02, true },
169 1.5 knakahar { "MACHINE_CLEARS.FP_ASSIST", 0xC3, 0x04, true },
170 1.5 knakahar { "MACHINE_CLEARS.ALL", 0xC3, 0x08, true },
171 1.5 knakahar { "BR_INST_RETIRED.ALL_BRANCHES", 0xC4, 0x00, true },
172 1.5 knakahar { "BR_INST_RETIRED.JCC", 0xC4, 0x7E, true },
173 1.5 knakahar { "BR_INST_RETIRED.FAR_BRANCH", 0xC4, 0xBF, true },
174 1.5 knakahar { "BR_INST_RETIRED.NON_RETURN_IND", 0xC4, 0xEB, true },
175 1.5 knakahar { "BR_INST_RETIRED.RETURN", 0xC4, 0xF7, true },
176 1.5 knakahar { "BR_INST_RETIRED.CALL", 0xC4, 0xF9, true },
177 1.5 knakahar { "BR_INST_RETIRED.IND_CALL", 0xC4, 0xFB, true },
178 1.5 knakahar { "BR_INST_RETIRED.REL_CALL", 0xC4, 0xFD, true },
179 1.5 knakahar { "BR_INST_RETIRED.TAKEN_JCC", 0xC4, 0xFE, true },
180 1.5 knakahar { "BR_MISP_RETIRED.ALL_BRANCHES", 0xC5, 0x00, true },
181 1.5 knakahar { "BR_MISP_RETIRED.JCC", 0xC5, 0x7E, true },
182 1.5 knakahar { "BR_MISP_RETIRED.FAR", 0xC5, 0xBF, true },
183 1.5 knakahar { "BR_MISP_RETIRED.NON_RETURN_IND", 0xC5, 0xEB, true },
184 1.5 knakahar { "BR_MISP_RETIRED.RETURN", 0xC5, 0xF7, true },
185 1.5 knakahar { "BR_MISP_RETIRED.CALL", 0xC5, 0xF9, true },
186 1.5 knakahar { "BR_MISP_RETIRED.IND_CALL", 0xC5, 0xFB, true },
187 1.5 knakahar { "BR_MISP_RETIRED.REL_CALL", 0xC5, 0xFD, true },
188 1.5 knakahar { "BR_MISP_RETIRED.TAKEN_JCC", 0xC5, 0xFE, true },
189 1.5 knakahar { "NO_ALLOC_CYCLES.ROB_FULL", 0xCA, 0x01, true },
190 1.5 knakahar { "NO_ALLOC_CYCLES.RAT_STALL", 0xCA, 0x20, true },
191 1.5 knakahar { "NO_ALLOC_CYCLES.ALL", 0xCA, 0x3F, true },
192 1.5 knakahar { "NO_ALLOC_CYCLES.NOT_DELIVERED", 0xCA, 0x50, true },
193 1.5 knakahar { "RS_FULL_STALL.MEC", 0xCB, 0x01, true },
194 1.5 knakahar { "RS_FULL_STALL.ALL", 0xCB, 0x1F, true },
195 1.5 knakahar { "CYCLES_DIV_BUSY.ANY", 0xCD, 0x01, true },
196 1.5 knakahar { "BACLEARS.ALL", 0xE6, 0x01, true },
197 1.5 knakahar { "BACLEARS.RETURN", 0xE6, 0x08, true },
198 1.5 knakahar { "BACLEARS.COND", 0xE6, 0x10, true },
199 1.5 knakahar { "MS_DECODED.MS_ENTRY", 0xE7, 0x01, true },
200 1.5 knakahar };
201 1.5 knakahar
202 1.5 knakahar static struct event_table intel_silvermont_airmont = {
203 1.5 knakahar .tablename = "Intel Silvermont/Airmont",
204 1.5 knakahar .names = intel_silvermont_airmont_names,
205 1.5 knakahar .nevents = sizeof(intel_silvermont_airmont_names) /
206 1.5 knakahar sizeof(struct name_to_event),
207 1.5 knakahar .next = NULL
208 1.5 knakahar };
209 1.5 knakahar
210 1.5 knakahar static struct event_table *
211 1.5 knakahar init_intel_silvermont_airmont(void)
212 1.5 knakahar {
213 1.5 knakahar
214 1.5 knakahar return &intel_silvermont_airmont;
215 1.5 knakahar }
216 1.5 knakahar
217 1.5 knakahar /*
218 1.6 knakahar * Intel Goldmont
219 1.6 knakahar */
220 1.6 knakahar static struct name_to_event intel_goldmont_names[] = {
221 1.6 knakahar { "LD_BLOCKS.ALL_BLOCK", 0x03, 0x10, true },
222 1.6 knakahar { "LD_BLOCKS.UTLB_MISS", 0x03, 0x08, true },
223 1.6 knakahar { "LD_BLOCKS.STORE_FORWARD", 0x03, 0x02, true },
224 1.6 knakahar { "LD_BLOCKS.DATA_UNKNOWN", 0x03, 0x01, true },
225 1.6 knakahar { "LD_BLOCKS.4K_ALIAS", 0x03, 0x04, true },
226 1.6 knakahar { "PAGE_WALKS.D_SIDE_CYCLES", 0x05, 0x01, true },
227 1.6 knakahar { "PAGE_WALKS.I_SIDE_CYCLES", 0x05, 0x02, true },
228 1.6 knakahar { "PAGE_WALKS.CYCLES", 0x05, 0x03, true },
229 1.6 knakahar { "UOPS_ISSUED.ANY", 0x0E, 0x00, true },
230 1.6 knakahar { "MISALIGN_MEM_REF.LOAD_PAGE_SPLIT", 0x13, 0x02, true },
231 1.6 knakahar { "MISALIGN_MEM_REF.STORE_PAGE_SPLIT", 0x13, 0x04, true },
232 1.6 knakahar { "LONGEST_LAT_CACHE.REFERENCE", 0x2E, 0x4F, true },
233 1.6 knakahar { "LONGEST_LAT_CACHE.MISS", 0x2E, 0x41, true },
234 1.6 knakahar { "L2_REJECT_XQ.ALL", 0x30, 0x00, true },
235 1.6 knakahar { "CORE_REJECT_L2Q.ALL", 0x31, 0x00, true },
236 1.6 knakahar { "CPU_CLK_UNHALTED.CORE_P", 0x3C, 0x00, true },
237 1.6 knakahar { "CPU_CLK_UNHALTED.REF", 0x3C, 0x01, true },
238 1.6 knakahar { "DL1.DIRTY_EVICTION", 0x51, 0x01, true },
239 1.6 knakahar { "ICACHE.HIT", 0x80, 0x01, true },
240 1.6 knakahar { "ICACHE.MISSES", 0x80, 0x02, true },
241 1.6 knakahar { "ICACHE.ACCESSES", 0x80, 0x03, true },
242 1.6 knakahar { "ITLB.MISS", 0x81, 0x04, true },
243 1.6 knakahar { "FETCH_STALL.ALL", 0x86, 0x00, true },
244 1.6 knakahar { "FETCH_STALL.ITLB_FILL_PENDING_CYCLES", 0x86, 0x01, true },
245 1.6 knakahar { "FETCH_STALL.ICACHE_FILL_PENDING_CYCLES", 0x86, 0x02, true },
246 1.6 knakahar { "UOPS_NOT_DELIVERED.ANY", 0x9C, 0x00, true },
247 1.6 knakahar { "OFFCORE_RESPONSE.0", 0xB7, 0x01, true },
248 1.6 knakahar { "OFFCORE_RESPONSE.1", 0xB7, 0x02, true },
249 1.6 knakahar { "INST_RETIRED.ANY_P", 0xC0, 0x00, true },
250 1.6 knakahar { "UOPS_RETIRED.ANY", 0xC2, 0x00, true },
251 1.6 knakahar { "UOPS_RETIRED.MS", 0xC2, 0x01, true },
252 1.6 knakahar { "UOPS_RETIRED.FPDIV", 0xC2, 0x08, true },
253 1.6 knakahar { "UOPS_RETIRED.IDIV", 0xC2, 0x10, true },
254 1.6 knakahar { "MACHINE_CLEARS.SMC", 0xC3, 0x01, true },
255 1.6 knakahar { "MACHINE_CLEARS.MEMORY_ORDERING", 0xC3, 0x02, true },
256 1.6 knakahar { "MACHINE_CLEARS.FP_ASSIST", 0xC3, 0x04, true },
257 1.6 knakahar { "MACHINE_CLEARS.DISAMBIGUATION", 0xC3, 0x08, true },
258 1.6 knakahar { "MACHINE_CLEARS.ALL", 0xC3, 0x00, true },
259 1.6 knakahar { "BR_INST_RETIRED.ALL_BRANCHES", 0xC4, 0x00, true },
260 1.6 knakahar { "BR_INST_RETIRED.JCC", 0xC4, 0x7E, true },
261 1.6 knakahar { "BR_INST_RETIRED.ALL_TAKEN_BRANCHES", 0xC4, 0x80, true },
262 1.6 knakahar { "BR_INST_RETIRED.TAKEN_JCC", 0xC4, 0xFE, true },
263 1.6 knakahar { "BR_INST_RETIRED.CALL", 0xC4, 0xF9, true },
264 1.6 knakahar { "BR_INST_RETIRED.REL_CALL", 0xC4, 0xFD, true },
265 1.6 knakahar { "BR_INST_RETIRED.IND_CALL", 0xC4, 0xFB, true },
266 1.6 knakahar { "BR_INST_RETIRED.RETURN", 0xC4, 0xF7, true },
267 1.6 knakahar { "BR_INST_RETIRED.NON_RETURN_IND", 0xC4, 0xEB, true },
268 1.6 knakahar { "BR_INST_RETIRED.FAR_BRANCH", 0xC4, 0xBF, true },
269 1.6 knakahar { "BR_MISP_RETIRED.ALL_BRANCHES", 0xC5, 0x00, true },
270 1.6 knakahar { "BR_MISP_RETIRED.JCC", 0xC5, 0x7E, true },
271 1.6 knakahar { "BR_MISP_RETIRED.TAKEN_JCC", 0xC5, 0xFE, true },
272 1.6 knakahar { "BR_MISP_RETIRED.IND_CALL", 0xC5, 0xFB, true },
273 1.6 knakahar { "BR_MISP_RETIRED.RETURN", 0xC5, 0xF7, true },
274 1.6 knakahar { "BR_MISP_RETIRED.NON_RETURN_IND", 0xC5, 0xEB, true },
275 1.6 knakahar { "ISSUE_SLOTS_NOT_CONSUMED.RESOURCE_FULL", 0xCA, 0x01, true },
276 1.6 knakahar { "ISSUE_SLOTS_NOT_CONSUMED.RECOVERY", 0xCA, 0x02, true },
277 1.6 knakahar { "ISSUE_SLOTS_NOT_CONSUMED.ANY", 0xCA, 0x00, true },
278 1.6 knakahar { "HW_INTERRUPTS.RECEIVED", 0xCB, 0x01, true },
279 1.6 knakahar { "HW_INTERRUPTS.MASKED", 0xCB, 0x02, true },
280 1.6 knakahar { "HW_INTERRUPTS.PENDING_AND_MASKED", 0xCB, 0x04, true },
281 1.6 knakahar { "CYCLES_DIV_BUSY.ALL", 0xCD, 0x00, true },
282 1.6 knakahar { "CYCLES_DIV_BUSY.IDIV", 0xCD, 0x01, true },
283 1.6 knakahar { "CYCLES_DIV_BUSY.FPDIV", 0xCD, 0x02, true },
284 1.6 knakahar { "MEM_UOPS_RETIRED.ALL_LOADS", 0xD0, 0x81, true },
285 1.6 knakahar { "MEM_UOPS_RETIRED.ALL_STORES", 0xD0, 0x82, true },
286 1.6 knakahar { "MEM_UOPS_RETIRED.ALL", 0xD0, 0x83, true },
287 1.6 knakahar { "MEM_UOPS_RETIRED.DTLB_MISS_LOADS", 0xD0, 0x11, true },
288 1.6 knakahar { "MEM_UOPS_RETIRED.DTLB_MISS_STORES", 0xD0, 0x12, true },
289 1.6 knakahar { "MEM_UOPS_RETIRED.DTLB_MISS", 0xD0, 0x13, true },
290 1.6 knakahar { "MEM_UOPS_RETIRED.LOCK_LOADS", 0xD0, 0x21, true },
291 1.6 knakahar { "MEM_UOPS_RETIRED.SPLIT_LOADS", 0xD0, 0x41, true },
292 1.6 knakahar { "MEM_UOPS_RETIRED.SPLIT_STORES", 0xD0, 0x42, true },
293 1.6 knakahar { "MEM_UOPS_RETIRED.SPLIT", 0xD0, 0x43, true },
294 1.6 knakahar { "MEM_LOAD_UOPS_RETIRED.L1_HIT", 0xD1, 0x01, true },
295 1.6 knakahar { "MEM_LOAD_UOPS_RETIRED.L1_MISS", 0xD1, 0x08, true },
296 1.6 knakahar { "MEM_LOAD_UOPS_RETIRED.L2_HIT", 0xD1, 0x02, true },
297 1.6 knakahar { "MEM_LOAD_UOPS_RETIRED.L2_MISS", 0xD1, 0x10, true },
298 1.6 knakahar { "MEM_LOAD_UOPS_RETIRED.HITM", 0xD1, 0x20, true },
299 1.6 knakahar { "MEM_LOAD_UOPS_RETIRED.WCB_HIT", 0xD1, 0x40, true },
300 1.6 knakahar { "MEM_LOAD_UOPS_RETIRED.DRAM_HIT", 0xD1, 0x80, true },
301 1.6 knakahar { "BACLEARS.ALL", 0xE6, 0x01, true },
302 1.6 knakahar { "BACLEARS.RETURN", 0xE6, 0x08, true },
303 1.6 knakahar { "BACLEAR.CONDS", 0xE6, 0x10, true },
304 1.6 knakahar { "MS_DECODED.MS_ENTRY", 0xE7, 0x01, true },
305 1.6 knakahar { "DECODED_RESTRICTION.PREDECODE_WRONG", 0xE9, 0x01, true },
306 1.6 knakahar };
307 1.6 knakahar
308 1.6 knakahar static struct event_table intel_goldmont = {
309 1.6 knakahar .tablename = "Intel Goldmont",
310 1.6 knakahar .names = intel_goldmont_names,
311 1.6 knakahar .nevents = sizeof(intel_goldmont_names) /
312 1.6 knakahar sizeof(struct name_to_event),
313 1.6 knakahar .next = NULL
314 1.6 knakahar };
315 1.6 knakahar
316 1.6 knakahar static struct event_table *
317 1.6 knakahar init_intel_goldmont(void)
318 1.6 knakahar {
319 1.6 knakahar
320 1.6 knakahar return &intel_goldmont;
321 1.6 knakahar }
322 1.6 knakahar
323 1.6 knakahar /*
324 1.7 knakahar * Intel Goldmont Plus (Additions from Goldmont)
325 1.7 knakahar */
326 1.7 knakahar static struct name_to_event intel_goldmontplus_names[] = {
327 1.7 knakahar { "INST_RETIRED.ANY", 0x00, 0x01, true },
328 1.7 knakahar { "DTLB_LOAD_MISSES.WALK_COMPLETED_4K", 0x08, 0x02, true },
329 1.7 knakahar { "DTLB_LOAD_MISSES.WALK_COMPLETED_2M_4M", 0x08, 0x04, true },
330 1.7 knakahar { "DTLB_LOAD_MISSES.WALK_COMPLETED_1GB", 0x08, 0x08, true },
331 1.7 knakahar { "DTLB_LOAD_MISSES.WALK_PENDING", 0x08, 0x10, true },
332 1.7 knakahar { "DTLB_STORE_MISSES.WALK_COMPLETED_4K", 0x49, 0x02, true },
333 1.7 knakahar { "DTLB_STORE_MISSES.WALK_COMPLETED_2M_4M", 0x49, 0x04, true },
334 1.7 knakahar { "DTLB_STORE_MISSES.WALK_COMPLETED_1GB", 0x49, 0x08, true },
335 1.7 knakahar { "DTLB_STORE_MISSES.WALK_PENDING", 0x49, 0x10, true },
336 1.7 knakahar { "EPT.WALK_PENDING", 0x4F, 0x10, true },
337 1.7 knakahar { "ITLB_MISSES.WALK_COMPLETED_4K", 0x85, 0x08, true },
338 1.7 knakahar { "ITLB_MISSES.WALK_COMPLETED_2M_4M", 0x85, 0x04, true },
339 1.7 knakahar { "ITLB_MISSES.WALK_COMPLETED_1GB", 0x85, 0x08, true },
340 1.7 knakahar { "ITLB_MISSES.WALK_PENDING", 0x85, 0x10, true },
341 1.7 knakahar { "TLB_FLUSHES.STLB_ANY", 0xBD, 0x20, true },
342 1.7 knakahar { "MACHINE_CLEARS.PAGE_FAULT", 0xC3, 0x20, true },
343 1.7 knakahar };
344 1.7 knakahar
345 1.7 knakahar static struct event_table intel_goldmontplus = {
346 1.7 knakahar .tablename = "Intel Goldmont Plus",
347 1.7 knakahar .names = intel_goldmontplus_names,
348 1.7 knakahar .nevents = sizeof(intel_goldmontplus_names) /
349 1.7 knakahar sizeof(struct name_to_event),
350 1.7 knakahar .next = NULL
351 1.7 knakahar };
352 1.7 knakahar
353 1.7 knakahar static struct event_table *
354 1.7 knakahar init_intel_goldmontplus(void)
355 1.7 knakahar {
356 1.7 knakahar
357 1.7 knakahar intel_goldmont.next = &intel_goldmontplus;
358 1.7 knakahar
359 1.7 knakahar return &intel_goldmont;
360 1.7 knakahar }
361 1.7 knakahar
362 1.7 knakahar /*
363 1.4 maxv * Intel Skylake/Kabylake.
364 1.4 maxv *
365 1.4 maxv * The events that are not listed, because they are of little interest or
366 1.4 maxv * require extra configuration:
367 1.4 maxv * TX_*
368 1.4 maxv * FRONTEND_RETIRED.*
369 1.4 maxv * FP_ARITH_INST_RETIRED.*
370 1.4 maxv * HLE_RETIRED.*
371 1.4 maxv * RTM_RETIRED.*
372 1.4 maxv * MEM_TRANS_RETIRED.*
373 1.4 maxv * UOPS_DISPATCHED_PORT.*
374 1.1 maxv */
375 1.1 maxv static struct name_to_event intel_skylake_kabylake_names[] = {
376 1.1 maxv /* Event Name - Event Select - UMask */
377 1.4 maxv { "LD_BLOCKS.STORE_FORWARD", 0x03, 0x02, true },
378 1.4 maxv { "LD_BLOCKS.NO_SR", 0x03, 0x08, true },
379 1.4 maxv { "LD_BLOCKS_PARTIAL.ADDRESS_ALIAS", 0x07, 0x01, true },
380 1.4 maxv { "DTLB_LOAD_MISSES.MISS_CAUSES_A_WALK", 0x08, 0x01, true },
381 1.4 maxv { "DTLB_LOAD_MISSES.WALK_COMPLETED_4K", 0x08, 0x02, true },
382 1.4 maxv { "DTLB_LOAD_MISSES.WALK_COMPLETED_2M_4M", 0x08, 0x04, true },
383 1.4 maxv { "DTLB_LOAD_MISSES.WALK_COMPLETED_1G", 0x08, 0x08, true },
384 1.4 maxv { "DTLB_LOAD_MISSES.WALK_COMPLETED", 0x08, 0x0E, true },
385 1.4 maxv { "DTLB_LOAD_MISSES.WALK_PENDING", 0x08, 0x10, true },
386 1.4 maxv { "DTLB_LOAD_MISSES.STLB_HIT", 0x08, 0x20, true },
387 1.4 maxv { "INT_MISC.RECOVERY_CYCLES", 0x0D, 0x01, true },
388 1.4 maxv { "INT_MISC.CLEAR_RESTEER_CYCLES", 0x0D, 0x80, true },
389 1.4 maxv { "UOPS_ISSUED.ANY", 0x0E, 0x01, true },
390 1.4 maxv { "UOPS_ISSUED.VECTOR_WIDTH_MISMATCH", 0x0E, 0x02, true },
391 1.4 maxv { "UOPS_ISSUED.SLOW_LEA", 0x0E, 0x20, true },
392 1.4 maxv { "L2_RQSTS.DEMAND_DATA_RD_MISS", 0x24, 0x21, true },
393 1.4 maxv { "L2_RQSTS.RFO_MISS", 0x24, 0x22, true },
394 1.4 maxv { "L2_RQSTS.CODE_RD_MISS", 0x24, 0x24, true },
395 1.4 maxv { "L2_RQSTS.ALL_DEMAND_MISS", 0x24, 0x27, true },
396 1.4 maxv { "L2_RQSTS.PF_MISS", 0x24, 0x38, true },
397 1.4 maxv { "L2_RQSTS.MISS", 0x24, 0x3F, true },
398 1.4 maxv { "L2_RQSTS.DEMAND_DATA_RD_HIT", 0x24, 0x41, true },
399 1.4 maxv { "L2_RQSTS.RFO_HIT", 0x24, 0x42, true },
400 1.4 maxv { "L2_RQSTS.CODE_RD_HIT", 0x24, 0x44, true },
401 1.4 maxv { "L2_RQSTS.PF_HIT", 0x24, 0xD8, true },
402 1.4 maxv { "L2_RQSTS.ALL_DEMAND_DATA_RD", 0x24, 0xE1, true },
403 1.4 maxv { "L2_RQSTS.ALL_RFO", 0x24, 0xE2, true },
404 1.4 maxv { "L2_RQSTS.ALL_CODE_RD", 0x24, 0xE4, true },
405 1.4 maxv { "L2_RQSTS.ALL_DEMAND_REFERENCES", 0x24, 0xE7, true },
406 1.4 maxv { "L2_RQSTS.ALL_PF", 0x24, 0xF8, true },
407 1.4 maxv { "L2_RQSTS.REFERENCES", 0x24, 0xFF, true },
408 1.4 maxv { "SW_PREFETCH_ACCESS.NTA", 0x32, 0x01, true },
409 1.4 maxv { "SW_PREFETCH_ACCESS.T0", 0x32, 0x02, true },
410 1.4 maxv { "SW_PREFETCH_ACCESS.T1_T2", 0x32, 0x04, true },
411 1.4 maxv { "SW_PREFETCH_ACCESS.PREFETCHW", 0x32, 0x08, true },
412 1.4 maxv { "CPU_CLK_THREAD_UNHALTED.ONE_THREAD_ACTIVE", 0x3C, 0x02, true },
413 1.4 maxv { "CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE", 0x3C, 0x02, true },
414 1.4 maxv { "L1D_PEND_MISS.PENDING", 0x48, 0x01, true },
415 1.4 maxv { "L1D_PEND_MISS.FB_FULL", 0x48, 0x02, true },
416 1.4 maxv { "DTLB_STORE_MISSES.MISS_CAUSES_A_WALK", 0x49, 0x01, true },
417 1.4 maxv { "DTLB_STORE_MISSES.WALK_COMPLETED_4K", 0x49, 0x02, true },
418 1.4 maxv { "DTLB_STORE_MISSES.WALK_COMPLETED_2M_4M", 0x49, 0x04, true },
419 1.4 maxv { "DTLB_STORE_MISSES.WALK_COMPLETED_1G", 0x49, 0x08, true },
420 1.4 maxv { "DTLB_STORE_MISSES.WALK_COMPLETED", 0x49, 0x0E, true },
421 1.4 maxv { "DTLB_STORE_MISSES.WALK_PENDING", 0x49, 0x10, true },
422 1.4 maxv { "DTLB_STORE_MISSES.STLB_HIT", 0x49, 0x20, true },
423 1.4 maxv { "LOAD_HIT_PRE.SW_PF", 0x4C, 0x01, true },
424 1.4 maxv { "EPT.WALK_PENDING", 0x4F, 0x10, true },
425 1.4 maxv { "L1D.REPLACEMENT", 0x51, 0x01, true },
426 1.4 maxv { "RS_EVENTS.EMPTY_CYCLES", 0x5E, 0x01, true },
427 1.4 maxv { "OFFCORE_REQUESTS_OUTSTANDING.DEMAND_DATA_RD", 0x60, 0x01, true },
428 1.4 maxv { "OFFCORE_REQUESTS_OUTSTANDING.DEMAND_CODE_RD", 0x60, 0x02, true },
429 1.4 maxv { "OFFCORE_REQUESTS_OUTSTANDING.DEMAND_RFO", 0x60, 0x04, true },
430 1.4 maxv { "OFFCORE_REQUESTS_OUTSTANDING.ALL_DATA_RD", 0x60, 0x08, true },
431 1.4 maxv { "OFFCORE_REQUESTS_OUTSTANDING.L3_MISS_DEMAND_DATA_RD", 0x60, 0x10, true },
432 1.4 maxv { "IDQ.MITE_UOPS", 0x79, 0x04, true },
433 1.4 maxv { "IDQ.DSB_UOPS", 0x79, 0x08, true },
434 1.4 maxv { "IDQ.MS_MITE_UOPS", 0x79, 0x20, true },
435 1.4 maxv { "IDQ.MS_UOPS", 0x79, 0x30, true },
436 1.4 maxv { "ICACHE_16B.IFDATA_STALL", 0x80, 0x04, true },
437 1.4 maxv { "ICACHE_64B.IFTAG_HIT", 0x83, 0x01, true },
438 1.4 maxv { "ICACHE_64B.IFTAG_MISS", 0x83, 0x02, true },
439 1.4 maxv { "ICACHE_64B.IFTAG_STALL", 0x83, 0x04, true },
440 1.4 maxv { "ITLB_MISSES.MISS_CAUSES_A_WALK", 0x85, 0x01, true },
441 1.4 maxv { "ITLB_MISSES.WALK_COMPLETED_4K", 0x85, 0x02, true },
442 1.4 maxv { "ITLB_MISSES.WALK_COMPLETED_2M_4M", 0x85, 0x04, true },
443 1.4 maxv { "ITLB_MISSES.WALK_COMPLETED_1G", 0x85, 0x08, true },
444 1.4 maxv { "ITLB_MISSES.WALK_COMPLETED", 0x85, 0x0E, true },
445 1.4 maxv { "ITLB_MISSES.WALK_PENDING", 0x85, 0x10, true },
446 1.4 maxv { "ITLB_MISSES.STLB_HIT", 0x85, 0x20, true },
447 1.4 maxv { "ILD_STALL.LCP", 0x87, 0x01, true },
448 1.4 maxv { "IDQ_UOPS_NOT_DELIVERED.CORE", 0x9C, 0x01, true },
449 1.4 maxv { "RESOURCE_STALLS.ANY", 0xA2, 0x01, true },
450 1.4 maxv { "RESOURCE_STALLS.SB", 0xA2, 0x08, true },
451 1.4 maxv { "EXE_ACTIVITY.EXE_BOUND_0_PORTS", 0xA6, 0x01, true },
452 1.4 maxv { "EXE_ACTIVITY.1_PORTS_UTIL", 0xA6, 0x02, true },
453 1.4 maxv { "EXE_ACTIVITY.2_PORTS_UTIL", 0xA6, 0x04, true },
454 1.4 maxv { "EXE_ACTIVITY.3_PORTS_UTIL", 0xA6, 0x08, true },
455 1.4 maxv { "EXE_ACTIVITY.4_PORTS_UTIL", 0xA6, 0x10, true },
456 1.4 maxv { "EXE_ACTIVITY.BOUND_ON_STORES", 0xA6, 0x40, true },
457 1.4 maxv { "LSD.UOPS", 0xA8, 0x01, true },
458 1.4 maxv { "DSB2MITE_SWITCHES.PENALTY_CYCLES", 0xAB, 0x02, true },
459 1.4 maxv { "ITLB.ITLB_FLUSH", 0xAE, 0x01, true },
460 1.4 maxv { "OFFCORE_REQUESTS.DEMAND_DATA_RD", 0xB0, 0x01, true },
461 1.4 maxv { "OFFCORE_REQUESTS.DEMAND_CODE_RD", 0xB0, 0x02, true },
462 1.4 maxv { "OFFCORE_REQUESTS.DEMAND_RFO", 0xB0, 0x04, true },
463 1.4 maxv { "OFFCORE_REQUESTS.ALL_DATA_RD", 0xB0, 0x08, true },
464 1.4 maxv { "OFFCORE_REQUESTS.L3_MISS_DEMAND_DATA_RD", 0xB0, 0x10, true },
465 1.4 maxv { "OFFCORE_REQUESTS.ALL_REQUESTS", 0xB0, 0x80, true },
466 1.4 maxv { "UOPS_EXECUTED.THREAD", 0xB1, 0x01, true },
467 1.4 maxv { "UOPS_EXECUTED.CORE", 0xB1, 0x02, true },
468 1.4 maxv { "UOPS_EXECUTED.X87", 0xB1, 0x10, true },
469 1.4 maxv { "OFFCORE_REQUESTS_BUFFER.SQ_FULL", 0xB2, 0x01, true },
470 1.4 maxv { "TLB_FLUSH.DTLB_THREAD", 0xBD, 0x01, true },
471 1.4 maxv { "TLB_FLUSH.STLB_ANY", 0xBD, 0x20, true },
472 1.4 maxv { "INST_RETIRED.PREC_DIST", 0xC0, 0x01, true },
473 1.4 maxv { "OTHER_ASSISTS.ANY", 0xC1, 0x3F, true },
474 1.4 maxv { "UOPS_RETIRED.RETIRE_SLOTS", 0xC2, 0x02, true },
475 1.4 maxv { "MACHINE_CLEARS.MEMORY_ORDERING", 0xC3, 0x02, true },
476 1.4 maxv { "MACHINE_CLEARS.SMC", 0xC3, 0x04, true },
477 1.4 maxv { "BR_INST_RETIRED.CONDITIONAL", 0xC4, 0x01, true },
478 1.4 maxv { "BR_INST_RETIRED.NEAR_CALL", 0xC4, 0x02, true },
479 1.4 maxv { "BR_INST_RETIRED.NEAR_RETURN", 0xC4, 0x08, true },
480 1.4 maxv { "BR_INST_RETIRED.NOT_TAKEN", 0xC4, 0x10, true },
481 1.4 maxv { "BR_INST_RETIRED.NEAR_TAKEN", 0xC4, 0x20, true },
482 1.4 maxv { "BR_INST_RETIRED.FAR_BRANCH", 0xC4, 0x40, true },
483 1.4 maxv { "BR_MISP_RETIRED.CONDITIONAL", 0xC5, 0x01, true },
484 1.4 maxv { "BR_MISP_RETIRED.NEAR_CALL", 0xC5, 0x02, true },
485 1.4 maxv { "BR_MISP_RETIRED.NEAR_TAKEN", 0xC5, 0x20, true },
486 1.4 maxv { "HW_INTERRUPTS.RECEIVED", 0xCB, 0x01, true },
487 1.4 maxv { "MEM_INST_RETIRED.STLB_MISS_LOADS", 0xD0, 0x11, true },
488 1.4 maxv { "MEM_INST_RETIRED.STLB_MISS_STORES", 0xD0, 0x12, true },
489 1.4 maxv { "MEM_INST_RETIRED.LOCK_LOADS", 0xD0, 0x21, true },
490 1.4 maxv { "MEM_INST_RETIRED.SPLIT_LOADS", 0xD0, 0x41, true },
491 1.4 maxv { "MEM_INST_RETIRED.SPLIT_STORES", 0xD0, 0x42, true },
492 1.4 maxv { "MEM_INST_RETIRED.ALL_LOADS", 0xD0, 0x81, true },
493 1.4 maxv { "MEM_INST_RETIRED.ALL_STORES", 0xD0, 0x82, true },
494 1.4 maxv { "MEM_LOAD_RETIRED.L1_HIT", 0xD1, 0x01, true },
495 1.4 maxv { "MEM_LOAD_RETIRED.L2_HIT", 0xD1, 0x02, true },
496 1.4 maxv { "MEM_LOAD_RETIRED.L3_HIT", 0xD1, 0x04, true },
497 1.4 maxv { "MEM_LOAD_RETIRED.L1_MISS", 0xD1, 0x08, true },
498 1.4 maxv { "MEM_LOAD_RETIRED.L2_MISS", 0xD1, 0x10, true },
499 1.4 maxv { "MEM_LOAD_RETIRED.L3_MISS", 0xD1, 0x20, true },
500 1.4 maxv { "MEM_LOAD_RETIRED.FB_HIT", 0xD1, 0x40, true },
501 1.4 maxv { "MEM_LOAD_L3_HIT_RETIRED.XSNP_MISS", 0xD2, 0x01, true },
502 1.4 maxv { "MEM_LOAD_L3_HIT_RETIRED.XSNP_HIT", 0xD2, 0x02, true },
503 1.4 maxv { "MEM_LOAD_L3_HIT_RETIRED.XSNP_HITM", 0xD2, 0x04, true },
504 1.4 maxv { "MEM_LOAD_L3_HIT_RETIRED.XSNP_NONE", 0xD2, 0x08, true },
505 1.4 maxv { "MEM_LOAD_MISC_RETIRED.UC", 0xD4, 0x04, true },
506 1.4 maxv { "BACLEARS.ANY", 0xE6, 0x01, true },
507 1.4 maxv { "L2_TRANS.L2_WB", 0xF0, 0x40, true },
508 1.4 maxv { "L2_LINES_IN.ALL", 0xF1, 0x1F, true },
509 1.4 maxv { "L2_LINES_OUT.SILENT", 0xF2, 0x01, true },
510 1.4 maxv { "L2_LINES_OUT.NON_SILENT", 0xF2, 0x02, true },
511 1.4 maxv { "L2_LINES_OUT.USELESS_HWPF", 0xF2, 0x04, true },
512 1.4 maxv { "SQ_MISC.SPLIT_LOCK", 0xF4, 0x10, true },
513 1.1 maxv };
514 1.1 maxv
515 1.1 maxv static struct event_table intel_skylake_kabylake = {
516 1.1 maxv .tablename = "Intel Skylake/Kabylake",
517 1.1 maxv .names = intel_skylake_kabylake_names,
518 1.1 maxv .nevents = sizeof(intel_skylake_kabylake_names) /
519 1.1 maxv sizeof(struct name_to_event),
520 1.1 maxv .next = NULL
521 1.1 maxv };
522 1.1 maxv
523 1.1 maxv static struct event_table *
524 1.1 maxv init_intel_skylake_kabylake(void)
525 1.1 maxv {
526 1.1 maxv return &intel_skylake_kabylake;
527 1.1 maxv }
528 1.1 maxv
529 1.1 maxv static struct event_table *
530 1.1 maxv init_intel_generic(void)
531 1.1 maxv {
532 1.1 maxv unsigned int eax, ebx, ecx, edx;
533 1.1 maxv struct event_table *table;
534 1.1 maxv
535 1.1 maxv /*
536 1.1 maxv * The kernel made sure the Architectural Version 1 PMCs were
537 1.1 maxv * present.
538 1.1 maxv */
539 1.1 maxv table = init_intel_arch1();
540 1.1 maxv
541 1.1 maxv /*
542 1.1 maxv * Now query the additional (non-architectural) events. They
543 1.1 maxv * depend on the CPU model.
544 1.1 maxv */
545 1.1 maxv eax = 0x01;
546 1.1 maxv ebx = 0;
547 1.1 maxv ecx = 0;
548 1.1 maxv edx = 0;
549 1.1 maxv x86_cpuid(&eax, &ebx, &ecx, &edx);
550 1.1 maxv
551 1.3 maxv if (CPUID_TO_FAMILY(eax) == 6) {
552 1.3 maxv switch (CPUID_TO_MODEL(eax)) {
553 1.5 knakahar case 0x37: /* Silvermont (Bay Trail) */
554 1.5 knakahar case 0x4A: /* Silvermont (Tangier) */
555 1.5 knakahar case 0x4C: /* Airmont (Braswell, Cherry Trail) */
556 1.5 knakahar case 0x4D: /* Silvermont (Avoton, Rangeley) */
557 1.5 knakahar case 0x5A: /* Silvermont (Anniedale) */
558 1.5 knakahar case 0x5D: /* Silvermont (SoFIA) */
559 1.5 knakahar table->next = init_intel_silvermont_airmont();
560 1.5 knakahar break;
561 1.6 knakahar case 0x5C: /* Goldmont (Apollo Lake) */
562 1.10 knakahar case 0x5F: /* Goldmont (Denverton) */
563 1.6 knakahar table->next = init_intel_goldmont();
564 1.6 knakahar break;
565 1.7 knakahar case 0x7A: /* Goldmont Plus (Gemini Lake) */
566 1.7 knakahar table->next = init_intel_goldmontplus();
567 1.7 knakahar break;
568 1.3 maxv case 0x4E: /* Skylake */
569 1.3 maxv case 0x5E: /* Skylake */
570 1.3 maxv case 0x8E: /* Kabylake */
571 1.3 maxv case 0x9E: /* Kabylake */
572 1.3 maxv table->next = init_intel_skylake_kabylake();
573 1.3 maxv break;
574 1.3 maxv }
575 1.1 maxv }
576 1.1 maxv
577 1.1 maxv return table;
578 1.1 maxv }
579 1.1 maxv
580 1.1 maxv /* -------------------------------------------------------------------------- */
581 1.1 maxv
582 1.1 maxv /*
583 1.1 maxv * AMD Family 10h
584 1.1 maxv */
585 1.1 maxv static struct name_to_event amd_f10h_names[] = {
586 1.2 maxv { "seg-load-all", 0x20, 0x7f, true },
587 1.2 maxv { "seg-load-es", 0x20, 0x01, true },
588 1.2 maxv { "seg-load-cs", 0x20, 0x02, true },
589 1.2 maxv { "seg-load-ss", 0x20, 0x04, true },
590 1.2 maxv { "seg-load-ds", 0x20, 0x08, true },
591 1.2 maxv { "seg-load-fs", 0x20, 0x10, true },
592 1.2 maxv { "seg-load-gs", 0x20, 0x20, true },
593 1.2 maxv { "seg-load-hs", 0x20, 0x40, true },
594 1.2 maxv { "l1cache-access", 0x40, 0x00, true },
595 1.2 maxv { "l1cache-miss", 0x41, 0x00, true },
596 1.2 maxv { "l1cache-refill", 0x42, 0x1f, true },
597 1.2 maxv { "l1cache-refill-invalid", 0x42, 0x01, true },
598 1.2 maxv { "l1cache-refill-shared", 0x42, 0x02, true },
599 1.2 maxv { "l1cache-refill-exclusive", 0x42, 0x04, true },
600 1.2 maxv { "l1cache-refill-owner", 0x42, 0x08, true },
601 1.2 maxv { "l1cache-refill-modified", 0x42, 0x10, true },
602 1.2 maxv { "l1cache-load", 0x43, 0x1f, true },
603 1.2 maxv { "l1cache-load-invalid", 0x43, 0x01, true },
604 1.2 maxv { "l1cache-load-shared", 0x43, 0x02, true },
605 1.2 maxv { "l1cache-load-exclusive", 0x43, 0x04, true },
606 1.2 maxv { "l1cache-load-owner", 0x43, 0x08, true },
607 1.2 maxv { "l1cache-load-modified", 0x43, 0x10, true },
608 1.2 maxv { "l1cache-writeback", 0x44, 0x1f, true },
609 1.2 maxv { "l1cache-writeback-invalid", 0x44, 0x01, true },
610 1.2 maxv { "l1cache-writeback-shared", 0x44, 0x02, true },
611 1.2 maxv { "l1cache-writeback-exclusive",0x44, 0x04, true },
612 1.2 maxv { "l1cache-writeback-owner", 0x44, 0x08, true },
613 1.2 maxv { "l1cache-writeback-modified", 0x44, 0x10, true },
614 1.2 maxv { "l1DTLB-hit-all", 0x4D, 0x07, true },
615 1.2 maxv { "l1DTLB-hit-4Kpage", 0x4D, 0x01, true },
616 1.2 maxv { "l1DTLB-hit-2Mpage", 0x4D, 0x02, true },
617 1.2 maxv { "l1DTLB-hit-1Gpage", 0x4D, 0x04, true },
618 1.2 maxv { "l1DTLB-miss-all", 0x45, 0x07, true },
619 1.2 maxv { "l1DTLB-miss-4Kpage", 0x45, 0x01, true },
620 1.2 maxv { "l1DTLB-miss-2Mpage", 0x45, 0x02, true },
621 1.2 maxv { "l1DTLB-miss-1Gpage", 0x45, 0x04, true },
622 1.2 maxv { "l2DTLB-miss-all", 0x46, 0x03, true },
623 1.2 maxv { "l2DTLB-miss-4Kpage", 0x46, 0x01, true },
624 1.2 maxv { "l2DTLB-miss-2Mpage", 0x46, 0x02, true },
625 1.1 maxv /* l2DTLB-miss-1Gpage: reserved on some revisions, so disabled */
626 1.2 maxv { "l1ITLB-miss", 0x84, 0x00, true },
627 1.2 maxv { "l2ITLB-miss-all", 0x85, 0x03, true },
628 1.2 maxv { "l2ITLB-miss-4Kpage", 0x85, 0x01, true },
629 1.2 maxv { "l2ITLB-miss-2Mpage", 0x85, 0x02, true },
630 1.2 maxv { "mem-misalign-ref", 0x47, 0x00, true },
631 1.2 maxv { "ins-fetch", 0x80, 0x00, true },
632 1.2 maxv { "ins-fetch-miss", 0x81, 0x00, true },
633 1.2 maxv { "ins-refill-l2", 0x82, 0x00, true },
634 1.2 maxv { "ins-refill-sys", 0x83, 0x00, true },
635 1.2 maxv { "ins-fetch-stall", 0x87, 0x00, true },
636 1.2 maxv { "ins-retired", 0xC0, 0x00, true },
637 1.2 maxv { "ins-empty", 0xD0, 0x00, true },
638 1.2 maxv { "ops-retired", 0xC1, 0x00, true },
639 1.2 maxv { "branch-retired", 0xC2, 0x00, true },
640 1.2 maxv { "branch-miss-retired", 0xC3, 0x00, true },
641 1.2 maxv { "branch-taken-retired", 0xC4, 0x00, true },
642 1.2 maxv { "branch-taken-miss-retired", 0xC5, 0x00, true },
643 1.2 maxv { "branch-far-retired", 0xC6, 0x00, true },
644 1.2 maxv { "branch-resync-retired", 0xC7, 0x00, true },
645 1.2 maxv { "branch-near-retired", 0xC8, 0x00, true },
646 1.2 maxv { "branch-near-miss-retired", 0xC9, 0x00, true },
647 1.2 maxv { "branch-indirect-miss-retired", 0xCA, 0x00, true },
648 1.2 maxv { "int-hw", 0xCF, 0x00, true },
649 1.2 maxv { "int-cycles-masked", 0xCD, 0x00, true },
650 1.2 maxv { "int-cycles-masked-pending", 0xCE, 0x00, true },
651 1.2 maxv { "fpu-exceptions", 0xDB, 0x00, true },
652 1.2 maxv { "break-match0", 0xDC, 0x00, true },
653 1.2 maxv { "break-match1", 0xDD, 0x00, true },
654 1.2 maxv { "break-match2", 0xDE, 0x00, true },
655 1.2 maxv { "break-match3", 0xDF, 0x00, true },
656 1.1 maxv };
657 1.1 maxv
658 1.1 maxv static struct event_table amd_f10h = {
659 1.1 maxv .tablename = "AMD Family 10h",
660 1.1 maxv .names = amd_f10h_names,
661 1.1 maxv .nevents = sizeof(amd_f10h_names) /
662 1.1 maxv sizeof(struct name_to_event),
663 1.1 maxv .next = NULL
664 1.1 maxv };
665 1.1 maxv
666 1.8 maxv /*
667 1.9 jmcneill * AMD Family 15h
668 1.9 jmcneill */
669 1.9 jmcneill static struct name_to_event amd_f15h_names[] = {
670 1.9 jmcneill { "FpPipeAssignment", 0x000, 0x77, true },
671 1.9 jmcneill { "FpSchedulerEmpty", 0x001, 0x00, true },
672 1.9 jmcneill { "FpRetSseAvxOps", 0x003, 0xff, true },
673 1.9 jmcneill { "FpNumMovElim", 0x004, 0x0f, true },
674 1.9 jmcneill { "FpRetiredSerOps", 0x005, 0x0f, true },
675 1.9 jmcneill { "LsSegRegLoads", 0x020, 0x7f, true },
676 1.9 jmcneill { "LsPipeRestartSelfMod", 0x021, 0x00, true },
677 1.9 jmcneill { "LsPipeRestartVarious", 0x022, 0x1f, true },
678 1.9 jmcneill { "LsLoadQueueStoreQFull", 0x023, 0x03, true },
679 1.9 jmcneill { "LsLockedOps", 0x024, 0x00, true },
680 1.9 jmcneill { "LsRetClflushInstr", 0x026, 0x00, true },
681 1.9 jmcneill { "LsRetCpuidInstr", 0x027, 0x00, true },
682 1.9 jmcneill { "LsDispatch", 0x029, 0x07, true },
683 1.9 jmcneill { "LsCanStoreToLoadFwOps", 0x02a, 0x03, true },
684 1.9 jmcneill { "LsSmisReceived", 0x02b, 0x00, true },
685 1.9 jmcneill { "LsExecClflushInstr", 0x030, 0x00, true },
686 1.9 jmcneill { "LsMisalignStore", 0x032, 0x00, true },
687 1.9 jmcneill { "LsFpLoadBufStall", 0x034, 0x00, true },
688 1.9 jmcneill { "LsStlf", 0x035, 0x00, true },
689 1.9 jmcneill { "DcCacheAccess", 0x040, 0x00, true },
690 1.9 jmcneill { "DcCacheMiss", 0x041, 0x00, true },
691 1.9 jmcneill { "DcCacheFillL2Sys", 0x042, 0x1f, true },
692 1.9 jmcneill { "DcCacheFillSys", 0x043, 0x00, true },
693 1.9 jmcneill { "DcUnifiedTlbHit", 0x045, 0x77, true },
694 1.9 jmcneill { "DcUnifiedTlbMiss", 0x046, 0x77, true },
695 1.9 jmcneill { "DcMisalignAccess", 0x047, 0x00, true },
696 1.9 jmcneill { "DcPrefetchInstrDisp", 0x04b, 0x07, true },
697 1.9 jmcneill { "DcIneffSwPrefetch", 0x052, 0x09, true },
698 1.9 jmcneill { "CuCmdVictimBuf", 0x060, 0x98, true },
699 1.9 jmcneill { "CuCmdMaskedOps", 0x061, 0x65, true },
700 1.9 jmcneill { "CuCmdReadBlkOps", 0x062, 0x77, true },
701 1.9 jmcneill { "CuCmdChgDirtyOps", 0x063, 0x08, true },
702 1.9 jmcneill { "CuDramSysReq", 0x064, 0x00, true },
703 1.9 jmcneill { "CuMemReqByType", 0x065, 0x83, true },
704 1.9 jmcneill { "CuDataCachePrefetch", 0x067, 0x03, true },
705 1.9 jmcneill { "CuMabReq", 0x068, 0xff, true },
706 1.9 jmcneill { "CuMabWaitCyc", 0x069, 0xff, true },
707 1.9 jmcneill { "CuSysRespCacheFill", 0x06c, 0x3f, true },
708 1.9 jmcneill { "CuOctwordsWritten", 0x06d, 0x01, true },
709 1.9 jmcneill { "CuCacheXInv", 0x075, 0x0f, true },
710 1.9 jmcneill { "CuCpuClkNotHalted", 0x076, 0x00, true },
711 1.9 jmcneill { "CuL2Req", 0x07d, 0x5f, true },
712 1.9 jmcneill { "CuL2Miss", 0x07e, 0x17, true },
713 1.9 jmcneill { "CuL2FillWb", 0x07f, 0x07, true },
714 1.9 jmcneill { "CuPageSplintering", 0x165, 0x07, true },
715 1.9 jmcneill { "CuL2PrefetchTrigEv", 0x16c, 0x03, true },
716 1.9 jmcneill { "CuXabAllocStall", 0x177, 0x03, true },
717 1.9 jmcneill { "CuFreeXabEntries", 0x17f, 0x01, true },
718 1.9 jmcneill { "IcCacheFetch", 0x080, 0x00, true },
719 1.9 jmcneill { "IcCacheMiss", 0x081, 0x00, true },
720 1.9 jmcneill { "IcCacheFillL2", 0x082, 0x00, true },
721 1.9 jmcneill { "IcCacheFillSys", 0x083, 0x00, true },
722 1.9 jmcneill { "IcL1TlbMissL2Hit", 0x084, 0x00, true },
723 1.9 jmcneill { "IcL1TlbMissL2Miss", 0x085, 0x07, true },
724 1.9 jmcneill { "IcPipeRestartInstrStrProbe", 0x086, 0x00, true },
725 1.9 jmcneill { "IcFetchStall", 0x087, 0x00, true },
726 1.9 jmcneill { "IcRetStackHits", 0x088, 0x00, true },
727 1.9 jmcneill { "IcRetStackOver", 0x089, 0x00, true },
728 1.9 jmcneill { "IcCacheVictims", 0x08b, 0x00, true },
729 1.9 jmcneill { "IcCacheLinesInv", 0x08c, 0x0f, true },
730 1.9 jmcneill { "IcTlbReload", 0x099, 0x00, true },
731 1.9 jmcneill { "IcTlbReloadAbort", 0x09a, 0x00, true },
732 1.9 jmcneill { "IcUopsDispatched", 0x186, 0x01, true },
733 1.9 jmcneill { "ExRetInstr", 0x0c0, 0x00, true },
734 1.9 jmcneill { "ExRetCops", 0x0c1, 0x00, true },
735 1.9 jmcneill { "ExRetBrn", 0x0c2, 0x00, true },
736 1.9 jmcneill { "ExRetBrnMisp", 0x0c3, 0x00, true },
737 1.9 jmcneill { "ExRetBrnTkn", 0x0c4, 0x00, true },
738 1.9 jmcneill { "ExRetBrnTknMisp", 0x0c5, 0x00, true },
739 1.9 jmcneill { "ExRetBrnFar", 0x0c6, 0x00, true },
740 1.9 jmcneill { "ExRetBrnResync", 0x0c7, 0x00, true },
741 1.9 jmcneill { "ExRetNearRet", 0x0c8, 0x00, true },
742 1.9 jmcneill { "ExRetNearRetMispred", 0x0c9, 0x00, true },
743 1.9 jmcneill { "ExRetBrnIndMisp", 0x0ca, 0x00, true },
744 1.9 jmcneill { "ExRetMmxFpInstr@X87", 0x0cb, 0x01, true },
745 1.9 jmcneill { "ExRetMmxFpInstr@Mmx", 0x0cb, 0x02, true },
746 1.9 jmcneill { "ExRetMmxFpInstr@Sse", 0x0cb, 0x04, true },
747 1.9 jmcneill { "ExIntMaskedCyc", 0x0cd, 0x00, true },
748 1.9 jmcneill { "ExIntMaskedCycIntPend", 0x0ce, 0x00, true },
749 1.9 jmcneill { "ExIntTaken", 0x0cf, 0x00, true },
750 1.9 jmcneill { "ExDecEmpty", 0x0d0, 0x00, true },
751 1.9 jmcneill { "ExDispStall", 0x0d1, 0x00, true },
752 1.9 jmcneill { "ExUseqStallSer", 0x0d2, 0x00, true },
753 1.9 jmcneill { "ExDispStallInstrRetQFull", 0x0d5, 0x00, true },
754 1.9 jmcneill { "ExDispStallIntSchedQFull", 0x0d6, 0x00, true },
755 1.9 jmcneill { "ExDispStallFpSchedQFull", 0x0d7, 0x00, true },
756 1.9 jmcneill { "ExDispStallLdqFull", 0x0d8, 0x00, true },
757 1.9 jmcneill { "ExUseqStallAllQuiet", 0x0d9, 0x00, true },
758 1.9 jmcneill { "ExFpuEx", 0x0db, 0x1f, true },
759 1.9 jmcneill { "ExBpDr0", 0x0dc, 0x8f, true },
760 1.9 jmcneill { "ExBpDr1", 0x0dd, 0x8f, true },
761 1.9 jmcneill { "ExBpDr2", 0x0de, 0x8f, true },
762 1.9 jmcneill { "ExBpDr3", 0x0df, 0x8f, true },
763 1.9 jmcneill { "ExRetx87FpOps", 0x1c0, 0x07, true },
764 1.9 jmcneill { "ExTaggedIbsOps", 0x1cf, 0x07, true },
765 1.9 jmcneill { "ExRetFusBrInstr", 0x1d0, 0x00, true },
766 1.9 jmcneill { "ExDispStallStqFull", 0x1d8, 0x00, true },
767 1.9 jmcneill { "ExCycNoDispIntPrfTok", 0x1dd, 0x00, true },
768 1.9 jmcneill { "ExCycNoDispfpPrfTok", 0x1de, 0x00, true },
769 1.9 jmcneill { "ExFpDispContention", 0x1df, 0x0f, true },
770 1.9 jmcneill };
771 1.9 jmcneill
772 1.9 jmcneill static struct event_table amd_f15h = {
773 1.9 jmcneill .tablename = "AMD Family 15h",
774 1.9 jmcneill .names = amd_f15h_names,
775 1.9 jmcneill .nevents = sizeof(amd_f15h_names) /
776 1.9 jmcneill sizeof(struct name_to_event),
777 1.9 jmcneill .next = NULL
778 1.9 jmcneill };
779 1.9 jmcneill
780 1.9 jmcneill /*
781 1.8 maxv * AMD Family 17h
782 1.8 maxv */
783 1.8 maxv static struct name_to_event amd_f17h_names[] = {
784 1.8 maxv { "FpRetx87FpOps", 0x02, __BITS(2,0), true },
785 1.8 maxv { "FpRetSseAvxOps", 0x03, __BITS(7,0), true },
786 1.8 maxv { "FpRetiredSerOps", 0x05, __BITS(3,0), true },
787 1.8 maxv { "LsL1DTlbMiss", 0x45, __BITS(7,0), true },
788 1.8 maxv { "LsTableWalker", 0x46, __BITS(3,0), true },
789 1.8 maxv { "LsMisalAccesses", 0x47, 0x00, true },
790 1.8 maxv { "LsInefSwPref", 0x52, __BITS(1,0), true },
791 1.8 maxv { "LsNotHaltedCyc", 0x76, 0x00, true },
792 1.8 maxv { "IcFw32", 0x80, 0x00, true },
793 1.8 maxv { "IcFw32Miss", 0x81, 0x00, true },
794 1.8 maxv { "IcCacheFillL2", 0x82, 0x00, true },
795 1.8 maxv { "IcCacheFillSys", 0x83, 0x00, true },
796 1.8 maxv { "IcFetchStall", 0x87, __BITS(2,0), true },
797 1.8 maxv { "IcCacheInval", 0x8C, __BITS(1,0), true },
798 1.8 maxv { "BpL1TlbMissL2Hit", 0x84, 0x00, true },
799 1.8 maxv { "BpL1TlbMissL2Miss", 0x85, 0x00, true },
800 1.8 maxv { "BpSnpReSync", 0x86, 0x00, true },
801 1.8 maxv { "BpL1BTBCorrect", 0x8A, 0x00, true },
802 1.8 maxv { "BpL2BTBCorrect", 0x8B, 0x00, true },
803 1.8 maxv { "BpTlbRel", 0x99, 0x00, true },
804 1.8 maxv { "ExRetInstr", 0xC0, 0x00, true },
805 1.8 maxv { "ExRetCops", 0xC1, 0x00, true },
806 1.8 maxv { "ExRetBrn", 0xC2, 0x00, true },
807 1.8 maxv { "ExRetBrnMisp", 0xC3, 0x00, true },
808 1.8 maxv { "ExRetBrnTkn", 0xC4, 0x00, true },
809 1.8 maxv { "ExRetBrnTknMisp", 0xC5, 0x00, true },
810 1.8 maxv { "ExRetBrnFar", 0xC6, 0x00, true },
811 1.8 maxv { "ExRetBrnResync", 0xC7, 0x00, true },
812 1.8 maxv { "ExRetBrnIndMisp", 0xCA, 0x00, true },
813 1.8 maxv { "ExRetNearRet", 0xC8, 0x00, true },
814 1.8 maxv { "ExRetNearRetMispred", 0xC9, 0x00, true },
815 1.8 maxv { "ExRetMmxFpInstr@X87", 0xCB, __BIT(0), true },
816 1.8 maxv { "ExRetMmxFpInstr@Mmx", 0xCB, __BIT(1), true },
817 1.8 maxv { "ExRetMmxFpInstr@Sse", 0xCB, __BIT(2), true },
818 1.8 maxv { "ExRetCond", 0xD1, 0x00, true },
819 1.8 maxv { "ExRetCondMisp", 0xD2, 0x00, true },
820 1.8 maxv { "ExDivBusy", 0xD3, 0x00, true },
821 1.8 maxv { "ExDivCount", 0xD4, 0x00, true },
822 1.8 maxv };
823 1.8 maxv
824 1.8 maxv static struct event_table amd_f17h = {
825 1.8 maxv .tablename = "AMD Family 17h",
826 1.8 maxv .names = amd_f17h_names,
827 1.8 maxv .nevents = sizeof(amd_f17h_names) /
828 1.8 maxv sizeof(struct name_to_event),
829 1.8 maxv .next = NULL
830 1.8 maxv };
831 1.1 maxv
832 1.1 maxv static struct event_table *
833 1.1 maxv init_amd_generic(void)
834 1.1 maxv {
835 1.1 maxv unsigned int eax, ebx, ecx, edx;
836 1.1 maxv
837 1.1 maxv eax = 0x01;
838 1.1 maxv ebx = 0;
839 1.1 maxv ecx = 0;
840 1.1 maxv edx = 0;
841 1.1 maxv x86_cpuid(&eax, &ebx, &ecx, &edx);
842 1.1 maxv
843 1.1 maxv switch (CPUID_TO_FAMILY(eax)) {
844 1.1 maxv case 0x10:
845 1.8 maxv return &amd_f10h;
846 1.9 jmcneill case 0x15:
847 1.9 jmcneill return &amd_f15h;
848 1.8 maxv case 0x17:
849 1.8 maxv return &amd_f17h;
850 1.1 maxv }
851 1.1 maxv
852 1.1 maxv return NULL;
853 1.1 maxv }
854 1.1 maxv
855 1.1 maxv /* -------------------------------------------------------------------------- */
856 1.1 maxv
857 1.1 maxv int
858 1.1 maxv tprof_event_init(uint32_t ident)
859 1.1 maxv {
860 1.1 maxv switch (ident) {
861 1.1 maxv case TPROF_IDENT_NONE:
862 1.1 maxv return -1;
863 1.1 maxv case TPROF_IDENT_INTEL_GENERIC:
864 1.1 maxv cpuevents = init_intel_generic();
865 1.1 maxv break;
866 1.1 maxv case TPROF_IDENT_AMD_GENERIC:
867 1.1 maxv cpuevents = init_amd_generic();
868 1.1 maxv break;
869 1.1 maxv }
870 1.1 maxv return (cpuevents == NULL) ? -1 : 0;
871 1.1 maxv }
872 1.1 maxv
873 1.1 maxv static void
874 1.1 maxv recursive_event_list(struct event_table *table)
875 1.1 maxv {
876 1.1 maxv size_t i;
877 1.1 maxv
878 1.1 maxv printf("%s:\n", table->tablename);
879 1.1 maxv for (i = 0; i < table->nevents; i++) {
880 1.1 maxv if (!table->names[i].enabled)
881 1.1 maxv continue;
882 1.1 maxv printf("\t%s\n", table->names[i].name);
883 1.1 maxv }
884 1.1 maxv
885 1.1 maxv if (table->next != NULL) {
886 1.1 maxv recursive_event_list(table->next);
887 1.1 maxv }
888 1.1 maxv }
889 1.1 maxv
890 1.1 maxv void
891 1.1 maxv tprof_event_list(void)
892 1.1 maxv {
893 1.1 maxv recursive_event_list(cpuevents);
894 1.1 maxv }
895 1.1 maxv
896 1.1 maxv static void
897 1.1 maxv recursive_event_lookup(struct event_table *table, const char *name,
898 1.1 maxv struct tprof_param *param)
899 1.1 maxv {
900 1.1 maxv size_t i;
901 1.1 maxv
902 1.1 maxv for (i = 0; i < table->nevents; i++) {
903 1.1 maxv if (!table->names[i].enabled)
904 1.1 maxv continue;
905 1.1 maxv if (!strcmp(table->names[i].name, name)) {
906 1.1 maxv param->p_event = table->names[i].event;
907 1.1 maxv param->p_unit = table->names[i].unit;
908 1.1 maxv return;
909 1.1 maxv }
910 1.1 maxv }
911 1.1 maxv
912 1.1 maxv if (table->next != NULL) {
913 1.1 maxv recursive_event_lookup(table->next, name, param);
914 1.1 maxv } else {
915 1.1 maxv errx(EXIT_FAILURE, "event '%s' unknown", name);
916 1.1 maxv }
917 1.1 maxv }
918 1.1 maxv
919 1.1 maxv void
920 1.1 maxv tprof_event_lookup(const char *name, struct tprof_param *param)
921 1.1 maxv {
922 1.1 maxv recursive_event_lookup(cpuevents, name, param);
923 1.1 maxv }
924