tprof_armv8.c revision 1.4.2.2 1 1.4.2.2 pgoyette /* $NetBSD: tprof_armv8.c,v 1.4.2.2 2018/07/28 04:37:57 pgoyette Exp $ */
2 1.4.2.2 pgoyette
3 1.4.2.2 pgoyette /*-
4 1.4.2.2 pgoyette * Copyright (c) 2018 Jared McNeill <jmcneill (at) invisible.ca>
5 1.4.2.2 pgoyette * All rights reserved.
6 1.4.2.2 pgoyette *
7 1.4.2.2 pgoyette * Redistribution and use in source and binary forms, with or without
8 1.4.2.2 pgoyette * modification, are permitted provided that the following conditions
9 1.4.2.2 pgoyette * are met:
10 1.4.2.2 pgoyette * 1. Redistributions of source code must retain the above copyright
11 1.4.2.2 pgoyette * notice, this list of conditions and the following disclaimer.
12 1.4.2.2 pgoyette * 2. Redistributions in binary form must reproduce the above copyright
13 1.4.2.2 pgoyette * notice, this list of conditions and the following disclaimer in the
14 1.4.2.2 pgoyette * documentation and/or other materials provided with the distribution.
15 1.4.2.2 pgoyette *
16 1.4.2.2 pgoyette * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
17 1.4.2.2 pgoyette * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18 1.4.2.2 pgoyette * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
19 1.4.2.2 pgoyette * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
20 1.4.2.2 pgoyette * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
21 1.4.2.2 pgoyette * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22 1.4.2.2 pgoyette * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
23 1.4.2.2 pgoyette * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24 1.4.2.2 pgoyette * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 1.4.2.2 pgoyette * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 1.4.2.2 pgoyette * SUCH DAMAGE.
27 1.4.2.2 pgoyette */
28 1.4.2.2 pgoyette
29 1.4.2.2 pgoyette #include <sys/cdefs.h>
30 1.4.2.2 pgoyette __KERNEL_RCSID(0, "$NetBSD: tprof_armv8.c,v 1.4.2.2 2018/07/28 04:37:57 pgoyette Exp $");
31 1.4.2.2 pgoyette
32 1.4.2.2 pgoyette #include <sys/param.h>
33 1.4.2.2 pgoyette #include <sys/bus.h>
34 1.4.2.2 pgoyette #include <sys/cpu.h>
35 1.4.2.2 pgoyette #include <sys/xcall.h>
36 1.4.2.2 pgoyette
37 1.4.2.2 pgoyette #include <dev/tprof/tprof.h>
38 1.4.2.2 pgoyette
39 1.4.2.2 pgoyette #include <arm/armreg.h>
40 1.4.2.2 pgoyette #include <arm/locore.h>
41 1.4.2.2 pgoyette
42 1.4.2.2 pgoyette #include <dev/tprof/tprof_armv8.h>
43 1.4.2.2 pgoyette
44 1.4.2.2 pgoyette static tprof_param_t armv8_pmu_param;
45 1.4.2.2 pgoyette static const u_int armv8_pmu_counter = 1;
46 1.4.2.2 pgoyette static uint32_t counter_val;
47 1.4.2.2 pgoyette static uint32_t counter_reset_val;
48 1.4.2.2 pgoyette
49 1.4.2.2 pgoyette static bool
50 1.4.2.2 pgoyette armv8_pmu_event_implemented(uint16_t event)
51 1.4.2.2 pgoyette {
52 1.4.2.2 pgoyette uint64_t eid[2];
53 1.4.2.2 pgoyette
54 1.4.2.2 pgoyette if (event >= 64)
55 1.4.2.2 pgoyette return false;
56 1.4.2.2 pgoyette
57 1.4.2.2 pgoyette eid[0] = reg_pmceid0_el0_read();
58 1.4.2.2 pgoyette eid[1] = reg_pmceid1_el0_read();
59 1.4.2.2 pgoyette
60 1.4.2.2 pgoyette const u_int idx = event / 32;
61 1.4.2.2 pgoyette const u_int bit = event % 32;
62 1.4.2.2 pgoyette
63 1.4.2.2 pgoyette if (eid[idx] & __BIT(bit))
64 1.4.2.2 pgoyette return true;
65 1.4.2.2 pgoyette
66 1.4.2.2 pgoyette return false;
67 1.4.2.2 pgoyette }
68 1.4.2.2 pgoyette
69 1.4.2.2 pgoyette static void
70 1.4.2.2 pgoyette armv8_pmu_set_pmevtyper(u_int counter, uint64_t val)
71 1.4.2.2 pgoyette {
72 1.4.2.2 pgoyette reg_pmselr_el0_write(counter);
73 1.4.2.2 pgoyette arm_isb();
74 1.4.2.2 pgoyette reg_pmxevtyper_el0_write(val);
75 1.4.2.2 pgoyette }
76 1.4.2.2 pgoyette
77 1.4.2.2 pgoyette static void
78 1.4.2.2 pgoyette armv8_pmu_set_pmevcntr(u_int counter, uint32_t val)
79 1.4.2.2 pgoyette {
80 1.4.2.2 pgoyette reg_pmselr_el0_write(counter);
81 1.4.2.2 pgoyette arm_isb();
82 1.4.2.2 pgoyette reg_pmxevcntr_el0_write(val);
83 1.4.2.2 pgoyette }
84 1.4.2.2 pgoyette
85 1.4.2.2 pgoyette static void
86 1.4.2.2 pgoyette armv8_pmu_start_cpu(void *arg1, void *arg2)
87 1.4.2.2 pgoyette {
88 1.4.2.2 pgoyette const uint32_t counter_mask = __BIT(armv8_pmu_counter);
89 1.4.2.2 pgoyette uint64_t pmcr, pmevtyper;
90 1.4.2.2 pgoyette
91 1.4.2.2 pgoyette /* Enable performance monitor */
92 1.4.2.2 pgoyette pmcr = reg_pmcr_el0_read();
93 1.4.2.2 pgoyette pmcr |= PMCR_E;
94 1.4.2.2 pgoyette reg_pmcr_el0_write(pmcr);
95 1.4.2.2 pgoyette
96 1.4.2.2 pgoyette /* Disable event counter */
97 1.4.2.2 pgoyette reg_pmcntenclr_el0_write(counter_mask);
98 1.4.2.2 pgoyette
99 1.4.2.2 pgoyette /* Configure event counter */
100 1.4.2.2 pgoyette pmevtyper = __SHIFTIN(armv8_pmu_param.p_event, PMEVTYPER_EVTCOUNT);
101 1.4.2.2 pgoyette if (!ISSET(armv8_pmu_param.p_flags, TPROF_PARAM_USER))
102 1.4.2.2 pgoyette pmevtyper |= PMEVTYPER_U;
103 1.4.2.2 pgoyette if (!ISSET(armv8_pmu_param.p_flags, TPROF_PARAM_KERN))
104 1.4.2.2 pgoyette pmevtyper |= PMEVTYPER_P;
105 1.4.2.2 pgoyette
106 1.4.2.2 pgoyette armv8_pmu_set_pmevtyper(armv8_pmu_counter, pmevtyper);
107 1.4.2.2 pgoyette
108 1.4.2.2 pgoyette /* Enable overflow interrupts */
109 1.4.2.2 pgoyette reg_pmintenset_el1_write(counter_mask);
110 1.4.2.2 pgoyette
111 1.4.2.2 pgoyette /* Clear overflow flag */
112 1.4.2.2 pgoyette reg_pmovsclr_el0_write(counter_mask);
113 1.4.2.2 pgoyette
114 1.4.2.2 pgoyette /* Initialize event counter value */
115 1.4.2.2 pgoyette armv8_pmu_set_pmevcntr(armv8_pmu_counter, counter_reset_val);
116 1.4.2.2 pgoyette
117 1.4.2.2 pgoyette /* Enable event counter */
118 1.4.2.2 pgoyette reg_pmcntenset_el0_write(counter_mask);
119 1.4.2.2 pgoyette }
120 1.4.2.2 pgoyette
121 1.4.2.2 pgoyette static void
122 1.4.2.2 pgoyette armv8_pmu_stop_cpu(void *arg1, void *arg2)
123 1.4.2.2 pgoyette {
124 1.4.2.2 pgoyette const uint32_t counter_mask = __BIT(armv8_pmu_counter);
125 1.4.2.2 pgoyette uint32_t pmcr;
126 1.4.2.2 pgoyette
127 1.4.2.2 pgoyette /* Disable overflow interrupts */
128 1.4.2.2 pgoyette reg_pmintenclr_el1_write(counter_mask);
129 1.4.2.2 pgoyette
130 1.4.2.2 pgoyette /* Disable event counter */
131 1.4.2.2 pgoyette reg_pmcntenclr_el0_write(counter_mask);
132 1.4.2.2 pgoyette
133 1.4.2.2 pgoyette /* Disable performance monitor */
134 1.4.2.2 pgoyette pmcr = reg_pmcr_el0_read();
135 1.4.2.2 pgoyette pmcr &= ~PMCR_E;
136 1.4.2.2 pgoyette reg_pmcr_el0_write(pmcr);
137 1.4.2.2 pgoyette }
138 1.4.2.2 pgoyette
139 1.4.2.2 pgoyette static uint64_t
140 1.4.2.2 pgoyette armv8_pmu_estimate_freq(void)
141 1.4.2.2 pgoyette {
142 1.4.2.2 pgoyette uint64_t cpufreq = curcpu()->ci_data.cpu_cc_freq;
143 1.4.2.2 pgoyette uint64_t freq = 10000;
144 1.4.2.2 pgoyette uint32_t pmcr;
145 1.4.2.2 pgoyette
146 1.4.2.2 pgoyette counter_val = cpufreq / freq;
147 1.4.2.2 pgoyette if (counter_val == 0)
148 1.4.2.2 pgoyette counter_val = 4000000000ULL / freq;
149 1.4.2.2 pgoyette
150 1.4.2.2 pgoyette pmcr = reg_pmcr_el0_read();
151 1.4.2.2 pgoyette if (pmcr & PMCR_D)
152 1.4.2.2 pgoyette counter_val /= 64;
153 1.4.2.2 pgoyette
154 1.4.2.2 pgoyette return freq;
155 1.4.2.2 pgoyette }
156 1.4.2.2 pgoyette
157 1.4.2.2 pgoyette static uint32_t
158 1.4.2.2 pgoyette armv8_pmu_ident(void)
159 1.4.2.2 pgoyette {
160 1.4.2.2 pgoyette return TPROF_IDENT_ARMV8_GENERIC;
161 1.4.2.2 pgoyette }
162 1.4.2.2 pgoyette
163 1.4.2.2 pgoyette static int
164 1.4.2.2 pgoyette armv8_pmu_start(const tprof_param_t *param)
165 1.4.2.2 pgoyette {
166 1.4.2.2 pgoyette uint64_t xc;
167 1.4.2.2 pgoyette
168 1.4.2.2 pgoyette if (!armv8_pmu_event_implemented(param->p_event)) {
169 1.4.2.2 pgoyette printf("%s: event %#" PRIx64 " not implemented on this CPU\n",
170 1.4.2.2 pgoyette __func__, param->p_event);
171 1.4.2.2 pgoyette return EINVAL;
172 1.4.2.2 pgoyette }
173 1.4.2.2 pgoyette
174 1.4.2.2 pgoyette counter_reset_val = -counter_val + 1;
175 1.4.2.2 pgoyette
176 1.4.2.2 pgoyette armv8_pmu_param = *param;
177 1.4.2.2 pgoyette xc = xc_broadcast(0, armv8_pmu_start_cpu, NULL, NULL);
178 1.4.2.2 pgoyette xc_wait(xc);
179 1.4.2.2 pgoyette
180 1.4.2.2 pgoyette return 0;
181 1.4.2.2 pgoyette }
182 1.4.2.2 pgoyette
183 1.4.2.2 pgoyette static void
184 1.4.2.2 pgoyette armv8_pmu_stop(const tprof_param_t *param)
185 1.4.2.2 pgoyette {
186 1.4.2.2 pgoyette uint64_t xc;
187 1.4.2.2 pgoyette
188 1.4.2.2 pgoyette xc = xc_broadcast(0, armv8_pmu_stop_cpu, NULL, NULL);
189 1.4.2.2 pgoyette xc_wait(xc);
190 1.4.2.2 pgoyette }
191 1.4.2.2 pgoyette
192 1.4.2.2 pgoyette static const tprof_backend_ops_t tprof_armv8_pmu_ops = {
193 1.4.2.2 pgoyette .tbo_estimate_freq = armv8_pmu_estimate_freq,
194 1.4.2.2 pgoyette .tbo_ident = armv8_pmu_ident,
195 1.4.2.2 pgoyette .tbo_start = armv8_pmu_start,
196 1.4.2.2 pgoyette .tbo_stop = armv8_pmu_stop,
197 1.4.2.2 pgoyette };
198 1.4.2.2 pgoyette
199 1.4.2.2 pgoyette int
200 1.4.2.2 pgoyette armv8_pmu_intr(void *priv)
201 1.4.2.2 pgoyette {
202 1.4.2.2 pgoyette const struct trapframe * const tf = priv;
203 1.4.2.2 pgoyette const uint32_t counter_mask = __BIT(armv8_pmu_counter);
204 1.4.2.2 pgoyette tprof_frame_info_t tfi;
205 1.4.2.2 pgoyette
206 1.4.2.2 pgoyette const uint32_t pmovs = reg_pmovsset_el0_read();
207 1.4.2.2 pgoyette if ((pmovs & counter_mask) != 0) {
208 1.4.2.2 pgoyette tfi.tfi_pc = tf->tf_pc;
209 1.4.2.2 pgoyette tfi.tfi_inkernel = tfi.tfi_pc >= VM_MIN_KERNEL_ADDRESS &&
210 1.4.2.2 pgoyette tfi.tfi_pc < VM_MAX_KERNEL_ADDRESS;
211 1.4.2.2 pgoyette tprof_sample(NULL, &tfi);
212 1.4.2.2 pgoyette
213 1.4.2.2 pgoyette armv8_pmu_set_pmevcntr(armv8_pmu_counter, counter_reset_val);
214 1.4.2.2 pgoyette }
215 1.4.2.2 pgoyette reg_pmovsclr_el0_write(pmovs);
216 1.4.2.2 pgoyette
217 1.4.2.2 pgoyette return 1;
218 1.4.2.2 pgoyette }
219 1.4.2.2 pgoyette
220 1.4.2.2 pgoyette int
221 1.4.2.2 pgoyette armv8_pmu_init(void)
222 1.4.2.2 pgoyette {
223 1.4.2.2 pgoyette /* Disable EL0 access to performance monitors */
224 1.4.2.2 pgoyette reg_pmuserenr_el0_write(0);
225 1.4.2.2 pgoyette
226 1.4.2.2 pgoyette /* Disable interrupts */
227 1.4.2.2 pgoyette reg_pmintenclr_el1_write(~0U);
228 1.4.2.2 pgoyette
229 1.4.2.2 pgoyette /* Disable counters */
230 1.4.2.2 pgoyette reg_pmcntenclr_el0_write(~0U);
231 1.4.2.2 pgoyette
232 1.4.2.2 pgoyette /* Disable performance monitor */
233 1.4.2.2 pgoyette reg_pmcr_el0_write(0);
234 1.4.2.2 pgoyette
235 1.4.2.2 pgoyette return tprof_backend_register("tprof_armv8", &tprof_armv8_pmu_ops,
236 1.4.2.2 pgoyette TPROF_BACKEND_VERSION);
237 1.4.2.2 pgoyette }
238