fpu.c revision 1.20 1 1.20 skrll /* $NetBSD: fpu.c,v 1.20 2010/03/16 16:20:19 skrll Exp $ */
2 1.1 fredette
3 1.1 fredette /*
4 1.1 fredette * Copyright (c) 2002 The NetBSD Foundation, Inc.
5 1.1 fredette * All rights reserved.
6 1.1 fredette *
7 1.1 fredette * This code is derived from software contributed to The NetBSD Foundation
8 1.1 fredette * by Matthew Fredette.
9 1.1 fredette *
10 1.1 fredette * Redistribution and use in source and binary forms, with or without
11 1.1 fredette * modification, are permitted provided that the following conditions
12 1.1 fredette * are met:
13 1.1 fredette * 1. Redistributions of source code must retain the above copyright
14 1.1 fredette * notice, this list of conditions and the following disclaimer.
15 1.1 fredette * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 fredette * notice, this list of conditions and the following disclaimer in the
17 1.1 fredette * documentation and/or other materials provided with the distribution.
18 1.1 fredette *
19 1.1 fredette * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.1 fredette * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.1 fredette * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.1 fredette * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.1 fredette * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.1 fredette * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.1 fredette * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.1 fredette * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.1 fredette * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.1 fredette * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.1 fredette * POSSIBILITY OF SUCH DAMAGE.
30 1.1 fredette */
31 1.1 fredette
32 1.1 fredette /*
33 1.1 fredette * FPU handling for NetBSD/hppa.
34 1.1 fredette */
35 1.1 fredette
36 1.1 fredette #include <sys/cdefs.h>
37 1.20 skrll __KERNEL_RCSID(0, "$NetBSD: fpu.c,v 1.20 2010/03/16 16:20:19 skrll Exp $");
38 1.1 fredette
39 1.16 skrll #include <sys/param.h>
40 1.1 fredette #include <sys/systm.h>
41 1.1 fredette #include <sys/proc.h>
42 1.1 fredette #include <sys/signalvar.h>
43 1.1 fredette
44 1.17 skrll #include <uvm/uvm_extern.h>
45 1.17 skrll
46 1.1 fredette #include <machine/cpufunc.h>
47 1.1 fredette #include <machine/frame.h>
48 1.1 fredette #include <machine/reg.h>
49 1.17 skrll #include <machine/pmap.h>
50 1.1 fredette
51 1.1 fredette #include <hppa/hppa/machdep.h>
52 1.1 fredette
53 1.1 fredette #include "../spmath/float.h"
54 1.1 fredette #include "../spmath/fpudispatch.h"
55 1.1 fredette
56 1.1 fredette /* Some macros representing opcodes. */
57 1.1 fredette #define OPCODE_NOP 0x08000240
58 1.1 fredette #define OPCODE_COPR_0_0 0x30000000
59 1.1 fredette
60 1.1 fredette /* Some macros representing fields in load/store opcodes. */
61 1.1 fredette #define OPCODE_CMPLT_S 0x00002000
62 1.1 fredette #define OPCODE_CMPLT_M 0x00000020
63 1.1 fredette #define OPCODE_CMPLT_SM (OPCODE_CMPLT_S | OPCODE_CMPLT_M)
64 1.1 fredette #define OPCODE_CMPLT_MB OPCODE_CMPLT_M
65 1.1 fredette #define OPCODE_CMPLT_MA (OPCODE_CMPLT_S | OPCODE_CMPLT_M)
66 1.1 fredette #define OPCODE_CMPLT (OPCODE_CMPLT_S | OPCODE_CMPLT_M)
67 1.1 fredette #define OPCODE_DOUBLE 0x08000000
68 1.1 fredette #define OPCODE_STORE 0x00000200
69 1.1 fredette #define OPCODE_INDEXED 0x00001000
70 1.1 fredette
71 1.1 fredette /* This is nonzero iff we're using a hardware FPU. */
72 1.1 fredette int fpu_present;
73 1.1 fredette
74 1.1 fredette /* If we have any FPU, this is its version. */
75 1.1 fredette u_int fpu_version;
76 1.1 fredette
77 1.1 fredette /* The number of times we have had to switch the FPU context. */
78 1.1 fredette u_int fpu_csw;
79 1.1 fredette
80 1.1 fredette /* The U-space physical address of the proc in the FPU, or zero. */
81 1.1 fredette paddr_t fpu_cur_uspace;
82 1.1 fredette
83 1.1 fredette /* In locore.S, this swaps states in and out of the FPU. */
84 1.20 skrll void hppa_fpu_swapout(struct pcb *);
85 1.20 skrll void hppa_fpu_swap(struct fpreg *, struct fpreg *);
86 1.1 fredette
87 1.1 fredette #ifdef FPEMUL
88 1.1 fredette /*
89 1.1 fredette * Given a trapframe and a general register number, the
90 1.1 fredette * FRAME_REG macro returns a pointer to that general
91 1.1 fredette * register. The _frame_reg_positions array is a lookup
92 1.1 fredette * table, since the general registers aren't in order
93 1.1 fredette * in a trapframe.
94 1.1 fredette *
95 1.1 fredette * NB: this more or less assumes that all members of
96 1.1 fredette * struct trapframe are u_ints.
97 1.1 fredette */
98 1.1 fredette #define FRAME_REG(f, reg, r0) \
99 1.1 fredette ((reg) == 0 ? (&r0) : ((&(f)->tf_t1) + _frame_reg_positions[reg]))
100 1.1 fredette #define _FRAME_POSITION(f) \
101 1.1 fredette ((&((struct trapframe *) 0)->f) - (&((struct trapframe *) 0)->tf_t1))
102 1.1 fredette const int _frame_reg_positions[32] = {
103 1.1 fredette -1, /* r0 */
104 1.1 fredette _FRAME_POSITION(tf_r1),
105 1.1 fredette _FRAME_POSITION(tf_rp), /* r2 */
106 1.1 fredette _FRAME_POSITION(tf_r3),
107 1.1 fredette _FRAME_POSITION(tf_r4),
108 1.1 fredette _FRAME_POSITION(tf_r5),
109 1.1 fredette _FRAME_POSITION(tf_r6),
110 1.1 fredette _FRAME_POSITION(tf_r7),
111 1.1 fredette _FRAME_POSITION(tf_r8),
112 1.1 fredette _FRAME_POSITION(tf_r9),
113 1.1 fredette _FRAME_POSITION(tf_r10),
114 1.1 fredette _FRAME_POSITION(tf_r11),
115 1.1 fredette _FRAME_POSITION(tf_r12),
116 1.1 fredette _FRAME_POSITION(tf_r13),
117 1.1 fredette _FRAME_POSITION(tf_r14),
118 1.1 fredette _FRAME_POSITION(tf_r15),
119 1.1 fredette _FRAME_POSITION(tf_r16),
120 1.1 fredette _FRAME_POSITION(tf_r17),
121 1.1 fredette _FRAME_POSITION(tf_r18),
122 1.1 fredette _FRAME_POSITION(tf_t4), /* r19 */
123 1.1 fredette _FRAME_POSITION(tf_t3), /* r20 */
124 1.1 fredette _FRAME_POSITION(tf_t2), /* r21 */
125 1.1 fredette _FRAME_POSITION(tf_t1), /* r22 */
126 1.1 fredette _FRAME_POSITION(tf_arg3), /* r23 */
127 1.1 fredette _FRAME_POSITION(tf_arg2), /* r24 */
128 1.1 fredette _FRAME_POSITION(tf_arg1), /* r25 */
129 1.1 fredette _FRAME_POSITION(tf_arg0), /* r26 */
130 1.1 fredette _FRAME_POSITION(tf_dp), /* r27 */
131 1.1 fredette _FRAME_POSITION(tf_ret0), /* r28 */
132 1.1 fredette _FRAME_POSITION(tf_ret1), /* r29 */
133 1.1 fredette _FRAME_POSITION(tf_sp), /* r30 */
134 1.1 fredette _FRAME_POSITION(tf_r31),
135 1.1 fredette };
136 1.1 fredette #endif /* FPEMUL */
137 1.1 fredette
138 1.1 fredette /*
139 1.1 fredette * Bootstraps the FPU.
140 1.1 fredette */
141 1.1 fredette void
142 1.1 fredette hppa_fpu_bootstrap(u_int ccr_enable)
143 1.1 fredette {
144 1.18 skrll uint32_t junk[2];
145 1.18 skrll uint32_t vers[2];
146 1.1 fredette extern u_int hppa_fpu_nop0;
147 1.1 fredette extern u_int hppa_fpu_nop1;
148 1.1 fredette
149 1.1 fredette /* See if we have a present and functioning hardware FPU. */
150 1.1 fredette fpu_present = (ccr_enable & HPPA_FPUS) == HPPA_FPUS;
151 1.1 fredette
152 1.1 fredette /* Initialize the FPU and get its version. */
153 1.1 fredette if (fpu_present) {
154 1.1 fredette
155 1.1 fredette /*
156 1.1 fredette * To somewhat optimize the emulation
157 1.1 fredette * assist trap handling and context
158 1.1 fredette * switching (to save them from having
159 1.1 fredette * to always load and check fpu_present),
160 1.1 fredette * there are two instructions in locore.S
161 1.1 fredette * that are replaced with nops when
162 1.1 fredette * there is a hardware FPU.
163 1.1 fredette */
164 1.1 fredette hppa_fpu_nop0 = OPCODE_NOP;
165 1.1 fredette hppa_fpu_nop1 = OPCODE_NOP;
166 1.1 fredette fcacheall();
167 1.1 fredette
168 1.1 fredette /*
169 1.1 fredette * We track what process has the FPU,
170 1.1 fredette * and how many times we have to swap
171 1.1 fredette * in and out.
172 1.1 fredette */
173 1.1 fredette
174 1.1 fredette /*
175 1.1 fredette * The PA-RISC 1.1 Architecture manual is
176 1.1 fredette * pretty clear that the copr,0,0 must be
177 1.1 fredette * wrapped in double word stores of fr0,
178 1.1 fredette * otherwise its operation is undefined.
179 1.1 fredette */
180 1.12 perry __asm volatile(
181 1.1 fredette " ldo %0, %%r22 \n"
182 1.1 fredette " fstds %%fr0, 0(%%r22) \n"
183 1.1 fredette " ldo %1, %%r22 \n"
184 1.1 fredette " copr,0,0 \n"
185 1.1 fredette " fstds %%fr0, 0(%%r22) \n"
186 1.10 chs : "=m" (junk), "=m" (vers) : : "r22");
187 1.1 fredette
188 1.1 fredette /*
189 1.1 fredette * Now mark that no process has the FPU,
190 1.1 fredette * and disable it, so the first time it
191 1.1 fredette * gets used the process' state gets
192 1.1 fredette * swapped in.
193 1.1 fredette */
194 1.1 fredette fpu_csw = 0;
195 1.1 fredette fpu_cur_uspace = 0;
196 1.1 fredette mtctl(ccr_enable & (CCR_MASK ^ HPPA_FPUS), CR_CCR);
197 1.1 fredette }
198 1.1 fredette #ifdef FPEMUL
199 1.1 fredette else
200 1.1 fredette /*
201 1.1 fredette * XXX This is a hack - to avoid
202 1.1 fredette * having to set up the emulator so
203 1.1 fredette * it can work for one instruction for
204 1.1 fredette * proc0, we dispatch the copr,0,0 opcode
205 1.1 fredette * into the emulator directly.
206 1.1 fredette */
207 1.10 chs decode_0c(OPCODE_COPR_0_0, 0, 0, vers);
208 1.1 fredette #endif /* FPEMUL */
209 1.10 chs fpu_version = vers[0];
210 1.1 fredette }
211 1.1 fredette
212 1.1 fredette /*
213 1.2 chs * If the given LWP has its state in the FPU,
214 1.2 chs * flush that state out into the LWP's PCB.
215 1.1 fredette */
216 1.1 fredette void
217 1.2 chs hppa_fpu_flush(struct lwp *l)
218 1.1 fredette {
219 1.2 chs struct trapframe *tf = l->l_md.md_regs;
220 1.19 rmind struct pcb *pcb = lwp_getpcb(l);
221 1.1 fredette
222 1.1 fredette /*
223 1.2 chs * If we have a hardware FPU, and this process'
224 1.2 chs * state is currently in it, swap it out.
225 1.2 chs */
226 1.2 chs
227 1.6 chs if (!fpu_present || fpu_cur_uspace == 0 ||
228 1.6 chs fpu_cur_uspace != tf->tf_cr30) {
229 1.6 chs return;
230 1.6 chs }
231 1.6 chs
232 1.20 skrll hppa_fpu_swapout(pcb);
233 1.6 chs fpu_cur_uspace = 0;
234 1.1 fredette }
235 1.1 fredette
236 1.1 fredette #ifdef FPEMUL
237 1.1 fredette
238 1.1 fredette /*
239 1.1 fredette * This emulates a coprocessor load/store instruction.
240 1.1 fredette */
241 1.4 chs static int hppa_fpu_ls(struct trapframe *, struct lwp *);
242 1.1 fredette static int
243 1.2 chs hppa_fpu_ls(struct trapframe *frame, struct lwp *l)
244 1.1 fredette {
245 1.19 rmind struct pcb *pcb = lwp_getpcb(l);
246 1.1 fredette u_int inst, inst_b, inst_x, inst_s, inst_t;
247 1.1 fredette int log2size;
248 1.1 fredette u_int *base;
249 1.1 fredette u_int offset, index, im5;
250 1.1 fredette void *fpreg;
251 1.1 fredette u_int r0 = 0;
252 1.6 chs int error;
253 1.6 chs
254 1.1 fredette /*
255 1.1 fredette * Get the instruction that we're emulating,
256 1.1 fredette * and break it down. Using HP bit notation,
257 1.1 fredette * b is a five-bit field starting at bit 10,
258 1.1 fredette * x is a five-bit field starting at bit 15,
259 1.1 fredette * s is a two-bit field starting at bit 17,
260 1.7 chs * and t is a five-bit field starting at bit 31.
261 1.1 fredette */
262 1.1 fredette inst = frame->tf_iir;
263 1.12 perry __asm volatile(
264 1.1 fredette " extru %4, 10, 5, %1 \n"
265 1.1 fredette " extru %4, 15, 5, %2 \n"
266 1.1 fredette " extru %4, 17, 2, %3 \n"
267 1.1 fredette " extru %4, 31, 5, %4 \n"
268 1.1 fredette : "=r" (inst_b), "=r" (inst_x), "=r" (inst_s), "=r" (inst_t)
269 1.1 fredette : "r" (inst));
270 1.1 fredette
271 1.1 fredette /*
272 1.1 fredette * The space must be the user's space, else we
273 1.1 fredette * segfault.
274 1.1 fredette */
275 1.19 rmind if (inst_s != pcb->pcb_space)
276 1.1 fredette return (EFAULT);
277 1.1 fredette
278 1.1 fredette /* See whether or not this is a doubleword load/store. */
279 1.1 fredette log2size = (inst & OPCODE_DOUBLE) ? 3 : 2;
280 1.1 fredette
281 1.1 fredette /* Get the floating point register. */
282 1.19 rmind fpreg = ((char *)pcb->pcb_fpregs) + (inst_t << log2size);
283 1.1 fredette
284 1.1 fredette /* Get the base register. */
285 1.1 fredette base = FRAME_REG(frame, inst_b, r0);
286 1.1 fredette
287 1.1 fredette /* Dispatch on whether or not this is an indexed load/store. */
288 1.1 fredette if (inst & OPCODE_INDEXED) {
289 1.1 fredette
290 1.1 fredette /* Get the index register value. */
291 1.1 fredette index = *FRAME_REG(frame, inst_x, r0);
292 1.1 fredette
293 1.1 fredette /* Dispatch on the completer. */
294 1.1 fredette switch (inst & OPCODE_CMPLT) {
295 1.1 fredette case OPCODE_CMPLT_S:
296 1.1 fredette offset = *base + (index << log2size);
297 1.1 fredette break;
298 1.1 fredette case OPCODE_CMPLT_M:
299 1.1 fredette offset = *base;
300 1.1 fredette *base = *base + index;
301 1.1 fredette break;
302 1.1 fredette case OPCODE_CMPLT_SM:
303 1.1 fredette offset = *base;
304 1.1 fredette *base = *base + (index << log2size);
305 1.1 fredette break;
306 1.1 fredette default:
307 1.1 fredette offset = *base + index;
308 1.1 fredette break;
309 1.1 fredette }
310 1.1 fredette } else {
311 1.1 fredette
312 1.1 fredette /* Do a low_sign_ext(x, 5). */
313 1.1 fredette im5 = inst_x >> 1;
314 1.1 fredette if (inst_x & 1)
315 1.1 fredette im5 |= 0xfffffff0;
316 1.1 fredette
317 1.1 fredette /* Dispatch on the completer. */
318 1.1 fredette switch (inst & OPCODE_CMPLT) {
319 1.1 fredette case OPCODE_CMPLT_MB:
320 1.1 fredette offset = *base + im5;
321 1.1 fredette *base = *base + im5;
322 1.1 fredette break;
323 1.1 fredette case OPCODE_CMPLT_MA:
324 1.1 fredette offset = *base;
325 1.1 fredette *base = *base + im5;
326 1.1 fredette break;
327 1.1 fredette default:
328 1.1 fredette offset = *base + im5;
329 1.1 fredette break;
330 1.1 fredette }
331 1.1 fredette }
332 1.1 fredette
333 1.1 fredette /*
334 1.1 fredette * The offset we calculated must be the same as the
335 1.1 fredette * offset in the IOR.
336 1.1 fredette */
337 1.1 fredette KASSERT(offset == frame->tf_ior);
338 1.1 fredette
339 1.1 fredette /* Perform the load or store. */
340 1.6 chs error = (inst & OPCODE_STORE) ?
341 1.1 fredette copyout(fpreg, (void *) offset, 1 << log2size) :
342 1.1 fredette copyin((const void *) offset, fpreg, 1 << log2size);
343 1.6 chs return error;
344 1.1 fredette }
345 1.1 fredette
346 1.1 fredette /*
347 1.1 fredette * This is called to emulate an instruction.
348 1.1 fredette */
349 1.1 fredette void
350 1.7 chs hppa_fpu_emulate(struct trapframe *frame, struct lwp *l, u_int inst)
351 1.1 fredette {
352 1.19 rmind struct pcb *pcb = lwp_getpcb(l);
353 1.7 chs u_int opcode, class, sub;
354 1.1 fredette u_int *fpregs;
355 1.1 fredette int exception;
356 1.8 chs ksiginfo_t ksi;
357 1.1 fredette
358 1.1 fredette /*
359 1.1 fredette * If the process' state is in any hardware FPU,
360 1.1 fredette * flush it out - we need to operate on it.
361 1.1 fredette */
362 1.2 chs hppa_fpu_flush(l);
363 1.1 fredette
364 1.1 fredette /*
365 1.1 fredette * Get the instruction that we're emulating,
366 1.1 fredette * and break it down. Using HP bit notation,
367 1.1 fredette * the class is a two-bit field starting at
368 1.1 fredette * bit 22, the opcode is a 6-bit field starting
369 1.1 fredette * at bit 5, and sub for a class 1 instruction
370 1.1 fredette * is a two bit field starting at bit 16, else
371 1.1 fredette * it is a three bit field starting at bit 18.
372 1.1 fredette */
373 1.7 chs #if 0
374 1.12 perry __asm volatile(
375 1.1 fredette " extru %3, 22, 2, %1 \n"
376 1.1 fredette " extru %3, 5, 6, %0 \n"
377 1.1 fredette " extru %3, 18, 3, %2 \n"
378 1.1 fredette " comib,<> 1, %1, 0 \n"
379 1.1 fredette " extru %3, 16, 2, %2 \n"
380 1.1 fredette : "=r" (opcode), "=r" (class), "=r" (sub)
381 1.1 fredette : "r" (inst));
382 1.7 chs #else
383 1.7 chs opcode = (inst >> (31 - 5)) & 0x3f;
384 1.7 chs class = (inst >> (31 - 22)) & 0x3;
385 1.7 chs if (class == 1) {
386 1.7 chs sub = (inst >> (31 - 16)) & 3;
387 1.7 chs } else {
388 1.7 chs sub = (inst >> (31 - 18)) & 7;
389 1.7 chs }
390 1.7 chs #endif
391 1.1 fredette
392 1.2 chs /* Get this LWP's FPU registers. */
393 1.19 rmind fpregs = (u_int *)pcb->pcb_fpregs;
394 1.1 fredette
395 1.1 fredette /* Dispatch on the opcode. */
396 1.1 fredette switch (opcode) {
397 1.1 fredette case 0x09:
398 1.1 fredette case 0x0b:
399 1.8 chs if (hppa_fpu_ls(frame, l) != 0) {
400 1.8 chs KSI_INIT_TRAP(&ksi);
401 1.8 chs ksi.ksi_signo = SIGSEGV;
402 1.8 chs ksi.ksi_code = SEGV_MAPERR;
403 1.8 chs ksi.ksi_trap = T_DTLBMISS;
404 1.8 chs ksi.ksi_addr = (void *)frame->tf_iioq_head;
405 1.8 chs trapsignal(l, &ksi);
406 1.8 chs }
407 1.1 fredette return;
408 1.1 fredette case 0x0c:
409 1.1 fredette exception = decode_0c(inst, class, sub, fpregs);
410 1.1 fredette break;
411 1.1 fredette case 0x0e:
412 1.1 fredette exception = decode_0e(inst, class, sub, fpregs);
413 1.1 fredette break;
414 1.1 fredette case 0x06:
415 1.1 fredette exception = decode_06(inst, fpregs);
416 1.1 fredette break;
417 1.1 fredette case 0x26:
418 1.1 fredette exception = decode_26(inst, fpregs);
419 1.1 fredette break;
420 1.1 fredette default:
421 1.1 fredette exception = UNIMPLEMENTEDEXCEPTION;
422 1.1 fredette break;
423 1.1 fredette }
424 1.1 fredette
425 1.8 chs if (exception) {
426 1.8 chs KSI_INIT_TRAP(&ksi);
427 1.8 chs if (exception & UNIMPLEMENTEDEXCEPTION) {
428 1.8 chs ksi.ksi_signo = SIGILL;
429 1.8 chs ksi.ksi_code = ILL_COPROC;
430 1.8 chs } else {
431 1.8 chs ksi.ksi_signo = SIGFPE;
432 1.8 chs if (exception & INVALIDEXCEPTION) {
433 1.8 chs ksi.ksi_code = FPE_FLTINV;
434 1.8 chs } else if (exception & DIVISIONBYZEROEXCEPTION) {
435 1.8 chs ksi.ksi_code = FPE_FLTDIV;
436 1.8 chs } else if (exception & OVERFLOWEXCEPTION) {
437 1.8 chs ksi.ksi_code = FPE_FLTOVF;
438 1.8 chs } else if (exception & UNDERFLOWEXCEPTION) {
439 1.8 chs ksi.ksi_code = FPE_FLTUND;
440 1.8 chs } else if (exception & INEXACTEXCEPTION) {
441 1.8 chs ksi.ksi_code = FPE_FLTRES;
442 1.8 chs }
443 1.8 chs }
444 1.8 chs ksi.ksi_trap = T_EMULATION;
445 1.8 chs ksi.ksi_addr = (void *)frame->tf_iioq_head;
446 1.8 chs trapsignal(l, &ksi);
447 1.8 chs }
448 1.1 fredette }
449 1.1 fredette
450 1.1 fredette #endif /* FPEMUL */
451