Home | History | Annotate | Line # | Download | only in fpu
fpu_emu.c revision 1.35
      1 /*	$NetBSD: fpu_emu.c,v 1.35 2022/07/26 16:08:33 rin Exp $ */
      2 
      3 /*
      4  * Copyright 2001 Wasabi Systems, Inc.
      5  * All rights reserved.
      6  *
      7  * Written by Eduardo Horvath and Simon Burge for Wasabi Systems, Inc.
      8  *
      9  * Redistribution and use in source and binary forms, with or without
     10  * modification, are permitted provided that the following conditions
     11  * are met:
     12  * 1. Redistributions of source code must retain the above copyright
     13  *    notice, this list of conditions and the following disclaimer.
     14  * 2. Redistributions in binary form must reproduce the above copyright
     15  *    notice, this list of conditions and the following disclaimer in the
     16  *    documentation and/or other materials provided with the distribution.
     17  * 3. All advertising materials mentioning features or use of this software
     18  *    must display the following acknowledgement:
     19  *      This product includes software developed for the NetBSD Project by
     20  *      Wasabi Systems, Inc.
     21  * 4. The name of Wasabi Systems, Inc. may not be used to endorse
     22  *    or promote products derived from this software without specific prior
     23  *    written permission.
     24  *
     25  * THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
     26  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     27  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     28  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL WASABI SYSTEMS, INC
     29  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     30  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     31  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     32  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     33  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     34  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     35  * POSSIBILITY OF SUCH DAMAGE.
     36  */
     37 
     38 /*
     39  * Copyright (c) 1992, 1993
     40  *	The Regents of the University of California.  All rights reserved.
     41  *
     42  * This software was developed by the Computer Systems Engineering group
     43  * at Lawrence Berkeley Laboratory under DARPA contract BG 91-66 and
     44  * contributed to Berkeley.
     45  *
     46  * All advertising materials mentioning features or use of this software
     47  * must display the following acknowledgement:
     48  *	This product includes software developed by the University of
     49  *	California, Lawrence Berkeley Laboratory.
     50  *
     51  * Redistribution and use in source and binary forms, with or without
     52  * modification, are permitted provided that the following conditions
     53  * are met:
     54  * 1. Redistributions of source code must retain the above copyright
     55  *    notice, this list of conditions and the following disclaimer.
     56  * 2. Redistributions in binary form must reproduce the above copyright
     57  *    notice, this list of conditions and the following disclaimer in the
     58  *    documentation and/or other materials provided with the distribution.
     59  * 3. Neither the name of the University nor the names of its contributors
     60  *    may be used to endorse or promote products derived from this software
     61  *    without specific prior written permission.
     62  *
     63  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     64  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     65  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     66  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     67  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     68  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     69  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     70  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     71  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     72  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     73  * SUCH DAMAGE.
     74  *
     75  *	@(#)fpu.c	8.1 (Berkeley) 6/11/93
     76  */
     77 
     78 #include <sys/cdefs.h>
     79 __KERNEL_RCSID(0, "$NetBSD: fpu_emu.c,v 1.35 2022/07/26 16:08:33 rin Exp $");
     80 
     81 #ifdef _KERNEL_OPT
     82 #include "opt_ddb.h"
     83 #endif
     84 
     85 #include <sys/param.h>
     86 #include <sys/systm.h>
     87 #include <sys/evcnt.h>
     88 #include <sys/proc.h>
     89 #include <sys/siginfo.h>
     90 #include <sys/signal.h>
     91 #include <sys/signalvar.h>
     92 #include <sys/syslog.h>
     93 
     94 #include <powerpc/instr.h>
     95 #include <powerpc/psl.h>
     96 
     97 #include <machine/fpu.h>
     98 #include <machine/reg.h>
     99 #include <machine/trap.h>
    100 
    101 #include <powerpc/fpu/fpu_emu.h>
    102 #include <powerpc/fpu/fpu_extern.h>
    103 
    104 #define	FPU_EMU_EVCNT_DECL(name)					\
    105 static struct evcnt fpu_emu_ev_##name =					\
    106     EVCNT_INITIALIZER(EVCNT_TYPE_TRAP, NULL, "fpemu", #name);		\
    107 EVCNT_ATTACH_STATIC(fpu_emu_ev_##name)
    108 
    109 #define	FPU_EMU_EVCNT_INCR(name)					\
    110     fpu_emu_ev_##name.ev_count++
    111 
    112 FPU_EMU_EVCNT_DECL(stfiwx);
    113 FPU_EMU_EVCNT_DECL(fpstore);
    114 FPU_EMU_EVCNT_DECL(fpload);
    115 FPU_EMU_EVCNT_DECL(fcmpu);
    116 FPU_EMU_EVCNT_DECL(frsp);
    117 FPU_EMU_EVCNT_DECL(fctiw);
    118 FPU_EMU_EVCNT_DECL(fcmpo);
    119 FPU_EMU_EVCNT_DECL(mtfsb1);
    120 FPU_EMU_EVCNT_DECL(fnegabs);
    121 FPU_EMU_EVCNT_DECL(mcrfs);
    122 FPU_EMU_EVCNT_DECL(mtfsb0);
    123 FPU_EMU_EVCNT_DECL(fmr);
    124 FPU_EMU_EVCNT_DECL(mtfsfi);
    125 FPU_EMU_EVCNT_DECL(fnabs);
    126 FPU_EMU_EVCNT_DECL(fabs);
    127 FPU_EMU_EVCNT_DECL(mffs);
    128 FPU_EMU_EVCNT_DECL(mtfsf);
    129 FPU_EMU_EVCNT_DECL(fctid);
    130 FPU_EMU_EVCNT_DECL(fcfid);
    131 FPU_EMU_EVCNT_DECL(fdiv);
    132 FPU_EMU_EVCNT_DECL(fsub);
    133 FPU_EMU_EVCNT_DECL(fadd);
    134 FPU_EMU_EVCNT_DECL(fsqrt);
    135 FPU_EMU_EVCNT_DECL(fsel);
    136 FPU_EMU_EVCNT_DECL(fpres);
    137 FPU_EMU_EVCNT_DECL(fmul);
    138 FPU_EMU_EVCNT_DECL(frsqrte);
    139 FPU_EMU_EVCNT_DECL(fmulsub);
    140 FPU_EMU_EVCNT_DECL(fmuladd);
    141 FPU_EMU_EVCNT_DECL(fnmsub);
    142 FPU_EMU_EVCNT_DECL(fnmadd);
    143 
    144 /* FPSR exception masks */
    145 #define FPSR_EX_MSK	(FPSCR_VX|FPSCR_OX|FPSCR_UX|FPSCR_ZX|		\
    146 			FPSCR_XX|FPSCR_VXSNAN|FPSCR_VXISI|FPSCR_VXIDI|	\
    147 			FPSCR_VXZDZ|FPSCR_VXIMZ|FPSCR_VXVC|FPSCR_VXSOFT|\
    148 			FPSCR_VXSQRT|FPSCR_VXCVI)
    149 #define	FPSR_EX		(FPSCR_VE|FPSCR_OE|FPSCR_UE|FPSCR_ZE|FPSCR_XE)
    150 #define	FPSR_INV	(FPSCR_VXSNAN|FPSCR_VXISI|FPSCR_VXIDI|		\
    151 			FPSCR_VXZDZ|FPSCR_VXIMZ|FPSCR_VXVC|FPSCR_VXSOFT|\
    152 			FPSCR_VXSQRT|FPSCR_VXCVI)
    153 
    154 
    155 int fpe_debug = 0;
    156 
    157 #ifdef DDB
    158 extern vaddr_t opc_disasm(vaddr_t loc, int opcode);
    159 #endif
    160 
    161 #ifdef DEBUG
    162 /*
    163  * Dump a `fpn' structure.
    164  */
    165 void
    166 fpu_dumpfpn(struct fpn *fp)
    167 {
    168 	static const char *class[] = {
    169 		"SNAN", "QNAN", "ZERO", "NUM", "INF"
    170 	};
    171 
    172 	KASSERT(fp != NULL);
    173 
    174 	printf("%s %c.%x %x %x %xE%d\n", class[fp->fp_class + 2],
    175 		fp->fp_sign ? '-' : ' ',
    176 		fp->fp_mant[0],	fp->fp_mant[1],
    177 		fp->fp_mant[2], fp->fp_mant[3],
    178 		fp->fp_exp);
    179 }
    180 #endif
    181 
    182 /*
    183  * fpu_execute returns the following error numbers (0 = no error):
    184  */
    185 #define	FPE		1	/* take a floating point exception */
    186 #define	NOTFPU		2	/* not an FPU instruction */
    187 #define	FAULT		3
    188 
    189 
    190 /*
    191  * Emulate a floating-point instruction.
    192  * Return zero for success, else signal number.
    193  * (Typically: zero, SIGFPE, SIGILL, SIGSEGV)
    194  */
    195 bool
    196 fpu_emulate(struct trapframe *tf, struct fpreg *fpf, ksiginfo_t *ksi)
    197 {
    198 	struct pcb *pcb;
    199 	union instr insn;
    200 	struct fpemu fe;
    201 
    202 	KSI_INIT_TRAP(ksi);
    203 	ksi->ksi_signo = 0;
    204 	ksi->ksi_addr = (void *)tf->tf_srr0;
    205 
    206 	/* initialize insn.is_datasize to tell it is *not* initialized */
    207 	fe.fe_fpstate = fpf;
    208 	fe.fe_cx = 0;
    209 
    210 	/* always set this (to avoid a warning) */
    211 
    212 	if (copyin((void *) (tf->tf_srr0), &insn.i_int, sizeof (insn.i_int))) {
    213 #ifdef DEBUG
    214 		printf("fpu_emulate: fault reading opcode\n");
    215 #endif
    216 		ksi->ksi_signo = SIGSEGV;
    217 		ksi->ksi_trap = EXC_ISI;
    218 		ksi->ksi_code = SEGV_MAPERR;
    219 		return true;
    220 	}
    221 
    222 	DPRINTF(FPE_EX, ("fpu_emulate: emulating insn %x at %p\n",
    223 	    insn.i_int, (void *)tf->tf_srr0));
    224 
    225 	if ((insn.i_any.i_opcd == OPC_TWI) ||
    226 	    ((insn.i_any.i_opcd == OPC_integer_31) &&
    227 	    (insn.i_x.i_xo == OPC31_TW))) {
    228 		/* Check for the two trap insns. */
    229 		DPRINTF(FPE_EX, ("fpu_emulate: SIGTRAP\n"));
    230 		ksi->ksi_signo = SIGTRAP;
    231 		ksi->ksi_trap = EXC_PGM;
    232 		ksi->ksi_code = TRAP_BRKPT;
    233 		return true;
    234 	}
    235 	switch (fpu_execute(tf, &fe, &insn)) {
    236 	case 0:
    237 success:
    238 		DPRINTF(FPE_EX, ("fpu_emulate: success\n"));
    239 		tf->tf_srr0 += 4;
    240 		return true;
    241 
    242 	case FPE:
    243 		pcb = lwp_getpcb(curlwp);
    244 		if ((pcb->pcb_flags & PSL_FE_PREC) == 0)
    245 			goto success;
    246 		DPRINTF(FPE_EX, ("fpu_emulate: SIGFPE\n"));
    247 		ksi->ksi_signo = SIGFPE;
    248 		ksi->ksi_trap = EXC_PGM;
    249 		ksi->ksi_code = fpu_get_fault_code();
    250 		return true;
    251 
    252 	case FAULT:
    253 		DPRINTF(FPE_EX, ("fpu_emulate: SIGSEGV\n"));
    254 		ksi->ksi_signo = SIGSEGV;
    255 		ksi->ksi_trap = EXC_DSI;
    256 		ksi->ksi_code = SEGV_MAPERR;
    257 		ksi->ksi_addr = (void *)fe.fe_addr;
    258 		return true;
    259 
    260 	case NOTFPU:
    261 	default:
    262 		DPRINTF(FPE_EX, ("fpu_emulate: SIGILL\n"));
    263 #if defined(DDB) && defined(DEBUG)
    264 		if (fpe_debug & FPE_EX) {
    265 			printf("fpu_emulate:  illegal insn %x at %p:",
    266 			insn.i_int, (void *) (tf->tf_srr0));
    267 			opc_disasm((vaddr_t)(tf->tf_srr0), insn.i_int);
    268 		}
    269 #endif
    270 		return false;
    271 	}
    272 }
    273 
    274 /*
    275  * Execute an FPU instruction (one that runs entirely in the FPU; not
    276  * FBfcc or STF, for instance).  On return, fe->fe_fs->fs_fsr will be
    277  * modified to reflect the setting the hardware would have left.
    278  *
    279  * Note that we do not catch all illegal opcodes, so you can, for instance,
    280  * multiply two integers this way.
    281  */
    282 int
    283 fpu_execute(struct trapframe *tf, struct fpemu *fe, union instr *insn)
    284 {
    285 	struct fpn *fp;
    286 	union instr instr = *insn;
    287 	int *a;
    288 	vaddr_t addr;
    289 	int ra, rb, rc, rt, type, mask, fsr, cx, bf, setcr;
    290 	unsigned int cond;
    291 	struct fpreg *fs;
    292 	int mtfsf = 0;
    293 
    294 	/* Setup work. */
    295 	fp = NULL;
    296 	fs = fe->fe_fpstate;
    297 	fe->fe_fpscr = ((int *)&fs->fpscr)[1];
    298 
    299 	/*
    300 	 * On PowerPC all floating point values are stored in registers
    301 	 * as doubles, even when used for single precision operations.
    302 	 */
    303 	type = FTYPE_DBL;
    304 	cond = instr.i_any.i_rc;
    305 	setcr = 0;
    306 	bf = 0;	/* XXX gcc */
    307 
    308 #if defined(DDB) && defined(DEBUG)
    309 	if (fpe_debug & FPE_EX) {
    310 		vaddr_t loc = tf->tf_srr0;
    311 
    312 		printf("Trying to emulate: %p ", (void *)loc);
    313 		opc_disasm(loc, instr.i_int);
    314 	}
    315 #endif
    316 
    317 	/*
    318 	 * `Decode' and execute instruction.
    319 	 */
    320 
    321 	if ((instr.i_any.i_opcd >= OPC_LFS && instr.i_any.i_opcd <= OPC_STFDU) ||
    322 	    instr.i_any.i_opcd == OPC_integer_31) {
    323 		/*
    324 		 * Handle load/store insns:
    325 		 *
    326 		 * Convert to/from single if needed, calculate addr,
    327 		 * and update index reg if needed.
    328 		 */
    329 		uint64_t buf;
    330 		size_t size = sizeof(float);
    331 		int store, update;
    332 
    333 		cond = 0; /* ld/st never set condition codes */
    334 
    335 
    336 		if (instr.i_any.i_opcd == OPC_integer_31) {
    337 			if (instr.i_x.i_xo == OPC31_STFIWX) {
    338 				FPU_EMU_EVCNT_INCR(stfiwx);
    339 
    340 				/* Store as integer */
    341 				ra = instr.i_x.i_ra;
    342 				rb = instr.i_x.i_rb;
    343 				DPRINTF(FPE_INSN, ("reg %d has %lx reg %d has %lx\n",
    344 					ra, tf->tf_fixreg[ra], rb, tf->tf_fixreg[rb]));
    345 
    346 				addr = tf->tf_fixreg[rb];
    347 				if (ra != 0)
    348 					addr += tf->tf_fixreg[ra];
    349 				rt = instr.i_x.i_rt;
    350 				a = (int *)&fs->fpreg[rt];
    351 				DPRINTF(FPE_INSN,
    352 					("fpu_execute: Store INT %x at %p\n",
    353 						a[1], (void *)addr));
    354 				if (copyout(&a[1], (void *)addr, sizeof(int))) {
    355 					fe->fe_addr = addr;
    356 					return (FAULT);
    357 				}
    358 				return (0);
    359 			}
    360 
    361 			if ((instr.i_x.i_xo & OPC31_FPMASK) != OPC31_FPOP)
    362 				/* Not an indexed FP load/store op */
    363 				return (NOTFPU);
    364 
    365 			store = (instr.i_x.i_xo & 0x80);
    366 			if (instr.i_x.i_xo & 0x40)
    367 				size = sizeof(double);
    368 			else
    369 				type = FTYPE_SNG;
    370 			update = (instr.i_x.i_xo & 0x20);
    371 
    372 			/* calculate EA of load/store */
    373 			ra = instr.i_x.i_ra;
    374 			rb = instr.i_x.i_rb;
    375 			DPRINTF(FPE_INSN, ("reg %d has %lx reg %d has %lx\n",
    376 				ra, tf->tf_fixreg[ra], rb, tf->tf_fixreg[rb]));
    377 			addr = tf->tf_fixreg[rb];
    378 			if (ra != 0)
    379 				addr += tf->tf_fixreg[ra];
    380 			rt = instr.i_x.i_rt;
    381 		} else {
    382 			store = instr.i_d.i_opcd & 0x4;
    383 			if (instr.i_d.i_opcd & 0x2)
    384 				size = sizeof(double);
    385 			else
    386 				type = FTYPE_SNG;
    387 			update = instr.i_d.i_opcd & 0x1;
    388 
    389 			/* calculate EA of load/store */
    390 			ra = instr.i_d.i_ra;
    391 			addr = instr.i_d.i_d;
    392 			DPRINTF(FPE_INSN, ("reg %d has %lx displ %lx\n",
    393 				ra, tf->tf_fixreg[ra], addr));
    394 			if (ra != 0)
    395 				addr += tf->tf_fixreg[ra];
    396 			rt = instr.i_d.i_rt;
    397 		}
    398 
    399 		if (update && ra == 0)
    400 			return (NOTFPU);
    401 
    402 		if (store) {
    403 			/* Store */
    404 			FPU_EMU_EVCNT_INCR(fpstore);
    405 			if (type != FTYPE_DBL) {
    406 				DPRINTF(FPE_INSN,
    407 					("fpu_execute: Store SNG at %p\n",
    408 						(void *)addr));
    409 				fpu_explode(fe, fp = &fe->fe_f1, FTYPE_DBL, rt);
    410 				fpu_implode(fe, fp, type, (void *)&buf);
    411 				if (copyout(&buf, (void *)addr, size)) {
    412 					fe->fe_addr = addr;
    413 					return (FAULT);
    414 				}
    415 			} else {
    416 				DPRINTF(FPE_INSN,
    417 					("fpu_execute: Store DBL at %p\n",
    418 						(void *)addr));
    419 				if (copyout(&fs->fpreg[rt], (void *)addr, size)) {
    420 					fe->fe_addr = addr;
    421 					return (FAULT);
    422 				}
    423 			}
    424 		} else {
    425 			/* Load */
    426 			FPU_EMU_EVCNT_INCR(fpload);
    427 			DPRINTF(FPE_INSN, ("fpu_execute: Load from %p\n",
    428 				(void *)addr));
    429 			if (copyin((const void *)addr, &fs->fpreg[rt], size)) {
    430 				fe->fe_addr = addr;
    431 				return (FAULT);
    432 			}
    433 			if (type != FTYPE_DBL) {
    434 				fpu_explode(fe, fp = &fe->fe_f1, type, rt);
    435 				fpu_implode(fe, fp, FTYPE_DBL,
    436 					(u_int *)&fs->fpreg[rt]);
    437 			}
    438 		}
    439 		if (update)
    440 			tf->tf_fixreg[ra] = addr;
    441 		/* Complete. */
    442 		return (0);
    443 #ifdef notyet
    444 	} else if (instr.i_any.i_opcd == OPC_load_st_62) {
    445 		/* These are 64-bit extenstions */
    446 		return (NOTFPU);
    447 #endif
    448 	} else if (instr.i_any.i_opcd == OPC_sp_fp_59 ||
    449 		instr.i_any.i_opcd == OPC_dp_fp_63) {
    450 
    451 
    452 		if (instr.i_any.i_opcd == OPC_dp_fp_63 &&
    453 		    !(instr.i_a.i_xo & OPC63M_MASK)) {
    454 			/* Format X */
    455 			rt = instr.i_x.i_rt;
    456 			ra = instr.i_x.i_ra;
    457 			rb = instr.i_x.i_rb;
    458 
    459 
    460 			/* One of the special opcodes.... */
    461 			switch (instr.i_x.i_xo) {
    462 			case	OPC63_FCMPU:
    463 				FPU_EMU_EVCNT_INCR(fcmpu);
    464 				DPRINTF(FPE_INSN, ("fpu_execute: FCMPU\n"));
    465 				rt >>= 2;
    466 				fpu_explode(fe, &fe->fe_f1, type, ra);
    467 				fpu_explode(fe, &fe->fe_f2, type, rb);
    468 				fpu_compare(fe, 0);
    469 				/* Make sure we do the condition regs. */
    470 				cond = 0;
    471 				/* N.B.: i_rs is already left shifted by two. */
    472 				bf = instr.i_x.i_rs & 0xfc;
    473 				setcr = 1;
    474 				break;
    475 
    476 			case	OPC63_FRSP:
    477 				/*
    478 				 * Convert to single:
    479 				 *
    480 				 * PowerPC uses this to round a double
    481 				 * precision value to single precision,
    482 				 * but values in registers are always
    483 				 * stored in double precision format.
    484 				 */
    485 				FPU_EMU_EVCNT_INCR(frsp);
    486 				DPRINTF(FPE_INSN, ("fpu_execute: FRSP\n"));
    487 				fpu_explode(fe, fp = &fe->fe_f1, FTYPE_DBL, rb);
    488 				fpu_implode(fe, fp, FTYPE_SNG,
    489 					(u_int *)&fs->fpreg[rt]);
    490 				fpu_explode(fe, fp = &fe->fe_f1, FTYPE_SNG, rt);
    491 				type = FTYPE_DBL;
    492 				break;
    493 			case	OPC63_FCTIW:
    494 			case	OPC63_FCTIWZ:
    495 				FPU_EMU_EVCNT_INCR(fctiw);
    496 				DPRINTF(FPE_INSN, ("fpu_execute: FCTIW\n"));
    497 				fpu_explode(fe, fp = &fe->fe_f1, type, rb);
    498 				type = FTYPE_INT;
    499 				break;
    500 			case	OPC63_FCMPO:
    501 				FPU_EMU_EVCNT_INCR(fcmpo);
    502 				DPRINTF(FPE_INSN, ("fpu_execute: FCMPO\n"));
    503 				rt >>= 2;
    504 				fpu_explode(fe, &fe->fe_f1, type, ra);
    505 				fpu_explode(fe, &fe->fe_f2, type, rb);
    506 				fpu_compare(fe, 1);
    507 				/* Make sure we do the condition regs. */
    508 				cond = 0;
    509 				/* N.B.: i_rs is already left shifted by two. */
    510 				bf = instr.i_x.i_rs & 0xfc;
    511 				setcr = 1;
    512 				break;
    513 			case	OPC63_MTFSB1:
    514 				FPU_EMU_EVCNT_INCR(mtfsb1);
    515 				DPRINTF(FPE_INSN, ("fpu_execute: MTFSB1\n"));
    516 				fe->fe_fpscr |=
    517 					(~(FPSCR_VX|FPSR_EX) & (1<<(31-rt)));
    518 				break;
    519 			case	OPC63_FNEG:
    520 				FPU_EMU_EVCNT_INCR(fnegabs);
    521 				DPRINTF(FPE_INSN, ("fpu_execute: FNEGABS\n"));
    522 				memcpy(&fs->fpreg[rt], &fs->fpreg[rb],
    523 					sizeof(double));
    524 				a = (int *)&fs->fpreg[rt];
    525 				*a ^= (1 << 31);
    526 				break;
    527 			case	OPC63_MCRFS:
    528 				FPU_EMU_EVCNT_INCR(mcrfs);
    529 				DPRINTF(FPE_INSN, ("fpu_execute: MCRFS\n"));
    530 				cond = 0;
    531 				rt &= 0x1c;
    532 				ra &= 0x1c;
    533 				/* Extract the bits we want */
    534 				mask = (fe->fe_fpscr >> (28 - ra)) & 0xf;
    535 				/* Clear the bits we copied. */
    536 				fe->fe_cx =
    537 					(FPSR_EX_MSK | (0xf << (28 - ra)));
    538 				fe->fe_fpscr &= fe->fe_cx;
    539 				/* Now shove them in the right part of cr */
    540 				tf->tf_cr &= ~(0xf << (28 - rt));
    541 				tf->tf_cr |= (mask << (28 - rt));
    542 				break;
    543 			case	OPC63_MTFSB0:
    544 				FPU_EMU_EVCNT_INCR(mtfsb0);
    545 				DPRINTF(FPE_INSN, ("fpu_execute: MTFSB0\n"));
    546 				fe->fe_fpscr &=
    547 					((FPSCR_VX|FPSR_EX) & ~(1<<(31-rt)));
    548 				break;
    549 			case	OPC63_FMR:
    550 				FPU_EMU_EVCNT_INCR(fmr);
    551 				DPRINTF(FPE_INSN, ("fpu_execute: FMR\n"));
    552 				memcpy(&fs->fpreg[rt], &fs->fpreg[rb],
    553 					sizeof(double));
    554 				break;
    555 			case	OPC63_MTFSFI:
    556 				mtfsf = 1;
    557 				FPU_EMU_EVCNT_INCR(mtfsfi);
    558 				DPRINTF(FPE_INSN, ("fpu_execute: MTFSFI\n"));
    559 				rb >>= 1;
    560 				rt &= 0x1c; /* Already left-shifted 4 */
    561 				fe->fe_cx = rb << (28 - rt);
    562 				mask = 0xf<<(28 - rt);
    563 				fe->fe_fpscr = (fe->fe_fpscr & ~mask) |
    564 					fe->fe_cx;
    565 /* XXX weird stuff about OX, FX, FEX, and VX should be handled */
    566 				break;
    567 			case	OPC63_FNABS:
    568 				FPU_EMU_EVCNT_INCR(fnabs);
    569 				DPRINTF(FPE_INSN, ("fpu_execute: FABS\n"));
    570 				memcpy(&fs->fpreg[rt], &fs->fpreg[rb],
    571 					sizeof(double));
    572 				a = (int *)&fs->fpreg[rt];
    573 				*a |= (1 << 31);
    574 				break;
    575 			case	OPC63_FABS:
    576 				FPU_EMU_EVCNT_INCR(fabs);
    577 				DPRINTF(FPE_INSN, ("fpu_execute: FABS\n"));
    578 				memcpy(&fs->fpreg[rt], &fs->fpreg[rb],
    579 					sizeof(double));
    580 				a = (int *)&fs->fpreg[rt];
    581 				*a &= ~(1 << 31);
    582 				break;
    583 			case	OPC63_MFFS:
    584 				FPU_EMU_EVCNT_INCR(mffs);
    585 				DPRINTF(FPE_INSN, ("fpu_execute: MFFS\n"));
    586 				/* XXX FEX is not sticky */
    587 				fs->fpscr &= ~FPSCR_FEX;
    588 				memcpy(&fs->fpreg[rt], &fs->fpscr,
    589 					sizeof(fs->fpscr));
    590 				break;
    591 			case	OPC63_MTFSF:
    592 				mtfsf = 1;
    593 				FPU_EMU_EVCNT_INCR(mtfsf);
    594 				DPRINTF(FPE_INSN, ("fpu_execute: MTFSF\n"));
    595 				if ((rt = instr.i_xfl.i_flm) == -1)
    596 					mask = -1;
    597 				else {
    598 					mask = 0;
    599 					/* Convert 1 bit -> 4 bits */
    600 					for (ra = 0; ra < 8; ra ++)
    601 						if (rt & (1<<ra))
    602 							mask |= (0xf<<(4*ra));
    603 				}
    604 				a = (int *)&fs->fpreg[rb];
    605 				fe->fe_cx = mask & a[1];
    606 				fe->fe_fpscr = (fe->fe_fpscr&~mask) |
    607 					(fe->fe_cx);
    608 				/*
    609 				 * XXX
    610 				 * Forbidden to set FEX and VX, also for
    611 				 * mcrfs, mtfsfi, and mtfsb[01].
    612 				 *
    613 				 * XXX
    614 				 * Handle invalid operation differently,
    615 				 * depending on VE.
    616 				 */
    617 /* XXX weird stuff about OX, FX, FEX, and VX should be handled */
    618 				break;
    619 			case	OPC63_FCTID:
    620 			case	OPC63_FCTIDZ:
    621 				FPU_EMU_EVCNT_INCR(fctid);
    622 				DPRINTF(FPE_INSN, ("fpu_execute: FCTID\n"));
    623 				fpu_explode(fe, fp = &fe->fe_f1, type, rb);
    624 				type = FTYPE_LNG;
    625 				break;
    626 			case	OPC63_FCFID:
    627 				FPU_EMU_EVCNT_INCR(fcfid);
    628 				DPRINTF(FPE_INSN, ("fpu_execute: FCFID\n"));
    629 				type = FTYPE_LNG;
    630 				fpu_explode(fe, fp = &fe->fe_f1, type, rb);
    631 				type = FTYPE_DBL;
    632 				break;
    633 			default:
    634 				return (NOTFPU);
    635 				break;
    636 			}
    637 		} else {
    638 			/* Format A */
    639 			rt = instr.i_a.i_frt;
    640 			ra = instr.i_a.i_fra;
    641 			rb = instr.i_a.i_frb;
    642 			rc = instr.i_a.i_frc;
    643 
    644 			/*
    645 			 * All arithmetic operations work on registers, which
    646 			 * are stored as doubles.
    647 			 */
    648 			type = FTYPE_DBL;
    649 			switch ((unsigned int)instr.i_a.i_xo) {
    650 			case	OPC59_FDIVS:
    651 				FPU_EMU_EVCNT_INCR(fdiv);
    652 				DPRINTF(FPE_INSN, ("fpu_execute: FDIV\n"));
    653 				fpu_explode(fe, &fe->fe_f1, type, ra);
    654 				fpu_explode(fe, &fe->fe_f2, type, rb);
    655 				fp = fpu_div(fe);
    656 				break;
    657 			case	OPC59_FSUBS:
    658 				FPU_EMU_EVCNT_INCR(fsub);
    659 				DPRINTF(FPE_INSN, ("fpu_execute: FSUB\n"));
    660 				fpu_explode(fe, &fe->fe_f1, type, ra);
    661 				fpu_explode(fe, &fe->fe_f2, type, rb);
    662 				fp = fpu_sub(fe);
    663 				break;
    664 			case	OPC59_FADDS:
    665 				FPU_EMU_EVCNT_INCR(fadd);
    666 				DPRINTF(FPE_INSN, ("fpu_execute: FADD\n"));
    667 				fpu_explode(fe, &fe->fe_f1, type, ra);
    668 				fpu_explode(fe, &fe->fe_f2, type, rb);
    669 				fp = fpu_add(fe);
    670 				break;
    671 			case	OPC59_FSQRTS:
    672 				FPU_EMU_EVCNT_INCR(fsqrt);
    673 				DPRINTF(FPE_INSN, ("fpu_execute: FSQRT\n"));
    674 				fpu_explode(fe, &fe->fe_f1, type, rb);
    675 				fp = fpu_sqrt(fe);
    676 				break;
    677 			case	OPC63M_FSEL:
    678 				FPU_EMU_EVCNT_INCR(fsel);
    679 				DPRINTF(FPE_INSN, ("fpu_execute: FSEL\n"));
    680 				a = (int *)&fe->fe_fpstate->fpreg[ra];
    681 				if ((*a & 0x80000000) && (*a & 0x7fffffff))
    682 					/* fra < 0 */
    683 					rc = rb;
    684 				DPRINTF(FPE_INSN, ("f%d => f%d\n", rc, rt));
    685 				memcpy(&fs->fpreg[rt], &fs->fpreg[rc],
    686 					sizeof(double));
    687 				break;
    688 			case	OPC59_FRES:
    689 				FPU_EMU_EVCNT_INCR(fpres);
    690 				DPRINTF(FPE_INSN, ("fpu_execute: FPRES\n"));
    691 				fpu_explode(fe, &fe->fe_f1, type, rb);
    692 				fp = fpu_sqrt(fe);
    693 				/* now we've gotta overwrite the dest reg */
    694 				*((int *)&fe->fe_fpstate->fpreg[rt]) = 1;
    695 				fpu_explode(fe, &fe->fe_f1, FTYPE_INT, rt);
    696 				fpu_div(fe);
    697 				break;
    698 			case	OPC59_FMULS:
    699 				FPU_EMU_EVCNT_INCR(fmul);
    700 				DPRINTF(FPE_INSN, ("fpu_execute: FMUL\n"));
    701 				fpu_explode(fe, &fe->fe_f1, type, ra);
    702 				fpu_explode(fe, &fe->fe_f2, type, rc);
    703 				fp = fpu_mul(fe);
    704 				break;
    705 			case	OPC63M_FRSQRTE:
    706 				/* Reciprocal sqrt() estimate */
    707 				FPU_EMU_EVCNT_INCR(frsqrte);
    708 				DPRINTF(FPE_INSN, ("fpu_execute: FRSQRTE\n"));
    709 				fpu_explode(fe, &fe->fe_f1, type, rb);
    710 				fp = fpu_sqrt(fe);
    711 				fe->fe_f2 = *fp;
    712 				/* now we've gotta overwrite the dest reg */
    713 				*((int *)&fe->fe_fpstate->fpreg[rt]) = 1;
    714 				fpu_explode(fe, &fe->fe_f1, FTYPE_INT, rt);
    715 				fpu_div(fe);
    716 				break;
    717 			case	OPC59_FMSUBS:
    718 				FPU_EMU_EVCNT_INCR(fmulsub);
    719 				DPRINTF(FPE_INSN, ("fpu_execute: FMULSUB\n"));
    720 				fpu_explode(fe, &fe->fe_f1, type, ra);
    721 				fpu_explode(fe, &fe->fe_f2, type, rc);
    722 				fp = fpu_mul(fe);
    723 				fe->fe_f1 = *fp;
    724 				fpu_explode(fe, &fe->fe_f2, type, rb);
    725 				fp = fpu_sub(fe);
    726 				break;
    727 			case	OPC59_FMADDS:
    728 				FPU_EMU_EVCNT_INCR(fmuladd);
    729 				DPRINTF(FPE_INSN, ("fpu_execute: FMULADD\n"));
    730 				fpu_explode(fe, &fe->fe_f1, type, ra);
    731 				fpu_explode(fe, &fe->fe_f2, type, rc);
    732 				fp = fpu_mul(fe);
    733 				fe->fe_f1 = *fp;
    734 				fpu_explode(fe, &fe->fe_f2, type, rb);
    735 				fp = fpu_add(fe);
    736 				break;
    737 			case	OPC59_FNMSUBS:
    738 				FPU_EMU_EVCNT_INCR(fnmsub);
    739 				DPRINTF(FPE_INSN, ("fpu_execute: FNMSUB\n"));
    740 				fpu_explode(fe, &fe->fe_f1, type, ra);
    741 				fpu_explode(fe, &fe->fe_f2, type, rc);
    742 				fp = fpu_mul(fe);
    743 				fe->fe_f1 = *fp;
    744 				fpu_explode(fe, &fe->fe_f2, type, rb);
    745 				fp = fpu_sub(fe);
    746 				/* Negate */
    747 				fp->fp_sign ^= 1;
    748 				break;
    749 			case	OPC59_FNMADDS:
    750 				FPU_EMU_EVCNT_INCR(fnmadd);
    751 				DPRINTF(FPE_INSN, ("fpu_execute: FNMADD\n"));
    752 				fpu_explode(fe, &fe->fe_f1, type, ra);
    753 				fpu_explode(fe, &fe->fe_f2, type, rc);
    754 				fp = fpu_mul(fe);
    755 				fe->fe_f1 = *fp;
    756 				fpu_explode(fe, &fe->fe_f2, type, rb);
    757 				fp = fpu_add(fe);
    758 				/* Negate */
    759 				fp->fp_sign ^= 1;
    760 				break;
    761 			default:
    762 				return (NOTFPU);
    763 				break;
    764 			}
    765 
    766 			/* If the instruction was single precision, round */
    767 			if (!(instr.i_any.i_opcd & 0x4)) {
    768 				fpu_implode(fe, fp, FTYPE_SNG,
    769 					(u_int *)&fs->fpreg[rt]);
    770 				fpu_explode(fe, fp = &fe->fe_f1, FTYPE_SNG, rt);
    771 			}
    772 		}
    773 	} else {
    774 		return (NOTFPU);
    775 	}
    776 
    777 	/*
    778 	 * ALU operation is complete.  Collapse the result and then check
    779 	 * for exceptions.  If we got any, and they are enabled, do not
    780 	 * alter the destination register, just stop with an exception.
    781 	 * Otherwise set new current exceptions and accrue.
    782 	 */
    783 	if (fp)
    784 		fpu_implode(fe, fp, type, (u_int *)&fs->fpreg[rt]);
    785 	cx = fe->fe_cx;
    786 	fsr = fe->fe_fpscr & ~(FPSCR_FEX|FPSCR_VX);
    787 	if (cx != 0) {
    788 		if (cx & FPSR_INV)
    789 			cx |= FPSCR_VX;
    790 		mask = fsr & FPSR_EX;
    791 		mask <<= (25-3);
    792 		if (cx & mask)
    793 			fsr |= FPSCR_FEX;
    794 		if (cx & FPSCR_FPRF) {
    795 			/* Need to replace CC */
    796 			fsr &= ~FPSCR_FPRF;
    797 		}
    798 		fsr |= cx;
    799 		DPRINTF(FPE_INSN, ("fpu_execute: cx %x, fsr %x\n", cx, fsr));
    800 	}
    801 	if (fsr & FPSR_INV)
    802 		fsr |= FPSCR_VX;
    803 	if (mtfsf == 0 && ((fsr ^ fe->fe_fpscr) & FPSR_EX_MSK))
    804 		fsr |= FPSCR_FX;
    805 
    806 	if (cond) {
    807 		cond = fsr & 0xf0000000;
    808 		/* Isolate condition codes */
    809 		cond >>= 28;
    810 		/* Move fpu condition codes to cr[1] */
    811 		tf->tf_cr &= ~(0x0f000000);
    812 		tf->tf_cr |= (cond<<24);
    813 		DPRINTF(FPE_INSN, ("fpu_execute: cr[1] <= %x\n", cond));
    814 	}
    815 
    816 	if (setcr) {
    817 		cond = fsr & FPSCR_FPCC;
    818 		/* Isolate condition codes */
    819 		cond <<= 16;
    820 		/* Move fpu condition codes to cr[bf/4] */
    821 		tf->tf_cr &= ~(0xf0000000>>bf);
    822 		tf->tf_cr |= (cond>>bf);
    823 		DPRINTF(FPE_INSN, ("fpu_execute: cr[%d] (cr=%x) <= %x\n", bf/4, tf->tf_cr, cond));
    824 	}
    825 
    826 	((int *)&fs->fpscr)[1] = fsr;
    827 	if (fsr & FPSCR_FEX)
    828 		return(FPE);
    829 	return (0);	/* success */
    830 }
    831