Home | History | Annotate | Line # | Download | only in fpe
fpu_fscale.c revision 1.15.12.1
      1  1.15.12.1     tls /*	$NetBSD: fpu_fscale.c,v 1.15.12.1 2013/06/23 06:20:08 tls Exp $	*/
      2        1.1  briggs 
      3        1.1  briggs /*
      4        1.1  briggs  * Copyright (c) 1995 Ken Nakata
      5        1.1  briggs  * All rights reserved.
      6        1.1  briggs  *
      7        1.1  briggs  * Redistribution and use in source and binary forms, with or without
      8        1.1  briggs  * modification, are permitted provided that the following conditions
      9        1.1  briggs  * are met:
     10        1.1  briggs  * 1. Redistributions of source code must retain the above copyright
     11        1.1  briggs  *    notice, this list of conditions and the following disclaimer.
     12        1.1  briggs  * 2. Redistributions in binary form must reproduce the above copyright
     13        1.1  briggs  *    notice, this list of conditions and the following disclaimer in the
     14        1.1  briggs  *    documentation and/or other materials provided with the distribution.
     15        1.1  briggs  * 3. The name of the author may not be used to endorse or promote products
     16        1.1  briggs  *    derived from this software without specific prior written permission.
     17        1.1  briggs  * 4. All advertising materials mentioning features or use of this software
     18        1.1  briggs  *    must display the following acknowledgement:
     19        1.1  briggs  *      This product includes software developed by Gordon Ross
     20        1.1  briggs  *
     21        1.1  briggs  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     22        1.1  briggs  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     23        1.1  briggs  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     24        1.1  briggs  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     25        1.1  briggs  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     26        1.1  briggs  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     27        1.1  briggs  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     28        1.1  briggs  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     29        1.1  briggs  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     30        1.1  briggs  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     31        1.1  briggs  */
     32        1.1  briggs 
     33        1.1  briggs /*
     34        1.1  briggs  * FSCALE - separated from the other type0 arithmetic instructions
     35        1.1  briggs  * for performance reason; maybe unnecessary, but FSCALE assumes
     36        1.1  briggs  * the source operand be an integer.  It performs type conversion
     37        1.1  briggs  * only if the source operand is *not* an integer.
     38        1.1  briggs  */
     39       1.11   lukem 
     40       1.11   lukem #include <sys/cdefs.h>
     41  1.15.12.1     tls __KERNEL_RCSID(0, "$NetBSD: fpu_fscale.c,v 1.15.12.1 2013/06/23 06:20:08 tls Exp $");
     42        1.1  briggs 
     43        1.1  briggs #include <sys/types.h>
     44        1.1  briggs #include <sys/signal.h>
     45        1.3  briggs #include <sys/systm.h>
     46        1.1  briggs #include <machine/frame.h>
     47        1.1  briggs 
     48        1.1  briggs #include "fpu_emulate.h"
     49        1.1  briggs 
     50        1.1  briggs int
     51       1.13     dsl fpu_emul_fscale(struct fpemu *fe, struct instruction *insn)
     52        1.1  briggs {
     53       1.14   isaki 	struct frame *frame;
     54  1.15.12.1     tls 	uint32_t *fpregs;
     55       1.14   isaki 	int word1, sig;
     56       1.14   isaki 	int regnum, format;
     57       1.14   isaki 	int scale, sign, exp;
     58  1.15.12.1     tls 	uint32_t m0, m1;
     59  1.15.12.1     tls 	uint32_t buf[3], fpsr;
     60       1.10  briggs #if DEBUG_FPE
     61       1.14   isaki 	int flags;
     62       1.14   isaki 	char regname;
     63       1.10  briggs #endif
     64        1.1  briggs 
     65       1.14   isaki 	scale = sig = 0;
     66       1.14   isaki 	frame = fe->fe_frame;
     67       1.14   isaki 	fpregs = &(fe->fe_fpframe->fpf_regs[0]);
     68       1.14   isaki 	/* clear all exceptions and conditions */
     69       1.14   isaki 	fpsr = fe->fe_fpsr & ~FPSR_EXCP & ~FPSR_CCB;
     70       1.10  briggs #if DEBUG_FPE
     71       1.14   isaki 	printf("fpu_emul_fscale: FPSR = %08x, FPCR = %08x\n", fpsr, fe->fe_fpcr);
     72       1.10  briggs #endif
     73        1.1  briggs 
     74       1.14   isaki 	word1 = insn->is_word1;
     75       1.14   isaki 	format = (word1 >> 10) & 7;
     76       1.14   isaki 	regnum = (word1 >> 7) & 7;
     77        1.1  briggs 
     78       1.14   isaki 	fe->fe_fpcr &= FPCR_ROUND;
     79       1.14   isaki 	fe->fe_fpcr |= FPCR_ZERO;
     80        1.1  briggs 
     81       1.14   isaki 	/* get the source operand */
     82       1.14   isaki 	if ((word1 & 0x4000) == 0) {
     83       1.10  briggs #if DEBUG_FPE
     84       1.14   isaki 		printf("fpu_emul_fscale: FP%d op FP%d => FP%d\n",
     85       1.15   isaki 		    format, regnum, regnum);
     86       1.14   isaki 		/* the operand is an FP reg */
     87       1.14   isaki 		printf("fpu_emul_scale: src opr FP%d=%08x%08x%08x\n",
     88       1.15   isaki 		    format, fpregs[format*3], fpregs[format*3+1],
     89       1.15   isaki 		    fpregs[format*3+2]);
     90       1.10  briggs #endif
     91       1.14   isaki 		fpu_explode(fe, &fe->fe_f2, FTYPE_EXT, &fpregs[format * 3]);
     92       1.14   isaki 		fpu_implode(fe, &fe->fe_f2, FTYPE_LNG, buf);
     93       1.14   isaki 		scale = buf[0];
     94        1.1  briggs 	} else {
     95       1.14   isaki 		/* the operand is in memory */
     96       1.14   isaki 		if (format == FTYPE_DBL) {
     97       1.14   isaki 			insn->is_datasize = 8;
     98       1.14   isaki 		} else if (format == FTYPE_SNG || format == FTYPE_LNG) {
     99       1.14   isaki 			insn->is_datasize = 4;
    100       1.14   isaki 		} else if (format == FTYPE_WRD) {
    101       1.14   isaki 			insn->is_datasize = 2;
    102       1.14   isaki 		} else if (format == FTYPE_BYT) {
    103       1.14   isaki 			insn->is_datasize = 1;
    104       1.14   isaki 		} else if (format == FTYPE_EXT) {
    105       1.14   isaki 			insn->is_datasize = 12;
    106       1.14   isaki 		} else {
    107       1.14   isaki 			/* invalid or unsupported operand format */
    108       1.14   isaki 			sig = SIGFPE;
    109       1.14   isaki 			return sig;
    110       1.14   isaki 		}
    111        1.1  briggs 
    112       1.14   isaki 		/* Get effective address. (modreg=opcode&077) */
    113       1.14   isaki 		sig = fpu_decode_ea(frame, insn, &insn->is_ea, insn->is_opcode);
    114       1.14   isaki 		if (sig) {
    115       1.10  briggs #if DEBUG_FPE
    116       1.14   isaki 			printf("fpu_emul_fscale: error in decode_ea\n");
    117       1.10  briggs #endif
    118       1.14   isaki 			return sig;
    119       1.14   isaki 		}
    120        1.1  briggs 
    121       1.10  briggs #if DEBUG_FPE
    122       1.14   isaki 		printf("fpu_emul_fscale: addr mode = ");
    123       1.14   isaki 		flags = insn->is_ea.ea_flags;
    124       1.14   isaki 		regname = (insn->is_ea.ea_regnum & 8) ? 'a' : 'd';
    125       1.14   isaki 
    126       1.14   isaki 		if (flags & EA_DIRECT) {
    127       1.14   isaki 			printf("%c%d\n", regname, insn->is_ea.ea_regnum & 7);
    128       1.14   isaki 		} else if (flags & EA_PREDECR) {
    129       1.14   isaki 			printf("%c%d@-\n", regname, insn->is_ea.ea_regnum & 7);
    130       1.14   isaki 		} else if (flags & EA_POSTINCR) {
    131       1.14   isaki 			printf("%c%d@+\n", regname, insn->is_ea.ea_regnum & 7);
    132       1.14   isaki 		} else if (flags & EA_OFFSET) {
    133       1.14   isaki 			printf("%c%d@(%d)\n",
    134       1.15   isaki 			    regname, insn->is_ea.ea_regnum & 7,
    135       1.15   isaki 			    insn->is_ea.ea_offset);
    136       1.14   isaki 		} else if (flags & EA_INDEXED) {
    137       1.14   isaki 			printf("%c%d@(...)\n",
    138       1.15   isaki 			    regname, insn->is_ea.ea_regnum & 7);
    139       1.14   isaki 		} else if (flags & EA_ABS) {
    140       1.14   isaki 			printf("0x%08x\n", insn->is_ea.ea_absaddr);
    141       1.14   isaki 		} else if (flags & EA_PC_REL) {
    142       1.14   isaki 			printf("pc@(%d)\n", insn->is_ea.ea_offset);
    143       1.14   isaki 		} else if (flags & EA_IMMED) {
    144       1.14   isaki 			printf("#0x%08x%08x%08x\n",
    145       1.15   isaki 			    insn->is_ea.ea_immed[0],
    146       1.15   isaki 			    insn->is_ea.ea_immed[1],
    147       1.15   isaki 			    insn->is_ea.ea_immed[2]);
    148       1.14   isaki 		} else {
    149       1.14   isaki 			printf("%c%d@\n", regname, insn->is_ea.ea_regnum & 7);
    150       1.14   isaki 		}
    151       1.10  briggs #endif
    152       1.14   isaki 		fpu_load_ea(frame, insn, &insn->is_ea, (char*)buf);
    153        1.1  briggs 
    154       1.10  briggs #if DEBUG_FPE
    155       1.14   isaki 		printf("fpu_emul_fscale: src = %08x%08x%08x, siz = %d\n",
    156       1.15   isaki 		    buf[0], buf[1], buf[2], insn->is_datasize);
    157       1.10  briggs #endif
    158       1.14   isaki 		if (format == FTYPE_LNG) {
    159       1.14   isaki 			/* nothing */
    160       1.14   isaki 			scale = buf[0];
    161       1.14   isaki 		} else if (format == FTYPE_WRD) {
    162       1.14   isaki 			/* sign-extend */
    163       1.14   isaki 			scale = buf[0] & 0xffff;
    164       1.14   isaki 			if (scale & 0x8000) {
    165       1.14   isaki 				scale |= 0xffff0000;
    166        1.1  briggs 			}
    167       1.14   isaki 		} else if (format == FTYPE_BYT) {
    168       1.14   isaki 			/* sign-extend */
    169       1.14   isaki 			scale = buf[0] & 0xff;
    170       1.14   isaki 			if (scale & 0x80) {
    171       1.14   isaki 				scale |= 0xffffff00;
    172        1.1  briggs 			}
    173       1.14   isaki 		} else if (format == FTYPE_DBL || format == FTYPE_SNG ||
    174       1.14   isaki 		           format == FTYPE_EXT) {
    175       1.14   isaki 			fpu_explode(fe, &fe->fe_f2, format, buf);
    176       1.14   isaki 			fpu_implode(fe, &fe->fe_f2, FTYPE_LNG, buf);
    177       1.14   isaki 			scale = buf[0];
    178        1.1  briggs 		}
    179       1.14   isaki 		/* make it look like we've got an FP oprand */
    180       1.14   isaki 		fe->fe_f2.fp_class = (buf[0] == 0) ? FPC_ZERO : FPC_NUM;
    181       1.14   isaki 	}
    182       1.14   isaki 
    183       1.14   isaki 	/* assume there's no exception */
    184       1.14   isaki 	sig = 0;
    185       1.14   isaki 
    186       1.14   isaki 	/*
    187       1.14   isaki 	 * it's barbaric but we're going to operate directly on
    188       1.14   isaki 	 * the dst operand's bit pattern
    189       1.14   isaki 	 */
    190       1.14   isaki 	sign = fpregs[regnum * 3] & 0x80000000;
    191       1.14   isaki 	exp = (fpregs[regnum * 3] & 0x7fff0000) >> 16;
    192       1.14   isaki 	m0 = fpregs[regnum * 3 + 1];
    193       1.14   isaki 	m1 = fpregs[regnum * 3 + 2];
    194       1.14   isaki 
    195       1.14   isaki 	switch (fe->fe_f2.fp_class) {
    196       1.14   isaki 	case FPC_SNAN:
    197       1.14   isaki 		fpsr |= FPSR_SNAN;
    198       1.14   isaki 	case FPC_QNAN:
    199       1.14   isaki 		/* dst = NaN */
    200       1.14   isaki 		exp = 0x7fff;
    201       1.14   isaki 		m0 = m1 = 0xffffffff;
    202       1.14   isaki 		break;
    203       1.14   isaki 	case FPC_ZERO:
    204       1.14   isaki 	case FPC_NUM:
    205       1.14   isaki 		if ((0 < exp && exp < 0x7fff) ||
    206       1.14   isaki 		    (exp == 0 && (m0 | m1) != 0)) {
    207       1.14   isaki 			/* normal or denormal */
    208       1.14   isaki 			exp += scale;
    209       1.14   isaki 			if (exp < 0) {
    210       1.14   isaki 				/* underflow */
    211  1.15.12.1     tls 				uint32_t grs;	/* guard, round and sticky */
    212       1.14   isaki 
    213       1.14   isaki 				exp = 0;
    214       1.14   isaki 				grs = m1 << (32 + exp);
    215       1.14   isaki 				m1 = m0 << (32 + exp) | m1 >> -exp;
    216       1.14   isaki 				m0 >>= -exp;
    217       1.14   isaki 				if (grs != 0) {
    218       1.14   isaki 					fpsr |= FPSR_INEX2;
    219       1.14   isaki 
    220       1.14   isaki 					switch (fe->fe_fpcr & 0x30) {
    221       1.14   isaki 					case FPCR_MINF:
    222       1.14   isaki 						if (sign != 0) {
    223       1.14   isaki 							if (++m1 == 0 &&
    224       1.14   isaki 							    ++m0 == 0) {
    225       1.14   isaki 								m0 = 0x80000000;
    226       1.14   isaki 								exp++;
    227       1.14   isaki 							}
    228       1.14   isaki 						}
    229       1.14   isaki 						break;
    230       1.14   isaki 					case FPCR_NEAR:
    231       1.14   isaki 						if (grs == 0x80000000) {
    232       1.14   isaki 							/* tie */
    233       1.14   isaki 							if ((m1 & 1) &&
    234       1.14   isaki 							    ++m1 == 0 &&
    235       1.14   isaki 							    ++m0 == 0) {
    236       1.14   isaki 								m0 = 0x80000000;
    237       1.14   isaki 								exp++;
    238       1.14   isaki 							}
    239       1.14   isaki 						} else if (grs & 0x80000000) {
    240       1.14   isaki 							if (++m1 == 0 &&
    241       1.14   isaki 							    ++m0 == 0) {
    242       1.14   isaki 								m0 = 0x80000000;
    243       1.14   isaki 								exp++;
    244       1.14   isaki 							}
    245       1.14   isaki 						}
    246       1.14   isaki 						break;
    247       1.14   isaki 					case FPCR_PINF:
    248       1.14   isaki 						if (sign == 0) {
    249       1.14   isaki 							if (++m1 == 0 &&
    250       1.14   isaki 							    ++m0 == 0) {
    251       1.14   isaki 								m0 = 0x80000000;
    252       1.14   isaki 								exp++;
    253       1.14   isaki 							}
    254       1.14   isaki 						}
    255       1.14   isaki 						break;
    256       1.14   isaki 					case FPCR_ZERO:
    257       1.14   isaki 						break;
    258       1.14   isaki 					}
    259       1.14   isaki 				}
    260       1.14   isaki 				if (exp == 0 && (m0 & 0x80000000) == 0) {
    261       1.14   isaki 					fpsr |= FPSR_UNFL;
    262       1.14   isaki 					if ((m0 | m1) == 0) {
    263       1.14   isaki 						fpsr |= FPSR_ZERO;
    264       1.14   isaki 					}
    265       1.14   isaki 				}
    266       1.14   isaki 			} else if (exp >= 0x7fff) {
    267       1.14   isaki 				/* overflow --> result = Inf */
    268       1.14   isaki 				/*
    269       1.14   isaki 				 * but first, try to normalize in case it's an
    270       1.14   isaki 				 * unnormalized
    271       1.14   isaki 				 */
    272       1.14   isaki 				while ((m0 & 0x80000000) == 0) {
    273       1.14   isaki 					exp--;
    274       1.14   isaki 					m0 = (m0 << 1) | (m1 >> 31);
    275       1.14   isaki 					m1 = m1 << 1;
    276       1.14   isaki 				}
    277       1.14   isaki 				/* if it's still too large, then return Inf */
    278       1.14   isaki 				if (exp >= 0x7fff) {
    279       1.14   isaki 					exp = 0x7fff;
    280       1.14   isaki 					m0 = m1 = 0;
    281       1.14   isaki 					fpsr |= FPSR_OVFL | FPSR_INF;
    282       1.14   isaki 				}
    283       1.14   isaki 			} else if ((m0 & 0x80000000) == 0) {
    284       1.14   isaki 				/*
    285       1.14   isaki 				 * it's a denormal; we try to normalize but
    286       1.14   isaki 				 * result may and may not be a normal.
    287       1.14   isaki 				 */
    288       1.14   isaki 				while (exp > 0 && (m0 & 0x80000000) == 0) {
    289       1.14   isaki 					exp--;
    290       1.14   isaki 					m0 = (m0 << 1) | (m1 >> 31);
    291       1.14   isaki 					m1 = m1 << 1;
    292       1.14   isaki 				}
    293       1.14   isaki 				if ((m0 & 0x80000000) == 0) {
    294       1.14   isaki 					fpsr |= FPSR_UNFL;
    295       1.14   isaki 				}
    296       1.14   isaki 			} /* exp in range and mantissa normalized */
    297       1.14   isaki 		} else if (exp == 0 && m0 == 0 && m1 == 0) {
    298       1.14   isaki 			/* dst is Zero */
    299        1.1  briggs 			fpsr |= FPSR_ZERO;
    300       1.14   isaki 		} /* else we know exp == 0x7fff */
    301       1.14   isaki 		else if ((m0 | m1) == 0) {
    302       1.14   isaki 			fpsr |= FPSR_INF;
    303       1.14   isaki 		} else if ((m0 & 0x40000000) == 0) {
    304       1.14   isaki 			/* a signaling NaN */
    305       1.14   isaki 			fpsr |= FPSR_NAN | FPSR_SNAN;
    306       1.14   isaki 		} else {
    307       1.14   isaki 			/* a quiet NaN */
    308       1.14   isaki 			fpsr |= FPSR_NAN;
    309        1.1  briggs 		}
    310       1.14   isaki 		break;
    311       1.14   isaki 	case FPC_INF:
    312       1.14   isaki 		/* dst = NaN */
    313       1.14   isaki 		exp = 0x7fff;
    314       1.14   isaki 		m0 = m1 = 0xffffffff;
    315       1.14   isaki 		fpsr |= FPSR_OPERR | FPSR_NAN;
    316       1.14   isaki 		break;
    317       1.14   isaki 	default:
    318        1.1  briggs #ifdef DEBUG
    319       1.14   isaki 		panic("fpu_emul_fscale: invalid fp class");
    320        1.1  briggs #endif
    321       1.14   isaki 		break;
    322       1.14   isaki 	}
    323        1.1  briggs 
    324       1.14   isaki 	/* store the result */
    325       1.14   isaki 	fpregs[regnum * 3] = sign | (exp << 16);
    326       1.14   isaki 	fpregs[regnum * 3 + 1] = m0;
    327       1.14   isaki 	fpregs[regnum * 3 + 2] = m1;
    328       1.14   isaki 
    329       1.14   isaki 	if (sign) {
    330       1.14   isaki 		fpsr |= FPSR_NEG;
    331       1.14   isaki 	}
    332        1.1  briggs 
    333       1.14   isaki 	/* update fpsr according to the result of operation */
    334       1.14   isaki 	fe->fe_fpframe->fpf_fpsr = fe->fe_fpsr = fpsr;
    335        1.1  briggs 
    336       1.10  briggs #if DEBUG_FPE
    337       1.14   isaki 	printf("fpu_emul_fscale: FPSR = %08x, FPCR = %08x\n",
    338       1.15   isaki 	    fe->fe_fpsr, fe->fe_fpcr);
    339       1.10  briggs #endif
    340        1.1  briggs 
    341       1.14   isaki 	return (fpsr & fe->fe_fpcr & FPSR_EXCP) ? SIGFPE : sig;
    342        1.1  briggs }
    343