Home | History | Annotate | Line # | Download | only in fpe
      1  1.17   isaki /*	$NetBSD: fpu_fscale.c,v 1.17 2025/01/06 07:34:24 isaki Exp $	*/
      2   1.1  briggs 
      3   1.1  briggs /*
      4   1.1  briggs  * Copyright (c) 1995 Ken Nakata
      5   1.1  briggs  * All rights reserved.
      6   1.1  briggs  *
      7   1.1  briggs  * Redistribution and use in source and binary forms, with or without
      8   1.1  briggs  * modification, are permitted provided that the following conditions
      9   1.1  briggs  * are met:
     10   1.1  briggs  * 1. Redistributions of source code must retain the above copyright
     11   1.1  briggs  *    notice, this list of conditions and the following disclaimer.
     12   1.1  briggs  * 2. Redistributions in binary form must reproduce the above copyright
     13   1.1  briggs  *    notice, this list of conditions and the following disclaimer in the
     14   1.1  briggs  *    documentation and/or other materials provided with the distribution.
     15   1.1  briggs  * 3. The name of the author may not be used to endorse or promote products
     16   1.1  briggs  *    derived from this software without specific prior written permission.
     17   1.1  briggs  * 4. All advertising materials mentioning features or use of this software
     18   1.1  briggs  *    must display the following acknowledgement:
     19   1.1  briggs  *      This product includes software developed by Gordon Ross
     20   1.1  briggs  *
     21   1.1  briggs  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     22   1.1  briggs  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     23   1.1  briggs  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     24   1.1  briggs  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     25   1.1  briggs  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     26   1.1  briggs  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     27   1.1  briggs  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     28   1.1  briggs  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     29   1.1  briggs  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     30   1.1  briggs  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     31   1.1  briggs  */
     32   1.1  briggs 
     33   1.1  briggs /*
     34   1.1  briggs  * FSCALE - separated from the other type0 arithmetic instructions
     35   1.1  briggs  * for performance reason; maybe unnecessary, but FSCALE assumes
     36   1.1  briggs  * the source operand be an integer.  It performs type conversion
     37   1.1  briggs  * only if the source operand is *not* an integer.
     38   1.1  briggs  */
     39  1.11   lukem 
     40  1.11   lukem #include <sys/cdefs.h>
     41  1.17   isaki __KERNEL_RCSID(0, "$NetBSD: fpu_fscale.c,v 1.17 2025/01/06 07:34:24 isaki Exp $");
     42   1.1  briggs 
     43   1.1  briggs #include <sys/types.h>
     44   1.1  briggs #include <sys/signal.h>
     45   1.3  briggs #include <sys/systm.h>
     46   1.1  briggs #include <machine/frame.h>
     47   1.1  briggs 
     48   1.1  briggs #include "fpu_emulate.h"
     49   1.1  briggs 
     50   1.1  briggs int
     51  1.13     dsl fpu_emul_fscale(struct fpemu *fe, struct instruction *insn)
     52   1.1  briggs {
     53  1.14   isaki 	struct frame *frame;
     54  1.16   isaki 	uint32_t *fpregs;
     55  1.14   isaki 	int word1, sig;
     56  1.14   isaki 	int regnum, format;
     57  1.17   isaki 	int modreg;
     58  1.14   isaki 	int scale, sign, exp;
     59  1.16   isaki 	uint32_t m0, m1;
     60  1.16   isaki 	uint32_t buf[3], fpsr;
     61  1.10  briggs #if DEBUG_FPE
     62  1.14   isaki 	int flags;
     63  1.14   isaki 	char regname;
     64  1.10  briggs #endif
     65   1.1  briggs 
     66  1.14   isaki 	scale = sig = 0;
     67  1.14   isaki 	frame = fe->fe_frame;
     68  1.14   isaki 	fpregs = &(fe->fe_fpframe->fpf_regs[0]);
     69  1.14   isaki 	/* clear all exceptions and conditions */
     70  1.14   isaki 	fpsr = fe->fe_fpsr & ~FPSR_EXCP & ~FPSR_CCB;
     71  1.10  briggs #if DEBUG_FPE
     72  1.14   isaki 	printf("fpu_emul_fscale: FPSR = %08x, FPCR = %08x\n", fpsr, fe->fe_fpcr);
     73  1.10  briggs #endif
     74   1.1  briggs 
     75  1.14   isaki 	word1 = insn->is_word1;
     76  1.14   isaki 	format = (word1 >> 10) & 7;
     77  1.14   isaki 	regnum = (word1 >> 7) & 7;
     78   1.1  briggs 
     79  1.14   isaki 	fe->fe_fpcr &= FPCR_ROUND;
     80  1.14   isaki 	fe->fe_fpcr |= FPCR_ZERO;
     81   1.1  briggs 
     82  1.14   isaki 	/* get the source operand */
     83  1.14   isaki 	if ((word1 & 0x4000) == 0) {
     84  1.10  briggs #if DEBUG_FPE
     85  1.14   isaki 		printf("fpu_emul_fscale: FP%d op FP%d => FP%d\n",
     86  1.15   isaki 		    format, regnum, regnum);
     87  1.14   isaki 		/* the operand is an FP reg */
     88  1.14   isaki 		printf("fpu_emul_scale: src opr FP%d=%08x%08x%08x\n",
     89  1.15   isaki 		    format, fpregs[format*3], fpregs[format*3+1],
     90  1.15   isaki 		    fpregs[format*3+2]);
     91  1.10  briggs #endif
     92  1.14   isaki 		fpu_explode(fe, &fe->fe_f2, FTYPE_EXT, &fpregs[format * 3]);
     93  1.14   isaki 		fpu_implode(fe, &fe->fe_f2, FTYPE_LNG, buf);
     94  1.14   isaki 		scale = buf[0];
     95   1.1  briggs 	} else {
     96  1.14   isaki 		/* the operand is in memory */
     97  1.14   isaki 		if (format == FTYPE_DBL) {
     98  1.14   isaki 			insn->is_datasize = 8;
     99  1.14   isaki 		} else if (format == FTYPE_SNG || format == FTYPE_LNG) {
    100  1.14   isaki 			insn->is_datasize = 4;
    101  1.14   isaki 		} else if (format == FTYPE_WRD) {
    102  1.14   isaki 			insn->is_datasize = 2;
    103  1.14   isaki 		} else if (format == FTYPE_BYT) {
    104  1.14   isaki 			insn->is_datasize = 1;
    105  1.14   isaki 		} else if (format == FTYPE_EXT) {
    106  1.14   isaki 			insn->is_datasize = 12;
    107  1.14   isaki 		} else {
    108  1.14   isaki 			/* invalid or unsupported operand format */
    109  1.14   isaki 			sig = SIGFPE;
    110  1.14   isaki 			return sig;
    111  1.14   isaki 		}
    112   1.1  briggs 
    113  1.17   isaki 		/* Check an illegal mod/reg. */
    114  1.17   isaki 		modreg = insn->is_opcode & 077;
    115  1.17   isaki 		if ((modreg >> 3) == 1/*An*/ || modreg >= 075) {
    116  1.17   isaki 			return SIGILL;
    117  1.17   isaki 		}
    118  1.17   isaki 
    119  1.14   isaki 		/* Get effective address. (modreg=opcode&077) */
    120  1.14   isaki 		sig = fpu_decode_ea(frame, insn, &insn->is_ea, insn->is_opcode);
    121  1.14   isaki 		if (sig) {
    122  1.10  briggs #if DEBUG_FPE
    123  1.14   isaki 			printf("fpu_emul_fscale: error in decode_ea\n");
    124  1.10  briggs #endif
    125  1.14   isaki 			return sig;
    126  1.14   isaki 		}
    127   1.1  briggs 
    128  1.17   isaki 		if (insn->is_ea.ea_flags == EA_DIRECT &&
    129  1.17   isaki 		    insn->is_datasize > 4) {
    130  1.17   isaki #if DEBUG_FPE
    131  1.17   isaki 			printf("%s: attempted to fetch dbl/ext from reg\n",
    132  1.17   isaki 			    __func__);
    133  1.17   isaki #endif
    134  1.17   isaki 			return SIGILL;
    135  1.17   isaki 		}
    136  1.17   isaki 
    137  1.10  briggs #if DEBUG_FPE
    138  1.14   isaki 		printf("fpu_emul_fscale: addr mode = ");
    139  1.14   isaki 		flags = insn->is_ea.ea_flags;
    140  1.14   isaki 		regname = (insn->is_ea.ea_regnum & 8) ? 'a' : 'd';
    141  1.14   isaki 
    142  1.14   isaki 		if (flags & EA_DIRECT) {
    143  1.14   isaki 			printf("%c%d\n", regname, insn->is_ea.ea_regnum & 7);
    144  1.14   isaki 		} else if (flags & EA_PREDECR) {
    145  1.14   isaki 			printf("%c%d@-\n", regname, insn->is_ea.ea_regnum & 7);
    146  1.14   isaki 		} else if (flags & EA_POSTINCR) {
    147  1.14   isaki 			printf("%c%d@+\n", regname, insn->is_ea.ea_regnum & 7);
    148  1.14   isaki 		} else if (flags & EA_OFFSET) {
    149  1.14   isaki 			printf("%c%d@(%d)\n",
    150  1.15   isaki 			    regname, insn->is_ea.ea_regnum & 7,
    151  1.15   isaki 			    insn->is_ea.ea_offset);
    152  1.14   isaki 		} else if (flags & EA_INDEXED) {
    153  1.14   isaki 			printf("%c%d@(...)\n",
    154  1.15   isaki 			    regname, insn->is_ea.ea_regnum & 7);
    155  1.14   isaki 		} else if (flags & EA_ABS) {
    156  1.14   isaki 			printf("0x%08x\n", insn->is_ea.ea_absaddr);
    157  1.14   isaki 		} else if (flags & EA_PC_REL) {
    158  1.14   isaki 			printf("pc@(%d)\n", insn->is_ea.ea_offset);
    159  1.14   isaki 		} else if (flags & EA_IMMED) {
    160  1.14   isaki 			printf("#0x%08x%08x%08x\n",
    161  1.15   isaki 			    insn->is_ea.ea_immed[0],
    162  1.15   isaki 			    insn->is_ea.ea_immed[1],
    163  1.15   isaki 			    insn->is_ea.ea_immed[2]);
    164  1.14   isaki 		} else {
    165  1.14   isaki 			printf("%c%d@\n", regname, insn->is_ea.ea_regnum & 7);
    166  1.14   isaki 		}
    167  1.10  briggs #endif
    168  1.14   isaki 		fpu_load_ea(frame, insn, &insn->is_ea, (char*)buf);
    169   1.1  briggs 
    170  1.10  briggs #if DEBUG_FPE
    171  1.14   isaki 		printf("fpu_emul_fscale: src = %08x%08x%08x, siz = %d\n",
    172  1.15   isaki 		    buf[0], buf[1], buf[2], insn->is_datasize);
    173  1.10  briggs #endif
    174  1.14   isaki 		if (format == FTYPE_LNG) {
    175  1.14   isaki 			/* nothing */
    176  1.14   isaki 			scale = buf[0];
    177  1.14   isaki 		} else if (format == FTYPE_WRD) {
    178  1.14   isaki 			/* sign-extend */
    179  1.14   isaki 			scale = buf[0] & 0xffff;
    180  1.14   isaki 			if (scale & 0x8000) {
    181  1.14   isaki 				scale |= 0xffff0000;
    182   1.1  briggs 			}
    183  1.14   isaki 		} else if (format == FTYPE_BYT) {
    184  1.14   isaki 			/* sign-extend */
    185  1.14   isaki 			scale = buf[0] & 0xff;
    186  1.14   isaki 			if (scale & 0x80) {
    187  1.14   isaki 				scale |= 0xffffff00;
    188   1.1  briggs 			}
    189  1.14   isaki 		} else if (format == FTYPE_DBL || format == FTYPE_SNG ||
    190  1.14   isaki 		           format == FTYPE_EXT) {
    191  1.14   isaki 			fpu_explode(fe, &fe->fe_f2, format, buf);
    192  1.14   isaki 			fpu_implode(fe, &fe->fe_f2, FTYPE_LNG, buf);
    193  1.14   isaki 			scale = buf[0];
    194   1.1  briggs 		}
    195  1.14   isaki 		/* make it look like we've got an FP oprand */
    196  1.14   isaki 		fe->fe_f2.fp_class = (buf[0] == 0) ? FPC_ZERO : FPC_NUM;
    197  1.14   isaki 	}
    198  1.14   isaki 
    199  1.14   isaki 	/* assume there's no exception */
    200  1.14   isaki 	sig = 0;
    201  1.14   isaki 
    202  1.14   isaki 	/*
    203  1.14   isaki 	 * it's barbaric but we're going to operate directly on
    204  1.14   isaki 	 * the dst operand's bit pattern
    205  1.14   isaki 	 */
    206  1.14   isaki 	sign = fpregs[regnum * 3] & 0x80000000;
    207  1.14   isaki 	exp = (fpregs[regnum * 3] & 0x7fff0000) >> 16;
    208  1.14   isaki 	m0 = fpregs[regnum * 3 + 1];
    209  1.14   isaki 	m1 = fpregs[regnum * 3 + 2];
    210  1.14   isaki 
    211  1.14   isaki 	switch (fe->fe_f2.fp_class) {
    212  1.14   isaki 	case FPC_SNAN:
    213  1.14   isaki 		fpsr |= FPSR_SNAN;
    214  1.14   isaki 	case FPC_QNAN:
    215  1.14   isaki 		/* dst = NaN */
    216  1.14   isaki 		exp = 0x7fff;
    217  1.14   isaki 		m0 = m1 = 0xffffffff;
    218  1.14   isaki 		break;
    219  1.14   isaki 	case FPC_ZERO:
    220  1.14   isaki 	case FPC_NUM:
    221  1.14   isaki 		if ((0 < exp && exp < 0x7fff) ||
    222  1.14   isaki 		    (exp == 0 && (m0 | m1) != 0)) {
    223  1.14   isaki 			/* normal or denormal */
    224  1.14   isaki 			exp += scale;
    225  1.14   isaki 			if (exp < 0) {
    226  1.14   isaki 				/* underflow */
    227  1.16   isaki 				uint32_t grs;	/* guard, round and sticky */
    228  1.14   isaki 
    229  1.14   isaki 				exp = 0;
    230  1.14   isaki 				grs = m1 << (32 + exp);
    231  1.14   isaki 				m1 = m0 << (32 + exp) | m1 >> -exp;
    232  1.14   isaki 				m0 >>= -exp;
    233  1.14   isaki 				if (grs != 0) {
    234  1.14   isaki 					fpsr |= FPSR_INEX2;
    235  1.14   isaki 
    236  1.14   isaki 					switch (fe->fe_fpcr & 0x30) {
    237  1.14   isaki 					case FPCR_MINF:
    238  1.14   isaki 						if (sign != 0) {
    239  1.14   isaki 							if (++m1 == 0 &&
    240  1.14   isaki 							    ++m0 == 0) {
    241  1.14   isaki 								m0 = 0x80000000;
    242  1.14   isaki 								exp++;
    243  1.14   isaki 							}
    244  1.14   isaki 						}
    245  1.14   isaki 						break;
    246  1.14   isaki 					case FPCR_NEAR:
    247  1.14   isaki 						if (grs == 0x80000000) {
    248  1.14   isaki 							/* tie */
    249  1.14   isaki 							if ((m1 & 1) &&
    250  1.14   isaki 							    ++m1 == 0 &&
    251  1.14   isaki 							    ++m0 == 0) {
    252  1.14   isaki 								m0 = 0x80000000;
    253  1.14   isaki 								exp++;
    254  1.14   isaki 							}
    255  1.14   isaki 						} else if (grs & 0x80000000) {
    256  1.14   isaki 							if (++m1 == 0 &&
    257  1.14   isaki 							    ++m0 == 0) {
    258  1.14   isaki 								m0 = 0x80000000;
    259  1.14   isaki 								exp++;
    260  1.14   isaki 							}
    261  1.14   isaki 						}
    262  1.14   isaki 						break;
    263  1.14   isaki 					case FPCR_PINF:
    264  1.14   isaki 						if (sign == 0) {
    265  1.14   isaki 							if (++m1 == 0 &&
    266  1.14   isaki 							    ++m0 == 0) {
    267  1.14   isaki 								m0 = 0x80000000;
    268  1.14   isaki 								exp++;
    269  1.14   isaki 							}
    270  1.14   isaki 						}
    271  1.14   isaki 						break;
    272  1.14   isaki 					case FPCR_ZERO:
    273  1.14   isaki 						break;
    274  1.14   isaki 					}
    275  1.14   isaki 				}
    276  1.14   isaki 				if (exp == 0 && (m0 & 0x80000000) == 0) {
    277  1.14   isaki 					fpsr |= FPSR_UNFL;
    278  1.14   isaki 					if ((m0 | m1) == 0) {
    279  1.14   isaki 						fpsr |= FPSR_ZERO;
    280  1.14   isaki 					}
    281  1.14   isaki 				}
    282  1.14   isaki 			} else if (exp >= 0x7fff) {
    283  1.14   isaki 				/* overflow --> result = Inf */
    284  1.14   isaki 				/*
    285  1.14   isaki 				 * but first, try to normalize in case it's an
    286  1.14   isaki 				 * unnormalized
    287  1.14   isaki 				 */
    288  1.14   isaki 				while ((m0 & 0x80000000) == 0) {
    289  1.14   isaki 					exp--;
    290  1.14   isaki 					m0 = (m0 << 1) | (m1 >> 31);
    291  1.14   isaki 					m1 = m1 << 1;
    292  1.14   isaki 				}
    293  1.14   isaki 				/* if it's still too large, then return Inf */
    294  1.14   isaki 				if (exp >= 0x7fff) {
    295  1.14   isaki 					exp = 0x7fff;
    296  1.14   isaki 					m0 = m1 = 0;
    297  1.14   isaki 					fpsr |= FPSR_OVFL | FPSR_INF;
    298  1.14   isaki 				}
    299  1.14   isaki 			} else if ((m0 & 0x80000000) == 0) {
    300  1.14   isaki 				/*
    301  1.14   isaki 				 * it's a denormal; we try to normalize but
    302  1.14   isaki 				 * result may and may not be a normal.
    303  1.14   isaki 				 */
    304  1.14   isaki 				while (exp > 0 && (m0 & 0x80000000) == 0) {
    305  1.14   isaki 					exp--;
    306  1.14   isaki 					m0 = (m0 << 1) | (m1 >> 31);
    307  1.14   isaki 					m1 = m1 << 1;
    308  1.14   isaki 				}
    309  1.14   isaki 				if ((m0 & 0x80000000) == 0) {
    310  1.14   isaki 					fpsr |= FPSR_UNFL;
    311  1.14   isaki 				}
    312  1.14   isaki 			} /* exp in range and mantissa normalized */
    313  1.14   isaki 		} else if (exp == 0 && m0 == 0 && m1 == 0) {
    314  1.14   isaki 			/* dst is Zero */
    315   1.1  briggs 			fpsr |= FPSR_ZERO;
    316  1.14   isaki 		} /* else we know exp == 0x7fff */
    317  1.14   isaki 		else if ((m0 | m1) == 0) {
    318  1.14   isaki 			fpsr |= FPSR_INF;
    319  1.14   isaki 		} else if ((m0 & 0x40000000) == 0) {
    320  1.14   isaki 			/* a signaling NaN */
    321  1.14   isaki 			fpsr |= FPSR_NAN | FPSR_SNAN;
    322  1.14   isaki 		} else {
    323  1.14   isaki 			/* a quiet NaN */
    324  1.14   isaki 			fpsr |= FPSR_NAN;
    325   1.1  briggs 		}
    326  1.14   isaki 		break;
    327  1.14   isaki 	case FPC_INF:
    328  1.14   isaki 		/* dst = NaN */
    329  1.14   isaki 		exp = 0x7fff;
    330  1.14   isaki 		m0 = m1 = 0xffffffff;
    331  1.14   isaki 		fpsr |= FPSR_OPERR | FPSR_NAN;
    332  1.14   isaki 		break;
    333  1.14   isaki 	default:
    334   1.1  briggs #ifdef DEBUG
    335  1.14   isaki 		panic("fpu_emul_fscale: invalid fp class");
    336   1.1  briggs #endif
    337  1.14   isaki 		break;
    338  1.14   isaki 	}
    339   1.1  briggs 
    340  1.14   isaki 	/* store the result */
    341  1.14   isaki 	fpregs[regnum * 3] = sign | (exp << 16);
    342  1.14   isaki 	fpregs[regnum * 3 + 1] = m0;
    343  1.14   isaki 	fpregs[regnum * 3 + 2] = m1;
    344  1.14   isaki 
    345  1.14   isaki 	if (sign) {
    346  1.14   isaki 		fpsr |= FPSR_NEG;
    347  1.14   isaki 	}
    348   1.1  briggs 
    349  1.14   isaki 	/* update fpsr according to the result of operation */
    350  1.14   isaki 	fe->fe_fpframe->fpf_fpsr = fe->fe_fpsr = fpsr;
    351   1.1  briggs 
    352  1.10  briggs #if DEBUG_FPE
    353  1.14   isaki 	printf("fpu_emul_fscale: FPSR = %08x, FPCR = %08x\n",
    354  1.15   isaki 	    fe->fe_fpsr, fe->fe_fpcr);
    355  1.10  briggs #endif
    356   1.1  briggs 
    357  1.14   isaki 	return (fpsr & fe->fe_fpcr & FPSR_EXCP) ? SIGFPE : sig;
    358   1.1  briggs }
    359