Home | History | Annotate | Line # | Download | only in spmath
sfmpy.c revision 1.3.26.1
      1  1.3.26.1      yamt /*	$NetBSD: sfmpy.c,v 1.3.26.1 2007/02/27 16:51:28 yamt Exp $	*/
      2       1.1  fredette 
      3       1.1  fredette /*	$OpenBSD: sfmpy.c,v 1.4 2001/03/29 03:58:19 mickey Exp $	*/
      4       1.1  fredette 
      5       1.1  fredette /*
      6       1.1  fredette  * Copyright 1996 1995 by Open Software Foundation, Inc.
      7       1.1  fredette  *              All Rights Reserved
      8       1.1  fredette  *
      9       1.1  fredette  * Permission to use, copy, modify, and distribute this software and
     10       1.1  fredette  * its documentation for any purpose and without fee is hereby granted,
     11       1.1  fredette  * provided that the above copyright notice appears in all copies and
     12       1.1  fredette  * that both the copyright notice and this permission notice appear in
     13       1.1  fredette  * supporting documentation.
     14       1.1  fredette  *
     15       1.1  fredette  * OSF DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE
     16       1.1  fredette  * INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
     17       1.1  fredette  * FOR A PARTICULAR PURPOSE.
     18       1.1  fredette  *
     19       1.1  fredette  * IN NO EVENT SHALL OSF BE LIABLE FOR ANY SPECIAL, INDIRECT, OR
     20       1.1  fredette  * CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM
     21       1.1  fredette  * LOSS OF USE, DATA OR PROFITS, WHETHER IN ACTION OF CONTRACT,
     22       1.1  fredette  * NEGLIGENCE, OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION
     23       1.1  fredette  * WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
     24       1.1  fredette  *
     25       1.1  fredette  */
     26       1.1  fredette /*
     27       1.1  fredette  * pmk1.1
     28       1.1  fredette  */
     29       1.1  fredette /*
     30       1.1  fredette  * (c) Copyright 1986 HEWLETT-PACKARD COMPANY
     31       1.1  fredette  *
     32       1.1  fredette  * To anyone who acknowledges that this file is provided "AS IS"
     33       1.1  fredette  * without any express or implied warranty:
     34       1.1  fredette  *     permission to use, copy, modify, and distribute this file
     35       1.1  fredette  * for any purpose is hereby granted without fee, provided that
     36       1.1  fredette  * the above copyright notice and this notice appears in all
     37       1.1  fredette  * copies, and that the name of Hewlett-Packard Company not be
     38       1.1  fredette  * used in advertising or publicity pertaining to distribution
     39       1.1  fredette  * of the software without specific, written prior permission.
     40       1.1  fredette  * Hewlett-Packard Company makes no representations about the
     41       1.1  fredette  * suitability of this software for any purpose.
     42       1.1  fredette  */
     43       1.2     lukem 
     44       1.2     lukem #include <sys/cdefs.h>
     45  1.3.26.1      yamt __KERNEL_RCSID(0, "$NetBSD: sfmpy.c,v 1.3.26.1 2007/02/27 16:51:28 yamt Exp $");
     46       1.1  fredette 
     47       1.1  fredette #include "../spmath/float.h"
     48       1.1  fredette #include "../spmath/sgl_float.h"
     49       1.1  fredette 
     50       1.1  fredette /*
     51       1.1  fredette  *  Single Precision Floating-point Multiply
     52       1.1  fredette  */
     53       1.1  fredette int
     54       1.1  fredette sgl_fmpy(srcptr1,srcptr2,dstptr,status)
     55       1.1  fredette 
     56       1.1  fredette sgl_floating_point *srcptr1, *srcptr2, *dstptr;
     57       1.1  fredette unsigned int *status;
     58       1.1  fredette {
     59       1.1  fredette 	register unsigned int opnd1, opnd2, opnd3, result;
     60       1.1  fredette 	register int dest_exponent, count;
     61  1.3.26.1      yamt 	register int inexact = false, guardbit = false, stickybit = false;
     62       1.1  fredette 	int is_tiny;
     63       1.1  fredette 
     64       1.1  fredette 	opnd1 = *srcptr1;
     65       1.1  fredette 	opnd2 = *srcptr2;
     66       1.1  fredette 	/*
     67       1.1  fredette 	 * set sign bit of result
     68       1.1  fredette 	 */
     69       1.1  fredette 	if (Sgl_sign(opnd1) ^ Sgl_sign(opnd2)) Sgl_setnegativezero(result);
     70       1.1  fredette 	else Sgl_setzero(result);
     71       1.1  fredette 	/*
     72       1.1  fredette 	 * check first operand for NaN's or infinity
     73       1.1  fredette 	 */
     74       1.1  fredette 	if (Sgl_isinfinity_exponent(opnd1)) {
     75       1.1  fredette 		if (Sgl_iszero_mantissa(opnd1)) {
     76       1.1  fredette 			if (Sgl_isnotnan(opnd2)) {
     77       1.1  fredette 				if (Sgl_iszero_exponentmantissa(opnd2)) {
     78       1.1  fredette 					/*
     79       1.1  fredette 					 * invalid since operands are infinity
     80       1.1  fredette 					 * and zero
     81       1.1  fredette 					 */
     82       1.1  fredette 					if (Is_invalidtrap_enabled())
     83       1.1  fredette 						return(INVALIDEXCEPTION);
     84       1.1  fredette 					Set_invalidflag();
     85       1.1  fredette 					Sgl_makequietnan(result);
     86       1.1  fredette 					*dstptr = result;
     87       1.1  fredette 					return(NOEXCEPTION);
     88       1.1  fredette 				}
     89       1.1  fredette 				/*
     90       1.1  fredette 				 * return infinity
     91       1.1  fredette 				 */
     92       1.1  fredette 				Sgl_setinfinity_exponentmantissa(result);
     93       1.1  fredette 				*dstptr = result;
     94       1.1  fredette 				return(NOEXCEPTION);
     95       1.1  fredette 			}
     96       1.1  fredette 		}
     97       1.1  fredette 		else {
     98       1.1  fredette 			/*
     99       1.1  fredette 			 * is NaN; signaling or quiet?
    100       1.1  fredette 			 */
    101       1.1  fredette 			if (Sgl_isone_signaling(opnd1)) {
    102       1.1  fredette 				/* trap if INVALIDTRAP enabled */
    103       1.1  fredette 				if (Is_invalidtrap_enabled())
    104       1.1  fredette 					return(INVALIDEXCEPTION);
    105       1.1  fredette 				/* make NaN quiet */
    106       1.1  fredette 				Set_invalidflag();
    107       1.1  fredette 				Sgl_set_quiet(opnd1);
    108       1.1  fredette 			}
    109       1.1  fredette 			/*
    110       1.1  fredette 			 * is second operand a signaling NaN?
    111       1.1  fredette 			 */
    112       1.1  fredette 			else if (Sgl_is_signalingnan(opnd2)) {
    113       1.1  fredette 				/* trap if INVALIDTRAP enabled */
    114       1.1  fredette 				if (Is_invalidtrap_enabled())
    115       1.1  fredette 					return(INVALIDEXCEPTION);
    116       1.1  fredette 				/* make NaN quiet */
    117       1.1  fredette 				Set_invalidflag();
    118       1.1  fredette 				Sgl_set_quiet(opnd2);
    119       1.1  fredette 				*dstptr = opnd2;
    120       1.1  fredette 				return(NOEXCEPTION);
    121       1.1  fredette 			}
    122       1.1  fredette 			/*
    123       1.1  fredette 			 * return quiet NaN
    124       1.1  fredette 			 */
    125       1.1  fredette 			*dstptr = opnd1;
    126       1.1  fredette 			return(NOEXCEPTION);
    127       1.1  fredette 		}
    128       1.1  fredette 	}
    129       1.1  fredette 	/*
    130       1.1  fredette 	 * check second operand for NaN's or infinity
    131       1.1  fredette 	 */
    132       1.1  fredette 	if (Sgl_isinfinity_exponent(opnd2)) {
    133       1.1  fredette 		if (Sgl_iszero_mantissa(opnd2)) {
    134       1.1  fredette 			if (Sgl_iszero_exponentmantissa(opnd1)) {
    135       1.1  fredette 				/* invalid since operands are zero & infinity */
    136       1.1  fredette 				if (Is_invalidtrap_enabled())
    137       1.1  fredette 					return(INVALIDEXCEPTION);
    138       1.1  fredette 				Set_invalidflag();
    139       1.1  fredette 				Sgl_makequietnan(opnd2);
    140       1.1  fredette 				*dstptr = opnd2;
    141       1.1  fredette 				return(NOEXCEPTION);
    142       1.1  fredette 			}
    143       1.1  fredette 			/*
    144       1.1  fredette 			 * return infinity
    145       1.1  fredette 			 */
    146       1.1  fredette 			Sgl_setinfinity_exponentmantissa(result);
    147       1.1  fredette 			*dstptr = result;
    148       1.1  fredette 			return(NOEXCEPTION);
    149       1.1  fredette 		}
    150       1.1  fredette 		/*
    151       1.1  fredette 		 * is NaN; signaling or quiet?
    152       1.1  fredette 		 */
    153       1.1  fredette 		if (Sgl_isone_signaling(opnd2)) {
    154       1.1  fredette 			/* trap if INVALIDTRAP enabled */
    155       1.1  fredette 			if (Is_invalidtrap_enabled()) return(INVALIDEXCEPTION);
    156       1.1  fredette 
    157       1.1  fredette 			/* make NaN quiet */
    158       1.1  fredette 			Set_invalidflag();
    159       1.1  fredette 			Sgl_set_quiet(opnd2);
    160       1.1  fredette 		}
    161       1.1  fredette 		/*
    162       1.1  fredette 		 * return quiet NaN
    163       1.1  fredette 		 */
    164       1.1  fredette 		*dstptr = opnd2;
    165       1.1  fredette 		return(NOEXCEPTION);
    166       1.1  fredette 	}
    167       1.1  fredette 	/*
    168       1.1  fredette 	 * Generate exponent
    169       1.1  fredette 	 */
    170       1.1  fredette 	dest_exponent = Sgl_exponent(opnd1) + Sgl_exponent(opnd2) - SGL_BIAS;
    171       1.1  fredette 
    172       1.1  fredette 	/*
    173       1.1  fredette 	 * Generate mantissa
    174       1.1  fredette 	 */
    175       1.1  fredette 	if (Sgl_isnotzero_exponent(opnd1)) {
    176       1.1  fredette 		/* set hidden bit */
    177       1.1  fredette 		Sgl_clear_signexponent_set_hidden(opnd1);
    178       1.1  fredette 	}
    179       1.1  fredette 	else {
    180       1.1  fredette 		/* check for zero */
    181       1.1  fredette 		if (Sgl_iszero_mantissa(opnd1)) {
    182       1.1  fredette 			Sgl_setzero_exponentmantissa(result);
    183       1.1  fredette 			*dstptr = result;
    184       1.1  fredette 			return(NOEXCEPTION);
    185       1.1  fredette 		}
    186       1.1  fredette 		/* is denormalized, adjust exponent */
    187       1.1  fredette 		Sgl_clear_signexponent(opnd1);
    188       1.1  fredette 		Sgl_leftshiftby1(opnd1);
    189       1.1  fredette 		Sgl_normalize(opnd1,dest_exponent);
    190       1.1  fredette 	}
    191       1.1  fredette 	/* opnd2 needs to have hidden bit set with msb in hidden bit */
    192       1.1  fredette 	if (Sgl_isnotzero_exponent(opnd2)) {
    193       1.1  fredette 		Sgl_clear_signexponent_set_hidden(opnd2);
    194       1.1  fredette 	}
    195       1.1  fredette 	else {
    196       1.1  fredette 		/* check for zero */
    197       1.1  fredette 		if (Sgl_iszero_mantissa(opnd2)) {
    198       1.1  fredette 			Sgl_setzero_exponentmantissa(result);
    199       1.1  fredette 			*dstptr = result;
    200       1.1  fredette 			return(NOEXCEPTION);
    201       1.1  fredette 		}
    202       1.1  fredette 		/* is denormalized; want to normalize */
    203       1.1  fredette 		Sgl_clear_signexponent(opnd2);
    204       1.1  fredette 		Sgl_leftshiftby1(opnd2);
    205       1.1  fredette 		Sgl_normalize(opnd2,dest_exponent);
    206       1.1  fredette 	}
    207       1.1  fredette 
    208       1.1  fredette 	/* Multiply two source mantissas together */
    209       1.1  fredette 
    210       1.1  fredette 	Sgl_leftshiftby4(opnd2);     /* make room for guard bits */
    211       1.1  fredette 	Sgl_setzero(opnd3);
    212       1.1  fredette 	/*
    213       1.1  fredette 	 * Four bits at a time are inspected in each loop, and a
    214       1.1  fredette 	 * simple shift and add multiply algorithm is used.
    215       1.1  fredette 	 */
    216       1.1  fredette 	for (count=1;count<SGL_P;count+=4) {
    217       1.1  fredette 		stickybit |= Slow4(opnd3);
    218       1.1  fredette 		Sgl_rightshiftby4(opnd3);
    219       1.1  fredette 		if (Sbit28(opnd1)) Sall(opnd3) += (Sall(opnd2) << 3);
    220       1.1  fredette 		if (Sbit29(opnd1)) Sall(opnd3) += (Sall(opnd2) << 2);
    221       1.1  fredette 		if (Sbit30(opnd1)) Sall(opnd3) += (Sall(opnd2) << 1);
    222       1.1  fredette 		if (Sbit31(opnd1)) Sall(opnd3) += Sall(opnd2);
    223       1.1  fredette 		Sgl_rightshiftby4(opnd1);
    224       1.1  fredette 	}
    225       1.1  fredette 	/* make sure result is left-justified */
    226       1.1  fredette 	if (Sgl_iszero_sign(opnd3)) {
    227       1.1  fredette 		Sgl_leftshiftby1(opnd3);
    228       1.1  fredette 	}
    229       1.1  fredette 	else {
    230       1.1  fredette 		/* result mantissa >= 2. */
    231       1.1  fredette 		dest_exponent++;
    232       1.1  fredette 	}
    233       1.1  fredette 	/* check for denormalized result */
    234       1.1  fredette 	while (Sgl_iszero_sign(opnd3)) {
    235       1.1  fredette 		Sgl_leftshiftby1(opnd3);
    236       1.1  fredette 		dest_exponent--;
    237       1.1  fredette 	}
    238       1.1  fredette 	/*
    239       1.1  fredette 	 * check for guard, sticky and inexact bits
    240       1.1  fredette 	 */
    241       1.1  fredette 	stickybit |= Sgl_all(opnd3) << (SGL_BITLENGTH - SGL_EXP_LENGTH + 1);
    242       1.1  fredette 	guardbit = Sbit24(opnd3);
    243       1.1  fredette 	inexact = guardbit | stickybit;
    244       1.1  fredette 
    245       1.1  fredette 	/* re-align mantissa */
    246       1.1  fredette 	Sgl_rightshiftby8(opnd3);
    247       1.1  fredette 
    248       1.1  fredette 	/*
    249       1.1  fredette 	 * round result
    250       1.1  fredette 	 */
    251       1.1  fredette 	if (inexact && (dest_exponent>0 || Is_underflowtrap_enabled())) {
    252       1.1  fredette 		Sgl_clear_signexponent(opnd3);
    253       1.1  fredette 		switch (Rounding_mode()) {
    254       1.1  fredette 			case ROUNDPLUS:
    255       1.1  fredette 				if (Sgl_iszero_sign(result))
    256       1.1  fredette 					Sgl_increment(opnd3);
    257       1.1  fredette 				break;
    258       1.1  fredette 			case ROUNDMINUS:
    259       1.1  fredette 				if (Sgl_isone_sign(result))
    260       1.1  fredette 					Sgl_increment(opnd3);
    261       1.1  fredette 				break;
    262       1.1  fredette 			case ROUNDNEAREST:
    263       1.1  fredette 				if (guardbit &&
    264       1.1  fredette 				    (stickybit || Sgl_isone_lowmantissa(opnd3)))
    265       1.1  fredette 					Sgl_increment(opnd3);
    266       1.1  fredette 				break;
    267       1.1  fredette 		}
    268       1.1  fredette 		if (Sgl_isone_hidden(opnd3)) dest_exponent++;
    269       1.1  fredette 	}
    270       1.1  fredette 	Sgl_set_mantissa(result,opnd3);
    271       1.1  fredette 
    272       1.1  fredette 	/*
    273       1.1  fredette 	 * Test for overflow
    274       1.1  fredette 	 */
    275       1.1  fredette 	if (dest_exponent >= SGL_INFINITY_EXPONENT) {
    276       1.1  fredette 		/* trap if OVERFLOWTRAP enabled */
    277       1.1  fredette 		if (Is_overflowtrap_enabled()) {
    278       1.1  fredette 			/*
    279       1.1  fredette 			 * Adjust bias of result
    280       1.1  fredette 			 */
    281       1.1  fredette 			Sgl_setwrapped_exponent(result,dest_exponent,ovfl);
    282       1.1  fredette 			*dstptr = result;
    283       1.1  fredette 			if (inexact) {
    284       1.1  fredette 			    if (Is_inexacttrap_enabled())
    285       1.1  fredette 				return(OVERFLOWEXCEPTION | INEXACTEXCEPTION);
    286       1.1  fredette 			    else Set_inexactflag();
    287       1.1  fredette 			}
    288       1.1  fredette 			return(OVERFLOWEXCEPTION);
    289       1.1  fredette 		}
    290  1.3.26.1      yamt 		inexact = true;
    291       1.1  fredette 		Set_overflowflag();
    292       1.1  fredette 		/* set result to infinity or largest number */
    293       1.1  fredette 		Sgl_setoverflow(result);
    294       1.1  fredette 	}
    295       1.1  fredette 	/*
    296       1.1  fredette 	 * Test for underflow
    297       1.1  fredette 	 */
    298       1.1  fredette 	else if (dest_exponent <= 0) {
    299       1.1  fredette 		/* trap if UNDERFLOWTRAP enabled */
    300       1.1  fredette 		if (Is_underflowtrap_enabled()) {
    301       1.1  fredette 			/*
    302       1.1  fredette 			 * Adjust bias of result
    303       1.1  fredette 			 */
    304       1.1  fredette 			Sgl_setwrapped_exponent(result,dest_exponent,unfl);
    305       1.1  fredette 			*dstptr = result;
    306       1.1  fredette 			if (inexact) {
    307       1.1  fredette 			    if (Is_inexacttrap_enabled())
    308       1.1  fredette 				return(UNDERFLOWEXCEPTION | INEXACTEXCEPTION);
    309       1.1  fredette 			    else Set_inexactflag();
    310       1.1  fredette 			}
    311       1.1  fredette 			return(UNDERFLOWEXCEPTION);
    312       1.1  fredette 		}
    313       1.1  fredette 
    314       1.1  fredette 		/* Determine if should set underflow flag */
    315  1.3.26.1      yamt 		is_tiny = true;
    316       1.1  fredette 		if (dest_exponent == 0 && inexact) {
    317       1.1  fredette 			switch (Rounding_mode()) {
    318       1.1  fredette 			case ROUNDPLUS:
    319       1.1  fredette 				if (Sgl_iszero_sign(result)) {
    320       1.1  fredette 					Sgl_increment(opnd3);
    321       1.1  fredette 					if (Sgl_isone_hiddenoverflow(opnd3))
    322  1.3.26.1      yamt 						is_tiny = false;
    323       1.1  fredette 					Sgl_decrement(opnd3);
    324       1.1  fredette 				}
    325       1.1  fredette 				break;
    326       1.1  fredette 			case ROUNDMINUS:
    327       1.1  fredette 				if (Sgl_isone_sign(result)) {
    328       1.1  fredette 					Sgl_increment(opnd3);
    329       1.1  fredette 					if (Sgl_isone_hiddenoverflow(opnd3))
    330  1.3.26.1      yamt 						is_tiny = false;
    331       1.1  fredette 					Sgl_decrement(opnd3);
    332       1.1  fredette 				}
    333       1.1  fredette 				break;
    334       1.1  fredette 			case ROUNDNEAREST:
    335       1.1  fredette 				if (guardbit && (stickybit ||
    336       1.1  fredette 				    Sgl_isone_lowmantissa(opnd3))) {
    337       1.1  fredette 					Sgl_increment(opnd3);
    338       1.1  fredette 					if (Sgl_isone_hiddenoverflow(opnd3))
    339  1.3.26.1      yamt 						is_tiny = false;
    340       1.1  fredette 					Sgl_decrement(opnd3);
    341       1.1  fredette 				}
    342       1.1  fredette 				break;
    343       1.1  fredette 			}
    344       1.1  fredette 		}
    345       1.1  fredette 
    346       1.1  fredette 		/*
    347       1.1  fredette 		 * denormalize result or set to signed zero
    348       1.1  fredette 		 */
    349       1.1  fredette 		stickybit = inexact;
    350       1.1  fredette 		Sgl_denormalize(opnd3,dest_exponent,guardbit,stickybit,inexact);
    351       1.1  fredette 
    352       1.1  fredette 		/* return zero or smallest number */
    353       1.1  fredette 		if (inexact) {
    354       1.1  fredette 			switch (Rounding_mode()) {
    355       1.1  fredette 			case ROUNDPLUS:
    356       1.1  fredette 				if (Sgl_iszero_sign(result))
    357       1.1  fredette 					Sgl_increment(opnd3);
    358       1.1  fredette 				break;
    359       1.1  fredette 			case ROUNDMINUS:
    360       1.1  fredette 				if (Sgl_isone_sign(result))
    361       1.1  fredette 					Sgl_increment(opnd3);
    362       1.1  fredette 				break;
    363       1.1  fredette 			case ROUNDNEAREST:
    364       1.1  fredette 				if (guardbit && (stickybit ||
    365       1.1  fredette 				    Sgl_isone_lowmantissa(opnd3)))
    366       1.1  fredette 					Sgl_increment(opnd3);
    367       1.1  fredette 				break;
    368       1.1  fredette 			}
    369       1.1  fredette 		if (is_tiny) Set_underflowflag();
    370       1.1  fredette 		}
    371       1.1  fredette 		Sgl_set_exponentmantissa(result,opnd3);
    372       1.1  fredette 	}
    373       1.1  fredette 	else Sgl_set_exponent(result,dest_exponent);
    374       1.1  fredette 	*dstptr = result;
    375       1.1  fredette 
    376       1.1  fredette 	/* check for inexact */
    377       1.1  fredette 	if (inexact) {
    378       1.1  fredette 		if (Is_inexacttrap_enabled()) return(INEXACTEXCEPTION);
    379       1.1  fredette 		else Set_inexactflag();
    380       1.1  fredette 	}
    381       1.1  fredette 	return(NOEXCEPTION);
    382       1.1  fredette }
    383