Home | History | Annotate | Line # | Download | only in i387
fenv.c revision 1.10
      1  1.10    andvar /* $NetBSD: fenv.c,v 1.10 2021/09/03 21:54:59 andvar Exp $ */
      2   1.1     joerg 
      3   1.1     joerg /*-
      4   1.1     joerg  * Copyright (c) 2004-2005 David Schultz <das (at) FreeBSD.ORG>
      5   1.1     joerg  * All rights reserved.
      6   1.1     joerg  *
      7   1.1     joerg  * Redistribution and use in source and binary forms, with or without
      8   1.1     joerg  * modification, are permitted provided that the following conditions
      9   1.1     joerg  * are met:
     10   1.1     joerg  * 1. Redistributions of source code must retain the above copyright
     11   1.1     joerg  *    notice, this list of conditions and the following disclaimer.
     12   1.1     joerg  * 2. Redistributions in binary form must reproduce the above copyright
     13   1.1     joerg  *    notice, this list of conditions and the following disclaimer in the
     14   1.1     joerg  *    documentation and/or other materials provided with the distribution.
     15   1.1     joerg  *
     16   1.1     joerg  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     17   1.1     joerg  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     18   1.1     joerg  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     19   1.1     joerg  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     20   1.1     joerg  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     21   1.1     joerg  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     22   1.1     joerg  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     23   1.1     joerg  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     24   1.1     joerg  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     25   1.1     joerg  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     26   1.1     joerg  * SUCH DAMAGE.
     27   1.1     joerg  */
     28   1.1     joerg 
     29   1.1     joerg #include <sys/cdefs.h>
     30  1.10    andvar __RCSID("$NetBSD: fenv.c,v 1.10 2021/09/03 21:54:59 andvar Exp $");
     31   1.8       chs 
     32   1.8       chs #include "namespace.h"
     33   1.1     joerg 
     34   1.1     joerg #include <sys/param.h>
     35   1.1     joerg #include <sys/sysctl.h>
     36   1.1     joerg #include <assert.h>
     37   1.1     joerg #include <fenv.h>
     38   1.1     joerg #include <stddef.h>
     39   1.1     joerg #include <string.h>
     40   1.1     joerg 
     41   1.8       chs #ifdef __weak_alias
     42   1.8       chs __weak_alias(feclearexcept,_feclearexcept)
     43   1.8       chs __weak_alias(fedisableexcept,_fedisableexcept)
     44   1.8       chs __weak_alias(feenableexcept,_feenableexcept)
     45   1.8       chs __weak_alias(fegetenv,_fegetenv)
     46   1.8       chs __weak_alias(fegetexcept,_fegetexcept)
     47   1.8       chs __weak_alias(fegetexceptflag,_fegetexceptflag)
     48   1.8       chs __weak_alias(fegetround,_fegetround)
     49   1.8       chs __weak_alias(feholdexcept,_feholdexcept)
     50   1.8       chs __weak_alias(feraiseexcept,_feraiseexcept)
     51   1.8       chs __weak_alias(fesetenv,_fesetenv)
     52   1.8       chs __weak_alias(fesetexceptflag,_fesetexceptflag)
     53   1.8       chs __weak_alias(fesetround,_fesetround)
     54   1.8       chs __weak_alias(fetestexcept,_fetestexcept)
     55   1.8       chs __weak_alias(feupdateenv,_feupdateenv)
     56   1.8       chs #endif
     57   1.8       chs 
     58   1.1     joerg /* Load x87 Control Word */
     59   1.1     joerg #define	__fldcw(__cw)		__asm__ __volatile__	\
     60   1.1     joerg 	("fldcw %0" : : "m" (__cw))
     61   1.1     joerg 
     62   1.1     joerg /* No-Wait Store Control Word */
     63   1.1     joerg #define	__fnstcw(__cw)		__asm__ __volatile__	\
     64   1.1     joerg 	("fnstcw %0" : "=m" (*(__cw)))
     65   1.1     joerg 
     66   1.1     joerg /* No-Wait Store Status Word */
     67   1.1     joerg #define	__fnstsw(__sw)		__asm__ __volatile__	\
     68   1.1     joerg 	("fnstsw %0" : "=am" (*(__sw)))
     69   1.1     joerg 
     70   1.1     joerg /* No-Wait Clear Exception Flags */
     71   1.1     joerg #define	__fnclex()		__asm__ __volatile__	\
     72   1.1     joerg 	("fnclex")
     73   1.1     joerg 
     74   1.1     joerg /* Load x87 Environment */
     75   1.1     joerg #define	__fldenv(__env)		__asm__ __volatile__	\
     76   1.1     joerg 	("fldenv %0" : : "m" (__env))
     77   1.1     joerg 
     78   1.1     joerg /* No-Wait Store x87 environment */
     79   1.1     joerg #define	__fnstenv(__env)	__asm__ __volatile__	\
     80   1.1     joerg 	("fnstenv %0" : "=m" (*(__env)))
     81   1.1     joerg 
     82   1.1     joerg /* Check for and handle pending unmasked x87 pending FPU exceptions */
     83   1.1     joerg #define	__fwait(__env)		__asm__	__volatile__	\
     84   1.1     joerg 	("fwait")
     85   1.1     joerg 
     86   1.1     joerg /* Load the MXCSR register */
     87   1.1     joerg #define	__ldmxcsr(__mxcsr)	__asm__ __volatile__	\
     88   1.1     joerg 	("ldmxcsr %0" : : "m" (__mxcsr))
     89   1.1     joerg 
     90   1.1     joerg /* Store the MXCSR register state */
     91   1.1     joerg #define	__stmxcsr(__mxcsr)	__asm__ __volatile__	\
     92   1.1     joerg 	("stmxcsr %0" : "=m" (*(__mxcsr)))
     93   1.1     joerg 
     94   1.1     joerg /*
     95   1.1     joerg  * The following constant represents the default floating-point environment
     96   1.1     joerg  * (that is, the one installed at program startup) and has type pointer to
     97   1.1     joerg  * const-qualified fenv_t.
     98   1.1     joerg  *
     99   1.1     joerg  * It can be used as an argument to the functions within the <fenv.h> header
    100   1.1     joerg  * that manage the floating-point environment, namely fesetenv() and
    101   1.1     joerg  * feupdateenv().
    102   1.1     joerg  *
    103   1.1     joerg  * x87 fpu registers are 16bit wide. The upper bits, 31-16, are marked as
    104   1.1     joerg  * RESERVED. We provide a partial floating-point environment, where we
    105   1.1     joerg  * define only the lower bits. The reserved bits are extracted and set by the
    106   1.1     joerg  * consumers of FE_DFL_ENV, during runtime.
    107   1.1     joerg  */
    108   1.1     joerg fenv_t __fe_dfl_env = {
    109   1.9  christos 	.x87 = {
    110   1.9  christos 		.control = __NetBSD_NPXCW__,    /* Control word register */
    111   1.9  christos 		.unused1 = 0,			/* Unused */
    112   1.9  christos 		.status = 0,  		     	/* Status word register */
    113   1.9  christos 		.unused2 = 0,			/* Unused */
    114   1.9  christos 		.tag = 0xffff,          	/* Tag word register */
    115   1.9  christos 		.unused3 = 0,			/* Unused */
    116   1.9  christos 		.others = {
    117   1.9  christos 			0, 0, 0, 0x0000ffff,
    118   1.1     joerg 		}
    119   1.1     joerg 	},
    120   1.9  christos 	.mxcsr = __INITIAL_MXCSR__		/* MXCSR register */
    121   1.1     joerg };
    122   1.1     joerg 
    123   1.1     joerg /*
    124   1.1     joerg  * Test for SSE support on this processor.
    125   1.1     joerg  *
    126   1.1     joerg  * We need to use ldmxcsr/stmxcsr to get correct results if any part
    127   1.1     joerg  * of the program was compiled to use SSE floating-point, but we can't
    128   1.1     joerg  * use SSE on older processors.
    129   1.1     joerg  *
    130   1.1     joerg  * In order to do so, we need to query the processor capabilities via the CPUID
    131   1.1     joerg  * instruction. We can make it even simpler though, by querying the machdep.sse
    132   1.1     joerg  * sysctl.
    133   1.1     joerg  */
    134   1.1     joerg static int __HAS_SSE = 0;
    135   1.1     joerg 
    136   1.6     joerg static void __init_libm(void) __attribute__ ((constructor, used));
    137   1.1     joerg 
    138   1.6     joerg static void __init_libm(void)
    139   1.1     joerg {
    140   1.3      taca 	size_t oldlen = sizeof(__HAS_SSE);
    141   1.1     joerg 	int rv;
    142   1.6     joerg 	uint16_t control;
    143   1.1     joerg 
    144   1.1     joerg 	rv = sysctlbyname("machdep.sse", &__HAS_SSE, &oldlen, NULL, 0);
    145   1.1     joerg 	if (rv == -1)
    146   1.1     joerg 		__HAS_SSE = 0;
    147   1.6     joerg 
    148   1.6     joerg 	__fnstcw(&control);
    149   1.6     joerg 	__fe_dfl_env.x87.control = control;
    150   1.1     joerg }
    151   1.1     joerg 
    152   1.1     joerg /*
    153   1.1     joerg  * The feclearexcept() function clears the supported floating-point exceptions
    154   1.1     joerg  * represented by `excepts'.
    155   1.1     joerg  */
    156   1.1     joerg int
    157   1.1     joerg feclearexcept(int excepts)
    158   1.1     joerg {
    159   1.1     joerg 	fenv_t env;
    160   1.1     joerg 	uint32_t mxcsr;
    161   1.1     joerg 	int ex;
    162   1.1     joerg 
    163   1.1     joerg 	_DIAGASSERT((excepts & ~FE_ALL_EXCEPT) == 0);
    164   1.1     joerg 
    165   1.1     joerg 	ex = excepts & FE_ALL_EXCEPT;
    166   1.1     joerg 
    167   1.1     joerg 	/* It's ~3x faster to call fnclex, than store/load fp env */
    168   1.1     joerg 	if (ex == FE_ALL_EXCEPT) {
    169   1.1     joerg 		__fnclex();
    170   1.1     joerg 	} else {
    171   1.1     joerg 		__fnstenv(&env);
    172   1.1     joerg 		env.x87.status &= ~ex;
    173   1.1     joerg 		__fldenv(env);
    174   1.1     joerg 	}
    175   1.1     joerg 
    176   1.1     joerg 	if (__HAS_SSE) {
    177   1.1     joerg 		__stmxcsr(&mxcsr);
    178   1.1     joerg 		mxcsr &= ~ex;
    179   1.1     joerg 		__ldmxcsr(mxcsr);
    180   1.1     joerg 	}
    181   1.1     joerg 
    182   1.1     joerg 	/* Success */
    183   1.1     joerg 	return (0);
    184   1.1     joerg }
    185   1.1     joerg 
    186   1.1     joerg /*
    187   1.1     joerg  * The fegetexceptflag() function stores an implementation-defined
    188   1.1     joerg  * representation of the states of the floating-point status flags indicated by
    189   1.1     joerg  * the argument excepts in the object pointed to by the argument flagp.
    190   1.1     joerg  */
    191   1.1     joerg int
    192   1.1     joerg fegetexceptflag(fexcept_t *flagp, int excepts)
    193   1.1     joerg {
    194   1.1     joerg 	uint32_t mxcsr;
    195   1.1     joerg 	uint16_t status;
    196   1.1     joerg 	int ex;
    197   1.1     joerg 
    198   1.1     joerg 	_DIAGASSERT(flagp != NULL);
    199   1.1     joerg 	_DIAGASSERT((excepts & ~FE_ALL_EXCEPT) == 0);
    200   1.1     joerg 
    201   1.1     joerg 	ex = excepts & FE_ALL_EXCEPT;
    202   1.1     joerg 
    203   1.1     joerg 	__fnstsw(&status);
    204   1.1     joerg 	if (__HAS_SSE)
    205   1.1     joerg 		__stmxcsr(&mxcsr);
    206   1.1     joerg 	else
    207   1.1     joerg 		mxcsr = 0;
    208   1.1     joerg 
    209   1.1     joerg 	*flagp = (mxcsr | status) & ex;
    210   1.1     joerg 
    211   1.1     joerg 	/* Success */
    212   1.1     joerg 	return (0);
    213   1.1     joerg }
    214   1.1     joerg 
    215   1.1     joerg /*
    216   1.1     joerg  * The feraiseexcept() function raises the supported floating-point exceptions
    217   1.1     joerg  * represented by the argument `excepts'.
    218   1.1     joerg  *
    219   1.1     joerg  * The standard explicitly allows us to execute an instruction that has the
    220   1.1     joerg  * exception as a side effect, but we choose to manipulate the status register
    221   1.1     joerg  * directly.
    222   1.1     joerg  *
    223   1.1     joerg  * The validation of input is being deferred to fesetexceptflag().
    224   1.1     joerg  */
    225   1.1     joerg int
    226   1.1     joerg feraiseexcept(int excepts)
    227   1.1     joerg {
    228   1.1     joerg 	fexcept_t ex;
    229   1.1     joerg 
    230   1.1     joerg 	_DIAGASSERT((excepts & ~FE_ALL_EXCEPT) == 0);
    231   1.1     joerg 
    232   1.1     joerg 	ex = excepts & FE_ALL_EXCEPT;
    233   1.1     joerg 	fesetexceptflag(&ex, excepts);
    234   1.1     joerg 	__fwait();
    235   1.1     joerg 
    236   1.1     joerg 	/* Success */
    237   1.1     joerg 	return (0);
    238   1.1     joerg }
    239   1.1     joerg 
    240   1.1     joerg /*
    241   1.1     joerg  * This function sets the floating-point status flags indicated by the argument
    242   1.1     joerg  * `excepts' to the states stored in the object pointed to by `flagp'. It does
    243   1.1     joerg  * NOT raise any floating-point exceptions, but only sets the state of the flags.
    244   1.1     joerg  */
    245   1.1     joerg int
    246   1.1     joerg fesetexceptflag(const fexcept_t *flagp, int excepts)
    247   1.1     joerg {
    248   1.1     joerg 	fenv_t env;
    249   1.1     joerg 	uint32_t mxcsr;
    250   1.1     joerg 	int ex;
    251   1.1     joerg 
    252   1.1     joerg 	_DIAGASSERT(flagp != NULL);
    253   1.1     joerg 	_DIAGASSERT((excepts & ~FE_ALL_EXCEPT) == 0);
    254   1.1     joerg 
    255   1.1     joerg 	ex = excepts & FE_ALL_EXCEPT;
    256   1.1     joerg 
    257   1.1     joerg 	__fnstenv(&env);
    258   1.1     joerg 	env.x87.status &= ~ex;
    259   1.1     joerg 	env.x87.status |= *flagp & ex;
    260   1.1     joerg 	__fldenv(env);
    261   1.1     joerg 
    262   1.1     joerg 	if (__HAS_SSE) {
    263   1.1     joerg 		__stmxcsr(&mxcsr);
    264   1.1     joerg 		mxcsr &= ~ex;
    265   1.1     joerg 		mxcsr |= *flagp & ex;
    266   1.1     joerg 		__ldmxcsr(mxcsr);
    267   1.1     joerg 	}
    268   1.1     joerg 
    269   1.1     joerg 	/* Success */
    270   1.1     joerg 	return (0);
    271   1.1     joerg }
    272   1.1     joerg 
    273   1.1     joerg /*
    274   1.1     joerg  * The fetestexcept() function determines which of a specified subset of the
    275   1.1     joerg  * floating-point exception flags are currently set. The `excepts' argument
    276   1.1     joerg  * specifies the floating-point status flags to be queried.
    277   1.1     joerg  */
    278   1.1     joerg int
    279   1.1     joerg fetestexcept(int excepts)
    280   1.1     joerg {
    281   1.1     joerg 	uint32_t mxcsr;
    282   1.1     joerg 	uint16_t status;
    283   1.1     joerg 	int ex;
    284   1.1     joerg 
    285   1.1     joerg 	_DIAGASSERT((excepts & ~FE_ALL_EXCEPT) == 0);
    286   1.1     joerg 
    287   1.1     joerg 	ex = excepts & FE_ALL_EXCEPT;
    288   1.1     joerg 
    289   1.1     joerg 	__fnstsw(&status);
    290   1.1     joerg 	if (__HAS_SSE)
    291   1.1     joerg 		__stmxcsr(&mxcsr);
    292   1.1     joerg 	else
    293   1.1     joerg 		mxcsr = 0;
    294   1.1     joerg 
    295   1.1     joerg 	return ((status | mxcsr) & ex);
    296   1.1     joerg }
    297   1.1     joerg 
    298   1.1     joerg int
    299   1.1     joerg fegetround(void)
    300   1.1     joerg {
    301   1.1     joerg 	uint16_t control;
    302   1.1     joerg 
    303   1.1     joerg 	/*
    304   1.1     joerg 	 * We assume that the x87 and the SSE unit agree on the
    305   1.1     joerg 	 * rounding mode.  Reading the control word on the x87 turns
    306   1.1     joerg 	 * out to be about 5 times faster than reading it on the SSE
    307   1.1     joerg 	 * unit on an Opteron 244.
    308   1.1     joerg 	 */
    309   1.1     joerg 	__fnstcw(&control);
    310   1.1     joerg 
    311   1.1     joerg 	return (control & __X87_ROUND_MASK);
    312   1.1     joerg }
    313   1.1     joerg 
    314   1.1     joerg /*
    315   1.1     joerg  * The fesetround() function shall establish the rounding direction represented
    316   1.1     joerg  * by its argument round. If the argument is not equal to the value of a
    317   1.1     joerg  * rounding direction macro, the rounding direction is not changed.
    318   1.1     joerg  */
    319   1.1     joerg int
    320   1.1     joerg fesetround(int round)
    321   1.1     joerg {
    322   1.1     joerg 	uint32_t mxcsr;
    323   1.1     joerg 	uint16_t control;
    324   1.1     joerg 
    325   1.1     joerg 	if (round & ~__X87_ROUND_MASK) {
    326   1.1     joerg 		/* Failure */
    327   1.1     joerg 		return (-1);
    328   1.1     joerg 	}
    329   1.1     joerg 
    330   1.1     joerg 	__fnstcw(&control);
    331   1.1     joerg 	control &= ~__X87_ROUND_MASK;
    332   1.1     joerg 	control |= round;
    333   1.1     joerg 	__fldcw(control);
    334   1.1     joerg 
    335   1.1     joerg 	if (__HAS_SSE) {
    336   1.1     joerg 		__stmxcsr(&mxcsr);
    337   1.1     joerg 		mxcsr &= ~(__X87_ROUND_MASK << __SSE_ROUND_SHIFT);
    338   1.1     joerg 		mxcsr |= round << __SSE_ROUND_SHIFT;
    339   1.1     joerg 		__ldmxcsr(mxcsr);
    340   1.1     joerg 	}
    341   1.1     joerg 
    342   1.1     joerg 	/* Success */
    343   1.1     joerg 	return (0);
    344   1.1     joerg }
    345   1.1     joerg 
    346   1.1     joerg /*
    347   1.1     joerg  * The fegetenv() function attempts to store the current floating-point
    348   1.1     joerg  * environment in the object pointed to by envp.
    349   1.1     joerg  */
    350   1.1     joerg int
    351   1.1     joerg fegetenv(fenv_t *envp)
    352   1.1     joerg {
    353   1.1     joerg 	uint32_t mxcsr;
    354   1.1     joerg 
    355   1.1     joerg 	_DIAGASSERT(flagp != NULL);
    356   1.1     joerg 
    357   1.1     joerg 	/*
    358   1.1     joerg 	 * fnstenv masks all exceptions, so we need to restore the old control
    359   1.1     joerg 	 * word to avoid this side effect.
    360   1.1     joerg 	 */
    361   1.1     joerg 	__fnstenv(envp);
    362   1.1     joerg 	__fldcw(envp->x87.control);
    363   1.1     joerg 	if (__HAS_SSE) {
    364   1.1     joerg 		__stmxcsr(&mxcsr);
    365   1.1     joerg 		envp->mxcsr = mxcsr;
    366   1.1     joerg 	}
    367   1.1     joerg 
    368   1.1     joerg 	/* Success */
    369   1.1     joerg 	return (0);
    370   1.1     joerg }
    371   1.1     joerg 
    372   1.1     joerg /*
    373   1.1     joerg  * The feholdexcept() function saves the current floating-point environment in
    374   1.1     joerg  * the object pointed to by envp, clears the floating-point status flags, and
    375   1.1     joerg  * then installs a non-stop (continue on floating-point exceptions) mode, if
    376   1.1     joerg  * available, for all floating-point exceptions.
    377   1.1     joerg  */
    378   1.1     joerg int
    379   1.1     joerg feholdexcept(fenv_t *envp)
    380   1.1     joerg {
    381   1.1     joerg 	uint32_t mxcsr;
    382   1.1     joerg 
    383   1.1     joerg 	_DIAGASSERT(envp != NULL);
    384   1.1     joerg 
    385   1.1     joerg 	__fnstenv(envp);
    386   1.1     joerg 	__fnclex();
    387   1.1     joerg 	if (__HAS_SSE) {
    388   1.1     joerg 		__stmxcsr(&mxcsr);
    389   1.1     joerg 		envp->mxcsr = mxcsr;
    390   1.1     joerg 		mxcsr &= ~FE_ALL_EXCEPT;
    391   1.1     joerg 		mxcsr |= FE_ALL_EXCEPT << __SSE_EMASK_SHIFT;
    392   1.1     joerg 		__ldmxcsr(mxcsr);
    393   1.1     joerg 	}
    394   1.1     joerg 
    395   1.1     joerg 	/* Success */
    396   1.1     joerg 	return (0);
    397   1.1     joerg }
    398   1.1     joerg 
    399   1.1     joerg /*
    400   1.1     joerg  * The fesetenv() function attempts to establish the floating-point environment
    401   1.1     joerg  * represented by the object pointed to by envp. The argument `envp' points
    402   1.1     joerg  * to an object set by a call to fegetenv() or feholdexcept(), or equal a
    403   1.1     joerg  * floating-point environment macro. The fesetenv() function does not raise
    404   1.1     joerg  * floating-point exceptions, but only installs the state of the floating-point
    405   1.1     joerg  * status flags represented through its argument.
    406   1.1     joerg  */
    407   1.1     joerg int
    408   1.1     joerg fesetenv(const fenv_t *envp)
    409   1.1     joerg {
    410   1.1     joerg 	fenv_t env;
    411   1.1     joerg 
    412   1.1     joerg 	_DIAGASSERT(envp != NULL);
    413   1.1     joerg 
    414   1.1     joerg 	/* Store the x87 floating-point environment */
    415   1.1     joerg 	memset(&env, 0, sizeof(env));
    416   1.1     joerg 	__fnstenv(&env);
    417   1.1     joerg 
    418   1.1     joerg 	__fe_dfl_env.x87.unused1 = env.x87.unused1;
    419   1.1     joerg 	__fe_dfl_env.x87.unused2 = env.x87.unused2;
    420   1.1     joerg 	__fe_dfl_env.x87.unused3 = env.x87.unused3;
    421   1.7  christos 	memcpy(__fe_dfl_env.x87.others, env.x87.others,
    422   1.7  christos 	    sizeof(__fe_dfl_env.x87.others));
    423   1.1     joerg 
    424   1.1     joerg 	__fldenv(envp->x87);
    425   1.1     joerg 	if (__HAS_SSE)
    426   1.1     joerg 		__ldmxcsr(envp->mxcsr);
    427   1.1     joerg 
    428   1.1     joerg 	/* Success */
    429   1.1     joerg 	return (0);
    430   1.1     joerg }
    431   1.1     joerg 
    432   1.1     joerg /*
    433   1.1     joerg  * The feupdateenv() function saves the currently raised floating-point
    434   1.1     joerg  * exceptions in its automatic storage, installs the floating-point environment
    435   1.1     joerg  * represented by the object pointed to by `envp', and then raises the saved
    436   1.1     joerg  * floating-point exceptions. The argument `envp' shall point to an object set
    437   1.1     joerg  * by a call to feholdexcept() or fegetenv(), or equal a floating-point
    438   1.1     joerg  * environment macro.
    439   1.1     joerg  */
    440   1.1     joerg int
    441   1.1     joerg feupdateenv(const fenv_t *envp)
    442   1.1     joerg {
    443   1.1     joerg 	fenv_t env;
    444   1.1     joerg 	uint32_t mxcsr;
    445   1.1     joerg 	uint16_t status;
    446   1.1     joerg 
    447   1.1     joerg 	_DIAGASSERT(envp != NULL);
    448   1.1     joerg 
    449   1.1     joerg 	/* Store the x87 floating-point environment */
    450   1.1     joerg 	memset(&env, 0, sizeof(env));
    451   1.1     joerg 	__fnstenv(&env);
    452   1.1     joerg 
    453   1.1     joerg 	__fe_dfl_env.x87.unused1 = env.x87.unused1;
    454   1.1     joerg 	__fe_dfl_env.x87.unused2 = env.x87.unused2;
    455   1.1     joerg 	__fe_dfl_env.x87.unused3 = env.x87.unused3;
    456   1.7  christos 	memcpy(__fe_dfl_env.x87.others, env.x87.others,
    457   1.7  christos 	    sizeof(__fe_dfl_env.x87.others));
    458   1.1     joerg 
    459   1.1     joerg 	__fnstsw(&status);
    460   1.1     joerg 	if (__HAS_SSE)
    461   1.1     joerg 		__stmxcsr(&mxcsr);
    462   1.1     joerg 	else
    463   1.1     joerg 		mxcsr = 0;
    464   1.1     joerg 	fesetenv(envp);
    465   1.1     joerg 	feraiseexcept((mxcsr | status) & FE_ALL_EXCEPT);
    466   1.1     joerg 
    467   1.1     joerg 	/* Success */
    468   1.1     joerg 	return (0);
    469   1.1     joerg }
    470   1.1     joerg 
    471   1.1     joerg /*
    472  1.10    andvar  * The following functions are extensions to the standard
    473   1.1     joerg  */
    474   1.1     joerg int
    475   1.1     joerg feenableexcept(int mask)
    476   1.1     joerg {
    477   1.1     joerg 	uint32_t mxcsr, omask;
    478   1.1     joerg 	uint16_t control;
    479   1.1     joerg 
    480   1.1     joerg 	mask &= FE_ALL_EXCEPT;
    481   1.1     joerg 	__fnstcw(&control);
    482   1.1     joerg 	if (__HAS_SSE)
    483   1.1     joerg 		__stmxcsr(&mxcsr);
    484   1.1     joerg 	else
    485   1.1     joerg 		mxcsr = 0;
    486   1.1     joerg 
    487   1.1     joerg 	omask = (control | mxcsr >> __SSE_EMASK_SHIFT) & FE_ALL_EXCEPT;
    488   1.1     joerg 	control &= ~mask;
    489   1.1     joerg 	__fldcw(control);
    490   1.1     joerg 	if (__HAS_SSE) {
    491   1.1     joerg 		mxcsr &= ~(mask << __SSE_EMASK_SHIFT);
    492   1.1     joerg 		__ldmxcsr(mxcsr);
    493   1.1     joerg 	}
    494   1.1     joerg 
    495   1.4  riastrad 	return (FE_ALL_EXCEPT & ~omask);
    496   1.1     joerg }
    497   1.1     joerg 
    498   1.1     joerg int
    499   1.1     joerg fedisableexcept(int mask)
    500   1.1     joerg {
    501   1.1     joerg 	uint32_t mxcsr, omask;
    502   1.1     joerg 	uint16_t control;
    503   1.1     joerg 
    504   1.1     joerg 	mask &= FE_ALL_EXCEPT;
    505   1.1     joerg 	__fnstcw(&control);
    506   1.1     joerg 	if (__HAS_SSE)
    507   1.1     joerg 		__stmxcsr(&mxcsr);
    508   1.1     joerg 	else
    509   1.1     joerg 		mxcsr = 0;
    510   1.1     joerg 
    511   1.1     joerg 	omask = (control | mxcsr >> __SSE_EMASK_SHIFT) & FE_ALL_EXCEPT;
    512   1.1     joerg 	control |= mask;
    513   1.1     joerg 	__fldcw(control);
    514   1.1     joerg 	if (__HAS_SSE) {
    515   1.1     joerg 		mxcsr |= mask << __SSE_EMASK_SHIFT;
    516   1.1     joerg 		__ldmxcsr(mxcsr);
    517   1.1     joerg 	}
    518   1.1     joerg 
    519   1.4  riastrad 	return (FE_ALL_EXCEPT & ~omask);
    520   1.1     joerg }
    521   1.1     joerg 
    522   1.1     joerg int
    523   1.1     joerg fegetexcept(void)
    524   1.1     joerg {
    525   1.1     joerg 	uint16_t control;
    526   1.1     joerg 
    527   1.1     joerg 	/*
    528   1.1     joerg 	 * We assume that the masks for the x87 and the SSE unit are
    529   1.1     joerg 	 * the same.
    530   1.1     joerg 	 */
    531   1.1     joerg 	__fnstcw(&control);
    532   1.1     joerg 
    533   1.5  riastrad 	return (~control & FE_ALL_EXCEPT);
    534   1.1     joerg }
    535