Home | History | Annotate | Line # | Download | only in i387
fenv.c revision 1.8
      1  1.8       chs /* $NetBSD: fenv.c,v 1.8 2017/03/22 23:11:08 chs Exp $ */
      2  1.1     joerg 
      3  1.1     joerg /*-
      4  1.1     joerg  * Copyright (c) 2004-2005 David Schultz <das (at) FreeBSD.ORG>
      5  1.1     joerg  * All rights reserved.
      6  1.1     joerg  *
      7  1.1     joerg  * Redistribution and use in source and binary forms, with or without
      8  1.1     joerg  * modification, are permitted provided that the following conditions
      9  1.1     joerg  * are met:
     10  1.1     joerg  * 1. Redistributions of source code must retain the above copyright
     11  1.1     joerg  *    notice, this list of conditions and the following disclaimer.
     12  1.1     joerg  * 2. Redistributions in binary form must reproduce the above copyright
     13  1.1     joerg  *    notice, this list of conditions and the following disclaimer in the
     14  1.1     joerg  *    documentation and/or other materials provided with the distribution.
     15  1.1     joerg  *
     16  1.1     joerg  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     17  1.1     joerg  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     18  1.1     joerg  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     19  1.1     joerg  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     20  1.1     joerg  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     21  1.1     joerg  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     22  1.1     joerg  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     23  1.1     joerg  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     24  1.1     joerg  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     25  1.1     joerg  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     26  1.1     joerg  * SUCH DAMAGE.
     27  1.1     joerg  */
     28  1.1     joerg 
     29  1.1     joerg #include <sys/cdefs.h>
     30  1.8       chs __RCSID("$NetBSD: fenv.c,v 1.8 2017/03/22 23:11:08 chs Exp $");
     31  1.8       chs 
     32  1.8       chs #include "namespace.h"
     33  1.1     joerg 
     34  1.1     joerg #include <sys/param.h>
     35  1.1     joerg #include <sys/sysctl.h>
     36  1.1     joerg #include <assert.h>
     37  1.1     joerg #include <fenv.h>
     38  1.1     joerg #include <stddef.h>
     39  1.1     joerg #include <string.h>
     40  1.1     joerg 
     41  1.8       chs #ifdef __weak_alias
     42  1.8       chs __weak_alias(feclearexcept,_feclearexcept)
     43  1.8       chs __weak_alias(fedisableexcept,_fedisableexcept)
     44  1.8       chs __weak_alias(feenableexcept,_feenableexcept)
     45  1.8       chs __weak_alias(fegetenv,_fegetenv)
     46  1.8       chs __weak_alias(fegetexcept,_fegetexcept)
     47  1.8       chs __weak_alias(fegetexceptflag,_fegetexceptflag)
     48  1.8       chs __weak_alias(fegetround,_fegetround)
     49  1.8       chs __weak_alias(feholdexcept,_feholdexcept)
     50  1.8       chs __weak_alias(feraiseexcept,_feraiseexcept)
     51  1.8       chs __weak_alias(fesetenv,_fesetenv)
     52  1.8       chs __weak_alias(fesetexceptflag,_fesetexceptflag)
     53  1.8       chs __weak_alias(fesetround,_fesetround)
     54  1.8       chs __weak_alias(fetestexcept,_fetestexcept)
     55  1.8       chs __weak_alias(feupdateenv,_feupdateenv)
     56  1.8       chs #endif
     57  1.8       chs 
     58  1.1     joerg /* Load x87 Control Word */
     59  1.1     joerg #define	__fldcw(__cw)		__asm__ __volatile__	\
     60  1.1     joerg 	("fldcw %0" : : "m" (__cw))
     61  1.1     joerg 
     62  1.1     joerg /* No-Wait Store Control Word */
     63  1.1     joerg #define	__fnstcw(__cw)		__asm__ __volatile__	\
     64  1.1     joerg 	("fnstcw %0" : "=m" (*(__cw)))
     65  1.1     joerg 
     66  1.1     joerg /* No-Wait Store Status Word */
     67  1.1     joerg #define	__fnstsw(__sw)		__asm__ __volatile__	\
     68  1.1     joerg 	("fnstsw %0" : "=am" (*(__sw)))
     69  1.1     joerg 
     70  1.1     joerg /* No-Wait Clear Exception Flags */
     71  1.1     joerg #define	__fnclex()		__asm__ __volatile__	\
     72  1.1     joerg 	("fnclex")
     73  1.1     joerg 
     74  1.1     joerg /* Load x87 Environment */
     75  1.1     joerg #define	__fldenv(__env)		__asm__ __volatile__	\
     76  1.1     joerg 	("fldenv %0" : : "m" (__env))
     77  1.1     joerg 
     78  1.1     joerg /* No-Wait Store x87 environment */
     79  1.1     joerg #define	__fnstenv(__env)	__asm__ __volatile__	\
     80  1.1     joerg 	("fnstenv %0" : "=m" (*(__env)))
     81  1.1     joerg 
     82  1.1     joerg /* Check for and handle pending unmasked x87 pending FPU exceptions */
     83  1.1     joerg #define	__fwait(__env)		__asm__	__volatile__	\
     84  1.1     joerg 	("fwait")
     85  1.1     joerg 
     86  1.1     joerg /* Load the MXCSR register */
     87  1.1     joerg #define	__ldmxcsr(__mxcsr)	__asm__ __volatile__	\
     88  1.1     joerg 	("ldmxcsr %0" : : "m" (__mxcsr))
     89  1.1     joerg 
     90  1.1     joerg /* Store the MXCSR register state */
     91  1.1     joerg #define	__stmxcsr(__mxcsr)	__asm__ __volatile__	\
     92  1.1     joerg 	("stmxcsr %0" : "=m" (*(__mxcsr)))
     93  1.1     joerg 
     94  1.1     joerg /*
     95  1.1     joerg  * The following constant represents the default floating-point environment
     96  1.1     joerg  * (that is, the one installed at program startup) and has type pointer to
     97  1.1     joerg  * const-qualified fenv_t.
     98  1.1     joerg  *
     99  1.1     joerg  * It can be used as an argument to the functions within the <fenv.h> header
    100  1.1     joerg  * that manage the floating-point environment, namely fesetenv() and
    101  1.1     joerg  * feupdateenv().
    102  1.1     joerg  *
    103  1.1     joerg  * x87 fpu registers are 16bit wide. The upper bits, 31-16, are marked as
    104  1.1     joerg  * RESERVED. We provide a partial floating-point environment, where we
    105  1.1     joerg  * define only the lower bits. The reserved bits are extracted and set by the
    106  1.1     joerg  * consumers of FE_DFL_ENV, during runtime.
    107  1.1     joerg  */
    108  1.1     joerg fenv_t __fe_dfl_env = {
    109  1.1     joerg 	{
    110  1.1     joerg 		__NetBSD_NPXCW__,       /* Control word register */
    111  1.1     joerg 		0x0,			/* Unused */
    112  1.1     joerg 		0x0000,                 /* Status word register */
    113  1.1     joerg 		0x0,			/* Unused */
    114  1.1     joerg 		0x0000ffff,             /* Tag word register */
    115  1.1     joerg 		0x0,			/* Unused */
    116  1.1     joerg 		{
    117  1.1     joerg 			0x0000, 0x0000,
    118  1.1     joerg 			0x0000, 0xffff
    119  1.1     joerg 		}
    120  1.1     joerg 	},
    121  1.1     joerg 	__INITIAL_MXCSR__		/* MXCSR register */
    122  1.1     joerg };
    123  1.1     joerg 
    124  1.1     joerg /*
    125  1.1     joerg  * Test for SSE support on this processor.
    126  1.1     joerg  *
    127  1.1     joerg  * We need to use ldmxcsr/stmxcsr to get correct results if any part
    128  1.1     joerg  * of the program was compiled to use SSE floating-point, but we can't
    129  1.1     joerg  * use SSE on older processors.
    130  1.1     joerg  *
    131  1.1     joerg  * In order to do so, we need to query the processor capabilities via the CPUID
    132  1.1     joerg  * instruction. We can make it even simpler though, by querying the machdep.sse
    133  1.1     joerg  * sysctl.
    134  1.1     joerg  */
    135  1.1     joerg static int __HAS_SSE = 0;
    136  1.1     joerg 
    137  1.6     joerg static void __init_libm(void) __attribute__ ((constructor, used));
    138  1.1     joerg 
    139  1.6     joerg static void __init_libm(void)
    140  1.1     joerg {
    141  1.3      taca 	size_t oldlen = sizeof(__HAS_SSE);
    142  1.1     joerg 	int rv;
    143  1.6     joerg 	uint16_t control;
    144  1.1     joerg 
    145  1.1     joerg 	rv = sysctlbyname("machdep.sse", &__HAS_SSE, &oldlen, NULL, 0);
    146  1.1     joerg 	if (rv == -1)
    147  1.1     joerg 		__HAS_SSE = 0;
    148  1.6     joerg 
    149  1.6     joerg 	__fnstcw(&control);
    150  1.6     joerg 	__fe_dfl_env.x87.control = control;
    151  1.1     joerg }
    152  1.1     joerg 
    153  1.1     joerg /*
    154  1.1     joerg  * The feclearexcept() function clears the supported floating-point exceptions
    155  1.1     joerg  * represented by `excepts'.
    156  1.1     joerg  */
    157  1.1     joerg int
    158  1.1     joerg feclearexcept(int excepts)
    159  1.1     joerg {
    160  1.1     joerg 	fenv_t env;
    161  1.1     joerg 	uint32_t mxcsr;
    162  1.1     joerg 	int ex;
    163  1.1     joerg 
    164  1.1     joerg 	_DIAGASSERT((excepts & ~FE_ALL_EXCEPT) == 0);
    165  1.1     joerg 
    166  1.1     joerg 	ex = excepts & FE_ALL_EXCEPT;
    167  1.1     joerg 
    168  1.1     joerg 	/* It's ~3x faster to call fnclex, than store/load fp env */
    169  1.1     joerg 	if (ex == FE_ALL_EXCEPT) {
    170  1.1     joerg 		__fnclex();
    171  1.1     joerg 	} else {
    172  1.1     joerg 		__fnstenv(&env);
    173  1.1     joerg 		env.x87.status &= ~ex;
    174  1.1     joerg 		__fldenv(env);
    175  1.1     joerg 	}
    176  1.1     joerg 
    177  1.1     joerg 	if (__HAS_SSE) {
    178  1.1     joerg 		__stmxcsr(&mxcsr);
    179  1.1     joerg 		mxcsr &= ~ex;
    180  1.1     joerg 		__ldmxcsr(mxcsr);
    181  1.1     joerg 	}
    182  1.1     joerg 
    183  1.1     joerg 	/* Success */
    184  1.1     joerg 	return (0);
    185  1.1     joerg }
    186  1.1     joerg 
    187  1.1     joerg /*
    188  1.1     joerg  * The fegetexceptflag() function stores an implementation-defined
    189  1.1     joerg  * representation of the states of the floating-point status flags indicated by
    190  1.1     joerg  * the argument excepts in the object pointed to by the argument flagp.
    191  1.1     joerg  */
    192  1.1     joerg int
    193  1.1     joerg fegetexceptflag(fexcept_t *flagp, int excepts)
    194  1.1     joerg {
    195  1.1     joerg 	uint32_t mxcsr;
    196  1.1     joerg 	uint16_t status;
    197  1.1     joerg 	int ex;
    198  1.1     joerg 
    199  1.1     joerg 	_DIAGASSERT(flagp != NULL);
    200  1.1     joerg 	_DIAGASSERT((excepts & ~FE_ALL_EXCEPT) == 0);
    201  1.1     joerg 
    202  1.1     joerg 	ex = excepts & FE_ALL_EXCEPT;
    203  1.1     joerg 
    204  1.1     joerg 	__fnstsw(&status);
    205  1.1     joerg 	if (__HAS_SSE)
    206  1.1     joerg 		__stmxcsr(&mxcsr);
    207  1.1     joerg 	else
    208  1.1     joerg 		mxcsr = 0;
    209  1.1     joerg 
    210  1.1     joerg 	*flagp = (mxcsr | status) & ex;
    211  1.1     joerg 
    212  1.1     joerg 	/* Success */
    213  1.1     joerg 	return (0);
    214  1.1     joerg }
    215  1.1     joerg 
    216  1.1     joerg /*
    217  1.1     joerg  * The feraiseexcept() function raises the supported floating-point exceptions
    218  1.1     joerg  * represented by the argument `excepts'.
    219  1.1     joerg  *
    220  1.1     joerg  * The standard explicitly allows us to execute an instruction that has the
    221  1.1     joerg  * exception as a side effect, but we choose to manipulate the status register
    222  1.1     joerg  * directly.
    223  1.1     joerg  *
    224  1.1     joerg  * The validation of input is being deferred to fesetexceptflag().
    225  1.1     joerg  */
    226  1.1     joerg int
    227  1.1     joerg feraiseexcept(int excepts)
    228  1.1     joerg {
    229  1.1     joerg 	fexcept_t ex;
    230  1.1     joerg 
    231  1.1     joerg 	_DIAGASSERT((excepts & ~FE_ALL_EXCEPT) == 0);
    232  1.1     joerg 
    233  1.1     joerg 	ex = excepts & FE_ALL_EXCEPT;
    234  1.1     joerg 	fesetexceptflag(&ex, excepts);
    235  1.1     joerg 	__fwait();
    236  1.1     joerg 
    237  1.1     joerg 	/* Success */
    238  1.1     joerg 	return (0);
    239  1.1     joerg }
    240  1.1     joerg 
    241  1.1     joerg /*
    242  1.1     joerg  * This function sets the floating-point status flags indicated by the argument
    243  1.1     joerg  * `excepts' to the states stored in the object pointed to by `flagp'. It does
    244  1.1     joerg  * NOT raise any floating-point exceptions, but only sets the state of the flags.
    245  1.1     joerg  */
    246  1.1     joerg int
    247  1.1     joerg fesetexceptflag(const fexcept_t *flagp, int excepts)
    248  1.1     joerg {
    249  1.1     joerg 	fenv_t env;
    250  1.1     joerg 	uint32_t mxcsr;
    251  1.1     joerg 	int ex;
    252  1.1     joerg 
    253  1.1     joerg 	_DIAGASSERT(flagp != NULL);
    254  1.1     joerg 	_DIAGASSERT((excepts & ~FE_ALL_EXCEPT) == 0);
    255  1.1     joerg 
    256  1.1     joerg 	ex = excepts & FE_ALL_EXCEPT;
    257  1.1     joerg 
    258  1.1     joerg 	__fnstenv(&env);
    259  1.1     joerg 	env.x87.status &= ~ex;
    260  1.1     joerg 	env.x87.status |= *flagp & ex;
    261  1.1     joerg 	__fldenv(env);
    262  1.1     joerg 
    263  1.1     joerg 	if (__HAS_SSE) {
    264  1.1     joerg 		__stmxcsr(&mxcsr);
    265  1.1     joerg 		mxcsr &= ~ex;
    266  1.1     joerg 		mxcsr |= *flagp & ex;
    267  1.1     joerg 		__ldmxcsr(mxcsr);
    268  1.1     joerg 	}
    269  1.1     joerg 
    270  1.1     joerg 	/* Success */
    271  1.1     joerg 	return (0);
    272  1.1     joerg }
    273  1.1     joerg 
    274  1.1     joerg /*
    275  1.1     joerg  * The fetestexcept() function determines which of a specified subset of the
    276  1.1     joerg  * floating-point exception flags are currently set. The `excepts' argument
    277  1.1     joerg  * specifies the floating-point status flags to be queried.
    278  1.1     joerg  */
    279  1.1     joerg int
    280  1.1     joerg fetestexcept(int excepts)
    281  1.1     joerg {
    282  1.1     joerg 	uint32_t mxcsr;
    283  1.1     joerg 	uint16_t status;
    284  1.1     joerg 	int ex;
    285  1.1     joerg 
    286  1.1     joerg 	_DIAGASSERT((excepts & ~FE_ALL_EXCEPT) == 0);
    287  1.1     joerg 
    288  1.1     joerg 	ex = excepts & FE_ALL_EXCEPT;
    289  1.1     joerg 
    290  1.1     joerg 	__fnstsw(&status);
    291  1.1     joerg 	if (__HAS_SSE)
    292  1.1     joerg 		__stmxcsr(&mxcsr);
    293  1.1     joerg 	else
    294  1.1     joerg 		mxcsr = 0;
    295  1.1     joerg 
    296  1.1     joerg 	return ((status | mxcsr) & ex);
    297  1.1     joerg }
    298  1.1     joerg 
    299  1.1     joerg int
    300  1.1     joerg fegetround(void)
    301  1.1     joerg {
    302  1.1     joerg 	uint16_t control;
    303  1.1     joerg 
    304  1.1     joerg 	/*
    305  1.1     joerg 	 * We assume that the x87 and the SSE unit agree on the
    306  1.1     joerg 	 * rounding mode.  Reading the control word on the x87 turns
    307  1.1     joerg 	 * out to be about 5 times faster than reading it on the SSE
    308  1.1     joerg 	 * unit on an Opteron 244.
    309  1.1     joerg 	 */
    310  1.1     joerg 	__fnstcw(&control);
    311  1.1     joerg 
    312  1.1     joerg 	return (control & __X87_ROUND_MASK);
    313  1.1     joerg }
    314  1.1     joerg 
    315  1.1     joerg /*
    316  1.1     joerg  * The fesetround() function shall establish the rounding direction represented
    317  1.1     joerg  * by its argument round. If the argument is not equal to the value of a
    318  1.1     joerg  * rounding direction macro, the rounding direction is not changed.
    319  1.1     joerg  */
    320  1.1     joerg int
    321  1.1     joerg fesetround(int round)
    322  1.1     joerg {
    323  1.1     joerg 	uint32_t mxcsr;
    324  1.1     joerg 	uint16_t control;
    325  1.1     joerg 
    326  1.1     joerg 	if (round & ~__X87_ROUND_MASK) {
    327  1.1     joerg 		/* Failure */
    328  1.1     joerg 		return (-1);
    329  1.1     joerg 	}
    330  1.1     joerg 
    331  1.1     joerg 	__fnstcw(&control);
    332  1.1     joerg 	control &= ~__X87_ROUND_MASK;
    333  1.1     joerg 	control |= round;
    334  1.1     joerg 	__fldcw(control);
    335  1.1     joerg 
    336  1.1     joerg 	if (__HAS_SSE) {
    337  1.1     joerg 		__stmxcsr(&mxcsr);
    338  1.1     joerg 		mxcsr &= ~(__X87_ROUND_MASK << __SSE_ROUND_SHIFT);
    339  1.1     joerg 		mxcsr |= round << __SSE_ROUND_SHIFT;
    340  1.1     joerg 		__ldmxcsr(mxcsr);
    341  1.1     joerg 	}
    342  1.1     joerg 
    343  1.1     joerg 	/* Success */
    344  1.1     joerg 	return (0);
    345  1.1     joerg }
    346  1.1     joerg 
    347  1.1     joerg /*
    348  1.1     joerg  * The fegetenv() function attempts to store the current floating-point
    349  1.1     joerg  * environment in the object pointed to by envp.
    350  1.1     joerg  */
    351  1.1     joerg int
    352  1.1     joerg fegetenv(fenv_t *envp)
    353  1.1     joerg {
    354  1.1     joerg 	uint32_t mxcsr;
    355  1.1     joerg 
    356  1.1     joerg 	_DIAGASSERT(flagp != NULL);
    357  1.1     joerg 
    358  1.1     joerg 	/*
    359  1.1     joerg 	 * fnstenv masks all exceptions, so we need to restore the old control
    360  1.1     joerg 	 * word to avoid this side effect.
    361  1.1     joerg 	 */
    362  1.1     joerg 	__fnstenv(envp);
    363  1.1     joerg 	__fldcw(envp->x87.control);
    364  1.1     joerg 	if (__HAS_SSE) {
    365  1.1     joerg 		__stmxcsr(&mxcsr);
    366  1.1     joerg 		envp->mxcsr = mxcsr;
    367  1.1     joerg 	}
    368  1.1     joerg 
    369  1.1     joerg 	/* Success */
    370  1.1     joerg 	return (0);
    371  1.1     joerg }
    372  1.1     joerg 
    373  1.1     joerg /*
    374  1.1     joerg  * The feholdexcept() function saves the current floating-point environment in
    375  1.1     joerg  * the object pointed to by envp, clears the floating-point status flags, and
    376  1.1     joerg  * then installs a non-stop (continue on floating-point exceptions) mode, if
    377  1.1     joerg  * available, for all floating-point exceptions.
    378  1.1     joerg  */
    379  1.1     joerg int
    380  1.1     joerg feholdexcept(fenv_t *envp)
    381  1.1     joerg {
    382  1.1     joerg 	uint32_t mxcsr;
    383  1.1     joerg 
    384  1.1     joerg 	_DIAGASSERT(envp != NULL);
    385  1.1     joerg 
    386  1.1     joerg 	__fnstenv(envp);
    387  1.1     joerg 	__fnclex();
    388  1.1     joerg 	if (__HAS_SSE) {
    389  1.1     joerg 		__stmxcsr(&mxcsr);
    390  1.1     joerg 		envp->mxcsr = mxcsr;
    391  1.1     joerg 		mxcsr &= ~FE_ALL_EXCEPT;
    392  1.1     joerg 		mxcsr |= FE_ALL_EXCEPT << __SSE_EMASK_SHIFT;
    393  1.1     joerg 		__ldmxcsr(mxcsr);
    394  1.1     joerg 	}
    395  1.1     joerg 
    396  1.1     joerg 	/* Success */
    397  1.1     joerg 	return (0);
    398  1.1     joerg }
    399  1.1     joerg 
    400  1.1     joerg /*
    401  1.1     joerg  * The fesetenv() function attempts to establish the floating-point environment
    402  1.1     joerg  * represented by the object pointed to by envp. The argument `envp' points
    403  1.1     joerg  * to an object set by a call to fegetenv() or feholdexcept(), or equal a
    404  1.1     joerg  * floating-point environment macro. The fesetenv() function does not raise
    405  1.1     joerg  * floating-point exceptions, but only installs the state of the floating-point
    406  1.1     joerg  * status flags represented through its argument.
    407  1.1     joerg  */
    408  1.1     joerg int
    409  1.1     joerg fesetenv(const fenv_t *envp)
    410  1.1     joerg {
    411  1.1     joerg 	fenv_t env;
    412  1.1     joerg 
    413  1.1     joerg 	_DIAGASSERT(envp != NULL);
    414  1.1     joerg 
    415  1.1     joerg 	/* Store the x87 floating-point environment */
    416  1.1     joerg 	memset(&env, 0, sizeof(env));
    417  1.1     joerg 	__fnstenv(&env);
    418  1.1     joerg 
    419  1.1     joerg 	__fe_dfl_env.x87.unused1 = env.x87.unused1;
    420  1.1     joerg 	__fe_dfl_env.x87.unused2 = env.x87.unused2;
    421  1.1     joerg 	__fe_dfl_env.x87.unused3 = env.x87.unused3;
    422  1.7  christos 	memcpy(__fe_dfl_env.x87.others, env.x87.others,
    423  1.7  christos 	    sizeof(__fe_dfl_env.x87.others));
    424  1.1     joerg 
    425  1.1     joerg 	__fldenv(envp->x87);
    426  1.1     joerg 	if (__HAS_SSE)
    427  1.1     joerg 		__ldmxcsr(envp->mxcsr);
    428  1.1     joerg 
    429  1.1     joerg 	/* Success */
    430  1.1     joerg 	return (0);
    431  1.1     joerg }
    432  1.1     joerg 
    433  1.1     joerg /*
    434  1.1     joerg  * The feupdateenv() function saves the currently raised floating-point
    435  1.1     joerg  * exceptions in its automatic storage, installs the floating-point environment
    436  1.1     joerg  * represented by the object pointed to by `envp', and then raises the saved
    437  1.1     joerg  * floating-point exceptions. The argument `envp' shall point to an object set
    438  1.1     joerg  * by a call to feholdexcept() or fegetenv(), or equal a floating-point
    439  1.1     joerg  * environment macro.
    440  1.1     joerg  */
    441  1.1     joerg int
    442  1.1     joerg feupdateenv(const fenv_t *envp)
    443  1.1     joerg {
    444  1.1     joerg 	fenv_t env;
    445  1.1     joerg 	uint32_t mxcsr;
    446  1.1     joerg 	uint16_t status;
    447  1.1     joerg 
    448  1.1     joerg 	_DIAGASSERT(envp != NULL);
    449  1.1     joerg 
    450  1.1     joerg 	/* Store the x87 floating-point environment */
    451  1.1     joerg 	memset(&env, 0, sizeof(env));
    452  1.1     joerg 	__fnstenv(&env);
    453  1.1     joerg 
    454  1.1     joerg 	__fe_dfl_env.x87.unused1 = env.x87.unused1;
    455  1.1     joerg 	__fe_dfl_env.x87.unused2 = env.x87.unused2;
    456  1.1     joerg 	__fe_dfl_env.x87.unused3 = env.x87.unused3;
    457  1.7  christos 	memcpy(__fe_dfl_env.x87.others, env.x87.others,
    458  1.7  christos 	    sizeof(__fe_dfl_env.x87.others));
    459  1.1     joerg 
    460  1.1     joerg 	__fnstsw(&status);
    461  1.1     joerg 	if (__HAS_SSE)
    462  1.1     joerg 		__stmxcsr(&mxcsr);
    463  1.1     joerg 	else
    464  1.1     joerg 		mxcsr = 0;
    465  1.1     joerg 	fesetenv(envp);
    466  1.1     joerg 	feraiseexcept((mxcsr | status) & FE_ALL_EXCEPT);
    467  1.1     joerg 
    468  1.1     joerg 	/* Success */
    469  1.1     joerg 	return (0);
    470  1.1     joerg }
    471  1.1     joerg 
    472  1.1     joerg /*
    473  1.1     joerg  * The following functions are extentions to the standard
    474  1.1     joerg  */
    475  1.1     joerg int
    476  1.1     joerg feenableexcept(int mask)
    477  1.1     joerg {
    478  1.1     joerg 	uint32_t mxcsr, omask;
    479  1.1     joerg 	uint16_t control;
    480  1.1     joerg 
    481  1.1     joerg 	mask &= FE_ALL_EXCEPT;
    482  1.1     joerg 	__fnstcw(&control);
    483  1.1     joerg 	if (__HAS_SSE)
    484  1.1     joerg 		__stmxcsr(&mxcsr);
    485  1.1     joerg 	else
    486  1.1     joerg 		mxcsr = 0;
    487  1.1     joerg 
    488  1.1     joerg 	omask = (control | mxcsr >> __SSE_EMASK_SHIFT) & FE_ALL_EXCEPT;
    489  1.1     joerg 	control &= ~mask;
    490  1.1     joerg 	__fldcw(control);
    491  1.1     joerg 	if (__HAS_SSE) {
    492  1.1     joerg 		mxcsr &= ~(mask << __SSE_EMASK_SHIFT);
    493  1.1     joerg 		__ldmxcsr(mxcsr);
    494  1.1     joerg 	}
    495  1.1     joerg 
    496  1.4  riastrad 	return (FE_ALL_EXCEPT & ~omask);
    497  1.1     joerg }
    498  1.1     joerg 
    499  1.1     joerg int
    500  1.1     joerg fedisableexcept(int mask)
    501  1.1     joerg {
    502  1.1     joerg 	uint32_t mxcsr, omask;
    503  1.1     joerg 	uint16_t control;
    504  1.1     joerg 
    505  1.1     joerg 	mask &= FE_ALL_EXCEPT;
    506  1.1     joerg 	__fnstcw(&control);
    507  1.1     joerg 	if (__HAS_SSE)
    508  1.1     joerg 		__stmxcsr(&mxcsr);
    509  1.1     joerg 	else
    510  1.1     joerg 		mxcsr = 0;
    511  1.1     joerg 
    512  1.1     joerg 	omask = (control | mxcsr >> __SSE_EMASK_SHIFT) & FE_ALL_EXCEPT;
    513  1.1     joerg 	control |= mask;
    514  1.1     joerg 	__fldcw(control);
    515  1.1     joerg 	if (__HAS_SSE) {
    516  1.1     joerg 		mxcsr |= mask << __SSE_EMASK_SHIFT;
    517  1.1     joerg 		__ldmxcsr(mxcsr);
    518  1.1     joerg 	}
    519  1.1     joerg 
    520  1.4  riastrad 	return (FE_ALL_EXCEPT & ~omask);
    521  1.1     joerg }
    522  1.1     joerg 
    523  1.1     joerg int
    524  1.1     joerg fegetexcept(void)
    525  1.1     joerg {
    526  1.1     joerg 	uint16_t control;
    527  1.1     joerg 
    528  1.1     joerg 	/*
    529  1.1     joerg 	 * We assume that the masks for the x87 and the SSE unit are
    530  1.1     joerg 	 * the same.
    531  1.1     joerg 	 */
    532  1.1     joerg 	__fnstcw(&control);
    533  1.1     joerg 
    534  1.5  riastrad 	return (~control & FE_ALL_EXCEPT);
    535  1.1     joerg }
    536