amd64/include/fpu.h

1.10  christos /*	$NetBSD: fpu.h,v 1.10 2013/12/01 01:05:16 christos Exp $	*/
 1.1      fvdl
 1.1      fvdl #ifndef	_AMD64_FPU_H_
 1.1      fvdl #define	_AMD64_FPU_H_
 1.1      fvdl
 1.1      fvdl /*
 1.1      fvdl  * NetBSD/amd64 only uses the extended save/restore format used
 1.1      fvdl  * by fxsave/fsrestore, to always deal with the SSE registers,
 1.1      fvdl  * which are part of the ABI to pass floating point values.
 1.7       dsl  *
 1.7       dsl  * The memory used for the 'fsave' instruction must be 16 byte aligned,
 1.7       dsl  * but the definition here isn't aligned to avoid padding elsewhere.
 1.1      fvdl  */
 1.1      fvdl
 1.1      fvdl struct fxsave64 {
 1.6       dsl 	uint16_t  fx_fcw;           /* 0: FPU control word */
 1.6       dsl 	uint16_t  fx_fsw;           /* 2: FPU status word */
 1.6       dsl 	uint8_t   fx_ftw;           /* 4: Abridged FPU tag word */
 1.6       dsl 	uint8_t   fx_reserved1;     /* 5: */
 1.6       dsl 	uint16_t  fx_fop;           /* 6: Low 11 bits are FPU opcode */
 1.6       dsl 	uint64_t  fx_rip;           /* 8: Address of faulting instruction */
 1.6       dsl 	uint64_t  fx_rdp;           /* 16: Data address associated with fault */
 1.6       dsl 	uint32_t  fx_mxcsr;         /* 24: SIMD control & status */
 1.6       dsl 	uint32_t  fx_mxcsr_mask;    /* 28: */
 1.6       dsl 	uint64_t  fx_st[8][2];      /* 32: 8 normal FP regs (80 bit) */
 1.6       dsl 	uint64_t  fx_xmm[16][2];    /* 160: 16 SSE2 registers */
 1.6       dsl 	uint8_t   fx_reserved2[48]; /* 416: */
 1.6       dsl 	uint8_t   fx_available[48]; /* 464: could be used by kernel */
 1.6       dsl };
 1.6       dsl
 1.6       dsl __CTASSERT(sizeof (struct fxsave64) == 512);
 1.1      fvdl
 1.1      fvdl struct savefpu {
 1.1      fvdl 	struct fxsave64 fp_fxsave;	/* see above */
 1.7       dsl };
 1.7       dsl
 1.7       dsl struct savefpu_i387 {
 1.5    cegger 	uint16_t fp_ex_sw;		/* saved status from last exception */
 1.5    cegger 	uint16_t fp_ex_tw;		/* saved tag from last exception */
 1.7       dsl };
 1.1      fvdl
 1.1      fvdl /*
 1.1      fvdl  * The i387 defaults to Intel extended precision mode and round to nearest,
 1.1      fvdl  * with all exceptions masked.
 1.1      fvdl  */
 1.1      fvdl #define	__INITIAL_NPXCW__	0x037f
 1.1      fvdl #define __INITIAL_MXCSR__ 	0x1f80
 1.1      fvdl #define __INITIAL_MXCSR_MASK__	0xffbf
 1.1      fvdl
 1.9     joerg /* Modern NetBSD uses the default control word.. */
 1.9     joerg #define	__NetBSD_NPXCW__	0x037f
 1.9     joerg /* NetBSD before 6.99.26 forced IEEE double precision. */
 1.9     joerg #define	__NetBSD_COMPAT_NPXCW__	0x127f
 1.1      fvdl /* Linux just uses the default control word. */
 1.1      fvdl #define	__Linux_NPXCW__		0x037f
 1.1      fvdl
 1.1      fvdl /*
 1.1      fvdl  * The standard control word from finit is 0x37F, giving:
 1.1      fvdl  *	round to nearest
 1.1      fvdl  *	64-bit precision
 1.1      fvdl  *	all exceptions masked.
 1.1      fvdl  *
 1.1      fvdl  * Now we want:
 1.1      fvdl  *	affine mode (if we decide to support 287's)
 1.1      fvdl  *	round to nearest
 1.1      fvdl  *	53-bit precision
 1.1      fvdl  *	all exceptions masked.
 1.1      fvdl  *
 1.1      fvdl  * 64-bit precision often gives bad results with high level languages
 1.1      fvdl  * because it makes the results of calculations depend on whether
 1.1      fvdl  * intermediate values are stored in memory or in FPU registers.
 1.1      fvdl  */
 1.1      fvdl
 1.1      fvdl #ifdef _KERNEL
 1.1      fvdl /*
 1.1      fvdl  * XXX
 1.1      fvdl  */
 1.1      fvdl struct trapframe;
 1.1      fvdl struct cpu_info;
 1.1      fvdl
 1.1      fvdl void fpuinit(struct cpu_info *);
1.10  christos void fpudrop(void);
1.10  christos void fpusave(struct lwp *);
1.10  christos void fpudiscard(struct lwp *);
 1.1      fvdl void fputrap(struct trapframe *);
1.10  christos void fpusave_lwp(struct lwp *, bool);
1.10  christos void fpusave_cpu(bool);
 1.1      fvdl
 1.1      fvdl #endif
 1.1      fvdl
 1.1      fvdl #endif /* _AMD64_FPU_H_ */