| /* $OpenBSD: fpu.h,v 1.16 2018/10/07 22:43:06 guenther Exp $ */ |
| /* $NetBSD: fpu.h,v 1.1 2003/04/26 18:39:40 fvdl Exp $ */ |
| |
| #ifndef _MACHINE_FPU_H_ |
| #define _MACHINE_FPU_H_ |
| |
| #include <sys/types.h> |
| |
| /* |
| * If the CPU supports xsave/xrstor then we use them so that we can provide |
| * AVX support. Otherwise we require fxsave/fxrstor, as the SSE registers |
| * are part of the ABI for passing floating point values. |
| * While fxsave/fxrstor only required 16-byte alignment for the save area, |
| * xsave/xrstor requires the save area to have 64-byte alignment. |
| */ |
| |
| struct fxsave64 { |
| u_int16_t fx_fcw; |
| u_int16_t fx_fsw; |
| u_int8_t fx_ftw; |
| u_int8_t fx_unused1; |
| u_int16_t fx_fop; |
| u_int64_t fx_rip; |
| u_int64_t fx_rdp; |
| u_int32_t fx_mxcsr; |
| u_int32_t fx_mxcsr_mask; |
| u_int64_t fx_st[8][2]; /* 8 normal FP regs */ |
| u_int64_t fx_xmm[16][2]; /* 16 SSE2 registers */ |
| u_int8_t fx_unused3[96]; |
| } __packed; |
| |
| struct xstate_hdr { |
| uint64_t xstate_bv; |
| uint64_t xstate_xcomp_bv; |
| uint8_t xstate_rsrv0[0]; |
| uint8_t xstate_rsrv[40]; |
| } ___packed; |
| |
| struct savefpu { |
| struct fxsave64 fp_fxsave; /* see above */ |
| struct xstate_hdr fp_xstate; |
| u_int64_t fp_ymm[16][2]; |
| u_int16_t fp_ex_sw; /* saved status from last exception */ |
| u_int16_t fp_ex_tw; /* saved tag from last exception */ |
| }; |
| |
| /* |
| * The i387 defaults to Intel extended precision mode and round to nearest, |
| * with all exceptions masked. |
| */ |
| #define __INITIAL_NPXCW__ 0x037f |
| #define __INITIAL_MXCSR__ 0x1f80 |
| #define __INITIAL_MXCSR_MASK__ 0xffbf |
| |
| #ifdef _KERNEL |
| /* |
| * XXX |
| */ |
| struct trapframe; |
| struct cpu_info; |
| |
| extern size_t fpu_save_len; |
| extern uint32_t fpu_mxcsr_mask; |
| extern uint64_t xsave_mask; |
| |
| void fpuinit(struct cpu_info *); |
| int fputrap(int _type); |
| void fpusave(struct savefpu *); |
| void fpusavereset(struct savefpu *); |
| void fpu_kernel_enter(void); |
| void fpu_kernel_exit(void); |
| |
| int xrstor_user(struct savefpu *_addr, uint64_t _mask); |
| #define fpureset() \ |
| xrstor_user(&proc0.p_addr->u_pcb.pcb_savefpu, xsave_mask) |
| int xsetbv_user(uint32_t _reg, uint64_t _mask); |
| |
| #define fninit() __asm("fninit") |
| #define fwait() __asm("fwait") |
| /* should be fxsave64, but where we use this it doesn't matter */ |
| #define fxsave(addr) __asm("fxsave %0" : "=m" (*addr)) |
| #define ldmxcsr(addr) __asm("ldmxcsr %0" : : "m" (*addr)) |
| #define fldcw(addr) __asm("fldcw %0" : : "m" (*addr)) |
| |
| static inline void |
| xsave(struct savefpu *addr, uint64_t mask) |
| { |
| uint32_t lo, hi; |
| |
| lo = mask; |
| hi = mask >> 32; |
| /* should be xsave64, but where we use this it doesn't matter */ |
| __asm volatile("xsave %0" : "=m" (*addr) : "a" (lo), "d" (hi) : |
| "memory"); |
| } |
| |
| #endif |
| |
| #endif /* _MACHINE_FPU_H_ */ |