--- //depot/vendor/freebsd/src/sys/amd64/amd64/fpu.c 2012-05-17 17:35:15.000000000 0000 +++ //depot/projects/smpng/sys/amd64/amd64/fpu.c 2012-07-04 13:15:40.000000000 0000 @@ -85,9 +85,7 @@ low = mask; hi = mask >> 32; - /* xrstor (%rdi) */ - __asm __volatile(".byte 0x0f,0xae,0x2f" : : - "a" (low), "d" (hi), "D" (addr)); + __asm __volatile("xrstor %0" : : "m" (*addr), "a" (low), "d" (hi)); } static __inline void @@ -97,22 +95,10 @@ low = mask; hi = mask >> 32; - /* xsave (%rdi) */ - __asm __volatile(".byte 0x0f,0xae,0x27" : : - "a" (low), "d" (hi), "D" (addr) : "memory"); + __asm __volatile("xsave %0" : "=m" (*addr) : "a" (low), "d" (hi) : + "memory"); } -static __inline void -xsetbv(uint32_t reg, uint64_t val) -{ - uint32_t low, hi; - - low = val; - hi = val >> 32; - __asm __volatile(".byte 0x0f,0x01,0xd1" : : - "c" (reg), "a" (low), "d" (hi)); -} - #else /* !(__GNUCLIKE_ASM && !lint) */ void fldcw(u_short cw); @@ -127,7 +113,6 @@ void stop_emulating(void); void xrstor(char *addr, uint64_t mask); void xsave(char *addr, uint64_t mask); -void xsetbv(uint32_t reg, uint64_t val); #endif /* __GNUCLIKE_ASM && !lint */ @@ -238,7 +223,7 @@ if (use_xsave) { load_cr4(rcr4() | CR4_XSAVE); - xsetbv(XCR0, xsave_mask); + load_xcr(XCR0, xsave_mask); } /* --- //depot/vendor/freebsd/src/sys/amd64/include/cpufunc.h 2012-02-27 17:30:15.000000000 0000 +++ //depot/projects/smpng/sys/amd64/include/cpufunc.h 2012-07-04 13:15:40.000000000 0000 @@ -409,6 +411,25 @@ return (data); } +static __inline u_long +rxcr(u_int reg) +{ + u_int low, high; + + __asm __volatile("xgetbv" : "=a" (low), "=d" (high) : "c" (reg)); + return (low | ((uint64_t)high << 32)); +} + +static __inline void +load_xcr(u_int reg, u_long val) +{ + u_int low, hi; + + low = val; + hi = val >> 32; + __asm __volatile("xsetbv" : : "c" (reg), "a" (low), "d" (hi)); +} + /* * Global TLB flush (except for thise for pages marked PG_G) */