2015-04-22 15:53:34 +07:00
|
|
|
/*
|
|
|
|
* x86 FPU boot time init code
|
|
|
|
*/
|
2015-04-24 07:54:44 +07:00
|
|
|
#include <asm/fpu/internal.h>
|
2015-04-22 15:53:34 +07:00
|
|
|
#include <asm/tlbflush.h>
|
|
|
|
|
2015-04-22 18:44:25 +07:00
|
|
|
/*
|
|
|
|
* Boot time CPU/FPU FDIV bug detection code:
|
|
|
|
*/
|
|
|
|
|
|
|
|
static double __initdata x = 4195835.0;
|
|
|
|
static double __initdata y = 3145727.0;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This used to check for exceptions..
|
|
|
|
* However, it turns out that to support that,
|
|
|
|
* the XMM trap handlers basically had to
|
|
|
|
* be buggy. So let's have a correct XMM trap
|
|
|
|
* handler, and forget about printing out
|
|
|
|
* some status at boot.
|
|
|
|
*
|
|
|
|
* We should really only care about bugs here
|
|
|
|
* anyway. Not features.
|
|
|
|
*/
|
|
|
|
static void __init check_fpu(void)
|
|
|
|
{
|
|
|
|
s32 fdiv_bug;
|
|
|
|
|
|
|
|
kernel_fpu_begin();
|
|
|
|
|
|
|
|
/*
|
|
|
|
* trap_init() enabled FXSR and company _before_ testing for FP
|
|
|
|
* problems here.
|
|
|
|
*
|
|
|
|
* Test for the divl bug: http://en.wikipedia.org/wiki/Fdiv_bug
|
|
|
|
*/
|
|
|
|
__asm__("fninit\n\t"
|
|
|
|
"fldl %1\n\t"
|
|
|
|
"fdivl %2\n\t"
|
|
|
|
"fmull %2\n\t"
|
|
|
|
"fldl %1\n\t"
|
|
|
|
"fsubp %%st,%%st(1)\n\t"
|
|
|
|
"fistpl %0\n\t"
|
|
|
|
"fwait\n\t"
|
|
|
|
"fninit"
|
|
|
|
: "=m" (*&fdiv_bug)
|
|
|
|
: "m" (*&x), "m" (*&y));
|
|
|
|
|
|
|
|
kernel_fpu_end();
|
|
|
|
|
|
|
|
if (fdiv_bug) {
|
|
|
|
set_cpu_bug(&boot_cpu_data, X86_BUG_FDIV);
|
|
|
|
pr_warn("Hmm, FPU with FDIV bug\n");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void fpu__init_check_bugs(void)
|
|
|
|
{
|
|
|
|
/*
|
|
|
|
* kernel_fpu_begin/end() in check_fpu() relies on the patched
|
|
|
|
* alternative instructions.
|
|
|
|
*/
|
|
|
|
if (cpu_has_fpu)
|
|
|
|
check_fpu();
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Boot time FPU feature detection code:
|
|
|
|
*/
|
2015-04-22 15:53:34 +07:00
|
|
|
unsigned int mxcsr_feature_mask __read_mostly = 0xffffffffu;
|
2015-04-24 15:49:11 +07:00
|
|
|
|
2015-04-22 15:53:34 +07:00
|
|
|
unsigned int xstate_size;
|
|
|
|
EXPORT_SYMBOL_GPL(xstate_size);
|
|
|
|
|
|
|
|
static void mxcsr_feature_mask_init(void)
|
|
|
|
{
|
2015-04-24 15:49:11 +07:00
|
|
|
unsigned int mask = 0;
|
2015-04-22 15:53:34 +07:00
|
|
|
|
|
|
|
if (cpu_has_fxsr) {
|
2015-04-24 15:49:11 +07:00
|
|
|
struct i387_fxsave_struct fx_tmp __aligned(32) = { };
|
|
|
|
|
|
|
|
asm volatile("fxsave %0" : "+m" (fx_tmp));
|
|
|
|
|
|
|
|
mask = fx_tmp.mxcsr_mask;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* If zero then use the default features mask,
|
|
|
|
* which has all features set, except the
|
|
|
|
* denormals-are-zero feature bit:
|
|
|
|
*/
|
2015-04-22 15:53:34 +07:00
|
|
|
if (mask == 0)
|
|
|
|
mask = 0x0000ffbf;
|
|
|
|
}
|
|
|
|
mxcsr_feature_mask &= mask;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void fpstate_xstate_init_size(void)
|
|
|
|
{
|
|
|
|
/*
|
|
|
|
* Note that xstate_size might be overwriten later during
|
|
|
|
* xsave_init().
|
|
|
|
*/
|
|
|
|
|
|
|
|
if (!cpu_has_fpu) {
|
|
|
|
/*
|
|
|
|
* Disable xsave as we do not support it if i387
|
|
|
|
* emulation is enabled.
|
|
|
|
*/
|
|
|
|
setup_clear_cpu_cap(X86_FEATURE_XSAVE);
|
|
|
|
setup_clear_cpu_cap(X86_FEATURE_XSAVEOPT);
|
|
|
|
xstate_size = sizeof(struct i387_soft_struct);
|
2015-04-25 09:29:26 +07:00
|
|
|
} else {
|
|
|
|
if (cpu_has_fxsr)
|
|
|
|
xstate_size = sizeof(struct i387_fxsave_struct);
|
|
|
|
else
|
|
|
|
xstate_size = sizeof(struct i387_fsave_struct);
|
2015-04-22 15:53:34 +07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Called on the boot CPU at bootup to set up the initial FPU state that
|
|
|
|
* is later cloned into all processes.
|
|
|
|
*
|
|
|
|
* Also called on secondary CPUs to set up the FPU state of their
|
|
|
|
* idle threads.
|
|
|
|
*/
|
|
|
|
void fpu__cpu_init(void)
|
|
|
|
{
|
|
|
|
unsigned long cr0;
|
|
|
|
unsigned long cr4_mask = 0;
|
|
|
|
|
|
|
|
#ifndef CONFIG_MATH_EMULATION
|
|
|
|
if (!cpu_has_fpu) {
|
|
|
|
pr_emerg("No FPU found and no math emulation present\n");
|
|
|
|
pr_emerg("Giving up\n");
|
|
|
|
for (;;)
|
|
|
|
asm volatile("hlt");
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
if (cpu_has_fxsr)
|
|
|
|
cr4_mask |= X86_CR4_OSFXSR;
|
|
|
|
if (cpu_has_xmm)
|
|
|
|
cr4_mask |= X86_CR4_OSXMMEXCPT;
|
|
|
|
if (cr4_mask)
|
|
|
|
cr4_set_bits(cr4_mask);
|
|
|
|
|
|
|
|
cr0 = read_cr0();
|
|
|
|
cr0 &= ~(X86_CR0_TS|X86_CR0_EM); /* clear TS and EM */
|
|
|
|
if (!cpu_has_fpu)
|
|
|
|
cr0 |= X86_CR0_EM;
|
|
|
|
write_cr0(cr0);
|
|
|
|
|
|
|
|
|
|
|
|
mxcsr_feature_mask_init();
|
|
|
|
xsave_init();
|
|
|
|
eager_fpu_init();
|
|
|
|
}
|
2015-04-22 16:36:14 +07:00
|
|
|
|
|
|
|
static int __init no_387(char *s)
|
|
|
|
{
|
|
|
|
setup_clear_cpu_cap(X86_FEATURE_FPU);
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
__setup("no387", no_387);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Set the X86_FEATURE_FPU CPU-capability bit based on
|
|
|
|
* trying to execute an actual sequence of FPU instructions:
|
|
|
|
*/
|
|
|
|
void fpu__detect(struct cpuinfo_x86 *c)
|
|
|
|
{
|
|
|
|
unsigned long cr0;
|
|
|
|
u16 fsw, fcw;
|
|
|
|
|
|
|
|
fsw = fcw = 0xffff;
|
|
|
|
|
|
|
|
cr0 = read_cr0();
|
|
|
|
cr0 &= ~(X86_CR0_TS | X86_CR0_EM);
|
|
|
|
write_cr0(cr0);
|
|
|
|
|
|
|
|
asm volatile("fninit ; fnstsw %0 ; fnstcw %1"
|
|
|
|
: "+m" (fsw), "+m" (fcw));
|
|
|
|
|
|
|
|
if (fsw == 0 && (fcw & 0x103f) == 0x003f)
|
|
|
|
set_cpu_cap(c, X86_FEATURE_FPU);
|
|
|
|
else
|
|
|
|
clear_cpu_cap(c, X86_FEATURE_FPU);
|
|
|
|
|
2015-04-25 09:29:26 +07:00
|
|
|
/* The final cr0 value is set later, in fpu_init() */
|
|
|
|
|
|
|
|
fpstate_xstate_init_size();
|
2015-04-22 16:36:14 +07:00
|
|
|
}
|