mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2024-12-01 13:46:42 +07:00
464d1a78fb
Convert the PDA code to use %fs rather than %gs as the segment for per-processor data. This is because some processors show a small but measurable performance gain for reloading a NULL segment selector (as %fs generally is in user-space) versus a non-NULL one (as %gs generally is). On modern processors the difference is very small, perhaps undetectable. Some old AMD "K6 3D+" processors are noticably slower when %fs is used rather than %gs; I have no idea why this might be, but I think they're sufficiently rare that it doesn't matter much. This patch also fixes the math emulator, which had not been adjusted to match the changed struct pt_regs. [frederik.deweerdt@gmail.com: fixit with gdb] [mingo@elte.hu: Fix KVM too] Signed-off-by: Jeremy Fitzhardinge <jeremy@xensource.com> Signed-off-by: Andi Kleen <ak@suse.de> Cc: Ian Campbell <Ian.Campbell@XenSource.com> Acked-by: Ingo Molnar <mingo@elte.hu> Acked-by: Zachary Amsden <zach@vmware.com> Cc: Eric Dumazet <dada1@cosmosbay.com> Signed-off-by: Frederik Deweerdt <frederik.deweerdt@gmail.com> Signed-off-by: Andrew Morton <akpm@osdl.org>
115 lines
3.5 KiB
C
115 lines
3.5 KiB
C
/*
|
|
* Generate definitions needed by assembly language modules.
|
|
* This code generates raw asm output which is post-processed
|
|
* to extract and format the required data.
|
|
*/
|
|
|
|
#include <linux/crypto.h>
|
|
#include <linux/sched.h>
|
|
#include <linux/signal.h>
|
|
#include <linux/personality.h>
|
|
#include <linux/suspend.h>
|
|
#include <asm/ucontext.h>
|
|
#include "sigframe.h"
|
|
#include <asm/fixmap.h>
|
|
#include <asm/processor.h>
|
|
#include <asm/thread_info.h>
|
|
#include <asm/elf.h>
|
|
#include <asm/pda.h>
|
|
|
|
#define DEFINE(sym, val) \
|
|
asm volatile("\n->" #sym " %0 " #val : : "i" (val))
|
|
|
|
#define BLANK() asm volatile("\n->" : : )
|
|
|
|
#define OFFSET(sym, str, mem) \
|
|
DEFINE(sym, offsetof(struct str, mem));
|
|
|
|
void foo(void)
|
|
{
|
|
OFFSET(SIGCONTEXT_eax, sigcontext, eax);
|
|
OFFSET(SIGCONTEXT_ebx, sigcontext, ebx);
|
|
OFFSET(SIGCONTEXT_ecx, sigcontext, ecx);
|
|
OFFSET(SIGCONTEXT_edx, sigcontext, edx);
|
|
OFFSET(SIGCONTEXT_esi, sigcontext, esi);
|
|
OFFSET(SIGCONTEXT_edi, sigcontext, edi);
|
|
OFFSET(SIGCONTEXT_ebp, sigcontext, ebp);
|
|
OFFSET(SIGCONTEXT_esp, sigcontext, esp);
|
|
OFFSET(SIGCONTEXT_eip, sigcontext, eip);
|
|
BLANK();
|
|
|
|
OFFSET(CPUINFO_x86, cpuinfo_x86, x86);
|
|
OFFSET(CPUINFO_x86_vendor, cpuinfo_x86, x86_vendor);
|
|
OFFSET(CPUINFO_x86_model, cpuinfo_x86, x86_model);
|
|
OFFSET(CPUINFO_x86_mask, cpuinfo_x86, x86_mask);
|
|
OFFSET(CPUINFO_hard_math, cpuinfo_x86, hard_math);
|
|
OFFSET(CPUINFO_cpuid_level, cpuinfo_x86, cpuid_level);
|
|
OFFSET(CPUINFO_x86_capability, cpuinfo_x86, x86_capability);
|
|
OFFSET(CPUINFO_x86_vendor_id, cpuinfo_x86, x86_vendor_id);
|
|
BLANK();
|
|
|
|
OFFSET(TI_task, thread_info, task);
|
|
OFFSET(TI_exec_domain, thread_info, exec_domain);
|
|
OFFSET(TI_flags, thread_info, flags);
|
|
OFFSET(TI_status, thread_info, status);
|
|
OFFSET(TI_preempt_count, thread_info, preempt_count);
|
|
OFFSET(TI_addr_limit, thread_info, addr_limit);
|
|
OFFSET(TI_restart_block, thread_info, restart_block);
|
|
OFFSET(TI_sysenter_return, thread_info, sysenter_return);
|
|
BLANK();
|
|
|
|
OFFSET(GDS_size, Xgt_desc_struct, size);
|
|
OFFSET(GDS_address, Xgt_desc_struct, address);
|
|
OFFSET(GDS_pad, Xgt_desc_struct, pad);
|
|
BLANK();
|
|
|
|
OFFSET(PT_EBX, pt_regs, ebx);
|
|
OFFSET(PT_ECX, pt_regs, ecx);
|
|
OFFSET(PT_EDX, pt_regs, edx);
|
|
OFFSET(PT_ESI, pt_regs, esi);
|
|
OFFSET(PT_EDI, pt_regs, edi);
|
|
OFFSET(PT_EBP, pt_regs, ebp);
|
|
OFFSET(PT_EAX, pt_regs, eax);
|
|
OFFSET(PT_DS, pt_regs, xds);
|
|
OFFSET(PT_ES, pt_regs, xes);
|
|
OFFSET(PT_FS, pt_regs, xfs);
|
|
OFFSET(PT_ORIG_EAX, pt_regs, orig_eax);
|
|
OFFSET(PT_EIP, pt_regs, eip);
|
|
OFFSET(PT_CS, pt_regs, xcs);
|
|
OFFSET(PT_EFLAGS, pt_regs, eflags);
|
|
OFFSET(PT_OLDESP, pt_regs, esp);
|
|
OFFSET(PT_OLDSS, pt_regs, xss);
|
|
BLANK();
|
|
|
|
OFFSET(EXEC_DOMAIN_handler, exec_domain, handler);
|
|
OFFSET(RT_SIGFRAME_sigcontext, rt_sigframe, uc.uc_mcontext);
|
|
BLANK();
|
|
|
|
OFFSET(pbe_address, pbe, address);
|
|
OFFSET(pbe_orig_address, pbe, orig_address);
|
|
OFFSET(pbe_next, pbe, next);
|
|
|
|
/* Offset from the sysenter stack to tss.esp0 */
|
|
DEFINE(TSS_sysenter_esp0, offsetof(struct tss_struct, esp0) -
|
|
sizeof(struct tss_struct));
|
|
|
|
DEFINE(PAGE_SIZE_asm, PAGE_SIZE);
|
|
DEFINE(VDSO_PRELINK, VDSO_PRELINK);
|
|
|
|
OFFSET(crypto_tfm_ctx_offset, crypto_tfm, __crt_ctx);
|
|
|
|
BLANK();
|
|
OFFSET(PDA_cpu, i386_pda, cpu_number);
|
|
OFFSET(PDA_pcurrent, i386_pda, pcurrent);
|
|
|
|
#ifdef CONFIG_PARAVIRT
|
|
BLANK();
|
|
OFFSET(PARAVIRT_enabled, paravirt_ops, paravirt_enabled);
|
|
OFFSET(PARAVIRT_irq_disable, paravirt_ops, irq_disable);
|
|
OFFSET(PARAVIRT_irq_enable, paravirt_ops, irq_enable);
|
|
OFFSET(PARAVIRT_irq_enable_sysexit, paravirt_ops, irq_enable_sysexit);
|
|
OFFSET(PARAVIRT_iret, paravirt_ops, iret);
|
|
OFFSET(PARAVIRT_read_cr0, paravirt_ops, read_cr0);
|
|
#endif
|
|
}
|