2019-05-29 00:10:25 +07:00
|
|
|
/* SPDX-License-Identifier: GPL-2.0-only */
|
2008-10-23 12:26:29 +07:00
|
|
|
#ifndef _ASM_X86_APIC_H
|
|
|
|
#define _ASM_X86_APIC_H
|
2008-01-30 19:30:15 +07:00
|
|
|
|
2009-02-17 19:52:29 +07:00
|
|
|
#include <linux/cpumask.h>
|
x86: APIC: remove apic_write_around(); use alternatives
Use alternatives to select the workaround for the 11AP Pentium erratum
for the affected steppings on the fly rather than build time. Remove the
X86_GOOD_APIC configuration option and replace all the calls to
apic_write_around() with plain apic_write(), protecting accesses to the
ESR as appropriate due to the 3AP Pentium erratum. Remove
apic_read_around() and all its invocations altogether as not needed.
Remove apic_write_atomic() and all its implementing backends. The use of
ASM_OUTPUT2() is not strictly needed for input constraints, but I have
used it for readability's sake.
I had the feeling no one else was brave enough to do it, so I went ahead
and here it is. Verified by checking the generated assembly and tested
with both a 32-bit and a 64-bit configuration, also with the 11AP
"feature" forced on and verified with gdb on /proc/kcore to work as
expected (as an 11AP machines are quite hard to get hands on these days).
Some script complained about the use of "volatile", but apic_write() needs
it for the same reason and is effectively a replacement for writel(), so I
have disregarded it.
I am not sure what the policy wrt defconfig files is, they are generated
and there is risk of a conflict resulting from an unrelated change, so I
have left changes to them out. The option will get removed from them at
the next run.
Some testing with machines other than mine will be needed to avoid some
stupid mistake, but despite its volume, the change is not really that
intrusive, so I am fairly confident that because it works for me, it will
everywhere.
Signed-off-by: Maciej W. Rozycki <macro@linux-mips.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-07-17 01:15:30 +07:00
|
|
|
|
|
|
|
#include <asm/alternative.h>
|
2009-02-17 19:52:29 +07:00
|
|
|
#include <asm/cpufeature.h>
|
|
|
|
#include <asm/apicdef.h>
|
2011-07-27 06:09:06 +07:00
|
|
|
#include <linux/atomic.h>
|
2009-02-17 19:52:29 +07:00
|
|
|
#include <asm/fixmap.h>
|
|
|
|
#include <asm/mpspec.h>
|
2008-07-11 01:16:52 +07:00
|
|
|
#include <asm/msr.h>
|
2018-07-29 18:06:04 +07:00
|
|
|
#include <asm/hardirq.h>
|
2008-01-30 19:30:15 +07:00
|
|
|
|
|
|
|
#define ARCH_APICTIMER_STOPS_ON_C3 1
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Debugging macros
|
|
|
|
*/
|
|
|
|
#define APIC_QUIET 0
|
|
|
|
#define APIC_VERBOSE 1
|
|
|
|
#define APIC_DEBUG 2
|
|
|
|
|
2015-12-14 17:19:12 +07:00
|
|
|
/* Macros for apic_extnmi which controls external NMI masking */
|
|
|
|
#define APIC_EXTNMI_BSP 0 /* Default */
|
|
|
|
#define APIC_EXTNMI_ALL 1
|
|
|
|
#define APIC_EXTNMI_NONE 2
|
|
|
|
|
2008-01-30 19:30:15 +07:00
|
|
|
/*
|
|
|
|
* Define the default level of output to be very little
|
|
|
|
* This can be turned up by using apic=verbose for more
|
|
|
|
* information and apic=debug for _lots_ of information.
|
|
|
|
* apic_verbosity is defined in apic.c
|
|
|
|
*/
|
|
|
|
#define apic_printk(v, s, a...) do { \
|
|
|
|
if ((v) <= apic_verbosity) \
|
|
|
|
printk(s, ##a); \
|
|
|
|
} while (0)
|
|
|
|
|
|
|
|
|
2009-02-11 17:27:39 +07:00
|
|
|
#if defined(CONFIG_X86_LOCAL_APIC) && defined(CONFIG_X86_32)
|
2008-01-30 19:30:15 +07:00
|
|
|
extern void generic_apic_probe(void);
|
2009-02-11 17:27:39 +07:00
|
|
|
#else
|
|
|
|
static inline void generic_apic_probe(void)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
#endif
|
2008-01-30 19:30:15 +07:00
|
|
|
|
|
|
|
#ifdef CONFIG_X86_LOCAL_APIC
|
|
|
|
|
x86/apic: Silence -Wtype-limits compiler warnings
There are many compiler warnings like this,
In file included from ./arch/x86/include/asm/smp.h:13,
from ./arch/x86/include/asm/mmzone_64.h:11,
from ./arch/x86/include/asm/mmzone.h:5,
from ./include/linux/mmzone.h:969,
from ./include/linux/gfp.h:6,
from ./include/linux/mm.h:10,
from arch/x86/kernel/apic/io_apic.c:34:
arch/x86/kernel/apic/io_apic.c: In function 'check_timer':
./arch/x86/include/asm/apic.h:37:11: warning: comparison of unsigned
expression >= 0 is always true [-Wtype-limits]
if ((v) <= apic_verbosity) \
^~
arch/x86/kernel/apic/io_apic.c:2160:2: note: in expansion of macro
'apic_printk'
apic_printk(APIC_QUIET, KERN_INFO "..TIMER: vector=0x%02X "
^~~~~~~~~~~
./arch/x86/include/asm/apic.h:37:11: warning: comparison of unsigned
expression >= 0 is always true [-Wtype-limits]
if ((v) <= apic_verbosity) \
^~
arch/x86/kernel/apic/io_apic.c:2207:4: note: in expansion of macro
'apic_printk'
apic_printk(APIC_QUIET, KERN_ERR "..MP-BIOS bug: "
^~~~~~~~~~~
APIC_QUIET is 0, so silence them by making apic_verbosity type int.
Signed-off-by: Qian Cai <cai@lca.pw>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
Link: https://lkml.kernel.org/r/1562621805-24789-1-git-send-email-cai@lca.pw
2019-07-09 04:36:45 +07:00
|
|
|
extern int apic_verbosity;
|
2008-01-30 19:30:15 +07:00
|
|
|
extern int local_apic_timer_c2_ok;
|
|
|
|
|
2008-06-21 06:11:20 +07:00
|
|
|
extern int disable_apic;
|
2019-05-09 12:54:16 +07:00
|
|
|
extern unsigned int lapic_timer_period;
|
2009-01-28 23:16:25 +07:00
|
|
|
|
2017-09-13 16:12:49 +07:00
|
|
|
extern enum apic_intr_mode_id apic_intr_mode;
|
|
|
|
enum apic_intr_mode_id {
|
|
|
|
APIC_PIC,
|
|
|
|
APIC_VIRTUAL_WIRE,
|
|
|
|
APIC_VIRTUAL_WIRE_NO_CONFIG,
|
|
|
|
APIC_SYMMETRIC_IO,
|
|
|
|
APIC_SYMMETRIC_IO_NO_ROUTING
|
|
|
|
};
|
|
|
|
|
2009-01-28 23:16:25 +07:00
|
|
|
#ifdef CONFIG_SMP
|
|
|
|
extern void __inquire_remote_apic(int apicid);
|
|
|
|
#else /* CONFIG_SMP */
|
|
|
|
static inline void __inquire_remote_apic(int apicid)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
#endif /* CONFIG_SMP */
|
|
|
|
|
|
|
|
static inline void default_inquire_remote_apic(int apicid)
|
|
|
|
{
|
|
|
|
if (apic_verbosity >= APIC_DEBUG)
|
|
|
|
__inquire_remote_apic(apicid);
|
|
|
|
}
|
|
|
|
|
2009-09-15 14:12:30 +07:00
|
|
|
/*
|
|
|
|
* With 82489DX we can't rely on apic feature bit
|
|
|
|
* retrieved via cpuid but still have to deal with
|
|
|
|
* such an apic chip so we assume that SMP configuration
|
|
|
|
* is found from MP table (64bit case uses ACPI mostly
|
|
|
|
* which set smp presence flag as well so we are safe
|
|
|
|
* to use this helper too).
|
|
|
|
*/
|
|
|
|
static inline bool apic_from_smp_config(void)
|
|
|
|
{
|
|
|
|
return smp_found_config && !disable_apic;
|
|
|
|
}
|
|
|
|
|
2008-01-30 19:30:15 +07:00
|
|
|
/*
|
|
|
|
* Basic functions accessing APICs.
|
|
|
|
*/
|
|
|
|
#ifdef CONFIG_PARAVIRT
|
|
|
|
#include <asm/paravirt.h>
|
2007-10-11 16:20:03 +07:00
|
|
|
#endif
|
2008-01-30 19:30:15 +07:00
|
|
|
|
2008-07-23 18:43:14 +07:00
|
|
|
extern int setup_profiling_timer(unsigned int);
|
2008-03-20 14:41:16 +07:00
|
|
|
|
2008-07-11 01:16:49 +07:00
|
|
|
static inline void native_apic_mem_write(u32 reg, u32 v)
|
2008-01-30 19:30:15 +07:00
|
|
|
{
|
x86: APIC: remove apic_write_around(); use alternatives
Use alternatives to select the workaround for the 11AP Pentium erratum
for the affected steppings on the fly rather than build time. Remove the
X86_GOOD_APIC configuration option and replace all the calls to
apic_write_around() with plain apic_write(), protecting accesses to the
ESR as appropriate due to the 3AP Pentium erratum. Remove
apic_read_around() and all its invocations altogether as not needed.
Remove apic_write_atomic() and all its implementing backends. The use of
ASM_OUTPUT2() is not strictly needed for input constraints, but I have
used it for readability's sake.
I had the feeling no one else was brave enough to do it, so I went ahead
and here it is. Verified by checking the generated assembly and tested
with both a 32-bit and a 64-bit configuration, also with the 11AP
"feature" forced on and verified with gdb on /proc/kcore to work as
expected (as an 11AP machines are quite hard to get hands on these days).
Some script complained about the use of "volatile", but apic_write() needs
it for the same reason and is effectively a replacement for writel(), so I
have disregarded it.
I am not sure what the policy wrt defconfig files is, they are generated
and there is risk of a conflict resulting from an unrelated change, so I
have left changes to them out. The option will get removed from them at
the next run.
Some testing with machines other than mine will be needed to avoid some
stupid mistake, but despite its volume, the change is not really that
intrusive, so I am fairly confident that because it works for me, it will
everywhere.
Signed-off-by: Maciej W. Rozycki <macro@linux-mips.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-07-17 01:15:30 +07:00
|
|
|
volatile u32 *addr = (volatile u32 *)(APIC_BASE + reg);
|
2008-01-30 19:30:15 +07:00
|
|
|
|
x86/asm: Cleanup prefetch primitives
This is based on a patch originally by hpa.
With the current improvements to the alternatives, we can simply use %P1
as a mem8 operand constraint and rely on the toolchain to generate the
proper instruction sizes. For example, on 32-bit, where we use an empty
old instruction we get:
apply_alternatives: feat: 6*32+8, old: (c104648b, len: 4), repl: (c195566c, len: 4)
c104648b: alt_insn: 90 90 90 90
c195566c: rpl_insn: 0f 0d 4b 5c
...
apply_alternatives: feat: 6*32+8, old: (c18e09b4, len: 3), repl: (c1955948, len: 3)
c18e09b4: alt_insn: 90 90 90
c1955948: rpl_insn: 0f 0d 08
...
apply_alternatives: feat: 6*32+8, old: (c1190cf9, len: 7), repl: (c1955a79, len: 7)
c1190cf9: alt_insn: 90 90 90 90 90 90 90
c1955a79: rpl_insn: 0f 0d 0d a0 d4 85 c1
all with the proper padding done depending on the size of the
replacement instruction the compiler generates.
Signed-off-by: Borislav Petkov <bp@suse.de>
Cc: H. Peter Anvin <hpa@linux.intel.com>
2015-01-18 23:48:18 +07:00
|
|
|
alternative_io("movl %0, %P1", "xchgl %0, %P1", X86_BUG_11AP,
|
x86: APIC: remove apic_write_around(); use alternatives
Use alternatives to select the workaround for the 11AP Pentium erratum
for the affected steppings on the fly rather than build time. Remove the
X86_GOOD_APIC configuration option and replace all the calls to
apic_write_around() with plain apic_write(), protecting accesses to the
ESR as appropriate due to the 3AP Pentium erratum. Remove
apic_read_around() and all its invocations altogether as not needed.
Remove apic_write_atomic() and all its implementing backends. The use of
ASM_OUTPUT2() is not strictly needed for input constraints, but I have
used it for readability's sake.
I had the feeling no one else was brave enough to do it, so I went ahead
and here it is. Verified by checking the generated assembly and tested
with both a 32-bit and a 64-bit configuration, also with the 11AP
"feature" forced on and verified with gdb on /proc/kcore to work as
expected (as an 11AP machines are quite hard to get hands on these days).
Some script complained about the use of "volatile", but apic_write() needs
it for the same reason and is effectively a replacement for writel(), so I
have disregarded it.
I am not sure what the policy wrt defconfig files is, they are generated
and there is risk of a conflict resulting from an unrelated change, so I
have left changes to them out. The option will get removed from them at
the next run.
Some testing with machines other than mine will be needed to avoid some
stupid mistake, but despite its volume, the change is not really that
intrusive, so I am fairly confident that because it works for me, it will
everywhere.
Signed-off-by: Maciej W. Rozycki <macro@linux-mips.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-07-17 01:15:30 +07:00
|
|
|
ASM_OUTPUT2("=r" (v), "=m" (*addr)),
|
|
|
|
ASM_OUTPUT2("0" (v), "m" (*addr)));
|
2008-01-30 19:30:15 +07:00
|
|
|
}
|
|
|
|
|
2008-07-11 01:16:49 +07:00
|
|
|
static inline u32 native_apic_mem_read(u32 reg)
|
2008-01-30 19:30:15 +07:00
|
|
|
{
|
|
|
|
return *((volatile u32 *)(APIC_BASE + reg));
|
|
|
|
}
|
|
|
|
|
2009-02-17 14:02:14 +07:00
|
|
|
extern void native_apic_wait_icr_idle(void);
|
|
|
|
extern u32 native_safe_apic_wait_icr_idle(void);
|
|
|
|
extern void native_apic_icr_write(u32 low, u32 id);
|
|
|
|
extern u64 native_apic_icr_read(void);
|
|
|
|
|
2015-01-16 04:22:09 +07:00
|
|
|
static inline bool apic_is_x2apic_enabled(void)
|
|
|
|
{
|
|
|
|
u64 msr;
|
|
|
|
|
|
|
|
if (rdmsrl_safe(MSR_IA32_APICBASE, &msr))
|
|
|
|
return false;
|
|
|
|
return msr & X2APIC_ENABLE;
|
|
|
|
}
|
|
|
|
|
2015-09-28 17:26:31 +07:00
|
|
|
extern void enable_IR_x2apic(void);
|
|
|
|
|
|
|
|
extern int get_physical_broadcast(void);
|
|
|
|
|
|
|
|
extern int lapic_get_maxlvt(void);
|
|
|
|
extern void clear_local_APIC(void);
|
|
|
|
extern void disconnect_bsp_APIC(int virt_wire_setup);
|
|
|
|
extern void disable_local_APIC(void);
|
2019-07-24 22:25:52 +07:00
|
|
|
extern void apic_soft_disable(void);
|
2015-09-28 17:26:31 +07:00
|
|
|
extern void lapic_shutdown(void);
|
|
|
|
extern void sync_Arb_IDs(void);
|
2017-11-28 21:53:50 +07:00
|
|
|
extern void init_bsp_APIC(void);
|
2017-09-13 16:12:45 +07:00
|
|
|
extern void apic_intr_mode_init(void);
|
2015-09-28 17:26:31 +07:00
|
|
|
extern void init_apic_mappings(void);
|
|
|
|
void register_lapic_address(unsigned long address);
|
|
|
|
extern void setup_boot_APIC_clock(void);
|
|
|
|
extern void setup_secondary_APIC_clock(void);
|
2016-07-14 22:22:55 +07:00
|
|
|
extern void lapic_update_tsc_freq(void);
|
2015-09-28 17:26:31 +07:00
|
|
|
|
|
|
|
#ifdef CONFIG_X86_64
|
|
|
|
static inline int apic_force_enable(unsigned long addr)
|
|
|
|
{
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
#else
|
|
|
|
extern int apic_force_enable(unsigned long addr);
|
|
|
|
#endif
|
|
|
|
|
|
|
|
extern void apic_ap_setup(void);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* On 32bit this is mach-xxx local
|
|
|
|
*/
|
|
|
|
#ifdef CONFIG_X86_64
|
|
|
|
extern int apic_is_clustered_box(void);
|
|
|
|
#else
|
|
|
|
static inline int apic_is_clustered_box(void)
|
|
|
|
{
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
extern int setup_APIC_eilvt(u8 lvt_off, u8 vector, u8 msg_type, u8 mask);
|
2017-09-14 04:29:38 +07:00
|
|
|
extern void lapic_assign_system_vectors(void);
|
|
|
|
extern void lapic_assign_legacy_vector(unsigned int isairq, bool replace);
|
|
|
|
extern void lapic_online(void);
|
|
|
|
extern void lapic_offline(void);
|
2019-06-28 14:23:07 +07:00
|
|
|
extern bool apic_needs_pit(void);
|
2015-09-28 17:26:31 +07:00
|
|
|
|
2019-07-23 01:47:23 +07:00
|
|
|
extern void apic_send_IPI_allbutself(unsigned int vector);
|
|
|
|
|
2015-09-28 17:26:31 +07:00
|
|
|
#else /* !CONFIG_X86_LOCAL_APIC */
|
|
|
|
static inline void lapic_shutdown(void) { }
|
|
|
|
#define local_apic_timer_c2_ok 1
|
|
|
|
static inline void init_apic_mappings(void) { }
|
|
|
|
static inline void disable_local_APIC(void) { }
|
|
|
|
# define setup_boot_APIC_clock x86_init_noop
|
|
|
|
# define setup_secondary_APIC_clock x86_init_noop
|
2016-07-14 22:22:55 +07:00
|
|
|
static inline void lapic_update_tsc_freq(void) { }
|
2018-01-17 14:37:48 +07:00
|
|
|
static inline void init_bsp_APIC(void) { }
|
2017-09-13 16:12:45 +07:00
|
|
|
static inline void apic_intr_mode_init(void) { }
|
2017-09-14 04:29:38 +07:00
|
|
|
static inline void lapic_assign_system_vectors(void) { }
|
|
|
|
static inline void lapic_assign_legacy_vector(unsigned int i, bool r) { }
|
2019-06-28 14:23:07 +07:00
|
|
|
static inline bool apic_needs_pit(void) { return true; }
|
2015-09-28 17:26:31 +07:00
|
|
|
#endif /* !CONFIG_X86_LOCAL_APIC */
|
|
|
|
|
2009-04-03 16:15:50 +07:00
|
|
|
#ifdef CONFIG_X86_X2APIC
|
2009-03-18 01:16:54 +07:00
|
|
|
/*
|
|
|
|
* Make previous memory operations globally visible before
|
|
|
|
* sending the IPI through x2apic wrmsr. We need a serializing instruction or
|
|
|
|
* mfence for this.
|
|
|
|
*/
|
|
|
|
static inline void x2apic_wrmsr_fence(void)
|
|
|
|
{
|
|
|
|
asm volatile("mfence" : : : "memory");
|
|
|
|
}
|
|
|
|
|
2008-07-11 01:16:52 +07:00
|
|
|
static inline void native_apic_msr_write(u32 reg, u32 v)
|
|
|
|
{
|
|
|
|
if (reg == APIC_DFR || reg == APIC_ID || reg == APIC_LDR ||
|
|
|
|
reg == APIC_LVR)
|
|
|
|
return;
|
|
|
|
|
|
|
|
wrmsr(APIC_BASE_MSR + (reg >> 4), v, 0);
|
|
|
|
}
|
|
|
|
|
2012-05-16 23:03:58 +07:00
|
|
|
static inline void native_apic_msr_eoi_write(u32 reg, u32 v)
|
|
|
|
{
|
2017-01-21 03:29:41 +07:00
|
|
|
__wrmsr(APIC_BASE_MSR + (APIC_EOI >> 4), APIC_EOI_ACK, 0);
|
2012-05-16 23:03:58 +07:00
|
|
|
}
|
|
|
|
|
2008-07-11 01:16:52 +07:00
|
|
|
static inline u32 native_apic_msr_read(u32 reg)
|
|
|
|
{
|
2010-11-09 04:20:29 +07:00
|
|
|
u64 msr;
|
2008-07-11 01:16:52 +07:00
|
|
|
|
|
|
|
if (reg == APIC_DFR)
|
|
|
|
return -1;
|
|
|
|
|
2010-11-09 04:20:29 +07:00
|
|
|
rdmsrl(APIC_BASE_MSR + (reg >> 4), msr);
|
|
|
|
return (u32)msr;
|
2008-07-11 01:16:52 +07:00
|
|
|
}
|
|
|
|
|
2009-02-17 14:02:14 +07:00
|
|
|
static inline void native_x2apic_wait_icr_idle(void)
|
|
|
|
{
|
|
|
|
/* no need to wait for icr idle in x2apic */
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline u32 native_safe_x2apic_wait_icr_idle(void)
|
|
|
|
{
|
|
|
|
/* no need to wait for icr idle in x2apic */
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void native_x2apic_icr_write(u32 low, u32 id)
|
|
|
|
{
|
|
|
|
wrmsrl(APIC_BASE_MSR + (APIC_ICR >> 4), ((__u64) id) << 32 | low);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline u64 native_x2apic_icr_read(void)
|
|
|
|
{
|
|
|
|
unsigned long val;
|
|
|
|
|
|
|
|
rdmsrl(APIC_BASE_MSR + (APIC_ICR >> 4), val);
|
|
|
|
return val;
|
|
|
|
}
|
|
|
|
|
2015-01-16 04:22:11 +07:00
|
|
|
extern int x2apic_mode;
|
2009-04-21 03:02:27 +07:00
|
|
|
extern int x2apic_phys;
|
2015-01-16 04:22:17 +07:00
|
|
|
extern void __init check_x2apic(void);
|
2015-01-16 04:22:26 +07:00
|
|
|
extern void x2apic_setup(void);
|
2008-09-04 06:58:31 +07:00
|
|
|
static inline int x2apic_enabled(void)
|
|
|
|
{
|
2016-03-29 22:41:57 +07:00
|
|
|
return boot_cpu_has(X86_FEATURE_X2APIC) && apic_is_x2apic_enabled();
|
2008-09-04 06:58:31 +07:00
|
|
|
}
|
2009-04-21 03:02:27 +07:00
|
|
|
|
2016-03-29 22:41:57 +07:00
|
|
|
#define x2apic_supported() (boot_cpu_has(X86_FEATURE_X2APIC))
|
2015-09-28 17:26:31 +07:00
|
|
|
#else /* !CONFIG_X86_X2APIC */
|
2015-01-16 04:22:19 +07:00
|
|
|
static inline void check_x2apic(void) { }
|
2015-01-16 04:22:26 +07:00
|
|
|
static inline void x2apic_setup(void) { }
|
2015-01-16 04:22:19 +07:00
|
|
|
static inline int x2apic_enabled(void) { return 0; }
|
2009-03-17 07:05:00 +07:00
|
|
|
|
2015-01-16 04:22:11 +07:00
|
|
|
#define x2apic_mode (0)
|
|
|
|
#define x2apic_supported() (0)
|
2015-09-28 17:26:31 +07:00
|
|
|
#endif /* !CONFIG_X86_X2APIC */
|
2008-01-30 19:30:15 +07:00
|
|
|
|
2017-06-20 06:37:44 +07:00
|
|
|
struct irq_data;
|
|
|
|
|
2009-02-17 19:52:29 +07:00
|
|
|
/*
|
|
|
|
* Copyright 2004 James Cleverdon, IBM.
|
|
|
|
*
|
|
|
|
* Generic APIC sub-arch data struct.
|
|
|
|
*
|
|
|
|
* Hacked for x86-64 by James Cleverdon from i386 architecture code by
|
|
|
|
* Martin Bligh, Andi Kleen, James Bottomley, John Stultz, and
|
|
|
|
* James Cleverdon.
|
|
|
|
*/
|
2009-02-17 22:28:46 +07:00
|
|
|
struct apic {
|
2017-09-14 04:29:23 +07:00
|
|
|
/* Hotpath functions first */
|
|
|
|
void (*eoi_write)(u32 reg, u32 v);
|
|
|
|
void (*native_eoi_write)(u32 reg, u32 v);
|
|
|
|
void (*write)(u32 reg, u32 v);
|
|
|
|
u32 (*read)(u32 reg);
|
|
|
|
|
|
|
|
/* IPI related functions */
|
|
|
|
void (*wait_icr_idle)(void);
|
|
|
|
u32 (*safe_wait_icr_idle)(void);
|
|
|
|
|
|
|
|
void (*send_IPI)(int cpu, int vector);
|
|
|
|
void (*send_IPI_mask)(const struct cpumask *mask, int vector);
|
|
|
|
void (*send_IPI_mask_allbutself)(const struct cpumask *msk, int vec);
|
|
|
|
void (*send_IPI_allbutself)(int vector);
|
|
|
|
void (*send_IPI_all)(int vector);
|
|
|
|
void (*send_IPI_self)(int vector);
|
|
|
|
|
|
|
|
/* dest_logical is used by the IPI functions */
|
|
|
|
u32 dest_logical;
|
|
|
|
u32 disable_esr;
|
|
|
|
u32 irq_delivery_mode;
|
|
|
|
u32 irq_dest_mode;
|
|
|
|
|
2017-09-14 04:29:37 +07:00
|
|
|
u32 (*calc_dest_apicid)(unsigned int cpu);
|
2017-09-14 04:29:23 +07:00
|
|
|
|
|
|
|
/* ICR related functions */
|
|
|
|
u64 (*icr_read)(void);
|
|
|
|
void (*icr_write)(u32 low, u32 high);
|
|
|
|
|
|
|
|
/* Probe, setup and smpboot functions */
|
|
|
|
int (*probe)(void);
|
|
|
|
int (*acpi_madt_oem_check)(char *oem_id, char *oem_table_id);
|
2018-04-10 08:16:06 +07:00
|
|
|
int (*apic_id_valid)(u32 apicid);
|
2017-09-14 04:29:23 +07:00
|
|
|
int (*apic_id_registered)(void);
|
|
|
|
|
|
|
|
bool (*check_apicid_used)(physid_mask_t *map, int apicid);
|
|
|
|
void (*init_apic_ldr)(void);
|
|
|
|
void (*ioapic_phys_id_map)(physid_mask_t *phys_map, physid_mask_t *retmap);
|
|
|
|
void (*setup_apic_routing)(void);
|
|
|
|
int (*cpu_present_to_apicid)(int mps_cpu);
|
|
|
|
void (*apicid_to_cpu_present)(int phys_apicid, physid_mask_t *retmap);
|
|
|
|
int (*check_phys_apicid_present)(int phys_apicid);
|
|
|
|
int (*phys_pkg_id)(int cpuid_apic, int index_msb);
|
|
|
|
|
|
|
|
u32 (*get_apic_id)(unsigned long x);
|
|
|
|
u32 (*set_apic_id)(unsigned int id);
|
2009-02-17 19:52:29 +07:00
|
|
|
|
|
|
|
/* wakeup_secondary_cpu */
|
2017-09-14 04:29:23 +07:00
|
|
|
int (*wakeup_secondary_cpu)(int apicid, unsigned long start_eip);
|
2009-02-17 19:52:29 +07:00
|
|
|
|
2017-09-14 04:29:23 +07:00
|
|
|
void (*inquire_remote_apic)(int apicid);
|
2011-01-23 20:37:33 +07:00
|
|
|
|
|
|
|
#ifdef CONFIG_X86_32
|
|
|
|
/*
|
|
|
|
* Called very early during boot from get_smp_config(). It should
|
|
|
|
* return the logical apicid. x86_[bios]_cpu_to_apicid is
|
|
|
|
* initialized before this function is called.
|
|
|
|
*
|
|
|
|
* If logical apicid can't be determined that early, the function
|
|
|
|
* may return BAD_APICID. Logical apicid will be configured after
|
|
|
|
* init_apic_ldr() while bringing up CPUs. Note that NUMA affinity
|
|
|
|
* won't be applied properly during early boot in this case.
|
|
|
|
*/
|
|
|
|
int (*x86_32_early_logical_apicid)(int cpu);
|
|
|
|
#endif
|
2017-09-14 04:29:23 +07:00
|
|
|
char *name;
|
2009-02-17 19:52:29 +07:00
|
|
|
};
|
|
|
|
|
2009-02-26 18:47:40 +07:00
|
|
|
/*
|
|
|
|
* Pointer to the local APIC driver in use on this system (there's
|
|
|
|
* always just one such driver in use - the kernel decides via an
|
|
|
|
* early probing process which one it picks - and then sticks to it):
|
|
|
|
*/
|
2009-02-17 22:28:46 +07:00
|
|
|
extern struct apic *apic;
|
2009-02-26 18:47:40 +07:00
|
|
|
|
2011-05-21 07:51:17 +07:00
|
|
|
/*
|
|
|
|
* APIC drivers are probed based on how they are listed in the .apicdrivers
|
|
|
|
* section. So the order is important and enforced by the ordering
|
|
|
|
* of different apic driver files in the Makefile.
|
|
|
|
*
|
|
|
|
* For the files having two apic drivers, we use apic_drivers()
|
|
|
|
* to enforce the order with in them.
|
|
|
|
*/
|
|
|
|
#define apic_driver(sym) \
|
2012-10-05 07:11:42 +07:00
|
|
|
static const struct apic *__apicdrivers_##sym __used \
|
2011-05-21 07:51:17 +07:00
|
|
|
__aligned(sizeof(struct apic *)) \
|
|
|
|
__section(.apicdrivers) = { &sym }
|
|
|
|
|
|
|
|
#define apic_drivers(sym1, sym2) \
|
|
|
|
static struct apic *__apicdrivers_##sym1##sym2[2] __used \
|
|
|
|
__aligned(sizeof(struct apic *)) \
|
|
|
|
__section(.apicdrivers) = { &sym1, &sym2 }
|
|
|
|
|
|
|
|
extern struct apic *__apicdrivers[], *__apicdrivers_end[];
|
|
|
|
|
2009-02-26 18:47:40 +07:00
|
|
|
/*
|
|
|
|
* APIC functionality to boot other CPUs - only used on SMP:
|
|
|
|
*/
|
|
|
|
#ifdef CONFIG_SMP
|
2009-02-26 11:50:49 +07:00
|
|
|
extern int wakeup_secondary_cpu_via_nmi(int apicid, unsigned long start_eip);
|
2017-09-14 04:29:53 +07:00
|
|
|
extern int lapic_can_unplug_cpu(void);
|
2009-02-26 18:47:40 +07:00
|
|
|
#endif
|
2009-02-17 19:52:29 +07:00
|
|
|
|
2010-03-17 17:37:00 +07:00
|
|
|
#ifdef CONFIG_X86_LOCAL_APIC
|
2011-12-13 09:51:53 +07:00
|
|
|
|
2009-02-17 19:52:29 +07:00
|
|
|
static inline u32 apic_read(u32 reg)
|
|
|
|
{
|
|
|
|
return apic->read(reg);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void apic_write(u32 reg, u32 val)
|
|
|
|
{
|
|
|
|
apic->write(reg, val);
|
|
|
|
}
|
|
|
|
|
2012-05-16 23:03:52 +07:00
|
|
|
static inline void apic_eoi(void)
|
|
|
|
{
|
|
|
|
apic->eoi_write(APIC_EOI, APIC_EOI_ACK);
|
|
|
|
}
|
|
|
|
|
2009-02-17 19:52:29 +07:00
|
|
|
static inline u64 apic_icr_read(void)
|
|
|
|
{
|
|
|
|
return apic->icr_read();
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void apic_icr_write(u32 low, u32 high)
|
|
|
|
{
|
|
|
|
apic->icr_write(low, high);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void apic_wait_icr_idle(void)
|
|
|
|
{
|
|
|
|
apic->wait_icr_idle();
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline u32 safe_apic_wait_icr_idle(void)
|
|
|
|
{
|
|
|
|
return apic->safe_wait_icr_idle();
|
|
|
|
}
|
|
|
|
|
2012-07-15 19:56:46 +07:00
|
|
|
extern void __init apic_set_eoi_write(void (*eoi_write)(u32 reg, u32 v));
|
|
|
|
|
2010-03-17 17:37:00 +07:00
|
|
|
#else /* CONFIG_X86_LOCAL_APIC */
|
|
|
|
|
|
|
|
static inline u32 apic_read(u32 reg) { return 0; }
|
|
|
|
static inline void apic_write(u32 reg, u32 val) { }
|
2012-05-16 23:03:52 +07:00
|
|
|
static inline void apic_eoi(void) { }
|
2010-03-17 17:37:00 +07:00
|
|
|
static inline u64 apic_icr_read(void) { return 0; }
|
|
|
|
static inline void apic_icr_write(u32 low, u32 high) { }
|
|
|
|
static inline void apic_wait_icr_idle(void) { }
|
|
|
|
static inline u32 safe_apic_wait_icr_idle(void) { return 0; }
|
2012-07-15 19:56:46 +07:00
|
|
|
static inline void apic_set_eoi_write(void (*eoi_write)(u32 reg, u32 v)) {}
|
2010-03-17 17:37:00 +07:00
|
|
|
|
|
|
|
#endif /* CONFIG_X86_LOCAL_APIC */
|
2009-02-17 19:52:29 +07:00
|
|
|
|
2018-06-04 22:33:55 +07:00
|
|
|
extern void apic_ack_irq(struct irq_data *data);
|
|
|
|
|
2009-02-17 19:52:29 +07:00
|
|
|
static inline void ack_APIC_irq(void)
|
|
|
|
{
|
|
|
|
/*
|
|
|
|
* ack_APIC_irq() actually gets compiled as a single instruction
|
|
|
|
* ... yummie.
|
|
|
|
*/
|
2012-05-16 23:03:52 +07:00
|
|
|
apic_eoi();
|
2009-02-17 19:52:29 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned default_get_apic_id(unsigned long x)
|
|
|
|
{
|
|
|
|
unsigned int ver = GET_APIC_VERSION(apic_read(APIC_LVR));
|
|
|
|
|
2009-06-08 20:55:09 +07:00
|
|
|
if (APIC_XAPIC(ver) || boot_cpu_has(X86_FEATURE_EXTD_APICID))
|
2009-02-17 19:52:29 +07:00
|
|
|
return (x >> 24) & 0xFF;
|
|
|
|
else
|
|
|
|
return (x >> 24) & 0x0F;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2014-07-31 13:53:27 +07:00
|
|
|
* Warm reset vector position:
|
2009-02-17 19:52:29 +07:00
|
|
|
*/
|
2014-07-31 13:53:27 +07:00
|
|
|
#define TRAMPOLINE_PHYS_LOW 0x467
|
|
|
|
#define TRAMPOLINE_PHYS_HIGH 0x469
|
2009-02-17 19:52:29 +07:00
|
|
|
|
2011-09-28 22:44:54 +07:00
|
|
|
extern void generic_bigsmp_probe(void);
|
2009-02-17 19:52:29 +07:00
|
|
|
|
|
|
|
#ifdef CONFIG_X86_LOCAL_APIC
|
|
|
|
|
|
|
|
#include <asm/smp.h>
|
|
|
|
|
|
|
|
#define APIC_DFR_VALUE (APIC_DFR_FLAT)
|
|
|
|
|
x86: Add read_mostly declaration/definition to variables from smp.h
Add "read-mostly" qualifier to the following variables in
smp.h:
- cpu_sibling_map
- cpu_core_map
- cpu_llc_shared_map
- cpu_llc_id
- cpu_number
- x86_cpu_to_apicid
- x86_bios_cpu_apicid
- x86_cpu_to_logical_apicid
As long as all the variables above are only written during the
initialization, this change is meant to prevent the false
sharing. More specifically, on vSMP Foundation platform
x86_cpu_to_apicid shared the same internode_cache_line with
frequently written lapic_events.
From the analysis of the first 33 per_cpu variables out of 219
(memories they describe, to be more specific) the 8 have read_mostly
nature (tlb_vector_offset, cpu_loops_per_jiffy, xen_debug_irq, etc.)
and 25 are frequently written (irq_stack_union, gdt_page,
exception_stacks, idt_desc, etc.).
Assuming that the spread of the rest of the per_cpu variables is
similar, identifying the read mostly memories will make more sense
in terms of long-term code maintenance comparing to identifying
frequently written memories.
Signed-off-by: Vlad Zolotarov <vlad@scalemp.com>
Acked-by: Shai Fultheim <shai@scalemp.com>
Cc: Shai Fultheim (Shai@ScaleMP.com) <Shai@scalemp.com>
Cc: ido@wizery.com
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Andrew Morton <akpm@linux-foundation.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1719258.EYKzE4Zbq5@vlad
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2012-06-11 16:56:52 +07:00
|
|
|
DECLARE_EARLY_PER_CPU_READ_MOSTLY(u16, x86_bios_cpu_apicid);
|
2009-02-17 19:52:29 +07:00
|
|
|
|
2017-09-14 04:29:22 +07:00
|
|
|
extern struct apic apic_noop;
|
2009-02-17 19:52:29 +07:00
|
|
|
|
|
|
|
static inline unsigned int read_apic_id(void)
|
|
|
|
{
|
2017-09-14 04:29:22 +07:00
|
|
|
unsigned int reg = apic_read(APIC_ID);
|
2009-02-17 19:52:29 +07:00
|
|
|
|
|
|
|
return apic->get_apic_id(reg);
|
|
|
|
}
|
|
|
|
|
2018-04-10 08:16:06 +07:00
|
|
|
extern int default_apic_id_valid(u32 apicid);
|
2014-06-09 15:19:32 +07:00
|
|
|
extern int default_acpi_madt_oem_check(char *, char *);
|
2009-02-17 19:52:29 +07:00
|
|
|
extern void default_setup_apic_routing(void);
|
2017-09-14 04:29:37 +07:00
|
|
|
|
|
|
|
extern u32 apic_default_calc_apicid(unsigned int cpu);
|
|
|
|
extern u32 apic_flat_calc_apicid(unsigned int cpu);
|
|
|
|
|
2017-09-14 04:29:22 +07:00
|
|
|
extern bool default_check_apicid_used(physid_mask_t *map, int apicid);
|
|
|
|
extern void default_ioapic_phys_id_map(physid_mask_t *phys_map, physid_mask_t *retmap);
|
2009-02-17 19:52:29 +07:00
|
|
|
extern int default_cpu_present_to_apicid(int mps_cpu);
|
2009-08-31 20:18:40 +07:00
|
|
|
extern int default_check_phys_apicid_present(int phys_apicid);
|
2009-02-17 19:52:29 +07:00
|
|
|
|
|
|
|
#endif /* CONFIG_X86_LOCAL_APIC */
|
2017-09-14 04:29:22 +07:00
|
|
|
|
2018-05-29 22:50:22 +07:00
|
|
|
#ifdef CONFIG_SMP
|
|
|
|
bool apic_id_is_primary_thread(unsigned int id);
|
2019-07-23 01:47:22 +07:00
|
|
|
void apic_smt_update(void);
|
2018-05-29 22:50:22 +07:00
|
|
|
#else
|
|
|
|
static inline bool apic_id_is_primary_thread(unsigned int id) { return false; }
|
2019-07-23 01:47:22 +07:00
|
|
|
static inline void apic_smt_update(void) { }
|
2018-05-29 22:50:22 +07:00
|
|
|
#endif
|
|
|
|
|
x86, trace: Introduce entering/exiting_irq()
When implementing tracepoints in interrupt handers, if the tracepoints are
simply added in the performance sensitive path of interrupt handers,
it may cause potential performance problem due to the time penalty.
To solve the problem, an idea is to prepare non-trace/trace irq handers and
switch their IDTs at the enabling/disabling time.
So, let's introduce entering_irq()/exiting_irq() for pre/post-
processing of each irq handler.
A way to use them is as follows.
Non-trace irq handler:
smp_irq_handler()
{
entering_irq(); /* pre-processing of this handler */
__smp_irq_handler(); /*
* common logic between non-trace and trace handlers
* in a vector.
*/
exiting_irq(); /* post-processing of this handler */
}
Trace irq_handler:
smp_trace_irq_handler()
{
entering_irq(); /* pre-processing of this handler */
trace_irq_entry(); /* tracepoint for irq entry */
__smp_irq_handler(); /*
* common logic between non-trace and trace handlers
* in a vector.
*/
trace_irq_exit(); /* tracepoint for irq exit */
exiting_irq(); /* post-processing of this handler */
}
If tracepoints can place outside entering_irq()/exiting_irq() as follows,
it looks cleaner.
smp_trace_irq_handler()
{
trace_irq_entry();
smp_irq_handler();
trace_irq_exit();
}
But it doesn't work.
The problem is with irq_enter/exit() being called. They must be called before
trace_irq_enter/exit(), because of the rcu_irq_enter() must be called before
any tracepoints are used, as tracepoints use rcu to synchronize.
As a possible alternative, we may be able to call irq_enter() first as follows
if irq_enter() can nest.
smp_trace_irq_hander()
{
irq_entry();
trace_irq_entry();
smp_irq_handler();
trace_irq_exit();
irq_exit();
}
But it doesn't work, either.
If irq_enter() is nested, it may have a time penalty because it has to check if it
was already called or not. The time penalty is not desired in performance sensitive
paths even if it is tiny.
Signed-off-by: Seiji Aguchi <seiji.aguchi@hds.com>
Link: http://lkml.kernel.org/r/51C3238D.9040706@hds.com
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: Steven Rostedt <rostedt@goodmis.org>
2013-06-20 22:45:17 +07:00
|
|
|
extern void irq_enter(void);
|
|
|
|
extern void irq_exit(void);
|
|
|
|
|
|
|
|
static inline void entering_irq(void)
|
|
|
|
{
|
|
|
|
irq_enter();
|
2018-07-29 18:06:04 +07:00
|
|
|
kvm_set_cpu_l1tf_flush_l1d();
|
x86, trace: Introduce entering/exiting_irq()
When implementing tracepoints in interrupt handers, if the tracepoints are
simply added in the performance sensitive path of interrupt handers,
it may cause potential performance problem due to the time penalty.
To solve the problem, an idea is to prepare non-trace/trace irq handers and
switch their IDTs at the enabling/disabling time.
So, let's introduce entering_irq()/exiting_irq() for pre/post-
processing of each irq handler.
A way to use them is as follows.
Non-trace irq handler:
smp_irq_handler()
{
entering_irq(); /* pre-processing of this handler */
__smp_irq_handler(); /*
* common logic between non-trace and trace handlers
* in a vector.
*/
exiting_irq(); /* post-processing of this handler */
}
Trace irq_handler:
smp_trace_irq_handler()
{
entering_irq(); /* pre-processing of this handler */
trace_irq_entry(); /* tracepoint for irq entry */
__smp_irq_handler(); /*
* common logic between non-trace and trace handlers
* in a vector.
*/
trace_irq_exit(); /* tracepoint for irq exit */
exiting_irq(); /* post-processing of this handler */
}
If tracepoints can place outside entering_irq()/exiting_irq() as follows,
it looks cleaner.
smp_trace_irq_handler()
{
trace_irq_entry();
smp_irq_handler();
trace_irq_exit();
}
But it doesn't work.
The problem is with irq_enter/exit() being called. They must be called before
trace_irq_enter/exit(), because of the rcu_irq_enter() must be called before
any tracepoints are used, as tracepoints use rcu to synchronize.
As a possible alternative, we may be able to call irq_enter() first as follows
if irq_enter() can nest.
smp_trace_irq_hander()
{
irq_entry();
trace_irq_entry();
smp_irq_handler();
trace_irq_exit();
irq_exit();
}
But it doesn't work, either.
If irq_enter() is nested, it may have a time penalty because it has to check if it
was already called or not. The time penalty is not desired in performance sensitive
paths even if it is tiny.
Signed-off-by: Seiji Aguchi <seiji.aguchi@hds.com>
Link: http://lkml.kernel.org/r/51C3238D.9040706@hds.com
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: Steven Rostedt <rostedt@goodmis.org>
2013-06-20 22:45:17 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline void entering_ack_irq(void)
|
|
|
|
{
|
|
|
|
entering_irq();
|
2016-03-15 08:20:54 +07:00
|
|
|
ack_APIC_irq();
|
x86, trace: Introduce entering/exiting_irq()
When implementing tracepoints in interrupt handers, if the tracepoints are
simply added in the performance sensitive path of interrupt handers,
it may cause potential performance problem due to the time penalty.
To solve the problem, an idea is to prepare non-trace/trace irq handers and
switch their IDTs at the enabling/disabling time.
So, let's introduce entering_irq()/exiting_irq() for pre/post-
processing of each irq handler.
A way to use them is as follows.
Non-trace irq handler:
smp_irq_handler()
{
entering_irq(); /* pre-processing of this handler */
__smp_irq_handler(); /*
* common logic between non-trace and trace handlers
* in a vector.
*/
exiting_irq(); /* post-processing of this handler */
}
Trace irq_handler:
smp_trace_irq_handler()
{
entering_irq(); /* pre-processing of this handler */
trace_irq_entry(); /* tracepoint for irq entry */
__smp_irq_handler(); /*
* common logic between non-trace and trace handlers
* in a vector.
*/
trace_irq_exit(); /* tracepoint for irq exit */
exiting_irq(); /* post-processing of this handler */
}
If tracepoints can place outside entering_irq()/exiting_irq() as follows,
it looks cleaner.
smp_trace_irq_handler()
{
trace_irq_entry();
smp_irq_handler();
trace_irq_exit();
}
But it doesn't work.
The problem is with irq_enter/exit() being called. They must be called before
trace_irq_enter/exit(), because of the rcu_irq_enter() must be called before
any tracepoints are used, as tracepoints use rcu to synchronize.
As a possible alternative, we may be able to call irq_enter() first as follows
if irq_enter() can nest.
smp_trace_irq_hander()
{
irq_entry();
trace_irq_entry();
smp_irq_handler();
trace_irq_exit();
irq_exit();
}
But it doesn't work, either.
If irq_enter() is nested, it may have a time penalty because it has to check if it
was already called or not. The time penalty is not desired in performance sensitive
paths even if it is tiny.
Signed-off-by: Seiji Aguchi <seiji.aguchi@hds.com>
Link: http://lkml.kernel.org/r/51C3238D.9040706@hds.com
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: Steven Rostedt <rostedt@goodmis.org>
2013-06-20 22:45:17 +07:00
|
|
|
}
|
|
|
|
|
2015-05-15 20:50:45 +07:00
|
|
|
static inline void ipi_entering_ack_irq(void)
|
|
|
|
{
|
|
|
|
irq_enter();
|
2016-09-18 18:34:51 +07:00
|
|
|
ack_APIC_irq();
|
2018-07-29 18:06:04 +07:00
|
|
|
kvm_set_cpu_l1tf_flush_l1d();
|
2015-05-15 20:50:45 +07:00
|
|
|
}
|
|
|
|
|
x86, trace: Introduce entering/exiting_irq()
When implementing tracepoints in interrupt handers, if the tracepoints are
simply added in the performance sensitive path of interrupt handers,
it may cause potential performance problem due to the time penalty.
To solve the problem, an idea is to prepare non-trace/trace irq handers and
switch their IDTs at the enabling/disabling time.
So, let's introduce entering_irq()/exiting_irq() for pre/post-
processing of each irq handler.
A way to use them is as follows.
Non-trace irq handler:
smp_irq_handler()
{
entering_irq(); /* pre-processing of this handler */
__smp_irq_handler(); /*
* common logic between non-trace and trace handlers
* in a vector.
*/
exiting_irq(); /* post-processing of this handler */
}
Trace irq_handler:
smp_trace_irq_handler()
{
entering_irq(); /* pre-processing of this handler */
trace_irq_entry(); /* tracepoint for irq entry */
__smp_irq_handler(); /*
* common logic between non-trace and trace handlers
* in a vector.
*/
trace_irq_exit(); /* tracepoint for irq exit */
exiting_irq(); /* post-processing of this handler */
}
If tracepoints can place outside entering_irq()/exiting_irq() as follows,
it looks cleaner.
smp_trace_irq_handler()
{
trace_irq_entry();
smp_irq_handler();
trace_irq_exit();
}
But it doesn't work.
The problem is with irq_enter/exit() being called. They must be called before
trace_irq_enter/exit(), because of the rcu_irq_enter() must be called before
any tracepoints are used, as tracepoints use rcu to synchronize.
As a possible alternative, we may be able to call irq_enter() first as follows
if irq_enter() can nest.
smp_trace_irq_hander()
{
irq_entry();
trace_irq_entry();
smp_irq_handler();
trace_irq_exit();
irq_exit();
}
But it doesn't work, either.
If irq_enter() is nested, it may have a time penalty because it has to check if it
was already called or not. The time penalty is not desired in performance sensitive
paths even if it is tiny.
Signed-off-by: Seiji Aguchi <seiji.aguchi@hds.com>
Link: http://lkml.kernel.org/r/51C3238D.9040706@hds.com
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: Steven Rostedt <rostedt@goodmis.org>
2013-06-20 22:45:17 +07:00
|
|
|
static inline void exiting_irq(void)
|
|
|
|
{
|
|
|
|
irq_exit();
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void exiting_ack_irq(void)
|
|
|
|
{
|
|
|
|
ack_APIC_irq();
|
2016-09-18 18:34:51 +07:00
|
|
|
irq_exit();
|
x86, trace: Introduce entering/exiting_irq()
When implementing tracepoints in interrupt handers, if the tracepoints are
simply added in the performance sensitive path of interrupt handers,
it may cause potential performance problem due to the time penalty.
To solve the problem, an idea is to prepare non-trace/trace irq handers and
switch their IDTs at the enabling/disabling time.
So, let's introduce entering_irq()/exiting_irq() for pre/post-
processing of each irq handler.
A way to use them is as follows.
Non-trace irq handler:
smp_irq_handler()
{
entering_irq(); /* pre-processing of this handler */
__smp_irq_handler(); /*
* common logic between non-trace and trace handlers
* in a vector.
*/
exiting_irq(); /* post-processing of this handler */
}
Trace irq_handler:
smp_trace_irq_handler()
{
entering_irq(); /* pre-processing of this handler */
trace_irq_entry(); /* tracepoint for irq entry */
__smp_irq_handler(); /*
* common logic between non-trace and trace handlers
* in a vector.
*/
trace_irq_exit(); /* tracepoint for irq exit */
exiting_irq(); /* post-processing of this handler */
}
If tracepoints can place outside entering_irq()/exiting_irq() as follows,
it looks cleaner.
smp_trace_irq_handler()
{
trace_irq_entry();
smp_irq_handler();
trace_irq_exit();
}
But it doesn't work.
The problem is with irq_enter/exit() being called. They must be called before
trace_irq_enter/exit(), because of the rcu_irq_enter() must be called before
any tracepoints are used, as tracepoints use rcu to synchronize.
As a possible alternative, we may be able to call irq_enter() first as follows
if irq_enter() can nest.
smp_trace_irq_hander()
{
irq_entry();
trace_irq_entry();
smp_irq_handler();
trace_irq_exit();
irq_exit();
}
But it doesn't work, either.
If irq_enter() is nested, it may have a time penalty because it has to check if it
was already called or not. The time penalty is not desired in performance sensitive
paths even if it is tiny.
Signed-off-by: Seiji Aguchi <seiji.aguchi@hds.com>
Link: http://lkml.kernel.org/r/51C3238D.9040706@hds.com
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: Steven Rostedt <rostedt@goodmis.org>
2013-06-20 22:45:17 +07:00
|
|
|
}
|
2009-02-17 19:52:29 +07:00
|
|
|
|
2013-08-20 14:01:07 +07:00
|
|
|
extern void ioapic_zap_locks(void);
|
|
|
|
|
2008-10-23 12:26:29 +07:00
|
|
|
#endif /* _ASM_X86_APIC_H */
|