mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2024-12-28 11:18:45 +07:00
25d8d4eeca
- Add support for (optionally) using queued spinlocks & rwlocks. - Support for a new faster system call ABI using the scv instruction on Power9 or later. - Drop support for the PROT_SAO mmap/mprotect flag as it will be unsupported on Power10 and future processors, leaving us with no way to implement the functionality it requests. This risks breaking userspace, though we believe it is unused in practice. - A bug fix for, and then the removal of, our custom stack expansion checking. We now allow stack expansion up to the rlimit, like other architectures. - Remove the remnants of our (previously disabled) topology update code, which tried to react to NUMA layout changes on virtualised systems, but was prone to crashes and other problems. - Add PMU support for Power10 CPUs. - A change to our signal trampoline so that we don't unbalance the link stack (branch return predictor) in the signal delivery path. - Lots of other cleanups, refactorings, smaller features and so on as usual. Thanks to: Abhishek Goel, Alastair D'Silva, Alexander A. Klimov, Alexey Kardashevskiy, Alistair Popple, Andrew Donnellan, Aneesh Kumar K.V, Anju T Sudhakar, Anton Blanchard, Arnd Bergmann, Athira Rajeev, Balamuruhan S, Bharata B Rao, Bill Wendling, Bin Meng, Cédric Le Goater, Chris Packham, Christophe Leroy, Christoph Hellwig, Daniel Axtens, Dan Williams, David Lamparter, Desnes A. Nunes do Rosario, Erhard F., Finn Thain, Frederic Barrat, Ganesh Goudar, Gautham R. Shenoy, Geoff Levand, Greg Kurz, Gustavo A. R. Silva, Hari Bathini, Harish, Imre Kaloz, Joel Stanley, Joe Perches, John Crispin, Jordan Niethe, Kajol Jain, Kamalesh Babulal, Kees Cook, Laurent Dufour, Leonardo Bras, Li RongQing, Madhavan Srinivasan, Mahesh Salgaonkar, Mark Cave-Ayland, Michal Suchanek, Milton Miller, Mimi Zohar, Murilo Opsfelder Araujo, Nathan Chancellor, Nathan Lynch, Naveen N. Rao, Nayna Jain, Nicholas Piggin, Oliver O'Halloran, Palmer Dabbelt, Pedro Miraglia Franco de Carvalho, Philippe Bergheaud, Pingfan Liu, Pratik Rajesh Sampat, Qian Cai, Qinglang Miao, Randy Dunlap, Ravi Bangoria, Sachin Sant, Sam Bobroff, Sandipan Das, Santosh Sivaraj, Satheesh Rajendran, Shirisha Ganta, Sourabh Jain, Srikar Dronamraju, Stan Johnson, Stephen Rothwell, Thadeu Lima de Souza Cascardo, Thiago Jung Bauermann, Tom Lane, Vaibhav Jain, Vladis Dronov, Wei Yongjun, Wen Xiong, YueHaibing. -----BEGIN PGP SIGNATURE----- iQJHBAABCAAxFiEEJFGtCPCthwEv2Y/bUevqPMjhpYAFAl8tOxATHG1wZUBlbGxl cm1hbi5pZC5hdQAKCRBR6+o8yOGlgDQfEAClXHWf6hnxB84bEu39D51NkVotL1IG BRWFvyix+xHuUkHIouBPAAMl6ngY5X6wkYd+Z+CY9zHNtdSDoVlJE30YXdMQA/dE L/rYxR1884yGR/uU/3wusboO68ReXwcKQPmKOymUfh0zH7ujyJsSWLpXFK1YDC5d 2TVVTi0Q+P5ucMHDh0L+AHirIxZvtZSp43+J7xLtywsj+XAxJWCTGo5WCJbdgbCA Qbv3aOkVyUa3EgsbdM/STPpv82ebqT+PHxeSIO4Jw6ZODtKRH0R5YsWCApuY9eZ+ ebY9RLmgv9ZAhJqB2fv9A5NDcMoGpZNmjM7HrWpXwULKQpkBGHCzJ9FcSdHVMOx8 nbVMFjt4uzLwV1w8lFYslQ2tNH/uH2o9BlryV1RLpiiKokDAJO/NOsWN9y0u/I4J EmAM5DSX2LgVvvas96IlGK8KX4xkOkf8FLX/H5UDvvAfloH8J4CZXk/CWCab/nqY KEHPnMmYvQZ1w9SzyZg9sO/1p6Bl1Gmm75Jv2F1lBiRW/42VcGBI/qLsJ4lC59Fc KbwufYNYYG38wbxDLW1HAPJhRonxIcaZj3EEqk7aTiLZ55nNbu8e2k32CpNXTGqt npOhzJHimcq7L6+878ZW+xpbZwogIEUdRSsmwb6aT8za3ShnYwSA2Q3LYxh9xyGH j3GifvPq6Efp3Q== =QMY1 -----END PGP SIGNATURE----- Merge tag 'powerpc-5.9-1' of git://git.kernel.org/pub/scm/linux/kernel/git/powerpc/linux Pull powerpc updates from Michael Ellerman: - Add support for (optionally) using queued spinlocks & rwlocks. - Support for a new faster system call ABI using the scv instruction on Power9 or later. - Drop support for the PROT_SAO mmap/mprotect flag as it will be unsupported on Power10 and future processors, leaving us with no way to implement the functionality it requests. This risks breaking userspace, though we believe it is unused in practice. - A bug fix for, and then the removal of, our custom stack expansion checking. We now allow stack expansion up to the rlimit, like other architectures. - Remove the remnants of our (previously disabled) topology update code, which tried to react to NUMA layout changes on virtualised systems, but was prone to crashes and other problems. - Add PMU support for Power10 CPUs. - A change to our signal trampoline so that we don't unbalance the link stack (branch return predictor) in the signal delivery path. - Lots of other cleanups, refactorings, smaller features and so on as usual. Thanks to: Abhishek Goel, Alastair D'Silva, Alexander A. Klimov, Alexey Kardashevskiy, Alistair Popple, Andrew Donnellan, Aneesh Kumar K.V, Anju T Sudhakar, Anton Blanchard, Arnd Bergmann, Athira Rajeev, Balamuruhan S, Bharata B Rao, Bill Wendling, Bin Meng, Cédric Le Goater, Chris Packham, Christophe Leroy, Christoph Hellwig, Daniel Axtens, Dan Williams, David Lamparter, Desnes A. Nunes do Rosario, Erhard F., Finn Thain, Frederic Barrat, Ganesh Goudar, Gautham R. Shenoy, Geoff Levand, Greg Kurz, Gustavo A. R. Silva, Hari Bathini, Harish, Imre Kaloz, Joel Stanley, Joe Perches, John Crispin, Jordan Niethe, Kajol Jain, Kamalesh Babulal, Kees Cook, Laurent Dufour, Leonardo Bras, Li RongQing, Madhavan Srinivasan, Mahesh Salgaonkar, Mark Cave-Ayland, Michal Suchanek, Milton Miller, Mimi Zohar, Murilo Opsfelder Araujo, Nathan Chancellor, Nathan Lynch, Naveen N. Rao, Nayna Jain, Nicholas Piggin, Oliver O'Halloran, Palmer Dabbelt, Pedro Miraglia Franco de Carvalho, Philippe Bergheaud, Pingfan Liu, Pratik Rajesh Sampat, Qian Cai, Qinglang Miao, Randy Dunlap, Ravi Bangoria, Sachin Sant, Sam Bobroff, Sandipan Das, Santosh Sivaraj, Satheesh Rajendran, Shirisha Ganta, Sourabh Jain, Srikar Dronamraju, Stan Johnson, Stephen Rothwell, Thadeu Lima de Souza Cascardo, Thiago Jung Bauermann, Tom Lane, Vaibhav Jain, Vladis Dronov, Wei Yongjun, Wen Xiong, YueHaibing. * tag 'powerpc-5.9-1' of git://git.kernel.org/pub/scm/linux/kernel/git/powerpc/linux: (337 commits) selftests/powerpc: Fix pkey syscall redefinitions powerpc: Fix circular dependency between percpu.h and mmu.h powerpc/powernv/sriov: Fix use of uninitialised variable selftests/powerpc: Skip vmx/vsx/tar/etc tests on older CPUs powerpc/40x: Fix assembler warning about r0 powerpc/papr_scm: Add support for fetching nvdimm 'fuel-gauge' metric powerpc/papr_scm: Fetch nvdimm performance stats from PHYP cpuidle: pseries: Fixup exit latency for CEDE(0) cpuidle: pseries: Add function to parse extended CEDE records cpuidle: pseries: Set the latency-hint before entering CEDE selftests/powerpc: Fix online CPU selection powerpc/perf: Consolidate perf_callchain_user_[64|32]() powerpc/pseries/hotplug-cpu: Remove double free in error path powerpc/pseries/mobility: Add pr_debug() for device tree changes powerpc/pseries/mobility: Set pr_fmt() powerpc/cacheinfo: Warn if cache object chain becomes unordered powerpc/cacheinfo: Improve diagnostics about malformed cache lists powerpc/cacheinfo: Use name@unit instead of full DT path in debug messages powerpc/cacheinfo: Set pr_fmt() powerpc: fix function annotations to avoid section mismatch warnings with gcc-10 ...
296 lines
8.6 KiB
C
296 lines
8.6 KiB
C
/* SPDX-License-Identifier: GPL-2.0-or-later */
|
|
/*
|
|
* This control block defines the PACA which defines the processor
|
|
* specific data for each logical processor on the system.
|
|
* There are some pointers defined that are utilized by PLIC.
|
|
*
|
|
* C 2001 PPC 64 Team, IBM Corp
|
|
*/
|
|
#ifndef _ASM_POWERPC_PACA_H
|
|
#define _ASM_POWERPC_PACA_H
|
|
#ifdef __KERNEL__
|
|
|
|
#ifdef CONFIG_PPC64
|
|
|
|
#include <linux/string.h>
|
|
#include <asm/types.h>
|
|
#include <asm/lppaca.h>
|
|
#include <asm/mmu.h>
|
|
#include <asm/page.h>
|
|
#ifdef CONFIG_PPC_BOOK3E
|
|
#include <asm/exception-64e.h>
|
|
#else
|
|
#include <asm/exception-64s.h>
|
|
#endif
|
|
#ifdef CONFIG_KVM_BOOK3S_64_HANDLER
|
|
#include <asm/kvm_book3s_asm.h>
|
|
#endif
|
|
#include <asm/accounting.h>
|
|
#include <asm/hmi.h>
|
|
#include <asm/cpuidle.h>
|
|
#include <asm/atomic.h>
|
|
|
|
#include <asm-generic/mmiowb_types.h>
|
|
|
|
register struct paca_struct *local_paca asm("r13");
|
|
|
|
#if defined(CONFIG_DEBUG_PREEMPT) && defined(CONFIG_SMP)
|
|
extern unsigned int debug_smp_processor_id(void); /* from linux/smp.h */
|
|
/*
|
|
* Add standard checks that preemption cannot occur when using get_paca():
|
|
* otherwise the paca_struct it points to may be the wrong one just after.
|
|
*/
|
|
#define get_paca() ((void) debug_smp_processor_id(), local_paca)
|
|
#else
|
|
#define get_paca() local_paca
|
|
#endif
|
|
|
|
#ifdef CONFIG_PPC_PSERIES
|
|
#define get_lppaca() (get_paca()->lppaca_ptr)
|
|
#endif
|
|
|
|
#define get_slb_shadow() (get_paca()->slb_shadow_ptr)
|
|
|
|
struct task_struct;
|
|
struct rtas_args;
|
|
|
|
/*
|
|
* Defines the layout of the paca.
|
|
*
|
|
* This structure is not directly accessed by firmware or the service
|
|
* processor.
|
|
*/
|
|
struct paca_struct {
|
|
#ifdef CONFIG_PPC_PSERIES
|
|
/*
|
|
* Because hw_cpu_id, unlike other paca fields, is accessed
|
|
* routinely from other CPUs (from the IRQ code), we stick to
|
|
* read-only (after boot) fields in the first cacheline to
|
|
* avoid cacheline bouncing.
|
|
*/
|
|
|
|
struct lppaca *lppaca_ptr; /* Pointer to LpPaca for PLIC */
|
|
#endif /* CONFIG_PPC_PSERIES */
|
|
|
|
/*
|
|
* MAGIC: the spinlock functions in arch/powerpc/lib/locks.c
|
|
* load lock_token and paca_index with a single lwz
|
|
* instruction. They must travel together and be properly
|
|
* aligned.
|
|
*/
|
|
#ifdef __BIG_ENDIAN__
|
|
u16 lock_token; /* Constant 0x8000, used in locks */
|
|
u16 paca_index; /* Logical processor number */
|
|
#else
|
|
u16 paca_index; /* Logical processor number */
|
|
u16 lock_token; /* Constant 0x8000, used in locks */
|
|
#endif
|
|
|
|
u64 kernel_toc; /* Kernel TOC address */
|
|
u64 kernelbase; /* Base address of kernel */
|
|
u64 kernel_msr; /* MSR while running in kernel */
|
|
void *emergency_sp; /* pointer to emergency stack */
|
|
u64 data_offset; /* per cpu data offset */
|
|
s16 hw_cpu_id; /* Physical processor number */
|
|
u8 cpu_start; /* At startup, processor spins until */
|
|
/* this becomes non-zero. */
|
|
u8 kexec_state; /* set when kexec down has irqs off */
|
|
#ifdef CONFIG_PPC_BOOK3S_64
|
|
struct slb_shadow *slb_shadow_ptr;
|
|
struct dtl_entry *dispatch_log;
|
|
struct dtl_entry *dispatch_log_end;
|
|
#endif
|
|
u64 dscr_default; /* per-CPU default DSCR */
|
|
|
|
#ifdef CONFIG_PPC_BOOK3S_64
|
|
/*
|
|
* Now, starting in cacheline 2, the exception save areas
|
|
*/
|
|
/* used for most interrupts/exceptions */
|
|
u64 exgen[EX_SIZE] __attribute__((aligned(0x80)));
|
|
u64 exslb[EX_SIZE]; /* used for SLB/segment table misses
|
|
* on the linear mapping */
|
|
/* SLB related definitions */
|
|
u16 vmalloc_sllp;
|
|
u8 slb_cache_ptr;
|
|
u8 stab_rr; /* stab/slb round-robin counter */
|
|
#ifdef CONFIG_DEBUG_VM
|
|
u8 in_kernel_slb_handler;
|
|
#endif
|
|
u32 slb_used_bitmap; /* Bitmaps for first 32 SLB entries. */
|
|
u32 slb_kern_bitmap;
|
|
u32 slb_cache[SLB_CACHE_ENTRIES];
|
|
#endif /* CONFIG_PPC_BOOK3S_64 */
|
|
|
|
#ifdef CONFIG_PPC_BOOK3E
|
|
u64 exgen[8] __aligned(0x40);
|
|
/* Keep pgd in the same cacheline as the start of extlb */
|
|
pgd_t *pgd __aligned(0x40); /* Current PGD */
|
|
pgd_t *kernel_pgd; /* Kernel PGD */
|
|
|
|
/* Shared by all threads of a core -- points to tcd of first thread */
|
|
struct tlb_core_data *tcd_ptr;
|
|
|
|
/*
|
|
* We can have up to 3 levels of reentrancy in the TLB miss handler,
|
|
* in each of four exception levels (normal, crit, mcheck, debug).
|
|
*/
|
|
u64 extlb[12][EX_TLB_SIZE / sizeof(u64)];
|
|
u64 exmc[8]; /* used for machine checks */
|
|
u64 excrit[8]; /* used for crit interrupts */
|
|
u64 exdbg[8]; /* used for debug interrupts */
|
|
|
|
/* Kernel stack pointers for use by special exceptions */
|
|
void *mc_kstack;
|
|
void *crit_kstack;
|
|
void *dbg_kstack;
|
|
|
|
struct tlb_core_data tcd;
|
|
#endif /* CONFIG_PPC_BOOK3E */
|
|
|
|
#ifdef CONFIG_PPC_BOOK3S
|
|
mm_context_id_t mm_ctx_id;
|
|
#ifdef CONFIG_PPC_MM_SLICES
|
|
unsigned char mm_ctx_low_slices_psize[BITS_PER_LONG / BITS_PER_BYTE];
|
|
unsigned char mm_ctx_high_slices_psize[SLICE_ARRAY_SIZE];
|
|
unsigned long mm_ctx_slb_addr_limit;
|
|
#else
|
|
u16 mm_ctx_user_psize;
|
|
u16 mm_ctx_sllp;
|
|
#endif
|
|
#endif
|
|
|
|
/*
|
|
* then miscellaneous read-write fields
|
|
*/
|
|
struct task_struct *__current; /* Pointer to current */
|
|
u64 kstack; /* Saved Kernel stack addr */
|
|
u64 saved_r1; /* r1 save for RTAS calls or PM or EE=0 */
|
|
u64 saved_msr; /* MSR saved here by enter_rtas */
|
|
#ifdef CONFIG_PPC_BOOK3E
|
|
u16 trap_save; /* Used when bad stack is encountered */
|
|
#endif
|
|
u8 irq_soft_mask; /* mask for irq soft masking */
|
|
u8 irq_happened; /* irq happened while soft-disabled */
|
|
u8 irq_work_pending; /* IRQ_WORK interrupt while soft-disable */
|
|
#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
|
|
u8 pmcregs_in_use; /* pseries puts this in lppaca */
|
|
#endif
|
|
u64 sprg_vdso; /* Saved user-visible sprg */
|
|
#ifdef CONFIG_PPC_TRANSACTIONAL_MEM
|
|
u64 tm_scratch; /* TM scratch area for reclaim */
|
|
#endif
|
|
|
|
#ifdef CONFIG_PPC_POWERNV
|
|
/* PowerNV idle fields */
|
|
/* PNV_CORE_IDLE_* bits, all siblings work on thread 0 paca */
|
|
unsigned long idle_state;
|
|
union {
|
|
/* P7/P8 specific fields */
|
|
struct {
|
|
/* PNV_THREAD_RUNNING/NAP/SLEEP */
|
|
u8 thread_idle_state;
|
|
/* Mask to denote subcore sibling threads */
|
|
u8 subcore_sibling_mask;
|
|
};
|
|
|
|
/* P9 specific fields */
|
|
struct {
|
|
#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
|
|
/* The PSSCR value that the kernel requested before going to stop */
|
|
u64 requested_psscr;
|
|
/* Flag to request this thread not to stop */
|
|
atomic_t dont_stop;
|
|
#endif
|
|
};
|
|
};
|
|
#endif
|
|
|
|
#ifdef CONFIG_PPC_BOOK3S_64
|
|
/* Non-maskable exceptions that are not performance critical */
|
|
u64 exnmi[EX_SIZE]; /* used for system reset (nmi) */
|
|
u64 exmc[EX_SIZE]; /* used for machine checks */
|
|
#endif
|
|
#ifdef CONFIG_PPC_BOOK3S_64
|
|
/* Exclusive stacks for system reset and machine check exception. */
|
|
void *nmi_emergency_sp;
|
|
void *mc_emergency_sp;
|
|
|
|
u16 in_nmi; /* In nmi handler */
|
|
|
|
/*
|
|
* Flag to check whether we are in machine check early handler
|
|
* and already using emergency stack.
|
|
*/
|
|
u16 in_mce;
|
|
u8 hmi_event_available; /* HMI event is available */
|
|
u8 hmi_p9_special_emu; /* HMI P9 special emulation */
|
|
u32 hmi_irqs; /* HMI irq stat */
|
|
#endif
|
|
u8 ftrace_enabled; /* Hard disable ftrace */
|
|
|
|
/* Stuff for accurate time accounting */
|
|
struct cpu_accounting_data accounting;
|
|
u64 dtl_ridx; /* read index in dispatch log */
|
|
struct dtl_entry *dtl_curr; /* pointer corresponding to dtl_ridx */
|
|
|
|
#ifdef CONFIG_KVM_BOOK3S_HANDLER
|
|
#ifdef CONFIG_KVM_BOOK3S_PR_POSSIBLE
|
|
/* We use this to store guest state in */
|
|
struct kvmppc_book3s_shadow_vcpu shadow_vcpu;
|
|
#endif
|
|
struct kvmppc_host_state kvm_hstate;
|
|
#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
|
|
/*
|
|
* Bitmap for sibling subcore status. See kvm/book3s_hv_ras.c for
|
|
* more details
|
|
*/
|
|
struct sibling_subcore_state *sibling_subcore_state;
|
|
#endif
|
|
#endif
|
|
#ifdef CONFIG_PPC_BOOK3S_64
|
|
/*
|
|
* rfi fallback flush must be in its own cacheline to prevent
|
|
* other paca data leaking into the L1d
|
|
*/
|
|
u64 exrfi[EX_SIZE] __aligned(0x80);
|
|
void *rfi_flush_fallback_area;
|
|
u64 l1d_flush_size;
|
|
#endif
|
|
#ifdef CONFIG_PPC_PSERIES
|
|
struct rtas_args *rtas_args_reentrant;
|
|
u8 *mce_data_buf; /* buffer to hold per cpu rtas errlog */
|
|
#endif /* CONFIG_PPC_PSERIES */
|
|
|
|
#ifdef CONFIG_PPC_BOOK3S_64
|
|
/* Capture SLB related old contents in MCE handler. */
|
|
struct slb_entry *mce_faulty_slbs;
|
|
u16 slb_save_cache_ptr;
|
|
#endif /* CONFIG_PPC_BOOK3S_64 */
|
|
#ifdef CONFIG_STACKPROTECTOR
|
|
unsigned long canary;
|
|
#endif
|
|
#ifdef CONFIG_MMIOWB
|
|
struct mmiowb_state mmiowb_state;
|
|
#endif
|
|
} ____cacheline_aligned;
|
|
|
|
extern void copy_mm_to_paca(struct mm_struct *mm);
|
|
extern struct paca_struct **paca_ptrs;
|
|
extern void initialise_paca(struct paca_struct *new_paca, int cpu);
|
|
extern void setup_paca(struct paca_struct *new_paca);
|
|
extern void allocate_paca_ptrs(void);
|
|
extern void allocate_paca(int cpu);
|
|
extern void free_unused_pacas(void);
|
|
|
|
#else /* CONFIG_PPC64 */
|
|
|
|
static inline void allocate_paca_ptrs(void) { };
|
|
static inline void allocate_paca(int cpu) { };
|
|
static inline void free_unused_pacas(void) { };
|
|
|
|
#endif /* CONFIG_PPC64 */
|
|
|
|
#endif /* __KERNEL__ */
|
|
#endif /* _ASM_POWERPC_PACA_H */
|