mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2024-12-12 01:06:48 +07:00
94e2b96ece
Enabling the SUE bit for core can can result in rare cache errors which are difficult to track down, so do not enable it. This can cause a minor performance loss in some tests. Signed-off-by: Jayachandran C <jchandra@broadcom.com> Cc: linux-mips@linux-mips.org Patchwork: https://patchwork.linux-mips.org/patch/8894/ Signed-off-by: Ralf Baechle <ralf@linux-mips.org>
301 lines
7.6 KiB
ArmAsm
301 lines
7.6 KiB
ArmAsm
/*
|
|
* Copyright 2003-2013 Broadcom Corporation.
|
|
* All Rights Reserved.
|
|
*
|
|
* This software is available to you under a choice of one of two
|
|
* licenses. You may choose to be licensed under the terms of the GNU
|
|
* General Public License (GPL) Version 2, available from the file
|
|
* COPYING in the main directory of this source tree, or the Broadcom
|
|
* license below:
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
*
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in
|
|
* the documentation and/or other materials provided with the
|
|
* distribution.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY BROADCOM ``AS IS'' AND ANY EXPRESS OR
|
|
* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
|
|
* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
* ARE DISCLAIMED. IN NO EVENT SHALL BROADCOM OR CONTRIBUTORS BE LIABLE
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
|
|
* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
|
|
* WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
|
|
* OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
|
|
* IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
|
|
#include <asm/asm.h>
|
|
#include <asm/asm-offsets.h>
|
|
#include <asm/cpu.h>
|
|
#include <asm/cacheops.h>
|
|
#include <asm/regdef.h>
|
|
#include <asm/mipsregs.h>
|
|
#include <asm/stackframe.h>
|
|
#include <asm/asmmacro.h>
|
|
#include <asm/addrspace.h>
|
|
|
|
#include <asm/netlogic/common.h>
|
|
|
|
#include <asm/netlogic/xlp-hal/iomap.h>
|
|
#include <asm/netlogic/xlp-hal/xlp.h>
|
|
#include <asm/netlogic/xlp-hal/sys.h>
|
|
#include <asm/netlogic/xlp-hal/cpucontrol.h>
|
|
|
|
#define CP0_EBASE $15
|
|
#define SYS_CPU_COHERENT_BASE CKSEG1ADDR(XLP_DEFAULT_IO_BASE) + \
|
|
XLP_IO_SYS_OFFSET(0) + XLP_IO_PCI_HDRSZ + \
|
|
SYS_CPU_NONCOHERENT_MODE * 4
|
|
|
|
/* Enable XLP features and workarounds in the LSU */
|
|
.macro xlp_config_lsu
|
|
li t0, LSU_DEFEATURE
|
|
mfcr t1, t0
|
|
|
|
lui t2, 0x4080 /* Enable Unaligned Access, L2HPE */
|
|
or t1, t1, t2
|
|
mtcr t1, t0
|
|
|
|
li t0, ICU_DEFEATURE
|
|
mfcr t1, t0
|
|
ori t1, 0x1000 /* Enable Icache partitioning */
|
|
mtcr t1, t0
|
|
|
|
li t0, SCHED_DEFEATURE
|
|
lui t1, 0x0100 /* Disable BRU accepting ALU ops */
|
|
mtcr t1, t0
|
|
.endm
|
|
|
|
/*
|
|
* Allow access to physical mem >64G by enabling ELPA in PAGEGRAIN
|
|
* register. This is needed before going to C code since the SP can
|
|
* in this region. Called from all HW threads.
|
|
*/
|
|
.macro xlp_early_mmu_init
|
|
mfc0 t0, CP0_PAGEMASK, 1
|
|
li t1, (1 << 29) /* ELPA bit */
|
|
or t0, t1
|
|
mtc0 t0, CP0_PAGEMASK, 1
|
|
.endm
|
|
|
|
/*
|
|
* L1D cache has to be flushed before enabling threads in XLP.
|
|
* On XLP8xx/XLP3xx, we do a low level flush using processor control
|
|
* registers. On XLPII CPUs, usual cache instructions work.
|
|
*/
|
|
.macro xlp_flush_l1_dcache
|
|
mfc0 t0, CP0_EBASE, 0
|
|
andi t0, t0, PRID_IMP_MASK
|
|
slt t1, t0, 0x1200
|
|
beqz t1, 15f
|
|
nop
|
|
|
|
/* XLP8xx low level cache flush */
|
|
li t0, LSU_DEBUG_DATA0
|
|
li t1, LSU_DEBUG_ADDR
|
|
li t2, 0 /* index */
|
|
li t3, 0x1000 /* loop count */
|
|
11:
|
|
sll v0, t2, 5
|
|
mtcr zero, t0
|
|
ori v1, v0, 0x3 /* way0 | write_enable | write_active */
|
|
mtcr v1, t1
|
|
12:
|
|
mfcr v1, t1
|
|
andi v1, 0x1 /* wait for write_active == 0 */
|
|
bnez v1, 12b
|
|
nop
|
|
mtcr zero, t0
|
|
ori v1, v0, 0x7 /* way1 | write_enable | write_active */
|
|
mtcr v1, t1
|
|
13:
|
|
mfcr v1, t1
|
|
andi v1, 0x1 /* wait for write_active == 0 */
|
|
bnez v1, 13b
|
|
nop
|
|
addi t2, 1
|
|
bne t3, t2, 11b
|
|
nop
|
|
b 17f
|
|
nop
|
|
|
|
/* XLPII CPUs, Invalidate all 64k of L1 D-cache */
|
|
15:
|
|
li t0, 0x80000000
|
|
li t1, 0x80010000
|
|
16: cache Index_Writeback_Inv_D, 0(t0)
|
|
addiu t0, t0, 32
|
|
bne t0, t1, 16b
|
|
nop
|
|
17:
|
|
.endm
|
|
|
|
/*
|
|
* nlm_reset_entry will be copied to the reset entry point for
|
|
* XLR and XLP. The XLP cores start here when they are woken up. This
|
|
* is also the NMI entry point.
|
|
*
|
|
* We use scratch reg 6/7 to save k0/k1 and check for NMI first.
|
|
*
|
|
* The data corresponding to reset/NMI is stored at RESET_DATA_PHYS
|
|
* location, this will have the thread mask (used when core is woken up)
|
|
* and the current NMI handler in case we reached here for an NMI.
|
|
*
|
|
* When a core or thread is newly woken up, it marks itself ready and
|
|
* loops in a 'wait'. When the CPU really needs waking up, we send an NMI
|
|
* IPI to it, with the NMI handler set to prom_boot_secondary_cpus
|
|
*/
|
|
.set noreorder
|
|
.set noat
|
|
.set arch=xlr /* for mfcr/mtcr, XLR is sufficient */
|
|
|
|
FEXPORT(nlm_reset_entry)
|
|
dmtc0 k0, $22, 6
|
|
dmtc0 k1, $22, 7
|
|
mfc0 k0, CP0_STATUS
|
|
li k1, 0x80000
|
|
and k1, k0, k1
|
|
beqz k1, 1f /* go to real reset entry */
|
|
nop
|
|
li k1, CKSEG1ADDR(RESET_DATA_PHYS) /* NMI */
|
|
ld k0, BOOT_NMI_HANDLER(k1)
|
|
jr k0
|
|
nop
|
|
|
|
1: /* Entry point on core wakeup */
|
|
mfc0 t0, CP0_EBASE, 0 /* processor ID */
|
|
andi t0, PRID_IMP_MASK
|
|
li t1, 0x1500 /* XLP 9xx */
|
|
beq t0, t1, 2f /* does not need to set coherent */
|
|
nop
|
|
|
|
li t1, 0x1300 /* XLP 5xx */
|
|
beq t0, t1, 2f /* does not need to set coherent */
|
|
nop
|
|
|
|
/* set bit in SYS coherent register for the core */
|
|
mfc0 t0, CP0_EBASE, 1
|
|
mfc0 t1, CP0_EBASE, 1
|
|
srl t1, 5
|
|
andi t1, 0x3 /* t1 <- node */
|
|
li t2, 0x40000
|
|
mul t3, t2, t1 /* t3 = node * 0x40000 */
|
|
srl t0, t0, 2
|
|
and t0, t0, 0x7 /* t0 <- core */
|
|
li t1, 0x1
|
|
sll t0, t1, t0
|
|
nor t0, t0, zero /* t0 <- ~(1 << core) */
|
|
li t2, SYS_CPU_COHERENT_BASE
|
|
add t2, t2, t3 /* t2 <- SYS offset for node */
|
|
lw t1, 0(t2)
|
|
and t1, t1, t0
|
|
sw t1, 0(t2)
|
|
|
|
/* read back to ensure complete */
|
|
lw t1, 0(t2)
|
|
sync
|
|
|
|
2:
|
|
/* Configure LSU on Non-0 Cores. */
|
|
xlp_config_lsu
|
|
/* FALL THROUGH */
|
|
|
|
/*
|
|
* Wake up sibling threads from the initial thread in a core.
|
|
*/
|
|
EXPORT(nlm_boot_siblings)
|
|
/* core L1D flush before enable threads */
|
|
xlp_flush_l1_dcache
|
|
/* save ra and sp, will be used later (only for boot cpu) */
|
|
dmtc0 ra, $22, 6
|
|
dmtc0 sp, $22, 7
|
|
/* Enable hw threads by writing to MAP_THREADMODE of the core */
|
|
li t0, CKSEG1ADDR(RESET_DATA_PHYS)
|
|
lw t1, BOOT_THREAD_MODE(t0) /* t1 <- thread mode */
|
|
li t0, ((CPU_BLOCKID_MAP << 8) | MAP_THREADMODE)
|
|
mfcr t2, t0
|
|
or t2, t2, t1
|
|
mtcr t2, t0
|
|
|
|
/*
|
|
* The new hardware thread starts at the next instruction
|
|
* For all the cases other than core 0 thread 0, we will
|
|
* jump to the secondary wait function.
|
|
|
|
* NOTE: All GPR contents are lost after the mtcr above!
|
|
*/
|
|
mfc0 v0, CP0_EBASE, 1
|
|
andi v0, 0x3ff /* v0 <- node/core */
|
|
|
|
/*
|
|
* Errata: to avoid potential live lock, setup IFU_BRUB_RESERVE
|
|
* when running 4 threads per core
|
|
*/
|
|
andi v1, v0, 0x3 /* v1 <- thread id */
|
|
bnez v1, 2f
|
|
nop
|
|
|
|
/* thread 0 of each core. */
|
|
li t0, CKSEG1ADDR(RESET_DATA_PHYS)
|
|
lw t1, BOOT_THREAD_MODE(t0) /* t1 <- thread mode */
|
|
subu t1, 0x3 /* 4-thread per core mode? */
|
|
bnez t1, 2f
|
|
nop
|
|
|
|
li t0, IFU_BRUB_RESERVE
|
|
li t1, 0x55
|
|
mtcr t1, t0
|
|
_ehb
|
|
2:
|
|
beqz v0, 4f /* boot cpu (cpuid == 0)? */
|
|
nop
|
|
|
|
/* setup status reg */
|
|
move t1, zero
|
|
#ifdef CONFIG_64BIT
|
|
ori t1, ST0_KX
|
|
#endif
|
|
mtc0 t1, CP0_STATUS
|
|
|
|
xlp_early_mmu_init
|
|
|
|
/* mark CPU ready */
|
|
li t3, CKSEG1ADDR(RESET_DATA_PHYS)
|
|
ADDIU t1, t3, BOOT_CPU_READY
|
|
sll v1, v0, 2
|
|
PTR_ADDU t1, v1
|
|
li t2, 1
|
|
sw t2, 0(t1)
|
|
/* Wait until NMI hits */
|
|
3: wait
|
|
b 3b
|
|
nop
|
|
|
|
/*
|
|
* For the boot CPU, we have to restore ra and sp and return, rest
|
|
* of the registers will be restored by the caller
|
|
*/
|
|
4:
|
|
dmfc0 ra, $22, 6
|
|
dmfc0 sp, $22, 7
|
|
jr ra
|
|
nop
|
|
EXPORT(nlm_reset_entry_end)
|
|
|
|
LEAF(nlm_init_boot_cpu)
|
|
#ifdef CONFIG_CPU_XLP
|
|
xlp_config_lsu
|
|
xlp_early_mmu_init
|
|
#endif
|
|
jr ra
|
|
nop
|
|
END(nlm_init_boot_cpu)
|