mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2025-01-22 23:59:26 +07:00
6b4feaea25
It is allowed to enable/disable clocks from interrupts, so common Exynos ARM clock management code for CPUfreq should use 'irqsave' version of spin_lock calls to avoid potential deadlock caused by spin_lock recursion. The same spin_lock is used by gate/mux clocks during enable/disable calls. This deadlock, can be reproduced by enabling CPUfreq (ondemand or userspace) and decoding video with s5p-mfc driver. Relevant stack trace: [ 5928.061534] BUG: spinlock recursion on CPU#0, bash/1252 [ 5928.061609] lock: 0xee80454c, .magic: dead4ead, .owner: bash/1252, .owner_cpu: 0 [ 5928.068586] CPU: 0 PID: 1252 Comm: bash Tainted: G W 4.4.0-rc4-00001-g447a7fd #678 [ 5928.077260] Hardware name: SAMSUNG EXYNOS (Flattened Device Tree) [ 5928.083359] [<c00153dc>] (unwind_backtrace) from [<c00121b4>] (show_stack+0x10/0x14) [ 5928.091072] [<c00121b4>] (show_stack) from [<c0213e28>] (dump_stack+0x68/0xb8) [ 5928.098275] [<c0213e28>] (dump_stack) from [<c005c1ec>] (do_raw_spin_lock+0x184/0x1ac) [ 5928.106177] [<c005c1ec>] (do_raw_spin_lock) from [<c05cfa98>] (_raw_spin_lock_irqsave+0x20/0x28) [ 5928.114943] [<c05cfa98>] (_raw_spin_lock_irqsave) from [<c0468698>] (clk_gate_endisable+0x24/0x98) [ 5928.123882] [<c0468698>] (clk_gate_endisable) from [<c0464d40>] (clk_core_disable+0x60/0x84) [ 5928.132299] [<c0464d40>] (clk_core_disable) from [<c0465e00>] (clk_disable+0x24/0x30) [ 5928.140117] [<c0465e00>] (clk_disable) from [<c03f3b80>] (s5p_mfc_handle_frame+0x254/0x860) [ 5928.148445] [<c03f3b80>] (s5p_mfc_handle_frame) from [<c03f4b34>] (s5p_mfc_irq+0x890/0xa24) [ 5928.156778] [<c03f4b34>] (s5p_mfc_irq) from [<c00627bc>] (handle_irq_event_percpu+0x50/0x14c) [ 5928.165283] [<c00627bc>] (handle_irq_event_percpu) from [<c00628f0>] (handle_irq_event+0x38/0x5c) [ 5928.174143] [<c00628f0>] (handle_irq_event) from [<c0065864>] (handle_fasteoi_irq+0xdc/0x1a4) [ 5928.182645] [<c0065864>] (handle_fasteoi_irq) from [<c0062090>] (generic_handle_irq+0x18/0x28) [ 5928.191236] [<c0062090>] (generic_handle_irq) from [<c00621a4>] (__handle_domain_irq+0x6c/0xdc) [ 5928.199917] [<c00621a4>] (__handle_domain_irq) from [<c0009470>] (gic_handle_irq+0x4c/0x98) [ 5928.208249] [<c0009470>] (gic_handle_irq) from [<c0012c54>] (__irq_svc+0x54/0x90) [ 5928.215709] Exception stack(0xeddb5cb8 to 0xeddb5d00) [ 5928.220745] 5ca0: ee80454c faddfadc [ 5928.228906] 5cc0: 00000000 01000001 ee831ce0 f8114200 ee807c00 01130520 00000403 eddb5d84 [ 5928.237063] 5ce0: ee807c48 2faf0800 ee807c0c eddb5d08 c046b618 c046b634 20000053 ffffffff [ 5928.245225] [<c0012c54>] (__irq_svc) from [<c046b634>] (exynos_cpuclk_notifier_cb+0x170/0x270) [ 5928.253823] [<c046b634>] (exynos_cpuclk_notifier_cb) from [<c003cb58>] (notifier_call_chain+0x44/0x84) [ 5928.263106] [<c003cb58>] (notifier_call_chain) from [<c003ccd4>] (__srcu_notifier_call_chain+0x6c/0x9c) [ 5928.272480] [<c003ccd4>] (__srcu_notifier_call_chain) from [<c003cd1c>] (srcu_notifier_call_chain+0x18/0x20) [ 5928.282288] [<c003cd1c>] (srcu_notifier_call_chain) from [<c0464ed0>] (__clk_notify+0x6c/0x74) [ 5928.290881] [<c0464ed0>] (__clk_notify) from [<c0465388>] (clk_propagate_rate_change+0xa0/0xac) [ 5928.299561] [<c0465388>] (clk_propagate_rate_change) from [<c0465378>] (clk_propagate_rate_change+0x90/0xac) [ 5928.309370] [<c0465378>] (clk_propagate_rate_change) from [<c04666fc>] (clk_core_set_rate_nolock+0x64/0xa8) [ 5928.319091] [<c04666fc>] (clk_core_set_rate_nolock) from [<c0466760>] (clk_set_rate+0x20/0x30) [ 5928.327686] [<c0466760>] (clk_set_rate) from [<c0428c70>] (set_target+0xe8/0x23c) [ 5928.335152] [<c0428c70>] (set_target) from [<c04244d0>] (__cpufreq_driver_target+0x184/0x29c) [ 5928.343655] [<c04244d0>] (__cpufreq_driver_target) from [<c0427128>] (cpufreq_set+0x44/0x64) [ 5928.352074] [<c0427128>] (cpufreq_set) from [<c0423948>] (store_scaling_setspeed+0x5c/0x74) [ 5928.360407] [<c0423948>] (store_scaling_setspeed) from [<c04238d0>] (store+0x7c/0x98) [ 5928.368221] [<c04238d0>] (store) from [<c0132540>] (sysfs_kf_write+0x44/0x48) [ 5928.375338] [<c0132540>] (sysfs_kf_write) from [<c0131b9c>] (kernfs_fop_write+0xb8/0x1bc) [ 5928.383496] [<c0131b9c>] (kernfs_fop_write) from [<c00d71f8>] (__vfs_write+0x2c/0xd4) [ 5928.391308] [<c00d71f8>] (__vfs_write) from [<c00d7de8>] (vfs_write+0xa0/0x144) [ 5928.398598] [<c00d7de8>] (vfs_write) from [<c00d8048>] (SyS_write+0x44/0x84) [ 5928.405631] [<c00d8048>] (SyS_write) from [<c000f540>] (ret_fast_syscall+0x0/0x3c) CC: stable@vger.kernel.org # v4.2+ Signed-off-by: Marek Szyprowski <m.szyprowski@samsung.com> Signed-off-by: Sylwester Nawrocki <s.nawrocki@samsung.com>
355 lines
11 KiB
C
355 lines
11 KiB
C
/*
|
|
* Copyright (c) 2014 Samsung Electronics Co., Ltd.
|
|
* Author: Thomas Abraham <thomas.ab@samsung.com>
|
|
*
|
|
* Copyright (c) 2015 Samsung Electronics Co., Ltd.
|
|
* Bartlomiej Zolnierkiewicz <b.zolnierkie@samsung.com>
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License version 2 as
|
|
* published by the Free Software Foundation.
|
|
*
|
|
* This file contains the utility function to register CPU clock for Samsung
|
|
* Exynos platforms. A CPU clock is defined as a clock supplied to a CPU or a
|
|
* group of CPUs. The CPU clock is typically derived from a hierarchy of clock
|
|
* blocks which includes mux and divider blocks. There are a number of other
|
|
* auxiliary clocks supplied to the CPU domain such as the debug blocks and AXI
|
|
* clock for CPU domain. The rates of these auxiliary clocks are related to the
|
|
* CPU clock rate and this relation is usually specified in the hardware manual
|
|
* of the SoC or supplied after the SoC characterization.
|
|
*
|
|
* The below implementation of the CPU clock allows the rate changes of the CPU
|
|
* clock and the corresponding rate changes of the auxillary clocks of the CPU
|
|
* domain. The platform clock driver provides a clock register configuration
|
|
* for each configurable rate which is then used to program the clock hardware
|
|
* registers to acheive a fast co-oridinated rate change for all the CPU domain
|
|
* clocks.
|
|
*
|
|
* On a rate change request for the CPU clock, the rate change is propagated
|
|
* upto the PLL supplying the clock to the CPU domain clock blocks. While the
|
|
* CPU domain PLL is reconfigured, the CPU domain clocks are driven using an
|
|
* alternate clock source. If required, the alternate clock source is divided
|
|
* down in order to keep the output clock rate within the previous OPP limits.
|
|
*/
|
|
|
|
#include <linux/errno.h>
|
|
#include <linux/slab.h>
|
|
#include <linux/clk.h>
|
|
#include <linux/clk-provider.h>
|
|
#include "clk-cpu.h"
|
|
|
|
#define E4210_SRC_CPU 0x0
|
|
#define E4210_STAT_CPU 0x200
|
|
#define E4210_DIV_CPU0 0x300
|
|
#define E4210_DIV_CPU1 0x304
|
|
#define E4210_DIV_STAT_CPU0 0x400
|
|
#define E4210_DIV_STAT_CPU1 0x404
|
|
|
|
#define E4210_DIV0_RATIO0_MASK 0x7
|
|
#define E4210_DIV1_HPM_MASK (0x7 << 4)
|
|
#define E4210_DIV1_COPY_MASK (0x7 << 0)
|
|
#define E4210_MUX_HPM_MASK (1 << 20)
|
|
#define E4210_DIV0_ATB_SHIFT 16
|
|
#define E4210_DIV0_ATB_MASK (DIV_MASK << E4210_DIV0_ATB_SHIFT)
|
|
|
|
#define MAX_DIV 8
|
|
#define DIV_MASK 7
|
|
#define DIV_MASK_ALL 0xffffffff
|
|
#define MUX_MASK 7
|
|
|
|
/*
|
|
* Helper function to wait until divider(s) have stabilized after the divider
|
|
* value has changed.
|
|
*/
|
|
static void wait_until_divider_stable(void __iomem *div_reg, unsigned long mask)
|
|
{
|
|
unsigned long timeout = jiffies + msecs_to_jiffies(10);
|
|
|
|
do {
|
|
if (!(readl(div_reg) & mask))
|
|
return;
|
|
} while (time_before(jiffies, timeout));
|
|
|
|
if (!(readl(div_reg) & mask))
|
|
return;
|
|
|
|
pr_err("%s: timeout in divider stablization\n", __func__);
|
|
}
|
|
|
|
/*
|
|
* Helper function to wait until mux has stabilized after the mux selection
|
|
* value was changed.
|
|
*/
|
|
static void wait_until_mux_stable(void __iomem *mux_reg, u32 mux_pos,
|
|
unsigned long mux_value)
|
|
{
|
|
unsigned long timeout = jiffies + msecs_to_jiffies(10);
|
|
|
|
do {
|
|
if (((readl(mux_reg) >> mux_pos) & MUX_MASK) == mux_value)
|
|
return;
|
|
} while (time_before(jiffies, timeout));
|
|
|
|
if (((readl(mux_reg) >> mux_pos) & MUX_MASK) == mux_value)
|
|
return;
|
|
|
|
pr_err("%s: re-parenting mux timed-out\n", __func__);
|
|
}
|
|
|
|
/* common round rate callback useable for all types of CPU clocks */
|
|
static long exynos_cpuclk_round_rate(struct clk_hw *hw,
|
|
unsigned long drate, unsigned long *prate)
|
|
{
|
|
struct clk_hw *parent = clk_hw_get_parent(hw);
|
|
*prate = clk_hw_round_rate(parent, drate);
|
|
return *prate;
|
|
}
|
|
|
|
/* common recalc rate callback useable for all types of CPU clocks */
|
|
static unsigned long exynos_cpuclk_recalc_rate(struct clk_hw *hw,
|
|
unsigned long parent_rate)
|
|
{
|
|
/*
|
|
* The CPU clock output (armclk) rate is the same as its parent
|
|
* rate. Although there exist certain dividers inside the CPU
|
|
* clock block that could be used to divide the parent clock,
|
|
* the driver does not make use of them currently, except during
|
|
* frequency transitions.
|
|
*/
|
|
return parent_rate;
|
|
}
|
|
|
|
static const struct clk_ops exynos_cpuclk_clk_ops = {
|
|
.recalc_rate = exynos_cpuclk_recalc_rate,
|
|
.round_rate = exynos_cpuclk_round_rate,
|
|
};
|
|
|
|
/*
|
|
* Helper function to set the 'safe' dividers for the CPU clock. The parameters
|
|
* div and mask contain the divider value and the register bit mask of the
|
|
* dividers to be programmed.
|
|
*/
|
|
static void exynos_set_safe_div(void __iomem *base, unsigned long div,
|
|
unsigned long mask)
|
|
{
|
|
unsigned long div0;
|
|
|
|
div0 = readl(base + E4210_DIV_CPU0);
|
|
div0 = (div0 & ~mask) | (div & mask);
|
|
writel(div0, base + E4210_DIV_CPU0);
|
|
wait_until_divider_stable(base + E4210_DIV_STAT_CPU0, mask);
|
|
}
|
|
|
|
/* handler for pre-rate change notification from parent clock */
|
|
static int exynos_cpuclk_pre_rate_change(struct clk_notifier_data *ndata,
|
|
struct exynos_cpuclk *cpuclk, void __iomem *base)
|
|
{
|
|
const struct exynos_cpuclk_cfg_data *cfg_data = cpuclk->cfg;
|
|
unsigned long alt_prate = clk_get_rate(cpuclk->alt_parent);
|
|
unsigned long alt_div = 0, alt_div_mask = DIV_MASK;
|
|
unsigned long div0, div1 = 0, mux_reg;
|
|
unsigned long flags;
|
|
|
|
/* find out the divider values to use for clock data */
|
|
while ((cfg_data->prate * 1000) != ndata->new_rate) {
|
|
if (cfg_data->prate == 0)
|
|
return -EINVAL;
|
|
cfg_data++;
|
|
}
|
|
|
|
spin_lock_irqsave(cpuclk->lock, flags);
|
|
|
|
/*
|
|
* For the selected PLL clock frequency, get the pre-defined divider
|
|
* values. If the clock for sclk_hpm is not sourced from apll, then
|
|
* the values for DIV_COPY and DIV_HPM dividers need not be set.
|
|
*/
|
|
div0 = cfg_data->div0;
|
|
if (cpuclk->flags & CLK_CPU_HAS_DIV1) {
|
|
div1 = cfg_data->div1;
|
|
if (readl(base + E4210_SRC_CPU) & E4210_MUX_HPM_MASK)
|
|
div1 = readl(base + E4210_DIV_CPU1) &
|
|
(E4210_DIV1_HPM_MASK | E4210_DIV1_COPY_MASK);
|
|
}
|
|
|
|
/*
|
|
* If the old parent clock speed is less than the clock speed of
|
|
* the alternate parent, then it should be ensured that at no point
|
|
* the armclk speed is more than the old_prate until the dividers are
|
|
* set. Also workaround the issue of the dividers being set to lower
|
|
* values before the parent clock speed is set to new lower speed
|
|
* (this can result in too high speed of armclk output clocks).
|
|
*/
|
|
if (alt_prate > ndata->old_rate || ndata->old_rate > ndata->new_rate) {
|
|
unsigned long tmp_rate = min(ndata->old_rate, ndata->new_rate);
|
|
|
|
alt_div = DIV_ROUND_UP(alt_prate, tmp_rate) - 1;
|
|
WARN_ON(alt_div >= MAX_DIV);
|
|
|
|
if (cpuclk->flags & CLK_CPU_NEEDS_DEBUG_ALT_DIV) {
|
|
/*
|
|
* In Exynos4210, ATB clock parent is also mout_core. So
|
|
* ATB clock also needs to be mantained at safe speed.
|
|
*/
|
|
alt_div |= E4210_DIV0_ATB_MASK;
|
|
alt_div_mask |= E4210_DIV0_ATB_MASK;
|
|
}
|
|
exynos_set_safe_div(base, alt_div, alt_div_mask);
|
|
div0 |= alt_div;
|
|
}
|
|
|
|
/* select sclk_mpll as the alternate parent */
|
|
mux_reg = readl(base + E4210_SRC_CPU);
|
|
writel(mux_reg | (1 << 16), base + E4210_SRC_CPU);
|
|
wait_until_mux_stable(base + E4210_STAT_CPU, 16, 2);
|
|
|
|
/* alternate parent is active now. set the dividers */
|
|
writel(div0, base + E4210_DIV_CPU0);
|
|
wait_until_divider_stable(base + E4210_DIV_STAT_CPU0, DIV_MASK_ALL);
|
|
|
|
if (cpuclk->flags & CLK_CPU_HAS_DIV1) {
|
|
writel(div1, base + E4210_DIV_CPU1);
|
|
wait_until_divider_stable(base + E4210_DIV_STAT_CPU1,
|
|
DIV_MASK_ALL);
|
|
}
|
|
|
|
spin_unlock_irqrestore(cpuclk->lock, flags);
|
|
return 0;
|
|
}
|
|
|
|
/* handler for post-rate change notification from parent clock */
|
|
static int exynos_cpuclk_post_rate_change(struct clk_notifier_data *ndata,
|
|
struct exynos_cpuclk *cpuclk, void __iomem *base)
|
|
{
|
|
const struct exynos_cpuclk_cfg_data *cfg_data = cpuclk->cfg;
|
|
unsigned long div = 0, div_mask = DIV_MASK;
|
|
unsigned long mux_reg;
|
|
unsigned long flags;
|
|
|
|
/* find out the divider values to use for clock data */
|
|
if (cpuclk->flags & CLK_CPU_NEEDS_DEBUG_ALT_DIV) {
|
|
while ((cfg_data->prate * 1000) != ndata->new_rate) {
|
|
if (cfg_data->prate == 0)
|
|
return -EINVAL;
|
|
cfg_data++;
|
|
}
|
|
}
|
|
|
|
spin_lock_irqsave(cpuclk->lock, flags);
|
|
|
|
/* select mout_apll as the alternate parent */
|
|
mux_reg = readl(base + E4210_SRC_CPU);
|
|
writel(mux_reg & ~(1 << 16), base + E4210_SRC_CPU);
|
|
wait_until_mux_stable(base + E4210_STAT_CPU, 16, 1);
|
|
|
|
if (cpuclk->flags & CLK_CPU_NEEDS_DEBUG_ALT_DIV) {
|
|
div |= (cfg_data->div0 & E4210_DIV0_ATB_MASK);
|
|
div_mask |= E4210_DIV0_ATB_MASK;
|
|
}
|
|
|
|
exynos_set_safe_div(base, div, div_mask);
|
|
spin_unlock_irqrestore(cpuclk->lock, flags);
|
|
return 0;
|
|
}
|
|
|
|
/*
|
|
* This notifier function is called for the pre-rate and post-rate change
|
|
* notifications of the parent clock of cpuclk.
|
|
*/
|
|
static int exynos_cpuclk_notifier_cb(struct notifier_block *nb,
|
|
unsigned long event, void *data)
|
|
{
|
|
struct clk_notifier_data *ndata = data;
|
|
struct exynos_cpuclk *cpuclk;
|
|
void __iomem *base;
|
|
int err = 0;
|
|
|
|
cpuclk = container_of(nb, struct exynos_cpuclk, clk_nb);
|
|
base = cpuclk->ctrl_base;
|
|
|
|
if (event == PRE_RATE_CHANGE)
|
|
err = exynos_cpuclk_pre_rate_change(ndata, cpuclk, base);
|
|
else if (event == POST_RATE_CHANGE)
|
|
err = exynos_cpuclk_post_rate_change(ndata, cpuclk, base);
|
|
|
|
return notifier_from_errno(err);
|
|
}
|
|
|
|
/* helper function to register a CPU clock */
|
|
int __init exynos_register_cpu_clock(struct samsung_clk_provider *ctx,
|
|
unsigned int lookup_id, const char *name, const char *parent,
|
|
const char *alt_parent, unsigned long offset,
|
|
const struct exynos_cpuclk_cfg_data *cfg,
|
|
unsigned long num_cfgs, unsigned long flags)
|
|
{
|
|
struct exynos_cpuclk *cpuclk;
|
|
struct clk_init_data init;
|
|
struct clk *clk;
|
|
int ret = 0;
|
|
|
|
cpuclk = kzalloc(sizeof(*cpuclk), GFP_KERNEL);
|
|
if (!cpuclk)
|
|
return -ENOMEM;
|
|
|
|
init.name = name;
|
|
init.flags = CLK_SET_RATE_PARENT;
|
|
init.parent_names = &parent;
|
|
init.num_parents = 1;
|
|
init.ops = &exynos_cpuclk_clk_ops;
|
|
|
|
cpuclk->hw.init = &init;
|
|
cpuclk->ctrl_base = ctx->reg_base + offset;
|
|
cpuclk->lock = &ctx->lock;
|
|
cpuclk->flags = flags;
|
|
cpuclk->clk_nb.notifier_call = exynos_cpuclk_notifier_cb;
|
|
|
|
cpuclk->alt_parent = __clk_lookup(alt_parent);
|
|
if (!cpuclk->alt_parent) {
|
|
pr_err("%s: could not lookup alternate parent %s\n",
|
|
__func__, alt_parent);
|
|
ret = -EINVAL;
|
|
goto free_cpuclk;
|
|
}
|
|
|
|
clk = __clk_lookup(parent);
|
|
if (!clk) {
|
|
pr_err("%s: could not lookup parent clock %s\n",
|
|
__func__, parent);
|
|
ret = -EINVAL;
|
|
goto free_cpuclk;
|
|
}
|
|
|
|
ret = clk_notifier_register(clk, &cpuclk->clk_nb);
|
|
if (ret) {
|
|
pr_err("%s: failed to register clock notifier for %s\n",
|
|
__func__, name);
|
|
goto free_cpuclk;
|
|
}
|
|
|
|
cpuclk->cfg = kmemdup(cfg, sizeof(*cfg) * num_cfgs, GFP_KERNEL);
|
|
if (!cpuclk->cfg) {
|
|
pr_err("%s: could not allocate memory for cpuclk data\n",
|
|
__func__);
|
|
ret = -ENOMEM;
|
|
goto unregister_clk_nb;
|
|
}
|
|
|
|
clk = clk_register(NULL, &cpuclk->hw);
|
|
if (IS_ERR(clk)) {
|
|
pr_err("%s: could not register cpuclk %s\n", __func__, name);
|
|
ret = PTR_ERR(clk);
|
|
goto free_cpuclk_data;
|
|
}
|
|
|
|
samsung_clk_add_lookup(ctx, clk, lookup_id);
|
|
return 0;
|
|
|
|
free_cpuclk_data:
|
|
kfree(cpuclk->cfg);
|
|
unregister_clk_nb:
|
|
clk_notifier_unregister(__clk_lookup(parent), &cpuclk->clk_nb);
|
|
free_cpuclk:
|
|
kfree(cpuclk);
|
|
return ret;
|
|
}
|