2019-02-20 00:45:26 +07:00
|
|
|
/* SPDX-License-Identifier: ISC */
|
2013-06-13 00:52:10 +07:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2005-2011 Atheros Communications Inc.
|
2017-12-22 23:31:13 +07:00
|
|
|
* Copyright (c) 2011-2017 Qualcomm Atheros, Inc.
|
2013-06-13 00:52:10 +07:00
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef _PCI_H_
|
|
|
|
#define _PCI_H_
|
|
|
|
|
|
|
|
#include <linux/interrupt.h>
|
ath10k: pci: use mutex for diagnostic window CE polling
The DIAG copy engine is only used via polling, but it holds a spinlock
with softirqs disabled. Each iteration of our read/write loops can
theoretically take 20ms (two 10ms timeout loops), and this loop can be
run an unbounded number of times while holding the spinlock -- dependent
on the request size given by the caller.
As of commit 39501ea64116 ("ath10k: download firmware via diag Copy
Engine for QCA6174 and QCA9377."), we transfer large chunks of firmware
memory using this mechanism. With large enough firmware segments, this
becomes an exceedingly long period for disabling soft IRQs. For example,
with a 500KiB firmware segment, in testing QCA6174A, I see 200 loop
iterations of about 50-100us each, which can total about 10-20ms.
In reality, we don't really need to block softirqs for this duration.
The DIAG CE is only used in polling mode, and we only need to hold
ce_lock to make sure any CE bookkeeping is done without screwing up
another CE. Otherwise, we only need to ensure exclusion between
ath10k_pci_diag_{read,write}_mem() contexts.
This patch moves to use fine-grained locking for the shared ce_lock,
while adding a new mutex just to ensure mutual exclusion of diag
read/write operations.
Tested on QCA6174A, firmware version WLAN.RM.4.4.1-00132-QCARMSWPZ-1.
Fixes: 39501ea64116 ("ath10k: download firmware via diag Copy Engine for QCA6174 and QCA9377.")
Signed-off-by: Brian Norris <briannorris@chromium.org>
Signed-off-by: Kalle Valo <kvalo@codeaurora.org>
2019-02-08 19:55:38 +07:00
|
|
|
#include <linux/mutex.h>
|
2013-06-13 00:52:10 +07:00
|
|
|
|
|
|
|
#include "hw.h"
|
|
|
|
#include "ce.h"
|
ath10k: add basic skeleton to support ahb
qca4019 uses ahb instead of pci where it slightly differs in device
enumeration, clock control, reset control, etc. Good thing is that
ahb also uses copy engine for the data transaction. So, the most of
the stuff implemented in pci.c/ce.c are reusable in ahb case too.
Device enumeration in ahb case comes through platform driver/device
model. All resource details like irq, memory map, clocks, etc for
qca4019 can be fetched from of_node of platform device.
Simply flow would look like,
device tree => platform device (kernel) => platform driver (ath10k)
Device tree entry will have all qca4019 resource details and the same
info will be passed to kernel. Kernel will prepare new platform device
for that entry and expose DT info to of_node in platform device.
Later, ath10k would register platform driver with unique compatible name
and then kernels binds to corresponding compatible entry & calls ath10k
ahb probe functions. From there onwards, ath10k will take control of it
and move forward.
New bool flag CONFIG_ATH10K_AHB is added in Kconfig to conditionally
enable ahb support in ath10k. On enabling this flag, ath10k_pci.ko
will have ahb support. This patch adds only basic skeleton and few
macros to support ahb in the context of qca4019.
Signed-off-by: Raja Mani <rmani@qti.qualcomm.com>
Signed-off-by: Kalle Valo <kvalo@qca.qualcomm.com>
2016-01-27 16:54:25 +07:00
|
|
|
#include "ahb.h"
|
2013-06-13 00:52:10 +07:00
|
|
|
|
|
|
|
/*
|
|
|
|
* maximum number of bytes that can be
|
|
|
|
* handled atomically by DiagRead/DiagWrite
|
|
|
|
*/
|
|
|
|
#define DIAG_TRANSFER_LIMIT 2048
|
|
|
|
|
|
|
|
struct bmi_xfer {
|
2014-07-14 20:25:25 +07:00
|
|
|
bool tx_done;
|
|
|
|
bool rx_done;
|
2013-06-13 00:52:10 +07:00
|
|
|
bool wait_for_resp;
|
|
|
|
u32 resp_len;
|
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
|
|
|
* PCI-specific Target state
|
|
|
|
*
|
|
|
|
* NOTE: Structure is shared between Host software and Target firmware!
|
|
|
|
*
|
|
|
|
* Much of this may be of interest to the Host so
|
|
|
|
* HOST_INTEREST->hi_interconnect_state points here
|
|
|
|
* (and all members are 32-bit quantities in order to
|
|
|
|
* facilitate Host access). In particular, Host software is
|
|
|
|
* required to initialize pipe_cfg_addr and svc_to_pipe_map.
|
|
|
|
*/
|
|
|
|
struct pcie_state {
|
|
|
|
/* Pipe configuration Target address */
|
|
|
|
/* NB: ce_pipe_config[CE_COUNT] */
|
|
|
|
u32 pipe_cfg_addr;
|
|
|
|
|
|
|
|
/* Service to pipe map Target address */
|
|
|
|
/* NB: service_to_pipe[PIPE_TO_CE_MAP_CN] */
|
|
|
|
u32 svc_to_pipe_map;
|
|
|
|
|
|
|
|
/* number of MSI interrupts requested */
|
|
|
|
u32 msi_requested;
|
|
|
|
|
|
|
|
/* number of MSI interrupts granted */
|
|
|
|
u32 msi_granted;
|
|
|
|
|
|
|
|
/* Message Signalled Interrupt address */
|
|
|
|
u32 msi_addr;
|
|
|
|
|
|
|
|
/* Base data */
|
|
|
|
u32 msi_data;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Data for firmware interrupt;
|
|
|
|
* MSI data for other interrupts are
|
|
|
|
* in various SoC registers
|
|
|
|
*/
|
|
|
|
u32 msi_fw_intr_data;
|
|
|
|
|
|
|
|
/* PCIE_PWR_METHOD_* */
|
|
|
|
u32 power_mgmt_method;
|
|
|
|
|
|
|
|
/* PCIE_CONFIG_FLAG_* */
|
|
|
|
u32 config_flags;
|
|
|
|
};
|
|
|
|
|
|
|
|
/* PCIE_CONFIG_FLAG definitions */
|
|
|
|
#define PCIE_CONFIG_FLAG_ENABLE_L1 0x0000001
|
|
|
|
|
|
|
|
/* Per-pipe state. */
|
2013-08-27 18:08:01 +07:00
|
|
|
struct ath10k_pci_pipe {
|
2013-06-13 00:52:10 +07:00
|
|
|
/* Handle of underlying Copy Engine */
|
2013-08-27 18:08:02 +07:00
|
|
|
struct ath10k_ce_pipe *ce_hdl;
|
2013-06-13 00:52:10 +07:00
|
|
|
|
|
|
|
/* Our pipe number; facilitiates use of pipe_info ptrs. */
|
|
|
|
u8 pipe_num;
|
|
|
|
|
|
|
|
/* Convenience back pointer to hif_ce_state. */
|
|
|
|
struct ath10k *hif_ce_state;
|
|
|
|
|
|
|
|
size_t buf_sz;
|
|
|
|
|
|
|
|
/* protects compl_free and num_send_allowed */
|
|
|
|
spinlock_t pipe_lock;
|
|
|
|
};
|
|
|
|
|
2014-12-02 15:55:54 +07:00
|
|
|
struct ath10k_pci_supp_chip {
|
|
|
|
u32 dev_id;
|
|
|
|
u32 rev_id;
|
|
|
|
};
|
|
|
|
|
2016-04-07 13:40:58 +07:00
|
|
|
enum ath10k_pci_irq_mode {
|
|
|
|
ATH10K_PCI_IRQ_AUTO = 0,
|
|
|
|
ATH10K_PCI_IRQ_LEGACY = 1,
|
|
|
|
ATH10K_PCI_IRQ_MSI = 2,
|
|
|
|
};
|
|
|
|
|
2013-06-13 00:52:10 +07:00
|
|
|
struct ath10k_pci {
|
|
|
|
struct pci_dev *pdev;
|
|
|
|
struct device *dev;
|
|
|
|
struct ath10k *ar;
|
|
|
|
void __iomem *mem;
|
2015-06-15 18:46:42 +07:00
|
|
|
size_t mem_len;
|
2013-06-13 00:52:10 +07:00
|
|
|
|
2016-04-07 13:40:58 +07:00
|
|
|
/* Operating interrupt mode */
|
|
|
|
enum ath10k_pci_irq_mode oper_irq_mode;
|
2013-06-13 00:52:10 +07:00
|
|
|
|
2013-08-27 18:08:01 +07:00
|
|
|
struct ath10k_pci_pipe pipe_info[CE_COUNT_MAX];
|
2013-06-13 00:52:10 +07:00
|
|
|
|
|
|
|
/* Copy Engine used for Diagnostic Accesses */
|
2013-08-27 18:08:02 +07:00
|
|
|
struct ath10k_ce_pipe *ce_diag;
|
ath10k: pci: use mutex for diagnostic window CE polling
The DIAG copy engine is only used via polling, but it holds a spinlock
with softirqs disabled. Each iteration of our read/write loops can
theoretically take 20ms (two 10ms timeout loops), and this loop can be
run an unbounded number of times while holding the spinlock -- dependent
on the request size given by the caller.
As of commit 39501ea64116 ("ath10k: download firmware via diag Copy
Engine for QCA6174 and QCA9377."), we transfer large chunks of firmware
memory using this mechanism. With large enough firmware segments, this
becomes an exceedingly long period for disabling soft IRQs. For example,
with a 500KiB firmware segment, in testing QCA6174A, I see 200 loop
iterations of about 50-100us each, which can total about 10-20ms.
In reality, we don't really need to block softirqs for this duration.
The DIAG CE is only used in polling mode, and we only need to hold
ce_lock to make sure any CE bookkeeping is done without screwing up
another CE. Otherwise, we only need to ensure exclusion between
ath10k_pci_diag_{read,write}_mem() contexts.
This patch moves to use fine-grained locking for the shared ce_lock,
while adding a new mutex just to ensure mutual exclusion of diag
read/write operations.
Tested on QCA6174A, firmware version WLAN.RM.4.4.1-00132-QCARMSWPZ-1.
Fixes: 39501ea64116 ("ath10k: download firmware via diag Copy Engine for QCA6174 and QCA9377.")
Signed-off-by: Brian Norris <briannorris@chromium.org>
Signed-off-by: Kalle Valo <kvalo@codeaurora.org>
2019-02-08 19:55:38 +07:00
|
|
|
/* For protecting ce_diag */
|
|
|
|
struct mutex ce_diag_mutex;
|
2013-06-13 00:52:10 +07:00
|
|
|
|
ath10k: perform crash dump collection in workqueue
Commit 25733c4e67df ("ath10k: pci: use mutex for diagnostic window CE
polling") introduced a regression where we try to sleep (grab a mutex)
in an atomic context:
[ 233.602619] BUG: sleeping function called from invalid context at kernel/locking/mutex.c:254
[ 233.602626] in_atomic(): 1, irqs_disabled(): 0, pid: 0, name: swapper/0
[ 233.602636] CPU: 0 PID: 0 Comm: swapper/0 Tainted: G W 5.1.0-rc2 #4
[ 233.602642] Hardware name: Google Scarlet (DT)
[ 233.602647] Call trace:
[ 233.602663] dump_backtrace+0x0/0x11c
[ 233.602672] show_stack+0x20/0x28
[ 233.602681] dump_stack+0x98/0xbc
[ 233.602690] ___might_sleep+0x154/0x16c
[ 233.602696] __might_sleep+0x78/0x88
[ 233.602704] mutex_lock+0x2c/0x5c
[ 233.602717] ath10k_pci_diag_read_mem+0x68/0x21c [ath10k_pci]
[ 233.602725] ath10k_pci_diag_read32+0x48/0x74 [ath10k_pci]
[ 233.602733] ath10k_pci_dump_registers+0x5c/0x16c [ath10k_pci]
[ 233.602741] ath10k_pci_fw_crashed_dump+0xb8/0x548 [ath10k_pci]
[ 233.602749] ath10k_pci_napi_poll+0x60/0x128 [ath10k_pci]
[ 233.602757] net_rx_action+0x140/0x388
[ 233.602766] __do_softirq+0x1b0/0x35c
[...]
ath10k_pci_fw_crashed_dump() is called from NAPI contexts, and firmware
memory dumps are retrieved using the diag memory interface.
A simple reproduction case is to run this on QCA6174A /
WLAN.RM.4.4.1-00132-QCARMSWP-1, which happens to be a way to b0rk the
firmware:
dd if=/sys/kernel/debug/ieee80211/phy0/ath10k/mem_value bs=4K count=1
of=/dev/null
(NB: simulated firmware crashes, via debugfs, don't trigger firmware
dumps.)
The fix is to move the crash-dump into a workqueue context, and avoid
relying on 'data_lock' for most mutual exclusion. We only keep using it
here for protecting 'fw_crash_counter', while the rest of the coredump
buffers are protected by a new 'dump_mutex'.
I've tested the above with simulated firmware crashes (debugfs 'reset'
file), real firmware crashes (the 'dd' command above), and a variety of
reboot and suspend/resume configurations on QCA6174A.
Reported here:
http://lkml.kernel.org/linux-wireless/20190325202706.GA68720@google.com
Fixes: 25733c4e67df ("ath10k: pci: use mutex for diagnostic window CE polling")
Signed-off-by: Brian Norris <briannorris@chromium.org>
Signed-off-by: Kalle Valo <kvalo@codeaurora.org>
2019-03-27 03:57:28 +07:00
|
|
|
struct work_struct dump_work;
|
|
|
|
|
2017-06-28 11:48:26 +07:00
|
|
|
struct ath10k_ce ce;
|
2014-08-22 19:33:14 +07:00
|
|
|
struct timer_list rx_post_retry;
|
2015-05-18 16:38:16 +07:00
|
|
|
|
|
|
|
/* Due to HW quirks it is recommended to disable ASPM during device
|
|
|
|
* bootup. To do that the original PCI-E Link Control is stored before
|
|
|
|
* device bootup is executed and re-programmed later.
|
|
|
|
*/
|
|
|
|
u16 link_ctl;
|
2015-05-18 16:38:18 +07:00
|
|
|
|
|
|
|
/* Protects ps_awake and ps_wake_refcount */
|
|
|
|
spinlock_t ps_lock;
|
|
|
|
|
|
|
|
/* The device has a special powersave-oriented register. When device is
|
|
|
|
* considered asleep it drains less power and driver is forbidden from
|
|
|
|
* accessing most MMIO registers. If host were to access them without
|
|
|
|
* waking up the device might scribble over host memory or return
|
|
|
|
* 0xdeadbeef readouts.
|
|
|
|
*/
|
|
|
|
unsigned long ps_wake_refcount;
|
|
|
|
|
|
|
|
/* Waking up takes some time (up to 2ms in some cases) so it can be bad
|
|
|
|
* for latency. To mitigate this the device isn't immediately allowed
|
|
|
|
* to sleep after all references are undone - instead there's a grace
|
|
|
|
* period after which the powersave register is updated unless some
|
|
|
|
* activity to/from device happened in the meantime.
|
|
|
|
*
|
|
|
|
* Also see comments on ATH10K_PCI_SLEEP_GRACE_PERIOD_MSEC.
|
|
|
|
*/
|
|
|
|
struct timer_list ps_timer;
|
|
|
|
|
|
|
|
/* MMIO registers are used to communicate with the device. With
|
|
|
|
* intensive traffic accessing powersave register would be a bit
|
|
|
|
* wasteful overhead and would needlessly stall CPU. It is far more
|
|
|
|
* efficient to rely on a variable in RAM and update it only upon
|
|
|
|
* powersave register state changes.
|
|
|
|
*/
|
|
|
|
bool ps_awake;
|
2015-10-16 19:54:51 +07:00
|
|
|
|
|
|
|
/* pci power save, disable for QCA988X and QCA99X0.
|
|
|
|
* Writing 'false' to this variable avoids frequent locking
|
|
|
|
* on MMIO read/write.
|
|
|
|
*/
|
|
|
|
bool pci_ps;
|
2016-01-27 16:54:23 +07:00
|
|
|
|
2016-05-24 03:12:43 +07:00
|
|
|
/* Chip specific pci reset routine used to do a safe reset */
|
|
|
|
int (*pci_soft_reset)(struct ath10k *ar);
|
|
|
|
|
|
|
|
/* Chip specific pci full reset function */
|
|
|
|
int (*pci_hard_reset)(struct ath10k *ar);
|
|
|
|
|
2017-02-01 01:36:51 +07:00
|
|
|
/* chip specific methods for converting target CPU virtual address
|
|
|
|
* space to CE address space
|
|
|
|
*/
|
|
|
|
u32 (*targ_cpu_to_ce_addr)(struct ath10k *ar, u32 addr);
|
|
|
|
|
2016-01-27 16:54:27 +07:00
|
|
|
/* Keep this entry in the last, memory for struct ath10k_ahb is
|
|
|
|
* allocated (ahb support enabled case) in the continuation of
|
|
|
|
* this struct.
|
|
|
|
*/
|
|
|
|
struct ath10k_ahb ahb[0];
|
2013-06-13 00:52:10 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
static inline struct ath10k_pci *ath10k_pci_priv(struct ath10k *ar)
|
|
|
|
{
|
2014-08-07 16:03:27 +07:00
|
|
|
return (struct ath10k_pci *)ar->drv_priv;
|
2013-06-13 00:52:10 +07:00
|
|
|
}
|
|
|
|
|
2014-08-22 19:33:14 +07:00
|
|
|
#define ATH10K_PCI_RX_POST_RETRY_MS 50
|
2013-06-13 00:52:10 +07:00
|
|
|
#define ATH_PCI_RESET_WAIT_MAX 10 /* ms */
|
2015-10-06 19:19:28 +07:00
|
|
|
#define PCIE_WAKE_TIMEOUT 30000 /* 30ms */
|
|
|
|
#define PCIE_WAKE_LATE_US 10000 /* 10ms */
|
2013-06-13 00:52:10 +07:00
|
|
|
|
|
|
|
#define BAR_NUM 0
|
|
|
|
|
|
|
|
#define CDC_WAR_MAGIC_STR 0xceef0000
|
|
|
|
#define CDC_WAR_DATA_CE 4
|
|
|
|
|
|
|
|
/* Wait up to this many Ms for a Diagnostic Access CE operation to complete */
|
2018-09-04 17:00:25 +07:00
|
|
|
#define DIAG_ACCESS_CE_TIMEOUT_US 10000 /* 10 ms */
|
|
|
|
#define DIAG_ACCESS_CE_WAIT_US 50
|
2013-06-13 00:52:10 +07:00
|
|
|
|
2015-05-18 16:38:18 +07:00
|
|
|
void ath10k_pci_write32(struct ath10k *ar, u32 offset, u32 value);
|
|
|
|
void ath10k_pci_soc_write32(struct ath10k *ar, u32 addr, u32 val);
|
|
|
|
void ath10k_pci_reg_write32(struct ath10k *ar, u32 addr, u32 val);
|
2013-10-16 20:46:11 +07:00
|
|
|
|
2015-05-18 16:38:18 +07:00
|
|
|
u32 ath10k_pci_read32(struct ath10k *ar, u32 offset);
|
|
|
|
u32 ath10k_pci_soc_read32(struct ath10k *ar, u32 addr);
|
|
|
|
u32 ath10k_pci_reg_read32(struct ath10k *ar, u32 addr);
|
2013-10-16 20:46:11 +07:00
|
|
|
|
2016-01-27 16:54:22 +07:00
|
|
|
int ath10k_pci_hif_tx_sg(struct ath10k *ar, u8 pipe_id,
|
|
|
|
struct ath10k_hif_sg_item *items, int n_items);
|
|
|
|
int ath10k_pci_hif_diag_read(struct ath10k *ar, u32 address, void *buf,
|
|
|
|
size_t buf_len);
|
|
|
|
int ath10k_pci_diag_write_mem(struct ath10k *ar, u32 address,
|
|
|
|
const void *data, int nbytes);
|
|
|
|
int ath10k_pci_hif_exchange_bmi_msg(struct ath10k *ar, void *req, u32 req_len,
|
|
|
|
void *resp, u32 *resp_len);
|
|
|
|
int ath10k_pci_hif_map_service_to_pipe(struct ath10k *ar, u16 service_id,
|
|
|
|
u8 *ul_pipe, u8 *dl_pipe);
|
|
|
|
void ath10k_pci_hif_get_default_pipe(struct ath10k *ar, u8 *ul_pipe,
|
|
|
|
u8 *dl_pipe);
|
|
|
|
void ath10k_pci_hif_send_complete_check(struct ath10k *ar, u8 pipe,
|
|
|
|
int force);
|
|
|
|
u16 ath10k_pci_hif_get_free_queue_number(struct ath10k *ar, u8 pipe);
|
|
|
|
void ath10k_pci_hif_power_down(struct ath10k *ar);
|
|
|
|
int ath10k_pci_alloc_pipes(struct ath10k *ar);
|
|
|
|
void ath10k_pci_free_pipes(struct ath10k *ar);
|
|
|
|
void ath10k_pci_free_pipes(struct ath10k *ar);
|
2017-10-24 16:29:54 +07:00
|
|
|
void ath10k_pci_rx_replenish_retry(struct timer_list *t);
|
2016-01-27 16:54:22 +07:00
|
|
|
void ath10k_pci_ce_deinit(struct ath10k *ar);
|
2016-09-02 23:46:09 +07:00
|
|
|
void ath10k_pci_init_napi(struct ath10k *ar);
|
2016-01-27 16:54:22 +07:00
|
|
|
int ath10k_pci_init_pipes(struct ath10k *ar);
|
|
|
|
int ath10k_pci_init_config(struct ath10k *ar);
|
|
|
|
void ath10k_pci_rx_post(struct ath10k *ar);
|
|
|
|
void ath10k_pci_flush(struct ath10k *ar);
|
|
|
|
void ath10k_pci_enable_legacy_irq(struct ath10k *ar);
|
|
|
|
bool ath10k_pci_irq_pending(struct ath10k *ar);
|
|
|
|
void ath10k_pci_disable_and_clear_legacy_irq(struct ath10k *ar);
|
2016-09-02 23:46:09 +07:00
|
|
|
void ath10k_pci_irq_msi_fw_mask(struct ath10k *ar);
|
2016-01-27 16:54:22 +07:00
|
|
|
int ath10k_pci_wait_for_target_init(struct ath10k *ar);
|
2016-01-27 16:54:24 +07:00
|
|
|
int ath10k_pci_setup_resource(struct ath10k *ar);
|
|
|
|
void ath10k_pci_release_resource(struct ath10k *ar);
|
2016-01-27 16:54:22 +07:00
|
|
|
|
2015-05-18 16:38:18 +07:00
|
|
|
/* QCA6174 is known to have Tx/Rx issues when SOC_WAKE register is poked too
|
|
|
|
* frequently. To avoid this put SoC to sleep after a very conservative grace
|
|
|
|
* period. Adjust with great care.
|
|
|
|
*/
|
|
|
|
#define ATH10K_PCI_SLEEP_GRACE_PERIOD_MSEC 60
|
2013-06-13 00:52:10 +07:00
|
|
|
|
|
|
|
#endif /* _PCI_H_ */
|