2019-02-16 05:39:15 +07:00
|
|
|
// SPDX-License-Identifier: GPL-2.0
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Copyright 2016-2019 HabanaLabs, Ltd.
|
|
|
|
* All Rights Reserved.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <uapi/misc/habanalabs.h>
|
|
|
|
#include "habanalabs.h"
|
|
|
|
|
|
|
|
#include <linux/fs.h>
|
|
|
|
#include <linux/uaccess.h>
|
|
|
|
#include <linux/slab.h>
|
|
|
|
|
habanalabs: add new IOCTL for debug, tracing and profiling
Habanalabs ASICs use the ARM coresight infrastructure to support debug,
tracing and profiling of neural networks topologies.
Because the coresight is configured using register writes and reads, and
some of the registers hold sensitive information (e.g. the address in
the device's DRAM where the trace data is written to), the user must go
through the kernel driver to configure this mechanism.
This patch implements the common code of the IOCTL and calls the
ASIC-specific function for the actual H/W configuration.
The IOCTL supports configuration of seven coresight components:
ETR, ETF, STM, FUNNEL, BMON, SPMU and TIMESTAMP
The user specifies which component he wishes to configure and provides a
pointer to a structure (located in its process space) that contains the
relevant configuration.
The common code copies the relevant data from the user-space to kernel
space and then calls the ASIC-specific function to do the H/W
configuration.
After the configuration is done, which is usually composed
of several IOCTL calls depending on what the user wanted to trace, the
user can start executing the topology. The trace data will be written to
the user's area in the device's DRAM.
After the tracing operation is complete, and user will call the IOCTL
again to disable the tracing operation. The user also need to read
values from registers for some of the components (e.g. the size of the
trace data in the device's DRAM). In that case, the user will provide a
pointer to an "output" structure in user-space, which the IOCTL code will
fill according the to selected component.
Signed-off-by: Omer Shpigelman <oshpigelman@habana.ai>
Signed-off-by: Oded Gabbay <oded.gabbay@gmail.com>
2019-04-02 02:31:22 +07:00
|
|
|
static u32 hl_debug_struct_size[HL_DEBUG_OP_TIMESTAMP + 1] = {
|
|
|
|
[HL_DEBUG_OP_ETR] = sizeof(struct hl_debug_params_etr),
|
|
|
|
[HL_DEBUG_OP_ETF] = sizeof(struct hl_debug_params_etf),
|
|
|
|
[HL_DEBUG_OP_STM] = sizeof(struct hl_debug_params_stm),
|
|
|
|
[HL_DEBUG_OP_FUNNEL] = 0,
|
|
|
|
[HL_DEBUG_OP_BMON] = sizeof(struct hl_debug_params_bmon),
|
|
|
|
[HL_DEBUG_OP_SPMU] = sizeof(struct hl_debug_params_spmu),
|
|
|
|
[HL_DEBUG_OP_TIMESTAMP] = 0
|
|
|
|
|
|
|
|
};
|
|
|
|
|
2019-03-24 15:15:44 +07:00
|
|
|
static int device_status_info(struct hl_device *hdev, struct hl_info_args *args)
|
|
|
|
{
|
|
|
|
struct hl_info_device_status dev_stat = {0};
|
|
|
|
u32 size = args->return_size;
|
|
|
|
void __user *out = (void __user *) (uintptr_t) args->return_pointer;
|
|
|
|
|
|
|
|
if ((!size) || (!out))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
dev_stat.status = hl_device_status(hdev);
|
|
|
|
|
|
|
|
return copy_to_user(out, &dev_stat,
|
|
|
|
min((size_t)size, sizeof(dev_stat))) ? -EFAULT : 0;
|
|
|
|
}
|
|
|
|
|
2019-02-16 05:39:23 +07:00
|
|
|
static int hw_ip_info(struct hl_device *hdev, struct hl_info_args *args)
|
|
|
|
{
|
|
|
|
struct hl_info_hw_ip_info hw_ip = {0};
|
|
|
|
u32 size = args->return_size;
|
|
|
|
void __user *out = (void __user *) (uintptr_t) args->return_pointer;
|
|
|
|
struct asic_fixed_properties *prop = &hdev->asic_prop;
|
|
|
|
u64 sram_kmd_size, dram_kmd_size;
|
|
|
|
|
|
|
|
if ((!size) || (!out))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
sram_kmd_size = (prop->sram_user_base_address -
|
|
|
|
prop->sram_base_address);
|
|
|
|
dram_kmd_size = (prop->dram_user_base_address -
|
|
|
|
prop->dram_base_address);
|
|
|
|
|
|
|
|
hw_ip.device_id = hdev->asic_funcs->get_pci_id(hdev);
|
|
|
|
hw_ip.sram_base_address = prop->sram_user_base_address;
|
|
|
|
hw_ip.dram_base_address = prop->dram_user_base_address;
|
|
|
|
hw_ip.tpc_enabled_mask = prop->tpc_enabled_mask;
|
|
|
|
hw_ip.sram_size = prop->sram_size - sram_kmd_size;
|
|
|
|
hw_ip.dram_size = prop->dram_size - dram_kmd_size;
|
2019-11-16 17:29:50 +07:00
|
|
|
if (hw_ip.dram_size > PAGE_SIZE)
|
2019-02-16 05:39:23 +07:00
|
|
|
hw_ip.dram_enabled = 1;
|
|
|
|
hw_ip.num_of_events = prop->num_of_events;
|
2019-10-16 15:53:52 +07:00
|
|
|
|
|
|
|
memcpy(hw_ip.armcp_version, prop->armcp_info.armcp_version,
|
|
|
|
min(VERSION_MAX_LEN, HL_INFO_VERSION_MAX_LEN));
|
|
|
|
|
|
|
|
memcpy(hw_ip.card_name, prop->armcp_info.card_name,
|
|
|
|
min(CARD_NAME_MAX_LEN, HL_INFO_CARD_NAME_MAX_LEN));
|
|
|
|
|
2019-08-08 21:05:45 +07:00
|
|
|
hw_ip.armcp_cpld_version = le32_to_cpu(prop->armcp_info.cpld_version);
|
2019-02-16 05:39:23 +07:00
|
|
|
hw_ip.psoc_pci_pll_nr = prop->psoc_pci_pll_nr;
|
|
|
|
hw_ip.psoc_pci_pll_nf = prop->psoc_pci_pll_nf;
|
|
|
|
hw_ip.psoc_pci_pll_od = prop->psoc_pci_pll_od;
|
|
|
|
hw_ip.psoc_pci_pll_div_factor = prop->psoc_pci_pll_div_factor;
|
|
|
|
|
|
|
|
return copy_to_user(out, &hw_ip,
|
|
|
|
min((size_t)size, sizeof(hw_ip))) ? -EFAULT : 0;
|
|
|
|
}
|
|
|
|
|
2019-08-29 01:51:52 +07:00
|
|
|
static int hw_events_info(struct hl_device *hdev, bool aggregate,
|
|
|
|
struct hl_info_args *args)
|
2019-02-16 05:39:23 +07:00
|
|
|
{
|
|
|
|
u32 size, max_size = args->return_size;
|
|
|
|
void __user *out = (void __user *) (uintptr_t) args->return_pointer;
|
|
|
|
void *arr;
|
|
|
|
|
|
|
|
if ((!max_size) || (!out))
|
|
|
|
return -EINVAL;
|
|
|
|
|
2019-08-29 01:51:52 +07:00
|
|
|
arr = hdev->asic_funcs->get_events_stat(hdev, aggregate, &size);
|
2019-02-16 05:39:23 +07:00
|
|
|
|
|
|
|
return copy_to_user(out, arr, min(max_size, size)) ? -EFAULT : 0;
|
|
|
|
}
|
|
|
|
|
2019-07-30 15:48:02 +07:00
|
|
|
static int dram_usage_info(struct hl_fpriv *hpriv, struct hl_info_args *args)
|
2019-02-16 05:39:23 +07:00
|
|
|
{
|
2019-07-30 15:48:02 +07:00
|
|
|
struct hl_device *hdev = hpriv->hdev;
|
2019-02-16 05:39:23 +07:00
|
|
|
struct hl_info_dram_usage dram_usage = {0};
|
|
|
|
u32 max_size = args->return_size;
|
|
|
|
void __user *out = (void __user *) (uintptr_t) args->return_pointer;
|
|
|
|
struct asic_fixed_properties *prop = &hdev->asic_prop;
|
|
|
|
u64 dram_kmd_size;
|
|
|
|
|
|
|
|
if ((!max_size) || (!out))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
dram_kmd_size = (prop->dram_user_base_address -
|
|
|
|
prop->dram_base_address);
|
|
|
|
dram_usage.dram_free_mem = (prop->dram_size - dram_kmd_size) -
|
|
|
|
atomic64_read(&hdev->dram_used_mem);
|
2019-07-30 15:48:02 +07:00
|
|
|
if (hpriv->ctx)
|
|
|
|
dram_usage.ctx_dram_mem =
|
|
|
|
atomic64_read(&hpriv->ctx->dram_phys_mem);
|
2019-02-16 05:39:23 +07:00
|
|
|
|
|
|
|
return copy_to_user(out, &dram_usage,
|
|
|
|
min((size_t) max_size, sizeof(dram_usage))) ? -EFAULT : 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int hw_idle(struct hl_device *hdev, struct hl_info_args *args)
|
|
|
|
{
|
|
|
|
struct hl_info_hw_idle hw_idle = {0};
|
|
|
|
u32 max_size = args->return_size;
|
|
|
|
void __user *out = (void __user *) (uintptr_t) args->return_pointer;
|
|
|
|
|
|
|
|
if ((!max_size) || (!out))
|
|
|
|
return -EINVAL;
|
|
|
|
|
2019-07-01 20:59:45 +07:00
|
|
|
hw_idle.is_idle = hdev->asic_funcs->is_device_idle(hdev,
|
|
|
|
&hw_idle.busy_engines_mask, NULL);
|
2019-02-16 05:39:23 +07:00
|
|
|
|
|
|
|
return copy_to_user(out, &hw_idle,
|
|
|
|
min((size_t) max_size, sizeof(hw_idle))) ? -EFAULT : 0;
|
|
|
|
}
|
|
|
|
|
habanalabs: add new IOCTL for debug, tracing and profiling
Habanalabs ASICs use the ARM coresight infrastructure to support debug,
tracing and profiling of neural networks topologies.
Because the coresight is configured using register writes and reads, and
some of the registers hold sensitive information (e.g. the address in
the device's DRAM where the trace data is written to), the user must go
through the kernel driver to configure this mechanism.
This patch implements the common code of the IOCTL and calls the
ASIC-specific function for the actual H/W configuration.
The IOCTL supports configuration of seven coresight components:
ETR, ETF, STM, FUNNEL, BMON, SPMU and TIMESTAMP
The user specifies which component he wishes to configure and provides a
pointer to a structure (located in its process space) that contains the
relevant configuration.
The common code copies the relevant data from the user-space to kernel
space and then calls the ASIC-specific function to do the H/W
configuration.
After the configuration is done, which is usually composed
of several IOCTL calls depending on what the user wanted to trace, the
user can start executing the topology. The trace data will be written to
the user's area in the device's DRAM.
After the tracing operation is complete, and user will call the IOCTL
again to disable the tracing operation. The user also need to read
values from registers for some of the components (e.g. the size of the
trace data in the device's DRAM). In that case, the user will provide a
pointer to an "output" structure in user-space, which the IOCTL code will
fill according the to selected component.
Signed-off-by: Omer Shpigelman <oshpigelman@habana.ai>
Signed-off-by: Oded Gabbay <oded.gabbay@gmail.com>
2019-04-02 02:31:22 +07:00
|
|
|
static int debug_coresight(struct hl_device *hdev, struct hl_debug_args *args)
|
|
|
|
{
|
|
|
|
struct hl_debug_params *params;
|
|
|
|
void *input = NULL, *output = NULL;
|
|
|
|
int rc;
|
|
|
|
|
|
|
|
params = kzalloc(sizeof(*params), GFP_KERNEL);
|
|
|
|
if (!params)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
|
|
|
params->reg_idx = args->reg_idx;
|
|
|
|
params->enable = args->enable;
|
|
|
|
params->op = args->op;
|
|
|
|
|
|
|
|
if (args->input_ptr && args->input_size) {
|
2019-08-06 14:37:59 +07:00
|
|
|
input = kzalloc(hl_debug_struct_size[args->op], GFP_KERNEL);
|
|
|
|
if (!input) {
|
|
|
|
rc = -ENOMEM;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (copy_from_user(input, u64_to_user_ptr(args->input_ptr),
|
|
|
|
args->input_size)) {
|
|
|
|
rc = -EFAULT;
|
|
|
|
dev_err(hdev->dev, "failed to copy input debug data\n");
|
habanalabs: add new IOCTL for debug, tracing and profiling
Habanalabs ASICs use the ARM coresight infrastructure to support debug,
tracing and profiling of neural networks topologies.
Because the coresight is configured using register writes and reads, and
some of the registers hold sensitive information (e.g. the address in
the device's DRAM where the trace data is written to), the user must go
through the kernel driver to configure this mechanism.
This patch implements the common code of the IOCTL and calls the
ASIC-specific function for the actual H/W configuration.
The IOCTL supports configuration of seven coresight components:
ETR, ETF, STM, FUNNEL, BMON, SPMU and TIMESTAMP
The user specifies which component he wishes to configure and provides a
pointer to a structure (located in its process space) that contains the
relevant configuration.
The common code copies the relevant data from the user-space to kernel
space and then calls the ASIC-specific function to do the H/W
configuration.
After the configuration is done, which is usually composed
of several IOCTL calls depending on what the user wanted to trace, the
user can start executing the topology. The trace data will be written to
the user's area in the device's DRAM.
After the tracing operation is complete, and user will call the IOCTL
again to disable the tracing operation. The user also need to read
values from registers for some of the components (e.g. the size of the
trace data in the device's DRAM). In that case, the user will provide a
pointer to an "output" structure in user-space, which the IOCTL code will
fill according the to selected component.
Signed-off-by: Omer Shpigelman <oshpigelman@habana.ai>
Signed-off-by: Oded Gabbay <oded.gabbay@gmail.com>
2019-04-02 02:31:22 +07:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
params->input = input;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (args->output_ptr && args->output_size) {
|
|
|
|
output = kzalloc(args->output_size, GFP_KERNEL);
|
|
|
|
if (!output) {
|
|
|
|
rc = -ENOMEM;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
params->output = output;
|
|
|
|
params->output_size = args->output_size;
|
|
|
|
}
|
|
|
|
|
|
|
|
rc = hdev->asic_funcs->debug_coresight(hdev, params);
|
|
|
|
if (rc) {
|
|
|
|
dev_err(hdev->dev,
|
|
|
|
"debug coresight operation failed %d\n", rc);
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
2019-11-16 17:29:50 +07:00
|
|
|
if (output && copy_to_user((void __user *) (uintptr_t) args->output_ptr,
|
|
|
|
output, args->output_size)) {
|
|
|
|
dev_err(hdev->dev, "copy to user failed in debug ioctl\n");
|
|
|
|
rc = -EFAULT;
|
|
|
|
goto out;
|
habanalabs: add new IOCTL for debug, tracing and profiling
Habanalabs ASICs use the ARM coresight infrastructure to support debug,
tracing and profiling of neural networks topologies.
Because the coresight is configured using register writes and reads, and
some of the registers hold sensitive information (e.g. the address in
the device's DRAM where the trace data is written to), the user must go
through the kernel driver to configure this mechanism.
This patch implements the common code of the IOCTL and calls the
ASIC-specific function for the actual H/W configuration.
The IOCTL supports configuration of seven coresight components:
ETR, ETF, STM, FUNNEL, BMON, SPMU and TIMESTAMP
The user specifies which component he wishes to configure and provides a
pointer to a structure (located in its process space) that contains the
relevant configuration.
The common code copies the relevant data from the user-space to kernel
space and then calls the ASIC-specific function to do the H/W
configuration.
After the configuration is done, which is usually composed
of several IOCTL calls depending on what the user wanted to trace, the
user can start executing the topology. The trace data will be written to
the user's area in the device's DRAM.
After the tracing operation is complete, and user will call the IOCTL
again to disable the tracing operation. The user also need to read
values from registers for some of the components (e.g. the size of the
trace data in the device's DRAM). In that case, the user will provide a
pointer to an "output" structure in user-space, which the IOCTL code will
fill according the to selected component.
Signed-off-by: Omer Shpigelman <oshpigelman@habana.ai>
Signed-off-by: Oded Gabbay <oded.gabbay@gmail.com>
2019-04-02 02:31:22 +07:00
|
|
|
}
|
|
|
|
|
2019-11-16 17:29:50 +07:00
|
|
|
|
habanalabs: add new IOCTL for debug, tracing and profiling
Habanalabs ASICs use the ARM coresight infrastructure to support debug,
tracing and profiling of neural networks topologies.
Because the coresight is configured using register writes and reads, and
some of the registers hold sensitive information (e.g. the address in
the device's DRAM where the trace data is written to), the user must go
through the kernel driver to configure this mechanism.
This patch implements the common code of the IOCTL and calls the
ASIC-specific function for the actual H/W configuration.
The IOCTL supports configuration of seven coresight components:
ETR, ETF, STM, FUNNEL, BMON, SPMU and TIMESTAMP
The user specifies which component he wishes to configure and provides a
pointer to a structure (located in its process space) that contains the
relevant configuration.
The common code copies the relevant data from the user-space to kernel
space and then calls the ASIC-specific function to do the H/W
configuration.
After the configuration is done, which is usually composed
of several IOCTL calls depending on what the user wanted to trace, the
user can start executing the topology. The trace data will be written to
the user's area in the device's DRAM.
After the tracing operation is complete, and user will call the IOCTL
again to disable the tracing operation. The user also need to read
values from registers for some of the components (e.g. the size of the
trace data in the device's DRAM). In that case, the user will provide a
pointer to an "output" structure in user-space, which the IOCTL code will
fill according the to selected component.
Signed-off-by: Omer Shpigelman <oshpigelman@habana.ai>
Signed-off-by: Oded Gabbay <oded.gabbay@gmail.com>
2019-04-02 02:31:22 +07:00
|
|
|
out:
|
|
|
|
kfree(params);
|
|
|
|
kfree(output);
|
|
|
|
kfree(input);
|
|
|
|
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
|
2019-08-28 21:32:04 +07:00
|
|
|
static int device_utilization(struct hl_device *hdev, struct hl_info_args *args)
|
|
|
|
{
|
|
|
|
struct hl_info_device_utilization device_util = {0};
|
|
|
|
u32 max_size = args->return_size;
|
|
|
|
void __user *out = (void __user *) (uintptr_t) args->return_pointer;
|
|
|
|
|
|
|
|
if ((!max_size) || (!out))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
if ((args->period_ms < 100) || (args->period_ms > 1000) ||
|
|
|
|
(args->period_ms % 100)) {
|
|
|
|
dev_err(hdev->dev,
|
|
|
|
"period %u must be between 100 - 1000 and must be divisible by 100\n",
|
|
|
|
args->period_ms);
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
device_util.utilization = hl_device_utilization(hdev, args->period_ms);
|
|
|
|
|
|
|
|
return copy_to_user(out, &device_util,
|
|
|
|
min((size_t) max_size, sizeof(device_util))) ? -EFAULT : 0;
|
|
|
|
}
|
|
|
|
|
2019-10-10 19:48:59 +07:00
|
|
|
static int get_clk_rate(struct hl_device *hdev, struct hl_info_args *args)
|
|
|
|
{
|
|
|
|
struct hl_info_clk_rate clk_rate = {0};
|
|
|
|
u32 max_size = args->return_size;
|
|
|
|
void __user *out = (void __user *) (uintptr_t) args->return_pointer;
|
|
|
|
int rc;
|
|
|
|
|
|
|
|
if ((!max_size) || (!out))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
rc = hdev->asic_funcs->get_clk_rate(hdev, &clk_rate.cur_clk_rate_mhz,
|
|
|
|
&clk_rate.max_clk_rate_mhz);
|
|
|
|
if (rc)
|
|
|
|
return rc;
|
|
|
|
|
|
|
|
return copy_to_user(out, &clk_rate,
|
|
|
|
min((size_t) max_size, sizeof(clk_rate))) ? -EFAULT : 0;
|
|
|
|
}
|
|
|
|
|
2019-11-03 21:26:44 +07:00
|
|
|
static int get_reset_count(struct hl_device *hdev, struct hl_info_args *args)
|
|
|
|
{
|
|
|
|
struct hl_info_reset_count reset_count = {0};
|
|
|
|
u32 max_size = args->return_size;
|
|
|
|
void __user *out = (void __user *) (uintptr_t) args->return_pointer;
|
|
|
|
|
|
|
|
if ((!max_size) || (!out))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
reset_count.hard_reset_cnt = hdev->hard_reset_cnt;
|
|
|
|
reset_count.soft_reset_cnt = hdev->soft_reset_cnt;
|
|
|
|
|
|
|
|
return copy_to_user(out, &reset_count,
|
|
|
|
min((size_t) max_size, sizeof(reset_count))) ? -EFAULT : 0;
|
|
|
|
}
|
|
|
|
|
2019-07-30 13:10:50 +07:00
|
|
|
static int _hl_info_ioctl(struct hl_fpriv *hpriv, void *data,
|
|
|
|
struct device *dev)
|
2019-02-16 05:39:23 +07:00
|
|
|
{
|
|
|
|
struct hl_info_args *args = data;
|
|
|
|
struct hl_device *hdev = hpriv->hdev;
|
|
|
|
int rc;
|
|
|
|
|
2019-08-08 19:30:22 +07:00
|
|
|
/*
|
|
|
|
* Information is returned for the following opcodes even if the device
|
|
|
|
* is disabled or in reset.
|
|
|
|
*/
|
|
|
|
switch (args->op) {
|
|
|
|
case HL_INFO_HW_IP_INFO:
|
|
|
|
return hw_ip_info(hdev, args);
|
|
|
|
|
|
|
|
case HL_INFO_DEVICE_STATUS:
|
2019-03-24 15:15:44 +07:00
|
|
|
return device_status_info(hdev, args);
|
|
|
|
|
2019-11-03 21:26:44 +07:00
|
|
|
case HL_INFO_RESET_COUNT:
|
|
|
|
return get_reset_count(hdev, args);
|
|
|
|
|
2019-08-08 19:30:22 +07:00
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2019-02-16 05:39:23 +07:00
|
|
|
if (hl_device_disabled_or_in_reset(hdev)) {
|
2019-07-30 13:10:50 +07:00
|
|
|
dev_warn_ratelimited(dev,
|
2019-04-06 19:41:35 +07:00
|
|
|
"Device is %s. Can't execute INFO IOCTL\n",
|
|
|
|
atomic_read(&hdev->in_reset) ? "in_reset" : "disabled");
|
2019-02-16 05:39:23 +07:00
|
|
|
return -EBUSY;
|
|
|
|
}
|
|
|
|
|
|
|
|
switch (args->op) {
|
|
|
|
case HL_INFO_HW_EVENTS:
|
2019-08-29 01:51:52 +07:00
|
|
|
rc = hw_events_info(hdev, false, args);
|
2019-02-16 05:39:23 +07:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HL_INFO_DRAM_USAGE:
|
2019-07-30 15:48:02 +07:00
|
|
|
rc = dram_usage_info(hpriv, args);
|
2019-02-16 05:39:23 +07:00
|
|
|
break;
|
|
|
|
|
|
|
|
case HL_INFO_HW_IDLE:
|
|
|
|
rc = hw_idle(hdev, args);
|
|
|
|
break;
|
|
|
|
|
2019-08-28 21:32:04 +07:00
|
|
|
case HL_INFO_DEVICE_UTILIZATION:
|
|
|
|
rc = device_utilization(hdev, args);
|
|
|
|
break;
|
|
|
|
|
2019-08-29 01:51:52 +07:00
|
|
|
case HL_INFO_HW_EVENTS_AGGREGATE:
|
|
|
|
rc = hw_events_info(hdev, true, args);
|
|
|
|
break;
|
|
|
|
|
2019-10-10 19:48:59 +07:00
|
|
|
case HL_INFO_CLK_RATE:
|
|
|
|
rc = get_clk_rate(hdev, args);
|
|
|
|
break;
|
|
|
|
|
2019-02-16 05:39:23 +07:00
|
|
|
default:
|
2019-07-30 13:10:50 +07:00
|
|
|
dev_err(dev, "Invalid request %d\n", args->op);
|
2019-02-16 05:39:23 +07:00
|
|
|
rc = -ENOTTY;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
|
2019-07-30 13:10:50 +07:00
|
|
|
static int hl_info_ioctl(struct hl_fpriv *hpriv, void *data)
|
|
|
|
{
|
|
|
|
return _hl_info_ioctl(hpriv, data, hpriv->hdev->dev);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int hl_info_ioctl_control(struct hl_fpriv *hpriv, void *data)
|
|
|
|
{
|
|
|
|
return _hl_info_ioctl(hpriv, data, hpriv->hdev->dev_ctrl);
|
|
|
|
}
|
|
|
|
|
habanalabs: add new IOCTL for debug, tracing and profiling
Habanalabs ASICs use the ARM coresight infrastructure to support debug,
tracing and profiling of neural networks topologies.
Because the coresight is configured using register writes and reads, and
some of the registers hold sensitive information (e.g. the address in
the device's DRAM where the trace data is written to), the user must go
through the kernel driver to configure this mechanism.
This patch implements the common code of the IOCTL and calls the
ASIC-specific function for the actual H/W configuration.
The IOCTL supports configuration of seven coresight components:
ETR, ETF, STM, FUNNEL, BMON, SPMU and TIMESTAMP
The user specifies which component he wishes to configure and provides a
pointer to a structure (located in its process space) that contains the
relevant configuration.
The common code copies the relevant data from the user-space to kernel
space and then calls the ASIC-specific function to do the H/W
configuration.
After the configuration is done, which is usually composed
of several IOCTL calls depending on what the user wanted to trace, the
user can start executing the topology. The trace data will be written to
the user's area in the device's DRAM.
After the tracing operation is complete, and user will call the IOCTL
again to disable the tracing operation. The user also need to read
values from registers for some of the components (e.g. the size of the
trace data in the device's DRAM). In that case, the user will provide a
pointer to an "output" structure in user-space, which the IOCTL code will
fill according the to selected component.
Signed-off-by: Omer Shpigelman <oshpigelman@habana.ai>
Signed-off-by: Oded Gabbay <oded.gabbay@gmail.com>
2019-04-02 02:31:22 +07:00
|
|
|
static int hl_debug_ioctl(struct hl_fpriv *hpriv, void *data)
|
|
|
|
{
|
|
|
|
struct hl_debug_args *args = data;
|
|
|
|
struct hl_device *hdev = hpriv->hdev;
|
|
|
|
int rc = 0;
|
|
|
|
|
|
|
|
if (hl_device_disabled_or_in_reset(hdev)) {
|
|
|
|
dev_warn_ratelimited(hdev->dev,
|
|
|
|
"Device is %s. Can't execute DEBUG IOCTL\n",
|
|
|
|
atomic_read(&hdev->in_reset) ? "in_reset" : "disabled");
|
|
|
|
return -EBUSY;
|
|
|
|
}
|
|
|
|
|
|
|
|
switch (args->op) {
|
|
|
|
case HL_DEBUG_OP_ETR:
|
|
|
|
case HL_DEBUG_OP_ETF:
|
|
|
|
case HL_DEBUG_OP_STM:
|
|
|
|
case HL_DEBUG_OP_FUNNEL:
|
|
|
|
case HL_DEBUG_OP_BMON:
|
|
|
|
case HL_DEBUG_OP_SPMU:
|
|
|
|
case HL_DEBUG_OP_TIMESTAMP:
|
2019-05-04 21:36:06 +07:00
|
|
|
if (!hdev->in_debug) {
|
2019-06-06 13:28:45 +07:00
|
|
|
dev_err_ratelimited(hdev->dev,
|
2019-05-04 21:36:06 +07:00
|
|
|
"Rejecting debug configuration request because device not in debug mode\n");
|
|
|
|
return -EFAULT;
|
|
|
|
}
|
habanalabs: add new IOCTL for debug, tracing and profiling
Habanalabs ASICs use the ARM coresight infrastructure to support debug,
tracing and profiling of neural networks topologies.
Because the coresight is configured using register writes and reads, and
some of the registers hold sensitive information (e.g. the address in
the device's DRAM where the trace data is written to), the user must go
through the kernel driver to configure this mechanism.
This patch implements the common code of the IOCTL and calls the
ASIC-specific function for the actual H/W configuration.
The IOCTL supports configuration of seven coresight components:
ETR, ETF, STM, FUNNEL, BMON, SPMU and TIMESTAMP
The user specifies which component he wishes to configure and provides a
pointer to a structure (located in its process space) that contains the
relevant configuration.
The common code copies the relevant data from the user-space to kernel
space and then calls the ASIC-specific function to do the H/W
configuration.
After the configuration is done, which is usually composed
of several IOCTL calls depending on what the user wanted to trace, the
user can start executing the topology. The trace data will be written to
the user's area in the device's DRAM.
After the tracing operation is complete, and user will call the IOCTL
again to disable the tracing operation. The user also need to read
values from registers for some of the components (e.g. the size of the
trace data in the device's DRAM). In that case, the user will provide a
pointer to an "output" structure in user-space, which the IOCTL code will
fill according the to selected component.
Signed-off-by: Omer Shpigelman <oshpigelman@habana.ai>
Signed-off-by: Oded Gabbay <oded.gabbay@gmail.com>
2019-04-02 02:31:22 +07:00
|
|
|
args->input_size =
|
|
|
|
min(args->input_size, hl_debug_struct_size[args->op]);
|
|
|
|
rc = debug_coresight(hdev, args);
|
|
|
|
break;
|
2019-05-04 21:36:06 +07:00
|
|
|
case HL_DEBUG_OP_SET_MODE:
|
|
|
|
rc = hl_device_set_debug_mode(hdev, (bool) args->enable);
|
|
|
|
break;
|
habanalabs: add new IOCTL for debug, tracing and profiling
Habanalabs ASICs use the ARM coresight infrastructure to support debug,
tracing and profiling of neural networks topologies.
Because the coresight is configured using register writes and reads, and
some of the registers hold sensitive information (e.g. the address in
the device's DRAM where the trace data is written to), the user must go
through the kernel driver to configure this mechanism.
This patch implements the common code of the IOCTL and calls the
ASIC-specific function for the actual H/W configuration.
The IOCTL supports configuration of seven coresight components:
ETR, ETF, STM, FUNNEL, BMON, SPMU and TIMESTAMP
The user specifies which component he wishes to configure and provides a
pointer to a structure (located in its process space) that contains the
relevant configuration.
The common code copies the relevant data from the user-space to kernel
space and then calls the ASIC-specific function to do the H/W
configuration.
After the configuration is done, which is usually composed
of several IOCTL calls depending on what the user wanted to trace, the
user can start executing the topology. The trace data will be written to
the user's area in the device's DRAM.
After the tracing operation is complete, and user will call the IOCTL
again to disable the tracing operation. The user also need to read
values from registers for some of the components (e.g. the size of the
trace data in the device's DRAM). In that case, the user will provide a
pointer to an "output" structure in user-space, which the IOCTL code will
fill according the to selected component.
Signed-off-by: Omer Shpigelman <oshpigelman@habana.ai>
Signed-off-by: Oded Gabbay <oded.gabbay@gmail.com>
2019-04-02 02:31:22 +07:00
|
|
|
default:
|
|
|
|
dev_err(hdev->dev, "Invalid request %d\n", args->op);
|
|
|
|
rc = -ENOTTY;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
|
2019-02-16 05:39:15 +07:00
|
|
|
#define HL_IOCTL_DEF(ioctl, _func) \
|
|
|
|
[_IOC_NR(ioctl)] = {.cmd = ioctl, .func = _func}
|
|
|
|
|
|
|
|
static const struct hl_ioctl_desc hl_ioctls[] = {
|
2019-02-16 05:39:23 +07:00
|
|
|
HL_IOCTL_DEF(HL_IOCTL_INFO, hl_info_ioctl),
|
2019-02-16 05:39:21 +07:00
|
|
|
HL_IOCTL_DEF(HL_IOCTL_CB, hl_cb_ioctl),
|
|
|
|
HL_IOCTL_DEF(HL_IOCTL_CS, hl_cs_ioctl),
|
2019-02-16 05:39:22 +07:00
|
|
|
HL_IOCTL_DEF(HL_IOCTL_WAIT_CS, hl_cs_wait_ioctl),
|
habanalabs: add new IOCTL for debug, tracing and profiling
Habanalabs ASICs use the ARM coresight infrastructure to support debug,
tracing and profiling of neural networks topologies.
Because the coresight is configured using register writes and reads, and
some of the registers hold sensitive information (e.g. the address in
the device's DRAM where the trace data is written to), the user must go
through the kernel driver to configure this mechanism.
This patch implements the common code of the IOCTL and calls the
ASIC-specific function for the actual H/W configuration.
The IOCTL supports configuration of seven coresight components:
ETR, ETF, STM, FUNNEL, BMON, SPMU and TIMESTAMP
The user specifies which component he wishes to configure and provides a
pointer to a structure (located in its process space) that contains the
relevant configuration.
The common code copies the relevant data from the user-space to kernel
space and then calls the ASIC-specific function to do the H/W
configuration.
After the configuration is done, which is usually composed
of several IOCTL calls depending on what the user wanted to trace, the
user can start executing the topology. The trace data will be written to
the user's area in the device's DRAM.
After the tracing operation is complete, and user will call the IOCTL
again to disable the tracing operation. The user also need to read
values from registers for some of the components (e.g. the size of the
trace data in the device's DRAM). In that case, the user will provide a
pointer to an "output" structure in user-space, which the IOCTL code will
fill according the to selected component.
Signed-off-by: Omer Shpigelman <oshpigelman@habana.ai>
Signed-off-by: Oded Gabbay <oded.gabbay@gmail.com>
2019-04-02 02:31:22 +07:00
|
|
|
HL_IOCTL_DEF(HL_IOCTL_MEMORY, hl_mem_ioctl),
|
|
|
|
HL_IOCTL_DEF(HL_IOCTL_DEBUG, hl_debug_ioctl)
|
2019-02-16 05:39:15 +07:00
|
|
|
};
|
|
|
|
|
2019-07-30 13:10:50 +07:00
|
|
|
static const struct hl_ioctl_desc hl_ioctls_control[] = {
|
|
|
|
HL_IOCTL_DEF(HL_IOCTL_INFO, hl_info_ioctl_control)
|
|
|
|
};
|
2019-02-16 05:39:15 +07:00
|
|
|
|
2019-07-30 13:10:50 +07:00
|
|
|
static long _hl_ioctl(struct file *filep, unsigned int cmd, unsigned long arg,
|
|
|
|
const struct hl_ioctl_desc *ioctl, struct device *dev)
|
2019-02-16 05:39:15 +07:00
|
|
|
{
|
|
|
|
struct hl_fpriv *hpriv = filep->private_data;
|
|
|
|
struct hl_device *hdev = hpriv->hdev;
|
|
|
|
unsigned int nr = _IOC_NR(cmd);
|
|
|
|
char stack_kdata[128] = {0};
|
|
|
|
char *kdata = NULL;
|
|
|
|
unsigned int usize, asize;
|
2019-07-30 13:10:50 +07:00
|
|
|
hl_ioctl_t *func;
|
|
|
|
u32 hl_size;
|
2019-02-16 05:39:15 +07:00
|
|
|
int retcode;
|
|
|
|
|
2019-02-16 05:39:20 +07:00
|
|
|
if (hdev->hard_reset_pending) {
|
2019-07-30 13:10:50 +07:00
|
|
|
dev_crit_ratelimited(hdev->dev_ctrl,
|
2019-02-16 05:39:20 +07:00
|
|
|
"Device HARD reset pending! Please close FD\n");
|
|
|
|
return -ENODEV;
|
|
|
|
}
|
|
|
|
|
2019-02-16 05:39:15 +07:00
|
|
|
/* Do not trust userspace, use our own definition */
|
|
|
|
func = ioctl->func;
|
|
|
|
|
|
|
|
if (unlikely(!func)) {
|
2019-07-30 13:10:50 +07:00
|
|
|
dev_dbg(dev, "no function\n");
|
2019-02-16 05:39:15 +07:00
|
|
|
retcode = -ENOTTY;
|
|
|
|
goto out_err;
|
|
|
|
}
|
|
|
|
|
2019-07-30 13:10:50 +07:00
|
|
|
hl_size = _IOC_SIZE(ioctl->cmd);
|
|
|
|
usize = asize = _IOC_SIZE(cmd);
|
|
|
|
if (hl_size > asize)
|
|
|
|
asize = hl_size;
|
|
|
|
|
|
|
|
cmd = ioctl->cmd;
|
|
|
|
|
2019-02-16 05:39:15 +07:00
|
|
|
if (cmd & (IOC_IN | IOC_OUT)) {
|
|
|
|
if (asize <= sizeof(stack_kdata)) {
|
|
|
|
kdata = stack_kdata;
|
|
|
|
} else {
|
|
|
|
kdata = kzalloc(asize, GFP_KERNEL);
|
|
|
|
if (!kdata) {
|
|
|
|
retcode = -ENOMEM;
|
|
|
|
goto out_err;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (cmd & IOC_IN) {
|
|
|
|
if (copy_from_user(kdata, (void __user *)arg, usize)) {
|
|
|
|
retcode = -EFAULT;
|
|
|
|
goto out_err;
|
|
|
|
}
|
|
|
|
} else if (cmd & IOC_OUT) {
|
|
|
|
memset(kdata, 0, usize);
|
|
|
|
}
|
|
|
|
|
|
|
|
retcode = func(hpriv, kdata);
|
|
|
|
|
2019-11-16 17:29:50 +07:00
|
|
|
if ((cmd & IOC_OUT) && copy_to_user((void __user *)arg, kdata, usize))
|
|
|
|
retcode = -EFAULT;
|
2019-02-16 05:39:15 +07:00
|
|
|
|
|
|
|
out_err:
|
|
|
|
if (retcode)
|
2019-07-30 13:10:50 +07:00
|
|
|
dev_dbg(dev, "error in ioctl: pid=%d, cmd=0x%02x, nr=0x%02x\n",
|
2019-02-16 05:39:15 +07:00
|
|
|
task_pid_nr(current), cmd, nr);
|
|
|
|
|
|
|
|
if (kdata != stack_kdata)
|
|
|
|
kfree(kdata);
|
|
|
|
|
|
|
|
return retcode;
|
|
|
|
}
|
2019-07-30 13:10:50 +07:00
|
|
|
|
|
|
|
long hl_ioctl(struct file *filep, unsigned int cmd, unsigned long arg)
|
|
|
|
{
|
|
|
|
struct hl_fpriv *hpriv = filep->private_data;
|
|
|
|
struct hl_device *hdev = hpriv->hdev;
|
|
|
|
const struct hl_ioctl_desc *ioctl = NULL;
|
|
|
|
unsigned int nr = _IOC_NR(cmd);
|
|
|
|
|
|
|
|
if ((nr >= HL_COMMAND_START) && (nr < HL_COMMAND_END)) {
|
|
|
|
ioctl = &hl_ioctls[nr];
|
|
|
|
} else {
|
|
|
|
dev_err(hdev->dev, "invalid ioctl: pid=%d, nr=0x%02x\n",
|
|
|
|
task_pid_nr(current), nr);
|
|
|
|
return -ENOTTY;
|
|
|
|
}
|
|
|
|
|
|
|
|
return _hl_ioctl(filep, cmd, arg, ioctl, hdev->dev);
|
|
|
|
}
|
|
|
|
|
|
|
|
long hl_ioctl_control(struct file *filep, unsigned int cmd, unsigned long arg)
|
|
|
|
{
|
|
|
|
struct hl_fpriv *hpriv = filep->private_data;
|
|
|
|
struct hl_device *hdev = hpriv->hdev;
|
|
|
|
const struct hl_ioctl_desc *ioctl = NULL;
|
|
|
|
unsigned int nr = _IOC_NR(cmd);
|
|
|
|
|
|
|
|
if (nr == _IOC_NR(HL_IOCTL_INFO)) {
|
|
|
|
ioctl = &hl_ioctls_control[nr];
|
|
|
|
} else {
|
|
|
|
dev_err(hdev->dev_ctrl, "invalid ioctl: pid=%d, nr=0x%02x\n",
|
|
|
|
task_pid_nr(current), nr);
|
|
|
|
return -ENOTTY;
|
|
|
|
}
|
|
|
|
|
|
|
|
return _hl_ioctl(filep, cmd, arg, ioctl, hdev->dev_ctrl);
|
|
|
|
}
|