mirror of
https://github.com/torvalds/linux.git
synced 2024-11-24 21:21:41 +00:00
perf: Add driver for Arm NI-700 interconnect PMU
The Arm NI-700 Network-on-Chip Interconnect has a relatively straightforward design with a hierarchy of voltage, power, and clock domains, where each clock domain then contains a number of interface units and a PMU which can monitor events thereon. As such, it begets a relatively straightforward driver to interface those PMUs with perf. Even more so than with arm-cmn, users will require detailed knowledge of the wider system topology in order to meaningfully analyse anything, since the interconnect itself cannot know what lies beyond the boundary of each inscrutably-numbered interface. Given that, for now they are also expected to refer to the NI-700 documentation for the relevant event IDs to provide as well. An identifier is implemented so we can come back and add jevents if anyone really wants to. Signed-off-by: Robin Murphy <robin.murphy@arm.com> Link: https://lore.kernel.org/r/9933058d0ab8138c78a61cd6852ea5d5ff48e393.1725470837.git.robin.murphy@arm.com Signed-off-by: Will Deacon <will@kernel.org>
This commit is contained in:
parent
abbe74dd10
commit
4d5a7680f2
17
Documentation/admin-guide/perf/arm-ni.rst
Normal file
17
Documentation/admin-guide/perf/arm-ni.rst
Normal file
@ -0,0 +1,17 @@
|
||||
====================================
|
||||
Arm Network-on Chip Interconnect PMU
|
||||
====================================
|
||||
|
||||
NI-700 and friends implement a distinct PMU for each clock domain within the
|
||||
interconnect. Correspondingly, the driver exposes multiple PMU devices named
|
||||
arm_ni_<x>_cd_<y>, where <x> is an (arbitrary) instance identifier and <y> is
|
||||
the clock domain ID within that particular instance. If multiple NI instances
|
||||
exist within a system, the PMU devices can be correlated with the underlying
|
||||
hardware instance via sysfs parentage.
|
||||
|
||||
Each PMU exposes base event aliases for the interface types present in its clock
|
||||
domain. These require qualifying with the "eventid" and "nodeid" parameters
|
||||
to specify the event code to count and the interface at which to count it
|
||||
(per the configured hardware ID as reflected in the xxNI_NODE_INFO register).
|
||||
The exception is the "cycles" alias for the PMU cycle counter, which is encoded
|
||||
with the PMU node type and needs no further qualification.
|
@ -16,6 +16,7 @@ Performance monitor support
|
||||
starfive_starlink_pmu
|
||||
arm-ccn
|
||||
arm-cmn
|
||||
arm-ni
|
||||
xgene-pmu
|
||||
arm_dsu_pmu
|
||||
thunderx2-pmu
|
||||
|
@ -48,6 +48,13 @@ config ARM_CMN
|
||||
Support for PMU events monitoring on the Arm CMN-600 Coherent Mesh
|
||||
Network interconnect.
|
||||
|
||||
config ARM_NI
|
||||
tristate "Arm NI-700 PMU support"
|
||||
depends on ARM64 || COMPILE_TEST
|
||||
help
|
||||
Support for PMU events monitoring on the Arm NI-700 Network-on-Chip
|
||||
interconnect and family.
|
||||
|
||||
config ARM_PMU
|
||||
depends on ARM || ARM64
|
||||
bool "ARM PMU framework"
|
||||
|
@ -3,6 +3,7 @@ obj-$(CONFIG_ARM_CCI_PMU) += arm-cci.o
|
||||
obj-$(CONFIG_ARM_CCN) += arm-ccn.o
|
||||
obj-$(CONFIG_ARM_CMN) += arm-cmn.o
|
||||
obj-$(CONFIG_ARM_DSU_PMU) += arm_dsu_pmu.o
|
||||
obj-$(CONFIG_ARM_NI) += arm-ni.o
|
||||
obj-$(CONFIG_ARM_PMU) += arm_pmu.o arm_pmu_platform.o
|
||||
obj-$(CONFIG_ARM_PMU_ACPI) += arm_pmu_acpi.o
|
||||
obj-$(CONFIG_ARM_PMUV3) += arm_pmuv3.o
|
||||
|
781
drivers/perf/arm-ni.c
Normal file
781
drivers/perf/arm-ni.c
Normal file
@ -0,0 +1,781 @@
|
||||
// SPDX-License-Identifier: GPL-2.0
|
||||
// Copyright (C) 2022-2024 Arm Limited
|
||||
// NI-700 Network-on-Chip PMU driver
|
||||
|
||||
#include <linux/acpi.h>
|
||||
#include <linux/bitfield.h>
|
||||
#include <linux/interrupt.h>
|
||||
#include <linux/io.h>
|
||||
#include <linux/io-64-nonatomic-lo-hi.h>
|
||||
#include <linux/kernel.h>
|
||||
#include <linux/module.h>
|
||||
#include <linux/of.h>
|
||||
#include <linux/perf_event.h>
|
||||
#include <linux/platform_device.h>
|
||||
#include <linux/slab.h>
|
||||
|
||||
/* Common registers */
|
||||
#define NI_NODE_TYPE 0x000
|
||||
#define NI_NODE_TYPE_NODE_ID GENMASK(31, 16)
|
||||
#define NI_NODE_TYPE_NODE_TYPE GENMASK(15, 0)
|
||||
|
||||
#define NI_CHILD_NODE_INFO 0x004
|
||||
#define NI_CHILD_PTR(n) (0x008 + (n) * 4)
|
||||
|
||||
#define NI700_PMUSELA 0x00c
|
||||
|
||||
/* Config node */
|
||||
#define NI_PERIPHERAL_ID0 0xfe0
|
||||
#define NI_PIDR0_PART_7_0 GENMASK(7, 0)
|
||||
#define NI_PERIPHERAL_ID1 0xfe4
|
||||
#define NI_PIDR1_PART_11_8 GENMASK(3, 0)
|
||||
#define NI_PERIPHERAL_ID2 0xfe8
|
||||
#define NI_PIDR2_VERSION GENMASK(7, 4)
|
||||
|
||||
/* PMU node */
|
||||
#define NI_PMEVCNTR(n) (0x008 + (n) * 8)
|
||||
#define NI_PMCCNTR_L 0x0f8
|
||||
#define NI_PMCCNTR_U 0x0fc
|
||||
#define NI_PMEVTYPER(n) (0x400 + (n) * 4)
|
||||
#define NI_PMEVTYPER_NODE_TYPE GENMASK(12, 9)
|
||||
#define NI_PMEVTYPER_NODE_ID GENMASK(8, 0)
|
||||
#define NI_PMCNTENSET 0xc00
|
||||
#define NI_PMCNTENCLR 0xc20
|
||||
#define NI_PMINTENSET 0xc40
|
||||
#define NI_PMINTENCLR 0xc60
|
||||
#define NI_PMOVSCLR 0xc80
|
||||
#define NI_PMOVSSET 0xcc0
|
||||
#define NI_PMCFGR 0xe00
|
||||
#define NI_PMCR 0xe04
|
||||
#define NI_PMCR_RESET_CCNT BIT(2)
|
||||
#define NI_PMCR_RESET_EVCNT BIT(1)
|
||||
#define NI_PMCR_ENABLE BIT(0)
|
||||
|
||||
#define NI_NUM_COUNTERS 8
|
||||
#define NI_CCNT_IDX 31
|
||||
|
||||
/* Event attributes */
|
||||
#define NI_CONFIG_TYPE GENMASK_ULL(15, 0)
|
||||
#define NI_CONFIG_NODEID GENMASK_ULL(31, 16)
|
||||
#define NI_CONFIG_EVENTID GENMASK_ULL(47, 32)
|
||||
|
||||
#define NI_EVENT_TYPE(event) FIELD_GET(NI_CONFIG_TYPE, (event)->attr.config)
|
||||
#define NI_EVENT_NODEID(event) FIELD_GET(NI_CONFIG_NODEID, (event)->attr.config)
|
||||
#define NI_EVENT_EVENTID(event) FIELD_GET(NI_CONFIG_EVENTID, (event)->attr.config)
|
||||
|
||||
enum ni_part {
|
||||
PART_NI_700 = 0x43b,
|
||||
PART_NI_710AE = 0x43d,
|
||||
};
|
||||
|
||||
enum ni_node_type {
|
||||
NI_GLOBAL,
|
||||
NI_VOLTAGE,
|
||||
NI_POWER,
|
||||
NI_CLOCK,
|
||||
NI_ASNI,
|
||||
NI_AMNI,
|
||||
NI_PMU,
|
||||
NI_HSNI,
|
||||
NI_HMNI,
|
||||
NI_PMNI,
|
||||
};
|
||||
|
||||
struct arm_ni_node {
|
||||
void __iomem *base;
|
||||
enum ni_node_type type;
|
||||
u16 id;
|
||||
u32 num_components;
|
||||
};
|
||||
|
||||
struct arm_ni_unit {
|
||||
void __iomem *pmusela;
|
||||
enum ni_node_type type;
|
||||
u16 id;
|
||||
bool ns;
|
||||
union {
|
||||
__le64 pmusel;
|
||||
u8 event[8];
|
||||
};
|
||||
};
|
||||
|
||||
struct arm_ni_cd {
|
||||
void __iomem *pmu_base;
|
||||
u16 id;
|
||||
int num_units;
|
||||
int irq;
|
||||
int cpu;
|
||||
struct hlist_node cpuhp_node;
|
||||
struct pmu pmu;
|
||||
struct arm_ni_unit *units;
|
||||
struct perf_event *evcnt[NI_NUM_COUNTERS];
|
||||
struct perf_event *ccnt;
|
||||
};
|
||||
|
||||
struct arm_ni {
|
||||
struct device *dev;
|
||||
void __iomem *base;
|
||||
enum ni_part part;
|
||||
int id;
|
||||
int num_cds;
|
||||
struct arm_ni_cd cds[] __counted_by(num_cds);
|
||||
};
|
||||
|
||||
#define cd_to_ni(cd) container_of((cd), struct arm_ni, cds[(cd)->id])
|
||||
#define pmu_to_cd(p) container_of((p), struct arm_ni_cd, pmu)
|
||||
|
||||
#define cd_for_each_unit(cd, u) \
|
||||
for (struct arm_ni_unit *u = cd->units; u < cd->units + cd->num_units; u++)
|
||||
|
||||
static int arm_ni_hp_state;
|
||||
|
||||
struct arm_ni_event_attr {
|
||||
struct device_attribute attr;
|
||||
enum ni_node_type type;
|
||||
};
|
||||
|
||||
#define NI_EVENT_ATTR(_name, _type) \
|
||||
(&((struct arm_ni_event_attr[]) {{ \
|
||||
.attr = __ATTR(_name, 0444, arm_ni_event_show, NULL), \
|
||||
.type = _type, \
|
||||
}})[0].attr.attr)
|
||||
|
||||
static ssize_t arm_ni_event_show(struct device *dev,
|
||||
struct device_attribute *attr, char *buf)
|
||||
{
|
||||
struct arm_ni_event_attr *eattr = container_of(attr, typeof(*eattr), attr);
|
||||
|
||||
if (eattr->type == NI_PMU)
|
||||
return sysfs_emit(buf, "type=0x%x\n", eattr->type);
|
||||
|
||||
return sysfs_emit(buf, "type=0x%x,eventid=?,nodeid=?\n", eattr->type);
|
||||
}
|
||||
|
||||
static umode_t arm_ni_event_attr_is_visible(struct kobject *kobj,
|
||||
struct attribute *attr, int unused)
|
||||
{
|
||||
struct device *dev = kobj_to_dev(kobj);
|
||||
struct arm_ni_cd *cd = pmu_to_cd(dev_get_drvdata(dev));
|
||||
struct arm_ni_event_attr *eattr;
|
||||
|
||||
eattr = container_of(attr, typeof(*eattr), attr.attr);
|
||||
|
||||
cd_for_each_unit(cd, unit) {
|
||||
if (unit->type == eattr->type && unit->ns)
|
||||
return attr->mode;
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
static struct attribute *arm_ni_event_attrs[] = {
|
||||
NI_EVENT_ATTR(asni, NI_ASNI),
|
||||
NI_EVENT_ATTR(amni, NI_AMNI),
|
||||
NI_EVENT_ATTR(cycles, NI_PMU),
|
||||
NI_EVENT_ATTR(hsni, NI_HSNI),
|
||||
NI_EVENT_ATTR(hmni, NI_HMNI),
|
||||
NI_EVENT_ATTR(pmni, NI_PMNI),
|
||||
NULL
|
||||
};
|
||||
|
||||
static const struct attribute_group arm_ni_event_attrs_group = {
|
||||
.name = "events",
|
||||
.attrs = arm_ni_event_attrs,
|
||||
.is_visible = arm_ni_event_attr_is_visible,
|
||||
};
|
||||
|
||||
struct arm_ni_format_attr {
|
||||
struct device_attribute attr;
|
||||
u64 field;
|
||||
};
|
||||
|
||||
#define NI_FORMAT_ATTR(_name, _fld) \
|
||||
(&((struct arm_ni_format_attr[]) {{ \
|
||||
.attr = __ATTR(_name, 0444, arm_ni_format_show, NULL), \
|
||||
.field = _fld, \
|
||||
}})[0].attr.attr)
|
||||
|
||||
static ssize_t arm_ni_format_show(struct device *dev,
|
||||
struct device_attribute *attr, char *buf)
|
||||
{
|
||||
struct arm_ni_format_attr *fmt = container_of(attr, typeof(*fmt), attr);
|
||||
|
||||
return sysfs_emit(buf, "config:%*pbl\n", 64, &fmt->field);
|
||||
}
|
||||
|
||||
static struct attribute *arm_ni_format_attrs[] = {
|
||||
NI_FORMAT_ATTR(type, NI_CONFIG_TYPE),
|
||||
NI_FORMAT_ATTR(nodeid, NI_CONFIG_NODEID),
|
||||
NI_FORMAT_ATTR(eventid, NI_CONFIG_EVENTID),
|
||||
NULL
|
||||
};
|
||||
|
||||
static const struct attribute_group arm_ni_format_attrs_group = {
|
||||
.name = "format",
|
||||
.attrs = arm_ni_format_attrs,
|
||||
};
|
||||
|
||||
static ssize_t arm_ni_cpumask_show(struct device *dev,
|
||||
struct device_attribute *attr, char *buf)
|
||||
{
|
||||
struct arm_ni_cd *cd = pmu_to_cd(dev_get_drvdata(dev));
|
||||
|
||||
return cpumap_print_to_pagebuf(true, buf, cpumask_of(cd->cpu));
|
||||
}
|
||||
|
||||
static struct device_attribute arm_ni_cpumask_attr =
|
||||
__ATTR(cpumask, 0444, arm_ni_cpumask_show, NULL);
|
||||
|
||||
static ssize_t arm_ni_identifier_show(struct device *dev,
|
||||
struct device_attribute *attr, char *buf)
|
||||
{
|
||||
struct arm_ni *ni = cd_to_ni(pmu_to_cd(dev_get_drvdata(dev)));
|
||||
u32 reg = readl_relaxed(ni->base + NI_PERIPHERAL_ID2);
|
||||
int version = FIELD_GET(NI_PIDR2_VERSION, reg);
|
||||
|
||||
return sysfs_emit(buf, "%03x%02x\n", ni->part, version);
|
||||
}
|
||||
|
||||
static struct device_attribute arm_ni_identifier_attr =
|
||||
__ATTR(identifier, 0444, arm_ni_identifier_show, NULL);
|
||||
|
||||
static struct attribute *arm_ni_other_attrs[] = {
|
||||
&arm_ni_cpumask_attr.attr,
|
||||
&arm_ni_identifier_attr.attr,
|
||||
NULL
|
||||
};
|
||||
|
||||
static const struct attribute_group arm_ni_other_attr_group = {
|
||||
.attrs = arm_ni_other_attrs,
|
||||
NULL
|
||||
};
|
||||
|
||||
static const struct attribute_group *arm_ni_attr_groups[] = {
|
||||
&arm_ni_event_attrs_group,
|
||||
&arm_ni_format_attrs_group,
|
||||
&arm_ni_other_attr_group,
|
||||
NULL
|
||||
};
|
||||
|
||||
static void arm_ni_pmu_enable(struct pmu *pmu)
|
||||
{
|
||||
writel_relaxed(NI_PMCR_ENABLE, pmu_to_cd(pmu)->pmu_base + NI_PMCR);
|
||||
}
|
||||
|
||||
static void arm_ni_pmu_disable(struct pmu *pmu)
|
||||
{
|
||||
writel_relaxed(0, pmu_to_cd(pmu)->pmu_base + NI_PMCR);
|
||||
}
|
||||
|
||||
struct arm_ni_val {
|
||||
unsigned int evcnt;
|
||||
unsigned int ccnt;
|
||||
};
|
||||
|
||||
static bool arm_ni_val_count_event(struct perf_event *evt, struct arm_ni_val *val)
|
||||
{
|
||||
if (is_software_event(evt))
|
||||
return true;
|
||||
|
||||
if (NI_EVENT_TYPE(evt) == NI_PMU) {
|
||||
val->ccnt++;
|
||||
return val->ccnt <= 1;
|
||||
}
|
||||
|
||||
val->evcnt++;
|
||||
return val->evcnt <= NI_NUM_COUNTERS;
|
||||
}
|
||||
|
||||
static int arm_ni_validate_group(struct perf_event *event)
|
||||
{
|
||||
struct perf_event *sibling, *leader = event->group_leader;
|
||||
struct arm_ni_val val = { 0 };
|
||||
|
||||
if (leader == event)
|
||||
return 0;
|
||||
|
||||
arm_ni_val_count_event(event, &val);
|
||||
if (!arm_ni_val_count_event(leader, &val))
|
||||
return -EINVAL;
|
||||
|
||||
for_each_sibling_event(sibling, leader) {
|
||||
if (!arm_ni_val_count_event(sibling, &val))
|
||||
return -EINVAL;
|
||||
}
|
||||
return 0;
|
||||
}
|
||||
|
||||
static int arm_ni_event_init(struct perf_event *event)
|
||||
{
|
||||
struct arm_ni_cd *cd = pmu_to_cd(event->pmu);
|
||||
|
||||
if (event->attr.type != event->pmu->type)
|
||||
return -ENOENT;
|
||||
|
||||
if (is_sampling_event(event))
|
||||
return -EINVAL;
|
||||
|
||||
event->cpu = cd->cpu;
|
||||
if (NI_EVENT_TYPE(event) == NI_PMU)
|
||||
return arm_ni_validate_group(event);
|
||||
|
||||
cd_for_each_unit(cd, unit) {
|
||||
if (unit->type == NI_EVENT_TYPE(event) &&
|
||||
unit->id == NI_EVENT_NODEID(event) && unit->ns) {
|
||||
event->hw.config_base = (unsigned long)unit;
|
||||
return arm_ni_validate_group(event);
|
||||
}
|
||||
}
|
||||
return -EINVAL;
|
||||
}
|
||||
|
||||
static u64 arm_ni_read_ccnt(struct arm_ni_cd *cd)
|
||||
{
|
||||
u64 l, u_old, u_new;
|
||||
int retries = 3; /* 1st time unlucky, 2nd improbable, 3rd just broken */
|
||||
|
||||
u_new = readl_relaxed(cd->pmu_base + NI_PMCCNTR_U);
|
||||
do {
|
||||
u_old = u_new;
|
||||
l = readl_relaxed(cd->pmu_base + NI_PMCCNTR_L);
|
||||
u_new = readl_relaxed(cd->pmu_base + NI_PMCCNTR_U);
|
||||
} while (u_new != u_old && --retries);
|
||||
WARN_ON(!retries);
|
||||
|
||||
return (u_new << 32) | l;
|
||||
}
|
||||
|
||||
static void arm_ni_event_read(struct perf_event *event)
|
||||
{
|
||||
struct arm_ni_cd *cd = pmu_to_cd(event->pmu);
|
||||
struct hw_perf_event *hw = &event->hw;
|
||||
u64 count, prev;
|
||||
bool ccnt = hw->idx == NI_CCNT_IDX;
|
||||
|
||||
do {
|
||||
prev = local64_read(&hw->prev_count);
|
||||
if (ccnt)
|
||||
count = arm_ni_read_ccnt(cd);
|
||||
else
|
||||
count = readl_relaxed(cd->pmu_base + NI_PMEVCNTR(hw->idx));
|
||||
} while (local64_cmpxchg(&hw->prev_count, prev, count) != prev);
|
||||
|
||||
count -= prev;
|
||||
if (!ccnt)
|
||||
count = (u32)count;
|
||||
local64_add(count, &event->count);
|
||||
}
|
||||
|
||||
static void arm_ni_event_start(struct perf_event *event, int flags)
|
||||
{
|
||||
struct arm_ni_cd *cd = pmu_to_cd(event->pmu);
|
||||
|
||||
writel_relaxed(1U << event->hw.idx, cd->pmu_base + NI_PMCNTENSET);
|
||||
}
|
||||
|
||||
static void arm_ni_event_stop(struct perf_event *event, int flags)
|
||||
{
|
||||
struct arm_ni_cd *cd = pmu_to_cd(event->pmu);
|
||||
|
||||
writel_relaxed(1U << event->hw.idx, cd->pmu_base + NI_PMCNTENCLR);
|
||||
if (flags & PERF_EF_UPDATE)
|
||||
arm_ni_event_read(event);
|
||||
}
|
||||
|
||||
static void arm_ni_init_ccnt(struct arm_ni_cd *cd)
|
||||
{
|
||||
local64_set(&cd->ccnt->hw.prev_count, S64_MIN);
|
||||
lo_hi_writeq_relaxed(S64_MIN, cd->pmu_base + NI_PMCCNTR_L);
|
||||
}
|
||||
|
||||
static void arm_ni_init_evcnt(struct arm_ni_cd *cd, int idx)
|
||||
{
|
||||
local64_set(&cd->evcnt[idx]->hw.prev_count, S32_MIN);
|
||||
writel_relaxed(S32_MIN, cd->pmu_base + NI_PMEVCNTR(idx));
|
||||
}
|
||||
|
||||
static int arm_ni_event_add(struct perf_event *event, int flags)
|
||||
{
|
||||
struct arm_ni_cd *cd = pmu_to_cd(event->pmu);
|
||||
struct hw_perf_event *hw = &event->hw;
|
||||
struct arm_ni_unit *unit;
|
||||
enum ni_node_type type = NI_EVENT_TYPE(event);
|
||||
u32 reg;
|
||||
|
||||
if (type == NI_PMU) {
|
||||
if (cd->ccnt)
|
||||
return -ENOSPC;
|
||||
hw->idx = NI_CCNT_IDX;
|
||||
cd->ccnt = event;
|
||||
arm_ni_init_ccnt(cd);
|
||||
} else {
|
||||
hw->idx = 0;
|
||||
while (cd->evcnt[hw->idx]) {
|
||||
if (++hw->idx == NI_NUM_COUNTERS)
|
||||
return -ENOSPC;
|
||||
}
|
||||
cd->evcnt[hw->idx] = event;
|
||||
unit = (void *)hw->config_base;
|
||||
unit->event[hw->idx] = NI_EVENT_EVENTID(event);
|
||||
arm_ni_init_evcnt(cd, hw->idx);
|
||||
lo_hi_writeq_relaxed(le64_to_cpu(unit->pmusel), unit->pmusela);
|
||||
|
||||
reg = FIELD_PREP(NI_PMEVTYPER_NODE_TYPE, type) |
|
||||
FIELD_PREP(NI_PMEVTYPER_NODE_ID, NI_EVENT_NODEID(event));
|
||||
writel_relaxed(reg, cd->pmu_base + NI_PMEVTYPER(hw->idx));
|
||||
}
|
||||
if (flags & PERF_EF_START)
|
||||
arm_ni_event_start(event, 0);
|
||||
return 0;
|
||||
}
|
||||
|
||||
static void arm_ni_event_del(struct perf_event *event, int flags)
|
||||
{
|
||||
struct arm_ni_cd *cd = pmu_to_cd(event->pmu);
|
||||
struct hw_perf_event *hw = &event->hw;
|
||||
|
||||
arm_ni_event_stop(event, PERF_EF_UPDATE);
|
||||
|
||||
if (hw->idx == NI_CCNT_IDX)
|
||||
cd->ccnt = NULL;
|
||||
else
|
||||
cd->evcnt[hw->idx] = NULL;
|
||||
}
|
||||
|
||||
static irqreturn_t arm_ni_handle_irq(int irq, void *dev_id)
|
||||
{
|
||||
struct arm_ni_cd *cd = dev_id;
|
||||
irqreturn_t ret = IRQ_NONE;
|
||||
u32 reg = readl_relaxed(cd->pmu_base + NI_PMOVSCLR);
|
||||
|
||||
if (reg & (1U << NI_CCNT_IDX)) {
|
||||
ret = IRQ_HANDLED;
|
||||
if (!(WARN_ON(!cd->ccnt))) {
|
||||
arm_ni_event_read(cd->ccnt);
|
||||
arm_ni_init_ccnt(cd);
|
||||
}
|
||||
}
|
||||
for (int i = 0; i < NI_NUM_COUNTERS; i++) {
|
||||
if (!(reg & (1U << i)))
|
||||
continue;
|
||||
ret = IRQ_HANDLED;
|
||||
if (!(WARN_ON(!cd->evcnt[i]))) {
|
||||
arm_ni_event_read(cd->evcnt[i]);
|
||||
arm_ni_init_evcnt(cd, i);
|
||||
}
|
||||
}
|
||||
writel_relaxed(reg, cd->pmu_base + NI_PMOVSCLR);
|
||||
return ret;
|
||||
}
|
||||
|
||||
static int arm_ni_init_cd(struct arm_ni *ni, struct arm_ni_node *node, u64 res_start)
|
||||
{
|
||||
struct arm_ni_cd *cd = ni->cds + node->id;
|
||||
const char *name;
|
||||
int err;
|
||||
|
||||
cd->id = node->id;
|
||||
cd->num_units = node->num_components;
|
||||
cd->units = devm_kcalloc(ni->dev, cd->num_units, sizeof(*(cd->units)), GFP_KERNEL);
|
||||
if (!cd->units)
|
||||
return -ENOMEM;
|
||||
|
||||
for (int i = 0; i < cd->num_units; i++) {
|
||||
u32 reg = readl_relaxed(node->base + NI_CHILD_PTR(i));
|
||||
void __iomem *unit_base = ni->base + reg;
|
||||
struct arm_ni_unit *unit = cd->units + i;
|
||||
|
||||
reg = readl_relaxed(unit_base + NI_NODE_TYPE);
|
||||
unit->type = FIELD_GET(NI_NODE_TYPE_NODE_TYPE, reg);
|
||||
unit->id = FIELD_GET(NI_NODE_TYPE_NODE_ID, reg);
|
||||
|
||||
switch (unit->type) {
|
||||
case NI_PMU:
|
||||
reg = readl_relaxed(unit_base + NI_PMCFGR);
|
||||
if (!reg) {
|
||||
dev_info(ni->dev, "No access to PMU %d\n", cd->id);
|
||||
devm_kfree(ni->dev, cd->units);
|
||||
return 0;
|
||||
}
|
||||
unit->ns = true;
|
||||
cd->pmu_base = unit_base;
|
||||
break;
|
||||
case NI_ASNI:
|
||||
case NI_AMNI:
|
||||
case NI_HSNI:
|
||||
case NI_HMNI:
|
||||
case NI_PMNI:
|
||||
unit->pmusela = unit_base + NI700_PMUSELA;
|
||||
writel_relaxed(1, unit->pmusela);
|
||||
if (readl_relaxed(unit->pmusela) != 1)
|
||||
dev_info(ni->dev, "No access to node 0x%04x%04x\n", unit->id, unit->type);
|
||||
else
|
||||
unit->ns = true;
|
||||
break;
|
||||
default:
|
||||
/*
|
||||
* e.g. FMU - thankfully bits 3:2 of FMU_ERR_FR0 are RES0 so
|
||||
* can't alias any of the leaf node types we're looking for.
|
||||
*/
|
||||
dev_dbg(ni->dev, "Mystery node 0x%04x%04x\n", unit->id, unit->type);
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
res_start += cd->pmu_base - ni->base;
|
||||
if (!devm_request_mem_region(ni->dev, res_start, SZ_4K, dev_name(ni->dev))) {
|
||||
dev_err(ni->dev, "Failed to request PMU region 0x%llx\n", res_start);
|
||||
return -EBUSY;
|
||||
}
|
||||
|
||||
writel_relaxed(NI_PMCR_RESET_CCNT | NI_PMCR_RESET_EVCNT,
|
||||
cd->pmu_base + NI_PMCR);
|
||||
writel_relaxed(U32_MAX, cd->pmu_base + NI_PMCNTENCLR);
|
||||
writel_relaxed(U32_MAX, cd->pmu_base + NI_PMOVSCLR);
|
||||
writel_relaxed(U32_MAX, cd->pmu_base + NI_PMINTENSET);
|
||||
|
||||
cd->irq = platform_get_irq(to_platform_device(ni->dev), cd->id);
|
||||
if (cd->irq < 0)
|
||||
return cd->irq;
|
||||
|
||||
err = devm_request_irq(ni->dev, cd->irq, arm_ni_handle_irq,
|
||||
IRQF_NOBALANCING | IRQF_NO_THREAD,
|
||||
dev_name(ni->dev), cd);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
cd->cpu = cpumask_local_spread(0, dev_to_node(ni->dev));
|
||||
cd->pmu = (struct pmu) {
|
||||
.module = THIS_MODULE,
|
||||
.parent = ni->dev,
|
||||
.attr_groups = arm_ni_attr_groups,
|
||||
.capabilities = PERF_PMU_CAP_NO_EXCLUDE,
|
||||
.task_ctx_nr = perf_invalid_context,
|
||||
.pmu_enable = arm_ni_pmu_enable,
|
||||
.pmu_disable = arm_ni_pmu_disable,
|
||||
.event_init = arm_ni_event_init,
|
||||
.add = arm_ni_event_add,
|
||||
.del = arm_ni_event_del,
|
||||
.start = arm_ni_event_start,
|
||||
.stop = arm_ni_event_stop,
|
||||
.read = arm_ni_event_read,
|
||||
};
|
||||
|
||||
name = devm_kasprintf(ni->dev, GFP_KERNEL, "arm_ni_%d_cd_%d", ni->id, cd->id);
|
||||
if (!name)
|
||||
return -ENOMEM;
|
||||
|
||||
err = cpuhp_state_add_instance_nocalls(arm_ni_hp_state, &cd->cpuhp_node);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
err = perf_pmu_register(&cd->pmu, name, -1);
|
||||
if (err)
|
||||
cpuhp_state_remove_instance_nocalls(arm_ni_hp_state, &cd->cpuhp_node);
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
static void arm_ni_probe_domain(void __iomem *base, struct arm_ni_node *node)
|
||||
{
|
||||
u32 reg = readl_relaxed(base + NI_NODE_TYPE);
|
||||
|
||||
node->base = base;
|
||||
node->type = FIELD_GET(NI_NODE_TYPE_NODE_TYPE, reg);
|
||||
node->id = FIELD_GET(NI_NODE_TYPE_NODE_ID, reg);
|
||||
node->num_components = readl_relaxed(base + NI_CHILD_NODE_INFO);
|
||||
}
|
||||
|
||||
static int arm_ni_probe(struct platform_device *pdev)
|
||||
{
|
||||
struct arm_ni_node cfg, vd, pd, cd;
|
||||
struct arm_ni *ni;
|
||||
struct resource *res;
|
||||
void __iomem *base;
|
||||
static atomic_t id;
|
||||
int num_cds;
|
||||
u32 reg, part;
|
||||
|
||||
/*
|
||||
* We want to map the whole configuration space for ease of discovery,
|
||||
* but the PMU pages are the only ones for which we can honestly claim
|
||||
* exclusive ownership, so we'll request them explicitly once found.
|
||||
*/
|
||||
res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
|
||||
base = devm_ioremap(&pdev->dev, res->start, resource_size(res));
|
||||
if (IS_ERR(base))
|
||||
return PTR_ERR(base);
|
||||
|
||||
arm_ni_probe_domain(base, &cfg);
|
||||
if (cfg.type != NI_GLOBAL)
|
||||
return -ENODEV;
|
||||
|
||||
reg = readl_relaxed(cfg.base + NI_PERIPHERAL_ID0);
|
||||
part = FIELD_GET(NI_PIDR0_PART_7_0, reg);
|
||||
reg = readl_relaxed(cfg.base + NI_PERIPHERAL_ID1);
|
||||
part |= FIELD_GET(NI_PIDR1_PART_11_8, reg) << 8;
|
||||
|
||||
switch (part) {
|
||||
case PART_NI_700:
|
||||
case PART_NI_710AE:
|
||||
break;
|
||||
default:
|
||||
dev_WARN(&pdev->dev, "Unknown part number: 0x%03x, this may go badly\n", part);
|
||||
break;
|
||||
}
|
||||
|
||||
num_cds = 0;
|
||||
for (int v = 0; v < cfg.num_components; v++) {
|
||||
reg = readl_relaxed(cfg.base + NI_CHILD_PTR(v));
|
||||
arm_ni_probe_domain(base + reg, &vd);
|
||||
for (int p = 0; p < vd.num_components; p++) {
|
||||
reg = readl_relaxed(vd.base + NI_CHILD_PTR(p));
|
||||
arm_ni_probe_domain(base + reg, &pd);
|
||||
num_cds += pd.num_components;
|
||||
}
|
||||
}
|
||||
|
||||
ni = devm_kzalloc(&pdev->dev, struct_size(ni, cds, num_cds), GFP_KERNEL);
|
||||
if (!ni)
|
||||
return -ENOMEM;
|
||||
|
||||
ni->dev = &pdev->dev;
|
||||
ni->base = base;
|
||||
ni->num_cds = num_cds;
|
||||
ni->part = part;
|
||||
ni->id = atomic_fetch_inc(&id);
|
||||
|
||||
for (int v = 0; v < cfg.num_components; v++) {
|
||||
reg = readl_relaxed(cfg.base + NI_CHILD_PTR(v));
|
||||
arm_ni_probe_domain(base + reg, &vd);
|
||||
for (int p = 0; p < vd.num_components; p++) {
|
||||
reg = readl_relaxed(vd.base + NI_CHILD_PTR(p));
|
||||
arm_ni_probe_domain(base + reg, &pd);
|
||||
for (int c = 0; c < pd.num_components; c++) {
|
||||
int ret;
|
||||
|
||||
reg = readl_relaxed(pd.base + NI_CHILD_PTR(c));
|
||||
arm_ni_probe_domain(base + reg, &cd);
|
||||
ret = arm_ni_init_cd(ni, &cd, res->start);
|
||||
if (ret)
|
||||
return ret;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
static void arm_ni_remove(struct platform_device *pdev)
|
||||
{
|
||||
struct arm_ni *ni = platform_get_drvdata(pdev);
|
||||
|
||||
for (int i = 0; i < ni->num_cds; i++) {
|
||||
struct arm_ni_cd *cd = ni->cds + i;
|
||||
|
||||
if (!cd->pmu_base)
|
||||
continue;
|
||||
|
||||
writel_relaxed(0, cd->pmu_base + NI_PMCR);
|
||||
writel_relaxed(U32_MAX, cd->pmu_base + NI_PMINTENCLR);
|
||||
perf_pmu_unregister(&cd->pmu);
|
||||
cpuhp_state_remove_instance_nocalls(arm_ni_hp_state, &cd->cpuhp_node);
|
||||
}
|
||||
}
|
||||
|
||||
#ifdef CONFIG_OF
|
||||
static const struct of_device_id arm_ni_of_match[] = {
|
||||
{ .compatible = "arm,ni-700" },
|
||||
{}
|
||||
};
|
||||
MODULE_DEVICE_TABLE(of, arm_ni_of_match);
|
||||
#endif
|
||||
|
||||
#ifdef CONFIG_ACPI
|
||||
static const struct acpi_device_id arm_ni_acpi_match[] = {
|
||||
{ "ARMHCB70" },
|
||||
{}
|
||||
};
|
||||
MODULE_DEVICE_TABLE(acpi, arm_ni_acpi_match);
|
||||
#endif
|
||||
|
||||
static struct platform_driver arm_ni_driver = {
|
||||
.driver = {
|
||||
.name = "arm-ni",
|
||||
.of_match_table = of_match_ptr(arm_ni_of_match),
|
||||
.acpi_match_table = ACPI_PTR(arm_ni_acpi_match),
|
||||
},
|
||||
.probe = arm_ni_probe,
|
||||
.remove = arm_ni_remove,
|
||||
};
|
||||
|
||||
static void arm_ni_pmu_migrate(struct arm_ni_cd *cd, unsigned int cpu)
|
||||
{
|
||||
perf_pmu_migrate_context(&cd->pmu, cd->cpu, cpu);
|
||||
irq_set_affinity(cd->irq, cpumask_of(cpu));
|
||||
cd->cpu = cpu;
|
||||
}
|
||||
|
||||
static int arm_ni_pmu_online_cpu(unsigned int cpu, struct hlist_node *cpuhp_node)
|
||||
{
|
||||
struct arm_ni_cd *cd;
|
||||
int node;
|
||||
|
||||
cd = hlist_entry_safe(cpuhp_node, struct arm_ni_cd, cpuhp_node);
|
||||
node = dev_to_node(cd_to_ni(cd)->dev);
|
||||
if (cpu_to_node(cd->cpu) != node && cpu_to_node(cpu) == node)
|
||||
arm_ni_pmu_migrate(cd, cpu);
|
||||
return 0;
|
||||
}
|
||||
|
||||
static int arm_ni_pmu_offline_cpu(unsigned int cpu, struct hlist_node *cpuhp_node)
|
||||
{
|
||||
struct arm_ni_cd *cd;
|
||||
unsigned int target;
|
||||
int node;
|
||||
|
||||
cd = hlist_entry_safe(cpuhp_node, struct arm_ni_cd, cpuhp_node);
|
||||
if (cpu != cd->cpu)
|
||||
return 0;
|
||||
|
||||
node = dev_to_node(cd_to_ni(cd)->dev);
|
||||
target = cpumask_any_and_but(cpumask_of_node(node), cpu_online_mask, cpu);
|
||||
if (target >= nr_cpu_ids)
|
||||
target = cpumask_any_but(cpu_online_mask, cpu);
|
||||
|
||||
if (target < nr_cpu_ids)
|
||||
arm_ni_pmu_migrate(cd, target);
|
||||
return 0;
|
||||
}
|
||||
|
||||
static int __init arm_ni_init(void)
|
||||
{
|
||||
int ret;
|
||||
|
||||
ret = cpuhp_setup_state_multi(CPUHP_AP_ONLINE_DYN,
|
||||
"perf/arm/ni:online",
|
||||
arm_ni_pmu_online_cpu,
|
||||
arm_ni_pmu_offline_cpu);
|
||||
if (ret < 0)
|
||||
return ret;
|
||||
|
||||
arm_ni_hp_state = ret;
|
||||
|
||||
ret = platform_driver_register(&arm_ni_driver);
|
||||
if (ret)
|
||||
cpuhp_remove_multi_state(arm_ni_hp_state);
|
||||
return ret;
|
||||
}
|
||||
|
||||
static void __exit arm_ni_exit(void)
|
||||
{
|
||||
platform_driver_unregister(&arm_ni_driver);
|
||||
cpuhp_remove_multi_state(arm_ni_hp_state);
|
||||
}
|
||||
|
||||
module_init(arm_ni_init);
|
||||
module_exit(arm_ni_exit);
|
||||
|
||||
MODULE_AUTHOR("Robin Murphy <robin.murphy@arm.com>");
|
||||
MODULE_DESCRIPTION("Arm NI-700 PMU driver");
|
||||
MODULE_LICENSE("GPL v2");
|
Loading…
Reference in New Issue
Block a user