Re: [PATCH v8 8/9] drivers: perf: hisi: Miscellanous node(MN) event counting in perf

From: Zhangshaokun
Date: Wed Jun 14 2017 - 04:57:39 EST


Hi Mark,

On 2017/6/9 21:26, Mark Rutland wrote:
> On Mon, May 22, 2017 at 08:48:37PM +0800, Shaokun Zhang wrote:
>> 1. Add support to count MN hardware events.
>> 2. Mn events are listed in sysfs at /sys/devices/hisi_mn_2/events/
>> The events can be selected as shown in perf list
>> e.g.: For MN_READ_REQUEST event for Super CPU cluster 2 the
>> event format is -e "hisi_mn_2/read_req/"
>> 3. MN PMU doesnot support counter overflow IRQ in HiP05/06/07, So
>> use hrtimer to poll and avoid counter overflow.
>> 4. The driver supports DT and ACPI mode.
>>
>> Signed-off-by: Shaokun Zhang <zhangshaokun@xxxxxxxxxxxxx>
>> Signed-off-by: Anurup M <anurup.m@xxxxxxxxxx>
>> ---
>> drivers/perf/hisilicon/Makefile | 2 +-
>> drivers/perf/hisilicon/hisi_uncore_mn.c | 468 ++++++++++++++++++++++++++++++++
>> 2 files changed, 469 insertions(+), 1 deletion(-)
>> create mode 100644 drivers/perf/hisilicon/hisi_uncore_mn.c
>
> Largely this looks similar to the L3C patch, and most of the same
> comments apply.
>
> Could you please try to rework this according to those comments which
> apply here too?
>

Ok, shall follow those comments to apply MN module.

thanks
Shaokun

> Thanks,
> Mark.
>
>>
>> diff --git a/drivers/perf/hisilicon/Makefile b/drivers/perf/hisilicon/Makefile
>> index 0887b56..26b2507 100644
>> --- a/drivers/perf/hisilicon/Makefile
>> +++ b/drivers/perf/hisilicon/Makefile
>> @@ -1 +1 @@
>> -obj-$(CONFIG_HISI_PMU) += djtag.o hisi_uncore_pmu.o hisi_uncore_l3c.o
>> +obj-$(CONFIG_HISI_PMU) += djtag.o hisi_uncore_pmu.o hisi_uncore_l3c.o hisi_uncore_mn.o
>> diff --git a/drivers/perf/hisilicon/hisi_uncore_mn.c b/drivers/perf/hisilicon/hisi_uncore_mn.c
>> new file mode 100644
>> index 0000000..89e28ae
>> --- /dev/null
>> +++ b/drivers/perf/hisilicon/hisi_uncore_mn.c
>> @@ -0,0 +1,468 @@
>> +/*
>> + * HiSilicon SoC MN Hardware event counters support
>> + *
>> + * Copyright (C) 2017 Hisilicon Limited
>> + * Author: Shaokun Zhang <zhangshaokun@xxxxxxxxxxxxx>
>> + *
>> + * This code is based on the uncore PMUs like arm-cci and arm-ccn.
>> + *
>> + * This program is free software; you can redistribute it and/or modify
>> + * it under the terms of the GNU General Public License version 2 as
>> + * published by the Free Software Foundation.
>> + *
>> + * This program is distributed in the hope that it will be useful,
>> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
>> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
>> + * GNU General Public License for more details.
>> + *
>> + * You should have received a copy of the GNU General Public License
>> + * along with this program. If not, see <http://www.gnu.org/licenses/>.
>> + */
>> +#include <linux/acpi.h>
>> +#include <linux/bitmap.h>
>> +#include <linux/module.h>
>> +#include <linux/of.h>
>> +#include <linux/of_device.h>
>> +#include <linux/perf_event.h>
>> +#include "hisi_uncore_pmu.h"
>> +
>> +/*
>> + * ARMv8 HiSilicon MN event types.
>> + */
>> +enum hisi_mn_pmu_event_types {
>> + HISI_HWEVENT_MN_EO_BARR_REQ = 0x0,
>> + HISI_HWEVENT_MN_EC_BARR_REQ = 0x01,
>> + HISI_HWEVENT_MN_DVM_OP_REQ = 0x02,
>> + HISI_HWEVENT_MN_DVM_SYNC_REQ = 0x03,
>> + HISI_HWEVENT_MN_READ_REQ = 0x04,
>> + HISI_HWEVENT_MN_WRITE_REQ = 0x05,
>> + HISI_HWEVENT_MN_EVENT_MAX = 0x08,
>> +};
>> +
>> +/*
>> + * ARMv8 HiSilicon Hardware counter Index.
>> + */
>> +enum hisi_mn_pmu_counters {
>> + HISI_IDX_MN_COUNTER0 = 0x0,
>> + HISI_IDX_MN_COUNTER_MAX = 0x4,
>> +};
>> +
>> +#define MN1_EVTYPE_REG_OFF 0x48
>> +#define MN1_EVCTRL_REG_OFF 0x40
>> +#define MN1_CNT0_REG_OFF 0x30
>> +#define MN1_EVENT_EN 0x01
>> +#define MN1_BANK_SELECT 0x01
>> +
>> +#define GET_MODULE_ID(hwmod_data) hwmod_data->module_id
>> +
>> +/*
>> + * Default timer frequency to poll and avoid counter overflow.
>> + * CPU speed = 2.4Ghz and number of CPU cores in a SCCL is 16.
>> + * For a single MN event on a CPU core consumes 200 cycles.
>> + * So overflow time = (2^31 * 200) / (16 * 2.4G) which is about 21 seconds
>> + * So on a safe side we use a timer interval of 8sec
>> + */
>> +#define MN1_HRTIMER_INTERVAL (8LL * MSEC_PER_SEC)
>> +
>> +struct hisi_mn_data {
>> + struct hisi_djtag_client *client;
>> + u32 module_id;
>> +};
>> +
>> +static inline int hisi_mn_pmu_counter_valid(int idx)
>> +{
>> + return (idx >= HISI_IDX_MN_COUNTER0 && idx < HISI_IDX_MN_COUNTER_MAX);
>> +}
>> +
>> +/* Select the counter register offset from the index */
>> +static inline u32 get_counter_reg_off(int cntr_idx)
>> +{
>> + return (MN1_CNT0_REG_OFF + (cntr_idx * 4));
>> +}
>> +
>> +static u64 hisi_mn_pmu_read_counter(struct hisi_pmu *mn_pmu, int cntr_idx)
>> +{
>> + struct hisi_mn_data *mn_data = mn_pmu->hwmod_data;
>> + struct hisi_djtag_client *client = mn_data->client;
>> + u32 module_id = GET_MODULE_ID(mn_data);
>> + u32 reg_off, value;
>> +
>> + reg_off = get_counter_reg_off(cntr_idx);
>> + hisi_djtag_readreg(module_id, MN1_BANK_SELECT, reg_off,
>> + client, &value);
>> +
>> + return value;
>> +}
>> +
>> +static void hisi_mn_pmu_set_evtype(struct hisi_pmu *mn_pmu, int idx, u32 val)
>> +{
>> + struct hisi_mn_data *mn_data = mn_pmu->hwmod_data;
>> + struct hisi_djtag_client *client = mn_data->client;
>> + u32 module_id = GET_MODULE_ID(mn_data);
>> + u32 event_value, value = 0;
>> +
>> + event_value = (val - HISI_HWEVENT_MN_EO_BARR_REQ);
>> +
>> + /*
>> + * Write the event code in event select register.
>> + * Each byte in the 32 bit event select register is used
>> + * to configure the event code. Each byte correspond to a
>> + * counter register to use.
>> + */
>> + val = event_value << (8 * idx);
>> +
>> + hisi_djtag_readreg(module_id, MN1_BANK_SELECT, MN1_EVTYPE_REG_OFF,
>> + client, &value);
>> + value &= ~(0xff << (8 * idx));
>> + value |= val;
>> + hisi_djtag_writereg(module_id, MN1_BANK_SELECT, MN1_EVTYPE_REG_OFF,
>> + value, client);
>> +}
>> +
>> +static void hisi_mn_pmu_clear_evtype(struct hisi_pmu *mn_pmu, int idx)
>> +{
>> + struct hisi_mn_data *mn_data = mn_pmu->hwmod_data;
>> + struct hisi_djtag_client *client = mn_data->client;
>> + u32 module_id = GET_MODULE_ID(mn_data);
>> + u32 value;
>> +
>> + if (!hisi_mn_pmu_counter_valid(idx)) {
>> + dev_err(mn_pmu->dev, "Unsupported event index:%d!\n", idx);
>> + return;
>> + }
>> +
>> + /*
>> + * Clear the event code in event select register by writing value 0xff.
>> + * Each byte in the 32 bit event select register is used to configure
>> + * the event code. Each byte correspond to a counter register to use.
>> + */
>> + hisi_djtag_readreg(module_id, MN1_BANK_SELECT, MN1_EVTYPE_REG_OFF,
>> + client, &value);
>> + value &= ~(0xff << (8 * idx));
>> + value |= (0xff << (8 * idx));
>> + hisi_djtag_writereg(module_id, MN1_BANK_SELECT, MN1_EVTYPE_REG_OFF,
>> + value, client);
>> +}
>> +
>> +static void hisi_mn_pmu_write_counter(struct hisi_pmu *mn_pmu,
>> + struct hw_perf_event *hwc, u32 value)
>> +{
>> + struct hisi_mn_data *mn_data = mn_pmu->hwmod_data;
>> + struct hisi_djtag_client *client = mn_data->client;
>> + u32 module_id = GET_MODULE_ID(mn_data);
>> + u32 reg_off;
>> + int idx = GET_CNTR_IDX(hwc);
>> +
>> + reg_off = get_counter_reg_off(idx);
>> + hisi_djtag_writereg(module_id, MN1_BANK_SELECT, reg_off, value, client);
>> +}
>> +
>> +static void hisi_mn_pmu_start_counters(struct hisi_pmu *mn_pmu)
>> +{
>> + struct hisi_mn_data *mn_data = mn_pmu->hwmod_data;
>> + struct hisi_djtag_client *client = mn_data->client;
>> + unsigned long *used_mask = mn_pmu->pmu_events.used_mask;
>> + u32 module_id = GET_MODULE_ID(mn_data);
>> + u32 num_counters = mn_pmu->num_counters;
>> + u32 value;
>> + int enabled = bitmap_weight(used_mask, num_counters);
>> +
>> + if (!enabled)
>> + return;
>> +
>> + /* Set the event_bus_en bit in MN_EVENT_CTRL to start counting */
>> + hisi_djtag_readreg(module_id, MN1_BANK_SELECT, MN1_EVCTRL_REG_OFF,
>> + client, &value);
>> + value |= MN1_EVENT_EN;
>> + hisi_djtag_writereg(module_id, MN1_BANK_SELECT, MN1_EVCTRL_REG_OFF,
>> + value, client);
>> +}
>> +
>> +static void hisi_mn_pmu_stop_counters(struct hisi_pmu *mn_pmu)
>> +{
>> + struct hisi_mn_data *mn_data = mn_pmu->hwmod_data;
>> + struct hisi_djtag_client *client = mn_data->client;
>> + u32 module_id = GET_MODULE_ID(mn_data);
>> + u32 value;
>> +
>> + /*
>> + * Clear the event_bus_en bit in MN_EVENT_CTRL
>> + */
>> + hisi_djtag_readreg(module_id, MN1_BANK_SELECT, MN1_EVCTRL_REG_OFF,
>> + client, &value);
>> + value &= ~(MN1_EVENT_EN);
>> + hisi_djtag_writereg(module_id, MN1_BANK_SELECT, MN1_EVCTRL_REG_OFF,
>> + value, client);
>> +}
>> +
>> +static void hisi_mn_pmu_clear_event_idx(struct hisi_pmu *mn_pmu, int idx)
>> +{
>> + if (!hisi_mn_pmu_counter_valid(idx)) {
>> + dev_err(mn_pmu->dev, "Unsupported event index:%d!\n", idx);
>> + return;
>> + }
>> + clear_bit(idx, mn_pmu->pmu_events.used_mask);
>> +}
>> +
>> +static int hisi_mn_pmu_get_event_idx(struct perf_event *event)
>> +{
>> + struct hisi_pmu *mn_pmu = to_hisi_pmu(event->pmu);
>> + unsigned long *used_mask = mn_pmu->pmu_events.used_mask;
>> + u32 num_counters = mn_pmu->num_counters;
>> + int event_idx;
>> +
>> + event_idx = find_first_zero_bit(used_mask, num_counters);
>> + if (event_idx == num_counters)
>> + return -EAGAIN;
>> +
>> + set_bit(event_idx, used_mask);
>> +
>> + return event_idx;
>> +}
>> +
>> +static const struct of_device_id hisi_mn_pmu_of_match[] = {
>> + { .compatible = "hisilicon,hip05-pmu-mn-v1", },
>> + { .compatible = "hisilicon,hip06-pmu-mn-v1", },
>> + { .compatible = "hisilicon,hip07-pmu-mn-v2", },
>> + {},
>> +};
>> +MODULE_DEVICE_TABLE(of, hisi_mn_pmu_of_match);
>> +
>> +static const struct acpi_device_id hisi_mn_pmu_acpi_match[] = {
>> + { "HISI0221", },
>> + { "HISI0222", },
>> + {},
>> +};
>> +MODULE_DEVICE_TABLE(acpi, hisi_mn_pmu_acpi_match);
>> +
>> +static struct attribute *hisi_mn_pmu_format_attr[] = {
>> + HISI_PMU_FORMAT_ATTR(event, "config:0-7"),
>> + NULL,
>> +};
>> +
>> +static const struct attribute_group hisi_mn_pmu_format_group = {
>> + .name = "format",
>> + .attrs = hisi_mn_pmu_format_attr,
>> +};
>> +
>> +static struct attribute *hisi_mn_pmu_events_attr[] = {
>> + HISI_PMU_EVENT_ATTR_STR(eo_barrier_req, "event=0x0"),
>> + HISI_PMU_EVENT_ATTR_STR(ec_barrier_req, "event=0x01"),
>> + HISI_PMU_EVENT_ATTR_STR(dvm_op_req, "event=0x02"),
>> + HISI_PMU_EVENT_ATTR_STR(dvm_sync_req, "event=0x03"),
>> + HISI_PMU_EVENT_ATTR_STR(read_req, "event=0x04"),
>> + HISI_PMU_EVENT_ATTR_STR(write_req, "event=0x05"),
>> + NULL,
>> +};
>> +
>> +static const struct attribute_group hisi_mn_pmu_events_group = {
>> + .name = "events",
>> + .attrs = hisi_mn_pmu_events_attr,
>> +};
>> +
>> +static struct attribute *hisi_mn_pmu_attrs[] = {
>> + NULL,
>> +};
>> +
>> +static const struct attribute_group hisi_mn_pmu_attr_group = {
>> + .attrs = hisi_mn_pmu_attrs,
>> +};
>> +
>> +static DEVICE_ATTR(cpumask, 0444, hisi_cpumask_sysfs_show, NULL);
>> +
>> +static struct attribute *hisi_mn_pmu_cpumask_attrs[] = {
>> + &dev_attr_cpumask.attr,
>> + NULL,
>> +};
>> +
>> +static const struct attribute_group hisi_mn_pmu_cpumask_attr_group = {
>> + .attrs = hisi_mn_pmu_cpumask_attrs,
>> +};
>> +
>> +static const struct attribute_group *hisi_mn_pmu_pmu_attr_groups[] = {
>> + &hisi_mn_pmu_attr_group,
>> + &hisi_mn_pmu_format_group,
>> + &hisi_mn_pmu_events_group,
>> + &hisi_mn_pmu_cpumask_attr_group,
>> + NULL,
>> +};
>> +
>> +static struct hisi_uncore_ops hisi_uncore_mn_ops = {
>> + .set_evtype = hisi_mn_pmu_set_evtype,
>> + .clear_evtype = hisi_mn_pmu_clear_evtype,
>> + .set_event_period = hisi_uncore_pmu_set_event_period,
>> + .get_event_idx = hisi_mn_pmu_get_event_idx,
>> + .clear_event_idx = hisi_mn_pmu_clear_event_idx,
>> + .event_update = hisi_uncore_pmu_event_update,
>> + .start_counters = hisi_mn_pmu_start_counters,
>> + .stop_counters = hisi_mn_pmu_stop_counters,
>> + .write_counter = hisi_mn_pmu_write_counter,
>> + .read_counter = hisi_mn_pmu_read_counter,
>> +};
>> +
>> +/* Use hrtimer when no IRQ, to poll for avoiding counter overflow */
>> +static void hisi_mn_pmu_hrtimer_init(struct hisi_pmu *mn_pmu)
>> +{
>> + INIT_LIST_HEAD(&mn_pmu->active_list);
>> + mn_pmu->ops->start_hrtimer = hisi_hrtimer_start;
>> + mn_pmu->ops->stop_hrtimer = hisi_hrtimer_stop;
>> + hisi_hrtimer_init(mn_pmu, MN1_HRTIMER_INTERVAL);
>> +}
>> +
>> +static void hisi_mn_pmu_init_data(struct hisi_pmu *mn_pmu,
>> + struct hisi_djtag_client *client)
>> +{
>> + struct device *dev = &client->dev;
>> +
>> + mn_pmu->num_events = HISI_HWEVENT_MN_EVENT_MAX;
>> + mn_pmu->num_counters = HISI_IDX_MN_COUNTER_MAX;
>> + mn_pmu->counter_bits = 32;
>> + mn_pmu->num_active = 0;
>> + mn_pmu->scl_id = hisi_djtag_get_sclid(client);
>> +
>> + mn_pmu->name = kasprintf(GFP_KERNEL, "hisi_mn_pmu_%d", mn_pmu->scl_id);
>> + mn_pmu->ops = &hisi_uncore_mn_ops;
>> + mn_pmu->dev = dev;
>> +
>> + /* Pick one core to use for cpumask attributes */
>> + cpumask_set_cpu(smp_processor_id(), &mn_pmu->cpus);
>> +
>> + /*
>> + * Use poll method to avoid counter overflow as overflow IRQ
>> + * is not supported in v1, v2 hardware.
>> + */
>> + hisi_mn_pmu_hrtimer_init(mn_pmu);
>> +}
>> +
>> +static int hisi_mn_pmu_dev_probe(struct hisi_pmu *mn_pmu,
>> + struct hisi_djtag_client *client)
>> +{
>> + struct hisi_mn_data *mn_data;
>> + struct device *dev = &client->dev;
>> + int ret;
>> +
>> + mn_data = devm_kzalloc(dev, sizeof(*mn_data), GFP_KERNEL);
>> + if (!mn_data)
>> + return -ENOMEM;
>> +
>> + /* Set the djtag Identifier */
>> + mn_data->client = client;
>> + mn_pmu->hwmod_data = mn_data;
>> +
>> + if (dev->of_node) {
>> + const struct of_device_id *of_id;
>> +
>> + of_id = of_match_device(hisi_mn_pmu_of_match, dev);
>> + if (!of_id) {
>> + dev_err(dev, "DT: Match device fail!\n");
>> + return -EINVAL;
>> + }
>> + } else if (ACPI_COMPANION(dev)) {
>> + const struct acpi_device_id *acpi_id;
>> +
>> + acpi_id = acpi_match_device(hisi_mn_pmu_acpi_match, dev);
>> + if (!acpi_id) {
>> + dev_err(dev, "ACPI: Match device fail!\n");
>> + return -EINVAL;
>> + }
>> + } else
>> + return -EINVAL;
>> +
>> + ret = device_property_read_u32(dev, "hisilicon,module-id",
>> + &mn_data->module_id);
>> + if (ret < 0) {
>> + dev_err(dev, "DT: Could not read module-id!\n");
>> + return -EINVAL;
>> + }
>> +
>> + hisi_mn_pmu_init_data(mn_pmu, client);
>> +
>> + return 0;
>> +}
>> +
>> +static int hisi_mn_pmu_probe(struct hisi_djtag_client *client)
>> +{
>> + struct hisi_pmu *mn_pmu;
>> + struct device *dev = &client->dev;
>> + int ret;
>> +
>> + mn_pmu = hisi_pmu_alloc(dev, HISI_IDX_MN_COUNTER_MAX);
>> + if (!mn_pmu)
>> + return -ENOMEM;
>> +
>> + ret = hisi_mn_pmu_dev_probe(mn_pmu, client);
>> + if (ret)
>> + return ret;
>> +
>> + mn_pmu->pmu = (struct pmu) {
>> + .name = mn_pmu->name,
>> + .task_ctx_nr = perf_invalid_context,
>> + .event_init = hisi_uncore_pmu_event_init,
>> + .pmu_enable = hisi_uncore_pmu_enable,
>> + .pmu_disable = hisi_uncore_pmu_disable,
>> + .add = hisi_uncore_pmu_add,
>> + .del = hisi_uncore_pmu_del,
>> + .start = hisi_uncore_pmu_start,
>> + .stop = hisi_uncore_pmu_stop,
>> + .read = hisi_uncore_pmu_read,
>> + .attr_groups = hisi_mn_pmu_pmu_attr_groups,
>> + };
>> +
>> + ret = hisi_uncore_pmu_setup(mn_pmu, mn_pmu->name);
>> + if (ret) {
>> + dev_err(dev, "hisi_uncore_pmu_init FAILED!!\n");
>> + kfree(mn_pmu->name);
>> + return ret;
>> + }
>> +
>> + /* Set the drv data to MN pmu */
>> + dev_set_drvdata(dev, mn_pmu);
>> +
>> + return 0;
>> +}
>> +
>> +static int hisi_mn_pmu_remove(struct hisi_djtag_client *client)
>> +{
>> + struct hisi_pmu *mn_pmu;
>> + struct device *dev = &client->dev;
>> +
>> + mn_pmu = dev_get_drvdata(dev);
>> + perf_pmu_unregister(&mn_pmu->pmu);
>> + kfree(mn_pmu->name);
>> +
>> + return 0;
>> +}
>> +
>> +static struct hisi_djtag_driver hisi_mn_pmu_driver = {
>> + .driver = {
>> + .name = "hisi-mn-pmu",
>> + .of_match_table = hisi_mn_pmu_of_match,
>> + .acpi_match_table = ACPI_PTR(hisi_mn_pmu_acpi_match),
>> + },
>> + .probe = hisi_mn_pmu_probe,
>> + .remove = hisi_mn_pmu_remove,
>> +};
>> +
>> +static int __init hisi_mn_pmu_init(void)
>> +{
>> + int ret;
>> +
>> + ret = hisi_djtag_register_driver(THIS_MODULE, &hisi_mn_pmu_driver);
>> + if (ret < 0) {
>> + pr_err("hisi pmu MN init failed, ret=%d\n", ret);
>> + return ret;
>> + }
>> +
>> + return 0;
>> +}
>> +module_init(hisi_mn_pmu_init);
>> +
>> +static void __exit hisi_mn_pmu_exit(void)
>> +{
>> + hisi_djtag_unregister_driver(&hisi_mn_pmu_driver);
>> +}
>> +module_exit(hisi_mn_pmu_exit);
>> +
>> +MODULE_DESCRIPTION("HiSilicon SoC HIP0x MN PMU driver");
>> +MODULE_LICENSE("GPL v2");
>> +MODULE_AUTHOR("Shaokun Zhang");
>> --
>> 1.9.1
>>
>
> .
>