1. Hip05/06/07 uncore PMU to support different hardware event counters. 2. Hisilicon PMU shall use the DJTAG hardware interface to access hardware event counters and configuration register. 3. Routines to initialize and setup PMU. 4. Routines to enable/disable/add/del/start/stop hardware event counting. 5. Add support to count L3 cache hardware events.
Signed-off-by: Anurup M <anuru...@huawei.com> Signed-off-by: Shaokun Zhang <zhangshao...@hisilicon.com> Signed-off-by: John Garry <john.ga...@huawei.com> --- drivers/perf/hisilicon/Makefile | 2 +- drivers/perf/hisilicon/hisi_uncore_l3c.c | 572 +++++++++++++++++++++++++++++++ drivers/perf/hisilicon/hisi_uncore_pmu.c | 325 ++++++++++++++++++ drivers/perf/hisilicon/hisi_uncore_pmu.h | 107 ++++++ 4 files changed, 1005 insertions(+), 1 deletion(-) create mode 100644 drivers/perf/hisilicon/hisi_uncore_l3c.c create mode 100644 drivers/perf/hisilicon/hisi_uncore_pmu.c create mode 100644 drivers/perf/hisilicon/hisi_uncore_pmu.h diff --git a/drivers/perf/hisilicon/Makefile b/drivers/perf/hisilicon/Makefile index be8f093..0887b56 100644 --- a/drivers/perf/hisilicon/Makefile +++ b/drivers/perf/hisilicon/Makefile @@ -1 +1 @@ -obj-$(CONFIG_HISI_PMU) += djtag.o +obj-$(CONFIG_HISI_PMU) += djtag.o hisi_uncore_pmu.o hisi_uncore_l3c.o diff --git a/drivers/perf/hisilicon/hisi_uncore_l3c.c b/drivers/perf/hisilicon/hisi_uncore_l3c.c new file mode 100644 index 0000000..a59700f --- /dev/null +++ b/drivers/perf/hisilicon/hisi_uncore_l3c.c @@ -0,0 +1,572 @@ +/* + * HiSilicon SoC L3C Hardware event counters support + * + * Copyright (C) 2016 Huawei Technologies Limited + * Author: Anurup M <anuru...@huawei.com> + * + * This code is based on the uncore PMU's like arm-cci and + * arm-ccn. + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License version 2 as + * published by the Free Software Foundation. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program. If not, see <http://www.gnu.org/licenses/>. + */ +#include <linux/bitmap.h> +#include <linux/module.h> +#include <linux/of.h> +#include <linux/of_device.h> +#include <linux/perf_event.h> +#include "hisi_uncore_pmu.h" + +/* + * ARMv8 HiSilicon L3C event types. + */ +enum armv8_hisi_l3c_event_types { + HISI_HWEVENT_L3C_READ_ALLOCATE = 0x0, + HISI_HWEVENT_L3C_WRITE_ALLOCATE = 0x01, + HISI_HWEVENT_L3C_READ_NOALLOCATE = 0x02, + HISI_HWEVENT_L3C_WRITE_NOALLOCATE = 0x03, + HISI_HWEVENT_L3C_READ_HIT = 0x04, + HISI_HWEVENT_L3C_WRITE_HIT = 0x05, + HISI_HWEVENT_L3C_EVENT_MAX = 0x15, +}; + +/* + * ARMv8 HiSilicon Hardware counter Index. + */ +enum armv8_hisi_l3c_counters { + HISI_IDX_L3C_COUNTER0 = 0x0, + HISI_IDX_L3C_COUNTER_MAX = 0x8, +}; + +#define HISI_MAX_CFG_L3C_CNTR 0x08 +#define L3C_EVTYPE_REG_OFF 0x140 +#define L3C_EVCTRL_REG_OFF 0x04 +#define L3C_CNT0_REG_OFF 0x170 +#define L3C_EVENT_EN 0x1000000 + +#define GET_MODULE_ID(hwmod_data) hwmod_data->l3c_hwcfg.module_id +#define GET_BANK_SEL(hwmod_data) hwmod_data->l3c_hwcfg.module_id + +struct hisi_l3c_hwcfg { + u32 module_id; + u32 bank_select; + u32 bank_id; +}; + +struct hisi_l3c_data { + struct hisi_djtag_client *client; + DECLARE_BITMAP(event_used_mask, + HISI_MAX_CFG_L3C_CNTR); + struct hisi_l3c_hwcfg l3c_hwcfg; +}; + +struct hisi_l3c_hw_diff { + u32 (*get_bank_id)(u32 module_id, u32 bank_select); +}; + +/* hip05/06 chips L3C bank identifier */ +static u32 l3c_bankid_map_v1[MAX_BANKS] = { + 0x02, 0x01, 0x04, 0x08, +}; + +/* hip07 chip L3C bank identifier */ +static u32 l3c_bankid_map_v2[MAX_BANKS] = { + 0x01, 0x02, 0x03, 0x04, +}; + +/* Return the L3C bank index to use in PMU name */ +static u32 get_l3c_bank_v1(u32 module_id, u32 bank_select) +{ + u32 i; + + /* + * For v1 chip (hip05/06) the index of bank_select + * in the bankid_map gives the bank index. + */ + for (i = 0 ; i < MAX_BANKS; i++) + if (l3c_bankid_map_v1[i] == bank_select) + break; + + return i; +} + +/* Return the L3C bank index to use in PMU name */ +static u32 get_l3c_bank_v2(u32 module_id, u32 bank_select) +{ + u32 i; + + /* + * For v2 chip (hip07) each bank has different + * module ID. So index of module ID in the + * bankid_map gives the bank index. + */ + for (i = 0 ; i < MAX_BANKS; i++) + if (l3c_bankid_map_v2[i] == module_id) + break; + + return i; +} + +static inline int hisi_l3c_counter_valid(int idx) +{ + return (idx >= HISI_IDX_L3C_COUNTER0 && + idx < HISI_IDX_L3C_COUNTER_MAX); +} + +/* Select the counter register offset from the index */ +static inline u32 get_counter_reg_off(int cntr_idx) +{ + return (L3C_CNT0_REG_OFF + (cntr_idx * 4)); +} + +static u32 hisi_l3c_read_counter(struct hisi_l3c_data *l3c_data, + int cntr_idx) +{ + struct hisi_djtag_client *client = l3c_data->client; + u32 module_id = GET_MODULE_ID(l3c_data); + u32 bank_sel = GET_BANK_SEL(l3c_data); + u32 reg_off, value; + + reg_off = get_counter_reg_off(cntr_idx); + + hisi_djtag_readreg(module_id, bank_sel, reg_off, client, &value); + + return value; +} + +static u64 hisi_l3c_event_update(struct perf_event *event, + struct hw_perf_event *hwc, int idx) +{ + struct hisi_pmu *l3c_pmu = to_hisi_pmu(event->pmu); + struct hisi_l3c_data *l3c_data = l3c_pmu->hwmod_data; + u64 delta, prev_raw_count, new_raw_count = 0; + + if (!hisi_l3c_counter_valid(idx)) { + dev_err(l3c_pmu->dev, "Unsupported event index:%d!\n", idx); + return 0; + } + + do { + /* Get count from the L3C bank / submodule */ + new_raw_count += hisi_l3c_read_counter(l3c_data, idx); + prev_raw_count = local64_read(&hwc->prev_count); + + /* + * compute the delta + */ + delta = (new_raw_count - prev_raw_count) & HISI_MAX_PERIOD; + + local64_add(delta, &event->count); + } while (local64_cmpxchg( + &hwc->prev_count, prev_raw_count, new_raw_count) != + prev_raw_count); + + return new_raw_count; +} + +static void hisi_l3c_set_evtype(struct hisi_pmu *l3c_pmu, int idx, u32 val) +{ + struct hisi_l3c_data *l3c_data = l3c_pmu->hwmod_data; + struct hisi_djtag_client *client = l3c_data->client; + u32 module_id = GET_MODULE_ID(l3c_data); + u32 bank_sel = GET_BANK_SEL(l3c_data); + u32 reg_off = L3C_EVTYPE_REG_OFF; + u32 event_value, value = 0; + + event_value = (val - + HISI_HWEVENT_L3C_READ_ALLOCATE); + + /* + * Select the appropriate Event select register(L3C_EVENT_TYPEx). + * There are 2 Event Select registers for the 8 hardware counters. + * For the first 4 hardware counters, the L3C_EVTYPE_REG_OFF is chosen. + * For the next 4 hardware counters, the second register is chosen. + */ + if (idx > 3) + reg_off += 4; + + /* + * Value to write to event select register + * Each byte in the 32 bit select register is used to + * configure the event code. Each byte correspond to a + * counter register to use. + */ + val = event_value << (8 * idx); + + /* + * Set the event in L3C_EVENT_TYPEx Register + * for all L3C banks + */ + hisi_djtag_readreg(module_id, bank_sel, reg_off, + client, &value); + value &= ~(0xff << (8 * idx)); + value |= val; + hisi_djtag_writereg(module_id, bank_sel, reg_off, + value, client); +} + +static void hisi_l3c_clear_evtype(struct hisi_pmu *l3c_pmu, int idx) +{ + struct hisi_l3c_data *l3c_data = l3c_pmu->hwmod_data; + struct hisi_djtag_client *client = l3c_data->client; + u32 module_id = GET_MODULE_ID(l3c_data); + u32 bank_sel = GET_BANK_SEL(l3c_data); + u32 reg_off = L3C_EVTYPE_REG_OFF; + u32 value; + + if (!hisi_l3c_counter_valid(idx)) { + dev_err(l3c_pmu->dev, + "Unsupported event index:%d!\n", idx); + return; + } + + /* + * Clear Counting in L3C event config register. + * Select the appropriate Event select register(L3C_EVENT_TYPEx). + * There are 2 Event Select registers for the 8 hardware counters. + * For the first 4 hardware counters, the L3C_EVTYPE_REG_OFF is chosen. + * For the next 4 hardware counters, the second register is chosen. + */ + if (idx > 3) + reg_off += 4; + + /* + * Clear the event in L3C_EVENT_TYPEx Register + */ + hisi_djtag_readreg(module_id, bank_sel, reg_off, + client, &value); + value &= ~(0xff << (8 * idx)); + value |= (0xff << (8 * idx)); + hisi_djtag_writereg(module_id, bank_sel, reg_off, + value, client); +} + +static u32 hisi_l3c_write_counter(struct hisi_pmu *l3c_pmu, + struct hw_perf_event *hwc, u32 value) +{ + struct hisi_l3c_data *l3c_data = l3c_pmu->hwmod_data; + struct hisi_djtag_client *client = l3c_data->client; + u32 module_id = GET_MODULE_ID(l3c_data); + u32 bank_sel = GET_BANK_SEL(l3c_data); + u32 reg_off; + int idx = GET_CNTR_IDX(hwc); + int ret; + + if (!hisi_l3c_counter_valid(idx)) { + dev_err(l3c_pmu->dev, + "Unsupported event index:%d!\n", idx); + return -EINVAL; + } + + reg_off = get_counter_reg_off(idx); + + ret = hisi_djtag_writereg(module_id, bank_sel, reg_off, + value, client); + if (!ret) + ret = value; + + return ret; +} + +static void hisi_l3c_start_counters(struct hisi_pmu *l3c_pmu) +{ + struct hisi_l3c_data *l3c_data = l3c_pmu->hwmod_data; + struct hisi_djtag_client *client = l3c_data->client; + u32 module_id = GET_MODULE_ID(l3c_data); + u32 bank_sel = GET_BANK_SEL(l3c_data); + u32 reg_off = L3C_EVCTRL_REG_OFF; + u32 eventen = L3C_EVENT_EN; + u32 value; + + int enabled = bitmap_weight(l3c_data->event_used_mask, + l3c_pmu->num_counters); + if (!enabled) + return; + + /* + * Set the event_bus_en bit in L3C AUCNTRL to start counting + * for the L3C bank + */ + hisi_djtag_readreg(module_id, bank_sel, reg_off, + client, &value); + value |= eventen; + hisi_djtag_writereg(module_id, bank_sel, reg_off, + value, client); +} + +static void hisi_l3c_stop_counters(struct hisi_pmu *l3c_pmu) +{ + struct hisi_l3c_data *l3c_data = l3c_pmu->hwmod_data; + struct hisi_djtag_client *client = l3c_data->client; + u32 module_id = GET_MODULE_ID(l3c_data); + u32 bank_sel = GET_BANK_SEL(l3c_data); + u32 reg_off = L3C_EVCTRL_REG_OFF; + u32 eventen = L3C_EVENT_EN; + u32 value; + + /* + * Clear the event_bus_en bit in L3C AUCNTRL + */ + hisi_djtag_readreg(module_id, bank_sel, reg_off, + client, &value); + value &= ~(eventen); + hisi_djtag_writereg(module_id, bank_sel, reg_off, + value, client); +} + +static void hisi_l3c_clear_event_idx(struct hisi_pmu *l3c_pmu, int idx) +{ + struct hisi_l3c_data *l3c_data = l3c_pmu->hwmod_data; + void *bitmap_addr; + + if (!hisi_l3c_counter_valid(idx)) { + dev_err(l3c_pmu->dev, + "Unsupported event index:%d!\n", idx); + return; + } + + bitmap_addr = l3c_data->event_used_mask; + + __clear_bit(idx, bitmap_addr); +} + +static int hisi_l3c_get_event_idx(struct hisi_pmu *l3c_pmu) +{ + struct hisi_l3c_data *l3c_data = l3c_pmu->hwmod_data; + int event_idx; + + event_idx = + find_first_zero_bit( + l3c_data->event_used_mask, + l3c_pmu->num_counters); + + if (event_idx == l3c_pmu->num_counters) + return -EAGAIN; + + __set_bit(event_idx, l3c_data->event_used_mask); + + return event_idx; +} + +/* Handle differences in L3C hw in v1/v2 chips */ +static const struct hisi_l3c_hw_diff l3c_hw_v1 = { + .get_bank_id = get_l3c_bank_v1, +}; + +/* Handle differences in L3C hw in v1/v2 chips */ +static const struct hisi_l3c_hw_diff l3c_hw_v2 = { + .get_bank_id = get_l3c_bank_v2, +}; + +static const struct of_device_id l3c_of_match[] = { + { .compatible = "hisilicon,hisi-pmu-l3c-v1", &l3c_hw_v1}, + { .compatible = "hisilicon,hisi-pmu-l3c-v2", &l3c_hw_v2}, + {}, +}; +MODULE_DEVICE_TABLE(of, l3c_of_match); + +static int init_hisi_l3c_hwcfg_fdt(struct device *dev, + struct hisi_l3c_data *l3c_data) +{ + struct hisi_l3c_hwcfg *l3c_hwcfg = &l3c_data->l3c_hwcfg; + struct device_node *node = dev->of_node; + const struct of_device_id *of_id; + int ret; + + ret = of_property_read_u32_index(node, "module-id", 0, + &l3c_hwcfg->module_id); + if (ret < 0) { + dev_err(dev, "DT: Couldnot read module-id!\n"); + return -EINVAL; + } + + ret = of_property_read_u32_index(node, "module-id", 1, + &l3c_hwcfg->bank_select); + if (ret < 0) { + dev_err(dev, "DT: Couldnot read bank-select!\n"); + return -EINVAL; + } + + of_id = of_match_device(l3c_of_match, dev); + if (of_id) { + const struct hisi_l3c_hw_diff *l3c_hw = of_id->data; + u32 bank_id; + + /* Get the L3C bank index to set the pmu name */ + bank_id = l3c_hw->get_bank_id(l3c_hwcfg->module_id, + l3c_hwcfg->bank_select); + if (bank_id == MAX_BANKS) { + dev_err(dev, "DT: Invalid bank-select!\n"); + return -EINVAL; + } + l3c_hwcfg->bank_id = bank_id; + } + + return 0; +} + +static int init_hisi_l3c_data(struct hisi_pmu *l3c_pmu, + struct hisi_djtag_client *client) +{ + struct hisi_l3c_data *l3c_data = NULL; + struct device *dev = &client->dev; + int ret; + + l3c_data = devm_kzalloc(dev, sizeof(*l3c_data), GFP_KERNEL); + if (!l3c_data) + return -ENOMEM; + + /* Set the djtag Identifier */ + l3c_data->client = client; + + l3c_pmu->hw_events.events = devm_kcalloc(dev, + l3c_pmu->num_counters, + sizeof(*l3c_pmu->hw_events.events), + GFP_KERNEL); + if (!l3c_pmu->hw_events.events) + return -ENOMEM; + + raw_spin_lock_init(&l3c_pmu->hw_events.pmu_lock); + + l3c_pmu->hwmod_data = l3c_data; + + if (dev->of_node) { + ret = init_hisi_l3c_hwcfg_fdt(dev, l3c_data); + if (ret) + return ret; + } + + return 0; +} + +static struct hisi_uncore_ops hisi_uncore_l3c_ops = { + .set_evtype = hisi_l3c_set_evtype, + .clear_evtype = hisi_l3c_clear_evtype, + .set_event_period = hisi_pmu_set_event_period, + .get_event_idx = hisi_l3c_get_event_idx, + .clear_event_idx = hisi_l3c_clear_event_idx, + .event_update = hisi_l3c_event_update, + .start_counters = hisi_l3c_start_counters, + .stop_counters = hisi_l3c_stop_counters, + .write_counter = hisi_l3c_write_counter, +}; + +static int hisi_l3c_pmu_init(struct hisi_pmu *l3c_pmu, + struct hisi_djtag_client *client) +{ + struct device *dev = &client->dev; + struct hisi_l3c_data *l3c_data = l3c_pmu->hwmod_data; + struct hisi_l3c_hwcfg *l3c_hwcfg = &l3c_data->l3c_hwcfg; + + l3c_pmu->num_events = HISI_HWEVENT_L3C_EVENT_MAX; + l3c_pmu->num_counters = HISI_IDX_L3C_COUNTER_MAX; + l3c_pmu->scl_id = hisi_djtag_get_sclid(client); + + l3c_pmu->name = kasprintf(GFP_KERNEL, "hisi_l3c%u_%u", + l3c_hwcfg->bank_id, l3c_pmu->scl_id); + l3c_pmu->ops = &hisi_uncore_l3c_ops; + l3c_pmu->dev = dev; + + /* Pick one core to use for cpumask attributes */ + cpumask_set_cpu(smp_processor_id(), &l3c_pmu->cpu); + + return 0; +} + +static int hisi_pmu_l3c_dev_probe(struct hisi_djtag_client *client) +{ + struct hisi_pmu *l3c_pmu = NULL; + struct device *dev = &client->dev; + int ret; + + l3c_pmu = hisi_pmu_alloc(dev); + if (!l3c_pmu) + return -ENOMEM; + + ret = init_hisi_l3c_data(l3c_pmu, client); + if (ret) + return ret; + + ret = hisi_l3c_pmu_init(l3c_pmu, client); + if (ret) + return ret; + + l3c_pmu->pmu = (struct pmu) { + .name = l3c_pmu->name, + .task_ctx_nr = perf_invalid_context, + .event_init = hisi_uncore_pmu_event_init, + .pmu_enable = hisi_uncore_pmu_enable, + .pmu_disable = hisi_uncore_pmu_disable, + .add = hisi_uncore_pmu_add, + .del = hisi_uncore_pmu_del, + .start = hisi_uncore_pmu_start, + .stop = hisi_uncore_pmu_stop, + .read = hisi_uncore_pmu_read, + }; + + ret = hisi_uncore_pmu_setup(l3c_pmu, l3c_pmu->name); + if (ret) { + dev_err(dev, "hisi_uncore_pmu_init FAILED!!\n"); + return ret; + } + + /* Set the drv data to L3C pmu */ + dev_set_drvdata(dev, l3c_pmu); + + return 0; +} + +static int hisi_pmu_l3c_dev_remove(struct hisi_djtag_client *client) +{ + struct hisi_pmu *l3c_pmu = NULL; + struct device *dev = &client->dev; + + l3c_pmu = dev_get_drvdata(dev); + + perf_pmu_unregister(&l3c_pmu->pmu); + + return 0; +} + +static struct hisi_djtag_driver hisi_pmu_l3c_driver = { + .driver = { + .name = "hisi-pmu-l3c", + .of_match_table = l3c_of_match, + }, + .probe = hisi_pmu_l3c_dev_probe, + .remove = hisi_pmu_l3c_dev_remove, +}; + +static int __init hisi_pmu_l3c_init(void) +{ + int rc; + + rc = hisi_djtag_register_driver(THIS_MODULE, &hisi_pmu_l3c_driver); + if (rc < 0) { + pr_err("hisi pmu L3C init failed, rc=%d\n", rc); + return rc; + } + + return 0; +} +module_init(hisi_pmu_l3c_init); + +static void __exit hisi_pmu_l3c_exit(void) +{ + hisi_djtag_unregister_driver(&hisi_pmu_l3c_driver); + +} +module_exit(hisi_pmu_l3c_exit); + +MODULE_DESCRIPTION("HiSilicon SoC HIP0x L3C PMU driver"); +MODULE_LICENSE("GPL v2"); +MODULE_AUTHOR("Anurup M"); diff --git a/drivers/perf/hisilicon/hisi_uncore_pmu.c b/drivers/perf/hisilicon/hisi_uncore_pmu.c new file mode 100644 index 0000000..950e38d --- /dev/null +++ b/drivers/perf/hisilicon/hisi_uncore_pmu.c @@ -0,0 +1,325 @@ +/* + * HiSilicon SoC Hardware event counters support + * + * Copyright (C) 2016 Huawei Technologies Limited + * Author: Anurup M <anuru...@huawei.com> + * + * This code is based on the uncore PMU's like arm-cci and + * arm-ccn. + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License version 2 as + * published by the Free Software Foundation. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program. If not, see <http://www.gnu.org/licenses/>. + */ +#include <linux/bitmap.h> +#include <linux/kernel.h> +#include <linux/module.h> +#include <linux/of.h> +#include <linux/perf_event.h> +#include "hisi_uncore_pmu.h" + +/* djtag read interface - Call djtag driver to access SoC registers */ +int hisi_djtag_readreg(int module_id, int bank, u32 offset, + struct hisi_djtag_client *client, u32 *pvalue) +{ + int ret; + u32 chain_id = 0; + + while (bank != 1) { + bank = (bank >> 0x1); + chain_id++; + } + + ret = hisi_djtag_readl(client, offset, module_id, + chain_id, pvalue); + if (ret) + dev_err(&client->dev, "read failed, ret=%d!\n", ret); + + return ret; +} + +/* djtag write interface - Call djtag driver to access SoC registers */ +int hisi_djtag_writereg(int module_id, int bank, + u32 offset, u32 value, + struct hisi_djtag_client *client) +{ + int ret; + + ret = hisi_djtag_writel(client, offset, module_id, + HISI_DJTAG_MOD_MASK, value); + if (ret) + dev_err(&client->dev, "write failed, ret=%d!\n", ret); + + return ret; +} + +static int pmu_map_event(struct perf_event *event) +{ + return (int)(event->attr.config & HISI_EVTYPE_EVENT); +} + +static int hisi_hw_perf_event_init(struct perf_event *event) +{ + struct hw_perf_event *hwc = &event->hw; + struct hisi_pmu *hisi_pmu = to_hisi_pmu(event->pmu); + struct device *dev = hisi_pmu->dev; + int mapping; + + mapping = pmu_map_event(event); + if (mapping < 0) { + dev_err(dev, "event %x:%llx not supported\n", event->attr.type, + event->attr.config); + return mapping; + } + + /* + * We don't assign an index until we actually place the event onto + * hardware. Use -1 to signify that we haven't decided where to put it + * yet. + */ + hwc->idx = -1; + hwc->config = 0; + hwc->event_base = 0; + + /* For HiSilicon SoC update config_base based on event encoding */ + hwc->config_base = event->attr.config; + + return 0; +} + +int hisi_uncore_pmu_event_init(struct perf_event *event) +{ + int err; + struct hisi_pmu *hisi_pmu; + + if (event->attr.type != event->pmu->type) + return -ENOENT; + + /* + * We do not support sampling as the counters are all + * shared by all CPU cores in a CPU die(SCCL). Also we + * do not support attach to a task(per-process mode) + */ + if (is_sampling_event(event) || event->attach_state & PERF_ATTACH_TASK) + return -EOPNOTSUPP; + + /* counters do not have these bits */ + if (event->attr.exclude_user || + event->attr.exclude_kernel || + event->attr.exclude_host || + event->attr.exclude_guest || + event->attr.exclude_hv || + event->attr.exclude_idle) + return -EINVAL; + + if (event->cpu < 0) + return -EINVAL; + + hisi_pmu = to_hisi_pmu(event->pmu); + event->cpu = cpumask_first(&hisi_pmu->cpu); + + err = hisi_hw_perf_event_init(event); + + return err; +} + +/* + * Enable counter and set the counter to count + * the event that we're interested in. + */ +void hisi_uncore_pmu_enable_event(struct perf_event *event) +{ + struct hw_perf_event *hwc = &event->hw; + struct hisi_pmu *hisi_pmu = to_hisi_pmu(event->pmu); + + /* + * Set event in Event select registers. + */ + if (hisi_pmu->ops->set_evtype) + hisi_pmu->ops->set_evtype(hisi_pmu, GET_CNTR_IDX(hwc), + hwc->config_base); + + /* Enable the hardware event counting */ + if (hisi_pmu->ops->enable_counter) + hisi_pmu->ops->enable_counter(hisi_pmu, GET_CNTR_IDX(hwc)); +} + +/* + * Disable counting and clear the event. + */ +void hisi_uncore_pmu_disable_event(struct perf_event *event) +{ + struct hw_perf_event *hwc = &event->hw; + struct hisi_pmu *hisi_pmu = to_hisi_pmu(event->pmu); + + /* Disable the hardware event counting */ + if (hisi_pmu->ops->disable_counter) + hisi_pmu->ops->disable_counter(hisi_pmu, GET_CNTR_IDX(hwc)); + + /* + * Clear event in Event select registers. + */ + if (hisi_pmu->ops->clear_evtype) + hisi_pmu->ops->clear_evtype(hisi_pmu, GET_CNTR_IDX(hwc)); +} + +void hisi_pmu_set_event_period(struct perf_event *event) +{ + struct hw_perf_event *hwc = &event->hw; + struct hisi_pmu *hisi_pmu = to_hisi_pmu(event->pmu); + + /* + * The Hisilicon PMU counters have a period of 2^32. To account for the + * possiblity of extreme interrupt latency we program for a period of + * half that. Hopefully we can handle the interrupt before another 2^31 + * events occur and the counter overtakes its previous value. + */ + u64 val = 1ULL << 31; + + local64_set(&hwc->prev_count, val); + + /* Write to the hardware event counter */ + hisi_pmu->ops->write_counter(hisi_pmu, hwc, val); +} + +void hisi_uncore_pmu_start(struct perf_event *event, + int pmu_flags) +{ + struct hw_perf_event *hwc = &event->hw; + struct hisi_pmu *hisi_pmu = to_hisi_pmu(event->pmu); + struct hisi_pmu_hw_events *hw_events; + unsigned long flags; + + hw_events = &hisi_pmu->hw_events; + + if (WARN_ON_ONCE(!(hwc->state & PERF_HES_STOPPED))) + return; + + WARN_ON_ONCE(!(hwc->state & PERF_HES_UPTODATE)); + hwc->state = 0; + + if (hisi_pmu->ops->set_event_period) + hisi_pmu->ops->set_event_period(event); + + if (flags & PERF_EF_RELOAD) { + u64 prev_raw_count = local64_read(&hwc->prev_count); + + hisi_pmu->ops->write_counter(hisi_pmu, hwc, + (u32)prev_raw_count); + } + + hisi_uncore_pmu_enable_event(event); + perf_event_update_userpage(event); +} + +void hisi_uncore_pmu_stop(struct perf_event *event, + int flags) +{ + struct hw_perf_event *hwc = &event->hw; + struct hisi_pmu *hisi_pmu = to_hisi_pmu(event->pmu); + + hisi_uncore_pmu_disable_event(event); + WARN_ON_ONCE(hwc->state & PERF_HES_STOPPED); + hwc->state |= PERF_HES_STOPPED; + + if (hwc->state & PERF_HES_UPTODATE) + return; + + /* Read hardware counter and update the Perf counter statistics */ + hisi_pmu->ops->event_update(event, hwc, GET_CNTR_IDX(hwc)); + hwc->state |= PERF_HES_UPTODATE; +} + +int hisi_uncore_pmu_add(struct perf_event *event, int flags) +{ + struct hw_perf_event *hwc = &event->hw; + struct hisi_pmu *hisi_pmu = to_hisi_pmu(event->pmu); + struct hisi_pmu_hw_events *hw_events; + int idx; + + hw_events = &hisi_pmu->hw_events; + + hwc->state = PERF_HES_STOPPED | PERF_HES_UPTODATE; + + /* Get an available counter index for counting. */ + idx = hisi_pmu->ops->get_event_idx(hisi_pmu); + if (idx < 0) + return -EAGAIN; + + event->hw.idx = idx; + hw_events->events[idx] = event; + + if (flags & PERF_EF_START) + hisi_uncore_pmu_start(event, PERF_EF_RELOAD); + + /* Propagate our changes to the userspace mapping. */ + perf_event_update_userpage(event); + + return 0; +} + +void hisi_uncore_pmu_del(struct perf_event *event, int flags) +{ + struct hw_perf_event *hwc = &event->hw; + struct hisi_pmu *hisi_pmu = to_hisi_pmu(event->pmu); + struct hisi_pmu_hw_events *hw_events; + + hw_events = &hisi_pmu->hw_events; + + hisi_uncore_pmu_stop(event, PERF_EF_UPDATE); + + hisi_pmu->ops->clear_event_idx(hisi_pmu, GET_CNTR_IDX(hwc)); + perf_event_update_userpage(event); + hw_events->events[GET_CNTR_IDX(hwc)] = NULL; +} + +struct hisi_pmu *hisi_pmu_alloc(struct device *dev) +{ + struct hisi_pmu *hisi_pmu; + + hisi_pmu = devm_kzalloc(dev, sizeof(*hisi_pmu), GFP_KERNEL); + if (!hisi_pmu) + return ERR_PTR(-ENOMEM); + + return hisi_pmu; +} + +void hisi_uncore_pmu_read(struct perf_event *event) +{ + struct hw_perf_event *hwc = &event->hw; + struct hisi_pmu *hisi_pmu = to_hisi_pmu(event->pmu); + + /* Read hardware counter and update the Perf counter statistics */ + hisi_pmu->ops->event_update(event, hwc, GET_CNTR_IDX(hwc)); +} + +void hisi_uncore_pmu_enable(struct pmu *pmu) +{ + struct hisi_pmu *hisi_pmu = to_hisi_pmu(pmu); + + if (hisi_pmu->ops->start_counters) + hisi_pmu->ops->start_counters(hisi_pmu); +} + +void hisi_uncore_pmu_disable(struct pmu *pmu) +{ + struct hisi_pmu *hisi_pmu = to_hisi_pmu(pmu); + + if (hisi_pmu->ops->stop_counters) + hisi_pmu->ops->start_counters(hisi_pmu); +} + +int hisi_uncore_pmu_setup(struct hisi_pmu *hisi_pmu, + const char *pmu_name) +{ + /* Register the events with perf */ + return perf_pmu_register(&hisi_pmu->pmu, pmu_name, -1); +} diff --git a/drivers/perf/hisilicon/hisi_uncore_pmu.h b/drivers/perf/hisilicon/hisi_uncore_pmu.h new file mode 100644 index 0000000..28b7565 --- /dev/null +++ b/drivers/perf/hisilicon/hisi_uncore_pmu.h @@ -0,0 +1,107 @@ +/* + * HiSilicon SoC Hardware event counters support + * + * Copyright (C) 2016 Huawei Technologies Limited + * Author: Anurup M <anuru...@huawei.com> + * + * This code is based on the uncore PMU's like arm-cci and + * arm-ccn. + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License version 2 as + * published by the Free Software Foundation. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program. If not, see <http://www.gnu.org/licenses/>. + */ +#ifndef __HISI_UNCORE_PMU_H__ +#define __HISI_UNCORE_PMU_H__ + +#include <linux/init.h> +#include <linux/interrupt.h> +#include <linux/kernel.h> +#include <linux/platform_device.h> +#include <linux/slab.h> +#include <linux/types.h> +#include <asm/local64.h> +#include "djtag.h" + +#undef pr_fmt +#define pr_fmt(fmt) "hisi_pmu: " fmt + +#define HISI_DJTAG_MOD_MASK (0xFFFF) +#define HISI_CNTR_SCCL_MASK (0xF00) + +#define HISI_EVTYPE_EVENT 0xfff +#define HISI_MAX_PERIOD ((1LLU << 32) - 1) + +#define MAX_BANKS 8 +#define MAX_COUNTERS 30 +#define MAX_UNITS 8 + +#define GET_CNTR_IDX(hwc) (hwc->idx) +#define to_hisi_pmu(c) (container_of(c, struct hisi_pmu, pmu)) + + +struct hisi_pmu; + +struct hisi_uncore_ops { + void (*set_evtype)(struct hisi_pmu *, int, u32); + void (*clear_evtype)(struct hisi_pmu *, int); + void (*set_event_period)(struct perf_event *); + int (*get_event_idx)(struct hisi_pmu *); + void (*clear_event_idx)(struct hisi_pmu *, int); + u64 (*event_update)(struct perf_event *, + struct hw_perf_event *, int); + u32 (*read_counter)(struct hisi_pmu *, int, int); + u32 (*write_counter)(struct hisi_pmu *, + struct hw_perf_event *, u32); + void (*enable_counter)(struct hisi_pmu *, int); + void (*disable_counter)(struct hisi_pmu *, int); + void (*start_counters)(struct hisi_pmu *); + void (*stop_counters)(struct hisi_pmu *); +}; + +struct hisi_pmu_hw_events { + struct perf_event **events; + raw_spinlock_t pmu_lock; +}; + +/* Generic pmu struct for different pmu types */ +struct hisi_pmu { + const char *name; + struct hisi_pmu_hw_events hw_events; + struct hisi_uncore_ops *ops; + struct device *dev; + void *hwmod_data; /* Hardware module specific data */ + cpumask_t cpu; + struct pmu pmu; + u32 scl_id; + int num_counters; + int num_events; +}; + +void hisi_uncore_pmu_read(struct perf_event *event); +void hisi_uncore_pmu_del(struct perf_event *event, int flags); +int hisi_uncore_pmu_add(struct perf_event *event, int flags); +void hisi_uncore_pmu_start(struct perf_event *event, int flags); +void hisi_uncore_pmu_stop(struct perf_event *event, int flags); +void hisi_pmu_set_event_period(struct perf_event *event); +void hisi_uncore_pmu_enable_event(struct perf_event *event); +int hisi_uncore_pmu_setup(struct hisi_pmu *hisi_pmu, const char *pmu_name); +void hisi_uncore_pmu_enable(struct pmu *pmu); +void hisi_uncore_pmu_disable(struct pmu *pmu); +int hisi_uncore_pmu_event_init(struct perf_event *event); +int hisi_djtag_readreg(int module_id, int bank, u32 offset, + struct hisi_djtag_client *client, + u32 *value); +int hisi_djtag_writereg(int module_id, int bank, + u32 offset, u32 value, + struct hisi_djtag_client *client); +struct hisi_pmu *hisi_pmu_alloc(struct device *dev); +#endif /* __HISI_UNCORE_PMU_H__ */ -- 2.1.4