162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0
262306a36Sopenharmony_ci/* Copyright(c) 2020 Intel Corporation. All rights rsvd. */
362306a36Sopenharmony_ci
462306a36Sopenharmony_ci#include <linux/sched/task.h>
562306a36Sopenharmony_ci#include <linux/io-64-nonatomic-lo-hi.h>
662306a36Sopenharmony_ci#include "idxd.h"
762306a36Sopenharmony_ci#include "perfmon.h"
862306a36Sopenharmony_ci
962306a36Sopenharmony_cistatic ssize_t cpumask_show(struct device *dev, struct device_attribute *attr,
1062306a36Sopenharmony_ci			    char *buf);
1162306a36Sopenharmony_ci
1262306a36Sopenharmony_cistatic cpumask_t		perfmon_dsa_cpu_mask;
1362306a36Sopenharmony_cistatic bool			cpuhp_set_up;
1462306a36Sopenharmony_cistatic enum cpuhp_state		cpuhp_slot;
1562306a36Sopenharmony_ci
1662306a36Sopenharmony_ci/*
1762306a36Sopenharmony_ci * perf userspace reads this attribute to determine which cpus to open
1862306a36Sopenharmony_ci * counters on.  It's connected to perfmon_dsa_cpu_mask, which is
1962306a36Sopenharmony_ci * maintained by the cpu hotplug handlers.
2062306a36Sopenharmony_ci */
2162306a36Sopenharmony_cistatic DEVICE_ATTR_RO(cpumask);
2262306a36Sopenharmony_ci
2362306a36Sopenharmony_cistatic struct attribute *perfmon_cpumask_attrs[] = {
2462306a36Sopenharmony_ci	&dev_attr_cpumask.attr,
2562306a36Sopenharmony_ci	NULL,
2662306a36Sopenharmony_ci};
2762306a36Sopenharmony_ci
2862306a36Sopenharmony_cistatic struct attribute_group cpumask_attr_group = {
2962306a36Sopenharmony_ci	.attrs = perfmon_cpumask_attrs,
3062306a36Sopenharmony_ci};
3162306a36Sopenharmony_ci
3262306a36Sopenharmony_ci/*
3362306a36Sopenharmony_ci * These attributes specify the bits in the config word that the perf
3462306a36Sopenharmony_ci * syscall uses to pass the event ids and categories to perfmon.
3562306a36Sopenharmony_ci */
3662306a36Sopenharmony_ciDEFINE_PERFMON_FORMAT_ATTR(event_category, "config:0-3");
3762306a36Sopenharmony_ciDEFINE_PERFMON_FORMAT_ATTR(event, "config:4-31");
3862306a36Sopenharmony_ci
3962306a36Sopenharmony_ci/*
4062306a36Sopenharmony_ci * These attributes specify the bits in the config1 word that the perf
4162306a36Sopenharmony_ci * syscall uses to pass filter data to perfmon.
4262306a36Sopenharmony_ci */
4362306a36Sopenharmony_ciDEFINE_PERFMON_FORMAT_ATTR(filter_wq, "config1:0-31");
4462306a36Sopenharmony_ciDEFINE_PERFMON_FORMAT_ATTR(filter_tc, "config1:32-39");
4562306a36Sopenharmony_ciDEFINE_PERFMON_FORMAT_ATTR(filter_pgsz, "config1:40-43");
4662306a36Sopenharmony_ciDEFINE_PERFMON_FORMAT_ATTR(filter_sz, "config1:44-51");
4762306a36Sopenharmony_ciDEFINE_PERFMON_FORMAT_ATTR(filter_eng, "config1:52-59");
4862306a36Sopenharmony_ci
4962306a36Sopenharmony_ci#define PERFMON_FILTERS_START	2
5062306a36Sopenharmony_ci#define PERFMON_FILTERS_MAX	5
5162306a36Sopenharmony_ci
5262306a36Sopenharmony_cistatic struct attribute *perfmon_format_attrs[] = {
5362306a36Sopenharmony_ci	&format_attr_idxd_event_category.attr,
5462306a36Sopenharmony_ci	&format_attr_idxd_event.attr,
5562306a36Sopenharmony_ci	&format_attr_idxd_filter_wq.attr,
5662306a36Sopenharmony_ci	&format_attr_idxd_filter_tc.attr,
5762306a36Sopenharmony_ci	&format_attr_idxd_filter_pgsz.attr,
5862306a36Sopenharmony_ci	&format_attr_idxd_filter_sz.attr,
5962306a36Sopenharmony_ci	&format_attr_idxd_filter_eng.attr,
6062306a36Sopenharmony_ci	NULL,
6162306a36Sopenharmony_ci};
6262306a36Sopenharmony_ci
6362306a36Sopenharmony_cistatic struct attribute_group perfmon_format_attr_group = {
6462306a36Sopenharmony_ci	.name = "format",
6562306a36Sopenharmony_ci	.attrs = perfmon_format_attrs,
6662306a36Sopenharmony_ci};
6762306a36Sopenharmony_ci
6862306a36Sopenharmony_cistatic const struct attribute_group *perfmon_attr_groups[] = {
6962306a36Sopenharmony_ci	&perfmon_format_attr_group,
7062306a36Sopenharmony_ci	&cpumask_attr_group,
7162306a36Sopenharmony_ci	NULL,
7262306a36Sopenharmony_ci};
7362306a36Sopenharmony_ci
7462306a36Sopenharmony_cistatic ssize_t cpumask_show(struct device *dev, struct device_attribute *attr,
7562306a36Sopenharmony_ci			    char *buf)
7662306a36Sopenharmony_ci{
7762306a36Sopenharmony_ci	return cpumap_print_to_pagebuf(true, buf, &perfmon_dsa_cpu_mask);
7862306a36Sopenharmony_ci}
7962306a36Sopenharmony_ci
8062306a36Sopenharmony_cistatic bool is_idxd_event(struct idxd_pmu *idxd_pmu, struct perf_event *event)
8162306a36Sopenharmony_ci{
8262306a36Sopenharmony_ci	return &idxd_pmu->pmu == event->pmu;
8362306a36Sopenharmony_ci}
8462306a36Sopenharmony_ci
8562306a36Sopenharmony_cistatic int perfmon_collect_events(struct idxd_pmu *idxd_pmu,
8662306a36Sopenharmony_ci				  struct perf_event *leader,
8762306a36Sopenharmony_ci				  bool do_grp)
8862306a36Sopenharmony_ci{
8962306a36Sopenharmony_ci	struct perf_event *event;
9062306a36Sopenharmony_ci	int n, max_count;
9162306a36Sopenharmony_ci
9262306a36Sopenharmony_ci	max_count = idxd_pmu->n_counters;
9362306a36Sopenharmony_ci	n = idxd_pmu->n_events;
9462306a36Sopenharmony_ci
9562306a36Sopenharmony_ci	if (n >= max_count)
9662306a36Sopenharmony_ci		return -EINVAL;
9762306a36Sopenharmony_ci
9862306a36Sopenharmony_ci	if (is_idxd_event(idxd_pmu, leader)) {
9962306a36Sopenharmony_ci		idxd_pmu->event_list[n] = leader;
10062306a36Sopenharmony_ci		idxd_pmu->event_list[n]->hw.idx = n;
10162306a36Sopenharmony_ci		n++;
10262306a36Sopenharmony_ci	}
10362306a36Sopenharmony_ci
10462306a36Sopenharmony_ci	if (!do_grp)
10562306a36Sopenharmony_ci		return n;
10662306a36Sopenharmony_ci
10762306a36Sopenharmony_ci	for_each_sibling_event(event, leader) {
10862306a36Sopenharmony_ci		if (!is_idxd_event(idxd_pmu, event) ||
10962306a36Sopenharmony_ci		    event->state <= PERF_EVENT_STATE_OFF)
11062306a36Sopenharmony_ci			continue;
11162306a36Sopenharmony_ci
11262306a36Sopenharmony_ci		if (n >= max_count)
11362306a36Sopenharmony_ci			return -EINVAL;
11462306a36Sopenharmony_ci
11562306a36Sopenharmony_ci		idxd_pmu->event_list[n] = event;
11662306a36Sopenharmony_ci		idxd_pmu->event_list[n]->hw.idx = n;
11762306a36Sopenharmony_ci		n++;
11862306a36Sopenharmony_ci	}
11962306a36Sopenharmony_ci
12062306a36Sopenharmony_ci	return n;
12162306a36Sopenharmony_ci}
12262306a36Sopenharmony_ci
12362306a36Sopenharmony_cistatic void perfmon_assign_hw_event(struct idxd_pmu *idxd_pmu,
12462306a36Sopenharmony_ci				    struct perf_event *event, int idx)
12562306a36Sopenharmony_ci{
12662306a36Sopenharmony_ci	struct idxd_device *idxd = idxd_pmu->idxd;
12762306a36Sopenharmony_ci	struct hw_perf_event *hwc = &event->hw;
12862306a36Sopenharmony_ci
12962306a36Sopenharmony_ci	hwc->idx = idx;
13062306a36Sopenharmony_ci	hwc->config_base = ioread64(CNTRCFG_REG(idxd, idx));
13162306a36Sopenharmony_ci	hwc->event_base = ioread64(CNTRCFG_REG(idxd, idx));
13262306a36Sopenharmony_ci}
13362306a36Sopenharmony_ci
13462306a36Sopenharmony_cistatic int perfmon_assign_event(struct idxd_pmu *idxd_pmu,
13562306a36Sopenharmony_ci				struct perf_event *event)
13662306a36Sopenharmony_ci{
13762306a36Sopenharmony_ci	int i;
13862306a36Sopenharmony_ci
13962306a36Sopenharmony_ci	for (i = 0; i < IDXD_PMU_EVENT_MAX; i++)
14062306a36Sopenharmony_ci		if (!test_and_set_bit(i, idxd_pmu->used_mask))
14162306a36Sopenharmony_ci			return i;
14262306a36Sopenharmony_ci
14362306a36Sopenharmony_ci	return -EINVAL;
14462306a36Sopenharmony_ci}
14562306a36Sopenharmony_ci
14662306a36Sopenharmony_ci/*
14762306a36Sopenharmony_ci * Check whether there are enough counters to satisfy that all the
14862306a36Sopenharmony_ci * events in the group can actually be scheduled at the same time.
14962306a36Sopenharmony_ci *
15062306a36Sopenharmony_ci * To do this, create a fake idxd_pmu object so the event collection
15162306a36Sopenharmony_ci * and assignment functions can be used without affecting the internal
15262306a36Sopenharmony_ci * state of the real idxd_pmu object.
15362306a36Sopenharmony_ci */
15462306a36Sopenharmony_cistatic int perfmon_validate_group(struct idxd_pmu *pmu,
15562306a36Sopenharmony_ci				  struct perf_event *event)
15662306a36Sopenharmony_ci{
15762306a36Sopenharmony_ci	struct perf_event *leader = event->group_leader;
15862306a36Sopenharmony_ci	struct idxd_pmu *fake_pmu;
15962306a36Sopenharmony_ci	int i, ret = 0, n, idx;
16062306a36Sopenharmony_ci
16162306a36Sopenharmony_ci	fake_pmu = kzalloc(sizeof(*fake_pmu), GFP_KERNEL);
16262306a36Sopenharmony_ci	if (!fake_pmu)
16362306a36Sopenharmony_ci		return -ENOMEM;
16462306a36Sopenharmony_ci
16562306a36Sopenharmony_ci	fake_pmu->pmu.name = pmu->pmu.name;
16662306a36Sopenharmony_ci	fake_pmu->n_counters = pmu->n_counters;
16762306a36Sopenharmony_ci
16862306a36Sopenharmony_ci	n = perfmon_collect_events(fake_pmu, leader, true);
16962306a36Sopenharmony_ci	if (n < 0) {
17062306a36Sopenharmony_ci		ret = n;
17162306a36Sopenharmony_ci		goto out;
17262306a36Sopenharmony_ci	}
17362306a36Sopenharmony_ci
17462306a36Sopenharmony_ci	fake_pmu->n_events = n;
17562306a36Sopenharmony_ci	n = perfmon_collect_events(fake_pmu, event, false);
17662306a36Sopenharmony_ci	if (n < 0) {
17762306a36Sopenharmony_ci		ret = n;
17862306a36Sopenharmony_ci		goto out;
17962306a36Sopenharmony_ci	}
18062306a36Sopenharmony_ci
18162306a36Sopenharmony_ci	fake_pmu->n_events = n;
18262306a36Sopenharmony_ci
18362306a36Sopenharmony_ci	for (i = 0; i < n; i++) {
18462306a36Sopenharmony_ci		event = fake_pmu->event_list[i];
18562306a36Sopenharmony_ci
18662306a36Sopenharmony_ci		idx = perfmon_assign_event(fake_pmu, event);
18762306a36Sopenharmony_ci		if (idx < 0) {
18862306a36Sopenharmony_ci			ret = idx;
18962306a36Sopenharmony_ci			goto out;
19062306a36Sopenharmony_ci		}
19162306a36Sopenharmony_ci	}
19262306a36Sopenharmony_ciout:
19362306a36Sopenharmony_ci	kfree(fake_pmu);
19462306a36Sopenharmony_ci
19562306a36Sopenharmony_ci	return ret;
19662306a36Sopenharmony_ci}
19762306a36Sopenharmony_ci
19862306a36Sopenharmony_cistatic int perfmon_pmu_event_init(struct perf_event *event)
19962306a36Sopenharmony_ci{
20062306a36Sopenharmony_ci	struct idxd_device *idxd;
20162306a36Sopenharmony_ci	int ret = 0;
20262306a36Sopenharmony_ci
20362306a36Sopenharmony_ci	idxd = event_to_idxd(event);
20462306a36Sopenharmony_ci	event->hw.idx = -1;
20562306a36Sopenharmony_ci
20662306a36Sopenharmony_ci	if (event->attr.type != event->pmu->type)
20762306a36Sopenharmony_ci		return -ENOENT;
20862306a36Sopenharmony_ci
20962306a36Sopenharmony_ci	/* sampling not supported */
21062306a36Sopenharmony_ci	if (event->attr.sample_period)
21162306a36Sopenharmony_ci		return -EINVAL;
21262306a36Sopenharmony_ci
21362306a36Sopenharmony_ci	if (event->cpu < 0)
21462306a36Sopenharmony_ci		return -EINVAL;
21562306a36Sopenharmony_ci
21662306a36Sopenharmony_ci	if (event->pmu != &idxd->idxd_pmu->pmu)
21762306a36Sopenharmony_ci		return -EINVAL;
21862306a36Sopenharmony_ci
21962306a36Sopenharmony_ci	event->hw.event_base = ioread64(PERFMON_TABLE_OFFSET(idxd));
22062306a36Sopenharmony_ci	event->cpu = idxd->idxd_pmu->cpu;
22162306a36Sopenharmony_ci	event->hw.config = event->attr.config;
22262306a36Sopenharmony_ci
22362306a36Sopenharmony_ci	if (event->group_leader != event)
22462306a36Sopenharmony_ci		 /* non-group events have themselves as leader */
22562306a36Sopenharmony_ci		ret = perfmon_validate_group(idxd->idxd_pmu, event);
22662306a36Sopenharmony_ci
22762306a36Sopenharmony_ci	return ret;
22862306a36Sopenharmony_ci}
22962306a36Sopenharmony_ci
23062306a36Sopenharmony_cistatic inline u64 perfmon_pmu_read_counter(struct perf_event *event)
23162306a36Sopenharmony_ci{
23262306a36Sopenharmony_ci	struct hw_perf_event *hwc = &event->hw;
23362306a36Sopenharmony_ci	struct idxd_device *idxd;
23462306a36Sopenharmony_ci	int cntr = hwc->idx;
23562306a36Sopenharmony_ci
23662306a36Sopenharmony_ci	idxd = event_to_idxd(event);
23762306a36Sopenharmony_ci
23862306a36Sopenharmony_ci	return ioread64(CNTRDATA_REG(idxd, cntr));
23962306a36Sopenharmony_ci}
24062306a36Sopenharmony_ci
24162306a36Sopenharmony_cistatic void perfmon_pmu_event_update(struct perf_event *event)
24262306a36Sopenharmony_ci{
24362306a36Sopenharmony_ci	struct idxd_device *idxd = event_to_idxd(event);
24462306a36Sopenharmony_ci	u64 prev_raw_count, new_raw_count, delta, p, n;
24562306a36Sopenharmony_ci	int shift = 64 - idxd->idxd_pmu->counter_width;
24662306a36Sopenharmony_ci	struct hw_perf_event *hwc = &event->hw;
24762306a36Sopenharmony_ci
24862306a36Sopenharmony_ci	prev_raw_count = local64_read(&hwc->prev_count);
24962306a36Sopenharmony_ci	do {
25062306a36Sopenharmony_ci		new_raw_count = perfmon_pmu_read_counter(event);
25162306a36Sopenharmony_ci	} while (!local64_try_cmpxchg(&hwc->prev_count,
25262306a36Sopenharmony_ci				      &prev_raw_count, new_raw_count));
25362306a36Sopenharmony_ci	n = (new_raw_count << shift);
25462306a36Sopenharmony_ci	p = (prev_raw_count << shift);
25562306a36Sopenharmony_ci
25662306a36Sopenharmony_ci	delta = ((n - p) >> shift);
25762306a36Sopenharmony_ci
25862306a36Sopenharmony_ci	local64_add(delta, &event->count);
25962306a36Sopenharmony_ci}
26062306a36Sopenharmony_ci
26162306a36Sopenharmony_civoid perfmon_counter_overflow(struct idxd_device *idxd)
26262306a36Sopenharmony_ci{
26362306a36Sopenharmony_ci	int i, n_counters, max_loop = OVERFLOW_SIZE;
26462306a36Sopenharmony_ci	struct perf_event *event;
26562306a36Sopenharmony_ci	unsigned long ovfstatus;
26662306a36Sopenharmony_ci
26762306a36Sopenharmony_ci	n_counters = min(idxd->idxd_pmu->n_counters, OVERFLOW_SIZE);
26862306a36Sopenharmony_ci
26962306a36Sopenharmony_ci	ovfstatus = ioread32(OVFSTATUS_REG(idxd));
27062306a36Sopenharmony_ci
27162306a36Sopenharmony_ci	/*
27262306a36Sopenharmony_ci	 * While updating overflowed counters, other counters behind
27362306a36Sopenharmony_ci	 * them could overflow and be missed in a given pass.
27462306a36Sopenharmony_ci	 * Normally this could happen at most n_counters times, but in
27562306a36Sopenharmony_ci	 * theory a tiny counter width could result in continual
27662306a36Sopenharmony_ci	 * overflows and endless looping.  max_loop provides a
27762306a36Sopenharmony_ci	 * failsafe in that highly unlikely case.
27862306a36Sopenharmony_ci	 */
27962306a36Sopenharmony_ci	while (ovfstatus && max_loop--) {
28062306a36Sopenharmony_ci		/* Figure out which counter(s) overflowed */
28162306a36Sopenharmony_ci		for_each_set_bit(i, &ovfstatus, n_counters) {
28262306a36Sopenharmony_ci			unsigned long ovfstatus_clear = 0;
28362306a36Sopenharmony_ci
28462306a36Sopenharmony_ci			/* Update event->count for overflowed counter */
28562306a36Sopenharmony_ci			event = idxd->idxd_pmu->event_list[i];
28662306a36Sopenharmony_ci			perfmon_pmu_event_update(event);
28762306a36Sopenharmony_ci			/* Writing 1 to OVFSTATUS bit clears it */
28862306a36Sopenharmony_ci			set_bit(i, &ovfstatus_clear);
28962306a36Sopenharmony_ci			iowrite32(ovfstatus_clear, OVFSTATUS_REG(idxd));
29062306a36Sopenharmony_ci		}
29162306a36Sopenharmony_ci
29262306a36Sopenharmony_ci		ovfstatus = ioread32(OVFSTATUS_REG(idxd));
29362306a36Sopenharmony_ci	}
29462306a36Sopenharmony_ci
29562306a36Sopenharmony_ci	/*
29662306a36Sopenharmony_ci	 * Should never happen.  If so, it means a counter(s) looped
29762306a36Sopenharmony_ci	 * around twice while this handler was running.
29862306a36Sopenharmony_ci	 */
29962306a36Sopenharmony_ci	WARN_ON_ONCE(ovfstatus);
30062306a36Sopenharmony_ci}
30162306a36Sopenharmony_ci
30262306a36Sopenharmony_cistatic inline void perfmon_reset_config(struct idxd_device *idxd)
30362306a36Sopenharmony_ci{
30462306a36Sopenharmony_ci	iowrite32(CONFIG_RESET, PERFRST_REG(idxd));
30562306a36Sopenharmony_ci	iowrite32(0, OVFSTATUS_REG(idxd));
30662306a36Sopenharmony_ci	iowrite32(0, PERFFRZ_REG(idxd));
30762306a36Sopenharmony_ci}
30862306a36Sopenharmony_ci
30962306a36Sopenharmony_cistatic inline void perfmon_reset_counters(struct idxd_device *idxd)
31062306a36Sopenharmony_ci{
31162306a36Sopenharmony_ci	iowrite32(CNTR_RESET, PERFRST_REG(idxd));
31262306a36Sopenharmony_ci}
31362306a36Sopenharmony_ci
31462306a36Sopenharmony_cistatic inline void perfmon_reset(struct idxd_device *idxd)
31562306a36Sopenharmony_ci{
31662306a36Sopenharmony_ci	perfmon_reset_config(idxd);
31762306a36Sopenharmony_ci	perfmon_reset_counters(idxd);
31862306a36Sopenharmony_ci}
31962306a36Sopenharmony_ci
32062306a36Sopenharmony_cistatic void perfmon_pmu_event_start(struct perf_event *event, int mode)
32162306a36Sopenharmony_ci{
32262306a36Sopenharmony_ci	u32 flt_wq, flt_tc, flt_pg_sz, flt_xfer_sz, flt_eng = 0;
32362306a36Sopenharmony_ci	u64 cntr_cfg, cntrdata, event_enc, event_cat = 0;
32462306a36Sopenharmony_ci	struct hw_perf_event *hwc = &event->hw;
32562306a36Sopenharmony_ci	union filter_cfg flt_cfg;
32662306a36Sopenharmony_ci	union event_cfg event_cfg;
32762306a36Sopenharmony_ci	struct idxd_device *idxd;
32862306a36Sopenharmony_ci	int cntr;
32962306a36Sopenharmony_ci
33062306a36Sopenharmony_ci	idxd = event_to_idxd(event);
33162306a36Sopenharmony_ci
33262306a36Sopenharmony_ci	event->hw.idx = hwc->idx;
33362306a36Sopenharmony_ci	cntr = hwc->idx;
33462306a36Sopenharmony_ci
33562306a36Sopenharmony_ci	/* Obtain event category and event value from user space */
33662306a36Sopenharmony_ci	event_cfg.val = event->attr.config;
33762306a36Sopenharmony_ci	flt_cfg.val = event->attr.config1;
33862306a36Sopenharmony_ci	event_cat = event_cfg.event_cat;
33962306a36Sopenharmony_ci	event_enc = event_cfg.event_enc;
34062306a36Sopenharmony_ci
34162306a36Sopenharmony_ci	/* Obtain filter configuration from user space */
34262306a36Sopenharmony_ci	flt_wq = flt_cfg.wq;
34362306a36Sopenharmony_ci	flt_tc = flt_cfg.tc;
34462306a36Sopenharmony_ci	flt_pg_sz = flt_cfg.pg_sz;
34562306a36Sopenharmony_ci	flt_xfer_sz = flt_cfg.xfer_sz;
34662306a36Sopenharmony_ci	flt_eng = flt_cfg.eng;
34762306a36Sopenharmony_ci
34862306a36Sopenharmony_ci	if (flt_wq && test_bit(FLT_WQ, &idxd->idxd_pmu->supported_filters))
34962306a36Sopenharmony_ci		iowrite32(flt_wq, FLTCFG_REG(idxd, cntr, FLT_WQ));
35062306a36Sopenharmony_ci	if (flt_tc && test_bit(FLT_TC, &idxd->idxd_pmu->supported_filters))
35162306a36Sopenharmony_ci		iowrite32(flt_tc, FLTCFG_REG(idxd, cntr, FLT_TC));
35262306a36Sopenharmony_ci	if (flt_pg_sz && test_bit(FLT_PG_SZ, &idxd->idxd_pmu->supported_filters))
35362306a36Sopenharmony_ci		iowrite32(flt_pg_sz, FLTCFG_REG(idxd, cntr, FLT_PG_SZ));
35462306a36Sopenharmony_ci	if (flt_xfer_sz && test_bit(FLT_XFER_SZ, &idxd->idxd_pmu->supported_filters))
35562306a36Sopenharmony_ci		iowrite32(flt_xfer_sz, FLTCFG_REG(idxd, cntr, FLT_XFER_SZ));
35662306a36Sopenharmony_ci	if (flt_eng && test_bit(FLT_ENG, &idxd->idxd_pmu->supported_filters))
35762306a36Sopenharmony_ci		iowrite32(flt_eng, FLTCFG_REG(idxd, cntr, FLT_ENG));
35862306a36Sopenharmony_ci
35962306a36Sopenharmony_ci	/* Read the start value */
36062306a36Sopenharmony_ci	cntrdata = ioread64(CNTRDATA_REG(idxd, cntr));
36162306a36Sopenharmony_ci	local64_set(&event->hw.prev_count, cntrdata);
36262306a36Sopenharmony_ci
36362306a36Sopenharmony_ci	/* Set counter to event/category */
36462306a36Sopenharmony_ci	cntr_cfg = event_cat << CNTRCFG_CATEGORY_SHIFT;
36562306a36Sopenharmony_ci	cntr_cfg |= event_enc << CNTRCFG_EVENT_SHIFT;
36662306a36Sopenharmony_ci	/* Set interrupt on overflow and counter enable bits */
36762306a36Sopenharmony_ci	cntr_cfg |= (CNTRCFG_IRQ_OVERFLOW | CNTRCFG_ENABLE);
36862306a36Sopenharmony_ci
36962306a36Sopenharmony_ci	iowrite64(cntr_cfg, CNTRCFG_REG(idxd, cntr));
37062306a36Sopenharmony_ci}
37162306a36Sopenharmony_ci
37262306a36Sopenharmony_cistatic void perfmon_pmu_event_stop(struct perf_event *event, int mode)
37362306a36Sopenharmony_ci{
37462306a36Sopenharmony_ci	struct hw_perf_event *hwc = &event->hw;
37562306a36Sopenharmony_ci	struct idxd_device *idxd;
37662306a36Sopenharmony_ci	int i, cntr = hwc->idx;
37762306a36Sopenharmony_ci	u64 cntr_cfg;
37862306a36Sopenharmony_ci
37962306a36Sopenharmony_ci	idxd = event_to_idxd(event);
38062306a36Sopenharmony_ci
38162306a36Sopenharmony_ci	/* remove this event from event list */
38262306a36Sopenharmony_ci	for (i = 0; i < idxd->idxd_pmu->n_events; i++) {
38362306a36Sopenharmony_ci		if (event != idxd->idxd_pmu->event_list[i])
38462306a36Sopenharmony_ci			continue;
38562306a36Sopenharmony_ci
38662306a36Sopenharmony_ci		for (++i; i < idxd->idxd_pmu->n_events; i++)
38762306a36Sopenharmony_ci			idxd->idxd_pmu->event_list[i - 1] = idxd->idxd_pmu->event_list[i];
38862306a36Sopenharmony_ci		--idxd->idxd_pmu->n_events;
38962306a36Sopenharmony_ci		break;
39062306a36Sopenharmony_ci	}
39162306a36Sopenharmony_ci
39262306a36Sopenharmony_ci	cntr_cfg = ioread64(CNTRCFG_REG(idxd, cntr));
39362306a36Sopenharmony_ci	cntr_cfg &= ~CNTRCFG_ENABLE;
39462306a36Sopenharmony_ci	iowrite64(cntr_cfg, CNTRCFG_REG(idxd, cntr));
39562306a36Sopenharmony_ci
39662306a36Sopenharmony_ci	if (mode == PERF_EF_UPDATE)
39762306a36Sopenharmony_ci		perfmon_pmu_event_update(event);
39862306a36Sopenharmony_ci
39962306a36Sopenharmony_ci	event->hw.idx = -1;
40062306a36Sopenharmony_ci	clear_bit(cntr, idxd->idxd_pmu->used_mask);
40162306a36Sopenharmony_ci}
40262306a36Sopenharmony_ci
40362306a36Sopenharmony_cistatic void perfmon_pmu_event_del(struct perf_event *event, int mode)
40462306a36Sopenharmony_ci{
40562306a36Sopenharmony_ci	perfmon_pmu_event_stop(event, PERF_EF_UPDATE);
40662306a36Sopenharmony_ci}
40762306a36Sopenharmony_ci
40862306a36Sopenharmony_cistatic int perfmon_pmu_event_add(struct perf_event *event, int flags)
40962306a36Sopenharmony_ci{
41062306a36Sopenharmony_ci	struct idxd_device *idxd = event_to_idxd(event);
41162306a36Sopenharmony_ci	struct idxd_pmu *idxd_pmu = idxd->idxd_pmu;
41262306a36Sopenharmony_ci	struct hw_perf_event *hwc = &event->hw;
41362306a36Sopenharmony_ci	int idx, n;
41462306a36Sopenharmony_ci
41562306a36Sopenharmony_ci	n = perfmon_collect_events(idxd_pmu, event, false);
41662306a36Sopenharmony_ci	if (n < 0)
41762306a36Sopenharmony_ci		return n;
41862306a36Sopenharmony_ci
41962306a36Sopenharmony_ci	hwc->state = PERF_HES_UPTODATE | PERF_HES_STOPPED;
42062306a36Sopenharmony_ci	if (!(flags & PERF_EF_START))
42162306a36Sopenharmony_ci		hwc->state |= PERF_HES_ARCH;
42262306a36Sopenharmony_ci
42362306a36Sopenharmony_ci	idx = perfmon_assign_event(idxd_pmu, event);
42462306a36Sopenharmony_ci	if (idx < 0)
42562306a36Sopenharmony_ci		return idx;
42662306a36Sopenharmony_ci
42762306a36Sopenharmony_ci	perfmon_assign_hw_event(idxd_pmu, event, idx);
42862306a36Sopenharmony_ci
42962306a36Sopenharmony_ci	if (flags & PERF_EF_START)
43062306a36Sopenharmony_ci		perfmon_pmu_event_start(event, 0);
43162306a36Sopenharmony_ci
43262306a36Sopenharmony_ci	idxd_pmu->n_events = n;
43362306a36Sopenharmony_ci
43462306a36Sopenharmony_ci	return 0;
43562306a36Sopenharmony_ci}
43662306a36Sopenharmony_ci
43762306a36Sopenharmony_cistatic void enable_perfmon_pmu(struct idxd_device *idxd)
43862306a36Sopenharmony_ci{
43962306a36Sopenharmony_ci	iowrite32(COUNTER_UNFREEZE, PERFFRZ_REG(idxd));
44062306a36Sopenharmony_ci}
44162306a36Sopenharmony_ci
44262306a36Sopenharmony_cistatic void disable_perfmon_pmu(struct idxd_device *idxd)
44362306a36Sopenharmony_ci{
44462306a36Sopenharmony_ci	iowrite32(COUNTER_FREEZE, PERFFRZ_REG(idxd));
44562306a36Sopenharmony_ci}
44662306a36Sopenharmony_ci
44762306a36Sopenharmony_cistatic void perfmon_pmu_enable(struct pmu *pmu)
44862306a36Sopenharmony_ci{
44962306a36Sopenharmony_ci	struct idxd_device *idxd = pmu_to_idxd(pmu);
45062306a36Sopenharmony_ci
45162306a36Sopenharmony_ci	enable_perfmon_pmu(idxd);
45262306a36Sopenharmony_ci}
45362306a36Sopenharmony_ci
45462306a36Sopenharmony_cistatic void perfmon_pmu_disable(struct pmu *pmu)
45562306a36Sopenharmony_ci{
45662306a36Sopenharmony_ci	struct idxd_device *idxd = pmu_to_idxd(pmu);
45762306a36Sopenharmony_ci
45862306a36Sopenharmony_ci	disable_perfmon_pmu(idxd);
45962306a36Sopenharmony_ci}
46062306a36Sopenharmony_ci
46162306a36Sopenharmony_cistatic void skip_filter(int i)
46262306a36Sopenharmony_ci{
46362306a36Sopenharmony_ci	int j;
46462306a36Sopenharmony_ci
46562306a36Sopenharmony_ci	for (j = i; j < PERFMON_FILTERS_MAX; j++)
46662306a36Sopenharmony_ci		perfmon_format_attrs[PERFMON_FILTERS_START + j] =
46762306a36Sopenharmony_ci			perfmon_format_attrs[PERFMON_FILTERS_START + j + 1];
46862306a36Sopenharmony_ci}
46962306a36Sopenharmony_ci
47062306a36Sopenharmony_cistatic void idxd_pmu_init(struct idxd_pmu *idxd_pmu)
47162306a36Sopenharmony_ci{
47262306a36Sopenharmony_ci	int i;
47362306a36Sopenharmony_ci
47462306a36Sopenharmony_ci	for (i = 0 ; i < PERFMON_FILTERS_MAX; i++) {
47562306a36Sopenharmony_ci		if (!test_bit(i, &idxd_pmu->supported_filters))
47662306a36Sopenharmony_ci			skip_filter(i);
47762306a36Sopenharmony_ci	}
47862306a36Sopenharmony_ci
47962306a36Sopenharmony_ci	idxd_pmu->pmu.name		= idxd_pmu->name;
48062306a36Sopenharmony_ci	idxd_pmu->pmu.attr_groups	= perfmon_attr_groups;
48162306a36Sopenharmony_ci	idxd_pmu->pmu.task_ctx_nr	= perf_invalid_context;
48262306a36Sopenharmony_ci	idxd_pmu->pmu.event_init	= perfmon_pmu_event_init;
48362306a36Sopenharmony_ci	idxd_pmu->pmu.pmu_enable	= perfmon_pmu_enable,
48462306a36Sopenharmony_ci	idxd_pmu->pmu.pmu_disable	= perfmon_pmu_disable,
48562306a36Sopenharmony_ci	idxd_pmu->pmu.add		= perfmon_pmu_event_add;
48662306a36Sopenharmony_ci	idxd_pmu->pmu.del		= perfmon_pmu_event_del;
48762306a36Sopenharmony_ci	idxd_pmu->pmu.start		= perfmon_pmu_event_start;
48862306a36Sopenharmony_ci	idxd_pmu->pmu.stop		= perfmon_pmu_event_stop;
48962306a36Sopenharmony_ci	idxd_pmu->pmu.read		= perfmon_pmu_event_update;
49062306a36Sopenharmony_ci	idxd_pmu->pmu.capabilities	= PERF_PMU_CAP_NO_EXCLUDE;
49162306a36Sopenharmony_ci	idxd_pmu->pmu.module		= THIS_MODULE;
49262306a36Sopenharmony_ci}
49362306a36Sopenharmony_ci
49462306a36Sopenharmony_civoid perfmon_pmu_remove(struct idxd_device *idxd)
49562306a36Sopenharmony_ci{
49662306a36Sopenharmony_ci	if (!idxd->idxd_pmu)
49762306a36Sopenharmony_ci		return;
49862306a36Sopenharmony_ci
49962306a36Sopenharmony_ci	cpuhp_state_remove_instance(cpuhp_slot, &idxd->idxd_pmu->cpuhp_node);
50062306a36Sopenharmony_ci	perf_pmu_unregister(&idxd->idxd_pmu->pmu);
50162306a36Sopenharmony_ci	kfree(idxd->idxd_pmu);
50262306a36Sopenharmony_ci	idxd->idxd_pmu = NULL;
50362306a36Sopenharmony_ci}
50462306a36Sopenharmony_ci
50562306a36Sopenharmony_cistatic int perf_event_cpu_online(unsigned int cpu, struct hlist_node *node)
50662306a36Sopenharmony_ci{
50762306a36Sopenharmony_ci	struct idxd_pmu *idxd_pmu;
50862306a36Sopenharmony_ci
50962306a36Sopenharmony_ci	idxd_pmu = hlist_entry_safe(node, typeof(*idxd_pmu), cpuhp_node);
51062306a36Sopenharmony_ci
51162306a36Sopenharmony_ci	/* select the first online CPU as the designated reader */
51262306a36Sopenharmony_ci	if (cpumask_empty(&perfmon_dsa_cpu_mask)) {
51362306a36Sopenharmony_ci		cpumask_set_cpu(cpu, &perfmon_dsa_cpu_mask);
51462306a36Sopenharmony_ci		idxd_pmu->cpu = cpu;
51562306a36Sopenharmony_ci	}
51662306a36Sopenharmony_ci
51762306a36Sopenharmony_ci	return 0;
51862306a36Sopenharmony_ci}
51962306a36Sopenharmony_ci
52062306a36Sopenharmony_cistatic int perf_event_cpu_offline(unsigned int cpu, struct hlist_node *node)
52162306a36Sopenharmony_ci{
52262306a36Sopenharmony_ci	struct idxd_pmu *idxd_pmu;
52362306a36Sopenharmony_ci	unsigned int target;
52462306a36Sopenharmony_ci
52562306a36Sopenharmony_ci	idxd_pmu = hlist_entry_safe(node, typeof(*idxd_pmu), cpuhp_node);
52662306a36Sopenharmony_ci
52762306a36Sopenharmony_ci	if (!cpumask_test_and_clear_cpu(cpu, &perfmon_dsa_cpu_mask))
52862306a36Sopenharmony_ci		return 0;
52962306a36Sopenharmony_ci
53062306a36Sopenharmony_ci	target = cpumask_any_but(cpu_online_mask, cpu);
53162306a36Sopenharmony_ci
53262306a36Sopenharmony_ci	/* migrate events if there is a valid target */
53362306a36Sopenharmony_ci	if (target < nr_cpu_ids)
53462306a36Sopenharmony_ci		cpumask_set_cpu(target, &perfmon_dsa_cpu_mask);
53562306a36Sopenharmony_ci	else
53662306a36Sopenharmony_ci		target = -1;
53762306a36Sopenharmony_ci
53862306a36Sopenharmony_ci	perf_pmu_migrate_context(&idxd_pmu->pmu, cpu, target);
53962306a36Sopenharmony_ci
54062306a36Sopenharmony_ci	return 0;
54162306a36Sopenharmony_ci}
54262306a36Sopenharmony_ci
54362306a36Sopenharmony_ciint perfmon_pmu_init(struct idxd_device *idxd)
54462306a36Sopenharmony_ci{
54562306a36Sopenharmony_ci	union idxd_perfcap perfcap;
54662306a36Sopenharmony_ci	struct idxd_pmu *idxd_pmu;
54762306a36Sopenharmony_ci	int rc = -ENODEV;
54862306a36Sopenharmony_ci
54962306a36Sopenharmony_ci	/*
55062306a36Sopenharmony_ci	 * perfmon module initialization failed, nothing to do
55162306a36Sopenharmony_ci	 */
55262306a36Sopenharmony_ci	if (!cpuhp_set_up)
55362306a36Sopenharmony_ci		return -ENODEV;
55462306a36Sopenharmony_ci
55562306a36Sopenharmony_ci	/*
55662306a36Sopenharmony_ci	 * If perfmon_offset or num_counters is 0, it means perfmon is
55762306a36Sopenharmony_ci	 * not supported on this hardware.
55862306a36Sopenharmony_ci	 */
55962306a36Sopenharmony_ci	if (idxd->perfmon_offset == 0)
56062306a36Sopenharmony_ci		return -ENODEV;
56162306a36Sopenharmony_ci
56262306a36Sopenharmony_ci	idxd_pmu = kzalloc(sizeof(*idxd_pmu), GFP_KERNEL);
56362306a36Sopenharmony_ci	if (!idxd_pmu)
56462306a36Sopenharmony_ci		return -ENOMEM;
56562306a36Sopenharmony_ci
56662306a36Sopenharmony_ci	idxd_pmu->idxd = idxd;
56762306a36Sopenharmony_ci	idxd->idxd_pmu = idxd_pmu;
56862306a36Sopenharmony_ci
56962306a36Sopenharmony_ci	if (idxd->data->type == IDXD_TYPE_DSA) {
57062306a36Sopenharmony_ci		rc = sprintf(idxd_pmu->name, "dsa%d", idxd->id);
57162306a36Sopenharmony_ci		if (rc < 0)
57262306a36Sopenharmony_ci			goto free;
57362306a36Sopenharmony_ci	} else if (idxd->data->type == IDXD_TYPE_IAX) {
57462306a36Sopenharmony_ci		rc = sprintf(idxd_pmu->name, "iax%d", idxd->id);
57562306a36Sopenharmony_ci		if (rc < 0)
57662306a36Sopenharmony_ci			goto free;
57762306a36Sopenharmony_ci	} else {
57862306a36Sopenharmony_ci		goto free;
57962306a36Sopenharmony_ci	}
58062306a36Sopenharmony_ci
58162306a36Sopenharmony_ci	perfmon_reset(idxd);
58262306a36Sopenharmony_ci
58362306a36Sopenharmony_ci	perfcap.bits = ioread64(PERFCAP_REG(idxd));
58462306a36Sopenharmony_ci
58562306a36Sopenharmony_ci	/*
58662306a36Sopenharmony_ci	 * If total perf counter is 0, stop further registration.
58762306a36Sopenharmony_ci	 * This is necessary in order to support driver running on
58862306a36Sopenharmony_ci	 * guest which does not have pmon support.
58962306a36Sopenharmony_ci	 */
59062306a36Sopenharmony_ci	if (perfcap.num_perf_counter == 0)
59162306a36Sopenharmony_ci		goto free;
59262306a36Sopenharmony_ci
59362306a36Sopenharmony_ci	/* A counter width of 0 means it can't count */
59462306a36Sopenharmony_ci	if (perfcap.counter_width == 0)
59562306a36Sopenharmony_ci		goto free;
59662306a36Sopenharmony_ci
59762306a36Sopenharmony_ci	/* Overflow interrupt and counter freeze support must be available */
59862306a36Sopenharmony_ci	if (!perfcap.overflow_interrupt || !perfcap.counter_freeze)
59962306a36Sopenharmony_ci		goto free;
60062306a36Sopenharmony_ci
60162306a36Sopenharmony_ci	/* Number of event categories cannot be 0 */
60262306a36Sopenharmony_ci	if (perfcap.num_event_category == 0)
60362306a36Sopenharmony_ci		goto free;
60462306a36Sopenharmony_ci
60562306a36Sopenharmony_ci	/*
60662306a36Sopenharmony_ci	 * We don't support per-counter capabilities for now.
60762306a36Sopenharmony_ci	 */
60862306a36Sopenharmony_ci	if (perfcap.cap_per_counter)
60962306a36Sopenharmony_ci		goto free;
61062306a36Sopenharmony_ci
61162306a36Sopenharmony_ci	idxd_pmu->n_event_categories = perfcap.num_event_category;
61262306a36Sopenharmony_ci	idxd_pmu->supported_event_categories = perfcap.global_event_category;
61362306a36Sopenharmony_ci	idxd_pmu->per_counter_caps_supported = perfcap.cap_per_counter;
61462306a36Sopenharmony_ci
61562306a36Sopenharmony_ci	/* check filter capability.  If 0, then filters are not supported */
61662306a36Sopenharmony_ci	idxd_pmu->supported_filters = perfcap.filter;
61762306a36Sopenharmony_ci	if (perfcap.filter)
61862306a36Sopenharmony_ci		idxd_pmu->n_filters = hweight8(perfcap.filter);
61962306a36Sopenharmony_ci
62062306a36Sopenharmony_ci	/* Store the total number of counters categories, and counter width */
62162306a36Sopenharmony_ci	idxd_pmu->n_counters = perfcap.num_perf_counter;
62262306a36Sopenharmony_ci	idxd_pmu->counter_width = perfcap.counter_width;
62362306a36Sopenharmony_ci
62462306a36Sopenharmony_ci	idxd_pmu_init(idxd_pmu);
62562306a36Sopenharmony_ci
62662306a36Sopenharmony_ci	rc = perf_pmu_register(&idxd_pmu->pmu, idxd_pmu->name, -1);
62762306a36Sopenharmony_ci	if (rc)
62862306a36Sopenharmony_ci		goto free;
62962306a36Sopenharmony_ci
63062306a36Sopenharmony_ci	rc = cpuhp_state_add_instance(cpuhp_slot, &idxd_pmu->cpuhp_node);
63162306a36Sopenharmony_ci	if (rc) {
63262306a36Sopenharmony_ci		perf_pmu_unregister(&idxd->idxd_pmu->pmu);
63362306a36Sopenharmony_ci		goto free;
63462306a36Sopenharmony_ci	}
63562306a36Sopenharmony_ciout:
63662306a36Sopenharmony_ci	return rc;
63762306a36Sopenharmony_cifree:
63862306a36Sopenharmony_ci	kfree(idxd_pmu);
63962306a36Sopenharmony_ci	idxd->idxd_pmu = NULL;
64062306a36Sopenharmony_ci
64162306a36Sopenharmony_ci	goto out;
64262306a36Sopenharmony_ci}
64362306a36Sopenharmony_ci
64462306a36Sopenharmony_civoid __init perfmon_init(void)
64562306a36Sopenharmony_ci{
64662306a36Sopenharmony_ci	int rc = cpuhp_setup_state_multi(CPUHP_AP_ONLINE_DYN,
64762306a36Sopenharmony_ci					 "driver/dma/idxd/perf:online",
64862306a36Sopenharmony_ci					 perf_event_cpu_online,
64962306a36Sopenharmony_ci					 perf_event_cpu_offline);
65062306a36Sopenharmony_ci	if (WARN_ON(rc < 0))
65162306a36Sopenharmony_ci		return;
65262306a36Sopenharmony_ci
65362306a36Sopenharmony_ci	cpuhp_slot = rc;
65462306a36Sopenharmony_ci	cpuhp_set_up = true;
65562306a36Sopenharmony_ci}
65662306a36Sopenharmony_ci
65762306a36Sopenharmony_civoid __exit perfmon_exit(void)
65862306a36Sopenharmony_ci{
65962306a36Sopenharmony_ci	if (cpuhp_set_up)
66062306a36Sopenharmony_ci		cpuhp_remove_multi_state(cpuhp_slot);
66162306a36Sopenharmony_ci}
662