162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * Copyright (C) 2018 Broadcom
462306a36Sopenharmony_ci */
562306a36Sopenharmony_ci
662306a36Sopenharmony_ci/**
762306a36Sopenharmony_ci * DOC: VC4 V3D performance monitor module
862306a36Sopenharmony_ci *
962306a36Sopenharmony_ci * The V3D block provides 16 hardware counters which can count various events.
1062306a36Sopenharmony_ci */
1162306a36Sopenharmony_ci
1262306a36Sopenharmony_ci#include "vc4_drv.h"
1362306a36Sopenharmony_ci#include "vc4_regs.h"
1462306a36Sopenharmony_ci
1562306a36Sopenharmony_ci#define VC4_PERFMONID_MIN	1
1662306a36Sopenharmony_ci#define VC4_PERFMONID_MAX	U32_MAX
1762306a36Sopenharmony_ci
1862306a36Sopenharmony_civoid vc4_perfmon_get(struct vc4_perfmon *perfmon)
1962306a36Sopenharmony_ci{
2062306a36Sopenharmony_ci	struct vc4_dev *vc4;
2162306a36Sopenharmony_ci
2262306a36Sopenharmony_ci	if (!perfmon)
2362306a36Sopenharmony_ci		return;
2462306a36Sopenharmony_ci
2562306a36Sopenharmony_ci	vc4 = perfmon->dev;
2662306a36Sopenharmony_ci	if (WARN_ON_ONCE(vc4->is_vc5))
2762306a36Sopenharmony_ci		return;
2862306a36Sopenharmony_ci
2962306a36Sopenharmony_ci	refcount_inc(&perfmon->refcnt);
3062306a36Sopenharmony_ci}
3162306a36Sopenharmony_ci
3262306a36Sopenharmony_civoid vc4_perfmon_put(struct vc4_perfmon *perfmon)
3362306a36Sopenharmony_ci{
3462306a36Sopenharmony_ci	struct vc4_dev *vc4;
3562306a36Sopenharmony_ci
3662306a36Sopenharmony_ci	if (!perfmon)
3762306a36Sopenharmony_ci		return;
3862306a36Sopenharmony_ci
3962306a36Sopenharmony_ci	vc4 = perfmon->dev;
4062306a36Sopenharmony_ci	if (WARN_ON_ONCE(vc4->is_vc5))
4162306a36Sopenharmony_ci		return;
4262306a36Sopenharmony_ci
4362306a36Sopenharmony_ci	if (refcount_dec_and_test(&perfmon->refcnt))
4462306a36Sopenharmony_ci		kfree(perfmon);
4562306a36Sopenharmony_ci}
4662306a36Sopenharmony_ci
4762306a36Sopenharmony_civoid vc4_perfmon_start(struct vc4_dev *vc4, struct vc4_perfmon *perfmon)
4862306a36Sopenharmony_ci{
4962306a36Sopenharmony_ci	unsigned int i;
5062306a36Sopenharmony_ci	u32 mask;
5162306a36Sopenharmony_ci
5262306a36Sopenharmony_ci	if (WARN_ON_ONCE(vc4->is_vc5))
5362306a36Sopenharmony_ci		return;
5462306a36Sopenharmony_ci
5562306a36Sopenharmony_ci	if (WARN_ON_ONCE(!perfmon || vc4->active_perfmon))
5662306a36Sopenharmony_ci		return;
5762306a36Sopenharmony_ci
5862306a36Sopenharmony_ci	for (i = 0; i < perfmon->ncounters; i++)
5962306a36Sopenharmony_ci		V3D_WRITE(V3D_PCTRS(i), perfmon->events[i]);
6062306a36Sopenharmony_ci
6162306a36Sopenharmony_ci	mask = GENMASK(perfmon->ncounters - 1, 0);
6262306a36Sopenharmony_ci	V3D_WRITE(V3D_PCTRC, mask);
6362306a36Sopenharmony_ci	V3D_WRITE(V3D_PCTRE, V3D_PCTRE_EN | mask);
6462306a36Sopenharmony_ci	vc4->active_perfmon = perfmon;
6562306a36Sopenharmony_ci}
6662306a36Sopenharmony_ci
6762306a36Sopenharmony_civoid vc4_perfmon_stop(struct vc4_dev *vc4, struct vc4_perfmon *perfmon,
6862306a36Sopenharmony_ci		      bool capture)
6962306a36Sopenharmony_ci{
7062306a36Sopenharmony_ci	unsigned int i;
7162306a36Sopenharmony_ci
7262306a36Sopenharmony_ci	if (WARN_ON_ONCE(vc4->is_vc5))
7362306a36Sopenharmony_ci		return;
7462306a36Sopenharmony_ci
7562306a36Sopenharmony_ci	if (WARN_ON_ONCE(!vc4->active_perfmon ||
7662306a36Sopenharmony_ci			 perfmon != vc4->active_perfmon))
7762306a36Sopenharmony_ci		return;
7862306a36Sopenharmony_ci
7962306a36Sopenharmony_ci	if (capture) {
8062306a36Sopenharmony_ci		for (i = 0; i < perfmon->ncounters; i++)
8162306a36Sopenharmony_ci			perfmon->counters[i] += V3D_READ(V3D_PCTR(i));
8262306a36Sopenharmony_ci	}
8362306a36Sopenharmony_ci
8462306a36Sopenharmony_ci	V3D_WRITE(V3D_PCTRE, 0);
8562306a36Sopenharmony_ci	vc4->active_perfmon = NULL;
8662306a36Sopenharmony_ci}
8762306a36Sopenharmony_ci
8862306a36Sopenharmony_cistruct vc4_perfmon *vc4_perfmon_find(struct vc4_file *vc4file, int id)
8962306a36Sopenharmony_ci{
9062306a36Sopenharmony_ci	struct vc4_dev *vc4 = vc4file->dev;
9162306a36Sopenharmony_ci	struct vc4_perfmon *perfmon;
9262306a36Sopenharmony_ci
9362306a36Sopenharmony_ci	if (WARN_ON_ONCE(vc4->is_vc5))
9462306a36Sopenharmony_ci		return NULL;
9562306a36Sopenharmony_ci
9662306a36Sopenharmony_ci	mutex_lock(&vc4file->perfmon.lock);
9762306a36Sopenharmony_ci	perfmon = idr_find(&vc4file->perfmon.idr, id);
9862306a36Sopenharmony_ci	vc4_perfmon_get(perfmon);
9962306a36Sopenharmony_ci	mutex_unlock(&vc4file->perfmon.lock);
10062306a36Sopenharmony_ci
10162306a36Sopenharmony_ci	return perfmon;
10262306a36Sopenharmony_ci}
10362306a36Sopenharmony_ci
10462306a36Sopenharmony_civoid vc4_perfmon_open_file(struct vc4_file *vc4file)
10562306a36Sopenharmony_ci{
10662306a36Sopenharmony_ci	struct vc4_dev *vc4 = vc4file->dev;
10762306a36Sopenharmony_ci
10862306a36Sopenharmony_ci	if (WARN_ON_ONCE(vc4->is_vc5))
10962306a36Sopenharmony_ci		return;
11062306a36Sopenharmony_ci
11162306a36Sopenharmony_ci	mutex_init(&vc4file->perfmon.lock);
11262306a36Sopenharmony_ci	idr_init_base(&vc4file->perfmon.idr, VC4_PERFMONID_MIN);
11362306a36Sopenharmony_ci	vc4file->dev = vc4;
11462306a36Sopenharmony_ci}
11562306a36Sopenharmony_ci
11662306a36Sopenharmony_cistatic int vc4_perfmon_idr_del(int id, void *elem, void *data)
11762306a36Sopenharmony_ci{
11862306a36Sopenharmony_ci	struct vc4_perfmon *perfmon = elem;
11962306a36Sopenharmony_ci
12062306a36Sopenharmony_ci	vc4_perfmon_put(perfmon);
12162306a36Sopenharmony_ci
12262306a36Sopenharmony_ci	return 0;
12362306a36Sopenharmony_ci}
12462306a36Sopenharmony_ci
12562306a36Sopenharmony_civoid vc4_perfmon_close_file(struct vc4_file *vc4file)
12662306a36Sopenharmony_ci{
12762306a36Sopenharmony_ci	struct vc4_dev *vc4 = vc4file->dev;
12862306a36Sopenharmony_ci
12962306a36Sopenharmony_ci	if (WARN_ON_ONCE(vc4->is_vc5))
13062306a36Sopenharmony_ci		return;
13162306a36Sopenharmony_ci
13262306a36Sopenharmony_ci	mutex_lock(&vc4file->perfmon.lock);
13362306a36Sopenharmony_ci	idr_for_each(&vc4file->perfmon.idr, vc4_perfmon_idr_del, NULL);
13462306a36Sopenharmony_ci	idr_destroy(&vc4file->perfmon.idr);
13562306a36Sopenharmony_ci	mutex_unlock(&vc4file->perfmon.lock);
13662306a36Sopenharmony_ci	mutex_destroy(&vc4file->perfmon.lock);
13762306a36Sopenharmony_ci}
13862306a36Sopenharmony_ci
13962306a36Sopenharmony_ciint vc4_perfmon_create_ioctl(struct drm_device *dev, void *data,
14062306a36Sopenharmony_ci			     struct drm_file *file_priv)
14162306a36Sopenharmony_ci{
14262306a36Sopenharmony_ci	struct vc4_dev *vc4 = to_vc4_dev(dev);
14362306a36Sopenharmony_ci	struct vc4_file *vc4file = file_priv->driver_priv;
14462306a36Sopenharmony_ci	struct drm_vc4_perfmon_create *req = data;
14562306a36Sopenharmony_ci	struct vc4_perfmon *perfmon;
14662306a36Sopenharmony_ci	unsigned int i;
14762306a36Sopenharmony_ci	int ret;
14862306a36Sopenharmony_ci
14962306a36Sopenharmony_ci	if (WARN_ON_ONCE(vc4->is_vc5))
15062306a36Sopenharmony_ci		return -ENODEV;
15162306a36Sopenharmony_ci
15262306a36Sopenharmony_ci	if (!vc4->v3d) {
15362306a36Sopenharmony_ci		DRM_DEBUG("Creating perfmon no VC4 V3D probed\n");
15462306a36Sopenharmony_ci		return -ENODEV;
15562306a36Sopenharmony_ci	}
15662306a36Sopenharmony_ci
15762306a36Sopenharmony_ci	/* Number of monitored counters cannot exceed HW limits. */
15862306a36Sopenharmony_ci	if (req->ncounters > DRM_VC4_MAX_PERF_COUNTERS ||
15962306a36Sopenharmony_ci	    !req->ncounters)
16062306a36Sopenharmony_ci		return -EINVAL;
16162306a36Sopenharmony_ci
16262306a36Sopenharmony_ci	/* Make sure all events are valid. */
16362306a36Sopenharmony_ci	for (i = 0; i < req->ncounters; i++) {
16462306a36Sopenharmony_ci		if (req->events[i] >= VC4_PERFCNT_NUM_EVENTS)
16562306a36Sopenharmony_ci			return -EINVAL;
16662306a36Sopenharmony_ci	}
16762306a36Sopenharmony_ci
16862306a36Sopenharmony_ci	perfmon = kzalloc(struct_size(perfmon, counters, req->ncounters),
16962306a36Sopenharmony_ci			  GFP_KERNEL);
17062306a36Sopenharmony_ci	if (!perfmon)
17162306a36Sopenharmony_ci		return -ENOMEM;
17262306a36Sopenharmony_ci	perfmon->dev = vc4;
17362306a36Sopenharmony_ci
17462306a36Sopenharmony_ci	for (i = 0; i < req->ncounters; i++)
17562306a36Sopenharmony_ci		perfmon->events[i] = req->events[i];
17662306a36Sopenharmony_ci
17762306a36Sopenharmony_ci	perfmon->ncounters = req->ncounters;
17862306a36Sopenharmony_ci
17962306a36Sopenharmony_ci	refcount_set(&perfmon->refcnt, 1);
18062306a36Sopenharmony_ci
18162306a36Sopenharmony_ci	mutex_lock(&vc4file->perfmon.lock);
18262306a36Sopenharmony_ci	ret = idr_alloc(&vc4file->perfmon.idr, perfmon, VC4_PERFMONID_MIN,
18362306a36Sopenharmony_ci			VC4_PERFMONID_MAX, GFP_KERNEL);
18462306a36Sopenharmony_ci	mutex_unlock(&vc4file->perfmon.lock);
18562306a36Sopenharmony_ci
18662306a36Sopenharmony_ci	if (ret < 0) {
18762306a36Sopenharmony_ci		kfree(perfmon);
18862306a36Sopenharmony_ci		return ret;
18962306a36Sopenharmony_ci	}
19062306a36Sopenharmony_ci
19162306a36Sopenharmony_ci	req->id = ret;
19262306a36Sopenharmony_ci	return 0;
19362306a36Sopenharmony_ci}
19462306a36Sopenharmony_ci
19562306a36Sopenharmony_ciint vc4_perfmon_destroy_ioctl(struct drm_device *dev, void *data,
19662306a36Sopenharmony_ci			      struct drm_file *file_priv)
19762306a36Sopenharmony_ci{
19862306a36Sopenharmony_ci	struct vc4_dev *vc4 = to_vc4_dev(dev);
19962306a36Sopenharmony_ci	struct vc4_file *vc4file = file_priv->driver_priv;
20062306a36Sopenharmony_ci	struct drm_vc4_perfmon_destroy *req = data;
20162306a36Sopenharmony_ci	struct vc4_perfmon *perfmon;
20262306a36Sopenharmony_ci
20362306a36Sopenharmony_ci	if (WARN_ON_ONCE(vc4->is_vc5))
20462306a36Sopenharmony_ci		return -ENODEV;
20562306a36Sopenharmony_ci
20662306a36Sopenharmony_ci	if (!vc4->v3d) {
20762306a36Sopenharmony_ci		DRM_DEBUG("Destroying perfmon no VC4 V3D probed\n");
20862306a36Sopenharmony_ci		return -ENODEV;
20962306a36Sopenharmony_ci	}
21062306a36Sopenharmony_ci
21162306a36Sopenharmony_ci	mutex_lock(&vc4file->perfmon.lock);
21262306a36Sopenharmony_ci	perfmon = idr_remove(&vc4file->perfmon.idr, req->id);
21362306a36Sopenharmony_ci	mutex_unlock(&vc4file->perfmon.lock);
21462306a36Sopenharmony_ci
21562306a36Sopenharmony_ci	if (!perfmon)
21662306a36Sopenharmony_ci		return -EINVAL;
21762306a36Sopenharmony_ci
21862306a36Sopenharmony_ci	vc4_perfmon_put(perfmon);
21962306a36Sopenharmony_ci	return 0;
22062306a36Sopenharmony_ci}
22162306a36Sopenharmony_ci
22262306a36Sopenharmony_ciint vc4_perfmon_get_values_ioctl(struct drm_device *dev, void *data,
22362306a36Sopenharmony_ci				 struct drm_file *file_priv)
22462306a36Sopenharmony_ci{
22562306a36Sopenharmony_ci	struct vc4_dev *vc4 = to_vc4_dev(dev);
22662306a36Sopenharmony_ci	struct vc4_file *vc4file = file_priv->driver_priv;
22762306a36Sopenharmony_ci	struct drm_vc4_perfmon_get_values *req = data;
22862306a36Sopenharmony_ci	struct vc4_perfmon *perfmon;
22962306a36Sopenharmony_ci	int ret;
23062306a36Sopenharmony_ci
23162306a36Sopenharmony_ci	if (WARN_ON_ONCE(vc4->is_vc5))
23262306a36Sopenharmony_ci		return -ENODEV;
23362306a36Sopenharmony_ci
23462306a36Sopenharmony_ci	if (!vc4->v3d) {
23562306a36Sopenharmony_ci		DRM_DEBUG("Getting perfmon no VC4 V3D probed\n");
23662306a36Sopenharmony_ci		return -ENODEV;
23762306a36Sopenharmony_ci	}
23862306a36Sopenharmony_ci
23962306a36Sopenharmony_ci	mutex_lock(&vc4file->perfmon.lock);
24062306a36Sopenharmony_ci	perfmon = idr_find(&vc4file->perfmon.idr, req->id);
24162306a36Sopenharmony_ci	vc4_perfmon_get(perfmon);
24262306a36Sopenharmony_ci	mutex_unlock(&vc4file->perfmon.lock);
24362306a36Sopenharmony_ci
24462306a36Sopenharmony_ci	if (!perfmon)
24562306a36Sopenharmony_ci		return -EINVAL;
24662306a36Sopenharmony_ci
24762306a36Sopenharmony_ci	if (copy_to_user(u64_to_user_ptr(req->values_ptr), perfmon->counters,
24862306a36Sopenharmony_ci			 perfmon->ncounters * sizeof(u64)))
24962306a36Sopenharmony_ci		ret = -EFAULT;
25062306a36Sopenharmony_ci	else
25162306a36Sopenharmony_ci		ret = 0;
25262306a36Sopenharmony_ci
25362306a36Sopenharmony_ci	vc4_perfmon_put(perfmon);
25462306a36Sopenharmony_ci	return ret;
25562306a36Sopenharmony_ci}
256