162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * Copyright (C) 2021 Raspberry Pi
462306a36Sopenharmony_ci */
562306a36Sopenharmony_ci
662306a36Sopenharmony_ci#include "v3d_drv.h"
762306a36Sopenharmony_ci#include "v3d_regs.h"
862306a36Sopenharmony_ci
962306a36Sopenharmony_ci#define V3D_PERFMONID_MIN	1
1062306a36Sopenharmony_ci#define V3D_PERFMONID_MAX	U32_MAX
1162306a36Sopenharmony_ci
1262306a36Sopenharmony_civoid v3d_perfmon_get(struct v3d_perfmon *perfmon)
1362306a36Sopenharmony_ci{
1462306a36Sopenharmony_ci	if (perfmon)
1562306a36Sopenharmony_ci		refcount_inc(&perfmon->refcnt);
1662306a36Sopenharmony_ci}
1762306a36Sopenharmony_ci
1862306a36Sopenharmony_civoid v3d_perfmon_put(struct v3d_perfmon *perfmon)
1962306a36Sopenharmony_ci{
2062306a36Sopenharmony_ci	if (perfmon && refcount_dec_and_test(&perfmon->refcnt)) {
2162306a36Sopenharmony_ci		mutex_destroy(&perfmon->lock);
2262306a36Sopenharmony_ci		kfree(perfmon);
2362306a36Sopenharmony_ci	}
2462306a36Sopenharmony_ci}
2562306a36Sopenharmony_ci
2662306a36Sopenharmony_civoid v3d_perfmon_start(struct v3d_dev *v3d, struct v3d_perfmon *perfmon)
2762306a36Sopenharmony_ci{
2862306a36Sopenharmony_ci	unsigned int i;
2962306a36Sopenharmony_ci	u32 mask;
3062306a36Sopenharmony_ci	u8 ncounters;
3162306a36Sopenharmony_ci
3262306a36Sopenharmony_ci	if (WARN_ON_ONCE(!perfmon || v3d->active_perfmon))
3362306a36Sopenharmony_ci		return;
3462306a36Sopenharmony_ci
3562306a36Sopenharmony_ci	ncounters = perfmon->ncounters;
3662306a36Sopenharmony_ci	mask = GENMASK(ncounters - 1, 0);
3762306a36Sopenharmony_ci
3862306a36Sopenharmony_ci	for (i = 0; i < ncounters; i++) {
3962306a36Sopenharmony_ci		u32 source = i / 4;
4062306a36Sopenharmony_ci		u32 channel = V3D_SET_FIELD(perfmon->counters[i], V3D_PCTR_S0);
4162306a36Sopenharmony_ci
4262306a36Sopenharmony_ci		i++;
4362306a36Sopenharmony_ci		channel |= V3D_SET_FIELD(i < ncounters ? perfmon->counters[i] : 0,
4462306a36Sopenharmony_ci					 V3D_PCTR_S1);
4562306a36Sopenharmony_ci		i++;
4662306a36Sopenharmony_ci		channel |= V3D_SET_FIELD(i < ncounters ? perfmon->counters[i] : 0,
4762306a36Sopenharmony_ci					 V3D_PCTR_S2);
4862306a36Sopenharmony_ci		i++;
4962306a36Sopenharmony_ci		channel |= V3D_SET_FIELD(i < ncounters ? perfmon->counters[i] : 0,
5062306a36Sopenharmony_ci					 V3D_PCTR_S3);
5162306a36Sopenharmony_ci		V3D_CORE_WRITE(0, V3D_V4_PCTR_0_SRC_X(source), channel);
5262306a36Sopenharmony_ci	}
5362306a36Sopenharmony_ci
5462306a36Sopenharmony_ci	V3D_CORE_WRITE(0, V3D_V4_PCTR_0_CLR, mask);
5562306a36Sopenharmony_ci	V3D_CORE_WRITE(0, V3D_PCTR_0_OVERFLOW, mask);
5662306a36Sopenharmony_ci	V3D_CORE_WRITE(0, V3D_V4_PCTR_0_EN, mask);
5762306a36Sopenharmony_ci
5862306a36Sopenharmony_ci	v3d->active_perfmon = perfmon;
5962306a36Sopenharmony_ci}
6062306a36Sopenharmony_ci
6162306a36Sopenharmony_civoid v3d_perfmon_stop(struct v3d_dev *v3d, struct v3d_perfmon *perfmon,
6262306a36Sopenharmony_ci		      bool capture)
6362306a36Sopenharmony_ci{
6462306a36Sopenharmony_ci	unsigned int i;
6562306a36Sopenharmony_ci
6662306a36Sopenharmony_ci	if (!perfmon || !v3d->active_perfmon)
6762306a36Sopenharmony_ci		return;
6862306a36Sopenharmony_ci
6962306a36Sopenharmony_ci	mutex_lock(&perfmon->lock);
7062306a36Sopenharmony_ci	if (perfmon != v3d->active_perfmon) {
7162306a36Sopenharmony_ci		mutex_unlock(&perfmon->lock);
7262306a36Sopenharmony_ci		return;
7362306a36Sopenharmony_ci	}
7462306a36Sopenharmony_ci
7562306a36Sopenharmony_ci	if (capture)
7662306a36Sopenharmony_ci		for (i = 0; i < perfmon->ncounters; i++)
7762306a36Sopenharmony_ci			perfmon->values[i] += V3D_CORE_READ(0, V3D_PCTR_0_PCTRX(i));
7862306a36Sopenharmony_ci
7962306a36Sopenharmony_ci	V3D_CORE_WRITE(0, V3D_V4_PCTR_0_EN, 0);
8062306a36Sopenharmony_ci
8162306a36Sopenharmony_ci	v3d->active_perfmon = NULL;
8262306a36Sopenharmony_ci	mutex_unlock(&perfmon->lock);
8362306a36Sopenharmony_ci}
8462306a36Sopenharmony_ci
8562306a36Sopenharmony_cistruct v3d_perfmon *v3d_perfmon_find(struct v3d_file_priv *v3d_priv, int id)
8662306a36Sopenharmony_ci{
8762306a36Sopenharmony_ci	struct v3d_perfmon *perfmon;
8862306a36Sopenharmony_ci
8962306a36Sopenharmony_ci	mutex_lock(&v3d_priv->perfmon.lock);
9062306a36Sopenharmony_ci	perfmon = idr_find(&v3d_priv->perfmon.idr, id);
9162306a36Sopenharmony_ci	v3d_perfmon_get(perfmon);
9262306a36Sopenharmony_ci	mutex_unlock(&v3d_priv->perfmon.lock);
9362306a36Sopenharmony_ci
9462306a36Sopenharmony_ci	return perfmon;
9562306a36Sopenharmony_ci}
9662306a36Sopenharmony_ci
9762306a36Sopenharmony_civoid v3d_perfmon_open_file(struct v3d_file_priv *v3d_priv)
9862306a36Sopenharmony_ci{
9962306a36Sopenharmony_ci	mutex_init(&v3d_priv->perfmon.lock);
10062306a36Sopenharmony_ci	idr_init_base(&v3d_priv->perfmon.idr, 1);
10162306a36Sopenharmony_ci}
10262306a36Sopenharmony_ci
10362306a36Sopenharmony_cistatic int v3d_perfmon_idr_del(int id, void *elem, void *data)
10462306a36Sopenharmony_ci{
10562306a36Sopenharmony_ci	struct v3d_perfmon *perfmon = elem;
10662306a36Sopenharmony_ci
10762306a36Sopenharmony_ci	v3d_perfmon_put(perfmon);
10862306a36Sopenharmony_ci
10962306a36Sopenharmony_ci	return 0;
11062306a36Sopenharmony_ci}
11162306a36Sopenharmony_ci
11262306a36Sopenharmony_civoid v3d_perfmon_close_file(struct v3d_file_priv *v3d_priv)
11362306a36Sopenharmony_ci{
11462306a36Sopenharmony_ci	mutex_lock(&v3d_priv->perfmon.lock);
11562306a36Sopenharmony_ci	idr_for_each(&v3d_priv->perfmon.idr, v3d_perfmon_idr_del, NULL);
11662306a36Sopenharmony_ci	idr_destroy(&v3d_priv->perfmon.idr);
11762306a36Sopenharmony_ci	mutex_unlock(&v3d_priv->perfmon.lock);
11862306a36Sopenharmony_ci	mutex_destroy(&v3d_priv->perfmon.lock);
11962306a36Sopenharmony_ci}
12062306a36Sopenharmony_ci
12162306a36Sopenharmony_ciint v3d_perfmon_create_ioctl(struct drm_device *dev, void *data,
12262306a36Sopenharmony_ci			     struct drm_file *file_priv)
12362306a36Sopenharmony_ci{
12462306a36Sopenharmony_ci	struct v3d_file_priv *v3d_priv = file_priv->driver_priv;
12562306a36Sopenharmony_ci	struct drm_v3d_perfmon_create *req = data;
12662306a36Sopenharmony_ci	struct v3d_perfmon *perfmon;
12762306a36Sopenharmony_ci	unsigned int i;
12862306a36Sopenharmony_ci	int ret;
12962306a36Sopenharmony_ci
13062306a36Sopenharmony_ci	/* Number of monitored counters cannot exceed HW limits. */
13162306a36Sopenharmony_ci	if (req->ncounters > DRM_V3D_MAX_PERF_COUNTERS ||
13262306a36Sopenharmony_ci	    !req->ncounters)
13362306a36Sopenharmony_ci		return -EINVAL;
13462306a36Sopenharmony_ci
13562306a36Sopenharmony_ci	/* Make sure all counters are valid. */
13662306a36Sopenharmony_ci	for (i = 0; i < req->ncounters; i++) {
13762306a36Sopenharmony_ci		if (req->counters[i] >= V3D_PERFCNT_NUM)
13862306a36Sopenharmony_ci			return -EINVAL;
13962306a36Sopenharmony_ci	}
14062306a36Sopenharmony_ci
14162306a36Sopenharmony_ci	perfmon = kzalloc(struct_size(perfmon, values, req->ncounters),
14262306a36Sopenharmony_ci			  GFP_KERNEL);
14362306a36Sopenharmony_ci	if (!perfmon)
14462306a36Sopenharmony_ci		return -ENOMEM;
14562306a36Sopenharmony_ci
14662306a36Sopenharmony_ci	for (i = 0; i < req->ncounters; i++)
14762306a36Sopenharmony_ci		perfmon->counters[i] = req->counters[i];
14862306a36Sopenharmony_ci
14962306a36Sopenharmony_ci	perfmon->ncounters = req->ncounters;
15062306a36Sopenharmony_ci
15162306a36Sopenharmony_ci	refcount_set(&perfmon->refcnt, 1);
15262306a36Sopenharmony_ci	mutex_init(&perfmon->lock);
15362306a36Sopenharmony_ci
15462306a36Sopenharmony_ci	mutex_lock(&v3d_priv->perfmon.lock);
15562306a36Sopenharmony_ci	ret = idr_alloc(&v3d_priv->perfmon.idr, perfmon, V3D_PERFMONID_MIN,
15662306a36Sopenharmony_ci			V3D_PERFMONID_MAX, GFP_KERNEL);
15762306a36Sopenharmony_ci	mutex_unlock(&v3d_priv->perfmon.lock);
15862306a36Sopenharmony_ci
15962306a36Sopenharmony_ci	if (ret < 0) {
16062306a36Sopenharmony_ci		mutex_destroy(&perfmon->lock);
16162306a36Sopenharmony_ci		kfree(perfmon);
16262306a36Sopenharmony_ci		return ret;
16362306a36Sopenharmony_ci	}
16462306a36Sopenharmony_ci
16562306a36Sopenharmony_ci	req->id = ret;
16662306a36Sopenharmony_ci
16762306a36Sopenharmony_ci	return 0;
16862306a36Sopenharmony_ci}
16962306a36Sopenharmony_ci
17062306a36Sopenharmony_ciint v3d_perfmon_destroy_ioctl(struct drm_device *dev, void *data,
17162306a36Sopenharmony_ci			      struct drm_file *file_priv)
17262306a36Sopenharmony_ci{
17362306a36Sopenharmony_ci	struct v3d_file_priv *v3d_priv = file_priv->driver_priv;
17462306a36Sopenharmony_ci	struct drm_v3d_perfmon_destroy *req = data;
17562306a36Sopenharmony_ci	struct v3d_perfmon *perfmon;
17662306a36Sopenharmony_ci
17762306a36Sopenharmony_ci	mutex_lock(&v3d_priv->perfmon.lock);
17862306a36Sopenharmony_ci	perfmon = idr_remove(&v3d_priv->perfmon.idr, req->id);
17962306a36Sopenharmony_ci	mutex_unlock(&v3d_priv->perfmon.lock);
18062306a36Sopenharmony_ci
18162306a36Sopenharmony_ci	if (!perfmon)
18262306a36Sopenharmony_ci		return -EINVAL;
18362306a36Sopenharmony_ci
18462306a36Sopenharmony_ci	v3d_perfmon_put(perfmon);
18562306a36Sopenharmony_ci
18662306a36Sopenharmony_ci	return 0;
18762306a36Sopenharmony_ci}
18862306a36Sopenharmony_ci
18962306a36Sopenharmony_ciint v3d_perfmon_get_values_ioctl(struct drm_device *dev, void *data,
19062306a36Sopenharmony_ci				 struct drm_file *file_priv)
19162306a36Sopenharmony_ci{
19262306a36Sopenharmony_ci	struct v3d_dev *v3d = to_v3d_dev(dev);
19362306a36Sopenharmony_ci	struct v3d_file_priv *v3d_priv = file_priv->driver_priv;
19462306a36Sopenharmony_ci	struct drm_v3d_perfmon_get_values *req = data;
19562306a36Sopenharmony_ci	struct v3d_perfmon *perfmon;
19662306a36Sopenharmony_ci	int ret = 0;
19762306a36Sopenharmony_ci
19862306a36Sopenharmony_ci	if (req->pad != 0)
19962306a36Sopenharmony_ci		return -EINVAL;
20062306a36Sopenharmony_ci
20162306a36Sopenharmony_ci	mutex_lock(&v3d_priv->perfmon.lock);
20262306a36Sopenharmony_ci	perfmon = idr_find(&v3d_priv->perfmon.idr, req->id);
20362306a36Sopenharmony_ci	v3d_perfmon_get(perfmon);
20462306a36Sopenharmony_ci	mutex_unlock(&v3d_priv->perfmon.lock);
20562306a36Sopenharmony_ci
20662306a36Sopenharmony_ci	if (!perfmon)
20762306a36Sopenharmony_ci		return -EINVAL;
20862306a36Sopenharmony_ci
20962306a36Sopenharmony_ci	v3d_perfmon_stop(v3d, perfmon, true);
21062306a36Sopenharmony_ci
21162306a36Sopenharmony_ci	if (copy_to_user(u64_to_user_ptr(req->values_ptr), perfmon->values,
21262306a36Sopenharmony_ci			 perfmon->ncounters * sizeof(u64)))
21362306a36Sopenharmony_ci		ret = -EFAULT;
21462306a36Sopenharmony_ci
21562306a36Sopenharmony_ci	v3d_perfmon_put(perfmon);
21662306a36Sopenharmony_ci
21762306a36Sopenharmony_ci	return ret;
21862306a36Sopenharmony_ci}
219