162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Copyright (C) 2018 Broadcom 462306a36Sopenharmony_ci */ 562306a36Sopenharmony_ci 662306a36Sopenharmony_ci/** 762306a36Sopenharmony_ci * DOC: VC4 V3D performance monitor module 862306a36Sopenharmony_ci * 962306a36Sopenharmony_ci * The V3D block provides 16 hardware counters which can count various events. 1062306a36Sopenharmony_ci */ 1162306a36Sopenharmony_ci 1262306a36Sopenharmony_ci#include "vc4_drv.h" 1362306a36Sopenharmony_ci#include "vc4_regs.h" 1462306a36Sopenharmony_ci 1562306a36Sopenharmony_ci#define VC4_PERFMONID_MIN 1 1662306a36Sopenharmony_ci#define VC4_PERFMONID_MAX U32_MAX 1762306a36Sopenharmony_ci 1862306a36Sopenharmony_civoid vc4_perfmon_get(struct vc4_perfmon *perfmon) 1962306a36Sopenharmony_ci{ 2062306a36Sopenharmony_ci struct vc4_dev *vc4; 2162306a36Sopenharmony_ci 2262306a36Sopenharmony_ci if (!perfmon) 2362306a36Sopenharmony_ci return; 2462306a36Sopenharmony_ci 2562306a36Sopenharmony_ci vc4 = perfmon->dev; 2662306a36Sopenharmony_ci if (WARN_ON_ONCE(vc4->is_vc5)) 2762306a36Sopenharmony_ci return; 2862306a36Sopenharmony_ci 2962306a36Sopenharmony_ci refcount_inc(&perfmon->refcnt); 3062306a36Sopenharmony_ci} 3162306a36Sopenharmony_ci 3262306a36Sopenharmony_civoid vc4_perfmon_put(struct vc4_perfmon *perfmon) 3362306a36Sopenharmony_ci{ 3462306a36Sopenharmony_ci struct vc4_dev *vc4; 3562306a36Sopenharmony_ci 3662306a36Sopenharmony_ci if (!perfmon) 3762306a36Sopenharmony_ci return; 3862306a36Sopenharmony_ci 3962306a36Sopenharmony_ci vc4 = perfmon->dev; 4062306a36Sopenharmony_ci if (WARN_ON_ONCE(vc4->is_vc5)) 4162306a36Sopenharmony_ci return; 4262306a36Sopenharmony_ci 4362306a36Sopenharmony_ci if (refcount_dec_and_test(&perfmon->refcnt)) 4462306a36Sopenharmony_ci kfree(perfmon); 4562306a36Sopenharmony_ci} 4662306a36Sopenharmony_ci 4762306a36Sopenharmony_civoid vc4_perfmon_start(struct vc4_dev *vc4, struct vc4_perfmon *perfmon) 4862306a36Sopenharmony_ci{ 4962306a36Sopenharmony_ci unsigned int i; 5062306a36Sopenharmony_ci u32 mask; 5162306a36Sopenharmony_ci 5262306a36Sopenharmony_ci if (WARN_ON_ONCE(vc4->is_vc5)) 5362306a36Sopenharmony_ci return; 5462306a36Sopenharmony_ci 5562306a36Sopenharmony_ci if (WARN_ON_ONCE(!perfmon || vc4->active_perfmon)) 5662306a36Sopenharmony_ci return; 5762306a36Sopenharmony_ci 5862306a36Sopenharmony_ci for (i = 0; i < perfmon->ncounters; i++) 5962306a36Sopenharmony_ci V3D_WRITE(V3D_PCTRS(i), perfmon->events[i]); 6062306a36Sopenharmony_ci 6162306a36Sopenharmony_ci mask = GENMASK(perfmon->ncounters - 1, 0); 6262306a36Sopenharmony_ci V3D_WRITE(V3D_PCTRC, mask); 6362306a36Sopenharmony_ci V3D_WRITE(V3D_PCTRE, V3D_PCTRE_EN | mask); 6462306a36Sopenharmony_ci vc4->active_perfmon = perfmon; 6562306a36Sopenharmony_ci} 6662306a36Sopenharmony_ci 6762306a36Sopenharmony_civoid vc4_perfmon_stop(struct vc4_dev *vc4, struct vc4_perfmon *perfmon, 6862306a36Sopenharmony_ci bool capture) 6962306a36Sopenharmony_ci{ 7062306a36Sopenharmony_ci unsigned int i; 7162306a36Sopenharmony_ci 7262306a36Sopenharmony_ci if (WARN_ON_ONCE(vc4->is_vc5)) 7362306a36Sopenharmony_ci return; 7462306a36Sopenharmony_ci 7562306a36Sopenharmony_ci if (WARN_ON_ONCE(!vc4->active_perfmon || 7662306a36Sopenharmony_ci perfmon != vc4->active_perfmon)) 7762306a36Sopenharmony_ci return; 7862306a36Sopenharmony_ci 7962306a36Sopenharmony_ci if (capture) { 8062306a36Sopenharmony_ci for (i = 0; i < perfmon->ncounters; i++) 8162306a36Sopenharmony_ci perfmon->counters[i] += V3D_READ(V3D_PCTR(i)); 8262306a36Sopenharmony_ci } 8362306a36Sopenharmony_ci 8462306a36Sopenharmony_ci V3D_WRITE(V3D_PCTRE, 0); 8562306a36Sopenharmony_ci vc4->active_perfmon = NULL; 8662306a36Sopenharmony_ci} 8762306a36Sopenharmony_ci 8862306a36Sopenharmony_cistruct vc4_perfmon *vc4_perfmon_find(struct vc4_file *vc4file, int id) 8962306a36Sopenharmony_ci{ 9062306a36Sopenharmony_ci struct vc4_dev *vc4 = vc4file->dev; 9162306a36Sopenharmony_ci struct vc4_perfmon *perfmon; 9262306a36Sopenharmony_ci 9362306a36Sopenharmony_ci if (WARN_ON_ONCE(vc4->is_vc5)) 9462306a36Sopenharmony_ci return NULL; 9562306a36Sopenharmony_ci 9662306a36Sopenharmony_ci mutex_lock(&vc4file->perfmon.lock); 9762306a36Sopenharmony_ci perfmon = idr_find(&vc4file->perfmon.idr, id); 9862306a36Sopenharmony_ci vc4_perfmon_get(perfmon); 9962306a36Sopenharmony_ci mutex_unlock(&vc4file->perfmon.lock); 10062306a36Sopenharmony_ci 10162306a36Sopenharmony_ci return perfmon; 10262306a36Sopenharmony_ci} 10362306a36Sopenharmony_ci 10462306a36Sopenharmony_civoid vc4_perfmon_open_file(struct vc4_file *vc4file) 10562306a36Sopenharmony_ci{ 10662306a36Sopenharmony_ci struct vc4_dev *vc4 = vc4file->dev; 10762306a36Sopenharmony_ci 10862306a36Sopenharmony_ci if (WARN_ON_ONCE(vc4->is_vc5)) 10962306a36Sopenharmony_ci return; 11062306a36Sopenharmony_ci 11162306a36Sopenharmony_ci mutex_init(&vc4file->perfmon.lock); 11262306a36Sopenharmony_ci idr_init_base(&vc4file->perfmon.idr, VC4_PERFMONID_MIN); 11362306a36Sopenharmony_ci vc4file->dev = vc4; 11462306a36Sopenharmony_ci} 11562306a36Sopenharmony_ci 11662306a36Sopenharmony_cistatic int vc4_perfmon_idr_del(int id, void *elem, void *data) 11762306a36Sopenharmony_ci{ 11862306a36Sopenharmony_ci struct vc4_perfmon *perfmon = elem; 11962306a36Sopenharmony_ci 12062306a36Sopenharmony_ci vc4_perfmon_put(perfmon); 12162306a36Sopenharmony_ci 12262306a36Sopenharmony_ci return 0; 12362306a36Sopenharmony_ci} 12462306a36Sopenharmony_ci 12562306a36Sopenharmony_civoid vc4_perfmon_close_file(struct vc4_file *vc4file) 12662306a36Sopenharmony_ci{ 12762306a36Sopenharmony_ci struct vc4_dev *vc4 = vc4file->dev; 12862306a36Sopenharmony_ci 12962306a36Sopenharmony_ci if (WARN_ON_ONCE(vc4->is_vc5)) 13062306a36Sopenharmony_ci return; 13162306a36Sopenharmony_ci 13262306a36Sopenharmony_ci mutex_lock(&vc4file->perfmon.lock); 13362306a36Sopenharmony_ci idr_for_each(&vc4file->perfmon.idr, vc4_perfmon_idr_del, NULL); 13462306a36Sopenharmony_ci idr_destroy(&vc4file->perfmon.idr); 13562306a36Sopenharmony_ci mutex_unlock(&vc4file->perfmon.lock); 13662306a36Sopenharmony_ci mutex_destroy(&vc4file->perfmon.lock); 13762306a36Sopenharmony_ci} 13862306a36Sopenharmony_ci 13962306a36Sopenharmony_ciint vc4_perfmon_create_ioctl(struct drm_device *dev, void *data, 14062306a36Sopenharmony_ci struct drm_file *file_priv) 14162306a36Sopenharmony_ci{ 14262306a36Sopenharmony_ci struct vc4_dev *vc4 = to_vc4_dev(dev); 14362306a36Sopenharmony_ci struct vc4_file *vc4file = file_priv->driver_priv; 14462306a36Sopenharmony_ci struct drm_vc4_perfmon_create *req = data; 14562306a36Sopenharmony_ci struct vc4_perfmon *perfmon; 14662306a36Sopenharmony_ci unsigned int i; 14762306a36Sopenharmony_ci int ret; 14862306a36Sopenharmony_ci 14962306a36Sopenharmony_ci if (WARN_ON_ONCE(vc4->is_vc5)) 15062306a36Sopenharmony_ci return -ENODEV; 15162306a36Sopenharmony_ci 15262306a36Sopenharmony_ci if (!vc4->v3d) { 15362306a36Sopenharmony_ci DRM_DEBUG("Creating perfmon no VC4 V3D probed\n"); 15462306a36Sopenharmony_ci return -ENODEV; 15562306a36Sopenharmony_ci } 15662306a36Sopenharmony_ci 15762306a36Sopenharmony_ci /* Number of monitored counters cannot exceed HW limits. */ 15862306a36Sopenharmony_ci if (req->ncounters > DRM_VC4_MAX_PERF_COUNTERS || 15962306a36Sopenharmony_ci !req->ncounters) 16062306a36Sopenharmony_ci return -EINVAL; 16162306a36Sopenharmony_ci 16262306a36Sopenharmony_ci /* Make sure all events are valid. */ 16362306a36Sopenharmony_ci for (i = 0; i < req->ncounters; i++) { 16462306a36Sopenharmony_ci if (req->events[i] >= VC4_PERFCNT_NUM_EVENTS) 16562306a36Sopenharmony_ci return -EINVAL; 16662306a36Sopenharmony_ci } 16762306a36Sopenharmony_ci 16862306a36Sopenharmony_ci perfmon = kzalloc(struct_size(perfmon, counters, req->ncounters), 16962306a36Sopenharmony_ci GFP_KERNEL); 17062306a36Sopenharmony_ci if (!perfmon) 17162306a36Sopenharmony_ci return -ENOMEM; 17262306a36Sopenharmony_ci perfmon->dev = vc4; 17362306a36Sopenharmony_ci 17462306a36Sopenharmony_ci for (i = 0; i < req->ncounters; i++) 17562306a36Sopenharmony_ci perfmon->events[i] = req->events[i]; 17662306a36Sopenharmony_ci 17762306a36Sopenharmony_ci perfmon->ncounters = req->ncounters; 17862306a36Sopenharmony_ci 17962306a36Sopenharmony_ci refcount_set(&perfmon->refcnt, 1); 18062306a36Sopenharmony_ci 18162306a36Sopenharmony_ci mutex_lock(&vc4file->perfmon.lock); 18262306a36Sopenharmony_ci ret = idr_alloc(&vc4file->perfmon.idr, perfmon, VC4_PERFMONID_MIN, 18362306a36Sopenharmony_ci VC4_PERFMONID_MAX, GFP_KERNEL); 18462306a36Sopenharmony_ci mutex_unlock(&vc4file->perfmon.lock); 18562306a36Sopenharmony_ci 18662306a36Sopenharmony_ci if (ret < 0) { 18762306a36Sopenharmony_ci kfree(perfmon); 18862306a36Sopenharmony_ci return ret; 18962306a36Sopenharmony_ci } 19062306a36Sopenharmony_ci 19162306a36Sopenharmony_ci req->id = ret; 19262306a36Sopenharmony_ci return 0; 19362306a36Sopenharmony_ci} 19462306a36Sopenharmony_ci 19562306a36Sopenharmony_ciint vc4_perfmon_destroy_ioctl(struct drm_device *dev, void *data, 19662306a36Sopenharmony_ci struct drm_file *file_priv) 19762306a36Sopenharmony_ci{ 19862306a36Sopenharmony_ci struct vc4_dev *vc4 = to_vc4_dev(dev); 19962306a36Sopenharmony_ci struct vc4_file *vc4file = file_priv->driver_priv; 20062306a36Sopenharmony_ci struct drm_vc4_perfmon_destroy *req = data; 20162306a36Sopenharmony_ci struct vc4_perfmon *perfmon; 20262306a36Sopenharmony_ci 20362306a36Sopenharmony_ci if (WARN_ON_ONCE(vc4->is_vc5)) 20462306a36Sopenharmony_ci return -ENODEV; 20562306a36Sopenharmony_ci 20662306a36Sopenharmony_ci if (!vc4->v3d) { 20762306a36Sopenharmony_ci DRM_DEBUG("Destroying perfmon no VC4 V3D probed\n"); 20862306a36Sopenharmony_ci return -ENODEV; 20962306a36Sopenharmony_ci } 21062306a36Sopenharmony_ci 21162306a36Sopenharmony_ci mutex_lock(&vc4file->perfmon.lock); 21262306a36Sopenharmony_ci perfmon = idr_remove(&vc4file->perfmon.idr, req->id); 21362306a36Sopenharmony_ci mutex_unlock(&vc4file->perfmon.lock); 21462306a36Sopenharmony_ci 21562306a36Sopenharmony_ci if (!perfmon) 21662306a36Sopenharmony_ci return -EINVAL; 21762306a36Sopenharmony_ci 21862306a36Sopenharmony_ci vc4_perfmon_put(perfmon); 21962306a36Sopenharmony_ci return 0; 22062306a36Sopenharmony_ci} 22162306a36Sopenharmony_ci 22262306a36Sopenharmony_ciint vc4_perfmon_get_values_ioctl(struct drm_device *dev, void *data, 22362306a36Sopenharmony_ci struct drm_file *file_priv) 22462306a36Sopenharmony_ci{ 22562306a36Sopenharmony_ci struct vc4_dev *vc4 = to_vc4_dev(dev); 22662306a36Sopenharmony_ci struct vc4_file *vc4file = file_priv->driver_priv; 22762306a36Sopenharmony_ci struct drm_vc4_perfmon_get_values *req = data; 22862306a36Sopenharmony_ci struct vc4_perfmon *perfmon; 22962306a36Sopenharmony_ci int ret; 23062306a36Sopenharmony_ci 23162306a36Sopenharmony_ci if (WARN_ON_ONCE(vc4->is_vc5)) 23262306a36Sopenharmony_ci return -ENODEV; 23362306a36Sopenharmony_ci 23462306a36Sopenharmony_ci if (!vc4->v3d) { 23562306a36Sopenharmony_ci DRM_DEBUG("Getting perfmon no VC4 V3D probed\n"); 23662306a36Sopenharmony_ci return -ENODEV; 23762306a36Sopenharmony_ci } 23862306a36Sopenharmony_ci 23962306a36Sopenharmony_ci mutex_lock(&vc4file->perfmon.lock); 24062306a36Sopenharmony_ci perfmon = idr_find(&vc4file->perfmon.idr, req->id); 24162306a36Sopenharmony_ci vc4_perfmon_get(perfmon); 24262306a36Sopenharmony_ci mutex_unlock(&vc4file->perfmon.lock); 24362306a36Sopenharmony_ci 24462306a36Sopenharmony_ci if (!perfmon) 24562306a36Sopenharmony_ci return -EINVAL; 24662306a36Sopenharmony_ci 24762306a36Sopenharmony_ci if (copy_to_user(u64_to_user_ptr(req->values_ptr), perfmon->counters, 24862306a36Sopenharmony_ci perfmon->ncounters * sizeof(u64))) 24962306a36Sopenharmony_ci ret = -EFAULT; 25062306a36Sopenharmony_ci else 25162306a36Sopenharmony_ci ret = 0; 25262306a36Sopenharmony_ci 25362306a36Sopenharmony_ci vc4_perfmon_put(perfmon); 25462306a36Sopenharmony_ci return ret; 25562306a36Sopenharmony_ci} 256