162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0+ 262306a36Sopenharmony_ci/* Copyright (C) 2014-2018 Broadcom */ 362306a36Sopenharmony_ci 462306a36Sopenharmony_ci#include <linux/device.h> 562306a36Sopenharmony_ci#include <linux/dma-mapping.h> 662306a36Sopenharmony_ci#include <linux/io.h> 762306a36Sopenharmony_ci#include <linux/module.h> 862306a36Sopenharmony_ci#include <linux/platform_device.h> 962306a36Sopenharmony_ci#include <linux/reset.h> 1062306a36Sopenharmony_ci#include <linux/sched/signal.h> 1162306a36Sopenharmony_ci#include <linux/uaccess.h> 1262306a36Sopenharmony_ci 1362306a36Sopenharmony_ci#include <drm/drm_managed.h> 1462306a36Sopenharmony_ci#include <drm/drm_syncobj.h> 1562306a36Sopenharmony_ci#include <uapi/drm/v3d_drm.h> 1662306a36Sopenharmony_ci 1762306a36Sopenharmony_ci#include "v3d_drv.h" 1862306a36Sopenharmony_ci#include "v3d_regs.h" 1962306a36Sopenharmony_ci#include "v3d_trace.h" 2062306a36Sopenharmony_ci 2162306a36Sopenharmony_cistatic void 2262306a36Sopenharmony_civ3d_init_core(struct v3d_dev *v3d, int core) 2362306a36Sopenharmony_ci{ 2462306a36Sopenharmony_ci /* Set OVRTMUOUT, which means that the texture sampler uniform 2562306a36Sopenharmony_ci * configuration's tmu output type field is used, instead of 2662306a36Sopenharmony_ci * using the hardware default behavior based on the texture 2762306a36Sopenharmony_ci * type. If you want the default behavior, you can still put 2862306a36Sopenharmony_ci * "2" in the indirect texture state's output_type field. 2962306a36Sopenharmony_ci */ 3062306a36Sopenharmony_ci if (v3d->ver < 40) 3162306a36Sopenharmony_ci V3D_CORE_WRITE(core, V3D_CTL_MISCCFG, V3D_MISCCFG_OVRTMUOUT); 3262306a36Sopenharmony_ci 3362306a36Sopenharmony_ci /* Whenever we flush the L2T cache, we always want to flush 3462306a36Sopenharmony_ci * the whole thing. 3562306a36Sopenharmony_ci */ 3662306a36Sopenharmony_ci V3D_CORE_WRITE(core, V3D_CTL_L2TFLSTA, 0); 3762306a36Sopenharmony_ci V3D_CORE_WRITE(core, V3D_CTL_L2TFLEND, ~0); 3862306a36Sopenharmony_ci} 3962306a36Sopenharmony_ci 4062306a36Sopenharmony_ci/* Sets invariant state for the HW. */ 4162306a36Sopenharmony_cistatic void 4262306a36Sopenharmony_civ3d_init_hw_state(struct v3d_dev *v3d) 4362306a36Sopenharmony_ci{ 4462306a36Sopenharmony_ci v3d_init_core(v3d, 0); 4562306a36Sopenharmony_ci} 4662306a36Sopenharmony_ci 4762306a36Sopenharmony_cistatic void 4862306a36Sopenharmony_civ3d_idle_axi(struct v3d_dev *v3d, int core) 4962306a36Sopenharmony_ci{ 5062306a36Sopenharmony_ci V3D_CORE_WRITE(core, V3D_GMP_CFG, V3D_GMP_CFG_STOP_REQ); 5162306a36Sopenharmony_ci 5262306a36Sopenharmony_ci if (wait_for((V3D_CORE_READ(core, V3D_GMP_STATUS) & 5362306a36Sopenharmony_ci (V3D_GMP_STATUS_RD_COUNT_MASK | 5462306a36Sopenharmony_ci V3D_GMP_STATUS_WR_COUNT_MASK | 5562306a36Sopenharmony_ci V3D_GMP_STATUS_CFG_BUSY)) == 0, 100)) { 5662306a36Sopenharmony_ci DRM_ERROR("Failed to wait for safe GMP shutdown\n"); 5762306a36Sopenharmony_ci } 5862306a36Sopenharmony_ci} 5962306a36Sopenharmony_ci 6062306a36Sopenharmony_cistatic void 6162306a36Sopenharmony_civ3d_idle_gca(struct v3d_dev *v3d) 6262306a36Sopenharmony_ci{ 6362306a36Sopenharmony_ci if (v3d->ver >= 41) 6462306a36Sopenharmony_ci return; 6562306a36Sopenharmony_ci 6662306a36Sopenharmony_ci V3D_GCA_WRITE(V3D_GCA_SAFE_SHUTDOWN, V3D_GCA_SAFE_SHUTDOWN_EN); 6762306a36Sopenharmony_ci 6862306a36Sopenharmony_ci if (wait_for((V3D_GCA_READ(V3D_GCA_SAFE_SHUTDOWN_ACK) & 6962306a36Sopenharmony_ci V3D_GCA_SAFE_SHUTDOWN_ACK_ACKED) == 7062306a36Sopenharmony_ci V3D_GCA_SAFE_SHUTDOWN_ACK_ACKED, 100)) { 7162306a36Sopenharmony_ci DRM_ERROR("Failed to wait for safe GCA shutdown\n"); 7262306a36Sopenharmony_ci } 7362306a36Sopenharmony_ci} 7462306a36Sopenharmony_ci 7562306a36Sopenharmony_cistatic void 7662306a36Sopenharmony_civ3d_reset_by_bridge(struct v3d_dev *v3d) 7762306a36Sopenharmony_ci{ 7862306a36Sopenharmony_ci int version = V3D_BRIDGE_READ(V3D_TOP_GR_BRIDGE_REVISION); 7962306a36Sopenharmony_ci 8062306a36Sopenharmony_ci if (V3D_GET_FIELD(version, V3D_TOP_GR_BRIDGE_MAJOR) == 2) { 8162306a36Sopenharmony_ci V3D_BRIDGE_WRITE(V3D_TOP_GR_BRIDGE_SW_INIT_0, 8262306a36Sopenharmony_ci V3D_TOP_GR_BRIDGE_SW_INIT_0_V3D_CLK_108_SW_INIT); 8362306a36Sopenharmony_ci V3D_BRIDGE_WRITE(V3D_TOP_GR_BRIDGE_SW_INIT_0, 0); 8462306a36Sopenharmony_ci 8562306a36Sopenharmony_ci /* GFXH-1383: The SW_INIT may cause a stray write to address 0 8662306a36Sopenharmony_ci * of the unit, so reset it to its power-on value here. 8762306a36Sopenharmony_ci */ 8862306a36Sopenharmony_ci V3D_WRITE(V3D_HUB_AXICFG, V3D_HUB_AXICFG_MAX_LEN_MASK); 8962306a36Sopenharmony_ci } else { 9062306a36Sopenharmony_ci WARN_ON_ONCE(V3D_GET_FIELD(version, 9162306a36Sopenharmony_ci V3D_TOP_GR_BRIDGE_MAJOR) != 7); 9262306a36Sopenharmony_ci V3D_BRIDGE_WRITE(V3D_TOP_GR_BRIDGE_SW_INIT_1, 9362306a36Sopenharmony_ci V3D_TOP_GR_BRIDGE_SW_INIT_1_V3D_CLK_108_SW_INIT); 9462306a36Sopenharmony_ci V3D_BRIDGE_WRITE(V3D_TOP_GR_BRIDGE_SW_INIT_1, 0); 9562306a36Sopenharmony_ci } 9662306a36Sopenharmony_ci} 9762306a36Sopenharmony_ci 9862306a36Sopenharmony_cistatic void 9962306a36Sopenharmony_civ3d_reset_v3d(struct v3d_dev *v3d) 10062306a36Sopenharmony_ci{ 10162306a36Sopenharmony_ci if (v3d->reset) 10262306a36Sopenharmony_ci reset_control_reset(v3d->reset); 10362306a36Sopenharmony_ci else 10462306a36Sopenharmony_ci v3d_reset_by_bridge(v3d); 10562306a36Sopenharmony_ci 10662306a36Sopenharmony_ci v3d_init_hw_state(v3d); 10762306a36Sopenharmony_ci} 10862306a36Sopenharmony_ci 10962306a36Sopenharmony_civoid 11062306a36Sopenharmony_civ3d_reset(struct v3d_dev *v3d) 11162306a36Sopenharmony_ci{ 11262306a36Sopenharmony_ci struct drm_device *dev = &v3d->drm; 11362306a36Sopenharmony_ci 11462306a36Sopenharmony_ci DRM_DEV_ERROR(dev->dev, "Resetting GPU for hang.\n"); 11562306a36Sopenharmony_ci DRM_DEV_ERROR(dev->dev, "V3D_ERR_STAT: 0x%08x\n", 11662306a36Sopenharmony_ci V3D_CORE_READ(0, V3D_ERR_STAT)); 11762306a36Sopenharmony_ci trace_v3d_reset_begin(dev); 11862306a36Sopenharmony_ci 11962306a36Sopenharmony_ci /* XXX: only needed for safe powerdown, not reset. */ 12062306a36Sopenharmony_ci if (false) 12162306a36Sopenharmony_ci v3d_idle_axi(v3d, 0); 12262306a36Sopenharmony_ci 12362306a36Sopenharmony_ci v3d_idle_gca(v3d); 12462306a36Sopenharmony_ci v3d_reset_v3d(v3d); 12562306a36Sopenharmony_ci 12662306a36Sopenharmony_ci v3d_mmu_set_page_table(v3d); 12762306a36Sopenharmony_ci v3d_irq_reset(v3d); 12862306a36Sopenharmony_ci 12962306a36Sopenharmony_ci v3d_perfmon_stop(v3d, v3d->active_perfmon, false); 13062306a36Sopenharmony_ci 13162306a36Sopenharmony_ci trace_v3d_reset_end(dev); 13262306a36Sopenharmony_ci} 13362306a36Sopenharmony_ci 13462306a36Sopenharmony_cistatic void 13562306a36Sopenharmony_civ3d_flush_l3(struct v3d_dev *v3d) 13662306a36Sopenharmony_ci{ 13762306a36Sopenharmony_ci if (v3d->ver < 41) { 13862306a36Sopenharmony_ci u32 gca_ctrl = V3D_GCA_READ(V3D_GCA_CACHE_CTRL); 13962306a36Sopenharmony_ci 14062306a36Sopenharmony_ci V3D_GCA_WRITE(V3D_GCA_CACHE_CTRL, 14162306a36Sopenharmony_ci gca_ctrl | V3D_GCA_CACHE_CTRL_FLUSH); 14262306a36Sopenharmony_ci 14362306a36Sopenharmony_ci if (v3d->ver < 33) { 14462306a36Sopenharmony_ci V3D_GCA_WRITE(V3D_GCA_CACHE_CTRL, 14562306a36Sopenharmony_ci gca_ctrl & ~V3D_GCA_CACHE_CTRL_FLUSH); 14662306a36Sopenharmony_ci } 14762306a36Sopenharmony_ci } 14862306a36Sopenharmony_ci} 14962306a36Sopenharmony_ci 15062306a36Sopenharmony_ci/* Invalidates the (read-only) L2C cache. This was the L2 cache for 15162306a36Sopenharmony_ci * uniforms and instructions on V3D 3.2. 15262306a36Sopenharmony_ci */ 15362306a36Sopenharmony_cistatic void 15462306a36Sopenharmony_civ3d_invalidate_l2c(struct v3d_dev *v3d, int core) 15562306a36Sopenharmony_ci{ 15662306a36Sopenharmony_ci if (v3d->ver > 32) 15762306a36Sopenharmony_ci return; 15862306a36Sopenharmony_ci 15962306a36Sopenharmony_ci V3D_CORE_WRITE(core, V3D_CTL_L2CACTL, 16062306a36Sopenharmony_ci V3D_L2CACTL_L2CCLR | 16162306a36Sopenharmony_ci V3D_L2CACTL_L2CENA); 16262306a36Sopenharmony_ci} 16362306a36Sopenharmony_ci 16462306a36Sopenharmony_ci/* Invalidates texture L2 cachelines */ 16562306a36Sopenharmony_cistatic void 16662306a36Sopenharmony_civ3d_flush_l2t(struct v3d_dev *v3d, int core) 16762306a36Sopenharmony_ci{ 16862306a36Sopenharmony_ci /* While there is a busy bit (V3D_L2TCACTL_L2TFLS), we don't 16962306a36Sopenharmony_ci * need to wait for completion before dispatching the job -- 17062306a36Sopenharmony_ci * L2T accesses will be stalled until the flush has completed. 17162306a36Sopenharmony_ci * However, we do need to make sure we don't try to trigger a 17262306a36Sopenharmony_ci * new flush while the L2_CLEAN queue is trying to 17362306a36Sopenharmony_ci * synchronously clean after a job. 17462306a36Sopenharmony_ci */ 17562306a36Sopenharmony_ci mutex_lock(&v3d->cache_clean_lock); 17662306a36Sopenharmony_ci V3D_CORE_WRITE(core, V3D_CTL_L2TCACTL, 17762306a36Sopenharmony_ci V3D_L2TCACTL_L2TFLS | 17862306a36Sopenharmony_ci V3D_SET_FIELD(V3D_L2TCACTL_FLM_FLUSH, V3D_L2TCACTL_FLM)); 17962306a36Sopenharmony_ci mutex_unlock(&v3d->cache_clean_lock); 18062306a36Sopenharmony_ci} 18162306a36Sopenharmony_ci 18262306a36Sopenharmony_ci/* Cleans texture L1 and L2 cachelines (writing back dirty data). 18362306a36Sopenharmony_ci * 18462306a36Sopenharmony_ci * For cleaning, which happens from the CACHE_CLEAN queue after CSD has 18562306a36Sopenharmony_ci * executed, we need to make sure that the clean is done before 18662306a36Sopenharmony_ci * signaling job completion. So, we synchronously wait before 18762306a36Sopenharmony_ci * returning, and we make sure that L2 invalidates don't happen in the 18862306a36Sopenharmony_ci * meantime to confuse our are-we-done checks. 18962306a36Sopenharmony_ci */ 19062306a36Sopenharmony_civoid 19162306a36Sopenharmony_civ3d_clean_caches(struct v3d_dev *v3d) 19262306a36Sopenharmony_ci{ 19362306a36Sopenharmony_ci struct drm_device *dev = &v3d->drm; 19462306a36Sopenharmony_ci int core = 0; 19562306a36Sopenharmony_ci 19662306a36Sopenharmony_ci trace_v3d_cache_clean_begin(dev); 19762306a36Sopenharmony_ci 19862306a36Sopenharmony_ci V3D_CORE_WRITE(core, V3D_CTL_L2TCACTL, V3D_L2TCACTL_TMUWCF); 19962306a36Sopenharmony_ci if (wait_for(!(V3D_CORE_READ(core, V3D_CTL_L2TCACTL) & 20062306a36Sopenharmony_ci V3D_L2TCACTL_TMUWCF), 100)) { 20162306a36Sopenharmony_ci DRM_ERROR("Timeout waiting for TMU write combiner flush\n"); 20262306a36Sopenharmony_ci } 20362306a36Sopenharmony_ci 20462306a36Sopenharmony_ci mutex_lock(&v3d->cache_clean_lock); 20562306a36Sopenharmony_ci V3D_CORE_WRITE(core, V3D_CTL_L2TCACTL, 20662306a36Sopenharmony_ci V3D_L2TCACTL_L2TFLS | 20762306a36Sopenharmony_ci V3D_SET_FIELD(V3D_L2TCACTL_FLM_CLEAN, V3D_L2TCACTL_FLM)); 20862306a36Sopenharmony_ci 20962306a36Sopenharmony_ci if (wait_for(!(V3D_CORE_READ(core, V3D_CTL_L2TCACTL) & 21062306a36Sopenharmony_ci V3D_L2TCACTL_L2TFLS), 100)) { 21162306a36Sopenharmony_ci DRM_ERROR("Timeout waiting for L2T clean\n"); 21262306a36Sopenharmony_ci } 21362306a36Sopenharmony_ci 21462306a36Sopenharmony_ci mutex_unlock(&v3d->cache_clean_lock); 21562306a36Sopenharmony_ci 21662306a36Sopenharmony_ci trace_v3d_cache_clean_end(dev); 21762306a36Sopenharmony_ci} 21862306a36Sopenharmony_ci 21962306a36Sopenharmony_ci/* Invalidates the slice caches. These are read-only caches. */ 22062306a36Sopenharmony_cistatic void 22162306a36Sopenharmony_civ3d_invalidate_slices(struct v3d_dev *v3d, int core) 22262306a36Sopenharmony_ci{ 22362306a36Sopenharmony_ci V3D_CORE_WRITE(core, V3D_CTL_SLCACTL, 22462306a36Sopenharmony_ci V3D_SET_FIELD(0xf, V3D_SLCACTL_TVCCS) | 22562306a36Sopenharmony_ci V3D_SET_FIELD(0xf, V3D_SLCACTL_TDCCS) | 22662306a36Sopenharmony_ci V3D_SET_FIELD(0xf, V3D_SLCACTL_UCC) | 22762306a36Sopenharmony_ci V3D_SET_FIELD(0xf, V3D_SLCACTL_ICC)); 22862306a36Sopenharmony_ci} 22962306a36Sopenharmony_ci 23062306a36Sopenharmony_civoid 23162306a36Sopenharmony_civ3d_invalidate_caches(struct v3d_dev *v3d) 23262306a36Sopenharmony_ci{ 23362306a36Sopenharmony_ci /* Invalidate the caches from the outside in. That way if 23462306a36Sopenharmony_ci * another CL's concurrent use of nearby memory were to pull 23562306a36Sopenharmony_ci * an invalidated cacheline back in, we wouldn't leave stale 23662306a36Sopenharmony_ci * data in the inner cache. 23762306a36Sopenharmony_ci */ 23862306a36Sopenharmony_ci v3d_flush_l3(v3d); 23962306a36Sopenharmony_ci v3d_invalidate_l2c(v3d, 0); 24062306a36Sopenharmony_ci v3d_flush_l2t(v3d, 0); 24162306a36Sopenharmony_ci v3d_invalidate_slices(v3d, 0); 24262306a36Sopenharmony_ci} 24362306a36Sopenharmony_ci 24462306a36Sopenharmony_ci/* Takes the reservation lock on all the BOs being referenced, so that 24562306a36Sopenharmony_ci * at queue submit time we can update the reservations. 24662306a36Sopenharmony_ci * 24762306a36Sopenharmony_ci * We don't lock the RCL the tile alloc/state BOs, or overflow memory 24862306a36Sopenharmony_ci * (all of which are on exec->unref_list). They're entirely private 24962306a36Sopenharmony_ci * to v3d, so we don't attach dma-buf fences to them. 25062306a36Sopenharmony_ci */ 25162306a36Sopenharmony_cistatic int 25262306a36Sopenharmony_civ3d_lock_bo_reservations(struct v3d_job *job, 25362306a36Sopenharmony_ci struct ww_acquire_ctx *acquire_ctx) 25462306a36Sopenharmony_ci{ 25562306a36Sopenharmony_ci int i, ret; 25662306a36Sopenharmony_ci 25762306a36Sopenharmony_ci ret = drm_gem_lock_reservations(job->bo, job->bo_count, acquire_ctx); 25862306a36Sopenharmony_ci if (ret) 25962306a36Sopenharmony_ci return ret; 26062306a36Sopenharmony_ci 26162306a36Sopenharmony_ci for (i = 0; i < job->bo_count; i++) { 26262306a36Sopenharmony_ci ret = dma_resv_reserve_fences(job->bo[i]->resv, 1); 26362306a36Sopenharmony_ci if (ret) 26462306a36Sopenharmony_ci goto fail; 26562306a36Sopenharmony_ci 26662306a36Sopenharmony_ci ret = drm_sched_job_add_implicit_dependencies(&job->base, 26762306a36Sopenharmony_ci job->bo[i], true); 26862306a36Sopenharmony_ci if (ret) 26962306a36Sopenharmony_ci goto fail; 27062306a36Sopenharmony_ci } 27162306a36Sopenharmony_ci 27262306a36Sopenharmony_ci return 0; 27362306a36Sopenharmony_ci 27462306a36Sopenharmony_cifail: 27562306a36Sopenharmony_ci drm_gem_unlock_reservations(job->bo, job->bo_count, acquire_ctx); 27662306a36Sopenharmony_ci return ret; 27762306a36Sopenharmony_ci} 27862306a36Sopenharmony_ci 27962306a36Sopenharmony_ci/** 28062306a36Sopenharmony_ci * v3d_lookup_bos() - Sets up job->bo[] with the GEM objects 28162306a36Sopenharmony_ci * referenced by the job. 28262306a36Sopenharmony_ci * @dev: DRM device 28362306a36Sopenharmony_ci * @file_priv: DRM file for this fd 28462306a36Sopenharmony_ci * @job: V3D job being set up 28562306a36Sopenharmony_ci * @bo_handles: GEM handles 28662306a36Sopenharmony_ci * @bo_count: Number of GEM handles passed in 28762306a36Sopenharmony_ci * 28862306a36Sopenharmony_ci * The command validator needs to reference BOs by their index within 28962306a36Sopenharmony_ci * the submitted job's BO list. This does the validation of the job's 29062306a36Sopenharmony_ci * BO list and reference counting for the lifetime of the job. 29162306a36Sopenharmony_ci * 29262306a36Sopenharmony_ci * Note that this function doesn't need to unreference the BOs on 29362306a36Sopenharmony_ci * failure, because that will happen at v3d_exec_cleanup() time. 29462306a36Sopenharmony_ci */ 29562306a36Sopenharmony_cistatic int 29662306a36Sopenharmony_civ3d_lookup_bos(struct drm_device *dev, 29762306a36Sopenharmony_ci struct drm_file *file_priv, 29862306a36Sopenharmony_ci struct v3d_job *job, 29962306a36Sopenharmony_ci u64 bo_handles, 30062306a36Sopenharmony_ci u32 bo_count) 30162306a36Sopenharmony_ci{ 30262306a36Sopenharmony_ci job->bo_count = bo_count; 30362306a36Sopenharmony_ci 30462306a36Sopenharmony_ci if (!job->bo_count) { 30562306a36Sopenharmony_ci /* See comment on bo_index for why we have to check 30662306a36Sopenharmony_ci * this. 30762306a36Sopenharmony_ci */ 30862306a36Sopenharmony_ci DRM_DEBUG("Rendering requires BOs\n"); 30962306a36Sopenharmony_ci return -EINVAL; 31062306a36Sopenharmony_ci } 31162306a36Sopenharmony_ci 31262306a36Sopenharmony_ci return drm_gem_objects_lookup(file_priv, 31362306a36Sopenharmony_ci (void __user *)(uintptr_t)bo_handles, 31462306a36Sopenharmony_ci job->bo_count, &job->bo); 31562306a36Sopenharmony_ci} 31662306a36Sopenharmony_ci 31762306a36Sopenharmony_cistatic void 31862306a36Sopenharmony_civ3d_job_free(struct kref *ref) 31962306a36Sopenharmony_ci{ 32062306a36Sopenharmony_ci struct v3d_job *job = container_of(ref, struct v3d_job, refcount); 32162306a36Sopenharmony_ci int i; 32262306a36Sopenharmony_ci 32362306a36Sopenharmony_ci if (job->bo) { 32462306a36Sopenharmony_ci for (i = 0; i < job->bo_count; i++) 32562306a36Sopenharmony_ci drm_gem_object_put(job->bo[i]); 32662306a36Sopenharmony_ci kvfree(job->bo); 32762306a36Sopenharmony_ci } 32862306a36Sopenharmony_ci 32962306a36Sopenharmony_ci dma_fence_put(job->irq_fence); 33062306a36Sopenharmony_ci dma_fence_put(job->done_fence); 33162306a36Sopenharmony_ci 33262306a36Sopenharmony_ci if (job->perfmon) 33362306a36Sopenharmony_ci v3d_perfmon_put(job->perfmon); 33462306a36Sopenharmony_ci 33562306a36Sopenharmony_ci kfree(job); 33662306a36Sopenharmony_ci} 33762306a36Sopenharmony_ci 33862306a36Sopenharmony_cistatic void 33962306a36Sopenharmony_civ3d_render_job_free(struct kref *ref) 34062306a36Sopenharmony_ci{ 34162306a36Sopenharmony_ci struct v3d_render_job *job = container_of(ref, struct v3d_render_job, 34262306a36Sopenharmony_ci base.refcount); 34362306a36Sopenharmony_ci struct v3d_bo *bo, *save; 34462306a36Sopenharmony_ci 34562306a36Sopenharmony_ci list_for_each_entry_safe(bo, save, &job->unref_list, unref_head) { 34662306a36Sopenharmony_ci drm_gem_object_put(&bo->base.base); 34762306a36Sopenharmony_ci } 34862306a36Sopenharmony_ci 34962306a36Sopenharmony_ci v3d_job_free(ref); 35062306a36Sopenharmony_ci} 35162306a36Sopenharmony_ci 35262306a36Sopenharmony_civoid v3d_job_cleanup(struct v3d_job *job) 35362306a36Sopenharmony_ci{ 35462306a36Sopenharmony_ci if (!job) 35562306a36Sopenharmony_ci return; 35662306a36Sopenharmony_ci 35762306a36Sopenharmony_ci drm_sched_job_cleanup(&job->base); 35862306a36Sopenharmony_ci v3d_job_put(job); 35962306a36Sopenharmony_ci} 36062306a36Sopenharmony_ci 36162306a36Sopenharmony_civoid v3d_job_put(struct v3d_job *job) 36262306a36Sopenharmony_ci{ 36362306a36Sopenharmony_ci kref_put(&job->refcount, job->free); 36462306a36Sopenharmony_ci} 36562306a36Sopenharmony_ci 36662306a36Sopenharmony_ciint 36762306a36Sopenharmony_civ3d_wait_bo_ioctl(struct drm_device *dev, void *data, 36862306a36Sopenharmony_ci struct drm_file *file_priv) 36962306a36Sopenharmony_ci{ 37062306a36Sopenharmony_ci int ret; 37162306a36Sopenharmony_ci struct drm_v3d_wait_bo *args = data; 37262306a36Sopenharmony_ci ktime_t start = ktime_get(); 37362306a36Sopenharmony_ci u64 delta_ns; 37462306a36Sopenharmony_ci unsigned long timeout_jiffies = 37562306a36Sopenharmony_ci nsecs_to_jiffies_timeout(args->timeout_ns); 37662306a36Sopenharmony_ci 37762306a36Sopenharmony_ci if (args->pad != 0) 37862306a36Sopenharmony_ci return -EINVAL; 37962306a36Sopenharmony_ci 38062306a36Sopenharmony_ci ret = drm_gem_dma_resv_wait(file_priv, args->handle, 38162306a36Sopenharmony_ci true, timeout_jiffies); 38262306a36Sopenharmony_ci 38362306a36Sopenharmony_ci /* Decrement the user's timeout, in case we got interrupted 38462306a36Sopenharmony_ci * such that the ioctl will be restarted. 38562306a36Sopenharmony_ci */ 38662306a36Sopenharmony_ci delta_ns = ktime_to_ns(ktime_sub(ktime_get(), start)); 38762306a36Sopenharmony_ci if (delta_ns < args->timeout_ns) 38862306a36Sopenharmony_ci args->timeout_ns -= delta_ns; 38962306a36Sopenharmony_ci else 39062306a36Sopenharmony_ci args->timeout_ns = 0; 39162306a36Sopenharmony_ci 39262306a36Sopenharmony_ci /* Asked to wait beyond the jiffie/scheduler precision? */ 39362306a36Sopenharmony_ci if (ret == -ETIME && args->timeout_ns) 39462306a36Sopenharmony_ci ret = -EAGAIN; 39562306a36Sopenharmony_ci 39662306a36Sopenharmony_ci return ret; 39762306a36Sopenharmony_ci} 39862306a36Sopenharmony_ci 39962306a36Sopenharmony_cistatic int 40062306a36Sopenharmony_civ3d_job_init(struct v3d_dev *v3d, struct drm_file *file_priv, 40162306a36Sopenharmony_ci void **container, size_t size, void (*free)(struct kref *ref), 40262306a36Sopenharmony_ci u32 in_sync, struct v3d_submit_ext *se, enum v3d_queue queue) 40362306a36Sopenharmony_ci{ 40462306a36Sopenharmony_ci struct v3d_file_priv *v3d_priv = file_priv->driver_priv; 40562306a36Sopenharmony_ci struct v3d_job *job; 40662306a36Sopenharmony_ci bool has_multisync = se && (se->flags & DRM_V3D_EXT_ID_MULTI_SYNC); 40762306a36Sopenharmony_ci int ret, i; 40862306a36Sopenharmony_ci 40962306a36Sopenharmony_ci *container = kcalloc(1, size, GFP_KERNEL); 41062306a36Sopenharmony_ci if (!*container) { 41162306a36Sopenharmony_ci DRM_ERROR("Cannot allocate memory for v3d job."); 41262306a36Sopenharmony_ci return -ENOMEM; 41362306a36Sopenharmony_ci } 41462306a36Sopenharmony_ci 41562306a36Sopenharmony_ci job = *container; 41662306a36Sopenharmony_ci job->v3d = v3d; 41762306a36Sopenharmony_ci job->free = free; 41862306a36Sopenharmony_ci 41962306a36Sopenharmony_ci ret = drm_sched_job_init(&job->base, &v3d_priv->sched_entity[queue], 42062306a36Sopenharmony_ci v3d_priv); 42162306a36Sopenharmony_ci if (ret) 42262306a36Sopenharmony_ci goto fail; 42362306a36Sopenharmony_ci 42462306a36Sopenharmony_ci if (has_multisync) { 42562306a36Sopenharmony_ci if (se->in_sync_count && se->wait_stage == queue) { 42662306a36Sopenharmony_ci struct drm_v3d_sem __user *handle = u64_to_user_ptr(se->in_syncs); 42762306a36Sopenharmony_ci 42862306a36Sopenharmony_ci for (i = 0; i < se->in_sync_count; i++) { 42962306a36Sopenharmony_ci struct drm_v3d_sem in; 43062306a36Sopenharmony_ci 43162306a36Sopenharmony_ci if (copy_from_user(&in, handle++, sizeof(in))) { 43262306a36Sopenharmony_ci ret = -EFAULT; 43362306a36Sopenharmony_ci DRM_DEBUG("Failed to copy wait dep handle.\n"); 43462306a36Sopenharmony_ci goto fail_deps; 43562306a36Sopenharmony_ci } 43662306a36Sopenharmony_ci ret = drm_sched_job_add_syncobj_dependency(&job->base, file_priv, in.handle, 0); 43762306a36Sopenharmony_ci 43862306a36Sopenharmony_ci // TODO: Investigate why this was filtered out for the IOCTL. 43962306a36Sopenharmony_ci if (ret && ret != -ENOENT) 44062306a36Sopenharmony_ci goto fail_deps; 44162306a36Sopenharmony_ci } 44262306a36Sopenharmony_ci } 44362306a36Sopenharmony_ci } else { 44462306a36Sopenharmony_ci ret = drm_sched_job_add_syncobj_dependency(&job->base, file_priv, in_sync, 0); 44562306a36Sopenharmony_ci 44662306a36Sopenharmony_ci // TODO: Investigate why this was filtered out for the IOCTL. 44762306a36Sopenharmony_ci if (ret && ret != -ENOENT) 44862306a36Sopenharmony_ci goto fail_deps; 44962306a36Sopenharmony_ci } 45062306a36Sopenharmony_ci 45162306a36Sopenharmony_ci kref_init(&job->refcount); 45262306a36Sopenharmony_ci 45362306a36Sopenharmony_ci return 0; 45462306a36Sopenharmony_ci 45562306a36Sopenharmony_cifail_deps: 45662306a36Sopenharmony_ci drm_sched_job_cleanup(&job->base); 45762306a36Sopenharmony_cifail: 45862306a36Sopenharmony_ci kfree(*container); 45962306a36Sopenharmony_ci *container = NULL; 46062306a36Sopenharmony_ci 46162306a36Sopenharmony_ci return ret; 46262306a36Sopenharmony_ci} 46362306a36Sopenharmony_ci 46462306a36Sopenharmony_cistatic void 46562306a36Sopenharmony_civ3d_push_job(struct v3d_job *job) 46662306a36Sopenharmony_ci{ 46762306a36Sopenharmony_ci drm_sched_job_arm(&job->base); 46862306a36Sopenharmony_ci 46962306a36Sopenharmony_ci job->done_fence = dma_fence_get(&job->base.s_fence->finished); 47062306a36Sopenharmony_ci 47162306a36Sopenharmony_ci /* put by scheduler job completion */ 47262306a36Sopenharmony_ci kref_get(&job->refcount); 47362306a36Sopenharmony_ci 47462306a36Sopenharmony_ci drm_sched_entity_push_job(&job->base); 47562306a36Sopenharmony_ci} 47662306a36Sopenharmony_ci 47762306a36Sopenharmony_cistatic void 47862306a36Sopenharmony_civ3d_attach_fences_and_unlock_reservation(struct drm_file *file_priv, 47962306a36Sopenharmony_ci struct v3d_job *job, 48062306a36Sopenharmony_ci struct ww_acquire_ctx *acquire_ctx, 48162306a36Sopenharmony_ci u32 out_sync, 48262306a36Sopenharmony_ci struct v3d_submit_ext *se, 48362306a36Sopenharmony_ci struct dma_fence *done_fence) 48462306a36Sopenharmony_ci{ 48562306a36Sopenharmony_ci struct drm_syncobj *sync_out; 48662306a36Sopenharmony_ci bool has_multisync = se && (se->flags & DRM_V3D_EXT_ID_MULTI_SYNC); 48762306a36Sopenharmony_ci int i; 48862306a36Sopenharmony_ci 48962306a36Sopenharmony_ci for (i = 0; i < job->bo_count; i++) { 49062306a36Sopenharmony_ci /* XXX: Use shared fences for read-only objects. */ 49162306a36Sopenharmony_ci dma_resv_add_fence(job->bo[i]->resv, job->done_fence, 49262306a36Sopenharmony_ci DMA_RESV_USAGE_WRITE); 49362306a36Sopenharmony_ci } 49462306a36Sopenharmony_ci 49562306a36Sopenharmony_ci drm_gem_unlock_reservations(job->bo, job->bo_count, acquire_ctx); 49662306a36Sopenharmony_ci 49762306a36Sopenharmony_ci /* Update the return sync object for the job */ 49862306a36Sopenharmony_ci /* If it only supports a single signal semaphore*/ 49962306a36Sopenharmony_ci if (!has_multisync) { 50062306a36Sopenharmony_ci sync_out = drm_syncobj_find(file_priv, out_sync); 50162306a36Sopenharmony_ci if (sync_out) { 50262306a36Sopenharmony_ci drm_syncobj_replace_fence(sync_out, done_fence); 50362306a36Sopenharmony_ci drm_syncobj_put(sync_out); 50462306a36Sopenharmony_ci } 50562306a36Sopenharmony_ci return; 50662306a36Sopenharmony_ci } 50762306a36Sopenharmony_ci 50862306a36Sopenharmony_ci /* If multiple semaphores extension is supported */ 50962306a36Sopenharmony_ci if (se->out_sync_count) { 51062306a36Sopenharmony_ci for (i = 0; i < se->out_sync_count; i++) { 51162306a36Sopenharmony_ci drm_syncobj_replace_fence(se->out_syncs[i].syncobj, 51262306a36Sopenharmony_ci done_fence); 51362306a36Sopenharmony_ci drm_syncobj_put(se->out_syncs[i].syncobj); 51462306a36Sopenharmony_ci } 51562306a36Sopenharmony_ci kvfree(se->out_syncs); 51662306a36Sopenharmony_ci } 51762306a36Sopenharmony_ci} 51862306a36Sopenharmony_ci 51962306a36Sopenharmony_cistatic void 52062306a36Sopenharmony_civ3d_put_multisync_post_deps(struct v3d_submit_ext *se) 52162306a36Sopenharmony_ci{ 52262306a36Sopenharmony_ci unsigned int i; 52362306a36Sopenharmony_ci 52462306a36Sopenharmony_ci if (!(se && se->out_sync_count)) 52562306a36Sopenharmony_ci return; 52662306a36Sopenharmony_ci 52762306a36Sopenharmony_ci for (i = 0; i < se->out_sync_count; i++) 52862306a36Sopenharmony_ci drm_syncobj_put(se->out_syncs[i].syncobj); 52962306a36Sopenharmony_ci kvfree(se->out_syncs); 53062306a36Sopenharmony_ci} 53162306a36Sopenharmony_ci 53262306a36Sopenharmony_cistatic int 53362306a36Sopenharmony_civ3d_get_multisync_post_deps(struct drm_file *file_priv, 53462306a36Sopenharmony_ci struct v3d_submit_ext *se, 53562306a36Sopenharmony_ci u32 count, u64 handles) 53662306a36Sopenharmony_ci{ 53762306a36Sopenharmony_ci struct drm_v3d_sem __user *post_deps; 53862306a36Sopenharmony_ci int i, ret; 53962306a36Sopenharmony_ci 54062306a36Sopenharmony_ci if (!count) 54162306a36Sopenharmony_ci return 0; 54262306a36Sopenharmony_ci 54362306a36Sopenharmony_ci se->out_syncs = (struct v3d_submit_outsync *) 54462306a36Sopenharmony_ci kvmalloc_array(count, 54562306a36Sopenharmony_ci sizeof(struct v3d_submit_outsync), 54662306a36Sopenharmony_ci GFP_KERNEL); 54762306a36Sopenharmony_ci if (!se->out_syncs) 54862306a36Sopenharmony_ci return -ENOMEM; 54962306a36Sopenharmony_ci 55062306a36Sopenharmony_ci post_deps = u64_to_user_ptr(handles); 55162306a36Sopenharmony_ci 55262306a36Sopenharmony_ci for (i = 0; i < count; i++) { 55362306a36Sopenharmony_ci struct drm_v3d_sem out; 55462306a36Sopenharmony_ci 55562306a36Sopenharmony_ci if (copy_from_user(&out, post_deps++, sizeof(out))) { 55662306a36Sopenharmony_ci ret = -EFAULT; 55762306a36Sopenharmony_ci DRM_DEBUG("Failed to copy post dep handles\n"); 55862306a36Sopenharmony_ci goto fail; 55962306a36Sopenharmony_ci } 56062306a36Sopenharmony_ci 56162306a36Sopenharmony_ci se->out_syncs[i].syncobj = drm_syncobj_find(file_priv, 56262306a36Sopenharmony_ci out.handle); 56362306a36Sopenharmony_ci if (!se->out_syncs[i].syncobj) { 56462306a36Sopenharmony_ci ret = -EINVAL; 56562306a36Sopenharmony_ci goto fail; 56662306a36Sopenharmony_ci } 56762306a36Sopenharmony_ci } 56862306a36Sopenharmony_ci se->out_sync_count = count; 56962306a36Sopenharmony_ci 57062306a36Sopenharmony_ci return 0; 57162306a36Sopenharmony_ci 57262306a36Sopenharmony_cifail: 57362306a36Sopenharmony_ci for (i--; i >= 0; i--) 57462306a36Sopenharmony_ci drm_syncobj_put(se->out_syncs[i].syncobj); 57562306a36Sopenharmony_ci kvfree(se->out_syncs); 57662306a36Sopenharmony_ci 57762306a36Sopenharmony_ci return ret; 57862306a36Sopenharmony_ci} 57962306a36Sopenharmony_ci 58062306a36Sopenharmony_ci/* Get data for multiple binary semaphores synchronization. Parse syncobj 58162306a36Sopenharmony_ci * to be signaled when job completes (out_sync). 58262306a36Sopenharmony_ci */ 58362306a36Sopenharmony_cistatic int 58462306a36Sopenharmony_civ3d_get_multisync_submit_deps(struct drm_file *file_priv, 58562306a36Sopenharmony_ci struct drm_v3d_extension __user *ext, 58662306a36Sopenharmony_ci void *data) 58762306a36Sopenharmony_ci{ 58862306a36Sopenharmony_ci struct drm_v3d_multi_sync multisync; 58962306a36Sopenharmony_ci struct v3d_submit_ext *se = data; 59062306a36Sopenharmony_ci int ret; 59162306a36Sopenharmony_ci 59262306a36Sopenharmony_ci if (copy_from_user(&multisync, ext, sizeof(multisync))) 59362306a36Sopenharmony_ci return -EFAULT; 59462306a36Sopenharmony_ci 59562306a36Sopenharmony_ci if (multisync.pad) 59662306a36Sopenharmony_ci return -EINVAL; 59762306a36Sopenharmony_ci 59862306a36Sopenharmony_ci ret = v3d_get_multisync_post_deps(file_priv, data, multisync.out_sync_count, 59962306a36Sopenharmony_ci multisync.out_syncs); 60062306a36Sopenharmony_ci if (ret) 60162306a36Sopenharmony_ci return ret; 60262306a36Sopenharmony_ci 60362306a36Sopenharmony_ci se->in_sync_count = multisync.in_sync_count; 60462306a36Sopenharmony_ci se->in_syncs = multisync.in_syncs; 60562306a36Sopenharmony_ci se->flags |= DRM_V3D_EXT_ID_MULTI_SYNC; 60662306a36Sopenharmony_ci se->wait_stage = multisync.wait_stage; 60762306a36Sopenharmony_ci 60862306a36Sopenharmony_ci return 0; 60962306a36Sopenharmony_ci} 61062306a36Sopenharmony_ci 61162306a36Sopenharmony_ci/* Whenever userspace sets ioctl extensions, v3d_get_extensions parses data 61262306a36Sopenharmony_ci * according to the extension id (name). 61362306a36Sopenharmony_ci */ 61462306a36Sopenharmony_cistatic int 61562306a36Sopenharmony_civ3d_get_extensions(struct drm_file *file_priv, 61662306a36Sopenharmony_ci u64 ext_handles, 61762306a36Sopenharmony_ci void *data) 61862306a36Sopenharmony_ci{ 61962306a36Sopenharmony_ci struct drm_v3d_extension __user *user_ext; 62062306a36Sopenharmony_ci int ret; 62162306a36Sopenharmony_ci 62262306a36Sopenharmony_ci user_ext = u64_to_user_ptr(ext_handles); 62362306a36Sopenharmony_ci while (user_ext) { 62462306a36Sopenharmony_ci struct drm_v3d_extension ext; 62562306a36Sopenharmony_ci 62662306a36Sopenharmony_ci if (copy_from_user(&ext, user_ext, sizeof(ext))) { 62762306a36Sopenharmony_ci DRM_DEBUG("Failed to copy submit extension\n"); 62862306a36Sopenharmony_ci return -EFAULT; 62962306a36Sopenharmony_ci } 63062306a36Sopenharmony_ci 63162306a36Sopenharmony_ci switch (ext.id) { 63262306a36Sopenharmony_ci case DRM_V3D_EXT_ID_MULTI_SYNC: 63362306a36Sopenharmony_ci ret = v3d_get_multisync_submit_deps(file_priv, user_ext, data); 63462306a36Sopenharmony_ci if (ret) 63562306a36Sopenharmony_ci return ret; 63662306a36Sopenharmony_ci break; 63762306a36Sopenharmony_ci default: 63862306a36Sopenharmony_ci DRM_DEBUG_DRIVER("Unknown extension id: %d\n", ext.id); 63962306a36Sopenharmony_ci return -EINVAL; 64062306a36Sopenharmony_ci } 64162306a36Sopenharmony_ci 64262306a36Sopenharmony_ci user_ext = u64_to_user_ptr(ext.next); 64362306a36Sopenharmony_ci } 64462306a36Sopenharmony_ci 64562306a36Sopenharmony_ci return 0; 64662306a36Sopenharmony_ci} 64762306a36Sopenharmony_ci 64862306a36Sopenharmony_ci/** 64962306a36Sopenharmony_ci * v3d_submit_cl_ioctl() - Submits a job (frame) to the V3D. 65062306a36Sopenharmony_ci * @dev: DRM device 65162306a36Sopenharmony_ci * @data: ioctl argument 65262306a36Sopenharmony_ci * @file_priv: DRM file for this fd 65362306a36Sopenharmony_ci * 65462306a36Sopenharmony_ci * This is the main entrypoint for userspace to submit a 3D frame to 65562306a36Sopenharmony_ci * the GPU. Userspace provides the binner command list (if 65662306a36Sopenharmony_ci * applicable), and the kernel sets up the render command list to draw 65762306a36Sopenharmony_ci * to the framebuffer described in the ioctl, using the command lists 65862306a36Sopenharmony_ci * that the 3D engine's binner will produce. 65962306a36Sopenharmony_ci */ 66062306a36Sopenharmony_ciint 66162306a36Sopenharmony_civ3d_submit_cl_ioctl(struct drm_device *dev, void *data, 66262306a36Sopenharmony_ci struct drm_file *file_priv) 66362306a36Sopenharmony_ci{ 66462306a36Sopenharmony_ci struct v3d_dev *v3d = to_v3d_dev(dev); 66562306a36Sopenharmony_ci struct v3d_file_priv *v3d_priv = file_priv->driver_priv; 66662306a36Sopenharmony_ci struct drm_v3d_submit_cl *args = data; 66762306a36Sopenharmony_ci struct v3d_submit_ext se = {0}; 66862306a36Sopenharmony_ci struct v3d_bin_job *bin = NULL; 66962306a36Sopenharmony_ci struct v3d_render_job *render = NULL; 67062306a36Sopenharmony_ci struct v3d_job *clean_job = NULL; 67162306a36Sopenharmony_ci struct v3d_job *last_job; 67262306a36Sopenharmony_ci struct ww_acquire_ctx acquire_ctx; 67362306a36Sopenharmony_ci int ret = 0; 67462306a36Sopenharmony_ci 67562306a36Sopenharmony_ci trace_v3d_submit_cl_ioctl(&v3d->drm, args->rcl_start, args->rcl_end); 67662306a36Sopenharmony_ci 67762306a36Sopenharmony_ci if (args->pad) 67862306a36Sopenharmony_ci return -EINVAL; 67962306a36Sopenharmony_ci 68062306a36Sopenharmony_ci if (args->flags && 68162306a36Sopenharmony_ci args->flags & ~(DRM_V3D_SUBMIT_CL_FLUSH_CACHE | 68262306a36Sopenharmony_ci DRM_V3D_SUBMIT_EXTENSION)) { 68362306a36Sopenharmony_ci DRM_INFO("invalid flags: %d\n", args->flags); 68462306a36Sopenharmony_ci return -EINVAL; 68562306a36Sopenharmony_ci } 68662306a36Sopenharmony_ci 68762306a36Sopenharmony_ci if (args->flags & DRM_V3D_SUBMIT_EXTENSION) { 68862306a36Sopenharmony_ci ret = v3d_get_extensions(file_priv, args->extensions, &se); 68962306a36Sopenharmony_ci if (ret) { 69062306a36Sopenharmony_ci DRM_DEBUG("Failed to get extensions.\n"); 69162306a36Sopenharmony_ci return ret; 69262306a36Sopenharmony_ci } 69362306a36Sopenharmony_ci } 69462306a36Sopenharmony_ci 69562306a36Sopenharmony_ci ret = v3d_job_init(v3d, file_priv, (void *)&render, sizeof(*render), 69662306a36Sopenharmony_ci v3d_render_job_free, args->in_sync_rcl, &se, V3D_RENDER); 69762306a36Sopenharmony_ci if (ret) 69862306a36Sopenharmony_ci goto fail; 69962306a36Sopenharmony_ci 70062306a36Sopenharmony_ci render->start = args->rcl_start; 70162306a36Sopenharmony_ci render->end = args->rcl_end; 70262306a36Sopenharmony_ci INIT_LIST_HEAD(&render->unref_list); 70362306a36Sopenharmony_ci 70462306a36Sopenharmony_ci if (args->bcl_start != args->bcl_end) { 70562306a36Sopenharmony_ci ret = v3d_job_init(v3d, file_priv, (void *)&bin, sizeof(*bin), 70662306a36Sopenharmony_ci v3d_job_free, args->in_sync_bcl, &se, V3D_BIN); 70762306a36Sopenharmony_ci if (ret) 70862306a36Sopenharmony_ci goto fail; 70962306a36Sopenharmony_ci 71062306a36Sopenharmony_ci bin->start = args->bcl_start; 71162306a36Sopenharmony_ci bin->end = args->bcl_end; 71262306a36Sopenharmony_ci bin->qma = args->qma; 71362306a36Sopenharmony_ci bin->qms = args->qms; 71462306a36Sopenharmony_ci bin->qts = args->qts; 71562306a36Sopenharmony_ci bin->render = render; 71662306a36Sopenharmony_ci } 71762306a36Sopenharmony_ci 71862306a36Sopenharmony_ci if (args->flags & DRM_V3D_SUBMIT_CL_FLUSH_CACHE) { 71962306a36Sopenharmony_ci ret = v3d_job_init(v3d, file_priv, (void *)&clean_job, sizeof(*clean_job), 72062306a36Sopenharmony_ci v3d_job_free, 0, NULL, V3D_CACHE_CLEAN); 72162306a36Sopenharmony_ci if (ret) 72262306a36Sopenharmony_ci goto fail; 72362306a36Sopenharmony_ci 72462306a36Sopenharmony_ci last_job = clean_job; 72562306a36Sopenharmony_ci } else { 72662306a36Sopenharmony_ci last_job = &render->base; 72762306a36Sopenharmony_ci } 72862306a36Sopenharmony_ci 72962306a36Sopenharmony_ci ret = v3d_lookup_bos(dev, file_priv, last_job, 73062306a36Sopenharmony_ci args->bo_handles, args->bo_handle_count); 73162306a36Sopenharmony_ci if (ret) 73262306a36Sopenharmony_ci goto fail; 73362306a36Sopenharmony_ci 73462306a36Sopenharmony_ci ret = v3d_lock_bo_reservations(last_job, &acquire_ctx); 73562306a36Sopenharmony_ci if (ret) 73662306a36Sopenharmony_ci goto fail; 73762306a36Sopenharmony_ci 73862306a36Sopenharmony_ci if (args->perfmon_id) { 73962306a36Sopenharmony_ci render->base.perfmon = v3d_perfmon_find(v3d_priv, 74062306a36Sopenharmony_ci args->perfmon_id); 74162306a36Sopenharmony_ci 74262306a36Sopenharmony_ci if (!render->base.perfmon) { 74362306a36Sopenharmony_ci ret = -ENOENT; 74462306a36Sopenharmony_ci goto fail_perfmon; 74562306a36Sopenharmony_ci } 74662306a36Sopenharmony_ci } 74762306a36Sopenharmony_ci 74862306a36Sopenharmony_ci mutex_lock(&v3d->sched_lock); 74962306a36Sopenharmony_ci if (bin) { 75062306a36Sopenharmony_ci bin->base.perfmon = render->base.perfmon; 75162306a36Sopenharmony_ci v3d_perfmon_get(bin->base.perfmon); 75262306a36Sopenharmony_ci v3d_push_job(&bin->base); 75362306a36Sopenharmony_ci 75462306a36Sopenharmony_ci ret = drm_sched_job_add_dependency(&render->base.base, 75562306a36Sopenharmony_ci dma_fence_get(bin->base.done_fence)); 75662306a36Sopenharmony_ci if (ret) 75762306a36Sopenharmony_ci goto fail_unreserve; 75862306a36Sopenharmony_ci } 75962306a36Sopenharmony_ci 76062306a36Sopenharmony_ci v3d_push_job(&render->base); 76162306a36Sopenharmony_ci 76262306a36Sopenharmony_ci if (clean_job) { 76362306a36Sopenharmony_ci struct dma_fence *render_fence = 76462306a36Sopenharmony_ci dma_fence_get(render->base.done_fence); 76562306a36Sopenharmony_ci ret = drm_sched_job_add_dependency(&clean_job->base, 76662306a36Sopenharmony_ci render_fence); 76762306a36Sopenharmony_ci if (ret) 76862306a36Sopenharmony_ci goto fail_unreserve; 76962306a36Sopenharmony_ci clean_job->perfmon = render->base.perfmon; 77062306a36Sopenharmony_ci v3d_perfmon_get(clean_job->perfmon); 77162306a36Sopenharmony_ci v3d_push_job(clean_job); 77262306a36Sopenharmony_ci } 77362306a36Sopenharmony_ci 77462306a36Sopenharmony_ci mutex_unlock(&v3d->sched_lock); 77562306a36Sopenharmony_ci 77662306a36Sopenharmony_ci v3d_attach_fences_and_unlock_reservation(file_priv, 77762306a36Sopenharmony_ci last_job, 77862306a36Sopenharmony_ci &acquire_ctx, 77962306a36Sopenharmony_ci args->out_sync, 78062306a36Sopenharmony_ci &se, 78162306a36Sopenharmony_ci last_job->done_fence); 78262306a36Sopenharmony_ci 78362306a36Sopenharmony_ci if (bin) 78462306a36Sopenharmony_ci v3d_job_put(&bin->base); 78562306a36Sopenharmony_ci v3d_job_put(&render->base); 78662306a36Sopenharmony_ci if (clean_job) 78762306a36Sopenharmony_ci v3d_job_put(clean_job); 78862306a36Sopenharmony_ci 78962306a36Sopenharmony_ci return 0; 79062306a36Sopenharmony_ci 79162306a36Sopenharmony_cifail_unreserve: 79262306a36Sopenharmony_ci mutex_unlock(&v3d->sched_lock); 79362306a36Sopenharmony_cifail_perfmon: 79462306a36Sopenharmony_ci drm_gem_unlock_reservations(last_job->bo, 79562306a36Sopenharmony_ci last_job->bo_count, &acquire_ctx); 79662306a36Sopenharmony_cifail: 79762306a36Sopenharmony_ci v3d_job_cleanup((void *)bin); 79862306a36Sopenharmony_ci v3d_job_cleanup((void *)render); 79962306a36Sopenharmony_ci v3d_job_cleanup(clean_job); 80062306a36Sopenharmony_ci v3d_put_multisync_post_deps(&se); 80162306a36Sopenharmony_ci 80262306a36Sopenharmony_ci return ret; 80362306a36Sopenharmony_ci} 80462306a36Sopenharmony_ci 80562306a36Sopenharmony_ci/** 80662306a36Sopenharmony_ci * v3d_submit_tfu_ioctl() - Submits a TFU (texture formatting) job to the V3D. 80762306a36Sopenharmony_ci * @dev: DRM device 80862306a36Sopenharmony_ci * @data: ioctl argument 80962306a36Sopenharmony_ci * @file_priv: DRM file for this fd 81062306a36Sopenharmony_ci * 81162306a36Sopenharmony_ci * Userspace provides the register setup for the TFU, which we don't 81262306a36Sopenharmony_ci * need to validate since the TFU is behind the MMU. 81362306a36Sopenharmony_ci */ 81462306a36Sopenharmony_ciint 81562306a36Sopenharmony_civ3d_submit_tfu_ioctl(struct drm_device *dev, void *data, 81662306a36Sopenharmony_ci struct drm_file *file_priv) 81762306a36Sopenharmony_ci{ 81862306a36Sopenharmony_ci struct v3d_dev *v3d = to_v3d_dev(dev); 81962306a36Sopenharmony_ci struct drm_v3d_submit_tfu *args = data; 82062306a36Sopenharmony_ci struct v3d_submit_ext se = {0}; 82162306a36Sopenharmony_ci struct v3d_tfu_job *job = NULL; 82262306a36Sopenharmony_ci struct ww_acquire_ctx acquire_ctx; 82362306a36Sopenharmony_ci int ret = 0; 82462306a36Sopenharmony_ci 82562306a36Sopenharmony_ci trace_v3d_submit_tfu_ioctl(&v3d->drm, args->iia); 82662306a36Sopenharmony_ci 82762306a36Sopenharmony_ci if (args->flags && !(args->flags & DRM_V3D_SUBMIT_EXTENSION)) { 82862306a36Sopenharmony_ci DRM_DEBUG("invalid flags: %d\n", args->flags); 82962306a36Sopenharmony_ci return -EINVAL; 83062306a36Sopenharmony_ci } 83162306a36Sopenharmony_ci 83262306a36Sopenharmony_ci if (args->flags & DRM_V3D_SUBMIT_EXTENSION) { 83362306a36Sopenharmony_ci ret = v3d_get_extensions(file_priv, args->extensions, &se); 83462306a36Sopenharmony_ci if (ret) { 83562306a36Sopenharmony_ci DRM_DEBUG("Failed to get extensions.\n"); 83662306a36Sopenharmony_ci return ret; 83762306a36Sopenharmony_ci } 83862306a36Sopenharmony_ci } 83962306a36Sopenharmony_ci 84062306a36Sopenharmony_ci ret = v3d_job_init(v3d, file_priv, (void *)&job, sizeof(*job), 84162306a36Sopenharmony_ci v3d_job_free, args->in_sync, &se, V3D_TFU); 84262306a36Sopenharmony_ci if (ret) 84362306a36Sopenharmony_ci goto fail; 84462306a36Sopenharmony_ci 84562306a36Sopenharmony_ci job->base.bo = kcalloc(ARRAY_SIZE(args->bo_handles), 84662306a36Sopenharmony_ci sizeof(*job->base.bo), GFP_KERNEL); 84762306a36Sopenharmony_ci if (!job->base.bo) { 84862306a36Sopenharmony_ci ret = -ENOMEM; 84962306a36Sopenharmony_ci goto fail; 85062306a36Sopenharmony_ci } 85162306a36Sopenharmony_ci 85262306a36Sopenharmony_ci job->args = *args; 85362306a36Sopenharmony_ci 85462306a36Sopenharmony_ci for (job->base.bo_count = 0; 85562306a36Sopenharmony_ci job->base.bo_count < ARRAY_SIZE(args->bo_handles); 85662306a36Sopenharmony_ci job->base.bo_count++) { 85762306a36Sopenharmony_ci struct drm_gem_object *bo; 85862306a36Sopenharmony_ci 85962306a36Sopenharmony_ci if (!args->bo_handles[job->base.bo_count]) 86062306a36Sopenharmony_ci break; 86162306a36Sopenharmony_ci 86262306a36Sopenharmony_ci bo = drm_gem_object_lookup(file_priv, args->bo_handles[job->base.bo_count]); 86362306a36Sopenharmony_ci if (!bo) { 86462306a36Sopenharmony_ci DRM_DEBUG("Failed to look up GEM BO %d: %d\n", 86562306a36Sopenharmony_ci job->base.bo_count, 86662306a36Sopenharmony_ci args->bo_handles[job->base.bo_count]); 86762306a36Sopenharmony_ci ret = -ENOENT; 86862306a36Sopenharmony_ci goto fail; 86962306a36Sopenharmony_ci } 87062306a36Sopenharmony_ci job->base.bo[job->base.bo_count] = bo; 87162306a36Sopenharmony_ci } 87262306a36Sopenharmony_ci 87362306a36Sopenharmony_ci ret = v3d_lock_bo_reservations(&job->base, &acquire_ctx); 87462306a36Sopenharmony_ci if (ret) 87562306a36Sopenharmony_ci goto fail; 87662306a36Sopenharmony_ci 87762306a36Sopenharmony_ci mutex_lock(&v3d->sched_lock); 87862306a36Sopenharmony_ci v3d_push_job(&job->base); 87962306a36Sopenharmony_ci mutex_unlock(&v3d->sched_lock); 88062306a36Sopenharmony_ci 88162306a36Sopenharmony_ci v3d_attach_fences_and_unlock_reservation(file_priv, 88262306a36Sopenharmony_ci &job->base, &acquire_ctx, 88362306a36Sopenharmony_ci args->out_sync, 88462306a36Sopenharmony_ci &se, 88562306a36Sopenharmony_ci job->base.done_fence); 88662306a36Sopenharmony_ci 88762306a36Sopenharmony_ci v3d_job_put(&job->base); 88862306a36Sopenharmony_ci 88962306a36Sopenharmony_ci return 0; 89062306a36Sopenharmony_ci 89162306a36Sopenharmony_cifail: 89262306a36Sopenharmony_ci v3d_job_cleanup((void *)job); 89362306a36Sopenharmony_ci v3d_put_multisync_post_deps(&se); 89462306a36Sopenharmony_ci 89562306a36Sopenharmony_ci return ret; 89662306a36Sopenharmony_ci} 89762306a36Sopenharmony_ci 89862306a36Sopenharmony_ci/** 89962306a36Sopenharmony_ci * v3d_submit_csd_ioctl() - Submits a CSD (texture formatting) job to the V3D. 90062306a36Sopenharmony_ci * @dev: DRM device 90162306a36Sopenharmony_ci * @data: ioctl argument 90262306a36Sopenharmony_ci * @file_priv: DRM file for this fd 90362306a36Sopenharmony_ci * 90462306a36Sopenharmony_ci * Userspace provides the register setup for the CSD, which we don't 90562306a36Sopenharmony_ci * need to validate since the CSD is behind the MMU. 90662306a36Sopenharmony_ci */ 90762306a36Sopenharmony_ciint 90862306a36Sopenharmony_civ3d_submit_csd_ioctl(struct drm_device *dev, void *data, 90962306a36Sopenharmony_ci struct drm_file *file_priv) 91062306a36Sopenharmony_ci{ 91162306a36Sopenharmony_ci struct v3d_dev *v3d = to_v3d_dev(dev); 91262306a36Sopenharmony_ci struct v3d_file_priv *v3d_priv = file_priv->driver_priv; 91362306a36Sopenharmony_ci struct drm_v3d_submit_csd *args = data; 91462306a36Sopenharmony_ci struct v3d_submit_ext se = {0}; 91562306a36Sopenharmony_ci struct v3d_csd_job *job = NULL; 91662306a36Sopenharmony_ci struct v3d_job *clean_job = NULL; 91762306a36Sopenharmony_ci struct ww_acquire_ctx acquire_ctx; 91862306a36Sopenharmony_ci int ret; 91962306a36Sopenharmony_ci 92062306a36Sopenharmony_ci trace_v3d_submit_csd_ioctl(&v3d->drm, args->cfg[5], args->cfg[6]); 92162306a36Sopenharmony_ci 92262306a36Sopenharmony_ci if (args->pad) 92362306a36Sopenharmony_ci return -EINVAL; 92462306a36Sopenharmony_ci 92562306a36Sopenharmony_ci if (!v3d_has_csd(v3d)) { 92662306a36Sopenharmony_ci DRM_DEBUG("Attempting CSD submit on non-CSD hardware\n"); 92762306a36Sopenharmony_ci return -EINVAL; 92862306a36Sopenharmony_ci } 92962306a36Sopenharmony_ci 93062306a36Sopenharmony_ci if (args->flags && !(args->flags & DRM_V3D_SUBMIT_EXTENSION)) { 93162306a36Sopenharmony_ci DRM_INFO("invalid flags: %d\n", args->flags); 93262306a36Sopenharmony_ci return -EINVAL; 93362306a36Sopenharmony_ci } 93462306a36Sopenharmony_ci 93562306a36Sopenharmony_ci if (args->flags & DRM_V3D_SUBMIT_EXTENSION) { 93662306a36Sopenharmony_ci ret = v3d_get_extensions(file_priv, args->extensions, &se); 93762306a36Sopenharmony_ci if (ret) { 93862306a36Sopenharmony_ci DRM_DEBUG("Failed to get extensions.\n"); 93962306a36Sopenharmony_ci return ret; 94062306a36Sopenharmony_ci } 94162306a36Sopenharmony_ci } 94262306a36Sopenharmony_ci 94362306a36Sopenharmony_ci ret = v3d_job_init(v3d, file_priv, (void *)&job, sizeof(*job), 94462306a36Sopenharmony_ci v3d_job_free, args->in_sync, &se, V3D_CSD); 94562306a36Sopenharmony_ci if (ret) 94662306a36Sopenharmony_ci goto fail; 94762306a36Sopenharmony_ci 94862306a36Sopenharmony_ci ret = v3d_job_init(v3d, file_priv, (void *)&clean_job, sizeof(*clean_job), 94962306a36Sopenharmony_ci v3d_job_free, 0, NULL, V3D_CACHE_CLEAN); 95062306a36Sopenharmony_ci if (ret) 95162306a36Sopenharmony_ci goto fail; 95262306a36Sopenharmony_ci 95362306a36Sopenharmony_ci job->args = *args; 95462306a36Sopenharmony_ci 95562306a36Sopenharmony_ci ret = v3d_lookup_bos(dev, file_priv, clean_job, 95662306a36Sopenharmony_ci args->bo_handles, args->bo_handle_count); 95762306a36Sopenharmony_ci if (ret) 95862306a36Sopenharmony_ci goto fail; 95962306a36Sopenharmony_ci 96062306a36Sopenharmony_ci ret = v3d_lock_bo_reservations(clean_job, &acquire_ctx); 96162306a36Sopenharmony_ci if (ret) 96262306a36Sopenharmony_ci goto fail; 96362306a36Sopenharmony_ci 96462306a36Sopenharmony_ci if (args->perfmon_id) { 96562306a36Sopenharmony_ci job->base.perfmon = v3d_perfmon_find(v3d_priv, 96662306a36Sopenharmony_ci args->perfmon_id); 96762306a36Sopenharmony_ci if (!job->base.perfmon) { 96862306a36Sopenharmony_ci ret = -ENOENT; 96962306a36Sopenharmony_ci goto fail_perfmon; 97062306a36Sopenharmony_ci } 97162306a36Sopenharmony_ci } 97262306a36Sopenharmony_ci 97362306a36Sopenharmony_ci mutex_lock(&v3d->sched_lock); 97462306a36Sopenharmony_ci v3d_push_job(&job->base); 97562306a36Sopenharmony_ci 97662306a36Sopenharmony_ci ret = drm_sched_job_add_dependency(&clean_job->base, 97762306a36Sopenharmony_ci dma_fence_get(job->base.done_fence)); 97862306a36Sopenharmony_ci if (ret) 97962306a36Sopenharmony_ci goto fail_unreserve; 98062306a36Sopenharmony_ci 98162306a36Sopenharmony_ci v3d_push_job(clean_job); 98262306a36Sopenharmony_ci mutex_unlock(&v3d->sched_lock); 98362306a36Sopenharmony_ci 98462306a36Sopenharmony_ci v3d_attach_fences_and_unlock_reservation(file_priv, 98562306a36Sopenharmony_ci clean_job, 98662306a36Sopenharmony_ci &acquire_ctx, 98762306a36Sopenharmony_ci args->out_sync, 98862306a36Sopenharmony_ci &se, 98962306a36Sopenharmony_ci clean_job->done_fence); 99062306a36Sopenharmony_ci 99162306a36Sopenharmony_ci v3d_job_put(&job->base); 99262306a36Sopenharmony_ci v3d_job_put(clean_job); 99362306a36Sopenharmony_ci 99462306a36Sopenharmony_ci return 0; 99562306a36Sopenharmony_ci 99662306a36Sopenharmony_cifail_unreserve: 99762306a36Sopenharmony_ci mutex_unlock(&v3d->sched_lock); 99862306a36Sopenharmony_cifail_perfmon: 99962306a36Sopenharmony_ci drm_gem_unlock_reservations(clean_job->bo, clean_job->bo_count, 100062306a36Sopenharmony_ci &acquire_ctx); 100162306a36Sopenharmony_cifail: 100262306a36Sopenharmony_ci v3d_job_cleanup((void *)job); 100362306a36Sopenharmony_ci v3d_job_cleanup(clean_job); 100462306a36Sopenharmony_ci v3d_put_multisync_post_deps(&se); 100562306a36Sopenharmony_ci 100662306a36Sopenharmony_ci return ret; 100762306a36Sopenharmony_ci} 100862306a36Sopenharmony_ci 100962306a36Sopenharmony_ciint 101062306a36Sopenharmony_civ3d_gem_init(struct drm_device *dev) 101162306a36Sopenharmony_ci{ 101262306a36Sopenharmony_ci struct v3d_dev *v3d = to_v3d_dev(dev); 101362306a36Sopenharmony_ci u32 pt_size = 4096 * 1024; 101462306a36Sopenharmony_ci int ret, i; 101562306a36Sopenharmony_ci 101662306a36Sopenharmony_ci for (i = 0; i < V3D_MAX_QUEUES; i++) 101762306a36Sopenharmony_ci v3d->queue[i].fence_context = dma_fence_context_alloc(1); 101862306a36Sopenharmony_ci 101962306a36Sopenharmony_ci spin_lock_init(&v3d->mm_lock); 102062306a36Sopenharmony_ci spin_lock_init(&v3d->job_lock); 102162306a36Sopenharmony_ci ret = drmm_mutex_init(dev, &v3d->bo_lock); 102262306a36Sopenharmony_ci if (ret) 102362306a36Sopenharmony_ci return ret; 102462306a36Sopenharmony_ci ret = drmm_mutex_init(dev, &v3d->reset_lock); 102562306a36Sopenharmony_ci if (ret) 102662306a36Sopenharmony_ci return ret; 102762306a36Sopenharmony_ci ret = drmm_mutex_init(dev, &v3d->sched_lock); 102862306a36Sopenharmony_ci if (ret) 102962306a36Sopenharmony_ci return ret; 103062306a36Sopenharmony_ci ret = drmm_mutex_init(dev, &v3d->cache_clean_lock); 103162306a36Sopenharmony_ci if (ret) 103262306a36Sopenharmony_ci return ret; 103362306a36Sopenharmony_ci 103462306a36Sopenharmony_ci /* Note: We don't allocate address 0. Various bits of HW 103562306a36Sopenharmony_ci * treat 0 as special, such as the occlusion query counters 103662306a36Sopenharmony_ci * where 0 means "disabled". 103762306a36Sopenharmony_ci */ 103862306a36Sopenharmony_ci drm_mm_init(&v3d->mm, 1, pt_size / sizeof(u32) - 1); 103962306a36Sopenharmony_ci 104062306a36Sopenharmony_ci v3d->pt = dma_alloc_wc(v3d->drm.dev, pt_size, 104162306a36Sopenharmony_ci &v3d->pt_paddr, 104262306a36Sopenharmony_ci GFP_KERNEL | __GFP_NOWARN | __GFP_ZERO); 104362306a36Sopenharmony_ci if (!v3d->pt) { 104462306a36Sopenharmony_ci drm_mm_takedown(&v3d->mm); 104562306a36Sopenharmony_ci dev_err(v3d->drm.dev, 104662306a36Sopenharmony_ci "Failed to allocate page tables. Please ensure you have DMA enabled.\n"); 104762306a36Sopenharmony_ci return -ENOMEM; 104862306a36Sopenharmony_ci } 104962306a36Sopenharmony_ci 105062306a36Sopenharmony_ci v3d_init_hw_state(v3d); 105162306a36Sopenharmony_ci v3d_mmu_set_page_table(v3d); 105262306a36Sopenharmony_ci 105362306a36Sopenharmony_ci ret = v3d_sched_init(v3d); 105462306a36Sopenharmony_ci if (ret) { 105562306a36Sopenharmony_ci drm_mm_takedown(&v3d->mm); 105662306a36Sopenharmony_ci dma_free_coherent(v3d->drm.dev, 4096 * 1024, (void *)v3d->pt, 105762306a36Sopenharmony_ci v3d->pt_paddr); 105862306a36Sopenharmony_ci } 105962306a36Sopenharmony_ci 106062306a36Sopenharmony_ci return 0; 106162306a36Sopenharmony_ci} 106262306a36Sopenharmony_ci 106362306a36Sopenharmony_civoid 106462306a36Sopenharmony_civ3d_gem_destroy(struct drm_device *dev) 106562306a36Sopenharmony_ci{ 106662306a36Sopenharmony_ci struct v3d_dev *v3d = to_v3d_dev(dev); 106762306a36Sopenharmony_ci 106862306a36Sopenharmony_ci v3d_sched_fini(v3d); 106962306a36Sopenharmony_ci 107062306a36Sopenharmony_ci /* Waiting for jobs to finish would need to be done before 107162306a36Sopenharmony_ci * unregistering V3D. 107262306a36Sopenharmony_ci */ 107362306a36Sopenharmony_ci WARN_ON(v3d->bin_job); 107462306a36Sopenharmony_ci WARN_ON(v3d->render_job); 107562306a36Sopenharmony_ci 107662306a36Sopenharmony_ci drm_mm_takedown(&v3d->mm); 107762306a36Sopenharmony_ci 107862306a36Sopenharmony_ci dma_free_coherent(v3d->drm.dev, 4096 * 1024, (void *)v3d->pt, 107962306a36Sopenharmony_ci v3d->pt_paddr); 108062306a36Sopenharmony_ci} 1081