162306a36Sopenharmony_ci/* 262306a36Sopenharmony_ci * Copyright © 2016 Intel Corporation 362306a36Sopenharmony_ci * 462306a36Sopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a 562306a36Sopenharmony_ci * copy of this software and associated documentation files (the "Software"), 662306a36Sopenharmony_ci * to deal in the Software without restriction, including without limitation 762306a36Sopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sublicense, 862306a36Sopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the 962306a36Sopenharmony_ci * Software is furnished to do so, subject to the following conditions: 1062306a36Sopenharmony_ci * 1162306a36Sopenharmony_ci * The above copyright notice and this permission notice (including the next 1262306a36Sopenharmony_ci * paragraph) shall be included in all copies or substantial portions of the 1362306a36Sopenharmony_ci * Software. 1462306a36Sopenharmony_ci * 1562306a36Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 1662306a36Sopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 1762306a36Sopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 1862306a36Sopenharmony_ci * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 1962306a36Sopenharmony_ci * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 2062306a36Sopenharmony_ci * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS 2162306a36Sopenharmony_ci * IN THE SOFTWARE. 2262306a36Sopenharmony_ci * 2362306a36Sopenharmony_ci */ 2462306a36Sopenharmony_ci 2562306a36Sopenharmony_ci#include <linux/prime_numbers.h> 2662306a36Sopenharmony_ci#include <linux/pm_qos.h> 2762306a36Sopenharmony_ci#include <linux/sort.h> 2862306a36Sopenharmony_ci 2962306a36Sopenharmony_ci#include "gem/i915_gem_internal.h" 3062306a36Sopenharmony_ci#include "gem/i915_gem_pm.h" 3162306a36Sopenharmony_ci#include "gem/selftests/mock_context.h" 3262306a36Sopenharmony_ci 3362306a36Sopenharmony_ci#include "gt/intel_engine_heartbeat.h" 3462306a36Sopenharmony_ci#include "gt/intel_engine_pm.h" 3562306a36Sopenharmony_ci#include "gt/intel_engine_user.h" 3662306a36Sopenharmony_ci#include "gt/intel_gt.h" 3762306a36Sopenharmony_ci#include "gt/intel_gt_clock_utils.h" 3862306a36Sopenharmony_ci#include "gt/intel_gt_requests.h" 3962306a36Sopenharmony_ci#include "gt/selftest_engine_heartbeat.h" 4062306a36Sopenharmony_ci 4162306a36Sopenharmony_ci#include "i915_random.h" 4262306a36Sopenharmony_ci#include "i915_selftest.h" 4362306a36Sopenharmony_ci#include "igt_flush_test.h" 4462306a36Sopenharmony_ci#include "igt_live_test.h" 4562306a36Sopenharmony_ci#include "igt_spinner.h" 4662306a36Sopenharmony_ci#include "lib_sw_fence.h" 4762306a36Sopenharmony_ci 4862306a36Sopenharmony_ci#include "mock_drm.h" 4962306a36Sopenharmony_ci#include "mock_gem_device.h" 5062306a36Sopenharmony_ci 5162306a36Sopenharmony_cistatic unsigned int num_uabi_engines(struct drm_i915_private *i915) 5262306a36Sopenharmony_ci{ 5362306a36Sopenharmony_ci struct intel_engine_cs *engine; 5462306a36Sopenharmony_ci unsigned int count; 5562306a36Sopenharmony_ci 5662306a36Sopenharmony_ci count = 0; 5762306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) 5862306a36Sopenharmony_ci count++; 5962306a36Sopenharmony_ci 6062306a36Sopenharmony_ci return count; 6162306a36Sopenharmony_ci} 6262306a36Sopenharmony_ci 6362306a36Sopenharmony_cistatic struct intel_engine_cs *rcs0(struct drm_i915_private *i915) 6462306a36Sopenharmony_ci{ 6562306a36Sopenharmony_ci return intel_engine_lookup_user(i915, I915_ENGINE_CLASS_RENDER, 0); 6662306a36Sopenharmony_ci} 6762306a36Sopenharmony_ci 6862306a36Sopenharmony_cistatic int igt_add_request(void *arg) 6962306a36Sopenharmony_ci{ 7062306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 7162306a36Sopenharmony_ci struct i915_request *request; 7262306a36Sopenharmony_ci 7362306a36Sopenharmony_ci /* Basic preliminary test to create a request and let it loose! */ 7462306a36Sopenharmony_ci 7562306a36Sopenharmony_ci request = mock_request(rcs0(i915)->kernel_context, HZ / 10); 7662306a36Sopenharmony_ci if (!request) 7762306a36Sopenharmony_ci return -ENOMEM; 7862306a36Sopenharmony_ci 7962306a36Sopenharmony_ci i915_request_add(request); 8062306a36Sopenharmony_ci 8162306a36Sopenharmony_ci return 0; 8262306a36Sopenharmony_ci} 8362306a36Sopenharmony_ci 8462306a36Sopenharmony_cistatic int igt_wait_request(void *arg) 8562306a36Sopenharmony_ci{ 8662306a36Sopenharmony_ci const long T = HZ / 4; 8762306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 8862306a36Sopenharmony_ci struct i915_request *request; 8962306a36Sopenharmony_ci int err = -EINVAL; 9062306a36Sopenharmony_ci 9162306a36Sopenharmony_ci /* Submit a request, then wait upon it */ 9262306a36Sopenharmony_ci 9362306a36Sopenharmony_ci request = mock_request(rcs0(i915)->kernel_context, T); 9462306a36Sopenharmony_ci if (!request) 9562306a36Sopenharmony_ci return -ENOMEM; 9662306a36Sopenharmony_ci 9762306a36Sopenharmony_ci i915_request_get(request); 9862306a36Sopenharmony_ci 9962306a36Sopenharmony_ci if (i915_request_wait(request, 0, 0) != -ETIME) { 10062306a36Sopenharmony_ci pr_err("request wait (busy query) succeeded (expected timeout before submit!)\n"); 10162306a36Sopenharmony_ci goto out_request; 10262306a36Sopenharmony_ci } 10362306a36Sopenharmony_ci 10462306a36Sopenharmony_ci if (i915_request_wait(request, 0, T) != -ETIME) { 10562306a36Sopenharmony_ci pr_err("request wait succeeded (expected timeout before submit!)\n"); 10662306a36Sopenharmony_ci goto out_request; 10762306a36Sopenharmony_ci } 10862306a36Sopenharmony_ci 10962306a36Sopenharmony_ci if (i915_request_completed(request)) { 11062306a36Sopenharmony_ci pr_err("request completed before submit!!\n"); 11162306a36Sopenharmony_ci goto out_request; 11262306a36Sopenharmony_ci } 11362306a36Sopenharmony_ci 11462306a36Sopenharmony_ci i915_request_add(request); 11562306a36Sopenharmony_ci 11662306a36Sopenharmony_ci if (i915_request_wait(request, 0, 0) != -ETIME) { 11762306a36Sopenharmony_ci pr_err("request wait (busy query) succeeded (expected timeout after submit!)\n"); 11862306a36Sopenharmony_ci goto out_request; 11962306a36Sopenharmony_ci } 12062306a36Sopenharmony_ci 12162306a36Sopenharmony_ci if (i915_request_completed(request)) { 12262306a36Sopenharmony_ci pr_err("request completed immediately!\n"); 12362306a36Sopenharmony_ci goto out_request; 12462306a36Sopenharmony_ci } 12562306a36Sopenharmony_ci 12662306a36Sopenharmony_ci if (i915_request_wait(request, 0, T / 2) != -ETIME) { 12762306a36Sopenharmony_ci pr_err("request wait succeeded (expected timeout!)\n"); 12862306a36Sopenharmony_ci goto out_request; 12962306a36Sopenharmony_ci } 13062306a36Sopenharmony_ci 13162306a36Sopenharmony_ci if (i915_request_wait(request, 0, T) == -ETIME) { 13262306a36Sopenharmony_ci pr_err("request wait timed out!\n"); 13362306a36Sopenharmony_ci goto out_request; 13462306a36Sopenharmony_ci } 13562306a36Sopenharmony_ci 13662306a36Sopenharmony_ci if (!i915_request_completed(request)) { 13762306a36Sopenharmony_ci pr_err("request not complete after waiting!\n"); 13862306a36Sopenharmony_ci goto out_request; 13962306a36Sopenharmony_ci } 14062306a36Sopenharmony_ci 14162306a36Sopenharmony_ci if (i915_request_wait(request, 0, T) == -ETIME) { 14262306a36Sopenharmony_ci pr_err("request wait timed out when already complete!\n"); 14362306a36Sopenharmony_ci goto out_request; 14462306a36Sopenharmony_ci } 14562306a36Sopenharmony_ci 14662306a36Sopenharmony_ci err = 0; 14762306a36Sopenharmony_ciout_request: 14862306a36Sopenharmony_ci i915_request_put(request); 14962306a36Sopenharmony_ci mock_device_flush(i915); 15062306a36Sopenharmony_ci return err; 15162306a36Sopenharmony_ci} 15262306a36Sopenharmony_ci 15362306a36Sopenharmony_cistatic int igt_fence_wait(void *arg) 15462306a36Sopenharmony_ci{ 15562306a36Sopenharmony_ci const long T = HZ / 4; 15662306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 15762306a36Sopenharmony_ci struct i915_request *request; 15862306a36Sopenharmony_ci int err = -EINVAL; 15962306a36Sopenharmony_ci 16062306a36Sopenharmony_ci /* Submit a request, treat it as a fence and wait upon it */ 16162306a36Sopenharmony_ci 16262306a36Sopenharmony_ci request = mock_request(rcs0(i915)->kernel_context, T); 16362306a36Sopenharmony_ci if (!request) 16462306a36Sopenharmony_ci return -ENOMEM; 16562306a36Sopenharmony_ci 16662306a36Sopenharmony_ci if (dma_fence_wait_timeout(&request->fence, false, T) != -ETIME) { 16762306a36Sopenharmony_ci pr_err("fence wait success before submit (expected timeout)!\n"); 16862306a36Sopenharmony_ci goto out; 16962306a36Sopenharmony_ci } 17062306a36Sopenharmony_ci 17162306a36Sopenharmony_ci i915_request_add(request); 17262306a36Sopenharmony_ci 17362306a36Sopenharmony_ci if (dma_fence_is_signaled(&request->fence)) { 17462306a36Sopenharmony_ci pr_err("fence signaled immediately!\n"); 17562306a36Sopenharmony_ci goto out; 17662306a36Sopenharmony_ci } 17762306a36Sopenharmony_ci 17862306a36Sopenharmony_ci if (dma_fence_wait_timeout(&request->fence, false, T / 2) != -ETIME) { 17962306a36Sopenharmony_ci pr_err("fence wait success after submit (expected timeout)!\n"); 18062306a36Sopenharmony_ci goto out; 18162306a36Sopenharmony_ci } 18262306a36Sopenharmony_ci 18362306a36Sopenharmony_ci if (dma_fence_wait_timeout(&request->fence, false, T) <= 0) { 18462306a36Sopenharmony_ci pr_err("fence wait timed out (expected success)!\n"); 18562306a36Sopenharmony_ci goto out; 18662306a36Sopenharmony_ci } 18762306a36Sopenharmony_ci 18862306a36Sopenharmony_ci if (!dma_fence_is_signaled(&request->fence)) { 18962306a36Sopenharmony_ci pr_err("fence unsignaled after waiting!\n"); 19062306a36Sopenharmony_ci goto out; 19162306a36Sopenharmony_ci } 19262306a36Sopenharmony_ci 19362306a36Sopenharmony_ci if (dma_fence_wait_timeout(&request->fence, false, T) <= 0) { 19462306a36Sopenharmony_ci pr_err("fence wait timed out when complete (expected success)!\n"); 19562306a36Sopenharmony_ci goto out; 19662306a36Sopenharmony_ci } 19762306a36Sopenharmony_ci 19862306a36Sopenharmony_ci err = 0; 19962306a36Sopenharmony_ciout: 20062306a36Sopenharmony_ci mock_device_flush(i915); 20162306a36Sopenharmony_ci return err; 20262306a36Sopenharmony_ci} 20362306a36Sopenharmony_ci 20462306a36Sopenharmony_cistatic int igt_request_rewind(void *arg) 20562306a36Sopenharmony_ci{ 20662306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 20762306a36Sopenharmony_ci struct i915_request *request, *vip; 20862306a36Sopenharmony_ci struct i915_gem_context *ctx[2]; 20962306a36Sopenharmony_ci struct intel_context *ce; 21062306a36Sopenharmony_ci int err = -EINVAL; 21162306a36Sopenharmony_ci 21262306a36Sopenharmony_ci ctx[0] = mock_context(i915, "A"); 21362306a36Sopenharmony_ci if (!ctx[0]) { 21462306a36Sopenharmony_ci err = -ENOMEM; 21562306a36Sopenharmony_ci goto err_ctx_0; 21662306a36Sopenharmony_ci } 21762306a36Sopenharmony_ci 21862306a36Sopenharmony_ci ce = i915_gem_context_get_engine(ctx[0], RCS0); 21962306a36Sopenharmony_ci GEM_BUG_ON(IS_ERR(ce)); 22062306a36Sopenharmony_ci request = mock_request(ce, 2 * HZ); 22162306a36Sopenharmony_ci intel_context_put(ce); 22262306a36Sopenharmony_ci if (!request) { 22362306a36Sopenharmony_ci err = -ENOMEM; 22462306a36Sopenharmony_ci goto err_context_0; 22562306a36Sopenharmony_ci } 22662306a36Sopenharmony_ci 22762306a36Sopenharmony_ci i915_request_get(request); 22862306a36Sopenharmony_ci i915_request_add(request); 22962306a36Sopenharmony_ci 23062306a36Sopenharmony_ci ctx[1] = mock_context(i915, "B"); 23162306a36Sopenharmony_ci if (!ctx[1]) { 23262306a36Sopenharmony_ci err = -ENOMEM; 23362306a36Sopenharmony_ci goto err_ctx_1; 23462306a36Sopenharmony_ci } 23562306a36Sopenharmony_ci 23662306a36Sopenharmony_ci ce = i915_gem_context_get_engine(ctx[1], RCS0); 23762306a36Sopenharmony_ci GEM_BUG_ON(IS_ERR(ce)); 23862306a36Sopenharmony_ci vip = mock_request(ce, 0); 23962306a36Sopenharmony_ci intel_context_put(ce); 24062306a36Sopenharmony_ci if (!vip) { 24162306a36Sopenharmony_ci err = -ENOMEM; 24262306a36Sopenharmony_ci goto err_context_1; 24362306a36Sopenharmony_ci } 24462306a36Sopenharmony_ci 24562306a36Sopenharmony_ci /* Simulate preemption by manual reordering */ 24662306a36Sopenharmony_ci if (!mock_cancel_request(request)) { 24762306a36Sopenharmony_ci pr_err("failed to cancel request (already executed)!\n"); 24862306a36Sopenharmony_ci i915_request_add(vip); 24962306a36Sopenharmony_ci goto err_context_1; 25062306a36Sopenharmony_ci } 25162306a36Sopenharmony_ci i915_request_get(vip); 25262306a36Sopenharmony_ci i915_request_add(vip); 25362306a36Sopenharmony_ci rcu_read_lock(); 25462306a36Sopenharmony_ci request->engine->submit_request(request); 25562306a36Sopenharmony_ci rcu_read_unlock(); 25662306a36Sopenharmony_ci 25762306a36Sopenharmony_ci 25862306a36Sopenharmony_ci if (i915_request_wait(vip, 0, HZ) == -ETIME) { 25962306a36Sopenharmony_ci pr_err("timed out waiting for high priority request\n"); 26062306a36Sopenharmony_ci goto err; 26162306a36Sopenharmony_ci } 26262306a36Sopenharmony_ci 26362306a36Sopenharmony_ci if (i915_request_completed(request)) { 26462306a36Sopenharmony_ci pr_err("low priority request already completed\n"); 26562306a36Sopenharmony_ci goto err; 26662306a36Sopenharmony_ci } 26762306a36Sopenharmony_ci 26862306a36Sopenharmony_ci err = 0; 26962306a36Sopenharmony_cierr: 27062306a36Sopenharmony_ci i915_request_put(vip); 27162306a36Sopenharmony_cierr_context_1: 27262306a36Sopenharmony_ci mock_context_close(ctx[1]); 27362306a36Sopenharmony_cierr_ctx_1: 27462306a36Sopenharmony_ci i915_request_put(request); 27562306a36Sopenharmony_cierr_context_0: 27662306a36Sopenharmony_ci mock_context_close(ctx[0]); 27762306a36Sopenharmony_cierr_ctx_0: 27862306a36Sopenharmony_ci mock_device_flush(i915); 27962306a36Sopenharmony_ci return err; 28062306a36Sopenharmony_ci} 28162306a36Sopenharmony_ci 28262306a36Sopenharmony_cistruct smoketest { 28362306a36Sopenharmony_ci struct intel_engine_cs *engine; 28462306a36Sopenharmony_ci struct i915_gem_context **contexts; 28562306a36Sopenharmony_ci atomic_long_t num_waits, num_fences; 28662306a36Sopenharmony_ci int ncontexts, max_batch; 28762306a36Sopenharmony_ci struct i915_request *(*request_alloc)(struct intel_context *ce); 28862306a36Sopenharmony_ci}; 28962306a36Sopenharmony_ci 29062306a36Sopenharmony_cistatic struct i915_request * 29162306a36Sopenharmony_ci__mock_request_alloc(struct intel_context *ce) 29262306a36Sopenharmony_ci{ 29362306a36Sopenharmony_ci return mock_request(ce, 0); 29462306a36Sopenharmony_ci} 29562306a36Sopenharmony_ci 29662306a36Sopenharmony_cistatic struct i915_request * 29762306a36Sopenharmony_ci__live_request_alloc(struct intel_context *ce) 29862306a36Sopenharmony_ci{ 29962306a36Sopenharmony_ci return intel_context_create_request(ce); 30062306a36Sopenharmony_ci} 30162306a36Sopenharmony_ci 30262306a36Sopenharmony_cistruct smoke_thread { 30362306a36Sopenharmony_ci struct kthread_worker *worker; 30462306a36Sopenharmony_ci struct kthread_work work; 30562306a36Sopenharmony_ci struct smoketest *t; 30662306a36Sopenharmony_ci bool stop; 30762306a36Sopenharmony_ci int result; 30862306a36Sopenharmony_ci}; 30962306a36Sopenharmony_ci 31062306a36Sopenharmony_cistatic void __igt_breadcrumbs_smoketest(struct kthread_work *work) 31162306a36Sopenharmony_ci{ 31262306a36Sopenharmony_ci struct smoke_thread *thread = container_of(work, typeof(*thread), work); 31362306a36Sopenharmony_ci struct smoketest *t = thread->t; 31462306a36Sopenharmony_ci const unsigned int max_batch = min(t->ncontexts, t->max_batch) - 1; 31562306a36Sopenharmony_ci const unsigned int total = 4 * t->ncontexts + 1; 31662306a36Sopenharmony_ci unsigned int num_waits = 0, num_fences = 0; 31762306a36Sopenharmony_ci struct i915_request **requests; 31862306a36Sopenharmony_ci I915_RND_STATE(prng); 31962306a36Sopenharmony_ci unsigned int *order; 32062306a36Sopenharmony_ci int err = 0; 32162306a36Sopenharmony_ci 32262306a36Sopenharmony_ci /* 32362306a36Sopenharmony_ci * A very simple test to catch the most egregious of list handling bugs. 32462306a36Sopenharmony_ci * 32562306a36Sopenharmony_ci * At its heart, we simply create oodles of requests running across 32662306a36Sopenharmony_ci * multiple kthreads and enable signaling on them, for the sole purpose 32762306a36Sopenharmony_ci * of stressing our breadcrumb handling. The only inspection we do is 32862306a36Sopenharmony_ci * that the fences were marked as signaled. 32962306a36Sopenharmony_ci */ 33062306a36Sopenharmony_ci 33162306a36Sopenharmony_ci requests = kcalloc(total, sizeof(*requests), GFP_KERNEL); 33262306a36Sopenharmony_ci if (!requests) { 33362306a36Sopenharmony_ci thread->result = -ENOMEM; 33462306a36Sopenharmony_ci return; 33562306a36Sopenharmony_ci } 33662306a36Sopenharmony_ci 33762306a36Sopenharmony_ci order = i915_random_order(total, &prng); 33862306a36Sopenharmony_ci if (!order) { 33962306a36Sopenharmony_ci err = -ENOMEM; 34062306a36Sopenharmony_ci goto out_requests; 34162306a36Sopenharmony_ci } 34262306a36Sopenharmony_ci 34362306a36Sopenharmony_ci while (!READ_ONCE(thread->stop)) { 34462306a36Sopenharmony_ci struct i915_sw_fence *submit, *wait; 34562306a36Sopenharmony_ci unsigned int n, count; 34662306a36Sopenharmony_ci 34762306a36Sopenharmony_ci submit = heap_fence_create(GFP_KERNEL); 34862306a36Sopenharmony_ci if (!submit) { 34962306a36Sopenharmony_ci err = -ENOMEM; 35062306a36Sopenharmony_ci break; 35162306a36Sopenharmony_ci } 35262306a36Sopenharmony_ci 35362306a36Sopenharmony_ci wait = heap_fence_create(GFP_KERNEL); 35462306a36Sopenharmony_ci if (!wait) { 35562306a36Sopenharmony_ci i915_sw_fence_commit(submit); 35662306a36Sopenharmony_ci heap_fence_put(submit); 35762306a36Sopenharmony_ci err = -ENOMEM; 35862306a36Sopenharmony_ci break; 35962306a36Sopenharmony_ci } 36062306a36Sopenharmony_ci 36162306a36Sopenharmony_ci i915_random_reorder(order, total, &prng); 36262306a36Sopenharmony_ci count = 1 + i915_prandom_u32_max_state(max_batch, &prng); 36362306a36Sopenharmony_ci 36462306a36Sopenharmony_ci for (n = 0; n < count; n++) { 36562306a36Sopenharmony_ci struct i915_gem_context *ctx = 36662306a36Sopenharmony_ci t->contexts[order[n] % t->ncontexts]; 36762306a36Sopenharmony_ci struct i915_request *rq; 36862306a36Sopenharmony_ci struct intel_context *ce; 36962306a36Sopenharmony_ci 37062306a36Sopenharmony_ci ce = i915_gem_context_get_engine(ctx, t->engine->legacy_idx); 37162306a36Sopenharmony_ci GEM_BUG_ON(IS_ERR(ce)); 37262306a36Sopenharmony_ci rq = t->request_alloc(ce); 37362306a36Sopenharmony_ci intel_context_put(ce); 37462306a36Sopenharmony_ci if (IS_ERR(rq)) { 37562306a36Sopenharmony_ci err = PTR_ERR(rq); 37662306a36Sopenharmony_ci count = n; 37762306a36Sopenharmony_ci break; 37862306a36Sopenharmony_ci } 37962306a36Sopenharmony_ci 38062306a36Sopenharmony_ci err = i915_sw_fence_await_sw_fence_gfp(&rq->submit, 38162306a36Sopenharmony_ci submit, 38262306a36Sopenharmony_ci GFP_KERNEL); 38362306a36Sopenharmony_ci 38462306a36Sopenharmony_ci requests[n] = i915_request_get(rq); 38562306a36Sopenharmony_ci i915_request_add(rq); 38662306a36Sopenharmony_ci 38762306a36Sopenharmony_ci if (err >= 0) 38862306a36Sopenharmony_ci err = i915_sw_fence_await_dma_fence(wait, 38962306a36Sopenharmony_ci &rq->fence, 39062306a36Sopenharmony_ci 0, 39162306a36Sopenharmony_ci GFP_KERNEL); 39262306a36Sopenharmony_ci 39362306a36Sopenharmony_ci if (err < 0) { 39462306a36Sopenharmony_ci i915_request_put(rq); 39562306a36Sopenharmony_ci count = n; 39662306a36Sopenharmony_ci break; 39762306a36Sopenharmony_ci } 39862306a36Sopenharmony_ci } 39962306a36Sopenharmony_ci 40062306a36Sopenharmony_ci i915_sw_fence_commit(submit); 40162306a36Sopenharmony_ci i915_sw_fence_commit(wait); 40262306a36Sopenharmony_ci 40362306a36Sopenharmony_ci if (!wait_event_timeout(wait->wait, 40462306a36Sopenharmony_ci i915_sw_fence_done(wait), 40562306a36Sopenharmony_ci 5 * HZ)) { 40662306a36Sopenharmony_ci struct i915_request *rq = requests[count - 1]; 40762306a36Sopenharmony_ci 40862306a36Sopenharmony_ci pr_err("waiting for %d/%d fences (last %llx:%lld) on %s timed out!\n", 40962306a36Sopenharmony_ci atomic_read(&wait->pending), count, 41062306a36Sopenharmony_ci rq->fence.context, rq->fence.seqno, 41162306a36Sopenharmony_ci t->engine->name); 41262306a36Sopenharmony_ci GEM_TRACE_DUMP(); 41362306a36Sopenharmony_ci 41462306a36Sopenharmony_ci intel_gt_set_wedged(t->engine->gt); 41562306a36Sopenharmony_ci GEM_BUG_ON(!i915_request_completed(rq)); 41662306a36Sopenharmony_ci i915_sw_fence_wait(wait); 41762306a36Sopenharmony_ci err = -EIO; 41862306a36Sopenharmony_ci } 41962306a36Sopenharmony_ci 42062306a36Sopenharmony_ci for (n = 0; n < count; n++) { 42162306a36Sopenharmony_ci struct i915_request *rq = requests[n]; 42262306a36Sopenharmony_ci 42362306a36Sopenharmony_ci if (!test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, 42462306a36Sopenharmony_ci &rq->fence.flags)) { 42562306a36Sopenharmony_ci pr_err("%llu:%llu was not signaled!\n", 42662306a36Sopenharmony_ci rq->fence.context, rq->fence.seqno); 42762306a36Sopenharmony_ci err = -EINVAL; 42862306a36Sopenharmony_ci } 42962306a36Sopenharmony_ci 43062306a36Sopenharmony_ci i915_request_put(rq); 43162306a36Sopenharmony_ci } 43262306a36Sopenharmony_ci 43362306a36Sopenharmony_ci heap_fence_put(wait); 43462306a36Sopenharmony_ci heap_fence_put(submit); 43562306a36Sopenharmony_ci 43662306a36Sopenharmony_ci if (err < 0) 43762306a36Sopenharmony_ci break; 43862306a36Sopenharmony_ci 43962306a36Sopenharmony_ci num_fences += count; 44062306a36Sopenharmony_ci num_waits++; 44162306a36Sopenharmony_ci 44262306a36Sopenharmony_ci cond_resched(); 44362306a36Sopenharmony_ci } 44462306a36Sopenharmony_ci 44562306a36Sopenharmony_ci atomic_long_add(num_fences, &t->num_fences); 44662306a36Sopenharmony_ci atomic_long_add(num_waits, &t->num_waits); 44762306a36Sopenharmony_ci 44862306a36Sopenharmony_ci kfree(order); 44962306a36Sopenharmony_ciout_requests: 45062306a36Sopenharmony_ci kfree(requests); 45162306a36Sopenharmony_ci thread->result = err; 45262306a36Sopenharmony_ci} 45362306a36Sopenharmony_ci 45462306a36Sopenharmony_cistatic int mock_breadcrumbs_smoketest(void *arg) 45562306a36Sopenharmony_ci{ 45662306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 45762306a36Sopenharmony_ci struct smoketest t = { 45862306a36Sopenharmony_ci .engine = rcs0(i915), 45962306a36Sopenharmony_ci .ncontexts = 1024, 46062306a36Sopenharmony_ci .max_batch = 1024, 46162306a36Sopenharmony_ci .request_alloc = __mock_request_alloc 46262306a36Sopenharmony_ci }; 46362306a36Sopenharmony_ci unsigned int ncpus = num_online_cpus(); 46462306a36Sopenharmony_ci struct smoke_thread *threads; 46562306a36Sopenharmony_ci unsigned int n; 46662306a36Sopenharmony_ci int ret = 0; 46762306a36Sopenharmony_ci 46862306a36Sopenharmony_ci /* 46962306a36Sopenharmony_ci * Smoketest our breadcrumb/signal handling for requests across multiple 47062306a36Sopenharmony_ci * threads. A very simple test to only catch the most egregious of bugs. 47162306a36Sopenharmony_ci * See __igt_breadcrumbs_smoketest(); 47262306a36Sopenharmony_ci */ 47362306a36Sopenharmony_ci 47462306a36Sopenharmony_ci threads = kcalloc(ncpus, sizeof(*threads), GFP_KERNEL); 47562306a36Sopenharmony_ci if (!threads) 47662306a36Sopenharmony_ci return -ENOMEM; 47762306a36Sopenharmony_ci 47862306a36Sopenharmony_ci t.contexts = kcalloc(t.ncontexts, sizeof(*t.contexts), GFP_KERNEL); 47962306a36Sopenharmony_ci if (!t.contexts) { 48062306a36Sopenharmony_ci ret = -ENOMEM; 48162306a36Sopenharmony_ci goto out_threads; 48262306a36Sopenharmony_ci } 48362306a36Sopenharmony_ci 48462306a36Sopenharmony_ci for (n = 0; n < t.ncontexts; n++) { 48562306a36Sopenharmony_ci t.contexts[n] = mock_context(t.engine->i915, "mock"); 48662306a36Sopenharmony_ci if (!t.contexts[n]) { 48762306a36Sopenharmony_ci ret = -ENOMEM; 48862306a36Sopenharmony_ci goto out_contexts; 48962306a36Sopenharmony_ci } 49062306a36Sopenharmony_ci } 49162306a36Sopenharmony_ci 49262306a36Sopenharmony_ci for (n = 0; n < ncpus; n++) { 49362306a36Sopenharmony_ci struct kthread_worker *worker; 49462306a36Sopenharmony_ci 49562306a36Sopenharmony_ci worker = kthread_create_worker(0, "igt/%d", n); 49662306a36Sopenharmony_ci if (IS_ERR(worker)) { 49762306a36Sopenharmony_ci ret = PTR_ERR(worker); 49862306a36Sopenharmony_ci ncpus = n; 49962306a36Sopenharmony_ci break; 50062306a36Sopenharmony_ci } 50162306a36Sopenharmony_ci 50262306a36Sopenharmony_ci threads[n].worker = worker; 50362306a36Sopenharmony_ci threads[n].t = &t; 50462306a36Sopenharmony_ci threads[n].stop = false; 50562306a36Sopenharmony_ci threads[n].result = 0; 50662306a36Sopenharmony_ci 50762306a36Sopenharmony_ci kthread_init_work(&threads[n].work, 50862306a36Sopenharmony_ci __igt_breadcrumbs_smoketest); 50962306a36Sopenharmony_ci kthread_queue_work(worker, &threads[n].work); 51062306a36Sopenharmony_ci } 51162306a36Sopenharmony_ci 51262306a36Sopenharmony_ci msleep(jiffies_to_msecs(i915_selftest.timeout_jiffies)); 51362306a36Sopenharmony_ci 51462306a36Sopenharmony_ci for (n = 0; n < ncpus; n++) { 51562306a36Sopenharmony_ci int err; 51662306a36Sopenharmony_ci 51762306a36Sopenharmony_ci WRITE_ONCE(threads[n].stop, true); 51862306a36Sopenharmony_ci kthread_flush_work(&threads[n].work); 51962306a36Sopenharmony_ci err = READ_ONCE(threads[n].result); 52062306a36Sopenharmony_ci if (err < 0 && !ret) 52162306a36Sopenharmony_ci ret = err; 52262306a36Sopenharmony_ci 52362306a36Sopenharmony_ci kthread_destroy_worker(threads[n].worker); 52462306a36Sopenharmony_ci } 52562306a36Sopenharmony_ci pr_info("Completed %lu waits for %lu fence across %d cpus\n", 52662306a36Sopenharmony_ci atomic_long_read(&t.num_waits), 52762306a36Sopenharmony_ci atomic_long_read(&t.num_fences), 52862306a36Sopenharmony_ci ncpus); 52962306a36Sopenharmony_ci 53062306a36Sopenharmony_ciout_contexts: 53162306a36Sopenharmony_ci for (n = 0; n < t.ncontexts; n++) { 53262306a36Sopenharmony_ci if (!t.contexts[n]) 53362306a36Sopenharmony_ci break; 53462306a36Sopenharmony_ci mock_context_close(t.contexts[n]); 53562306a36Sopenharmony_ci } 53662306a36Sopenharmony_ci kfree(t.contexts); 53762306a36Sopenharmony_ciout_threads: 53862306a36Sopenharmony_ci kfree(threads); 53962306a36Sopenharmony_ci return ret; 54062306a36Sopenharmony_ci} 54162306a36Sopenharmony_ci 54262306a36Sopenharmony_ciint i915_request_mock_selftests(void) 54362306a36Sopenharmony_ci{ 54462306a36Sopenharmony_ci static const struct i915_subtest tests[] = { 54562306a36Sopenharmony_ci SUBTEST(igt_add_request), 54662306a36Sopenharmony_ci SUBTEST(igt_wait_request), 54762306a36Sopenharmony_ci SUBTEST(igt_fence_wait), 54862306a36Sopenharmony_ci SUBTEST(igt_request_rewind), 54962306a36Sopenharmony_ci SUBTEST(mock_breadcrumbs_smoketest), 55062306a36Sopenharmony_ci }; 55162306a36Sopenharmony_ci struct drm_i915_private *i915; 55262306a36Sopenharmony_ci intel_wakeref_t wakeref; 55362306a36Sopenharmony_ci int err = 0; 55462306a36Sopenharmony_ci 55562306a36Sopenharmony_ci i915 = mock_gem_device(); 55662306a36Sopenharmony_ci if (!i915) 55762306a36Sopenharmony_ci return -ENOMEM; 55862306a36Sopenharmony_ci 55962306a36Sopenharmony_ci with_intel_runtime_pm(&i915->runtime_pm, wakeref) 56062306a36Sopenharmony_ci err = i915_subtests(tests, i915); 56162306a36Sopenharmony_ci 56262306a36Sopenharmony_ci mock_destroy_device(i915); 56362306a36Sopenharmony_ci 56462306a36Sopenharmony_ci return err; 56562306a36Sopenharmony_ci} 56662306a36Sopenharmony_ci 56762306a36Sopenharmony_cistatic int live_nop_request(void *arg) 56862306a36Sopenharmony_ci{ 56962306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 57062306a36Sopenharmony_ci struct intel_engine_cs *engine; 57162306a36Sopenharmony_ci struct igt_live_test t; 57262306a36Sopenharmony_ci int err = -ENODEV; 57362306a36Sopenharmony_ci 57462306a36Sopenharmony_ci /* 57562306a36Sopenharmony_ci * Submit various sized batches of empty requests, to each engine 57662306a36Sopenharmony_ci * (individually), and wait for the batch to complete. We can check 57762306a36Sopenharmony_ci * the overhead of submitting requests to the hardware. 57862306a36Sopenharmony_ci */ 57962306a36Sopenharmony_ci 58062306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 58162306a36Sopenharmony_ci unsigned long n, prime; 58262306a36Sopenharmony_ci IGT_TIMEOUT(end_time); 58362306a36Sopenharmony_ci ktime_t times[2] = {}; 58462306a36Sopenharmony_ci 58562306a36Sopenharmony_ci err = igt_live_test_begin(&t, i915, __func__, engine->name); 58662306a36Sopenharmony_ci if (err) 58762306a36Sopenharmony_ci return err; 58862306a36Sopenharmony_ci 58962306a36Sopenharmony_ci intel_engine_pm_get(engine); 59062306a36Sopenharmony_ci for_each_prime_number_from(prime, 1, 8192) { 59162306a36Sopenharmony_ci struct i915_request *request = NULL; 59262306a36Sopenharmony_ci 59362306a36Sopenharmony_ci times[1] = ktime_get_raw(); 59462306a36Sopenharmony_ci 59562306a36Sopenharmony_ci for (n = 0; n < prime; n++) { 59662306a36Sopenharmony_ci i915_request_put(request); 59762306a36Sopenharmony_ci request = i915_request_create(engine->kernel_context); 59862306a36Sopenharmony_ci if (IS_ERR(request)) 59962306a36Sopenharmony_ci return PTR_ERR(request); 60062306a36Sopenharmony_ci 60162306a36Sopenharmony_ci /* 60262306a36Sopenharmony_ci * This space is left intentionally blank. 60362306a36Sopenharmony_ci * 60462306a36Sopenharmony_ci * We do not actually want to perform any 60562306a36Sopenharmony_ci * action with this request, we just want 60662306a36Sopenharmony_ci * to measure the latency in allocation 60762306a36Sopenharmony_ci * and submission of our breadcrumbs - 60862306a36Sopenharmony_ci * ensuring that the bare request is sufficient 60962306a36Sopenharmony_ci * for the system to work (i.e. proper HEAD 61062306a36Sopenharmony_ci * tracking of the rings, interrupt handling, 61162306a36Sopenharmony_ci * etc). It also gives us the lowest bounds 61262306a36Sopenharmony_ci * for latency. 61362306a36Sopenharmony_ci */ 61462306a36Sopenharmony_ci 61562306a36Sopenharmony_ci i915_request_get(request); 61662306a36Sopenharmony_ci i915_request_add(request); 61762306a36Sopenharmony_ci } 61862306a36Sopenharmony_ci i915_request_wait(request, 0, MAX_SCHEDULE_TIMEOUT); 61962306a36Sopenharmony_ci i915_request_put(request); 62062306a36Sopenharmony_ci 62162306a36Sopenharmony_ci times[1] = ktime_sub(ktime_get_raw(), times[1]); 62262306a36Sopenharmony_ci if (prime == 1) 62362306a36Sopenharmony_ci times[0] = times[1]; 62462306a36Sopenharmony_ci 62562306a36Sopenharmony_ci if (__igt_timeout(end_time, NULL)) 62662306a36Sopenharmony_ci break; 62762306a36Sopenharmony_ci } 62862306a36Sopenharmony_ci intel_engine_pm_put(engine); 62962306a36Sopenharmony_ci 63062306a36Sopenharmony_ci err = igt_live_test_end(&t); 63162306a36Sopenharmony_ci if (err) 63262306a36Sopenharmony_ci return err; 63362306a36Sopenharmony_ci 63462306a36Sopenharmony_ci pr_info("Request latencies on %s: 1 = %lluns, %lu = %lluns\n", 63562306a36Sopenharmony_ci engine->name, 63662306a36Sopenharmony_ci ktime_to_ns(times[0]), 63762306a36Sopenharmony_ci prime, div64_u64(ktime_to_ns(times[1]), prime)); 63862306a36Sopenharmony_ci } 63962306a36Sopenharmony_ci 64062306a36Sopenharmony_ci return err; 64162306a36Sopenharmony_ci} 64262306a36Sopenharmony_ci 64362306a36Sopenharmony_cistatic int __cancel_inactive(struct intel_engine_cs *engine) 64462306a36Sopenharmony_ci{ 64562306a36Sopenharmony_ci struct intel_context *ce; 64662306a36Sopenharmony_ci struct igt_spinner spin; 64762306a36Sopenharmony_ci struct i915_request *rq; 64862306a36Sopenharmony_ci int err = 0; 64962306a36Sopenharmony_ci 65062306a36Sopenharmony_ci if (igt_spinner_init(&spin, engine->gt)) 65162306a36Sopenharmony_ci return -ENOMEM; 65262306a36Sopenharmony_ci 65362306a36Sopenharmony_ci ce = intel_context_create(engine); 65462306a36Sopenharmony_ci if (IS_ERR(ce)) { 65562306a36Sopenharmony_ci err = PTR_ERR(ce); 65662306a36Sopenharmony_ci goto out_spin; 65762306a36Sopenharmony_ci } 65862306a36Sopenharmony_ci 65962306a36Sopenharmony_ci rq = igt_spinner_create_request(&spin, ce, MI_ARB_CHECK); 66062306a36Sopenharmony_ci if (IS_ERR(rq)) { 66162306a36Sopenharmony_ci err = PTR_ERR(rq); 66262306a36Sopenharmony_ci goto out_ce; 66362306a36Sopenharmony_ci } 66462306a36Sopenharmony_ci 66562306a36Sopenharmony_ci pr_debug("%s: Cancelling inactive request\n", engine->name); 66662306a36Sopenharmony_ci i915_request_cancel(rq, -EINTR); 66762306a36Sopenharmony_ci i915_request_get(rq); 66862306a36Sopenharmony_ci i915_request_add(rq); 66962306a36Sopenharmony_ci 67062306a36Sopenharmony_ci if (i915_request_wait(rq, 0, HZ / 5) < 0) { 67162306a36Sopenharmony_ci struct drm_printer p = drm_info_printer(engine->i915->drm.dev); 67262306a36Sopenharmony_ci 67362306a36Sopenharmony_ci pr_err("%s: Failed to cancel inactive request\n", engine->name); 67462306a36Sopenharmony_ci intel_engine_dump(engine, &p, "%s\n", engine->name); 67562306a36Sopenharmony_ci err = -ETIME; 67662306a36Sopenharmony_ci goto out_rq; 67762306a36Sopenharmony_ci } 67862306a36Sopenharmony_ci 67962306a36Sopenharmony_ci if (rq->fence.error != -EINTR) { 68062306a36Sopenharmony_ci pr_err("%s: fence not cancelled (%u)\n", 68162306a36Sopenharmony_ci engine->name, rq->fence.error); 68262306a36Sopenharmony_ci err = -EINVAL; 68362306a36Sopenharmony_ci } 68462306a36Sopenharmony_ci 68562306a36Sopenharmony_ciout_rq: 68662306a36Sopenharmony_ci i915_request_put(rq); 68762306a36Sopenharmony_ciout_ce: 68862306a36Sopenharmony_ci intel_context_put(ce); 68962306a36Sopenharmony_ciout_spin: 69062306a36Sopenharmony_ci igt_spinner_fini(&spin); 69162306a36Sopenharmony_ci if (err) 69262306a36Sopenharmony_ci pr_err("%s: %s error %d\n", __func__, engine->name, err); 69362306a36Sopenharmony_ci return err; 69462306a36Sopenharmony_ci} 69562306a36Sopenharmony_ci 69662306a36Sopenharmony_cistatic int __cancel_active(struct intel_engine_cs *engine) 69762306a36Sopenharmony_ci{ 69862306a36Sopenharmony_ci struct intel_context *ce; 69962306a36Sopenharmony_ci struct igt_spinner spin; 70062306a36Sopenharmony_ci struct i915_request *rq; 70162306a36Sopenharmony_ci int err = 0; 70262306a36Sopenharmony_ci 70362306a36Sopenharmony_ci if (igt_spinner_init(&spin, engine->gt)) 70462306a36Sopenharmony_ci return -ENOMEM; 70562306a36Sopenharmony_ci 70662306a36Sopenharmony_ci ce = intel_context_create(engine); 70762306a36Sopenharmony_ci if (IS_ERR(ce)) { 70862306a36Sopenharmony_ci err = PTR_ERR(ce); 70962306a36Sopenharmony_ci goto out_spin; 71062306a36Sopenharmony_ci } 71162306a36Sopenharmony_ci 71262306a36Sopenharmony_ci rq = igt_spinner_create_request(&spin, ce, MI_ARB_CHECK); 71362306a36Sopenharmony_ci if (IS_ERR(rq)) { 71462306a36Sopenharmony_ci err = PTR_ERR(rq); 71562306a36Sopenharmony_ci goto out_ce; 71662306a36Sopenharmony_ci } 71762306a36Sopenharmony_ci 71862306a36Sopenharmony_ci pr_debug("%s: Cancelling active request\n", engine->name); 71962306a36Sopenharmony_ci i915_request_get(rq); 72062306a36Sopenharmony_ci i915_request_add(rq); 72162306a36Sopenharmony_ci if (!igt_wait_for_spinner(&spin, rq)) { 72262306a36Sopenharmony_ci struct drm_printer p = drm_info_printer(engine->i915->drm.dev); 72362306a36Sopenharmony_ci 72462306a36Sopenharmony_ci pr_err("Failed to start spinner on %s\n", engine->name); 72562306a36Sopenharmony_ci intel_engine_dump(engine, &p, "%s\n", engine->name); 72662306a36Sopenharmony_ci err = -ETIME; 72762306a36Sopenharmony_ci goto out_rq; 72862306a36Sopenharmony_ci } 72962306a36Sopenharmony_ci i915_request_cancel(rq, -EINTR); 73062306a36Sopenharmony_ci 73162306a36Sopenharmony_ci if (i915_request_wait(rq, 0, HZ / 5) < 0) { 73262306a36Sopenharmony_ci struct drm_printer p = drm_info_printer(engine->i915->drm.dev); 73362306a36Sopenharmony_ci 73462306a36Sopenharmony_ci pr_err("%s: Failed to cancel active request\n", engine->name); 73562306a36Sopenharmony_ci intel_engine_dump(engine, &p, "%s\n", engine->name); 73662306a36Sopenharmony_ci err = -ETIME; 73762306a36Sopenharmony_ci goto out_rq; 73862306a36Sopenharmony_ci } 73962306a36Sopenharmony_ci 74062306a36Sopenharmony_ci if (rq->fence.error != -EINTR) { 74162306a36Sopenharmony_ci pr_err("%s: fence not cancelled (%u)\n", 74262306a36Sopenharmony_ci engine->name, rq->fence.error); 74362306a36Sopenharmony_ci err = -EINVAL; 74462306a36Sopenharmony_ci } 74562306a36Sopenharmony_ci 74662306a36Sopenharmony_ciout_rq: 74762306a36Sopenharmony_ci i915_request_put(rq); 74862306a36Sopenharmony_ciout_ce: 74962306a36Sopenharmony_ci intel_context_put(ce); 75062306a36Sopenharmony_ciout_spin: 75162306a36Sopenharmony_ci igt_spinner_fini(&spin); 75262306a36Sopenharmony_ci if (err) 75362306a36Sopenharmony_ci pr_err("%s: %s error %d\n", __func__, engine->name, err); 75462306a36Sopenharmony_ci return err; 75562306a36Sopenharmony_ci} 75662306a36Sopenharmony_ci 75762306a36Sopenharmony_cistatic int __cancel_completed(struct intel_engine_cs *engine) 75862306a36Sopenharmony_ci{ 75962306a36Sopenharmony_ci struct intel_context *ce; 76062306a36Sopenharmony_ci struct igt_spinner spin; 76162306a36Sopenharmony_ci struct i915_request *rq; 76262306a36Sopenharmony_ci int err = 0; 76362306a36Sopenharmony_ci 76462306a36Sopenharmony_ci if (igt_spinner_init(&spin, engine->gt)) 76562306a36Sopenharmony_ci return -ENOMEM; 76662306a36Sopenharmony_ci 76762306a36Sopenharmony_ci ce = intel_context_create(engine); 76862306a36Sopenharmony_ci if (IS_ERR(ce)) { 76962306a36Sopenharmony_ci err = PTR_ERR(ce); 77062306a36Sopenharmony_ci goto out_spin; 77162306a36Sopenharmony_ci } 77262306a36Sopenharmony_ci 77362306a36Sopenharmony_ci rq = igt_spinner_create_request(&spin, ce, MI_ARB_CHECK); 77462306a36Sopenharmony_ci if (IS_ERR(rq)) { 77562306a36Sopenharmony_ci err = PTR_ERR(rq); 77662306a36Sopenharmony_ci goto out_ce; 77762306a36Sopenharmony_ci } 77862306a36Sopenharmony_ci igt_spinner_end(&spin); 77962306a36Sopenharmony_ci i915_request_get(rq); 78062306a36Sopenharmony_ci i915_request_add(rq); 78162306a36Sopenharmony_ci 78262306a36Sopenharmony_ci if (i915_request_wait(rq, 0, HZ / 5) < 0) { 78362306a36Sopenharmony_ci err = -ETIME; 78462306a36Sopenharmony_ci goto out_rq; 78562306a36Sopenharmony_ci } 78662306a36Sopenharmony_ci 78762306a36Sopenharmony_ci pr_debug("%s: Cancelling completed request\n", engine->name); 78862306a36Sopenharmony_ci i915_request_cancel(rq, -EINTR); 78962306a36Sopenharmony_ci if (rq->fence.error) { 79062306a36Sopenharmony_ci pr_err("%s: fence not cancelled (%u)\n", 79162306a36Sopenharmony_ci engine->name, rq->fence.error); 79262306a36Sopenharmony_ci err = -EINVAL; 79362306a36Sopenharmony_ci } 79462306a36Sopenharmony_ci 79562306a36Sopenharmony_ciout_rq: 79662306a36Sopenharmony_ci i915_request_put(rq); 79762306a36Sopenharmony_ciout_ce: 79862306a36Sopenharmony_ci intel_context_put(ce); 79962306a36Sopenharmony_ciout_spin: 80062306a36Sopenharmony_ci igt_spinner_fini(&spin); 80162306a36Sopenharmony_ci if (err) 80262306a36Sopenharmony_ci pr_err("%s: %s error %d\n", __func__, engine->name, err); 80362306a36Sopenharmony_ci return err; 80462306a36Sopenharmony_ci} 80562306a36Sopenharmony_ci 80662306a36Sopenharmony_ci/* 80762306a36Sopenharmony_ci * Test to prove a non-preemptable request can be cancelled and a subsequent 80862306a36Sopenharmony_ci * request on the same context can successfully complete after cancellation. 80962306a36Sopenharmony_ci * 81062306a36Sopenharmony_ci * Testing methodology is to create a non-preemptible request and submit it, 81162306a36Sopenharmony_ci * wait for spinner to start, create a NOP request and submit it, cancel the 81262306a36Sopenharmony_ci * spinner, wait for spinner to complete and verify it failed with an error, 81362306a36Sopenharmony_ci * finally wait for NOP request to complete verify it succeeded without an 81462306a36Sopenharmony_ci * error. Preemption timeout also reduced / restored so test runs in a timely 81562306a36Sopenharmony_ci * maner. 81662306a36Sopenharmony_ci */ 81762306a36Sopenharmony_cistatic int __cancel_reset(struct drm_i915_private *i915, 81862306a36Sopenharmony_ci struct intel_engine_cs *engine) 81962306a36Sopenharmony_ci{ 82062306a36Sopenharmony_ci struct intel_context *ce; 82162306a36Sopenharmony_ci struct igt_spinner spin; 82262306a36Sopenharmony_ci struct i915_request *rq, *nop; 82362306a36Sopenharmony_ci unsigned long preempt_timeout_ms; 82462306a36Sopenharmony_ci int err = 0; 82562306a36Sopenharmony_ci 82662306a36Sopenharmony_ci if (!CONFIG_DRM_I915_PREEMPT_TIMEOUT || 82762306a36Sopenharmony_ci !intel_has_reset_engine(engine->gt)) 82862306a36Sopenharmony_ci return 0; 82962306a36Sopenharmony_ci 83062306a36Sopenharmony_ci preempt_timeout_ms = engine->props.preempt_timeout_ms; 83162306a36Sopenharmony_ci engine->props.preempt_timeout_ms = 100; 83262306a36Sopenharmony_ci 83362306a36Sopenharmony_ci if (igt_spinner_init(&spin, engine->gt)) 83462306a36Sopenharmony_ci goto out_restore; 83562306a36Sopenharmony_ci 83662306a36Sopenharmony_ci ce = intel_context_create(engine); 83762306a36Sopenharmony_ci if (IS_ERR(ce)) { 83862306a36Sopenharmony_ci err = PTR_ERR(ce); 83962306a36Sopenharmony_ci goto out_spin; 84062306a36Sopenharmony_ci } 84162306a36Sopenharmony_ci 84262306a36Sopenharmony_ci rq = igt_spinner_create_request(&spin, ce, MI_NOOP); 84362306a36Sopenharmony_ci if (IS_ERR(rq)) { 84462306a36Sopenharmony_ci err = PTR_ERR(rq); 84562306a36Sopenharmony_ci goto out_ce; 84662306a36Sopenharmony_ci } 84762306a36Sopenharmony_ci 84862306a36Sopenharmony_ci pr_debug("%s: Cancelling active non-preemptable request\n", 84962306a36Sopenharmony_ci engine->name); 85062306a36Sopenharmony_ci i915_request_get(rq); 85162306a36Sopenharmony_ci i915_request_add(rq); 85262306a36Sopenharmony_ci if (!igt_wait_for_spinner(&spin, rq)) { 85362306a36Sopenharmony_ci struct drm_printer p = drm_info_printer(engine->i915->drm.dev); 85462306a36Sopenharmony_ci 85562306a36Sopenharmony_ci pr_err("Failed to start spinner on %s\n", engine->name); 85662306a36Sopenharmony_ci intel_engine_dump(engine, &p, "%s\n", engine->name); 85762306a36Sopenharmony_ci err = -ETIME; 85862306a36Sopenharmony_ci goto out_rq; 85962306a36Sopenharmony_ci } 86062306a36Sopenharmony_ci 86162306a36Sopenharmony_ci nop = intel_context_create_request(ce); 86262306a36Sopenharmony_ci if (IS_ERR(nop)) 86362306a36Sopenharmony_ci goto out_rq; 86462306a36Sopenharmony_ci i915_request_get(nop); 86562306a36Sopenharmony_ci i915_request_add(nop); 86662306a36Sopenharmony_ci 86762306a36Sopenharmony_ci i915_request_cancel(rq, -EINTR); 86862306a36Sopenharmony_ci 86962306a36Sopenharmony_ci if (i915_request_wait(rq, 0, HZ) < 0) { 87062306a36Sopenharmony_ci struct drm_printer p = drm_info_printer(engine->i915->drm.dev); 87162306a36Sopenharmony_ci 87262306a36Sopenharmony_ci pr_err("%s: Failed to cancel hung request\n", engine->name); 87362306a36Sopenharmony_ci intel_engine_dump(engine, &p, "%s\n", engine->name); 87462306a36Sopenharmony_ci err = -ETIME; 87562306a36Sopenharmony_ci goto out_nop; 87662306a36Sopenharmony_ci } 87762306a36Sopenharmony_ci 87862306a36Sopenharmony_ci if (rq->fence.error != -EINTR) { 87962306a36Sopenharmony_ci pr_err("%s: fence not cancelled (%u)\n", 88062306a36Sopenharmony_ci engine->name, rq->fence.error); 88162306a36Sopenharmony_ci err = -EINVAL; 88262306a36Sopenharmony_ci goto out_nop; 88362306a36Sopenharmony_ci } 88462306a36Sopenharmony_ci 88562306a36Sopenharmony_ci if (i915_request_wait(nop, 0, HZ) < 0) { 88662306a36Sopenharmony_ci struct drm_printer p = drm_info_printer(engine->i915->drm.dev); 88762306a36Sopenharmony_ci 88862306a36Sopenharmony_ci pr_err("%s: Failed to complete nop request\n", engine->name); 88962306a36Sopenharmony_ci intel_engine_dump(engine, &p, "%s\n", engine->name); 89062306a36Sopenharmony_ci err = -ETIME; 89162306a36Sopenharmony_ci goto out_nop; 89262306a36Sopenharmony_ci } 89362306a36Sopenharmony_ci 89462306a36Sopenharmony_ci if (nop->fence.error != 0) { 89562306a36Sopenharmony_ci pr_err("%s: Nop request errored (%u)\n", 89662306a36Sopenharmony_ci engine->name, nop->fence.error); 89762306a36Sopenharmony_ci err = -EINVAL; 89862306a36Sopenharmony_ci } 89962306a36Sopenharmony_ci 90062306a36Sopenharmony_ciout_nop: 90162306a36Sopenharmony_ci i915_request_put(nop); 90262306a36Sopenharmony_ciout_rq: 90362306a36Sopenharmony_ci i915_request_put(rq); 90462306a36Sopenharmony_ciout_ce: 90562306a36Sopenharmony_ci intel_context_put(ce); 90662306a36Sopenharmony_ciout_spin: 90762306a36Sopenharmony_ci igt_spinner_fini(&spin); 90862306a36Sopenharmony_ciout_restore: 90962306a36Sopenharmony_ci engine->props.preempt_timeout_ms = preempt_timeout_ms; 91062306a36Sopenharmony_ci if (err) 91162306a36Sopenharmony_ci pr_err("%s: %s error %d\n", __func__, engine->name, err); 91262306a36Sopenharmony_ci return err; 91362306a36Sopenharmony_ci} 91462306a36Sopenharmony_ci 91562306a36Sopenharmony_cistatic int live_cancel_request(void *arg) 91662306a36Sopenharmony_ci{ 91762306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 91862306a36Sopenharmony_ci struct intel_engine_cs *engine; 91962306a36Sopenharmony_ci 92062306a36Sopenharmony_ci /* 92162306a36Sopenharmony_ci * Check cancellation of requests. We expect to be able to immediately 92262306a36Sopenharmony_ci * cancel active requests, even if they are currently on the GPU. 92362306a36Sopenharmony_ci */ 92462306a36Sopenharmony_ci 92562306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 92662306a36Sopenharmony_ci struct igt_live_test t; 92762306a36Sopenharmony_ci int err, err2; 92862306a36Sopenharmony_ci 92962306a36Sopenharmony_ci if (!intel_engine_has_preemption(engine)) 93062306a36Sopenharmony_ci continue; 93162306a36Sopenharmony_ci 93262306a36Sopenharmony_ci err = igt_live_test_begin(&t, i915, __func__, engine->name); 93362306a36Sopenharmony_ci if (err) 93462306a36Sopenharmony_ci return err; 93562306a36Sopenharmony_ci 93662306a36Sopenharmony_ci err = __cancel_inactive(engine); 93762306a36Sopenharmony_ci if (err == 0) 93862306a36Sopenharmony_ci err = __cancel_active(engine); 93962306a36Sopenharmony_ci if (err == 0) 94062306a36Sopenharmony_ci err = __cancel_completed(engine); 94162306a36Sopenharmony_ci 94262306a36Sopenharmony_ci err2 = igt_live_test_end(&t); 94362306a36Sopenharmony_ci if (err) 94462306a36Sopenharmony_ci return err; 94562306a36Sopenharmony_ci if (err2) 94662306a36Sopenharmony_ci return err2; 94762306a36Sopenharmony_ci 94862306a36Sopenharmony_ci /* Expects reset so call outside of igt_live_test_* */ 94962306a36Sopenharmony_ci err = __cancel_reset(i915, engine); 95062306a36Sopenharmony_ci if (err) 95162306a36Sopenharmony_ci return err; 95262306a36Sopenharmony_ci 95362306a36Sopenharmony_ci if (igt_flush_test(i915)) 95462306a36Sopenharmony_ci return -EIO; 95562306a36Sopenharmony_ci } 95662306a36Sopenharmony_ci 95762306a36Sopenharmony_ci return 0; 95862306a36Sopenharmony_ci} 95962306a36Sopenharmony_ci 96062306a36Sopenharmony_cistatic struct i915_vma *empty_batch(struct intel_gt *gt) 96162306a36Sopenharmony_ci{ 96262306a36Sopenharmony_ci struct drm_i915_gem_object *obj; 96362306a36Sopenharmony_ci struct i915_vma *vma; 96462306a36Sopenharmony_ci u32 *cmd; 96562306a36Sopenharmony_ci int err; 96662306a36Sopenharmony_ci 96762306a36Sopenharmony_ci obj = i915_gem_object_create_internal(gt->i915, PAGE_SIZE); 96862306a36Sopenharmony_ci if (IS_ERR(obj)) 96962306a36Sopenharmony_ci return ERR_CAST(obj); 97062306a36Sopenharmony_ci 97162306a36Sopenharmony_ci cmd = i915_gem_object_pin_map_unlocked(obj, I915_MAP_WC); 97262306a36Sopenharmony_ci if (IS_ERR(cmd)) { 97362306a36Sopenharmony_ci err = PTR_ERR(cmd); 97462306a36Sopenharmony_ci goto err; 97562306a36Sopenharmony_ci } 97662306a36Sopenharmony_ci 97762306a36Sopenharmony_ci *cmd = MI_BATCH_BUFFER_END; 97862306a36Sopenharmony_ci 97962306a36Sopenharmony_ci __i915_gem_object_flush_map(obj, 0, 64); 98062306a36Sopenharmony_ci i915_gem_object_unpin_map(obj); 98162306a36Sopenharmony_ci 98262306a36Sopenharmony_ci intel_gt_chipset_flush(gt); 98362306a36Sopenharmony_ci 98462306a36Sopenharmony_ci vma = i915_vma_instance(obj, gt->vm, NULL); 98562306a36Sopenharmony_ci if (IS_ERR(vma)) { 98662306a36Sopenharmony_ci err = PTR_ERR(vma); 98762306a36Sopenharmony_ci goto err; 98862306a36Sopenharmony_ci } 98962306a36Sopenharmony_ci 99062306a36Sopenharmony_ci err = i915_vma_pin(vma, 0, 0, PIN_USER); 99162306a36Sopenharmony_ci if (err) 99262306a36Sopenharmony_ci goto err; 99362306a36Sopenharmony_ci 99462306a36Sopenharmony_ci /* Force the wait now to avoid including it in the benchmark */ 99562306a36Sopenharmony_ci err = i915_vma_sync(vma); 99662306a36Sopenharmony_ci if (err) 99762306a36Sopenharmony_ci goto err_pin; 99862306a36Sopenharmony_ci 99962306a36Sopenharmony_ci return vma; 100062306a36Sopenharmony_ci 100162306a36Sopenharmony_cierr_pin: 100262306a36Sopenharmony_ci i915_vma_unpin(vma); 100362306a36Sopenharmony_cierr: 100462306a36Sopenharmony_ci i915_gem_object_put(obj); 100562306a36Sopenharmony_ci return ERR_PTR(err); 100662306a36Sopenharmony_ci} 100762306a36Sopenharmony_ci 100862306a36Sopenharmony_cistatic int emit_bb_start(struct i915_request *rq, struct i915_vma *batch) 100962306a36Sopenharmony_ci{ 101062306a36Sopenharmony_ci return rq->engine->emit_bb_start(rq, 101162306a36Sopenharmony_ci i915_vma_offset(batch), 101262306a36Sopenharmony_ci i915_vma_size(batch), 101362306a36Sopenharmony_ci 0); 101462306a36Sopenharmony_ci} 101562306a36Sopenharmony_ci 101662306a36Sopenharmony_cistatic struct i915_request * 101762306a36Sopenharmony_ciempty_request(struct intel_engine_cs *engine, 101862306a36Sopenharmony_ci struct i915_vma *batch) 101962306a36Sopenharmony_ci{ 102062306a36Sopenharmony_ci struct i915_request *request; 102162306a36Sopenharmony_ci int err; 102262306a36Sopenharmony_ci 102362306a36Sopenharmony_ci request = i915_request_create(engine->kernel_context); 102462306a36Sopenharmony_ci if (IS_ERR(request)) 102562306a36Sopenharmony_ci return request; 102662306a36Sopenharmony_ci 102762306a36Sopenharmony_ci err = emit_bb_start(request, batch); 102862306a36Sopenharmony_ci if (err) 102962306a36Sopenharmony_ci goto out_request; 103062306a36Sopenharmony_ci 103162306a36Sopenharmony_ci i915_request_get(request); 103262306a36Sopenharmony_ciout_request: 103362306a36Sopenharmony_ci i915_request_add(request); 103462306a36Sopenharmony_ci return err ? ERR_PTR(err) : request; 103562306a36Sopenharmony_ci} 103662306a36Sopenharmony_ci 103762306a36Sopenharmony_cistatic int live_empty_request(void *arg) 103862306a36Sopenharmony_ci{ 103962306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 104062306a36Sopenharmony_ci struct intel_engine_cs *engine; 104162306a36Sopenharmony_ci struct igt_live_test t; 104262306a36Sopenharmony_ci int err; 104362306a36Sopenharmony_ci 104462306a36Sopenharmony_ci /* 104562306a36Sopenharmony_ci * Submit various sized batches of empty requests, to each engine 104662306a36Sopenharmony_ci * (individually), and wait for the batch to complete. We can check 104762306a36Sopenharmony_ci * the overhead of submitting requests to the hardware. 104862306a36Sopenharmony_ci */ 104962306a36Sopenharmony_ci 105062306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 105162306a36Sopenharmony_ci IGT_TIMEOUT(end_time); 105262306a36Sopenharmony_ci struct i915_request *request; 105362306a36Sopenharmony_ci struct i915_vma *batch; 105462306a36Sopenharmony_ci unsigned long n, prime; 105562306a36Sopenharmony_ci ktime_t times[2] = {}; 105662306a36Sopenharmony_ci 105762306a36Sopenharmony_ci batch = empty_batch(engine->gt); 105862306a36Sopenharmony_ci if (IS_ERR(batch)) 105962306a36Sopenharmony_ci return PTR_ERR(batch); 106062306a36Sopenharmony_ci 106162306a36Sopenharmony_ci err = igt_live_test_begin(&t, i915, __func__, engine->name); 106262306a36Sopenharmony_ci if (err) 106362306a36Sopenharmony_ci goto out_batch; 106462306a36Sopenharmony_ci 106562306a36Sopenharmony_ci intel_engine_pm_get(engine); 106662306a36Sopenharmony_ci 106762306a36Sopenharmony_ci /* Warmup / preload */ 106862306a36Sopenharmony_ci request = empty_request(engine, batch); 106962306a36Sopenharmony_ci if (IS_ERR(request)) { 107062306a36Sopenharmony_ci err = PTR_ERR(request); 107162306a36Sopenharmony_ci intel_engine_pm_put(engine); 107262306a36Sopenharmony_ci goto out_batch; 107362306a36Sopenharmony_ci } 107462306a36Sopenharmony_ci i915_request_wait(request, 0, MAX_SCHEDULE_TIMEOUT); 107562306a36Sopenharmony_ci 107662306a36Sopenharmony_ci for_each_prime_number_from(prime, 1, 8192) { 107762306a36Sopenharmony_ci times[1] = ktime_get_raw(); 107862306a36Sopenharmony_ci 107962306a36Sopenharmony_ci for (n = 0; n < prime; n++) { 108062306a36Sopenharmony_ci i915_request_put(request); 108162306a36Sopenharmony_ci request = empty_request(engine, batch); 108262306a36Sopenharmony_ci if (IS_ERR(request)) { 108362306a36Sopenharmony_ci err = PTR_ERR(request); 108462306a36Sopenharmony_ci intel_engine_pm_put(engine); 108562306a36Sopenharmony_ci goto out_batch; 108662306a36Sopenharmony_ci } 108762306a36Sopenharmony_ci } 108862306a36Sopenharmony_ci i915_request_wait(request, 0, MAX_SCHEDULE_TIMEOUT); 108962306a36Sopenharmony_ci 109062306a36Sopenharmony_ci times[1] = ktime_sub(ktime_get_raw(), times[1]); 109162306a36Sopenharmony_ci if (prime == 1) 109262306a36Sopenharmony_ci times[0] = times[1]; 109362306a36Sopenharmony_ci 109462306a36Sopenharmony_ci if (__igt_timeout(end_time, NULL)) 109562306a36Sopenharmony_ci break; 109662306a36Sopenharmony_ci } 109762306a36Sopenharmony_ci i915_request_put(request); 109862306a36Sopenharmony_ci intel_engine_pm_put(engine); 109962306a36Sopenharmony_ci 110062306a36Sopenharmony_ci err = igt_live_test_end(&t); 110162306a36Sopenharmony_ci if (err) 110262306a36Sopenharmony_ci goto out_batch; 110362306a36Sopenharmony_ci 110462306a36Sopenharmony_ci pr_info("Batch latencies on %s: 1 = %lluns, %lu = %lluns\n", 110562306a36Sopenharmony_ci engine->name, 110662306a36Sopenharmony_ci ktime_to_ns(times[0]), 110762306a36Sopenharmony_ci prime, div64_u64(ktime_to_ns(times[1]), prime)); 110862306a36Sopenharmony_ciout_batch: 110962306a36Sopenharmony_ci i915_vma_unpin(batch); 111062306a36Sopenharmony_ci i915_vma_put(batch); 111162306a36Sopenharmony_ci if (err) 111262306a36Sopenharmony_ci break; 111362306a36Sopenharmony_ci } 111462306a36Sopenharmony_ci 111562306a36Sopenharmony_ci return err; 111662306a36Sopenharmony_ci} 111762306a36Sopenharmony_ci 111862306a36Sopenharmony_cistatic struct i915_vma *recursive_batch(struct intel_gt *gt) 111962306a36Sopenharmony_ci{ 112062306a36Sopenharmony_ci struct drm_i915_gem_object *obj; 112162306a36Sopenharmony_ci const int ver = GRAPHICS_VER(gt->i915); 112262306a36Sopenharmony_ci struct i915_vma *vma; 112362306a36Sopenharmony_ci u32 *cmd; 112462306a36Sopenharmony_ci int err; 112562306a36Sopenharmony_ci 112662306a36Sopenharmony_ci obj = i915_gem_object_create_internal(gt->i915, PAGE_SIZE); 112762306a36Sopenharmony_ci if (IS_ERR(obj)) 112862306a36Sopenharmony_ci return ERR_CAST(obj); 112962306a36Sopenharmony_ci 113062306a36Sopenharmony_ci vma = i915_vma_instance(obj, gt->vm, NULL); 113162306a36Sopenharmony_ci if (IS_ERR(vma)) { 113262306a36Sopenharmony_ci err = PTR_ERR(vma); 113362306a36Sopenharmony_ci goto err; 113462306a36Sopenharmony_ci } 113562306a36Sopenharmony_ci 113662306a36Sopenharmony_ci err = i915_vma_pin(vma, 0, 0, PIN_USER); 113762306a36Sopenharmony_ci if (err) 113862306a36Sopenharmony_ci goto err; 113962306a36Sopenharmony_ci 114062306a36Sopenharmony_ci cmd = i915_gem_object_pin_map_unlocked(obj, I915_MAP_WC); 114162306a36Sopenharmony_ci if (IS_ERR(cmd)) { 114262306a36Sopenharmony_ci err = PTR_ERR(cmd); 114362306a36Sopenharmony_ci goto err; 114462306a36Sopenharmony_ci } 114562306a36Sopenharmony_ci 114662306a36Sopenharmony_ci if (ver >= 8) { 114762306a36Sopenharmony_ci *cmd++ = MI_BATCH_BUFFER_START | 1 << 8 | 1; 114862306a36Sopenharmony_ci *cmd++ = lower_32_bits(i915_vma_offset(vma)); 114962306a36Sopenharmony_ci *cmd++ = upper_32_bits(i915_vma_offset(vma)); 115062306a36Sopenharmony_ci } else if (ver >= 6) { 115162306a36Sopenharmony_ci *cmd++ = MI_BATCH_BUFFER_START | 1 << 8; 115262306a36Sopenharmony_ci *cmd++ = lower_32_bits(i915_vma_offset(vma)); 115362306a36Sopenharmony_ci } else { 115462306a36Sopenharmony_ci *cmd++ = MI_BATCH_BUFFER_START | MI_BATCH_GTT; 115562306a36Sopenharmony_ci *cmd++ = lower_32_bits(i915_vma_offset(vma)); 115662306a36Sopenharmony_ci } 115762306a36Sopenharmony_ci *cmd++ = MI_BATCH_BUFFER_END; /* terminate early in case of error */ 115862306a36Sopenharmony_ci 115962306a36Sopenharmony_ci __i915_gem_object_flush_map(obj, 0, 64); 116062306a36Sopenharmony_ci i915_gem_object_unpin_map(obj); 116162306a36Sopenharmony_ci 116262306a36Sopenharmony_ci intel_gt_chipset_flush(gt); 116362306a36Sopenharmony_ci 116462306a36Sopenharmony_ci return vma; 116562306a36Sopenharmony_ci 116662306a36Sopenharmony_cierr: 116762306a36Sopenharmony_ci i915_gem_object_put(obj); 116862306a36Sopenharmony_ci return ERR_PTR(err); 116962306a36Sopenharmony_ci} 117062306a36Sopenharmony_ci 117162306a36Sopenharmony_cistatic int recursive_batch_resolve(struct i915_vma *batch) 117262306a36Sopenharmony_ci{ 117362306a36Sopenharmony_ci u32 *cmd; 117462306a36Sopenharmony_ci 117562306a36Sopenharmony_ci cmd = i915_gem_object_pin_map_unlocked(batch->obj, I915_MAP_WC); 117662306a36Sopenharmony_ci if (IS_ERR(cmd)) 117762306a36Sopenharmony_ci return PTR_ERR(cmd); 117862306a36Sopenharmony_ci 117962306a36Sopenharmony_ci *cmd = MI_BATCH_BUFFER_END; 118062306a36Sopenharmony_ci 118162306a36Sopenharmony_ci __i915_gem_object_flush_map(batch->obj, 0, sizeof(*cmd)); 118262306a36Sopenharmony_ci i915_gem_object_unpin_map(batch->obj); 118362306a36Sopenharmony_ci 118462306a36Sopenharmony_ci intel_gt_chipset_flush(batch->vm->gt); 118562306a36Sopenharmony_ci 118662306a36Sopenharmony_ci return 0; 118762306a36Sopenharmony_ci} 118862306a36Sopenharmony_ci 118962306a36Sopenharmony_cistatic int live_all_engines(void *arg) 119062306a36Sopenharmony_ci{ 119162306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 119262306a36Sopenharmony_ci const unsigned int nengines = num_uabi_engines(i915); 119362306a36Sopenharmony_ci struct intel_engine_cs *engine; 119462306a36Sopenharmony_ci struct i915_request **request; 119562306a36Sopenharmony_ci struct igt_live_test t; 119662306a36Sopenharmony_ci unsigned int idx; 119762306a36Sopenharmony_ci int err; 119862306a36Sopenharmony_ci 119962306a36Sopenharmony_ci /* 120062306a36Sopenharmony_ci * Check we can submit requests to all engines simultaneously. We 120162306a36Sopenharmony_ci * send a recursive batch to each engine - checking that we don't 120262306a36Sopenharmony_ci * block doing so, and that they don't complete too soon. 120362306a36Sopenharmony_ci */ 120462306a36Sopenharmony_ci 120562306a36Sopenharmony_ci request = kcalloc(nengines, sizeof(*request), GFP_KERNEL); 120662306a36Sopenharmony_ci if (!request) 120762306a36Sopenharmony_ci return -ENOMEM; 120862306a36Sopenharmony_ci 120962306a36Sopenharmony_ci err = igt_live_test_begin(&t, i915, __func__, ""); 121062306a36Sopenharmony_ci if (err) 121162306a36Sopenharmony_ci goto out_free; 121262306a36Sopenharmony_ci 121362306a36Sopenharmony_ci idx = 0; 121462306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 121562306a36Sopenharmony_ci struct i915_vma *batch; 121662306a36Sopenharmony_ci 121762306a36Sopenharmony_ci batch = recursive_batch(engine->gt); 121862306a36Sopenharmony_ci if (IS_ERR(batch)) { 121962306a36Sopenharmony_ci err = PTR_ERR(batch); 122062306a36Sopenharmony_ci pr_err("%s: Unable to create batch, err=%d\n", 122162306a36Sopenharmony_ci __func__, err); 122262306a36Sopenharmony_ci goto out_free; 122362306a36Sopenharmony_ci } 122462306a36Sopenharmony_ci 122562306a36Sopenharmony_ci i915_vma_lock(batch); 122662306a36Sopenharmony_ci request[idx] = intel_engine_create_kernel_request(engine); 122762306a36Sopenharmony_ci if (IS_ERR(request[idx])) { 122862306a36Sopenharmony_ci err = PTR_ERR(request[idx]); 122962306a36Sopenharmony_ci pr_err("%s: Request allocation failed with err=%d\n", 123062306a36Sopenharmony_ci __func__, err); 123162306a36Sopenharmony_ci goto out_unlock; 123262306a36Sopenharmony_ci } 123362306a36Sopenharmony_ci GEM_BUG_ON(request[idx]->context->vm != batch->vm); 123462306a36Sopenharmony_ci 123562306a36Sopenharmony_ci err = i915_vma_move_to_active(batch, request[idx], 0); 123662306a36Sopenharmony_ci GEM_BUG_ON(err); 123762306a36Sopenharmony_ci 123862306a36Sopenharmony_ci err = emit_bb_start(request[idx], batch); 123962306a36Sopenharmony_ci GEM_BUG_ON(err); 124062306a36Sopenharmony_ci request[idx]->batch = batch; 124162306a36Sopenharmony_ci 124262306a36Sopenharmony_ci i915_request_get(request[idx]); 124362306a36Sopenharmony_ci i915_request_add(request[idx]); 124462306a36Sopenharmony_ci idx++; 124562306a36Sopenharmony_ciout_unlock: 124662306a36Sopenharmony_ci i915_vma_unlock(batch); 124762306a36Sopenharmony_ci if (err) 124862306a36Sopenharmony_ci goto out_request; 124962306a36Sopenharmony_ci } 125062306a36Sopenharmony_ci 125162306a36Sopenharmony_ci idx = 0; 125262306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 125362306a36Sopenharmony_ci if (i915_request_completed(request[idx])) { 125462306a36Sopenharmony_ci pr_err("%s(%s): request completed too early!\n", 125562306a36Sopenharmony_ci __func__, engine->name); 125662306a36Sopenharmony_ci err = -EINVAL; 125762306a36Sopenharmony_ci goto out_request; 125862306a36Sopenharmony_ci } 125962306a36Sopenharmony_ci idx++; 126062306a36Sopenharmony_ci } 126162306a36Sopenharmony_ci 126262306a36Sopenharmony_ci idx = 0; 126362306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 126462306a36Sopenharmony_ci err = recursive_batch_resolve(request[idx]->batch); 126562306a36Sopenharmony_ci if (err) { 126662306a36Sopenharmony_ci pr_err("%s: failed to resolve batch, err=%d\n", 126762306a36Sopenharmony_ci __func__, err); 126862306a36Sopenharmony_ci goto out_request; 126962306a36Sopenharmony_ci } 127062306a36Sopenharmony_ci idx++; 127162306a36Sopenharmony_ci } 127262306a36Sopenharmony_ci 127362306a36Sopenharmony_ci idx = 0; 127462306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 127562306a36Sopenharmony_ci struct i915_request *rq = request[idx]; 127662306a36Sopenharmony_ci long timeout; 127762306a36Sopenharmony_ci 127862306a36Sopenharmony_ci timeout = i915_request_wait(rq, 0, 127962306a36Sopenharmony_ci MAX_SCHEDULE_TIMEOUT); 128062306a36Sopenharmony_ci if (timeout < 0) { 128162306a36Sopenharmony_ci err = timeout; 128262306a36Sopenharmony_ci pr_err("%s: error waiting for request on %s, err=%d\n", 128362306a36Sopenharmony_ci __func__, engine->name, err); 128462306a36Sopenharmony_ci goto out_request; 128562306a36Sopenharmony_ci } 128662306a36Sopenharmony_ci 128762306a36Sopenharmony_ci GEM_BUG_ON(!i915_request_completed(rq)); 128862306a36Sopenharmony_ci i915_vma_unpin(rq->batch); 128962306a36Sopenharmony_ci i915_vma_put(rq->batch); 129062306a36Sopenharmony_ci i915_request_put(rq); 129162306a36Sopenharmony_ci request[idx] = NULL; 129262306a36Sopenharmony_ci idx++; 129362306a36Sopenharmony_ci } 129462306a36Sopenharmony_ci 129562306a36Sopenharmony_ci err = igt_live_test_end(&t); 129662306a36Sopenharmony_ci 129762306a36Sopenharmony_ciout_request: 129862306a36Sopenharmony_ci idx = 0; 129962306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 130062306a36Sopenharmony_ci struct i915_request *rq = request[idx]; 130162306a36Sopenharmony_ci 130262306a36Sopenharmony_ci if (!rq) 130362306a36Sopenharmony_ci continue; 130462306a36Sopenharmony_ci 130562306a36Sopenharmony_ci if (rq->batch) { 130662306a36Sopenharmony_ci i915_vma_unpin(rq->batch); 130762306a36Sopenharmony_ci i915_vma_put(rq->batch); 130862306a36Sopenharmony_ci } 130962306a36Sopenharmony_ci i915_request_put(rq); 131062306a36Sopenharmony_ci idx++; 131162306a36Sopenharmony_ci } 131262306a36Sopenharmony_ciout_free: 131362306a36Sopenharmony_ci kfree(request); 131462306a36Sopenharmony_ci return err; 131562306a36Sopenharmony_ci} 131662306a36Sopenharmony_ci 131762306a36Sopenharmony_cistatic int live_sequential_engines(void *arg) 131862306a36Sopenharmony_ci{ 131962306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 132062306a36Sopenharmony_ci const unsigned int nengines = num_uabi_engines(i915); 132162306a36Sopenharmony_ci struct i915_request **request; 132262306a36Sopenharmony_ci struct i915_request *prev = NULL; 132362306a36Sopenharmony_ci struct intel_engine_cs *engine; 132462306a36Sopenharmony_ci struct igt_live_test t; 132562306a36Sopenharmony_ci unsigned int idx; 132662306a36Sopenharmony_ci int err; 132762306a36Sopenharmony_ci 132862306a36Sopenharmony_ci /* 132962306a36Sopenharmony_ci * Check we can submit requests to all engines sequentially, such 133062306a36Sopenharmony_ci * that each successive request waits for the earlier ones. This 133162306a36Sopenharmony_ci * tests that we don't execute requests out of order, even though 133262306a36Sopenharmony_ci * they are running on independent engines. 133362306a36Sopenharmony_ci */ 133462306a36Sopenharmony_ci 133562306a36Sopenharmony_ci request = kcalloc(nengines, sizeof(*request), GFP_KERNEL); 133662306a36Sopenharmony_ci if (!request) 133762306a36Sopenharmony_ci return -ENOMEM; 133862306a36Sopenharmony_ci 133962306a36Sopenharmony_ci err = igt_live_test_begin(&t, i915, __func__, ""); 134062306a36Sopenharmony_ci if (err) 134162306a36Sopenharmony_ci goto out_free; 134262306a36Sopenharmony_ci 134362306a36Sopenharmony_ci idx = 0; 134462306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 134562306a36Sopenharmony_ci struct i915_vma *batch; 134662306a36Sopenharmony_ci 134762306a36Sopenharmony_ci batch = recursive_batch(engine->gt); 134862306a36Sopenharmony_ci if (IS_ERR(batch)) { 134962306a36Sopenharmony_ci err = PTR_ERR(batch); 135062306a36Sopenharmony_ci pr_err("%s: Unable to create batch for %s, err=%d\n", 135162306a36Sopenharmony_ci __func__, engine->name, err); 135262306a36Sopenharmony_ci goto out_free; 135362306a36Sopenharmony_ci } 135462306a36Sopenharmony_ci 135562306a36Sopenharmony_ci i915_vma_lock(batch); 135662306a36Sopenharmony_ci request[idx] = intel_engine_create_kernel_request(engine); 135762306a36Sopenharmony_ci if (IS_ERR(request[idx])) { 135862306a36Sopenharmony_ci err = PTR_ERR(request[idx]); 135962306a36Sopenharmony_ci pr_err("%s: Request allocation failed for %s with err=%d\n", 136062306a36Sopenharmony_ci __func__, engine->name, err); 136162306a36Sopenharmony_ci goto out_unlock; 136262306a36Sopenharmony_ci } 136362306a36Sopenharmony_ci GEM_BUG_ON(request[idx]->context->vm != batch->vm); 136462306a36Sopenharmony_ci 136562306a36Sopenharmony_ci if (prev) { 136662306a36Sopenharmony_ci err = i915_request_await_dma_fence(request[idx], 136762306a36Sopenharmony_ci &prev->fence); 136862306a36Sopenharmony_ci if (err) { 136962306a36Sopenharmony_ci i915_request_add(request[idx]); 137062306a36Sopenharmony_ci pr_err("%s: Request await failed for %s with err=%d\n", 137162306a36Sopenharmony_ci __func__, engine->name, err); 137262306a36Sopenharmony_ci goto out_unlock; 137362306a36Sopenharmony_ci } 137462306a36Sopenharmony_ci } 137562306a36Sopenharmony_ci 137662306a36Sopenharmony_ci err = i915_vma_move_to_active(batch, request[idx], 0); 137762306a36Sopenharmony_ci GEM_BUG_ON(err); 137862306a36Sopenharmony_ci 137962306a36Sopenharmony_ci err = emit_bb_start(request[idx], batch); 138062306a36Sopenharmony_ci GEM_BUG_ON(err); 138162306a36Sopenharmony_ci request[idx]->batch = batch; 138262306a36Sopenharmony_ci 138362306a36Sopenharmony_ci i915_request_get(request[idx]); 138462306a36Sopenharmony_ci i915_request_add(request[idx]); 138562306a36Sopenharmony_ci 138662306a36Sopenharmony_ci prev = request[idx]; 138762306a36Sopenharmony_ci idx++; 138862306a36Sopenharmony_ci 138962306a36Sopenharmony_ciout_unlock: 139062306a36Sopenharmony_ci i915_vma_unlock(batch); 139162306a36Sopenharmony_ci if (err) 139262306a36Sopenharmony_ci goto out_request; 139362306a36Sopenharmony_ci } 139462306a36Sopenharmony_ci 139562306a36Sopenharmony_ci idx = 0; 139662306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 139762306a36Sopenharmony_ci long timeout; 139862306a36Sopenharmony_ci 139962306a36Sopenharmony_ci if (i915_request_completed(request[idx])) { 140062306a36Sopenharmony_ci pr_err("%s(%s): request completed too early!\n", 140162306a36Sopenharmony_ci __func__, engine->name); 140262306a36Sopenharmony_ci err = -EINVAL; 140362306a36Sopenharmony_ci goto out_request; 140462306a36Sopenharmony_ci } 140562306a36Sopenharmony_ci 140662306a36Sopenharmony_ci err = recursive_batch_resolve(request[idx]->batch); 140762306a36Sopenharmony_ci if (err) { 140862306a36Sopenharmony_ci pr_err("%s: failed to resolve batch, err=%d\n", 140962306a36Sopenharmony_ci __func__, err); 141062306a36Sopenharmony_ci goto out_request; 141162306a36Sopenharmony_ci } 141262306a36Sopenharmony_ci 141362306a36Sopenharmony_ci timeout = i915_request_wait(request[idx], 0, 141462306a36Sopenharmony_ci MAX_SCHEDULE_TIMEOUT); 141562306a36Sopenharmony_ci if (timeout < 0) { 141662306a36Sopenharmony_ci err = timeout; 141762306a36Sopenharmony_ci pr_err("%s: error waiting for request on %s, err=%d\n", 141862306a36Sopenharmony_ci __func__, engine->name, err); 141962306a36Sopenharmony_ci goto out_request; 142062306a36Sopenharmony_ci } 142162306a36Sopenharmony_ci 142262306a36Sopenharmony_ci GEM_BUG_ON(!i915_request_completed(request[idx])); 142362306a36Sopenharmony_ci idx++; 142462306a36Sopenharmony_ci } 142562306a36Sopenharmony_ci 142662306a36Sopenharmony_ci err = igt_live_test_end(&t); 142762306a36Sopenharmony_ci 142862306a36Sopenharmony_ciout_request: 142962306a36Sopenharmony_ci idx = 0; 143062306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 143162306a36Sopenharmony_ci u32 *cmd; 143262306a36Sopenharmony_ci 143362306a36Sopenharmony_ci if (!request[idx]) 143462306a36Sopenharmony_ci break; 143562306a36Sopenharmony_ci 143662306a36Sopenharmony_ci cmd = i915_gem_object_pin_map_unlocked(request[idx]->batch->obj, 143762306a36Sopenharmony_ci I915_MAP_WC); 143862306a36Sopenharmony_ci if (!IS_ERR(cmd)) { 143962306a36Sopenharmony_ci *cmd = MI_BATCH_BUFFER_END; 144062306a36Sopenharmony_ci 144162306a36Sopenharmony_ci __i915_gem_object_flush_map(request[idx]->batch->obj, 144262306a36Sopenharmony_ci 0, sizeof(*cmd)); 144362306a36Sopenharmony_ci i915_gem_object_unpin_map(request[idx]->batch->obj); 144462306a36Sopenharmony_ci 144562306a36Sopenharmony_ci intel_gt_chipset_flush(engine->gt); 144662306a36Sopenharmony_ci } 144762306a36Sopenharmony_ci 144862306a36Sopenharmony_ci i915_vma_put(request[idx]->batch); 144962306a36Sopenharmony_ci i915_request_put(request[idx]); 145062306a36Sopenharmony_ci idx++; 145162306a36Sopenharmony_ci } 145262306a36Sopenharmony_ciout_free: 145362306a36Sopenharmony_ci kfree(request); 145462306a36Sopenharmony_ci return err; 145562306a36Sopenharmony_ci} 145662306a36Sopenharmony_ci 145762306a36Sopenharmony_cistruct parallel_thread { 145862306a36Sopenharmony_ci struct kthread_worker *worker; 145962306a36Sopenharmony_ci struct kthread_work work; 146062306a36Sopenharmony_ci struct intel_engine_cs *engine; 146162306a36Sopenharmony_ci int result; 146262306a36Sopenharmony_ci}; 146362306a36Sopenharmony_ci 146462306a36Sopenharmony_cistatic void __live_parallel_engine1(struct kthread_work *work) 146562306a36Sopenharmony_ci{ 146662306a36Sopenharmony_ci struct parallel_thread *thread = 146762306a36Sopenharmony_ci container_of(work, typeof(*thread), work); 146862306a36Sopenharmony_ci struct intel_engine_cs *engine = thread->engine; 146962306a36Sopenharmony_ci IGT_TIMEOUT(end_time); 147062306a36Sopenharmony_ci unsigned long count; 147162306a36Sopenharmony_ci int err = 0; 147262306a36Sopenharmony_ci 147362306a36Sopenharmony_ci count = 0; 147462306a36Sopenharmony_ci intel_engine_pm_get(engine); 147562306a36Sopenharmony_ci do { 147662306a36Sopenharmony_ci struct i915_request *rq; 147762306a36Sopenharmony_ci 147862306a36Sopenharmony_ci rq = i915_request_create(engine->kernel_context); 147962306a36Sopenharmony_ci if (IS_ERR(rq)) { 148062306a36Sopenharmony_ci err = PTR_ERR(rq); 148162306a36Sopenharmony_ci break; 148262306a36Sopenharmony_ci } 148362306a36Sopenharmony_ci 148462306a36Sopenharmony_ci i915_request_get(rq); 148562306a36Sopenharmony_ci i915_request_add(rq); 148662306a36Sopenharmony_ci 148762306a36Sopenharmony_ci err = 0; 148862306a36Sopenharmony_ci if (i915_request_wait(rq, 0, HZ) < 0) 148962306a36Sopenharmony_ci err = -ETIME; 149062306a36Sopenharmony_ci i915_request_put(rq); 149162306a36Sopenharmony_ci if (err) 149262306a36Sopenharmony_ci break; 149362306a36Sopenharmony_ci 149462306a36Sopenharmony_ci count++; 149562306a36Sopenharmony_ci } while (!__igt_timeout(end_time, NULL)); 149662306a36Sopenharmony_ci intel_engine_pm_put(engine); 149762306a36Sopenharmony_ci 149862306a36Sopenharmony_ci pr_info("%s: %lu request + sync\n", engine->name, count); 149962306a36Sopenharmony_ci thread->result = err; 150062306a36Sopenharmony_ci} 150162306a36Sopenharmony_ci 150262306a36Sopenharmony_cistatic void __live_parallel_engineN(struct kthread_work *work) 150362306a36Sopenharmony_ci{ 150462306a36Sopenharmony_ci struct parallel_thread *thread = 150562306a36Sopenharmony_ci container_of(work, typeof(*thread), work); 150662306a36Sopenharmony_ci struct intel_engine_cs *engine = thread->engine; 150762306a36Sopenharmony_ci IGT_TIMEOUT(end_time); 150862306a36Sopenharmony_ci unsigned long count; 150962306a36Sopenharmony_ci int err = 0; 151062306a36Sopenharmony_ci 151162306a36Sopenharmony_ci count = 0; 151262306a36Sopenharmony_ci intel_engine_pm_get(engine); 151362306a36Sopenharmony_ci do { 151462306a36Sopenharmony_ci struct i915_request *rq; 151562306a36Sopenharmony_ci 151662306a36Sopenharmony_ci rq = i915_request_create(engine->kernel_context); 151762306a36Sopenharmony_ci if (IS_ERR(rq)) { 151862306a36Sopenharmony_ci err = PTR_ERR(rq); 151962306a36Sopenharmony_ci break; 152062306a36Sopenharmony_ci } 152162306a36Sopenharmony_ci 152262306a36Sopenharmony_ci i915_request_add(rq); 152362306a36Sopenharmony_ci count++; 152462306a36Sopenharmony_ci } while (!__igt_timeout(end_time, NULL)); 152562306a36Sopenharmony_ci intel_engine_pm_put(engine); 152662306a36Sopenharmony_ci 152762306a36Sopenharmony_ci pr_info("%s: %lu requests\n", engine->name, count); 152862306a36Sopenharmony_ci thread->result = err; 152962306a36Sopenharmony_ci} 153062306a36Sopenharmony_ci 153162306a36Sopenharmony_cistatic bool wake_all(struct drm_i915_private *i915) 153262306a36Sopenharmony_ci{ 153362306a36Sopenharmony_ci if (atomic_dec_and_test(&i915->selftest.counter)) { 153462306a36Sopenharmony_ci wake_up_var(&i915->selftest.counter); 153562306a36Sopenharmony_ci return true; 153662306a36Sopenharmony_ci } 153762306a36Sopenharmony_ci 153862306a36Sopenharmony_ci return false; 153962306a36Sopenharmony_ci} 154062306a36Sopenharmony_ci 154162306a36Sopenharmony_cistatic int wait_for_all(struct drm_i915_private *i915) 154262306a36Sopenharmony_ci{ 154362306a36Sopenharmony_ci if (wake_all(i915)) 154462306a36Sopenharmony_ci return 0; 154562306a36Sopenharmony_ci 154662306a36Sopenharmony_ci if (wait_var_event_timeout(&i915->selftest.counter, 154762306a36Sopenharmony_ci !atomic_read(&i915->selftest.counter), 154862306a36Sopenharmony_ci i915_selftest.timeout_jiffies)) 154962306a36Sopenharmony_ci return 0; 155062306a36Sopenharmony_ci 155162306a36Sopenharmony_ci return -ETIME; 155262306a36Sopenharmony_ci} 155362306a36Sopenharmony_ci 155462306a36Sopenharmony_cistatic void __live_parallel_spin(struct kthread_work *work) 155562306a36Sopenharmony_ci{ 155662306a36Sopenharmony_ci struct parallel_thread *thread = 155762306a36Sopenharmony_ci container_of(work, typeof(*thread), work); 155862306a36Sopenharmony_ci struct intel_engine_cs *engine = thread->engine; 155962306a36Sopenharmony_ci struct igt_spinner spin; 156062306a36Sopenharmony_ci struct i915_request *rq; 156162306a36Sopenharmony_ci int err = 0; 156262306a36Sopenharmony_ci 156362306a36Sopenharmony_ci /* 156462306a36Sopenharmony_ci * Create a spinner running for eternity on each engine. If a second 156562306a36Sopenharmony_ci * spinner is incorrectly placed on the same engine, it will not be 156662306a36Sopenharmony_ci * able to start in time. 156762306a36Sopenharmony_ci */ 156862306a36Sopenharmony_ci 156962306a36Sopenharmony_ci if (igt_spinner_init(&spin, engine->gt)) { 157062306a36Sopenharmony_ci wake_all(engine->i915); 157162306a36Sopenharmony_ci thread->result = -ENOMEM; 157262306a36Sopenharmony_ci return; 157362306a36Sopenharmony_ci } 157462306a36Sopenharmony_ci 157562306a36Sopenharmony_ci intel_engine_pm_get(engine); 157662306a36Sopenharmony_ci rq = igt_spinner_create_request(&spin, 157762306a36Sopenharmony_ci engine->kernel_context, 157862306a36Sopenharmony_ci MI_NOOP); /* no preemption */ 157962306a36Sopenharmony_ci intel_engine_pm_put(engine); 158062306a36Sopenharmony_ci if (IS_ERR(rq)) { 158162306a36Sopenharmony_ci err = PTR_ERR(rq); 158262306a36Sopenharmony_ci if (err == -ENODEV) 158362306a36Sopenharmony_ci err = 0; 158462306a36Sopenharmony_ci wake_all(engine->i915); 158562306a36Sopenharmony_ci goto out_spin; 158662306a36Sopenharmony_ci } 158762306a36Sopenharmony_ci 158862306a36Sopenharmony_ci i915_request_get(rq); 158962306a36Sopenharmony_ci i915_request_add(rq); 159062306a36Sopenharmony_ci if (igt_wait_for_spinner(&spin, rq)) { 159162306a36Sopenharmony_ci /* Occupy this engine for the whole test */ 159262306a36Sopenharmony_ci err = wait_for_all(engine->i915); 159362306a36Sopenharmony_ci } else { 159462306a36Sopenharmony_ci pr_err("Failed to start spinner on %s\n", engine->name); 159562306a36Sopenharmony_ci err = -EINVAL; 159662306a36Sopenharmony_ci } 159762306a36Sopenharmony_ci igt_spinner_end(&spin); 159862306a36Sopenharmony_ci 159962306a36Sopenharmony_ci if (err == 0 && i915_request_wait(rq, 0, HZ) < 0) 160062306a36Sopenharmony_ci err = -EIO; 160162306a36Sopenharmony_ci i915_request_put(rq); 160262306a36Sopenharmony_ci 160362306a36Sopenharmony_ciout_spin: 160462306a36Sopenharmony_ci igt_spinner_fini(&spin); 160562306a36Sopenharmony_ci thread->result = err; 160662306a36Sopenharmony_ci} 160762306a36Sopenharmony_ci 160862306a36Sopenharmony_cistatic int live_parallel_engines(void *arg) 160962306a36Sopenharmony_ci{ 161062306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 161162306a36Sopenharmony_ci static void (* const func[])(struct kthread_work *) = { 161262306a36Sopenharmony_ci __live_parallel_engine1, 161362306a36Sopenharmony_ci __live_parallel_engineN, 161462306a36Sopenharmony_ci __live_parallel_spin, 161562306a36Sopenharmony_ci NULL, 161662306a36Sopenharmony_ci }; 161762306a36Sopenharmony_ci const unsigned int nengines = num_uabi_engines(i915); 161862306a36Sopenharmony_ci struct parallel_thread *threads; 161962306a36Sopenharmony_ci struct intel_engine_cs *engine; 162062306a36Sopenharmony_ci void (* const *fn)(struct kthread_work *); 162162306a36Sopenharmony_ci int err = 0; 162262306a36Sopenharmony_ci 162362306a36Sopenharmony_ci /* 162462306a36Sopenharmony_ci * Check we can submit requests to all engines concurrently. This 162562306a36Sopenharmony_ci * tests that we load up the system maximally. 162662306a36Sopenharmony_ci */ 162762306a36Sopenharmony_ci 162862306a36Sopenharmony_ci threads = kcalloc(nengines, sizeof(*threads), GFP_KERNEL); 162962306a36Sopenharmony_ci if (!threads) 163062306a36Sopenharmony_ci return -ENOMEM; 163162306a36Sopenharmony_ci 163262306a36Sopenharmony_ci for (fn = func; !err && *fn; fn++) { 163362306a36Sopenharmony_ci char name[KSYM_NAME_LEN]; 163462306a36Sopenharmony_ci struct igt_live_test t; 163562306a36Sopenharmony_ci unsigned int idx; 163662306a36Sopenharmony_ci 163762306a36Sopenharmony_ci snprintf(name, sizeof(name), "%ps", *fn); 163862306a36Sopenharmony_ci err = igt_live_test_begin(&t, i915, __func__, name); 163962306a36Sopenharmony_ci if (err) 164062306a36Sopenharmony_ci break; 164162306a36Sopenharmony_ci 164262306a36Sopenharmony_ci atomic_set(&i915->selftest.counter, nengines); 164362306a36Sopenharmony_ci 164462306a36Sopenharmony_ci idx = 0; 164562306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 164662306a36Sopenharmony_ci struct kthread_worker *worker; 164762306a36Sopenharmony_ci 164862306a36Sopenharmony_ci worker = kthread_create_worker(0, "igt/parallel:%s", 164962306a36Sopenharmony_ci engine->name); 165062306a36Sopenharmony_ci if (IS_ERR(worker)) { 165162306a36Sopenharmony_ci err = PTR_ERR(worker); 165262306a36Sopenharmony_ci break; 165362306a36Sopenharmony_ci } 165462306a36Sopenharmony_ci 165562306a36Sopenharmony_ci threads[idx].worker = worker; 165662306a36Sopenharmony_ci threads[idx].result = 0; 165762306a36Sopenharmony_ci threads[idx].engine = engine; 165862306a36Sopenharmony_ci 165962306a36Sopenharmony_ci kthread_init_work(&threads[idx].work, *fn); 166062306a36Sopenharmony_ci kthread_queue_work(worker, &threads[idx].work); 166162306a36Sopenharmony_ci idx++; 166262306a36Sopenharmony_ci } 166362306a36Sopenharmony_ci 166462306a36Sopenharmony_ci idx = 0; 166562306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 166662306a36Sopenharmony_ci int status; 166762306a36Sopenharmony_ci 166862306a36Sopenharmony_ci if (!threads[idx].worker) 166962306a36Sopenharmony_ci break; 167062306a36Sopenharmony_ci 167162306a36Sopenharmony_ci kthread_flush_work(&threads[idx].work); 167262306a36Sopenharmony_ci status = READ_ONCE(threads[idx].result); 167362306a36Sopenharmony_ci if (status && !err) 167462306a36Sopenharmony_ci err = status; 167562306a36Sopenharmony_ci 167662306a36Sopenharmony_ci kthread_destroy_worker(threads[idx++].worker); 167762306a36Sopenharmony_ci } 167862306a36Sopenharmony_ci 167962306a36Sopenharmony_ci if (igt_live_test_end(&t)) 168062306a36Sopenharmony_ci err = -EIO; 168162306a36Sopenharmony_ci } 168262306a36Sopenharmony_ci 168362306a36Sopenharmony_ci kfree(threads); 168462306a36Sopenharmony_ci return err; 168562306a36Sopenharmony_ci} 168662306a36Sopenharmony_ci 168762306a36Sopenharmony_cistatic int 168862306a36Sopenharmony_cimax_batches(struct i915_gem_context *ctx, struct intel_engine_cs *engine) 168962306a36Sopenharmony_ci{ 169062306a36Sopenharmony_ci struct i915_request *rq; 169162306a36Sopenharmony_ci int ret; 169262306a36Sopenharmony_ci 169362306a36Sopenharmony_ci /* 169462306a36Sopenharmony_ci * Before execlists, all contexts share the same ringbuffer. With 169562306a36Sopenharmony_ci * execlists, each context/engine has a separate ringbuffer and 169662306a36Sopenharmony_ci * for the purposes of this test, inexhaustible. 169762306a36Sopenharmony_ci * 169862306a36Sopenharmony_ci * For the global ringbuffer though, we have to be very careful 169962306a36Sopenharmony_ci * that we do not wrap while preventing the execution of requests 170062306a36Sopenharmony_ci * with a unsignaled fence. 170162306a36Sopenharmony_ci */ 170262306a36Sopenharmony_ci if (HAS_EXECLISTS(ctx->i915)) 170362306a36Sopenharmony_ci return INT_MAX; 170462306a36Sopenharmony_ci 170562306a36Sopenharmony_ci rq = igt_request_alloc(ctx, engine); 170662306a36Sopenharmony_ci if (IS_ERR(rq)) { 170762306a36Sopenharmony_ci ret = PTR_ERR(rq); 170862306a36Sopenharmony_ci } else { 170962306a36Sopenharmony_ci int sz; 171062306a36Sopenharmony_ci 171162306a36Sopenharmony_ci ret = rq->ring->size - rq->reserved_space; 171262306a36Sopenharmony_ci i915_request_add(rq); 171362306a36Sopenharmony_ci 171462306a36Sopenharmony_ci sz = rq->ring->emit - rq->head; 171562306a36Sopenharmony_ci if (sz < 0) 171662306a36Sopenharmony_ci sz += rq->ring->size; 171762306a36Sopenharmony_ci ret /= sz; 171862306a36Sopenharmony_ci ret /= 2; /* leave half spare, in case of emergency! */ 171962306a36Sopenharmony_ci } 172062306a36Sopenharmony_ci 172162306a36Sopenharmony_ci return ret; 172262306a36Sopenharmony_ci} 172362306a36Sopenharmony_ci 172462306a36Sopenharmony_cistatic int live_breadcrumbs_smoketest(void *arg) 172562306a36Sopenharmony_ci{ 172662306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 172762306a36Sopenharmony_ci const unsigned int nengines = num_uabi_engines(i915); 172862306a36Sopenharmony_ci const unsigned int ncpus = /* saturate with nengines * ncpus */ 172962306a36Sopenharmony_ci max_t(int, 2, DIV_ROUND_UP(num_online_cpus(), nengines)); 173062306a36Sopenharmony_ci unsigned long num_waits, num_fences; 173162306a36Sopenharmony_ci struct intel_engine_cs *engine; 173262306a36Sopenharmony_ci struct smoke_thread *threads; 173362306a36Sopenharmony_ci struct igt_live_test live; 173462306a36Sopenharmony_ci intel_wakeref_t wakeref; 173562306a36Sopenharmony_ci struct smoketest *smoke; 173662306a36Sopenharmony_ci unsigned int n, idx; 173762306a36Sopenharmony_ci struct file *file; 173862306a36Sopenharmony_ci int ret = 0; 173962306a36Sopenharmony_ci 174062306a36Sopenharmony_ci /* 174162306a36Sopenharmony_ci * Smoketest our breadcrumb/signal handling for requests across multiple 174262306a36Sopenharmony_ci * threads. A very simple test to only catch the most egregious of bugs. 174362306a36Sopenharmony_ci * See __igt_breadcrumbs_smoketest(); 174462306a36Sopenharmony_ci * 174562306a36Sopenharmony_ci * On real hardware this time. 174662306a36Sopenharmony_ci */ 174762306a36Sopenharmony_ci 174862306a36Sopenharmony_ci wakeref = intel_runtime_pm_get(&i915->runtime_pm); 174962306a36Sopenharmony_ci 175062306a36Sopenharmony_ci file = mock_file(i915); 175162306a36Sopenharmony_ci if (IS_ERR(file)) { 175262306a36Sopenharmony_ci ret = PTR_ERR(file); 175362306a36Sopenharmony_ci goto out_rpm; 175462306a36Sopenharmony_ci } 175562306a36Sopenharmony_ci 175662306a36Sopenharmony_ci smoke = kcalloc(nengines, sizeof(*smoke), GFP_KERNEL); 175762306a36Sopenharmony_ci if (!smoke) { 175862306a36Sopenharmony_ci ret = -ENOMEM; 175962306a36Sopenharmony_ci goto out_file; 176062306a36Sopenharmony_ci } 176162306a36Sopenharmony_ci 176262306a36Sopenharmony_ci threads = kcalloc(ncpus * nengines, sizeof(*threads), GFP_KERNEL); 176362306a36Sopenharmony_ci if (!threads) { 176462306a36Sopenharmony_ci ret = -ENOMEM; 176562306a36Sopenharmony_ci goto out_smoke; 176662306a36Sopenharmony_ci } 176762306a36Sopenharmony_ci 176862306a36Sopenharmony_ci smoke[0].request_alloc = __live_request_alloc; 176962306a36Sopenharmony_ci smoke[0].ncontexts = 64; 177062306a36Sopenharmony_ci smoke[0].contexts = kcalloc(smoke[0].ncontexts, 177162306a36Sopenharmony_ci sizeof(*smoke[0].contexts), 177262306a36Sopenharmony_ci GFP_KERNEL); 177362306a36Sopenharmony_ci if (!smoke[0].contexts) { 177462306a36Sopenharmony_ci ret = -ENOMEM; 177562306a36Sopenharmony_ci goto out_threads; 177662306a36Sopenharmony_ci } 177762306a36Sopenharmony_ci 177862306a36Sopenharmony_ci for (n = 0; n < smoke[0].ncontexts; n++) { 177962306a36Sopenharmony_ci smoke[0].contexts[n] = live_context(i915, file); 178062306a36Sopenharmony_ci if (IS_ERR(smoke[0].contexts[n])) { 178162306a36Sopenharmony_ci ret = PTR_ERR(smoke[0].contexts[n]); 178262306a36Sopenharmony_ci goto out_contexts; 178362306a36Sopenharmony_ci } 178462306a36Sopenharmony_ci } 178562306a36Sopenharmony_ci 178662306a36Sopenharmony_ci ret = igt_live_test_begin(&live, i915, __func__, ""); 178762306a36Sopenharmony_ci if (ret) 178862306a36Sopenharmony_ci goto out_contexts; 178962306a36Sopenharmony_ci 179062306a36Sopenharmony_ci idx = 0; 179162306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 179262306a36Sopenharmony_ci smoke[idx] = smoke[0]; 179362306a36Sopenharmony_ci smoke[idx].engine = engine; 179462306a36Sopenharmony_ci smoke[idx].max_batch = 179562306a36Sopenharmony_ci max_batches(smoke[0].contexts[0], engine); 179662306a36Sopenharmony_ci if (smoke[idx].max_batch < 0) { 179762306a36Sopenharmony_ci ret = smoke[idx].max_batch; 179862306a36Sopenharmony_ci goto out_flush; 179962306a36Sopenharmony_ci } 180062306a36Sopenharmony_ci /* One ring interleaved between requests from all cpus */ 180162306a36Sopenharmony_ci smoke[idx].max_batch /= ncpus + 1; 180262306a36Sopenharmony_ci pr_debug("Limiting batches to %d requests on %s\n", 180362306a36Sopenharmony_ci smoke[idx].max_batch, engine->name); 180462306a36Sopenharmony_ci 180562306a36Sopenharmony_ci for (n = 0; n < ncpus; n++) { 180662306a36Sopenharmony_ci unsigned int i = idx * ncpus + n; 180762306a36Sopenharmony_ci struct kthread_worker *worker; 180862306a36Sopenharmony_ci 180962306a36Sopenharmony_ci worker = kthread_create_worker(0, "igt/%d.%d", idx, n); 181062306a36Sopenharmony_ci if (IS_ERR(worker)) { 181162306a36Sopenharmony_ci ret = PTR_ERR(worker); 181262306a36Sopenharmony_ci goto out_flush; 181362306a36Sopenharmony_ci } 181462306a36Sopenharmony_ci 181562306a36Sopenharmony_ci threads[i].worker = worker; 181662306a36Sopenharmony_ci threads[i].t = &smoke[idx]; 181762306a36Sopenharmony_ci 181862306a36Sopenharmony_ci kthread_init_work(&threads[i].work, 181962306a36Sopenharmony_ci __igt_breadcrumbs_smoketest); 182062306a36Sopenharmony_ci kthread_queue_work(worker, &threads[i].work); 182162306a36Sopenharmony_ci } 182262306a36Sopenharmony_ci 182362306a36Sopenharmony_ci idx++; 182462306a36Sopenharmony_ci } 182562306a36Sopenharmony_ci 182662306a36Sopenharmony_ci msleep(jiffies_to_msecs(i915_selftest.timeout_jiffies)); 182762306a36Sopenharmony_ci 182862306a36Sopenharmony_ciout_flush: 182962306a36Sopenharmony_ci idx = 0; 183062306a36Sopenharmony_ci num_waits = 0; 183162306a36Sopenharmony_ci num_fences = 0; 183262306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 183362306a36Sopenharmony_ci for (n = 0; n < ncpus; n++) { 183462306a36Sopenharmony_ci unsigned int i = idx * ncpus + n; 183562306a36Sopenharmony_ci int err; 183662306a36Sopenharmony_ci 183762306a36Sopenharmony_ci if (!threads[i].worker) 183862306a36Sopenharmony_ci continue; 183962306a36Sopenharmony_ci 184062306a36Sopenharmony_ci WRITE_ONCE(threads[i].stop, true); 184162306a36Sopenharmony_ci kthread_flush_work(&threads[i].work); 184262306a36Sopenharmony_ci err = READ_ONCE(threads[i].result); 184362306a36Sopenharmony_ci if (err < 0 && !ret) 184462306a36Sopenharmony_ci ret = err; 184562306a36Sopenharmony_ci 184662306a36Sopenharmony_ci kthread_destroy_worker(threads[i].worker); 184762306a36Sopenharmony_ci } 184862306a36Sopenharmony_ci 184962306a36Sopenharmony_ci num_waits += atomic_long_read(&smoke[idx].num_waits); 185062306a36Sopenharmony_ci num_fences += atomic_long_read(&smoke[idx].num_fences); 185162306a36Sopenharmony_ci idx++; 185262306a36Sopenharmony_ci } 185362306a36Sopenharmony_ci pr_info("Completed %lu waits for %lu fences across %d engines and %d cpus\n", 185462306a36Sopenharmony_ci num_waits, num_fences, idx, ncpus); 185562306a36Sopenharmony_ci 185662306a36Sopenharmony_ci ret = igt_live_test_end(&live) ?: ret; 185762306a36Sopenharmony_ciout_contexts: 185862306a36Sopenharmony_ci kfree(smoke[0].contexts); 185962306a36Sopenharmony_ciout_threads: 186062306a36Sopenharmony_ci kfree(threads); 186162306a36Sopenharmony_ciout_smoke: 186262306a36Sopenharmony_ci kfree(smoke); 186362306a36Sopenharmony_ciout_file: 186462306a36Sopenharmony_ci fput(file); 186562306a36Sopenharmony_ciout_rpm: 186662306a36Sopenharmony_ci intel_runtime_pm_put(&i915->runtime_pm, wakeref); 186762306a36Sopenharmony_ci 186862306a36Sopenharmony_ci return ret; 186962306a36Sopenharmony_ci} 187062306a36Sopenharmony_ci 187162306a36Sopenharmony_ciint i915_request_live_selftests(struct drm_i915_private *i915) 187262306a36Sopenharmony_ci{ 187362306a36Sopenharmony_ci static const struct i915_subtest tests[] = { 187462306a36Sopenharmony_ci SUBTEST(live_nop_request), 187562306a36Sopenharmony_ci SUBTEST(live_all_engines), 187662306a36Sopenharmony_ci SUBTEST(live_sequential_engines), 187762306a36Sopenharmony_ci SUBTEST(live_parallel_engines), 187862306a36Sopenharmony_ci SUBTEST(live_empty_request), 187962306a36Sopenharmony_ci SUBTEST(live_cancel_request), 188062306a36Sopenharmony_ci SUBTEST(live_breadcrumbs_smoketest), 188162306a36Sopenharmony_ci }; 188262306a36Sopenharmony_ci 188362306a36Sopenharmony_ci if (intel_gt_is_wedged(to_gt(i915))) 188462306a36Sopenharmony_ci return 0; 188562306a36Sopenharmony_ci 188662306a36Sopenharmony_ci return i915_live_subtests(tests, i915); 188762306a36Sopenharmony_ci} 188862306a36Sopenharmony_ci 188962306a36Sopenharmony_cistatic int switch_to_kernel_sync(struct intel_context *ce, int err) 189062306a36Sopenharmony_ci{ 189162306a36Sopenharmony_ci struct i915_request *rq; 189262306a36Sopenharmony_ci struct dma_fence *fence; 189362306a36Sopenharmony_ci 189462306a36Sopenharmony_ci rq = intel_engine_create_kernel_request(ce->engine); 189562306a36Sopenharmony_ci if (IS_ERR(rq)) 189662306a36Sopenharmony_ci return PTR_ERR(rq); 189762306a36Sopenharmony_ci 189862306a36Sopenharmony_ci fence = i915_active_fence_get(&ce->timeline->last_request); 189962306a36Sopenharmony_ci if (fence) { 190062306a36Sopenharmony_ci i915_request_await_dma_fence(rq, fence); 190162306a36Sopenharmony_ci dma_fence_put(fence); 190262306a36Sopenharmony_ci } 190362306a36Sopenharmony_ci 190462306a36Sopenharmony_ci rq = i915_request_get(rq); 190562306a36Sopenharmony_ci i915_request_add(rq); 190662306a36Sopenharmony_ci if (i915_request_wait(rq, 0, HZ / 2) < 0 && !err) 190762306a36Sopenharmony_ci err = -ETIME; 190862306a36Sopenharmony_ci i915_request_put(rq); 190962306a36Sopenharmony_ci 191062306a36Sopenharmony_ci while (!err && !intel_engine_is_idle(ce->engine)) 191162306a36Sopenharmony_ci intel_engine_flush_submission(ce->engine); 191262306a36Sopenharmony_ci 191362306a36Sopenharmony_ci return err; 191462306a36Sopenharmony_ci} 191562306a36Sopenharmony_ci 191662306a36Sopenharmony_cistruct perf_stats { 191762306a36Sopenharmony_ci struct intel_engine_cs *engine; 191862306a36Sopenharmony_ci unsigned long count; 191962306a36Sopenharmony_ci ktime_t time; 192062306a36Sopenharmony_ci ktime_t busy; 192162306a36Sopenharmony_ci u64 runtime; 192262306a36Sopenharmony_ci}; 192362306a36Sopenharmony_ci 192462306a36Sopenharmony_cistruct perf_series { 192562306a36Sopenharmony_ci struct drm_i915_private *i915; 192662306a36Sopenharmony_ci unsigned int nengines; 192762306a36Sopenharmony_ci struct intel_context *ce[]; 192862306a36Sopenharmony_ci}; 192962306a36Sopenharmony_ci 193062306a36Sopenharmony_cistatic int cmp_u32(const void *A, const void *B) 193162306a36Sopenharmony_ci{ 193262306a36Sopenharmony_ci const u32 *a = A, *b = B; 193362306a36Sopenharmony_ci 193462306a36Sopenharmony_ci return *a - *b; 193562306a36Sopenharmony_ci} 193662306a36Sopenharmony_ci 193762306a36Sopenharmony_cistatic u32 trifilter(u32 *a) 193862306a36Sopenharmony_ci{ 193962306a36Sopenharmony_ci u64 sum; 194062306a36Sopenharmony_ci 194162306a36Sopenharmony_ci#define TF_COUNT 5 194262306a36Sopenharmony_ci sort(a, TF_COUNT, sizeof(*a), cmp_u32, NULL); 194362306a36Sopenharmony_ci 194462306a36Sopenharmony_ci sum = mul_u32_u32(a[2], 2); 194562306a36Sopenharmony_ci sum += a[1]; 194662306a36Sopenharmony_ci sum += a[3]; 194762306a36Sopenharmony_ci 194862306a36Sopenharmony_ci GEM_BUG_ON(sum > U32_MAX); 194962306a36Sopenharmony_ci return sum; 195062306a36Sopenharmony_ci#define TF_BIAS 2 195162306a36Sopenharmony_ci} 195262306a36Sopenharmony_ci 195362306a36Sopenharmony_cistatic u64 cycles_to_ns(struct intel_engine_cs *engine, u32 cycles) 195462306a36Sopenharmony_ci{ 195562306a36Sopenharmony_ci u64 ns = intel_gt_clock_interval_to_ns(engine->gt, cycles); 195662306a36Sopenharmony_ci 195762306a36Sopenharmony_ci return DIV_ROUND_CLOSEST(ns, 1 << TF_BIAS); 195862306a36Sopenharmony_ci} 195962306a36Sopenharmony_ci 196062306a36Sopenharmony_cistatic u32 *emit_timestamp_store(u32 *cs, struct intel_context *ce, u32 offset) 196162306a36Sopenharmony_ci{ 196262306a36Sopenharmony_ci *cs++ = MI_STORE_REGISTER_MEM_GEN8 | MI_USE_GGTT; 196362306a36Sopenharmony_ci *cs++ = i915_mmio_reg_offset(RING_TIMESTAMP((ce->engine->mmio_base))); 196462306a36Sopenharmony_ci *cs++ = offset; 196562306a36Sopenharmony_ci *cs++ = 0; 196662306a36Sopenharmony_ci 196762306a36Sopenharmony_ci return cs; 196862306a36Sopenharmony_ci} 196962306a36Sopenharmony_ci 197062306a36Sopenharmony_cistatic u32 *emit_store_dw(u32 *cs, u32 offset, u32 value) 197162306a36Sopenharmony_ci{ 197262306a36Sopenharmony_ci *cs++ = MI_STORE_DWORD_IMM_GEN4 | MI_USE_GGTT; 197362306a36Sopenharmony_ci *cs++ = offset; 197462306a36Sopenharmony_ci *cs++ = 0; 197562306a36Sopenharmony_ci *cs++ = value; 197662306a36Sopenharmony_ci 197762306a36Sopenharmony_ci return cs; 197862306a36Sopenharmony_ci} 197962306a36Sopenharmony_ci 198062306a36Sopenharmony_cistatic u32 *emit_semaphore_poll(u32 *cs, u32 mode, u32 value, u32 offset) 198162306a36Sopenharmony_ci{ 198262306a36Sopenharmony_ci *cs++ = MI_SEMAPHORE_WAIT | 198362306a36Sopenharmony_ci MI_SEMAPHORE_GLOBAL_GTT | 198462306a36Sopenharmony_ci MI_SEMAPHORE_POLL | 198562306a36Sopenharmony_ci mode; 198662306a36Sopenharmony_ci *cs++ = value; 198762306a36Sopenharmony_ci *cs++ = offset; 198862306a36Sopenharmony_ci *cs++ = 0; 198962306a36Sopenharmony_ci 199062306a36Sopenharmony_ci return cs; 199162306a36Sopenharmony_ci} 199262306a36Sopenharmony_ci 199362306a36Sopenharmony_cistatic u32 *emit_semaphore_poll_until(u32 *cs, u32 offset, u32 value) 199462306a36Sopenharmony_ci{ 199562306a36Sopenharmony_ci return emit_semaphore_poll(cs, MI_SEMAPHORE_SAD_EQ_SDD, value, offset); 199662306a36Sopenharmony_ci} 199762306a36Sopenharmony_ci 199862306a36Sopenharmony_cistatic void semaphore_set(u32 *sema, u32 value) 199962306a36Sopenharmony_ci{ 200062306a36Sopenharmony_ci WRITE_ONCE(*sema, value); 200162306a36Sopenharmony_ci wmb(); /* flush the update to the cache, and beyond */ 200262306a36Sopenharmony_ci} 200362306a36Sopenharmony_ci 200462306a36Sopenharmony_cistatic u32 *hwsp_scratch(const struct intel_context *ce) 200562306a36Sopenharmony_ci{ 200662306a36Sopenharmony_ci return memset32(ce->engine->status_page.addr + 1000, 0, 21); 200762306a36Sopenharmony_ci} 200862306a36Sopenharmony_ci 200962306a36Sopenharmony_cistatic u32 hwsp_offset(const struct intel_context *ce, u32 *dw) 201062306a36Sopenharmony_ci{ 201162306a36Sopenharmony_ci return (i915_ggtt_offset(ce->engine->status_page.vma) + 201262306a36Sopenharmony_ci offset_in_page(dw)); 201362306a36Sopenharmony_ci} 201462306a36Sopenharmony_ci 201562306a36Sopenharmony_cistatic int measure_semaphore_response(struct intel_context *ce) 201662306a36Sopenharmony_ci{ 201762306a36Sopenharmony_ci u32 *sema = hwsp_scratch(ce); 201862306a36Sopenharmony_ci const u32 offset = hwsp_offset(ce, sema); 201962306a36Sopenharmony_ci u32 elapsed[TF_COUNT], cycles; 202062306a36Sopenharmony_ci struct i915_request *rq; 202162306a36Sopenharmony_ci u32 *cs; 202262306a36Sopenharmony_ci int err; 202362306a36Sopenharmony_ci int i; 202462306a36Sopenharmony_ci 202562306a36Sopenharmony_ci /* 202662306a36Sopenharmony_ci * Measure how many cycles it takes for the HW to detect the change 202762306a36Sopenharmony_ci * in a semaphore value. 202862306a36Sopenharmony_ci * 202962306a36Sopenharmony_ci * A: read CS_TIMESTAMP from CPU 203062306a36Sopenharmony_ci * poke semaphore 203162306a36Sopenharmony_ci * B: read CS_TIMESTAMP on GPU 203262306a36Sopenharmony_ci * 203362306a36Sopenharmony_ci * Semaphore latency: B - A 203462306a36Sopenharmony_ci */ 203562306a36Sopenharmony_ci 203662306a36Sopenharmony_ci semaphore_set(sema, -1); 203762306a36Sopenharmony_ci 203862306a36Sopenharmony_ci rq = i915_request_create(ce); 203962306a36Sopenharmony_ci if (IS_ERR(rq)) 204062306a36Sopenharmony_ci return PTR_ERR(rq); 204162306a36Sopenharmony_ci 204262306a36Sopenharmony_ci cs = intel_ring_begin(rq, 4 + 12 * ARRAY_SIZE(elapsed)); 204362306a36Sopenharmony_ci if (IS_ERR(cs)) { 204462306a36Sopenharmony_ci i915_request_add(rq); 204562306a36Sopenharmony_ci err = PTR_ERR(cs); 204662306a36Sopenharmony_ci goto err; 204762306a36Sopenharmony_ci } 204862306a36Sopenharmony_ci 204962306a36Sopenharmony_ci cs = emit_store_dw(cs, offset, 0); 205062306a36Sopenharmony_ci for (i = 1; i <= ARRAY_SIZE(elapsed); i++) { 205162306a36Sopenharmony_ci cs = emit_semaphore_poll_until(cs, offset, i); 205262306a36Sopenharmony_ci cs = emit_timestamp_store(cs, ce, offset + i * sizeof(u32)); 205362306a36Sopenharmony_ci cs = emit_store_dw(cs, offset, 0); 205462306a36Sopenharmony_ci } 205562306a36Sopenharmony_ci 205662306a36Sopenharmony_ci intel_ring_advance(rq, cs); 205762306a36Sopenharmony_ci i915_request_add(rq); 205862306a36Sopenharmony_ci 205962306a36Sopenharmony_ci if (wait_for(READ_ONCE(*sema) == 0, 50)) { 206062306a36Sopenharmony_ci err = -EIO; 206162306a36Sopenharmony_ci goto err; 206262306a36Sopenharmony_ci } 206362306a36Sopenharmony_ci 206462306a36Sopenharmony_ci for (i = 1; i <= ARRAY_SIZE(elapsed); i++) { 206562306a36Sopenharmony_ci preempt_disable(); 206662306a36Sopenharmony_ci cycles = ENGINE_READ_FW(ce->engine, RING_TIMESTAMP); 206762306a36Sopenharmony_ci semaphore_set(sema, i); 206862306a36Sopenharmony_ci preempt_enable(); 206962306a36Sopenharmony_ci 207062306a36Sopenharmony_ci if (wait_for(READ_ONCE(*sema) == 0, 50)) { 207162306a36Sopenharmony_ci err = -EIO; 207262306a36Sopenharmony_ci goto err; 207362306a36Sopenharmony_ci } 207462306a36Sopenharmony_ci 207562306a36Sopenharmony_ci elapsed[i - 1] = sema[i] - cycles; 207662306a36Sopenharmony_ci } 207762306a36Sopenharmony_ci 207862306a36Sopenharmony_ci cycles = trifilter(elapsed); 207962306a36Sopenharmony_ci pr_info("%s: semaphore response %d cycles, %lluns\n", 208062306a36Sopenharmony_ci ce->engine->name, cycles >> TF_BIAS, 208162306a36Sopenharmony_ci cycles_to_ns(ce->engine, cycles)); 208262306a36Sopenharmony_ci 208362306a36Sopenharmony_ci return intel_gt_wait_for_idle(ce->engine->gt, HZ); 208462306a36Sopenharmony_ci 208562306a36Sopenharmony_cierr: 208662306a36Sopenharmony_ci intel_gt_set_wedged(ce->engine->gt); 208762306a36Sopenharmony_ci return err; 208862306a36Sopenharmony_ci} 208962306a36Sopenharmony_ci 209062306a36Sopenharmony_cistatic int measure_idle_dispatch(struct intel_context *ce) 209162306a36Sopenharmony_ci{ 209262306a36Sopenharmony_ci u32 *sema = hwsp_scratch(ce); 209362306a36Sopenharmony_ci const u32 offset = hwsp_offset(ce, sema); 209462306a36Sopenharmony_ci u32 elapsed[TF_COUNT], cycles; 209562306a36Sopenharmony_ci u32 *cs; 209662306a36Sopenharmony_ci int err; 209762306a36Sopenharmony_ci int i; 209862306a36Sopenharmony_ci 209962306a36Sopenharmony_ci /* 210062306a36Sopenharmony_ci * Measure how long it takes for us to submit a request while the 210162306a36Sopenharmony_ci * engine is idle, but is resting in our context. 210262306a36Sopenharmony_ci * 210362306a36Sopenharmony_ci * A: read CS_TIMESTAMP from CPU 210462306a36Sopenharmony_ci * submit request 210562306a36Sopenharmony_ci * B: read CS_TIMESTAMP on GPU 210662306a36Sopenharmony_ci * 210762306a36Sopenharmony_ci * Submission latency: B - A 210862306a36Sopenharmony_ci */ 210962306a36Sopenharmony_ci 211062306a36Sopenharmony_ci for (i = 0; i < ARRAY_SIZE(elapsed); i++) { 211162306a36Sopenharmony_ci struct i915_request *rq; 211262306a36Sopenharmony_ci 211362306a36Sopenharmony_ci err = intel_gt_wait_for_idle(ce->engine->gt, HZ / 2); 211462306a36Sopenharmony_ci if (err) 211562306a36Sopenharmony_ci return err; 211662306a36Sopenharmony_ci 211762306a36Sopenharmony_ci rq = i915_request_create(ce); 211862306a36Sopenharmony_ci if (IS_ERR(rq)) { 211962306a36Sopenharmony_ci err = PTR_ERR(rq); 212062306a36Sopenharmony_ci goto err; 212162306a36Sopenharmony_ci } 212262306a36Sopenharmony_ci 212362306a36Sopenharmony_ci cs = intel_ring_begin(rq, 4); 212462306a36Sopenharmony_ci if (IS_ERR(cs)) { 212562306a36Sopenharmony_ci i915_request_add(rq); 212662306a36Sopenharmony_ci err = PTR_ERR(cs); 212762306a36Sopenharmony_ci goto err; 212862306a36Sopenharmony_ci } 212962306a36Sopenharmony_ci 213062306a36Sopenharmony_ci cs = emit_timestamp_store(cs, ce, offset + i * sizeof(u32)); 213162306a36Sopenharmony_ci 213262306a36Sopenharmony_ci intel_ring_advance(rq, cs); 213362306a36Sopenharmony_ci 213462306a36Sopenharmony_ci preempt_disable(); 213562306a36Sopenharmony_ci local_bh_disable(); 213662306a36Sopenharmony_ci elapsed[i] = ENGINE_READ_FW(ce->engine, RING_TIMESTAMP); 213762306a36Sopenharmony_ci i915_request_add(rq); 213862306a36Sopenharmony_ci local_bh_enable(); 213962306a36Sopenharmony_ci preempt_enable(); 214062306a36Sopenharmony_ci } 214162306a36Sopenharmony_ci 214262306a36Sopenharmony_ci err = intel_gt_wait_for_idle(ce->engine->gt, HZ / 2); 214362306a36Sopenharmony_ci if (err) 214462306a36Sopenharmony_ci goto err; 214562306a36Sopenharmony_ci 214662306a36Sopenharmony_ci for (i = 0; i < ARRAY_SIZE(elapsed); i++) 214762306a36Sopenharmony_ci elapsed[i] = sema[i] - elapsed[i]; 214862306a36Sopenharmony_ci 214962306a36Sopenharmony_ci cycles = trifilter(elapsed); 215062306a36Sopenharmony_ci pr_info("%s: idle dispatch latency %d cycles, %lluns\n", 215162306a36Sopenharmony_ci ce->engine->name, cycles >> TF_BIAS, 215262306a36Sopenharmony_ci cycles_to_ns(ce->engine, cycles)); 215362306a36Sopenharmony_ci 215462306a36Sopenharmony_ci return intel_gt_wait_for_idle(ce->engine->gt, HZ); 215562306a36Sopenharmony_ci 215662306a36Sopenharmony_cierr: 215762306a36Sopenharmony_ci intel_gt_set_wedged(ce->engine->gt); 215862306a36Sopenharmony_ci return err; 215962306a36Sopenharmony_ci} 216062306a36Sopenharmony_ci 216162306a36Sopenharmony_cistatic int measure_busy_dispatch(struct intel_context *ce) 216262306a36Sopenharmony_ci{ 216362306a36Sopenharmony_ci u32 *sema = hwsp_scratch(ce); 216462306a36Sopenharmony_ci const u32 offset = hwsp_offset(ce, sema); 216562306a36Sopenharmony_ci u32 elapsed[TF_COUNT + 1], cycles; 216662306a36Sopenharmony_ci u32 *cs; 216762306a36Sopenharmony_ci int err; 216862306a36Sopenharmony_ci int i; 216962306a36Sopenharmony_ci 217062306a36Sopenharmony_ci /* 217162306a36Sopenharmony_ci * Measure how long it takes for us to submit a request while the 217262306a36Sopenharmony_ci * engine is busy, polling on a semaphore in our context. With 217362306a36Sopenharmony_ci * direct submission, this will include the cost of a lite restore. 217462306a36Sopenharmony_ci * 217562306a36Sopenharmony_ci * A: read CS_TIMESTAMP from CPU 217662306a36Sopenharmony_ci * submit request 217762306a36Sopenharmony_ci * B: read CS_TIMESTAMP on GPU 217862306a36Sopenharmony_ci * 217962306a36Sopenharmony_ci * Submission latency: B - A 218062306a36Sopenharmony_ci */ 218162306a36Sopenharmony_ci 218262306a36Sopenharmony_ci for (i = 1; i <= ARRAY_SIZE(elapsed); i++) { 218362306a36Sopenharmony_ci struct i915_request *rq; 218462306a36Sopenharmony_ci 218562306a36Sopenharmony_ci rq = i915_request_create(ce); 218662306a36Sopenharmony_ci if (IS_ERR(rq)) { 218762306a36Sopenharmony_ci err = PTR_ERR(rq); 218862306a36Sopenharmony_ci goto err; 218962306a36Sopenharmony_ci } 219062306a36Sopenharmony_ci 219162306a36Sopenharmony_ci cs = intel_ring_begin(rq, 12); 219262306a36Sopenharmony_ci if (IS_ERR(cs)) { 219362306a36Sopenharmony_ci i915_request_add(rq); 219462306a36Sopenharmony_ci err = PTR_ERR(cs); 219562306a36Sopenharmony_ci goto err; 219662306a36Sopenharmony_ci } 219762306a36Sopenharmony_ci 219862306a36Sopenharmony_ci cs = emit_store_dw(cs, offset + i * sizeof(u32), -1); 219962306a36Sopenharmony_ci cs = emit_semaphore_poll_until(cs, offset, i); 220062306a36Sopenharmony_ci cs = emit_timestamp_store(cs, ce, offset + i * sizeof(u32)); 220162306a36Sopenharmony_ci 220262306a36Sopenharmony_ci intel_ring_advance(rq, cs); 220362306a36Sopenharmony_ci 220462306a36Sopenharmony_ci if (i > 1 && wait_for(READ_ONCE(sema[i - 1]), 500)) { 220562306a36Sopenharmony_ci err = -EIO; 220662306a36Sopenharmony_ci goto err; 220762306a36Sopenharmony_ci } 220862306a36Sopenharmony_ci 220962306a36Sopenharmony_ci preempt_disable(); 221062306a36Sopenharmony_ci local_bh_disable(); 221162306a36Sopenharmony_ci elapsed[i - 1] = ENGINE_READ_FW(ce->engine, RING_TIMESTAMP); 221262306a36Sopenharmony_ci i915_request_add(rq); 221362306a36Sopenharmony_ci local_bh_enable(); 221462306a36Sopenharmony_ci semaphore_set(sema, i - 1); 221562306a36Sopenharmony_ci preempt_enable(); 221662306a36Sopenharmony_ci } 221762306a36Sopenharmony_ci 221862306a36Sopenharmony_ci wait_for(READ_ONCE(sema[i - 1]), 500); 221962306a36Sopenharmony_ci semaphore_set(sema, i - 1); 222062306a36Sopenharmony_ci 222162306a36Sopenharmony_ci for (i = 1; i <= TF_COUNT; i++) { 222262306a36Sopenharmony_ci GEM_BUG_ON(sema[i] == -1); 222362306a36Sopenharmony_ci elapsed[i - 1] = sema[i] - elapsed[i]; 222462306a36Sopenharmony_ci } 222562306a36Sopenharmony_ci 222662306a36Sopenharmony_ci cycles = trifilter(elapsed); 222762306a36Sopenharmony_ci pr_info("%s: busy dispatch latency %d cycles, %lluns\n", 222862306a36Sopenharmony_ci ce->engine->name, cycles >> TF_BIAS, 222962306a36Sopenharmony_ci cycles_to_ns(ce->engine, cycles)); 223062306a36Sopenharmony_ci 223162306a36Sopenharmony_ci return intel_gt_wait_for_idle(ce->engine->gt, HZ); 223262306a36Sopenharmony_ci 223362306a36Sopenharmony_cierr: 223462306a36Sopenharmony_ci intel_gt_set_wedged(ce->engine->gt); 223562306a36Sopenharmony_ci return err; 223662306a36Sopenharmony_ci} 223762306a36Sopenharmony_ci 223862306a36Sopenharmony_cistatic int plug(struct intel_engine_cs *engine, u32 *sema, u32 mode, int value) 223962306a36Sopenharmony_ci{ 224062306a36Sopenharmony_ci const u32 offset = 224162306a36Sopenharmony_ci i915_ggtt_offset(engine->status_page.vma) + 224262306a36Sopenharmony_ci offset_in_page(sema); 224362306a36Sopenharmony_ci struct i915_request *rq; 224462306a36Sopenharmony_ci u32 *cs; 224562306a36Sopenharmony_ci 224662306a36Sopenharmony_ci rq = i915_request_create(engine->kernel_context); 224762306a36Sopenharmony_ci if (IS_ERR(rq)) 224862306a36Sopenharmony_ci return PTR_ERR(rq); 224962306a36Sopenharmony_ci 225062306a36Sopenharmony_ci cs = intel_ring_begin(rq, 4); 225162306a36Sopenharmony_ci if (IS_ERR(cs)) { 225262306a36Sopenharmony_ci i915_request_add(rq); 225362306a36Sopenharmony_ci return PTR_ERR(cs); 225462306a36Sopenharmony_ci } 225562306a36Sopenharmony_ci 225662306a36Sopenharmony_ci cs = emit_semaphore_poll(cs, mode, value, offset); 225762306a36Sopenharmony_ci 225862306a36Sopenharmony_ci intel_ring_advance(rq, cs); 225962306a36Sopenharmony_ci i915_request_add(rq); 226062306a36Sopenharmony_ci 226162306a36Sopenharmony_ci return 0; 226262306a36Sopenharmony_ci} 226362306a36Sopenharmony_ci 226462306a36Sopenharmony_cistatic int measure_inter_request(struct intel_context *ce) 226562306a36Sopenharmony_ci{ 226662306a36Sopenharmony_ci u32 *sema = hwsp_scratch(ce); 226762306a36Sopenharmony_ci const u32 offset = hwsp_offset(ce, sema); 226862306a36Sopenharmony_ci u32 elapsed[TF_COUNT + 1], cycles; 226962306a36Sopenharmony_ci struct i915_sw_fence *submit; 227062306a36Sopenharmony_ci int i, err; 227162306a36Sopenharmony_ci 227262306a36Sopenharmony_ci /* 227362306a36Sopenharmony_ci * Measure how long it takes to advance from one request into the 227462306a36Sopenharmony_ci * next. Between each request we flush the GPU caches to memory, 227562306a36Sopenharmony_ci * update the breadcrumbs, and then invalidate those caches. 227662306a36Sopenharmony_ci * We queue up all the requests to be submitted in one batch so 227762306a36Sopenharmony_ci * it should be one set of contiguous measurements. 227862306a36Sopenharmony_ci * 227962306a36Sopenharmony_ci * A: read CS_TIMESTAMP on GPU 228062306a36Sopenharmony_ci * advance request 228162306a36Sopenharmony_ci * B: read CS_TIMESTAMP on GPU 228262306a36Sopenharmony_ci * 228362306a36Sopenharmony_ci * Request latency: B - A 228462306a36Sopenharmony_ci */ 228562306a36Sopenharmony_ci 228662306a36Sopenharmony_ci err = plug(ce->engine, sema, MI_SEMAPHORE_SAD_NEQ_SDD, 0); 228762306a36Sopenharmony_ci if (err) 228862306a36Sopenharmony_ci return err; 228962306a36Sopenharmony_ci 229062306a36Sopenharmony_ci submit = heap_fence_create(GFP_KERNEL); 229162306a36Sopenharmony_ci if (!submit) { 229262306a36Sopenharmony_ci semaphore_set(sema, 1); 229362306a36Sopenharmony_ci return -ENOMEM; 229462306a36Sopenharmony_ci } 229562306a36Sopenharmony_ci 229662306a36Sopenharmony_ci intel_engine_flush_submission(ce->engine); 229762306a36Sopenharmony_ci for (i = 1; i <= ARRAY_SIZE(elapsed); i++) { 229862306a36Sopenharmony_ci struct i915_request *rq; 229962306a36Sopenharmony_ci u32 *cs; 230062306a36Sopenharmony_ci 230162306a36Sopenharmony_ci rq = i915_request_create(ce); 230262306a36Sopenharmony_ci if (IS_ERR(rq)) { 230362306a36Sopenharmony_ci err = PTR_ERR(rq); 230462306a36Sopenharmony_ci goto err_submit; 230562306a36Sopenharmony_ci } 230662306a36Sopenharmony_ci 230762306a36Sopenharmony_ci err = i915_sw_fence_await_sw_fence_gfp(&rq->submit, 230862306a36Sopenharmony_ci submit, 230962306a36Sopenharmony_ci GFP_KERNEL); 231062306a36Sopenharmony_ci if (err < 0) { 231162306a36Sopenharmony_ci i915_request_add(rq); 231262306a36Sopenharmony_ci goto err_submit; 231362306a36Sopenharmony_ci } 231462306a36Sopenharmony_ci 231562306a36Sopenharmony_ci cs = intel_ring_begin(rq, 4); 231662306a36Sopenharmony_ci if (IS_ERR(cs)) { 231762306a36Sopenharmony_ci i915_request_add(rq); 231862306a36Sopenharmony_ci err = PTR_ERR(cs); 231962306a36Sopenharmony_ci goto err_submit; 232062306a36Sopenharmony_ci } 232162306a36Sopenharmony_ci 232262306a36Sopenharmony_ci cs = emit_timestamp_store(cs, ce, offset + i * sizeof(u32)); 232362306a36Sopenharmony_ci 232462306a36Sopenharmony_ci intel_ring_advance(rq, cs); 232562306a36Sopenharmony_ci i915_request_add(rq); 232662306a36Sopenharmony_ci } 232762306a36Sopenharmony_ci i915_sw_fence_commit(submit); 232862306a36Sopenharmony_ci intel_engine_flush_submission(ce->engine); 232962306a36Sopenharmony_ci heap_fence_put(submit); 233062306a36Sopenharmony_ci 233162306a36Sopenharmony_ci semaphore_set(sema, 1); 233262306a36Sopenharmony_ci err = intel_gt_wait_for_idle(ce->engine->gt, HZ / 2); 233362306a36Sopenharmony_ci if (err) 233462306a36Sopenharmony_ci goto err; 233562306a36Sopenharmony_ci 233662306a36Sopenharmony_ci for (i = 1; i <= TF_COUNT; i++) 233762306a36Sopenharmony_ci elapsed[i - 1] = sema[i + 1] - sema[i]; 233862306a36Sopenharmony_ci 233962306a36Sopenharmony_ci cycles = trifilter(elapsed); 234062306a36Sopenharmony_ci pr_info("%s: inter-request latency %d cycles, %lluns\n", 234162306a36Sopenharmony_ci ce->engine->name, cycles >> TF_BIAS, 234262306a36Sopenharmony_ci cycles_to_ns(ce->engine, cycles)); 234362306a36Sopenharmony_ci 234462306a36Sopenharmony_ci return intel_gt_wait_for_idle(ce->engine->gt, HZ); 234562306a36Sopenharmony_ci 234662306a36Sopenharmony_cierr_submit: 234762306a36Sopenharmony_ci i915_sw_fence_commit(submit); 234862306a36Sopenharmony_ci heap_fence_put(submit); 234962306a36Sopenharmony_ci semaphore_set(sema, 1); 235062306a36Sopenharmony_cierr: 235162306a36Sopenharmony_ci intel_gt_set_wedged(ce->engine->gt); 235262306a36Sopenharmony_ci return err; 235362306a36Sopenharmony_ci} 235462306a36Sopenharmony_ci 235562306a36Sopenharmony_cistatic int measure_context_switch(struct intel_context *ce) 235662306a36Sopenharmony_ci{ 235762306a36Sopenharmony_ci u32 *sema = hwsp_scratch(ce); 235862306a36Sopenharmony_ci const u32 offset = hwsp_offset(ce, sema); 235962306a36Sopenharmony_ci struct i915_request *fence = NULL; 236062306a36Sopenharmony_ci u32 elapsed[TF_COUNT + 1], cycles; 236162306a36Sopenharmony_ci int i, j, err; 236262306a36Sopenharmony_ci u32 *cs; 236362306a36Sopenharmony_ci 236462306a36Sopenharmony_ci /* 236562306a36Sopenharmony_ci * Measure how long it takes to advance from one request in one 236662306a36Sopenharmony_ci * context to a request in another context. This allows us to 236762306a36Sopenharmony_ci * measure how long the context save/restore take, along with all 236862306a36Sopenharmony_ci * the inter-context setup we require. 236962306a36Sopenharmony_ci * 237062306a36Sopenharmony_ci * A: read CS_TIMESTAMP on GPU 237162306a36Sopenharmony_ci * switch context 237262306a36Sopenharmony_ci * B: read CS_TIMESTAMP on GPU 237362306a36Sopenharmony_ci * 237462306a36Sopenharmony_ci * Context switch latency: B - A 237562306a36Sopenharmony_ci */ 237662306a36Sopenharmony_ci 237762306a36Sopenharmony_ci err = plug(ce->engine, sema, MI_SEMAPHORE_SAD_NEQ_SDD, 0); 237862306a36Sopenharmony_ci if (err) 237962306a36Sopenharmony_ci return err; 238062306a36Sopenharmony_ci 238162306a36Sopenharmony_ci for (i = 1; i <= ARRAY_SIZE(elapsed); i++) { 238262306a36Sopenharmony_ci struct intel_context *arr[] = { 238362306a36Sopenharmony_ci ce, ce->engine->kernel_context 238462306a36Sopenharmony_ci }; 238562306a36Sopenharmony_ci u32 addr = offset + ARRAY_SIZE(arr) * i * sizeof(u32); 238662306a36Sopenharmony_ci 238762306a36Sopenharmony_ci for (j = 0; j < ARRAY_SIZE(arr); j++) { 238862306a36Sopenharmony_ci struct i915_request *rq; 238962306a36Sopenharmony_ci 239062306a36Sopenharmony_ci rq = i915_request_create(arr[j]); 239162306a36Sopenharmony_ci if (IS_ERR(rq)) { 239262306a36Sopenharmony_ci err = PTR_ERR(rq); 239362306a36Sopenharmony_ci goto err_fence; 239462306a36Sopenharmony_ci } 239562306a36Sopenharmony_ci 239662306a36Sopenharmony_ci if (fence) { 239762306a36Sopenharmony_ci err = i915_request_await_dma_fence(rq, 239862306a36Sopenharmony_ci &fence->fence); 239962306a36Sopenharmony_ci if (err) { 240062306a36Sopenharmony_ci i915_request_add(rq); 240162306a36Sopenharmony_ci goto err_fence; 240262306a36Sopenharmony_ci } 240362306a36Sopenharmony_ci } 240462306a36Sopenharmony_ci 240562306a36Sopenharmony_ci cs = intel_ring_begin(rq, 4); 240662306a36Sopenharmony_ci if (IS_ERR(cs)) { 240762306a36Sopenharmony_ci i915_request_add(rq); 240862306a36Sopenharmony_ci err = PTR_ERR(cs); 240962306a36Sopenharmony_ci goto err_fence; 241062306a36Sopenharmony_ci } 241162306a36Sopenharmony_ci 241262306a36Sopenharmony_ci cs = emit_timestamp_store(cs, ce, addr); 241362306a36Sopenharmony_ci addr += sizeof(u32); 241462306a36Sopenharmony_ci 241562306a36Sopenharmony_ci intel_ring_advance(rq, cs); 241662306a36Sopenharmony_ci 241762306a36Sopenharmony_ci i915_request_put(fence); 241862306a36Sopenharmony_ci fence = i915_request_get(rq); 241962306a36Sopenharmony_ci 242062306a36Sopenharmony_ci i915_request_add(rq); 242162306a36Sopenharmony_ci } 242262306a36Sopenharmony_ci } 242362306a36Sopenharmony_ci i915_request_put(fence); 242462306a36Sopenharmony_ci intel_engine_flush_submission(ce->engine); 242562306a36Sopenharmony_ci 242662306a36Sopenharmony_ci semaphore_set(sema, 1); 242762306a36Sopenharmony_ci err = intel_gt_wait_for_idle(ce->engine->gt, HZ / 2); 242862306a36Sopenharmony_ci if (err) 242962306a36Sopenharmony_ci goto err; 243062306a36Sopenharmony_ci 243162306a36Sopenharmony_ci for (i = 1; i <= TF_COUNT; i++) 243262306a36Sopenharmony_ci elapsed[i - 1] = sema[2 * i + 2] - sema[2 * i + 1]; 243362306a36Sopenharmony_ci 243462306a36Sopenharmony_ci cycles = trifilter(elapsed); 243562306a36Sopenharmony_ci pr_info("%s: context switch latency %d cycles, %lluns\n", 243662306a36Sopenharmony_ci ce->engine->name, cycles >> TF_BIAS, 243762306a36Sopenharmony_ci cycles_to_ns(ce->engine, cycles)); 243862306a36Sopenharmony_ci 243962306a36Sopenharmony_ci return intel_gt_wait_for_idle(ce->engine->gt, HZ); 244062306a36Sopenharmony_ci 244162306a36Sopenharmony_cierr_fence: 244262306a36Sopenharmony_ci i915_request_put(fence); 244362306a36Sopenharmony_ci semaphore_set(sema, 1); 244462306a36Sopenharmony_cierr: 244562306a36Sopenharmony_ci intel_gt_set_wedged(ce->engine->gt); 244662306a36Sopenharmony_ci return err; 244762306a36Sopenharmony_ci} 244862306a36Sopenharmony_ci 244962306a36Sopenharmony_cistatic int measure_preemption(struct intel_context *ce) 245062306a36Sopenharmony_ci{ 245162306a36Sopenharmony_ci u32 *sema = hwsp_scratch(ce); 245262306a36Sopenharmony_ci const u32 offset = hwsp_offset(ce, sema); 245362306a36Sopenharmony_ci u32 elapsed[TF_COUNT], cycles; 245462306a36Sopenharmony_ci u32 *cs; 245562306a36Sopenharmony_ci int err; 245662306a36Sopenharmony_ci int i; 245762306a36Sopenharmony_ci 245862306a36Sopenharmony_ci /* 245962306a36Sopenharmony_ci * We measure two latencies while triggering preemption. The first 246062306a36Sopenharmony_ci * latency is how long it takes for us to submit a preempting request. 246162306a36Sopenharmony_ci * The second latency is how it takes for us to return from the 246262306a36Sopenharmony_ci * preemption back to the original context. 246362306a36Sopenharmony_ci * 246462306a36Sopenharmony_ci * A: read CS_TIMESTAMP from CPU 246562306a36Sopenharmony_ci * submit preemption 246662306a36Sopenharmony_ci * B: read CS_TIMESTAMP on GPU (in preempting context) 246762306a36Sopenharmony_ci * context switch 246862306a36Sopenharmony_ci * C: read CS_TIMESTAMP on GPU (in original context) 246962306a36Sopenharmony_ci * 247062306a36Sopenharmony_ci * Preemption dispatch latency: B - A 247162306a36Sopenharmony_ci * Preemption switch latency: C - B 247262306a36Sopenharmony_ci */ 247362306a36Sopenharmony_ci 247462306a36Sopenharmony_ci if (!intel_engine_has_preemption(ce->engine)) 247562306a36Sopenharmony_ci return 0; 247662306a36Sopenharmony_ci 247762306a36Sopenharmony_ci for (i = 1; i <= ARRAY_SIZE(elapsed); i++) { 247862306a36Sopenharmony_ci u32 addr = offset + 2 * i * sizeof(u32); 247962306a36Sopenharmony_ci struct i915_request *rq; 248062306a36Sopenharmony_ci 248162306a36Sopenharmony_ci rq = i915_request_create(ce); 248262306a36Sopenharmony_ci if (IS_ERR(rq)) { 248362306a36Sopenharmony_ci err = PTR_ERR(rq); 248462306a36Sopenharmony_ci goto err; 248562306a36Sopenharmony_ci } 248662306a36Sopenharmony_ci 248762306a36Sopenharmony_ci cs = intel_ring_begin(rq, 12); 248862306a36Sopenharmony_ci if (IS_ERR(cs)) { 248962306a36Sopenharmony_ci i915_request_add(rq); 249062306a36Sopenharmony_ci err = PTR_ERR(cs); 249162306a36Sopenharmony_ci goto err; 249262306a36Sopenharmony_ci } 249362306a36Sopenharmony_ci 249462306a36Sopenharmony_ci cs = emit_store_dw(cs, addr, -1); 249562306a36Sopenharmony_ci cs = emit_semaphore_poll_until(cs, offset, i); 249662306a36Sopenharmony_ci cs = emit_timestamp_store(cs, ce, addr + sizeof(u32)); 249762306a36Sopenharmony_ci 249862306a36Sopenharmony_ci intel_ring_advance(rq, cs); 249962306a36Sopenharmony_ci i915_request_add(rq); 250062306a36Sopenharmony_ci 250162306a36Sopenharmony_ci if (wait_for(READ_ONCE(sema[2 * i]) == -1, 500)) { 250262306a36Sopenharmony_ci err = -EIO; 250362306a36Sopenharmony_ci goto err; 250462306a36Sopenharmony_ci } 250562306a36Sopenharmony_ci 250662306a36Sopenharmony_ci rq = i915_request_create(ce->engine->kernel_context); 250762306a36Sopenharmony_ci if (IS_ERR(rq)) { 250862306a36Sopenharmony_ci err = PTR_ERR(rq); 250962306a36Sopenharmony_ci goto err; 251062306a36Sopenharmony_ci } 251162306a36Sopenharmony_ci 251262306a36Sopenharmony_ci cs = intel_ring_begin(rq, 8); 251362306a36Sopenharmony_ci if (IS_ERR(cs)) { 251462306a36Sopenharmony_ci i915_request_add(rq); 251562306a36Sopenharmony_ci err = PTR_ERR(cs); 251662306a36Sopenharmony_ci goto err; 251762306a36Sopenharmony_ci } 251862306a36Sopenharmony_ci 251962306a36Sopenharmony_ci cs = emit_timestamp_store(cs, ce, addr); 252062306a36Sopenharmony_ci cs = emit_store_dw(cs, offset, i); 252162306a36Sopenharmony_ci 252262306a36Sopenharmony_ci intel_ring_advance(rq, cs); 252362306a36Sopenharmony_ci rq->sched.attr.priority = I915_PRIORITY_BARRIER; 252462306a36Sopenharmony_ci 252562306a36Sopenharmony_ci elapsed[i - 1] = ENGINE_READ_FW(ce->engine, RING_TIMESTAMP); 252662306a36Sopenharmony_ci i915_request_add(rq); 252762306a36Sopenharmony_ci } 252862306a36Sopenharmony_ci 252962306a36Sopenharmony_ci if (wait_for(READ_ONCE(sema[2 * i - 2]) != -1, 500)) { 253062306a36Sopenharmony_ci err = -EIO; 253162306a36Sopenharmony_ci goto err; 253262306a36Sopenharmony_ci } 253362306a36Sopenharmony_ci 253462306a36Sopenharmony_ci for (i = 1; i <= TF_COUNT; i++) 253562306a36Sopenharmony_ci elapsed[i - 1] = sema[2 * i + 0] - elapsed[i - 1]; 253662306a36Sopenharmony_ci 253762306a36Sopenharmony_ci cycles = trifilter(elapsed); 253862306a36Sopenharmony_ci pr_info("%s: preemption dispatch latency %d cycles, %lluns\n", 253962306a36Sopenharmony_ci ce->engine->name, cycles >> TF_BIAS, 254062306a36Sopenharmony_ci cycles_to_ns(ce->engine, cycles)); 254162306a36Sopenharmony_ci 254262306a36Sopenharmony_ci for (i = 1; i <= TF_COUNT; i++) 254362306a36Sopenharmony_ci elapsed[i - 1] = sema[2 * i + 1] - sema[2 * i + 0]; 254462306a36Sopenharmony_ci 254562306a36Sopenharmony_ci cycles = trifilter(elapsed); 254662306a36Sopenharmony_ci pr_info("%s: preemption switch latency %d cycles, %lluns\n", 254762306a36Sopenharmony_ci ce->engine->name, cycles >> TF_BIAS, 254862306a36Sopenharmony_ci cycles_to_ns(ce->engine, cycles)); 254962306a36Sopenharmony_ci 255062306a36Sopenharmony_ci return intel_gt_wait_for_idle(ce->engine->gt, HZ); 255162306a36Sopenharmony_ci 255262306a36Sopenharmony_cierr: 255362306a36Sopenharmony_ci intel_gt_set_wedged(ce->engine->gt); 255462306a36Sopenharmony_ci return err; 255562306a36Sopenharmony_ci} 255662306a36Sopenharmony_ci 255762306a36Sopenharmony_cistruct signal_cb { 255862306a36Sopenharmony_ci struct dma_fence_cb base; 255962306a36Sopenharmony_ci bool seen; 256062306a36Sopenharmony_ci}; 256162306a36Sopenharmony_ci 256262306a36Sopenharmony_cistatic void signal_cb(struct dma_fence *fence, struct dma_fence_cb *cb) 256362306a36Sopenharmony_ci{ 256462306a36Sopenharmony_ci struct signal_cb *s = container_of(cb, typeof(*s), base); 256562306a36Sopenharmony_ci 256662306a36Sopenharmony_ci smp_store_mb(s->seen, true); /* be safe, be strong */ 256762306a36Sopenharmony_ci} 256862306a36Sopenharmony_ci 256962306a36Sopenharmony_cistatic int measure_completion(struct intel_context *ce) 257062306a36Sopenharmony_ci{ 257162306a36Sopenharmony_ci u32 *sema = hwsp_scratch(ce); 257262306a36Sopenharmony_ci const u32 offset = hwsp_offset(ce, sema); 257362306a36Sopenharmony_ci u32 elapsed[TF_COUNT], cycles; 257462306a36Sopenharmony_ci u32 *cs; 257562306a36Sopenharmony_ci int err; 257662306a36Sopenharmony_ci int i; 257762306a36Sopenharmony_ci 257862306a36Sopenharmony_ci /* 257962306a36Sopenharmony_ci * Measure how long it takes for the signal (interrupt) to be 258062306a36Sopenharmony_ci * sent from the GPU to be processed by the CPU. 258162306a36Sopenharmony_ci * 258262306a36Sopenharmony_ci * A: read CS_TIMESTAMP on GPU 258362306a36Sopenharmony_ci * signal 258462306a36Sopenharmony_ci * B: read CS_TIMESTAMP from CPU 258562306a36Sopenharmony_ci * 258662306a36Sopenharmony_ci * Completion latency: B - A 258762306a36Sopenharmony_ci */ 258862306a36Sopenharmony_ci 258962306a36Sopenharmony_ci for (i = 1; i <= ARRAY_SIZE(elapsed); i++) { 259062306a36Sopenharmony_ci struct signal_cb cb = { .seen = false }; 259162306a36Sopenharmony_ci struct i915_request *rq; 259262306a36Sopenharmony_ci 259362306a36Sopenharmony_ci rq = i915_request_create(ce); 259462306a36Sopenharmony_ci if (IS_ERR(rq)) { 259562306a36Sopenharmony_ci err = PTR_ERR(rq); 259662306a36Sopenharmony_ci goto err; 259762306a36Sopenharmony_ci } 259862306a36Sopenharmony_ci 259962306a36Sopenharmony_ci cs = intel_ring_begin(rq, 12); 260062306a36Sopenharmony_ci if (IS_ERR(cs)) { 260162306a36Sopenharmony_ci i915_request_add(rq); 260262306a36Sopenharmony_ci err = PTR_ERR(cs); 260362306a36Sopenharmony_ci goto err; 260462306a36Sopenharmony_ci } 260562306a36Sopenharmony_ci 260662306a36Sopenharmony_ci cs = emit_store_dw(cs, offset + i * sizeof(u32), -1); 260762306a36Sopenharmony_ci cs = emit_semaphore_poll_until(cs, offset, i); 260862306a36Sopenharmony_ci cs = emit_timestamp_store(cs, ce, offset + i * sizeof(u32)); 260962306a36Sopenharmony_ci 261062306a36Sopenharmony_ci intel_ring_advance(rq, cs); 261162306a36Sopenharmony_ci 261262306a36Sopenharmony_ci dma_fence_add_callback(&rq->fence, &cb.base, signal_cb); 261362306a36Sopenharmony_ci i915_request_add(rq); 261462306a36Sopenharmony_ci 261562306a36Sopenharmony_ci intel_engine_flush_submission(ce->engine); 261662306a36Sopenharmony_ci if (wait_for(READ_ONCE(sema[i]) == -1, 50)) { 261762306a36Sopenharmony_ci err = -EIO; 261862306a36Sopenharmony_ci goto err; 261962306a36Sopenharmony_ci } 262062306a36Sopenharmony_ci 262162306a36Sopenharmony_ci preempt_disable(); 262262306a36Sopenharmony_ci semaphore_set(sema, i); 262362306a36Sopenharmony_ci while (!READ_ONCE(cb.seen)) 262462306a36Sopenharmony_ci cpu_relax(); 262562306a36Sopenharmony_ci 262662306a36Sopenharmony_ci elapsed[i - 1] = ENGINE_READ_FW(ce->engine, RING_TIMESTAMP); 262762306a36Sopenharmony_ci preempt_enable(); 262862306a36Sopenharmony_ci } 262962306a36Sopenharmony_ci 263062306a36Sopenharmony_ci err = intel_gt_wait_for_idle(ce->engine->gt, HZ / 2); 263162306a36Sopenharmony_ci if (err) 263262306a36Sopenharmony_ci goto err; 263362306a36Sopenharmony_ci 263462306a36Sopenharmony_ci for (i = 0; i < ARRAY_SIZE(elapsed); i++) { 263562306a36Sopenharmony_ci GEM_BUG_ON(sema[i + 1] == -1); 263662306a36Sopenharmony_ci elapsed[i] = elapsed[i] - sema[i + 1]; 263762306a36Sopenharmony_ci } 263862306a36Sopenharmony_ci 263962306a36Sopenharmony_ci cycles = trifilter(elapsed); 264062306a36Sopenharmony_ci pr_info("%s: completion latency %d cycles, %lluns\n", 264162306a36Sopenharmony_ci ce->engine->name, cycles >> TF_BIAS, 264262306a36Sopenharmony_ci cycles_to_ns(ce->engine, cycles)); 264362306a36Sopenharmony_ci 264462306a36Sopenharmony_ci return intel_gt_wait_for_idle(ce->engine->gt, HZ); 264562306a36Sopenharmony_ci 264662306a36Sopenharmony_cierr: 264762306a36Sopenharmony_ci intel_gt_set_wedged(ce->engine->gt); 264862306a36Sopenharmony_ci return err; 264962306a36Sopenharmony_ci} 265062306a36Sopenharmony_ci 265162306a36Sopenharmony_cistatic void rps_pin(struct intel_gt *gt) 265262306a36Sopenharmony_ci{ 265362306a36Sopenharmony_ci /* Pin the frequency to max */ 265462306a36Sopenharmony_ci atomic_inc(>->rps.num_waiters); 265562306a36Sopenharmony_ci intel_uncore_forcewake_get(gt->uncore, FORCEWAKE_ALL); 265662306a36Sopenharmony_ci 265762306a36Sopenharmony_ci mutex_lock(>->rps.lock); 265862306a36Sopenharmony_ci intel_rps_set(>->rps, gt->rps.max_freq); 265962306a36Sopenharmony_ci mutex_unlock(>->rps.lock); 266062306a36Sopenharmony_ci} 266162306a36Sopenharmony_ci 266262306a36Sopenharmony_cistatic void rps_unpin(struct intel_gt *gt) 266362306a36Sopenharmony_ci{ 266462306a36Sopenharmony_ci intel_uncore_forcewake_put(gt->uncore, FORCEWAKE_ALL); 266562306a36Sopenharmony_ci atomic_dec(>->rps.num_waiters); 266662306a36Sopenharmony_ci} 266762306a36Sopenharmony_ci 266862306a36Sopenharmony_cistatic int perf_request_latency(void *arg) 266962306a36Sopenharmony_ci{ 267062306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 267162306a36Sopenharmony_ci struct intel_engine_cs *engine; 267262306a36Sopenharmony_ci struct pm_qos_request qos; 267362306a36Sopenharmony_ci int err = 0; 267462306a36Sopenharmony_ci 267562306a36Sopenharmony_ci if (GRAPHICS_VER(i915) < 8) /* per-engine CS timestamp, semaphores */ 267662306a36Sopenharmony_ci return 0; 267762306a36Sopenharmony_ci 267862306a36Sopenharmony_ci cpu_latency_qos_add_request(&qos, 0); /* disable cstates */ 267962306a36Sopenharmony_ci 268062306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 268162306a36Sopenharmony_ci struct intel_context *ce; 268262306a36Sopenharmony_ci 268362306a36Sopenharmony_ci ce = intel_context_create(engine); 268462306a36Sopenharmony_ci if (IS_ERR(ce)) { 268562306a36Sopenharmony_ci err = PTR_ERR(ce); 268662306a36Sopenharmony_ci goto out; 268762306a36Sopenharmony_ci } 268862306a36Sopenharmony_ci 268962306a36Sopenharmony_ci err = intel_context_pin(ce); 269062306a36Sopenharmony_ci if (err) { 269162306a36Sopenharmony_ci intel_context_put(ce); 269262306a36Sopenharmony_ci goto out; 269362306a36Sopenharmony_ci } 269462306a36Sopenharmony_ci 269562306a36Sopenharmony_ci st_engine_heartbeat_disable(engine); 269662306a36Sopenharmony_ci rps_pin(engine->gt); 269762306a36Sopenharmony_ci 269862306a36Sopenharmony_ci if (err == 0) 269962306a36Sopenharmony_ci err = measure_semaphore_response(ce); 270062306a36Sopenharmony_ci if (err == 0) 270162306a36Sopenharmony_ci err = measure_idle_dispatch(ce); 270262306a36Sopenharmony_ci if (err == 0) 270362306a36Sopenharmony_ci err = measure_busy_dispatch(ce); 270462306a36Sopenharmony_ci if (err == 0) 270562306a36Sopenharmony_ci err = measure_inter_request(ce); 270662306a36Sopenharmony_ci if (err == 0) 270762306a36Sopenharmony_ci err = measure_context_switch(ce); 270862306a36Sopenharmony_ci if (err == 0) 270962306a36Sopenharmony_ci err = measure_preemption(ce); 271062306a36Sopenharmony_ci if (err == 0) 271162306a36Sopenharmony_ci err = measure_completion(ce); 271262306a36Sopenharmony_ci 271362306a36Sopenharmony_ci rps_unpin(engine->gt); 271462306a36Sopenharmony_ci st_engine_heartbeat_enable(engine); 271562306a36Sopenharmony_ci 271662306a36Sopenharmony_ci intel_context_unpin(ce); 271762306a36Sopenharmony_ci intel_context_put(ce); 271862306a36Sopenharmony_ci if (err) 271962306a36Sopenharmony_ci goto out; 272062306a36Sopenharmony_ci } 272162306a36Sopenharmony_ci 272262306a36Sopenharmony_ciout: 272362306a36Sopenharmony_ci if (igt_flush_test(i915)) 272462306a36Sopenharmony_ci err = -EIO; 272562306a36Sopenharmony_ci 272662306a36Sopenharmony_ci cpu_latency_qos_remove_request(&qos); 272762306a36Sopenharmony_ci return err; 272862306a36Sopenharmony_ci} 272962306a36Sopenharmony_ci 273062306a36Sopenharmony_cistatic int s_sync0(void *arg) 273162306a36Sopenharmony_ci{ 273262306a36Sopenharmony_ci struct perf_series *ps = arg; 273362306a36Sopenharmony_ci IGT_TIMEOUT(end_time); 273462306a36Sopenharmony_ci unsigned int idx = 0; 273562306a36Sopenharmony_ci int err = 0; 273662306a36Sopenharmony_ci 273762306a36Sopenharmony_ci GEM_BUG_ON(!ps->nengines); 273862306a36Sopenharmony_ci do { 273962306a36Sopenharmony_ci struct i915_request *rq; 274062306a36Sopenharmony_ci 274162306a36Sopenharmony_ci rq = i915_request_create(ps->ce[idx]); 274262306a36Sopenharmony_ci if (IS_ERR(rq)) { 274362306a36Sopenharmony_ci err = PTR_ERR(rq); 274462306a36Sopenharmony_ci break; 274562306a36Sopenharmony_ci } 274662306a36Sopenharmony_ci 274762306a36Sopenharmony_ci i915_request_get(rq); 274862306a36Sopenharmony_ci i915_request_add(rq); 274962306a36Sopenharmony_ci 275062306a36Sopenharmony_ci if (i915_request_wait(rq, 0, HZ / 5) < 0) 275162306a36Sopenharmony_ci err = -ETIME; 275262306a36Sopenharmony_ci i915_request_put(rq); 275362306a36Sopenharmony_ci if (err) 275462306a36Sopenharmony_ci break; 275562306a36Sopenharmony_ci 275662306a36Sopenharmony_ci if (++idx == ps->nengines) 275762306a36Sopenharmony_ci idx = 0; 275862306a36Sopenharmony_ci } while (!__igt_timeout(end_time, NULL)); 275962306a36Sopenharmony_ci 276062306a36Sopenharmony_ci return err; 276162306a36Sopenharmony_ci} 276262306a36Sopenharmony_ci 276362306a36Sopenharmony_cistatic int s_sync1(void *arg) 276462306a36Sopenharmony_ci{ 276562306a36Sopenharmony_ci struct perf_series *ps = arg; 276662306a36Sopenharmony_ci struct i915_request *prev = NULL; 276762306a36Sopenharmony_ci IGT_TIMEOUT(end_time); 276862306a36Sopenharmony_ci unsigned int idx = 0; 276962306a36Sopenharmony_ci int err = 0; 277062306a36Sopenharmony_ci 277162306a36Sopenharmony_ci GEM_BUG_ON(!ps->nengines); 277262306a36Sopenharmony_ci do { 277362306a36Sopenharmony_ci struct i915_request *rq; 277462306a36Sopenharmony_ci 277562306a36Sopenharmony_ci rq = i915_request_create(ps->ce[idx]); 277662306a36Sopenharmony_ci if (IS_ERR(rq)) { 277762306a36Sopenharmony_ci err = PTR_ERR(rq); 277862306a36Sopenharmony_ci break; 277962306a36Sopenharmony_ci } 278062306a36Sopenharmony_ci 278162306a36Sopenharmony_ci i915_request_get(rq); 278262306a36Sopenharmony_ci i915_request_add(rq); 278362306a36Sopenharmony_ci 278462306a36Sopenharmony_ci if (prev && i915_request_wait(prev, 0, HZ / 5) < 0) 278562306a36Sopenharmony_ci err = -ETIME; 278662306a36Sopenharmony_ci i915_request_put(prev); 278762306a36Sopenharmony_ci prev = rq; 278862306a36Sopenharmony_ci if (err) 278962306a36Sopenharmony_ci break; 279062306a36Sopenharmony_ci 279162306a36Sopenharmony_ci if (++idx == ps->nengines) 279262306a36Sopenharmony_ci idx = 0; 279362306a36Sopenharmony_ci } while (!__igt_timeout(end_time, NULL)); 279462306a36Sopenharmony_ci i915_request_put(prev); 279562306a36Sopenharmony_ci 279662306a36Sopenharmony_ci return err; 279762306a36Sopenharmony_ci} 279862306a36Sopenharmony_ci 279962306a36Sopenharmony_cistatic int s_many(void *arg) 280062306a36Sopenharmony_ci{ 280162306a36Sopenharmony_ci struct perf_series *ps = arg; 280262306a36Sopenharmony_ci IGT_TIMEOUT(end_time); 280362306a36Sopenharmony_ci unsigned int idx = 0; 280462306a36Sopenharmony_ci 280562306a36Sopenharmony_ci GEM_BUG_ON(!ps->nengines); 280662306a36Sopenharmony_ci do { 280762306a36Sopenharmony_ci struct i915_request *rq; 280862306a36Sopenharmony_ci 280962306a36Sopenharmony_ci rq = i915_request_create(ps->ce[idx]); 281062306a36Sopenharmony_ci if (IS_ERR(rq)) 281162306a36Sopenharmony_ci return PTR_ERR(rq); 281262306a36Sopenharmony_ci 281362306a36Sopenharmony_ci i915_request_add(rq); 281462306a36Sopenharmony_ci 281562306a36Sopenharmony_ci if (++idx == ps->nengines) 281662306a36Sopenharmony_ci idx = 0; 281762306a36Sopenharmony_ci } while (!__igt_timeout(end_time, NULL)); 281862306a36Sopenharmony_ci 281962306a36Sopenharmony_ci return 0; 282062306a36Sopenharmony_ci} 282162306a36Sopenharmony_ci 282262306a36Sopenharmony_cistatic int perf_series_engines(void *arg) 282362306a36Sopenharmony_ci{ 282462306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 282562306a36Sopenharmony_ci static int (* const func[])(void *arg) = { 282662306a36Sopenharmony_ci s_sync0, 282762306a36Sopenharmony_ci s_sync1, 282862306a36Sopenharmony_ci s_many, 282962306a36Sopenharmony_ci NULL, 283062306a36Sopenharmony_ci }; 283162306a36Sopenharmony_ci const unsigned int nengines = num_uabi_engines(i915); 283262306a36Sopenharmony_ci struct intel_engine_cs *engine; 283362306a36Sopenharmony_ci int (* const *fn)(void *arg); 283462306a36Sopenharmony_ci struct pm_qos_request qos; 283562306a36Sopenharmony_ci struct perf_stats *stats; 283662306a36Sopenharmony_ci struct perf_series *ps; 283762306a36Sopenharmony_ci unsigned int idx; 283862306a36Sopenharmony_ci int err = 0; 283962306a36Sopenharmony_ci 284062306a36Sopenharmony_ci stats = kcalloc(nengines, sizeof(*stats), GFP_KERNEL); 284162306a36Sopenharmony_ci if (!stats) 284262306a36Sopenharmony_ci return -ENOMEM; 284362306a36Sopenharmony_ci 284462306a36Sopenharmony_ci ps = kzalloc(struct_size(ps, ce, nengines), GFP_KERNEL); 284562306a36Sopenharmony_ci if (!ps) { 284662306a36Sopenharmony_ci kfree(stats); 284762306a36Sopenharmony_ci return -ENOMEM; 284862306a36Sopenharmony_ci } 284962306a36Sopenharmony_ci 285062306a36Sopenharmony_ci cpu_latency_qos_add_request(&qos, 0); /* disable cstates */ 285162306a36Sopenharmony_ci 285262306a36Sopenharmony_ci ps->i915 = i915; 285362306a36Sopenharmony_ci ps->nengines = nengines; 285462306a36Sopenharmony_ci 285562306a36Sopenharmony_ci idx = 0; 285662306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 285762306a36Sopenharmony_ci struct intel_context *ce; 285862306a36Sopenharmony_ci 285962306a36Sopenharmony_ci ce = intel_context_create(engine); 286062306a36Sopenharmony_ci if (IS_ERR(ce)) { 286162306a36Sopenharmony_ci err = PTR_ERR(ce); 286262306a36Sopenharmony_ci goto out; 286362306a36Sopenharmony_ci } 286462306a36Sopenharmony_ci 286562306a36Sopenharmony_ci err = intel_context_pin(ce); 286662306a36Sopenharmony_ci if (err) { 286762306a36Sopenharmony_ci intel_context_put(ce); 286862306a36Sopenharmony_ci goto out; 286962306a36Sopenharmony_ci } 287062306a36Sopenharmony_ci 287162306a36Sopenharmony_ci ps->ce[idx++] = ce; 287262306a36Sopenharmony_ci } 287362306a36Sopenharmony_ci GEM_BUG_ON(idx != ps->nengines); 287462306a36Sopenharmony_ci 287562306a36Sopenharmony_ci for (fn = func; *fn && !err; fn++) { 287662306a36Sopenharmony_ci char name[KSYM_NAME_LEN]; 287762306a36Sopenharmony_ci struct igt_live_test t; 287862306a36Sopenharmony_ci 287962306a36Sopenharmony_ci snprintf(name, sizeof(name), "%ps", *fn); 288062306a36Sopenharmony_ci err = igt_live_test_begin(&t, i915, __func__, name); 288162306a36Sopenharmony_ci if (err) 288262306a36Sopenharmony_ci break; 288362306a36Sopenharmony_ci 288462306a36Sopenharmony_ci for (idx = 0; idx < nengines; idx++) { 288562306a36Sopenharmony_ci struct perf_stats *p = 288662306a36Sopenharmony_ci memset(&stats[idx], 0, sizeof(stats[idx])); 288762306a36Sopenharmony_ci struct intel_context *ce = ps->ce[idx]; 288862306a36Sopenharmony_ci 288962306a36Sopenharmony_ci p->engine = ps->ce[idx]->engine; 289062306a36Sopenharmony_ci intel_engine_pm_get(p->engine); 289162306a36Sopenharmony_ci 289262306a36Sopenharmony_ci if (intel_engine_supports_stats(p->engine)) 289362306a36Sopenharmony_ci p->busy = intel_engine_get_busy_time(p->engine, 289462306a36Sopenharmony_ci &p->time) + 1; 289562306a36Sopenharmony_ci else 289662306a36Sopenharmony_ci p->time = ktime_get(); 289762306a36Sopenharmony_ci p->runtime = -intel_context_get_total_runtime_ns(ce); 289862306a36Sopenharmony_ci } 289962306a36Sopenharmony_ci 290062306a36Sopenharmony_ci err = (*fn)(ps); 290162306a36Sopenharmony_ci if (igt_live_test_end(&t)) 290262306a36Sopenharmony_ci err = -EIO; 290362306a36Sopenharmony_ci 290462306a36Sopenharmony_ci for (idx = 0; idx < nengines; idx++) { 290562306a36Sopenharmony_ci struct perf_stats *p = &stats[idx]; 290662306a36Sopenharmony_ci struct intel_context *ce = ps->ce[idx]; 290762306a36Sopenharmony_ci int integer, decimal; 290862306a36Sopenharmony_ci u64 busy, dt, now; 290962306a36Sopenharmony_ci 291062306a36Sopenharmony_ci if (p->busy) 291162306a36Sopenharmony_ci p->busy = ktime_sub(intel_engine_get_busy_time(p->engine, 291262306a36Sopenharmony_ci &now), 291362306a36Sopenharmony_ci p->busy - 1); 291462306a36Sopenharmony_ci else 291562306a36Sopenharmony_ci now = ktime_get(); 291662306a36Sopenharmony_ci p->time = ktime_sub(now, p->time); 291762306a36Sopenharmony_ci 291862306a36Sopenharmony_ci err = switch_to_kernel_sync(ce, err); 291962306a36Sopenharmony_ci p->runtime += intel_context_get_total_runtime_ns(ce); 292062306a36Sopenharmony_ci intel_engine_pm_put(p->engine); 292162306a36Sopenharmony_ci 292262306a36Sopenharmony_ci busy = 100 * ktime_to_ns(p->busy); 292362306a36Sopenharmony_ci dt = ktime_to_ns(p->time); 292462306a36Sopenharmony_ci if (dt) { 292562306a36Sopenharmony_ci integer = div64_u64(busy, dt); 292662306a36Sopenharmony_ci busy -= integer * dt; 292762306a36Sopenharmony_ci decimal = div64_u64(100 * busy, dt); 292862306a36Sopenharmony_ci } else { 292962306a36Sopenharmony_ci integer = 0; 293062306a36Sopenharmony_ci decimal = 0; 293162306a36Sopenharmony_ci } 293262306a36Sopenharmony_ci 293362306a36Sopenharmony_ci pr_info("%s %5s: { seqno:%d, busy:%d.%02d%%, runtime:%lldms, walltime:%lldms }\n", 293462306a36Sopenharmony_ci name, p->engine->name, ce->timeline->seqno, 293562306a36Sopenharmony_ci integer, decimal, 293662306a36Sopenharmony_ci div_u64(p->runtime, 1000 * 1000), 293762306a36Sopenharmony_ci div_u64(ktime_to_ns(p->time), 1000 * 1000)); 293862306a36Sopenharmony_ci } 293962306a36Sopenharmony_ci } 294062306a36Sopenharmony_ci 294162306a36Sopenharmony_ciout: 294262306a36Sopenharmony_ci for (idx = 0; idx < nengines; idx++) { 294362306a36Sopenharmony_ci if (IS_ERR_OR_NULL(ps->ce[idx])) 294462306a36Sopenharmony_ci break; 294562306a36Sopenharmony_ci 294662306a36Sopenharmony_ci intel_context_unpin(ps->ce[idx]); 294762306a36Sopenharmony_ci intel_context_put(ps->ce[idx]); 294862306a36Sopenharmony_ci } 294962306a36Sopenharmony_ci kfree(ps); 295062306a36Sopenharmony_ci 295162306a36Sopenharmony_ci cpu_latency_qos_remove_request(&qos); 295262306a36Sopenharmony_ci kfree(stats); 295362306a36Sopenharmony_ci return err; 295462306a36Sopenharmony_ci} 295562306a36Sopenharmony_ci 295662306a36Sopenharmony_cistruct p_thread { 295762306a36Sopenharmony_ci struct perf_stats p; 295862306a36Sopenharmony_ci struct kthread_worker *worker; 295962306a36Sopenharmony_ci struct kthread_work work; 296062306a36Sopenharmony_ci struct intel_engine_cs *engine; 296162306a36Sopenharmony_ci int result; 296262306a36Sopenharmony_ci}; 296362306a36Sopenharmony_ci 296462306a36Sopenharmony_cistatic void p_sync0(struct kthread_work *work) 296562306a36Sopenharmony_ci{ 296662306a36Sopenharmony_ci struct p_thread *thread = container_of(work, typeof(*thread), work); 296762306a36Sopenharmony_ci struct perf_stats *p = &thread->p; 296862306a36Sopenharmony_ci struct intel_engine_cs *engine = p->engine; 296962306a36Sopenharmony_ci struct intel_context *ce; 297062306a36Sopenharmony_ci IGT_TIMEOUT(end_time); 297162306a36Sopenharmony_ci unsigned long count; 297262306a36Sopenharmony_ci bool busy; 297362306a36Sopenharmony_ci int err = 0; 297462306a36Sopenharmony_ci 297562306a36Sopenharmony_ci ce = intel_context_create(engine); 297662306a36Sopenharmony_ci if (IS_ERR(ce)) { 297762306a36Sopenharmony_ci thread->result = PTR_ERR(ce); 297862306a36Sopenharmony_ci return; 297962306a36Sopenharmony_ci } 298062306a36Sopenharmony_ci 298162306a36Sopenharmony_ci err = intel_context_pin(ce); 298262306a36Sopenharmony_ci if (err) { 298362306a36Sopenharmony_ci intel_context_put(ce); 298462306a36Sopenharmony_ci thread->result = err; 298562306a36Sopenharmony_ci return; 298662306a36Sopenharmony_ci } 298762306a36Sopenharmony_ci 298862306a36Sopenharmony_ci if (intel_engine_supports_stats(engine)) { 298962306a36Sopenharmony_ci p->busy = intel_engine_get_busy_time(engine, &p->time); 299062306a36Sopenharmony_ci busy = true; 299162306a36Sopenharmony_ci } else { 299262306a36Sopenharmony_ci p->time = ktime_get(); 299362306a36Sopenharmony_ci busy = false; 299462306a36Sopenharmony_ci } 299562306a36Sopenharmony_ci 299662306a36Sopenharmony_ci count = 0; 299762306a36Sopenharmony_ci do { 299862306a36Sopenharmony_ci struct i915_request *rq; 299962306a36Sopenharmony_ci 300062306a36Sopenharmony_ci rq = i915_request_create(ce); 300162306a36Sopenharmony_ci if (IS_ERR(rq)) { 300262306a36Sopenharmony_ci err = PTR_ERR(rq); 300362306a36Sopenharmony_ci break; 300462306a36Sopenharmony_ci } 300562306a36Sopenharmony_ci 300662306a36Sopenharmony_ci i915_request_get(rq); 300762306a36Sopenharmony_ci i915_request_add(rq); 300862306a36Sopenharmony_ci 300962306a36Sopenharmony_ci err = 0; 301062306a36Sopenharmony_ci if (i915_request_wait(rq, 0, HZ) < 0) 301162306a36Sopenharmony_ci err = -ETIME; 301262306a36Sopenharmony_ci i915_request_put(rq); 301362306a36Sopenharmony_ci if (err) 301462306a36Sopenharmony_ci break; 301562306a36Sopenharmony_ci 301662306a36Sopenharmony_ci count++; 301762306a36Sopenharmony_ci } while (!__igt_timeout(end_time, NULL)); 301862306a36Sopenharmony_ci 301962306a36Sopenharmony_ci if (busy) { 302062306a36Sopenharmony_ci ktime_t now; 302162306a36Sopenharmony_ci 302262306a36Sopenharmony_ci p->busy = ktime_sub(intel_engine_get_busy_time(engine, &now), 302362306a36Sopenharmony_ci p->busy); 302462306a36Sopenharmony_ci p->time = ktime_sub(now, p->time); 302562306a36Sopenharmony_ci } else { 302662306a36Sopenharmony_ci p->time = ktime_sub(ktime_get(), p->time); 302762306a36Sopenharmony_ci } 302862306a36Sopenharmony_ci 302962306a36Sopenharmony_ci err = switch_to_kernel_sync(ce, err); 303062306a36Sopenharmony_ci p->runtime = intel_context_get_total_runtime_ns(ce); 303162306a36Sopenharmony_ci p->count = count; 303262306a36Sopenharmony_ci 303362306a36Sopenharmony_ci intel_context_unpin(ce); 303462306a36Sopenharmony_ci intel_context_put(ce); 303562306a36Sopenharmony_ci thread->result = err; 303662306a36Sopenharmony_ci} 303762306a36Sopenharmony_ci 303862306a36Sopenharmony_cistatic void p_sync1(struct kthread_work *work) 303962306a36Sopenharmony_ci{ 304062306a36Sopenharmony_ci struct p_thread *thread = container_of(work, typeof(*thread), work); 304162306a36Sopenharmony_ci struct perf_stats *p = &thread->p; 304262306a36Sopenharmony_ci struct intel_engine_cs *engine = p->engine; 304362306a36Sopenharmony_ci struct i915_request *prev = NULL; 304462306a36Sopenharmony_ci struct intel_context *ce; 304562306a36Sopenharmony_ci IGT_TIMEOUT(end_time); 304662306a36Sopenharmony_ci unsigned long count; 304762306a36Sopenharmony_ci bool busy; 304862306a36Sopenharmony_ci int err = 0; 304962306a36Sopenharmony_ci 305062306a36Sopenharmony_ci ce = intel_context_create(engine); 305162306a36Sopenharmony_ci if (IS_ERR(ce)) { 305262306a36Sopenharmony_ci thread->result = PTR_ERR(ce); 305362306a36Sopenharmony_ci return; 305462306a36Sopenharmony_ci } 305562306a36Sopenharmony_ci 305662306a36Sopenharmony_ci err = intel_context_pin(ce); 305762306a36Sopenharmony_ci if (err) { 305862306a36Sopenharmony_ci intel_context_put(ce); 305962306a36Sopenharmony_ci thread->result = err; 306062306a36Sopenharmony_ci return; 306162306a36Sopenharmony_ci } 306262306a36Sopenharmony_ci 306362306a36Sopenharmony_ci if (intel_engine_supports_stats(engine)) { 306462306a36Sopenharmony_ci p->busy = intel_engine_get_busy_time(engine, &p->time); 306562306a36Sopenharmony_ci busy = true; 306662306a36Sopenharmony_ci } else { 306762306a36Sopenharmony_ci p->time = ktime_get(); 306862306a36Sopenharmony_ci busy = false; 306962306a36Sopenharmony_ci } 307062306a36Sopenharmony_ci 307162306a36Sopenharmony_ci count = 0; 307262306a36Sopenharmony_ci do { 307362306a36Sopenharmony_ci struct i915_request *rq; 307462306a36Sopenharmony_ci 307562306a36Sopenharmony_ci rq = i915_request_create(ce); 307662306a36Sopenharmony_ci if (IS_ERR(rq)) { 307762306a36Sopenharmony_ci err = PTR_ERR(rq); 307862306a36Sopenharmony_ci break; 307962306a36Sopenharmony_ci } 308062306a36Sopenharmony_ci 308162306a36Sopenharmony_ci i915_request_get(rq); 308262306a36Sopenharmony_ci i915_request_add(rq); 308362306a36Sopenharmony_ci 308462306a36Sopenharmony_ci err = 0; 308562306a36Sopenharmony_ci if (prev && i915_request_wait(prev, 0, HZ) < 0) 308662306a36Sopenharmony_ci err = -ETIME; 308762306a36Sopenharmony_ci i915_request_put(prev); 308862306a36Sopenharmony_ci prev = rq; 308962306a36Sopenharmony_ci if (err) 309062306a36Sopenharmony_ci break; 309162306a36Sopenharmony_ci 309262306a36Sopenharmony_ci count++; 309362306a36Sopenharmony_ci } while (!__igt_timeout(end_time, NULL)); 309462306a36Sopenharmony_ci i915_request_put(prev); 309562306a36Sopenharmony_ci 309662306a36Sopenharmony_ci if (busy) { 309762306a36Sopenharmony_ci ktime_t now; 309862306a36Sopenharmony_ci 309962306a36Sopenharmony_ci p->busy = ktime_sub(intel_engine_get_busy_time(engine, &now), 310062306a36Sopenharmony_ci p->busy); 310162306a36Sopenharmony_ci p->time = ktime_sub(now, p->time); 310262306a36Sopenharmony_ci } else { 310362306a36Sopenharmony_ci p->time = ktime_sub(ktime_get(), p->time); 310462306a36Sopenharmony_ci } 310562306a36Sopenharmony_ci 310662306a36Sopenharmony_ci err = switch_to_kernel_sync(ce, err); 310762306a36Sopenharmony_ci p->runtime = intel_context_get_total_runtime_ns(ce); 310862306a36Sopenharmony_ci p->count = count; 310962306a36Sopenharmony_ci 311062306a36Sopenharmony_ci intel_context_unpin(ce); 311162306a36Sopenharmony_ci intel_context_put(ce); 311262306a36Sopenharmony_ci thread->result = err; 311362306a36Sopenharmony_ci} 311462306a36Sopenharmony_ci 311562306a36Sopenharmony_cistatic void p_many(struct kthread_work *work) 311662306a36Sopenharmony_ci{ 311762306a36Sopenharmony_ci struct p_thread *thread = container_of(work, typeof(*thread), work); 311862306a36Sopenharmony_ci struct perf_stats *p = &thread->p; 311962306a36Sopenharmony_ci struct intel_engine_cs *engine = p->engine; 312062306a36Sopenharmony_ci struct intel_context *ce; 312162306a36Sopenharmony_ci IGT_TIMEOUT(end_time); 312262306a36Sopenharmony_ci unsigned long count; 312362306a36Sopenharmony_ci int err = 0; 312462306a36Sopenharmony_ci bool busy; 312562306a36Sopenharmony_ci 312662306a36Sopenharmony_ci ce = intel_context_create(engine); 312762306a36Sopenharmony_ci if (IS_ERR(ce)) { 312862306a36Sopenharmony_ci thread->result = PTR_ERR(ce); 312962306a36Sopenharmony_ci return; 313062306a36Sopenharmony_ci } 313162306a36Sopenharmony_ci 313262306a36Sopenharmony_ci err = intel_context_pin(ce); 313362306a36Sopenharmony_ci if (err) { 313462306a36Sopenharmony_ci intel_context_put(ce); 313562306a36Sopenharmony_ci thread->result = err; 313662306a36Sopenharmony_ci return; 313762306a36Sopenharmony_ci } 313862306a36Sopenharmony_ci 313962306a36Sopenharmony_ci if (intel_engine_supports_stats(engine)) { 314062306a36Sopenharmony_ci p->busy = intel_engine_get_busy_time(engine, &p->time); 314162306a36Sopenharmony_ci busy = true; 314262306a36Sopenharmony_ci } else { 314362306a36Sopenharmony_ci p->time = ktime_get(); 314462306a36Sopenharmony_ci busy = false; 314562306a36Sopenharmony_ci } 314662306a36Sopenharmony_ci 314762306a36Sopenharmony_ci count = 0; 314862306a36Sopenharmony_ci do { 314962306a36Sopenharmony_ci struct i915_request *rq; 315062306a36Sopenharmony_ci 315162306a36Sopenharmony_ci rq = i915_request_create(ce); 315262306a36Sopenharmony_ci if (IS_ERR(rq)) { 315362306a36Sopenharmony_ci err = PTR_ERR(rq); 315462306a36Sopenharmony_ci break; 315562306a36Sopenharmony_ci } 315662306a36Sopenharmony_ci 315762306a36Sopenharmony_ci i915_request_add(rq); 315862306a36Sopenharmony_ci count++; 315962306a36Sopenharmony_ci } while (!__igt_timeout(end_time, NULL)); 316062306a36Sopenharmony_ci 316162306a36Sopenharmony_ci if (busy) { 316262306a36Sopenharmony_ci ktime_t now; 316362306a36Sopenharmony_ci 316462306a36Sopenharmony_ci p->busy = ktime_sub(intel_engine_get_busy_time(engine, &now), 316562306a36Sopenharmony_ci p->busy); 316662306a36Sopenharmony_ci p->time = ktime_sub(now, p->time); 316762306a36Sopenharmony_ci } else { 316862306a36Sopenharmony_ci p->time = ktime_sub(ktime_get(), p->time); 316962306a36Sopenharmony_ci } 317062306a36Sopenharmony_ci 317162306a36Sopenharmony_ci err = switch_to_kernel_sync(ce, err); 317262306a36Sopenharmony_ci p->runtime = intel_context_get_total_runtime_ns(ce); 317362306a36Sopenharmony_ci p->count = count; 317462306a36Sopenharmony_ci 317562306a36Sopenharmony_ci intel_context_unpin(ce); 317662306a36Sopenharmony_ci intel_context_put(ce); 317762306a36Sopenharmony_ci thread->result = err; 317862306a36Sopenharmony_ci} 317962306a36Sopenharmony_ci 318062306a36Sopenharmony_cistatic int perf_parallel_engines(void *arg) 318162306a36Sopenharmony_ci{ 318262306a36Sopenharmony_ci struct drm_i915_private *i915 = arg; 318362306a36Sopenharmony_ci static void (* const func[])(struct kthread_work *) = { 318462306a36Sopenharmony_ci p_sync0, 318562306a36Sopenharmony_ci p_sync1, 318662306a36Sopenharmony_ci p_many, 318762306a36Sopenharmony_ci NULL, 318862306a36Sopenharmony_ci }; 318962306a36Sopenharmony_ci const unsigned int nengines = num_uabi_engines(i915); 319062306a36Sopenharmony_ci void (* const *fn)(struct kthread_work *); 319162306a36Sopenharmony_ci struct intel_engine_cs *engine; 319262306a36Sopenharmony_ci struct pm_qos_request qos; 319362306a36Sopenharmony_ci struct p_thread *engines; 319462306a36Sopenharmony_ci int err = 0; 319562306a36Sopenharmony_ci 319662306a36Sopenharmony_ci engines = kcalloc(nengines, sizeof(*engines), GFP_KERNEL); 319762306a36Sopenharmony_ci if (!engines) 319862306a36Sopenharmony_ci return -ENOMEM; 319962306a36Sopenharmony_ci 320062306a36Sopenharmony_ci cpu_latency_qos_add_request(&qos, 0); 320162306a36Sopenharmony_ci 320262306a36Sopenharmony_ci for (fn = func; *fn; fn++) { 320362306a36Sopenharmony_ci char name[KSYM_NAME_LEN]; 320462306a36Sopenharmony_ci struct igt_live_test t; 320562306a36Sopenharmony_ci unsigned int idx; 320662306a36Sopenharmony_ci 320762306a36Sopenharmony_ci snprintf(name, sizeof(name), "%ps", *fn); 320862306a36Sopenharmony_ci err = igt_live_test_begin(&t, i915, __func__, name); 320962306a36Sopenharmony_ci if (err) 321062306a36Sopenharmony_ci break; 321162306a36Sopenharmony_ci 321262306a36Sopenharmony_ci atomic_set(&i915->selftest.counter, nengines); 321362306a36Sopenharmony_ci 321462306a36Sopenharmony_ci idx = 0; 321562306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 321662306a36Sopenharmony_ci struct kthread_worker *worker; 321762306a36Sopenharmony_ci 321862306a36Sopenharmony_ci intel_engine_pm_get(engine); 321962306a36Sopenharmony_ci 322062306a36Sopenharmony_ci memset(&engines[idx].p, 0, sizeof(engines[idx].p)); 322162306a36Sopenharmony_ci 322262306a36Sopenharmony_ci worker = kthread_create_worker(0, "igt:%s", 322362306a36Sopenharmony_ci engine->name); 322462306a36Sopenharmony_ci if (IS_ERR(worker)) { 322562306a36Sopenharmony_ci err = PTR_ERR(worker); 322662306a36Sopenharmony_ci intel_engine_pm_put(engine); 322762306a36Sopenharmony_ci break; 322862306a36Sopenharmony_ci } 322962306a36Sopenharmony_ci engines[idx].worker = worker; 323062306a36Sopenharmony_ci engines[idx].result = 0; 323162306a36Sopenharmony_ci engines[idx].p.engine = engine; 323262306a36Sopenharmony_ci engines[idx].engine = engine; 323362306a36Sopenharmony_ci 323462306a36Sopenharmony_ci kthread_init_work(&engines[idx].work, *fn); 323562306a36Sopenharmony_ci kthread_queue_work(worker, &engines[idx].work); 323662306a36Sopenharmony_ci idx++; 323762306a36Sopenharmony_ci } 323862306a36Sopenharmony_ci 323962306a36Sopenharmony_ci idx = 0; 324062306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 324162306a36Sopenharmony_ci int status; 324262306a36Sopenharmony_ci 324362306a36Sopenharmony_ci if (!engines[idx].worker) 324462306a36Sopenharmony_ci break; 324562306a36Sopenharmony_ci 324662306a36Sopenharmony_ci kthread_flush_work(&engines[idx].work); 324762306a36Sopenharmony_ci status = READ_ONCE(engines[idx].result); 324862306a36Sopenharmony_ci if (status && !err) 324962306a36Sopenharmony_ci err = status; 325062306a36Sopenharmony_ci 325162306a36Sopenharmony_ci intel_engine_pm_put(engine); 325262306a36Sopenharmony_ci 325362306a36Sopenharmony_ci kthread_destroy_worker(engines[idx].worker); 325462306a36Sopenharmony_ci idx++; 325562306a36Sopenharmony_ci } 325662306a36Sopenharmony_ci 325762306a36Sopenharmony_ci if (igt_live_test_end(&t)) 325862306a36Sopenharmony_ci err = -EIO; 325962306a36Sopenharmony_ci if (err) 326062306a36Sopenharmony_ci break; 326162306a36Sopenharmony_ci 326262306a36Sopenharmony_ci idx = 0; 326362306a36Sopenharmony_ci for_each_uabi_engine(engine, i915) { 326462306a36Sopenharmony_ci struct perf_stats *p = &engines[idx].p; 326562306a36Sopenharmony_ci u64 busy = 100 * ktime_to_ns(p->busy); 326662306a36Sopenharmony_ci u64 dt = ktime_to_ns(p->time); 326762306a36Sopenharmony_ci int integer, decimal; 326862306a36Sopenharmony_ci 326962306a36Sopenharmony_ci if (dt) { 327062306a36Sopenharmony_ci integer = div64_u64(busy, dt); 327162306a36Sopenharmony_ci busy -= integer * dt; 327262306a36Sopenharmony_ci decimal = div64_u64(100 * busy, dt); 327362306a36Sopenharmony_ci } else { 327462306a36Sopenharmony_ci integer = 0; 327562306a36Sopenharmony_ci decimal = 0; 327662306a36Sopenharmony_ci } 327762306a36Sopenharmony_ci 327862306a36Sopenharmony_ci GEM_BUG_ON(engine != p->engine); 327962306a36Sopenharmony_ci pr_info("%s %5s: { count:%lu, busy:%d.%02d%%, runtime:%lldms, walltime:%lldms }\n", 328062306a36Sopenharmony_ci name, engine->name, p->count, integer, decimal, 328162306a36Sopenharmony_ci div_u64(p->runtime, 1000 * 1000), 328262306a36Sopenharmony_ci div_u64(ktime_to_ns(p->time), 1000 * 1000)); 328362306a36Sopenharmony_ci idx++; 328462306a36Sopenharmony_ci } 328562306a36Sopenharmony_ci } 328662306a36Sopenharmony_ci 328762306a36Sopenharmony_ci cpu_latency_qos_remove_request(&qos); 328862306a36Sopenharmony_ci kfree(engines); 328962306a36Sopenharmony_ci return err; 329062306a36Sopenharmony_ci} 329162306a36Sopenharmony_ci 329262306a36Sopenharmony_ciint i915_request_perf_selftests(struct drm_i915_private *i915) 329362306a36Sopenharmony_ci{ 329462306a36Sopenharmony_ci static const struct i915_subtest tests[] = { 329562306a36Sopenharmony_ci SUBTEST(perf_request_latency), 329662306a36Sopenharmony_ci SUBTEST(perf_series_engines), 329762306a36Sopenharmony_ci SUBTEST(perf_parallel_engines), 329862306a36Sopenharmony_ci }; 329962306a36Sopenharmony_ci 330062306a36Sopenharmony_ci if (intel_gt_is_wedged(to_gt(i915))) 330162306a36Sopenharmony_ci return 0; 330262306a36Sopenharmony_ci 330362306a36Sopenharmony_ci return i915_subtests(tests, i915); 330462306a36Sopenharmony_ci} 3305