162306a36Sopenharmony_ci/*
262306a36Sopenharmony_ci * Copyright © 2016 Intel Corporation
362306a36Sopenharmony_ci *
462306a36Sopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a
562306a36Sopenharmony_ci * copy of this software and associated documentation files (the "Software"),
662306a36Sopenharmony_ci * to deal in the Software without restriction, including without limitation
762306a36Sopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sublicense,
862306a36Sopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the
962306a36Sopenharmony_ci * Software is furnished to do so, subject to the following conditions:
1062306a36Sopenharmony_ci *
1162306a36Sopenharmony_ci * The above copyright notice and this permission notice (including the next
1262306a36Sopenharmony_ci * paragraph) shall be included in all copies or substantial portions of the
1362306a36Sopenharmony_ci * Software.
1462306a36Sopenharmony_ci *
1562306a36Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
1662306a36Sopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
1762306a36Sopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
1862306a36Sopenharmony_ci * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
1962306a36Sopenharmony_ci * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
2062306a36Sopenharmony_ci * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
2162306a36Sopenharmony_ci * IN THE SOFTWARE.
2262306a36Sopenharmony_ci *
2362306a36Sopenharmony_ci */
2462306a36Sopenharmony_ci
2562306a36Sopenharmony_ci#include <linux/prime_numbers.h>
2662306a36Sopenharmony_ci#include <linux/pm_qos.h>
2762306a36Sopenharmony_ci#include <linux/sort.h>
2862306a36Sopenharmony_ci
2962306a36Sopenharmony_ci#include "gem/i915_gem_internal.h"
3062306a36Sopenharmony_ci#include "gem/i915_gem_pm.h"
3162306a36Sopenharmony_ci#include "gem/selftests/mock_context.h"
3262306a36Sopenharmony_ci
3362306a36Sopenharmony_ci#include "gt/intel_engine_heartbeat.h"
3462306a36Sopenharmony_ci#include "gt/intel_engine_pm.h"
3562306a36Sopenharmony_ci#include "gt/intel_engine_user.h"
3662306a36Sopenharmony_ci#include "gt/intel_gt.h"
3762306a36Sopenharmony_ci#include "gt/intel_gt_clock_utils.h"
3862306a36Sopenharmony_ci#include "gt/intel_gt_requests.h"
3962306a36Sopenharmony_ci#include "gt/selftest_engine_heartbeat.h"
4062306a36Sopenharmony_ci
4162306a36Sopenharmony_ci#include "i915_random.h"
4262306a36Sopenharmony_ci#include "i915_selftest.h"
4362306a36Sopenharmony_ci#include "igt_flush_test.h"
4462306a36Sopenharmony_ci#include "igt_live_test.h"
4562306a36Sopenharmony_ci#include "igt_spinner.h"
4662306a36Sopenharmony_ci#include "lib_sw_fence.h"
4762306a36Sopenharmony_ci
4862306a36Sopenharmony_ci#include "mock_drm.h"
4962306a36Sopenharmony_ci#include "mock_gem_device.h"
5062306a36Sopenharmony_ci
5162306a36Sopenharmony_cistatic unsigned int num_uabi_engines(struct drm_i915_private *i915)
5262306a36Sopenharmony_ci{
5362306a36Sopenharmony_ci	struct intel_engine_cs *engine;
5462306a36Sopenharmony_ci	unsigned int count;
5562306a36Sopenharmony_ci
5662306a36Sopenharmony_ci	count = 0;
5762306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915)
5862306a36Sopenharmony_ci		count++;
5962306a36Sopenharmony_ci
6062306a36Sopenharmony_ci	return count;
6162306a36Sopenharmony_ci}
6262306a36Sopenharmony_ci
6362306a36Sopenharmony_cistatic struct intel_engine_cs *rcs0(struct drm_i915_private *i915)
6462306a36Sopenharmony_ci{
6562306a36Sopenharmony_ci	return intel_engine_lookup_user(i915, I915_ENGINE_CLASS_RENDER, 0);
6662306a36Sopenharmony_ci}
6762306a36Sopenharmony_ci
6862306a36Sopenharmony_cistatic int igt_add_request(void *arg)
6962306a36Sopenharmony_ci{
7062306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
7162306a36Sopenharmony_ci	struct i915_request *request;
7262306a36Sopenharmony_ci
7362306a36Sopenharmony_ci	/* Basic preliminary test to create a request and let it loose! */
7462306a36Sopenharmony_ci
7562306a36Sopenharmony_ci	request = mock_request(rcs0(i915)->kernel_context, HZ / 10);
7662306a36Sopenharmony_ci	if (!request)
7762306a36Sopenharmony_ci		return -ENOMEM;
7862306a36Sopenharmony_ci
7962306a36Sopenharmony_ci	i915_request_add(request);
8062306a36Sopenharmony_ci
8162306a36Sopenharmony_ci	return 0;
8262306a36Sopenharmony_ci}
8362306a36Sopenharmony_ci
8462306a36Sopenharmony_cistatic int igt_wait_request(void *arg)
8562306a36Sopenharmony_ci{
8662306a36Sopenharmony_ci	const long T = HZ / 4;
8762306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
8862306a36Sopenharmony_ci	struct i915_request *request;
8962306a36Sopenharmony_ci	int err = -EINVAL;
9062306a36Sopenharmony_ci
9162306a36Sopenharmony_ci	/* Submit a request, then wait upon it */
9262306a36Sopenharmony_ci
9362306a36Sopenharmony_ci	request = mock_request(rcs0(i915)->kernel_context, T);
9462306a36Sopenharmony_ci	if (!request)
9562306a36Sopenharmony_ci		return -ENOMEM;
9662306a36Sopenharmony_ci
9762306a36Sopenharmony_ci	i915_request_get(request);
9862306a36Sopenharmony_ci
9962306a36Sopenharmony_ci	if (i915_request_wait(request, 0, 0) != -ETIME) {
10062306a36Sopenharmony_ci		pr_err("request wait (busy query) succeeded (expected timeout before submit!)\n");
10162306a36Sopenharmony_ci		goto out_request;
10262306a36Sopenharmony_ci	}
10362306a36Sopenharmony_ci
10462306a36Sopenharmony_ci	if (i915_request_wait(request, 0, T) != -ETIME) {
10562306a36Sopenharmony_ci		pr_err("request wait succeeded (expected timeout before submit!)\n");
10662306a36Sopenharmony_ci		goto out_request;
10762306a36Sopenharmony_ci	}
10862306a36Sopenharmony_ci
10962306a36Sopenharmony_ci	if (i915_request_completed(request)) {
11062306a36Sopenharmony_ci		pr_err("request completed before submit!!\n");
11162306a36Sopenharmony_ci		goto out_request;
11262306a36Sopenharmony_ci	}
11362306a36Sopenharmony_ci
11462306a36Sopenharmony_ci	i915_request_add(request);
11562306a36Sopenharmony_ci
11662306a36Sopenharmony_ci	if (i915_request_wait(request, 0, 0) != -ETIME) {
11762306a36Sopenharmony_ci		pr_err("request wait (busy query) succeeded (expected timeout after submit!)\n");
11862306a36Sopenharmony_ci		goto out_request;
11962306a36Sopenharmony_ci	}
12062306a36Sopenharmony_ci
12162306a36Sopenharmony_ci	if (i915_request_completed(request)) {
12262306a36Sopenharmony_ci		pr_err("request completed immediately!\n");
12362306a36Sopenharmony_ci		goto out_request;
12462306a36Sopenharmony_ci	}
12562306a36Sopenharmony_ci
12662306a36Sopenharmony_ci	if (i915_request_wait(request, 0, T / 2) != -ETIME) {
12762306a36Sopenharmony_ci		pr_err("request wait succeeded (expected timeout!)\n");
12862306a36Sopenharmony_ci		goto out_request;
12962306a36Sopenharmony_ci	}
13062306a36Sopenharmony_ci
13162306a36Sopenharmony_ci	if (i915_request_wait(request, 0, T) == -ETIME) {
13262306a36Sopenharmony_ci		pr_err("request wait timed out!\n");
13362306a36Sopenharmony_ci		goto out_request;
13462306a36Sopenharmony_ci	}
13562306a36Sopenharmony_ci
13662306a36Sopenharmony_ci	if (!i915_request_completed(request)) {
13762306a36Sopenharmony_ci		pr_err("request not complete after waiting!\n");
13862306a36Sopenharmony_ci		goto out_request;
13962306a36Sopenharmony_ci	}
14062306a36Sopenharmony_ci
14162306a36Sopenharmony_ci	if (i915_request_wait(request, 0, T) == -ETIME) {
14262306a36Sopenharmony_ci		pr_err("request wait timed out when already complete!\n");
14362306a36Sopenharmony_ci		goto out_request;
14462306a36Sopenharmony_ci	}
14562306a36Sopenharmony_ci
14662306a36Sopenharmony_ci	err = 0;
14762306a36Sopenharmony_ciout_request:
14862306a36Sopenharmony_ci	i915_request_put(request);
14962306a36Sopenharmony_ci	mock_device_flush(i915);
15062306a36Sopenharmony_ci	return err;
15162306a36Sopenharmony_ci}
15262306a36Sopenharmony_ci
15362306a36Sopenharmony_cistatic int igt_fence_wait(void *arg)
15462306a36Sopenharmony_ci{
15562306a36Sopenharmony_ci	const long T = HZ / 4;
15662306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
15762306a36Sopenharmony_ci	struct i915_request *request;
15862306a36Sopenharmony_ci	int err = -EINVAL;
15962306a36Sopenharmony_ci
16062306a36Sopenharmony_ci	/* Submit a request, treat it as a fence and wait upon it */
16162306a36Sopenharmony_ci
16262306a36Sopenharmony_ci	request = mock_request(rcs0(i915)->kernel_context, T);
16362306a36Sopenharmony_ci	if (!request)
16462306a36Sopenharmony_ci		return -ENOMEM;
16562306a36Sopenharmony_ci
16662306a36Sopenharmony_ci	if (dma_fence_wait_timeout(&request->fence, false, T) != -ETIME) {
16762306a36Sopenharmony_ci		pr_err("fence wait success before submit (expected timeout)!\n");
16862306a36Sopenharmony_ci		goto out;
16962306a36Sopenharmony_ci	}
17062306a36Sopenharmony_ci
17162306a36Sopenharmony_ci	i915_request_add(request);
17262306a36Sopenharmony_ci
17362306a36Sopenharmony_ci	if (dma_fence_is_signaled(&request->fence)) {
17462306a36Sopenharmony_ci		pr_err("fence signaled immediately!\n");
17562306a36Sopenharmony_ci		goto out;
17662306a36Sopenharmony_ci	}
17762306a36Sopenharmony_ci
17862306a36Sopenharmony_ci	if (dma_fence_wait_timeout(&request->fence, false, T / 2) != -ETIME) {
17962306a36Sopenharmony_ci		pr_err("fence wait success after submit (expected timeout)!\n");
18062306a36Sopenharmony_ci		goto out;
18162306a36Sopenharmony_ci	}
18262306a36Sopenharmony_ci
18362306a36Sopenharmony_ci	if (dma_fence_wait_timeout(&request->fence, false, T) <= 0) {
18462306a36Sopenharmony_ci		pr_err("fence wait timed out (expected success)!\n");
18562306a36Sopenharmony_ci		goto out;
18662306a36Sopenharmony_ci	}
18762306a36Sopenharmony_ci
18862306a36Sopenharmony_ci	if (!dma_fence_is_signaled(&request->fence)) {
18962306a36Sopenharmony_ci		pr_err("fence unsignaled after waiting!\n");
19062306a36Sopenharmony_ci		goto out;
19162306a36Sopenharmony_ci	}
19262306a36Sopenharmony_ci
19362306a36Sopenharmony_ci	if (dma_fence_wait_timeout(&request->fence, false, T) <= 0) {
19462306a36Sopenharmony_ci		pr_err("fence wait timed out when complete (expected success)!\n");
19562306a36Sopenharmony_ci		goto out;
19662306a36Sopenharmony_ci	}
19762306a36Sopenharmony_ci
19862306a36Sopenharmony_ci	err = 0;
19962306a36Sopenharmony_ciout:
20062306a36Sopenharmony_ci	mock_device_flush(i915);
20162306a36Sopenharmony_ci	return err;
20262306a36Sopenharmony_ci}
20362306a36Sopenharmony_ci
20462306a36Sopenharmony_cistatic int igt_request_rewind(void *arg)
20562306a36Sopenharmony_ci{
20662306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
20762306a36Sopenharmony_ci	struct i915_request *request, *vip;
20862306a36Sopenharmony_ci	struct i915_gem_context *ctx[2];
20962306a36Sopenharmony_ci	struct intel_context *ce;
21062306a36Sopenharmony_ci	int err = -EINVAL;
21162306a36Sopenharmony_ci
21262306a36Sopenharmony_ci	ctx[0] = mock_context(i915, "A");
21362306a36Sopenharmony_ci	if (!ctx[0]) {
21462306a36Sopenharmony_ci		err = -ENOMEM;
21562306a36Sopenharmony_ci		goto err_ctx_0;
21662306a36Sopenharmony_ci	}
21762306a36Sopenharmony_ci
21862306a36Sopenharmony_ci	ce = i915_gem_context_get_engine(ctx[0], RCS0);
21962306a36Sopenharmony_ci	GEM_BUG_ON(IS_ERR(ce));
22062306a36Sopenharmony_ci	request = mock_request(ce, 2 * HZ);
22162306a36Sopenharmony_ci	intel_context_put(ce);
22262306a36Sopenharmony_ci	if (!request) {
22362306a36Sopenharmony_ci		err = -ENOMEM;
22462306a36Sopenharmony_ci		goto err_context_0;
22562306a36Sopenharmony_ci	}
22662306a36Sopenharmony_ci
22762306a36Sopenharmony_ci	i915_request_get(request);
22862306a36Sopenharmony_ci	i915_request_add(request);
22962306a36Sopenharmony_ci
23062306a36Sopenharmony_ci	ctx[1] = mock_context(i915, "B");
23162306a36Sopenharmony_ci	if (!ctx[1]) {
23262306a36Sopenharmony_ci		err = -ENOMEM;
23362306a36Sopenharmony_ci		goto err_ctx_1;
23462306a36Sopenharmony_ci	}
23562306a36Sopenharmony_ci
23662306a36Sopenharmony_ci	ce = i915_gem_context_get_engine(ctx[1], RCS0);
23762306a36Sopenharmony_ci	GEM_BUG_ON(IS_ERR(ce));
23862306a36Sopenharmony_ci	vip = mock_request(ce, 0);
23962306a36Sopenharmony_ci	intel_context_put(ce);
24062306a36Sopenharmony_ci	if (!vip) {
24162306a36Sopenharmony_ci		err = -ENOMEM;
24262306a36Sopenharmony_ci		goto err_context_1;
24362306a36Sopenharmony_ci	}
24462306a36Sopenharmony_ci
24562306a36Sopenharmony_ci	/* Simulate preemption by manual reordering */
24662306a36Sopenharmony_ci	if (!mock_cancel_request(request)) {
24762306a36Sopenharmony_ci		pr_err("failed to cancel request (already executed)!\n");
24862306a36Sopenharmony_ci		i915_request_add(vip);
24962306a36Sopenharmony_ci		goto err_context_1;
25062306a36Sopenharmony_ci	}
25162306a36Sopenharmony_ci	i915_request_get(vip);
25262306a36Sopenharmony_ci	i915_request_add(vip);
25362306a36Sopenharmony_ci	rcu_read_lock();
25462306a36Sopenharmony_ci	request->engine->submit_request(request);
25562306a36Sopenharmony_ci	rcu_read_unlock();
25662306a36Sopenharmony_ci
25762306a36Sopenharmony_ci
25862306a36Sopenharmony_ci	if (i915_request_wait(vip, 0, HZ) == -ETIME) {
25962306a36Sopenharmony_ci		pr_err("timed out waiting for high priority request\n");
26062306a36Sopenharmony_ci		goto err;
26162306a36Sopenharmony_ci	}
26262306a36Sopenharmony_ci
26362306a36Sopenharmony_ci	if (i915_request_completed(request)) {
26462306a36Sopenharmony_ci		pr_err("low priority request already completed\n");
26562306a36Sopenharmony_ci		goto err;
26662306a36Sopenharmony_ci	}
26762306a36Sopenharmony_ci
26862306a36Sopenharmony_ci	err = 0;
26962306a36Sopenharmony_cierr:
27062306a36Sopenharmony_ci	i915_request_put(vip);
27162306a36Sopenharmony_cierr_context_1:
27262306a36Sopenharmony_ci	mock_context_close(ctx[1]);
27362306a36Sopenharmony_cierr_ctx_1:
27462306a36Sopenharmony_ci	i915_request_put(request);
27562306a36Sopenharmony_cierr_context_0:
27662306a36Sopenharmony_ci	mock_context_close(ctx[0]);
27762306a36Sopenharmony_cierr_ctx_0:
27862306a36Sopenharmony_ci	mock_device_flush(i915);
27962306a36Sopenharmony_ci	return err;
28062306a36Sopenharmony_ci}
28162306a36Sopenharmony_ci
28262306a36Sopenharmony_cistruct smoketest {
28362306a36Sopenharmony_ci	struct intel_engine_cs *engine;
28462306a36Sopenharmony_ci	struct i915_gem_context **contexts;
28562306a36Sopenharmony_ci	atomic_long_t num_waits, num_fences;
28662306a36Sopenharmony_ci	int ncontexts, max_batch;
28762306a36Sopenharmony_ci	struct i915_request *(*request_alloc)(struct intel_context *ce);
28862306a36Sopenharmony_ci};
28962306a36Sopenharmony_ci
29062306a36Sopenharmony_cistatic struct i915_request *
29162306a36Sopenharmony_ci__mock_request_alloc(struct intel_context *ce)
29262306a36Sopenharmony_ci{
29362306a36Sopenharmony_ci	return mock_request(ce, 0);
29462306a36Sopenharmony_ci}
29562306a36Sopenharmony_ci
29662306a36Sopenharmony_cistatic struct i915_request *
29762306a36Sopenharmony_ci__live_request_alloc(struct intel_context *ce)
29862306a36Sopenharmony_ci{
29962306a36Sopenharmony_ci	return intel_context_create_request(ce);
30062306a36Sopenharmony_ci}
30162306a36Sopenharmony_ci
30262306a36Sopenharmony_cistruct smoke_thread {
30362306a36Sopenharmony_ci	struct kthread_worker *worker;
30462306a36Sopenharmony_ci	struct kthread_work work;
30562306a36Sopenharmony_ci	struct smoketest *t;
30662306a36Sopenharmony_ci	bool stop;
30762306a36Sopenharmony_ci	int result;
30862306a36Sopenharmony_ci};
30962306a36Sopenharmony_ci
31062306a36Sopenharmony_cistatic void __igt_breadcrumbs_smoketest(struct kthread_work *work)
31162306a36Sopenharmony_ci{
31262306a36Sopenharmony_ci	struct smoke_thread *thread = container_of(work, typeof(*thread), work);
31362306a36Sopenharmony_ci	struct smoketest *t = thread->t;
31462306a36Sopenharmony_ci	const unsigned int max_batch = min(t->ncontexts, t->max_batch) - 1;
31562306a36Sopenharmony_ci	const unsigned int total = 4 * t->ncontexts + 1;
31662306a36Sopenharmony_ci	unsigned int num_waits = 0, num_fences = 0;
31762306a36Sopenharmony_ci	struct i915_request **requests;
31862306a36Sopenharmony_ci	I915_RND_STATE(prng);
31962306a36Sopenharmony_ci	unsigned int *order;
32062306a36Sopenharmony_ci	int err = 0;
32162306a36Sopenharmony_ci
32262306a36Sopenharmony_ci	/*
32362306a36Sopenharmony_ci	 * A very simple test to catch the most egregious of list handling bugs.
32462306a36Sopenharmony_ci	 *
32562306a36Sopenharmony_ci	 * At its heart, we simply create oodles of requests running across
32662306a36Sopenharmony_ci	 * multiple kthreads and enable signaling on them, for the sole purpose
32762306a36Sopenharmony_ci	 * of stressing our breadcrumb handling. The only inspection we do is
32862306a36Sopenharmony_ci	 * that the fences were marked as signaled.
32962306a36Sopenharmony_ci	 */
33062306a36Sopenharmony_ci
33162306a36Sopenharmony_ci	requests = kcalloc(total, sizeof(*requests), GFP_KERNEL);
33262306a36Sopenharmony_ci	if (!requests) {
33362306a36Sopenharmony_ci		thread->result = -ENOMEM;
33462306a36Sopenharmony_ci		return;
33562306a36Sopenharmony_ci	}
33662306a36Sopenharmony_ci
33762306a36Sopenharmony_ci	order = i915_random_order(total, &prng);
33862306a36Sopenharmony_ci	if (!order) {
33962306a36Sopenharmony_ci		err = -ENOMEM;
34062306a36Sopenharmony_ci		goto out_requests;
34162306a36Sopenharmony_ci	}
34262306a36Sopenharmony_ci
34362306a36Sopenharmony_ci	while (!READ_ONCE(thread->stop)) {
34462306a36Sopenharmony_ci		struct i915_sw_fence *submit, *wait;
34562306a36Sopenharmony_ci		unsigned int n, count;
34662306a36Sopenharmony_ci
34762306a36Sopenharmony_ci		submit = heap_fence_create(GFP_KERNEL);
34862306a36Sopenharmony_ci		if (!submit) {
34962306a36Sopenharmony_ci			err = -ENOMEM;
35062306a36Sopenharmony_ci			break;
35162306a36Sopenharmony_ci		}
35262306a36Sopenharmony_ci
35362306a36Sopenharmony_ci		wait = heap_fence_create(GFP_KERNEL);
35462306a36Sopenharmony_ci		if (!wait) {
35562306a36Sopenharmony_ci			i915_sw_fence_commit(submit);
35662306a36Sopenharmony_ci			heap_fence_put(submit);
35762306a36Sopenharmony_ci			err = -ENOMEM;
35862306a36Sopenharmony_ci			break;
35962306a36Sopenharmony_ci		}
36062306a36Sopenharmony_ci
36162306a36Sopenharmony_ci		i915_random_reorder(order, total, &prng);
36262306a36Sopenharmony_ci		count = 1 + i915_prandom_u32_max_state(max_batch, &prng);
36362306a36Sopenharmony_ci
36462306a36Sopenharmony_ci		for (n = 0; n < count; n++) {
36562306a36Sopenharmony_ci			struct i915_gem_context *ctx =
36662306a36Sopenharmony_ci				t->contexts[order[n] % t->ncontexts];
36762306a36Sopenharmony_ci			struct i915_request *rq;
36862306a36Sopenharmony_ci			struct intel_context *ce;
36962306a36Sopenharmony_ci
37062306a36Sopenharmony_ci			ce = i915_gem_context_get_engine(ctx, t->engine->legacy_idx);
37162306a36Sopenharmony_ci			GEM_BUG_ON(IS_ERR(ce));
37262306a36Sopenharmony_ci			rq = t->request_alloc(ce);
37362306a36Sopenharmony_ci			intel_context_put(ce);
37462306a36Sopenharmony_ci			if (IS_ERR(rq)) {
37562306a36Sopenharmony_ci				err = PTR_ERR(rq);
37662306a36Sopenharmony_ci				count = n;
37762306a36Sopenharmony_ci				break;
37862306a36Sopenharmony_ci			}
37962306a36Sopenharmony_ci
38062306a36Sopenharmony_ci			err = i915_sw_fence_await_sw_fence_gfp(&rq->submit,
38162306a36Sopenharmony_ci							       submit,
38262306a36Sopenharmony_ci							       GFP_KERNEL);
38362306a36Sopenharmony_ci
38462306a36Sopenharmony_ci			requests[n] = i915_request_get(rq);
38562306a36Sopenharmony_ci			i915_request_add(rq);
38662306a36Sopenharmony_ci
38762306a36Sopenharmony_ci			if (err >= 0)
38862306a36Sopenharmony_ci				err = i915_sw_fence_await_dma_fence(wait,
38962306a36Sopenharmony_ci								    &rq->fence,
39062306a36Sopenharmony_ci								    0,
39162306a36Sopenharmony_ci								    GFP_KERNEL);
39262306a36Sopenharmony_ci
39362306a36Sopenharmony_ci			if (err < 0) {
39462306a36Sopenharmony_ci				i915_request_put(rq);
39562306a36Sopenharmony_ci				count = n;
39662306a36Sopenharmony_ci				break;
39762306a36Sopenharmony_ci			}
39862306a36Sopenharmony_ci		}
39962306a36Sopenharmony_ci
40062306a36Sopenharmony_ci		i915_sw_fence_commit(submit);
40162306a36Sopenharmony_ci		i915_sw_fence_commit(wait);
40262306a36Sopenharmony_ci
40362306a36Sopenharmony_ci		if (!wait_event_timeout(wait->wait,
40462306a36Sopenharmony_ci					i915_sw_fence_done(wait),
40562306a36Sopenharmony_ci					5 * HZ)) {
40662306a36Sopenharmony_ci			struct i915_request *rq = requests[count - 1];
40762306a36Sopenharmony_ci
40862306a36Sopenharmony_ci			pr_err("waiting for %d/%d fences (last %llx:%lld) on %s timed out!\n",
40962306a36Sopenharmony_ci			       atomic_read(&wait->pending), count,
41062306a36Sopenharmony_ci			       rq->fence.context, rq->fence.seqno,
41162306a36Sopenharmony_ci			       t->engine->name);
41262306a36Sopenharmony_ci			GEM_TRACE_DUMP();
41362306a36Sopenharmony_ci
41462306a36Sopenharmony_ci			intel_gt_set_wedged(t->engine->gt);
41562306a36Sopenharmony_ci			GEM_BUG_ON(!i915_request_completed(rq));
41662306a36Sopenharmony_ci			i915_sw_fence_wait(wait);
41762306a36Sopenharmony_ci			err = -EIO;
41862306a36Sopenharmony_ci		}
41962306a36Sopenharmony_ci
42062306a36Sopenharmony_ci		for (n = 0; n < count; n++) {
42162306a36Sopenharmony_ci			struct i915_request *rq = requests[n];
42262306a36Sopenharmony_ci
42362306a36Sopenharmony_ci			if (!test_bit(DMA_FENCE_FLAG_SIGNALED_BIT,
42462306a36Sopenharmony_ci				      &rq->fence.flags)) {
42562306a36Sopenharmony_ci				pr_err("%llu:%llu was not signaled!\n",
42662306a36Sopenharmony_ci				       rq->fence.context, rq->fence.seqno);
42762306a36Sopenharmony_ci				err = -EINVAL;
42862306a36Sopenharmony_ci			}
42962306a36Sopenharmony_ci
43062306a36Sopenharmony_ci			i915_request_put(rq);
43162306a36Sopenharmony_ci		}
43262306a36Sopenharmony_ci
43362306a36Sopenharmony_ci		heap_fence_put(wait);
43462306a36Sopenharmony_ci		heap_fence_put(submit);
43562306a36Sopenharmony_ci
43662306a36Sopenharmony_ci		if (err < 0)
43762306a36Sopenharmony_ci			break;
43862306a36Sopenharmony_ci
43962306a36Sopenharmony_ci		num_fences += count;
44062306a36Sopenharmony_ci		num_waits++;
44162306a36Sopenharmony_ci
44262306a36Sopenharmony_ci		cond_resched();
44362306a36Sopenharmony_ci	}
44462306a36Sopenharmony_ci
44562306a36Sopenharmony_ci	atomic_long_add(num_fences, &t->num_fences);
44662306a36Sopenharmony_ci	atomic_long_add(num_waits, &t->num_waits);
44762306a36Sopenharmony_ci
44862306a36Sopenharmony_ci	kfree(order);
44962306a36Sopenharmony_ciout_requests:
45062306a36Sopenharmony_ci	kfree(requests);
45162306a36Sopenharmony_ci	thread->result = err;
45262306a36Sopenharmony_ci}
45362306a36Sopenharmony_ci
45462306a36Sopenharmony_cistatic int mock_breadcrumbs_smoketest(void *arg)
45562306a36Sopenharmony_ci{
45662306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
45762306a36Sopenharmony_ci	struct smoketest t = {
45862306a36Sopenharmony_ci		.engine = rcs0(i915),
45962306a36Sopenharmony_ci		.ncontexts = 1024,
46062306a36Sopenharmony_ci		.max_batch = 1024,
46162306a36Sopenharmony_ci		.request_alloc = __mock_request_alloc
46262306a36Sopenharmony_ci	};
46362306a36Sopenharmony_ci	unsigned int ncpus = num_online_cpus();
46462306a36Sopenharmony_ci	struct smoke_thread *threads;
46562306a36Sopenharmony_ci	unsigned int n;
46662306a36Sopenharmony_ci	int ret = 0;
46762306a36Sopenharmony_ci
46862306a36Sopenharmony_ci	/*
46962306a36Sopenharmony_ci	 * Smoketest our breadcrumb/signal handling for requests across multiple
47062306a36Sopenharmony_ci	 * threads. A very simple test to only catch the most egregious of bugs.
47162306a36Sopenharmony_ci	 * See __igt_breadcrumbs_smoketest();
47262306a36Sopenharmony_ci	 */
47362306a36Sopenharmony_ci
47462306a36Sopenharmony_ci	threads = kcalloc(ncpus, sizeof(*threads), GFP_KERNEL);
47562306a36Sopenharmony_ci	if (!threads)
47662306a36Sopenharmony_ci		return -ENOMEM;
47762306a36Sopenharmony_ci
47862306a36Sopenharmony_ci	t.contexts = kcalloc(t.ncontexts, sizeof(*t.contexts), GFP_KERNEL);
47962306a36Sopenharmony_ci	if (!t.contexts) {
48062306a36Sopenharmony_ci		ret = -ENOMEM;
48162306a36Sopenharmony_ci		goto out_threads;
48262306a36Sopenharmony_ci	}
48362306a36Sopenharmony_ci
48462306a36Sopenharmony_ci	for (n = 0; n < t.ncontexts; n++) {
48562306a36Sopenharmony_ci		t.contexts[n] = mock_context(t.engine->i915, "mock");
48662306a36Sopenharmony_ci		if (!t.contexts[n]) {
48762306a36Sopenharmony_ci			ret = -ENOMEM;
48862306a36Sopenharmony_ci			goto out_contexts;
48962306a36Sopenharmony_ci		}
49062306a36Sopenharmony_ci	}
49162306a36Sopenharmony_ci
49262306a36Sopenharmony_ci	for (n = 0; n < ncpus; n++) {
49362306a36Sopenharmony_ci		struct kthread_worker *worker;
49462306a36Sopenharmony_ci
49562306a36Sopenharmony_ci		worker = kthread_create_worker(0, "igt/%d", n);
49662306a36Sopenharmony_ci		if (IS_ERR(worker)) {
49762306a36Sopenharmony_ci			ret = PTR_ERR(worker);
49862306a36Sopenharmony_ci			ncpus = n;
49962306a36Sopenharmony_ci			break;
50062306a36Sopenharmony_ci		}
50162306a36Sopenharmony_ci
50262306a36Sopenharmony_ci		threads[n].worker = worker;
50362306a36Sopenharmony_ci		threads[n].t = &t;
50462306a36Sopenharmony_ci		threads[n].stop = false;
50562306a36Sopenharmony_ci		threads[n].result = 0;
50662306a36Sopenharmony_ci
50762306a36Sopenharmony_ci		kthread_init_work(&threads[n].work,
50862306a36Sopenharmony_ci				  __igt_breadcrumbs_smoketest);
50962306a36Sopenharmony_ci		kthread_queue_work(worker, &threads[n].work);
51062306a36Sopenharmony_ci	}
51162306a36Sopenharmony_ci
51262306a36Sopenharmony_ci	msleep(jiffies_to_msecs(i915_selftest.timeout_jiffies));
51362306a36Sopenharmony_ci
51462306a36Sopenharmony_ci	for (n = 0; n < ncpus; n++) {
51562306a36Sopenharmony_ci		int err;
51662306a36Sopenharmony_ci
51762306a36Sopenharmony_ci		WRITE_ONCE(threads[n].stop, true);
51862306a36Sopenharmony_ci		kthread_flush_work(&threads[n].work);
51962306a36Sopenharmony_ci		err = READ_ONCE(threads[n].result);
52062306a36Sopenharmony_ci		if (err < 0 && !ret)
52162306a36Sopenharmony_ci			ret = err;
52262306a36Sopenharmony_ci
52362306a36Sopenharmony_ci		kthread_destroy_worker(threads[n].worker);
52462306a36Sopenharmony_ci	}
52562306a36Sopenharmony_ci	pr_info("Completed %lu waits for %lu fence across %d cpus\n",
52662306a36Sopenharmony_ci		atomic_long_read(&t.num_waits),
52762306a36Sopenharmony_ci		atomic_long_read(&t.num_fences),
52862306a36Sopenharmony_ci		ncpus);
52962306a36Sopenharmony_ci
53062306a36Sopenharmony_ciout_contexts:
53162306a36Sopenharmony_ci	for (n = 0; n < t.ncontexts; n++) {
53262306a36Sopenharmony_ci		if (!t.contexts[n])
53362306a36Sopenharmony_ci			break;
53462306a36Sopenharmony_ci		mock_context_close(t.contexts[n]);
53562306a36Sopenharmony_ci	}
53662306a36Sopenharmony_ci	kfree(t.contexts);
53762306a36Sopenharmony_ciout_threads:
53862306a36Sopenharmony_ci	kfree(threads);
53962306a36Sopenharmony_ci	return ret;
54062306a36Sopenharmony_ci}
54162306a36Sopenharmony_ci
54262306a36Sopenharmony_ciint i915_request_mock_selftests(void)
54362306a36Sopenharmony_ci{
54462306a36Sopenharmony_ci	static const struct i915_subtest tests[] = {
54562306a36Sopenharmony_ci		SUBTEST(igt_add_request),
54662306a36Sopenharmony_ci		SUBTEST(igt_wait_request),
54762306a36Sopenharmony_ci		SUBTEST(igt_fence_wait),
54862306a36Sopenharmony_ci		SUBTEST(igt_request_rewind),
54962306a36Sopenharmony_ci		SUBTEST(mock_breadcrumbs_smoketest),
55062306a36Sopenharmony_ci	};
55162306a36Sopenharmony_ci	struct drm_i915_private *i915;
55262306a36Sopenharmony_ci	intel_wakeref_t wakeref;
55362306a36Sopenharmony_ci	int err = 0;
55462306a36Sopenharmony_ci
55562306a36Sopenharmony_ci	i915 = mock_gem_device();
55662306a36Sopenharmony_ci	if (!i915)
55762306a36Sopenharmony_ci		return -ENOMEM;
55862306a36Sopenharmony_ci
55962306a36Sopenharmony_ci	with_intel_runtime_pm(&i915->runtime_pm, wakeref)
56062306a36Sopenharmony_ci		err = i915_subtests(tests, i915);
56162306a36Sopenharmony_ci
56262306a36Sopenharmony_ci	mock_destroy_device(i915);
56362306a36Sopenharmony_ci
56462306a36Sopenharmony_ci	return err;
56562306a36Sopenharmony_ci}
56662306a36Sopenharmony_ci
56762306a36Sopenharmony_cistatic int live_nop_request(void *arg)
56862306a36Sopenharmony_ci{
56962306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
57062306a36Sopenharmony_ci	struct intel_engine_cs *engine;
57162306a36Sopenharmony_ci	struct igt_live_test t;
57262306a36Sopenharmony_ci	int err = -ENODEV;
57362306a36Sopenharmony_ci
57462306a36Sopenharmony_ci	/*
57562306a36Sopenharmony_ci	 * Submit various sized batches of empty requests, to each engine
57662306a36Sopenharmony_ci	 * (individually), and wait for the batch to complete. We can check
57762306a36Sopenharmony_ci	 * the overhead of submitting requests to the hardware.
57862306a36Sopenharmony_ci	 */
57962306a36Sopenharmony_ci
58062306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
58162306a36Sopenharmony_ci		unsigned long n, prime;
58262306a36Sopenharmony_ci		IGT_TIMEOUT(end_time);
58362306a36Sopenharmony_ci		ktime_t times[2] = {};
58462306a36Sopenharmony_ci
58562306a36Sopenharmony_ci		err = igt_live_test_begin(&t, i915, __func__, engine->name);
58662306a36Sopenharmony_ci		if (err)
58762306a36Sopenharmony_ci			return err;
58862306a36Sopenharmony_ci
58962306a36Sopenharmony_ci		intel_engine_pm_get(engine);
59062306a36Sopenharmony_ci		for_each_prime_number_from(prime, 1, 8192) {
59162306a36Sopenharmony_ci			struct i915_request *request = NULL;
59262306a36Sopenharmony_ci
59362306a36Sopenharmony_ci			times[1] = ktime_get_raw();
59462306a36Sopenharmony_ci
59562306a36Sopenharmony_ci			for (n = 0; n < prime; n++) {
59662306a36Sopenharmony_ci				i915_request_put(request);
59762306a36Sopenharmony_ci				request = i915_request_create(engine->kernel_context);
59862306a36Sopenharmony_ci				if (IS_ERR(request))
59962306a36Sopenharmony_ci					return PTR_ERR(request);
60062306a36Sopenharmony_ci
60162306a36Sopenharmony_ci				/*
60262306a36Sopenharmony_ci				 * This space is left intentionally blank.
60362306a36Sopenharmony_ci				 *
60462306a36Sopenharmony_ci				 * We do not actually want to perform any
60562306a36Sopenharmony_ci				 * action with this request, we just want
60662306a36Sopenharmony_ci				 * to measure the latency in allocation
60762306a36Sopenharmony_ci				 * and submission of our breadcrumbs -
60862306a36Sopenharmony_ci				 * ensuring that the bare request is sufficient
60962306a36Sopenharmony_ci				 * for the system to work (i.e. proper HEAD
61062306a36Sopenharmony_ci				 * tracking of the rings, interrupt handling,
61162306a36Sopenharmony_ci				 * etc). It also gives us the lowest bounds
61262306a36Sopenharmony_ci				 * for latency.
61362306a36Sopenharmony_ci				 */
61462306a36Sopenharmony_ci
61562306a36Sopenharmony_ci				i915_request_get(request);
61662306a36Sopenharmony_ci				i915_request_add(request);
61762306a36Sopenharmony_ci			}
61862306a36Sopenharmony_ci			i915_request_wait(request, 0, MAX_SCHEDULE_TIMEOUT);
61962306a36Sopenharmony_ci			i915_request_put(request);
62062306a36Sopenharmony_ci
62162306a36Sopenharmony_ci			times[1] = ktime_sub(ktime_get_raw(), times[1]);
62262306a36Sopenharmony_ci			if (prime == 1)
62362306a36Sopenharmony_ci				times[0] = times[1];
62462306a36Sopenharmony_ci
62562306a36Sopenharmony_ci			if (__igt_timeout(end_time, NULL))
62662306a36Sopenharmony_ci				break;
62762306a36Sopenharmony_ci		}
62862306a36Sopenharmony_ci		intel_engine_pm_put(engine);
62962306a36Sopenharmony_ci
63062306a36Sopenharmony_ci		err = igt_live_test_end(&t);
63162306a36Sopenharmony_ci		if (err)
63262306a36Sopenharmony_ci			return err;
63362306a36Sopenharmony_ci
63462306a36Sopenharmony_ci		pr_info("Request latencies on %s: 1 = %lluns, %lu = %lluns\n",
63562306a36Sopenharmony_ci			engine->name,
63662306a36Sopenharmony_ci			ktime_to_ns(times[0]),
63762306a36Sopenharmony_ci			prime, div64_u64(ktime_to_ns(times[1]), prime));
63862306a36Sopenharmony_ci	}
63962306a36Sopenharmony_ci
64062306a36Sopenharmony_ci	return err;
64162306a36Sopenharmony_ci}
64262306a36Sopenharmony_ci
64362306a36Sopenharmony_cistatic int __cancel_inactive(struct intel_engine_cs *engine)
64462306a36Sopenharmony_ci{
64562306a36Sopenharmony_ci	struct intel_context *ce;
64662306a36Sopenharmony_ci	struct igt_spinner spin;
64762306a36Sopenharmony_ci	struct i915_request *rq;
64862306a36Sopenharmony_ci	int err = 0;
64962306a36Sopenharmony_ci
65062306a36Sopenharmony_ci	if (igt_spinner_init(&spin, engine->gt))
65162306a36Sopenharmony_ci		return -ENOMEM;
65262306a36Sopenharmony_ci
65362306a36Sopenharmony_ci	ce = intel_context_create(engine);
65462306a36Sopenharmony_ci	if (IS_ERR(ce)) {
65562306a36Sopenharmony_ci		err = PTR_ERR(ce);
65662306a36Sopenharmony_ci		goto out_spin;
65762306a36Sopenharmony_ci	}
65862306a36Sopenharmony_ci
65962306a36Sopenharmony_ci	rq = igt_spinner_create_request(&spin, ce, MI_ARB_CHECK);
66062306a36Sopenharmony_ci	if (IS_ERR(rq)) {
66162306a36Sopenharmony_ci		err = PTR_ERR(rq);
66262306a36Sopenharmony_ci		goto out_ce;
66362306a36Sopenharmony_ci	}
66462306a36Sopenharmony_ci
66562306a36Sopenharmony_ci	pr_debug("%s: Cancelling inactive request\n", engine->name);
66662306a36Sopenharmony_ci	i915_request_cancel(rq, -EINTR);
66762306a36Sopenharmony_ci	i915_request_get(rq);
66862306a36Sopenharmony_ci	i915_request_add(rq);
66962306a36Sopenharmony_ci
67062306a36Sopenharmony_ci	if (i915_request_wait(rq, 0, HZ / 5) < 0) {
67162306a36Sopenharmony_ci		struct drm_printer p = drm_info_printer(engine->i915->drm.dev);
67262306a36Sopenharmony_ci
67362306a36Sopenharmony_ci		pr_err("%s: Failed to cancel inactive request\n", engine->name);
67462306a36Sopenharmony_ci		intel_engine_dump(engine, &p, "%s\n", engine->name);
67562306a36Sopenharmony_ci		err = -ETIME;
67662306a36Sopenharmony_ci		goto out_rq;
67762306a36Sopenharmony_ci	}
67862306a36Sopenharmony_ci
67962306a36Sopenharmony_ci	if (rq->fence.error != -EINTR) {
68062306a36Sopenharmony_ci		pr_err("%s: fence not cancelled (%u)\n",
68162306a36Sopenharmony_ci		       engine->name, rq->fence.error);
68262306a36Sopenharmony_ci		err = -EINVAL;
68362306a36Sopenharmony_ci	}
68462306a36Sopenharmony_ci
68562306a36Sopenharmony_ciout_rq:
68662306a36Sopenharmony_ci	i915_request_put(rq);
68762306a36Sopenharmony_ciout_ce:
68862306a36Sopenharmony_ci	intel_context_put(ce);
68962306a36Sopenharmony_ciout_spin:
69062306a36Sopenharmony_ci	igt_spinner_fini(&spin);
69162306a36Sopenharmony_ci	if (err)
69262306a36Sopenharmony_ci		pr_err("%s: %s error %d\n", __func__, engine->name, err);
69362306a36Sopenharmony_ci	return err;
69462306a36Sopenharmony_ci}
69562306a36Sopenharmony_ci
69662306a36Sopenharmony_cistatic int __cancel_active(struct intel_engine_cs *engine)
69762306a36Sopenharmony_ci{
69862306a36Sopenharmony_ci	struct intel_context *ce;
69962306a36Sopenharmony_ci	struct igt_spinner spin;
70062306a36Sopenharmony_ci	struct i915_request *rq;
70162306a36Sopenharmony_ci	int err = 0;
70262306a36Sopenharmony_ci
70362306a36Sopenharmony_ci	if (igt_spinner_init(&spin, engine->gt))
70462306a36Sopenharmony_ci		return -ENOMEM;
70562306a36Sopenharmony_ci
70662306a36Sopenharmony_ci	ce = intel_context_create(engine);
70762306a36Sopenharmony_ci	if (IS_ERR(ce)) {
70862306a36Sopenharmony_ci		err = PTR_ERR(ce);
70962306a36Sopenharmony_ci		goto out_spin;
71062306a36Sopenharmony_ci	}
71162306a36Sopenharmony_ci
71262306a36Sopenharmony_ci	rq = igt_spinner_create_request(&spin, ce, MI_ARB_CHECK);
71362306a36Sopenharmony_ci	if (IS_ERR(rq)) {
71462306a36Sopenharmony_ci		err = PTR_ERR(rq);
71562306a36Sopenharmony_ci		goto out_ce;
71662306a36Sopenharmony_ci	}
71762306a36Sopenharmony_ci
71862306a36Sopenharmony_ci	pr_debug("%s: Cancelling active request\n", engine->name);
71962306a36Sopenharmony_ci	i915_request_get(rq);
72062306a36Sopenharmony_ci	i915_request_add(rq);
72162306a36Sopenharmony_ci	if (!igt_wait_for_spinner(&spin, rq)) {
72262306a36Sopenharmony_ci		struct drm_printer p = drm_info_printer(engine->i915->drm.dev);
72362306a36Sopenharmony_ci
72462306a36Sopenharmony_ci		pr_err("Failed to start spinner on %s\n", engine->name);
72562306a36Sopenharmony_ci		intel_engine_dump(engine, &p, "%s\n", engine->name);
72662306a36Sopenharmony_ci		err = -ETIME;
72762306a36Sopenharmony_ci		goto out_rq;
72862306a36Sopenharmony_ci	}
72962306a36Sopenharmony_ci	i915_request_cancel(rq, -EINTR);
73062306a36Sopenharmony_ci
73162306a36Sopenharmony_ci	if (i915_request_wait(rq, 0, HZ / 5) < 0) {
73262306a36Sopenharmony_ci		struct drm_printer p = drm_info_printer(engine->i915->drm.dev);
73362306a36Sopenharmony_ci
73462306a36Sopenharmony_ci		pr_err("%s: Failed to cancel active request\n", engine->name);
73562306a36Sopenharmony_ci		intel_engine_dump(engine, &p, "%s\n", engine->name);
73662306a36Sopenharmony_ci		err = -ETIME;
73762306a36Sopenharmony_ci		goto out_rq;
73862306a36Sopenharmony_ci	}
73962306a36Sopenharmony_ci
74062306a36Sopenharmony_ci	if (rq->fence.error != -EINTR) {
74162306a36Sopenharmony_ci		pr_err("%s: fence not cancelled (%u)\n",
74262306a36Sopenharmony_ci		       engine->name, rq->fence.error);
74362306a36Sopenharmony_ci		err = -EINVAL;
74462306a36Sopenharmony_ci	}
74562306a36Sopenharmony_ci
74662306a36Sopenharmony_ciout_rq:
74762306a36Sopenharmony_ci	i915_request_put(rq);
74862306a36Sopenharmony_ciout_ce:
74962306a36Sopenharmony_ci	intel_context_put(ce);
75062306a36Sopenharmony_ciout_spin:
75162306a36Sopenharmony_ci	igt_spinner_fini(&spin);
75262306a36Sopenharmony_ci	if (err)
75362306a36Sopenharmony_ci		pr_err("%s: %s error %d\n", __func__, engine->name, err);
75462306a36Sopenharmony_ci	return err;
75562306a36Sopenharmony_ci}
75662306a36Sopenharmony_ci
75762306a36Sopenharmony_cistatic int __cancel_completed(struct intel_engine_cs *engine)
75862306a36Sopenharmony_ci{
75962306a36Sopenharmony_ci	struct intel_context *ce;
76062306a36Sopenharmony_ci	struct igt_spinner spin;
76162306a36Sopenharmony_ci	struct i915_request *rq;
76262306a36Sopenharmony_ci	int err = 0;
76362306a36Sopenharmony_ci
76462306a36Sopenharmony_ci	if (igt_spinner_init(&spin, engine->gt))
76562306a36Sopenharmony_ci		return -ENOMEM;
76662306a36Sopenharmony_ci
76762306a36Sopenharmony_ci	ce = intel_context_create(engine);
76862306a36Sopenharmony_ci	if (IS_ERR(ce)) {
76962306a36Sopenharmony_ci		err = PTR_ERR(ce);
77062306a36Sopenharmony_ci		goto out_spin;
77162306a36Sopenharmony_ci	}
77262306a36Sopenharmony_ci
77362306a36Sopenharmony_ci	rq = igt_spinner_create_request(&spin, ce, MI_ARB_CHECK);
77462306a36Sopenharmony_ci	if (IS_ERR(rq)) {
77562306a36Sopenharmony_ci		err = PTR_ERR(rq);
77662306a36Sopenharmony_ci		goto out_ce;
77762306a36Sopenharmony_ci	}
77862306a36Sopenharmony_ci	igt_spinner_end(&spin);
77962306a36Sopenharmony_ci	i915_request_get(rq);
78062306a36Sopenharmony_ci	i915_request_add(rq);
78162306a36Sopenharmony_ci
78262306a36Sopenharmony_ci	if (i915_request_wait(rq, 0, HZ / 5) < 0) {
78362306a36Sopenharmony_ci		err = -ETIME;
78462306a36Sopenharmony_ci		goto out_rq;
78562306a36Sopenharmony_ci	}
78662306a36Sopenharmony_ci
78762306a36Sopenharmony_ci	pr_debug("%s: Cancelling completed request\n", engine->name);
78862306a36Sopenharmony_ci	i915_request_cancel(rq, -EINTR);
78962306a36Sopenharmony_ci	if (rq->fence.error) {
79062306a36Sopenharmony_ci		pr_err("%s: fence not cancelled (%u)\n",
79162306a36Sopenharmony_ci		       engine->name, rq->fence.error);
79262306a36Sopenharmony_ci		err = -EINVAL;
79362306a36Sopenharmony_ci	}
79462306a36Sopenharmony_ci
79562306a36Sopenharmony_ciout_rq:
79662306a36Sopenharmony_ci	i915_request_put(rq);
79762306a36Sopenharmony_ciout_ce:
79862306a36Sopenharmony_ci	intel_context_put(ce);
79962306a36Sopenharmony_ciout_spin:
80062306a36Sopenharmony_ci	igt_spinner_fini(&spin);
80162306a36Sopenharmony_ci	if (err)
80262306a36Sopenharmony_ci		pr_err("%s: %s error %d\n", __func__, engine->name, err);
80362306a36Sopenharmony_ci	return err;
80462306a36Sopenharmony_ci}
80562306a36Sopenharmony_ci
80662306a36Sopenharmony_ci/*
80762306a36Sopenharmony_ci * Test to prove a non-preemptable request can be cancelled and a subsequent
80862306a36Sopenharmony_ci * request on the same context can successfully complete after cancellation.
80962306a36Sopenharmony_ci *
81062306a36Sopenharmony_ci * Testing methodology is to create a non-preemptible request and submit it,
81162306a36Sopenharmony_ci * wait for spinner to start, create a NOP request and submit it, cancel the
81262306a36Sopenharmony_ci * spinner, wait for spinner to complete and verify it failed with an error,
81362306a36Sopenharmony_ci * finally wait for NOP request to complete verify it succeeded without an
81462306a36Sopenharmony_ci * error. Preemption timeout also reduced / restored so test runs in a timely
81562306a36Sopenharmony_ci * maner.
81662306a36Sopenharmony_ci */
81762306a36Sopenharmony_cistatic int __cancel_reset(struct drm_i915_private *i915,
81862306a36Sopenharmony_ci			  struct intel_engine_cs *engine)
81962306a36Sopenharmony_ci{
82062306a36Sopenharmony_ci	struct intel_context *ce;
82162306a36Sopenharmony_ci	struct igt_spinner spin;
82262306a36Sopenharmony_ci	struct i915_request *rq, *nop;
82362306a36Sopenharmony_ci	unsigned long preempt_timeout_ms;
82462306a36Sopenharmony_ci	int err = 0;
82562306a36Sopenharmony_ci
82662306a36Sopenharmony_ci	if (!CONFIG_DRM_I915_PREEMPT_TIMEOUT ||
82762306a36Sopenharmony_ci	    !intel_has_reset_engine(engine->gt))
82862306a36Sopenharmony_ci		return 0;
82962306a36Sopenharmony_ci
83062306a36Sopenharmony_ci	preempt_timeout_ms = engine->props.preempt_timeout_ms;
83162306a36Sopenharmony_ci	engine->props.preempt_timeout_ms = 100;
83262306a36Sopenharmony_ci
83362306a36Sopenharmony_ci	if (igt_spinner_init(&spin, engine->gt))
83462306a36Sopenharmony_ci		goto out_restore;
83562306a36Sopenharmony_ci
83662306a36Sopenharmony_ci	ce = intel_context_create(engine);
83762306a36Sopenharmony_ci	if (IS_ERR(ce)) {
83862306a36Sopenharmony_ci		err = PTR_ERR(ce);
83962306a36Sopenharmony_ci		goto out_spin;
84062306a36Sopenharmony_ci	}
84162306a36Sopenharmony_ci
84262306a36Sopenharmony_ci	rq = igt_spinner_create_request(&spin, ce, MI_NOOP);
84362306a36Sopenharmony_ci	if (IS_ERR(rq)) {
84462306a36Sopenharmony_ci		err = PTR_ERR(rq);
84562306a36Sopenharmony_ci		goto out_ce;
84662306a36Sopenharmony_ci	}
84762306a36Sopenharmony_ci
84862306a36Sopenharmony_ci	pr_debug("%s: Cancelling active non-preemptable request\n",
84962306a36Sopenharmony_ci		 engine->name);
85062306a36Sopenharmony_ci	i915_request_get(rq);
85162306a36Sopenharmony_ci	i915_request_add(rq);
85262306a36Sopenharmony_ci	if (!igt_wait_for_spinner(&spin, rq)) {
85362306a36Sopenharmony_ci		struct drm_printer p = drm_info_printer(engine->i915->drm.dev);
85462306a36Sopenharmony_ci
85562306a36Sopenharmony_ci		pr_err("Failed to start spinner on %s\n", engine->name);
85662306a36Sopenharmony_ci		intel_engine_dump(engine, &p, "%s\n", engine->name);
85762306a36Sopenharmony_ci		err = -ETIME;
85862306a36Sopenharmony_ci		goto out_rq;
85962306a36Sopenharmony_ci	}
86062306a36Sopenharmony_ci
86162306a36Sopenharmony_ci	nop = intel_context_create_request(ce);
86262306a36Sopenharmony_ci	if (IS_ERR(nop))
86362306a36Sopenharmony_ci		goto out_rq;
86462306a36Sopenharmony_ci	i915_request_get(nop);
86562306a36Sopenharmony_ci	i915_request_add(nop);
86662306a36Sopenharmony_ci
86762306a36Sopenharmony_ci	i915_request_cancel(rq, -EINTR);
86862306a36Sopenharmony_ci
86962306a36Sopenharmony_ci	if (i915_request_wait(rq, 0, HZ) < 0) {
87062306a36Sopenharmony_ci		struct drm_printer p = drm_info_printer(engine->i915->drm.dev);
87162306a36Sopenharmony_ci
87262306a36Sopenharmony_ci		pr_err("%s: Failed to cancel hung request\n", engine->name);
87362306a36Sopenharmony_ci		intel_engine_dump(engine, &p, "%s\n", engine->name);
87462306a36Sopenharmony_ci		err = -ETIME;
87562306a36Sopenharmony_ci		goto out_nop;
87662306a36Sopenharmony_ci	}
87762306a36Sopenharmony_ci
87862306a36Sopenharmony_ci	if (rq->fence.error != -EINTR) {
87962306a36Sopenharmony_ci		pr_err("%s: fence not cancelled (%u)\n",
88062306a36Sopenharmony_ci		       engine->name, rq->fence.error);
88162306a36Sopenharmony_ci		err = -EINVAL;
88262306a36Sopenharmony_ci		goto out_nop;
88362306a36Sopenharmony_ci	}
88462306a36Sopenharmony_ci
88562306a36Sopenharmony_ci	if (i915_request_wait(nop, 0, HZ) < 0) {
88662306a36Sopenharmony_ci		struct drm_printer p = drm_info_printer(engine->i915->drm.dev);
88762306a36Sopenharmony_ci
88862306a36Sopenharmony_ci		pr_err("%s: Failed to complete nop request\n", engine->name);
88962306a36Sopenharmony_ci		intel_engine_dump(engine, &p, "%s\n", engine->name);
89062306a36Sopenharmony_ci		err = -ETIME;
89162306a36Sopenharmony_ci		goto out_nop;
89262306a36Sopenharmony_ci	}
89362306a36Sopenharmony_ci
89462306a36Sopenharmony_ci	if (nop->fence.error != 0) {
89562306a36Sopenharmony_ci		pr_err("%s: Nop request errored (%u)\n",
89662306a36Sopenharmony_ci		       engine->name, nop->fence.error);
89762306a36Sopenharmony_ci		err = -EINVAL;
89862306a36Sopenharmony_ci	}
89962306a36Sopenharmony_ci
90062306a36Sopenharmony_ciout_nop:
90162306a36Sopenharmony_ci	i915_request_put(nop);
90262306a36Sopenharmony_ciout_rq:
90362306a36Sopenharmony_ci	i915_request_put(rq);
90462306a36Sopenharmony_ciout_ce:
90562306a36Sopenharmony_ci	intel_context_put(ce);
90662306a36Sopenharmony_ciout_spin:
90762306a36Sopenharmony_ci	igt_spinner_fini(&spin);
90862306a36Sopenharmony_ciout_restore:
90962306a36Sopenharmony_ci	engine->props.preempt_timeout_ms = preempt_timeout_ms;
91062306a36Sopenharmony_ci	if (err)
91162306a36Sopenharmony_ci		pr_err("%s: %s error %d\n", __func__, engine->name, err);
91262306a36Sopenharmony_ci	return err;
91362306a36Sopenharmony_ci}
91462306a36Sopenharmony_ci
91562306a36Sopenharmony_cistatic int live_cancel_request(void *arg)
91662306a36Sopenharmony_ci{
91762306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
91862306a36Sopenharmony_ci	struct intel_engine_cs *engine;
91962306a36Sopenharmony_ci
92062306a36Sopenharmony_ci	/*
92162306a36Sopenharmony_ci	 * Check cancellation of requests. We expect to be able to immediately
92262306a36Sopenharmony_ci	 * cancel active requests, even if they are currently on the GPU.
92362306a36Sopenharmony_ci	 */
92462306a36Sopenharmony_ci
92562306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
92662306a36Sopenharmony_ci		struct igt_live_test t;
92762306a36Sopenharmony_ci		int err, err2;
92862306a36Sopenharmony_ci
92962306a36Sopenharmony_ci		if (!intel_engine_has_preemption(engine))
93062306a36Sopenharmony_ci			continue;
93162306a36Sopenharmony_ci
93262306a36Sopenharmony_ci		err = igt_live_test_begin(&t, i915, __func__, engine->name);
93362306a36Sopenharmony_ci		if (err)
93462306a36Sopenharmony_ci			return err;
93562306a36Sopenharmony_ci
93662306a36Sopenharmony_ci		err = __cancel_inactive(engine);
93762306a36Sopenharmony_ci		if (err == 0)
93862306a36Sopenharmony_ci			err = __cancel_active(engine);
93962306a36Sopenharmony_ci		if (err == 0)
94062306a36Sopenharmony_ci			err = __cancel_completed(engine);
94162306a36Sopenharmony_ci
94262306a36Sopenharmony_ci		err2 = igt_live_test_end(&t);
94362306a36Sopenharmony_ci		if (err)
94462306a36Sopenharmony_ci			return err;
94562306a36Sopenharmony_ci		if (err2)
94662306a36Sopenharmony_ci			return err2;
94762306a36Sopenharmony_ci
94862306a36Sopenharmony_ci		/* Expects reset so call outside of igt_live_test_* */
94962306a36Sopenharmony_ci		err = __cancel_reset(i915, engine);
95062306a36Sopenharmony_ci		if (err)
95162306a36Sopenharmony_ci			return err;
95262306a36Sopenharmony_ci
95362306a36Sopenharmony_ci		if (igt_flush_test(i915))
95462306a36Sopenharmony_ci			return -EIO;
95562306a36Sopenharmony_ci	}
95662306a36Sopenharmony_ci
95762306a36Sopenharmony_ci	return 0;
95862306a36Sopenharmony_ci}
95962306a36Sopenharmony_ci
96062306a36Sopenharmony_cistatic struct i915_vma *empty_batch(struct intel_gt *gt)
96162306a36Sopenharmony_ci{
96262306a36Sopenharmony_ci	struct drm_i915_gem_object *obj;
96362306a36Sopenharmony_ci	struct i915_vma *vma;
96462306a36Sopenharmony_ci	u32 *cmd;
96562306a36Sopenharmony_ci	int err;
96662306a36Sopenharmony_ci
96762306a36Sopenharmony_ci	obj = i915_gem_object_create_internal(gt->i915, PAGE_SIZE);
96862306a36Sopenharmony_ci	if (IS_ERR(obj))
96962306a36Sopenharmony_ci		return ERR_CAST(obj);
97062306a36Sopenharmony_ci
97162306a36Sopenharmony_ci	cmd = i915_gem_object_pin_map_unlocked(obj, I915_MAP_WC);
97262306a36Sopenharmony_ci	if (IS_ERR(cmd)) {
97362306a36Sopenharmony_ci		err = PTR_ERR(cmd);
97462306a36Sopenharmony_ci		goto err;
97562306a36Sopenharmony_ci	}
97662306a36Sopenharmony_ci
97762306a36Sopenharmony_ci	*cmd = MI_BATCH_BUFFER_END;
97862306a36Sopenharmony_ci
97962306a36Sopenharmony_ci	__i915_gem_object_flush_map(obj, 0, 64);
98062306a36Sopenharmony_ci	i915_gem_object_unpin_map(obj);
98162306a36Sopenharmony_ci
98262306a36Sopenharmony_ci	intel_gt_chipset_flush(gt);
98362306a36Sopenharmony_ci
98462306a36Sopenharmony_ci	vma = i915_vma_instance(obj, gt->vm, NULL);
98562306a36Sopenharmony_ci	if (IS_ERR(vma)) {
98662306a36Sopenharmony_ci		err = PTR_ERR(vma);
98762306a36Sopenharmony_ci		goto err;
98862306a36Sopenharmony_ci	}
98962306a36Sopenharmony_ci
99062306a36Sopenharmony_ci	err = i915_vma_pin(vma, 0, 0, PIN_USER);
99162306a36Sopenharmony_ci	if (err)
99262306a36Sopenharmony_ci		goto err;
99362306a36Sopenharmony_ci
99462306a36Sopenharmony_ci	/* Force the wait now to avoid including it in the benchmark */
99562306a36Sopenharmony_ci	err = i915_vma_sync(vma);
99662306a36Sopenharmony_ci	if (err)
99762306a36Sopenharmony_ci		goto err_pin;
99862306a36Sopenharmony_ci
99962306a36Sopenharmony_ci	return vma;
100062306a36Sopenharmony_ci
100162306a36Sopenharmony_cierr_pin:
100262306a36Sopenharmony_ci	i915_vma_unpin(vma);
100362306a36Sopenharmony_cierr:
100462306a36Sopenharmony_ci	i915_gem_object_put(obj);
100562306a36Sopenharmony_ci	return ERR_PTR(err);
100662306a36Sopenharmony_ci}
100762306a36Sopenharmony_ci
100862306a36Sopenharmony_cistatic int emit_bb_start(struct i915_request *rq, struct i915_vma *batch)
100962306a36Sopenharmony_ci{
101062306a36Sopenharmony_ci	return rq->engine->emit_bb_start(rq,
101162306a36Sopenharmony_ci					 i915_vma_offset(batch),
101262306a36Sopenharmony_ci					 i915_vma_size(batch),
101362306a36Sopenharmony_ci					 0);
101462306a36Sopenharmony_ci}
101562306a36Sopenharmony_ci
101662306a36Sopenharmony_cistatic struct i915_request *
101762306a36Sopenharmony_ciempty_request(struct intel_engine_cs *engine,
101862306a36Sopenharmony_ci	      struct i915_vma *batch)
101962306a36Sopenharmony_ci{
102062306a36Sopenharmony_ci	struct i915_request *request;
102162306a36Sopenharmony_ci	int err;
102262306a36Sopenharmony_ci
102362306a36Sopenharmony_ci	request = i915_request_create(engine->kernel_context);
102462306a36Sopenharmony_ci	if (IS_ERR(request))
102562306a36Sopenharmony_ci		return request;
102662306a36Sopenharmony_ci
102762306a36Sopenharmony_ci	err = emit_bb_start(request, batch);
102862306a36Sopenharmony_ci	if (err)
102962306a36Sopenharmony_ci		goto out_request;
103062306a36Sopenharmony_ci
103162306a36Sopenharmony_ci	i915_request_get(request);
103262306a36Sopenharmony_ciout_request:
103362306a36Sopenharmony_ci	i915_request_add(request);
103462306a36Sopenharmony_ci	return err ? ERR_PTR(err) : request;
103562306a36Sopenharmony_ci}
103662306a36Sopenharmony_ci
103762306a36Sopenharmony_cistatic int live_empty_request(void *arg)
103862306a36Sopenharmony_ci{
103962306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
104062306a36Sopenharmony_ci	struct intel_engine_cs *engine;
104162306a36Sopenharmony_ci	struct igt_live_test t;
104262306a36Sopenharmony_ci	int err;
104362306a36Sopenharmony_ci
104462306a36Sopenharmony_ci	/*
104562306a36Sopenharmony_ci	 * Submit various sized batches of empty requests, to each engine
104662306a36Sopenharmony_ci	 * (individually), and wait for the batch to complete. We can check
104762306a36Sopenharmony_ci	 * the overhead of submitting requests to the hardware.
104862306a36Sopenharmony_ci	 */
104962306a36Sopenharmony_ci
105062306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
105162306a36Sopenharmony_ci		IGT_TIMEOUT(end_time);
105262306a36Sopenharmony_ci		struct i915_request *request;
105362306a36Sopenharmony_ci		struct i915_vma *batch;
105462306a36Sopenharmony_ci		unsigned long n, prime;
105562306a36Sopenharmony_ci		ktime_t times[2] = {};
105662306a36Sopenharmony_ci
105762306a36Sopenharmony_ci		batch = empty_batch(engine->gt);
105862306a36Sopenharmony_ci		if (IS_ERR(batch))
105962306a36Sopenharmony_ci			return PTR_ERR(batch);
106062306a36Sopenharmony_ci
106162306a36Sopenharmony_ci		err = igt_live_test_begin(&t, i915, __func__, engine->name);
106262306a36Sopenharmony_ci		if (err)
106362306a36Sopenharmony_ci			goto out_batch;
106462306a36Sopenharmony_ci
106562306a36Sopenharmony_ci		intel_engine_pm_get(engine);
106662306a36Sopenharmony_ci
106762306a36Sopenharmony_ci		/* Warmup / preload */
106862306a36Sopenharmony_ci		request = empty_request(engine, batch);
106962306a36Sopenharmony_ci		if (IS_ERR(request)) {
107062306a36Sopenharmony_ci			err = PTR_ERR(request);
107162306a36Sopenharmony_ci			intel_engine_pm_put(engine);
107262306a36Sopenharmony_ci			goto out_batch;
107362306a36Sopenharmony_ci		}
107462306a36Sopenharmony_ci		i915_request_wait(request, 0, MAX_SCHEDULE_TIMEOUT);
107562306a36Sopenharmony_ci
107662306a36Sopenharmony_ci		for_each_prime_number_from(prime, 1, 8192) {
107762306a36Sopenharmony_ci			times[1] = ktime_get_raw();
107862306a36Sopenharmony_ci
107962306a36Sopenharmony_ci			for (n = 0; n < prime; n++) {
108062306a36Sopenharmony_ci				i915_request_put(request);
108162306a36Sopenharmony_ci				request = empty_request(engine, batch);
108262306a36Sopenharmony_ci				if (IS_ERR(request)) {
108362306a36Sopenharmony_ci					err = PTR_ERR(request);
108462306a36Sopenharmony_ci					intel_engine_pm_put(engine);
108562306a36Sopenharmony_ci					goto out_batch;
108662306a36Sopenharmony_ci				}
108762306a36Sopenharmony_ci			}
108862306a36Sopenharmony_ci			i915_request_wait(request, 0, MAX_SCHEDULE_TIMEOUT);
108962306a36Sopenharmony_ci
109062306a36Sopenharmony_ci			times[1] = ktime_sub(ktime_get_raw(), times[1]);
109162306a36Sopenharmony_ci			if (prime == 1)
109262306a36Sopenharmony_ci				times[0] = times[1];
109362306a36Sopenharmony_ci
109462306a36Sopenharmony_ci			if (__igt_timeout(end_time, NULL))
109562306a36Sopenharmony_ci				break;
109662306a36Sopenharmony_ci		}
109762306a36Sopenharmony_ci		i915_request_put(request);
109862306a36Sopenharmony_ci		intel_engine_pm_put(engine);
109962306a36Sopenharmony_ci
110062306a36Sopenharmony_ci		err = igt_live_test_end(&t);
110162306a36Sopenharmony_ci		if (err)
110262306a36Sopenharmony_ci			goto out_batch;
110362306a36Sopenharmony_ci
110462306a36Sopenharmony_ci		pr_info("Batch latencies on %s: 1 = %lluns, %lu = %lluns\n",
110562306a36Sopenharmony_ci			engine->name,
110662306a36Sopenharmony_ci			ktime_to_ns(times[0]),
110762306a36Sopenharmony_ci			prime, div64_u64(ktime_to_ns(times[1]), prime));
110862306a36Sopenharmony_ciout_batch:
110962306a36Sopenharmony_ci		i915_vma_unpin(batch);
111062306a36Sopenharmony_ci		i915_vma_put(batch);
111162306a36Sopenharmony_ci		if (err)
111262306a36Sopenharmony_ci			break;
111362306a36Sopenharmony_ci	}
111462306a36Sopenharmony_ci
111562306a36Sopenharmony_ci	return err;
111662306a36Sopenharmony_ci}
111762306a36Sopenharmony_ci
111862306a36Sopenharmony_cistatic struct i915_vma *recursive_batch(struct intel_gt *gt)
111962306a36Sopenharmony_ci{
112062306a36Sopenharmony_ci	struct drm_i915_gem_object *obj;
112162306a36Sopenharmony_ci	const int ver = GRAPHICS_VER(gt->i915);
112262306a36Sopenharmony_ci	struct i915_vma *vma;
112362306a36Sopenharmony_ci	u32 *cmd;
112462306a36Sopenharmony_ci	int err;
112562306a36Sopenharmony_ci
112662306a36Sopenharmony_ci	obj = i915_gem_object_create_internal(gt->i915, PAGE_SIZE);
112762306a36Sopenharmony_ci	if (IS_ERR(obj))
112862306a36Sopenharmony_ci		return ERR_CAST(obj);
112962306a36Sopenharmony_ci
113062306a36Sopenharmony_ci	vma = i915_vma_instance(obj, gt->vm, NULL);
113162306a36Sopenharmony_ci	if (IS_ERR(vma)) {
113262306a36Sopenharmony_ci		err = PTR_ERR(vma);
113362306a36Sopenharmony_ci		goto err;
113462306a36Sopenharmony_ci	}
113562306a36Sopenharmony_ci
113662306a36Sopenharmony_ci	err = i915_vma_pin(vma, 0, 0, PIN_USER);
113762306a36Sopenharmony_ci	if (err)
113862306a36Sopenharmony_ci		goto err;
113962306a36Sopenharmony_ci
114062306a36Sopenharmony_ci	cmd = i915_gem_object_pin_map_unlocked(obj, I915_MAP_WC);
114162306a36Sopenharmony_ci	if (IS_ERR(cmd)) {
114262306a36Sopenharmony_ci		err = PTR_ERR(cmd);
114362306a36Sopenharmony_ci		goto err;
114462306a36Sopenharmony_ci	}
114562306a36Sopenharmony_ci
114662306a36Sopenharmony_ci	if (ver >= 8) {
114762306a36Sopenharmony_ci		*cmd++ = MI_BATCH_BUFFER_START | 1 << 8 | 1;
114862306a36Sopenharmony_ci		*cmd++ = lower_32_bits(i915_vma_offset(vma));
114962306a36Sopenharmony_ci		*cmd++ = upper_32_bits(i915_vma_offset(vma));
115062306a36Sopenharmony_ci	} else if (ver >= 6) {
115162306a36Sopenharmony_ci		*cmd++ = MI_BATCH_BUFFER_START | 1 << 8;
115262306a36Sopenharmony_ci		*cmd++ = lower_32_bits(i915_vma_offset(vma));
115362306a36Sopenharmony_ci	} else {
115462306a36Sopenharmony_ci		*cmd++ = MI_BATCH_BUFFER_START | MI_BATCH_GTT;
115562306a36Sopenharmony_ci		*cmd++ = lower_32_bits(i915_vma_offset(vma));
115662306a36Sopenharmony_ci	}
115762306a36Sopenharmony_ci	*cmd++ = MI_BATCH_BUFFER_END; /* terminate early in case of error */
115862306a36Sopenharmony_ci
115962306a36Sopenharmony_ci	__i915_gem_object_flush_map(obj, 0, 64);
116062306a36Sopenharmony_ci	i915_gem_object_unpin_map(obj);
116162306a36Sopenharmony_ci
116262306a36Sopenharmony_ci	intel_gt_chipset_flush(gt);
116362306a36Sopenharmony_ci
116462306a36Sopenharmony_ci	return vma;
116562306a36Sopenharmony_ci
116662306a36Sopenharmony_cierr:
116762306a36Sopenharmony_ci	i915_gem_object_put(obj);
116862306a36Sopenharmony_ci	return ERR_PTR(err);
116962306a36Sopenharmony_ci}
117062306a36Sopenharmony_ci
117162306a36Sopenharmony_cistatic int recursive_batch_resolve(struct i915_vma *batch)
117262306a36Sopenharmony_ci{
117362306a36Sopenharmony_ci	u32 *cmd;
117462306a36Sopenharmony_ci
117562306a36Sopenharmony_ci	cmd = i915_gem_object_pin_map_unlocked(batch->obj, I915_MAP_WC);
117662306a36Sopenharmony_ci	if (IS_ERR(cmd))
117762306a36Sopenharmony_ci		return PTR_ERR(cmd);
117862306a36Sopenharmony_ci
117962306a36Sopenharmony_ci	*cmd = MI_BATCH_BUFFER_END;
118062306a36Sopenharmony_ci
118162306a36Sopenharmony_ci	__i915_gem_object_flush_map(batch->obj, 0, sizeof(*cmd));
118262306a36Sopenharmony_ci	i915_gem_object_unpin_map(batch->obj);
118362306a36Sopenharmony_ci
118462306a36Sopenharmony_ci	intel_gt_chipset_flush(batch->vm->gt);
118562306a36Sopenharmony_ci
118662306a36Sopenharmony_ci	return 0;
118762306a36Sopenharmony_ci}
118862306a36Sopenharmony_ci
118962306a36Sopenharmony_cistatic int live_all_engines(void *arg)
119062306a36Sopenharmony_ci{
119162306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
119262306a36Sopenharmony_ci	const unsigned int nengines = num_uabi_engines(i915);
119362306a36Sopenharmony_ci	struct intel_engine_cs *engine;
119462306a36Sopenharmony_ci	struct i915_request **request;
119562306a36Sopenharmony_ci	struct igt_live_test t;
119662306a36Sopenharmony_ci	unsigned int idx;
119762306a36Sopenharmony_ci	int err;
119862306a36Sopenharmony_ci
119962306a36Sopenharmony_ci	/*
120062306a36Sopenharmony_ci	 * Check we can submit requests to all engines simultaneously. We
120162306a36Sopenharmony_ci	 * send a recursive batch to each engine - checking that we don't
120262306a36Sopenharmony_ci	 * block doing so, and that they don't complete too soon.
120362306a36Sopenharmony_ci	 */
120462306a36Sopenharmony_ci
120562306a36Sopenharmony_ci	request = kcalloc(nengines, sizeof(*request), GFP_KERNEL);
120662306a36Sopenharmony_ci	if (!request)
120762306a36Sopenharmony_ci		return -ENOMEM;
120862306a36Sopenharmony_ci
120962306a36Sopenharmony_ci	err = igt_live_test_begin(&t, i915, __func__, "");
121062306a36Sopenharmony_ci	if (err)
121162306a36Sopenharmony_ci		goto out_free;
121262306a36Sopenharmony_ci
121362306a36Sopenharmony_ci	idx = 0;
121462306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
121562306a36Sopenharmony_ci		struct i915_vma *batch;
121662306a36Sopenharmony_ci
121762306a36Sopenharmony_ci		batch = recursive_batch(engine->gt);
121862306a36Sopenharmony_ci		if (IS_ERR(batch)) {
121962306a36Sopenharmony_ci			err = PTR_ERR(batch);
122062306a36Sopenharmony_ci			pr_err("%s: Unable to create batch, err=%d\n",
122162306a36Sopenharmony_ci			       __func__, err);
122262306a36Sopenharmony_ci			goto out_free;
122362306a36Sopenharmony_ci		}
122462306a36Sopenharmony_ci
122562306a36Sopenharmony_ci		i915_vma_lock(batch);
122662306a36Sopenharmony_ci		request[idx] = intel_engine_create_kernel_request(engine);
122762306a36Sopenharmony_ci		if (IS_ERR(request[idx])) {
122862306a36Sopenharmony_ci			err = PTR_ERR(request[idx]);
122962306a36Sopenharmony_ci			pr_err("%s: Request allocation failed with err=%d\n",
123062306a36Sopenharmony_ci			       __func__, err);
123162306a36Sopenharmony_ci			goto out_unlock;
123262306a36Sopenharmony_ci		}
123362306a36Sopenharmony_ci		GEM_BUG_ON(request[idx]->context->vm != batch->vm);
123462306a36Sopenharmony_ci
123562306a36Sopenharmony_ci		err = i915_vma_move_to_active(batch, request[idx], 0);
123662306a36Sopenharmony_ci		GEM_BUG_ON(err);
123762306a36Sopenharmony_ci
123862306a36Sopenharmony_ci		err = emit_bb_start(request[idx], batch);
123962306a36Sopenharmony_ci		GEM_BUG_ON(err);
124062306a36Sopenharmony_ci		request[idx]->batch = batch;
124162306a36Sopenharmony_ci
124262306a36Sopenharmony_ci		i915_request_get(request[idx]);
124362306a36Sopenharmony_ci		i915_request_add(request[idx]);
124462306a36Sopenharmony_ci		idx++;
124562306a36Sopenharmony_ciout_unlock:
124662306a36Sopenharmony_ci		i915_vma_unlock(batch);
124762306a36Sopenharmony_ci		if (err)
124862306a36Sopenharmony_ci			goto out_request;
124962306a36Sopenharmony_ci	}
125062306a36Sopenharmony_ci
125162306a36Sopenharmony_ci	idx = 0;
125262306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
125362306a36Sopenharmony_ci		if (i915_request_completed(request[idx])) {
125462306a36Sopenharmony_ci			pr_err("%s(%s): request completed too early!\n",
125562306a36Sopenharmony_ci			       __func__, engine->name);
125662306a36Sopenharmony_ci			err = -EINVAL;
125762306a36Sopenharmony_ci			goto out_request;
125862306a36Sopenharmony_ci		}
125962306a36Sopenharmony_ci		idx++;
126062306a36Sopenharmony_ci	}
126162306a36Sopenharmony_ci
126262306a36Sopenharmony_ci	idx = 0;
126362306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
126462306a36Sopenharmony_ci		err = recursive_batch_resolve(request[idx]->batch);
126562306a36Sopenharmony_ci		if (err) {
126662306a36Sopenharmony_ci			pr_err("%s: failed to resolve batch, err=%d\n",
126762306a36Sopenharmony_ci			       __func__, err);
126862306a36Sopenharmony_ci			goto out_request;
126962306a36Sopenharmony_ci		}
127062306a36Sopenharmony_ci		idx++;
127162306a36Sopenharmony_ci	}
127262306a36Sopenharmony_ci
127362306a36Sopenharmony_ci	idx = 0;
127462306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
127562306a36Sopenharmony_ci		struct i915_request *rq = request[idx];
127662306a36Sopenharmony_ci		long timeout;
127762306a36Sopenharmony_ci
127862306a36Sopenharmony_ci		timeout = i915_request_wait(rq, 0,
127962306a36Sopenharmony_ci					    MAX_SCHEDULE_TIMEOUT);
128062306a36Sopenharmony_ci		if (timeout < 0) {
128162306a36Sopenharmony_ci			err = timeout;
128262306a36Sopenharmony_ci			pr_err("%s: error waiting for request on %s, err=%d\n",
128362306a36Sopenharmony_ci			       __func__, engine->name, err);
128462306a36Sopenharmony_ci			goto out_request;
128562306a36Sopenharmony_ci		}
128662306a36Sopenharmony_ci
128762306a36Sopenharmony_ci		GEM_BUG_ON(!i915_request_completed(rq));
128862306a36Sopenharmony_ci		i915_vma_unpin(rq->batch);
128962306a36Sopenharmony_ci		i915_vma_put(rq->batch);
129062306a36Sopenharmony_ci		i915_request_put(rq);
129162306a36Sopenharmony_ci		request[idx] = NULL;
129262306a36Sopenharmony_ci		idx++;
129362306a36Sopenharmony_ci	}
129462306a36Sopenharmony_ci
129562306a36Sopenharmony_ci	err = igt_live_test_end(&t);
129662306a36Sopenharmony_ci
129762306a36Sopenharmony_ciout_request:
129862306a36Sopenharmony_ci	idx = 0;
129962306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
130062306a36Sopenharmony_ci		struct i915_request *rq = request[idx];
130162306a36Sopenharmony_ci
130262306a36Sopenharmony_ci		if (!rq)
130362306a36Sopenharmony_ci			continue;
130462306a36Sopenharmony_ci
130562306a36Sopenharmony_ci		if (rq->batch) {
130662306a36Sopenharmony_ci			i915_vma_unpin(rq->batch);
130762306a36Sopenharmony_ci			i915_vma_put(rq->batch);
130862306a36Sopenharmony_ci		}
130962306a36Sopenharmony_ci		i915_request_put(rq);
131062306a36Sopenharmony_ci		idx++;
131162306a36Sopenharmony_ci	}
131262306a36Sopenharmony_ciout_free:
131362306a36Sopenharmony_ci	kfree(request);
131462306a36Sopenharmony_ci	return err;
131562306a36Sopenharmony_ci}
131662306a36Sopenharmony_ci
131762306a36Sopenharmony_cistatic int live_sequential_engines(void *arg)
131862306a36Sopenharmony_ci{
131962306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
132062306a36Sopenharmony_ci	const unsigned int nengines = num_uabi_engines(i915);
132162306a36Sopenharmony_ci	struct i915_request **request;
132262306a36Sopenharmony_ci	struct i915_request *prev = NULL;
132362306a36Sopenharmony_ci	struct intel_engine_cs *engine;
132462306a36Sopenharmony_ci	struct igt_live_test t;
132562306a36Sopenharmony_ci	unsigned int idx;
132662306a36Sopenharmony_ci	int err;
132762306a36Sopenharmony_ci
132862306a36Sopenharmony_ci	/*
132962306a36Sopenharmony_ci	 * Check we can submit requests to all engines sequentially, such
133062306a36Sopenharmony_ci	 * that each successive request waits for the earlier ones. This
133162306a36Sopenharmony_ci	 * tests that we don't execute requests out of order, even though
133262306a36Sopenharmony_ci	 * they are running on independent engines.
133362306a36Sopenharmony_ci	 */
133462306a36Sopenharmony_ci
133562306a36Sopenharmony_ci	request = kcalloc(nengines, sizeof(*request), GFP_KERNEL);
133662306a36Sopenharmony_ci	if (!request)
133762306a36Sopenharmony_ci		return -ENOMEM;
133862306a36Sopenharmony_ci
133962306a36Sopenharmony_ci	err = igt_live_test_begin(&t, i915, __func__, "");
134062306a36Sopenharmony_ci	if (err)
134162306a36Sopenharmony_ci		goto out_free;
134262306a36Sopenharmony_ci
134362306a36Sopenharmony_ci	idx = 0;
134462306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
134562306a36Sopenharmony_ci		struct i915_vma *batch;
134662306a36Sopenharmony_ci
134762306a36Sopenharmony_ci		batch = recursive_batch(engine->gt);
134862306a36Sopenharmony_ci		if (IS_ERR(batch)) {
134962306a36Sopenharmony_ci			err = PTR_ERR(batch);
135062306a36Sopenharmony_ci			pr_err("%s: Unable to create batch for %s, err=%d\n",
135162306a36Sopenharmony_ci			       __func__, engine->name, err);
135262306a36Sopenharmony_ci			goto out_free;
135362306a36Sopenharmony_ci		}
135462306a36Sopenharmony_ci
135562306a36Sopenharmony_ci		i915_vma_lock(batch);
135662306a36Sopenharmony_ci		request[idx] = intel_engine_create_kernel_request(engine);
135762306a36Sopenharmony_ci		if (IS_ERR(request[idx])) {
135862306a36Sopenharmony_ci			err = PTR_ERR(request[idx]);
135962306a36Sopenharmony_ci			pr_err("%s: Request allocation failed for %s with err=%d\n",
136062306a36Sopenharmony_ci			       __func__, engine->name, err);
136162306a36Sopenharmony_ci			goto out_unlock;
136262306a36Sopenharmony_ci		}
136362306a36Sopenharmony_ci		GEM_BUG_ON(request[idx]->context->vm != batch->vm);
136462306a36Sopenharmony_ci
136562306a36Sopenharmony_ci		if (prev) {
136662306a36Sopenharmony_ci			err = i915_request_await_dma_fence(request[idx],
136762306a36Sopenharmony_ci							   &prev->fence);
136862306a36Sopenharmony_ci			if (err) {
136962306a36Sopenharmony_ci				i915_request_add(request[idx]);
137062306a36Sopenharmony_ci				pr_err("%s: Request await failed for %s with err=%d\n",
137162306a36Sopenharmony_ci				       __func__, engine->name, err);
137262306a36Sopenharmony_ci				goto out_unlock;
137362306a36Sopenharmony_ci			}
137462306a36Sopenharmony_ci		}
137562306a36Sopenharmony_ci
137662306a36Sopenharmony_ci		err = i915_vma_move_to_active(batch, request[idx], 0);
137762306a36Sopenharmony_ci		GEM_BUG_ON(err);
137862306a36Sopenharmony_ci
137962306a36Sopenharmony_ci		err = emit_bb_start(request[idx], batch);
138062306a36Sopenharmony_ci		GEM_BUG_ON(err);
138162306a36Sopenharmony_ci		request[idx]->batch = batch;
138262306a36Sopenharmony_ci
138362306a36Sopenharmony_ci		i915_request_get(request[idx]);
138462306a36Sopenharmony_ci		i915_request_add(request[idx]);
138562306a36Sopenharmony_ci
138662306a36Sopenharmony_ci		prev = request[idx];
138762306a36Sopenharmony_ci		idx++;
138862306a36Sopenharmony_ci
138962306a36Sopenharmony_ciout_unlock:
139062306a36Sopenharmony_ci		i915_vma_unlock(batch);
139162306a36Sopenharmony_ci		if (err)
139262306a36Sopenharmony_ci			goto out_request;
139362306a36Sopenharmony_ci	}
139462306a36Sopenharmony_ci
139562306a36Sopenharmony_ci	idx = 0;
139662306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
139762306a36Sopenharmony_ci		long timeout;
139862306a36Sopenharmony_ci
139962306a36Sopenharmony_ci		if (i915_request_completed(request[idx])) {
140062306a36Sopenharmony_ci			pr_err("%s(%s): request completed too early!\n",
140162306a36Sopenharmony_ci			       __func__, engine->name);
140262306a36Sopenharmony_ci			err = -EINVAL;
140362306a36Sopenharmony_ci			goto out_request;
140462306a36Sopenharmony_ci		}
140562306a36Sopenharmony_ci
140662306a36Sopenharmony_ci		err = recursive_batch_resolve(request[idx]->batch);
140762306a36Sopenharmony_ci		if (err) {
140862306a36Sopenharmony_ci			pr_err("%s: failed to resolve batch, err=%d\n",
140962306a36Sopenharmony_ci			       __func__, err);
141062306a36Sopenharmony_ci			goto out_request;
141162306a36Sopenharmony_ci		}
141262306a36Sopenharmony_ci
141362306a36Sopenharmony_ci		timeout = i915_request_wait(request[idx], 0,
141462306a36Sopenharmony_ci					    MAX_SCHEDULE_TIMEOUT);
141562306a36Sopenharmony_ci		if (timeout < 0) {
141662306a36Sopenharmony_ci			err = timeout;
141762306a36Sopenharmony_ci			pr_err("%s: error waiting for request on %s, err=%d\n",
141862306a36Sopenharmony_ci			       __func__, engine->name, err);
141962306a36Sopenharmony_ci			goto out_request;
142062306a36Sopenharmony_ci		}
142162306a36Sopenharmony_ci
142262306a36Sopenharmony_ci		GEM_BUG_ON(!i915_request_completed(request[idx]));
142362306a36Sopenharmony_ci		idx++;
142462306a36Sopenharmony_ci	}
142562306a36Sopenharmony_ci
142662306a36Sopenharmony_ci	err = igt_live_test_end(&t);
142762306a36Sopenharmony_ci
142862306a36Sopenharmony_ciout_request:
142962306a36Sopenharmony_ci	idx = 0;
143062306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
143162306a36Sopenharmony_ci		u32 *cmd;
143262306a36Sopenharmony_ci
143362306a36Sopenharmony_ci		if (!request[idx])
143462306a36Sopenharmony_ci			break;
143562306a36Sopenharmony_ci
143662306a36Sopenharmony_ci		cmd = i915_gem_object_pin_map_unlocked(request[idx]->batch->obj,
143762306a36Sopenharmony_ci						       I915_MAP_WC);
143862306a36Sopenharmony_ci		if (!IS_ERR(cmd)) {
143962306a36Sopenharmony_ci			*cmd = MI_BATCH_BUFFER_END;
144062306a36Sopenharmony_ci
144162306a36Sopenharmony_ci			__i915_gem_object_flush_map(request[idx]->batch->obj,
144262306a36Sopenharmony_ci						    0, sizeof(*cmd));
144362306a36Sopenharmony_ci			i915_gem_object_unpin_map(request[idx]->batch->obj);
144462306a36Sopenharmony_ci
144562306a36Sopenharmony_ci			intel_gt_chipset_flush(engine->gt);
144662306a36Sopenharmony_ci		}
144762306a36Sopenharmony_ci
144862306a36Sopenharmony_ci		i915_vma_put(request[idx]->batch);
144962306a36Sopenharmony_ci		i915_request_put(request[idx]);
145062306a36Sopenharmony_ci		idx++;
145162306a36Sopenharmony_ci	}
145262306a36Sopenharmony_ciout_free:
145362306a36Sopenharmony_ci	kfree(request);
145462306a36Sopenharmony_ci	return err;
145562306a36Sopenharmony_ci}
145662306a36Sopenharmony_ci
145762306a36Sopenharmony_cistruct parallel_thread {
145862306a36Sopenharmony_ci	struct kthread_worker *worker;
145962306a36Sopenharmony_ci	struct kthread_work work;
146062306a36Sopenharmony_ci	struct intel_engine_cs *engine;
146162306a36Sopenharmony_ci	int result;
146262306a36Sopenharmony_ci};
146362306a36Sopenharmony_ci
146462306a36Sopenharmony_cistatic void __live_parallel_engine1(struct kthread_work *work)
146562306a36Sopenharmony_ci{
146662306a36Sopenharmony_ci	struct parallel_thread *thread =
146762306a36Sopenharmony_ci		container_of(work, typeof(*thread), work);
146862306a36Sopenharmony_ci	struct intel_engine_cs *engine = thread->engine;
146962306a36Sopenharmony_ci	IGT_TIMEOUT(end_time);
147062306a36Sopenharmony_ci	unsigned long count;
147162306a36Sopenharmony_ci	int err = 0;
147262306a36Sopenharmony_ci
147362306a36Sopenharmony_ci	count = 0;
147462306a36Sopenharmony_ci	intel_engine_pm_get(engine);
147562306a36Sopenharmony_ci	do {
147662306a36Sopenharmony_ci		struct i915_request *rq;
147762306a36Sopenharmony_ci
147862306a36Sopenharmony_ci		rq = i915_request_create(engine->kernel_context);
147962306a36Sopenharmony_ci		if (IS_ERR(rq)) {
148062306a36Sopenharmony_ci			err = PTR_ERR(rq);
148162306a36Sopenharmony_ci			break;
148262306a36Sopenharmony_ci		}
148362306a36Sopenharmony_ci
148462306a36Sopenharmony_ci		i915_request_get(rq);
148562306a36Sopenharmony_ci		i915_request_add(rq);
148662306a36Sopenharmony_ci
148762306a36Sopenharmony_ci		err = 0;
148862306a36Sopenharmony_ci		if (i915_request_wait(rq, 0, HZ) < 0)
148962306a36Sopenharmony_ci			err = -ETIME;
149062306a36Sopenharmony_ci		i915_request_put(rq);
149162306a36Sopenharmony_ci		if (err)
149262306a36Sopenharmony_ci			break;
149362306a36Sopenharmony_ci
149462306a36Sopenharmony_ci		count++;
149562306a36Sopenharmony_ci	} while (!__igt_timeout(end_time, NULL));
149662306a36Sopenharmony_ci	intel_engine_pm_put(engine);
149762306a36Sopenharmony_ci
149862306a36Sopenharmony_ci	pr_info("%s: %lu request + sync\n", engine->name, count);
149962306a36Sopenharmony_ci	thread->result = err;
150062306a36Sopenharmony_ci}
150162306a36Sopenharmony_ci
150262306a36Sopenharmony_cistatic void __live_parallel_engineN(struct kthread_work *work)
150362306a36Sopenharmony_ci{
150462306a36Sopenharmony_ci	struct parallel_thread *thread =
150562306a36Sopenharmony_ci		container_of(work, typeof(*thread), work);
150662306a36Sopenharmony_ci	struct intel_engine_cs *engine = thread->engine;
150762306a36Sopenharmony_ci	IGT_TIMEOUT(end_time);
150862306a36Sopenharmony_ci	unsigned long count;
150962306a36Sopenharmony_ci	int err = 0;
151062306a36Sopenharmony_ci
151162306a36Sopenharmony_ci	count = 0;
151262306a36Sopenharmony_ci	intel_engine_pm_get(engine);
151362306a36Sopenharmony_ci	do {
151462306a36Sopenharmony_ci		struct i915_request *rq;
151562306a36Sopenharmony_ci
151662306a36Sopenharmony_ci		rq = i915_request_create(engine->kernel_context);
151762306a36Sopenharmony_ci		if (IS_ERR(rq)) {
151862306a36Sopenharmony_ci			err = PTR_ERR(rq);
151962306a36Sopenharmony_ci			break;
152062306a36Sopenharmony_ci		}
152162306a36Sopenharmony_ci
152262306a36Sopenharmony_ci		i915_request_add(rq);
152362306a36Sopenharmony_ci		count++;
152462306a36Sopenharmony_ci	} while (!__igt_timeout(end_time, NULL));
152562306a36Sopenharmony_ci	intel_engine_pm_put(engine);
152662306a36Sopenharmony_ci
152762306a36Sopenharmony_ci	pr_info("%s: %lu requests\n", engine->name, count);
152862306a36Sopenharmony_ci	thread->result = err;
152962306a36Sopenharmony_ci}
153062306a36Sopenharmony_ci
153162306a36Sopenharmony_cistatic bool wake_all(struct drm_i915_private *i915)
153262306a36Sopenharmony_ci{
153362306a36Sopenharmony_ci	if (atomic_dec_and_test(&i915->selftest.counter)) {
153462306a36Sopenharmony_ci		wake_up_var(&i915->selftest.counter);
153562306a36Sopenharmony_ci		return true;
153662306a36Sopenharmony_ci	}
153762306a36Sopenharmony_ci
153862306a36Sopenharmony_ci	return false;
153962306a36Sopenharmony_ci}
154062306a36Sopenharmony_ci
154162306a36Sopenharmony_cistatic int wait_for_all(struct drm_i915_private *i915)
154262306a36Sopenharmony_ci{
154362306a36Sopenharmony_ci	if (wake_all(i915))
154462306a36Sopenharmony_ci		return 0;
154562306a36Sopenharmony_ci
154662306a36Sopenharmony_ci	if (wait_var_event_timeout(&i915->selftest.counter,
154762306a36Sopenharmony_ci				   !atomic_read(&i915->selftest.counter),
154862306a36Sopenharmony_ci				   i915_selftest.timeout_jiffies))
154962306a36Sopenharmony_ci		return 0;
155062306a36Sopenharmony_ci
155162306a36Sopenharmony_ci	return -ETIME;
155262306a36Sopenharmony_ci}
155362306a36Sopenharmony_ci
155462306a36Sopenharmony_cistatic void __live_parallel_spin(struct kthread_work *work)
155562306a36Sopenharmony_ci{
155662306a36Sopenharmony_ci	struct parallel_thread *thread =
155762306a36Sopenharmony_ci		container_of(work, typeof(*thread), work);
155862306a36Sopenharmony_ci	struct intel_engine_cs *engine = thread->engine;
155962306a36Sopenharmony_ci	struct igt_spinner spin;
156062306a36Sopenharmony_ci	struct i915_request *rq;
156162306a36Sopenharmony_ci	int err = 0;
156262306a36Sopenharmony_ci
156362306a36Sopenharmony_ci	/*
156462306a36Sopenharmony_ci	 * Create a spinner running for eternity on each engine. If a second
156562306a36Sopenharmony_ci	 * spinner is incorrectly placed on the same engine, it will not be
156662306a36Sopenharmony_ci	 * able to start in time.
156762306a36Sopenharmony_ci	 */
156862306a36Sopenharmony_ci
156962306a36Sopenharmony_ci	if (igt_spinner_init(&spin, engine->gt)) {
157062306a36Sopenharmony_ci		wake_all(engine->i915);
157162306a36Sopenharmony_ci		thread->result = -ENOMEM;
157262306a36Sopenharmony_ci		return;
157362306a36Sopenharmony_ci	}
157462306a36Sopenharmony_ci
157562306a36Sopenharmony_ci	intel_engine_pm_get(engine);
157662306a36Sopenharmony_ci	rq = igt_spinner_create_request(&spin,
157762306a36Sopenharmony_ci					engine->kernel_context,
157862306a36Sopenharmony_ci					MI_NOOP); /* no preemption */
157962306a36Sopenharmony_ci	intel_engine_pm_put(engine);
158062306a36Sopenharmony_ci	if (IS_ERR(rq)) {
158162306a36Sopenharmony_ci		err = PTR_ERR(rq);
158262306a36Sopenharmony_ci		if (err == -ENODEV)
158362306a36Sopenharmony_ci			err = 0;
158462306a36Sopenharmony_ci		wake_all(engine->i915);
158562306a36Sopenharmony_ci		goto out_spin;
158662306a36Sopenharmony_ci	}
158762306a36Sopenharmony_ci
158862306a36Sopenharmony_ci	i915_request_get(rq);
158962306a36Sopenharmony_ci	i915_request_add(rq);
159062306a36Sopenharmony_ci	if (igt_wait_for_spinner(&spin, rq)) {
159162306a36Sopenharmony_ci		/* Occupy this engine for the whole test */
159262306a36Sopenharmony_ci		err = wait_for_all(engine->i915);
159362306a36Sopenharmony_ci	} else {
159462306a36Sopenharmony_ci		pr_err("Failed to start spinner on %s\n", engine->name);
159562306a36Sopenharmony_ci		err = -EINVAL;
159662306a36Sopenharmony_ci	}
159762306a36Sopenharmony_ci	igt_spinner_end(&spin);
159862306a36Sopenharmony_ci
159962306a36Sopenharmony_ci	if (err == 0 && i915_request_wait(rq, 0, HZ) < 0)
160062306a36Sopenharmony_ci		err = -EIO;
160162306a36Sopenharmony_ci	i915_request_put(rq);
160262306a36Sopenharmony_ci
160362306a36Sopenharmony_ciout_spin:
160462306a36Sopenharmony_ci	igt_spinner_fini(&spin);
160562306a36Sopenharmony_ci	thread->result = err;
160662306a36Sopenharmony_ci}
160762306a36Sopenharmony_ci
160862306a36Sopenharmony_cistatic int live_parallel_engines(void *arg)
160962306a36Sopenharmony_ci{
161062306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
161162306a36Sopenharmony_ci	static void (* const func[])(struct kthread_work *) = {
161262306a36Sopenharmony_ci		__live_parallel_engine1,
161362306a36Sopenharmony_ci		__live_parallel_engineN,
161462306a36Sopenharmony_ci		__live_parallel_spin,
161562306a36Sopenharmony_ci		NULL,
161662306a36Sopenharmony_ci	};
161762306a36Sopenharmony_ci	const unsigned int nengines = num_uabi_engines(i915);
161862306a36Sopenharmony_ci	struct parallel_thread *threads;
161962306a36Sopenharmony_ci	struct intel_engine_cs *engine;
162062306a36Sopenharmony_ci	void (* const *fn)(struct kthread_work *);
162162306a36Sopenharmony_ci	int err = 0;
162262306a36Sopenharmony_ci
162362306a36Sopenharmony_ci	/*
162462306a36Sopenharmony_ci	 * Check we can submit requests to all engines concurrently. This
162562306a36Sopenharmony_ci	 * tests that we load up the system maximally.
162662306a36Sopenharmony_ci	 */
162762306a36Sopenharmony_ci
162862306a36Sopenharmony_ci	threads = kcalloc(nengines, sizeof(*threads), GFP_KERNEL);
162962306a36Sopenharmony_ci	if (!threads)
163062306a36Sopenharmony_ci		return -ENOMEM;
163162306a36Sopenharmony_ci
163262306a36Sopenharmony_ci	for (fn = func; !err && *fn; fn++) {
163362306a36Sopenharmony_ci		char name[KSYM_NAME_LEN];
163462306a36Sopenharmony_ci		struct igt_live_test t;
163562306a36Sopenharmony_ci		unsigned int idx;
163662306a36Sopenharmony_ci
163762306a36Sopenharmony_ci		snprintf(name, sizeof(name), "%ps", *fn);
163862306a36Sopenharmony_ci		err = igt_live_test_begin(&t, i915, __func__, name);
163962306a36Sopenharmony_ci		if (err)
164062306a36Sopenharmony_ci			break;
164162306a36Sopenharmony_ci
164262306a36Sopenharmony_ci		atomic_set(&i915->selftest.counter, nengines);
164362306a36Sopenharmony_ci
164462306a36Sopenharmony_ci		idx = 0;
164562306a36Sopenharmony_ci		for_each_uabi_engine(engine, i915) {
164662306a36Sopenharmony_ci			struct kthread_worker *worker;
164762306a36Sopenharmony_ci
164862306a36Sopenharmony_ci			worker = kthread_create_worker(0, "igt/parallel:%s",
164962306a36Sopenharmony_ci						       engine->name);
165062306a36Sopenharmony_ci			if (IS_ERR(worker)) {
165162306a36Sopenharmony_ci				err = PTR_ERR(worker);
165262306a36Sopenharmony_ci				break;
165362306a36Sopenharmony_ci			}
165462306a36Sopenharmony_ci
165562306a36Sopenharmony_ci			threads[idx].worker = worker;
165662306a36Sopenharmony_ci			threads[idx].result = 0;
165762306a36Sopenharmony_ci			threads[idx].engine = engine;
165862306a36Sopenharmony_ci
165962306a36Sopenharmony_ci			kthread_init_work(&threads[idx].work, *fn);
166062306a36Sopenharmony_ci			kthread_queue_work(worker, &threads[idx].work);
166162306a36Sopenharmony_ci			idx++;
166262306a36Sopenharmony_ci		}
166362306a36Sopenharmony_ci
166462306a36Sopenharmony_ci		idx = 0;
166562306a36Sopenharmony_ci		for_each_uabi_engine(engine, i915) {
166662306a36Sopenharmony_ci			int status;
166762306a36Sopenharmony_ci
166862306a36Sopenharmony_ci			if (!threads[idx].worker)
166962306a36Sopenharmony_ci				break;
167062306a36Sopenharmony_ci
167162306a36Sopenharmony_ci			kthread_flush_work(&threads[idx].work);
167262306a36Sopenharmony_ci			status = READ_ONCE(threads[idx].result);
167362306a36Sopenharmony_ci			if (status && !err)
167462306a36Sopenharmony_ci				err = status;
167562306a36Sopenharmony_ci
167662306a36Sopenharmony_ci			kthread_destroy_worker(threads[idx++].worker);
167762306a36Sopenharmony_ci		}
167862306a36Sopenharmony_ci
167962306a36Sopenharmony_ci		if (igt_live_test_end(&t))
168062306a36Sopenharmony_ci			err = -EIO;
168162306a36Sopenharmony_ci	}
168262306a36Sopenharmony_ci
168362306a36Sopenharmony_ci	kfree(threads);
168462306a36Sopenharmony_ci	return err;
168562306a36Sopenharmony_ci}
168662306a36Sopenharmony_ci
168762306a36Sopenharmony_cistatic int
168862306a36Sopenharmony_cimax_batches(struct i915_gem_context *ctx, struct intel_engine_cs *engine)
168962306a36Sopenharmony_ci{
169062306a36Sopenharmony_ci	struct i915_request *rq;
169162306a36Sopenharmony_ci	int ret;
169262306a36Sopenharmony_ci
169362306a36Sopenharmony_ci	/*
169462306a36Sopenharmony_ci	 * Before execlists, all contexts share the same ringbuffer. With
169562306a36Sopenharmony_ci	 * execlists, each context/engine has a separate ringbuffer and
169662306a36Sopenharmony_ci	 * for the purposes of this test, inexhaustible.
169762306a36Sopenharmony_ci	 *
169862306a36Sopenharmony_ci	 * For the global ringbuffer though, we have to be very careful
169962306a36Sopenharmony_ci	 * that we do not wrap while preventing the execution of requests
170062306a36Sopenharmony_ci	 * with a unsignaled fence.
170162306a36Sopenharmony_ci	 */
170262306a36Sopenharmony_ci	if (HAS_EXECLISTS(ctx->i915))
170362306a36Sopenharmony_ci		return INT_MAX;
170462306a36Sopenharmony_ci
170562306a36Sopenharmony_ci	rq = igt_request_alloc(ctx, engine);
170662306a36Sopenharmony_ci	if (IS_ERR(rq)) {
170762306a36Sopenharmony_ci		ret = PTR_ERR(rq);
170862306a36Sopenharmony_ci	} else {
170962306a36Sopenharmony_ci		int sz;
171062306a36Sopenharmony_ci
171162306a36Sopenharmony_ci		ret = rq->ring->size - rq->reserved_space;
171262306a36Sopenharmony_ci		i915_request_add(rq);
171362306a36Sopenharmony_ci
171462306a36Sopenharmony_ci		sz = rq->ring->emit - rq->head;
171562306a36Sopenharmony_ci		if (sz < 0)
171662306a36Sopenharmony_ci			sz += rq->ring->size;
171762306a36Sopenharmony_ci		ret /= sz;
171862306a36Sopenharmony_ci		ret /= 2; /* leave half spare, in case of emergency! */
171962306a36Sopenharmony_ci	}
172062306a36Sopenharmony_ci
172162306a36Sopenharmony_ci	return ret;
172262306a36Sopenharmony_ci}
172362306a36Sopenharmony_ci
172462306a36Sopenharmony_cistatic int live_breadcrumbs_smoketest(void *arg)
172562306a36Sopenharmony_ci{
172662306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
172762306a36Sopenharmony_ci	const unsigned int nengines = num_uabi_engines(i915);
172862306a36Sopenharmony_ci	const unsigned int ncpus = /* saturate with nengines * ncpus */
172962306a36Sopenharmony_ci		max_t(int, 2, DIV_ROUND_UP(num_online_cpus(), nengines));
173062306a36Sopenharmony_ci	unsigned long num_waits, num_fences;
173162306a36Sopenharmony_ci	struct intel_engine_cs *engine;
173262306a36Sopenharmony_ci	struct smoke_thread *threads;
173362306a36Sopenharmony_ci	struct igt_live_test live;
173462306a36Sopenharmony_ci	intel_wakeref_t wakeref;
173562306a36Sopenharmony_ci	struct smoketest *smoke;
173662306a36Sopenharmony_ci	unsigned int n, idx;
173762306a36Sopenharmony_ci	struct file *file;
173862306a36Sopenharmony_ci	int ret = 0;
173962306a36Sopenharmony_ci
174062306a36Sopenharmony_ci	/*
174162306a36Sopenharmony_ci	 * Smoketest our breadcrumb/signal handling for requests across multiple
174262306a36Sopenharmony_ci	 * threads. A very simple test to only catch the most egregious of bugs.
174362306a36Sopenharmony_ci	 * See __igt_breadcrumbs_smoketest();
174462306a36Sopenharmony_ci	 *
174562306a36Sopenharmony_ci	 * On real hardware this time.
174662306a36Sopenharmony_ci	 */
174762306a36Sopenharmony_ci
174862306a36Sopenharmony_ci	wakeref = intel_runtime_pm_get(&i915->runtime_pm);
174962306a36Sopenharmony_ci
175062306a36Sopenharmony_ci	file = mock_file(i915);
175162306a36Sopenharmony_ci	if (IS_ERR(file)) {
175262306a36Sopenharmony_ci		ret = PTR_ERR(file);
175362306a36Sopenharmony_ci		goto out_rpm;
175462306a36Sopenharmony_ci	}
175562306a36Sopenharmony_ci
175662306a36Sopenharmony_ci	smoke = kcalloc(nengines, sizeof(*smoke), GFP_KERNEL);
175762306a36Sopenharmony_ci	if (!smoke) {
175862306a36Sopenharmony_ci		ret = -ENOMEM;
175962306a36Sopenharmony_ci		goto out_file;
176062306a36Sopenharmony_ci	}
176162306a36Sopenharmony_ci
176262306a36Sopenharmony_ci	threads = kcalloc(ncpus * nengines, sizeof(*threads), GFP_KERNEL);
176362306a36Sopenharmony_ci	if (!threads) {
176462306a36Sopenharmony_ci		ret = -ENOMEM;
176562306a36Sopenharmony_ci		goto out_smoke;
176662306a36Sopenharmony_ci	}
176762306a36Sopenharmony_ci
176862306a36Sopenharmony_ci	smoke[0].request_alloc = __live_request_alloc;
176962306a36Sopenharmony_ci	smoke[0].ncontexts = 64;
177062306a36Sopenharmony_ci	smoke[0].contexts = kcalloc(smoke[0].ncontexts,
177162306a36Sopenharmony_ci				    sizeof(*smoke[0].contexts),
177262306a36Sopenharmony_ci				    GFP_KERNEL);
177362306a36Sopenharmony_ci	if (!smoke[0].contexts) {
177462306a36Sopenharmony_ci		ret = -ENOMEM;
177562306a36Sopenharmony_ci		goto out_threads;
177662306a36Sopenharmony_ci	}
177762306a36Sopenharmony_ci
177862306a36Sopenharmony_ci	for (n = 0; n < smoke[0].ncontexts; n++) {
177962306a36Sopenharmony_ci		smoke[0].contexts[n] = live_context(i915, file);
178062306a36Sopenharmony_ci		if (IS_ERR(smoke[0].contexts[n])) {
178162306a36Sopenharmony_ci			ret = PTR_ERR(smoke[0].contexts[n]);
178262306a36Sopenharmony_ci			goto out_contexts;
178362306a36Sopenharmony_ci		}
178462306a36Sopenharmony_ci	}
178562306a36Sopenharmony_ci
178662306a36Sopenharmony_ci	ret = igt_live_test_begin(&live, i915, __func__, "");
178762306a36Sopenharmony_ci	if (ret)
178862306a36Sopenharmony_ci		goto out_contexts;
178962306a36Sopenharmony_ci
179062306a36Sopenharmony_ci	idx = 0;
179162306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
179262306a36Sopenharmony_ci		smoke[idx] = smoke[0];
179362306a36Sopenharmony_ci		smoke[idx].engine = engine;
179462306a36Sopenharmony_ci		smoke[idx].max_batch =
179562306a36Sopenharmony_ci			max_batches(smoke[0].contexts[0], engine);
179662306a36Sopenharmony_ci		if (smoke[idx].max_batch < 0) {
179762306a36Sopenharmony_ci			ret = smoke[idx].max_batch;
179862306a36Sopenharmony_ci			goto out_flush;
179962306a36Sopenharmony_ci		}
180062306a36Sopenharmony_ci		/* One ring interleaved between requests from all cpus */
180162306a36Sopenharmony_ci		smoke[idx].max_batch /= ncpus + 1;
180262306a36Sopenharmony_ci		pr_debug("Limiting batches to %d requests on %s\n",
180362306a36Sopenharmony_ci			 smoke[idx].max_batch, engine->name);
180462306a36Sopenharmony_ci
180562306a36Sopenharmony_ci		for (n = 0; n < ncpus; n++) {
180662306a36Sopenharmony_ci			unsigned int i = idx * ncpus + n;
180762306a36Sopenharmony_ci			struct kthread_worker *worker;
180862306a36Sopenharmony_ci
180962306a36Sopenharmony_ci			worker = kthread_create_worker(0, "igt/%d.%d", idx, n);
181062306a36Sopenharmony_ci			if (IS_ERR(worker)) {
181162306a36Sopenharmony_ci				ret = PTR_ERR(worker);
181262306a36Sopenharmony_ci				goto out_flush;
181362306a36Sopenharmony_ci			}
181462306a36Sopenharmony_ci
181562306a36Sopenharmony_ci			threads[i].worker = worker;
181662306a36Sopenharmony_ci			threads[i].t = &smoke[idx];
181762306a36Sopenharmony_ci
181862306a36Sopenharmony_ci			kthread_init_work(&threads[i].work,
181962306a36Sopenharmony_ci					  __igt_breadcrumbs_smoketest);
182062306a36Sopenharmony_ci			kthread_queue_work(worker, &threads[i].work);
182162306a36Sopenharmony_ci		}
182262306a36Sopenharmony_ci
182362306a36Sopenharmony_ci		idx++;
182462306a36Sopenharmony_ci	}
182562306a36Sopenharmony_ci
182662306a36Sopenharmony_ci	msleep(jiffies_to_msecs(i915_selftest.timeout_jiffies));
182762306a36Sopenharmony_ci
182862306a36Sopenharmony_ciout_flush:
182962306a36Sopenharmony_ci	idx = 0;
183062306a36Sopenharmony_ci	num_waits = 0;
183162306a36Sopenharmony_ci	num_fences = 0;
183262306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
183362306a36Sopenharmony_ci		for (n = 0; n < ncpus; n++) {
183462306a36Sopenharmony_ci			unsigned int i = idx * ncpus + n;
183562306a36Sopenharmony_ci			int err;
183662306a36Sopenharmony_ci
183762306a36Sopenharmony_ci			if (!threads[i].worker)
183862306a36Sopenharmony_ci				continue;
183962306a36Sopenharmony_ci
184062306a36Sopenharmony_ci			WRITE_ONCE(threads[i].stop, true);
184162306a36Sopenharmony_ci			kthread_flush_work(&threads[i].work);
184262306a36Sopenharmony_ci			err = READ_ONCE(threads[i].result);
184362306a36Sopenharmony_ci			if (err < 0 && !ret)
184462306a36Sopenharmony_ci				ret = err;
184562306a36Sopenharmony_ci
184662306a36Sopenharmony_ci			kthread_destroy_worker(threads[i].worker);
184762306a36Sopenharmony_ci		}
184862306a36Sopenharmony_ci
184962306a36Sopenharmony_ci		num_waits += atomic_long_read(&smoke[idx].num_waits);
185062306a36Sopenharmony_ci		num_fences += atomic_long_read(&smoke[idx].num_fences);
185162306a36Sopenharmony_ci		idx++;
185262306a36Sopenharmony_ci	}
185362306a36Sopenharmony_ci	pr_info("Completed %lu waits for %lu fences across %d engines and %d cpus\n",
185462306a36Sopenharmony_ci		num_waits, num_fences, idx, ncpus);
185562306a36Sopenharmony_ci
185662306a36Sopenharmony_ci	ret = igt_live_test_end(&live) ?: ret;
185762306a36Sopenharmony_ciout_contexts:
185862306a36Sopenharmony_ci	kfree(smoke[0].contexts);
185962306a36Sopenharmony_ciout_threads:
186062306a36Sopenharmony_ci	kfree(threads);
186162306a36Sopenharmony_ciout_smoke:
186262306a36Sopenharmony_ci	kfree(smoke);
186362306a36Sopenharmony_ciout_file:
186462306a36Sopenharmony_ci	fput(file);
186562306a36Sopenharmony_ciout_rpm:
186662306a36Sopenharmony_ci	intel_runtime_pm_put(&i915->runtime_pm, wakeref);
186762306a36Sopenharmony_ci
186862306a36Sopenharmony_ci	return ret;
186962306a36Sopenharmony_ci}
187062306a36Sopenharmony_ci
187162306a36Sopenharmony_ciint i915_request_live_selftests(struct drm_i915_private *i915)
187262306a36Sopenharmony_ci{
187362306a36Sopenharmony_ci	static const struct i915_subtest tests[] = {
187462306a36Sopenharmony_ci		SUBTEST(live_nop_request),
187562306a36Sopenharmony_ci		SUBTEST(live_all_engines),
187662306a36Sopenharmony_ci		SUBTEST(live_sequential_engines),
187762306a36Sopenharmony_ci		SUBTEST(live_parallel_engines),
187862306a36Sopenharmony_ci		SUBTEST(live_empty_request),
187962306a36Sopenharmony_ci		SUBTEST(live_cancel_request),
188062306a36Sopenharmony_ci		SUBTEST(live_breadcrumbs_smoketest),
188162306a36Sopenharmony_ci	};
188262306a36Sopenharmony_ci
188362306a36Sopenharmony_ci	if (intel_gt_is_wedged(to_gt(i915)))
188462306a36Sopenharmony_ci		return 0;
188562306a36Sopenharmony_ci
188662306a36Sopenharmony_ci	return i915_live_subtests(tests, i915);
188762306a36Sopenharmony_ci}
188862306a36Sopenharmony_ci
188962306a36Sopenharmony_cistatic int switch_to_kernel_sync(struct intel_context *ce, int err)
189062306a36Sopenharmony_ci{
189162306a36Sopenharmony_ci	struct i915_request *rq;
189262306a36Sopenharmony_ci	struct dma_fence *fence;
189362306a36Sopenharmony_ci
189462306a36Sopenharmony_ci	rq = intel_engine_create_kernel_request(ce->engine);
189562306a36Sopenharmony_ci	if (IS_ERR(rq))
189662306a36Sopenharmony_ci		return PTR_ERR(rq);
189762306a36Sopenharmony_ci
189862306a36Sopenharmony_ci	fence = i915_active_fence_get(&ce->timeline->last_request);
189962306a36Sopenharmony_ci	if (fence) {
190062306a36Sopenharmony_ci		i915_request_await_dma_fence(rq, fence);
190162306a36Sopenharmony_ci		dma_fence_put(fence);
190262306a36Sopenharmony_ci	}
190362306a36Sopenharmony_ci
190462306a36Sopenharmony_ci	rq = i915_request_get(rq);
190562306a36Sopenharmony_ci	i915_request_add(rq);
190662306a36Sopenharmony_ci	if (i915_request_wait(rq, 0, HZ / 2) < 0 && !err)
190762306a36Sopenharmony_ci		err = -ETIME;
190862306a36Sopenharmony_ci	i915_request_put(rq);
190962306a36Sopenharmony_ci
191062306a36Sopenharmony_ci	while (!err && !intel_engine_is_idle(ce->engine))
191162306a36Sopenharmony_ci		intel_engine_flush_submission(ce->engine);
191262306a36Sopenharmony_ci
191362306a36Sopenharmony_ci	return err;
191462306a36Sopenharmony_ci}
191562306a36Sopenharmony_ci
191662306a36Sopenharmony_cistruct perf_stats {
191762306a36Sopenharmony_ci	struct intel_engine_cs *engine;
191862306a36Sopenharmony_ci	unsigned long count;
191962306a36Sopenharmony_ci	ktime_t time;
192062306a36Sopenharmony_ci	ktime_t busy;
192162306a36Sopenharmony_ci	u64 runtime;
192262306a36Sopenharmony_ci};
192362306a36Sopenharmony_ci
192462306a36Sopenharmony_cistruct perf_series {
192562306a36Sopenharmony_ci	struct drm_i915_private *i915;
192662306a36Sopenharmony_ci	unsigned int nengines;
192762306a36Sopenharmony_ci	struct intel_context *ce[];
192862306a36Sopenharmony_ci};
192962306a36Sopenharmony_ci
193062306a36Sopenharmony_cistatic int cmp_u32(const void *A, const void *B)
193162306a36Sopenharmony_ci{
193262306a36Sopenharmony_ci	const u32 *a = A, *b = B;
193362306a36Sopenharmony_ci
193462306a36Sopenharmony_ci	return *a - *b;
193562306a36Sopenharmony_ci}
193662306a36Sopenharmony_ci
193762306a36Sopenharmony_cistatic u32 trifilter(u32 *a)
193862306a36Sopenharmony_ci{
193962306a36Sopenharmony_ci	u64 sum;
194062306a36Sopenharmony_ci
194162306a36Sopenharmony_ci#define TF_COUNT 5
194262306a36Sopenharmony_ci	sort(a, TF_COUNT, sizeof(*a), cmp_u32, NULL);
194362306a36Sopenharmony_ci
194462306a36Sopenharmony_ci	sum = mul_u32_u32(a[2], 2);
194562306a36Sopenharmony_ci	sum += a[1];
194662306a36Sopenharmony_ci	sum += a[3];
194762306a36Sopenharmony_ci
194862306a36Sopenharmony_ci	GEM_BUG_ON(sum > U32_MAX);
194962306a36Sopenharmony_ci	return sum;
195062306a36Sopenharmony_ci#define TF_BIAS 2
195162306a36Sopenharmony_ci}
195262306a36Sopenharmony_ci
195362306a36Sopenharmony_cistatic u64 cycles_to_ns(struct intel_engine_cs *engine, u32 cycles)
195462306a36Sopenharmony_ci{
195562306a36Sopenharmony_ci	u64 ns = intel_gt_clock_interval_to_ns(engine->gt, cycles);
195662306a36Sopenharmony_ci
195762306a36Sopenharmony_ci	return DIV_ROUND_CLOSEST(ns, 1 << TF_BIAS);
195862306a36Sopenharmony_ci}
195962306a36Sopenharmony_ci
196062306a36Sopenharmony_cistatic u32 *emit_timestamp_store(u32 *cs, struct intel_context *ce, u32 offset)
196162306a36Sopenharmony_ci{
196262306a36Sopenharmony_ci	*cs++ = MI_STORE_REGISTER_MEM_GEN8 | MI_USE_GGTT;
196362306a36Sopenharmony_ci	*cs++ = i915_mmio_reg_offset(RING_TIMESTAMP((ce->engine->mmio_base)));
196462306a36Sopenharmony_ci	*cs++ = offset;
196562306a36Sopenharmony_ci	*cs++ = 0;
196662306a36Sopenharmony_ci
196762306a36Sopenharmony_ci	return cs;
196862306a36Sopenharmony_ci}
196962306a36Sopenharmony_ci
197062306a36Sopenharmony_cistatic u32 *emit_store_dw(u32 *cs, u32 offset, u32 value)
197162306a36Sopenharmony_ci{
197262306a36Sopenharmony_ci	*cs++ = MI_STORE_DWORD_IMM_GEN4 | MI_USE_GGTT;
197362306a36Sopenharmony_ci	*cs++ = offset;
197462306a36Sopenharmony_ci	*cs++ = 0;
197562306a36Sopenharmony_ci	*cs++ = value;
197662306a36Sopenharmony_ci
197762306a36Sopenharmony_ci	return cs;
197862306a36Sopenharmony_ci}
197962306a36Sopenharmony_ci
198062306a36Sopenharmony_cistatic u32 *emit_semaphore_poll(u32 *cs, u32 mode, u32 value, u32 offset)
198162306a36Sopenharmony_ci{
198262306a36Sopenharmony_ci	*cs++ = MI_SEMAPHORE_WAIT |
198362306a36Sopenharmony_ci		MI_SEMAPHORE_GLOBAL_GTT |
198462306a36Sopenharmony_ci		MI_SEMAPHORE_POLL |
198562306a36Sopenharmony_ci		mode;
198662306a36Sopenharmony_ci	*cs++ = value;
198762306a36Sopenharmony_ci	*cs++ = offset;
198862306a36Sopenharmony_ci	*cs++ = 0;
198962306a36Sopenharmony_ci
199062306a36Sopenharmony_ci	return cs;
199162306a36Sopenharmony_ci}
199262306a36Sopenharmony_ci
199362306a36Sopenharmony_cistatic u32 *emit_semaphore_poll_until(u32 *cs, u32 offset, u32 value)
199462306a36Sopenharmony_ci{
199562306a36Sopenharmony_ci	return emit_semaphore_poll(cs, MI_SEMAPHORE_SAD_EQ_SDD, value, offset);
199662306a36Sopenharmony_ci}
199762306a36Sopenharmony_ci
199862306a36Sopenharmony_cistatic void semaphore_set(u32 *sema, u32 value)
199962306a36Sopenharmony_ci{
200062306a36Sopenharmony_ci	WRITE_ONCE(*sema, value);
200162306a36Sopenharmony_ci	wmb(); /* flush the update to the cache, and beyond */
200262306a36Sopenharmony_ci}
200362306a36Sopenharmony_ci
200462306a36Sopenharmony_cistatic u32 *hwsp_scratch(const struct intel_context *ce)
200562306a36Sopenharmony_ci{
200662306a36Sopenharmony_ci	return memset32(ce->engine->status_page.addr + 1000, 0, 21);
200762306a36Sopenharmony_ci}
200862306a36Sopenharmony_ci
200962306a36Sopenharmony_cistatic u32 hwsp_offset(const struct intel_context *ce, u32 *dw)
201062306a36Sopenharmony_ci{
201162306a36Sopenharmony_ci	return (i915_ggtt_offset(ce->engine->status_page.vma) +
201262306a36Sopenharmony_ci		offset_in_page(dw));
201362306a36Sopenharmony_ci}
201462306a36Sopenharmony_ci
201562306a36Sopenharmony_cistatic int measure_semaphore_response(struct intel_context *ce)
201662306a36Sopenharmony_ci{
201762306a36Sopenharmony_ci	u32 *sema = hwsp_scratch(ce);
201862306a36Sopenharmony_ci	const u32 offset = hwsp_offset(ce, sema);
201962306a36Sopenharmony_ci	u32 elapsed[TF_COUNT], cycles;
202062306a36Sopenharmony_ci	struct i915_request *rq;
202162306a36Sopenharmony_ci	u32 *cs;
202262306a36Sopenharmony_ci	int err;
202362306a36Sopenharmony_ci	int i;
202462306a36Sopenharmony_ci
202562306a36Sopenharmony_ci	/*
202662306a36Sopenharmony_ci	 * Measure how many cycles it takes for the HW to detect the change
202762306a36Sopenharmony_ci	 * in a semaphore value.
202862306a36Sopenharmony_ci	 *
202962306a36Sopenharmony_ci	 *    A: read CS_TIMESTAMP from CPU
203062306a36Sopenharmony_ci	 *    poke semaphore
203162306a36Sopenharmony_ci	 *    B: read CS_TIMESTAMP on GPU
203262306a36Sopenharmony_ci	 *
203362306a36Sopenharmony_ci	 * Semaphore latency: B - A
203462306a36Sopenharmony_ci	 */
203562306a36Sopenharmony_ci
203662306a36Sopenharmony_ci	semaphore_set(sema, -1);
203762306a36Sopenharmony_ci
203862306a36Sopenharmony_ci	rq = i915_request_create(ce);
203962306a36Sopenharmony_ci	if (IS_ERR(rq))
204062306a36Sopenharmony_ci		return PTR_ERR(rq);
204162306a36Sopenharmony_ci
204262306a36Sopenharmony_ci	cs = intel_ring_begin(rq, 4 + 12 * ARRAY_SIZE(elapsed));
204362306a36Sopenharmony_ci	if (IS_ERR(cs)) {
204462306a36Sopenharmony_ci		i915_request_add(rq);
204562306a36Sopenharmony_ci		err = PTR_ERR(cs);
204662306a36Sopenharmony_ci		goto err;
204762306a36Sopenharmony_ci	}
204862306a36Sopenharmony_ci
204962306a36Sopenharmony_ci	cs = emit_store_dw(cs, offset, 0);
205062306a36Sopenharmony_ci	for (i = 1; i <= ARRAY_SIZE(elapsed); i++) {
205162306a36Sopenharmony_ci		cs = emit_semaphore_poll_until(cs, offset, i);
205262306a36Sopenharmony_ci		cs = emit_timestamp_store(cs, ce, offset + i * sizeof(u32));
205362306a36Sopenharmony_ci		cs = emit_store_dw(cs, offset, 0);
205462306a36Sopenharmony_ci	}
205562306a36Sopenharmony_ci
205662306a36Sopenharmony_ci	intel_ring_advance(rq, cs);
205762306a36Sopenharmony_ci	i915_request_add(rq);
205862306a36Sopenharmony_ci
205962306a36Sopenharmony_ci	if (wait_for(READ_ONCE(*sema) == 0, 50)) {
206062306a36Sopenharmony_ci		err = -EIO;
206162306a36Sopenharmony_ci		goto err;
206262306a36Sopenharmony_ci	}
206362306a36Sopenharmony_ci
206462306a36Sopenharmony_ci	for (i = 1; i <= ARRAY_SIZE(elapsed); i++) {
206562306a36Sopenharmony_ci		preempt_disable();
206662306a36Sopenharmony_ci		cycles = ENGINE_READ_FW(ce->engine, RING_TIMESTAMP);
206762306a36Sopenharmony_ci		semaphore_set(sema, i);
206862306a36Sopenharmony_ci		preempt_enable();
206962306a36Sopenharmony_ci
207062306a36Sopenharmony_ci		if (wait_for(READ_ONCE(*sema) == 0, 50)) {
207162306a36Sopenharmony_ci			err = -EIO;
207262306a36Sopenharmony_ci			goto err;
207362306a36Sopenharmony_ci		}
207462306a36Sopenharmony_ci
207562306a36Sopenharmony_ci		elapsed[i - 1] = sema[i] - cycles;
207662306a36Sopenharmony_ci	}
207762306a36Sopenharmony_ci
207862306a36Sopenharmony_ci	cycles = trifilter(elapsed);
207962306a36Sopenharmony_ci	pr_info("%s: semaphore response %d cycles, %lluns\n",
208062306a36Sopenharmony_ci		ce->engine->name, cycles >> TF_BIAS,
208162306a36Sopenharmony_ci		cycles_to_ns(ce->engine, cycles));
208262306a36Sopenharmony_ci
208362306a36Sopenharmony_ci	return intel_gt_wait_for_idle(ce->engine->gt, HZ);
208462306a36Sopenharmony_ci
208562306a36Sopenharmony_cierr:
208662306a36Sopenharmony_ci	intel_gt_set_wedged(ce->engine->gt);
208762306a36Sopenharmony_ci	return err;
208862306a36Sopenharmony_ci}
208962306a36Sopenharmony_ci
209062306a36Sopenharmony_cistatic int measure_idle_dispatch(struct intel_context *ce)
209162306a36Sopenharmony_ci{
209262306a36Sopenharmony_ci	u32 *sema = hwsp_scratch(ce);
209362306a36Sopenharmony_ci	const u32 offset = hwsp_offset(ce, sema);
209462306a36Sopenharmony_ci	u32 elapsed[TF_COUNT], cycles;
209562306a36Sopenharmony_ci	u32 *cs;
209662306a36Sopenharmony_ci	int err;
209762306a36Sopenharmony_ci	int i;
209862306a36Sopenharmony_ci
209962306a36Sopenharmony_ci	/*
210062306a36Sopenharmony_ci	 * Measure how long it takes for us to submit a request while the
210162306a36Sopenharmony_ci	 * engine is idle, but is resting in our context.
210262306a36Sopenharmony_ci	 *
210362306a36Sopenharmony_ci	 *    A: read CS_TIMESTAMP from CPU
210462306a36Sopenharmony_ci	 *    submit request
210562306a36Sopenharmony_ci	 *    B: read CS_TIMESTAMP on GPU
210662306a36Sopenharmony_ci	 *
210762306a36Sopenharmony_ci	 * Submission latency: B - A
210862306a36Sopenharmony_ci	 */
210962306a36Sopenharmony_ci
211062306a36Sopenharmony_ci	for (i = 0; i < ARRAY_SIZE(elapsed); i++) {
211162306a36Sopenharmony_ci		struct i915_request *rq;
211262306a36Sopenharmony_ci
211362306a36Sopenharmony_ci		err = intel_gt_wait_for_idle(ce->engine->gt, HZ / 2);
211462306a36Sopenharmony_ci		if (err)
211562306a36Sopenharmony_ci			return err;
211662306a36Sopenharmony_ci
211762306a36Sopenharmony_ci		rq = i915_request_create(ce);
211862306a36Sopenharmony_ci		if (IS_ERR(rq)) {
211962306a36Sopenharmony_ci			err = PTR_ERR(rq);
212062306a36Sopenharmony_ci			goto err;
212162306a36Sopenharmony_ci		}
212262306a36Sopenharmony_ci
212362306a36Sopenharmony_ci		cs = intel_ring_begin(rq, 4);
212462306a36Sopenharmony_ci		if (IS_ERR(cs)) {
212562306a36Sopenharmony_ci			i915_request_add(rq);
212662306a36Sopenharmony_ci			err = PTR_ERR(cs);
212762306a36Sopenharmony_ci			goto err;
212862306a36Sopenharmony_ci		}
212962306a36Sopenharmony_ci
213062306a36Sopenharmony_ci		cs = emit_timestamp_store(cs, ce, offset + i * sizeof(u32));
213162306a36Sopenharmony_ci
213262306a36Sopenharmony_ci		intel_ring_advance(rq, cs);
213362306a36Sopenharmony_ci
213462306a36Sopenharmony_ci		preempt_disable();
213562306a36Sopenharmony_ci		local_bh_disable();
213662306a36Sopenharmony_ci		elapsed[i] = ENGINE_READ_FW(ce->engine, RING_TIMESTAMP);
213762306a36Sopenharmony_ci		i915_request_add(rq);
213862306a36Sopenharmony_ci		local_bh_enable();
213962306a36Sopenharmony_ci		preempt_enable();
214062306a36Sopenharmony_ci	}
214162306a36Sopenharmony_ci
214262306a36Sopenharmony_ci	err = intel_gt_wait_for_idle(ce->engine->gt, HZ / 2);
214362306a36Sopenharmony_ci	if (err)
214462306a36Sopenharmony_ci		goto err;
214562306a36Sopenharmony_ci
214662306a36Sopenharmony_ci	for (i = 0; i < ARRAY_SIZE(elapsed); i++)
214762306a36Sopenharmony_ci		elapsed[i] = sema[i] - elapsed[i];
214862306a36Sopenharmony_ci
214962306a36Sopenharmony_ci	cycles = trifilter(elapsed);
215062306a36Sopenharmony_ci	pr_info("%s: idle dispatch latency %d cycles, %lluns\n",
215162306a36Sopenharmony_ci		ce->engine->name, cycles >> TF_BIAS,
215262306a36Sopenharmony_ci		cycles_to_ns(ce->engine, cycles));
215362306a36Sopenharmony_ci
215462306a36Sopenharmony_ci	return intel_gt_wait_for_idle(ce->engine->gt, HZ);
215562306a36Sopenharmony_ci
215662306a36Sopenharmony_cierr:
215762306a36Sopenharmony_ci	intel_gt_set_wedged(ce->engine->gt);
215862306a36Sopenharmony_ci	return err;
215962306a36Sopenharmony_ci}
216062306a36Sopenharmony_ci
216162306a36Sopenharmony_cistatic int measure_busy_dispatch(struct intel_context *ce)
216262306a36Sopenharmony_ci{
216362306a36Sopenharmony_ci	u32 *sema = hwsp_scratch(ce);
216462306a36Sopenharmony_ci	const u32 offset = hwsp_offset(ce, sema);
216562306a36Sopenharmony_ci	u32 elapsed[TF_COUNT + 1], cycles;
216662306a36Sopenharmony_ci	u32 *cs;
216762306a36Sopenharmony_ci	int err;
216862306a36Sopenharmony_ci	int i;
216962306a36Sopenharmony_ci
217062306a36Sopenharmony_ci	/*
217162306a36Sopenharmony_ci	 * Measure how long it takes for us to submit a request while the
217262306a36Sopenharmony_ci	 * engine is busy, polling on a semaphore in our context. With
217362306a36Sopenharmony_ci	 * direct submission, this will include the cost of a lite restore.
217462306a36Sopenharmony_ci	 *
217562306a36Sopenharmony_ci	 *    A: read CS_TIMESTAMP from CPU
217662306a36Sopenharmony_ci	 *    submit request
217762306a36Sopenharmony_ci	 *    B: read CS_TIMESTAMP on GPU
217862306a36Sopenharmony_ci	 *
217962306a36Sopenharmony_ci	 * Submission latency: B - A
218062306a36Sopenharmony_ci	 */
218162306a36Sopenharmony_ci
218262306a36Sopenharmony_ci	for (i = 1; i <= ARRAY_SIZE(elapsed); i++) {
218362306a36Sopenharmony_ci		struct i915_request *rq;
218462306a36Sopenharmony_ci
218562306a36Sopenharmony_ci		rq = i915_request_create(ce);
218662306a36Sopenharmony_ci		if (IS_ERR(rq)) {
218762306a36Sopenharmony_ci			err = PTR_ERR(rq);
218862306a36Sopenharmony_ci			goto err;
218962306a36Sopenharmony_ci		}
219062306a36Sopenharmony_ci
219162306a36Sopenharmony_ci		cs = intel_ring_begin(rq, 12);
219262306a36Sopenharmony_ci		if (IS_ERR(cs)) {
219362306a36Sopenharmony_ci			i915_request_add(rq);
219462306a36Sopenharmony_ci			err = PTR_ERR(cs);
219562306a36Sopenharmony_ci			goto err;
219662306a36Sopenharmony_ci		}
219762306a36Sopenharmony_ci
219862306a36Sopenharmony_ci		cs = emit_store_dw(cs, offset + i * sizeof(u32), -1);
219962306a36Sopenharmony_ci		cs = emit_semaphore_poll_until(cs, offset, i);
220062306a36Sopenharmony_ci		cs = emit_timestamp_store(cs, ce, offset + i * sizeof(u32));
220162306a36Sopenharmony_ci
220262306a36Sopenharmony_ci		intel_ring_advance(rq, cs);
220362306a36Sopenharmony_ci
220462306a36Sopenharmony_ci		if (i > 1 && wait_for(READ_ONCE(sema[i - 1]), 500)) {
220562306a36Sopenharmony_ci			err = -EIO;
220662306a36Sopenharmony_ci			goto err;
220762306a36Sopenharmony_ci		}
220862306a36Sopenharmony_ci
220962306a36Sopenharmony_ci		preempt_disable();
221062306a36Sopenharmony_ci		local_bh_disable();
221162306a36Sopenharmony_ci		elapsed[i - 1] = ENGINE_READ_FW(ce->engine, RING_TIMESTAMP);
221262306a36Sopenharmony_ci		i915_request_add(rq);
221362306a36Sopenharmony_ci		local_bh_enable();
221462306a36Sopenharmony_ci		semaphore_set(sema, i - 1);
221562306a36Sopenharmony_ci		preempt_enable();
221662306a36Sopenharmony_ci	}
221762306a36Sopenharmony_ci
221862306a36Sopenharmony_ci	wait_for(READ_ONCE(sema[i - 1]), 500);
221962306a36Sopenharmony_ci	semaphore_set(sema, i - 1);
222062306a36Sopenharmony_ci
222162306a36Sopenharmony_ci	for (i = 1; i <= TF_COUNT; i++) {
222262306a36Sopenharmony_ci		GEM_BUG_ON(sema[i] == -1);
222362306a36Sopenharmony_ci		elapsed[i - 1] = sema[i] - elapsed[i];
222462306a36Sopenharmony_ci	}
222562306a36Sopenharmony_ci
222662306a36Sopenharmony_ci	cycles = trifilter(elapsed);
222762306a36Sopenharmony_ci	pr_info("%s: busy dispatch latency %d cycles, %lluns\n",
222862306a36Sopenharmony_ci		ce->engine->name, cycles >> TF_BIAS,
222962306a36Sopenharmony_ci		cycles_to_ns(ce->engine, cycles));
223062306a36Sopenharmony_ci
223162306a36Sopenharmony_ci	return intel_gt_wait_for_idle(ce->engine->gt, HZ);
223262306a36Sopenharmony_ci
223362306a36Sopenharmony_cierr:
223462306a36Sopenharmony_ci	intel_gt_set_wedged(ce->engine->gt);
223562306a36Sopenharmony_ci	return err;
223662306a36Sopenharmony_ci}
223762306a36Sopenharmony_ci
223862306a36Sopenharmony_cistatic int plug(struct intel_engine_cs *engine, u32 *sema, u32 mode, int value)
223962306a36Sopenharmony_ci{
224062306a36Sopenharmony_ci	const u32 offset =
224162306a36Sopenharmony_ci		i915_ggtt_offset(engine->status_page.vma) +
224262306a36Sopenharmony_ci		offset_in_page(sema);
224362306a36Sopenharmony_ci	struct i915_request *rq;
224462306a36Sopenharmony_ci	u32 *cs;
224562306a36Sopenharmony_ci
224662306a36Sopenharmony_ci	rq = i915_request_create(engine->kernel_context);
224762306a36Sopenharmony_ci	if (IS_ERR(rq))
224862306a36Sopenharmony_ci		return PTR_ERR(rq);
224962306a36Sopenharmony_ci
225062306a36Sopenharmony_ci	cs = intel_ring_begin(rq, 4);
225162306a36Sopenharmony_ci	if (IS_ERR(cs)) {
225262306a36Sopenharmony_ci		i915_request_add(rq);
225362306a36Sopenharmony_ci		return PTR_ERR(cs);
225462306a36Sopenharmony_ci	}
225562306a36Sopenharmony_ci
225662306a36Sopenharmony_ci	cs = emit_semaphore_poll(cs, mode, value, offset);
225762306a36Sopenharmony_ci
225862306a36Sopenharmony_ci	intel_ring_advance(rq, cs);
225962306a36Sopenharmony_ci	i915_request_add(rq);
226062306a36Sopenharmony_ci
226162306a36Sopenharmony_ci	return 0;
226262306a36Sopenharmony_ci}
226362306a36Sopenharmony_ci
226462306a36Sopenharmony_cistatic int measure_inter_request(struct intel_context *ce)
226562306a36Sopenharmony_ci{
226662306a36Sopenharmony_ci	u32 *sema = hwsp_scratch(ce);
226762306a36Sopenharmony_ci	const u32 offset = hwsp_offset(ce, sema);
226862306a36Sopenharmony_ci	u32 elapsed[TF_COUNT + 1], cycles;
226962306a36Sopenharmony_ci	struct i915_sw_fence *submit;
227062306a36Sopenharmony_ci	int i, err;
227162306a36Sopenharmony_ci
227262306a36Sopenharmony_ci	/*
227362306a36Sopenharmony_ci	 * Measure how long it takes to advance from one request into the
227462306a36Sopenharmony_ci	 * next. Between each request we flush the GPU caches to memory,
227562306a36Sopenharmony_ci	 * update the breadcrumbs, and then invalidate those caches.
227662306a36Sopenharmony_ci	 * We queue up all the requests to be submitted in one batch so
227762306a36Sopenharmony_ci	 * it should be one set of contiguous measurements.
227862306a36Sopenharmony_ci	 *
227962306a36Sopenharmony_ci	 *    A: read CS_TIMESTAMP on GPU
228062306a36Sopenharmony_ci	 *    advance request
228162306a36Sopenharmony_ci	 *    B: read CS_TIMESTAMP on GPU
228262306a36Sopenharmony_ci	 *
228362306a36Sopenharmony_ci	 * Request latency: B - A
228462306a36Sopenharmony_ci	 */
228562306a36Sopenharmony_ci
228662306a36Sopenharmony_ci	err = plug(ce->engine, sema, MI_SEMAPHORE_SAD_NEQ_SDD, 0);
228762306a36Sopenharmony_ci	if (err)
228862306a36Sopenharmony_ci		return err;
228962306a36Sopenharmony_ci
229062306a36Sopenharmony_ci	submit = heap_fence_create(GFP_KERNEL);
229162306a36Sopenharmony_ci	if (!submit) {
229262306a36Sopenharmony_ci		semaphore_set(sema, 1);
229362306a36Sopenharmony_ci		return -ENOMEM;
229462306a36Sopenharmony_ci	}
229562306a36Sopenharmony_ci
229662306a36Sopenharmony_ci	intel_engine_flush_submission(ce->engine);
229762306a36Sopenharmony_ci	for (i = 1; i <= ARRAY_SIZE(elapsed); i++) {
229862306a36Sopenharmony_ci		struct i915_request *rq;
229962306a36Sopenharmony_ci		u32 *cs;
230062306a36Sopenharmony_ci
230162306a36Sopenharmony_ci		rq = i915_request_create(ce);
230262306a36Sopenharmony_ci		if (IS_ERR(rq)) {
230362306a36Sopenharmony_ci			err = PTR_ERR(rq);
230462306a36Sopenharmony_ci			goto err_submit;
230562306a36Sopenharmony_ci		}
230662306a36Sopenharmony_ci
230762306a36Sopenharmony_ci		err = i915_sw_fence_await_sw_fence_gfp(&rq->submit,
230862306a36Sopenharmony_ci						       submit,
230962306a36Sopenharmony_ci						       GFP_KERNEL);
231062306a36Sopenharmony_ci		if (err < 0) {
231162306a36Sopenharmony_ci			i915_request_add(rq);
231262306a36Sopenharmony_ci			goto err_submit;
231362306a36Sopenharmony_ci		}
231462306a36Sopenharmony_ci
231562306a36Sopenharmony_ci		cs = intel_ring_begin(rq, 4);
231662306a36Sopenharmony_ci		if (IS_ERR(cs)) {
231762306a36Sopenharmony_ci			i915_request_add(rq);
231862306a36Sopenharmony_ci			err = PTR_ERR(cs);
231962306a36Sopenharmony_ci			goto err_submit;
232062306a36Sopenharmony_ci		}
232162306a36Sopenharmony_ci
232262306a36Sopenharmony_ci		cs = emit_timestamp_store(cs, ce, offset + i * sizeof(u32));
232362306a36Sopenharmony_ci
232462306a36Sopenharmony_ci		intel_ring_advance(rq, cs);
232562306a36Sopenharmony_ci		i915_request_add(rq);
232662306a36Sopenharmony_ci	}
232762306a36Sopenharmony_ci	i915_sw_fence_commit(submit);
232862306a36Sopenharmony_ci	intel_engine_flush_submission(ce->engine);
232962306a36Sopenharmony_ci	heap_fence_put(submit);
233062306a36Sopenharmony_ci
233162306a36Sopenharmony_ci	semaphore_set(sema, 1);
233262306a36Sopenharmony_ci	err = intel_gt_wait_for_idle(ce->engine->gt, HZ / 2);
233362306a36Sopenharmony_ci	if (err)
233462306a36Sopenharmony_ci		goto err;
233562306a36Sopenharmony_ci
233662306a36Sopenharmony_ci	for (i = 1; i <= TF_COUNT; i++)
233762306a36Sopenharmony_ci		elapsed[i - 1] = sema[i + 1] - sema[i];
233862306a36Sopenharmony_ci
233962306a36Sopenharmony_ci	cycles = trifilter(elapsed);
234062306a36Sopenharmony_ci	pr_info("%s: inter-request latency %d cycles, %lluns\n",
234162306a36Sopenharmony_ci		ce->engine->name, cycles >> TF_BIAS,
234262306a36Sopenharmony_ci		cycles_to_ns(ce->engine, cycles));
234362306a36Sopenharmony_ci
234462306a36Sopenharmony_ci	return intel_gt_wait_for_idle(ce->engine->gt, HZ);
234562306a36Sopenharmony_ci
234662306a36Sopenharmony_cierr_submit:
234762306a36Sopenharmony_ci	i915_sw_fence_commit(submit);
234862306a36Sopenharmony_ci	heap_fence_put(submit);
234962306a36Sopenharmony_ci	semaphore_set(sema, 1);
235062306a36Sopenharmony_cierr:
235162306a36Sopenharmony_ci	intel_gt_set_wedged(ce->engine->gt);
235262306a36Sopenharmony_ci	return err;
235362306a36Sopenharmony_ci}
235462306a36Sopenharmony_ci
235562306a36Sopenharmony_cistatic int measure_context_switch(struct intel_context *ce)
235662306a36Sopenharmony_ci{
235762306a36Sopenharmony_ci	u32 *sema = hwsp_scratch(ce);
235862306a36Sopenharmony_ci	const u32 offset = hwsp_offset(ce, sema);
235962306a36Sopenharmony_ci	struct i915_request *fence = NULL;
236062306a36Sopenharmony_ci	u32 elapsed[TF_COUNT + 1], cycles;
236162306a36Sopenharmony_ci	int i, j, err;
236262306a36Sopenharmony_ci	u32 *cs;
236362306a36Sopenharmony_ci
236462306a36Sopenharmony_ci	/*
236562306a36Sopenharmony_ci	 * Measure how long it takes to advance from one request in one
236662306a36Sopenharmony_ci	 * context to a request in another context. This allows us to
236762306a36Sopenharmony_ci	 * measure how long the context save/restore take, along with all
236862306a36Sopenharmony_ci	 * the inter-context setup we require.
236962306a36Sopenharmony_ci	 *
237062306a36Sopenharmony_ci	 *    A: read CS_TIMESTAMP on GPU
237162306a36Sopenharmony_ci	 *    switch context
237262306a36Sopenharmony_ci	 *    B: read CS_TIMESTAMP on GPU
237362306a36Sopenharmony_ci	 *
237462306a36Sopenharmony_ci	 * Context switch latency: B - A
237562306a36Sopenharmony_ci	 */
237662306a36Sopenharmony_ci
237762306a36Sopenharmony_ci	err = plug(ce->engine, sema, MI_SEMAPHORE_SAD_NEQ_SDD, 0);
237862306a36Sopenharmony_ci	if (err)
237962306a36Sopenharmony_ci		return err;
238062306a36Sopenharmony_ci
238162306a36Sopenharmony_ci	for (i = 1; i <= ARRAY_SIZE(elapsed); i++) {
238262306a36Sopenharmony_ci		struct intel_context *arr[] = {
238362306a36Sopenharmony_ci			ce, ce->engine->kernel_context
238462306a36Sopenharmony_ci		};
238562306a36Sopenharmony_ci		u32 addr = offset + ARRAY_SIZE(arr) * i * sizeof(u32);
238662306a36Sopenharmony_ci
238762306a36Sopenharmony_ci		for (j = 0; j < ARRAY_SIZE(arr); j++) {
238862306a36Sopenharmony_ci			struct i915_request *rq;
238962306a36Sopenharmony_ci
239062306a36Sopenharmony_ci			rq = i915_request_create(arr[j]);
239162306a36Sopenharmony_ci			if (IS_ERR(rq)) {
239262306a36Sopenharmony_ci				err = PTR_ERR(rq);
239362306a36Sopenharmony_ci				goto err_fence;
239462306a36Sopenharmony_ci			}
239562306a36Sopenharmony_ci
239662306a36Sopenharmony_ci			if (fence) {
239762306a36Sopenharmony_ci				err = i915_request_await_dma_fence(rq,
239862306a36Sopenharmony_ci								   &fence->fence);
239962306a36Sopenharmony_ci				if (err) {
240062306a36Sopenharmony_ci					i915_request_add(rq);
240162306a36Sopenharmony_ci					goto err_fence;
240262306a36Sopenharmony_ci				}
240362306a36Sopenharmony_ci			}
240462306a36Sopenharmony_ci
240562306a36Sopenharmony_ci			cs = intel_ring_begin(rq, 4);
240662306a36Sopenharmony_ci			if (IS_ERR(cs)) {
240762306a36Sopenharmony_ci				i915_request_add(rq);
240862306a36Sopenharmony_ci				err = PTR_ERR(cs);
240962306a36Sopenharmony_ci				goto err_fence;
241062306a36Sopenharmony_ci			}
241162306a36Sopenharmony_ci
241262306a36Sopenharmony_ci			cs = emit_timestamp_store(cs, ce, addr);
241362306a36Sopenharmony_ci			addr += sizeof(u32);
241462306a36Sopenharmony_ci
241562306a36Sopenharmony_ci			intel_ring_advance(rq, cs);
241662306a36Sopenharmony_ci
241762306a36Sopenharmony_ci			i915_request_put(fence);
241862306a36Sopenharmony_ci			fence = i915_request_get(rq);
241962306a36Sopenharmony_ci
242062306a36Sopenharmony_ci			i915_request_add(rq);
242162306a36Sopenharmony_ci		}
242262306a36Sopenharmony_ci	}
242362306a36Sopenharmony_ci	i915_request_put(fence);
242462306a36Sopenharmony_ci	intel_engine_flush_submission(ce->engine);
242562306a36Sopenharmony_ci
242662306a36Sopenharmony_ci	semaphore_set(sema, 1);
242762306a36Sopenharmony_ci	err = intel_gt_wait_for_idle(ce->engine->gt, HZ / 2);
242862306a36Sopenharmony_ci	if (err)
242962306a36Sopenharmony_ci		goto err;
243062306a36Sopenharmony_ci
243162306a36Sopenharmony_ci	for (i = 1; i <= TF_COUNT; i++)
243262306a36Sopenharmony_ci		elapsed[i - 1] = sema[2 * i + 2] - sema[2 * i + 1];
243362306a36Sopenharmony_ci
243462306a36Sopenharmony_ci	cycles = trifilter(elapsed);
243562306a36Sopenharmony_ci	pr_info("%s: context switch latency %d cycles, %lluns\n",
243662306a36Sopenharmony_ci		ce->engine->name, cycles >> TF_BIAS,
243762306a36Sopenharmony_ci		cycles_to_ns(ce->engine, cycles));
243862306a36Sopenharmony_ci
243962306a36Sopenharmony_ci	return intel_gt_wait_for_idle(ce->engine->gt, HZ);
244062306a36Sopenharmony_ci
244162306a36Sopenharmony_cierr_fence:
244262306a36Sopenharmony_ci	i915_request_put(fence);
244362306a36Sopenharmony_ci	semaphore_set(sema, 1);
244462306a36Sopenharmony_cierr:
244562306a36Sopenharmony_ci	intel_gt_set_wedged(ce->engine->gt);
244662306a36Sopenharmony_ci	return err;
244762306a36Sopenharmony_ci}
244862306a36Sopenharmony_ci
244962306a36Sopenharmony_cistatic int measure_preemption(struct intel_context *ce)
245062306a36Sopenharmony_ci{
245162306a36Sopenharmony_ci	u32 *sema = hwsp_scratch(ce);
245262306a36Sopenharmony_ci	const u32 offset = hwsp_offset(ce, sema);
245362306a36Sopenharmony_ci	u32 elapsed[TF_COUNT], cycles;
245462306a36Sopenharmony_ci	u32 *cs;
245562306a36Sopenharmony_ci	int err;
245662306a36Sopenharmony_ci	int i;
245762306a36Sopenharmony_ci
245862306a36Sopenharmony_ci	/*
245962306a36Sopenharmony_ci	 * We measure two latencies while triggering preemption. The first
246062306a36Sopenharmony_ci	 * latency is how long it takes for us to submit a preempting request.
246162306a36Sopenharmony_ci	 * The second latency is how it takes for us to return from the
246262306a36Sopenharmony_ci	 * preemption back to the original context.
246362306a36Sopenharmony_ci	 *
246462306a36Sopenharmony_ci	 *    A: read CS_TIMESTAMP from CPU
246562306a36Sopenharmony_ci	 *    submit preemption
246662306a36Sopenharmony_ci	 *    B: read CS_TIMESTAMP on GPU (in preempting context)
246762306a36Sopenharmony_ci	 *    context switch
246862306a36Sopenharmony_ci	 *    C: read CS_TIMESTAMP on GPU (in original context)
246962306a36Sopenharmony_ci	 *
247062306a36Sopenharmony_ci	 * Preemption dispatch latency: B - A
247162306a36Sopenharmony_ci	 * Preemption switch latency: C - B
247262306a36Sopenharmony_ci	 */
247362306a36Sopenharmony_ci
247462306a36Sopenharmony_ci	if (!intel_engine_has_preemption(ce->engine))
247562306a36Sopenharmony_ci		return 0;
247662306a36Sopenharmony_ci
247762306a36Sopenharmony_ci	for (i = 1; i <= ARRAY_SIZE(elapsed); i++) {
247862306a36Sopenharmony_ci		u32 addr = offset + 2 * i * sizeof(u32);
247962306a36Sopenharmony_ci		struct i915_request *rq;
248062306a36Sopenharmony_ci
248162306a36Sopenharmony_ci		rq = i915_request_create(ce);
248262306a36Sopenharmony_ci		if (IS_ERR(rq)) {
248362306a36Sopenharmony_ci			err = PTR_ERR(rq);
248462306a36Sopenharmony_ci			goto err;
248562306a36Sopenharmony_ci		}
248662306a36Sopenharmony_ci
248762306a36Sopenharmony_ci		cs = intel_ring_begin(rq, 12);
248862306a36Sopenharmony_ci		if (IS_ERR(cs)) {
248962306a36Sopenharmony_ci			i915_request_add(rq);
249062306a36Sopenharmony_ci			err = PTR_ERR(cs);
249162306a36Sopenharmony_ci			goto err;
249262306a36Sopenharmony_ci		}
249362306a36Sopenharmony_ci
249462306a36Sopenharmony_ci		cs = emit_store_dw(cs, addr, -1);
249562306a36Sopenharmony_ci		cs = emit_semaphore_poll_until(cs, offset, i);
249662306a36Sopenharmony_ci		cs = emit_timestamp_store(cs, ce, addr + sizeof(u32));
249762306a36Sopenharmony_ci
249862306a36Sopenharmony_ci		intel_ring_advance(rq, cs);
249962306a36Sopenharmony_ci		i915_request_add(rq);
250062306a36Sopenharmony_ci
250162306a36Sopenharmony_ci		if (wait_for(READ_ONCE(sema[2 * i]) == -1, 500)) {
250262306a36Sopenharmony_ci			err = -EIO;
250362306a36Sopenharmony_ci			goto err;
250462306a36Sopenharmony_ci		}
250562306a36Sopenharmony_ci
250662306a36Sopenharmony_ci		rq = i915_request_create(ce->engine->kernel_context);
250762306a36Sopenharmony_ci		if (IS_ERR(rq)) {
250862306a36Sopenharmony_ci			err = PTR_ERR(rq);
250962306a36Sopenharmony_ci			goto err;
251062306a36Sopenharmony_ci		}
251162306a36Sopenharmony_ci
251262306a36Sopenharmony_ci		cs = intel_ring_begin(rq, 8);
251362306a36Sopenharmony_ci		if (IS_ERR(cs)) {
251462306a36Sopenharmony_ci			i915_request_add(rq);
251562306a36Sopenharmony_ci			err = PTR_ERR(cs);
251662306a36Sopenharmony_ci			goto err;
251762306a36Sopenharmony_ci		}
251862306a36Sopenharmony_ci
251962306a36Sopenharmony_ci		cs = emit_timestamp_store(cs, ce, addr);
252062306a36Sopenharmony_ci		cs = emit_store_dw(cs, offset, i);
252162306a36Sopenharmony_ci
252262306a36Sopenharmony_ci		intel_ring_advance(rq, cs);
252362306a36Sopenharmony_ci		rq->sched.attr.priority = I915_PRIORITY_BARRIER;
252462306a36Sopenharmony_ci
252562306a36Sopenharmony_ci		elapsed[i - 1] = ENGINE_READ_FW(ce->engine, RING_TIMESTAMP);
252662306a36Sopenharmony_ci		i915_request_add(rq);
252762306a36Sopenharmony_ci	}
252862306a36Sopenharmony_ci
252962306a36Sopenharmony_ci	if (wait_for(READ_ONCE(sema[2 * i - 2]) != -1, 500)) {
253062306a36Sopenharmony_ci		err = -EIO;
253162306a36Sopenharmony_ci		goto err;
253262306a36Sopenharmony_ci	}
253362306a36Sopenharmony_ci
253462306a36Sopenharmony_ci	for (i = 1; i <= TF_COUNT; i++)
253562306a36Sopenharmony_ci		elapsed[i - 1] = sema[2 * i + 0] - elapsed[i - 1];
253662306a36Sopenharmony_ci
253762306a36Sopenharmony_ci	cycles = trifilter(elapsed);
253862306a36Sopenharmony_ci	pr_info("%s: preemption dispatch latency %d cycles, %lluns\n",
253962306a36Sopenharmony_ci		ce->engine->name, cycles >> TF_BIAS,
254062306a36Sopenharmony_ci		cycles_to_ns(ce->engine, cycles));
254162306a36Sopenharmony_ci
254262306a36Sopenharmony_ci	for (i = 1; i <= TF_COUNT; i++)
254362306a36Sopenharmony_ci		elapsed[i - 1] = sema[2 * i + 1] - sema[2 * i + 0];
254462306a36Sopenharmony_ci
254562306a36Sopenharmony_ci	cycles = trifilter(elapsed);
254662306a36Sopenharmony_ci	pr_info("%s: preemption switch latency %d cycles, %lluns\n",
254762306a36Sopenharmony_ci		ce->engine->name, cycles >> TF_BIAS,
254862306a36Sopenharmony_ci		cycles_to_ns(ce->engine, cycles));
254962306a36Sopenharmony_ci
255062306a36Sopenharmony_ci	return intel_gt_wait_for_idle(ce->engine->gt, HZ);
255162306a36Sopenharmony_ci
255262306a36Sopenharmony_cierr:
255362306a36Sopenharmony_ci	intel_gt_set_wedged(ce->engine->gt);
255462306a36Sopenharmony_ci	return err;
255562306a36Sopenharmony_ci}
255662306a36Sopenharmony_ci
255762306a36Sopenharmony_cistruct signal_cb {
255862306a36Sopenharmony_ci	struct dma_fence_cb base;
255962306a36Sopenharmony_ci	bool seen;
256062306a36Sopenharmony_ci};
256162306a36Sopenharmony_ci
256262306a36Sopenharmony_cistatic void signal_cb(struct dma_fence *fence, struct dma_fence_cb *cb)
256362306a36Sopenharmony_ci{
256462306a36Sopenharmony_ci	struct signal_cb *s = container_of(cb, typeof(*s), base);
256562306a36Sopenharmony_ci
256662306a36Sopenharmony_ci	smp_store_mb(s->seen, true); /* be safe, be strong */
256762306a36Sopenharmony_ci}
256862306a36Sopenharmony_ci
256962306a36Sopenharmony_cistatic int measure_completion(struct intel_context *ce)
257062306a36Sopenharmony_ci{
257162306a36Sopenharmony_ci	u32 *sema = hwsp_scratch(ce);
257262306a36Sopenharmony_ci	const u32 offset = hwsp_offset(ce, sema);
257362306a36Sopenharmony_ci	u32 elapsed[TF_COUNT], cycles;
257462306a36Sopenharmony_ci	u32 *cs;
257562306a36Sopenharmony_ci	int err;
257662306a36Sopenharmony_ci	int i;
257762306a36Sopenharmony_ci
257862306a36Sopenharmony_ci	/*
257962306a36Sopenharmony_ci	 * Measure how long it takes for the signal (interrupt) to be
258062306a36Sopenharmony_ci	 * sent from the GPU to be processed by the CPU.
258162306a36Sopenharmony_ci	 *
258262306a36Sopenharmony_ci	 *    A: read CS_TIMESTAMP on GPU
258362306a36Sopenharmony_ci	 *    signal
258462306a36Sopenharmony_ci	 *    B: read CS_TIMESTAMP from CPU
258562306a36Sopenharmony_ci	 *
258662306a36Sopenharmony_ci	 * Completion latency: B - A
258762306a36Sopenharmony_ci	 */
258862306a36Sopenharmony_ci
258962306a36Sopenharmony_ci	for (i = 1; i <= ARRAY_SIZE(elapsed); i++) {
259062306a36Sopenharmony_ci		struct signal_cb cb = { .seen = false };
259162306a36Sopenharmony_ci		struct i915_request *rq;
259262306a36Sopenharmony_ci
259362306a36Sopenharmony_ci		rq = i915_request_create(ce);
259462306a36Sopenharmony_ci		if (IS_ERR(rq)) {
259562306a36Sopenharmony_ci			err = PTR_ERR(rq);
259662306a36Sopenharmony_ci			goto err;
259762306a36Sopenharmony_ci		}
259862306a36Sopenharmony_ci
259962306a36Sopenharmony_ci		cs = intel_ring_begin(rq, 12);
260062306a36Sopenharmony_ci		if (IS_ERR(cs)) {
260162306a36Sopenharmony_ci			i915_request_add(rq);
260262306a36Sopenharmony_ci			err = PTR_ERR(cs);
260362306a36Sopenharmony_ci			goto err;
260462306a36Sopenharmony_ci		}
260562306a36Sopenharmony_ci
260662306a36Sopenharmony_ci		cs = emit_store_dw(cs, offset + i * sizeof(u32), -1);
260762306a36Sopenharmony_ci		cs = emit_semaphore_poll_until(cs, offset, i);
260862306a36Sopenharmony_ci		cs = emit_timestamp_store(cs, ce, offset + i * sizeof(u32));
260962306a36Sopenharmony_ci
261062306a36Sopenharmony_ci		intel_ring_advance(rq, cs);
261162306a36Sopenharmony_ci
261262306a36Sopenharmony_ci		dma_fence_add_callback(&rq->fence, &cb.base, signal_cb);
261362306a36Sopenharmony_ci		i915_request_add(rq);
261462306a36Sopenharmony_ci
261562306a36Sopenharmony_ci		intel_engine_flush_submission(ce->engine);
261662306a36Sopenharmony_ci		if (wait_for(READ_ONCE(sema[i]) == -1, 50)) {
261762306a36Sopenharmony_ci			err = -EIO;
261862306a36Sopenharmony_ci			goto err;
261962306a36Sopenharmony_ci		}
262062306a36Sopenharmony_ci
262162306a36Sopenharmony_ci		preempt_disable();
262262306a36Sopenharmony_ci		semaphore_set(sema, i);
262362306a36Sopenharmony_ci		while (!READ_ONCE(cb.seen))
262462306a36Sopenharmony_ci			cpu_relax();
262562306a36Sopenharmony_ci
262662306a36Sopenharmony_ci		elapsed[i - 1] = ENGINE_READ_FW(ce->engine, RING_TIMESTAMP);
262762306a36Sopenharmony_ci		preempt_enable();
262862306a36Sopenharmony_ci	}
262962306a36Sopenharmony_ci
263062306a36Sopenharmony_ci	err = intel_gt_wait_for_idle(ce->engine->gt, HZ / 2);
263162306a36Sopenharmony_ci	if (err)
263262306a36Sopenharmony_ci		goto err;
263362306a36Sopenharmony_ci
263462306a36Sopenharmony_ci	for (i = 0; i < ARRAY_SIZE(elapsed); i++) {
263562306a36Sopenharmony_ci		GEM_BUG_ON(sema[i + 1] == -1);
263662306a36Sopenharmony_ci		elapsed[i] = elapsed[i] - sema[i + 1];
263762306a36Sopenharmony_ci	}
263862306a36Sopenharmony_ci
263962306a36Sopenharmony_ci	cycles = trifilter(elapsed);
264062306a36Sopenharmony_ci	pr_info("%s: completion latency %d cycles, %lluns\n",
264162306a36Sopenharmony_ci		ce->engine->name, cycles >> TF_BIAS,
264262306a36Sopenharmony_ci		cycles_to_ns(ce->engine, cycles));
264362306a36Sopenharmony_ci
264462306a36Sopenharmony_ci	return intel_gt_wait_for_idle(ce->engine->gt, HZ);
264562306a36Sopenharmony_ci
264662306a36Sopenharmony_cierr:
264762306a36Sopenharmony_ci	intel_gt_set_wedged(ce->engine->gt);
264862306a36Sopenharmony_ci	return err;
264962306a36Sopenharmony_ci}
265062306a36Sopenharmony_ci
265162306a36Sopenharmony_cistatic void rps_pin(struct intel_gt *gt)
265262306a36Sopenharmony_ci{
265362306a36Sopenharmony_ci	/* Pin the frequency to max */
265462306a36Sopenharmony_ci	atomic_inc(&gt->rps.num_waiters);
265562306a36Sopenharmony_ci	intel_uncore_forcewake_get(gt->uncore, FORCEWAKE_ALL);
265662306a36Sopenharmony_ci
265762306a36Sopenharmony_ci	mutex_lock(&gt->rps.lock);
265862306a36Sopenharmony_ci	intel_rps_set(&gt->rps, gt->rps.max_freq);
265962306a36Sopenharmony_ci	mutex_unlock(&gt->rps.lock);
266062306a36Sopenharmony_ci}
266162306a36Sopenharmony_ci
266262306a36Sopenharmony_cistatic void rps_unpin(struct intel_gt *gt)
266362306a36Sopenharmony_ci{
266462306a36Sopenharmony_ci	intel_uncore_forcewake_put(gt->uncore, FORCEWAKE_ALL);
266562306a36Sopenharmony_ci	atomic_dec(&gt->rps.num_waiters);
266662306a36Sopenharmony_ci}
266762306a36Sopenharmony_ci
266862306a36Sopenharmony_cistatic int perf_request_latency(void *arg)
266962306a36Sopenharmony_ci{
267062306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
267162306a36Sopenharmony_ci	struct intel_engine_cs *engine;
267262306a36Sopenharmony_ci	struct pm_qos_request qos;
267362306a36Sopenharmony_ci	int err = 0;
267462306a36Sopenharmony_ci
267562306a36Sopenharmony_ci	if (GRAPHICS_VER(i915) < 8) /* per-engine CS timestamp, semaphores */
267662306a36Sopenharmony_ci		return 0;
267762306a36Sopenharmony_ci
267862306a36Sopenharmony_ci	cpu_latency_qos_add_request(&qos, 0); /* disable cstates */
267962306a36Sopenharmony_ci
268062306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
268162306a36Sopenharmony_ci		struct intel_context *ce;
268262306a36Sopenharmony_ci
268362306a36Sopenharmony_ci		ce = intel_context_create(engine);
268462306a36Sopenharmony_ci		if (IS_ERR(ce)) {
268562306a36Sopenharmony_ci			err = PTR_ERR(ce);
268662306a36Sopenharmony_ci			goto out;
268762306a36Sopenharmony_ci		}
268862306a36Sopenharmony_ci
268962306a36Sopenharmony_ci		err = intel_context_pin(ce);
269062306a36Sopenharmony_ci		if (err) {
269162306a36Sopenharmony_ci			intel_context_put(ce);
269262306a36Sopenharmony_ci			goto out;
269362306a36Sopenharmony_ci		}
269462306a36Sopenharmony_ci
269562306a36Sopenharmony_ci		st_engine_heartbeat_disable(engine);
269662306a36Sopenharmony_ci		rps_pin(engine->gt);
269762306a36Sopenharmony_ci
269862306a36Sopenharmony_ci		if (err == 0)
269962306a36Sopenharmony_ci			err = measure_semaphore_response(ce);
270062306a36Sopenharmony_ci		if (err == 0)
270162306a36Sopenharmony_ci			err = measure_idle_dispatch(ce);
270262306a36Sopenharmony_ci		if (err == 0)
270362306a36Sopenharmony_ci			err = measure_busy_dispatch(ce);
270462306a36Sopenharmony_ci		if (err == 0)
270562306a36Sopenharmony_ci			err = measure_inter_request(ce);
270662306a36Sopenharmony_ci		if (err == 0)
270762306a36Sopenharmony_ci			err = measure_context_switch(ce);
270862306a36Sopenharmony_ci		if (err == 0)
270962306a36Sopenharmony_ci			err = measure_preemption(ce);
271062306a36Sopenharmony_ci		if (err == 0)
271162306a36Sopenharmony_ci			err = measure_completion(ce);
271262306a36Sopenharmony_ci
271362306a36Sopenharmony_ci		rps_unpin(engine->gt);
271462306a36Sopenharmony_ci		st_engine_heartbeat_enable(engine);
271562306a36Sopenharmony_ci
271662306a36Sopenharmony_ci		intel_context_unpin(ce);
271762306a36Sopenharmony_ci		intel_context_put(ce);
271862306a36Sopenharmony_ci		if (err)
271962306a36Sopenharmony_ci			goto out;
272062306a36Sopenharmony_ci	}
272162306a36Sopenharmony_ci
272262306a36Sopenharmony_ciout:
272362306a36Sopenharmony_ci	if (igt_flush_test(i915))
272462306a36Sopenharmony_ci		err = -EIO;
272562306a36Sopenharmony_ci
272662306a36Sopenharmony_ci	cpu_latency_qos_remove_request(&qos);
272762306a36Sopenharmony_ci	return err;
272862306a36Sopenharmony_ci}
272962306a36Sopenharmony_ci
273062306a36Sopenharmony_cistatic int s_sync0(void *arg)
273162306a36Sopenharmony_ci{
273262306a36Sopenharmony_ci	struct perf_series *ps = arg;
273362306a36Sopenharmony_ci	IGT_TIMEOUT(end_time);
273462306a36Sopenharmony_ci	unsigned int idx = 0;
273562306a36Sopenharmony_ci	int err = 0;
273662306a36Sopenharmony_ci
273762306a36Sopenharmony_ci	GEM_BUG_ON(!ps->nengines);
273862306a36Sopenharmony_ci	do {
273962306a36Sopenharmony_ci		struct i915_request *rq;
274062306a36Sopenharmony_ci
274162306a36Sopenharmony_ci		rq = i915_request_create(ps->ce[idx]);
274262306a36Sopenharmony_ci		if (IS_ERR(rq)) {
274362306a36Sopenharmony_ci			err = PTR_ERR(rq);
274462306a36Sopenharmony_ci			break;
274562306a36Sopenharmony_ci		}
274662306a36Sopenharmony_ci
274762306a36Sopenharmony_ci		i915_request_get(rq);
274862306a36Sopenharmony_ci		i915_request_add(rq);
274962306a36Sopenharmony_ci
275062306a36Sopenharmony_ci		if (i915_request_wait(rq, 0, HZ / 5) < 0)
275162306a36Sopenharmony_ci			err = -ETIME;
275262306a36Sopenharmony_ci		i915_request_put(rq);
275362306a36Sopenharmony_ci		if (err)
275462306a36Sopenharmony_ci			break;
275562306a36Sopenharmony_ci
275662306a36Sopenharmony_ci		if (++idx == ps->nengines)
275762306a36Sopenharmony_ci			idx = 0;
275862306a36Sopenharmony_ci	} while (!__igt_timeout(end_time, NULL));
275962306a36Sopenharmony_ci
276062306a36Sopenharmony_ci	return err;
276162306a36Sopenharmony_ci}
276262306a36Sopenharmony_ci
276362306a36Sopenharmony_cistatic int s_sync1(void *arg)
276462306a36Sopenharmony_ci{
276562306a36Sopenharmony_ci	struct perf_series *ps = arg;
276662306a36Sopenharmony_ci	struct i915_request *prev = NULL;
276762306a36Sopenharmony_ci	IGT_TIMEOUT(end_time);
276862306a36Sopenharmony_ci	unsigned int idx = 0;
276962306a36Sopenharmony_ci	int err = 0;
277062306a36Sopenharmony_ci
277162306a36Sopenharmony_ci	GEM_BUG_ON(!ps->nengines);
277262306a36Sopenharmony_ci	do {
277362306a36Sopenharmony_ci		struct i915_request *rq;
277462306a36Sopenharmony_ci
277562306a36Sopenharmony_ci		rq = i915_request_create(ps->ce[idx]);
277662306a36Sopenharmony_ci		if (IS_ERR(rq)) {
277762306a36Sopenharmony_ci			err = PTR_ERR(rq);
277862306a36Sopenharmony_ci			break;
277962306a36Sopenharmony_ci		}
278062306a36Sopenharmony_ci
278162306a36Sopenharmony_ci		i915_request_get(rq);
278262306a36Sopenharmony_ci		i915_request_add(rq);
278362306a36Sopenharmony_ci
278462306a36Sopenharmony_ci		if (prev && i915_request_wait(prev, 0, HZ / 5) < 0)
278562306a36Sopenharmony_ci			err = -ETIME;
278662306a36Sopenharmony_ci		i915_request_put(prev);
278762306a36Sopenharmony_ci		prev = rq;
278862306a36Sopenharmony_ci		if (err)
278962306a36Sopenharmony_ci			break;
279062306a36Sopenharmony_ci
279162306a36Sopenharmony_ci		if (++idx == ps->nengines)
279262306a36Sopenharmony_ci			idx = 0;
279362306a36Sopenharmony_ci	} while (!__igt_timeout(end_time, NULL));
279462306a36Sopenharmony_ci	i915_request_put(prev);
279562306a36Sopenharmony_ci
279662306a36Sopenharmony_ci	return err;
279762306a36Sopenharmony_ci}
279862306a36Sopenharmony_ci
279962306a36Sopenharmony_cistatic int s_many(void *arg)
280062306a36Sopenharmony_ci{
280162306a36Sopenharmony_ci	struct perf_series *ps = arg;
280262306a36Sopenharmony_ci	IGT_TIMEOUT(end_time);
280362306a36Sopenharmony_ci	unsigned int idx = 0;
280462306a36Sopenharmony_ci
280562306a36Sopenharmony_ci	GEM_BUG_ON(!ps->nengines);
280662306a36Sopenharmony_ci	do {
280762306a36Sopenharmony_ci		struct i915_request *rq;
280862306a36Sopenharmony_ci
280962306a36Sopenharmony_ci		rq = i915_request_create(ps->ce[idx]);
281062306a36Sopenharmony_ci		if (IS_ERR(rq))
281162306a36Sopenharmony_ci			return PTR_ERR(rq);
281262306a36Sopenharmony_ci
281362306a36Sopenharmony_ci		i915_request_add(rq);
281462306a36Sopenharmony_ci
281562306a36Sopenharmony_ci		if (++idx == ps->nengines)
281662306a36Sopenharmony_ci			idx = 0;
281762306a36Sopenharmony_ci	} while (!__igt_timeout(end_time, NULL));
281862306a36Sopenharmony_ci
281962306a36Sopenharmony_ci	return 0;
282062306a36Sopenharmony_ci}
282162306a36Sopenharmony_ci
282262306a36Sopenharmony_cistatic int perf_series_engines(void *arg)
282362306a36Sopenharmony_ci{
282462306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
282562306a36Sopenharmony_ci	static int (* const func[])(void *arg) = {
282662306a36Sopenharmony_ci		s_sync0,
282762306a36Sopenharmony_ci		s_sync1,
282862306a36Sopenharmony_ci		s_many,
282962306a36Sopenharmony_ci		NULL,
283062306a36Sopenharmony_ci	};
283162306a36Sopenharmony_ci	const unsigned int nengines = num_uabi_engines(i915);
283262306a36Sopenharmony_ci	struct intel_engine_cs *engine;
283362306a36Sopenharmony_ci	int (* const *fn)(void *arg);
283462306a36Sopenharmony_ci	struct pm_qos_request qos;
283562306a36Sopenharmony_ci	struct perf_stats *stats;
283662306a36Sopenharmony_ci	struct perf_series *ps;
283762306a36Sopenharmony_ci	unsigned int idx;
283862306a36Sopenharmony_ci	int err = 0;
283962306a36Sopenharmony_ci
284062306a36Sopenharmony_ci	stats = kcalloc(nengines, sizeof(*stats), GFP_KERNEL);
284162306a36Sopenharmony_ci	if (!stats)
284262306a36Sopenharmony_ci		return -ENOMEM;
284362306a36Sopenharmony_ci
284462306a36Sopenharmony_ci	ps = kzalloc(struct_size(ps, ce, nengines), GFP_KERNEL);
284562306a36Sopenharmony_ci	if (!ps) {
284662306a36Sopenharmony_ci		kfree(stats);
284762306a36Sopenharmony_ci		return -ENOMEM;
284862306a36Sopenharmony_ci	}
284962306a36Sopenharmony_ci
285062306a36Sopenharmony_ci	cpu_latency_qos_add_request(&qos, 0); /* disable cstates */
285162306a36Sopenharmony_ci
285262306a36Sopenharmony_ci	ps->i915 = i915;
285362306a36Sopenharmony_ci	ps->nengines = nengines;
285462306a36Sopenharmony_ci
285562306a36Sopenharmony_ci	idx = 0;
285662306a36Sopenharmony_ci	for_each_uabi_engine(engine, i915) {
285762306a36Sopenharmony_ci		struct intel_context *ce;
285862306a36Sopenharmony_ci
285962306a36Sopenharmony_ci		ce = intel_context_create(engine);
286062306a36Sopenharmony_ci		if (IS_ERR(ce)) {
286162306a36Sopenharmony_ci			err = PTR_ERR(ce);
286262306a36Sopenharmony_ci			goto out;
286362306a36Sopenharmony_ci		}
286462306a36Sopenharmony_ci
286562306a36Sopenharmony_ci		err = intel_context_pin(ce);
286662306a36Sopenharmony_ci		if (err) {
286762306a36Sopenharmony_ci			intel_context_put(ce);
286862306a36Sopenharmony_ci			goto out;
286962306a36Sopenharmony_ci		}
287062306a36Sopenharmony_ci
287162306a36Sopenharmony_ci		ps->ce[idx++] = ce;
287262306a36Sopenharmony_ci	}
287362306a36Sopenharmony_ci	GEM_BUG_ON(idx != ps->nengines);
287462306a36Sopenharmony_ci
287562306a36Sopenharmony_ci	for (fn = func; *fn && !err; fn++) {
287662306a36Sopenharmony_ci		char name[KSYM_NAME_LEN];
287762306a36Sopenharmony_ci		struct igt_live_test t;
287862306a36Sopenharmony_ci
287962306a36Sopenharmony_ci		snprintf(name, sizeof(name), "%ps", *fn);
288062306a36Sopenharmony_ci		err = igt_live_test_begin(&t, i915, __func__, name);
288162306a36Sopenharmony_ci		if (err)
288262306a36Sopenharmony_ci			break;
288362306a36Sopenharmony_ci
288462306a36Sopenharmony_ci		for (idx = 0; idx < nengines; idx++) {
288562306a36Sopenharmony_ci			struct perf_stats *p =
288662306a36Sopenharmony_ci				memset(&stats[idx], 0, sizeof(stats[idx]));
288762306a36Sopenharmony_ci			struct intel_context *ce = ps->ce[idx];
288862306a36Sopenharmony_ci
288962306a36Sopenharmony_ci			p->engine = ps->ce[idx]->engine;
289062306a36Sopenharmony_ci			intel_engine_pm_get(p->engine);
289162306a36Sopenharmony_ci
289262306a36Sopenharmony_ci			if (intel_engine_supports_stats(p->engine))
289362306a36Sopenharmony_ci				p->busy = intel_engine_get_busy_time(p->engine,
289462306a36Sopenharmony_ci								     &p->time) + 1;
289562306a36Sopenharmony_ci			else
289662306a36Sopenharmony_ci				p->time = ktime_get();
289762306a36Sopenharmony_ci			p->runtime = -intel_context_get_total_runtime_ns(ce);
289862306a36Sopenharmony_ci		}
289962306a36Sopenharmony_ci
290062306a36Sopenharmony_ci		err = (*fn)(ps);
290162306a36Sopenharmony_ci		if (igt_live_test_end(&t))
290262306a36Sopenharmony_ci			err = -EIO;
290362306a36Sopenharmony_ci
290462306a36Sopenharmony_ci		for (idx = 0; idx < nengines; idx++) {
290562306a36Sopenharmony_ci			struct perf_stats *p = &stats[idx];
290662306a36Sopenharmony_ci			struct intel_context *ce = ps->ce[idx];
290762306a36Sopenharmony_ci			int integer, decimal;
290862306a36Sopenharmony_ci			u64 busy, dt, now;
290962306a36Sopenharmony_ci
291062306a36Sopenharmony_ci			if (p->busy)
291162306a36Sopenharmony_ci				p->busy = ktime_sub(intel_engine_get_busy_time(p->engine,
291262306a36Sopenharmony_ci									       &now),
291362306a36Sopenharmony_ci						    p->busy - 1);
291462306a36Sopenharmony_ci			else
291562306a36Sopenharmony_ci				now = ktime_get();
291662306a36Sopenharmony_ci			p->time = ktime_sub(now, p->time);
291762306a36Sopenharmony_ci
291862306a36Sopenharmony_ci			err = switch_to_kernel_sync(ce, err);
291962306a36Sopenharmony_ci			p->runtime += intel_context_get_total_runtime_ns(ce);
292062306a36Sopenharmony_ci			intel_engine_pm_put(p->engine);
292162306a36Sopenharmony_ci
292262306a36Sopenharmony_ci			busy = 100 * ktime_to_ns(p->busy);
292362306a36Sopenharmony_ci			dt = ktime_to_ns(p->time);
292462306a36Sopenharmony_ci			if (dt) {
292562306a36Sopenharmony_ci				integer = div64_u64(busy, dt);
292662306a36Sopenharmony_ci				busy -= integer * dt;
292762306a36Sopenharmony_ci				decimal = div64_u64(100 * busy, dt);
292862306a36Sopenharmony_ci			} else {
292962306a36Sopenharmony_ci				integer = 0;
293062306a36Sopenharmony_ci				decimal = 0;
293162306a36Sopenharmony_ci			}
293262306a36Sopenharmony_ci
293362306a36Sopenharmony_ci			pr_info("%s %5s: { seqno:%d, busy:%d.%02d%%, runtime:%lldms, walltime:%lldms }\n",
293462306a36Sopenharmony_ci				name, p->engine->name, ce->timeline->seqno,
293562306a36Sopenharmony_ci				integer, decimal,
293662306a36Sopenharmony_ci				div_u64(p->runtime, 1000 * 1000),
293762306a36Sopenharmony_ci				div_u64(ktime_to_ns(p->time), 1000 * 1000));
293862306a36Sopenharmony_ci		}
293962306a36Sopenharmony_ci	}
294062306a36Sopenharmony_ci
294162306a36Sopenharmony_ciout:
294262306a36Sopenharmony_ci	for (idx = 0; idx < nengines; idx++) {
294362306a36Sopenharmony_ci		if (IS_ERR_OR_NULL(ps->ce[idx]))
294462306a36Sopenharmony_ci			break;
294562306a36Sopenharmony_ci
294662306a36Sopenharmony_ci		intel_context_unpin(ps->ce[idx]);
294762306a36Sopenharmony_ci		intel_context_put(ps->ce[idx]);
294862306a36Sopenharmony_ci	}
294962306a36Sopenharmony_ci	kfree(ps);
295062306a36Sopenharmony_ci
295162306a36Sopenharmony_ci	cpu_latency_qos_remove_request(&qos);
295262306a36Sopenharmony_ci	kfree(stats);
295362306a36Sopenharmony_ci	return err;
295462306a36Sopenharmony_ci}
295562306a36Sopenharmony_ci
295662306a36Sopenharmony_cistruct p_thread {
295762306a36Sopenharmony_ci	struct perf_stats p;
295862306a36Sopenharmony_ci	struct kthread_worker *worker;
295962306a36Sopenharmony_ci	struct kthread_work work;
296062306a36Sopenharmony_ci	struct intel_engine_cs *engine;
296162306a36Sopenharmony_ci	int result;
296262306a36Sopenharmony_ci};
296362306a36Sopenharmony_ci
296462306a36Sopenharmony_cistatic void p_sync0(struct kthread_work *work)
296562306a36Sopenharmony_ci{
296662306a36Sopenharmony_ci	struct p_thread *thread = container_of(work, typeof(*thread), work);
296762306a36Sopenharmony_ci	struct perf_stats *p = &thread->p;
296862306a36Sopenharmony_ci	struct intel_engine_cs *engine = p->engine;
296962306a36Sopenharmony_ci	struct intel_context *ce;
297062306a36Sopenharmony_ci	IGT_TIMEOUT(end_time);
297162306a36Sopenharmony_ci	unsigned long count;
297262306a36Sopenharmony_ci	bool busy;
297362306a36Sopenharmony_ci	int err = 0;
297462306a36Sopenharmony_ci
297562306a36Sopenharmony_ci	ce = intel_context_create(engine);
297662306a36Sopenharmony_ci	if (IS_ERR(ce)) {
297762306a36Sopenharmony_ci		thread->result = PTR_ERR(ce);
297862306a36Sopenharmony_ci		return;
297962306a36Sopenharmony_ci	}
298062306a36Sopenharmony_ci
298162306a36Sopenharmony_ci	err = intel_context_pin(ce);
298262306a36Sopenharmony_ci	if (err) {
298362306a36Sopenharmony_ci		intel_context_put(ce);
298462306a36Sopenharmony_ci		thread->result = err;
298562306a36Sopenharmony_ci		return;
298662306a36Sopenharmony_ci	}
298762306a36Sopenharmony_ci
298862306a36Sopenharmony_ci	if (intel_engine_supports_stats(engine)) {
298962306a36Sopenharmony_ci		p->busy = intel_engine_get_busy_time(engine, &p->time);
299062306a36Sopenharmony_ci		busy = true;
299162306a36Sopenharmony_ci	} else {
299262306a36Sopenharmony_ci		p->time = ktime_get();
299362306a36Sopenharmony_ci		busy = false;
299462306a36Sopenharmony_ci	}
299562306a36Sopenharmony_ci
299662306a36Sopenharmony_ci	count = 0;
299762306a36Sopenharmony_ci	do {
299862306a36Sopenharmony_ci		struct i915_request *rq;
299962306a36Sopenharmony_ci
300062306a36Sopenharmony_ci		rq = i915_request_create(ce);
300162306a36Sopenharmony_ci		if (IS_ERR(rq)) {
300262306a36Sopenharmony_ci			err = PTR_ERR(rq);
300362306a36Sopenharmony_ci			break;
300462306a36Sopenharmony_ci		}
300562306a36Sopenharmony_ci
300662306a36Sopenharmony_ci		i915_request_get(rq);
300762306a36Sopenharmony_ci		i915_request_add(rq);
300862306a36Sopenharmony_ci
300962306a36Sopenharmony_ci		err = 0;
301062306a36Sopenharmony_ci		if (i915_request_wait(rq, 0, HZ) < 0)
301162306a36Sopenharmony_ci			err = -ETIME;
301262306a36Sopenharmony_ci		i915_request_put(rq);
301362306a36Sopenharmony_ci		if (err)
301462306a36Sopenharmony_ci			break;
301562306a36Sopenharmony_ci
301662306a36Sopenharmony_ci		count++;
301762306a36Sopenharmony_ci	} while (!__igt_timeout(end_time, NULL));
301862306a36Sopenharmony_ci
301962306a36Sopenharmony_ci	if (busy) {
302062306a36Sopenharmony_ci		ktime_t now;
302162306a36Sopenharmony_ci
302262306a36Sopenharmony_ci		p->busy = ktime_sub(intel_engine_get_busy_time(engine, &now),
302362306a36Sopenharmony_ci				    p->busy);
302462306a36Sopenharmony_ci		p->time = ktime_sub(now, p->time);
302562306a36Sopenharmony_ci	} else {
302662306a36Sopenharmony_ci		p->time = ktime_sub(ktime_get(), p->time);
302762306a36Sopenharmony_ci	}
302862306a36Sopenharmony_ci
302962306a36Sopenharmony_ci	err = switch_to_kernel_sync(ce, err);
303062306a36Sopenharmony_ci	p->runtime = intel_context_get_total_runtime_ns(ce);
303162306a36Sopenharmony_ci	p->count = count;
303262306a36Sopenharmony_ci
303362306a36Sopenharmony_ci	intel_context_unpin(ce);
303462306a36Sopenharmony_ci	intel_context_put(ce);
303562306a36Sopenharmony_ci	thread->result = err;
303662306a36Sopenharmony_ci}
303762306a36Sopenharmony_ci
303862306a36Sopenharmony_cistatic void p_sync1(struct kthread_work *work)
303962306a36Sopenharmony_ci{
304062306a36Sopenharmony_ci	struct p_thread *thread = container_of(work, typeof(*thread), work);
304162306a36Sopenharmony_ci	struct perf_stats *p = &thread->p;
304262306a36Sopenharmony_ci	struct intel_engine_cs *engine = p->engine;
304362306a36Sopenharmony_ci	struct i915_request *prev = NULL;
304462306a36Sopenharmony_ci	struct intel_context *ce;
304562306a36Sopenharmony_ci	IGT_TIMEOUT(end_time);
304662306a36Sopenharmony_ci	unsigned long count;
304762306a36Sopenharmony_ci	bool busy;
304862306a36Sopenharmony_ci	int err = 0;
304962306a36Sopenharmony_ci
305062306a36Sopenharmony_ci	ce = intel_context_create(engine);
305162306a36Sopenharmony_ci	if (IS_ERR(ce)) {
305262306a36Sopenharmony_ci		thread->result = PTR_ERR(ce);
305362306a36Sopenharmony_ci		return;
305462306a36Sopenharmony_ci	}
305562306a36Sopenharmony_ci
305662306a36Sopenharmony_ci	err = intel_context_pin(ce);
305762306a36Sopenharmony_ci	if (err) {
305862306a36Sopenharmony_ci		intel_context_put(ce);
305962306a36Sopenharmony_ci		thread->result = err;
306062306a36Sopenharmony_ci		return;
306162306a36Sopenharmony_ci	}
306262306a36Sopenharmony_ci
306362306a36Sopenharmony_ci	if (intel_engine_supports_stats(engine)) {
306462306a36Sopenharmony_ci		p->busy = intel_engine_get_busy_time(engine, &p->time);
306562306a36Sopenharmony_ci		busy = true;
306662306a36Sopenharmony_ci	} else {
306762306a36Sopenharmony_ci		p->time = ktime_get();
306862306a36Sopenharmony_ci		busy = false;
306962306a36Sopenharmony_ci	}
307062306a36Sopenharmony_ci
307162306a36Sopenharmony_ci	count = 0;
307262306a36Sopenharmony_ci	do {
307362306a36Sopenharmony_ci		struct i915_request *rq;
307462306a36Sopenharmony_ci
307562306a36Sopenharmony_ci		rq = i915_request_create(ce);
307662306a36Sopenharmony_ci		if (IS_ERR(rq)) {
307762306a36Sopenharmony_ci			err = PTR_ERR(rq);
307862306a36Sopenharmony_ci			break;
307962306a36Sopenharmony_ci		}
308062306a36Sopenharmony_ci
308162306a36Sopenharmony_ci		i915_request_get(rq);
308262306a36Sopenharmony_ci		i915_request_add(rq);
308362306a36Sopenharmony_ci
308462306a36Sopenharmony_ci		err = 0;
308562306a36Sopenharmony_ci		if (prev && i915_request_wait(prev, 0, HZ) < 0)
308662306a36Sopenharmony_ci			err = -ETIME;
308762306a36Sopenharmony_ci		i915_request_put(prev);
308862306a36Sopenharmony_ci		prev = rq;
308962306a36Sopenharmony_ci		if (err)
309062306a36Sopenharmony_ci			break;
309162306a36Sopenharmony_ci
309262306a36Sopenharmony_ci		count++;
309362306a36Sopenharmony_ci	} while (!__igt_timeout(end_time, NULL));
309462306a36Sopenharmony_ci	i915_request_put(prev);
309562306a36Sopenharmony_ci
309662306a36Sopenharmony_ci	if (busy) {
309762306a36Sopenharmony_ci		ktime_t now;
309862306a36Sopenharmony_ci
309962306a36Sopenharmony_ci		p->busy = ktime_sub(intel_engine_get_busy_time(engine, &now),
310062306a36Sopenharmony_ci				    p->busy);
310162306a36Sopenharmony_ci		p->time = ktime_sub(now, p->time);
310262306a36Sopenharmony_ci	} else {
310362306a36Sopenharmony_ci		p->time = ktime_sub(ktime_get(), p->time);
310462306a36Sopenharmony_ci	}
310562306a36Sopenharmony_ci
310662306a36Sopenharmony_ci	err = switch_to_kernel_sync(ce, err);
310762306a36Sopenharmony_ci	p->runtime = intel_context_get_total_runtime_ns(ce);
310862306a36Sopenharmony_ci	p->count = count;
310962306a36Sopenharmony_ci
311062306a36Sopenharmony_ci	intel_context_unpin(ce);
311162306a36Sopenharmony_ci	intel_context_put(ce);
311262306a36Sopenharmony_ci	thread->result = err;
311362306a36Sopenharmony_ci}
311462306a36Sopenharmony_ci
311562306a36Sopenharmony_cistatic void p_many(struct kthread_work *work)
311662306a36Sopenharmony_ci{
311762306a36Sopenharmony_ci	struct p_thread *thread = container_of(work, typeof(*thread), work);
311862306a36Sopenharmony_ci	struct perf_stats *p = &thread->p;
311962306a36Sopenharmony_ci	struct intel_engine_cs *engine = p->engine;
312062306a36Sopenharmony_ci	struct intel_context *ce;
312162306a36Sopenharmony_ci	IGT_TIMEOUT(end_time);
312262306a36Sopenharmony_ci	unsigned long count;
312362306a36Sopenharmony_ci	int err = 0;
312462306a36Sopenharmony_ci	bool busy;
312562306a36Sopenharmony_ci
312662306a36Sopenharmony_ci	ce = intel_context_create(engine);
312762306a36Sopenharmony_ci	if (IS_ERR(ce)) {
312862306a36Sopenharmony_ci		thread->result = PTR_ERR(ce);
312962306a36Sopenharmony_ci		return;
313062306a36Sopenharmony_ci	}
313162306a36Sopenharmony_ci
313262306a36Sopenharmony_ci	err = intel_context_pin(ce);
313362306a36Sopenharmony_ci	if (err) {
313462306a36Sopenharmony_ci		intel_context_put(ce);
313562306a36Sopenharmony_ci		thread->result = err;
313662306a36Sopenharmony_ci		return;
313762306a36Sopenharmony_ci	}
313862306a36Sopenharmony_ci
313962306a36Sopenharmony_ci	if (intel_engine_supports_stats(engine)) {
314062306a36Sopenharmony_ci		p->busy = intel_engine_get_busy_time(engine, &p->time);
314162306a36Sopenharmony_ci		busy = true;
314262306a36Sopenharmony_ci	} else {
314362306a36Sopenharmony_ci		p->time = ktime_get();
314462306a36Sopenharmony_ci		busy = false;
314562306a36Sopenharmony_ci	}
314662306a36Sopenharmony_ci
314762306a36Sopenharmony_ci	count = 0;
314862306a36Sopenharmony_ci	do {
314962306a36Sopenharmony_ci		struct i915_request *rq;
315062306a36Sopenharmony_ci
315162306a36Sopenharmony_ci		rq = i915_request_create(ce);
315262306a36Sopenharmony_ci		if (IS_ERR(rq)) {
315362306a36Sopenharmony_ci			err = PTR_ERR(rq);
315462306a36Sopenharmony_ci			break;
315562306a36Sopenharmony_ci		}
315662306a36Sopenharmony_ci
315762306a36Sopenharmony_ci		i915_request_add(rq);
315862306a36Sopenharmony_ci		count++;
315962306a36Sopenharmony_ci	} while (!__igt_timeout(end_time, NULL));
316062306a36Sopenharmony_ci
316162306a36Sopenharmony_ci	if (busy) {
316262306a36Sopenharmony_ci		ktime_t now;
316362306a36Sopenharmony_ci
316462306a36Sopenharmony_ci		p->busy = ktime_sub(intel_engine_get_busy_time(engine, &now),
316562306a36Sopenharmony_ci				    p->busy);
316662306a36Sopenharmony_ci		p->time = ktime_sub(now, p->time);
316762306a36Sopenharmony_ci	} else {
316862306a36Sopenharmony_ci		p->time = ktime_sub(ktime_get(), p->time);
316962306a36Sopenharmony_ci	}
317062306a36Sopenharmony_ci
317162306a36Sopenharmony_ci	err = switch_to_kernel_sync(ce, err);
317262306a36Sopenharmony_ci	p->runtime = intel_context_get_total_runtime_ns(ce);
317362306a36Sopenharmony_ci	p->count = count;
317462306a36Sopenharmony_ci
317562306a36Sopenharmony_ci	intel_context_unpin(ce);
317662306a36Sopenharmony_ci	intel_context_put(ce);
317762306a36Sopenharmony_ci	thread->result = err;
317862306a36Sopenharmony_ci}
317962306a36Sopenharmony_ci
318062306a36Sopenharmony_cistatic int perf_parallel_engines(void *arg)
318162306a36Sopenharmony_ci{
318262306a36Sopenharmony_ci	struct drm_i915_private *i915 = arg;
318362306a36Sopenharmony_ci	static void (* const func[])(struct kthread_work *) = {
318462306a36Sopenharmony_ci		p_sync0,
318562306a36Sopenharmony_ci		p_sync1,
318662306a36Sopenharmony_ci		p_many,
318762306a36Sopenharmony_ci		NULL,
318862306a36Sopenharmony_ci	};
318962306a36Sopenharmony_ci	const unsigned int nengines = num_uabi_engines(i915);
319062306a36Sopenharmony_ci	void (* const *fn)(struct kthread_work *);
319162306a36Sopenharmony_ci	struct intel_engine_cs *engine;
319262306a36Sopenharmony_ci	struct pm_qos_request qos;
319362306a36Sopenharmony_ci	struct p_thread *engines;
319462306a36Sopenharmony_ci	int err = 0;
319562306a36Sopenharmony_ci
319662306a36Sopenharmony_ci	engines = kcalloc(nengines, sizeof(*engines), GFP_KERNEL);
319762306a36Sopenharmony_ci	if (!engines)
319862306a36Sopenharmony_ci		return -ENOMEM;
319962306a36Sopenharmony_ci
320062306a36Sopenharmony_ci	cpu_latency_qos_add_request(&qos, 0);
320162306a36Sopenharmony_ci
320262306a36Sopenharmony_ci	for (fn = func; *fn; fn++) {
320362306a36Sopenharmony_ci		char name[KSYM_NAME_LEN];
320462306a36Sopenharmony_ci		struct igt_live_test t;
320562306a36Sopenharmony_ci		unsigned int idx;
320662306a36Sopenharmony_ci
320762306a36Sopenharmony_ci		snprintf(name, sizeof(name), "%ps", *fn);
320862306a36Sopenharmony_ci		err = igt_live_test_begin(&t, i915, __func__, name);
320962306a36Sopenharmony_ci		if (err)
321062306a36Sopenharmony_ci			break;
321162306a36Sopenharmony_ci
321262306a36Sopenharmony_ci		atomic_set(&i915->selftest.counter, nengines);
321362306a36Sopenharmony_ci
321462306a36Sopenharmony_ci		idx = 0;
321562306a36Sopenharmony_ci		for_each_uabi_engine(engine, i915) {
321662306a36Sopenharmony_ci			struct kthread_worker *worker;
321762306a36Sopenharmony_ci
321862306a36Sopenharmony_ci			intel_engine_pm_get(engine);
321962306a36Sopenharmony_ci
322062306a36Sopenharmony_ci			memset(&engines[idx].p, 0, sizeof(engines[idx].p));
322162306a36Sopenharmony_ci
322262306a36Sopenharmony_ci			worker = kthread_create_worker(0, "igt:%s",
322362306a36Sopenharmony_ci						       engine->name);
322462306a36Sopenharmony_ci			if (IS_ERR(worker)) {
322562306a36Sopenharmony_ci				err = PTR_ERR(worker);
322662306a36Sopenharmony_ci				intel_engine_pm_put(engine);
322762306a36Sopenharmony_ci				break;
322862306a36Sopenharmony_ci			}
322962306a36Sopenharmony_ci			engines[idx].worker = worker;
323062306a36Sopenharmony_ci			engines[idx].result = 0;
323162306a36Sopenharmony_ci			engines[idx].p.engine = engine;
323262306a36Sopenharmony_ci			engines[idx].engine = engine;
323362306a36Sopenharmony_ci
323462306a36Sopenharmony_ci			kthread_init_work(&engines[idx].work, *fn);
323562306a36Sopenharmony_ci			kthread_queue_work(worker, &engines[idx].work);
323662306a36Sopenharmony_ci			idx++;
323762306a36Sopenharmony_ci		}
323862306a36Sopenharmony_ci
323962306a36Sopenharmony_ci		idx = 0;
324062306a36Sopenharmony_ci		for_each_uabi_engine(engine, i915) {
324162306a36Sopenharmony_ci			int status;
324262306a36Sopenharmony_ci
324362306a36Sopenharmony_ci			if (!engines[idx].worker)
324462306a36Sopenharmony_ci				break;
324562306a36Sopenharmony_ci
324662306a36Sopenharmony_ci			kthread_flush_work(&engines[idx].work);
324762306a36Sopenharmony_ci			status = READ_ONCE(engines[idx].result);
324862306a36Sopenharmony_ci			if (status && !err)
324962306a36Sopenharmony_ci				err = status;
325062306a36Sopenharmony_ci
325162306a36Sopenharmony_ci			intel_engine_pm_put(engine);
325262306a36Sopenharmony_ci
325362306a36Sopenharmony_ci			kthread_destroy_worker(engines[idx].worker);
325462306a36Sopenharmony_ci			idx++;
325562306a36Sopenharmony_ci		}
325662306a36Sopenharmony_ci
325762306a36Sopenharmony_ci		if (igt_live_test_end(&t))
325862306a36Sopenharmony_ci			err = -EIO;
325962306a36Sopenharmony_ci		if (err)
326062306a36Sopenharmony_ci			break;
326162306a36Sopenharmony_ci
326262306a36Sopenharmony_ci		idx = 0;
326362306a36Sopenharmony_ci		for_each_uabi_engine(engine, i915) {
326462306a36Sopenharmony_ci			struct perf_stats *p = &engines[idx].p;
326562306a36Sopenharmony_ci			u64 busy = 100 * ktime_to_ns(p->busy);
326662306a36Sopenharmony_ci			u64 dt = ktime_to_ns(p->time);
326762306a36Sopenharmony_ci			int integer, decimal;
326862306a36Sopenharmony_ci
326962306a36Sopenharmony_ci			if (dt) {
327062306a36Sopenharmony_ci				integer = div64_u64(busy, dt);
327162306a36Sopenharmony_ci				busy -= integer * dt;
327262306a36Sopenharmony_ci				decimal = div64_u64(100 * busy, dt);
327362306a36Sopenharmony_ci			} else {
327462306a36Sopenharmony_ci				integer = 0;
327562306a36Sopenharmony_ci				decimal = 0;
327662306a36Sopenharmony_ci			}
327762306a36Sopenharmony_ci
327862306a36Sopenharmony_ci			GEM_BUG_ON(engine != p->engine);
327962306a36Sopenharmony_ci			pr_info("%s %5s: { count:%lu, busy:%d.%02d%%, runtime:%lldms, walltime:%lldms }\n",
328062306a36Sopenharmony_ci				name, engine->name, p->count, integer, decimal,
328162306a36Sopenharmony_ci				div_u64(p->runtime, 1000 * 1000),
328262306a36Sopenharmony_ci				div_u64(ktime_to_ns(p->time), 1000 * 1000));
328362306a36Sopenharmony_ci			idx++;
328462306a36Sopenharmony_ci		}
328562306a36Sopenharmony_ci	}
328662306a36Sopenharmony_ci
328762306a36Sopenharmony_ci	cpu_latency_qos_remove_request(&qos);
328862306a36Sopenharmony_ci	kfree(engines);
328962306a36Sopenharmony_ci	return err;
329062306a36Sopenharmony_ci}
329162306a36Sopenharmony_ci
329262306a36Sopenharmony_ciint i915_request_perf_selftests(struct drm_i915_private *i915)
329362306a36Sopenharmony_ci{
329462306a36Sopenharmony_ci	static const struct i915_subtest tests[] = {
329562306a36Sopenharmony_ci		SUBTEST(perf_request_latency),
329662306a36Sopenharmony_ci		SUBTEST(perf_series_engines),
329762306a36Sopenharmony_ci		SUBTEST(perf_parallel_engines),
329862306a36Sopenharmony_ci	};
329962306a36Sopenharmony_ci
330062306a36Sopenharmony_ci	if (intel_gt_is_wedged(to_gt(i915)))
330162306a36Sopenharmony_ci		return 0;
330262306a36Sopenharmony_ci
330362306a36Sopenharmony_ci	return i915_subtests(tests, i915);
330462306a36Sopenharmony_ci}
3305