162306a36Sopenharmony_ci// SPDX-License-Identifier: MIT 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Copyright © 2017-2018 Intel Corporation 462306a36Sopenharmony_ci */ 562306a36Sopenharmony_ci 662306a36Sopenharmony_ci#include <linux/prime_numbers.h> 762306a36Sopenharmony_ci#include <linux/string_helpers.h> 862306a36Sopenharmony_ci 962306a36Sopenharmony_ci#include "intel_context.h" 1062306a36Sopenharmony_ci#include "intel_engine_heartbeat.h" 1162306a36Sopenharmony_ci#include "intel_engine_pm.h" 1262306a36Sopenharmony_ci#include "intel_engine_regs.h" 1362306a36Sopenharmony_ci#include "intel_gpu_commands.h" 1462306a36Sopenharmony_ci#include "intel_gt.h" 1562306a36Sopenharmony_ci#include "intel_gt_requests.h" 1662306a36Sopenharmony_ci#include "intel_ring.h" 1762306a36Sopenharmony_ci#include "selftest_engine_heartbeat.h" 1862306a36Sopenharmony_ci 1962306a36Sopenharmony_ci#include "../selftests/i915_random.h" 2062306a36Sopenharmony_ci#include "../i915_selftest.h" 2162306a36Sopenharmony_ci 2262306a36Sopenharmony_ci#include "selftests/igt_flush_test.h" 2362306a36Sopenharmony_ci#include "selftests/lib_sw_fence.h" 2462306a36Sopenharmony_ci#include "selftests/mock_gem_device.h" 2562306a36Sopenharmony_ci#include "selftests/mock_timeline.h" 2662306a36Sopenharmony_ci 2762306a36Sopenharmony_cistatic struct page *hwsp_page(struct intel_timeline *tl) 2862306a36Sopenharmony_ci{ 2962306a36Sopenharmony_ci struct drm_i915_gem_object *obj = tl->hwsp_ggtt->obj; 3062306a36Sopenharmony_ci 3162306a36Sopenharmony_ci GEM_BUG_ON(!i915_gem_object_has_pinned_pages(obj)); 3262306a36Sopenharmony_ci return sg_page(obj->mm.pages->sgl); 3362306a36Sopenharmony_ci} 3462306a36Sopenharmony_ci 3562306a36Sopenharmony_cistatic unsigned long hwsp_cacheline(struct intel_timeline *tl) 3662306a36Sopenharmony_ci{ 3762306a36Sopenharmony_ci unsigned long address = (unsigned long)page_address(hwsp_page(tl)); 3862306a36Sopenharmony_ci 3962306a36Sopenharmony_ci return (address + offset_in_page(tl->hwsp_offset)) / TIMELINE_SEQNO_BYTES; 4062306a36Sopenharmony_ci} 4162306a36Sopenharmony_ci 4262306a36Sopenharmony_cistatic int selftest_tl_pin(struct intel_timeline *tl) 4362306a36Sopenharmony_ci{ 4462306a36Sopenharmony_ci struct i915_gem_ww_ctx ww; 4562306a36Sopenharmony_ci int err; 4662306a36Sopenharmony_ci 4762306a36Sopenharmony_ci i915_gem_ww_ctx_init(&ww, false); 4862306a36Sopenharmony_ciretry: 4962306a36Sopenharmony_ci err = i915_gem_object_lock(tl->hwsp_ggtt->obj, &ww); 5062306a36Sopenharmony_ci if (!err) 5162306a36Sopenharmony_ci err = intel_timeline_pin(tl, &ww); 5262306a36Sopenharmony_ci 5362306a36Sopenharmony_ci if (err == -EDEADLK) { 5462306a36Sopenharmony_ci err = i915_gem_ww_ctx_backoff(&ww); 5562306a36Sopenharmony_ci if (!err) 5662306a36Sopenharmony_ci goto retry; 5762306a36Sopenharmony_ci } 5862306a36Sopenharmony_ci i915_gem_ww_ctx_fini(&ww); 5962306a36Sopenharmony_ci return err; 6062306a36Sopenharmony_ci} 6162306a36Sopenharmony_ci 6262306a36Sopenharmony_ci/* Only half of seqno's are usable, see __intel_timeline_get_seqno() */ 6362306a36Sopenharmony_ci#define CACHELINES_PER_PAGE (PAGE_SIZE / TIMELINE_SEQNO_BYTES / 2) 6462306a36Sopenharmony_ci 6562306a36Sopenharmony_cistruct mock_hwsp_freelist { 6662306a36Sopenharmony_ci struct intel_gt *gt; 6762306a36Sopenharmony_ci struct radix_tree_root cachelines; 6862306a36Sopenharmony_ci struct intel_timeline **history; 6962306a36Sopenharmony_ci unsigned long count, max; 7062306a36Sopenharmony_ci struct rnd_state prng; 7162306a36Sopenharmony_ci}; 7262306a36Sopenharmony_ci 7362306a36Sopenharmony_cienum { 7462306a36Sopenharmony_ci SHUFFLE = BIT(0), 7562306a36Sopenharmony_ci}; 7662306a36Sopenharmony_ci 7762306a36Sopenharmony_cistatic void __mock_hwsp_record(struct mock_hwsp_freelist *state, 7862306a36Sopenharmony_ci unsigned int idx, 7962306a36Sopenharmony_ci struct intel_timeline *tl) 8062306a36Sopenharmony_ci{ 8162306a36Sopenharmony_ci tl = xchg(&state->history[idx], tl); 8262306a36Sopenharmony_ci if (tl) { 8362306a36Sopenharmony_ci radix_tree_delete(&state->cachelines, hwsp_cacheline(tl)); 8462306a36Sopenharmony_ci intel_timeline_unpin(tl); 8562306a36Sopenharmony_ci intel_timeline_put(tl); 8662306a36Sopenharmony_ci } 8762306a36Sopenharmony_ci} 8862306a36Sopenharmony_ci 8962306a36Sopenharmony_cistatic int __mock_hwsp_timeline(struct mock_hwsp_freelist *state, 9062306a36Sopenharmony_ci unsigned int count, 9162306a36Sopenharmony_ci unsigned int flags) 9262306a36Sopenharmony_ci{ 9362306a36Sopenharmony_ci struct intel_timeline *tl; 9462306a36Sopenharmony_ci unsigned int idx; 9562306a36Sopenharmony_ci 9662306a36Sopenharmony_ci while (count--) { 9762306a36Sopenharmony_ci unsigned long cacheline; 9862306a36Sopenharmony_ci int err; 9962306a36Sopenharmony_ci 10062306a36Sopenharmony_ci tl = intel_timeline_create(state->gt); 10162306a36Sopenharmony_ci if (IS_ERR(tl)) 10262306a36Sopenharmony_ci return PTR_ERR(tl); 10362306a36Sopenharmony_ci 10462306a36Sopenharmony_ci err = selftest_tl_pin(tl); 10562306a36Sopenharmony_ci if (err) { 10662306a36Sopenharmony_ci intel_timeline_put(tl); 10762306a36Sopenharmony_ci return err; 10862306a36Sopenharmony_ci } 10962306a36Sopenharmony_ci 11062306a36Sopenharmony_ci cacheline = hwsp_cacheline(tl); 11162306a36Sopenharmony_ci err = radix_tree_insert(&state->cachelines, cacheline, tl); 11262306a36Sopenharmony_ci if (err) { 11362306a36Sopenharmony_ci if (err == -EEXIST) { 11462306a36Sopenharmony_ci pr_err("HWSP cacheline %lu already used; duplicate allocation!\n", 11562306a36Sopenharmony_ci cacheline); 11662306a36Sopenharmony_ci } 11762306a36Sopenharmony_ci intel_timeline_unpin(tl); 11862306a36Sopenharmony_ci intel_timeline_put(tl); 11962306a36Sopenharmony_ci return err; 12062306a36Sopenharmony_ci } 12162306a36Sopenharmony_ci 12262306a36Sopenharmony_ci idx = state->count++ % state->max; 12362306a36Sopenharmony_ci __mock_hwsp_record(state, idx, tl); 12462306a36Sopenharmony_ci } 12562306a36Sopenharmony_ci 12662306a36Sopenharmony_ci if (flags & SHUFFLE) 12762306a36Sopenharmony_ci i915_prandom_shuffle(state->history, 12862306a36Sopenharmony_ci sizeof(*state->history), 12962306a36Sopenharmony_ci min(state->count, state->max), 13062306a36Sopenharmony_ci &state->prng); 13162306a36Sopenharmony_ci 13262306a36Sopenharmony_ci count = i915_prandom_u32_max_state(min(state->count, state->max), 13362306a36Sopenharmony_ci &state->prng); 13462306a36Sopenharmony_ci while (count--) { 13562306a36Sopenharmony_ci idx = --state->count % state->max; 13662306a36Sopenharmony_ci __mock_hwsp_record(state, idx, NULL); 13762306a36Sopenharmony_ci } 13862306a36Sopenharmony_ci 13962306a36Sopenharmony_ci return 0; 14062306a36Sopenharmony_ci} 14162306a36Sopenharmony_ci 14262306a36Sopenharmony_cistatic int mock_hwsp_freelist(void *arg) 14362306a36Sopenharmony_ci{ 14462306a36Sopenharmony_ci struct mock_hwsp_freelist state; 14562306a36Sopenharmony_ci struct drm_i915_private *i915; 14662306a36Sopenharmony_ci const struct { 14762306a36Sopenharmony_ci const char *name; 14862306a36Sopenharmony_ci unsigned int flags; 14962306a36Sopenharmony_ci } phases[] = { 15062306a36Sopenharmony_ci { "linear", 0 }, 15162306a36Sopenharmony_ci { "shuffled", SHUFFLE }, 15262306a36Sopenharmony_ci { }, 15362306a36Sopenharmony_ci }, *p; 15462306a36Sopenharmony_ci unsigned int na; 15562306a36Sopenharmony_ci int err = 0; 15662306a36Sopenharmony_ci 15762306a36Sopenharmony_ci i915 = mock_gem_device(); 15862306a36Sopenharmony_ci if (!i915) 15962306a36Sopenharmony_ci return -ENOMEM; 16062306a36Sopenharmony_ci 16162306a36Sopenharmony_ci INIT_RADIX_TREE(&state.cachelines, GFP_KERNEL); 16262306a36Sopenharmony_ci state.prng = I915_RND_STATE_INITIALIZER(i915_selftest.random_seed); 16362306a36Sopenharmony_ci 16462306a36Sopenharmony_ci state.gt = to_gt(i915); 16562306a36Sopenharmony_ci 16662306a36Sopenharmony_ci /* 16762306a36Sopenharmony_ci * Create a bunch of timelines and check that their HWSP do not overlap. 16862306a36Sopenharmony_ci * Free some, and try again. 16962306a36Sopenharmony_ci */ 17062306a36Sopenharmony_ci 17162306a36Sopenharmony_ci state.max = PAGE_SIZE / sizeof(*state.history); 17262306a36Sopenharmony_ci state.count = 0; 17362306a36Sopenharmony_ci state.history = kcalloc(state.max, sizeof(*state.history), GFP_KERNEL); 17462306a36Sopenharmony_ci if (!state.history) { 17562306a36Sopenharmony_ci err = -ENOMEM; 17662306a36Sopenharmony_ci goto err_put; 17762306a36Sopenharmony_ci } 17862306a36Sopenharmony_ci 17962306a36Sopenharmony_ci for (p = phases; p->name; p++) { 18062306a36Sopenharmony_ci pr_debug("%s(%s)\n", __func__, p->name); 18162306a36Sopenharmony_ci for_each_prime_number_from(na, 1, 2 * CACHELINES_PER_PAGE) { 18262306a36Sopenharmony_ci err = __mock_hwsp_timeline(&state, na, p->flags); 18362306a36Sopenharmony_ci if (err) 18462306a36Sopenharmony_ci goto out; 18562306a36Sopenharmony_ci } 18662306a36Sopenharmony_ci } 18762306a36Sopenharmony_ci 18862306a36Sopenharmony_ciout: 18962306a36Sopenharmony_ci for (na = 0; na < state.max; na++) 19062306a36Sopenharmony_ci __mock_hwsp_record(&state, na, NULL); 19162306a36Sopenharmony_ci kfree(state.history); 19262306a36Sopenharmony_cierr_put: 19362306a36Sopenharmony_ci mock_destroy_device(i915); 19462306a36Sopenharmony_ci return err; 19562306a36Sopenharmony_ci} 19662306a36Sopenharmony_ci 19762306a36Sopenharmony_cistruct __igt_sync { 19862306a36Sopenharmony_ci const char *name; 19962306a36Sopenharmony_ci u32 seqno; 20062306a36Sopenharmony_ci bool expected; 20162306a36Sopenharmony_ci bool set; 20262306a36Sopenharmony_ci}; 20362306a36Sopenharmony_ci 20462306a36Sopenharmony_cistatic int __igt_sync(struct intel_timeline *tl, 20562306a36Sopenharmony_ci u64 ctx, 20662306a36Sopenharmony_ci const struct __igt_sync *p, 20762306a36Sopenharmony_ci const char *name) 20862306a36Sopenharmony_ci{ 20962306a36Sopenharmony_ci int ret; 21062306a36Sopenharmony_ci 21162306a36Sopenharmony_ci if (__intel_timeline_sync_is_later(tl, ctx, p->seqno) != p->expected) { 21262306a36Sopenharmony_ci pr_err("%s: %s(ctx=%llu, seqno=%u) expected passed %s but failed\n", 21362306a36Sopenharmony_ci name, p->name, ctx, p->seqno, str_yes_no(p->expected)); 21462306a36Sopenharmony_ci return -EINVAL; 21562306a36Sopenharmony_ci } 21662306a36Sopenharmony_ci 21762306a36Sopenharmony_ci if (p->set) { 21862306a36Sopenharmony_ci ret = __intel_timeline_sync_set(tl, ctx, p->seqno); 21962306a36Sopenharmony_ci if (ret) 22062306a36Sopenharmony_ci return ret; 22162306a36Sopenharmony_ci } 22262306a36Sopenharmony_ci 22362306a36Sopenharmony_ci return 0; 22462306a36Sopenharmony_ci} 22562306a36Sopenharmony_ci 22662306a36Sopenharmony_cistatic int igt_sync(void *arg) 22762306a36Sopenharmony_ci{ 22862306a36Sopenharmony_ci const struct __igt_sync pass[] = { 22962306a36Sopenharmony_ci { "unset", 0, false, false }, 23062306a36Sopenharmony_ci { "new", 0, false, true }, 23162306a36Sopenharmony_ci { "0a", 0, true, true }, 23262306a36Sopenharmony_ci { "1a", 1, false, true }, 23362306a36Sopenharmony_ci { "1b", 1, true, true }, 23462306a36Sopenharmony_ci { "0b", 0, true, false }, 23562306a36Sopenharmony_ci { "2a", 2, false, true }, 23662306a36Sopenharmony_ci { "4", 4, false, true }, 23762306a36Sopenharmony_ci { "INT_MAX", INT_MAX, false, true }, 23862306a36Sopenharmony_ci { "INT_MAX-1", INT_MAX-1, true, false }, 23962306a36Sopenharmony_ci { "INT_MAX+1", (u32)INT_MAX+1, false, true }, 24062306a36Sopenharmony_ci { "INT_MAX", INT_MAX, true, false }, 24162306a36Sopenharmony_ci { "UINT_MAX", UINT_MAX, false, true }, 24262306a36Sopenharmony_ci { "wrap", 0, false, true }, 24362306a36Sopenharmony_ci { "unwrap", UINT_MAX, true, false }, 24462306a36Sopenharmony_ci {}, 24562306a36Sopenharmony_ci }, *p; 24662306a36Sopenharmony_ci struct intel_timeline tl; 24762306a36Sopenharmony_ci int order, offset; 24862306a36Sopenharmony_ci int ret = -ENODEV; 24962306a36Sopenharmony_ci 25062306a36Sopenharmony_ci mock_timeline_init(&tl, 0); 25162306a36Sopenharmony_ci for (p = pass; p->name; p++) { 25262306a36Sopenharmony_ci for (order = 1; order < 64; order++) { 25362306a36Sopenharmony_ci for (offset = -1; offset <= (order > 1); offset++) { 25462306a36Sopenharmony_ci u64 ctx = BIT_ULL(order) + offset; 25562306a36Sopenharmony_ci 25662306a36Sopenharmony_ci ret = __igt_sync(&tl, ctx, p, "1"); 25762306a36Sopenharmony_ci if (ret) 25862306a36Sopenharmony_ci goto out; 25962306a36Sopenharmony_ci } 26062306a36Sopenharmony_ci } 26162306a36Sopenharmony_ci } 26262306a36Sopenharmony_ci mock_timeline_fini(&tl); 26362306a36Sopenharmony_ci 26462306a36Sopenharmony_ci mock_timeline_init(&tl, 0); 26562306a36Sopenharmony_ci for (order = 1; order < 64; order++) { 26662306a36Sopenharmony_ci for (offset = -1; offset <= (order > 1); offset++) { 26762306a36Sopenharmony_ci u64 ctx = BIT_ULL(order) + offset; 26862306a36Sopenharmony_ci 26962306a36Sopenharmony_ci for (p = pass; p->name; p++) { 27062306a36Sopenharmony_ci ret = __igt_sync(&tl, ctx, p, "2"); 27162306a36Sopenharmony_ci if (ret) 27262306a36Sopenharmony_ci goto out; 27362306a36Sopenharmony_ci } 27462306a36Sopenharmony_ci } 27562306a36Sopenharmony_ci } 27662306a36Sopenharmony_ci 27762306a36Sopenharmony_ciout: 27862306a36Sopenharmony_ci mock_timeline_fini(&tl); 27962306a36Sopenharmony_ci return ret; 28062306a36Sopenharmony_ci} 28162306a36Sopenharmony_ci 28262306a36Sopenharmony_cistatic unsigned int random_engine(struct rnd_state *rnd) 28362306a36Sopenharmony_ci{ 28462306a36Sopenharmony_ci return i915_prandom_u32_max_state(I915_NUM_ENGINES, rnd); 28562306a36Sopenharmony_ci} 28662306a36Sopenharmony_ci 28762306a36Sopenharmony_cistatic int bench_sync(void *arg) 28862306a36Sopenharmony_ci{ 28962306a36Sopenharmony_ci struct rnd_state prng; 29062306a36Sopenharmony_ci struct intel_timeline tl; 29162306a36Sopenharmony_ci unsigned long end_time, count; 29262306a36Sopenharmony_ci u64 prng32_1M; 29362306a36Sopenharmony_ci ktime_t kt; 29462306a36Sopenharmony_ci int order, last_order; 29562306a36Sopenharmony_ci 29662306a36Sopenharmony_ci mock_timeline_init(&tl, 0); 29762306a36Sopenharmony_ci 29862306a36Sopenharmony_ci /* Lookups from cache are very fast and so the random number generation 29962306a36Sopenharmony_ci * and the loop itself becomes a significant factor in the per-iteration 30062306a36Sopenharmony_ci * timings. We try to compensate the results by measuring the overhead 30162306a36Sopenharmony_ci * of the prng and subtract it from the reported results. 30262306a36Sopenharmony_ci */ 30362306a36Sopenharmony_ci prandom_seed_state(&prng, i915_selftest.random_seed); 30462306a36Sopenharmony_ci count = 0; 30562306a36Sopenharmony_ci kt = ktime_get(); 30662306a36Sopenharmony_ci end_time = jiffies + HZ/10; 30762306a36Sopenharmony_ci do { 30862306a36Sopenharmony_ci u32 x; 30962306a36Sopenharmony_ci 31062306a36Sopenharmony_ci /* Make sure the compiler doesn't optimise away the prng call */ 31162306a36Sopenharmony_ci WRITE_ONCE(x, prandom_u32_state(&prng)); 31262306a36Sopenharmony_ci 31362306a36Sopenharmony_ci count++; 31462306a36Sopenharmony_ci } while (!time_after(jiffies, end_time)); 31562306a36Sopenharmony_ci kt = ktime_sub(ktime_get(), kt); 31662306a36Sopenharmony_ci pr_debug("%s: %lu random evaluations, %lluns/prng\n", 31762306a36Sopenharmony_ci __func__, count, (long long)div64_ul(ktime_to_ns(kt), count)); 31862306a36Sopenharmony_ci prng32_1M = div64_ul(ktime_to_ns(kt) << 20, count); 31962306a36Sopenharmony_ci 32062306a36Sopenharmony_ci /* Benchmark (only) setting random context ids */ 32162306a36Sopenharmony_ci prandom_seed_state(&prng, i915_selftest.random_seed); 32262306a36Sopenharmony_ci count = 0; 32362306a36Sopenharmony_ci kt = ktime_get(); 32462306a36Sopenharmony_ci end_time = jiffies + HZ/10; 32562306a36Sopenharmony_ci do { 32662306a36Sopenharmony_ci u64 id = i915_prandom_u64_state(&prng); 32762306a36Sopenharmony_ci 32862306a36Sopenharmony_ci __intel_timeline_sync_set(&tl, id, 0); 32962306a36Sopenharmony_ci count++; 33062306a36Sopenharmony_ci } while (!time_after(jiffies, end_time)); 33162306a36Sopenharmony_ci kt = ktime_sub(ktime_get(), kt); 33262306a36Sopenharmony_ci kt = ktime_sub_ns(kt, (count * prng32_1M * 2) >> 20); 33362306a36Sopenharmony_ci pr_info("%s: %lu random insertions, %lluns/insert\n", 33462306a36Sopenharmony_ci __func__, count, (long long)div64_ul(ktime_to_ns(kt), count)); 33562306a36Sopenharmony_ci 33662306a36Sopenharmony_ci /* Benchmark looking up the exact same context ids as we just set */ 33762306a36Sopenharmony_ci prandom_seed_state(&prng, i915_selftest.random_seed); 33862306a36Sopenharmony_ci end_time = count; 33962306a36Sopenharmony_ci kt = ktime_get(); 34062306a36Sopenharmony_ci while (end_time--) { 34162306a36Sopenharmony_ci u64 id = i915_prandom_u64_state(&prng); 34262306a36Sopenharmony_ci 34362306a36Sopenharmony_ci if (!__intel_timeline_sync_is_later(&tl, id, 0)) { 34462306a36Sopenharmony_ci mock_timeline_fini(&tl); 34562306a36Sopenharmony_ci pr_err("Lookup of %llu failed\n", id); 34662306a36Sopenharmony_ci return -EINVAL; 34762306a36Sopenharmony_ci } 34862306a36Sopenharmony_ci } 34962306a36Sopenharmony_ci kt = ktime_sub(ktime_get(), kt); 35062306a36Sopenharmony_ci kt = ktime_sub_ns(kt, (count * prng32_1M * 2) >> 20); 35162306a36Sopenharmony_ci pr_info("%s: %lu random lookups, %lluns/lookup\n", 35262306a36Sopenharmony_ci __func__, count, (long long)div64_ul(ktime_to_ns(kt), count)); 35362306a36Sopenharmony_ci 35462306a36Sopenharmony_ci mock_timeline_fini(&tl); 35562306a36Sopenharmony_ci cond_resched(); 35662306a36Sopenharmony_ci 35762306a36Sopenharmony_ci mock_timeline_init(&tl, 0); 35862306a36Sopenharmony_ci 35962306a36Sopenharmony_ci /* Benchmark setting the first N (in order) contexts */ 36062306a36Sopenharmony_ci count = 0; 36162306a36Sopenharmony_ci kt = ktime_get(); 36262306a36Sopenharmony_ci end_time = jiffies + HZ/10; 36362306a36Sopenharmony_ci do { 36462306a36Sopenharmony_ci __intel_timeline_sync_set(&tl, count++, 0); 36562306a36Sopenharmony_ci } while (!time_after(jiffies, end_time)); 36662306a36Sopenharmony_ci kt = ktime_sub(ktime_get(), kt); 36762306a36Sopenharmony_ci pr_info("%s: %lu in-order insertions, %lluns/insert\n", 36862306a36Sopenharmony_ci __func__, count, (long long)div64_ul(ktime_to_ns(kt), count)); 36962306a36Sopenharmony_ci 37062306a36Sopenharmony_ci /* Benchmark looking up the exact same context ids as we just set */ 37162306a36Sopenharmony_ci end_time = count; 37262306a36Sopenharmony_ci kt = ktime_get(); 37362306a36Sopenharmony_ci while (end_time--) { 37462306a36Sopenharmony_ci if (!__intel_timeline_sync_is_later(&tl, end_time, 0)) { 37562306a36Sopenharmony_ci pr_err("Lookup of %lu failed\n", end_time); 37662306a36Sopenharmony_ci mock_timeline_fini(&tl); 37762306a36Sopenharmony_ci return -EINVAL; 37862306a36Sopenharmony_ci } 37962306a36Sopenharmony_ci } 38062306a36Sopenharmony_ci kt = ktime_sub(ktime_get(), kt); 38162306a36Sopenharmony_ci pr_info("%s: %lu in-order lookups, %lluns/lookup\n", 38262306a36Sopenharmony_ci __func__, count, (long long)div64_ul(ktime_to_ns(kt), count)); 38362306a36Sopenharmony_ci 38462306a36Sopenharmony_ci mock_timeline_fini(&tl); 38562306a36Sopenharmony_ci cond_resched(); 38662306a36Sopenharmony_ci 38762306a36Sopenharmony_ci mock_timeline_init(&tl, 0); 38862306a36Sopenharmony_ci 38962306a36Sopenharmony_ci /* Benchmark searching for a random context id and maybe changing it */ 39062306a36Sopenharmony_ci prandom_seed_state(&prng, i915_selftest.random_seed); 39162306a36Sopenharmony_ci count = 0; 39262306a36Sopenharmony_ci kt = ktime_get(); 39362306a36Sopenharmony_ci end_time = jiffies + HZ/10; 39462306a36Sopenharmony_ci do { 39562306a36Sopenharmony_ci u32 id = random_engine(&prng); 39662306a36Sopenharmony_ci u32 seqno = prandom_u32_state(&prng); 39762306a36Sopenharmony_ci 39862306a36Sopenharmony_ci if (!__intel_timeline_sync_is_later(&tl, id, seqno)) 39962306a36Sopenharmony_ci __intel_timeline_sync_set(&tl, id, seqno); 40062306a36Sopenharmony_ci 40162306a36Sopenharmony_ci count++; 40262306a36Sopenharmony_ci } while (!time_after(jiffies, end_time)); 40362306a36Sopenharmony_ci kt = ktime_sub(ktime_get(), kt); 40462306a36Sopenharmony_ci kt = ktime_sub_ns(kt, (count * prng32_1M * 2) >> 20); 40562306a36Sopenharmony_ci pr_info("%s: %lu repeated insert/lookups, %lluns/op\n", 40662306a36Sopenharmony_ci __func__, count, (long long)div64_ul(ktime_to_ns(kt), count)); 40762306a36Sopenharmony_ci mock_timeline_fini(&tl); 40862306a36Sopenharmony_ci cond_resched(); 40962306a36Sopenharmony_ci 41062306a36Sopenharmony_ci /* Benchmark searching for a known context id and changing the seqno */ 41162306a36Sopenharmony_ci for (last_order = 1, order = 1; order < 32; 41262306a36Sopenharmony_ci ({ int tmp = last_order; last_order = order; order += tmp; })) { 41362306a36Sopenharmony_ci unsigned int mask = BIT(order) - 1; 41462306a36Sopenharmony_ci 41562306a36Sopenharmony_ci mock_timeline_init(&tl, 0); 41662306a36Sopenharmony_ci 41762306a36Sopenharmony_ci count = 0; 41862306a36Sopenharmony_ci kt = ktime_get(); 41962306a36Sopenharmony_ci end_time = jiffies + HZ/10; 42062306a36Sopenharmony_ci do { 42162306a36Sopenharmony_ci /* Without assuming too many details of the underlying 42262306a36Sopenharmony_ci * implementation, try to identify its phase-changes 42362306a36Sopenharmony_ci * (if any)! 42462306a36Sopenharmony_ci */ 42562306a36Sopenharmony_ci u64 id = (u64)(count & mask) << order; 42662306a36Sopenharmony_ci 42762306a36Sopenharmony_ci __intel_timeline_sync_is_later(&tl, id, 0); 42862306a36Sopenharmony_ci __intel_timeline_sync_set(&tl, id, 0); 42962306a36Sopenharmony_ci 43062306a36Sopenharmony_ci count++; 43162306a36Sopenharmony_ci } while (!time_after(jiffies, end_time)); 43262306a36Sopenharmony_ci kt = ktime_sub(ktime_get(), kt); 43362306a36Sopenharmony_ci pr_info("%s: %lu cyclic/%d insert/lookups, %lluns/op\n", 43462306a36Sopenharmony_ci __func__, count, order, 43562306a36Sopenharmony_ci (long long)div64_ul(ktime_to_ns(kt), count)); 43662306a36Sopenharmony_ci mock_timeline_fini(&tl); 43762306a36Sopenharmony_ci cond_resched(); 43862306a36Sopenharmony_ci } 43962306a36Sopenharmony_ci 44062306a36Sopenharmony_ci return 0; 44162306a36Sopenharmony_ci} 44262306a36Sopenharmony_ci 44362306a36Sopenharmony_ciint intel_timeline_mock_selftests(void) 44462306a36Sopenharmony_ci{ 44562306a36Sopenharmony_ci static const struct i915_subtest tests[] = { 44662306a36Sopenharmony_ci SUBTEST(mock_hwsp_freelist), 44762306a36Sopenharmony_ci SUBTEST(igt_sync), 44862306a36Sopenharmony_ci SUBTEST(bench_sync), 44962306a36Sopenharmony_ci }; 45062306a36Sopenharmony_ci 45162306a36Sopenharmony_ci return i915_subtests(tests, NULL); 45262306a36Sopenharmony_ci} 45362306a36Sopenharmony_ci 45462306a36Sopenharmony_cistatic int emit_ggtt_store_dw(struct i915_request *rq, u32 addr, u32 value) 45562306a36Sopenharmony_ci{ 45662306a36Sopenharmony_ci u32 *cs; 45762306a36Sopenharmony_ci 45862306a36Sopenharmony_ci cs = intel_ring_begin(rq, 4); 45962306a36Sopenharmony_ci if (IS_ERR(cs)) 46062306a36Sopenharmony_ci return PTR_ERR(cs); 46162306a36Sopenharmony_ci 46262306a36Sopenharmony_ci if (GRAPHICS_VER(rq->i915) >= 8) { 46362306a36Sopenharmony_ci *cs++ = MI_STORE_DWORD_IMM_GEN4 | MI_USE_GGTT; 46462306a36Sopenharmony_ci *cs++ = addr; 46562306a36Sopenharmony_ci *cs++ = 0; 46662306a36Sopenharmony_ci *cs++ = value; 46762306a36Sopenharmony_ci } else if (GRAPHICS_VER(rq->i915) >= 4) { 46862306a36Sopenharmony_ci *cs++ = MI_STORE_DWORD_IMM_GEN4 | MI_USE_GGTT; 46962306a36Sopenharmony_ci *cs++ = 0; 47062306a36Sopenharmony_ci *cs++ = addr; 47162306a36Sopenharmony_ci *cs++ = value; 47262306a36Sopenharmony_ci } else { 47362306a36Sopenharmony_ci *cs++ = MI_STORE_DWORD_IMM | MI_MEM_VIRTUAL; 47462306a36Sopenharmony_ci *cs++ = addr; 47562306a36Sopenharmony_ci *cs++ = value; 47662306a36Sopenharmony_ci *cs++ = MI_NOOP; 47762306a36Sopenharmony_ci } 47862306a36Sopenharmony_ci 47962306a36Sopenharmony_ci intel_ring_advance(rq, cs); 48062306a36Sopenharmony_ci 48162306a36Sopenharmony_ci return 0; 48262306a36Sopenharmony_ci} 48362306a36Sopenharmony_ci 48462306a36Sopenharmony_cistatic struct i915_request * 48562306a36Sopenharmony_cichecked_tl_write(struct intel_timeline *tl, struct intel_engine_cs *engine, u32 value) 48662306a36Sopenharmony_ci{ 48762306a36Sopenharmony_ci struct i915_request *rq; 48862306a36Sopenharmony_ci int err; 48962306a36Sopenharmony_ci 49062306a36Sopenharmony_ci err = selftest_tl_pin(tl); 49162306a36Sopenharmony_ci if (err) { 49262306a36Sopenharmony_ci rq = ERR_PTR(err); 49362306a36Sopenharmony_ci goto out; 49462306a36Sopenharmony_ci } 49562306a36Sopenharmony_ci 49662306a36Sopenharmony_ci if (READ_ONCE(*tl->hwsp_seqno) != tl->seqno) { 49762306a36Sopenharmony_ci pr_err("Timeline created with incorrect breadcrumb, found %x, expected %x\n", 49862306a36Sopenharmony_ci *tl->hwsp_seqno, tl->seqno); 49962306a36Sopenharmony_ci intel_timeline_unpin(tl); 50062306a36Sopenharmony_ci return ERR_PTR(-EINVAL); 50162306a36Sopenharmony_ci } 50262306a36Sopenharmony_ci 50362306a36Sopenharmony_ci rq = intel_engine_create_kernel_request(engine); 50462306a36Sopenharmony_ci if (IS_ERR(rq)) 50562306a36Sopenharmony_ci goto out_unpin; 50662306a36Sopenharmony_ci 50762306a36Sopenharmony_ci i915_request_get(rq); 50862306a36Sopenharmony_ci 50962306a36Sopenharmony_ci err = emit_ggtt_store_dw(rq, tl->hwsp_offset, value); 51062306a36Sopenharmony_ci i915_request_add(rq); 51162306a36Sopenharmony_ci if (err) { 51262306a36Sopenharmony_ci i915_request_put(rq); 51362306a36Sopenharmony_ci rq = ERR_PTR(err); 51462306a36Sopenharmony_ci } 51562306a36Sopenharmony_ci 51662306a36Sopenharmony_ciout_unpin: 51762306a36Sopenharmony_ci intel_timeline_unpin(tl); 51862306a36Sopenharmony_ciout: 51962306a36Sopenharmony_ci if (IS_ERR(rq)) 52062306a36Sopenharmony_ci pr_err("Failed to write to timeline!\n"); 52162306a36Sopenharmony_ci return rq; 52262306a36Sopenharmony_ci} 52362306a36Sopenharmony_ci 52462306a36Sopenharmony_cistatic int live_hwsp_engine(void *arg) 52562306a36Sopenharmony_ci{ 52662306a36Sopenharmony_ci#define NUM_TIMELINES 4096 52762306a36Sopenharmony_ci struct intel_gt *gt = arg; 52862306a36Sopenharmony_ci struct intel_timeline **timelines; 52962306a36Sopenharmony_ci struct intel_engine_cs *engine; 53062306a36Sopenharmony_ci enum intel_engine_id id; 53162306a36Sopenharmony_ci unsigned long count, n; 53262306a36Sopenharmony_ci int err = 0; 53362306a36Sopenharmony_ci 53462306a36Sopenharmony_ci /* 53562306a36Sopenharmony_ci * Create a bunch of timelines and check we can write 53662306a36Sopenharmony_ci * independently to each of their breadcrumb slots. 53762306a36Sopenharmony_ci */ 53862306a36Sopenharmony_ci 53962306a36Sopenharmony_ci timelines = kvmalloc_array(NUM_TIMELINES * I915_NUM_ENGINES, 54062306a36Sopenharmony_ci sizeof(*timelines), 54162306a36Sopenharmony_ci GFP_KERNEL); 54262306a36Sopenharmony_ci if (!timelines) 54362306a36Sopenharmony_ci return -ENOMEM; 54462306a36Sopenharmony_ci 54562306a36Sopenharmony_ci count = 0; 54662306a36Sopenharmony_ci for_each_engine(engine, gt, id) { 54762306a36Sopenharmony_ci if (!intel_engine_can_store_dword(engine)) 54862306a36Sopenharmony_ci continue; 54962306a36Sopenharmony_ci 55062306a36Sopenharmony_ci intel_engine_pm_get(engine); 55162306a36Sopenharmony_ci 55262306a36Sopenharmony_ci for (n = 0; n < NUM_TIMELINES; n++) { 55362306a36Sopenharmony_ci struct intel_timeline *tl; 55462306a36Sopenharmony_ci struct i915_request *rq; 55562306a36Sopenharmony_ci 55662306a36Sopenharmony_ci tl = intel_timeline_create(gt); 55762306a36Sopenharmony_ci if (IS_ERR(tl)) { 55862306a36Sopenharmony_ci err = PTR_ERR(tl); 55962306a36Sopenharmony_ci break; 56062306a36Sopenharmony_ci } 56162306a36Sopenharmony_ci 56262306a36Sopenharmony_ci rq = checked_tl_write(tl, engine, count); 56362306a36Sopenharmony_ci if (IS_ERR(rq)) { 56462306a36Sopenharmony_ci intel_timeline_put(tl); 56562306a36Sopenharmony_ci err = PTR_ERR(rq); 56662306a36Sopenharmony_ci break; 56762306a36Sopenharmony_ci } 56862306a36Sopenharmony_ci 56962306a36Sopenharmony_ci timelines[count++] = tl; 57062306a36Sopenharmony_ci i915_request_put(rq); 57162306a36Sopenharmony_ci } 57262306a36Sopenharmony_ci 57362306a36Sopenharmony_ci intel_engine_pm_put(engine); 57462306a36Sopenharmony_ci if (err) 57562306a36Sopenharmony_ci break; 57662306a36Sopenharmony_ci } 57762306a36Sopenharmony_ci 57862306a36Sopenharmony_ci if (igt_flush_test(gt->i915)) 57962306a36Sopenharmony_ci err = -EIO; 58062306a36Sopenharmony_ci 58162306a36Sopenharmony_ci for (n = 0; n < count; n++) { 58262306a36Sopenharmony_ci struct intel_timeline *tl = timelines[n]; 58362306a36Sopenharmony_ci 58462306a36Sopenharmony_ci if (!err && READ_ONCE(*tl->hwsp_seqno) != n) { 58562306a36Sopenharmony_ci GEM_TRACE_ERR("Invalid seqno:%lu stored in timeline %llu @ %x, found 0x%x\n", 58662306a36Sopenharmony_ci n, tl->fence_context, tl->hwsp_offset, *tl->hwsp_seqno); 58762306a36Sopenharmony_ci GEM_TRACE_DUMP(); 58862306a36Sopenharmony_ci err = -EINVAL; 58962306a36Sopenharmony_ci } 59062306a36Sopenharmony_ci intel_timeline_put(tl); 59162306a36Sopenharmony_ci } 59262306a36Sopenharmony_ci 59362306a36Sopenharmony_ci kvfree(timelines); 59462306a36Sopenharmony_ci return err; 59562306a36Sopenharmony_ci#undef NUM_TIMELINES 59662306a36Sopenharmony_ci} 59762306a36Sopenharmony_ci 59862306a36Sopenharmony_cistatic int live_hwsp_alternate(void *arg) 59962306a36Sopenharmony_ci{ 60062306a36Sopenharmony_ci#define NUM_TIMELINES 4096 60162306a36Sopenharmony_ci struct intel_gt *gt = arg; 60262306a36Sopenharmony_ci struct intel_timeline **timelines; 60362306a36Sopenharmony_ci struct intel_engine_cs *engine; 60462306a36Sopenharmony_ci enum intel_engine_id id; 60562306a36Sopenharmony_ci unsigned long count, n; 60662306a36Sopenharmony_ci int err = 0; 60762306a36Sopenharmony_ci 60862306a36Sopenharmony_ci /* 60962306a36Sopenharmony_ci * Create a bunch of timelines and check we can write 61062306a36Sopenharmony_ci * independently to each of their breadcrumb slots with adjacent 61162306a36Sopenharmony_ci * engines. 61262306a36Sopenharmony_ci */ 61362306a36Sopenharmony_ci 61462306a36Sopenharmony_ci timelines = kvmalloc_array(NUM_TIMELINES * I915_NUM_ENGINES, 61562306a36Sopenharmony_ci sizeof(*timelines), 61662306a36Sopenharmony_ci GFP_KERNEL); 61762306a36Sopenharmony_ci if (!timelines) 61862306a36Sopenharmony_ci return -ENOMEM; 61962306a36Sopenharmony_ci 62062306a36Sopenharmony_ci count = 0; 62162306a36Sopenharmony_ci for (n = 0; n < NUM_TIMELINES; n++) { 62262306a36Sopenharmony_ci for_each_engine(engine, gt, id) { 62362306a36Sopenharmony_ci struct intel_timeline *tl; 62462306a36Sopenharmony_ci struct i915_request *rq; 62562306a36Sopenharmony_ci 62662306a36Sopenharmony_ci if (!intel_engine_can_store_dword(engine)) 62762306a36Sopenharmony_ci continue; 62862306a36Sopenharmony_ci 62962306a36Sopenharmony_ci tl = intel_timeline_create(gt); 63062306a36Sopenharmony_ci if (IS_ERR(tl)) { 63162306a36Sopenharmony_ci err = PTR_ERR(tl); 63262306a36Sopenharmony_ci goto out; 63362306a36Sopenharmony_ci } 63462306a36Sopenharmony_ci 63562306a36Sopenharmony_ci intel_engine_pm_get(engine); 63662306a36Sopenharmony_ci rq = checked_tl_write(tl, engine, count); 63762306a36Sopenharmony_ci intel_engine_pm_put(engine); 63862306a36Sopenharmony_ci if (IS_ERR(rq)) { 63962306a36Sopenharmony_ci intel_timeline_put(tl); 64062306a36Sopenharmony_ci err = PTR_ERR(rq); 64162306a36Sopenharmony_ci goto out; 64262306a36Sopenharmony_ci } 64362306a36Sopenharmony_ci 64462306a36Sopenharmony_ci timelines[count++] = tl; 64562306a36Sopenharmony_ci i915_request_put(rq); 64662306a36Sopenharmony_ci } 64762306a36Sopenharmony_ci } 64862306a36Sopenharmony_ci 64962306a36Sopenharmony_ciout: 65062306a36Sopenharmony_ci if (igt_flush_test(gt->i915)) 65162306a36Sopenharmony_ci err = -EIO; 65262306a36Sopenharmony_ci 65362306a36Sopenharmony_ci for (n = 0; n < count; n++) { 65462306a36Sopenharmony_ci struct intel_timeline *tl = timelines[n]; 65562306a36Sopenharmony_ci 65662306a36Sopenharmony_ci if (!err && READ_ONCE(*tl->hwsp_seqno) != n) { 65762306a36Sopenharmony_ci GEM_TRACE_ERR("Invalid seqno:%lu stored in timeline %llu @ %x, found 0x%x\n", 65862306a36Sopenharmony_ci n, tl->fence_context, tl->hwsp_offset, *tl->hwsp_seqno); 65962306a36Sopenharmony_ci GEM_TRACE_DUMP(); 66062306a36Sopenharmony_ci err = -EINVAL; 66162306a36Sopenharmony_ci } 66262306a36Sopenharmony_ci intel_timeline_put(tl); 66362306a36Sopenharmony_ci } 66462306a36Sopenharmony_ci 66562306a36Sopenharmony_ci kvfree(timelines); 66662306a36Sopenharmony_ci return err; 66762306a36Sopenharmony_ci#undef NUM_TIMELINES 66862306a36Sopenharmony_ci} 66962306a36Sopenharmony_ci 67062306a36Sopenharmony_cistatic int live_hwsp_wrap(void *arg) 67162306a36Sopenharmony_ci{ 67262306a36Sopenharmony_ci struct intel_gt *gt = arg; 67362306a36Sopenharmony_ci struct intel_engine_cs *engine; 67462306a36Sopenharmony_ci struct intel_timeline *tl; 67562306a36Sopenharmony_ci enum intel_engine_id id; 67662306a36Sopenharmony_ci int err = 0; 67762306a36Sopenharmony_ci 67862306a36Sopenharmony_ci /* 67962306a36Sopenharmony_ci * Across a seqno wrap, we need to keep the old cacheline alive for 68062306a36Sopenharmony_ci * foreign GPU references. 68162306a36Sopenharmony_ci */ 68262306a36Sopenharmony_ci 68362306a36Sopenharmony_ci tl = intel_timeline_create(gt); 68462306a36Sopenharmony_ci if (IS_ERR(tl)) 68562306a36Sopenharmony_ci return PTR_ERR(tl); 68662306a36Sopenharmony_ci 68762306a36Sopenharmony_ci if (!tl->has_initial_breadcrumb) 68862306a36Sopenharmony_ci goto out_free; 68962306a36Sopenharmony_ci 69062306a36Sopenharmony_ci err = selftest_tl_pin(tl); 69162306a36Sopenharmony_ci if (err) 69262306a36Sopenharmony_ci goto out_free; 69362306a36Sopenharmony_ci 69462306a36Sopenharmony_ci for_each_engine(engine, gt, id) { 69562306a36Sopenharmony_ci const u32 *hwsp_seqno[2]; 69662306a36Sopenharmony_ci struct i915_request *rq; 69762306a36Sopenharmony_ci u32 seqno[2]; 69862306a36Sopenharmony_ci 69962306a36Sopenharmony_ci if (!intel_engine_can_store_dword(engine)) 70062306a36Sopenharmony_ci continue; 70162306a36Sopenharmony_ci 70262306a36Sopenharmony_ci rq = intel_engine_create_kernel_request(engine); 70362306a36Sopenharmony_ci if (IS_ERR(rq)) { 70462306a36Sopenharmony_ci err = PTR_ERR(rq); 70562306a36Sopenharmony_ci goto out; 70662306a36Sopenharmony_ci } 70762306a36Sopenharmony_ci 70862306a36Sopenharmony_ci tl->seqno = -4u; 70962306a36Sopenharmony_ci 71062306a36Sopenharmony_ci mutex_lock_nested(&tl->mutex, SINGLE_DEPTH_NESTING); 71162306a36Sopenharmony_ci err = intel_timeline_get_seqno(tl, rq, &seqno[0]); 71262306a36Sopenharmony_ci mutex_unlock(&tl->mutex); 71362306a36Sopenharmony_ci if (err) { 71462306a36Sopenharmony_ci i915_request_add(rq); 71562306a36Sopenharmony_ci goto out; 71662306a36Sopenharmony_ci } 71762306a36Sopenharmony_ci pr_debug("seqno[0]:%08x, hwsp_offset:%08x\n", 71862306a36Sopenharmony_ci seqno[0], tl->hwsp_offset); 71962306a36Sopenharmony_ci 72062306a36Sopenharmony_ci err = emit_ggtt_store_dw(rq, tl->hwsp_offset, seqno[0]); 72162306a36Sopenharmony_ci if (err) { 72262306a36Sopenharmony_ci i915_request_add(rq); 72362306a36Sopenharmony_ci goto out; 72462306a36Sopenharmony_ci } 72562306a36Sopenharmony_ci hwsp_seqno[0] = tl->hwsp_seqno; 72662306a36Sopenharmony_ci 72762306a36Sopenharmony_ci mutex_lock_nested(&tl->mutex, SINGLE_DEPTH_NESTING); 72862306a36Sopenharmony_ci err = intel_timeline_get_seqno(tl, rq, &seqno[1]); 72962306a36Sopenharmony_ci mutex_unlock(&tl->mutex); 73062306a36Sopenharmony_ci if (err) { 73162306a36Sopenharmony_ci i915_request_add(rq); 73262306a36Sopenharmony_ci goto out; 73362306a36Sopenharmony_ci } 73462306a36Sopenharmony_ci pr_debug("seqno[1]:%08x, hwsp_offset:%08x\n", 73562306a36Sopenharmony_ci seqno[1], tl->hwsp_offset); 73662306a36Sopenharmony_ci 73762306a36Sopenharmony_ci err = emit_ggtt_store_dw(rq, tl->hwsp_offset, seqno[1]); 73862306a36Sopenharmony_ci if (err) { 73962306a36Sopenharmony_ci i915_request_add(rq); 74062306a36Sopenharmony_ci goto out; 74162306a36Sopenharmony_ci } 74262306a36Sopenharmony_ci hwsp_seqno[1] = tl->hwsp_seqno; 74362306a36Sopenharmony_ci 74462306a36Sopenharmony_ci /* With wrap should come a new hwsp */ 74562306a36Sopenharmony_ci GEM_BUG_ON(seqno[1] >= seqno[0]); 74662306a36Sopenharmony_ci GEM_BUG_ON(hwsp_seqno[0] == hwsp_seqno[1]); 74762306a36Sopenharmony_ci 74862306a36Sopenharmony_ci i915_request_add(rq); 74962306a36Sopenharmony_ci 75062306a36Sopenharmony_ci if (i915_request_wait(rq, 0, HZ / 5) < 0) { 75162306a36Sopenharmony_ci pr_err("Wait for timeline writes timed out!\n"); 75262306a36Sopenharmony_ci err = -EIO; 75362306a36Sopenharmony_ci goto out; 75462306a36Sopenharmony_ci } 75562306a36Sopenharmony_ci 75662306a36Sopenharmony_ci if (READ_ONCE(*hwsp_seqno[0]) != seqno[0] || 75762306a36Sopenharmony_ci READ_ONCE(*hwsp_seqno[1]) != seqno[1]) { 75862306a36Sopenharmony_ci pr_err("Bad timeline values: found (%x, %x), expected (%x, %x)\n", 75962306a36Sopenharmony_ci *hwsp_seqno[0], *hwsp_seqno[1], 76062306a36Sopenharmony_ci seqno[0], seqno[1]); 76162306a36Sopenharmony_ci err = -EINVAL; 76262306a36Sopenharmony_ci goto out; 76362306a36Sopenharmony_ci } 76462306a36Sopenharmony_ci 76562306a36Sopenharmony_ci intel_gt_retire_requests(gt); /* recycle HWSP */ 76662306a36Sopenharmony_ci } 76762306a36Sopenharmony_ci 76862306a36Sopenharmony_ciout: 76962306a36Sopenharmony_ci if (igt_flush_test(gt->i915)) 77062306a36Sopenharmony_ci err = -EIO; 77162306a36Sopenharmony_ci 77262306a36Sopenharmony_ci intel_timeline_unpin(tl); 77362306a36Sopenharmony_ciout_free: 77462306a36Sopenharmony_ci intel_timeline_put(tl); 77562306a36Sopenharmony_ci return err; 77662306a36Sopenharmony_ci} 77762306a36Sopenharmony_ci 77862306a36Sopenharmony_cistatic int emit_read_hwsp(struct i915_request *rq, 77962306a36Sopenharmony_ci u32 seqno, u32 hwsp, 78062306a36Sopenharmony_ci u32 *addr) 78162306a36Sopenharmony_ci{ 78262306a36Sopenharmony_ci const u32 gpr = i915_mmio_reg_offset(GEN8_RING_CS_GPR(rq->engine->mmio_base, 0)); 78362306a36Sopenharmony_ci u32 *cs; 78462306a36Sopenharmony_ci 78562306a36Sopenharmony_ci cs = intel_ring_begin(rq, 12); 78662306a36Sopenharmony_ci if (IS_ERR(cs)) 78762306a36Sopenharmony_ci return PTR_ERR(cs); 78862306a36Sopenharmony_ci 78962306a36Sopenharmony_ci *cs++ = MI_STORE_DWORD_IMM_GEN4 | MI_USE_GGTT; 79062306a36Sopenharmony_ci *cs++ = *addr; 79162306a36Sopenharmony_ci *cs++ = 0; 79262306a36Sopenharmony_ci *cs++ = seqno; 79362306a36Sopenharmony_ci *addr += 4; 79462306a36Sopenharmony_ci 79562306a36Sopenharmony_ci *cs++ = MI_LOAD_REGISTER_MEM_GEN8 | MI_USE_GGTT; 79662306a36Sopenharmony_ci *cs++ = gpr; 79762306a36Sopenharmony_ci *cs++ = hwsp; 79862306a36Sopenharmony_ci *cs++ = 0; 79962306a36Sopenharmony_ci 80062306a36Sopenharmony_ci *cs++ = MI_STORE_REGISTER_MEM_GEN8 | MI_USE_GGTT; 80162306a36Sopenharmony_ci *cs++ = gpr; 80262306a36Sopenharmony_ci *cs++ = *addr; 80362306a36Sopenharmony_ci *cs++ = 0; 80462306a36Sopenharmony_ci *addr += 4; 80562306a36Sopenharmony_ci 80662306a36Sopenharmony_ci intel_ring_advance(rq, cs); 80762306a36Sopenharmony_ci 80862306a36Sopenharmony_ci return 0; 80962306a36Sopenharmony_ci} 81062306a36Sopenharmony_ci 81162306a36Sopenharmony_cistruct hwsp_watcher { 81262306a36Sopenharmony_ci struct i915_vma *vma; 81362306a36Sopenharmony_ci struct i915_request *rq; 81462306a36Sopenharmony_ci u32 addr; 81562306a36Sopenharmony_ci u32 *map; 81662306a36Sopenharmony_ci}; 81762306a36Sopenharmony_ci 81862306a36Sopenharmony_cistatic bool cmp_lt(u32 a, u32 b) 81962306a36Sopenharmony_ci{ 82062306a36Sopenharmony_ci return a < b; 82162306a36Sopenharmony_ci} 82262306a36Sopenharmony_ci 82362306a36Sopenharmony_cistatic bool cmp_gte(u32 a, u32 b) 82462306a36Sopenharmony_ci{ 82562306a36Sopenharmony_ci return a >= b; 82662306a36Sopenharmony_ci} 82762306a36Sopenharmony_ci 82862306a36Sopenharmony_cistatic int setup_watcher(struct hwsp_watcher *w, struct intel_gt *gt, 82962306a36Sopenharmony_ci struct intel_timeline *tl) 83062306a36Sopenharmony_ci{ 83162306a36Sopenharmony_ci struct drm_i915_gem_object *obj; 83262306a36Sopenharmony_ci struct i915_vma *vma; 83362306a36Sopenharmony_ci 83462306a36Sopenharmony_ci obj = i915_gem_object_create_internal(gt->i915, SZ_2M); 83562306a36Sopenharmony_ci if (IS_ERR(obj)) 83662306a36Sopenharmony_ci return PTR_ERR(obj); 83762306a36Sopenharmony_ci 83862306a36Sopenharmony_ci /* keep the same cache settings as timeline */ 83962306a36Sopenharmony_ci i915_gem_object_set_pat_index(obj, tl->hwsp_ggtt->obj->pat_index); 84062306a36Sopenharmony_ci w->map = i915_gem_object_pin_map_unlocked(obj, 84162306a36Sopenharmony_ci page_unmask_bits(tl->hwsp_ggtt->obj->mm.mapping)); 84262306a36Sopenharmony_ci if (IS_ERR(w->map)) { 84362306a36Sopenharmony_ci i915_gem_object_put(obj); 84462306a36Sopenharmony_ci return PTR_ERR(w->map); 84562306a36Sopenharmony_ci } 84662306a36Sopenharmony_ci 84762306a36Sopenharmony_ci vma = i915_gem_object_ggtt_pin(obj, NULL, 0, 0, 0); 84862306a36Sopenharmony_ci if (IS_ERR(vma)) { 84962306a36Sopenharmony_ci i915_gem_object_put(obj); 85062306a36Sopenharmony_ci return PTR_ERR(vma); 85162306a36Sopenharmony_ci } 85262306a36Sopenharmony_ci 85362306a36Sopenharmony_ci w->vma = vma; 85462306a36Sopenharmony_ci w->addr = i915_ggtt_offset(vma); 85562306a36Sopenharmony_ci return 0; 85662306a36Sopenharmony_ci} 85762306a36Sopenharmony_ci 85862306a36Sopenharmony_cistatic void switch_tl_lock(struct i915_request *from, struct i915_request *to) 85962306a36Sopenharmony_ci{ 86062306a36Sopenharmony_ci /* some light mutex juggling required; think co-routines */ 86162306a36Sopenharmony_ci 86262306a36Sopenharmony_ci if (from) { 86362306a36Sopenharmony_ci lockdep_unpin_lock(&from->context->timeline->mutex, from->cookie); 86462306a36Sopenharmony_ci mutex_unlock(&from->context->timeline->mutex); 86562306a36Sopenharmony_ci } 86662306a36Sopenharmony_ci 86762306a36Sopenharmony_ci if (to) { 86862306a36Sopenharmony_ci mutex_lock(&to->context->timeline->mutex); 86962306a36Sopenharmony_ci to->cookie = lockdep_pin_lock(&to->context->timeline->mutex); 87062306a36Sopenharmony_ci } 87162306a36Sopenharmony_ci} 87262306a36Sopenharmony_ci 87362306a36Sopenharmony_cistatic int create_watcher(struct hwsp_watcher *w, 87462306a36Sopenharmony_ci struct intel_engine_cs *engine, 87562306a36Sopenharmony_ci int ringsz) 87662306a36Sopenharmony_ci{ 87762306a36Sopenharmony_ci struct intel_context *ce; 87862306a36Sopenharmony_ci 87962306a36Sopenharmony_ci ce = intel_context_create(engine); 88062306a36Sopenharmony_ci if (IS_ERR(ce)) 88162306a36Sopenharmony_ci return PTR_ERR(ce); 88262306a36Sopenharmony_ci 88362306a36Sopenharmony_ci ce->ring_size = ringsz; 88462306a36Sopenharmony_ci w->rq = intel_context_create_request(ce); 88562306a36Sopenharmony_ci intel_context_put(ce); 88662306a36Sopenharmony_ci if (IS_ERR(w->rq)) 88762306a36Sopenharmony_ci return PTR_ERR(w->rq); 88862306a36Sopenharmony_ci 88962306a36Sopenharmony_ci w->addr = i915_ggtt_offset(w->vma); 89062306a36Sopenharmony_ci 89162306a36Sopenharmony_ci switch_tl_lock(w->rq, NULL); 89262306a36Sopenharmony_ci 89362306a36Sopenharmony_ci return 0; 89462306a36Sopenharmony_ci} 89562306a36Sopenharmony_ci 89662306a36Sopenharmony_cistatic int check_watcher(struct hwsp_watcher *w, const char *name, 89762306a36Sopenharmony_ci bool (*op)(u32 hwsp, u32 seqno)) 89862306a36Sopenharmony_ci{ 89962306a36Sopenharmony_ci struct i915_request *rq = fetch_and_zero(&w->rq); 90062306a36Sopenharmony_ci u32 offset, end; 90162306a36Sopenharmony_ci int err; 90262306a36Sopenharmony_ci 90362306a36Sopenharmony_ci GEM_BUG_ON(w->addr - i915_ggtt_offset(w->vma) > w->vma->size); 90462306a36Sopenharmony_ci 90562306a36Sopenharmony_ci i915_request_get(rq); 90662306a36Sopenharmony_ci switch_tl_lock(NULL, rq); 90762306a36Sopenharmony_ci i915_request_add(rq); 90862306a36Sopenharmony_ci 90962306a36Sopenharmony_ci if (i915_request_wait(rq, 0, HZ) < 0) { 91062306a36Sopenharmony_ci err = -ETIME; 91162306a36Sopenharmony_ci goto out; 91262306a36Sopenharmony_ci } 91362306a36Sopenharmony_ci 91462306a36Sopenharmony_ci err = 0; 91562306a36Sopenharmony_ci offset = 0; 91662306a36Sopenharmony_ci end = (w->addr - i915_ggtt_offset(w->vma)) / sizeof(*w->map); 91762306a36Sopenharmony_ci while (offset < end) { 91862306a36Sopenharmony_ci if (!op(w->map[offset + 1], w->map[offset])) { 91962306a36Sopenharmony_ci pr_err("Watcher '%s' found HWSP value %x for seqno %x\n", 92062306a36Sopenharmony_ci name, w->map[offset + 1], w->map[offset]); 92162306a36Sopenharmony_ci err = -EINVAL; 92262306a36Sopenharmony_ci } 92362306a36Sopenharmony_ci 92462306a36Sopenharmony_ci offset += 2; 92562306a36Sopenharmony_ci } 92662306a36Sopenharmony_ci 92762306a36Sopenharmony_ciout: 92862306a36Sopenharmony_ci i915_request_put(rq); 92962306a36Sopenharmony_ci return err; 93062306a36Sopenharmony_ci} 93162306a36Sopenharmony_ci 93262306a36Sopenharmony_cistatic void cleanup_watcher(struct hwsp_watcher *w) 93362306a36Sopenharmony_ci{ 93462306a36Sopenharmony_ci if (w->rq) { 93562306a36Sopenharmony_ci switch_tl_lock(NULL, w->rq); 93662306a36Sopenharmony_ci 93762306a36Sopenharmony_ci i915_request_add(w->rq); 93862306a36Sopenharmony_ci } 93962306a36Sopenharmony_ci 94062306a36Sopenharmony_ci i915_vma_unpin_and_release(&w->vma, I915_VMA_RELEASE_MAP); 94162306a36Sopenharmony_ci} 94262306a36Sopenharmony_ci 94362306a36Sopenharmony_cistatic bool retire_requests(struct intel_timeline *tl) 94462306a36Sopenharmony_ci{ 94562306a36Sopenharmony_ci struct i915_request *rq, *rn; 94662306a36Sopenharmony_ci 94762306a36Sopenharmony_ci mutex_lock(&tl->mutex); 94862306a36Sopenharmony_ci list_for_each_entry_safe(rq, rn, &tl->requests, link) 94962306a36Sopenharmony_ci if (!i915_request_retire(rq)) 95062306a36Sopenharmony_ci break; 95162306a36Sopenharmony_ci mutex_unlock(&tl->mutex); 95262306a36Sopenharmony_ci 95362306a36Sopenharmony_ci return !i915_active_fence_isset(&tl->last_request); 95462306a36Sopenharmony_ci} 95562306a36Sopenharmony_ci 95662306a36Sopenharmony_cistatic struct i915_request *wrap_timeline(struct i915_request *rq) 95762306a36Sopenharmony_ci{ 95862306a36Sopenharmony_ci struct intel_context *ce = rq->context; 95962306a36Sopenharmony_ci struct intel_timeline *tl = ce->timeline; 96062306a36Sopenharmony_ci u32 seqno = rq->fence.seqno; 96162306a36Sopenharmony_ci 96262306a36Sopenharmony_ci while (tl->seqno >= seqno) { /* Cause a wrap */ 96362306a36Sopenharmony_ci i915_request_put(rq); 96462306a36Sopenharmony_ci rq = intel_context_create_request(ce); 96562306a36Sopenharmony_ci if (IS_ERR(rq)) 96662306a36Sopenharmony_ci return rq; 96762306a36Sopenharmony_ci 96862306a36Sopenharmony_ci i915_request_get(rq); 96962306a36Sopenharmony_ci i915_request_add(rq); 97062306a36Sopenharmony_ci } 97162306a36Sopenharmony_ci 97262306a36Sopenharmony_ci i915_request_put(rq); 97362306a36Sopenharmony_ci rq = i915_request_create(ce); 97462306a36Sopenharmony_ci if (IS_ERR(rq)) 97562306a36Sopenharmony_ci return rq; 97662306a36Sopenharmony_ci 97762306a36Sopenharmony_ci i915_request_get(rq); 97862306a36Sopenharmony_ci i915_request_add(rq); 97962306a36Sopenharmony_ci 98062306a36Sopenharmony_ci return rq; 98162306a36Sopenharmony_ci} 98262306a36Sopenharmony_ci 98362306a36Sopenharmony_cistatic int live_hwsp_read(void *arg) 98462306a36Sopenharmony_ci{ 98562306a36Sopenharmony_ci struct intel_gt *gt = arg; 98662306a36Sopenharmony_ci struct hwsp_watcher watcher[2] = {}; 98762306a36Sopenharmony_ci struct intel_engine_cs *engine; 98862306a36Sopenharmony_ci struct intel_timeline *tl; 98962306a36Sopenharmony_ci enum intel_engine_id id; 99062306a36Sopenharmony_ci int err = 0; 99162306a36Sopenharmony_ci int i; 99262306a36Sopenharmony_ci 99362306a36Sopenharmony_ci /* 99462306a36Sopenharmony_ci * If we take a reference to the HWSP for reading on the GPU, that 99562306a36Sopenharmony_ci * read may be arbitrarily delayed (either by foreign fence or 99662306a36Sopenharmony_ci * priority saturation) and a wrap can happen within 30 minutes. 99762306a36Sopenharmony_ci * When the GPU read is finally submitted it should be correct, 99862306a36Sopenharmony_ci * even across multiple wraps. 99962306a36Sopenharmony_ci */ 100062306a36Sopenharmony_ci 100162306a36Sopenharmony_ci if (GRAPHICS_VER(gt->i915) < 8) /* CS convenience [SRM/LRM] */ 100262306a36Sopenharmony_ci return 0; 100362306a36Sopenharmony_ci 100462306a36Sopenharmony_ci tl = intel_timeline_create(gt); 100562306a36Sopenharmony_ci if (IS_ERR(tl)) 100662306a36Sopenharmony_ci return PTR_ERR(tl); 100762306a36Sopenharmony_ci 100862306a36Sopenharmony_ci if (!tl->has_initial_breadcrumb) 100962306a36Sopenharmony_ci goto out_free; 101062306a36Sopenharmony_ci 101162306a36Sopenharmony_ci selftest_tl_pin(tl); 101262306a36Sopenharmony_ci 101362306a36Sopenharmony_ci for (i = 0; i < ARRAY_SIZE(watcher); i++) { 101462306a36Sopenharmony_ci err = setup_watcher(&watcher[i], gt, tl); 101562306a36Sopenharmony_ci if (err) 101662306a36Sopenharmony_ci goto out; 101762306a36Sopenharmony_ci } 101862306a36Sopenharmony_ci 101962306a36Sopenharmony_ci for_each_engine(engine, gt, id) { 102062306a36Sopenharmony_ci struct intel_context *ce; 102162306a36Sopenharmony_ci unsigned long count = 0; 102262306a36Sopenharmony_ci IGT_TIMEOUT(end_time); 102362306a36Sopenharmony_ci 102462306a36Sopenharmony_ci /* Create a request we can use for remote reading of the HWSP */ 102562306a36Sopenharmony_ci err = create_watcher(&watcher[1], engine, SZ_512K); 102662306a36Sopenharmony_ci if (err) 102762306a36Sopenharmony_ci goto out; 102862306a36Sopenharmony_ci 102962306a36Sopenharmony_ci do { 103062306a36Sopenharmony_ci struct i915_sw_fence *submit; 103162306a36Sopenharmony_ci struct i915_request *rq; 103262306a36Sopenharmony_ci u32 hwsp, dummy; 103362306a36Sopenharmony_ci 103462306a36Sopenharmony_ci submit = heap_fence_create(GFP_KERNEL); 103562306a36Sopenharmony_ci if (!submit) { 103662306a36Sopenharmony_ci err = -ENOMEM; 103762306a36Sopenharmony_ci goto out; 103862306a36Sopenharmony_ci } 103962306a36Sopenharmony_ci 104062306a36Sopenharmony_ci err = create_watcher(&watcher[0], engine, SZ_4K); 104162306a36Sopenharmony_ci if (err) 104262306a36Sopenharmony_ci goto out; 104362306a36Sopenharmony_ci 104462306a36Sopenharmony_ci ce = intel_context_create(engine); 104562306a36Sopenharmony_ci if (IS_ERR(ce)) { 104662306a36Sopenharmony_ci err = PTR_ERR(ce); 104762306a36Sopenharmony_ci goto out; 104862306a36Sopenharmony_ci } 104962306a36Sopenharmony_ci 105062306a36Sopenharmony_ci ce->timeline = intel_timeline_get(tl); 105162306a36Sopenharmony_ci 105262306a36Sopenharmony_ci /* Ensure timeline is mapped, done during first pin */ 105362306a36Sopenharmony_ci err = intel_context_pin(ce); 105462306a36Sopenharmony_ci if (err) { 105562306a36Sopenharmony_ci intel_context_put(ce); 105662306a36Sopenharmony_ci goto out; 105762306a36Sopenharmony_ci } 105862306a36Sopenharmony_ci 105962306a36Sopenharmony_ci /* 106062306a36Sopenharmony_ci * Start at a new wrap, and set seqno right before another wrap, 106162306a36Sopenharmony_ci * saving 30 minutes of nops 106262306a36Sopenharmony_ci */ 106362306a36Sopenharmony_ci tl->seqno = -12u + 2 * (count & 3); 106462306a36Sopenharmony_ci __intel_timeline_get_seqno(tl, &dummy); 106562306a36Sopenharmony_ci 106662306a36Sopenharmony_ci rq = i915_request_create(ce); 106762306a36Sopenharmony_ci if (IS_ERR(rq)) { 106862306a36Sopenharmony_ci err = PTR_ERR(rq); 106962306a36Sopenharmony_ci intel_context_unpin(ce); 107062306a36Sopenharmony_ci intel_context_put(ce); 107162306a36Sopenharmony_ci goto out; 107262306a36Sopenharmony_ci } 107362306a36Sopenharmony_ci 107462306a36Sopenharmony_ci err = i915_sw_fence_await_dma_fence(&rq->submit, 107562306a36Sopenharmony_ci &watcher[0].rq->fence, 0, 107662306a36Sopenharmony_ci GFP_KERNEL); 107762306a36Sopenharmony_ci if (err < 0) { 107862306a36Sopenharmony_ci i915_request_add(rq); 107962306a36Sopenharmony_ci intel_context_unpin(ce); 108062306a36Sopenharmony_ci intel_context_put(ce); 108162306a36Sopenharmony_ci goto out; 108262306a36Sopenharmony_ci } 108362306a36Sopenharmony_ci 108462306a36Sopenharmony_ci switch_tl_lock(rq, watcher[0].rq); 108562306a36Sopenharmony_ci err = intel_timeline_read_hwsp(rq, watcher[0].rq, &hwsp); 108662306a36Sopenharmony_ci if (err == 0) 108762306a36Sopenharmony_ci err = emit_read_hwsp(watcher[0].rq, /* before */ 108862306a36Sopenharmony_ci rq->fence.seqno, hwsp, 108962306a36Sopenharmony_ci &watcher[0].addr); 109062306a36Sopenharmony_ci switch_tl_lock(watcher[0].rq, rq); 109162306a36Sopenharmony_ci if (err) { 109262306a36Sopenharmony_ci i915_request_add(rq); 109362306a36Sopenharmony_ci intel_context_unpin(ce); 109462306a36Sopenharmony_ci intel_context_put(ce); 109562306a36Sopenharmony_ci goto out; 109662306a36Sopenharmony_ci } 109762306a36Sopenharmony_ci 109862306a36Sopenharmony_ci switch_tl_lock(rq, watcher[1].rq); 109962306a36Sopenharmony_ci err = intel_timeline_read_hwsp(rq, watcher[1].rq, &hwsp); 110062306a36Sopenharmony_ci if (err == 0) 110162306a36Sopenharmony_ci err = emit_read_hwsp(watcher[1].rq, /* after */ 110262306a36Sopenharmony_ci rq->fence.seqno, hwsp, 110362306a36Sopenharmony_ci &watcher[1].addr); 110462306a36Sopenharmony_ci switch_tl_lock(watcher[1].rq, rq); 110562306a36Sopenharmony_ci if (err) { 110662306a36Sopenharmony_ci i915_request_add(rq); 110762306a36Sopenharmony_ci intel_context_unpin(ce); 110862306a36Sopenharmony_ci intel_context_put(ce); 110962306a36Sopenharmony_ci goto out; 111062306a36Sopenharmony_ci } 111162306a36Sopenharmony_ci 111262306a36Sopenharmony_ci i915_request_get(rq); 111362306a36Sopenharmony_ci i915_request_add(rq); 111462306a36Sopenharmony_ci 111562306a36Sopenharmony_ci rq = wrap_timeline(rq); 111662306a36Sopenharmony_ci intel_context_unpin(ce); 111762306a36Sopenharmony_ci intel_context_put(ce); 111862306a36Sopenharmony_ci if (IS_ERR(rq)) { 111962306a36Sopenharmony_ci err = PTR_ERR(rq); 112062306a36Sopenharmony_ci goto out; 112162306a36Sopenharmony_ci } 112262306a36Sopenharmony_ci 112362306a36Sopenharmony_ci err = i915_sw_fence_await_dma_fence(&watcher[1].rq->submit, 112462306a36Sopenharmony_ci &rq->fence, 0, 112562306a36Sopenharmony_ci GFP_KERNEL); 112662306a36Sopenharmony_ci if (err < 0) { 112762306a36Sopenharmony_ci i915_request_put(rq); 112862306a36Sopenharmony_ci goto out; 112962306a36Sopenharmony_ci } 113062306a36Sopenharmony_ci 113162306a36Sopenharmony_ci err = check_watcher(&watcher[0], "before", cmp_lt); 113262306a36Sopenharmony_ci i915_sw_fence_commit(submit); 113362306a36Sopenharmony_ci heap_fence_put(submit); 113462306a36Sopenharmony_ci if (err) { 113562306a36Sopenharmony_ci i915_request_put(rq); 113662306a36Sopenharmony_ci goto out; 113762306a36Sopenharmony_ci } 113862306a36Sopenharmony_ci count++; 113962306a36Sopenharmony_ci 114062306a36Sopenharmony_ci /* Flush the timeline before manually wrapping again */ 114162306a36Sopenharmony_ci if (i915_request_wait(rq, 114262306a36Sopenharmony_ci I915_WAIT_INTERRUPTIBLE, 114362306a36Sopenharmony_ci HZ) < 0) { 114462306a36Sopenharmony_ci err = -ETIME; 114562306a36Sopenharmony_ci i915_request_put(rq); 114662306a36Sopenharmony_ci goto out; 114762306a36Sopenharmony_ci } 114862306a36Sopenharmony_ci retire_requests(tl); 114962306a36Sopenharmony_ci i915_request_put(rq); 115062306a36Sopenharmony_ci 115162306a36Sopenharmony_ci /* Single requests are limited to half a ring at most */ 115262306a36Sopenharmony_ci if (8 * watcher[1].rq->ring->emit > 115362306a36Sopenharmony_ci 3 * watcher[1].rq->ring->size) 115462306a36Sopenharmony_ci break; 115562306a36Sopenharmony_ci 115662306a36Sopenharmony_ci } while (!__igt_timeout(end_time, NULL) && 115762306a36Sopenharmony_ci count < (PAGE_SIZE / TIMELINE_SEQNO_BYTES - 1) / 2); 115862306a36Sopenharmony_ci 115962306a36Sopenharmony_ci pr_info("%s: simulated %lu wraps\n", engine->name, count); 116062306a36Sopenharmony_ci err = check_watcher(&watcher[1], "after", cmp_gte); 116162306a36Sopenharmony_ci if (err) 116262306a36Sopenharmony_ci goto out; 116362306a36Sopenharmony_ci } 116462306a36Sopenharmony_ci 116562306a36Sopenharmony_ciout: 116662306a36Sopenharmony_ci for (i = 0; i < ARRAY_SIZE(watcher); i++) 116762306a36Sopenharmony_ci cleanup_watcher(&watcher[i]); 116862306a36Sopenharmony_ci 116962306a36Sopenharmony_ci intel_timeline_unpin(tl); 117062306a36Sopenharmony_ci 117162306a36Sopenharmony_ci if (igt_flush_test(gt->i915)) 117262306a36Sopenharmony_ci err = -EIO; 117362306a36Sopenharmony_ci 117462306a36Sopenharmony_ciout_free: 117562306a36Sopenharmony_ci intel_timeline_put(tl); 117662306a36Sopenharmony_ci return err; 117762306a36Sopenharmony_ci} 117862306a36Sopenharmony_ci 117962306a36Sopenharmony_cistatic int live_hwsp_rollover_kernel(void *arg) 118062306a36Sopenharmony_ci{ 118162306a36Sopenharmony_ci struct intel_gt *gt = arg; 118262306a36Sopenharmony_ci struct intel_engine_cs *engine; 118362306a36Sopenharmony_ci enum intel_engine_id id; 118462306a36Sopenharmony_ci int err = 0; 118562306a36Sopenharmony_ci 118662306a36Sopenharmony_ci /* 118762306a36Sopenharmony_ci * Run the host for long enough, and even the kernel context will 118862306a36Sopenharmony_ci * see a seqno rollover. 118962306a36Sopenharmony_ci */ 119062306a36Sopenharmony_ci 119162306a36Sopenharmony_ci for_each_engine(engine, gt, id) { 119262306a36Sopenharmony_ci struct intel_context *ce = engine->kernel_context; 119362306a36Sopenharmony_ci struct intel_timeline *tl = ce->timeline; 119462306a36Sopenharmony_ci struct i915_request *rq[3] = {}; 119562306a36Sopenharmony_ci int i; 119662306a36Sopenharmony_ci 119762306a36Sopenharmony_ci st_engine_heartbeat_disable(engine); 119862306a36Sopenharmony_ci if (intel_gt_wait_for_idle(gt, HZ / 2)) { 119962306a36Sopenharmony_ci err = -EIO; 120062306a36Sopenharmony_ci goto out; 120162306a36Sopenharmony_ci } 120262306a36Sopenharmony_ci 120362306a36Sopenharmony_ci GEM_BUG_ON(i915_active_fence_isset(&tl->last_request)); 120462306a36Sopenharmony_ci tl->seqno = -2u; 120562306a36Sopenharmony_ci WRITE_ONCE(*(u32 *)tl->hwsp_seqno, tl->seqno); 120662306a36Sopenharmony_ci 120762306a36Sopenharmony_ci for (i = 0; i < ARRAY_SIZE(rq); i++) { 120862306a36Sopenharmony_ci struct i915_request *this; 120962306a36Sopenharmony_ci 121062306a36Sopenharmony_ci this = i915_request_create(ce); 121162306a36Sopenharmony_ci if (IS_ERR(this)) { 121262306a36Sopenharmony_ci err = PTR_ERR(this); 121362306a36Sopenharmony_ci goto out; 121462306a36Sopenharmony_ci } 121562306a36Sopenharmony_ci 121662306a36Sopenharmony_ci pr_debug("%s: create fence.seqnp:%d\n", 121762306a36Sopenharmony_ci engine->name, 121862306a36Sopenharmony_ci lower_32_bits(this->fence.seqno)); 121962306a36Sopenharmony_ci 122062306a36Sopenharmony_ci GEM_BUG_ON(rcu_access_pointer(this->timeline) != tl); 122162306a36Sopenharmony_ci 122262306a36Sopenharmony_ci rq[i] = i915_request_get(this); 122362306a36Sopenharmony_ci i915_request_add(this); 122462306a36Sopenharmony_ci } 122562306a36Sopenharmony_ci 122662306a36Sopenharmony_ci /* We expected a wrap! */ 122762306a36Sopenharmony_ci GEM_BUG_ON(rq[2]->fence.seqno > rq[0]->fence.seqno); 122862306a36Sopenharmony_ci 122962306a36Sopenharmony_ci if (i915_request_wait(rq[2], 0, HZ / 5) < 0) { 123062306a36Sopenharmony_ci pr_err("Wait for timeline wrap timed out!\n"); 123162306a36Sopenharmony_ci err = -EIO; 123262306a36Sopenharmony_ci goto out; 123362306a36Sopenharmony_ci } 123462306a36Sopenharmony_ci 123562306a36Sopenharmony_ci for (i = 0; i < ARRAY_SIZE(rq); i++) { 123662306a36Sopenharmony_ci if (!i915_request_completed(rq[i])) { 123762306a36Sopenharmony_ci pr_err("Pre-wrap request not completed!\n"); 123862306a36Sopenharmony_ci err = -EINVAL; 123962306a36Sopenharmony_ci goto out; 124062306a36Sopenharmony_ci } 124162306a36Sopenharmony_ci } 124262306a36Sopenharmony_ci 124362306a36Sopenharmony_ciout: 124462306a36Sopenharmony_ci for (i = 0; i < ARRAY_SIZE(rq); i++) 124562306a36Sopenharmony_ci i915_request_put(rq[i]); 124662306a36Sopenharmony_ci st_engine_heartbeat_enable(engine); 124762306a36Sopenharmony_ci if (err) 124862306a36Sopenharmony_ci break; 124962306a36Sopenharmony_ci } 125062306a36Sopenharmony_ci 125162306a36Sopenharmony_ci if (igt_flush_test(gt->i915)) 125262306a36Sopenharmony_ci err = -EIO; 125362306a36Sopenharmony_ci 125462306a36Sopenharmony_ci return err; 125562306a36Sopenharmony_ci} 125662306a36Sopenharmony_ci 125762306a36Sopenharmony_cistatic int live_hwsp_rollover_user(void *arg) 125862306a36Sopenharmony_ci{ 125962306a36Sopenharmony_ci struct intel_gt *gt = arg; 126062306a36Sopenharmony_ci struct intel_engine_cs *engine; 126162306a36Sopenharmony_ci enum intel_engine_id id; 126262306a36Sopenharmony_ci int err = 0; 126362306a36Sopenharmony_ci 126462306a36Sopenharmony_ci /* 126562306a36Sopenharmony_ci * Simulate a long running user context, and force the seqno wrap 126662306a36Sopenharmony_ci * on the user's timeline. 126762306a36Sopenharmony_ci */ 126862306a36Sopenharmony_ci 126962306a36Sopenharmony_ci for_each_engine(engine, gt, id) { 127062306a36Sopenharmony_ci struct i915_request *rq[3] = {}; 127162306a36Sopenharmony_ci struct intel_timeline *tl; 127262306a36Sopenharmony_ci struct intel_context *ce; 127362306a36Sopenharmony_ci int i; 127462306a36Sopenharmony_ci 127562306a36Sopenharmony_ci ce = intel_context_create(engine); 127662306a36Sopenharmony_ci if (IS_ERR(ce)) 127762306a36Sopenharmony_ci return PTR_ERR(ce); 127862306a36Sopenharmony_ci 127962306a36Sopenharmony_ci err = intel_context_alloc_state(ce); 128062306a36Sopenharmony_ci if (err) 128162306a36Sopenharmony_ci goto out; 128262306a36Sopenharmony_ci 128362306a36Sopenharmony_ci tl = ce->timeline; 128462306a36Sopenharmony_ci if (!tl->has_initial_breadcrumb) 128562306a36Sopenharmony_ci goto out; 128662306a36Sopenharmony_ci 128762306a36Sopenharmony_ci err = intel_context_pin(ce); 128862306a36Sopenharmony_ci if (err) 128962306a36Sopenharmony_ci goto out; 129062306a36Sopenharmony_ci 129162306a36Sopenharmony_ci tl->seqno = -4u; 129262306a36Sopenharmony_ci WRITE_ONCE(*(u32 *)tl->hwsp_seqno, tl->seqno); 129362306a36Sopenharmony_ci 129462306a36Sopenharmony_ci for (i = 0; i < ARRAY_SIZE(rq); i++) { 129562306a36Sopenharmony_ci struct i915_request *this; 129662306a36Sopenharmony_ci 129762306a36Sopenharmony_ci this = intel_context_create_request(ce); 129862306a36Sopenharmony_ci if (IS_ERR(this)) { 129962306a36Sopenharmony_ci err = PTR_ERR(this); 130062306a36Sopenharmony_ci goto out_unpin; 130162306a36Sopenharmony_ci } 130262306a36Sopenharmony_ci 130362306a36Sopenharmony_ci pr_debug("%s: create fence.seqnp:%d\n", 130462306a36Sopenharmony_ci engine->name, 130562306a36Sopenharmony_ci lower_32_bits(this->fence.seqno)); 130662306a36Sopenharmony_ci 130762306a36Sopenharmony_ci GEM_BUG_ON(rcu_access_pointer(this->timeline) != tl); 130862306a36Sopenharmony_ci 130962306a36Sopenharmony_ci rq[i] = i915_request_get(this); 131062306a36Sopenharmony_ci i915_request_add(this); 131162306a36Sopenharmony_ci } 131262306a36Sopenharmony_ci 131362306a36Sopenharmony_ci /* We expected a wrap! */ 131462306a36Sopenharmony_ci GEM_BUG_ON(rq[2]->fence.seqno > rq[0]->fence.seqno); 131562306a36Sopenharmony_ci 131662306a36Sopenharmony_ci if (i915_request_wait(rq[2], 0, HZ / 5) < 0) { 131762306a36Sopenharmony_ci pr_err("Wait for timeline wrap timed out!\n"); 131862306a36Sopenharmony_ci err = -EIO; 131962306a36Sopenharmony_ci goto out_unpin; 132062306a36Sopenharmony_ci } 132162306a36Sopenharmony_ci 132262306a36Sopenharmony_ci for (i = 0; i < ARRAY_SIZE(rq); i++) { 132362306a36Sopenharmony_ci if (!i915_request_completed(rq[i])) { 132462306a36Sopenharmony_ci pr_err("Pre-wrap request not completed!\n"); 132562306a36Sopenharmony_ci err = -EINVAL; 132662306a36Sopenharmony_ci goto out_unpin; 132762306a36Sopenharmony_ci } 132862306a36Sopenharmony_ci } 132962306a36Sopenharmony_ciout_unpin: 133062306a36Sopenharmony_ci intel_context_unpin(ce); 133162306a36Sopenharmony_ciout: 133262306a36Sopenharmony_ci for (i = 0; i < ARRAY_SIZE(rq); i++) 133362306a36Sopenharmony_ci i915_request_put(rq[i]); 133462306a36Sopenharmony_ci intel_context_put(ce); 133562306a36Sopenharmony_ci if (err) 133662306a36Sopenharmony_ci break; 133762306a36Sopenharmony_ci } 133862306a36Sopenharmony_ci 133962306a36Sopenharmony_ci if (igt_flush_test(gt->i915)) 134062306a36Sopenharmony_ci err = -EIO; 134162306a36Sopenharmony_ci 134262306a36Sopenharmony_ci return err; 134362306a36Sopenharmony_ci} 134462306a36Sopenharmony_ci 134562306a36Sopenharmony_cistatic int live_hwsp_recycle(void *arg) 134662306a36Sopenharmony_ci{ 134762306a36Sopenharmony_ci struct intel_gt *gt = arg; 134862306a36Sopenharmony_ci struct intel_engine_cs *engine; 134962306a36Sopenharmony_ci enum intel_engine_id id; 135062306a36Sopenharmony_ci unsigned long count; 135162306a36Sopenharmony_ci int err = 0; 135262306a36Sopenharmony_ci 135362306a36Sopenharmony_ci /* 135462306a36Sopenharmony_ci * Check seqno writes into one timeline at a time. We expect to 135562306a36Sopenharmony_ci * recycle the breadcrumb slot between iterations and neither 135662306a36Sopenharmony_ci * want to confuse ourselves or the GPU. 135762306a36Sopenharmony_ci */ 135862306a36Sopenharmony_ci 135962306a36Sopenharmony_ci count = 0; 136062306a36Sopenharmony_ci for_each_engine(engine, gt, id) { 136162306a36Sopenharmony_ci IGT_TIMEOUT(end_time); 136262306a36Sopenharmony_ci 136362306a36Sopenharmony_ci if (!intel_engine_can_store_dword(engine)) 136462306a36Sopenharmony_ci continue; 136562306a36Sopenharmony_ci 136662306a36Sopenharmony_ci intel_engine_pm_get(engine); 136762306a36Sopenharmony_ci 136862306a36Sopenharmony_ci do { 136962306a36Sopenharmony_ci struct intel_timeline *tl; 137062306a36Sopenharmony_ci struct i915_request *rq; 137162306a36Sopenharmony_ci 137262306a36Sopenharmony_ci tl = intel_timeline_create(gt); 137362306a36Sopenharmony_ci if (IS_ERR(tl)) { 137462306a36Sopenharmony_ci err = PTR_ERR(tl); 137562306a36Sopenharmony_ci break; 137662306a36Sopenharmony_ci } 137762306a36Sopenharmony_ci 137862306a36Sopenharmony_ci rq = checked_tl_write(tl, engine, count); 137962306a36Sopenharmony_ci if (IS_ERR(rq)) { 138062306a36Sopenharmony_ci intel_timeline_put(tl); 138162306a36Sopenharmony_ci err = PTR_ERR(rq); 138262306a36Sopenharmony_ci break; 138362306a36Sopenharmony_ci } 138462306a36Sopenharmony_ci 138562306a36Sopenharmony_ci if (i915_request_wait(rq, 0, HZ / 5) < 0) { 138662306a36Sopenharmony_ci pr_err("Wait for timeline writes timed out!\n"); 138762306a36Sopenharmony_ci i915_request_put(rq); 138862306a36Sopenharmony_ci intel_timeline_put(tl); 138962306a36Sopenharmony_ci err = -EIO; 139062306a36Sopenharmony_ci break; 139162306a36Sopenharmony_ci } 139262306a36Sopenharmony_ci 139362306a36Sopenharmony_ci if (READ_ONCE(*tl->hwsp_seqno) != count) { 139462306a36Sopenharmony_ci GEM_TRACE_ERR("Invalid seqno:%lu stored in timeline %llu @ %x found 0x%x\n", 139562306a36Sopenharmony_ci count, tl->fence_context, 139662306a36Sopenharmony_ci tl->hwsp_offset, *tl->hwsp_seqno); 139762306a36Sopenharmony_ci GEM_TRACE_DUMP(); 139862306a36Sopenharmony_ci err = -EINVAL; 139962306a36Sopenharmony_ci } 140062306a36Sopenharmony_ci 140162306a36Sopenharmony_ci i915_request_put(rq); 140262306a36Sopenharmony_ci intel_timeline_put(tl); 140362306a36Sopenharmony_ci count++; 140462306a36Sopenharmony_ci 140562306a36Sopenharmony_ci if (err) 140662306a36Sopenharmony_ci break; 140762306a36Sopenharmony_ci } while (!__igt_timeout(end_time, NULL)); 140862306a36Sopenharmony_ci 140962306a36Sopenharmony_ci intel_engine_pm_put(engine); 141062306a36Sopenharmony_ci if (err) 141162306a36Sopenharmony_ci break; 141262306a36Sopenharmony_ci } 141362306a36Sopenharmony_ci 141462306a36Sopenharmony_ci return err; 141562306a36Sopenharmony_ci} 141662306a36Sopenharmony_ci 141762306a36Sopenharmony_ciint intel_timeline_live_selftests(struct drm_i915_private *i915) 141862306a36Sopenharmony_ci{ 141962306a36Sopenharmony_ci static const struct i915_subtest tests[] = { 142062306a36Sopenharmony_ci SUBTEST(live_hwsp_recycle), 142162306a36Sopenharmony_ci SUBTEST(live_hwsp_engine), 142262306a36Sopenharmony_ci SUBTEST(live_hwsp_alternate), 142362306a36Sopenharmony_ci SUBTEST(live_hwsp_wrap), 142462306a36Sopenharmony_ci SUBTEST(live_hwsp_read), 142562306a36Sopenharmony_ci SUBTEST(live_hwsp_rollover_kernel), 142662306a36Sopenharmony_ci SUBTEST(live_hwsp_rollover_user), 142762306a36Sopenharmony_ci }; 142862306a36Sopenharmony_ci 142962306a36Sopenharmony_ci if (intel_gt_is_wedged(to_gt(i915))) 143062306a36Sopenharmony_ci return 0; 143162306a36Sopenharmony_ci 143262306a36Sopenharmony_ci return intel_gt_live_subtests(tests, to_gt(i915)); 143362306a36Sopenharmony_ci} 1434