1d722e3fbSopenharmony_ci/*
2d722e3fbSopenharmony_ci * Copyright 2017 Advanced Micro Devices, Inc.
3d722e3fbSopenharmony_ci *
4d722e3fbSopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a
5d722e3fbSopenharmony_ci * copy of this software and associated documentation files (the "Software"),
6d722e3fbSopenharmony_ci * to deal in the Software without restriction, including without limitation
7d722e3fbSopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8d722e3fbSopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the
9d722e3fbSopenharmony_ci * Software is furnished to do so, subject to the following conditions:
10d722e3fbSopenharmony_ci *
11d722e3fbSopenharmony_ci * The above copyright notice and this permission notice shall be included in
12d722e3fbSopenharmony_ci * all copies or substantial portions of the Software.
13d722e3fbSopenharmony_ci *
14d722e3fbSopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15d722e3fbSopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16d722e3fbSopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17d722e3fbSopenharmony_ci * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18d722e3fbSopenharmony_ci * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19d722e3fbSopenharmony_ci * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20d722e3fbSopenharmony_ci * OTHER DEALINGS IN THE SOFTWARE.
21d722e3fbSopenharmony_ci *
22d722e3fbSopenharmony_ci*/
23d722e3fbSopenharmony_ci
24d722e3fbSopenharmony_ci#include "CUnit/Basic.h"
25d722e3fbSopenharmony_ci#include "xf86drm.h"
26d722e3fbSopenharmony_ci
27d722e3fbSopenharmony_ci#include "amdgpu_test.h"
28d722e3fbSopenharmony_ci#include "amdgpu_drm.h"
29d722e3fbSopenharmony_ci#include "amdgpu_internal.h"
30d722e3fbSopenharmony_ci#include <pthread.h>
31d722e3fbSopenharmony_ci
32d722e3fbSopenharmony_cistatic  amdgpu_device_handle device_handle;
33d722e3fbSopenharmony_cistatic  uint32_t  major_version;
34d722e3fbSopenharmony_cistatic  uint32_t  minor_version;
35d722e3fbSopenharmony_ci
36d722e3fbSopenharmony_cistatic  uint32_t  family_id;
37d722e3fbSopenharmony_cistatic  uint32_t  chip_id;
38d722e3fbSopenharmony_cistatic  uint32_t  chip_rev;
39d722e3fbSopenharmony_ci
40d722e3fbSopenharmony_cistatic void amdgpu_syncobj_timeline_test(void);
41d722e3fbSopenharmony_ci
42d722e3fbSopenharmony_ciCU_BOOL suite_syncobj_timeline_tests_enable(void)
43d722e3fbSopenharmony_ci{
44d722e3fbSopenharmony_ci	int r;
45d722e3fbSopenharmony_ci	uint64_t cap = 0;
46d722e3fbSopenharmony_ci
47d722e3fbSopenharmony_ci	r = drmGetCap(drm_amdgpu[0], DRM_CAP_SYNCOBJ_TIMELINE, &cap);
48d722e3fbSopenharmony_ci	if (r || cap == 0)
49d722e3fbSopenharmony_ci		return CU_FALSE;
50d722e3fbSopenharmony_ci
51d722e3fbSopenharmony_ci	return CU_TRUE;
52d722e3fbSopenharmony_ci}
53d722e3fbSopenharmony_ci
54d722e3fbSopenharmony_ciint suite_syncobj_timeline_tests_init(void)
55d722e3fbSopenharmony_ci{
56d722e3fbSopenharmony_ci	int r;
57d722e3fbSopenharmony_ci
58d722e3fbSopenharmony_ci	r = amdgpu_device_initialize(drm_amdgpu[0], &major_version,
59d722e3fbSopenharmony_ci				   &minor_version, &device_handle);
60d722e3fbSopenharmony_ci
61d722e3fbSopenharmony_ci	if (r) {
62d722e3fbSopenharmony_ci		if ((r == -EACCES) && (errno == EACCES))
63d722e3fbSopenharmony_ci			printf("\n\nError:%s. "
64d722e3fbSopenharmony_ci				"Hint:Try to run this test program as root.",
65d722e3fbSopenharmony_ci				strerror(errno));
66d722e3fbSopenharmony_ci		return CUE_SINIT_FAILED;
67d722e3fbSopenharmony_ci	}
68d722e3fbSopenharmony_ci
69d722e3fbSopenharmony_ci	return CUE_SUCCESS;
70d722e3fbSopenharmony_ci}
71d722e3fbSopenharmony_ci
72d722e3fbSopenharmony_ciint suite_syncobj_timeline_tests_clean(void)
73d722e3fbSopenharmony_ci{
74d722e3fbSopenharmony_ci	int r = amdgpu_device_deinitialize(device_handle);
75d722e3fbSopenharmony_ci
76d722e3fbSopenharmony_ci	if (r == 0)
77d722e3fbSopenharmony_ci		return CUE_SUCCESS;
78d722e3fbSopenharmony_ci	else
79d722e3fbSopenharmony_ci		return CUE_SCLEAN_FAILED;
80d722e3fbSopenharmony_ci}
81d722e3fbSopenharmony_ci
82d722e3fbSopenharmony_ci
83d722e3fbSopenharmony_ciCU_TestInfo syncobj_timeline_tests[] = {
84d722e3fbSopenharmony_ci	{ "syncobj timeline test",  amdgpu_syncobj_timeline_test },
85d722e3fbSopenharmony_ci	CU_TEST_INFO_NULL,
86d722e3fbSopenharmony_ci};
87d722e3fbSopenharmony_ci
88d722e3fbSopenharmony_ci#define GFX_COMPUTE_NOP  0xffff1000
89d722e3fbSopenharmony_ci#define SDMA_NOP  0x0
90d722e3fbSopenharmony_cistatic int syncobj_command_submission_helper(uint32_t syncobj_handle, bool
91d722e3fbSopenharmony_ci					     wait_or_signal, uint64_t point)
92d722e3fbSopenharmony_ci{
93d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
94d722e3fbSopenharmony_ci	amdgpu_bo_handle ib_result_handle;
95d722e3fbSopenharmony_ci	void *ib_result_cpu;
96d722e3fbSopenharmony_ci	uint64_t ib_result_mc_address;
97d722e3fbSopenharmony_ci	struct drm_amdgpu_cs_chunk chunks[2];
98d722e3fbSopenharmony_ci	struct drm_amdgpu_cs_chunk_data chunk_data;
99d722e3fbSopenharmony_ci	struct drm_amdgpu_cs_chunk_syncobj syncobj_data;
100d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status;
101d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list;
102d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle;
103d722e3fbSopenharmony_ci	uint32_t expired;
104d722e3fbSopenharmony_ci	int i, r;
105d722e3fbSopenharmony_ci	uint64_t seq_no;
106d722e3fbSopenharmony_ci	static uint32_t *ptr;
107d722e3fbSopenharmony_ci	struct amdgpu_gpu_info gpu_info = {0};
108d722e3fbSopenharmony_ci	unsigned gc_ip_type;
109d722e3fbSopenharmony_ci
110d722e3fbSopenharmony_ci	r = amdgpu_query_gpu_info(device_handle, &gpu_info);
111d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
112d722e3fbSopenharmony_ci
113d722e3fbSopenharmony_ci	family_id = device_handle->info.family_id;
114d722e3fbSopenharmony_ci	chip_id = device_handle->info.chip_external_rev;
115d722e3fbSopenharmony_ci	chip_rev = device_handle->info.chip_rev;
116d722e3fbSopenharmony_ci
117d722e3fbSopenharmony_ci	gc_ip_type = (asic_is_gfx_pipe_removed(family_id, chip_id, chip_rev)) ?
118d722e3fbSopenharmony_ci			AMDGPU_HW_IP_COMPUTE : AMDGPU_HW_IP_GFX;
119d722e3fbSopenharmony_ci
120d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
121d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
122d722e3fbSopenharmony_ci
123d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, 4096, 4096,
124d722e3fbSopenharmony_ci				    AMDGPU_GEM_DOMAIN_GTT, 0,
125d722e3fbSopenharmony_ci				    &ib_result_handle, &ib_result_cpu,
126d722e3fbSopenharmony_ci				    &ib_result_mc_address, &va_handle);
127d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
128d722e3fbSopenharmony_ci
129d722e3fbSopenharmony_ci	r = amdgpu_get_bo_list(device_handle, ib_result_handle, NULL,
130d722e3fbSopenharmony_ci			       &bo_list);
131d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
132d722e3fbSopenharmony_ci
133d722e3fbSopenharmony_ci	ptr = ib_result_cpu;
134d722e3fbSopenharmony_ci
135d722e3fbSopenharmony_ci	for (i = 0; i < 16; ++i)
136d722e3fbSopenharmony_ci		ptr[i] = wait_or_signal ? GFX_COMPUTE_NOP: SDMA_NOP;
137d722e3fbSopenharmony_ci
138d722e3fbSopenharmony_ci	chunks[0].chunk_id = AMDGPU_CHUNK_ID_IB;
139d722e3fbSopenharmony_ci	chunks[0].length_dw = sizeof(struct drm_amdgpu_cs_chunk_ib) / 4;
140d722e3fbSopenharmony_ci	chunks[0].chunk_data = (uint64_t)(uintptr_t)&chunk_data;
141d722e3fbSopenharmony_ci	chunk_data.ib_data._pad = 0;
142d722e3fbSopenharmony_ci	chunk_data.ib_data.va_start = ib_result_mc_address;
143d722e3fbSopenharmony_ci	chunk_data.ib_data.ib_bytes = 16 * 4;
144d722e3fbSopenharmony_ci	chunk_data.ib_data.ip_type = wait_or_signal ? gc_ip_type :
145d722e3fbSopenharmony_ci		AMDGPU_HW_IP_DMA;
146d722e3fbSopenharmony_ci	chunk_data.ib_data.ip_instance = 0;
147d722e3fbSopenharmony_ci	chunk_data.ib_data.ring = 0;
148d722e3fbSopenharmony_ci	chunk_data.ib_data.flags = AMDGPU_IB_FLAG_EMIT_MEM_SYNC;
149d722e3fbSopenharmony_ci
150d722e3fbSopenharmony_ci	chunks[1].chunk_id = wait_or_signal ?
151d722e3fbSopenharmony_ci		AMDGPU_CHUNK_ID_SYNCOBJ_TIMELINE_WAIT :
152d722e3fbSopenharmony_ci		AMDGPU_CHUNK_ID_SYNCOBJ_TIMELINE_SIGNAL;
153d722e3fbSopenharmony_ci	chunks[1].length_dw = sizeof(struct drm_amdgpu_cs_chunk_syncobj) / 4;
154d722e3fbSopenharmony_ci	chunks[1].chunk_data = (uint64_t)(uintptr_t)&syncobj_data;
155d722e3fbSopenharmony_ci	syncobj_data.handle = syncobj_handle;
156d722e3fbSopenharmony_ci	syncobj_data.point = point;
157d722e3fbSopenharmony_ci	syncobj_data.flags = DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT;
158d722e3fbSopenharmony_ci
159d722e3fbSopenharmony_ci	r = amdgpu_cs_submit_raw(device_handle,
160d722e3fbSopenharmony_ci				 context_handle,
161d722e3fbSopenharmony_ci				 bo_list,
162d722e3fbSopenharmony_ci				 2,
163d722e3fbSopenharmony_ci				 chunks,
164d722e3fbSopenharmony_ci				 &seq_no);
165d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
166d722e3fbSopenharmony_ci
167d722e3fbSopenharmony_ci
168d722e3fbSopenharmony_ci	memset(&fence_status, 0, sizeof(struct amdgpu_cs_fence));
169d722e3fbSopenharmony_ci	fence_status.context = context_handle;
170d722e3fbSopenharmony_ci	fence_status.ip_type = wait_or_signal ? gc_ip_type :
171d722e3fbSopenharmony_ci		AMDGPU_HW_IP_DMA;
172d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
173d722e3fbSopenharmony_ci	fence_status.ring = 0;
174d722e3fbSopenharmony_ci	fence_status.fence = seq_no;
175d722e3fbSopenharmony_ci
176d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
177d722e3fbSopenharmony_ci			AMDGPU_TIMEOUT_INFINITE,0, &expired);
178d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
179d722e3fbSopenharmony_ci
180d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(bo_list);
181d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
182d722e3fbSopenharmony_ci
183d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(ib_result_handle, va_handle,
184d722e3fbSopenharmony_ci				     ib_result_mc_address, 4096);
185d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
186d722e3fbSopenharmony_ci
187d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
188d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
189d722e3fbSopenharmony_ci
190d722e3fbSopenharmony_ci	return r;
191d722e3fbSopenharmony_ci}
192d722e3fbSopenharmony_ci
193d722e3fbSopenharmony_cistruct syncobj_point {
194d722e3fbSopenharmony_ci	uint32_t syncobj_handle;
195d722e3fbSopenharmony_ci	uint64_t point;
196d722e3fbSopenharmony_ci};
197d722e3fbSopenharmony_ci
198d722e3fbSopenharmony_cistatic void *syncobj_wait(void *data)
199d722e3fbSopenharmony_ci{
200d722e3fbSopenharmony_ci	struct syncobj_point *sp = (struct syncobj_point *)data;
201d722e3fbSopenharmony_ci	int r;
202d722e3fbSopenharmony_ci
203d722e3fbSopenharmony_ci	r = syncobj_command_submission_helper(sp->syncobj_handle, true,
204d722e3fbSopenharmony_ci					      sp->point);
205d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
206d722e3fbSopenharmony_ci
207d722e3fbSopenharmony_ci	return (void *)(long)r;
208d722e3fbSopenharmony_ci}
209d722e3fbSopenharmony_ci
210d722e3fbSopenharmony_cistatic void *syncobj_signal(void *data)
211d722e3fbSopenharmony_ci{
212d722e3fbSopenharmony_ci	struct syncobj_point *sp = (struct syncobj_point *)data;
213d722e3fbSopenharmony_ci	int r;
214d722e3fbSopenharmony_ci
215d722e3fbSopenharmony_ci	r = syncobj_command_submission_helper(sp->syncobj_handle, false,
216d722e3fbSopenharmony_ci					      sp->point);
217d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
218d722e3fbSopenharmony_ci
219d722e3fbSopenharmony_ci	return (void *)(long)r;
220d722e3fbSopenharmony_ci}
221d722e3fbSopenharmony_ci
222d722e3fbSopenharmony_cistatic void amdgpu_syncobj_timeline_test(void)
223d722e3fbSopenharmony_ci{
224d722e3fbSopenharmony_ci	static pthread_t wait_thread;
225d722e3fbSopenharmony_ci	static pthread_t signal_thread;
226d722e3fbSopenharmony_ci	static pthread_t c_thread;
227d722e3fbSopenharmony_ci	struct syncobj_point sp1, sp2, sp3;
228d722e3fbSopenharmony_ci	uint32_t syncobj_handle;
229d722e3fbSopenharmony_ci	uint64_t payload;
230d722e3fbSopenharmony_ci	uint64_t wait_point, signal_point;
231d722e3fbSopenharmony_ci	uint64_t timeout;
232d722e3fbSopenharmony_ci	struct timespec tp;
233d722e3fbSopenharmony_ci	int r, sync_fd;
234d722e3fbSopenharmony_ci	void *tmp;
235d722e3fbSopenharmony_ci
236d722e3fbSopenharmony_ci	r =  amdgpu_cs_create_syncobj2(device_handle, 0, &syncobj_handle);
237d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
238d722e3fbSopenharmony_ci
239d722e3fbSopenharmony_ci	// wait on point 5
240d722e3fbSopenharmony_ci	sp1.syncobj_handle = syncobj_handle;
241d722e3fbSopenharmony_ci	sp1.point = 5;
242d722e3fbSopenharmony_ci	r = pthread_create(&wait_thread, NULL, syncobj_wait, &sp1);
243d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
244d722e3fbSopenharmony_ci
245d722e3fbSopenharmony_ci	// signal on point 10
246d722e3fbSopenharmony_ci	sp2.syncobj_handle = syncobj_handle;
247d722e3fbSopenharmony_ci	sp2.point = 10;
248d722e3fbSopenharmony_ci	r = pthread_create(&signal_thread, NULL, syncobj_signal, &sp2);
249d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
250d722e3fbSopenharmony_ci
251d722e3fbSopenharmony_ci	r = pthread_join(wait_thread, &tmp);
252d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
253d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(tmp, 0);
254d722e3fbSopenharmony_ci
255d722e3fbSopenharmony_ci	r = pthread_join(signal_thread, &tmp);
256d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
257d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(tmp, 0);
258d722e3fbSopenharmony_ci
259d722e3fbSopenharmony_ci	//query timeline payload
260d722e3fbSopenharmony_ci	r = amdgpu_cs_syncobj_query(device_handle, &syncobj_handle,
261d722e3fbSopenharmony_ci				    &payload, 1);
262d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
263d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(payload, 10);
264d722e3fbSopenharmony_ci
265d722e3fbSopenharmony_ci	//signal on point 16
266d722e3fbSopenharmony_ci	sp3.syncobj_handle = syncobj_handle;
267d722e3fbSopenharmony_ci	sp3.point = 16;
268d722e3fbSopenharmony_ci	r = pthread_create(&c_thread, NULL, syncobj_signal, &sp3);
269d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
270d722e3fbSopenharmony_ci	//CPU wait on point 16
271d722e3fbSopenharmony_ci	wait_point = 16;
272d722e3fbSopenharmony_ci	timeout = 0;
273d722e3fbSopenharmony_ci	clock_gettime(CLOCK_MONOTONIC, &tp);
274d722e3fbSopenharmony_ci	timeout = tp.tv_sec * 1000000000ULL + tp.tv_nsec;
275d722e3fbSopenharmony_ci	timeout += 0x10000000000; //10s
276d722e3fbSopenharmony_ci	r = amdgpu_cs_syncobj_timeline_wait(device_handle, &syncobj_handle,
277d722e3fbSopenharmony_ci					    &wait_point, 1, timeout,
278d722e3fbSopenharmony_ci					    DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL |
279d722e3fbSopenharmony_ci					    DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT,
280d722e3fbSopenharmony_ci					    NULL);
281d722e3fbSopenharmony_ci
282d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
283d722e3fbSopenharmony_ci	r = pthread_join(c_thread, &tmp);
284d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
285d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(tmp, 0);
286d722e3fbSopenharmony_ci
287d722e3fbSopenharmony_ci	// export point 16 and import to point 18
288d722e3fbSopenharmony_ci	r = amdgpu_cs_syncobj_export_sync_file2(device_handle, syncobj_handle,
289d722e3fbSopenharmony_ci						16,
290d722e3fbSopenharmony_ci						DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT,
291d722e3fbSopenharmony_ci						&sync_fd);
292d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
293d722e3fbSopenharmony_ci	r = amdgpu_cs_syncobj_import_sync_file2(device_handle, syncobj_handle,
294d722e3fbSopenharmony_ci						18, sync_fd);
295d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
296d722e3fbSopenharmony_ci	r = amdgpu_cs_syncobj_query(device_handle, &syncobj_handle,
297d722e3fbSopenharmony_ci				    &payload, 1);
298d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
299d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(payload, 18);
300d722e3fbSopenharmony_ci
301d722e3fbSopenharmony_ci	// CPU signal on point 20
302d722e3fbSopenharmony_ci	signal_point = 20;
303d722e3fbSopenharmony_ci	r = amdgpu_cs_syncobj_timeline_signal(device_handle, &syncobj_handle,
304d722e3fbSopenharmony_ci					      &signal_point, 1);
305d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
306d722e3fbSopenharmony_ci	r = amdgpu_cs_syncobj_query(device_handle, &syncobj_handle,
307d722e3fbSopenharmony_ci				    &payload, 1);
308d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
309d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(payload, 20);
310d722e3fbSopenharmony_ci
311d722e3fbSopenharmony_ci	r = amdgpu_cs_destroy_syncobj(device_handle, syncobj_handle);
312d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
313d722e3fbSopenharmony_ci
314d722e3fbSopenharmony_ci}
315