1d722e3fbSopenharmony_ci/* 2d722e3fbSopenharmony_ci * Copyright 2017 Advanced Micro Devices, Inc. 3d722e3fbSopenharmony_ci * 4d722e3fbSopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a 5d722e3fbSopenharmony_ci * copy of this software and associated documentation files (the "Software"), 6d722e3fbSopenharmony_ci * to deal in the Software without restriction, including without limitation 7d722e3fbSopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8d722e3fbSopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the 9d722e3fbSopenharmony_ci * Software is furnished to do so, subject to the following conditions: 10d722e3fbSopenharmony_ci * 11d722e3fbSopenharmony_ci * The above copyright notice and this permission notice shall be included in 12d722e3fbSopenharmony_ci * all copies or substantial portions of the Software. 13d722e3fbSopenharmony_ci * 14d722e3fbSopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15d722e3fbSopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16d722e3fbSopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17d722e3fbSopenharmony_ci * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 18d722e3fbSopenharmony_ci * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19d722e3fbSopenharmony_ci * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20d722e3fbSopenharmony_ci * OTHER DEALINGS IN THE SOFTWARE. 21d722e3fbSopenharmony_ci * 22d722e3fbSopenharmony_ci*/ 23d722e3fbSopenharmony_ci 24d722e3fbSopenharmony_ci#include "CUnit/Basic.h" 25d722e3fbSopenharmony_ci#include "xf86drm.h" 26d722e3fbSopenharmony_ci 27d722e3fbSopenharmony_ci#include "amdgpu_test.h" 28d722e3fbSopenharmony_ci#include "amdgpu_drm.h" 29d722e3fbSopenharmony_ci#include "amdgpu_internal.h" 30d722e3fbSopenharmony_ci#include <pthread.h> 31d722e3fbSopenharmony_ci 32d722e3fbSopenharmony_cistatic amdgpu_device_handle device_handle; 33d722e3fbSopenharmony_cistatic uint32_t major_version; 34d722e3fbSopenharmony_cistatic uint32_t minor_version; 35d722e3fbSopenharmony_ci 36d722e3fbSopenharmony_cistatic uint32_t family_id; 37d722e3fbSopenharmony_cistatic uint32_t chip_id; 38d722e3fbSopenharmony_cistatic uint32_t chip_rev; 39d722e3fbSopenharmony_ci 40d722e3fbSopenharmony_cistatic void amdgpu_syncobj_timeline_test(void); 41d722e3fbSopenharmony_ci 42d722e3fbSopenharmony_ciCU_BOOL suite_syncobj_timeline_tests_enable(void) 43d722e3fbSopenharmony_ci{ 44d722e3fbSopenharmony_ci int r; 45d722e3fbSopenharmony_ci uint64_t cap = 0; 46d722e3fbSopenharmony_ci 47d722e3fbSopenharmony_ci r = drmGetCap(drm_amdgpu[0], DRM_CAP_SYNCOBJ_TIMELINE, &cap); 48d722e3fbSopenharmony_ci if (r || cap == 0) 49d722e3fbSopenharmony_ci return CU_FALSE; 50d722e3fbSopenharmony_ci 51d722e3fbSopenharmony_ci return CU_TRUE; 52d722e3fbSopenharmony_ci} 53d722e3fbSopenharmony_ci 54d722e3fbSopenharmony_ciint suite_syncobj_timeline_tests_init(void) 55d722e3fbSopenharmony_ci{ 56d722e3fbSopenharmony_ci int r; 57d722e3fbSopenharmony_ci 58d722e3fbSopenharmony_ci r = amdgpu_device_initialize(drm_amdgpu[0], &major_version, 59d722e3fbSopenharmony_ci &minor_version, &device_handle); 60d722e3fbSopenharmony_ci 61d722e3fbSopenharmony_ci if (r) { 62d722e3fbSopenharmony_ci if ((r == -EACCES) && (errno == EACCES)) 63d722e3fbSopenharmony_ci printf("\n\nError:%s. " 64d722e3fbSopenharmony_ci "Hint:Try to run this test program as root.", 65d722e3fbSopenharmony_ci strerror(errno)); 66d722e3fbSopenharmony_ci return CUE_SINIT_FAILED; 67d722e3fbSopenharmony_ci } 68d722e3fbSopenharmony_ci 69d722e3fbSopenharmony_ci return CUE_SUCCESS; 70d722e3fbSopenharmony_ci} 71d722e3fbSopenharmony_ci 72d722e3fbSopenharmony_ciint suite_syncobj_timeline_tests_clean(void) 73d722e3fbSopenharmony_ci{ 74d722e3fbSopenharmony_ci int r = amdgpu_device_deinitialize(device_handle); 75d722e3fbSopenharmony_ci 76d722e3fbSopenharmony_ci if (r == 0) 77d722e3fbSopenharmony_ci return CUE_SUCCESS; 78d722e3fbSopenharmony_ci else 79d722e3fbSopenharmony_ci return CUE_SCLEAN_FAILED; 80d722e3fbSopenharmony_ci} 81d722e3fbSopenharmony_ci 82d722e3fbSopenharmony_ci 83d722e3fbSopenharmony_ciCU_TestInfo syncobj_timeline_tests[] = { 84d722e3fbSopenharmony_ci { "syncobj timeline test", amdgpu_syncobj_timeline_test }, 85d722e3fbSopenharmony_ci CU_TEST_INFO_NULL, 86d722e3fbSopenharmony_ci}; 87d722e3fbSopenharmony_ci 88d722e3fbSopenharmony_ci#define GFX_COMPUTE_NOP 0xffff1000 89d722e3fbSopenharmony_ci#define SDMA_NOP 0x0 90d722e3fbSopenharmony_cistatic int syncobj_command_submission_helper(uint32_t syncobj_handle, bool 91d722e3fbSopenharmony_ci wait_or_signal, uint64_t point) 92d722e3fbSopenharmony_ci{ 93d722e3fbSopenharmony_ci amdgpu_context_handle context_handle; 94d722e3fbSopenharmony_ci amdgpu_bo_handle ib_result_handle; 95d722e3fbSopenharmony_ci void *ib_result_cpu; 96d722e3fbSopenharmony_ci uint64_t ib_result_mc_address; 97d722e3fbSopenharmony_ci struct drm_amdgpu_cs_chunk chunks[2]; 98d722e3fbSopenharmony_ci struct drm_amdgpu_cs_chunk_data chunk_data; 99d722e3fbSopenharmony_ci struct drm_amdgpu_cs_chunk_syncobj syncobj_data; 100d722e3fbSopenharmony_ci struct amdgpu_cs_fence fence_status; 101d722e3fbSopenharmony_ci amdgpu_bo_list_handle bo_list; 102d722e3fbSopenharmony_ci amdgpu_va_handle va_handle; 103d722e3fbSopenharmony_ci uint32_t expired; 104d722e3fbSopenharmony_ci int i, r; 105d722e3fbSopenharmony_ci uint64_t seq_no; 106d722e3fbSopenharmony_ci static uint32_t *ptr; 107d722e3fbSopenharmony_ci struct amdgpu_gpu_info gpu_info = {0}; 108d722e3fbSopenharmony_ci unsigned gc_ip_type; 109d722e3fbSopenharmony_ci 110d722e3fbSopenharmony_ci r = amdgpu_query_gpu_info(device_handle, &gpu_info); 111d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 112d722e3fbSopenharmony_ci 113d722e3fbSopenharmony_ci family_id = device_handle->info.family_id; 114d722e3fbSopenharmony_ci chip_id = device_handle->info.chip_external_rev; 115d722e3fbSopenharmony_ci chip_rev = device_handle->info.chip_rev; 116d722e3fbSopenharmony_ci 117d722e3fbSopenharmony_ci gc_ip_type = (asic_is_gfx_pipe_removed(family_id, chip_id, chip_rev)) ? 118d722e3fbSopenharmony_ci AMDGPU_HW_IP_COMPUTE : AMDGPU_HW_IP_GFX; 119d722e3fbSopenharmony_ci 120d722e3fbSopenharmony_ci r = amdgpu_cs_ctx_create(device_handle, &context_handle); 121d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 122d722e3fbSopenharmony_ci 123d722e3fbSopenharmony_ci r = amdgpu_bo_alloc_and_map(device_handle, 4096, 4096, 124d722e3fbSopenharmony_ci AMDGPU_GEM_DOMAIN_GTT, 0, 125d722e3fbSopenharmony_ci &ib_result_handle, &ib_result_cpu, 126d722e3fbSopenharmony_ci &ib_result_mc_address, &va_handle); 127d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 128d722e3fbSopenharmony_ci 129d722e3fbSopenharmony_ci r = amdgpu_get_bo_list(device_handle, ib_result_handle, NULL, 130d722e3fbSopenharmony_ci &bo_list); 131d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 132d722e3fbSopenharmony_ci 133d722e3fbSopenharmony_ci ptr = ib_result_cpu; 134d722e3fbSopenharmony_ci 135d722e3fbSopenharmony_ci for (i = 0; i < 16; ++i) 136d722e3fbSopenharmony_ci ptr[i] = wait_or_signal ? GFX_COMPUTE_NOP: SDMA_NOP; 137d722e3fbSopenharmony_ci 138d722e3fbSopenharmony_ci chunks[0].chunk_id = AMDGPU_CHUNK_ID_IB; 139d722e3fbSopenharmony_ci chunks[0].length_dw = sizeof(struct drm_amdgpu_cs_chunk_ib) / 4; 140d722e3fbSopenharmony_ci chunks[0].chunk_data = (uint64_t)(uintptr_t)&chunk_data; 141d722e3fbSopenharmony_ci chunk_data.ib_data._pad = 0; 142d722e3fbSopenharmony_ci chunk_data.ib_data.va_start = ib_result_mc_address; 143d722e3fbSopenharmony_ci chunk_data.ib_data.ib_bytes = 16 * 4; 144d722e3fbSopenharmony_ci chunk_data.ib_data.ip_type = wait_or_signal ? gc_ip_type : 145d722e3fbSopenharmony_ci AMDGPU_HW_IP_DMA; 146d722e3fbSopenharmony_ci chunk_data.ib_data.ip_instance = 0; 147d722e3fbSopenharmony_ci chunk_data.ib_data.ring = 0; 148d722e3fbSopenharmony_ci chunk_data.ib_data.flags = AMDGPU_IB_FLAG_EMIT_MEM_SYNC; 149d722e3fbSopenharmony_ci 150d722e3fbSopenharmony_ci chunks[1].chunk_id = wait_or_signal ? 151d722e3fbSopenharmony_ci AMDGPU_CHUNK_ID_SYNCOBJ_TIMELINE_WAIT : 152d722e3fbSopenharmony_ci AMDGPU_CHUNK_ID_SYNCOBJ_TIMELINE_SIGNAL; 153d722e3fbSopenharmony_ci chunks[1].length_dw = sizeof(struct drm_amdgpu_cs_chunk_syncobj) / 4; 154d722e3fbSopenharmony_ci chunks[1].chunk_data = (uint64_t)(uintptr_t)&syncobj_data; 155d722e3fbSopenharmony_ci syncobj_data.handle = syncobj_handle; 156d722e3fbSopenharmony_ci syncobj_data.point = point; 157d722e3fbSopenharmony_ci syncobj_data.flags = DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT; 158d722e3fbSopenharmony_ci 159d722e3fbSopenharmony_ci r = amdgpu_cs_submit_raw(device_handle, 160d722e3fbSopenharmony_ci context_handle, 161d722e3fbSopenharmony_ci bo_list, 162d722e3fbSopenharmony_ci 2, 163d722e3fbSopenharmony_ci chunks, 164d722e3fbSopenharmony_ci &seq_no); 165d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 166d722e3fbSopenharmony_ci 167d722e3fbSopenharmony_ci 168d722e3fbSopenharmony_ci memset(&fence_status, 0, sizeof(struct amdgpu_cs_fence)); 169d722e3fbSopenharmony_ci fence_status.context = context_handle; 170d722e3fbSopenharmony_ci fence_status.ip_type = wait_or_signal ? gc_ip_type : 171d722e3fbSopenharmony_ci AMDGPU_HW_IP_DMA; 172d722e3fbSopenharmony_ci fence_status.ip_instance = 0; 173d722e3fbSopenharmony_ci fence_status.ring = 0; 174d722e3fbSopenharmony_ci fence_status.fence = seq_no; 175d722e3fbSopenharmony_ci 176d722e3fbSopenharmony_ci r = amdgpu_cs_query_fence_status(&fence_status, 177d722e3fbSopenharmony_ci AMDGPU_TIMEOUT_INFINITE,0, &expired); 178d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 179d722e3fbSopenharmony_ci 180d722e3fbSopenharmony_ci r = amdgpu_bo_list_destroy(bo_list); 181d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 182d722e3fbSopenharmony_ci 183d722e3fbSopenharmony_ci r = amdgpu_bo_unmap_and_free(ib_result_handle, va_handle, 184d722e3fbSopenharmony_ci ib_result_mc_address, 4096); 185d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 186d722e3fbSopenharmony_ci 187d722e3fbSopenharmony_ci r = amdgpu_cs_ctx_free(context_handle); 188d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 189d722e3fbSopenharmony_ci 190d722e3fbSopenharmony_ci return r; 191d722e3fbSopenharmony_ci} 192d722e3fbSopenharmony_ci 193d722e3fbSopenharmony_cistruct syncobj_point { 194d722e3fbSopenharmony_ci uint32_t syncobj_handle; 195d722e3fbSopenharmony_ci uint64_t point; 196d722e3fbSopenharmony_ci}; 197d722e3fbSopenharmony_ci 198d722e3fbSopenharmony_cistatic void *syncobj_wait(void *data) 199d722e3fbSopenharmony_ci{ 200d722e3fbSopenharmony_ci struct syncobj_point *sp = (struct syncobj_point *)data; 201d722e3fbSopenharmony_ci int r; 202d722e3fbSopenharmony_ci 203d722e3fbSopenharmony_ci r = syncobj_command_submission_helper(sp->syncobj_handle, true, 204d722e3fbSopenharmony_ci sp->point); 205d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 206d722e3fbSopenharmony_ci 207d722e3fbSopenharmony_ci return (void *)(long)r; 208d722e3fbSopenharmony_ci} 209d722e3fbSopenharmony_ci 210d722e3fbSopenharmony_cistatic void *syncobj_signal(void *data) 211d722e3fbSopenharmony_ci{ 212d722e3fbSopenharmony_ci struct syncobj_point *sp = (struct syncobj_point *)data; 213d722e3fbSopenharmony_ci int r; 214d722e3fbSopenharmony_ci 215d722e3fbSopenharmony_ci r = syncobj_command_submission_helper(sp->syncobj_handle, false, 216d722e3fbSopenharmony_ci sp->point); 217d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 218d722e3fbSopenharmony_ci 219d722e3fbSopenharmony_ci return (void *)(long)r; 220d722e3fbSopenharmony_ci} 221d722e3fbSopenharmony_ci 222d722e3fbSopenharmony_cistatic void amdgpu_syncobj_timeline_test(void) 223d722e3fbSopenharmony_ci{ 224d722e3fbSopenharmony_ci static pthread_t wait_thread; 225d722e3fbSopenharmony_ci static pthread_t signal_thread; 226d722e3fbSopenharmony_ci static pthread_t c_thread; 227d722e3fbSopenharmony_ci struct syncobj_point sp1, sp2, sp3; 228d722e3fbSopenharmony_ci uint32_t syncobj_handle; 229d722e3fbSopenharmony_ci uint64_t payload; 230d722e3fbSopenharmony_ci uint64_t wait_point, signal_point; 231d722e3fbSopenharmony_ci uint64_t timeout; 232d722e3fbSopenharmony_ci struct timespec tp; 233d722e3fbSopenharmony_ci int r, sync_fd; 234d722e3fbSopenharmony_ci void *tmp; 235d722e3fbSopenharmony_ci 236d722e3fbSopenharmony_ci r = amdgpu_cs_create_syncobj2(device_handle, 0, &syncobj_handle); 237d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 238d722e3fbSopenharmony_ci 239d722e3fbSopenharmony_ci // wait on point 5 240d722e3fbSopenharmony_ci sp1.syncobj_handle = syncobj_handle; 241d722e3fbSopenharmony_ci sp1.point = 5; 242d722e3fbSopenharmony_ci r = pthread_create(&wait_thread, NULL, syncobj_wait, &sp1); 243d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 244d722e3fbSopenharmony_ci 245d722e3fbSopenharmony_ci // signal on point 10 246d722e3fbSopenharmony_ci sp2.syncobj_handle = syncobj_handle; 247d722e3fbSopenharmony_ci sp2.point = 10; 248d722e3fbSopenharmony_ci r = pthread_create(&signal_thread, NULL, syncobj_signal, &sp2); 249d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 250d722e3fbSopenharmony_ci 251d722e3fbSopenharmony_ci r = pthread_join(wait_thread, &tmp); 252d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 253d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(tmp, 0); 254d722e3fbSopenharmony_ci 255d722e3fbSopenharmony_ci r = pthread_join(signal_thread, &tmp); 256d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 257d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(tmp, 0); 258d722e3fbSopenharmony_ci 259d722e3fbSopenharmony_ci //query timeline payload 260d722e3fbSopenharmony_ci r = amdgpu_cs_syncobj_query(device_handle, &syncobj_handle, 261d722e3fbSopenharmony_ci &payload, 1); 262d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 263d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(payload, 10); 264d722e3fbSopenharmony_ci 265d722e3fbSopenharmony_ci //signal on point 16 266d722e3fbSopenharmony_ci sp3.syncobj_handle = syncobj_handle; 267d722e3fbSopenharmony_ci sp3.point = 16; 268d722e3fbSopenharmony_ci r = pthread_create(&c_thread, NULL, syncobj_signal, &sp3); 269d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 270d722e3fbSopenharmony_ci //CPU wait on point 16 271d722e3fbSopenharmony_ci wait_point = 16; 272d722e3fbSopenharmony_ci timeout = 0; 273d722e3fbSopenharmony_ci clock_gettime(CLOCK_MONOTONIC, &tp); 274d722e3fbSopenharmony_ci timeout = tp.tv_sec * 1000000000ULL + tp.tv_nsec; 275d722e3fbSopenharmony_ci timeout += 0x10000000000; //10s 276d722e3fbSopenharmony_ci r = amdgpu_cs_syncobj_timeline_wait(device_handle, &syncobj_handle, 277d722e3fbSopenharmony_ci &wait_point, 1, timeout, 278d722e3fbSopenharmony_ci DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL | 279d722e3fbSopenharmony_ci DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT, 280d722e3fbSopenharmony_ci NULL); 281d722e3fbSopenharmony_ci 282d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 283d722e3fbSopenharmony_ci r = pthread_join(c_thread, &tmp); 284d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 285d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(tmp, 0); 286d722e3fbSopenharmony_ci 287d722e3fbSopenharmony_ci // export point 16 and import to point 18 288d722e3fbSopenharmony_ci r = amdgpu_cs_syncobj_export_sync_file2(device_handle, syncobj_handle, 289d722e3fbSopenharmony_ci 16, 290d722e3fbSopenharmony_ci DRM_SYNCOBJ_WAIT_FLAGS_WAIT_FOR_SUBMIT, 291d722e3fbSopenharmony_ci &sync_fd); 292d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 293d722e3fbSopenharmony_ci r = amdgpu_cs_syncobj_import_sync_file2(device_handle, syncobj_handle, 294d722e3fbSopenharmony_ci 18, sync_fd); 295d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 296d722e3fbSopenharmony_ci r = amdgpu_cs_syncobj_query(device_handle, &syncobj_handle, 297d722e3fbSopenharmony_ci &payload, 1); 298d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 299d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(payload, 18); 300d722e3fbSopenharmony_ci 301d722e3fbSopenharmony_ci // CPU signal on point 20 302d722e3fbSopenharmony_ci signal_point = 20; 303d722e3fbSopenharmony_ci r = amdgpu_cs_syncobj_timeline_signal(device_handle, &syncobj_handle, 304d722e3fbSopenharmony_ci &signal_point, 1); 305d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 306d722e3fbSopenharmony_ci r = amdgpu_cs_syncobj_query(device_handle, &syncobj_handle, 307d722e3fbSopenharmony_ci &payload, 1); 308d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 309d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(payload, 20); 310d722e3fbSopenharmony_ci 311d722e3fbSopenharmony_ci r = amdgpu_cs_destroy_syncobj(device_handle, syncobj_handle); 312d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 313d722e3fbSopenharmony_ci 314d722e3fbSopenharmony_ci} 315