1d722e3fbSopenharmony_ci/* 2d722e3fbSopenharmony_ci * Copyright 2017 Advanced Micro Devices, Inc. 3d722e3fbSopenharmony_ci * 4d722e3fbSopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a 5d722e3fbSopenharmony_ci * copy of this software and associated documentation files (the "Software"), 6d722e3fbSopenharmony_ci * to deal in the Software without restriction, including without limitation 7d722e3fbSopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8d722e3fbSopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the 9d722e3fbSopenharmony_ci * Software is furnished to do so, subject to the following conditions: 10d722e3fbSopenharmony_ci * 11d722e3fbSopenharmony_ci * The above copyright notice and this permission notice shall be included in 12d722e3fbSopenharmony_ci * all copies or substantial portions of the Software. 13d722e3fbSopenharmony_ci * 14d722e3fbSopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15d722e3fbSopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16d722e3fbSopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17d722e3fbSopenharmony_ci * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 18d722e3fbSopenharmony_ci * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19d722e3fbSopenharmony_ci * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20d722e3fbSopenharmony_ci * OTHER DEALINGS IN THE SOFTWARE. 21d722e3fbSopenharmony_ci * 22d722e3fbSopenharmony_ci*/ 23d722e3fbSopenharmony_ci 24d722e3fbSopenharmony_ci#include <stdio.h> 25d722e3fbSopenharmony_ci#include <inttypes.h> 26d722e3fbSopenharmony_ci 27d722e3fbSopenharmony_ci#include "CUnit/Basic.h" 28d722e3fbSopenharmony_ci 29d722e3fbSopenharmony_ci#include "util_math.h" 30d722e3fbSopenharmony_ci 31d722e3fbSopenharmony_ci#include "amdgpu_test.h" 32d722e3fbSopenharmony_ci#include "amdgpu_drm.h" 33d722e3fbSopenharmony_ci#include "amdgpu_internal.h" 34d722e3fbSopenharmony_ci#include "frame.h" 35d722e3fbSopenharmony_ci#include "uve_ib.h" 36d722e3fbSopenharmony_ci 37d722e3fbSopenharmony_ci#define IB_SIZE 4096 38d722e3fbSopenharmony_ci#define MAX_RESOURCES 16 39d722e3fbSopenharmony_ci 40d722e3fbSopenharmony_cistruct amdgpu_uvd_enc_bo { 41d722e3fbSopenharmony_ci amdgpu_bo_handle handle; 42d722e3fbSopenharmony_ci amdgpu_va_handle va_handle; 43d722e3fbSopenharmony_ci uint64_t addr; 44d722e3fbSopenharmony_ci uint64_t size; 45d722e3fbSopenharmony_ci uint8_t *ptr; 46d722e3fbSopenharmony_ci}; 47d722e3fbSopenharmony_ci 48d722e3fbSopenharmony_cistruct amdgpu_uvd_enc { 49d722e3fbSopenharmony_ci unsigned width; 50d722e3fbSopenharmony_ci unsigned height; 51d722e3fbSopenharmony_ci struct amdgpu_uvd_enc_bo session; 52d722e3fbSopenharmony_ci struct amdgpu_uvd_enc_bo vbuf; 53d722e3fbSopenharmony_ci struct amdgpu_uvd_enc_bo bs; 54d722e3fbSopenharmony_ci struct amdgpu_uvd_enc_bo fb; 55d722e3fbSopenharmony_ci struct amdgpu_uvd_enc_bo cpb; 56d722e3fbSopenharmony_ci}; 57d722e3fbSopenharmony_ci 58d722e3fbSopenharmony_cistatic amdgpu_device_handle device_handle; 59d722e3fbSopenharmony_cistatic uint32_t major_version; 60d722e3fbSopenharmony_cistatic uint32_t minor_version; 61d722e3fbSopenharmony_cistatic uint32_t family_id; 62d722e3fbSopenharmony_ci 63d722e3fbSopenharmony_cistatic amdgpu_context_handle context_handle; 64d722e3fbSopenharmony_cistatic amdgpu_bo_handle ib_handle; 65d722e3fbSopenharmony_cistatic amdgpu_va_handle ib_va_handle; 66d722e3fbSopenharmony_cistatic uint64_t ib_mc_address; 67d722e3fbSopenharmony_cistatic uint32_t *ib_cpu; 68d722e3fbSopenharmony_ci 69d722e3fbSopenharmony_cistatic struct amdgpu_uvd_enc enc; 70d722e3fbSopenharmony_cistatic amdgpu_bo_handle resources[MAX_RESOURCES]; 71d722e3fbSopenharmony_cistatic unsigned num_resources; 72d722e3fbSopenharmony_ci 73d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_create(void); 74d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_session_init(void); 75d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_encode(void); 76d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_destroy(void); 77d722e3fbSopenharmony_ci 78d722e3fbSopenharmony_ci 79d722e3fbSopenharmony_ciCU_TestInfo uvd_enc_tests[] = { 80d722e3fbSopenharmony_ci { "UVD ENC create", amdgpu_cs_uvd_enc_create }, 81d722e3fbSopenharmony_ci { "UVD ENC session init", amdgpu_cs_uvd_enc_session_init }, 82d722e3fbSopenharmony_ci { "UVD ENC encode", amdgpu_cs_uvd_enc_encode }, 83d722e3fbSopenharmony_ci { "UVD ENC destroy", amdgpu_cs_uvd_enc_destroy }, 84d722e3fbSopenharmony_ci CU_TEST_INFO_NULL, 85d722e3fbSopenharmony_ci}; 86d722e3fbSopenharmony_ci 87d722e3fbSopenharmony_ciCU_BOOL suite_uvd_enc_tests_enable(void) 88d722e3fbSopenharmony_ci{ 89d722e3fbSopenharmony_ci int r; 90d722e3fbSopenharmony_ci struct drm_amdgpu_info_hw_ip info; 91d722e3fbSopenharmony_ci 92d722e3fbSopenharmony_ci if (amdgpu_device_initialize(drm_amdgpu[0], &major_version, 93d722e3fbSopenharmony_ci &minor_version, &device_handle)) 94d722e3fbSopenharmony_ci return CU_FALSE; 95d722e3fbSopenharmony_ci 96d722e3fbSopenharmony_ci r = amdgpu_query_hw_ip_info(device_handle, AMDGPU_HW_IP_UVD_ENC, 0, &info); 97d722e3fbSopenharmony_ci 98d722e3fbSopenharmony_ci if (amdgpu_device_deinitialize(device_handle)) 99d722e3fbSopenharmony_ci return CU_FALSE; 100d722e3fbSopenharmony_ci 101d722e3fbSopenharmony_ci if (!info.available_rings) 102d722e3fbSopenharmony_ci printf("\n\nThe ASIC NOT support UVD ENC, suite disabled.\n"); 103d722e3fbSopenharmony_ci 104d722e3fbSopenharmony_ci return (r == 0 && (info.available_rings ? CU_TRUE : CU_FALSE)); 105d722e3fbSopenharmony_ci} 106d722e3fbSopenharmony_ci 107d722e3fbSopenharmony_ci 108d722e3fbSopenharmony_ciint suite_uvd_enc_tests_init(void) 109d722e3fbSopenharmony_ci{ 110d722e3fbSopenharmony_ci int r; 111d722e3fbSopenharmony_ci 112d722e3fbSopenharmony_ci r = amdgpu_device_initialize(drm_amdgpu[0], &major_version, 113d722e3fbSopenharmony_ci &minor_version, &device_handle); 114d722e3fbSopenharmony_ci if (r) 115d722e3fbSopenharmony_ci return CUE_SINIT_FAILED; 116d722e3fbSopenharmony_ci 117d722e3fbSopenharmony_ci family_id = device_handle->info.family_id; 118d722e3fbSopenharmony_ci 119d722e3fbSopenharmony_ci r = amdgpu_cs_ctx_create(device_handle, &context_handle); 120d722e3fbSopenharmony_ci if (r) 121d722e3fbSopenharmony_ci return CUE_SINIT_FAILED; 122d722e3fbSopenharmony_ci 123d722e3fbSopenharmony_ci r = amdgpu_bo_alloc_and_map(device_handle, IB_SIZE, 4096, 124d722e3fbSopenharmony_ci AMDGPU_GEM_DOMAIN_GTT, 0, 125d722e3fbSopenharmony_ci &ib_handle, (void**)&ib_cpu, 126d722e3fbSopenharmony_ci &ib_mc_address, &ib_va_handle); 127d722e3fbSopenharmony_ci if (r) 128d722e3fbSopenharmony_ci return CUE_SINIT_FAILED; 129d722e3fbSopenharmony_ci 130d722e3fbSopenharmony_ci return CUE_SUCCESS; 131d722e3fbSopenharmony_ci} 132d722e3fbSopenharmony_ci 133d722e3fbSopenharmony_ciint suite_uvd_enc_tests_clean(void) 134d722e3fbSopenharmony_ci{ 135d722e3fbSopenharmony_ci int r; 136d722e3fbSopenharmony_ci 137d722e3fbSopenharmony_ci r = amdgpu_bo_unmap_and_free(ib_handle, ib_va_handle, 138d722e3fbSopenharmony_ci ib_mc_address, IB_SIZE); 139d722e3fbSopenharmony_ci if (r) 140d722e3fbSopenharmony_ci return CUE_SCLEAN_FAILED; 141d722e3fbSopenharmony_ci 142d722e3fbSopenharmony_ci r = amdgpu_cs_ctx_free(context_handle); 143d722e3fbSopenharmony_ci if (r) 144d722e3fbSopenharmony_ci return CUE_SCLEAN_FAILED; 145d722e3fbSopenharmony_ci 146d722e3fbSopenharmony_ci r = amdgpu_device_deinitialize(device_handle); 147d722e3fbSopenharmony_ci if (r) 148d722e3fbSopenharmony_ci return CUE_SCLEAN_FAILED; 149d722e3fbSopenharmony_ci 150d722e3fbSopenharmony_ci return CUE_SUCCESS; 151d722e3fbSopenharmony_ci} 152d722e3fbSopenharmony_ci 153d722e3fbSopenharmony_cistatic int submit(unsigned ndw, unsigned ip) 154d722e3fbSopenharmony_ci{ 155d722e3fbSopenharmony_ci struct amdgpu_cs_request ibs_request = {0}; 156d722e3fbSopenharmony_ci struct amdgpu_cs_ib_info ib_info = {0}; 157d722e3fbSopenharmony_ci struct amdgpu_cs_fence fence_status = {0}; 158d722e3fbSopenharmony_ci uint32_t expired; 159d722e3fbSopenharmony_ci int r; 160d722e3fbSopenharmony_ci 161d722e3fbSopenharmony_ci ib_info.ib_mc_address = ib_mc_address; 162d722e3fbSopenharmony_ci ib_info.size = ndw; 163d722e3fbSopenharmony_ci 164d722e3fbSopenharmony_ci ibs_request.ip_type = ip; 165d722e3fbSopenharmony_ci 166d722e3fbSopenharmony_ci r = amdgpu_bo_list_create(device_handle, num_resources, resources, 167d722e3fbSopenharmony_ci NULL, &ibs_request.resources); 168d722e3fbSopenharmony_ci if (r) 169d722e3fbSopenharmony_ci return r; 170d722e3fbSopenharmony_ci 171d722e3fbSopenharmony_ci ibs_request.number_of_ibs = 1; 172d722e3fbSopenharmony_ci ibs_request.ibs = &ib_info; 173d722e3fbSopenharmony_ci ibs_request.fence_info.handle = NULL; 174d722e3fbSopenharmony_ci 175d722e3fbSopenharmony_ci r = amdgpu_cs_submit(context_handle, 0, &ibs_request, 1); 176d722e3fbSopenharmony_ci if (r) 177d722e3fbSopenharmony_ci return r; 178d722e3fbSopenharmony_ci 179d722e3fbSopenharmony_ci r = amdgpu_bo_list_destroy(ibs_request.resources); 180d722e3fbSopenharmony_ci if (r) 181d722e3fbSopenharmony_ci return r; 182d722e3fbSopenharmony_ci 183d722e3fbSopenharmony_ci fence_status.context = context_handle; 184d722e3fbSopenharmony_ci fence_status.ip_type = ip; 185d722e3fbSopenharmony_ci fence_status.fence = ibs_request.seq_no; 186d722e3fbSopenharmony_ci 187d722e3fbSopenharmony_ci r = amdgpu_cs_query_fence_status(&fence_status, 188d722e3fbSopenharmony_ci AMDGPU_TIMEOUT_INFINITE, 189d722e3fbSopenharmony_ci 0, &expired); 190d722e3fbSopenharmony_ci if (r) 191d722e3fbSopenharmony_ci return r; 192d722e3fbSopenharmony_ci 193d722e3fbSopenharmony_ci return 0; 194d722e3fbSopenharmony_ci} 195d722e3fbSopenharmony_ci 196d722e3fbSopenharmony_cistatic void alloc_resource(struct amdgpu_uvd_enc_bo *uvd_enc_bo, 197d722e3fbSopenharmony_ci unsigned size, unsigned domain) 198d722e3fbSopenharmony_ci{ 199d722e3fbSopenharmony_ci struct amdgpu_bo_alloc_request req = {0}; 200d722e3fbSopenharmony_ci amdgpu_bo_handle buf_handle; 201d722e3fbSopenharmony_ci amdgpu_va_handle va_handle; 202d722e3fbSopenharmony_ci uint64_t va = 0; 203d722e3fbSopenharmony_ci int r; 204d722e3fbSopenharmony_ci 205d722e3fbSopenharmony_ci req.alloc_size = ALIGN(size, 4096); 206d722e3fbSopenharmony_ci req.preferred_heap = domain; 207d722e3fbSopenharmony_ci r = amdgpu_bo_alloc(device_handle, &req, &buf_handle); 208d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 209d722e3fbSopenharmony_ci r = amdgpu_va_range_alloc(device_handle, 210d722e3fbSopenharmony_ci amdgpu_gpu_va_range_general, 211d722e3fbSopenharmony_ci req.alloc_size, 1, 0, &va, 212d722e3fbSopenharmony_ci &va_handle, 0); 213d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 214d722e3fbSopenharmony_ci r = amdgpu_bo_va_op(buf_handle, 0, req.alloc_size, va, 0, 215d722e3fbSopenharmony_ci AMDGPU_VA_OP_MAP); 216d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 217d722e3fbSopenharmony_ci uvd_enc_bo->addr = va; 218d722e3fbSopenharmony_ci uvd_enc_bo->handle = buf_handle; 219d722e3fbSopenharmony_ci uvd_enc_bo->size = req.alloc_size; 220d722e3fbSopenharmony_ci uvd_enc_bo->va_handle = va_handle; 221d722e3fbSopenharmony_ci r = amdgpu_bo_cpu_map(uvd_enc_bo->handle, (void **)&uvd_enc_bo->ptr); 222d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 223d722e3fbSopenharmony_ci memset(uvd_enc_bo->ptr, 0, size); 224d722e3fbSopenharmony_ci r = amdgpu_bo_cpu_unmap(uvd_enc_bo->handle); 225d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 226d722e3fbSopenharmony_ci} 227d722e3fbSopenharmony_ci 228d722e3fbSopenharmony_cistatic void free_resource(struct amdgpu_uvd_enc_bo *uvd_enc_bo) 229d722e3fbSopenharmony_ci{ 230d722e3fbSopenharmony_ci int r; 231d722e3fbSopenharmony_ci 232d722e3fbSopenharmony_ci r = amdgpu_bo_va_op(uvd_enc_bo->handle, 0, uvd_enc_bo->size, 233d722e3fbSopenharmony_ci uvd_enc_bo->addr, 0, AMDGPU_VA_OP_UNMAP); 234d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 235d722e3fbSopenharmony_ci 236d722e3fbSopenharmony_ci r = amdgpu_va_range_free(uvd_enc_bo->va_handle); 237d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 238d722e3fbSopenharmony_ci 239d722e3fbSopenharmony_ci r = amdgpu_bo_free(uvd_enc_bo->handle); 240d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 241d722e3fbSopenharmony_ci memset(uvd_enc_bo, 0, sizeof(*uvd_enc_bo)); 242d722e3fbSopenharmony_ci} 243d722e3fbSopenharmony_ci 244d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_create(void) 245d722e3fbSopenharmony_ci{ 246d722e3fbSopenharmony_ci enc.width = 160; 247d722e3fbSopenharmony_ci enc.height = 128; 248d722e3fbSopenharmony_ci 249d722e3fbSopenharmony_ci num_resources = 0; 250d722e3fbSopenharmony_ci alloc_resource(&enc.session, 128 * 1024, AMDGPU_GEM_DOMAIN_GTT); 251d722e3fbSopenharmony_ci resources[num_resources++] = enc.session.handle; 252d722e3fbSopenharmony_ci resources[num_resources++] = ib_handle; 253d722e3fbSopenharmony_ci} 254d722e3fbSopenharmony_ci 255d722e3fbSopenharmony_cistatic void check_result(struct amdgpu_uvd_enc *enc) 256d722e3fbSopenharmony_ci{ 257d722e3fbSopenharmony_ci uint64_t sum; 258d722e3fbSopenharmony_ci uint32_t s = 175602; 259d722e3fbSopenharmony_ci uint32_t *ptr, size; 260d722e3fbSopenharmony_ci int j, r; 261d722e3fbSopenharmony_ci 262d722e3fbSopenharmony_ci r = amdgpu_bo_cpu_map(enc->fb.handle, (void **)&enc->fb.ptr); 263d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 264d722e3fbSopenharmony_ci ptr = (uint32_t *)enc->fb.ptr; 265d722e3fbSopenharmony_ci size = ptr[6]; 266d722e3fbSopenharmony_ci r = amdgpu_bo_cpu_unmap(enc->fb.handle); 267d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 268d722e3fbSopenharmony_ci r = amdgpu_bo_cpu_map(enc->bs.handle, (void **)&enc->bs.ptr); 269d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 270d722e3fbSopenharmony_ci for (j = 0, sum = 0; j < size; ++j) 271d722e3fbSopenharmony_ci sum += enc->bs.ptr[j]; 272d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(sum, s); 273d722e3fbSopenharmony_ci r = amdgpu_bo_cpu_unmap(enc->bs.handle); 274d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 275d722e3fbSopenharmony_ci 276d722e3fbSopenharmony_ci} 277d722e3fbSopenharmony_ci 278d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_session_init(void) 279d722e3fbSopenharmony_ci{ 280d722e3fbSopenharmony_ci int len, r; 281d722e3fbSopenharmony_ci 282d722e3fbSopenharmony_ci len = 0; 283d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_session_info, sizeof(uve_session_info)); 284d722e3fbSopenharmony_ci len += sizeof(uve_session_info) / 4; 285d722e3fbSopenharmony_ci ib_cpu[len++] = enc.session.addr >> 32; 286d722e3fbSopenharmony_ci ib_cpu[len++] = enc.session.addr; 287d722e3fbSopenharmony_ci 288d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_task_info, sizeof(uve_task_info)); 289d722e3fbSopenharmony_ci len += sizeof(uve_task_info) / 4; 290d722e3fbSopenharmony_ci ib_cpu[len++] = 0x000000d8; 291d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000000; 292d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000000; 293d722e3fbSopenharmony_ci 294d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_op_init, sizeof(uve_op_init)); 295d722e3fbSopenharmony_ci len += sizeof(uve_op_init) / 4; 296d722e3fbSopenharmony_ci 297d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_session_init, sizeof(uve_session_init)); 298d722e3fbSopenharmony_ci len += sizeof(uve_session_init) / 4; 299d722e3fbSopenharmony_ci 300d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_layer_ctrl, sizeof(uve_layer_ctrl)); 301d722e3fbSopenharmony_ci len += sizeof(uve_layer_ctrl) / 4; 302d722e3fbSopenharmony_ci 303d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_slice_ctrl, sizeof(uve_slice_ctrl)); 304d722e3fbSopenharmony_ci len += sizeof(uve_slice_ctrl) / 4; 305d722e3fbSopenharmony_ci 306d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_spec_misc, sizeof(uve_spec_misc)); 307d722e3fbSopenharmony_ci len += sizeof(uve_spec_misc) / 4; 308d722e3fbSopenharmony_ci 309d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_rc_session_init, sizeof(uve_rc_session_init)); 310d722e3fbSopenharmony_ci len += sizeof(uve_rc_session_init) / 4; 311d722e3fbSopenharmony_ci 312d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_deblocking_filter, sizeof(uve_deblocking_filter)); 313d722e3fbSopenharmony_ci len += sizeof(uve_deblocking_filter) / 4; 314d722e3fbSopenharmony_ci 315d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_quality_params, sizeof(uve_quality_params)); 316d722e3fbSopenharmony_ci len += sizeof(uve_quality_params) / 4; 317d722e3fbSopenharmony_ci 318d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_op_init_rc, sizeof(uve_op_init_rc)); 319d722e3fbSopenharmony_ci len += sizeof(uve_op_init_rc) / 4; 320d722e3fbSopenharmony_ci 321d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_op_init_rc_vbv_level, sizeof(uve_op_init_rc_vbv_level)); 322d722e3fbSopenharmony_ci len += sizeof(uve_op_init_rc_vbv_level) / 4; 323d722e3fbSopenharmony_ci 324d722e3fbSopenharmony_ci r = submit(len, AMDGPU_HW_IP_UVD_ENC); 325d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 326d722e3fbSopenharmony_ci} 327d722e3fbSopenharmony_ci 328d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_encode(void) 329d722e3fbSopenharmony_ci{ 330d722e3fbSopenharmony_ci int len, r, i; 331d722e3fbSopenharmony_ci uint64_t luma_offset, chroma_offset; 332d722e3fbSopenharmony_ci uint32_t vbuf_size, bs_size = 0x003f4800, cpb_size; 333d722e3fbSopenharmony_ci unsigned align = (family_id >= AMDGPU_FAMILY_AI) ? 256 : 16; 334d722e3fbSopenharmony_ci vbuf_size = ALIGN(enc.width, align) * ALIGN(enc.height, 16) * 1.5; 335d722e3fbSopenharmony_ci cpb_size = vbuf_size * 10; 336d722e3fbSopenharmony_ci 337d722e3fbSopenharmony_ci 338d722e3fbSopenharmony_ci num_resources = 0; 339d722e3fbSopenharmony_ci alloc_resource(&enc.fb, 4096, AMDGPU_GEM_DOMAIN_VRAM); 340d722e3fbSopenharmony_ci resources[num_resources++] = enc.fb.handle; 341d722e3fbSopenharmony_ci alloc_resource(&enc.bs, bs_size, AMDGPU_GEM_DOMAIN_VRAM); 342d722e3fbSopenharmony_ci resources[num_resources++] = enc.bs.handle; 343d722e3fbSopenharmony_ci alloc_resource(&enc.vbuf, vbuf_size, AMDGPU_GEM_DOMAIN_VRAM); 344d722e3fbSopenharmony_ci resources[num_resources++] = enc.vbuf.handle; 345d722e3fbSopenharmony_ci alloc_resource(&enc.cpb, cpb_size, AMDGPU_GEM_DOMAIN_VRAM); 346d722e3fbSopenharmony_ci resources[num_resources++] = enc.cpb.handle; 347d722e3fbSopenharmony_ci resources[num_resources++] = ib_handle; 348d722e3fbSopenharmony_ci 349d722e3fbSopenharmony_ci r = amdgpu_bo_cpu_map(enc.vbuf.handle, (void **)&enc.vbuf.ptr); 350d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 351d722e3fbSopenharmony_ci 352d722e3fbSopenharmony_ci memset(enc.vbuf.ptr, 0, vbuf_size); 353d722e3fbSopenharmony_ci for (i = 0; i < enc.height; ++i) { 354d722e3fbSopenharmony_ci memcpy(enc.vbuf.ptr, (frame + i * enc.width), enc.width); 355d722e3fbSopenharmony_ci enc.vbuf.ptr += ALIGN(enc.width, align); 356d722e3fbSopenharmony_ci } 357d722e3fbSopenharmony_ci for (i = 0; i < enc.height / 2; ++i) { 358d722e3fbSopenharmony_ci memcpy(enc.vbuf.ptr, ((frame + enc.height * enc.width) + i * enc.width), enc.width); 359d722e3fbSopenharmony_ci enc.vbuf.ptr += ALIGN(enc.width, align); 360d722e3fbSopenharmony_ci } 361d722e3fbSopenharmony_ci 362d722e3fbSopenharmony_ci r = amdgpu_bo_cpu_unmap(enc.vbuf.handle); 363d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 364d722e3fbSopenharmony_ci 365d722e3fbSopenharmony_ci len = 0; 366d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_session_info, sizeof(uve_session_info)); 367d722e3fbSopenharmony_ci len += sizeof(uve_session_info) / 4; 368d722e3fbSopenharmony_ci ib_cpu[len++] = enc.session.addr >> 32; 369d722e3fbSopenharmony_ci ib_cpu[len++] = enc.session.addr; 370d722e3fbSopenharmony_ci 371d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_task_info, sizeof(uve_task_info)); 372d722e3fbSopenharmony_ci len += sizeof(uve_task_info) / 4; 373d722e3fbSopenharmony_ci ib_cpu[len++] = 0x000005e0; 374d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000001; 375d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000001; 376d722e3fbSopenharmony_ci 377d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_nalu_buffer_1, sizeof(uve_nalu_buffer_1)); 378d722e3fbSopenharmony_ci len += sizeof(uve_nalu_buffer_1) / 4; 379d722e3fbSopenharmony_ci 380d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_nalu_buffer_2, sizeof(uve_nalu_buffer_2)); 381d722e3fbSopenharmony_ci len += sizeof(uve_nalu_buffer_2) / 4; 382d722e3fbSopenharmony_ci 383d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_nalu_buffer_3, sizeof(uve_nalu_buffer_3)); 384d722e3fbSopenharmony_ci len += sizeof(uve_nalu_buffer_3) / 4; 385d722e3fbSopenharmony_ci 386d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_nalu_buffer_4, sizeof(uve_nalu_buffer_4)); 387d722e3fbSopenharmony_ci len += sizeof(uve_nalu_buffer_4) / 4; 388d722e3fbSopenharmony_ci 389d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_slice_header, sizeof(uve_slice_header)); 390d722e3fbSopenharmony_ci len += sizeof(uve_slice_header) / 4; 391d722e3fbSopenharmony_ci 392d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000254; 393d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000010; 394d722e3fbSopenharmony_ci ib_cpu[len++] = enc.cpb.addr >> 32; 395d722e3fbSopenharmony_ci ib_cpu[len++] = enc.cpb.addr; 396d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_ctx_buffer, sizeof(uve_ctx_buffer)); 397d722e3fbSopenharmony_ci len += sizeof(uve_ctx_buffer) / 4; 398d722e3fbSopenharmony_ci 399d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_bitstream_buffer, sizeof(uve_bitstream_buffer)); 400d722e3fbSopenharmony_ci len += sizeof(uve_bitstream_buffer) / 4; 401d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000000; 402d722e3fbSopenharmony_ci ib_cpu[len++] = enc.bs.addr >> 32; 403d722e3fbSopenharmony_ci ib_cpu[len++] = enc.bs.addr; 404d722e3fbSopenharmony_ci ib_cpu[len++] = 0x003f4800; 405d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000000; 406d722e3fbSopenharmony_ci 407d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_feedback_buffer, sizeof(uve_feedback_buffer)); 408d722e3fbSopenharmony_ci len += sizeof(uve_feedback_buffer) / 4; 409d722e3fbSopenharmony_ci ib_cpu[len++] = enc.fb.addr >> 32; 410d722e3fbSopenharmony_ci ib_cpu[len++] = enc.fb.addr; 411d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000010; 412d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000028; 413d722e3fbSopenharmony_ci 414d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_feedback_buffer_additional, sizeof(uve_feedback_buffer_additional)); 415d722e3fbSopenharmony_ci len += sizeof(uve_feedback_buffer_additional) / 4; 416d722e3fbSopenharmony_ci 417d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_intra_refresh, sizeof(uve_intra_refresh)); 418d722e3fbSopenharmony_ci len += sizeof(uve_intra_refresh) / 4; 419d722e3fbSopenharmony_ci 420d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_layer_select, sizeof(uve_layer_select)); 421d722e3fbSopenharmony_ci len += sizeof(uve_layer_select) / 4; 422d722e3fbSopenharmony_ci 423d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_rc_layer_init, sizeof(uve_rc_layer_init)); 424d722e3fbSopenharmony_ci len += sizeof(uve_rc_layer_init) / 4; 425d722e3fbSopenharmony_ci 426d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_layer_select, sizeof(uve_layer_select)); 427d722e3fbSopenharmony_ci len += sizeof(uve_layer_select) / 4; 428d722e3fbSopenharmony_ci 429d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_rc_per_pic, sizeof(uve_rc_per_pic)); 430d722e3fbSopenharmony_ci len += sizeof(uve_rc_per_pic) / 4; 431d722e3fbSopenharmony_ci 432d722e3fbSopenharmony_ci unsigned luma_size = ALIGN(enc.width, align) * ALIGN(enc.height, 16); 433d722e3fbSopenharmony_ci luma_offset = enc.vbuf.addr; 434d722e3fbSopenharmony_ci chroma_offset = luma_offset + luma_size; 435d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000054; 436d722e3fbSopenharmony_ci ib_cpu[len++] = 0x0000000c; 437d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000002; 438d722e3fbSopenharmony_ci ib_cpu[len++] = 0x003f4800; 439d722e3fbSopenharmony_ci ib_cpu[len++] = luma_offset >> 32; 440d722e3fbSopenharmony_ci ib_cpu[len++] = luma_offset; 441d722e3fbSopenharmony_ci ib_cpu[len++] = chroma_offset >> 32; 442d722e3fbSopenharmony_ci ib_cpu[len++] = chroma_offset; 443d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_encode_param, sizeof(uve_encode_param)); 444d722e3fbSopenharmony_ci ib_cpu[len] = ALIGN(enc.width, align); 445d722e3fbSopenharmony_ci ib_cpu[len + 1] = ALIGN(enc.width, align); 446d722e3fbSopenharmony_ci len += sizeof(uve_encode_param) / 4; 447d722e3fbSopenharmony_ci 448d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_op_speed_enc_mode, sizeof(uve_op_speed_enc_mode)); 449d722e3fbSopenharmony_ci len += sizeof(uve_op_speed_enc_mode) / 4; 450d722e3fbSopenharmony_ci 451d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_op_encode, sizeof(uve_op_encode)); 452d722e3fbSopenharmony_ci len += sizeof(uve_op_encode) / 4; 453d722e3fbSopenharmony_ci 454d722e3fbSopenharmony_ci r = submit(len, AMDGPU_HW_IP_UVD_ENC); 455d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 456d722e3fbSopenharmony_ci 457d722e3fbSopenharmony_ci check_result(&enc); 458d722e3fbSopenharmony_ci 459d722e3fbSopenharmony_ci free_resource(&enc.fb); 460d722e3fbSopenharmony_ci free_resource(&enc.bs); 461d722e3fbSopenharmony_ci free_resource(&enc.vbuf); 462d722e3fbSopenharmony_ci free_resource(&enc.cpb); 463d722e3fbSopenharmony_ci} 464d722e3fbSopenharmony_ci 465d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_destroy(void) 466d722e3fbSopenharmony_ci{ 467d722e3fbSopenharmony_ci int len, r; 468d722e3fbSopenharmony_ci 469d722e3fbSopenharmony_ci num_resources = 0; 470d722e3fbSopenharmony_ci resources[num_resources++] = ib_handle; 471d722e3fbSopenharmony_ci 472d722e3fbSopenharmony_ci len = 0; 473d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_session_info, sizeof(uve_session_info)); 474d722e3fbSopenharmony_ci len += sizeof(uve_session_info) / 4; 475d722e3fbSopenharmony_ci ib_cpu[len++] = enc.session.addr >> 32; 476d722e3fbSopenharmony_ci ib_cpu[len++] = enc.session.addr; 477d722e3fbSopenharmony_ci 478d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_task_info, sizeof(uve_task_info)); 479d722e3fbSopenharmony_ci len += sizeof(uve_task_info) / 4; 480d722e3fbSopenharmony_ci ib_cpu[len++] = 0xffffffff; 481d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000002; 482d722e3fbSopenharmony_ci ib_cpu[len++] = 0x00000000; 483d722e3fbSopenharmony_ci 484d722e3fbSopenharmony_ci memcpy((ib_cpu + len), uve_op_close, sizeof(uve_op_close)); 485d722e3fbSopenharmony_ci len += sizeof(uve_op_close) / 4; 486d722e3fbSopenharmony_ci 487d722e3fbSopenharmony_ci r = submit(len, AMDGPU_HW_IP_UVD_ENC); 488d722e3fbSopenharmony_ci CU_ASSERT_EQUAL(r, 0); 489d722e3fbSopenharmony_ci 490d722e3fbSopenharmony_ci free_resource(&enc.session); 491d722e3fbSopenharmony_ci} 492