1d722e3fbSopenharmony_ci/*
2d722e3fbSopenharmony_ci * Copyright 2017 Advanced Micro Devices, Inc.
3d722e3fbSopenharmony_ci *
4d722e3fbSopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a
5d722e3fbSopenharmony_ci * copy of this software and associated documentation files (the "Software"),
6d722e3fbSopenharmony_ci * to deal in the Software without restriction, including without limitation
7d722e3fbSopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8d722e3fbSopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the
9d722e3fbSopenharmony_ci * Software is furnished to do so, subject to the following conditions:
10d722e3fbSopenharmony_ci *
11d722e3fbSopenharmony_ci * The above copyright notice and this permission notice shall be included in
12d722e3fbSopenharmony_ci * all copies or substantial portions of the Software.
13d722e3fbSopenharmony_ci *
14d722e3fbSopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15d722e3fbSopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16d722e3fbSopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17d722e3fbSopenharmony_ci * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18d722e3fbSopenharmony_ci * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19d722e3fbSopenharmony_ci * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20d722e3fbSopenharmony_ci * OTHER DEALINGS IN THE SOFTWARE.
21d722e3fbSopenharmony_ci *
22d722e3fbSopenharmony_ci*/
23d722e3fbSopenharmony_ci
24d722e3fbSopenharmony_ci#include <stdio.h>
25d722e3fbSopenharmony_ci#include <inttypes.h>
26d722e3fbSopenharmony_ci
27d722e3fbSopenharmony_ci#include "CUnit/Basic.h"
28d722e3fbSopenharmony_ci
29d722e3fbSopenharmony_ci#include "util_math.h"
30d722e3fbSopenharmony_ci
31d722e3fbSopenharmony_ci#include "amdgpu_test.h"
32d722e3fbSopenharmony_ci#include "amdgpu_drm.h"
33d722e3fbSopenharmony_ci#include "amdgpu_internal.h"
34d722e3fbSopenharmony_ci#include "frame.h"
35d722e3fbSopenharmony_ci#include "uve_ib.h"
36d722e3fbSopenharmony_ci
37d722e3fbSopenharmony_ci#define IB_SIZE		4096
38d722e3fbSopenharmony_ci#define MAX_RESOURCES	16
39d722e3fbSopenharmony_ci
40d722e3fbSopenharmony_cistruct amdgpu_uvd_enc_bo {
41d722e3fbSopenharmony_ci	amdgpu_bo_handle handle;
42d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle;
43d722e3fbSopenharmony_ci	uint64_t addr;
44d722e3fbSopenharmony_ci	uint64_t size;
45d722e3fbSopenharmony_ci	uint8_t *ptr;
46d722e3fbSopenharmony_ci};
47d722e3fbSopenharmony_ci
48d722e3fbSopenharmony_cistruct amdgpu_uvd_enc {
49d722e3fbSopenharmony_ci	unsigned width;
50d722e3fbSopenharmony_ci	unsigned height;
51d722e3fbSopenharmony_ci	struct amdgpu_uvd_enc_bo session;
52d722e3fbSopenharmony_ci	struct amdgpu_uvd_enc_bo vbuf;
53d722e3fbSopenharmony_ci	struct amdgpu_uvd_enc_bo bs;
54d722e3fbSopenharmony_ci	struct amdgpu_uvd_enc_bo fb;
55d722e3fbSopenharmony_ci	struct amdgpu_uvd_enc_bo cpb;
56d722e3fbSopenharmony_ci};
57d722e3fbSopenharmony_ci
58d722e3fbSopenharmony_cistatic amdgpu_device_handle device_handle;
59d722e3fbSopenharmony_cistatic uint32_t major_version;
60d722e3fbSopenharmony_cistatic uint32_t minor_version;
61d722e3fbSopenharmony_cistatic uint32_t family_id;
62d722e3fbSopenharmony_ci
63d722e3fbSopenharmony_cistatic amdgpu_context_handle context_handle;
64d722e3fbSopenharmony_cistatic amdgpu_bo_handle ib_handle;
65d722e3fbSopenharmony_cistatic amdgpu_va_handle ib_va_handle;
66d722e3fbSopenharmony_cistatic uint64_t ib_mc_address;
67d722e3fbSopenharmony_cistatic uint32_t *ib_cpu;
68d722e3fbSopenharmony_ci
69d722e3fbSopenharmony_cistatic struct amdgpu_uvd_enc enc;
70d722e3fbSopenharmony_cistatic amdgpu_bo_handle resources[MAX_RESOURCES];
71d722e3fbSopenharmony_cistatic unsigned num_resources;
72d722e3fbSopenharmony_ci
73d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_create(void);
74d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_session_init(void);
75d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_encode(void);
76d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_destroy(void);
77d722e3fbSopenharmony_ci
78d722e3fbSopenharmony_ci
79d722e3fbSopenharmony_ciCU_TestInfo uvd_enc_tests[] = {
80d722e3fbSopenharmony_ci	{ "UVD ENC create",  amdgpu_cs_uvd_enc_create },
81d722e3fbSopenharmony_ci	{ "UVD ENC session init",  amdgpu_cs_uvd_enc_session_init },
82d722e3fbSopenharmony_ci	{ "UVD ENC encode",  amdgpu_cs_uvd_enc_encode },
83d722e3fbSopenharmony_ci	{ "UVD ENC destroy",  amdgpu_cs_uvd_enc_destroy },
84d722e3fbSopenharmony_ci	CU_TEST_INFO_NULL,
85d722e3fbSopenharmony_ci};
86d722e3fbSopenharmony_ci
87d722e3fbSopenharmony_ciCU_BOOL suite_uvd_enc_tests_enable(void)
88d722e3fbSopenharmony_ci{
89d722e3fbSopenharmony_ci	int r;
90d722e3fbSopenharmony_ci	struct drm_amdgpu_info_hw_ip info;
91d722e3fbSopenharmony_ci
92d722e3fbSopenharmony_ci	if (amdgpu_device_initialize(drm_amdgpu[0], &major_version,
93d722e3fbSopenharmony_ci					     &minor_version, &device_handle))
94d722e3fbSopenharmony_ci		return CU_FALSE;
95d722e3fbSopenharmony_ci
96d722e3fbSopenharmony_ci	r = amdgpu_query_hw_ip_info(device_handle, AMDGPU_HW_IP_UVD_ENC, 0, &info);
97d722e3fbSopenharmony_ci
98d722e3fbSopenharmony_ci	if (amdgpu_device_deinitialize(device_handle))
99d722e3fbSopenharmony_ci		return CU_FALSE;
100d722e3fbSopenharmony_ci
101d722e3fbSopenharmony_ci	if (!info.available_rings)
102d722e3fbSopenharmony_ci		printf("\n\nThe ASIC NOT support UVD ENC, suite disabled.\n");
103d722e3fbSopenharmony_ci
104d722e3fbSopenharmony_ci	return (r == 0 && (info.available_rings ? CU_TRUE : CU_FALSE));
105d722e3fbSopenharmony_ci}
106d722e3fbSopenharmony_ci
107d722e3fbSopenharmony_ci
108d722e3fbSopenharmony_ciint suite_uvd_enc_tests_init(void)
109d722e3fbSopenharmony_ci{
110d722e3fbSopenharmony_ci	int r;
111d722e3fbSopenharmony_ci
112d722e3fbSopenharmony_ci	r = amdgpu_device_initialize(drm_amdgpu[0], &major_version,
113d722e3fbSopenharmony_ci				     &minor_version, &device_handle);
114d722e3fbSopenharmony_ci	if (r)
115d722e3fbSopenharmony_ci		return CUE_SINIT_FAILED;
116d722e3fbSopenharmony_ci
117d722e3fbSopenharmony_ci	family_id = device_handle->info.family_id;
118d722e3fbSopenharmony_ci
119d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
120d722e3fbSopenharmony_ci	if (r)
121d722e3fbSopenharmony_ci		return CUE_SINIT_FAILED;
122d722e3fbSopenharmony_ci
123d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, IB_SIZE, 4096,
124d722e3fbSopenharmony_ci				    AMDGPU_GEM_DOMAIN_GTT, 0,
125d722e3fbSopenharmony_ci				    &ib_handle, (void**)&ib_cpu,
126d722e3fbSopenharmony_ci				    &ib_mc_address, &ib_va_handle);
127d722e3fbSopenharmony_ci	if (r)
128d722e3fbSopenharmony_ci		return CUE_SINIT_FAILED;
129d722e3fbSopenharmony_ci
130d722e3fbSopenharmony_ci	return CUE_SUCCESS;
131d722e3fbSopenharmony_ci}
132d722e3fbSopenharmony_ci
133d722e3fbSopenharmony_ciint suite_uvd_enc_tests_clean(void)
134d722e3fbSopenharmony_ci{
135d722e3fbSopenharmony_ci	int r;
136d722e3fbSopenharmony_ci
137d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(ib_handle, ib_va_handle,
138d722e3fbSopenharmony_ci				     ib_mc_address, IB_SIZE);
139d722e3fbSopenharmony_ci	if (r)
140d722e3fbSopenharmony_ci		return CUE_SCLEAN_FAILED;
141d722e3fbSopenharmony_ci
142d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
143d722e3fbSopenharmony_ci	if (r)
144d722e3fbSopenharmony_ci		return CUE_SCLEAN_FAILED;
145d722e3fbSopenharmony_ci
146d722e3fbSopenharmony_ci	r = amdgpu_device_deinitialize(device_handle);
147d722e3fbSopenharmony_ci	if (r)
148d722e3fbSopenharmony_ci		return CUE_SCLEAN_FAILED;
149d722e3fbSopenharmony_ci
150d722e3fbSopenharmony_ci	return CUE_SUCCESS;
151d722e3fbSopenharmony_ci}
152d722e3fbSopenharmony_ci
153d722e3fbSopenharmony_cistatic int submit(unsigned ndw, unsigned ip)
154d722e3fbSopenharmony_ci{
155d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request = {0};
156d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info = {0};
157d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status = {0};
158d722e3fbSopenharmony_ci	uint32_t expired;
159d722e3fbSopenharmony_ci	int r;
160d722e3fbSopenharmony_ci
161d722e3fbSopenharmony_ci	ib_info.ib_mc_address = ib_mc_address;
162d722e3fbSopenharmony_ci	ib_info.size = ndw;
163d722e3fbSopenharmony_ci
164d722e3fbSopenharmony_ci	ibs_request.ip_type = ip;
165d722e3fbSopenharmony_ci
166d722e3fbSopenharmony_ci	r = amdgpu_bo_list_create(device_handle, num_resources, resources,
167d722e3fbSopenharmony_ci				  NULL, &ibs_request.resources);
168d722e3fbSopenharmony_ci	if (r)
169d722e3fbSopenharmony_ci		return r;
170d722e3fbSopenharmony_ci
171d722e3fbSopenharmony_ci	ibs_request.number_of_ibs = 1;
172d722e3fbSopenharmony_ci	ibs_request.ibs = &ib_info;
173d722e3fbSopenharmony_ci	ibs_request.fence_info.handle = NULL;
174d722e3fbSopenharmony_ci
175d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle, 0, &ibs_request, 1);
176d722e3fbSopenharmony_ci	if (r)
177d722e3fbSopenharmony_ci		return r;
178d722e3fbSopenharmony_ci
179d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(ibs_request.resources);
180d722e3fbSopenharmony_ci	if (r)
181d722e3fbSopenharmony_ci		return r;
182d722e3fbSopenharmony_ci
183d722e3fbSopenharmony_ci	fence_status.context = context_handle;
184d722e3fbSopenharmony_ci	fence_status.ip_type = ip;
185d722e3fbSopenharmony_ci	fence_status.fence = ibs_request.seq_no;
186d722e3fbSopenharmony_ci
187d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
188d722e3fbSopenharmony_ci					 AMDGPU_TIMEOUT_INFINITE,
189d722e3fbSopenharmony_ci					 0, &expired);
190d722e3fbSopenharmony_ci	if (r)
191d722e3fbSopenharmony_ci		return r;
192d722e3fbSopenharmony_ci
193d722e3fbSopenharmony_ci	return 0;
194d722e3fbSopenharmony_ci}
195d722e3fbSopenharmony_ci
196d722e3fbSopenharmony_cistatic void alloc_resource(struct amdgpu_uvd_enc_bo *uvd_enc_bo,
197d722e3fbSopenharmony_ci			unsigned size, unsigned domain)
198d722e3fbSopenharmony_ci{
199d722e3fbSopenharmony_ci	struct amdgpu_bo_alloc_request req = {0};
200d722e3fbSopenharmony_ci	amdgpu_bo_handle buf_handle;
201d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle;
202d722e3fbSopenharmony_ci	uint64_t va = 0;
203d722e3fbSopenharmony_ci	int r;
204d722e3fbSopenharmony_ci
205d722e3fbSopenharmony_ci	req.alloc_size = ALIGN(size, 4096);
206d722e3fbSopenharmony_ci	req.preferred_heap = domain;
207d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc(device_handle, &req, &buf_handle);
208d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
209d722e3fbSopenharmony_ci	r = amdgpu_va_range_alloc(device_handle,
210d722e3fbSopenharmony_ci				  amdgpu_gpu_va_range_general,
211d722e3fbSopenharmony_ci				  req.alloc_size, 1, 0, &va,
212d722e3fbSopenharmony_ci				  &va_handle, 0);
213d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
214d722e3fbSopenharmony_ci	r = amdgpu_bo_va_op(buf_handle, 0, req.alloc_size, va, 0,
215d722e3fbSopenharmony_ci			    AMDGPU_VA_OP_MAP);
216d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
217d722e3fbSopenharmony_ci	uvd_enc_bo->addr = va;
218d722e3fbSopenharmony_ci	uvd_enc_bo->handle = buf_handle;
219d722e3fbSopenharmony_ci	uvd_enc_bo->size = req.alloc_size;
220d722e3fbSopenharmony_ci	uvd_enc_bo->va_handle = va_handle;
221d722e3fbSopenharmony_ci	r = amdgpu_bo_cpu_map(uvd_enc_bo->handle, (void **)&uvd_enc_bo->ptr);
222d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
223d722e3fbSopenharmony_ci	memset(uvd_enc_bo->ptr, 0, size);
224d722e3fbSopenharmony_ci	r = amdgpu_bo_cpu_unmap(uvd_enc_bo->handle);
225d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
226d722e3fbSopenharmony_ci}
227d722e3fbSopenharmony_ci
228d722e3fbSopenharmony_cistatic void free_resource(struct amdgpu_uvd_enc_bo *uvd_enc_bo)
229d722e3fbSopenharmony_ci{
230d722e3fbSopenharmony_ci	int r;
231d722e3fbSopenharmony_ci
232d722e3fbSopenharmony_ci	r = amdgpu_bo_va_op(uvd_enc_bo->handle, 0, uvd_enc_bo->size,
233d722e3fbSopenharmony_ci			    uvd_enc_bo->addr, 0, AMDGPU_VA_OP_UNMAP);
234d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
235d722e3fbSopenharmony_ci
236d722e3fbSopenharmony_ci	r = amdgpu_va_range_free(uvd_enc_bo->va_handle);
237d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
238d722e3fbSopenharmony_ci
239d722e3fbSopenharmony_ci	r = amdgpu_bo_free(uvd_enc_bo->handle);
240d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
241d722e3fbSopenharmony_ci	memset(uvd_enc_bo, 0, sizeof(*uvd_enc_bo));
242d722e3fbSopenharmony_ci}
243d722e3fbSopenharmony_ci
244d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_create(void)
245d722e3fbSopenharmony_ci{
246d722e3fbSopenharmony_ci	enc.width = 160;
247d722e3fbSopenharmony_ci	enc.height = 128;
248d722e3fbSopenharmony_ci
249d722e3fbSopenharmony_ci	num_resources  = 0;
250d722e3fbSopenharmony_ci	alloc_resource(&enc.session, 128 * 1024, AMDGPU_GEM_DOMAIN_GTT);
251d722e3fbSopenharmony_ci	resources[num_resources++] = enc.session.handle;
252d722e3fbSopenharmony_ci	resources[num_resources++] = ib_handle;
253d722e3fbSopenharmony_ci}
254d722e3fbSopenharmony_ci
255d722e3fbSopenharmony_cistatic void check_result(struct amdgpu_uvd_enc *enc)
256d722e3fbSopenharmony_ci{
257d722e3fbSopenharmony_ci	uint64_t sum;
258d722e3fbSopenharmony_ci	uint32_t s = 175602;
259d722e3fbSopenharmony_ci	uint32_t *ptr, size;
260d722e3fbSopenharmony_ci	int j, r;
261d722e3fbSopenharmony_ci
262d722e3fbSopenharmony_ci	r = amdgpu_bo_cpu_map(enc->fb.handle, (void **)&enc->fb.ptr);
263d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
264d722e3fbSopenharmony_ci	ptr = (uint32_t *)enc->fb.ptr;
265d722e3fbSopenharmony_ci	size = ptr[6];
266d722e3fbSopenharmony_ci	r = amdgpu_bo_cpu_unmap(enc->fb.handle);
267d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
268d722e3fbSopenharmony_ci	r = amdgpu_bo_cpu_map(enc->bs.handle, (void **)&enc->bs.ptr);
269d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
270d722e3fbSopenharmony_ci	for (j = 0, sum = 0; j < size; ++j)
271d722e3fbSopenharmony_ci		sum += enc->bs.ptr[j];
272d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(sum, s);
273d722e3fbSopenharmony_ci	r = amdgpu_bo_cpu_unmap(enc->bs.handle);
274d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
275d722e3fbSopenharmony_ci
276d722e3fbSopenharmony_ci}
277d722e3fbSopenharmony_ci
278d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_session_init(void)
279d722e3fbSopenharmony_ci{
280d722e3fbSopenharmony_ci	int len, r;
281d722e3fbSopenharmony_ci
282d722e3fbSopenharmony_ci	len = 0;
283d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_session_info, sizeof(uve_session_info));
284d722e3fbSopenharmony_ci	len += sizeof(uve_session_info) / 4;
285d722e3fbSopenharmony_ci	ib_cpu[len++] = enc.session.addr >> 32;
286d722e3fbSopenharmony_ci	ib_cpu[len++] = enc.session.addr;
287d722e3fbSopenharmony_ci
288d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_task_info, sizeof(uve_task_info));
289d722e3fbSopenharmony_ci	len += sizeof(uve_task_info) / 4;
290d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x000000d8;
291d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000000;
292d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000000;
293d722e3fbSopenharmony_ci
294d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_op_init, sizeof(uve_op_init));
295d722e3fbSopenharmony_ci	len += sizeof(uve_op_init) / 4;
296d722e3fbSopenharmony_ci
297d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_session_init, sizeof(uve_session_init));
298d722e3fbSopenharmony_ci	len += sizeof(uve_session_init) / 4;
299d722e3fbSopenharmony_ci
300d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_layer_ctrl, sizeof(uve_layer_ctrl));
301d722e3fbSopenharmony_ci	len += sizeof(uve_layer_ctrl) / 4;
302d722e3fbSopenharmony_ci
303d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_slice_ctrl, sizeof(uve_slice_ctrl));
304d722e3fbSopenharmony_ci	len += sizeof(uve_slice_ctrl) / 4;
305d722e3fbSopenharmony_ci
306d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_spec_misc, sizeof(uve_spec_misc));
307d722e3fbSopenharmony_ci	len += sizeof(uve_spec_misc) / 4;
308d722e3fbSopenharmony_ci
309d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_rc_session_init, sizeof(uve_rc_session_init));
310d722e3fbSopenharmony_ci	len += sizeof(uve_rc_session_init) / 4;
311d722e3fbSopenharmony_ci
312d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_deblocking_filter, sizeof(uve_deblocking_filter));
313d722e3fbSopenharmony_ci	len += sizeof(uve_deblocking_filter) / 4;
314d722e3fbSopenharmony_ci
315d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_quality_params, sizeof(uve_quality_params));
316d722e3fbSopenharmony_ci	len += sizeof(uve_quality_params) / 4;
317d722e3fbSopenharmony_ci
318d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_op_init_rc, sizeof(uve_op_init_rc));
319d722e3fbSopenharmony_ci	len += sizeof(uve_op_init_rc) / 4;
320d722e3fbSopenharmony_ci
321d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_op_init_rc_vbv_level, sizeof(uve_op_init_rc_vbv_level));
322d722e3fbSopenharmony_ci	len += sizeof(uve_op_init_rc_vbv_level) / 4;
323d722e3fbSopenharmony_ci
324d722e3fbSopenharmony_ci	r = submit(len, AMDGPU_HW_IP_UVD_ENC);
325d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
326d722e3fbSopenharmony_ci}
327d722e3fbSopenharmony_ci
328d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_encode(void)
329d722e3fbSopenharmony_ci{
330d722e3fbSopenharmony_ci	int len, r, i;
331d722e3fbSopenharmony_ci	uint64_t luma_offset, chroma_offset;
332d722e3fbSopenharmony_ci	uint32_t vbuf_size, bs_size = 0x003f4800, cpb_size;
333d722e3fbSopenharmony_ci	unsigned align = (family_id >= AMDGPU_FAMILY_AI) ? 256 : 16;
334d722e3fbSopenharmony_ci	vbuf_size = ALIGN(enc.width, align) * ALIGN(enc.height, 16) * 1.5;
335d722e3fbSopenharmony_ci	cpb_size = vbuf_size * 10;
336d722e3fbSopenharmony_ci
337d722e3fbSopenharmony_ci
338d722e3fbSopenharmony_ci	num_resources  = 0;
339d722e3fbSopenharmony_ci	alloc_resource(&enc.fb, 4096, AMDGPU_GEM_DOMAIN_VRAM);
340d722e3fbSopenharmony_ci	resources[num_resources++] = enc.fb.handle;
341d722e3fbSopenharmony_ci	alloc_resource(&enc.bs, bs_size, AMDGPU_GEM_DOMAIN_VRAM);
342d722e3fbSopenharmony_ci	resources[num_resources++] = enc.bs.handle;
343d722e3fbSopenharmony_ci	alloc_resource(&enc.vbuf, vbuf_size, AMDGPU_GEM_DOMAIN_VRAM);
344d722e3fbSopenharmony_ci	resources[num_resources++] = enc.vbuf.handle;
345d722e3fbSopenharmony_ci	alloc_resource(&enc.cpb, cpb_size, AMDGPU_GEM_DOMAIN_VRAM);
346d722e3fbSopenharmony_ci	resources[num_resources++] = enc.cpb.handle;
347d722e3fbSopenharmony_ci	resources[num_resources++] = ib_handle;
348d722e3fbSopenharmony_ci
349d722e3fbSopenharmony_ci	r = amdgpu_bo_cpu_map(enc.vbuf.handle, (void **)&enc.vbuf.ptr);
350d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
351d722e3fbSopenharmony_ci
352d722e3fbSopenharmony_ci	memset(enc.vbuf.ptr, 0, vbuf_size);
353d722e3fbSopenharmony_ci	for (i = 0; i < enc.height; ++i) {
354d722e3fbSopenharmony_ci		memcpy(enc.vbuf.ptr, (frame + i * enc.width), enc.width);
355d722e3fbSopenharmony_ci		enc.vbuf.ptr += ALIGN(enc.width, align);
356d722e3fbSopenharmony_ci	}
357d722e3fbSopenharmony_ci	for (i = 0; i < enc.height / 2; ++i) {
358d722e3fbSopenharmony_ci		memcpy(enc.vbuf.ptr, ((frame + enc.height * enc.width) + i * enc.width), enc.width);
359d722e3fbSopenharmony_ci		enc.vbuf.ptr += ALIGN(enc.width, align);
360d722e3fbSopenharmony_ci	}
361d722e3fbSopenharmony_ci
362d722e3fbSopenharmony_ci	r = amdgpu_bo_cpu_unmap(enc.vbuf.handle);
363d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
364d722e3fbSopenharmony_ci
365d722e3fbSopenharmony_ci	len = 0;
366d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_session_info, sizeof(uve_session_info));
367d722e3fbSopenharmony_ci	len += sizeof(uve_session_info) / 4;
368d722e3fbSopenharmony_ci	ib_cpu[len++] = enc.session.addr >> 32;
369d722e3fbSopenharmony_ci	ib_cpu[len++] = enc.session.addr;
370d722e3fbSopenharmony_ci
371d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_task_info, sizeof(uve_task_info));
372d722e3fbSopenharmony_ci	len += sizeof(uve_task_info) / 4;
373d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x000005e0;
374d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000001;
375d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000001;
376d722e3fbSopenharmony_ci
377d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_nalu_buffer_1, sizeof(uve_nalu_buffer_1));
378d722e3fbSopenharmony_ci	len += sizeof(uve_nalu_buffer_1) / 4;
379d722e3fbSopenharmony_ci
380d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_nalu_buffer_2, sizeof(uve_nalu_buffer_2));
381d722e3fbSopenharmony_ci	len += sizeof(uve_nalu_buffer_2) / 4;
382d722e3fbSopenharmony_ci
383d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_nalu_buffer_3, sizeof(uve_nalu_buffer_3));
384d722e3fbSopenharmony_ci	len += sizeof(uve_nalu_buffer_3) / 4;
385d722e3fbSopenharmony_ci
386d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_nalu_buffer_4, sizeof(uve_nalu_buffer_4));
387d722e3fbSopenharmony_ci	len += sizeof(uve_nalu_buffer_4) / 4;
388d722e3fbSopenharmony_ci
389d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_slice_header, sizeof(uve_slice_header));
390d722e3fbSopenharmony_ci	len += sizeof(uve_slice_header) / 4;
391d722e3fbSopenharmony_ci
392d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000254;
393d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000010;
394d722e3fbSopenharmony_ci	ib_cpu[len++] = enc.cpb.addr >> 32;
395d722e3fbSopenharmony_ci	ib_cpu[len++] = enc.cpb.addr;
396d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_ctx_buffer, sizeof(uve_ctx_buffer));
397d722e3fbSopenharmony_ci	len += sizeof(uve_ctx_buffer) / 4;
398d722e3fbSopenharmony_ci
399d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_bitstream_buffer, sizeof(uve_bitstream_buffer));
400d722e3fbSopenharmony_ci	len += sizeof(uve_bitstream_buffer) / 4;
401d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000000;
402d722e3fbSopenharmony_ci	ib_cpu[len++] = enc.bs.addr >> 32;
403d722e3fbSopenharmony_ci	ib_cpu[len++] = enc.bs.addr;
404d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x003f4800;
405d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000000;
406d722e3fbSopenharmony_ci
407d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_feedback_buffer, sizeof(uve_feedback_buffer));
408d722e3fbSopenharmony_ci	len += sizeof(uve_feedback_buffer) / 4;
409d722e3fbSopenharmony_ci	ib_cpu[len++] = enc.fb.addr >> 32;
410d722e3fbSopenharmony_ci	ib_cpu[len++] = enc.fb.addr;
411d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000010;
412d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000028;
413d722e3fbSopenharmony_ci
414d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_feedback_buffer_additional, sizeof(uve_feedback_buffer_additional));
415d722e3fbSopenharmony_ci	len += sizeof(uve_feedback_buffer_additional) / 4;
416d722e3fbSopenharmony_ci
417d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_intra_refresh, sizeof(uve_intra_refresh));
418d722e3fbSopenharmony_ci	len += sizeof(uve_intra_refresh) / 4;
419d722e3fbSopenharmony_ci
420d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_layer_select, sizeof(uve_layer_select));
421d722e3fbSopenharmony_ci	len += sizeof(uve_layer_select) / 4;
422d722e3fbSopenharmony_ci
423d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_rc_layer_init, sizeof(uve_rc_layer_init));
424d722e3fbSopenharmony_ci	len += sizeof(uve_rc_layer_init) / 4;
425d722e3fbSopenharmony_ci
426d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_layer_select, sizeof(uve_layer_select));
427d722e3fbSopenharmony_ci	len += sizeof(uve_layer_select) / 4;
428d722e3fbSopenharmony_ci
429d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_rc_per_pic, sizeof(uve_rc_per_pic));
430d722e3fbSopenharmony_ci	len += sizeof(uve_rc_per_pic) / 4;
431d722e3fbSopenharmony_ci
432d722e3fbSopenharmony_ci	unsigned luma_size = ALIGN(enc.width, align) * ALIGN(enc.height, 16);
433d722e3fbSopenharmony_ci	luma_offset = enc.vbuf.addr;
434d722e3fbSopenharmony_ci	chroma_offset = luma_offset + luma_size;
435d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000054;
436d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x0000000c;
437d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000002;
438d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x003f4800;
439d722e3fbSopenharmony_ci	ib_cpu[len++] = luma_offset >> 32;
440d722e3fbSopenharmony_ci	ib_cpu[len++] = luma_offset;
441d722e3fbSopenharmony_ci	ib_cpu[len++] = chroma_offset >> 32;
442d722e3fbSopenharmony_ci	ib_cpu[len++] = chroma_offset;
443d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_encode_param, sizeof(uve_encode_param));
444d722e3fbSopenharmony_ci	ib_cpu[len] = ALIGN(enc.width, align);
445d722e3fbSopenharmony_ci	ib_cpu[len + 1] = ALIGN(enc.width, align);
446d722e3fbSopenharmony_ci	len += sizeof(uve_encode_param) / 4;
447d722e3fbSopenharmony_ci
448d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_op_speed_enc_mode, sizeof(uve_op_speed_enc_mode));
449d722e3fbSopenharmony_ci	len += sizeof(uve_op_speed_enc_mode) / 4;
450d722e3fbSopenharmony_ci
451d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_op_encode, sizeof(uve_op_encode));
452d722e3fbSopenharmony_ci	len += sizeof(uve_op_encode) / 4;
453d722e3fbSopenharmony_ci
454d722e3fbSopenharmony_ci	r = submit(len, AMDGPU_HW_IP_UVD_ENC);
455d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
456d722e3fbSopenharmony_ci
457d722e3fbSopenharmony_ci	check_result(&enc);
458d722e3fbSopenharmony_ci
459d722e3fbSopenharmony_ci	free_resource(&enc.fb);
460d722e3fbSopenharmony_ci	free_resource(&enc.bs);
461d722e3fbSopenharmony_ci	free_resource(&enc.vbuf);
462d722e3fbSopenharmony_ci	free_resource(&enc.cpb);
463d722e3fbSopenharmony_ci}
464d722e3fbSopenharmony_ci
465d722e3fbSopenharmony_cistatic void amdgpu_cs_uvd_enc_destroy(void)
466d722e3fbSopenharmony_ci{
467d722e3fbSopenharmony_ci	int len, r;
468d722e3fbSopenharmony_ci
469d722e3fbSopenharmony_ci	num_resources  = 0;
470d722e3fbSopenharmony_ci	resources[num_resources++] = ib_handle;
471d722e3fbSopenharmony_ci
472d722e3fbSopenharmony_ci	len = 0;
473d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_session_info, sizeof(uve_session_info));
474d722e3fbSopenharmony_ci	len += sizeof(uve_session_info) / 4;
475d722e3fbSopenharmony_ci	ib_cpu[len++] = enc.session.addr >> 32;
476d722e3fbSopenharmony_ci	ib_cpu[len++] = enc.session.addr;
477d722e3fbSopenharmony_ci
478d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_task_info, sizeof(uve_task_info));
479d722e3fbSopenharmony_ci	len += sizeof(uve_task_info) / 4;
480d722e3fbSopenharmony_ci	ib_cpu[len++] = 0xffffffff;
481d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000002;
482d722e3fbSopenharmony_ci	ib_cpu[len++] = 0x00000000;
483d722e3fbSopenharmony_ci
484d722e3fbSopenharmony_ci	memcpy((ib_cpu + len), uve_op_close, sizeof(uve_op_close));
485d722e3fbSopenharmony_ci	len += sizeof(uve_op_close) / 4;
486d722e3fbSopenharmony_ci
487d722e3fbSopenharmony_ci	r = submit(len, AMDGPU_HW_IP_UVD_ENC);
488d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
489d722e3fbSopenharmony_ci
490d722e3fbSopenharmony_ci	free_resource(&enc.session);
491d722e3fbSopenharmony_ci}
492