1d722e3fbSopenharmony_ci/*
2d722e3fbSopenharmony_ci * Copyright 2014 Advanced Micro Devices, Inc.
3d722e3fbSopenharmony_ci *
4d722e3fbSopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a
5d722e3fbSopenharmony_ci * copy of this software and associated documentation files (the "Software"),
6d722e3fbSopenharmony_ci * to deal in the Software without restriction, including without limitation
7d722e3fbSopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8d722e3fbSopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the
9d722e3fbSopenharmony_ci * Software is furnished to do so, subject to the following conditions:
10d722e3fbSopenharmony_ci *
11d722e3fbSopenharmony_ci * The above copyright notice and this permission notice shall be included in
12d722e3fbSopenharmony_ci * all copies or substantial portions of the Software.
13d722e3fbSopenharmony_ci *
14d722e3fbSopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15d722e3fbSopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16d722e3fbSopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17d722e3fbSopenharmony_ci * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18d722e3fbSopenharmony_ci * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19d722e3fbSopenharmony_ci * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20d722e3fbSopenharmony_ci * OTHER DEALINGS IN THE SOFTWARE.
21d722e3fbSopenharmony_ci *
22d722e3fbSopenharmony_ci*/
23d722e3fbSopenharmony_ci
24d722e3fbSopenharmony_ci#include <stdio.h>
25d722e3fbSopenharmony_ci#include <stdlib.h>
26d722e3fbSopenharmony_ci#include <unistd.h>
27d722e3fbSopenharmony_ci#include <sys/types.h>
28d722e3fbSopenharmony_ci#ifdef MAJOR_IN_SYSMACROS
29d722e3fbSopenharmony_ci#include <sys/sysmacros.h>
30d722e3fbSopenharmony_ci#endif
31d722e3fbSopenharmony_ci#include <sys/stat.h>
32d722e3fbSopenharmony_ci#include <fcntl.h>
33d722e3fbSopenharmony_ci#if HAVE_ALLOCA_H
34d722e3fbSopenharmony_ci# include <alloca.h>
35d722e3fbSopenharmony_ci#endif
36d722e3fbSopenharmony_ci#include <sys/wait.h>
37d722e3fbSopenharmony_ci
38d722e3fbSopenharmony_ci#include "CUnit/Basic.h"
39d722e3fbSopenharmony_ci
40d722e3fbSopenharmony_ci#include "amdgpu_test.h"
41d722e3fbSopenharmony_ci#include "amdgpu_drm.h"
42d722e3fbSopenharmony_ci#include "amdgpu_internal.h"
43d722e3fbSopenharmony_ci#include "util_math.h"
44d722e3fbSopenharmony_ci
45d722e3fbSopenharmony_cistatic  amdgpu_device_handle device_handle;
46d722e3fbSopenharmony_cistatic  uint32_t  major_version;
47d722e3fbSopenharmony_cistatic  uint32_t  minor_version;
48d722e3fbSopenharmony_cistatic  uint32_t  family_id;
49d722e3fbSopenharmony_cistatic  uint32_t  chip_id;
50d722e3fbSopenharmony_cistatic  uint32_t  chip_rev;
51d722e3fbSopenharmony_ci
52d722e3fbSopenharmony_cistatic void amdgpu_query_info_test(void);
53d722e3fbSopenharmony_cistatic void amdgpu_command_submission_gfx(void);
54d722e3fbSopenharmony_cistatic void amdgpu_command_submission_compute(void);
55d722e3fbSopenharmony_cistatic void amdgpu_command_submission_multi_fence(void);
56d722e3fbSopenharmony_cistatic void amdgpu_command_submission_sdma(void);
57d722e3fbSopenharmony_cistatic void amdgpu_userptr_test(void);
58d722e3fbSopenharmony_cistatic void amdgpu_semaphore_test(void);
59d722e3fbSopenharmony_cistatic void amdgpu_sync_dependency_test(void);
60d722e3fbSopenharmony_cistatic void amdgpu_bo_eviction_test(void);
61d722e3fbSopenharmony_cistatic void amdgpu_compute_dispatch_test(void);
62d722e3fbSopenharmony_cistatic void amdgpu_gfx_dispatch_test(void);
63d722e3fbSopenharmony_cistatic void amdgpu_draw_test(void);
64d722e3fbSopenharmony_cistatic void amdgpu_gpu_reset_test(void);
65d722e3fbSopenharmony_cistatic void amdgpu_stable_pstate_test(void);
66d722e3fbSopenharmony_ci
67d722e3fbSopenharmony_cistatic void amdgpu_command_submission_write_linear_helper(unsigned ip_type);
68d722e3fbSopenharmony_cistatic void amdgpu_command_submission_const_fill_helper(unsigned ip_type);
69d722e3fbSopenharmony_cistatic void amdgpu_command_submission_copy_linear_helper(unsigned ip_type);
70d722e3fbSopenharmony_cistatic void amdgpu_test_exec_cs_helper(amdgpu_context_handle context_handle,
71d722e3fbSopenharmony_ci				       unsigned ip_type,
72d722e3fbSopenharmony_ci				       int instance, int pm4_dw, uint32_t *pm4_src,
73d722e3fbSopenharmony_ci				       int res_cnt, amdgpu_bo_handle *resources,
74d722e3fbSopenharmony_ci				       struct amdgpu_cs_ib_info *ib_info,
75d722e3fbSopenharmony_ci				       struct amdgpu_cs_request *ibs_request);
76d722e3fbSopenharmony_ci
77d722e3fbSopenharmony_ciCU_TestInfo basic_tests[] = {
78d722e3fbSopenharmony_ci	{ "Query Info Test",  amdgpu_query_info_test },
79d722e3fbSopenharmony_ci	{ "Userptr Test",  amdgpu_userptr_test },
80d722e3fbSopenharmony_ci	{ "bo eviction Test",  amdgpu_bo_eviction_test },
81d722e3fbSopenharmony_ci	{ "Command submission Test (GFX)",  amdgpu_command_submission_gfx },
82d722e3fbSopenharmony_ci	{ "Command submission Test (Compute)", amdgpu_command_submission_compute },
83d722e3fbSopenharmony_ci	{ "Command submission Test (Multi-Fence)", amdgpu_command_submission_multi_fence },
84d722e3fbSopenharmony_ci	{ "Command submission Test (SDMA)", amdgpu_command_submission_sdma },
85d722e3fbSopenharmony_ci	{ "SW semaphore Test",  amdgpu_semaphore_test },
86d722e3fbSopenharmony_ci	{ "Sync dependency Test",  amdgpu_sync_dependency_test },
87d722e3fbSopenharmony_ci	{ "Dispatch Test (Compute)",  amdgpu_compute_dispatch_test },
88d722e3fbSopenharmony_ci	{ "Dispatch Test (GFX)",  amdgpu_gfx_dispatch_test },
89d722e3fbSopenharmony_ci	{ "Draw Test",  amdgpu_draw_test },
90d722e3fbSopenharmony_ci	{ "GPU reset Test", amdgpu_gpu_reset_test },
91d722e3fbSopenharmony_ci	{ "Stable pstate Test", amdgpu_stable_pstate_test },
92d722e3fbSopenharmony_ci	CU_TEST_INFO_NULL,
93d722e3fbSopenharmony_ci};
94d722e3fbSopenharmony_ci#define BUFFER_SIZE (MAX2(8 * 1024, getpagesize()))
95d722e3fbSopenharmony_ci#define SDMA_PKT_HEADER_op_offset 0
96d722e3fbSopenharmony_ci#define SDMA_PKT_HEADER_op_mask   0x000000FF
97d722e3fbSopenharmony_ci#define SDMA_PKT_HEADER_op_shift  0
98d722e3fbSopenharmony_ci#define SDMA_PKT_HEADER_OP(x) (((x) & SDMA_PKT_HEADER_op_mask) << SDMA_PKT_HEADER_op_shift)
99d722e3fbSopenharmony_ci#define SDMA_OPCODE_CONSTANT_FILL  11
100d722e3fbSopenharmony_ci#       define SDMA_CONSTANT_FILL_EXTRA_SIZE(x)           ((x) << 14)
101d722e3fbSopenharmony_ci	/* 0 = byte fill
102d722e3fbSopenharmony_ci	 * 2 = DW fill
103d722e3fbSopenharmony_ci	 */
104d722e3fbSopenharmony_ci#define SDMA_PACKET(op, sub_op, e)	((((e) & 0xFFFF) << 16) |	\
105d722e3fbSopenharmony_ci					(((sub_op) & 0xFF) << 8) |	\
106d722e3fbSopenharmony_ci					(((op) & 0xFF) << 0))
107d722e3fbSopenharmony_ci#define	SDMA_OPCODE_WRITE				  2
108d722e3fbSopenharmony_ci#       define SDMA_WRITE_SUB_OPCODE_LINEAR               0
109d722e3fbSopenharmony_ci#       define SDMA_WRTIE_SUB_OPCODE_TILED                1
110d722e3fbSopenharmony_ci
111d722e3fbSopenharmony_ci#define	SDMA_OPCODE_COPY				  1
112d722e3fbSopenharmony_ci#       define SDMA_COPY_SUB_OPCODE_LINEAR                0
113d722e3fbSopenharmony_ci
114d722e3fbSopenharmony_ci#define	SDMA_OPCODE_ATOMIC				  10
115d722e3fbSopenharmony_ci#		define SDMA_ATOMIC_LOOP(x)               ((x) << 0)
116d722e3fbSopenharmony_ci        /* 0 - single_pass_atomic.
117d722e3fbSopenharmony_ci         * 1 - loop_until_compare_satisfied.
118d722e3fbSopenharmony_ci         */
119d722e3fbSopenharmony_ci#		define SDMA_ATOMIC_TMZ(x)                ((x) << 2)
120d722e3fbSopenharmony_ci		/* 0 - non-TMZ.
121d722e3fbSopenharmony_ci		 * 1 - TMZ.
122d722e3fbSopenharmony_ci	     */
123d722e3fbSopenharmony_ci#		define SDMA_ATOMIC_OPCODE(x)             ((x) << 9)
124d722e3fbSopenharmony_ci		/* TC_OP_ATOMIC_CMPSWAP_RTN_32 0x00000008
125d722e3fbSopenharmony_ci		 * same as Packet 3
126d722e3fbSopenharmony_ci		 */
127d722e3fbSopenharmony_ci
128d722e3fbSopenharmony_ci#define GFX_COMPUTE_NOP  0xffff1000
129d722e3fbSopenharmony_ci#define SDMA_NOP  0x0
130d722e3fbSopenharmony_ci
131d722e3fbSopenharmony_ci/* PM4 */
132d722e3fbSopenharmony_ci#define	PACKET_TYPE0	0
133d722e3fbSopenharmony_ci#define	PACKET_TYPE1	1
134d722e3fbSopenharmony_ci#define	PACKET_TYPE2	2
135d722e3fbSopenharmony_ci#define	PACKET_TYPE3	3
136d722e3fbSopenharmony_ci
137d722e3fbSopenharmony_ci#define CP_PACKET_GET_TYPE(h) (((h) >> 30) & 3)
138d722e3fbSopenharmony_ci#define CP_PACKET_GET_COUNT(h) (((h) >> 16) & 0x3FFF)
139d722e3fbSopenharmony_ci#define CP_PACKET0_GET_REG(h) ((h) & 0xFFFF)
140d722e3fbSopenharmony_ci#define CP_PACKET3_GET_OPCODE(h) (((h) >> 8) & 0xFF)
141d722e3fbSopenharmony_ci#define PACKET0(reg, n)	((PACKET_TYPE0 << 30) |				\
142d722e3fbSopenharmony_ci			 ((reg) & 0xFFFF) |			\
143d722e3fbSopenharmony_ci			 ((n) & 0x3FFF) << 16)
144d722e3fbSopenharmony_ci#define CP_PACKET2			0x80000000
145d722e3fbSopenharmony_ci#define		PACKET2_PAD_SHIFT		0
146d722e3fbSopenharmony_ci#define		PACKET2_PAD_MASK		(0x3fffffff << 0)
147d722e3fbSopenharmony_ci
148d722e3fbSopenharmony_ci#define PACKET2(v)	(CP_PACKET2 | REG_SET(PACKET2_PAD, (v)))
149d722e3fbSopenharmony_ci
150d722e3fbSopenharmony_ci#define PACKET3(op, n)	((PACKET_TYPE3 << 30) |				\
151d722e3fbSopenharmony_ci			 (((op) & 0xFF) << 8) |				\
152d722e3fbSopenharmony_ci			 ((n) & 0x3FFF) << 16)
153d722e3fbSopenharmony_ci#define PACKET3_COMPUTE(op, n) PACKET3(op, n) | (1 << 1)
154d722e3fbSopenharmony_ci
155d722e3fbSopenharmony_ci/* Packet 3 types */
156d722e3fbSopenharmony_ci#define	PACKET3_NOP					0x10
157d722e3fbSopenharmony_ci
158d722e3fbSopenharmony_ci#define	PACKET3_WRITE_DATA				0x37
159d722e3fbSopenharmony_ci#define		WRITE_DATA_DST_SEL(x)                   ((x) << 8)
160d722e3fbSopenharmony_ci		/* 0 - register
161d722e3fbSopenharmony_ci		 * 1 - memory (sync - via GRBM)
162d722e3fbSopenharmony_ci		 * 2 - gl2
163d722e3fbSopenharmony_ci		 * 3 - gds
164d722e3fbSopenharmony_ci		 * 4 - reserved
165d722e3fbSopenharmony_ci		 * 5 - memory (async - direct)
166d722e3fbSopenharmony_ci		 */
167d722e3fbSopenharmony_ci#define		WR_ONE_ADDR                             (1 << 16)
168d722e3fbSopenharmony_ci#define		WR_CONFIRM                              (1 << 20)
169d722e3fbSopenharmony_ci#define		WRITE_DATA_CACHE_POLICY(x)              ((x) << 25)
170d722e3fbSopenharmony_ci		/* 0 - LRU
171d722e3fbSopenharmony_ci		 * 1 - Stream
172d722e3fbSopenharmony_ci		 */
173d722e3fbSopenharmony_ci#define		WRITE_DATA_ENGINE_SEL(x)                ((x) << 30)
174d722e3fbSopenharmony_ci		/* 0 - me
175d722e3fbSopenharmony_ci		 * 1 - pfp
176d722e3fbSopenharmony_ci		 * 2 - ce
177d722e3fbSopenharmony_ci		 */
178d722e3fbSopenharmony_ci
179d722e3fbSopenharmony_ci#define	PACKET3_ATOMIC_MEM				0x1E
180d722e3fbSopenharmony_ci#define     TC_OP_ATOMIC_CMPSWAP_RTN_32          0x00000008
181d722e3fbSopenharmony_ci#define     ATOMIC_MEM_COMMAND(x)               ((x) << 8)
182d722e3fbSopenharmony_ci            /* 0 - single_pass_atomic.
183d722e3fbSopenharmony_ci             * 1 - loop_until_compare_satisfied.
184d722e3fbSopenharmony_ci             */
185d722e3fbSopenharmony_ci#define     ATOMIC_MEM_CACHEPOLICAY(x)          ((x) << 25)
186d722e3fbSopenharmony_ci            /* 0 - lru.
187d722e3fbSopenharmony_ci             * 1 - stream.
188d722e3fbSopenharmony_ci             */
189d722e3fbSopenharmony_ci#define     ATOMIC_MEM_ENGINESEL(x)             ((x) << 30)
190d722e3fbSopenharmony_ci            /* 0 - micro_engine.
191d722e3fbSopenharmony_ci			 */
192d722e3fbSopenharmony_ci
193d722e3fbSopenharmony_ci#define	PACKET3_DMA_DATA				0x50
194d722e3fbSopenharmony_ci/* 1. header
195d722e3fbSopenharmony_ci * 2. CONTROL
196d722e3fbSopenharmony_ci * 3. SRC_ADDR_LO or DATA [31:0]
197d722e3fbSopenharmony_ci * 4. SRC_ADDR_HI [31:0]
198d722e3fbSopenharmony_ci * 5. DST_ADDR_LO [31:0]
199d722e3fbSopenharmony_ci * 6. DST_ADDR_HI [7:0]
200d722e3fbSopenharmony_ci * 7. COMMAND [30:21] | BYTE_COUNT [20:0]
201d722e3fbSopenharmony_ci */
202d722e3fbSopenharmony_ci/* CONTROL */
203d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_ENGINE(x)     ((x) << 0)
204d722e3fbSopenharmony_ci		/* 0 - ME
205d722e3fbSopenharmony_ci		 * 1 - PFP
206d722e3fbSopenharmony_ci		 */
207d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_SRC_CACHE_POLICY(x) ((x) << 13)
208d722e3fbSopenharmony_ci		/* 0 - LRU
209d722e3fbSopenharmony_ci		 * 1 - Stream
210d722e3fbSopenharmony_ci		 * 2 - Bypass
211d722e3fbSopenharmony_ci		 */
212d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_SRC_VOLATILE (1 << 15)
213d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_DST_SEL(x)  ((x) << 20)
214d722e3fbSopenharmony_ci		/* 0 - DST_ADDR using DAS
215d722e3fbSopenharmony_ci		 * 1 - GDS
216d722e3fbSopenharmony_ci		 * 3 - DST_ADDR using L2
217d722e3fbSopenharmony_ci		 */
218d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_DST_CACHE_POLICY(x) ((x) << 25)
219d722e3fbSopenharmony_ci		/* 0 - LRU
220d722e3fbSopenharmony_ci		 * 1 - Stream
221d722e3fbSopenharmony_ci		 * 2 - Bypass
222d722e3fbSopenharmony_ci		 */
223d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_DST_VOLATILE (1 << 27)
224d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_SRC_SEL(x)  ((x) << 29)
225d722e3fbSopenharmony_ci		/* 0 - SRC_ADDR using SAS
226d722e3fbSopenharmony_ci		 * 1 - GDS
227d722e3fbSopenharmony_ci		 * 2 - DATA
228d722e3fbSopenharmony_ci		 * 3 - SRC_ADDR using L2
229d722e3fbSopenharmony_ci		 */
230d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_CP_SYNC     (1 << 31)
231d722e3fbSopenharmony_ci/* COMMAND */
232d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_DIS_WC      (1 << 21)
233d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_CMD_SRC_SWAP(x) ((x) << 22)
234d722e3fbSopenharmony_ci		/* 0 - none
235d722e3fbSopenharmony_ci		 * 1 - 8 in 16
236d722e3fbSopenharmony_ci		 * 2 - 8 in 32
237d722e3fbSopenharmony_ci		 * 3 - 8 in 64
238d722e3fbSopenharmony_ci		 */
239d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_CMD_DST_SWAP(x) ((x) << 24)
240d722e3fbSopenharmony_ci		/* 0 - none
241d722e3fbSopenharmony_ci		 * 1 - 8 in 16
242d722e3fbSopenharmony_ci		 * 2 - 8 in 32
243d722e3fbSopenharmony_ci		 * 3 - 8 in 64
244d722e3fbSopenharmony_ci		 */
245d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_CMD_SAS     (1 << 26)
246d722e3fbSopenharmony_ci		/* 0 - memory
247d722e3fbSopenharmony_ci		 * 1 - register
248d722e3fbSopenharmony_ci		 */
249d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_CMD_DAS     (1 << 27)
250d722e3fbSopenharmony_ci		/* 0 - memory
251d722e3fbSopenharmony_ci		 * 1 - register
252d722e3fbSopenharmony_ci		 */
253d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_CMD_SAIC    (1 << 28)
254d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_CMD_DAIC    (1 << 29)
255d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_CMD_RAW_WAIT  (1 << 30)
256d722e3fbSopenharmony_ci
257d722e3fbSopenharmony_ci#define SDMA_PACKET_SI(op, b, t, s, cnt)	((((op) & 0xF) << 28) |	\
258d722e3fbSopenharmony_ci						(((b) & 0x1) << 26) |		\
259d722e3fbSopenharmony_ci						(((t) & 0x1) << 23) |		\
260d722e3fbSopenharmony_ci						(((s) & 0x1) << 22) |		\
261d722e3fbSopenharmony_ci						(((cnt) & 0xFFFFF) << 0))
262d722e3fbSopenharmony_ci#define	SDMA_OPCODE_COPY_SI	3
263d722e3fbSopenharmony_ci#define SDMA_OPCODE_CONSTANT_FILL_SI	13
264d722e3fbSopenharmony_ci#define SDMA_NOP_SI  0xf
265d722e3fbSopenharmony_ci#define GFX_COMPUTE_NOP_SI 0x80000000
266d722e3fbSopenharmony_ci#define	PACKET3_DMA_DATA_SI	0x41
267d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_SI_ENGINE(x)     ((x) << 27)
268d722e3fbSopenharmony_ci		/* 0 - ME
269d722e3fbSopenharmony_ci		 * 1 - PFP
270d722e3fbSopenharmony_ci		 */
271d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_SI_DST_SEL(x)  ((x) << 20)
272d722e3fbSopenharmony_ci		/* 0 - DST_ADDR using DAS
273d722e3fbSopenharmony_ci		 * 1 - GDS
274d722e3fbSopenharmony_ci		 * 3 - DST_ADDR using L2
275d722e3fbSopenharmony_ci		 */
276d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_SI_SRC_SEL(x)  ((x) << 29)
277d722e3fbSopenharmony_ci		/* 0 - SRC_ADDR using SAS
278d722e3fbSopenharmony_ci		 * 1 - GDS
279d722e3fbSopenharmony_ci		 * 2 - DATA
280d722e3fbSopenharmony_ci		 * 3 - SRC_ADDR using L2
281d722e3fbSopenharmony_ci		 */
282d722e3fbSopenharmony_ci#              define PACKET3_DMA_DATA_SI_CP_SYNC     (1 << 31)
283d722e3fbSopenharmony_ci
284d722e3fbSopenharmony_ci
285d722e3fbSopenharmony_ci#define PKT3_CONTEXT_CONTROL                   0x28
286d722e3fbSopenharmony_ci#define     CONTEXT_CONTROL_LOAD_ENABLE(x)     (((unsigned)(x) & 0x1) << 31)
287d722e3fbSopenharmony_ci#define     CONTEXT_CONTROL_LOAD_CE_RAM(x)     (((unsigned)(x) & 0x1) << 28)
288d722e3fbSopenharmony_ci#define     CONTEXT_CONTROL_SHADOW_ENABLE(x)   (((unsigned)(x) & 0x1) << 31)
289d722e3fbSopenharmony_ci
290d722e3fbSopenharmony_ci#define PKT3_CLEAR_STATE                       0x12
291d722e3fbSopenharmony_ci
292d722e3fbSopenharmony_ci#define PKT3_SET_SH_REG                        0x76
293d722e3fbSopenharmony_ci#define		PACKET3_SET_SH_REG_START			0x00002c00
294d722e3fbSopenharmony_ci
295d722e3fbSopenharmony_ci#define PKT3_SET_SH_REG_INDEX			0x9B
296d722e3fbSopenharmony_ci
297d722e3fbSopenharmony_ci#define	PACKET3_DISPATCH_DIRECT				0x15
298d722e3fbSopenharmony_ci#define PACKET3_EVENT_WRITE				0x46
299d722e3fbSopenharmony_ci#define PACKET3_ACQUIRE_MEM				0x58
300d722e3fbSopenharmony_ci#define PACKET3_SET_CONTEXT_REG				0x69
301d722e3fbSopenharmony_ci#define PACKET3_SET_UCONFIG_REG				0x79
302d722e3fbSopenharmony_ci#define PACKET3_DRAW_INDEX_AUTO				0x2D
303d722e3fbSopenharmony_ci/* gfx 8 */
304d722e3fbSopenharmony_ci#define mmCOMPUTE_PGM_LO                                                        0x2e0c
305d722e3fbSopenharmony_ci#define mmCOMPUTE_PGM_RSRC1                                                     0x2e12
306d722e3fbSopenharmony_ci#define mmCOMPUTE_TMPRING_SIZE                                                  0x2e18
307d722e3fbSopenharmony_ci#define mmCOMPUTE_USER_DATA_0                                                   0x2e40
308d722e3fbSopenharmony_ci#define mmCOMPUTE_USER_DATA_1                                                   0x2e41
309d722e3fbSopenharmony_ci#define mmCOMPUTE_RESOURCE_LIMITS                                               0x2e15
310d722e3fbSopenharmony_ci#define mmCOMPUTE_NUM_THREAD_X                                                  0x2e07
311d722e3fbSopenharmony_ci
312d722e3fbSopenharmony_ci
313d722e3fbSopenharmony_ci
314d722e3fbSopenharmony_ci#define SWAP_32(num) (((num & 0xff000000) >> 24) | \
315d722e3fbSopenharmony_ci		      ((num & 0x0000ff00) << 8) | \
316d722e3fbSopenharmony_ci		      ((num & 0x00ff0000) >> 8) | \
317d722e3fbSopenharmony_ci		      ((num & 0x000000ff) << 24))
318d722e3fbSopenharmony_ci
319d722e3fbSopenharmony_ci
320d722e3fbSopenharmony_ci/* Shader code
321d722e3fbSopenharmony_ci * void main()
322d722e3fbSopenharmony_ci{
323d722e3fbSopenharmony_ci
324d722e3fbSopenharmony_ci	float x = some_input;
325d722e3fbSopenharmony_ci		for (unsigned i = 0; i < 1000000; i++)
326d722e3fbSopenharmony_ci  	x = sin(x);
327d722e3fbSopenharmony_ci
328d722e3fbSopenharmony_ci	u[0] = 42u;
329d722e3fbSopenharmony_ci}
330d722e3fbSopenharmony_ci*/
331d722e3fbSopenharmony_ci
332d722e3fbSopenharmony_cistatic  uint32_t shader_bin[] = {
333d722e3fbSopenharmony_ci	SWAP_32(0x800082be), SWAP_32(0x02ff08bf), SWAP_32(0x7f969800), SWAP_32(0x040085bf),
334d722e3fbSopenharmony_ci	SWAP_32(0x02810281), SWAP_32(0x02ff08bf), SWAP_32(0x7f969800), SWAP_32(0xfcff84bf),
335d722e3fbSopenharmony_ci	SWAP_32(0xff0083be), SWAP_32(0x00f00000), SWAP_32(0xc10082be), SWAP_32(0xaa02007e),
336d722e3fbSopenharmony_ci	SWAP_32(0x000070e0), SWAP_32(0x00000080), SWAP_32(0x000081bf)
337d722e3fbSopenharmony_ci};
338d722e3fbSopenharmony_ci
339d722e3fbSopenharmony_ci#define CODE_OFFSET 512
340d722e3fbSopenharmony_ci#define DATA_OFFSET 1024
341d722e3fbSopenharmony_ci
342d722e3fbSopenharmony_cienum cs_type {
343d722e3fbSopenharmony_ci	CS_BUFFERCLEAR,
344d722e3fbSopenharmony_ci	CS_BUFFERCOPY,
345d722e3fbSopenharmony_ci	CS_HANG,
346d722e3fbSopenharmony_ci	CS_HANG_SLOW
347d722e3fbSopenharmony_ci};
348d722e3fbSopenharmony_ci
349d722e3fbSopenharmony_cistatic const uint32_t bufferclear_cs_shader_gfx9[] = {
350d722e3fbSopenharmony_ci    0x260000ff, 0x000003ff, 0xd1fd0000, 0x04010c08,
351d722e3fbSopenharmony_ci    0x7e020280, 0x7e040204, 0x7e060205, 0x7e080206,
352d722e3fbSopenharmony_ci    0x7e0a0207, 0xe01c2000, 0x80000200, 0xbf8c0000,
353d722e3fbSopenharmony_ci    0xbf810000
354d722e3fbSopenharmony_ci};
355d722e3fbSopenharmony_ci
356d722e3fbSopenharmony_cistatic const uint32_t bufferclear_cs_shader_gfx10[] = {
357d722e3fbSopenharmony_ci	0xD7460004, 0x04010C08, 0x7E000204, 0x7E020205,
358d722e3fbSopenharmony_ci	0x7E040206, 0x7E060207, 0xE01C2000, 0x80000004,
359d722e3fbSopenharmony_ci	0xBF810000
360d722e3fbSopenharmony_ci};
361d722e3fbSopenharmony_ci
362d722e3fbSopenharmony_cistatic const uint32_t bufferclear_cs_shader_registers_gfx9[][2] = {
363d722e3fbSopenharmony_ci	{0x2e12, 0x000C0041},	//{ mmCOMPUTE_PGM_RSRC1,	  0x000C0041 },
364d722e3fbSopenharmony_ci	{0x2e13, 0x00000090},	//{ mmCOMPUTE_PGM_RSRC2,	  0x00000090 },
365d722e3fbSopenharmony_ci	{0x2e07, 0x00000040},	//{ mmCOMPUTE_NUM_THREAD_X, 0x00000040 },
366d722e3fbSopenharmony_ci	{0x2e08, 0x00000001},	//{ mmCOMPUTE_NUM_THREAD_Y, 0x00000001 },
367d722e3fbSopenharmony_ci	{0x2e09, 0x00000001},	//{ mmCOMPUTE_NUM_THREAD_Z, 0x00000001 }
368d722e3fbSopenharmony_ci};
369d722e3fbSopenharmony_ci
370d722e3fbSopenharmony_cistatic const uint32_t bufferclear_cs_shader_registers_num_gfx9 = 5;
371d722e3fbSopenharmony_ci
372d722e3fbSopenharmony_cistatic const uint32_t buffercopy_cs_shader_gfx9[] = {
373d722e3fbSopenharmony_ci    0x260000ff, 0x000003ff, 0xd1fd0000, 0x04010c08,
374d722e3fbSopenharmony_ci    0x7e020280, 0xe00c2000, 0x80000200, 0xbf8c0f70,
375d722e3fbSopenharmony_ci    0xe01c2000, 0x80010200, 0xbf810000
376d722e3fbSopenharmony_ci};
377d722e3fbSopenharmony_ci
378d722e3fbSopenharmony_cistatic const uint32_t buffercopy_cs_shader_gfx10[] = {
379d722e3fbSopenharmony_ci	0xD7460001, 0x04010C08, 0xE00C2000, 0x80000201,
380d722e3fbSopenharmony_ci	0xBF8C3F70, 0xE01C2000, 0x80010201, 0xBF810000
381d722e3fbSopenharmony_ci};
382d722e3fbSopenharmony_ci
383d722e3fbSopenharmony_cistatic const uint32_t preamblecache_gfx9[] = {
384d722e3fbSopenharmony_ci	0xc0026900, 0x81, 0x80000000, 0x40004000, 0xc0026900, 0x8c, 0xaa99aaaa, 0x0,
385d722e3fbSopenharmony_ci	0xc0026900, 0x90, 0x80000000, 0x40004000, 0xc0026900, 0x94, 0x80000000, 0x40004000,
386d722e3fbSopenharmony_ci	0xc0026900, 0xb4,  0x0, 0x3f800000, 0xc0016900, 0x103, 0x0,
387d722e3fbSopenharmony_ci	0xc0016900, 0x208, 0x0, 0xc0016900, 0x290, 0x0,
388d722e3fbSopenharmony_ci	0xc0016900, 0x2a1, 0x0, 0xc0026900, 0x2ad, 0x0, 0x0,
389d722e3fbSopenharmony_ci	0xc0016900, 0x2d5, 0x10000, 0xc0016900,  0x2dc, 0x0,
390d722e3fbSopenharmony_ci	0xc0066900, 0x2de, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0xc0026900, 0x2e5, 0x0, 0x0,
391d722e3fbSopenharmony_ci	0xc0056900, 0x2f9, 0x5, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000,
392d722e3fbSopenharmony_ci	0xc0036900, 0x311, 0x3, 0, 0x100000, 0xc0026900, 0x316, 0x1e, 0x20,
393d722e3fbSopenharmony_ci	0xc0016900, 0x349, 0x0, 0xc0016900, 0x358, 0x0, 0xc0016900, 0x367, 0x0,
394d722e3fbSopenharmony_ci	0xc0016900, 0x376, 0x0, 0xc0016900, 0x385, 0x0, 0xc0016900, 0x19, 0x0,
395d722e3fbSopenharmony_ci	0xc0056900, 0xe8, 0x0, 0x0, 0x0, 0x0, 0x0,
396d722e3fbSopenharmony_ci	0xc0076900, 0x1e1, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
397d722e3fbSopenharmony_ci	0xc0026900, 0x204, 0x90000, 0x4, 0xc0046900, 0x20c, 0x0, 0x0, 0x0, 0x0,
398d722e3fbSopenharmony_ci	0xc0016900, 0x2b2, 0x0, 0xc0026900, 0x30e, 0xffffffff, 0xffffffff,
399d722e3fbSopenharmony_ci	0xc0016900, 0x314, 0x0, 0xc0016900, 0x2a6, 0, 0xc0016900, 0x210, 0,
400d722e3fbSopenharmony_ci	0xc0002f00, 0x1, 0xc0016900, 0x1, 0x1,
401d722e3fbSopenharmony_ci	0xc0016900, 0x18, 0x2, 0xc0016900, 0x206, 0x300, 0xc0017900, 0x20000243, 0x0,
402d722e3fbSopenharmony_ci	0xc0017900, 0x248, 0xffffffff, 0xc0017900, 0x249, 0x0, 0xc0017900, 0x24a, 0x0,
403d722e3fbSopenharmony_ci	0xc0017900, 0x24b, 0x0
404d722e3fbSopenharmony_ci};
405d722e3fbSopenharmony_ci
406d722e3fbSopenharmony_cistatic const uint32_t preamblecache_gfx10[] = {
407d722e3fbSopenharmony_ci	0xc0026900, 0x81, 0x80000000, 0x40004000, 0xc0026900, 0x8c, 0xaa99aaaa, 0x0,
408d722e3fbSopenharmony_ci	0xc0026900, 0x90, 0x80000000, 0x40004000, 0xc0026900, 0x94, 0x80000000, 0x40004000,
409d722e3fbSopenharmony_ci	0xc0026900, 0xb4, 0x0, 0x3f800000, 0xc0016900, 0x103, 0x0,
410d722e3fbSopenharmony_ci	0xc0016900, 0x208, 0x0, 0xc0016900, 0x290, 0x0,
411d722e3fbSopenharmony_ci	0xc0016900, 0x2a1, 0x0, 0xc0026900, 0x2ad, 0x0, 0x0,
412d722e3fbSopenharmony_ci	0xc0016900, 0x2d5, 0x10000, 0xc0016900, 0x2dc, 0x0,
413d722e3fbSopenharmony_ci	0xc0066900, 0x2de, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0xc0026900, 0x2e5, 0x0, 0x0,
414d722e3fbSopenharmony_ci	0xc0056900, 0x2f9, 0x5, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000,
415d722e3fbSopenharmony_ci	0xc0046900, 0x310, 0, 0x3, 0, 0x100000, 0xc0026900, 0x316, 0xe, 0x20,
416d722e3fbSopenharmony_ci	0xc0016900, 0x349, 0x0, 0xc0016900, 0x358, 0x0, 0xc0016900, 0x367, 0x0,
417d722e3fbSopenharmony_ci	0xc0016900, 0x376, 0x0, 0xc0016900, 0x385, 0x0, 0xc0016900, 0x6, 0x0,
418d722e3fbSopenharmony_ci	0xc0056900, 0xe8, 0x0, 0x0, 0x0, 0x0, 0x0,
419d722e3fbSopenharmony_ci	0xc0076900, 0x1e1, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
420d722e3fbSopenharmony_ci	0xc0026900, 0x204, 0x90000, 0x4, 0xc0046900, 0x20c, 0x0, 0x0, 0x0, 0x0,
421d722e3fbSopenharmony_ci	0xc0016900, 0x2b2, 0x0, 0xc0026900, 0x30e, 0xffffffff, 0xffffffff,
422d722e3fbSopenharmony_ci	0xc0016900, 0x314, 0x0, 0xc0016900, 0x10a, 0, 0xc0016900, 0x2a6, 0, 0xc0016900, 0x210, 0,
423d722e3fbSopenharmony_ci	0xc0016900, 0x2db, 0, 0xc0016900, 0x1d4, 0, 0xc0002f00, 0x1, 0xc0016900, 0x1, 0x1, 0xc0016900, 0xe, 0x2,
424d722e3fbSopenharmony_ci	0xc0016900, 0x206, 0x300, 0xc0016900, 0x212, 0x200, 0xc0017900, 0x7b, 0x20, 0xc0017a00, 0x20000243, 0x0,
425d722e3fbSopenharmony_ci	0xc0017900, 0x249, 0, 0xc0017900, 0x24a, 0, 0xc0017900, 0x24b, 0, 0xc0017900, 0x259, 0xffffffff,
426d722e3fbSopenharmony_ci	0xc0017900, 0x25f, 0, 0xc0017900, 0x260, 0, 0xc0017900, 0x262, 0,
427d722e3fbSopenharmony_ci	0xc0017600, 0x45, 0x0, 0xc0017600, 0x6, 0x0,
428d722e3fbSopenharmony_ci	0xc0067600, 0x70, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
429d722e3fbSopenharmony_ci	0xc0067600, 0x30, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0
430d722e3fbSopenharmony_ci};
431d722e3fbSopenharmony_ci
432d722e3fbSopenharmony_cienum ps_type {
433d722e3fbSopenharmony_ci	PS_CONST,
434d722e3fbSopenharmony_ci	PS_TEX,
435d722e3fbSopenharmony_ci	PS_HANG,
436d722e3fbSopenharmony_ci	PS_HANG_SLOW
437d722e3fbSopenharmony_ci};
438d722e3fbSopenharmony_ci
439d722e3fbSopenharmony_cistatic const uint32_t ps_const_shader_gfx9[] = {
440d722e3fbSopenharmony_ci    0x7E000200, 0x7E020201, 0x7E040202, 0x7E060203,
441d722e3fbSopenharmony_ci    0xD2960000, 0x00020300, 0xD2960001, 0x00020702,
442d722e3fbSopenharmony_ci    0xC4001C0F, 0x00000100, 0xBF810000
443d722e3fbSopenharmony_ci};
444d722e3fbSopenharmony_ci
445d722e3fbSopenharmony_cistatic const uint32_t ps_const_shader_patchinfo_code_size_gfx9 = 6;
446d722e3fbSopenharmony_ci
447d722e3fbSopenharmony_cistatic const uint32_t ps_const_shader_patchinfo_code_gfx9[][10][6] = {
448d722e3fbSopenharmony_ci    {{ 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xC4001890, 0x00000000 },
449d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xC4001801, 0x00000000 },
450d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xC4001803, 0x00000100 },
451d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xC4001803, 0x00000300 },
452d722e3fbSopenharmony_ci     { 0xD2960000, 0x00020300, 0xD2960001, 0x00020702, 0xC4001C0F, 0x00000100 },
453d722e3fbSopenharmony_ci     { 0xD2950000, 0x00020300, 0xD2950001, 0x00020702, 0xC4001C0F, 0x00000100 },
454d722e3fbSopenharmony_ci     { 0xD2940000, 0x00020300, 0xD2940001, 0x00020702, 0xC4001C0F, 0x00000100 },
455d722e3fbSopenharmony_ci     { 0xD2970000, 0x00020300, 0xD2970001, 0x00020702, 0xC4001C0F, 0x00000100 },
456d722e3fbSopenharmony_ci     { 0xD2980000, 0x00020300, 0xD2980001, 0x00020702, 0xC4001C0F, 0x00000100 },
457d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xC400180F, 0x03020100 }
458d722e3fbSopenharmony_ci    }
459d722e3fbSopenharmony_ci};
460d722e3fbSopenharmony_ci
461d722e3fbSopenharmony_cistatic const uint32_t ps_const_shader_patchinfo_offset_gfx9[] = {
462d722e3fbSopenharmony_ci    0x00000004
463d722e3fbSopenharmony_ci};
464d722e3fbSopenharmony_ci
465d722e3fbSopenharmony_cistatic const uint32_t ps_num_sh_registers_gfx9 = 2;
466d722e3fbSopenharmony_ci
467d722e3fbSopenharmony_cistatic const uint32_t ps_const_sh_registers_gfx9[][2] = {
468d722e3fbSopenharmony_ci    {0x2C0A, 0x000C0040},//{ mmSPI_SHADER_PGM_RSRC1_PS, 0x000C0040 },
469d722e3fbSopenharmony_ci    {0x2C0B, 0x00000008}, //{ mmSPI_SHADER_PGM_RSRC2_PS, 0x00000008 }
470d722e3fbSopenharmony_ci};
471d722e3fbSopenharmony_ci
472d722e3fbSopenharmony_cistatic const uint32_t ps_num_context_registers_gfx9 = 7;
473d722e3fbSopenharmony_ci
474d722e3fbSopenharmony_cistatic const uint32_t ps_const_context_reg_gfx9[][2] = {
475d722e3fbSopenharmony_ci    {0xA1B4, 0x00000002}, //{ mmSPI_PS_INPUT_ADDR,       0x00000002 },
476d722e3fbSopenharmony_ci    {0xA1B6, 0x00000000}, //{ mmSPI_PS_IN_CONTROL,       0x00000000 },
477d722e3fbSopenharmony_ci    {0xA08F, 0x0000000F}, //{ mmCB_SHADER_MASK,          0x0000000F },
478d722e3fbSopenharmony_ci    {0xA203, 0x00000010}, //{ mmDB_SHADER_CONTROL,       0x00000010 },
479d722e3fbSopenharmony_ci    {0xA1C4, 0x00000000}, //{ mmSPI_SHADER_Z_FORMAT,     0x00000000 },
480d722e3fbSopenharmony_ci    {0xA1B8, 0x00000000}, //{ mmSPI_BARYC_CNTL,          0x00000000 /* Always 0 for now */},
481d722e3fbSopenharmony_ci    {0xA1C5, 0x00000004}, //{ mmSPI_SHADER_COL_FORMAT,   0x00000004 }
482d722e3fbSopenharmony_ci};
483d722e3fbSopenharmony_ci
484d722e3fbSopenharmony_cistatic const uint32_t ps_const_shader_gfx10[] = {
485d722e3fbSopenharmony_ci    0x7E000200, 0x7E020201, 0x7E040202, 0x7E060203,
486d722e3fbSopenharmony_ci    0x5E000300, 0x5E020702, 0xBF800000, 0xBF800000,
487d722e3fbSopenharmony_ci    0xF8001C0F, 0x00000100, 0xBF810000
488d722e3fbSopenharmony_ci};
489d722e3fbSopenharmony_ci
490d722e3fbSopenharmony_cistatic const uint32_t ps_const_shader_patchinfo_code_size_gfx10 = 6;
491d722e3fbSopenharmony_ci
492d722e3fbSopenharmony_cistatic const uint32_t ps_const_shader_patchinfo_code_gfx10[][10][6] = {
493d722e3fbSopenharmony_ci    {{ 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xF8001890, 0x00000000 },
494d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xF8001801, 0x00000000 },
495d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xF8001803, 0x00000100 },
496d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xF8001803, 0x00000300 },
497d722e3fbSopenharmony_ci     { 0x5E000300, 0x5E020702, 0xBF800000, 0xBF800000, 0xF8001C0F, 0x00000100 },
498d722e3fbSopenharmony_ci     { 0xD7690000, 0x00020300, 0xD7690001, 0x00020702, 0xF8001C0F, 0x00000100 },
499d722e3fbSopenharmony_ci     { 0xD7680000, 0x00020300, 0xD7680001, 0x00020702, 0xF8001C0F, 0x00000100 },
500d722e3fbSopenharmony_ci     { 0xD76A0000, 0x00020300, 0xD76A0001, 0x00020702, 0xF8001C0F, 0x00000100 },
501d722e3fbSopenharmony_ci     { 0xD76B0000, 0x00020300, 0xD76B0001, 0x00020702, 0xF8001C0F, 0x00000100 },
502d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xF800180F, 0x03020100 }
503d722e3fbSopenharmony_ci    }
504d722e3fbSopenharmony_ci};
505d722e3fbSopenharmony_ci
506d722e3fbSopenharmony_cistatic const uint32_t ps_const_shader_patchinfo_offset_gfx10[] = {
507d722e3fbSopenharmony_ci    0x00000004
508d722e3fbSopenharmony_ci};
509d722e3fbSopenharmony_ci
510d722e3fbSopenharmony_cistatic const uint32_t ps_num_sh_registers_gfx10 = 2;
511d722e3fbSopenharmony_ci
512d722e3fbSopenharmony_cistatic const uint32_t ps_const_sh_registers_gfx10[][2] = {
513d722e3fbSopenharmony_ci    {0x2C0A, 0x000C0000},//{ mmSPI_SHADER_PGM_RSRC1_PS, 0x000C0000 },
514d722e3fbSopenharmony_ci    {0x2C0B, 0x00000008}, //{ mmSPI_SHADER_PGM_RSRC2_PS, 0x00000008 }
515d722e3fbSopenharmony_ci};
516d722e3fbSopenharmony_ci
517d722e3fbSopenharmony_cistatic const uint32_t ps_tex_shader_gfx9[] = {
518d722e3fbSopenharmony_ci    0xBEFC000C, 0xBE8E017E, 0xBEFE077E, 0xD4180000,
519d722e3fbSopenharmony_ci    0xD4190001, 0xD41C0100, 0xD41D0101, 0xF0800F00,
520d722e3fbSopenharmony_ci    0x00400206, 0xBEFE010E, 0xBF8C0F70, 0xD2960000,
521d722e3fbSopenharmony_ci    0x00020702, 0xD2960001, 0x00020B04, 0xC4001C0F,
522d722e3fbSopenharmony_ci    0x00000100, 0xBF810000
523d722e3fbSopenharmony_ci};
524d722e3fbSopenharmony_ci
525d722e3fbSopenharmony_cistatic const uint32_t ps_tex_shader_patchinfo_offset_gfx9[] = {
526d722e3fbSopenharmony_ci    0x0000000B
527d722e3fbSopenharmony_ci};
528d722e3fbSopenharmony_ci
529d722e3fbSopenharmony_cistatic const uint32_t ps_tex_shader_patchinfo_code_size_gfx9 = 6;
530d722e3fbSopenharmony_ci
531d722e3fbSopenharmony_cistatic const uint32_t ps_tex_shader_patchinfo_code_gfx9[][10][6] = {
532d722e3fbSopenharmony_ci    {{ 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xC4001890, 0x00000000 },
533d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xC4001801, 0x00000002 },
534d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xC4001803, 0x00000302 },
535d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xC4001803, 0x00000502 },
536d722e3fbSopenharmony_ci     { 0xD2960000, 0x00020702, 0xD2960001, 0x00020B04, 0xC4001C0F, 0x00000100 },
537d722e3fbSopenharmony_ci     { 0xD2950000, 0x00020702, 0xD2950001, 0x00020B04, 0xC4001C0F, 0x00000100 },
538d722e3fbSopenharmony_ci     { 0xD2940000, 0x00020702, 0xD2940001, 0x00020B04, 0xC4001C0F, 0x00000100 },
539d722e3fbSopenharmony_ci     { 0xD2970000, 0x00020702, 0xD2970001, 0x00020B04, 0xC4001C0F, 0x00000100 },
540d722e3fbSopenharmony_ci     { 0xD2980000, 0x00020702, 0xD2980001, 0x00020B04, 0xC4001C0F, 0x00000100 },
541d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xC400180F, 0x05040302 }
542d722e3fbSopenharmony_ci    }
543d722e3fbSopenharmony_ci};
544d722e3fbSopenharmony_ci
545d722e3fbSopenharmony_cistatic const uint32_t ps_tex_sh_registers_gfx9[][2] = {
546d722e3fbSopenharmony_ci    {0x2C0A, 0x000C0081},//{ mmSPI_SHADER_PGM_RSRC1_PS, 0x000C0081 },
547d722e3fbSopenharmony_ci    {0x2C0B, 0x00000018}, //{ mmSPI_SHADER_PGM_RSRC2_PS, 0x00000018 }
548d722e3fbSopenharmony_ci};
549d722e3fbSopenharmony_ci
550d722e3fbSopenharmony_cistatic const uint32_t ps_tex_context_reg_gfx9[][2] = {
551d722e3fbSopenharmony_ci    {0xA1B4, 0x00000002}, //{ mmSPI_PS_INPUT_ADDR,       0x00000002 },
552d722e3fbSopenharmony_ci    {0xA1B6, 0x00000001}, //{ mmSPI_PS_IN_CONTROL,       0x00000001 },
553d722e3fbSopenharmony_ci    {0xA08F, 0x0000000F}, //{ mmCB_SHADER_MASK,          0x0000000F },
554d722e3fbSopenharmony_ci    {0xA203, 0x00000010}, //{ mmDB_SHADER_CONTROL,       0x00000010 },
555d722e3fbSopenharmony_ci    {0xA1C4, 0x00000000}, //{ mmSPI_SHADER_Z_FORMAT,     0x00000000 },
556d722e3fbSopenharmony_ci    {0xA1B8, 0x00000000}, //{ mmSPI_BARYC_CNTL,          0x00000000 /* Always 0 for now */},
557d722e3fbSopenharmony_ci    {0xA1C5, 0x00000004}, //{ mmSPI_SHADER_COL_FORMAT,   0x00000004  }
558d722e3fbSopenharmony_ci};
559d722e3fbSopenharmony_ci
560d722e3fbSopenharmony_cistatic const uint32_t ps_tex_shader_gfx10[] = {
561d722e3fbSopenharmony_ci    0xBEFC030C, 0xBE8E047E, 0xBEFE0A7E, 0xC8080000,
562d722e3fbSopenharmony_ci    0xC80C0100, 0xC8090001, 0xC80D0101, 0xF0800F0A,
563d722e3fbSopenharmony_ci    0x00400402, 0x00000003, 0xBEFE040E, 0xBF8C0F70,
564d722e3fbSopenharmony_ci    0x5E000B04, 0x5E020F06, 0xBF800000, 0xBF800000,
565d722e3fbSopenharmony_ci    0xF8001C0F, 0x00000100, 0xBF810000
566d722e3fbSopenharmony_ci};
567d722e3fbSopenharmony_ci
568d722e3fbSopenharmony_cistatic const uint32_t ps_tex_shader_patchinfo_offset_gfx10[] = {
569d722e3fbSopenharmony_ci    0x0000000C
570d722e3fbSopenharmony_ci};
571d722e3fbSopenharmony_ci
572d722e3fbSopenharmony_cistatic const uint32_t ps_tex_shader_patchinfo_code_size_gfx10 = 6;
573d722e3fbSopenharmony_ci
574d722e3fbSopenharmony_cistatic const uint32_t ps_tex_shader_patchinfo_code_gfx10[][10][6] = {
575d722e3fbSopenharmony_ci    {{ 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xF8001890, 0x00000000 },
576d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xF8001801, 0x00000004 },
577d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xF8001803, 0x00000504 },
578d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xF8001803, 0x00000704 },
579d722e3fbSopenharmony_ci     { 0x5E000B04, 0x5E020F06, 0xBF800000, 0xBF800000, 0xF8001C0F, 0x00000100 },
580d722e3fbSopenharmony_ci     { 0xD7690000, 0x00020B04, 0xD7690001, 0x00020F06, 0xF8001C0F, 0x00000100 },
581d722e3fbSopenharmony_ci     { 0xD7680000, 0x00020B04, 0xD7680001, 0x00020F06, 0xF8001C0F, 0x00000100 },
582d722e3fbSopenharmony_ci     { 0xD76A0000, 0x00020B04, 0xD76A0001, 0x00020F06, 0xF8001C0F, 0x00000100 },
583d722e3fbSopenharmony_ci     { 0xD76B0000, 0x00020B04, 0xD76B0001, 0x00020F06, 0xF8001C0F, 0x00000100 },
584d722e3fbSopenharmony_ci     { 0xBF800000, 0xBF800000, 0xBF800000, 0xBF800000, 0xF800180F, 0x07060504 }
585d722e3fbSopenharmony_ci    }
586d722e3fbSopenharmony_ci};
587d722e3fbSopenharmony_ci
588d722e3fbSopenharmony_cistatic const uint32_t vs_RectPosTexFast_shader_gfx9[] = {
589d722e3fbSopenharmony_ci    0x7E000B00, 0x020000F3, 0xD042000A, 0x00010100,
590d722e3fbSopenharmony_ci    0x7E020202, 0x7E040200, 0x020000F3, 0x7E060206,
591d722e3fbSopenharmony_ci    0x7E080204, 0xD1000001, 0x002A0302, 0x7C840080,
592d722e3fbSopenharmony_ci    0x7E000200, 0x7E040203, 0x7E0A0201, 0xD1000003,
593d722e3fbSopenharmony_ci    0x002A0704, 0x7E0C0207, 0x7E0E0205, 0x00000101,
594d722e3fbSopenharmony_ci    0x00020505, 0x7E040208, 0x7E0A02F2, 0x00060903,
595d722e3fbSopenharmony_ci    0x00080D07, 0x7E0C0209, 0xC40008CF, 0x05020100,
596d722e3fbSopenharmony_ci    0xC400020F, 0x05060403, 0xBF810000
597d722e3fbSopenharmony_ci};
598d722e3fbSopenharmony_ci
599d722e3fbSopenharmony_cistatic const uint32_t vs_RectPosTexFast_shader_gfx10[] = {
600d722e3fbSopenharmony_ci    0x7E000B00, 0x060000F3, 0x7E020202, 0x7E040206,
601d722e3fbSopenharmony_ci    0x7C040080, 0x060000F3, 0xD5010001, 0x01AA0200,
602d722e3fbSopenharmony_ci    0x7E060203, 0xD5010002, 0x01AA0404, 0x7E080207,
603d722e3fbSopenharmony_ci    0x7C040080, 0xD5010000, 0x01A80101, 0xD5010001,
604d722e3fbSopenharmony_ci    0x01AA0601, 0x7E060208, 0x7E0A02F2, 0xD5010002,
605d722e3fbSopenharmony_ci    0x01A80902, 0xD5010004, 0x01AA0805, 0x7E0C0209,
606d722e3fbSopenharmony_ci    0xF80008CF, 0x05030100, 0xF800020F, 0x05060402,
607d722e3fbSopenharmony_ci    0xBF810000
608d722e3fbSopenharmony_ci};
609d722e3fbSopenharmony_ci
610d722e3fbSopenharmony_cistatic const uint32_t cached_cmd_gfx9[] = {
611d722e3fbSopenharmony_ci	0xc0016900, 0x0, 0x0, 0xc0026900, 0x3, 0x2a, 0x0,
612d722e3fbSopenharmony_ci	0xc0046900, 0xa, 0x0, 0x0, 0x0, 0x200020,
613d722e3fbSopenharmony_ci	0xc0016900, 0x83, 0xffff, 0xc0026900, 0x8e, 0xf, 0xf,
614d722e3fbSopenharmony_ci	0xc0056900, 0x105, 0x0, 0x0,  0x0, 0x0, 0x12,
615d722e3fbSopenharmony_ci	0xc0026900, 0x10b, 0x0, 0x0, 0xc0016900, 0x1e0, 0x0,
616d722e3fbSopenharmony_ci	0xc0036900, 0x200, 0x0, 0x10000, 0xcc0011,
617d722e3fbSopenharmony_ci	0xc0026900, 0x292, 0x20, 0x60201b8,
618d722e3fbSopenharmony_ci	0xc0026900, 0x2b0, 0x0, 0x0, 0xc0016900, 0x2f8, 0x0
619d722e3fbSopenharmony_ci};
620d722e3fbSopenharmony_ci
621d722e3fbSopenharmony_cistatic const uint32_t cached_cmd_gfx10[] = {
622d722e3fbSopenharmony_ci	0xc0016900, 0x0, 0x0, 0xc0026900, 0x3, 0x2a, 0x0,
623d722e3fbSopenharmony_ci	0xc0046900, 0xa, 0x0, 0x0, 0x0, 0x200020,
624d722e3fbSopenharmony_ci	0xc0016900, 0x83, 0xffff, 0xc0026900, 0x8e, 0xf, 0xf,
625d722e3fbSopenharmony_ci	0xc0056900, 0x105, 0x0, 0x0, 0x0, 0x0, 0x18,
626d722e3fbSopenharmony_ci	0xc0026900, 0x10b, 0x0, 0x0, 0xc0016900, 0x1e0, 0x0,
627d722e3fbSopenharmony_ci	0xc0036900, 0x200, 0x0, 0x10000, 0xcc0011,
628d722e3fbSopenharmony_ci	0xc0026900, 0x292, 0x20, 0x6020000,
629d722e3fbSopenharmony_ci	0xc0026900, 0x2b0, 0x0, 0x0, 0xc0016900, 0x2f8, 0x0
630d722e3fbSopenharmony_ci};
631d722e3fbSopenharmony_ci
632d722e3fbSopenharmony_ciunsigned int memcpy_ps_hang[] = {
633d722e3fbSopenharmony_ci        0xFFFFFFFF, 0xBEFE0A7E, 0xBEFC0304, 0xC0C20100,
634d722e3fbSopenharmony_ci        0xC0800300, 0xC8080000, 0xC80C0100, 0xC8090001,
635d722e3fbSopenharmony_ci        0xC80D0101, 0xBF8C007F, 0xF0800F00, 0x00010002,
636d722e3fbSopenharmony_ci        0xBEFE040C, 0xBF8C0F70, 0xBF800000, 0xBF800000,
637d722e3fbSopenharmony_ci        0xF800180F, 0x03020100, 0xBF810000
638d722e3fbSopenharmony_ci};
639d722e3fbSopenharmony_ci
640d722e3fbSopenharmony_cistruct amdgpu_test_shader {
641d722e3fbSopenharmony_ci	uint32_t *shader;
642d722e3fbSopenharmony_ci	uint32_t header_length;
643d722e3fbSopenharmony_ci	uint32_t body_length;
644d722e3fbSopenharmony_ci	uint32_t foot_length;
645d722e3fbSopenharmony_ci};
646d722e3fbSopenharmony_ci
647d722e3fbSopenharmony_ciunsigned int memcpy_cs_hang_slow_ai_codes[] = {
648d722e3fbSopenharmony_ci    0xd1fd0000, 0x04010c08, 0xe00c2000, 0x80000100,
649d722e3fbSopenharmony_ci    0xbf8c0f70, 0xe01c2000, 0x80010100, 0xbf810000
650d722e3fbSopenharmony_ci};
651d722e3fbSopenharmony_ci
652d722e3fbSopenharmony_cistruct amdgpu_test_shader memcpy_cs_hang_slow_ai = {
653d722e3fbSopenharmony_ci        memcpy_cs_hang_slow_ai_codes,
654d722e3fbSopenharmony_ci        4,
655d722e3fbSopenharmony_ci        3,
656d722e3fbSopenharmony_ci        1
657d722e3fbSopenharmony_ci};
658d722e3fbSopenharmony_ci
659d722e3fbSopenharmony_ciunsigned int memcpy_cs_hang_slow_rv_codes[] = {
660d722e3fbSopenharmony_ci    0x8e00860c, 0x32000000, 0xe00c2000, 0x80010100,
661d722e3fbSopenharmony_ci    0xbf8c0f70, 0xe01c2000, 0x80020100, 0xbf810000
662d722e3fbSopenharmony_ci};
663d722e3fbSopenharmony_ci
664d722e3fbSopenharmony_cistruct amdgpu_test_shader memcpy_cs_hang_slow_rv = {
665d722e3fbSopenharmony_ci        memcpy_cs_hang_slow_rv_codes,
666d722e3fbSopenharmony_ci        4,
667d722e3fbSopenharmony_ci        3,
668d722e3fbSopenharmony_ci        1
669d722e3fbSopenharmony_ci};
670d722e3fbSopenharmony_ci
671d722e3fbSopenharmony_ciunsigned int memcpy_cs_hang_slow_nv_codes[] = {
672d722e3fbSopenharmony_ci    0xd7460000, 0x04010c08, 0xe00c2000, 0x80000100,
673d722e3fbSopenharmony_ci    0xbf8c0f70, 0xe01ca000, 0x80010100, 0xbf810000
674d722e3fbSopenharmony_ci};
675d722e3fbSopenharmony_ci
676d722e3fbSopenharmony_cistruct amdgpu_test_shader memcpy_cs_hang_slow_nv = {
677d722e3fbSopenharmony_ci        memcpy_cs_hang_slow_nv_codes,
678d722e3fbSopenharmony_ci        4,
679d722e3fbSopenharmony_ci        3,
680d722e3fbSopenharmony_ci        1
681d722e3fbSopenharmony_ci};
682d722e3fbSopenharmony_ci
683d722e3fbSopenharmony_ciunsigned int memcpy_ps_hang_slow_ai_codes[] = {
684d722e3fbSopenharmony_ci        0xbefc000c, 0xbe8e017e, 0xbefe077e, 0xd4080000,
685d722e3fbSopenharmony_ci        0xd4090001, 0xd40c0100, 0xd40d0101, 0xf0800f00,
686d722e3fbSopenharmony_ci        0x00400002, 0xbefe010e, 0xbf8c0f70, 0xbf800000,
687d722e3fbSopenharmony_ci        0xbf800000, 0xbf800000, 0xbf800000, 0xc400180f,
688d722e3fbSopenharmony_ci        0x03020100, 0xbf810000
689d722e3fbSopenharmony_ci};
690d722e3fbSopenharmony_ci
691d722e3fbSopenharmony_cistruct amdgpu_test_shader memcpy_ps_hang_slow_ai = {
692d722e3fbSopenharmony_ci        memcpy_ps_hang_slow_ai_codes,
693d722e3fbSopenharmony_ci        7,
694d722e3fbSopenharmony_ci        2,
695d722e3fbSopenharmony_ci        9
696d722e3fbSopenharmony_ci};
697d722e3fbSopenharmony_ci
698d722e3fbSopenharmony_ciint amdgpu_bo_alloc_and_map_raw(amdgpu_device_handle dev, unsigned size,
699d722e3fbSopenharmony_ci			unsigned alignment, unsigned heap, uint64_t alloc_flags,
700d722e3fbSopenharmony_ci			uint64_t mapping_flags, amdgpu_bo_handle *bo, void **cpu,
701d722e3fbSopenharmony_ci			uint64_t *mc_address,
702d722e3fbSopenharmony_ci			amdgpu_va_handle *va_handle)
703d722e3fbSopenharmony_ci{
704d722e3fbSopenharmony_ci	struct amdgpu_bo_alloc_request request = {};
705d722e3fbSopenharmony_ci	amdgpu_bo_handle buf_handle;
706d722e3fbSopenharmony_ci	amdgpu_va_handle handle;
707d722e3fbSopenharmony_ci	uint64_t vmc_addr;
708d722e3fbSopenharmony_ci	int r;
709d722e3fbSopenharmony_ci
710d722e3fbSopenharmony_ci	request.alloc_size = size;
711d722e3fbSopenharmony_ci	request.phys_alignment = alignment;
712d722e3fbSopenharmony_ci	request.preferred_heap = heap;
713d722e3fbSopenharmony_ci	request.flags = alloc_flags;
714d722e3fbSopenharmony_ci
715d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc(dev, &request, &buf_handle);
716d722e3fbSopenharmony_ci	if (r)
717d722e3fbSopenharmony_ci		return r;
718d722e3fbSopenharmony_ci
719d722e3fbSopenharmony_ci	r = amdgpu_va_range_alloc(dev,
720d722e3fbSopenharmony_ci				  amdgpu_gpu_va_range_general,
721d722e3fbSopenharmony_ci				  size, alignment, 0, &vmc_addr,
722d722e3fbSopenharmony_ci				  &handle, 0);
723d722e3fbSopenharmony_ci	if (r)
724d722e3fbSopenharmony_ci		goto error_va_alloc;
725d722e3fbSopenharmony_ci
726d722e3fbSopenharmony_ci	r = amdgpu_bo_va_op_raw(dev, buf_handle, 0,  ALIGN(size, getpagesize()), vmc_addr,
727d722e3fbSopenharmony_ci				   AMDGPU_VM_PAGE_READABLE |
728d722e3fbSopenharmony_ci				   AMDGPU_VM_PAGE_WRITEABLE |
729d722e3fbSopenharmony_ci				   AMDGPU_VM_PAGE_EXECUTABLE |
730d722e3fbSopenharmony_ci				   mapping_flags,
731d722e3fbSopenharmony_ci				   AMDGPU_VA_OP_MAP);
732d722e3fbSopenharmony_ci	if (r)
733d722e3fbSopenharmony_ci		goto error_va_map;
734d722e3fbSopenharmony_ci
735d722e3fbSopenharmony_ci	r = amdgpu_bo_cpu_map(buf_handle, cpu);
736d722e3fbSopenharmony_ci	if (r)
737d722e3fbSopenharmony_ci		goto error_cpu_map;
738d722e3fbSopenharmony_ci
739d722e3fbSopenharmony_ci	*bo = buf_handle;
740d722e3fbSopenharmony_ci	*mc_address = vmc_addr;
741d722e3fbSopenharmony_ci	*va_handle = handle;
742d722e3fbSopenharmony_ci
743d722e3fbSopenharmony_ci	return 0;
744d722e3fbSopenharmony_ci
745d722e3fbSopenharmony_ci error_cpu_map:
746d722e3fbSopenharmony_ci	amdgpu_bo_cpu_unmap(buf_handle);
747d722e3fbSopenharmony_ci
748d722e3fbSopenharmony_ci error_va_map:
749d722e3fbSopenharmony_ci	amdgpu_bo_va_op(buf_handle, 0, size, vmc_addr, 0, AMDGPU_VA_OP_UNMAP);
750d722e3fbSopenharmony_ci
751d722e3fbSopenharmony_ci error_va_alloc:
752d722e3fbSopenharmony_ci	amdgpu_bo_free(buf_handle);
753d722e3fbSopenharmony_ci	return r;
754d722e3fbSopenharmony_ci}
755d722e3fbSopenharmony_ci
756d722e3fbSopenharmony_ci
757d722e3fbSopenharmony_ci
758d722e3fbSopenharmony_ciCU_BOOL suite_basic_tests_enable(void)
759d722e3fbSopenharmony_ci{
760d722e3fbSopenharmony_ci
761d722e3fbSopenharmony_ci	if (amdgpu_device_initialize(drm_amdgpu[0], &major_version,
762d722e3fbSopenharmony_ci					     &minor_version, &device_handle))
763d722e3fbSopenharmony_ci		return CU_FALSE;
764d722e3fbSopenharmony_ci
765d722e3fbSopenharmony_ci
766d722e3fbSopenharmony_ci	family_id = device_handle->info.family_id;
767d722e3fbSopenharmony_ci	chip_id = device_handle->info.chip_external_rev;
768d722e3fbSopenharmony_ci	chip_rev = device_handle->info.chip_rev;
769d722e3fbSopenharmony_ci
770d722e3fbSopenharmony_ci	if (amdgpu_device_deinitialize(device_handle))
771d722e3fbSopenharmony_ci		return CU_FALSE;
772d722e3fbSopenharmony_ci
773d722e3fbSopenharmony_ci	/* disable gfx engine basic test cases for some asics have no CPG */
774d722e3fbSopenharmony_ci	if (asic_is_gfx_pipe_removed(family_id, chip_id, chip_rev)) {
775d722e3fbSopenharmony_ci		if (amdgpu_set_test_active("Basic Tests",
776d722e3fbSopenharmony_ci					"Command submission Test (GFX)",
777d722e3fbSopenharmony_ci					CU_FALSE))
778d722e3fbSopenharmony_ci			fprintf(stderr, "test deactivation failed - %s\n",
779d722e3fbSopenharmony_ci				CU_get_error_msg());
780d722e3fbSopenharmony_ci
781d722e3fbSopenharmony_ci		if (amdgpu_set_test_active("Basic Tests",
782d722e3fbSopenharmony_ci					"Command submission Test (Multi-Fence)",
783d722e3fbSopenharmony_ci					CU_FALSE))
784d722e3fbSopenharmony_ci			fprintf(stderr, "test deactivation failed - %s\n",
785d722e3fbSopenharmony_ci				CU_get_error_msg());
786d722e3fbSopenharmony_ci
787d722e3fbSopenharmony_ci		if (amdgpu_set_test_active("Basic Tests",
788d722e3fbSopenharmony_ci					"Sync dependency Test",
789d722e3fbSopenharmony_ci					CU_FALSE))
790d722e3fbSopenharmony_ci			fprintf(stderr, "test deactivation failed - %s\n",
791d722e3fbSopenharmony_ci				CU_get_error_msg());
792d722e3fbSopenharmony_ci	}
793d722e3fbSopenharmony_ci
794d722e3fbSopenharmony_ci	return CU_TRUE;
795d722e3fbSopenharmony_ci}
796d722e3fbSopenharmony_ci
797d722e3fbSopenharmony_ciint suite_basic_tests_init(void)
798d722e3fbSopenharmony_ci{
799d722e3fbSopenharmony_ci	struct amdgpu_gpu_info gpu_info = {0};
800d722e3fbSopenharmony_ci	int r;
801d722e3fbSopenharmony_ci
802d722e3fbSopenharmony_ci	r = amdgpu_device_initialize(drm_amdgpu[0], &major_version,
803d722e3fbSopenharmony_ci				   &minor_version, &device_handle);
804d722e3fbSopenharmony_ci
805d722e3fbSopenharmony_ci	if (r) {
806d722e3fbSopenharmony_ci		if ((r == -EACCES) && (errno == EACCES))
807d722e3fbSopenharmony_ci			printf("\n\nError:%s. "
808d722e3fbSopenharmony_ci				"Hint:Try to run this test program as root.",
809d722e3fbSopenharmony_ci				strerror(errno));
810d722e3fbSopenharmony_ci		return CUE_SINIT_FAILED;
811d722e3fbSopenharmony_ci	}
812d722e3fbSopenharmony_ci
813d722e3fbSopenharmony_ci	r = amdgpu_query_gpu_info(device_handle, &gpu_info);
814d722e3fbSopenharmony_ci	if (r)
815d722e3fbSopenharmony_ci		return CUE_SINIT_FAILED;
816d722e3fbSopenharmony_ci
817d722e3fbSopenharmony_ci	family_id = gpu_info.family_id;
818d722e3fbSopenharmony_ci
819d722e3fbSopenharmony_ci	return CUE_SUCCESS;
820d722e3fbSopenharmony_ci}
821d722e3fbSopenharmony_ci
822d722e3fbSopenharmony_ciint suite_basic_tests_clean(void)
823d722e3fbSopenharmony_ci{
824d722e3fbSopenharmony_ci	int r = amdgpu_device_deinitialize(device_handle);
825d722e3fbSopenharmony_ci
826d722e3fbSopenharmony_ci	if (r == 0)
827d722e3fbSopenharmony_ci		return CUE_SUCCESS;
828d722e3fbSopenharmony_ci	else
829d722e3fbSopenharmony_ci		return CUE_SCLEAN_FAILED;
830d722e3fbSopenharmony_ci}
831d722e3fbSopenharmony_ci
832d722e3fbSopenharmony_cistatic void amdgpu_query_info_test(void)
833d722e3fbSopenharmony_ci{
834d722e3fbSopenharmony_ci	struct amdgpu_gpu_info gpu_info = {0};
835d722e3fbSopenharmony_ci	uint32_t version, feature;
836d722e3fbSopenharmony_ci	int r;
837d722e3fbSopenharmony_ci
838d722e3fbSopenharmony_ci	r = amdgpu_query_gpu_info(device_handle, &gpu_info);
839d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
840d722e3fbSopenharmony_ci
841d722e3fbSopenharmony_ci	r = amdgpu_query_firmware_version(device_handle, AMDGPU_INFO_FW_VCE, 0,
842d722e3fbSopenharmony_ci					  0, &version, &feature);
843d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
844d722e3fbSopenharmony_ci}
845d722e3fbSopenharmony_ci
846d722e3fbSopenharmony_cistatic void amdgpu_command_submission_gfx_separate_ibs(void)
847d722e3fbSopenharmony_ci{
848d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
849d722e3fbSopenharmony_ci	amdgpu_bo_handle ib_result_handle, ib_result_ce_handle;
850d722e3fbSopenharmony_ci	void *ib_result_cpu, *ib_result_ce_cpu;
851d722e3fbSopenharmony_ci	uint64_t ib_result_mc_address, ib_result_ce_mc_address;
852d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request = {0};
853d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info[2];
854d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status = {0};
855d722e3fbSopenharmony_ci	uint32_t *ptr;
856d722e3fbSopenharmony_ci	uint32_t expired;
857d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list;
858d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle, va_handle_ce;
859d722e3fbSopenharmony_ci	int r, i = 0;
860d722e3fbSopenharmony_ci
861d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
862d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
863d722e3fbSopenharmony_ci
864d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, 4096, 4096,
865d722e3fbSopenharmony_ci				    AMDGPU_GEM_DOMAIN_GTT, 0,
866d722e3fbSopenharmony_ci				    &ib_result_handle, &ib_result_cpu,
867d722e3fbSopenharmony_ci				    &ib_result_mc_address, &va_handle);
868d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
869d722e3fbSopenharmony_ci
870d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, 4096, 4096,
871d722e3fbSopenharmony_ci				    AMDGPU_GEM_DOMAIN_GTT, 0,
872d722e3fbSopenharmony_ci				    &ib_result_ce_handle, &ib_result_ce_cpu,
873d722e3fbSopenharmony_ci				    &ib_result_ce_mc_address, &va_handle_ce);
874d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
875d722e3fbSopenharmony_ci
876d722e3fbSopenharmony_ci	r = amdgpu_get_bo_list(device_handle, ib_result_handle,
877d722e3fbSopenharmony_ci			       ib_result_ce_handle, &bo_list);
878d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
879d722e3fbSopenharmony_ci
880d722e3fbSopenharmony_ci	memset(ib_info, 0, 2 * sizeof(struct amdgpu_cs_ib_info));
881d722e3fbSopenharmony_ci
882d722e3fbSopenharmony_ci	/* IT_SET_CE_DE_COUNTERS */
883d722e3fbSopenharmony_ci	ptr = ib_result_ce_cpu;
884d722e3fbSopenharmony_ci	if (family_id != AMDGPU_FAMILY_SI) {
885d722e3fbSopenharmony_ci		ptr[i++] = 0xc0008900;
886d722e3fbSopenharmony_ci		ptr[i++] = 0;
887d722e3fbSopenharmony_ci	}
888d722e3fbSopenharmony_ci	ptr[i++] = 0xc0008400;
889d722e3fbSopenharmony_ci	ptr[i++] = 1;
890d722e3fbSopenharmony_ci	ib_info[0].ib_mc_address = ib_result_ce_mc_address;
891d722e3fbSopenharmony_ci	ib_info[0].size = i;
892d722e3fbSopenharmony_ci	ib_info[0].flags = AMDGPU_IB_FLAG_CE;
893d722e3fbSopenharmony_ci
894d722e3fbSopenharmony_ci	/* IT_WAIT_ON_CE_COUNTER */
895d722e3fbSopenharmony_ci	ptr = ib_result_cpu;
896d722e3fbSopenharmony_ci	ptr[0] = 0xc0008600;
897d722e3fbSopenharmony_ci	ptr[1] = 0x00000001;
898d722e3fbSopenharmony_ci	ib_info[1].ib_mc_address = ib_result_mc_address;
899d722e3fbSopenharmony_ci	ib_info[1].size = 2;
900d722e3fbSopenharmony_ci
901d722e3fbSopenharmony_ci	ibs_request.ip_type = AMDGPU_HW_IP_GFX;
902d722e3fbSopenharmony_ci	ibs_request.number_of_ibs = 2;
903d722e3fbSopenharmony_ci	ibs_request.ibs = ib_info;
904d722e3fbSopenharmony_ci	ibs_request.resources = bo_list;
905d722e3fbSopenharmony_ci	ibs_request.fence_info.handle = NULL;
906d722e3fbSopenharmony_ci
907d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle, 0,&ibs_request, 1);
908d722e3fbSopenharmony_ci
909d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
910d722e3fbSopenharmony_ci
911d722e3fbSopenharmony_ci	fence_status.context = context_handle;
912d722e3fbSopenharmony_ci	fence_status.ip_type = AMDGPU_HW_IP_GFX;
913d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
914d722e3fbSopenharmony_ci	fence_status.fence = ibs_request.seq_no;
915d722e3fbSopenharmony_ci
916d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
917d722e3fbSopenharmony_ci					 AMDGPU_TIMEOUT_INFINITE,
918d722e3fbSopenharmony_ci					 0, &expired);
919d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
920d722e3fbSopenharmony_ci
921d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(ib_result_handle, va_handle,
922d722e3fbSopenharmony_ci				     ib_result_mc_address, 4096);
923d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
924d722e3fbSopenharmony_ci
925d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(ib_result_ce_handle, va_handle_ce,
926d722e3fbSopenharmony_ci				     ib_result_ce_mc_address, 4096);
927d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
928d722e3fbSopenharmony_ci
929d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(bo_list);
930d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
931d722e3fbSopenharmony_ci
932d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
933d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
934d722e3fbSopenharmony_ci
935d722e3fbSopenharmony_ci}
936d722e3fbSopenharmony_ci
937d722e3fbSopenharmony_cistatic void amdgpu_command_submission_gfx_shared_ib(void)
938d722e3fbSopenharmony_ci{
939d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
940d722e3fbSopenharmony_ci	amdgpu_bo_handle ib_result_handle;
941d722e3fbSopenharmony_ci	void *ib_result_cpu;
942d722e3fbSopenharmony_ci	uint64_t ib_result_mc_address;
943d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request = {0};
944d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info[2];
945d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status = {0};
946d722e3fbSopenharmony_ci	uint32_t *ptr;
947d722e3fbSopenharmony_ci	uint32_t expired;
948d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list;
949d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle;
950d722e3fbSopenharmony_ci	int r, i = 0;
951d722e3fbSopenharmony_ci
952d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
953d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
954d722e3fbSopenharmony_ci
955d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, 4096, 4096,
956d722e3fbSopenharmony_ci				    AMDGPU_GEM_DOMAIN_GTT, 0,
957d722e3fbSopenharmony_ci				    &ib_result_handle, &ib_result_cpu,
958d722e3fbSopenharmony_ci				    &ib_result_mc_address, &va_handle);
959d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
960d722e3fbSopenharmony_ci
961d722e3fbSopenharmony_ci	r = amdgpu_get_bo_list(device_handle, ib_result_handle, NULL,
962d722e3fbSopenharmony_ci			       &bo_list);
963d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
964d722e3fbSopenharmony_ci
965d722e3fbSopenharmony_ci	memset(ib_info, 0, 2 * sizeof(struct amdgpu_cs_ib_info));
966d722e3fbSopenharmony_ci
967d722e3fbSopenharmony_ci	/* IT_SET_CE_DE_COUNTERS */
968d722e3fbSopenharmony_ci	ptr = ib_result_cpu;
969d722e3fbSopenharmony_ci	if (family_id != AMDGPU_FAMILY_SI) {
970d722e3fbSopenharmony_ci		ptr[i++] = 0xc0008900;
971d722e3fbSopenharmony_ci		ptr[i++] = 0;
972d722e3fbSopenharmony_ci	}
973d722e3fbSopenharmony_ci	ptr[i++] = 0xc0008400;
974d722e3fbSopenharmony_ci	ptr[i++] = 1;
975d722e3fbSopenharmony_ci	ib_info[0].ib_mc_address = ib_result_mc_address;
976d722e3fbSopenharmony_ci	ib_info[0].size = i;
977d722e3fbSopenharmony_ci	ib_info[0].flags = AMDGPU_IB_FLAG_CE;
978d722e3fbSopenharmony_ci
979d722e3fbSopenharmony_ci	ptr = (uint32_t *)ib_result_cpu + 4;
980d722e3fbSopenharmony_ci	ptr[0] = 0xc0008600;
981d722e3fbSopenharmony_ci	ptr[1] = 0x00000001;
982d722e3fbSopenharmony_ci	ib_info[1].ib_mc_address = ib_result_mc_address + 16;
983d722e3fbSopenharmony_ci	ib_info[1].size = 2;
984d722e3fbSopenharmony_ci
985d722e3fbSopenharmony_ci	ibs_request.ip_type = AMDGPU_HW_IP_GFX;
986d722e3fbSopenharmony_ci	ibs_request.number_of_ibs = 2;
987d722e3fbSopenharmony_ci	ibs_request.ibs = ib_info;
988d722e3fbSopenharmony_ci	ibs_request.resources = bo_list;
989d722e3fbSopenharmony_ci	ibs_request.fence_info.handle = NULL;
990d722e3fbSopenharmony_ci
991d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle, 0, &ibs_request, 1);
992d722e3fbSopenharmony_ci
993d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
994d722e3fbSopenharmony_ci
995d722e3fbSopenharmony_ci	fence_status.context = context_handle;
996d722e3fbSopenharmony_ci	fence_status.ip_type = AMDGPU_HW_IP_GFX;
997d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
998d722e3fbSopenharmony_ci	fence_status.fence = ibs_request.seq_no;
999d722e3fbSopenharmony_ci
1000d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
1001d722e3fbSopenharmony_ci					 AMDGPU_TIMEOUT_INFINITE,
1002d722e3fbSopenharmony_ci					 0, &expired);
1003d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1004d722e3fbSopenharmony_ci
1005d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(ib_result_handle, va_handle,
1006d722e3fbSopenharmony_ci				     ib_result_mc_address, 4096);
1007d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1008d722e3fbSopenharmony_ci
1009d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(bo_list);
1010d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1011d722e3fbSopenharmony_ci
1012d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
1013d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1014d722e3fbSopenharmony_ci}
1015d722e3fbSopenharmony_ci
1016d722e3fbSopenharmony_cistatic void amdgpu_command_submission_gfx_cp_write_data(void)
1017d722e3fbSopenharmony_ci{
1018d722e3fbSopenharmony_ci	amdgpu_command_submission_write_linear_helper(AMDGPU_HW_IP_GFX);
1019d722e3fbSopenharmony_ci}
1020d722e3fbSopenharmony_ci
1021d722e3fbSopenharmony_cistatic void amdgpu_command_submission_gfx_cp_const_fill(void)
1022d722e3fbSopenharmony_ci{
1023d722e3fbSopenharmony_ci	amdgpu_command_submission_const_fill_helper(AMDGPU_HW_IP_GFX);
1024d722e3fbSopenharmony_ci}
1025d722e3fbSopenharmony_ci
1026d722e3fbSopenharmony_cistatic void amdgpu_command_submission_gfx_cp_copy_data(void)
1027d722e3fbSopenharmony_ci{
1028d722e3fbSopenharmony_ci	amdgpu_command_submission_copy_linear_helper(AMDGPU_HW_IP_GFX);
1029d722e3fbSopenharmony_ci}
1030d722e3fbSopenharmony_ci
1031d722e3fbSopenharmony_cistatic void amdgpu_bo_eviction_test(void)
1032d722e3fbSopenharmony_ci{
1033d722e3fbSopenharmony_ci	const int sdma_write_length = 1024;
1034d722e3fbSopenharmony_ci	const int pm4_dw = 256;
1035d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
1036d722e3fbSopenharmony_ci	amdgpu_bo_handle bo1, bo2, vram_max[2], gtt_max[2];
1037d722e3fbSopenharmony_ci	amdgpu_bo_handle *resources;
1038d722e3fbSopenharmony_ci	uint32_t *pm4;
1039d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info *ib_info;
1040d722e3fbSopenharmony_ci	struct amdgpu_cs_request *ibs_request;
1041d722e3fbSopenharmony_ci	uint64_t bo1_mc, bo2_mc;
1042d722e3fbSopenharmony_ci	volatile unsigned char *bo1_cpu, *bo2_cpu;
1043d722e3fbSopenharmony_ci	int i, j, r, loop1, loop2;
1044d722e3fbSopenharmony_ci	uint64_t gtt_flags[2] = {0, AMDGPU_GEM_CREATE_CPU_GTT_USWC};
1045d722e3fbSopenharmony_ci	amdgpu_va_handle bo1_va_handle, bo2_va_handle;
1046d722e3fbSopenharmony_ci	struct amdgpu_heap_info vram_info, gtt_info;
1047d722e3fbSopenharmony_ci
1048d722e3fbSopenharmony_ci	pm4 = calloc(pm4_dw, sizeof(*pm4));
1049d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(pm4, NULL);
1050d722e3fbSopenharmony_ci
1051d722e3fbSopenharmony_ci	ib_info = calloc(1, sizeof(*ib_info));
1052d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ib_info, NULL);
1053d722e3fbSopenharmony_ci
1054d722e3fbSopenharmony_ci	ibs_request = calloc(1, sizeof(*ibs_request));
1055d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ibs_request, NULL);
1056d722e3fbSopenharmony_ci
1057d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
1058d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1059d722e3fbSopenharmony_ci
1060d722e3fbSopenharmony_ci	/* prepare resource */
1061d722e3fbSopenharmony_ci	resources = calloc(4, sizeof(amdgpu_bo_handle));
1062d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(resources, NULL);
1063d722e3fbSopenharmony_ci
1064d722e3fbSopenharmony_ci	r = amdgpu_query_heap_info(device_handle, AMDGPU_GEM_DOMAIN_VRAM,
1065d722e3fbSopenharmony_ci				   0, &vram_info);
1066d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1067d722e3fbSopenharmony_ci
1068d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_wrap(device_handle, vram_info.max_allocation, 4096,
1069d722e3fbSopenharmony_ci				 AMDGPU_GEM_DOMAIN_VRAM, 0, &vram_max[0]);
1070d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1071d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_wrap(device_handle, vram_info.max_allocation, 4096,
1072d722e3fbSopenharmony_ci				 AMDGPU_GEM_DOMAIN_VRAM, 0, &vram_max[1]);
1073d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1074d722e3fbSopenharmony_ci
1075d722e3fbSopenharmony_ci	r = amdgpu_query_heap_info(device_handle, AMDGPU_GEM_DOMAIN_GTT,
1076d722e3fbSopenharmony_ci				   0, &gtt_info);
1077d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1078d722e3fbSopenharmony_ci
1079d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_wrap(device_handle, gtt_info.max_allocation, 4096,
1080d722e3fbSopenharmony_ci				 AMDGPU_GEM_DOMAIN_GTT, 0, &gtt_max[0]);
1081d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1082d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_wrap(device_handle, gtt_info.max_allocation, 4096,
1083d722e3fbSopenharmony_ci				 AMDGPU_GEM_DOMAIN_GTT, 0, &gtt_max[1]);
1084d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1085d722e3fbSopenharmony_ci
1086d722e3fbSopenharmony_ci
1087d722e3fbSopenharmony_ci
1088d722e3fbSopenharmony_ci	loop1 = loop2 = 0;
1089d722e3fbSopenharmony_ci	/* run 9 circle to test all mapping combination */
1090d722e3fbSopenharmony_ci	while(loop1 < 2) {
1091d722e3fbSopenharmony_ci		while(loop2 < 2) {
1092d722e3fbSopenharmony_ci			/* allocate UC bo1for sDMA use */
1093d722e3fbSopenharmony_ci			r = amdgpu_bo_alloc_and_map(device_handle,
1094d722e3fbSopenharmony_ci						    sdma_write_length, 4096,
1095d722e3fbSopenharmony_ci						    AMDGPU_GEM_DOMAIN_GTT,
1096d722e3fbSopenharmony_ci						    gtt_flags[loop1], &bo1,
1097d722e3fbSopenharmony_ci						    (void**)&bo1_cpu, &bo1_mc,
1098d722e3fbSopenharmony_ci						    &bo1_va_handle);
1099d722e3fbSopenharmony_ci			CU_ASSERT_EQUAL(r, 0);
1100d722e3fbSopenharmony_ci
1101d722e3fbSopenharmony_ci			/* set bo1 */
1102d722e3fbSopenharmony_ci			memset((void*)bo1_cpu, 0xaa, sdma_write_length);
1103d722e3fbSopenharmony_ci
1104d722e3fbSopenharmony_ci			/* allocate UC bo2 for sDMA use */
1105d722e3fbSopenharmony_ci			r = amdgpu_bo_alloc_and_map(device_handle,
1106d722e3fbSopenharmony_ci						    sdma_write_length, 4096,
1107d722e3fbSopenharmony_ci						    AMDGPU_GEM_DOMAIN_GTT,
1108d722e3fbSopenharmony_ci						    gtt_flags[loop2], &bo2,
1109d722e3fbSopenharmony_ci						    (void**)&bo2_cpu, &bo2_mc,
1110d722e3fbSopenharmony_ci						    &bo2_va_handle);
1111d722e3fbSopenharmony_ci			CU_ASSERT_EQUAL(r, 0);
1112d722e3fbSopenharmony_ci
1113d722e3fbSopenharmony_ci			/* clear bo2 */
1114d722e3fbSopenharmony_ci			memset((void*)bo2_cpu, 0, sdma_write_length);
1115d722e3fbSopenharmony_ci
1116d722e3fbSopenharmony_ci			resources[0] = bo1;
1117d722e3fbSopenharmony_ci			resources[1] = bo2;
1118d722e3fbSopenharmony_ci			resources[2] = vram_max[loop2];
1119d722e3fbSopenharmony_ci			resources[3] = gtt_max[loop2];
1120d722e3fbSopenharmony_ci
1121d722e3fbSopenharmony_ci			/* fulfill PM4: test DMA copy linear */
1122d722e3fbSopenharmony_ci			i = j = 0;
1123d722e3fbSopenharmony_ci			if (family_id == AMDGPU_FAMILY_SI) {
1124d722e3fbSopenharmony_ci				pm4[i++] = SDMA_PACKET_SI(SDMA_OPCODE_COPY_SI, 0, 0, 0,
1125d722e3fbSopenharmony_ci							  sdma_write_length);
1126d722e3fbSopenharmony_ci				pm4[i++] = 0xffffffff & bo2_mc;
1127d722e3fbSopenharmony_ci				pm4[i++] = 0xffffffff & bo1_mc;
1128d722e3fbSopenharmony_ci				pm4[i++] = (0xffffffff00000000 & bo2_mc) >> 32;
1129d722e3fbSopenharmony_ci				pm4[i++] = (0xffffffff00000000 & bo1_mc) >> 32;
1130d722e3fbSopenharmony_ci			} else {
1131d722e3fbSopenharmony_ci				pm4[i++] = SDMA_PACKET(SDMA_OPCODE_COPY, SDMA_COPY_SUB_OPCODE_LINEAR, 0);
1132d722e3fbSopenharmony_ci				if (family_id >= AMDGPU_FAMILY_AI)
1133d722e3fbSopenharmony_ci					pm4[i++] = sdma_write_length - 1;
1134d722e3fbSopenharmony_ci				else
1135d722e3fbSopenharmony_ci					pm4[i++] = sdma_write_length;
1136d722e3fbSopenharmony_ci				pm4[i++] = 0;
1137d722e3fbSopenharmony_ci				pm4[i++] = 0xffffffff & bo1_mc;
1138d722e3fbSopenharmony_ci				pm4[i++] = (0xffffffff00000000 & bo1_mc) >> 32;
1139d722e3fbSopenharmony_ci				pm4[i++] = 0xffffffff & bo2_mc;
1140d722e3fbSopenharmony_ci				pm4[i++] = (0xffffffff00000000 & bo2_mc) >> 32;
1141d722e3fbSopenharmony_ci			}
1142d722e3fbSopenharmony_ci
1143d722e3fbSopenharmony_ci			amdgpu_test_exec_cs_helper(context_handle,
1144d722e3fbSopenharmony_ci						   AMDGPU_HW_IP_DMA, 0,
1145d722e3fbSopenharmony_ci						   i, pm4,
1146d722e3fbSopenharmony_ci						   4, resources,
1147d722e3fbSopenharmony_ci						   ib_info, ibs_request);
1148d722e3fbSopenharmony_ci
1149d722e3fbSopenharmony_ci			/* verify if SDMA test result meets with expected */
1150d722e3fbSopenharmony_ci			i = 0;
1151d722e3fbSopenharmony_ci			while(i < sdma_write_length) {
1152d722e3fbSopenharmony_ci				CU_ASSERT_EQUAL(bo2_cpu[i++], 0xaa);
1153d722e3fbSopenharmony_ci			}
1154d722e3fbSopenharmony_ci			r = amdgpu_bo_unmap_and_free(bo1, bo1_va_handle, bo1_mc,
1155d722e3fbSopenharmony_ci						     sdma_write_length);
1156d722e3fbSopenharmony_ci			CU_ASSERT_EQUAL(r, 0);
1157d722e3fbSopenharmony_ci			r = amdgpu_bo_unmap_and_free(bo2, bo2_va_handle, bo2_mc,
1158d722e3fbSopenharmony_ci						     sdma_write_length);
1159d722e3fbSopenharmony_ci			CU_ASSERT_EQUAL(r, 0);
1160d722e3fbSopenharmony_ci			loop2++;
1161d722e3fbSopenharmony_ci		}
1162d722e3fbSopenharmony_ci		loop2 = 0;
1163d722e3fbSopenharmony_ci		loop1++;
1164d722e3fbSopenharmony_ci	}
1165d722e3fbSopenharmony_ci	amdgpu_bo_free(vram_max[0]);
1166d722e3fbSopenharmony_ci	amdgpu_bo_free(vram_max[1]);
1167d722e3fbSopenharmony_ci	amdgpu_bo_free(gtt_max[0]);
1168d722e3fbSopenharmony_ci	amdgpu_bo_free(gtt_max[1]);
1169d722e3fbSopenharmony_ci	/* clean resources */
1170d722e3fbSopenharmony_ci	free(resources);
1171d722e3fbSopenharmony_ci	free(ibs_request);
1172d722e3fbSopenharmony_ci	free(ib_info);
1173d722e3fbSopenharmony_ci	free(pm4);
1174d722e3fbSopenharmony_ci
1175d722e3fbSopenharmony_ci	/* end of test */
1176d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
1177d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1178d722e3fbSopenharmony_ci}
1179d722e3fbSopenharmony_ci
1180d722e3fbSopenharmony_ci
1181d722e3fbSopenharmony_cistatic void amdgpu_command_submission_gfx(void)
1182d722e3fbSopenharmony_ci{
1183d722e3fbSopenharmony_ci	/* write data using the CP */
1184d722e3fbSopenharmony_ci	amdgpu_command_submission_gfx_cp_write_data();
1185d722e3fbSopenharmony_ci	/* const fill using the CP */
1186d722e3fbSopenharmony_ci	amdgpu_command_submission_gfx_cp_const_fill();
1187d722e3fbSopenharmony_ci	/* copy data using the CP */
1188d722e3fbSopenharmony_ci	amdgpu_command_submission_gfx_cp_copy_data();
1189d722e3fbSopenharmony_ci	/* separate IB buffers for multi-IB submission */
1190d722e3fbSopenharmony_ci	amdgpu_command_submission_gfx_separate_ibs();
1191d722e3fbSopenharmony_ci	/* shared IB buffer for multi-IB submission */
1192d722e3fbSopenharmony_ci	amdgpu_command_submission_gfx_shared_ib();
1193d722e3fbSopenharmony_ci}
1194d722e3fbSopenharmony_ci
1195d722e3fbSopenharmony_cistatic void amdgpu_semaphore_test(void)
1196d722e3fbSopenharmony_ci{
1197d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle[2];
1198d722e3fbSopenharmony_ci	amdgpu_semaphore_handle sem;
1199d722e3fbSopenharmony_ci	amdgpu_bo_handle ib_result_handle[2];
1200d722e3fbSopenharmony_ci	void *ib_result_cpu[2];
1201d722e3fbSopenharmony_ci	uint64_t ib_result_mc_address[2];
1202d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request[2] = {0};
1203d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info[2] = {0};
1204d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status = {0};
1205d722e3fbSopenharmony_ci	uint32_t *ptr;
1206d722e3fbSopenharmony_ci	uint32_t expired;
1207d722e3fbSopenharmony_ci	uint32_t sdma_nop, gfx_nop;
1208d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list[2];
1209d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle[2];
1210d722e3fbSopenharmony_ci	int r, i;
1211d722e3fbSopenharmony_ci	struct amdgpu_gpu_info gpu_info = {0};
1212d722e3fbSopenharmony_ci	unsigned gc_ip_type;
1213d722e3fbSopenharmony_ci
1214d722e3fbSopenharmony_ci	r = amdgpu_query_gpu_info(device_handle, &gpu_info);
1215d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1216d722e3fbSopenharmony_ci
1217d722e3fbSopenharmony_ci	gc_ip_type = (asic_is_gfx_pipe_removed(family_id, chip_id, chip_rev)) ?
1218d722e3fbSopenharmony_ci			AMDGPU_HW_IP_COMPUTE : AMDGPU_HW_IP_GFX;
1219d722e3fbSopenharmony_ci
1220d722e3fbSopenharmony_ci	if (family_id == AMDGPU_FAMILY_SI) {
1221d722e3fbSopenharmony_ci		sdma_nop = SDMA_PACKET_SI(SDMA_NOP_SI, 0, 0, 0, 0);
1222d722e3fbSopenharmony_ci		gfx_nop = GFX_COMPUTE_NOP_SI;
1223d722e3fbSopenharmony_ci	} else {
1224d722e3fbSopenharmony_ci		sdma_nop = SDMA_PKT_HEADER_OP(SDMA_NOP);
1225d722e3fbSopenharmony_ci		gfx_nop = GFX_COMPUTE_NOP;
1226d722e3fbSopenharmony_ci	}
1227d722e3fbSopenharmony_ci
1228d722e3fbSopenharmony_ci	r = amdgpu_cs_create_semaphore(&sem);
1229d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1230d722e3fbSopenharmony_ci	for (i = 0; i < 2; i++) {
1231d722e3fbSopenharmony_ci		r = amdgpu_cs_ctx_create(device_handle, &context_handle[i]);
1232d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
1233d722e3fbSopenharmony_ci
1234d722e3fbSopenharmony_ci		r = amdgpu_bo_alloc_and_map(device_handle, 4096, 4096,
1235d722e3fbSopenharmony_ci					    AMDGPU_GEM_DOMAIN_GTT, 0,
1236d722e3fbSopenharmony_ci					    &ib_result_handle[i], &ib_result_cpu[i],
1237d722e3fbSopenharmony_ci					    &ib_result_mc_address[i], &va_handle[i]);
1238d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
1239d722e3fbSopenharmony_ci
1240d722e3fbSopenharmony_ci		r = amdgpu_get_bo_list(device_handle, ib_result_handle[i],
1241d722e3fbSopenharmony_ci				       NULL, &bo_list[i]);
1242d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
1243d722e3fbSopenharmony_ci	}
1244d722e3fbSopenharmony_ci
1245d722e3fbSopenharmony_ci	/* 1. same context different engine */
1246d722e3fbSopenharmony_ci	ptr = ib_result_cpu[0];
1247d722e3fbSopenharmony_ci	ptr[0] = sdma_nop;
1248d722e3fbSopenharmony_ci	ib_info[0].ib_mc_address = ib_result_mc_address[0];
1249d722e3fbSopenharmony_ci	ib_info[0].size = 1;
1250d722e3fbSopenharmony_ci
1251d722e3fbSopenharmony_ci	ibs_request[0].ip_type = AMDGPU_HW_IP_DMA;
1252d722e3fbSopenharmony_ci	ibs_request[0].number_of_ibs = 1;
1253d722e3fbSopenharmony_ci	ibs_request[0].ibs = &ib_info[0];
1254d722e3fbSopenharmony_ci	ibs_request[0].resources = bo_list[0];
1255d722e3fbSopenharmony_ci	ibs_request[0].fence_info.handle = NULL;
1256d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle[0], 0,&ibs_request[0], 1);
1257d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1258d722e3fbSopenharmony_ci	r = amdgpu_cs_signal_semaphore(context_handle[0], AMDGPU_HW_IP_DMA, 0, 0, sem);
1259d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1260d722e3fbSopenharmony_ci
1261d722e3fbSopenharmony_ci	r = amdgpu_cs_wait_semaphore(context_handle[0], gc_ip_type, 0, 0, sem);
1262d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1263d722e3fbSopenharmony_ci	ptr = ib_result_cpu[1];
1264d722e3fbSopenharmony_ci	ptr[0] = gfx_nop;
1265d722e3fbSopenharmony_ci	ib_info[1].ib_mc_address = ib_result_mc_address[1];
1266d722e3fbSopenharmony_ci	ib_info[1].size = 1;
1267d722e3fbSopenharmony_ci
1268d722e3fbSopenharmony_ci	ibs_request[1].ip_type = gc_ip_type;
1269d722e3fbSopenharmony_ci	ibs_request[1].number_of_ibs = 1;
1270d722e3fbSopenharmony_ci	ibs_request[1].ibs = &ib_info[1];
1271d722e3fbSopenharmony_ci	ibs_request[1].resources = bo_list[1];
1272d722e3fbSopenharmony_ci	ibs_request[1].fence_info.handle = NULL;
1273d722e3fbSopenharmony_ci
1274d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle[0], 0,&ibs_request[1], 1);
1275d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1276d722e3fbSopenharmony_ci
1277d722e3fbSopenharmony_ci	fence_status.context = context_handle[0];
1278d722e3fbSopenharmony_ci	fence_status.ip_type = gc_ip_type;
1279d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
1280d722e3fbSopenharmony_ci	fence_status.fence = ibs_request[1].seq_no;
1281d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
1282d722e3fbSopenharmony_ci					 500000000, 0, &expired);
1283d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1284d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(expired, true);
1285d722e3fbSopenharmony_ci
1286d722e3fbSopenharmony_ci	/* 2. same engine different context */
1287d722e3fbSopenharmony_ci	ptr = ib_result_cpu[0];
1288d722e3fbSopenharmony_ci	ptr[0] = gfx_nop;
1289d722e3fbSopenharmony_ci	ib_info[0].ib_mc_address = ib_result_mc_address[0];
1290d722e3fbSopenharmony_ci	ib_info[0].size = 1;
1291d722e3fbSopenharmony_ci
1292d722e3fbSopenharmony_ci	ibs_request[0].ip_type = gc_ip_type;
1293d722e3fbSopenharmony_ci	ibs_request[0].number_of_ibs = 1;
1294d722e3fbSopenharmony_ci	ibs_request[0].ibs = &ib_info[0];
1295d722e3fbSopenharmony_ci	ibs_request[0].resources = bo_list[0];
1296d722e3fbSopenharmony_ci	ibs_request[0].fence_info.handle = NULL;
1297d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle[0], 0,&ibs_request[0], 1);
1298d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1299d722e3fbSopenharmony_ci	r = amdgpu_cs_signal_semaphore(context_handle[0], gc_ip_type, 0, 0, sem);
1300d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1301d722e3fbSopenharmony_ci
1302d722e3fbSopenharmony_ci	r = amdgpu_cs_wait_semaphore(context_handle[1], gc_ip_type, 0, 0, sem);
1303d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1304d722e3fbSopenharmony_ci	ptr = ib_result_cpu[1];
1305d722e3fbSopenharmony_ci	ptr[0] = gfx_nop;
1306d722e3fbSopenharmony_ci	ib_info[1].ib_mc_address = ib_result_mc_address[1];
1307d722e3fbSopenharmony_ci	ib_info[1].size = 1;
1308d722e3fbSopenharmony_ci
1309d722e3fbSopenharmony_ci	ibs_request[1].ip_type = gc_ip_type;
1310d722e3fbSopenharmony_ci	ibs_request[1].number_of_ibs = 1;
1311d722e3fbSopenharmony_ci	ibs_request[1].ibs = &ib_info[1];
1312d722e3fbSopenharmony_ci	ibs_request[1].resources = bo_list[1];
1313d722e3fbSopenharmony_ci	ibs_request[1].fence_info.handle = NULL;
1314d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle[1], 0,&ibs_request[1], 1);
1315d722e3fbSopenharmony_ci
1316d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1317d722e3fbSopenharmony_ci
1318d722e3fbSopenharmony_ci	fence_status.context = context_handle[1];
1319d722e3fbSopenharmony_ci	fence_status.ip_type = gc_ip_type;
1320d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
1321d722e3fbSopenharmony_ci	fence_status.fence = ibs_request[1].seq_no;
1322d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
1323d722e3fbSopenharmony_ci					 500000000, 0, &expired);
1324d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1325d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(expired, true);
1326d722e3fbSopenharmony_ci
1327d722e3fbSopenharmony_ci	for (i = 0; i < 2; i++) {
1328d722e3fbSopenharmony_ci		r = amdgpu_bo_unmap_and_free(ib_result_handle[i], va_handle[i],
1329d722e3fbSopenharmony_ci					     ib_result_mc_address[i], 4096);
1330d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
1331d722e3fbSopenharmony_ci
1332d722e3fbSopenharmony_ci		r = amdgpu_bo_list_destroy(bo_list[i]);
1333d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
1334d722e3fbSopenharmony_ci
1335d722e3fbSopenharmony_ci		r = amdgpu_cs_ctx_free(context_handle[i]);
1336d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
1337d722e3fbSopenharmony_ci	}
1338d722e3fbSopenharmony_ci
1339d722e3fbSopenharmony_ci	r = amdgpu_cs_destroy_semaphore(sem);
1340d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1341d722e3fbSopenharmony_ci}
1342d722e3fbSopenharmony_ci
1343d722e3fbSopenharmony_cistatic void amdgpu_command_submission_compute_nop(void)
1344d722e3fbSopenharmony_ci{
1345d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
1346d722e3fbSopenharmony_ci	amdgpu_bo_handle ib_result_handle;
1347d722e3fbSopenharmony_ci	void *ib_result_cpu;
1348d722e3fbSopenharmony_ci	uint64_t ib_result_mc_address;
1349d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request;
1350d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info;
1351d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status;
1352d722e3fbSopenharmony_ci	uint32_t *ptr;
1353d722e3fbSopenharmony_ci	uint32_t expired;
1354d722e3fbSopenharmony_ci	int r, instance;
1355d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list;
1356d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle;
1357d722e3fbSopenharmony_ci	struct drm_amdgpu_info_hw_ip info;
1358d722e3fbSopenharmony_ci
1359d722e3fbSopenharmony_ci	r = amdgpu_query_hw_ip_info(device_handle, AMDGPU_HW_IP_COMPUTE, 0, &info);
1360d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1361d722e3fbSopenharmony_ci
1362d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
1363d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1364d722e3fbSopenharmony_ci
1365d722e3fbSopenharmony_ci	for (instance = 0; (1 << instance) & info.available_rings; instance++) {
1366d722e3fbSopenharmony_ci		r = amdgpu_bo_alloc_and_map(device_handle, 4096, 4096,
1367d722e3fbSopenharmony_ci					    AMDGPU_GEM_DOMAIN_GTT, 0,
1368d722e3fbSopenharmony_ci					    &ib_result_handle, &ib_result_cpu,
1369d722e3fbSopenharmony_ci					    &ib_result_mc_address, &va_handle);
1370d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
1371d722e3fbSopenharmony_ci
1372d722e3fbSopenharmony_ci		r = amdgpu_get_bo_list(device_handle, ib_result_handle, NULL,
1373d722e3fbSopenharmony_ci				       &bo_list);
1374d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
1375d722e3fbSopenharmony_ci
1376d722e3fbSopenharmony_ci		ptr = ib_result_cpu;
1377d722e3fbSopenharmony_ci		memset(ptr, 0, 16);
1378d722e3fbSopenharmony_ci		ptr[0]=PACKET3(PACKET3_NOP, 14);
1379d722e3fbSopenharmony_ci
1380d722e3fbSopenharmony_ci		memset(&ib_info, 0, sizeof(struct amdgpu_cs_ib_info));
1381d722e3fbSopenharmony_ci		ib_info.ib_mc_address = ib_result_mc_address;
1382d722e3fbSopenharmony_ci		ib_info.size = 16;
1383d722e3fbSopenharmony_ci
1384d722e3fbSopenharmony_ci		memset(&ibs_request, 0, sizeof(struct amdgpu_cs_request));
1385d722e3fbSopenharmony_ci		ibs_request.ip_type = AMDGPU_HW_IP_COMPUTE;
1386d722e3fbSopenharmony_ci		ibs_request.ring = instance;
1387d722e3fbSopenharmony_ci		ibs_request.number_of_ibs = 1;
1388d722e3fbSopenharmony_ci		ibs_request.ibs = &ib_info;
1389d722e3fbSopenharmony_ci		ibs_request.resources = bo_list;
1390d722e3fbSopenharmony_ci		ibs_request.fence_info.handle = NULL;
1391d722e3fbSopenharmony_ci
1392d722e3fbSopenharmony_ci		memset(&fence_status, 0, sizeof(struct amdgpu_cs_fence));
1393d722e3fbSopenharmony_ci		r = amdgpu_cs_submit(context_handle, 0,&ibs_request, 1);
1394d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
1395d722e3fbSopenharmony_ci
1396d722e3fbSopenharmony_ci		fence_status.context = context_handle;
1397d722e3fbSopenharmony_ci		fence_status.ip_type = AMDGPU_HW_IP_COMPUTE;
1398d722e3fbSopenharmony_ci		fence_status.ip_instance = 0;
1399d722e3fbSopenharmony_ci		fence_status.ring = instance;
1400d722e3fbSopenharmony_ci		fence_status.fence = ibs_request.seq_no;
1401d722e3fbSopenharmony_ci
1402d722e3fbSopenharmony_ci		r = amdgpu_cs_query_fence_status(&fence_status,
1403d722e3fbSopenharmony_ci						 AMDGPU_TIMEOUT_INFINITE,
1404d722e3fbSopenharmony_ci						 0, &expired);
1405d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
1406d722e3fbSopenharmony_ci
1407d722e3fbSopenharmony_ci		r = amdgpu_bo_list_destroy(bo_list);
1408d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
1409d722e3fbSopenharmony_ci
1410d722e3fbSopenharmony_ci		r = amdgpu_bo_unmap_and_free(ib_result_handle, va_handle,
1411d722e3fbSopenharmony_ci					     ib_result_mc_address, 4096);
1412d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
1413d722e3fbSopenharmony_ci	}
1414d722e3fbSopenharmony_ci
1415d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
1416d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1417d722e3fbSopenharmony_ci}
1418d722e3fbSopenharmony_ci
1419d722e3fbSopenharmony_cistatic void amdgpu_command_submission_compute_cp_write_data(void)
1420d722e3fbSopenharmony_ci{
1421d722e3fbSopenharmony_ci	amdgpu_command_submission_write_linear_helper(AMDGPU_HW_IP_COMPUTE);
1422d722e3fbSopenharmony_ci}
1423d722e3fbSopenharmony_ci
1424d722e3fbSopenharmony_cistatic void amdgpu_command_submission_compute_cp_const_fill(void)
1425d722e3fbSopenharmony_ci{
1426d722e3fbSopenharmony_ci	amdgpu_command_submission_const_fill_helper(AMDGPU_HW_IP_COMPUTE);
1427d722e3fbSopenharmony_ci}
1428d722e3fbSopenharmony_ci
1429d722e3fbSopenharmony_cistatic void amdgpu_command_submission_compute_cp_copy_data(void)
1430d722e3fbSopenharmony_ci{
1431d722e3fbSopenharmony_ci	amdgpu_command_submission_copy_linear_helper(AMDGPU_HW_IP_COMPUTE);
1432d722e3fbSopenharmony_ci}
1433d722e3fbSopenharmony_ci
1434d722e3fbSopenharmony_cistatic void amdgpu_command_submission_compute(void)
1435d722e3fbSopenharmony_ci{
1436d722e3fbSopenharmony_ci	/* write data using the CP */
1437d722e3fbSopenharmony_ci	amdgpu_command_submission_compute_cp_write_data();
1438d722e3fbSopenharmony_ci	/* const fill using the CP */
1439d722e3fbSopenharmony_ci	amdgpu_command_submission_compute_cp_const_fill();
1440d722e3fbSopenharmony_ci	/* copy data using the CP */
1441d722e3fbSopenharmony_ci	amdgpu_command_submission_compute_cp_copy_data();
1442d722e3fbSopenharmony_ci	/* nop test */
1443d722e3fbSopenharmony_ci	amdgpu_command_submission_compute_nop();
1444d722e3fbSopenharmony_ci}
1445d722e3fbSopenharmony_ci
1446d722e3fbSopenharmony_ci/*
1447d722e3fbSopenharmony_ci * caller need create/release:
1448d722e3fbSopenharmony_ci * pm4_src, resources, ib_info, and ibs_request
1449d722e3fbSopenharmony_ci * submit command stream described in ibs_request and wait for this IB accomplished
1450d722e3fbSopenharmony_ci */
1451d722e3fbSopenharmony_civoid
1452d722e3fbSopenharmony_ciamdgpu_test_exec_cs_helper_raw(amdgpu_device_handle device_handle,
1453d722e3fbSopenharmony_ci			       amdgpu_context_handle context_handle,
1454d722e3fbSopenharmony_ci			       unsigned ip_type, int instance, int pm4_dw,
1455d722e3fbSopenharmony_ci			       uint32_t *pm4_src, int res_cnt,
1456d722e3fbSopenharmony_ci			       amdgpu_bo_handle *resources,
1457d722e3fbSopenharmony_ci			       struct amdgpu_cs_ib_info *ib_info,
1458d722e3fbSopenharmony_ci			       struct amdgpu_cs_request *ibs_request,
1459d722e3fbSopenharmony_ci			       bool secure)
1460d722e3fbSopenharmony_ci{
1461d722e3fbSopenharmony_ci	int r;
1462d722e3fbSopenharmony_ci	uint32_t expired;
1463d722e3fbSopenharmony_ci	uint32_t *ring_ptr;
1464d722e3fbSopenharmony_ci	amdgpu_bo_handle ib_result_handle;
1465d722e3fbSopenharmony_ci	void *ib_result_cpu;
1466d722e3fbSopenharmony_ci	uint64_t ib_result_mc_address;
1467d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status = {0};
1468d722e3fbSopenharmony_ci	amdgpu_bo_handle *all_res = alloca(sizeof(resources[0]) * (res_cnt + 1));
1469d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle;
1470d722e3fbSopenharmony_ci
1471d722e3fbSopenharmony_ci	/* prepare CS */
1472d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(pm4_src, NULL);
1473d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(resources, NULL);
1474d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ib_info, NULL);
1475d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ibs_request, NULL);
1476d722e3fbSopenharmony_ci	CU_ASSERT_TRUE(pm4_dw <= 1024);
1477d722e3fbSopenharmony_ci
1478d722e3fbSopenharmony_ci	/* allocate IB */
1479d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, 4096, 4096,
1480d722e3fbSopenharmony_ci				    AMDGPU_GEM_DOMAIN_GTT, 0,
1481d722e3fbSopenharmony_ci				    &ib_result_handle, &ib_result_cpu,
1482d722e3fbSopenharmony_ci				    &ib_result_mc_address, &va_handle);
1483d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1484d722e3fbSopenharmony_ci
1485d722e3fbSopenharmony_ci	/* copy PM4 packet to ring from caller */
1486d722e3fbSopenharmony_ci	ring_ptr = ib_result_cpu;
1487d722e3fbSopenharmony_ci	memcpy(ring_ptr, pm4_src, pm4_dw * sizeof(*pm4_src));
1488d722e3fbSopenharmony_ci
1489d722e3fbSopenharmony_ci	ib_info->ib_mc_address = ib_result_mc_address;
1490d722e3fbSopenharmony_ci	ib_info->size = pm4_dw;
1491d722e3fbSopenharmony_ci	if (secure)
1492d722e3fbSopenharmony_ci		ib_info->flags |= AMDGPU_IB_FLAGS_SECURE;
1493d722e3fbSopenharmony_ci
1494d722e3fbSopenharmony_ci	ibs_request->ip_type = ip_type;
1495d722e3fbSopenharmony_ci	ibs_request->ring = instance;
1496d722e3fbSopenharmony_ci	ibs_request->number_of_ibs = 1;
1497d722e3fbSopenharmony_ci	ibs_request->ibs = ib_info;
1498d722e3fbSopenharmony_ci	ibs_request->fence_info.handle = NULL;
1499d722e3fbSopenharmony_ci
1500d722e3fbSopenharmony_ci	memcpy(all_res, resources, sizeof(resources[0]) * res_cnt);
1501d722e3fbSopenharmony_ci	all_res[res_cnt] = ib_result_handle;
1502d722e3fbSopenharmony_ci
1503d722e3fbSopenharmony_ci	r = amdgpu_bo_list_create(device_handle, res_cnt+1, all_res,
1504d722e3fbSopenharmony_ci				  NULL, &ibs_request->resources);
1505d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1506d722e3fbSopenharmony_ci
1507d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ibs_request, NULL);
1508d722e3fbSopenharmony_ci
1509d722e3fbSopenharmony_ci	/* submit CS */
1510d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle, 0, ibs_request, 1);
1511d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1512d722e3fbSopenharmony_ci
1513d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(ibs_request->resources);
1514d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1515d722e3fbSopenharmony_ci
1516d722e3fbSopenharmony_ci	fence_status.ip_type = ip_type;
1517d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
1518d722e3fbSopenharmony_ci	fence_status.ring = ibs_request->ring;
1519d722e3fbSopenharmony_ci	fence_status.context = context_handle;
1520d722e3fbSopenharmony_ci	fence_status.fence = ibs_request->seq_no;
1521d722e3fbSopenharmony_ci
1522d722e3fbSopenharmony_ci	/* wait for IB accomplished */
1523d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
1524d722e3fbSopenharmony_ci					 AMDGPU_TIMEOUT_INFINITE,
1525d722e3fbSopenharmony_ci					 0, &expired);
1526d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1527d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(expired, true);
1528d722e3fbSopenharmony_ci
1529d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(ib_result_handle, va_handle,
1530d722e3fbSopenharmony_ci				     ib_result_mc_address, 4096);
1531d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1532d722e3fbSopenharmony_ci}
1533d722e3fbSopenharmony_ci
1534d722e3fbSopenharmony_cistatic void
1535d722e3fbSopenharmony_ciamdgpu_test_exec_cs_helper(amdgpu_context_handle context_handle,
1536d722e3fbSopenharmony_ci			   unsigned ip_type, int instance, int pm4_dw,
1537d722e3fbSopenharmony_ci			   uint32_t *pm4_src, int res_cnt,
1538d722e3fbSopenharmony_ci			   amdgpu_bo_handle *resources,
1539d722e3fbSopenharmony_ci			   struct amdgpu_cs_ib_info *ib_info,
1540d722e3fbSopenharmony_ci			   struct amdgpu_cs_request *ibs_request)
1541d722e3fbSopenharmony_ci{
1542d722e3fbSopenharmony_ci	amdgpu_test_exec_cs_helper_raw(device_handle, context_handle,
1543d722e3fbSopenharmony_ci				       ip_type, instance, pm4_dw, pm4_src,
1544d722e3fbSopenharmony_ci				       res_cnt, resources, ib_info,
1545d722e3fbSopenharmony_ci				       ibs_request, false);
1546d722e3fbSopenharmony_ci}
1547d722e3fbSopenharmony_ci
1548d722e3fbSopenharmony_civoid
1549d722e3fbSopenharmony_ciamdgpu_command_submission_write_linear_helper_with_secure(amdgpu_device_handle
1550d722e3fbSopenharmony_ci							  device, unsigned
1551d722e3fbSopenharmony_ci							  ip_type, bool secure)
1552d722e3fbSopenharmony_ci{
1553d722e3fbSopenharmony_ci	const int sdma_write_length = 128;
1554d722e3fbSopenharmony_ci	const int pm4_dw = 256;
1555d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
1556d722e3fbSopenharmony_ci	amdgpu_bo_handle bo;
1557d722e3fbSopenharmony_ci	amdgpu_bo_handle *resources;
1558d722e3fbSopenharmony_ci	uint32_t *pm4;
1559d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info *ib_info;
1560d722e3fbSopenharmony_ci	struct amdgpu_cs_request *ibs_request;
1561d722e3fbSopenharmony_ci	uint64_t bo_mc;
1562d722e3fbSopenharmony_ci	volatile uint32_t *bo_cpu;
1563d722e3fbSopenharmony_ci	uint32_t bo_cpu_origin;
1564d722e3fbSopenharmony_ci	int i, j, r, loop, ring_id;
1565d722e3fbSopenharmony_ci	uint64_t gtt_flags[2] = {0, AMDGPU_GEM_CREATE_CPU_GTT_USWC};
1566d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle;
1567d722e3fbSopenharmony_ci	struct drm_amdgpu_info_hw_ip hw_ip_info;
1568d722e3fbSopenharmony_ci
1569d722e3fbSopenharmony_ci	pm4 = calloc(pm4_dw, sizeof(*pm4));
1570d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(pm4, NULL);
1571d722e3fbSopenharmony_ci
1572d722e3fbSopenharmony_ci	ib_info = calloc(1, sizeof(*ib_info));
1573d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ib_info, NULL);
1574d722e3fbSopenharmony_ci
1575d722e3fbSopenharmony_ci	ibs_request = calloc(1, sizeof(*ibs_request));
1576d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ibs_request, NULL);
1577d722e3fbSopenharmony_ci
1578d722e3fbSopenharmony_ci	r = amdgpu_query_hw_ip_info(device, ip_type, 0, &hw_ip_info);
1579d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1580d722e3fbSopenharmony_ci
1581d722e3fbSopenharmony_ci	for (i = 0; secure && (i < 2); i++)
1582d722e3fbSopenharmony_ci		gtt_flags[i] |= AMDGPU_GEM_CREATE_ENCRYPTED;
1583d722e3fbSopenharmony_ci
1584d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device, &context_handle);
1585d722e3fbSopenharmony_ci
1586d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1587d722e3fbSopenharmony_ci
1588d722e3fbSopenharmony_ci	/* prepare resource */
1589d722e3fbSopenharmony_ci	resources = calloc(1, sizeof(amdgpu_bo_handle));
1590d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(resources, NULL);
1591d722e3fbSopenharmony_ci
1592d722e3fbSopenharmony_ci	for (ring_id = 0; (1 << ring_id) & hw_ip_info.available_rings; ring_id++) {
1593d722e3fbSopenharmony_ci		loop = 0;
1594d722e3fbSopenharmony_ci		while(loop < 2) {
1595d722e3fbSopenharmony_ci			/* allocate UC bo for sDMA use */
1596d722e3fbSopenharmony_ci			r = amdgpu_bo_alloc_and_map(device,
1597d722e3fbSopenharmony_ci						    sdma_write_length * sizeof(uint32_t),
1598d722e3fbSopenharmony_ci						    4096, AMDGPU_GEM_DOMAIN_GTT,
1599d722e3fbSopenharmony_ci						    gtt_flags[loop], &bo, (void**)&bo_cpu,
1600d722e3fbSopenharmony_ci						    &bo_mc, &va_handle);
1601d722e3fbSopenharmony_ci			CU_ASSERT_EQUAL(r, 0);
1602d722e3fbSopenharmony_ci
1603d722e3fbSopenharmony_ci			/* clear bo */
1604d722e3fbSopenharmony_ci			memset((void*)bo_cpu, 0, sdma_write_length * sizeof(uint32_t));
1605d722e3fbSopenharmony_ci
1606d722e3fbSopenharmony_ci			resources[0] = bo;
1607d722e3fbSopenharmony_ci
1608d722e3fbSopenharmony_ci			/* fulfill PM4: test DMA write-linear */
1609d722e3fbSopenharmony_ci			i = j = 0;
1610d722e3fbSopenharmony_ci			if (ip_type == AMDGPU_HW_IP_DMA) {
1611d722e3fbSopenharmony_ci				if (family_id == AMDGPU_FAMILY_SI)
1612d722e3fbSopenharmony_ci					pm4[i++] = SDMA_PACKET_SI(SDMA_OPCODE_WRITE, 0, 0, 0,
1613d722e3fbSopenharmony_ci								  sdma_write_length);
1614d722e3fbSopenharmony_ci				else
1615d722e3fbSopenharmony_ci					pm4[i++] = SDMA_PACKET(SDMA_OPCODE_WRITE,
1616d722e3fbSopenharmony_ci							       SDMA_WRITE_SUB_OPCODE_LINEAR,
1617d722e3fbSopenharmony_ci							       secure ? SDMA_ATOMIC_TMZ(1) : 0);
1618d722e3fbSopenharmony_ci				pm4[i++] = 0xfffffffc & bo_mc;
1619d722e3fbSopenharmony_ci				pm4[i++] = (0xffffffff00000000 & bo_mc) >> 32;
1620d722e3fbSopenharmony_ci				if (family_id >= AMDGPU_FAMILY_AI)
1621d722e3fbSopenharmony_ci					pm4[i++] = sdma_write_length - 1;
1622d722e3fbSopenharmony_ci				else if (family_id != AMDGPU_FAMILY_SI)
1623d722e3fbSopenharmony_ci					pm4[i++] = sdma_write_length;
1624d722e3fbSopenharmony_ci				while(j++ < sdma_write_length)
1625d722e3fbSopenharmony_ci					pm4[i++] = 0xdeadbeaf;
1626d722e3fbSopenharmony_ci			} else if ((ip_type == AMDGPU_HW_IP_GFX) ||
1627d722e3fbSopenharmony_ci				    (ip_type == AMDGPU_HW_IP_COMPUTE)) {
1628d722e3fbSopenharmony_ci				pm4[i++] = PACKET3(PACKET3_WRITE_DATA, 2 + sdma_write_length);
1629d722e3fbSopenharmony_ci				pm4[i++] = WRITE_DATA_DST_SEL(5) | WR_CONFIRM;
1630d722e3fbSopenharmony_ci				pm4[i++] = 0xfffffffc & bo_mc;
1631d722e3fbSopenharmony_ci				pm4[i++] = (0xffffffff00000000 & bo_mc) >> 32;
1632d722e3fbSopenharmony_ci				while(j++ < sdma_write_length)
1633d722e3fbSopenharmony_ci					pm4[i++] = 0xdeadbeaf;
1634d722e3fbSopenharmony_ci			}
1635d722e3fbSopenharmony_ci
1636d722e3fbSopenharmony_ci			amdgpu_test_exec_cs_helper_raw(device, context_handle,
1637d722e3fbSopenharmony_ci						       ip_type, ring_id, i, pm4,
1638d722e3fbSopenharmony_ci						       1, resources, ib_info,
1639d722e3fbSopenharmony_ci						       ibs_request, secure);
1640d722e3fbSopenharmony_ci
1641d722e3fbSopenharmony_ci			/* verify if SDMA test result meets with expected */
1642d722e3fbSopenharmony_ci			i = 0;
1643d722e3fbSopenharmony_ci			if (!secure) {
1644d722e3fbSopenharmony_ci				while(i < sdma_write_length) {
1645d722e3fbSopenharmony_ci					CU_ASSERT_EQUAL(bo_cpu[i++], 0xdeadbeaf);
1646d722e3fbSopenharmony_ci				}
1647d722e3fbSopenharmony_ci			} else if (ip_type == AMDGPU_HW_IP_GFX) {
1648d722e3fbSopenharmony_ci				memset((void*)pm4, 0, pm4_dw * sizeof(uint32_t));
1649d722e3fbSopenharmony_ci				pm4[i++] = PACKET3(PACKET3_ATOMIC_MEM, 7);
1650d722e3fbSopenharmony_ci				/* atomic opcode for 32b w/ RTN and ATOMIC_SWAPCMP_RTN
1651d722e3fbSopenharmony_ci				 * command, 1-loop_until_compare_satisfied.
1652d722e3fbSopenharmony_ci				 * single_pass_atomic, 0-lru
1653d722e3fbSopenharmony_ci				 * engine_sel, 0-micro_engine
1654d722e3fbSopenharmony_ci				 */
1655d722e3fbSopenharmony_ci				pm4[i++] = (TC_OP_ATOMIC_CMPSWAP_RTN_32 |
1656d722e3fbSopenharmony_ci							ATOMIC_MEM_COMMAND(1) |
1657d722e3fbSopenharmony_ci							ATOMIC_MEM_CACHEPOLICAY(0) |
1658d722e3fbSopenharmony_ci							ATOMIC_MEM_ENGINESEL(0));
1659d722e3fbSopenharmony_ci				pm4[i++] = 0xfffffffc & bo_mc;
1660d722e3fbSopenharmony_ci				pm4[i++] = (0xffffffff00000000 & bo_mc) >> 32;
1661d722e3fbSopenharmony_ci				pm4[i++] = 0x12345678;
1662d722e3fbSopenharmony_ci				pm4[i++] = 0x0;
1663d722e3fbSopenharmony_ci				pm4[i++] = 0xdeadbeaf;
1664d722e3fbSopenharmony_ci				pm4[i++] = 0x0;
1665d722e3fbSopenharmony_ci				pm4[i++] = 0x100;
1666d722e3fbSopenharmony_ci				amdgpu_test_exec_cs_helper_raw(device, context_handle,
1667d722e3fbSopenharmony_ci							ip_type, ring_id, i, pm4,
1668d722e3fbSopenharmony_ci							1, resources, ib_info,
1669d722e3fbSopenharmony_ci							ibs_request, true);
1670d722e3fbSopenharmony_ci			} else if (ip_type == AMDGPU_HW_IP_DMA) {
1671d722e3fbSopenharmony_ci				/* restore the bo_cpu to compare */
1672d722e3fbSopenharmony_ci				bo_cpu_origin = bo_cpu[0];
1673d722e3fbSopenharmony_ci				memset((void*)pm4, 0, pm4_dw * sizeof(uint32_t));
1674d722e3fbSopenharmony_ci				/* atomic opcode for 32b w/ RTN and ATOMIC_SWAPCMP_RTN
1675d722e3fbSopenharmony_ci				 * loop, 1-loop_until_compare_satisfied.
1676d722e3fbSopenharmony_ci				 * single_pass_atomic, 0-lru
1677d722e3fbSopenharmony_ci				 */
1678d722e3fbSopenharmony_ci				pm4[i++] = SDMA_PACKET(SDMA_OPCODE_ATOMIC,
1679d722e3fbSopenharmony_ci							       0,
1680d722e3fbSopenharmony_ci							       SDMA_ATOMIC_LOOP(1) |
1681d722e3fbSopenharmony_ci							       SDMA_ATOMIC_TMZ(1) |
1682d722e3fbSopenharmony_ci							       SDMA_ATOMIC_OPCODE(TC_OP_ATOMIC_CMPSWAP_RTN_32));
1683d722e3fbSopenharmony_ci				pm4[i++] = 0xfffffffc & bo_mc;
1684d722e3fbSopenharmony_ci				pm4[i++] = (0xffffffff00000000 & bo_mc) >> 32;
1685d722e3fbSopenharmony_ci				pm4[i++] = 0x12345678;
1686d722e3fbSopenharmony_ci				pm4[i++] = 0x0;
1687d722e3fbSopenharmony_ci				pm4[i++] = 0xdeadbeaf;
1688d722e3fbSopenharmony_ci				pm4[i++] = 0x0;
1689d722e3fbSopenharmony_ci				pm4[i++] = 0x100;
1690d722e3fbSopenharmony_ci				amdgpu_test_exec_cs_helper_raw(device, context_handle,
1691d722e3fbSopenharmony_ci							ip_type, ring_id, i, pm4,
1692d722e3fbSopenharmony_ci							1, resources, ib_info,
1693d722e3fbSopenharmony_ci							ibs_request, true);
1694d722e3fbSopenharmony_ci				/* DMA's atomic behavir is unlike GFX
1695d722e3fbSopenharmony_ci				 * If the comparing data is not equal to destination data,
1696d722e3fbSopenharmony_ci				 * For GFX, loop again till gfx timeout(system hang).
1697d722e3fbSopenharmony_ci				 * For DMA, loop again till timer expired and then send interrupt.
1698d722e3fbSopenharmony_ci				 * So testcase can't use interrupt mechanism.
1699d722e3fbSopenharmony_ci				 * We take another way to verify. When the comparing data is not
1700d722e3fbSopenharmony_ci				 * equal to destination data, overwrite the source data to the destination
1701d722e3fbSopenharmony_ci				 * buffer. Otherwise, original destination data unchanged.
1702d722e3fbSopenharmony_ci				 * So if the bo_cpu data is overwritten, the result is passed.
1703d722e3fbSopenharmony_ci				 */
1704d722e3fbSopenharmony_ci				CU_ASSERT_NOT_EQUAL(bo_cpu[0], bo_cpu_origin);
1705d722e3fbSopenharmony_ci
1706d722e3fbSopenharmony_ci				/* compare again for the case of dest_data != cmp_data */
1707d722e3fbSopenharmony_ci				i = 0;
1708d722e3fbSopenharmony_ci				/* restore again, here dest_data should be */
1709d722e3fbSopenharmony_ci				bo_cpu_origin = bo_cpu[0];
1710d722e3fbSopenharmony_ci				memset((void*)pm4, 0, pm4_dw * sizeof(uint32_t));
1711d722e3fbSopenharmony_ci				pm4[i++] = SDMA_PACKET(SDMA_OPCODE_ATOMIC,
1712d722e3fbSopenharmony_ci							       0,
1713d722e3fbSopenharmony_ci							       SDMA_ATOMIC_LOOP(1) |
1714d722e3fbSopenharmony_ci							       SDMA_ATOMIC_TMZ(1) |
1715d722e3fbSopenharmony_ci							       SDMA_ATOMIC_OPCODE(TC_OP_ATOMIC_CMPSWAP_RTN_32));
1716d722e3fbSopenharmony_ci				pm4[i++] = 0xfffffffc & bo_mc;
1717d722e3fbSopenharmony_ci				pm4[i++] = (0xffffffff00000000 & bo_mc) >> 32;
1718d722e3fbSopenharmony_ci				pm4[i++] = 0x87654321;
1719d722e3fbSopenharmony_ci				pm4[i++] = 0x0;
1720d722e3fbSopenharmony_ci				pm4[i++] = 0xdeadbeaf;
1721d722e3fbSopenharmony_ci				pm4[i++] = 0x0;
1722d722e3fbSopenharmony_ci				pm4[i++] = 0x100;
1723d722e3fbSopenharmony_ci				amdgpu_test_exec_cs_helper_raw(device, context_handle,
1724d722e3fbSopenharmony_ci							ip_type, ring_id, i, pm4,
1725d722e3fbSopenharmony_ci							1, resources, ib_info,
1726d722e3fbSopenharmony_ci							ibs_request, true);
1727d722e3fbSopenharmony_ci				/* here bo_cpu[0] should be unchanged, still is 0x12345678, otherwise failed*/
1728d722e3fbSopenharmony_ci				CU_ASSERT_EQUAL(bo_cpu[0], bo_cpu_origin);
1729d722e3fbSopenharmony_ci			}
1730d722e3fbSopenharmony_ci
1731d722e3fbSopenharmony_ci			r = amdgpu_bo_unmap_and_free(bo, va_handle, bo_mc,
1732d722e3fbSopenharmony_ci						     sdma_write_length * sizeof(uint32_t));
1733d722e3fbSopenharmony_ci			CU_ASSERT_EQUAL(r, 0);
1734d722e3fbSopenharmony_ci			loop++;
1735d722e3fbSopenharmony_ci		}
1736d722e3fbSopenharmony_ci	}
1737d722e3fbSopenharmony_ci	/* clean resources */
1738d722e3fbSopenharmony_ci	free(resources);
1739d722e3fbSopenharmony_ci	free(ibs_request);
1740d722e3fbSopenharmony_ci	free(ib_info);
1741d722e3fbSopenharmony_ci	free(pm4);
1742d722e3fbSopenharmony_ci
1743d722e3fbSopenharmony_ci	/* end of test */
1744d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
1745d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1746d722e3fbSopenharmony_ci}
1747d722e3fbSopenharmony_ci
1748d722e3fbSopenharmony_cistatic void amdgpu_command_submission_write_linear_helper(unsigned ip_type)
1749d722e3fbSopenharmony_ci{
1750d722e3fbSopenharmony_ci	amdgpu_command_submission_write_linear_helper_with_secure(device_handle,
1751d722e3fbSopenharmony_ci								  ip_type,
1752d722e3fbSopenharmony_ci								  false);
1753d722e3fbSopenharmony_ci}
1754d722e3fbSopenharmony_ci
1755d722e3fbSopenharmony_cistatic void amdgpu_command_submission_sdma_write_linear(void)
1756d722e3fbSopenharmony_ci{
1757d722e3fbSopenharmony_ci	amdgpu_command_submission_write_linear_helper(AMDGPU_HW_IP_DMA);
1758d722e3fbSopenharmony_ci}
1759d722e3fbSopenharmony_ci
1760d722e3fbSopenharmony_cistatic void amdgpu_command_submission_const_fill_helper(unsigned ip_type)
1761d722e3fbSopenharmony_ci{
1762d722e3fbSopenharmony_ci	const int sdma_write_length = 1024 * 1024;
1763d722e3fbSopenharmony_ci	const int pm4_dw = 256;
1764d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
1765d722e3fbSopenharmony_ci	amdgpu_bo_handle bo;
1766d722e3fbSopenharmony_ci	amdgpu_bo_handle *resources;
1767d722e3fbSopenharmony_ci	uint32_t *pm4;
1768d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info *ib_info;
1769d722e3fbSopenharmony_ci	struct amdgpu_cs_request *ibs_request;
1770d722e3fbSopenharmony_ci	uint64_t bo_mc;
1771d722e3fbSopenharmony_ci	volatile uint32_t *bo_cpu;
1772d722e3fbSopenharmony_ci	int i, j, r, loop, ring_id;
1773d722e3fbSopenharmony_ci	uint64_t gtt_flags[2] = {0, AMDGPU_GEM_CREATE_CPU_GTT_USWC};
1774d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle;
1775d722e3fbSopenharmony_ci	struct drm_amdgpu_info_hw_ip hw_ip_info;
1776d722e3fbSopenharmony_ci
1777d722e3fbSopenharmony_ci	pm4 = calloc(pm4_dw, sizeof(*pm4));
1778d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(pm4, NULL);
1779d722e3fbSopenharmony_ci
1780d722e3fbSopenharmony_ci	ib_info = calloc(1, sizeof(*ib_info));
1781d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ib_info, NULL);
1782d722e3fbSopenharmony_ci
1783d722e3fbSopenharmony_ci	ibs_request = calloc(1, sizeof(*ibs_request));
1784d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ibs_request, NULL);
1785d722e3fbSopenharmony_ci
1786d722e3fbSopenharmony_ci	r = amdgpu_query_hw_ip_info(device_handle, ip_type, 0, &hw_ip_info);
1787d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1788d722e3fbSopenharmony_ci
1789d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
1790d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1791d722e3fbSopenharmony_ci
1792d722e3fbSopenharmony_ci	/* prepare resource */
1793d722e3fbSopenharmony_ci	resources = calloc(1, sizeof(amdgpu_bo_handle));
1794d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(resources, NULL);
1795d722e3fbSopenharmony_ci
1796d722e3fbSopenharmony_ci	for (ring_id = 0; (1 << ring_id) & hw_ip_info.available_rings; ring_id++) {
1797d722e3fbSopenharmony_ci		loop = 0;
1798d722e3fbSopenharmony_ci		while(loop < 2) {
1799d722e3fbSopenharmony_ci			/* allocate UC bo for sDMA use */
1800d722e3fbSopenharmony_ci			r = amdgpu_bo_alloc_and_map(device_handle,
1801d722e3fbSopenharmony_ci						    sdma_write_length, 4096,
1802d722e3fbSopenharmony_ci						    AMDGPU_GEM_DOMAIN_GTT,
1803d722e3fbSopenharmony_ci						    gtt_flags[loop], &bo, (void**)&bo_cpu,
1804d722e3fbSopenharmony_ci						    &bo_mc, &va_handle);
1805d722e3fbSopenharmony_ci			CU_ASSERT_EQUAL(r, 0);
1806d722e3fbSopenharmony_ci
1807d722e3fbSopenharmony_ci			/* clear bo */
1808d722e3fbSopenharmony_ci			memset((void*)bo_cpu, 0, sdma_write_length);
1809d722e3fbSopenharmony_ci
1810d722e3fbSopenharmony_ci			resources[0] = bo;
1811d722e3fbSopenharmony_ci
1812d722e3fbSopenharmony_ci			/* fulfill PM4: test DMA const fill */
1813d722e3fbSopenharmony_ci			i = j = 0;
1814d722e3fbSopenharmony_ci			if (ip_type == AMDGPU_HW_IP_DMA) {
1815d722e3fbSopenharmony_ci				if (family_id == AMDGPU_FAMILY_SI) {
1816d722e3fbSopenharmony_ci					pm4[i++] = SDMA_PACKET_SI(SDMA_OPCODE_CONSTANT_FILL_SI,
1817d722e3fbSopenharmony_ci								  0, 0, 0,
1818d722e3fbSopenharmony_ci								  sdma_write_length / 4);
1819d722e3fbSopenharmony_ci					pm4[i++] = 0xfffffffc & bo_mc;
1820d722e3fbSopenharmony_ci					pm4[i++] = 0xdeadbeaf;
1821d722e3fbSopenharmony_ci					pm4[i++] = (0xffffffff00000000 & bo_mc) >> 16;
1822d722e3fbSopenharmony_ci				} else {
1823d722e3fbSopenharmony_ci					pm4[i++] = SDMA_PACKET(SDMA_OPCODE_CONSTANT_FILL, 0,
1824d722e3fbSopenharmony_ci							       SDMA_CONSTANT_FILL_EXTRA_SIZE(2));
1825d722e3fbSopenharmony_ci					pm4[i++] = 0xffffffff & bo_mc;
1826d722e3fbSopenharmony_ci					pm4[i++] = (0xffffffff00000000 & bo_mc) >> 32;
1827d722e3fbSopenharmony_ci					pm4[i++] = 0xdeadbeaf;
1828d722e3fbSopenharmony_ci					if (family_id >= AMDGPU_FAMILY_AI)
1829d722e3fbSopenharmony_ci						pm4[i++] = sdma_write_length - 1;
1830d722e3fbSopenharmony_ci					else
1831d722e3fbSopenharmony_ci						pm4[i++] = sdma_write_length;
1832d722e3fbSopenharmony_ci				}
1833d722e3fbSopenharmony_ci			} else if ((ip_type == AMDGPU_HW_IP_GFX) ||
1834d722e3fbSopenharmony_ci				   (ip_type == AMDGPU_HW_IP_COMPUTE)) {
1835d722e3fbSopenharmony_ci				if (family_id == AMDGPU_FAMILY_SI) {
1836d722e3fbSopenharmony_ci					pm4[i++] = PACKET3(PACKET3_DMA_DATA_SI, 4);
1837d722e3fbSopenharmony_ci					pm4[i++] = 0xdeadbeaf;
1838d722e3fbSopenharmony_ci					pm4[i++] = PACKET3_DMA_DATA_SI_ENGINE(0) |
1839d722e3fbSopenharmony_ci						   PACKET3_DMA_DATA_SI_DST_SEL(0) |
1840d722e3fbSopenharmony_ci						   PACKET3_DMA_DATA_SI_SRC_SEL(2) |
1841d722e3fbSopenharmony_ci						   PACKET3_DMA_DATA_SI_CP_SYNC;
1842d722e3fbSopenharmony_ci					pm4[i++] = 0xffffffff & bo_mc;
1843d722e3fbSopenharmony_ci					pm4[i++] = (0xffffffff00000000 & bo_mc) >> 32;
1844d722e3fbSopenharmony_ci					pm4[i++] = sdma_write_length;
1845d722e3fbSopenharmony_ci				} else {
1846d722e3fbSopenharmony_ci					pm4[i++] = PACKET3(PACKET3_DMA_DATA, 5);
1847d722e3fbSopenharmony_ci					pm4[i++] = PACKET3_DMA_DATA_ENGINE(0) |
1848d722e3fbSopenharmony_ci						   PACKET3_DMA_DATA_DST_SEL(0) |
1849d722e3fbSopenharmony_ci						   PACKET3_DMA_DATA_SRC_SEL(2) |
1850d722e3fbSopenharmony_ci						   PACKET3_DMA_DATA_CP_SYNC;
1851d722e3fbSopenharmony_ci					pm4[i++] = 0xdeadbeaf;
1852d722e3fbSopenharmony_ci					pm4[i++] = 0;
1853d722e3fbSopenharmony_ci					pm4[i++] = 0xfffffffc & bo_mc;
1854d722e3fbSopenharmony_ci					pm4[i++] = (0xffffffff00000000 & bo_mc) >> 32;
1855d722e3fbSopenharmony_ci					pm4[i++] = sdma_write_length;
1856d722e3fbSopenharmony_ci				}
1857d722e3fbSopenharmony_ci			}
1858d722e3fbSopenharmony_ci
1859d722e3fbSopenharmony_ci			amdgpu_test_exec_cs_helper(context_handle,
1860d722e3fbSopenharmony_ci						   ip_type, ring_id,
1861d722e3fbSopenharmony_ci						   i, pm4,
1862d722e3fbSopenharmony_ci						   1, resources,
1863d722e3fbSopenharmony_ci						   ib_info, ibs_request);
1864d722e3fbSopenharmony_ci
1865d722e3fbSopenharmony_ci			/* verify if SDMA test result meets with expected */
1866d722e3fbSopenharmony_ci			i = 0;
1867d722e3fbSopenharmony_ci			while(i < (sdma_write_length / 4)) {
1868d722e3fbSopenharmony_ci				CU_ASSERT_EQUAL(bo_cpu[i++], 0xdeadbeaf);
1869d722e3fbSopenharmony_ci			}
1870d722e3fbSopenharmony_ci
1871d722e3fbSopenharmony_ci			r = amdgpu_bo_unmap_and_free(bo, va_handle, bo_mc,
1872d722e3fbSopenharmony_ci						     sdma_write_length);
1873d722e3fbSopenharmony_ci			CU_ASSERT_EQUAL(r, 0);
1874d722e3fbSopenharmony_ci			loop++;
1875d722e3fbSopenharmony_ci		}
1876d722e3fbSopenharmony_ci	}
1877d722e3fbSopenharmony_ci	/* clean resources */
1878d722e3fbSopenharmony_ci	free(resources);
1879d722e3fbSopenharmony_ci	free(ibs_request);
1880d722e3fbSopenharmony_ci	free(ib_info);
1881d722e3fbSopenharmony_ci	free(pm4);
1882d722e3fbSopenharmony_ci
1883d722e3fbSopenharmony_ci	/* end of test */
1884d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
1885d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1886d722e3fbSopenharmony_ci}
1887d722e3fbSopenharmony_ci
1888d722e3fbSopenharmony_cistatic void amdgpu_command_submission_sdma_const_fill(void)
1889d722e3fbSopenharmony_ci{
1890d722e3fbSopenharmony_ci	amdgpu_command_submission_const_fill_helper(AMDGPU_HW_IP_DMA);
1891d722e3fbSopenharmony_ci}
1892d722e3fbSopenharmony_ci
1893d722e3fbSopenharmony_cistatic void amdgpu_command_submission_copy_linear_helper(unsigned ip_type)
1894d722e3fbSopenharmony_ci{
1895d722e3fbSopenharmony_ci	const int sdma_write_length = 1024;
1896d722e3fbSopenharmony_ci	const int pm4_dw = 256;
1897d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
1898d722e3fbSopenharmony_ci	amdgpu_bo_handle bo1, bo2;
1899d722e3fbSopenharmony_ci	amdgpu_bo_handle *resources;
1900d722e3fbSopenharmony_ci	uint32_t *pm4;
1901d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info *ib_info;
1902d722e3fbSopenharmony_ci	struct amdgpu_cs_request *ibs_request;
1903d722e3fbSopenharmony_ci	uint64_t bo1_mc, bo2_mc;
1904d722e3fbSopenharmony_ci	volatile unsigned char *bo1_cpu, *bo2_cpu;
1905d722e3fbSopenharmony_ci	int i, j, r, loop1, loop2, ring_id;
1906d722e3fbSopenharmony_ci	uint64_t gtt_flags[2] = {0, AMDGPU_GEM_CREATE_CPU_GTT_USWC};
1907d722e3fbSopenharmony_ci	amdgpu_va_handle bo1_va_handle, bo2_va_handle;
1908d722e3fbSopenharmony_ci	struct drm_amdgpu_info_hw_ip hw_ip_info;
1909d722e3fbSopenharmony_ci
1910d722e3fbSopenharmony_ci	pm4 = calloc(pm4_dw, sizeof(*pm4));
1911d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(pm4, NULL);
1912d722e3fbSopenharmony_ci
1913d722e3fbSopenharmony_ci	ib_info = calloc(1, sizeof(*ib_info));
1914d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ib_info, NULL);
1915d722e3fbSopenharmony_ci
1916d722e3fbSopenharmony_ci	ibs_request = calloc(1, sizeof(*ibs_request));
1917d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ibs_request, NULL);
1918d722e3fbSopenharmony_ci
1919d722e3fbSopenharmony_ci	r = amdgpu_query_hw_ip_info(device_handle, ip_type, 0, &hw_ip_info);
1920d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1921d722e3fbSopenharmony_ci
1922d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
1923d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
1924d722e3fbSopenharmony_ci
1925d722e3fbSopenharmony_ci	/* prepare resource */
1926d722e3fbSopenharmony_ci	resources = calloc(2, sizeof(amdgpu_bo_handle));
1927d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(resources, NULL);
1928d722e3fbSopenharmony_ci
1929d722e3fbSopenharmony_ci	for (ring_id = 0; (1 << ring_id) & hw_ip_info.available_rings; ring_id++) {
1930d722e3fbSopenharmony_ci		loop1 = loop2 = 0;
1931d722e3fbSopenharmony_ci		/* run 9 circle to test all mapping combination */
1932d722e3fbSopenharmony_ci		while(loop1 < 2) {
1933d722e3fbSopenharmony_ci			while(loop2 < 2) {
1934d722e3fbSopenharmony_ci				/* allocate UC bo1for sDMA use */
1935d722e3fbSopenharmony_ci				r = amdgpu_bo_alloc_and_map(device_handle,
1936d722e3fbSopenharmony_ci							    sdma_write_length, 4096,
1937d722e3fbSopenharmony_ci							    AMDGPU_GEM_DOMAIN_GTT,
1938d722e3fbSopenharmony_ci							    gtt_flags[loop1], &bo1,
1939d722e3fbSopenharmony_ci							    (void**)&bo1_cpu, &bo1_mc,
1940d722e3fbSopenharmony_ci							    &bo1_va_handle);
1941d722e3fbSopenharmony_ci				CU_ASSERT_EQUAL(r, 0);
1942d722e3fbSopenharmony_ci
1943d722e3fbSopenharmony_ci				/* set bo1 */
1944d722e3fbSopenharmony_ci				memset((void*)bo1_cpu, 0xaa, sdma_write_length);
1945d722e3fbSopenharmony_ci
1946d722e3fbSopenharmony_ci				/* allocate UC bo2 for sDMA use */
1947d722e3fbSopenharmony_ci				r = amdgpu_bo_alloc_and_map(device_handle,
1948d722e3fbSopenharmony_ci							    sdma_write_length, 4096,
1949d722e3fbSopenharmony_ci							    AMDGPU_GEM_DOMAIN_GTT,
1950d722e3fbSopenharmony_ci							    gtt_flags[loop2], &bo2,
1951d722e3fbSopenharmony_ci							    (void**)&bo2_cpu, &bo2_mc,
1952d722e3fbSopenharmony_ci							    &bo2_va_handle);
1953d722e3fbSopenharmony_ci				CU_ASSERT_EQUAL(r, 0);
1954d722e3fbSopenharmony_ci
1955d722e3fbSopenharmony_ci				/* clear bo2 */
1956d722e3fbSopenharmony_ci				memset((void*)bo2_cpu, 0, sdma_write_length);
1957d722e3fbSopenharmony_ci
1958d722e3fbSopenharmony_ci				resources[0] = bo1;
1959d722e3fbSopenharmony_ci				resources[1] = bo2;
1960d722e3fbSopenharmony_ci
1961d722e3fbSopenharmony_ci				/* fulfill PM4: test DMA copy linear */
1962d722e3fbSopenharmony_ci				i = j = 0;
1963d722e3fbSopenharmony_ci				if (ip_type == AMDGPU_HW_IP_DMA) {
1964d722e3fbSopenharmony_ci					if (family_id == AMDGPU_FAMILY_SI) {
1965d722e3fbSopenharmony_ci						pm4[i++] = SDMA_PACKET_SI(SDMA_OPCODE_COPY_SI,
1966d722e3fbSopenharmony_ci									  0, 0, 0,
1967d722e3fbSopenharmony_ci									  sdma_write_length);
1968d722e3fbSopenharmony_ci						pm4[i++] = 0xffffffff & bo2_mc;
1969d722e3fbSopenharmony_ci						pm4[i++] = 0xffffffff & bo1_mc;
1970d722e3fbSopenharmony_ci						pm4[i++] = (0xffffffff00000000 & bo2_mc) >> 32;
1971d722e3fbSopenharmony_ci						pm4[i++] = (0xffffffff00000000 & bo1_mc) >> 32;
1972d722e3fbSopenharmony_ci					} else {
1973d722e3fbSopenharmony_ci						pm4[i++] = SDMA_PACKET(SDMA_OPCODE_COPY,
1974d722e3fbSopenharmony_ci								       SDMA_COPY_SUB_OPCODE_LINEAR,
1975d722e3fbSopenharmony_ci								       0);
1976d722e3fbSopenharmony_ci						if (family_id >= AMDGPU_FAMILY_AI)
1977d722e3fbSopenharmony_ci							pm4[i++] = sdma_write_length - 1;
1978d722e3fbSopenharmony_ci						else
1979d722e3fbSopenharmony_ci							pm4[i++] = sdma_write_length;
1980d722e3fbSopenharmony_ci						pm4[i++] = 0;
1981d722e3fbSopenharmony_ci						pm4[i++] = 0xffffffff & bo1_mc;
1982d722e3fbSopenharmony_ci						pm4[i++] = (0xffffffff00000000 & bo1_mc) >> 32;
1983d722e3fbSopenharmony_ci						pm4[i++] = 0xffffffff & bo2_mc;
1984d722e3fbSopenharmony_ci						pm4[i++] = (0xffffffff00000000 & bo2_mc) >> 32;
1985d722e3fbSopenharmony_ci					}
1986d722e3fbSopenharmony_ci				} else if ((ip_type == AMDGPU_HW_IP_GFX) ||
1987d722e3fbSopenharmony_ci					   (ip_type == AMDGPU_HW_IP_COMPUTE)) {
1988d722e3fbSopenharmony_ci					if (family_id == AMDGPU_FAMILY_SI) {
1989d722e3fbSopenharmony_ci						pm4[i++] = PACKET3(PACKET3_DMA_DATA_SI, 4);
1990d722e3fbSopenharmony_ci						pm4[i++] = 0xfffffffc & bo1_mc;
1991d722e3fbSopenharmony_ci						pm4[i++] = PACKET3_DMA_DATA_SI_ENGINE(0) |
1992d722e3fbSopenharmony_ci							   PACKET3_DMA_DATA_SI_DST_SEL(0) |
1993d722e3fbSopenharmony_ci							   PACKET3_DMA_DATA_SI_SRC_SEL(0) |
1994d722e3fbSopenharmony_ci							   PACKET3_DMA_DATA_SI_CP_SYNC |
1995d722e3fbSopenharmony_ci							   (0xffff00000000 & bo1_mc) >> 32;
1996d722e3fbSopenharmony_ci						pm4[i++] = 0xfffffffc & bo2_mc;
1997d722e3fbSopenharmony_ci						pm4[i++] = (0xffffffff00000000 & bo2_mc) >> 32;
1998d722e3fbSopenharmony_ci						pm4[i++] = sdma_write_length;
1999d722e3fbSopenharmony_ci					} else {
2000d722e3fbSopenharmony_ci						pm4[i++] = PACKET3(PACKET3_DMA_DATA, 5);
2001d722e3fbSopenharmony_ci						pm4[i++] = PACKET3_DMA_DATA_ENGINE(0) |
2002d722e3fbSopenharmony_ci							   PACKET3_DMA_DATA_DST_SEL(0) |
2003d722e3fbSopenharmony_ci							   PACKET3_DMA_DATA_SRC_SEL(0) |
2004d722e3fbSopenharmony_ci							   PACKET3_DMA_DATA_CP_SYNC;
2005d722e3fbSopenharmony_ci						pm4[i++] = 0xfffffffc & bo1_mc;
2006d722e3fbSopenharmony_ci						pm4[i++] = (0xffffffff00000000 & bo1_mc) >> 32;
2007d722e3fbSopenharmony_ci						pm4[i++] = 0xfffffffc & bo2_mc;
2008d722e3fbSopenharmony_ci						pm4[i++] = (0xffffffff00000000 & bo2_mc) >> 32;
2009d722e3fbSopenharmony_ci						pm4[i++] = sdma_write_length;
2010d722e3fbSopenharmony_ci					}
2011d722e3fbSopenharmony_ci				}
2012d722e3fbSopenharmony_ci
2013d722e3fbSopenharmony_ci				amdgpu_test_exec_cs_helper(context_handle,
2014d722e3fbSopenharmony_ci							   ip_type, ring_id,
2015d722e3fbSopenharmony_ci							   i, pm4,
2016d722e3fbSopenharmony_ci							   2, resources,
2017d722e3fbSopenharmony_ci							   ib_info, ibs_request);
2018d722e3fbSopenharmony_ci
2019d722e3fbSopenharmony_ci				/* verify if SDMA test result meets with expected */
2020d722e3fbSopenharmony_ci				i = 0;
2021d722e3fbSopenharmony_ci				while(i < sdma_write_length) {
2022d722e3fbSopenharmony_ci					CU_ASSERT_EQUAL(bo2_cpu[i++], 0xaa);
2023d722e3fbSopenharmony_ci				}
2024d722e3fbSopenharmony_ci				r = amdgpu_bo_unmap_and_free(bo1, bo1_va_handle, bo1_mc,
2025d722e3fbSopenharmony_ci							     sdma_write_length);
2026d722e3fbSopenharmony_ci				CU_ASSERT_EQUAL(r, 0);
2027d722e3fbSopenharmony_ci				r = amdgpu_bo_unmap_and_free(bo2, bo2_va_handle, bo2_mc,
2028d722e3fbSopenharmony_ci							     sdma_write_length);
2029d722e3fbSopenharmony_ci				CU_ASSERT_EQUAL(r, 0);
2030d722e3fbSopenharmony_ci				loop2++;
2031d722e3fbSopenharmony_ci			}
2032d722e3fbSopenharmony_ci			loop1++;
2033d722e3fbSopenharmony_ci		}
2034d722e3fbSopenharmony_ci	}
2035d722e3fbSopenharmony_ci	/* clean resources */
2036d722e3fbSopenharmony_ci	free(resources);
2037d722e3fbSopenharmony_ci	free(ibs_request);
2038d722e3fbSopenharmony_ci	free(ib_info);
2039d722e3fbSopenharmony_ci	free(pm4);
2040d722e3fbSopenharmony_ci
2041d722e3fbSopenharmony_ci	/* end of test */
2042d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
2043d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2044d722e3fbSopenharmony_ci}
2045d722e3fbSopenharmony_ci
2046d722e3fbSopenharmony_cistatic void amdgpu_command_submission_sdma_copy_linear(void)
2047d722e3fbSopenharmony_ci{
2048d722e3fbSopenharmony_ci	amdgpu_command_submission_copy_linear_helper(AMDGPU_HW_IP_DMA);
2049d722e3fbSopenharmony_ci}
2050d722e3fbSopenharmony_ci
2051d722e3fbSopenharmony_cistatic void amdgpu_command_submission_sdma(void)
2052d722e3fbSopenharmony_ci{
2053d722e3fbSopenharmony_ci	amdgpu_command_submission_sdma_write_linear();
2054d722e3fbSopenharmony_ci	amdgpu_command_submission_sdma_const_fill();
2055d722e3fbSopenharmony_ci	amdgpu_command_submission_sdma_copy_linear();
2056d722e3fbSopenharmony_ci}
2057d722e3fbSopenharmony_ci
2058d722e3fbSopenharmony_cistatic void amdgpu_command_submission_multi_fence_wait_all(bool wait_all)
2059d722e3fbSopenharmony_ci{
2060d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
2061d722e3fbSopenharmony_ci	amdgpu_bo_handle ib_result_handle, ib_result_ce_handle;
2062d722e3fbSopenharmony_ci	void *ib_result_cpu, *ib_result_ce_cpu;
2063d722e3fbSopenharmony_ci	uint64_t ib_result_mc_address, ib_result_ce_mc_address;
2064d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request[2] = {0};
2065d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info[2];
2066d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status[2] = {0};
2067d722e3fbSopenharmony_ci	uint32_t *ptr;
2068d722e3fbSopenharmony_ci	uint32_t expired;
2069d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list;
2070d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle, va_handle_ce;
2071d722e3fbSopenharmony_ci	int r;
2072d722e3fbSopenharmony_ci	int i = 0, ib_cs_num = 2;
2073d722e3fbSopenharmony_ci
2074d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
2075d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2076d722e3fbSopenharmony_ci
2077d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, 4096, 4096,
2078d722e3fbSopenharmony_ci				    AMDGPU_GEM_DOMAIN_GTT, 0,
2079d722e3fbSopenharmony_ci				    &ib_result_handle, &ib_result_cpu,
2080d722e3fbSopenharmony_ci				    &ib_result_mc_address, &va_handle);
2081d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2082d722e3fbSopenharmony_ci
2083d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, 4096, 4096,
2084d722e3fbSopenharmony_ci				    AMDGPU_GEM_DOMAIN_GTT, 0,
2085d722e3fbSopenharmony_ci				    &ib_result_ce_handle, &ib_result_ce_cpu,
2086d722e3fbSopenharmony_ci				    &ib_result_ce_mc_address, &va_handle_ce);
2087d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2088d722e3fbSopenharmony_ci
2089d722e3fbSopenharmony_ci	r = amdgpu_get_bo_list(device_handle, ib_result_handle,
2090d722e3fbSopenharmony_ci			       ib_result_ce_handle, &bo_list);
2091d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2092d722e3fbSopenharmony_ci
2093d722e3fbSopenharmony_ci	memset(ib_info, 0, 2 * sizeof(struct amdgpu_cs_ib_info));
2094d722e3fbSopenharmony_ci
2095d722e3fbSopenharmony_ci	/* IT_SET_CE_DE_COUNTERS */
2096d722e3fbSopenharmony_ci	ptr = ib_result_ce_cpu;
2097d722e3fbSopenharmony_ci	if (family_id != AMDGPU_FAMILY_SI) {
2098d722e3fbSopenharmony_ci		ptr[i++] = 0xc0008900;
2099d722e3fbSopenharmony_ci		ptr[i++] = 0;
2100d722e3fbSopenharmony_ci	}
2101d722e3fbSopenharmony_ci	ptr[i++] = 0xc0008400;
2102d722e3fbSopenharmony_ci	ptr[i++] = 1;
2103d722e3fbSopenharmony_ci	ib_info[0].ib_mc_address = ib_result_ce_mc_address;
2104d722e3fbSopenharmony_ci	ib_info[0].size = i;
2105d722e3fbSopenharmony_ci	ib_info[0].flags = AMDGPU_IB_FLAG_CE;
2106d722e3fbSopenharmony_ci
2107d722e3fbSopenharmony_ci	/* IT_WAIT_ON_CE_COUNTER */
2108d722e3fbSopenharmony_ci	ptr = ib_result_cpu;
2109d722e3fbSopenharmony_ci	ptr[0] = 0xc0008600;
2110d722e3fbSopenharmony_ci	ptr[1] = 0x00000001;
2111d722e3fbSopenharmony_ci	ib_info[1].ib_mc_address = ib_result_mc_address;
2112d722e3fbSopenharmony_ci	ib_info[1].size = 2;
2113d722e3fbSopenharmony_ci
2114d722e3fbSopenharmony_ci	for (i = 0; i < ib_cs_num; i++) {
2115d722e3fbSopenharmony_ci		ibs_request[i].ip_type = AMDGPU_HW_IP_GFX;
2116d722e3fbSopenharmony_ci		ibs_request[i].number_of_ibs = 2;
2117d722e3fbSopenharmony_ci		ibs_request[i].ibs = ib_info;
2118d722e3fbSopenharmony_ci		ibs_request[i].resources = bo_list;
2119d722e3fbSopenharmony_ci		ibs_request[i].fence_info.handle = NULL;
2120d722e3fbSopenharmony_ci	}
2121d722e3fbSopenharmony_ci
2122d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle, 0,ibs_request, ib_cs_num);
2123d722e3fbSopenharmony_ci
2124d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2125d722e3fbSopenharmony_ci
2126d722e3fbSopenharmony_ci	for (i = 0; i < ib_cs_num; i++) {
2127d722e3fbSopenharmony_ci		fence_status[i].context = context_handle;
2128d722e3fbSopenharmony_ci		fence_status[i].ip_type = AMDGPU_HW_IP_GFX;
2129d722e3fbSopenharmony_ci		fence_status[i].fence = ibs_request[i].seq_no;
2130d722e3fbSopenharmony_ci	}
2131d722e3fbSopenharmony_ci
2132d722e3fbSopenharmony_ci	r = amdgpu_cs_wait_fences(fence_status, ib_cs_num, wait_all,
2133d722e3fbSopenharmony_ci				AMDGPU_TIMEOUT_INFINITE,
2134d722e3fbSopenharmony_ci				&expired, NULL);
2135d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2136d722e3fbSopenharmony_ci
2137d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(ib_result_handle, va_handle,
2138d722e3fbSopenharmony_ci				     ib_result_mc_address, 4096);
2139d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2140d722e3fbSopenharmony_ci
2141d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(ib_result_ce_handle, va_handle_ce,
2142d722e3fbSopenharmony_ci				     ib_result_ce_mc_address, 4096);
2143d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2144d722e3fbSopenharmony_ci
2145d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(bo_list);
2146d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2147d722e3fbSopenharmony_ci
2148d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
2149d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2150d722e3fbSopenharmony_ci}
2151d722e3fbSopenharmony_ci
2152d722e3fbSopenharmony_cistatic void amdgpu_command_submission_multi_fence(void)
2153d722e3fbSopenharmony_ci{
2154d722e3fbSopenharmony_ci	amdgpu_command_submission_multi_fence_wait_all(true);
2155d722e3fbSopenharmony_ci	amdgpu_command_submission_multi_fence_wait_all(false);
2156d722e3fbSopenharmony_ci}
2157d722e3fbSopenharmony_ci
2158d722e3fbSopenharmony_cistatic void amdgpu_userptr_test(void)
2159d722e3fbSopenharmony_ci{
2160d722e3fbSopenharmony_ci	int i, r, j;
2161d722e3fbSopenharmony_ci	uint32_t *pm4 = NULL;
2162d722e3fbSopenharmony_ci	uint64_t bo_mc;
2163d722e3fbSopenharmony_ci	void *ptr = NULL;
2164d722e3fbSopenharmony_ci	int pm4_dw = 256;
2165d722e3fbSopenharmony_ci	int sdma_write_length = 4;
2166d722e3fbSopenharmony_ci	amdgpu_bo_handle handle;
2167d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
2168d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info *ib_info;
2169d722e3fbSopenharmony_ci	struct amdgpu_cs_request *ibs_request;
2170d722e3fbSopenharmony_ci	amdgpu_bo_handle buf_handle;
2171d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle;
2172d722e3fbSopenharmony_ci
2173d722e3fbSopenharmony_ci	pm4 = calloc(pm4_dw, sizeof(*pm4));
2174d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(pm4, NULL);
2175d722e3fbSopenharmony_ci
2176d722e3fbSopenharmony_ci	ib_info = calloc(1, sizeof(*ib_info));
2177d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ib_info, NULL);
2178d722e3fbSopenharmony_ci
2179d722e3fbSopenharmony_ci	ibs_request = calloc(1, sizeof(*ibs_request));
2180d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ibs_request, NULL);
2181d722e3fbSopenharmony_ci
2182d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
2183d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2184d722e3fbSopenharmony_ci
2185d722e3fbSopenharmony_ci	posix_memalign(&ptr, sysconf(_SC_PAGE_SIZE), BUFFER_SIZE);
2186d722e3fbSopenharmony_ci	CU_ASSERT_NOT_EQUAL(ptr, NULL);
2187d722e3fbSopenharmony_ci	memset(ptr, 0, BUFFER_SIZE);
2188d722e3fbSopenharmony_ci
2189d722e3fbSopenharmony_ci	r = amdgpu_create_bo_from_user_mem(device_handle,
2190d722e3fbSopenharmony_ci					   ptr, BUFFER_SIZE, &buf_handle);
2191d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2192d722e3fbSopenharmony_ci
2193d722e3fbSopenharmony_ci	r = amdgpu_va_range_alloc(device_handle,
2194d722e3fbSopenharmony_ci				  amdgpu_gpu_va_range_general,
2195d722e3fbSopenharmony_ci				  BUFFER_SIZE, 1, 0, &bo_mc,
2196d722e3fbSopenharmony_ci				  &va_handle, 0);
2197d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2198d722e3fbSopenharmony_ci
2199d722e3fbSopenharmony_ci	r = amdgpu_bo_va_op(buf_handle, 0, BUFFER_SIZE, bo_mc, 0, AMDGPU_VA_OP_MAP);
2200d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2201d722e3fbSopenharmony_ci
2202d722e3fbSopenharmony_ci	handle = buf_handle;
2203d722e3fbSopenharmony_ci
2204d722e3fbSopenharmony_ci	j = i = 0;
2205d722e3fbSopenharmony_ci
2206d722e3fbSopenharmony_ci	if (family_id == AMDGPU_FAMILY_SI)
2207d722e3fbSopenharmony_ci		pm4[i++] = SDMA_PACKET_SI(SDMA_OPCODE_WRITE, 0, 0, 0,
2208d722e3fbSopenharmony_ci				sdma_write_length);
2209d722e3fbSopenharmony_ci	else
2210d722e3fbSopenharmony_ci		pm4[i++] = SDMA_PACKET(SDMA_OPCODE_WRITE,
2211d722e3fbSopenharmony_ci				SDMA_WRITE_SUB_OPCODE_LINEAR, 0);
2212d722e3fbSopenharmony_ci	pm4[i++] = 0xffffffff & bo_mc;
2213d722e3fbSopenharmony_ci	pm4[i++] = (0xffffffff00000000 & bo_mc) >> 32;
2214d722e3fbSopenharmony_ci	if (family_id >= AMDGPU_FAMILY_AI)
2215d722e3fbSopenharmony_ci		pm4[i++] = sdma_write_length - 1;
2216d722e3fbSopenharmony_ci	else if (family_id != AMDGPU_FAMILY_SI)
2217d722e3fbSopenharmony_ci		pm4[i++] = sdma_write_length;
2218d722e3fbSopenharmony_ci
2219d722e3fbSopenharmony_ci	while (j++ < sdma_write_length)
2220d722e3fbSopenharmony_ci		pm4[i++] = 0xdeadbeaf;
2221d722e3fbSopenharmony_ci
2222d722e3fbSopenharmony_ci	if (!fork()) {
2223d722e3fbSopenharmony_ci		pm4[0] = 0x0;
2224d722e3fbSopenharmony_ci		exit(0);
2225d722e3fbSopenharmony_ci	}
2226d722e3fbSopenharmony_ci
2227d722e3fbSopenharmony_ci	amdgpu_test_exec_cs_helper(context_handle,
2228d722e3fbSopenharmony_ci				   AMDGPU_HW_IP_DMA, 0,
2229d722e3fbSopenharmony_ci				   i, pm4,
2230d722e3fbSopenharmony_ci				   1, &handle,
2231d722e3fbSopenharmony_ci				   ib_info, ibs_request);
2232d722e3fbSopenharmony_ci	i = 0;
2233d722e3fbSopenharmony_ci	while (i < sdma_write_length) {
2234d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(((int*)ptr)[i++], 0xdeadbeaf);
2235d722e3fbSopenharmony_ci	}
2236d722e3fbSopenharmony_ci	free(ibs_request);
2237d722e3fbSopenharmony_ci	free(ib_info);
2238d722e3fbSopenharmony_ci	free(pm4);
2239d722e3fbSopenharmony_ci
2240d722e3fbSopenharmony_ci	r = amdgpu_bo_va_op(buf_handle, 0, BUFFER_SIZE, bo_mc, 0, AMDGPU_VA_OP_UNMAP);
2241d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2242d722e3fbSopenharmony_ci	r = amdgpu_va_range_free(va_handle);
2243d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2244d722e3fbSopenharmony_ci	r = amdgpu_bo_free(buf_handle);
2245d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2246d722e3fbSopenharmony_ci	free(ptr);
2247d722e3fbSopenharmony_ci
2248d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
2249d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2250d722e3fbSopenharmony_ci
2251d722e3fbSopenharmony_ci	wait(NULL);
2252d722e3fbSopenharmony_ci}
2253d722e3fbSopenharmony_ci
2254d722e3fbSopenharmony_cistatic void amdgpu_sync_dependency_test(void)
2255d722e3fbSopenharmony_ci{
2256d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle[2];
2257d722e3fbSopenharmony_ci	amdgpu_bo_handle ib_result_handle;
2258d722e3fbSopenharmony_ci	void *ib_result_cpu;
2259d722e3fbSopenharmony_ci	uint64_t ib_result_mc_address;
2260d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request;
2261d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info;
2262d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status;
2263d722e3fbSopenharmony_ci	uint32_t expired;
2264d722e3fbSopenharmony_ci	int i, j, r;
2265d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list;
2266d722e3fbSopenharmony_ci	amdgpu_va_handle va_handle;
2267d722e3fbSopenharmony_ci	static uint32_t *ptr;
2268d722e3fbSopenharmony_ci	uint64_t seq_no;
2269d722e3fbSopenharmony_ci
2270d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle[0]);
2271d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2272d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle[1]);
2273d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2274d722e3fbSopenharmony_ci
2275d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, 8192, 4096,
2276d722e3fbSopenharmony_ci			AMDGPU_GEM_DOMAIN_GTT, 0,
2277d722e3fbSopenharmony_ci						    &ib_result_handle, &ib_result_cpu,
2278d722e3fbSopenharmony_ci						    &ib_result_mc_address, &va_handle);
2279d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2280d722e3fbSopenharmony_ci
2281d722e3fbSopenharmony_ci	r = amdgpu_get_bo_list(device_handle, ib_result_handle, NULL,
2282d722e3fbSopenharmony_ci			       &bo_list);
2283d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2284d722e3fbSopenharmony_ci
2285d722e3fbSopenharmony_ci	ptr = ib_result_cpu;
2286d722e3fbSopenharmony_ci	i = 0;
2287d722e3fbSopenharmony_ci
2288d722e3fbSopenharmony_ci	memcpy(ptr + CODE_OFFSET , shader_bin, sizeof(shader_bin));
2289d722e3fbSopenharmony_ci
2290d722e3fbSopenharmony_ci	/* Dispatch minimal init config and verify it's executed */
2291d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_CONTEXT_CONTROL, 1);
2292d722e3fbSopenharmony_ci	ptr[i++] = 0x80000000;
2293d722e3fbSopenharmony_ci	ptr[i++] = 0x80000000;
2294d722e3fbSopenharmony_ci
2295d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_CLEAR_STATE, 0);
2296d722e3fbSopenharmony_ci	ptr[i++] = 0x80000000;
2297d722e3fbSopenharmony_ci
2298d722e3fbSopenharmony_ci
2299d722e3fbSopenharmony_ci	/* Program compute regs */
2300d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_SET_SH_REG, 2);
2301d722e3fbSopenharmony_ci	ptr[i++] = mmCOMPUTE_PGM_LO - PACKET3_SET_SH_REG_START;
2302d722e3fbSopenharmony_ci	ptr[i++] = (ib_result_mc_address + CODE_OFFSET * 4) >> 8;
2303d722e3fbSopenharmony_ci	ptr[i++] = (ib_result_mc_address + CODE_OFFSET * 4) >> 40;
2304d722e3fbSopenharmony_ci
2305d722e3fbSopenharmony_ci
2306d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_SET_SH_REG, 2);
2307d722e3fbSopenharmony_ci	ptr[i++] = mmCOMPUTE_PGM_RSRC1 - PACKET3_SET_SH_REG_START;
2308d722e3fbSopenharmony_ci	/*
2309d722e3fbSopenharmony_ci	 * 002c0040         COMPUTE_PGM_RSRC1 <- VGPRS = 0
2310d722e3fbSopenharmony_ci	                                      SGPRS = 1
2311d722e3fbSopenharmony_ci	                                      PRIORITY = 0
2312d722e3fbSopenharmony_ci	                                      FLOAT_MODE = 192 (0xc0)
2313d722e3fbSopenharmony_ci	                                      PRIV = 0
2314d722e3fbSopenharmony_ci	                                      DX10_CLAMP = 1
2315d722e3fbSopenharmony_ci	                                      DEBUG_MODE = 0
2316d722e3fbSopenharmony_ci	                                      IEEE_MODE = 0
2317d722e3fbSopenharmony_ci	                                      BULKY = 0
2318d722e3fbSopenharmony_ci	                                      CDBG_USER = 0
2319d722e3fbSopenharmony_ci	 *
2320d722e3fbSopenharmony_ci	 */
2321d722e3fbSopenharmony_ci	ptr[i++] = 0x002c0040;
2322d722e3fbSopenharmony_ci
2323d722e3fbSopenharmony_ci
2324d722e3fbSopenharmony_ci	/*
2325d722e3fbSopenharmony_ci	 * 00000010         COMPUTE_PGM_RSRC2 <- SCRATCH_EN = 0
2326d722e3fbSopenharmony_ci	                                      USER_SGPR = 8
2327d722e3fbSopenharmony_ci	                                      TRAP_PRESENT = 0
2328d722e3fbSopenharmony_ci	                                      TGID_X_EN = 0
2329d722e3fbSopenharmony_ci	                                      TGID_Y_EN = 0
2330d722e3fbSopenharmony_ci	                                      TGID_Z_EN = 0
2331d722e3fbSopenharmony_ci	                                      TG_SIZE_EN = 0
2332d722e3fbSopenharmony_ci	                                      TIDIG_COMP_CNT = 0
2333d722e3fbSopenharmony_ci	                                      EXCP_EN_MSB = 0
2334d722e3fbSopenharmony_ci	                                      LDS_SIZE = 0
2335d722e3fbSopenharmony_ci	                                      EXCP_EN = 0
2336d722e3fbSopenharmony_ci	 *
2337d722e3fbSopenharmony_ci	 */
2338d722e3fbSopenharmony_ci	ptr[i++] = 0x00000010;
2339d722e3fbSopenharmony_ci
2340d722e3fbSopenharmony_ci
2341d722e3fbSopenharmony_ci/*
2342d722e3fbSopenharmony_ci * 00000100         COMPUTE_TMPRING_SIZE <- WAVES = 256 (0x100)
2343d722e3fbSopenharmony_ci                                         WAVESIZE = 0
2344d722e3fbSopenharmony_ci *
2345d722e3fbSopenharmony_ci */
2346d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_SET_SH_REG, 1);
2347d722e3fbSopenharmony_ci	ptr[i++] = mmCOMPUTE_TMPRING_SIZE - PACKET3_SET_SH_REG_START;
2348d722e3fbSopenharmony_ci	ptr[i++] = 0x00000100;
2349d722e3fbSopenharmony_ci
2350d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_SET_SH_REG, 2);
2351d722e3fbSopenharmony_ci	ptr[i++] = mmCOMPUTE_USER_DATA_0 - PACKET3_SET_SH_REG_START;
2352d722e3fbSopenharmony_ci	ptr[i++] = 0xffffffff & (ib_result_mc_address + DATA_OFFSET * 4);
2353d722e3fbSopenharmony_ci	ptr[i++] = (0xffffffff00000000 & (ib_result_mc_address + DATA_OFFSET * 4)) >> 32;
2354d722e3fbSopenharmony_ci
2355d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_SET_SH_REG, 1);
2356d722e3fbSopenharmony_ci	ptr[i++] = mmCOMPUTE_RESOURCE_LIMITS - PACKET3_SET_SH_REG_START;
2357d722e3fbSopenharmony_ci	ptr[i++] = 0;
2358d722e3fbSopenharmony_ci
2359d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_SET_SH_REG, 3);
2360d722e3fbSopenharmony_ci	ptr[i++] = mmCOMPUTE_NUM_THREAD_X - PACKET3_SET_SH_REG_START;
2361d722e3fbSopenharmony_ci	ptr[i++] = 1;
2362d722e3fbSopenharmony_ci	ptr[i++] = 1;
2363d722e3fbSopenharmony_ci	ptr[i++] = 1;
2364d722e3fbSopenharmony_ci
2365d722e3fbSopenharmony_ci
2366d722e3fbSopenharmony_ci	/* Dispatch */
2367d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_DISPATCH_DIRECT, 3);
2368d722e3fbSopenharmony_ci	ptr[i++] = 1;
2369d722e3fbSopenharmony_ci	ptr[i++] = 1;
2370d722e3fbSopenharmony_ci	ptr[i++] = 1;
2371d722e3fbSopenharmony_ci	ptr[i++] = 0x00000045; /* DISPATCH DIRECT field */
2372d722e3fbSopenharmony_ci
2373d722e3fbSopenharmony_ci
2374d722e3fbSopenharmony_ci	while (i & 7)
2375d722e3fbSopenharmony_ci		ptr[i++] =  0xffff1000; /* type3 nop packet */
2376d722e3fbSopenharmony_ci
2377d722e3fbSopenharmony_ci	memset(&ib_info, 0, sizeof(struct amdgpu_cs_ib_info));
2378d722e3fbSopenharmony_ci	ib_info.ib_mc_address = ib_result_mc_address;
2379d722e3fbSopenharmony_ci	ib_info.size = i;
2380d722e3fbSopenharmony_ci
2381d722e3fbSopenharmony_ci	memset(&ibs_request, 0, sizeof(struct amdgpu_cs_request));
2382d722e3fbSopenharmony_ci	ibs_request.ip_type = AMDGPU_HW_IP_GFX;
2383d722e3fbSopenharmony_ci	ibs_request.ring = 0;
2384d722e3fbSopenharmony_ci	ibs_request.number_of_ibs = 1;
2385d722e3fbSopenharmony_ci	ibs_request.ibs = &ib_info;
2386d722e3fbSopenharmony_ci	ibs_request.resources = bo_list;
2387d722e3fbSopenharmony_ci	ibs_request.fence_info.handle = NULL;
2388d722e3fbSopenharmony_ci
2389d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle[1], 0,&ibs_request, 1);
2390d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2391d722e3fbSopenharmony_ci	seq_no = ibs_request.seq_no;
2392d722e3fbSopenharmony_ci
2393d722e3fbSopenharmony_ci
2394d722e3fbSopenharmony_ci
2395d722e3fbSopenharmony_ci	/* Prepare second command with dependency on the first */
2396d722e3fbSopenharmony_ci	j = i;
2397d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_WRITE_DATA, 3);
2398d722e3fbSopenharmony_ci	ptr[i++] = WRITE_DATA_DST_SEL(5) | WR_CONFIRM;
2399d722e3fbSopenharmony_ci	ptr[i++] =          0xfffffffc & (ib_result_mc_address + DATA_OFFSET * 4);
2400d722e3fbSopenharmony_ci	ptr[i++] = (0xffffffff00000000 & (ib_result_mc_address + DATA_OFFSET * 4)) >> 32;
2401d722e3fbSopenharmony_ci	ptr[i++] = 99;
2402d722e3fbSopenharmony_ci
2403d722e3fbSopenharmony_ci	while (i & 7)
2404d722e3fbSopenharmony_ci		ptr[i++] =  0xffff1000; /* type3 nop packet */
2405d722e3fbSopenharmony_ci
2406d722e3fbSopenharmony_ci	memset(&ib_info, 0, sizeof(struct amdgpu_cs_ib_info));
2407d722e3fbSopenharmony_ci	ib_info.ib_mc_address = ib_result_mc_address + j * 4;
2408d722e3fbSopenharmony_ci	ib_info.size = i - j;
2409d722e3fbSopenharmony_ci
2410d722e3fbSopenharmony_ci	memset(&ibs_request, 0, sizeof(struct amdgpu_cs_request));
2411d722e3fbSopenharmony_ci	ibs_request.ip_type = AMDGPU_HW_IP_GFX;
2412d722e3fbSopenharmony_ci	ibs_request.ring = 0;
2413d722e3fbSopenharmony_ci	ibs_request.number_of_ibs = 1;
2414d722e3fbSopenharmony_ci	ibs_request.ibs = &ib_info;
2415d722e3fbSopenharmony_ci	ibs_request.resources = bo_list;
2416d722e3fbSopenharmony_ci	ibs_request.fence_info.handle = NULL;
2417d722e3fbSopenharmony_ci
2418d722e3fbSopenharmony_ci	ibs_request.number_of_dependencies = 1;
2419d722e3fbSopenharmony_ci
2420d722e3fbSopenharmony_ci	ibs_request.dependencies = calloc(1, sizeof(*ibs_request.dependencies));
2421d722e3fbSopenharmony_ci	ibs_request.dependencies[0].context = context_handle[1];
2422d722e3fbSopenharmony_ci	ibs_request.dependencies[0].ip_instance = 0;
2423d722e3fbSopenharmony_ci	ibs_request.dependencies[0].ring = 0;
2424d722e3fbSopenharmony_ci	ibs_request.dependencies[0].fence = seq_no;
2425d722e3fbSopenharmony_ci
2426d722e3fbSopenharmony_ci
2427d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle[0], 0,&ibs_request, 1);
2428d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2429d722e3fbSopenharmony_ci
2430d722e3fbSopenharmony_ci
2431d722e3fbSopenharmony_ci	memset(&fence_status, 0, sizeof(struct amdgpu_cs_fence));
2432d722e3fbSopenharmony_ci	fence_status.context = context_handle[0];
2433d722e3fbSopenharmony_ci	fence_status.ip_type = AMDGPU_HW_IP_GFX;
2434d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
2435d722e3fbSopenharmony_ci	fence_status.ring = 0;
2436d722e3fbSopenharmony_ci	fence_status.fence = ibs_request.seq_no;
2437d722e3fbSopenharmony_ci
2438d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
2439d722e3fbSopenharmony_ci		       AMDGPU_TIMEOUT_INFINITE,0, &expired);
2440d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2441d722e3fbSopenharmony_ci
2442d722e3fbSopenharmony_ci	/* Expect the second command to wait for shader to complete */
2443d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(ptr[DATA_OFFSET], 99);
2444d722e3fbSopenharmony_ci
2445d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(bo_list);
2446d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2447d722e3fbSopenharmony_ci
2448d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(ib_result_handle, va_handle,
2449d722e3fbSopenharmony_ci				     ib_result_mc_address, 4096);
2450d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2451d722e3fbSopenharmony_ci
2452d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle[0]);
2453d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2454d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle[1]);
2455d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2456d722e3fbSopenharmony_ci
2457d722e3fbSopenharmony_ci	free(ibs_request.dependencies);
2458d722e3fbSopenharmony_ci}
2459d722e3fbSopenharmony_ci
2460d722e3fbSopenharmony_cistatic int amdgpu_dispatch_load_cs_shader_hang_slow(uint32_t *ptr, int family)
2461d722e3fbSopenharmony_ci{
2462d722e3fbSopenharmony_ci	struct amdgpu_test_shader *shader;
2463d722e3fbSopenharmony_ci	int i, loop = 0x10000;
2464d722e3fbSopenharmony_ci
2465d722e3fbSopenharmony_ci	switch (family) {
2466d722e3fbSopenharmony_ci		case AMDGPU_FAMILY_AI:
2467d722e3fbSopenharmony_ci			shader = &memcpy_cs_hang_slow_ai;
2468d722e3fbSopenharmony_ci			break;
2469d722e3fbSopenharmony_ci		case AMDGPU_FAMILY_RV:
2470d722e3fbSopenharmony_ci			shader = &memcpy_cs_hang_slow_rv;
2471d722e3fbSopenharmony_ci			break;
2472d722e3fbSopenharmony_ci		case AMDGPU_FAMILY_NV:
2473d722e3fbSopenharmony_ci			shader = &memcpy_cs_hang_slow_nv;
2474d722e3fbSopenharmony_ci			break;
2475d722e3fbSopenharmony_ci		default:
2476d722e3fbSopenharmony_ci			return -1;
2477d722e3fbSopenharmony_ci			break;
2478d722e3fbSopenharmony_ci	}
2479d722e3fbSopenharmony_ci
2480d722e3fbSopenharmony_ci	memcpy(ptr, shader->shader, shader->header_length * sizeof(uint32_t));
2481d722e3fbSopenharmony_ci
2482d722e3fbSopenharmony_ci	for (i = 0; i < loop; i++)
2483d722e3fbSopenharmony_ci		memcpy(ptr + shader->header_length + shader->body_length * i,
2484d722e3fbSopenharmony_ci			shader->shader + shader->header_length,
2485d722e3fbSopenharmony_ci			shader->body_length * sizeof(uint32_t));
2486d722e3fbSopenharmony_ci
2487d722e3fbSopenharmony_ci	memcpy(ptr + shader->header_length + shader->body_length * loop,
2488d722e3fbSopenharmony_ci		shader->shader + shader->header_length + shader->body_length,
2489d722e3fbSopenharmony_ci		shader->foot_length * sizeof(uint32_t));
2490d722e3fbSopenharmony_ci
2491d722e3fbSopenharmony_ci	return 0;
2492d722e3fbSopenharmony_ci}
2493d722e3fbSopenharmony_ci
2494d722e3fbSopenharmony_cistatic int amdgpu_dispatch_load_cs_shader(uint8_t *ptr,
2495d722e3fbSopenharmony_ci					   int cs_type,
2496d722e3fbSopenharmony_ci					   uint32_t version)
2497d722e3fbSopenharmony_ci{
2498d722e3fbSopenharmony_ci	uint32_t shader_size;
2499d722e3fbSopenharmony_ci	const uint32_t *shader;
2500d722e3fbSopenharmony_ci
2501d722e3fbSopenharmony_ci	switch (cs_type) {
2502d722e3fbSopenharmony_ci		case CS_BUFFERCLEAR:
2503d722e3fbSopenharmony_ci			if (version == 9) {
2504d722e3fbSopenharmony_ci				shader = bufferclear_cs_shader_gfx9;
2505d722e3fbSopenharmony_ci				shader_size = sizeof(bufferclear_cs_shader_gfx9);
2506d722e3fbSopenharmony_ci			} else if (version == 10) {
2507d722e3fbSopenharmony_ci				shader = bufferclear_cs_shader_gfx10;
2508d722e3fbSopenharmony_ci				shader_size = sizeof(bufferclear_cs_shader_gfx10);
2509d722e3fbSopenharmony_ci			}
2510d722e3fbSopenharmony_ci			break;
2511d722e3fbSopenharmony_ci		case CS_BUFFERCOPY:
2512d722e3fbSopenharmony_ci			if (version == 9) {
2513d722e3fbSopenharmony_ci				shader = buffercopy_cs_shader_gfx9;
2514d722e3fbSopenharmony_ci				shader_size = sizeof(buffercopy_cs_shader_gfx9);
2515d722e3fbSopenharmony_ci			} else if (version == 10) {
2516d722e3fbSopenharmony_ci				shader = buffercopy_cs_shader_gfx10;
2517d722e3fbSopenharmony_ci				shader_size = sizeof(buffercopy_cs_shader_gfx10);
2518d722e3fbSopenharmony_ci			}
2519d722e3fbSopenharmony_ci			break;
2520d722e3fbSopenharmony_ci		case CS_HANG:
2521d722e3fbSopenharmony_ci			shader = memcpy_ps_hang;
2522d722e3fbSopenharmony_ci			shader_size = sizeof(memcpy_ps_hang);
2523d722e3fbSopenharmony_ci			break;
2524d722e3fbSopenharmony_ci		default:
2525d722e3fbSopenharmony_ci			return -1;
2526d722e3fbSopenharmony_ci			break;
2527d722e3fbSopenharmony_ci	}
2528d722e3fbSopenharmony_ci
2529d722e3fbSopenharmony_ci	memcpy(ptr, shader, shader_size);
2530d722e3fbSopenharmony_ci	return 0;
2531d722e3fbSopenharmony_ci}
2532d722e3fbSopenharmony_ci
2533d722e3fbSopenharmony_cistatic int amdgpu_dispatch_init(uint32_t *ptr, uint32_t ip_type, uint32_t version)
2534d722e3fbSopenharmony_ci{
2535d722e3fbSopenharmony_ci	int i = 0;
2536d722e3fbSopenharmony_ci
2537d722e3fbSopenharmony_ci	/* Write context control and load shadowing register if necessary */
2538d722e3fbSopenharmony_ci	if (ip_type == AMDGPU_HW_IP_GFX) {
2539d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PKT3_CONTEXT_CONTROL, 1);
2540d722e3fbSopenharmony_ci		ptr[i++] = 0x80000000;
2541d722e3fbSopenharmony_ci		ptr[i++] = 0x80000000;
2542d722e3fbSopenharmony_ci	}
2543d722e3fbSopenharmony_ci
2544d722e3fbSopenharmony_ci	/* Issue commands to set default compute state. */
2545d722e3fbSopenharmony_ci	/* clear mmCOMPUTE_START_Z - mmCOMPUTE_START_X */
2546d722e3fbSopenharmony_ci	ptr[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 3);
2547d722e3fbSopenharmony_ci	ptr[i++] = 0x204;
2548d722e3fbSopenharmony_ci	i += 3;
2549d722e3fbSopenharmony_ci
2550d722e3fbSopenharmony_ci	/* clear mmCOMPUTE_TMPRING_SIZE */
2551d722e3fbSopenharmony_ci	ptr[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 1);
2552d722e3fbSopenharmony_ci	ptr[i++] = 0x218;
2553d722e3fbSopenharmony_ci	ptr[i++] = 0;
2554d722e3fbSopenharmony_ci
2555d722e3fbSopenharmony_ci	/* Set new sh registers in GFX10 to 0 */
2556d722e3fbSopenharmony_ci	if (version == 10) {
2557d722e3fbSopenharmony_ci		/* mmCOMPUTE_SHADER_CHKSUM */
2558d722e3fbSopenharmony_ci		ptr[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 1);
2559d722e3fbSopenharmony_ci		ptr[i++] = 0x22a;
2560d722e3fbSopenharmony_ci		ptr[i++] = 0;
2561d722e3fbSopenharmony_ci		/* mmCOMPUTE_REQ_CTRL */
2562d722e3fbSopenharmony_ci		ptr[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 6);
2563d722e3fbSopenharmony_ci		ptr[i++] = 0x222;
2564d722e3fbSopenharmony_ci		i += 6;
2565d722e3fbSopenharmony_ci		/* mmCP_COHER_START_DELAY */
2566d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_UCONFIG_REG, 1);
2567d722e3fbSopenharmony_ci		ptr[i++] = 0x7b;
2568d722e3fbSopenharmony_ci		ptr[i++] = 0x20;
2569d722e3fbSopenharmony_ci	}
2570d722e3fbSopenharmony_ci	return i;
2571d722e3fbSopenharmony_ci}
2572d722e3fbSopenharmony_ci
2573d722e3fbSopenharmony_cistatic int amdgpu_dispatch_write_cumask(uint32_t *ptr, uint32_t version)
2574d722e3fbSopenharmony_ci{
2575d722e3fbSopenharmony_ci	int i = 0;
2576d722e3fbSopenharmony_ci
2577d722e3fbSopenharmony_ci	/*  Issue commands to set cu mask used in current dispatch */
2578d722e3fbSopenharmony_ci	if (version == 9) {
2579d722e3fbSopenharmony_ci		/* set mmCOMPUTE_STATIC_THREAD_MGMT_SE1 - mmCOMPUTE_STATIC_THREAD_MGMT_SE0 */
2580d722e3fbSopenharmony_ci		ptr[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 2);
2581d722e3fbSopenharmony_ci		ptr[i++] = 0x216;
2582d722e3fbSopenharmony_ci		ptr[i++] = 0xffffffff;
2583d722e3fbSopenharmony_ci		ptr[i++] = 0xffffffff;
2584d722e3fbSopenharmony_ci		/* set mmCOMPUTE_STATIC_THREAD_MGMT_SE3 - mmCOMPUTE_STATIC_THREAD_MGMT_SE2 */
2585d722e3fbSopenharmony_ci		ptr[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 2);
2586d722e3fbSopenharmony_ci		ptr[i++] = 0x219;
2587d722e3fbSopenharmony_ci		ptr[i++] = 0xffffffff;
2588d722e3fbSopenharmony_ci		ptr[i++] = 0xffffffff;
2589d722e3fbSopenharmony_ci	} else if (version == 10) {
2590d722e3fbSopenharmony_ci		/* set mmCOMPUTE_STATIC_THREAD_MGMT_SE1 - mmCOMPUTE_STATIC_THREAD_MGMT_SE0 */
2591d722e3fbSopenharmony_ci		ptr[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG_INDEX, 2);
2592d722e3fbSopenharmony_ci		ptr[i++] = 0x30000216;
2593d722e3fbSopenharmony_ci		ptr[i++] = 0xffffffff;
2594d722e3fbSopenharmony_ci		ptr[i++] = 0xffffffff;
2595d722e3fbSopenharmony_ci		/* set mmCOMPUTE_STATIC_THREAD_MGMT_SE3 - mmCOMPUTE_STATIC_THREAD_MGMT_SE2 */
2596d722e3fbSopenharmony_ci		ptr[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG_INDEX, 2);
2597d722e3fbSopenharmony_ci		ptr[i++] = 0x30000219;
2598d722e3fbSopenharmony_ci		ptr[i++] = 0xffffffff;
2599d722e3fbSopenharmony_ci		ptr[i++] = 0xffffffff;
2600d722e3fbSopenharmony_ci	}
2601d722e3fbSopenharmony_ci
2602d722e3fbSopenharmony_ci	return i;
2603d722e3fbSopenharmony_ci}
2604d722e3fbSopenharmony_ci
2605d722e3fbSopenharmony_cistatic int amdgpu_dispatch_write2hw(uint32_t *ptr, uint64_t shader_addr, uint32_t version)
2606d722e3fbSopenharmony_ci{
2607d722e3fbSopenharmony_ci	int i, j;
2608d722e3fbSopenharmony_ci
2609d722e3fbSopenharmony_ci	i = 0;
2610d722e3fbSopenharmony_ci
2611d722e3fbSopenharmony_ci	/* Writes shader state to HW */
2612d722e3fbSopenharmony_ci	/* set mmCOMPUTE_PGM_HI - mmCOMPUTE_PGM_LO */
2613d722e3fbSopenharmony_ci	ptr[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 2);
2614d722e3fbSopenharmony_ci	ptr[i++] = 0x20c;
2615d722e3fbSopenharmony_ci	ptr[i++] = (shader_addr >> 8);
2616d722e3fbSopenharmony_ci	ptr[i++] = (shader_addr >> 40);
2617d722e3fbSopenharmony_ci	/* write sh regs*/
2618d722e3fbSopenharmony_ci	for (j = 0; j < bufferclear_cs_shader_registers_num_gfx9; j++) {
2619d722e3fbSopenharmony_ci		ptr[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 1);
2620d722e3fbSopenharmony_ci		/* - Gfx9ShRegBase */
2621d722e3fbSopenharmony_ci		ptr[i++] = bufferclear_cs_shader_registers_gfx9[j][0] - 0x2c00;
2622d722e3fbSopenharmony_ci		ptr[i++] = bufferclear_cs_shader_registers_gfx9[j][1];
2623d722e3fbSopenharmony_ci	}
2624d722e3fbSopenharmony_ci
2625d722e3fbSopenharmony_ci	if (version == 10) {
2626d722e3fbSopenharmony_ci		/* mmCOMPUTE_PGM_RSRC3 */
2627d722e3fbSopenharmony_ci		ptr[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 1);
2628d722e3fbSopenharmony_ci		ptr[i++] = 0x228;
2629d722e3fbSopenharmony_ci		ptr[i++] = 0;
2630d722e3fbSopenharmony_ci	}
2631d722e3fbSopenharmony_ci
2632d722e3fbSopenharmony_ci	return i;
2633d722e3fbSopenharmony_ci}
2634d722e3fbSopenharmony_ci
2635d722e3fbSopenharmony_cistatic void amdgpu_memset_dispatch_test(amdgpu_device_handle device_handle,
2636d722e3fbSopenharmony_ci					 uint32_t ip_type,
2637d722e3fbSopenharmony_ci					 uint32_t ring,
2638d722e3fbSopenharmony_ci					 uint32_t version)
2639d722e3fbSopenharmony_ci{
2640d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
2641d722e3fbSopenharmony_ci	amdgpu_bo_handle bo_dst, bo_shader, bo_cmd, resources[3];
2642d722e3fbSopenharmony_ci	volatile unsigned char *ptr_dst;
2643d722e3fbSopenharmony_ci	void *ptr_shader;
2644d722e3fbSopenharmony_ci	uint32_t *ptr_cmd;
2645d722e3fbSopenharmony_ci	uint64_t mc_address_dst, mc_address_shader, mc_address_cmd;
2646d722e3fbSopenharmony_ci	amdgpu_va_handle va_dst, va_shader, va_cmd;
2647d722e3fbSopenharmony_ci	int i, r;
2648d722e3fbSopenharmony_ci	int bo_dst_size = 16384;
2649d722e3fbSopenharmony_ci	int bo_shader_size = 4096;
2650d722e3fbSopenharmony_ci	int bo_cmd_size = 4096;
2651d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request = {0};
2652d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info= {0};
2653d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list;
2654d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status = {0};
2655d722e3fbSopenharmony_ci	uint32_t expired;
2656d722e3fbSopenharmony_ci
2657d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
2658d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2659d722e3fbSopenharmony_ci
2660d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_cmd_size, 4096,
2661d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_GTT, 0,
2662d722e3fbSopenharmony_ci					&bo_cmd, (void **)&ptr_cmd,
2663d722e3fbSopenharmony_ci					&mc_address_cmd, &va_cmd);
2664d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2665d722e3fbSopenharmony_ci	memset(ptr_cmd, 0, bo_cmd_size);
2666d722e3fbSopenharmony_ci
2667d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_shader_size, 4096,
2668d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
2669d722e3fbSopenharmony_ci					&bo_shader, &ptr_shader,
2670d722e3fbSopenharmony_ci					&mc_address_shader, &va_shader);
2671d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2672d722e3fbSopenharmony_ci	memset(ptr_shader, 0, bo_shader_size);
2673d722e3fbSopenharmony_ci
2674d722e3fbSopenharmony_ci	r = amdgpu_dispatch_load_cs_shader(ptr_shader, CS_BUFFERCLEAR, version);
2675d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2676d722e3fbSopenharmony_ci
2677d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_dst_size, 4096,
2678d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
2679d722e3fbSopenharmony_ci					&bo_dst, (void **)&ptr_dst,
2680d722e3fbSopenharmony_ci					&mc_address_dst, &va_dst);
2681d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2682d722e3fbSopenharmony_ci
2683d722e3fbSopenharmony_ci	i = 0;
2684d722e3fbSopenharmony_ci	i += amdgpu_dispatch_init(ptr_cmd + i, ip_type, version);
2685d722e3fbSopenharmony_ci
2686d722e3fbSopenharmony_ci	/*  Issue commands to set cu mask used in current dispatch */
2687d722e3fbSopenharmony_ci	i += amdgpu_dispatch_write_cumask(ptr_cmd + i, version);
2688d722e3fbSopenharmony_ci
2689d722e3fbSopenharmony_ci	/* Writes shader state to HW */
2690d722e3fbSopenharmony_ci	i += amdgpu_dispatch_write2hw(ptr_cmd + i, mc_address_shader, version);
2691d722e3fbSopenharmony_ci
2692d722e3fbSopenharmony_ci	/* Write constant data */
2693d722e3fbSopenharmony_ci	/* Writes the UAV constant data to the SGPRs. */
2694d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 4);
2695d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x240;
2696d722e3fbSopenharmony_ci	ptr_cmd[i++] = mc_address_dst;
2697d722e3fbSopenharmony_ci	ptr_cmd[i++] = (mc_address_dst >> 32) | 0x100000;
2698d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x400;
2699d722e3fbSopenharmony_ci	if (version == 9)
2700d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x74fac;
2701d722e3fbSopenharmony_ci	else if (version == 10)
2702d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x1104bfac;
2703d722e3fbSopenharmony_ci
2704d722e3fbSopenharmony_ci	/* Sets a range of pixel shader constants */
2705d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 4);
2706d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x244;
2707d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x22222222;
2708d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x22222222;
2709d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x22222222;
2710d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x22222222;
2711d722e3fbSopenharmony_ci
2712d722e3fbSopenharmony_ci	/* clear mmCOMPUTE_RESOURCE_LIMITS */
2713d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 1);
2714d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x215;
2715d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0;
2716d722e3fbSopenharmony_ci
2717d722e3fbSopenharmony_ci	/* dispatch direct command */
2718d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3_COMPUTE(PACKET3_DISPATCH_DIRECT, 3);
2719d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x10;
2720d722e3fbSopenharmony_ci	ptr_cmd[i++] = 1;
2721d722e3fbSopenharmony_ci	ptr_cmd[i++] = 1;
2722d722e3fbSopenharmony_ci	ptr_cmd[i++] = 1;
2723d722e3fbSopenharmony_ci
2724d722e3fbSopenharmony_ci	while (i & 7)
2725d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0xffff1000; /* type3 nop packet */
2726d722e3fbSopenharmony_ci
2727d722e3fbSopenharmony_ci	resources[0] = bo_dst;
2728d722e3fbSopenharmony_ci	resources[1] = bo_shader;
2729d722e3fbSopenharmony_ci	resources[2] = bo_cmd;
2730d722e3fbSopenharmony_ci	r = amdgpu_bo_list_create(device_handle, 3, resources, NULL, &bo_list);
2731d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2732d722e3fbSopenharmony_ci
2733d722e3fbSopenharmony_ci	ib_info.ib_mc_address = mc_address_cmd;
2734d722e3fbSopenharmony_ci	ib_info.size = i;
2735d722e3fbSopenharmony_ci	ibs_request.ip_type = ip_type;
2736d722e3fbSopenharmony_ci	ibs_request.ring = ring;
2737d722e3fbSopenharmony_ci	ibs_request.resources = bo_list;
2738d722e3fbSopenharmony_ci	ibs_request.number_of_ibs = 1;
2739d722e3fbSopenharmony_ci	ibs_request.ibs = &ib_info;
2740d722e3fbSopenharmony_ci	ibs_request.fence_info.handle = NULL;
2741d722e3fbSopenharmony_ci
2742d722e3fbSopenharmony_ci	/* submit CS */
2743d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle, 0, &ibs_request, 1);
2744d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2745d722e3fbSopenharmony_ci
2746d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(bo_list);
2747d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2748d722e3fbSopenharmony_ci
2749d722e3fbSopenharmony_ci	fence_status.ip_type = ip_type;
2750d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
2751d722e3fbSopenharmony_ci	fence_status.ring = ring;
2752d722e3fbSopenharmony_ci	fence_status.context = context_handle;
2753d722e3fbSopenharmony_ci	fence_status.fence = ibs_request.seq_no;
2754d722e3fbSopenharmony_ci
2755d722e3fbSopenharmony_ci	/* wait for IB accomplished */
2756d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
2757d722e3fbSopenharmony_ci					 AMDGPU_TIMEOUT_INFINITE,
2758d722e3fbSopenharmony_ci					 0, &expired);
2759d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2760d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(expired, true);
2761d722e3fbSopenharmony_ci
2762d722e3fbSopenharmony_ci	/* verify if memset test result meets with expected */
2763d722e3fbSopenharmony_ci	i = 0;
2764d722e3fbSopenharmony_ci	while(i < bo_dst_size) {
2765d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(ptr_dst[i++], 0x22);
2766d722e3fbSopenharmony_ci	}
2767d722e3fbSopenharmony_ci
2768d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_dst, va_dst, mc_address_dst, bo_dst_size);
2769d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2770d722e3fbSopenharmony_ci
2771d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_shader, va_shader, mc_address_shader, bo_shader_size);
2772d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2773d722e3fbSopenharmony_ci
2774d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_cmd, va_cmd, mc_address_cmd, bo_cmd_size);
2775d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2776d722e3fbSopenharmony_ci
2777d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
2778d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2779d722e3fbSopenharmony_ci}
2780d722e3fbSopenharmony_ci
2781d722e3fbSopenharmony_cistatic void amdgpu_memcpy_dispatch_test(amdgpu_device_handle device_handle,
2782d722e3fbSopenharmony_ci					uint32_t ip_type,
2783d722e3fbSopenharmony_ci					uint32_t ring,
2784d722e3fbSopenharmony_ci					uint32_t version,
2785d722e3fbSopenharmony_ci					int hang)
2786d722e3fbSopenharmony_ci{
2787d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
2788d722e3fbSopenharmony_ci	amdgpu_bo_handle bo_src, bo_dst, bo_shader, bo_cmd, resources[4];
2789d722e3fbSopenharmony_ci	volatile unsigned char *ptr_dst;
2790d722e3fbSopenharmony_ci	void *ptr_shader;
2791d722e3fbSopenharmony_ci	unsigned char *ptr_src;
2792d722e3fbSopenharmony_ci	uint32_t *ptr_cmd;
2793d722e3fbSopenharmony_ci	uint64_t mc_address_src, mc_address_dst, mc_address_shader, mc_address_cmd;
2794d722e3fbSopenharmony_ci	amdgpu_va_handle va_src, va_dst, va_shader, va_cmd;
2795d722e3fbSopenharmony_ci	int i, r;
2796d722e3fbSopenharmony_ci	int bo_dst_size = 16384;
2797d722e3fbSopenharmony_ci	int bo_shader_size = 4096;
2798d722e3fbSopenharmony_ci	int bo_cmd_size = 4096;
2799d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request = {0};
2800d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info= {0};
2801d722e3fbSopenharmony_ci	uint32_t expired, hang_state, hangs;
2802d722e3fbSopenharmony_ci	enum cs_type cs_type;
2803d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list;
2804d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status = {0};
2805d722e3fbSopenharmony_ci
2806d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
2807d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2808d722e3fbSopenharmony_ci
2809d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_cmd_size, 4096,
2810d722e3fbSopenharmony_ci				    AMDGPU_GEM_DOMAIN_GTT, 0,
2811d722e3fbSopenharmony_ci				    &bo_cmd, (void **)&ptr_cmd,
2812d722e3fbSopenharmony_ci				    &mc_address_cmd, &va_cmd);
2813d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2814d722e3fbSopenharmony_ci	memset(ptr_cmd, 0, bo_cmd_size);
2815d722e3fbSopenharmony_ci
2816d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_shader_size, 4096,
2817d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
2818d722e3fbSopenharmony_ci					&bo_shader, &ptr_shader,
2819d722e3fbSopenharmony_ci					&mc_address_shader, &va_shader);
2820d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2821d722e3fbSopenharmony_ci	memset(ptr_shader, 0, bo_shader_size);
2822d722e3fbSopenharmony_ci
2823d722e3fbSopenharmony_ci	cs_type = hang ? CS_HANG : CS_BUFFERCOPY;
2824d722e3fbSopenharmony_ci	r = amdgpu_dispatch_load_cs_shader(ptr_shader, cs_type, version);
2825d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2826d722e3fbSopenharmony_ci
2827d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_dst_size, 4096,
2828d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
2829d722e3fbSopenharmony_ci					&bo_src, (void **)&ptr_src,
2830d722e3fbSopenharmony_ci					&mc_address_src, &va_src);
2831d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2832d722e3fbSopenharmony_ci
2833d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_dst_size, 4096,
2834d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
2835d722e3fbSopenharmony_ci					&bo_dst, (void **)&ptr_dst,
2836d722e3fbSopenharmony_ci					&mc_address_dst, &va_dst);
2837d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2838d722e3fbSopenharmony_ci
2839d722e3fbSopenharmony_ci	memset(ptr_src, 0x55, bo_dst_size);
2840d722e3fbSopenharmony_ci
2841d722e3fbSopenharmony_ci	i = 0;
2842d722e3fbSopenharmony_ci	i += amdgpu_dispatch_init(ptr_cmd + i, ip_type, version);
2843d722e3fbSopenharmony_ci
2844d722e3fbSopenharmony_ci	/*  Issue commands to set cu mask used in current dispatch */
2845d722e3fbSopenharmony_ci	i += amdgpu_dispatch_write_cumask(ptr_cmd + i, version);
2846d722e3fbSopenharmony_ci
2847d722e3fbSopenharmony_ci	/* Writes shader state to HW */
2848d722e3fbSopenharmony_ci	i += amdgpu_dispatch_write2hw(ptr_cmd + i, mc_address_shader, version);
2849d722e3fbSopenharmony_ci
2850d722e3fbSopenharmony_ci	/* Write constant data */
2851d722e3fbSopenharmony_ci	/* Writes the texture resource constants data to the SGPRs */
2852d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 4);
2853d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x240;
2854d722e3fbSopenharmony_ci	ptr_cmd[i++] = mc_address_src;
2855d722e3fbSopenharmony_ci	ptr_cmd[i++] = (mc_address_src >> 32) | 0x100000;
2856d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x400;
2857d722e3fbSopenharmony_ci	if (version == 9)
2858d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x74fac;
2859d722e3fbSopenharmony_ci	else if (version == 10)
2860d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x1104bfac;
2861d722e3fbSopenharmony_ci
2862d722e3fbSopenharmony_ci	/* Writes the UAV constant data to the SGPRs. */
2863d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 4);
2864d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x244;
2865d722e3fbSopenharmony_ci	ptr_cmd[i++] = mc_address_dst;
2866d722e3fbSopenharmony_ci	ptr_cmd[i++] = (mc_address_dst >> 32) | 0x100000;
2867d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x400;
2868d722e3fbSopenharmony_ci	if (version == 9)
2869d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x74fac;
2870d722e3fbSopenharmony_ci	else if (version == 10)
2871d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x1104bfac;
2872d722e3fbSopenharmony_ci
2873d722e3fbSopenharmony_ci	/* clear mmCOMPUTE_RESOURCE_LIMITS */
2874d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 1);
2875d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x215;
2876d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0;
2877d722e3fbSopenharmony_ci
2878d722e3fbSopenharmony_ci	/* dispatch direct command */
2879d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3_COMPUTE(PACKET3_DISPATCH_DIRECT, 3);
2880d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x10;
2881d722e3fbSopenharmony_ci	ptr_cmd[i++] = 1;
2882d722e3fbSopenharmony_ci	ptr_cmd[i++] = 1;
2883d722e3fbSopenharmony_ci	ptr_cmd[i++] = 1;
2884d722e3fbSopenharmony_ci
2885d722e3fbSopenharmony_ci	while (i & 7)
2886d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0xffff1000; /* type3 nop packet */
2887d722e3fbSopenharmony_ci
2888d722e3fbSopenharmony_ci	resources[0] = bo_shader;
2889d722e3fbSopenharmony_ci	resources[1] = bo_src;
2890d722e3fbSopenharmony_ci	resources[2] = bo_dst;
2891d722e3fbSopenharmony_ci	resources[3] = bo_cmd;
2892d722e3fbSopenharmony_ci	r = amdgpu_bo_list_create(device_handle, 4, resources, NULL, &bo_list);
2893d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2894d722e3fbSopenharmony_ci
2895d722e3fbSopenharmony_ci	ib_info.ib_mc_address = mc_address_cmd;
2896d722e3fbSopenharmony_ci	ib_info.size = i;
2897d722e3fbSopenharmony_ci	ibs_request.ip_type = ip_type;
2898d722e3fbSopenharmony_ci	ibs_request.ring = ring;
2899d722e3fbSopenharmony_ci	ibs_request.resources = bo_list;
2900d722e3fbSopenharmony_ci	ibs_request.number_of_ibs = 1;
2901d722e3fbSopenharmony_ci	ibs_request.ibs = &ib_info;
2902d722e3fbSopenharmony_ci	ibs_request.fence_info.handle = NULL;
2903d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle, 0, &ibs_request, 1);
2904d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2905d722e3fbSopenharmony_ci
2906d722e3fbSopenharmony_ci	fence_status.ip_type = ip_type;
2907d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
2908d722e3fbSopenharmony_ci	fence_status.ring = ring;
2909d722e3fbSopenharmony_ci	fence_status.context = context_handle;
2910d722e3fbSopenharmony_ci	fence_status.fence = ibs_request.seq_no;
2911d722e3fbSopenharmony_ci
2912d722e3fbSopenharmony_ci	/* wait for IB accomplished */
2913d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
2914d722e3fbSopenharmony_ci					 AMDGPU_TIMEOUT_INFINITE,
2915d722e3fbSopenharmony_ci					 0, &expired);
2916d722e3fbSopenharmony_ci
2917d722e3fbSopenharmony_ci	if (!hang) {
2918d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
2919d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(expired, true);
2920d722e3fbSopenharmony_ci
2921d722e3fbSopenharmony_ci		/* verify if memcpy test result meets with expected */
2922d722e3fbSopenharmony_ci		i = 0;
2923d722e3fbSopenharmony_ci		while(i < bo_dst_size) {
2924d722e3fbSopenharmony_ci			CU_ASSERT_EQUAL(ptr_dst[i], ptr_src[i]);
2925d722e3fbSopenharmony_ci			i++;
2926d722e3fbSopenharmony_ci		}
2927d722e3fbSopenharmony_ci	} else {
2928d722e3fbSopenharmony_ci		r = amdgpu_cs_query_reset_state(context_handle, &hang_state, &hangs);
2929d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
2930d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(hang_state, AMDGPU_CTX_UNKNOWN_RESET);
2931d722e3fbSopenharmony_ci	}
2932d722e3fbSopenharmony_ci
2933d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(bo_list);
2934d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2935d722e3fbSopenharmony_ci
2936d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_src, va_src, mc_address_src, bo_dst_size);
2937d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2938d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_dst, va_dst, mc_address_dst, bo_dst_size);
2939d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2940d722e3fbSopenharmony_ci
2941d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_cmd, va_cmd, mc_address_cmd, bo_cmd_size);
2942d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2943d722e3fbSopenharmony_ci
2944d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_shader, va_shader, mc_address_shader, bo_shader_size);
2945d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2946d722e3fbSopenharmony_ci
2947d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
2948d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2949d722e3fbSopenharmony_ci}
2950d722e3fbSopenharmony_ci
2951d722e3fbSopenharmony_cistatic void amdgpu_compute_dispatch_test(void)
2952d722e3fbSopenharmony_ci{
2953d722e3fbSopenharmony_ci	int r;
2954d722e3fbSopenharmony_ci	struct drm_amdgpu_info_hw_ip info;
2955d722e3fbSopenharmony_ci	uint32_t ring_id, version;
2956d722e3fbSopenharmony_ci
2957d722e3fbSopenharmony_ci	r = amdgpu_query_hw_ip_info(device_handle, AMDGPU_HW_IP_COMPUTE, 0, &info);
2958d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2959d722e3fbSopenharmony_ci	if (!info.available_rings)
2960d722e3fbSopenharmony_ci		printf("SKIP ... as there's no compute ring\n");
2961d722e3fbSopenharmony_ci
2962d722e3fbSopenharmony_ci	version = info.hw_ip_version_major;
2963d722e3fbSopenharmony_ci	if (version != 9 && version != 10) {
2964d722e3fbSopenharmony_ci		printf("SKIP ... unsupported gfx version %d\n", version);
2965d722e3fbSopenharmony_ci		return;
2966d722e3fbSopenharmony_ci	}
2967d722e3fbSopenharmony_ci
2968d722e3fbSopenharmony_ci	for (ring_id = 0; (1 << ring_id) & info.available_rings; ring_id++) {
2969d722e3fbSopenharmony_ci		amdgpu_memset_dispatch_test(device_handle, AMDGPU_HW_IP_COMPUTE, ring_id, version);
2970d722e3fbSopenharmony_ci		amdgpu_memcpy_dispatch_test(device_handle, AMDGPU_HW_IP_COMPUTE, ring_id, version, 0);
2971d722e3fbSopenharmony_ci	}
2972d722e3fbSopenharmony_ci}
2973d722e3fbSopenharmony_ci
2974d722e3fbSopenharmony_cistatic void amdgpu_gfx_dispatch_test(void)
2975d722e3fbSopenharmony_ci{
2976d722e3fbSopenharmony_ci	int r;
2977d722e3fbSopenharmony_ci	struct drm_amdgpu_info_hw_ip info;
2978d722e3fbSopenharmony_ci	uint32_t ring_id, version;
2979d722e3fbSopenharmony_ci
2980d722e3fbSopenharmony_ci	r = amdgpu_query_hw_ip_info(device_handle, AMDGPU_HW_IP_GFX, 0, &info);
2981d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
2982d722e3fbSopenharmony_ci	if (!info.available_rings)
2983d722e3fbSopenharmony_ci		printf("SKIP ... as there's no graphics ring\n");
2984d722e3fbSopenharmony_ci
2985d722e3fbSopenharmony_ci	version = info.hw_ip_version_major;
2986d722e3fbSopenharmony_ci	if (version != 9 && version != 10) {
2987d722e3fbSopenharmony_ci		printf("SKIP ... unsupported gfx version %d\n", version);
2988d722e3fbSopenharmony_ci		return;
2989d722e3fbSopenharmony_ci	}
2990d722e3fbSopenharmony_ci
2991d722e3fbSopenharmony_ci	for (ring_id = 0; (1 << ring_id) & info.available_rings; ring_id++) {
2992d722e3fbSopenharmony_ci		amdgpu_memset_dispatch_test(device_handle, AMDGPU_HW_IP_GFX, ring_id, version);
2993d722e3fbSopenharmony_ci		amdgpu_memcpy_dispatch_test(device_handle, AMDGPU_HW_IP_GFX, ring_id, version, 0);
2994d722e3fbSopenharmony_ci	}
2995d722e3fbSopenharmony_ci}
2996d722e3fbSopenharmony_ci
2997d722e3fbSopenharmony_civoid amdgpu_dispatch_hang_helper(amdgpu_device_handle device_handle, uint32_t ip_type)
2998d722e3fbSopenharmony_ci{
2999d722e3fbSopenharmony_ci	int r;
3000d722e3fbSopenharmony_ci	struct drm_amdgpu_info_hw_ip info;
3001d722e3fbSopenharmony_ci	uint32_t ring_id, version;
3002d722e3fbSopenharmony_ci
3003d722e3fbSopenharmony_ci	r = amdgpu_query_hw_ip_info(device_handle, ip_type, 0, &info);
3004d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3005d722e3fbSopenharmony_ci	if (!info.available_rings)
3006d722e3fbSopenharmony_ci		printf("SKIP ... as there's no ring for ip %d\n", ip_type);
3007d722e3fbSopenharmony_ci
3008d722e3fbSopenharmony_ci	version = info.hw_ip_version_major;
3009d722e3fbSopenharmony_ci	if (version != 9 && version != 10) {
3010d722e3fbSopenharmony_ci		printf("SKIP ... unsupported gfx version %d\n", version);
3011d722e3fbSopenharmony_ci		return;
3012d722e3fbSopenharmony_ci	}
3013d722e3fbSopenharmony_ci
3014d722e3fbSopenharmony_ci	for (ring_id = 0; (1 << ring_id) & info.available_rings; ring_id++) {
3015d722e3fbSopenharmony_ci		amdgpu_memcpy_dispatch_test(device_handle, ip_type, ring_id, version, 0);
3016d722e3fbSopenharmony_ci		amdgpu_memcpy_dispatch_test(device_handle, ip_type, ring_id, version, 1);
3017d722e3fbSopenharmony_ci		amdgpu_memcpy_dispatch_test(device_handle, ip_type, ring_id, version, 0);
3018d722e3fbSopenharmony_ci	}
3019d722e3fbSopenharmony_ci}
3020d722e3fbSopenharmony_ci
3021d722e3fbSopenharmony_cistatic void amdgpu_memcpy_dispatch_hang_slow_test(amdgpu_device_handle device_handle,
3022d722e3fbSopenharmony_ci						  uint32_t ip_type, uint32_t ring, int version)
3023d722e3fbSopenharmony_ci{
3024d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
3025d722e3fbSopenharmony_ci	amdgpu_bo_handle bo_src, bo_dst, bo_shader, bo_cmd, resources[4];
3026d722e3fbSopenharmony_ci	volatile unsigned char *ptr_dst;
3027d722e3fbSopenharmony_ci	void *ptr_shader;
3028d722e3fbSopenharmony_ci	unsigned char *ptr_src;
3029d722e3fbSopenharmony_ci	uint32_t *ptr_cmd;
3030d722e3fbSopenharmony_ci	uint64_t mc_address_src, mc_address_dst, mc_address_shader, mc_address_cmd;
3031d722e3fbSopenharmony_ci	amdgpu_va_handle va_src, va_dst, va_shader, va_cmd;
3032d722e3fbSopenharmony_ci	int i, r;
3033d722e3fbSopenharmony_ci	int bo_dst_size = 0x4000000;
3034d722e3fbSopenharmony_ci	int bo_shader_size = 0x400000;
3035d722e3fbSopenharmony_ci	int bo_cmd_size = 4096;
3036d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request = {0};
3037d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info= {0};
3038d722e3fbSopenharmony_ci	uint32_t hang_state, hangs, expired;
3039d722e3fbSopenharmony_ci	struct amdgpu_gpu_info gpu_info = {0};
3040d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list;
3041d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status = {0};
3042d722e3fbSopenharmony_ci
3043d722e3fbSopenharmony_ci	r = amdgpu_query_gpu_info(device_handle, &gpu_info);
3044d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3045d722e3fbSopenharmony_ci
3046d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
3047d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3048d722e3fbSopenharmony_ci
3049d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_cmd_size, 4096,
3050d722e3fbSopenharmony_ci				    AMDGPU_GEM_DOMAIN_GTT, 0,
3051d722e3fbSopenharmony_ci				    &bo_cmd, (void **)&ptr_cmd,
3052d722e3fbSopenharmony_ci				    &mc_address_cmd, &va_cmd);
3053d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3054d722e3fbSopenharmony_ci	memset(ptr_cmd, 0, bo_cmd_size);
3055d722e3fbSopenharmony_ci
3056d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_shader_size, 4096,
3057d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
3058d722e3fbSopenharmony_ci					&bo_shader, &ptr_shader,
3059d722e3fbSopenharmony_ci					&mc_address_shader, &va_shader);
3060d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3061d722e3fbSopenharmony_ci	memset(ptr_shader, 0, bo_shader_size);
3062d722e3fbSopenharmony_ci
3063d722e3fbSopenharmony_ci	r = amdgpu_dispatch_load_cs_shader_hang_slow(ptr_shader, gpu_info.family_id);
3064d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3065d722e3fbSopenharmony_ci
3066d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_dst_size, 4096,
3067d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
3068d722e3fbSopenharmony_ci					&bo_src, (void **)&ptr_src,
3069d722e3fbSopenharmony_ci					&mc_address_src, &va_src);
3070d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3071d722e3fbSopenharmony_ci
3072d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_dst_size, 4096,
3073d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
3074d722e3fbSopenharmony_ci					&bo_dst, (void **)&ptr_dst,
3075d722e3fbSopenharmony_ci					&mc_address_dst, &va_dst);
3076d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3077d722e3fbSopenharmony_ci
3078d722e3fbSopenharmony_ci	memset(ptr_src, 0x55, bo_dst_size);
3079d722e3fbSopenharmony_ci
3080d722e3fbSopenharmony_ci	i = 0;
3081d722e3fbSopenharmony_ci	i += amdgpu_dispatch_init(ptr_cmd + i, ip_type, version);
3082d722e3fbSopenharmony_ci
3083d722e3fbSopenharmony_ci	/*  Issue commands to set cu mask used in current dispatch */
3084d722e3fbSopenharmony_ci	i += amdgpu_dispatch_write_cumask(ptr_cmd + i, version);
3085d722e3fbSopenharmony_ci
3086d722e3fbSopenharmony_ci	/* Writes shader state to HW */
3087d722e3fbSopenharmony_ci	i += amdgpu_dispatch_write2hw(ptr_cmd + i, mc_address_shader, version);
3088d722e3fbSopenharmony_ci
3089d722e3fbSopenharmony_ci	/* Write constant data */
3090d722e3fbSopenharmony_ci	/* Writes the texture resource constants data to the SGPRs */
3091d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 4);
3092d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x240;
3093d722e3fbSopenharmony_ci	ptr_cmd[i++] = mc_address_src;
3094d722e3fbSopenharmony_ci	ptr_cmd[i++] = (mc_address_src >> 32) | 0x100000;
3095d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x400000;
3096d722e3fbSopenharmony_ci	if (version == 9)
3097d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x74fac;
3098d722e3fbSopenharmony_ci	else if (version == 10)
3099d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x1104bfac;
3100d722e3fbSopenharmony_ci
3101d722e3fbSopenharmony_ci	/* Writes the UAV constant data to the SGPRs. */
3102d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 4);
3103d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x244;
3104d722e3fbSopenharmony_ci	ptr_cmd[i++] = mc_address_dst;
3105d722e3fbSopenharmony_ci	ptr_cmd[i++] = (mc_address_dst >> 32) | 0x100000;
3106d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x400000;
3107d722e3fbSopenharmony_ci	if (version == 9)
3108d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x74fac;
3109d722e3fbSopenharmony_ci	else if (version == 10)
3110d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x1104bfac;
3111d722e3fbSopenharmony_ci
3112d722e3fbSopenharmony_ci	/* clear mmCOMPUTE_RESOURCE_LIMITS */
3113d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3_COMPUTE(PKT3_SET_SH_REG, 1);
3114d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x215;
3115d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0;
3116d722e3fbSopenharmony_ci
3117d722e3fbSopenharmony_ci	/* dispatch direct command */
3118d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3_COMPUTE(PACKET3_DISPATCH_DIRECT, 3);
3119d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x10000;
3120d722e3fbSopenharmony_ci	ptr_cmd[i++] = 1;
3121d722e3fbSopenharmony_ci	ptr_cmd[i++] = 1;
3122d722e3fbSopenharmony_ci	ptr_cmd[i++] = 1;
3123d722e3fbSopenharmony_ci
3124d722e3fbSopenharmony_ci	while (i & 7)
3125d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0xffff1000; /* type3 nop packet */
3126d722e3fbSopenharmony_ci
3127d722e3fbSopenharmony_ci	resources[0] = bo_shader;
3128d722e3fbSopenharmony_ci	resources[1] = bo_src;
3129d722e3fbSopenharmony_ci	resources[2] = bo_dst;
3130d722e3fbSopenharmony_ci	resources[3] = bo_cmd;
3131d722e3fbSopenharmony_ci	r = amdgpu_bo_list_create(device_handle, 4, resources, NULL, &bo_list);
3132d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3133d722e3fbSopenharmony_ci
3134d722e3fbSopenharmony_ci	ib_info.ib_mc_address = mc_address_cmd;
3135d722e3fbSopenharmony_ci	ib_info.size = i;
3136d722e3fbSopenharmony_ci	ibs_request.ip_type = ip_type;
3137d722e3fbSopenharmony_ci	ibs_request.ring = ring;
3138d722e3fbSopenharmony_ci	ibs_request.resources = bo_list;
3139d722e3fbSopenharmony_ci	ibs_request.number_of_ibs = 1;
3140d722e3fbSopenharmony_ci	ibs_request.ibs = &ib_info;
3141d722e3fbSopenharmony_ci	ibs_request.fence_info.handle = NULL;
3142d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle, 0, &ibs_request, 1);
3143d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3144d722e3fbSopenharmony_ci
3145d722e3fbSopenharmony_ci	fence_status.ip_type = ip_type;
3146d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
3147d722e3fbSopenharmony_ci	fence_status.ring = ring;
3148d722e3fbSopenharmony_ci	fence_status.context = context_handle;
3149d722e3fbSopenharmony_ci	fence_status.fence = ibs_request.seq_no;
3150d722e3fbSopenharmony_ci
3151d722e3fbSopenharmony_ci	/* wait for IB accomplished */
3152d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
3153d722e3fbSopenharmony_ci					 AMDGPU_TIMEOUT_INFINITE,
3154d722e3fbSopenharmony_ci					 0, &expired);
3155d722e3fbSopenharmony_ci
3156d722e3fbSopenharmony_ci	r = amdgpu_cs_query_reset_state(context_handle, &hang_state, &hangs);
3157d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3158d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(hang_state, AMDGPU_CTX_UNKNOWN_RESET);
3159d722e3fbSopenharmony_ci
3160d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(bo_list);
3161d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3162d722e3fbSopenharmony_ci
3163d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_src, va_src, mc_address_src, bo_dst_size);
3164d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3165d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_dst, va_dst, mc_address_dst, bo_dst_size);
3166d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3167d722e3fbSopenharmony_ci
3168d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_cmd, va_cmd, mc_address_cmd, bo_cmd_size);
3169d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3170d722e3fbSopenharmony_ci
3171d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_shader, va_shader, mc_address_shader, bo_shader_size);
3172d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3173d722e3fbSopenharmony_ci
3174d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
3175d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3176d722e3fbSopenharmony_ci}
3177d722e3fbSopenharmony_ci
3178d722e3fbSopenharmony_civoid amdgpu_dispatch_hang_slow_helper(amdgpu_device_handle device_handle, uint32_t ip_type)
3179d722e3fbSopenharmony_ci{
3180d722e3fbSopenharmony_ci	int r;
3181d722e3fbSopenharmony_ci	struct drm_amdgpu_info_hw_ip info;
3182d722e3fbSopenharmony_ci	uint32_t ring_id, version;
3183d722e3fbSopenharmony_ci
3184d722e3fbSopenharmony_ci	r = amdgpu_query_hw_ip_info(device_handle, ip_type, 0, &info);
3185d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3186d722e3fbSopenharmony_ci	if (!info.available_rings)
3187d722e3fbSopenharmony_ci		printf("SKIP ... as there's no ring for ip %d\n", ip_type);
3188d722e3fbSopenharmony_ci
3189d722e3fbSopenharmony_ci	version = info.hw_ip_version_major;
3190d722e3fbSopenharmony_ci	if (version != 9 && version != 10) {
3191d722e3fbSopenharmony_ci		printf("SKIP ... unsupported gfx version %d\n", version);
3192d722e3fbSopenharmony_ci		return;
3193d722e3fbSopenharmony_ci	}
3194d722e3fbSopenharmony_ci
3195d722e3fbSopenharmony_ci	for (ring_id = 0; (1 << ring_id) & info.available_rings; ring_id++) {
3196d722e3fbSopenharmony_ci		amdgpu_memcpy_dispatch_test(device_handle, ip_type, ring_id, version, 0);
3197d722e3fbSopenharmony_ci		amdgpu_memcpy_dispatch_hang_slow_test(device_handle, ip_type, ring_id, version);
3198d722e3fbSopenharmony_ci		amdgpu_memcpy_dispatch_test(device_handle, ip_type, ring_id, version, 0);
3199d722e3fbSopenharmony_ci	}
3200d722e3fbSopenharmony_ci}
3201d722e3fbSopenharmony_ci
3202d722e3fbSopenharmony_cistatic int amdgpu_draw_load_ps_shader_hang_slow(uint32_t *ptr, int family)
3203d722e3fbSopenharmony_ci{
3204d722e3fbSopenharmony_ci	struct amdgpu_test_shader *shader;
3205d722e3fbSopenharmony_ci	int i, loop = 0x40000;
3206d722e3fbSopenharmony_ci
3207d722e3fbSopenharmony_ci	switch (family) {
3208d722e3fbSopenharmony_ci		case AMDGPU_FAMILY_AI:
3209d722e3fbSopenharmony_ci		case AMDGPU_FAMILY_RV:
3210d722e3fbSopenharmony_ci			shader = &memcpy_ps_hang_slow_ai;
3211d722e3fbSopenharmony_ci			break;
3212d722e3fbSopenharmony_ci		default:
3213d722e3fbSopenharmony_ci			return -1;
3214d722e3fbSopenharmony_ci			break;
3215d722e3fbSopenharmony_ci	}
3216d722e3fbSopenharmony_ci
3217d722e3fbSopenharmony_ci	memcpy(ptr, shader->shader, shader->header_length * sizeof(uint32_t));
3218d722e3fbSopenharmony_ci
3219d722e3fbSopenharmony_ci	for (i = 0; i < loop; i++)
3220d722e3fbSopenharmony_ci		memcpy(ptr + shader->header_length + shader->body_length * i,
3221d722e3fbSopenharmony_ci			shader->shader + shader->header_length,
3222d722e3fbSopenharmony_ci			shader->body_length * sizeof(uint32_t));
3223d722e3fbSopenharmony_ci
3224d722e3fbSopenharmony_ci	memcpy(ptr + shader->header_length + shader->body_length * loop,
3225d722e3fbSopenharmony_ci		shader->shader + shader->header_length + shader->body_length,
3226d722e3fbSopenharmony_ci		shader->foot_length * sizeof(uint32_t));
3227d722e3fbSopenharmony_ci
3228d722e3fbSopenharmony_ci	return 0;
3229d722e3fbSopenharmony_ci}
3230d722e3fbSopenharmony_ci
3231d722e3fbSopenharmony_cistatic int amdgpu_draw_load_ps_shader(uint8_t *ptr, int ps_type, uint32_t version)
3232d722e3fbSopenharmony_ci{
3233d722e3fbSopenharmony_ci	int i;
3234d722e3fbSopenharmony_ci	uint32_t shader_offset= 256;
3235d722e3fbSopenharmony_ci	uint32_t mem_offset, patch_code_offset;
3236d722e3fbSopenharmony_ci	uint32_t shader_size, patchinfo_code_size;
3237d722e3fbSopenharmony_ci	const uint32_t *shader;
3238d722e3fbSopenharmony_ci	const uint32_t *patchinfo_code;
3239d722e3fbSopenharmony_ci	const uint32_t *patchcode_offset;
3240d722e3fbSopenharmony_ci
3241d722e3fbSopenharmony_ci	switch (ps_type) {
3242d722e3fbSopenharmony_ci		case PS_CONST:
3243d722e3fbSopenharmony_ci			if (version == 9) {
3244d722e3fbSopenharmony_ci				shader = ps_const_shader_gfx9;
3245d722e3fbSopenharmony_ci				shader_size = sizeof(ps_const_shader_gfx9);
3246d722e3fbSopenharmony_ci				patchinfo_code = (const uint32_t *)ps_const_shader_patchinfo_code_gfx9;
3247d722e3fbSopenharmony_ci				patchinfo_code_size = ps_const_shader_patchinfo_code_size_gfx9;
3248d722e3fbSopenharmony_ci				patchcode_offset = ps_const_shader_patchinfo_offset_gfx9;
3249d722e3fbSopenharmony_ci			} else if (version == 10){
3250d722e3fbSopenharmony_ci				shader = ps_const_shader_gfx10;
3251d722e3fbSopenharmony_ci				shader_size = sizeof(ps_const_shader_gfx10);
3252d722e3fbSopenharmony_ci				patchinfo_code = (const uint32_t *)ps_const_shader_patchinfo_code_gfx10;
3253d722e3fbSopenharmony_ci				patchinfo_code_size = ps_const_shader_patchinfo_code_size_gfx10;
3254d722e3fbSopenharmony_ci				patchcode_offset = ps_const_shader_patchinfo_offset_gfx10;
3255d722e3fbSopenharmony_ci			}
3256d722e3fbSopenharmony_ci			break;
3257d722e3fbSopenharmony_ci		case PS_TEX:
3258d722e3fbSopenharmony_ci			if (version == 9) {
3259d722e3fbSopenharmony_ci				shader = ps_tex_shader_gfx9;
3260d722e3fbSopenharmony_ci				shader_size = sizeof(ps_tex_shader_gfx9);
3261d722e3fbSopenharmony_ci				patchinfo_code = (const uint32_t *)ps_tex_shader_patchinfo_code_gfx9;
3262d722e3fbSopenharmony_ci				patchinfo_code_size = ps_tex_shader_patchinfo_code_size_gfx9;
3263d722e3fbSopenharmony_ci				patchcode_offset = ps_tex_shader_patchinfo_offset_gfx9;
3264d722e3fbSopenharmony_ci			} else if (version == 10) {
3265d722e3fbSopenharmony_ci				shader = ps_tex_shader_gfx10;
3266d722e3fbSopenharmony_ci				shader_size = sizeof(ps_tex_shader_gfx10);
3267d722e3fbSopenharmony_ci				patchinfo_code = (const uint32_t *)ps_tex_shader_patchinfo_code_gfx10;
3268d722e3fbSopenharmony_ci				patchinfo_code_size = ps_tex_shader_patchinfo_code_size_gfx10;
3269d722e3fbSopenharmony_ci				patchcode_offset = ps_tex_shader_patchinfo_offset_gfx10;
3270d722e3fbSopenharmony_ci			}
3271d722e3fbSopenharmony_ci			break;
3272d722e3fbSopenharmony_ci		case PS_HANG:
3273d722e3fbSopenharmony_ci			shader = memcpy_ps_hang;
3274d722e3fbSopenharmony_ci			shader_size = sizeof(memcpy_ps_hang);
3275d722e3fbSopenharmony_ci
3276d722e3fbSopenharmony_ci			memcpy(ptr, shader, shader_size);
3277d722e3fbSopenharmony_ci			return 0;
3278d722e3fbSopenharmony_ci		default:
3279d722e3fbSopenharmony_ci			return -1;
3280d722e3fbSopenharmony_ci			break;
3281d722e3fbSopenharmony_ci	}
3282d722e3fbSopenharmony_ci
3283d722e3fbSopenharmony_ci	/* write main shader program */
3284d722e3fbSopenharmony_ci	for (i = 0 ; i < 10; i++) {
3285d722e3fbSopenharmony_ci		mem_offset = i * shader_offset;
3286d722e3fbSopenharmony_ci		memcpy(ptr + mem_offset, shader, shader_size);
3287d722e3fbSopenharmony_ci	}
3288d722e3fbSopenharmony_ci
3289d722e3fbSopenharmony_ci	/* overwrite patch codes */
3290d722e3fbSopenharmony_ci	for (i = 0 ; i < 10; i++) {
3291d722e3fbSopenharmony_ci		mem_offset = i * shader_offset + patchcode_offset[0] * sizeof(uint32_t);
3292d722e3fbSopenharmony_ci		patch_code_offset = i * patchinfo_code_size;
3293d722e3fbSopenharmony_ci		memcpy(ptr + mem_offset,
3294d722e3fbSopenharmony_ci			patchinfo_code + patch_code_offset,
3295d722e3fbSopenharmony_ci			patchinfo_code_size * sizeof(uint32_t));
3296d722e3fbSopenharmony_ci	}
3297d722e3fbSopenharmony_ci
3298d722e3fbSopenharmony_ci	return 0;
3299d722e3fbSopenharmony_ci}
3300d722e3fbSopenharmony_ci
3301d722e3fbSopenharmony_ci/* load RectPosTexFast_VS */
3302d722e3fbSopenharmony_cistatic int amdgpu_draw_load_vs_shader(uint8_t *ptr, uint32_t version)
3303d722e3fbSopenharmony_ci{
3304d722e3fbSopenharmony_ci	const uint32_t *shader;
3305d722e3fbSopenharmony_ci	uint32_t shader_size;
3306d722e3fbSopenharmony_ci
3307d722e3fbSopenharmony_ci	if (version == 9) {
3308d722e3fbSopenharmony_ci		shader = vs_RectPosTexFast_shader_gfx9;
3309d722e3fbSopenharmony_ci		shader_size = sizeof(vs_RectPosTexFast_shader_gfx9);
3310d722e3fbSopenharmony_ci	} else if (version == 10) {
3311d722e3fbSopenharmony_ci		shader = vs_RectPosTexFast_shader_gfx10;
3312d722e3fbSopenharmony_ci		shader_size = sizeof(vs_RectPosTexFast_shader_gfx10);
3313d722e3fbSopenharmony_ci	}
3314d722e3fbSopenharmony_ci
3315d722e3fbSopenharmony_ci	memcpy(ptr, shader, shader_size);
3316d722e3fbSopenharmony_ci
3317d722e3fbSopenharmony_ci	return 0;
3318d722e3fbSopenharmony_ci}
3319d722e3fbSopenharmony_ci
3320d722e3fbSopenharmony_cistatic int amdgpu_draw_init(uint32_t *ptr, uint32_t version)
3321d722e3fbSopenharmony_ci{
3322d722e3fbSopenharmony_ci	int i = 0;
3323d722e3fbSopenharmony_ci	const uint32_t *preamblecache_ptr;
3324d722e3fbSopenharmony_ci	uint32_t preamblecache_size;
3325d722e3fbSopenharmony_ci
3326d722e3fbSopenharmony_ci	/* Write context control and load shadowing register if necessary */
3327d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_CONTEXT_CONTROL, 1);
3328d722e3fbSopenharmony_ci	ptr[i++] = 0x80000000;
3329d722e3fbSopenharmony_ci	ptr[i++] = 0x80000000;
3330d722e3fbSopenharmony_ci
3331d722e3fbSopenharmony_ci	if (version == 9) {
3332d722e3fbSopenharmony_ci		preamblecache_ptr = preamblecache_gfx9;
3333d722e3fbSopenharmony_ci		preamblecache_size = sizeof(preamblecache_gfx9);
3334d722e3fbSopenharmony_ci	} else if (version == 10) {
3335d722e3fbSopenharmony_ci		preamblecache_ptr = preamblecache_gfx10;
3336d722e3fbSopenharmony_ci		preamblecache_size = sizeof(preamblecache_gfx10);
3337d722e3fbSopenharmony_ci	}
3338d722e3fbSopenharmony_ci
3339d722e3fbSopenharmony_ci	memcpy(ptr + i, preamblecache_ptr, preamblecache_size);
3340d722e3fbSopenharmony_ci	return i + preamblecache_size/sizeof(uint32_t);
3341d722e3fbSopenharmony_ci}
3342d722e3fbSopenharmony_ci
3343d722e3fbSopenharmony_cistatic int amdgpu_draw_setup_and_write_drawblt_surf_info(uint32_t *ptr,
3344d722e3fbSopenharmony_ci							 uint64_t dst_addr,
3345d722e3fbSopenharmony_ci							 uint32_t version,
3346d722e3fbSopenharmony_ci							 int hang_slow)
3347d722e3fbSopenharmony_ci{
3348d722e3fbSopenharmony_ci	int i = 0;
3349d722e3fbSopenharmony_ci
3350d722e3fbSopenharmony_ci	/* setup color buffer */
3351d722e3fbSopenharmony_ci	if (version == 9) {
3352d722e3fbSopenharmony_ci		/* offset   reg
3353d722e3fbSopenharmony_ci		   0xA318   CB_COLOR0_BASE
3354d722e3fbSopenharmony_ci		   0xA319   CB_COLOR0_BASE_EXT
3355d722e3fbSopenharmony_ci		   0xA31A   CB_COLOR0_ATTRIB2
3356d722e3fbSopenharmony_ci		   0xA31B   CB_COLOR0_VIEW
3357d722e3fbSopenharmony_ci		   0xA31C   CB_COLOR0_INFO
3358d722e3fbSopenharmony_ci		   0xA31D   CB_COLOR0_ATTRIB
3359d722e3fbSopenharmony_ci		   0xA31E   CB_COLOR0_DCC_CONTROL
3360d722e3fbSopenharmony_ci		   0xA31F   CB_COLOR0_CMASK
3361d722e3fbSopenharmony_ci		   0xA320   CB_COLOR0_CMASK_BASE_EXT
3362d722e3fbSopenharmony_ci		   0xA321   CB_COLOR0_FMASK
3363d722e3fbSopenharmony_ci		   0xA322   CB_COLOR0_FMASK_BASE_EXT
3364d722e3fbSopenharmony_ci		   0xA323   CB_COLOR0_CLEAR_WORD0
3365d722e3fbSopenharmony_ci		   0xA324   CB_COLOR0_CLEAR_WORD1
3366d722e3fbSopenharmony_ci		   0xA325   CB_COLOR0_DCC_BASE
3367d722e3fbSopenharmony_ci		   0xA326   CB_COLOR0_DCC_BASE_EXT */
3368d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 15);
3369d722e3fbSopenharmony_ci		ptr[i++] = 0x318;
3370d722e3fbSopenharmony_ci		ptr[i++] = dst_addr >> 8;
3371d722e3fbSopenharmony_ci		ptr[i++] = dst_addr >> 40;
3372d722e3fbSopenharmony_ci		ptr[i++] = hang_slow ? 0x3ffc7ff : 0x7c01f;
3373d722e3fbSopenharmony_ci		ptr[i++] = 0;
3374d722e3fbSopenharmony_ci		ptr[i++] = 0x50438;
3375d722e3fbSopenharmony_ci		ptr[i++] = 0x10140000;
3376d722e3fbSopenharmony_ci		i += 9;
3377d722e3fbSopenharmony_ci
3378d722e3fbSopenharmony_ci		/* mmCB_MRT0_EPITCH */
3379d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3380d722e3fbSopenharmony_ci		ptr[i++] = 0x1e8;
3381d722e3fbSopenharmony_ci		ptr[i++] = hang_slow ? 0xfff : 0x1f;
3382d722e3fbSopenharmony_ci	} else if (version == 10) {
3383d722e3fbSopenharmony_ci		/* 0xA318   CB_COLOR0_BASE
3384d722e3fbSopenharmony_ci		   0xA319   CB_COLOR0_PITCH
3385d722e3fbSopenharmony_ci		   0xA31A   CB_COLOR0_SLICE
3386d722e3fbSopenharmony_ci		   0xA31B   CB_COLOR0_VIEW
3387d722e3fbSopenharmony_ci		   0xA31C   CB_COLOR0_INFO
3388d722e3fbSopenharmony_ci		   0xA31D   CB_COLOR0_ATTRIB
3389d722e3fbSopenharmony_ci		   0xA31E   CB_COLOR0_DCC_CONTROL
3390d722e3fbSopenharmony_ci		   0xA31F   CB_COLOR0_CMASK
3391d722e3fbSopenharmony_ci		   0xA320   CB_COLOR0_CMASK_SLICE
3392d722e3fbSopenharmony_ci		   0xA321   CB_COLOR0_FMASK
3393d722e3fbSopenharmony_ci		   0xA322   CB_COLOR0_FMASK_SLICE
3394d722e3fbSopenharmony_ci		   0xA323   CB_COLOR0_CLEAR_WORD0
3395d722e3fbSopenharmony_ci		   0xA324   CB_COLOR0_CLEAR_WORD1
3396d722e3fbSopenharmony_ci		   0xA325   CB_COLOR0_DCC_BASE */
3397d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 14);
3398d722e3fbSopenharmony_ci		ptr[i++] = 0x318;
3399d722e3fbSopenharmony_ci		ptr[i++] = dst_addr >> 8;
3400d722e3fbSopenharmony_ci		i += 3;
3401d722e3fbSopenharmony_ci		ptr[i++] = 0x50438;
3402d722e3fbSopenharmony_ci		i += 9;
3403d722e3fbSopenharmony_ci
3404d722e3fbSopenharmony_ci		/* 0xA390   CB_COLOR0_BASE_EXT */
3405d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3406d722e3fbSopenharmony_ci		ptr[i++] = 0x390;
3407d722e3fbSopenharmony_ci		ptr[i++] = dst_addr >> 40;
3408d722e3fbSopenharmony_ci
3409d722e3fbSopenharmony_ci		/* 0xA398   CB_COLOR0_CMASK_BASE_EXT */
3410d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3411d722e3fbSopenharmony_ci		ptr[i++] = 0x398;
3412d722e3fbSopenharmony_ci		ptr[i++] = 0;
3413d722e3fbSopenharmony_ci
3414d722e3fbSopenharmony_ci		/* 0xA3A0   CB_COLOR0_FMASK_BASE_EXT */
3415d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3416d722e3fbSopenharmony_ci		ptr[i++] = 0x3a0;
3417d722e3fbSopenharmony_ci		ptr[i++] = 0;
3418d722e3fbSopenharmony_ci
3419d722e3fbSopenharmony_ci		/* 0xA3A8   CB_COLOR0_DCC_BASE_EXT */
3420d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3421d722e3fbSopenharmony_ci		ptr[i++] = 0x3a8;
3422d722e3fbSopenharmony_ci		ptr[i++] = 0;
3423d722e3fbSopenharmony_ci
3424d722e3fbSopenharmony_ci		/* 0xA3B0   CB_COLOR0_ATTRIB2 */
3425d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3426d722e3fbSopenharmony_ci		ptr[i++] = 0x3b0;
3427d722e3fbSopenharmony_ci		ptr[i++] = hang_slow ? 0x3ffc7ff : 0x7c01f;
3428d722e3fbSopenharmony_ci
3429d722e3fbSopenharmony_ci		/* 0xA3B8   CB_COLOR0_ATTRIB3 */
3430d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3431d722e3fbSopenharmony_ci		ptr[i++] = 0x3b8;
3432d722e3fbSopenharmony_ci		ptr[i++] = 0x9014000;
3433d722e3fbSopenharmony_ci	}
3434d722e3fbSopenharmony_ci
3435d722e3fbSopenharmony_ci	/* 0xA32B   CB_COLOR1_BASE */
3436d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3437d722e3fbSopenharmony_ci	ptr[i++] = 0x32b;
3438d722e3fbSopenharmony_ci	ptr[i++] = 0;
3439d722e3fbSopenharmony_ci
3440d722e3fbSopenharmony_ci	/* 0xA33A   CB_COLOR1_BASE */
3441d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3442d722e3fbSopenharmony_ci	ptr[i++] = 0x33a;
3443d722e3fbSopenharmony_ci	ptr[i++] = 0;
3444d722e3fbSopenharmony_ci
3445d722e3fbSopenharmony_ci	/* SPI_SHADER_COL_FORMAT */
3446d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3447d722e3fbSopenharmony_ci	ptr[i++] = 0x1c5;
3448d722e3fbSopenharmony_ci	ptr[i++] = 9;
3449d722e3fbSopenharmony_ci
3450d722e3fbSopenharmony_ci	/* Setup depth buffer */
3451d722e3fbSopenharmony_ci	if (version == 9) {
3452d722e3fbSopenharmony_ci		/* mmDB_Z_INFO */
3453d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 2);
3454d722e3fbSopenharmony_ci		ptr[i++] = 0xe;
3455d722e3fbSopenharmony_ci		i += 2;
3456d722e3fbSopenharmony_ci	} else if (version == 10) {
3457d722e3fbSopenharmony_ci		/* mmDB_Z_INFO */
3458d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 2);
3459d722e3fbSopenharmony_ci		ptr[i++] = 0x10;
3460d722e3fbSopenharmony_ci		i += 2;
3461d722e3fbSopenharmony_ci	}
3462d722e3fbSopenharmony_ci
3463d722e3fbSopenharmony_ci	return i;
3464d722e3fbSopenharmony_ci}
3465d722e3fbSopenharmony_ci
3466d722e3fbSopenharmony_cistatic int amdgpu_draw_setup_and_write_drawblt_state(uint32_t *ptr,
3467d722e3fbSopenharmony_ci						     uint32_t version,
3468d722e3fbSopenharmony_ci						     int hang_slow)
3469d722e3fbSopenharmony_ci{
3470d722e3fbSopenharmony_ci	int i = 0;
3471d722e3fbSopenharmony_ci	const uint32_t *cached_cmd_ptr;
3472d722e3fbSopenharmony_ci	uint32_t cached_cmd_size;
3473d722e3fbSopenharmony_ci
3474d722e3fbSopenharmony_ci	/* mmPA_SC_TILE_STEERING_OVERRIDE */
3475d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3476d722e3fbSopenharmony_ci	ptr[i++] = 0xd7;
3477d722e3fbSopenharmony_ci	ptr[i++] = 0;
3478d722e3fbSopenharmony_ci
3479d722e3fbSopenharmony_ci	ptr[i++] = 0xffff1000;
3480d722e3fbSopenharmony_ci	ptr[i++] = 0xc0021000;
3481d722e3fbSopenharmony_ci
3482d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3483d722e3fbSopenharmony_ci	ptr[i++] = 0xd7;
3484d722e3fbSopenharmony_ci	if (version == 9)
3485d722e3fbSopenharmony_ci		ptr[i++] = 1;
3486d722e3fbSopenharmony_ci	else if (version == 10)
3487d722e3fbSopenharmony_ci		ptr[i++] = 0;
3488d722e3fbSopenharmony_ci
3489d722e3fbSopenharmony_ci	/* mmPA_SC_AA_SAMPLE_LOCS_PIXEL_X0Y0_0 */
3490d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 16);
3491d722e3fbSopenharmony_ci	ptr[i++] = 0x2fe;
3492d722e3fbSopenharmony_ci	i += 16;
3493d722e3fbSopenharmony_ci
3494d722e3fbSopenharmony_ci	/* mmPA_SC_CENTROID_PRIORITY_0 */
3495d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 2);
3496d722e3fbSopenharmony_ci	ptr[i++] = 0x2f5;
3497d722e3fbSopenharmony_ci	i += 2;
3498d722e3fbSopenharmony_ci
3499d722e3fbSopenharmony_ci	if (version == 9) {
3500d722e3fbSopenharmony_ci		cached_cmd_ptr = cached_cmd_gfx9;
3501d722e3fbSopenharmony_ci		cached_cmd_size = sizeof(cached_cmd_gfx9);
3502d722e3fbSopenharmony_ci	} else if (version == 10) {
3503d722e3fbSopenharmony_ci		cached_cmd_ptr = cached_cmd_gfx10;
3504d722e3fbSopenharmony_ci		cached_cmd_size = sizeof(cached_cmd_gfx10);
3505d722e3fbSopenharmony_ci	}
3506d722e3fbSopenharmony_ci
3507d722e3fbSopenharmony_ci	memcpy(ptr + i, cached_cmd_ptr, cached_cmd_size);
3508d722e3fbSopenharmony_ci	if (hang_slow)
3509d722e3fbSopenharmony_ci		*(ptr + i + 12) = 0x8000800;
3510d722e3fbSopenharmony_ci	i += cached_cmd_size/sizeof(uint32_t);
3511d722e3fbSopenharmony_ci
3512d722e3fbSopenharmony_ci	if (version == 10) {
3513d722e3fbSopenharmony_ci		/* mmCB_RMI_GL2_CACHE_CONTROL */
3514d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3515d722e3fbSopenharmony_ci		ptr[i++] = 0x104;
3516d722e3fbSopenharmony_ci		ptr[i++] = 0x40aa0055;
3517d722e3fbSopenharmony_ci		/* mmDB_RMI_L2_CACHE_CONTROL */
3518d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3519d722e3fbSopenharmony_ci		ptr[i++] = 0x1f;
3520d722e3fbSopenharmony_ci		ptr[i++] = 0x2a0055;
3521d722e3fbSopenharmony_ci	}
3522d722e3fbSopenharmony_ci
3523d722e3fbSopenharmony_ci	return i;
3524d722e3fbSopenharmony_ci}
3525d722e3fbSopenharmony_ci
3526d722e3fbSopenharmony_cistatic int amdgpu_draw_vs_RectPosTexFast_write2hw(uint32_t *ptr,
3527d722e3fbSopenharmony_ci						  int ps_type,
3528d722e3fbSopenharmony_ci						  uint64_t shader_addr,
3529d722e3fbSopenharmony_ci						  uint32_t version,
3530d722e3fbSopenharmony_ci						  int hang_slow)
3531d722e3fbSopenharmony_ci{
3532d722e3fbSopenharmony_ci	int i = 0;
3533d722e3fbSopenharmony_ci
3534d722e3fbSopenharmony_ci	/* mmPA_CL_VS_OUT_CNTL */
3535d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3536d722e3fbSopenharmony_ci	ptr[i++] = 0x207;
3537d722e3fbSopenharmony_ci	ptr[i++] = 0;
3538d722e3fbSopenharmony_ci
3539d722e3fbSopenharmony_ci	if (version == 9) {
3540d722e3fbSopenharmony_ci		/* mmSPI_SHADER_PGM_RSRC3_VS */
3541d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PKT3_SET_SH_REG, 1);
3542d722e3fbSopenharmony_ci		ptr[i++] = 0x46;
3543d722e3fbSopenharmony_ci		ptr[i++] = 0xffff;
3544d722e3fbSopenharmony_ci	} else if (version == 10) {
3545d722e3fbSopenharmony_ci		/* mmSPI_SHADER_PGM_RSRC3_VS */
3546d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PKT3_SET_SH_REG_INDEX, 1);
3547d722e3fbSopenharmony_ci		ptr[i++] = 0x30000046;
3548d722e3fbSopenharmony_ci		ptr[i++] = 0xffff;
3549d722e3fbSopenharmony_ci		/* mmSPI_SHADER_PGM_RSRC4_VS */
3550d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PKT3_SET_SH_REG_INDEX, 1);
3551d722e3fbSopenharmony_ci		ptr[i++] = 0x30000041;
3552d722e3fbSopenharmony_ci		ptr[i++] = 0xffff;
3553d722e3fbSopenharmony_ci	}
3554d722e3fbSopenharmony_ci
3555d722e3fbSopenharmony_ci	/* mmSPI_SHADER_PGM_LO_VS...mmSPI_SHADER_PGM_HI_VS */
3556d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_SET_SH_REG, 2);
3557d722e3fbSopenharmony_ci	ptr[i++] = 0x48;
3558d722e3fbSopenharmony_ci	ptr[i++] = shader_addr >> 8;
3559d722e3fbSopenharmony_ci	ptr[i++] = shader_addr >> 40;
3560d722e3fbSopenharmony_ci
3561d722e3fbSopenharmony_ci	/* mmSPI_SHADER_PGM_RSRC1_VS */
3562d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_SET_SH_REG, 1);
3563d722e3fbSopenharmony_ci	ptr[i++] = 0x4a;
3564d722e3fbSopenharmony_ci	if (version == 9)
3565d722e3fbSopenharmony_ci		ptr[i++] = 0xc0081;
3566d722e3fbSopenharmony_ci	else if (version == 10)
3567d722e3fbSopenharmony_ci		ptr[i++] = 0xc0041;
3568d722e3fbSopenharmony_ci	/* mmSPI_SHADER_PGM_RSRC2_VS */
3569d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_SET_SH_REG, 1);
3570d722e3fbSopenharmony_ci	ptr[i++] = 0x4b;
3571d722e3fbSopenharmony_ci	ptr[i++] = 0x18;
3572d722e3fbSopenharmony_ci
3573d722e3fbSopenharmony_ci	/* mmSPI_VS_OUT_CONFIG */
3574d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3575d722e3fbSopenharmony_ci	ptr[i++] = 0x1b1;
3576d722e3fbSopenharmony_ci	ptr[i++] = 2;
3577d722e3fbSopenharmony_ci
3578d722e3fbSopenharmony_ci	/* mmSPI_SHADER_POS_FORMAT */
3579d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3580d722e3fbSopenharmony_ci	ptr[i++] = 0x1c3;
3581d722e3fbSopenharmony_ci	ptr[i++] = 4;
3582d722e3fbSopenharmony_ci
3583d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_SET_SH_REG, 4);
3584d722e3fbSopenharmony_ci	ptr[i++] = 0x4c;
3585d722e3fbSopenharmony_ci	i += 2;
3586d722e3fbSopenharmony_ci	ptr[i++] = hang_slow ? 0x45000000 : 0x42000000;
3587d722e3fbSopenharmony_ci	ptr[i++] = hang_slow ? 0x45000000 : 0x42000000;
3588d722e3fbSopenharmony_ci
3589d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_SET_SH_REG, 4);
3590d722e3fbSopenharmony_ci	ptr[i++] = 0x50;
3591d722e3fbSopenharmony_ci	i += 2;
3592d722e3fbSopenharmony_ci	if (ps_type == PS_CONST) {
3593d722e3fbSopenharmony_ci		i += 2;
3594d722e3fbSopenharmony_ci	} else if (ps_type == PS_TEX) {
3595d722e3fbSopenharmony_ci		ptr[i++] = 0x3f800000;
3596d722e3fbSopenharmony_ci		ptr[i++] = 0x3f800000;
3597d722e3fbSopenharmony_ci	}
3598d722e3fbSopenharmony_ci
3599d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PKT3_SET_SH_REG, 4);
3600d722e3fbSopenharmony_ci	ptr[i++] = 0x54;
3601d722e3fbSopenharmony_ci	i += 4;
3602d722e3fbSopenharmony_ci
3603d722e3fbSopenharmony_ci	return i;
3604d722e3fbSopenharmony_ci}
3605d722e3fbSopenharmony_ci
3606d722e3fbSopenharmony_cistatic int amdgpu_draw_ps_write2hw(uint32_t *ptr,
3607d722e3fbSopenharmony_ci				   int ps_type,
3608d722e3fbSopenharmony_ci				   uint64_t shader_addr,
3609d722e3fbSopenharmony_ci				   uint32_t version)
3610d722e3fbSopenharmony_ci{
3611d722e3fbSopenharmony_ci	int i, j;
3612d722e3fbSopenharmony_ci	const uint32_t *sh_registers;
3613d722e3fbSopenharmony_ci	const uint32_t *context_registers;
3614d722e3fbSopenharmony_ci	uint32_t num_sh_reg, num_context_reg;
3615d722e3fbSopenharmony_ci
3616d722e3fbSopenharmony_ci	if (ps_type == PS_CONST) {
3617d722e3fbSopenharmony_ci		if (version == 9) {
3618d722e3fbSopenharmony_ci			sh_registers = (const uint32_t *)ps_const_sh_registers_gfx9;
3619d722e3fbSopenharmony_ci			num_sh_reg = ps_num_sh_registers_gfx9;
3620d722e3fbSopenharmony_ci		} else if (version == 10) {
3621d722e3fbSopenharmony_ci			sh_registers = (const uint32_t *)ps_const_sh_registers_gfx10;
3622d722e3fbSopenharmony_ci			num_sh_reg = ps_num_sh_registers_gfx10;
3623d722e3fbSopenharmony_ci		}
3624d722e3fbSopenharmony_ci		context_registers = (const uint32_t *)ps_const_context_reg_gfx9;
3625d722e3fbSopenharmony_ci		num_context_reg = ps_num_context_registers_gfx9;
3626d722e3fbSopenharmony_ci	} else if (ps_type == PS_TEX) {
3627d722e3fbSopenharmony_ci		sh_registers = (const uint32_t *)ps_tex_sh_registers_gfx9;
3628d722e3fbSopenharmony_ci		context_registers = (const uint32_t *)ps_tex_context_reg_gfx9;
3629d722e3fbSopenharmony_ci		num_sh_reg = ps_num_sh_registers_gfx9;
3630d722e3fbSopenharmony_ci		num_context_reg = ps_num_context_registers_gfx9;
3631d722e3fbSopenharmony_ci	}
3632d722e3fbSopenharmony_ci
3633d722e3fbSopenharmony_ci	i = 0;
3634d722e3fbSopenharmony_ci
3635d722e3fbSopenharmony_ci	if (version == 9) {
3636d722e3fbSopenharmony_ci		/* 0x2c07   SPI_SHADER_PGM_RSRC3_PS
3637d722e3fbSopenharmony_ci		   0x2c08   SPI_SHADER_PGM_LO_PS
3638d722e3fbSopenharmony_ci		   0x2c09   SPI_SHADER_PGM_HI_PS */
3639d722e3fbSopenharmony_ci		/* multiplicator 9 is from  SPI_SHADER_COL_FORMAT */
3640d722e3fbSopenharmony_ci		shader_addr += 256 * 9;
3641d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PKT3_SET_SH_REG, 3);
3642d722e3fbSopenharmony_ci		ptr[i++] = 0x7;
3643d722e3fbSopenharmony_ci		ptr[i++] = 0xffff;
3644d722e3fbSopenharmony_ci		ptr[i++] = shader_addr >> 8;
3645d722e3fbSopenharmony_ci		ptr[i++] = shader_addr >> 40;
3646d722e3fbSopenharmony_ci	} else if (version == 10) {
3647d722e3fbSopenharmony_ci		shader_addr += 256 * 9;
3648d722e3fbSopenharmony_ci		/* 0x2c08	 SPI_SHADER_PGM_LO_PS
3649d722e3fbSopenharmony_ci		     0x2c09	 SPI_SHADER_PGM_HI_PS */
3650d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PKT3_SET_SH_REG, 2);
3651d722e3fbSopenharmony_ci		ptr[i++] = 0x8;
3652d722e3fbSopenharmony_ci		ptr[i++] = shader_addr >> 8;
3653d722e3fbSopenharmony_ci		ptr[i++] = shader_addr >> 40;
3654d722e3fbSopenharmony_ci
3655d722e3fbSopenharmony_ci		/* mmSPI_SHADER_PGM_RSRC3_PS */
3656d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PKT3_SET_SH_REG_INDEX, 1);
3657d722e3fbSopenharmony_ci		ptr[i++] = 0x30000007;
3658d722e3fbSopenharmony_ci		ptr[i++] = 0xffff;
3659d722e3fbSopenharmony_ci		/* mmSPI_SHADER_PGM_RSRC4_PS */
3660d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PKT3_SET_SH_REG_INDEX, 1);
3661d722e3fbSopenharmony_ci		ptr[i++] = 0x30000001;
3662d722e3fbSopenharmony_ci		ptr[i++] = 0xffff;
3663d722e3fbSopenharmony_ci	}
3664d722e3fbSopenharmony_ci
3665d722e3fbSopenharmony_ci	for (j = 0; j < num_sh_reg; j++) {
3666d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PKT3_SET_SH_REG, 1);
3667d722e3fbSopenharmony_ci		ptr[i++] = sh_registers[j * 2] - 0x2c00;
3668d722e3fbSopenharmony_ci		ptr[i++] = sh_registers[j * 2 + 1];
3669d722e3fbSopenharmony_ci	}
3670d722e3fbSopenharmony_ci
3671d722e3fbSopenharmony_ci	for (j = 0; j < num_context_reg; j++) {
3672d722e3fbSopenharmony_ci		if (context_registers[j * 2] != 0xA1C5) {
3673d722e3fbSopenharmony_ci			ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3674d722e3fbSopenharmony_ci			ptr[i++] = context_registers[j * 2] - 0xa000;
3675d722e3fbSopenharmony_ci			ptr[i++] = context_registers[j * 2 + 1];
3676d722e3fbSopenharmony_ci		}
3677d722e3fbSopenharmony_ci
3678d722e3fbSopenharmony_ci		if (context_registers[j * 2] == 0xA1B4) {
3679d722e3fbSopenharmony_ci			ptr[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3680d722e3fbSopenharmony_ci			ptr[i++] = 0x1b3;
3681d722e3fbSopenharmony_ci			ptr[i++] = 2;
3682d722e3fbSopenharmony_ci		}
3683d722e3fbSopenharmony_ci	}
3684d722e3fbSopenharmony_ci
3685d722e3fbSopenharmony_ci	return i;
3686d722e3fbSopenharmony_ci}
3687d722e3fbSopenharmony_ci
3688d722e3fbSopenharmony_cistatic int amdgpu_draw_draw(uint32_t *ptr, uint32_t version)
3689d722e3fbSopenharmony_ci{
3690d722e3fbSopenharmony_ci	int i = 0;
3691d722e3fbSopenharmony_ci
3692d722e3fbSopenharmony_ci	if (version == 9) {
3693d722e3fbSopenharmony_ci		/* mmIA_MULTI_VGT_PARAM */
3694d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_UCONFIG_REG, 1);
3695d722e3fbSopenharmony_ci		ptr[i++] = 0x40000258;
3696d722e3fbSopenharmony_ci		ptr[i++] = 0xd00ff;
3697d722e3fbSopenharmony_ci		/* mmVGT_PRIMITIVE_TYPE */
3698d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_UCONFIG_REG, 1);
3699d722e3fbSopenharmony_ci		ptr[i++] = 0x10000242;
3700d722e3fbSopenharmony_ci		ptr[i++] = 0x11;
3701d722e3fbSopenharmony_ci	} else if (version == 10) {
3702d722e3fbSopenharmony_ci		/* mmGE_CNTL */
3703d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_UCONFIG_REG, 1);
3704d722e3fbSopenharmony_ci		ptr[i++] = 0x25b;
3705d722e3fbSopenharmony_ci		ptr[i++] = 0xff;
3706d722e3fbSopenharmony_ci		/* mmVGT_PRIMITIVE_TYPE */
3707d722e3fbSopenharmony_ci		ptr[i++] = PACKET3(PACKET3_SET_UCONFIG_REG, 1);
3708d722e3fbSopenharmony_ci		ptr[i++] = 0x242;
3709d722e3fbSopenharmony_ci		ptr[i++] = 0x11;
3710d722e3fbSopenharmony_ci	}
3711d722e3fbSopenharmony_ci
3712d722e3fbSopenharmony_ci	ptr[i++] = PACKET3(PACKET3_DRAW_INDEX_AUTO, 1);
3713d722e3fbSopenharmony_ci	ptr[i++] = 3;
3714d722e3fbSopenharmony_ci	ptr[i++] = 2;
3715d722e3fbSopenharmony_ci
3716d722e3fbSopenharmony_ci	return i;
3717d722e3fbSopenharmony_ci}
3718d722e3fbSopenharmony_ci
3719d722e3fbSopenharmony_civoid amdgpu_memset_draw(amdgpu_device_handle device_handle,
3720d722e3fbSopenharmony_ci			amdgpu_bo_handle bo_shader_ps,
3721d722e3fbSopenharmony_ci			amdgpu_bo_handle bo_shader_vs,
3722d722e3fbSopenharmony_ci			uint64_t mc_address_shader_ps,
3723d722e3fbSopenharmony_ci			uint64_t mc_address_shader_vs,
3724d722e3fbSopenharmony_ci			uint32_t ring_id, uint32_t version)
3725d722e3fbSopenharmony_ci{
3726d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
3727d722e3fbSopenharmony_ci	amdgpu_bo_handle bo_dst, bo_cmd, resources[4];
3728d722e3fbSopenharmony_ci	volatile unsigned char *ptr_dst;
3729d722e3fbSopenharmony_ci	uint32_t *ptr_cmd;
3730d722e3fbSopenharmony_ci	uint64_t mc_address_dst, mc_address_cmd;
3731d722e3fbSopenharmony_ci	amdgpu_va_handle va_dst, va_cmd;
3732d722e3fbSopenharmony_ci	int i, r;
3733d722e3fbSopenharmony_ci	int bo_dst_size = 16384;
3734d722e3fbSopenharmony_ci	int bo_cmd_size = 4096;
3735d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request = {0};
3736d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info = {0};
3737d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status = {0};
3738d722e3fbSopenharmony_ci	uint32_t expired;
3739d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list;
3740d722e3fbSopenharmony_ci
3741d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
3742d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3743d722e3fbSopenharmony_ci
3744d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_cmd_size, 4096,
3745d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_GTT, 0,
3746d722e3fbSopenharmony_ci					&bo_cmd, (void **)&ptr_cmd,
3747d722e3fbSopenharmony_ci					&mc_address_cmd, &va_cmd);
3748d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3749d722e3fbSopenharmony_ci	memset(ptr_cmd, 0, bo_cmd_size);
3750d722e3fbSopenharmony_ci
3751d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_dst_size, 4096,
3752d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
3753d722e3fbSopenharmony_ci					&bo_dst, (void **)&ptr_dst,
3754d722e3fbSopenharmony_ci					&mc_address_dst, &va_dst);
3755d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3756d722e3fbSopenharmony_ci
3757d722e3fbSopenharmony_ci	i = 0;
3758d722e3fbSopenharmony_ci	i += amdgpu_draw_init(ptr_cmd + i, version);
3759d722e3fbSopenharmony_ci
3760d722e3fbSopenharmony_ci	i += amdgpu_draw_setup_and_write_drawblt_surf_info(ptr_cmd + i, mc_address_dst, version, 0);
3761d722e3fbSopenharmony_ci
3762d722e3fbSopenharmony_ci	i += amdgpu_draw_setup_and_write_drawblt_state(ptr_cmd + i, version, 0);
3763d722e3fbSopenharmony_ci
3764d722e3fbSopenharmony_ci	i += amdgpu_draw_vs_RectPosTexFast_write2hw(ptr_cmd + i, PS_CONST, mc_address_shader_vs,
3765d722e3fbSopenharmony_ci						    version, 0);
3766d722e3fbSopenharmony_ci
3767d722e3fbSopenharmony_ci	i += amdgpu_draw_ps_write2hw(ptr_cmd + i, PS_CONST, mc_address_shader_ps, version);
3768d722e3fbSopenharmony_ci
3769d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3(PKT3_SET_SH_REG, 4);
3770d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0xc;
3771d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x33333333;
3772d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x33333333;
3773d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x33333333;
3774d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x33333333;
3775d722e3fbSopenharmony_ci
3776d722e3fbSopenharmony_ci	i += amdgpu_draw_draw(ptr_cmd + i, version);
3777d722e3fbSopenharmony_ci
3778d722e3fbSopenharmony_ci	while (i & 7)
3779d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0xffff1000; /* type3 nop packet */
3780d722e3fbSopenharmony_ci
3781d722e3fbSopenharmony_ci	resources[0] = bo_dst;
3782d722e3fbSopenharmony_ci	resources[1] = bo_shader_ps;
3783d722e3fbSopenharmony_ci	resources[2] = bo_shader_vs;
3784d722e3fbSopenharmony_ci	resources[3] = bo_cmd;
3785d722e3fbSopenharmony_ci	r = amdgpu_bo_list_create(device_handle, 4, resources, NULL, &bo_list);
3786d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3787d722e3fbSopenharmony_ci
3788d722e3fbSopenharmony_ci	ib_info.ib_mc_address = mc_address_cmd;
3789d722e3fbSopenharmony_ci	ib_info.size = i;
3790d722e3fbSopenharmony_ci	ibs_request.ip_type = AMDGPU_HW_IP_GFX;
3791d722e3fbSopenharmony_ci	ibs_request.ring = ring_id;
3792d722e3fbSopenharmony_ci	ibs_request.resources = bo_list;
3793d722e3fbSopenharmony_ci	ibs_request.number_of_ibs = 1;
3794d722e3fbSopenharmony_ci	ibs_request.ibs = &ib_info;
3795d722e3fbSopenharmony_ci	ibs_request.fence_info.handle = NULL;
3796d722e3fbSopenharmony_ci
3797d722e3fbSopenharmony_ci	/* submit CS */
3798d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle, 0, &ibs_request, 1);
3799d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3800d722e3fbSopenharmony_ci
3801d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(bo_list);
3802d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3803d722e3fbSopenharmony_ci
3804d722e3fbSopenharmony_ci	fence_status.ip_type = AMDGPU_HW_IP_GFX;
3805d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
3806d722e3fbSopenharmony_ci	fence_status.ring = ring_id;
3807d722e3fbSopenharmony_ci	fence_status.context = context_handle;
3808d722e3fbSopenharmony_ci	fence_status.fence = ibs_request.seq_no;
3809d722e3fbSopenharmony_ci
3810d722e3fbSopenharmony_ci	/* wait for IB accomplished */
3811d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
3812d722e3fbSopenharmony_ci					 AMDGPU_TIMEOUT_INFINITE,
3813d722e3fbSopenharmony_ci					 0, &expired);
3814d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3815d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(expired, true);
3816d722e3fbSopenharmony_ci
3817d722e3fbSopenharmony_ci	/* verify if memset test result meets with expected */
3818d722e3fbSopenharmony_ci	i = 0;
3819d722e3fbSopenharmony_ci	while(i < bo_dst_size) {
3820d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(ptr_dst[i++], 0x33);
3821d722e3fbSopenharmony_ci	}
3822d722e3fbSopenharmony_ci
3823d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_dst, va_dst, mc_address_dst, bo_dst_size);
3824d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3825d722e3fbSopenharmony_ci
3826d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_cmd, va_cmd, mc_address_cmd, bo_cmd_size);
3827d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3828d722e3fbSopenharmony_ci
3829d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
3830d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3831d722e3fbSopenharmony_ci}
3832d722e3fbSopenharmony_ci
3833d722e3fbSopenharmony_cistatic void amdgpu_memset_draw_test(amdgpu_device_handle device_handle,
3834d722e3fbSopenharmony_ci				    uint32_t ring, int version)
3835d722e3fbSopenharmony_ci{
3836d722e3fbSopenharmony_ci	amdgpu_bo_handle bo_shader_ps, bo_shader_vs;
3837d722e3fbSopenharmony_ci	void *ptr_shader_ps;
3838d722e3fbSopenharmony_ci	void *ptr_shader_vs;
3839d722e3fbSopenharmony_ci	uint64_t mc_address_shader_ps, mc_address_shader_vs;
3840d722e3fbSopenharmony_ci	amdgpu_va_handle va_shader_ps, va_shader_vs;
3841d722e3fbSopenharmony_ci	int r;
3842d722e3fbSopenharmony_ci	int bo_shader_size = 4096;
3843d722e3fbSopenharmony_ci
3844d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_shader_size, 4096,
3845d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
3846d722e3fbSopenharmony_ci					&bo_shader_ps, &ptr_shader_ps,
3847d722e3fbSopenharmony_ci					&mc_address_shader_ps, &va_shader_ps);
3848d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3849d722e3fbSopenharmony_ci	memset(ptr_shader_ps, 0, bo_shader_size);
3850d722e3fbSopenharmony_ci
3851d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_shader_size, 4096,
3852d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
3853d722e3fbSopenharmony_ci					&bo_shader_vs, &ptr_shader_vs,
3854d722e3fbSopenharmony_ci					&mc_address_shader_vs, &va_shader_vs);
3855d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3856d722e3fbSopenharmony_ci	memset(ptr_shader_vs, 0, bo_shader_size);
3857d722e3fbSopenharmony_ci
3858d722e3fbSopenharmony_ci	r = amdgpu_draw_load_ps_shader(ptr_shader_ps, PS_CONST, version);
3859d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3860d722e3fbSopenharmony_ci
3861d722e3fbSopenharmony_ci	r = amdgpu_draw_load_vs_shader(ptr_shader_vs, version);
3862d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3863d722e3fbSopenharmony_ci
3864d722e3fbSopenharmony_ci	amdgpu_memset_draw(device_handle, bo_shader_ps, bo_shader_vs,
3865d722e3fbSopenharmony_ci			mc_address_shader_ps, mc_address_shader_vs,
3866d722e3fbSopenharmony_ci			ring, version);
3867d722e3fbSopenharmony_ci
3868d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_shader_ps, va_shader_ps, mc_address_shader_ps, bo_shader_size);
3869d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3870d722e3fbSopenharmony_ci
3871d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_shader_vs, va_shader_vs, mc_address_shader_vs, bo_shader_size);
3872d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3873d722e3fbSopenharmony_ci}
3874d722e3fbSopenharmony_ci
3875d722e3fbSopenharmony_cistatic void amdgpu_memcpy_draw(amdgpu_device_handle device_handle,
3876d722e3fbSopenharmony_ci			       amdgpu_bo_handle bo_shader_ps,
3877d722e3fbSopenharmony_ci			       amdgpu_bo_handle bo_shader_vs,
3878d722e3fbSopenharmony_ci			       uint64_t mc_address_shader_ps,
3879d722e3fbSopenharmony_ci			       uint64_t mc_address_shader_vs,
3880d722e3fbSopenharmony_ci			       uint32_t ring, int version, int hang)
3881d722e3fbSopenharmony_ci{
3882d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
3883d722e3fbSopenharmony_ci	amdgpu_bo_handle bo_dst, bo_src, bo_cmd, resources[5];
3884d722e3fbSopenharmony_ci	volatile unsigned char *ptr_dst;
3885d722e3fbSopenharmony_ci	unsigned char *ptr_src;
3886d722e3fbSopenharmony_ci	uint32_t *ptr_cmd;
3887d722e3fbSopenharmony_ci	uint64_t mc_address_dst, mc_address_src, mc_address_cmd;
3888d722e3fbSopenharmony_ci	amdgpu_va_handle va_dst, va_src, va_cmd;
3889d722e3fbSopenharmony_ci	int i, r;
3890d722e3fbSopenharmony_ci	int bo_size = 16384;
3891d722e3fbSopenharmony_ci	int bo_cmd_size = 4096;
3892d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request = {0};
3893d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info= {0};
3894d722e3fbSopenharmony_ci	uint32_t hang_state, hangs;
3895d722e3fbSopenharmony_ci	uint32_t expired;
3896d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list;
3897d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status = {0};
3898d722e3fbSopenharmony_ci
3899d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
3900d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3901d722e3fbSopenharmony_ci
3902d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_cmd_size, 4096,
3903d722e3fbSopenharmony_ci				    AMDGPU_GEM_DOMAIN_GTT, 0,
3904d722e3fbSopenharmony_ci				    &bo_cmd, (void **)&ptr_cmd,
3905d722e3fbSopenharmony_ci				    &mc_address_cmd, &va_cmd);
3906d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3907d722e3fbSopenharmony_ci	memset(ptr_cmd, 0, bo_cmd_size);
3908d722e3fbSopenharmony_ci
3909d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_size, 4096,
3910d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
3911d722e3fbSopenharmony_ci					&bo_src, (void **)&ptr_src,
3912d722e3fbSopenharmony_ci					&mc_address_src, &va_src);
3913d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3914d722e3fbSopenharmony_ci
3915d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_size, 4096,
3916d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
3917d722e3fbSopenharmony_ci					&bo_dst, (void **)&ptr_dst,
3918d722e3fbSopenharmony_ci					&mc_address_dst, &va_dst);
3919d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3920d722e3fbSopenharmony_ci
3921d722e3fbSopenharmony_ci	memset(ptr_src, 0x55, bo_size);
3922d722e3fbSopenharmony_ci
3923d722e3fbSopenharmony_ci	i = 0;
3924d722e3fbSopenharmony_ci	i += amdgpu_draw_init(ptr_cmd + i, version);
3925d722e3fbSopenharmony_ci
3926d722e3fbSopenharmony_ci	i += amdgpu_draw_setup_and_write_drawblt_surf_info(ptr_cmd + i, mc_address_dst, version, 0);
3927d722e3fbSopenharmony_ci
3928d722e3fbSopenharmony_ci	i += amdgpu_draw_setup_and_write_drawblt_state(ptr_cmd + i, version, 0);
3929d722e3fbSopenharmony_ci
3930d722e3fbSopenharmony_ci	i += amdgpu_draw_vs_RectPosTexFast_write2hw(ptr_cmd + i, PS_TEX, mc_address_shader_vs,
3931d722e3fbSopenharmony_ci						    version, 0);
3932d722e3fbSopenharmony_ci
3933d722e3fbSopenharmony_ci	i += amdgpu_draw_ps_write2hw(ptr_cmd + i, PS_TEX, mc_address_shader_ps, version);
3934d722e3fbSopenharmony_ci
3935d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3(PKT3_SET_SH_REG, 8);
3936d722e3fbSopenharmony_ci	if (version == 9) {
3937d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0xc;
3938d722e3fbSopenharmony_ci		ptr_cmd[i++] = mc_address_src >> 8;
3939d722e3fbSopenharmony_ci		ptr_cmd[i++] = mc_address_src >> 40 | 0x10e00000;
3940d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x7c01f;
3941d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x90500fac;
3942d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x3e000;
3943d722e3fbSopenharmony_ci		i += 3;
3944d722e3fbSopenharmony_ci	} else if (version == 10) {
3945d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0xc;
3946d722e3fbSopenharmony_ci		ptr_cmd[i++] = mc_address_src >> 8;
3947d722e3fbSopenharmony_ci		ptr_cmd[i++] = mc_address_src >> 40 | 0xc4b00000;
3948d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x8007c007;
3949d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x90500fac;
3950d722e3fbSopenharmony_ci		i += 2;
3951d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x400;
3952d722e3fbSopenharmony_ci		i++;
3953d722e3fbSopenharmony_ci	}
3954d722e3fbSopenharmony_ci
3955d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3(PKT3_SET_SH_REG, 4);
3956d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x14;
3957d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x92;
3958d722e3fbSopenharmony_ci	i += 3;
3959d722e3fbSopenharmony_ci
3960d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
3961d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x191;
3962d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0;
3963d722e3fbSopenharmony_ci
3964d722e3fbSopenharmony_ci	i += amdgpu_draw_draw(ptr_cmd + i, version);
3965d722e3fbSopenharmony_ci
3966d722e3fbSopenharmony_ci	while (i & 7)
3967d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0xffff1000; /* type3 nop packet */
3968d722e3fbSopenharmony_ci
3969d722e3fbSopenharmony_ci	resources[0] = bo_dst;
3970d722e3fbSopenharmony_ci	resources[1] = bo_src;
3971d722e3fbSopenharmony_ci	resources[2] = bo_shader_ps;
3972d722e3fbSopenharmony_ci	resources[3] = bo_shader_vs;
3973d722e3fbSopenharmony_ci	resources[4] = bo_cmd;
3974d722e3fbSopenharmony_ci	r = amdgpu_bo_list_create(device_handle, 5, resources, NULL, &bo_list);
3975d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3976d722e3fbSopenharmony_ci
3977d722e3fbSopenharmony_ci	ib_info.ib_mc_address = mc_address_cmd;
3978d722e3fbSopenharmony_ci	ib_info.size = i;
3979d722e3fbSopenharmony_ci	ibs_request.ip_type = AMDGPU_HW_IP_GFX;
3980d722e3fbSopenharmony_ci	ibs_request.ring = ring;
3981d722e3fbSopenharmony_ci	ibs_request.resources = bo_list;
3982d722e3fbSopenharmony_ci	ibs_request.number_of_ibs = 1;
3983d722e3fbSopenharmony_ci	ibs_request.ibs = &ib_info;
3984d722e3fbSopenharmony_ci	ibs_request.fence_info.handle = NULL;
3985d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle, 0, &ibs_request, 1);
3986d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
3987d722e3fbSopenharmony_ci
3988d722e3fbSopenharmony_ci	fence_status.ip_type = AMDGPU_HW_IP_GFX;
3989d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
3990d722e3fbSopenharmony_ci	fence_status.ring = ring;
3991d722e3fbSopenharmony_ci	fence_status.context = context_handle;
3992d722e3fbSopenharmony_ci	fence_status.fence = ibs_request.seq_no;
3993d722e3fbSopenharmony_ci
3994d722e3fbSopenharmony_ci	/* wait for IB accomplished */
3995d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
3996d722e3fbSopenharmony_ci					 AMDGPU_TIMEOUT_INFINITE,
3997d722e3fbSopenharmony_ci					 0, &expired);
3998d722e3fbSopenharmony_ci	if (!hang) {
3999d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
4000d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(expired, true);
4001d722e3fbSopenharmony_ci
4002d722e3fbSopenharmony_ci		/* verify if memcpy test result meets with expected */
4003d722e3fbSopenharmony_ci		i = 0;
4004d722e3fbSopenharmony_ci		while(i < bo_size) {
4005d722e3fbSopenharmony_ci			CU_ASSERT_EQUAL(ptr_dst[i], ptr_src[i]);
4006d722e3fbSopenharmony_ci			i++;
4007d722e3fbSopenharmony_ci		}
4008d722e3fbSopenharmony_ci	} else {
4009d722e3fbSopenharmony_ci		r = amdgpu_cs_query_reset_state(context_handle, &hang_state, &hangs);
4010d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(r, 0);
4011d722e3fbSopenharmony_ci		CU_ASSERT_EQUAL(hang_state, AMDGPU_CTX_UNKNOWN_RESET);
4012d722e3fbSopenharmony_ci	}
4013d722e3fbSopenharmony_ci
4014d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(bo_list);
4015d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4016d722e3fbSopenharmony_ci
4017d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_src, va_src, mc_address_src, bo_size);
4018d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4019d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_dst, va_dst, mc_address_dst, bo_size);
4020d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4021d722e3fbSopenharmony_ci
4022d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_cmd, va_cmd, mc_address_cmd, bo_cmd_size);
4023d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4024d722e3fbSopenharmony_ci
4025d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
4026d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4027d722e3fbSopenharmony_ci}
4028d722e3fbSopenharmony_ci
4029d722e3fbSopenharmony_civoid amdgpu_memcpy_draw_test(amdgpu_device_handle device_handle, uint32_t ring,
4030d722e3fbSopenharmony_ci			     int version, int hang)
4031d722e3fbSopenharmony_ci{
4032d722e3fbSopenharmony_ci	amdgpu_bo_handle bo_shader_ps, bo_shader_vs;
4033d722e3fbSopenharmony_ci	void *ptr_shader_ps;
4034d722e3fbSopenharmony_ci	void *ptr_shader_vs;
4035d722e3fbSopenharmony_ci	uint64_t mc_address_shader_ps, mc_address_shader_vs;
4036d722e3fbSopenharmony_ci	amdgpu_va_handle va_shader_ps, va_shader_vs;
4037d722e3fbSopenharmony_ci	int bo_shader_size = 4096;
4038d722e3fbSopenharmony_ci	enum ps_type ps_type = hang ? PS_HANG : PS_TEX;
4039d722e3fbSopenharmony_ci	int r;
4040d722e3fbSopenharmony_ci
4041d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_shader_size, 4096,
4042d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
4043d722e3fbSopenharmony_ci					&bo_shader_ps, &ptr_shader_ps,
4044d722e3fbSopenharmony_ci					&mc_address_shader_ps, &va_shader_ps);
4045d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4046d722e3fbSopenharmony_ci	memset(ptr_shader_ps, 0, bo_shader_size);
4047d722e3fbSopenharmony_ci
4048d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_shader_size, 4096,
4049d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
4050d722e3fbSopenharmony_ci					&bo_shader_vs, &ptr_shader_vs,
4051d722e3fbSopenharmony_ci					&mc_address_shader_vs, &va_shader_vs);
4052d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4053d722e3fbSopenharmony_ci	memset(ptr_shader_vs, 0, bo_shader_size);
4054d722e3fbSopenharmony_ci
4055d722e3fbSopenharmony_ci	r = amdgpu_draw_load_ps_shader(ptr_shader_ps, ps_type, version);
4056d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4057d722e3fbSopenharmony_ci
4058d722e3fbSopenharmony_ci	r = amdgpu_draw_load_vs_shader(ptr_shader_vs, version);
4059d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4060d722e3fbSopenharmony_ci
4061d722e3fbSopenharmony_ci	amdgpu_memcpy_draw(device_handle, bo_shader_ps, bo_shader_vs,
4062d722e3fbSopenharmony_ci			mc_address_shader_ps, mc_address_shader_vs,
4063d722e3fbSopenharmony_ci			ring, version, hang);
4064d722e3fbSopenharmony_ci
4065d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_shader_ps, va_shader_ps, mc_address_shader_ps, bo_shader_size);
4066d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4067d722e3fbSopenharmony_ci
4068d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_shader_vs, va_shader_vs, mc_address_shader_vs, bo_shader_size);
4069d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4070d722e3fbSopenharmony_ci}
4071d722e3fbSopenharmony_ci
4072d722e3fbSopenharmony_cistatic void amdgpu_draw_test(void)
4073d722e3fbSopenharmony_ci{
4074d722e3fbSopenharmony_ci	int r;
4075d722e3fbSopenharmony_ci	struct drm_amdgpu_info_hw_ip info;
4076d722e3fbSopenharmony_ci	uint32_t ring_id, version;
4077d722e3fbSopenharmony_ci
4078d722e3fbSopenharmony_ci	r = amdgpu_query_hw_ip_info(device_handle, AMDGPU_HW_IP_GFX, 0, &info);
4079d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4080d722e3fbSopenharmony_ci	if (!info.available_rings)
4081d722e3fbSopenharmony_ci		printf("SKIP ... as there's no graphics ring\n");
4082d722e3fbSopenharmony_ci
4083d722e3fbSopenharmony_ci	version = info.hw_ip_version_major;
4084d722e3fbSopenharmony_ci	if (version != 9 && version != 10) {
4085d722e3fbSopenharmony_ci		printf("SKIP ... unsupported gfx version %d\n", version);
4086d722e3fbSopenharmony_ci		return;
4087d722e3fbSopenharmony_ci	}
4088d722e3fbSopenharmony_ci
4089d722e3fbSopenharmony_ci	for (ring_id = 0; (1 << ring_id) & info.available_rings; ring_id++) {
4090d722e3fbSopenharmony_ci		amdgpu_memset_draw_test(device_handle, ring_id, version);
4091d722e3fbSopenharmony_ci		amdgpu_memcpy_draw_test(device_handle, ring_id, version, 0);
4092d722e3fbSopenharmony_ci	}
4093d722e3fbSopenharmony_ci}
4094d722e3fbSopenharmony_ci
4095d722e3fbSopenharmony_civoid amdgpu_memcpy_draw_hang_slow_test(amdgpu_device_handle device_handle, uint32_t ring, int version)
4096d722e3fbSopenharmony_ci{
4097d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
4098d722e3fbSopenharmony_ci	amdgpu_bo_handle bo_shader_ps, bo_shader_vs;
4099d722e3fbSopenharmony_ci	amdgpu_bo_handle bo_dst, bo_src, bo_cmd, resources[5];
4100d722e3fbSopenharmony_ci	void *ptr_shader_ps;
4101d722e3fbSopenharmony_ci	void *ptr_shader_vs;
4102d722e3fbSopenharmony_ci	volatile unsigned char *ptr_dst;
4103d722e3fbSopenharmony_ci	unsigned char *ptr_src;
4104d722e3fbSopenharmony_ci	uint32_t *ptr_cmd;
4105d722e3fbSopenharmony_ci	uint64_t mc_address_dst, mc_address_src, mc_address_cmd;
4106d722e3fbSopenharmony_ci	uint64_t mc_address_shader_ps, mc_address_shader_vs;
4107d722e3fbSopenharmony_ci	amdgpu_va_handle va_shader_ps, va_shader_vs;
4108d722e3fbSopenharmony_ci	amdgpu_va_handle va_dst, va_src, va_cmd;
4109d722e3fbSopenharmony_ci	struct amdgpu_gpu_info gpu_info = {0};
4110d722e3fbSopenharmony_ci	int i, r;
4111d722e3fbSopenharmony_ci	int bo_size = 0x4000000;
4112d722e3fbSopenharmony_ci	int bo_shader_ps_size = 0x400000;
4113d722e3fbSopenharmony_ci	int bo_shader_vs_size = 4096;
4114d722e3fbSopenharmony_ci	int bo_cmd_size = 4096;
4115d722e3fbSopenharmony_ci	struct amdgpu_cs_request ibs_request = {0};
4116d722e3fbSopenharmony_ci	struct amdgpu_cs_ib_info ib_info= {0};
4117d722e3fbSopenharmony_ci	uint32_t hang_state, hangs, expired;
4118d722e3fbSopenharmony_ci	amdgpu_bo_list_handle bo_list;
4119d722e3fbSopenharmony_ci	struct amdgpu_cs_fence fence_status = {0};
4120d722e3fbSopenharmony_ci
4121d722e3fbSopenharmony_ci	r = amdgpu_query_gpu_info(device_handle, &gpu_info);
4122d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4123d722e3fbSopenharmony_ci
4124d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
4125d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4126d722e3fbSopenharmony_ci
4127d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_cmd_size, 4096,
4128d722e3fbSopenharmony_ci				    AMDGPU_GEM_DOMAIN_GTT, 0,
4129d722e3fbSopenharmony_ci				    &bo_cmd, (void **)&ptr_cmd,
4130d722e3fbSopenharmony_ci				    &mc_address_cmd, &va_cmd);
4131d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4132d722e3fbSopenharmony_ci	memset(ptr_cmd, 0, bo_cmd_size);
4133d722e3fbSopenharmony_ci
4134d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_shader_ps_size, 4096,
4135d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
4136d722e3fbSopenharmony_ci					&bo_shader_ps, &ptr_shader_ps,
4137d722e3fbSopenharmony_ci					&mc_address_shader_ps, &va_shader_ps);
4138d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4139d722e3fbSopenharmony_ci	memset(ptr_shader_ps, 0, bo_shader_ps_size);
4140d722e3fbSopenharmony_ci
4141d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_shader_vs_size, 4096,
4142d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
4143d722e3fbSopenharmony_ci					&bo_shader_vs, &ptr_shader_vs,
4144d722e3fbSopenharmony_ci					&mc_address_shader_vs, &va_shader_vs);
4145d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4146d722e3fbSopenharmony_ci	memset(ptr_shader_vs, 0, bo_shader_vs_size);
4147d722e3fbSopenharmony_ci
4148d722e3fbSopenharmony_ci	r = amdgpu_draw_load_ps_shader_hang_slow(ptr_shader_ps, gpu_info.family_id);
4149d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4150d722e3fbSopenharmony_ci
4151d722e3fbSopenharmony_ci	r = amdgpu_draw_load_vs_shader(ptr_shader_vs, version);
4152d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4153d722e3fbSopenharmony_ci
4154d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_size, 4096,
4155d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
4156d722e3fbSopenharmony_ci					&bo_src, (void **)&ptr_src,
4157d722e3fbSopenharmony_ci					&mc_address_src, &va_src);
4158d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4159d722e3fbSopenharmony_ci
4160d722e3fbSopenharmony_ci	r = amdgpu_bo_alloc_and_map(device_handle, bo_size, 4096,
4161d722e3fbSopenharmony_ci					AMDGPU_GEM_DOMAIN_VRAM, 0,
4162d722e3fbSopenharmony_ci					&bo_dst, (void **)&ptr_dst,
4163d722e3fbSopenharmony_ci					&mc_address_dst, &va_dst);
4164d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4165d722e3fbSopenharmony_ci
4166d722e3fbSopenharmony_ci	memset(ptr_src, 0x55, bo_size);
4167d722e3fbSopenharmony_ci
4168d722e3fbSopenharmony_ci	i = 0;
4169d722e3fbSopenharmony_ci	i += amdgpu_draw_init(ptr_cmd + i, version);
4170d722e3fbSopenharmony_ci
4171d722e3fbSopenharmony_ci	i += amdgpu_draw_setup_and_write_drawblt_surf_info(ptr_cmd + i, mc_address_dst, version, 1);
4172d722e3fbSopenharmony_ci
4173d722e3fbSopenharmony_ci	i += amdgpu_draw_setup_and_write_drawblt_state(ptr_cmd + i, version, 1);
4174d722e3fbSopenharmony_ci
4175d722e3fbSopenharmony_ci	i += amdgpu_draw_vs_RectPosTexFast_write2hw(ptr_cmd + i, PS_TEX,
4176d722e3fbSopenharmony_ci							mc_address_shader_vs, version, 1);
4177d722e3fbSopenharmony_ci
4178d722e3fbSopenharmony_ci	i += amdgpu_draw_ps_write2hw(ptr_cmd + i, PS_TEX, mc_address_shader_ps, version);
4179d722e3fbSopenharmony_ci
4180d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3(PKT3_SET_SH_REG, 8);
4181d722e3fbSopenharmony_ci
4182d722e3fbSopenharmony_ci	if (version == 9) {
4183d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0xc;
4184d722e3fbSopenharmony_ci		ptr_cmd[i++] = mc_address_src >> 8;
4185d722e3fbSopenharmony_ci		ptr_cmd[i++] = mc_address_src >> 40 | 0x10e00000;
4186d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x1ffcfff;
4187d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x90500fac;
4188d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x1ffe000;
4189d722e3fbSopenharmony_ci		i += 3;
4190d722e3fbSopenharmony_ci	} else if (version == 10) {
4191d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0xc;
4192d722e3fbSopenharmony_ci		ptr_cmd[i++] = mc_address_src >> 8;
4193d722e3fbSopenharmony_ci		ptr_cmd[i++] = mc_address_src >> 40 | 0xc4b00000;
4194d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x81ffc1ff;
4195d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0x90500fac;
4196d722e3fbSopenharmony_ci		i += 4;
4197d722e3fbSopenharmony_ci	}
4198d722e3fbSopenharmony_ci
4199d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3(PKT3_SET_SH_REG, 4);
4200d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x14;
4201d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x92;
4202d722e3fbSopenharmony_ci	i += 3;
4203d722e3fbSopenharmony_ci
4204d722e3fbSopenharmony_ci	ptr_cmd[i++] = PACKET3(PACKET3_SET_CONTEXT_REG, 1);
4205d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0x191;
4206d722e3fbSopenharmony_ci	ptr_cmd[i++] = 0;
4207d722e3fbSopenharmony_ci
4208d722e3fbSopenharmony_ci	i += amdgpu_draw_draw(ptr_cmd + i, version);
4209d722e3fbSopenharmony_ci
4210d722e3fbSopenharmony_ci	while (i & 7)
4211d722e3fbSopenharmony_ci		ptr_cmd[i++] = 0xffff1000; /* type3 nop packet */
4212d722e3fbSopenharmony_ci
4213d722e3fbSopenharmony_ci	resources[0] = bo_dst;
4214d722e3fbSopenharmony_ci	resources[1] = bo_src;
4215d722e3fbSopenharmony_ci	resources[2] = bo_shader_ps;
4216d722e3fbSopenharmony_ci	resources[3] = bo_shader_vs;
4217d722e3fbSopenharmony_ci	resources[4] = bo_cmd;
4218d722e3fbSopenharmony_ci	r = amdgpu_bo_list_create(device_handle, 5, resources, NULL, &bo_list);
4219d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4220d722e3fbSopenharmony_ci
4221d722e3fbSopenharmony_ci	ib_info.ib_mc_address = mc_address_cmd;
4222d722e3fbSopenharmony_ci	ib_info.size = i;
4223d722e3fbSopenharmony_ci	ibs_request.ip_type = AMDGPU_HW_IP_GFX;
4224d722e3fbSopenharmony_ci	ibs_request.ring = ring;
4225d722e3fbSopenharmony_ci	ibs_request.resources = bo_list;
4226d722e3fbSopenharmony_ci	ibs_request.number_of_ibs = 1;
4227d722e3fbSopenharmony_ci	ibs_request.ibs = &ib_info;
4228d722e3fbSopenharmony_ci	ibs_request.fence_info.handle = NULL;
4229d722e3fbSopenharmony_ci	r = amdgpu_cs_submit(context_handle, 0, &ibs_request, 1);
4230d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4231d722e3fbSopenharmony_ci
4232d722e3fbSopenharmony_ci	fence_status.ip_type = AMDGPU_HW_IP_GFX;
4233d722e3fbSopenharmony_ci	fence_status.ip_instance = 0;
4234d722e3fbSopenharmony_ci	fence_status.ring = ring;
4235d722e3fbSopenharmony_ci	fence_status.context = context_handle;
4236d722e3fbSopenharmony_ci	fence_status.fence = ibs_request.seq_no;
4237d722e3fbSopenharmony_ci
4238d722e3fbSopenharmony_ci	/* wait for IB accomplished */
4239d722e3fbSopenharmony_ci	r = amdgpu_cs_query_fence_status(&fence_status,
4240d722e3fbSopenharmony_ci					 AMDGPU_TIMEOUT_INFINITE,
4241d722e3fbSopenharmony_ci					 0, &expired);
4242d722e3fbSopenharmony_ci
4243d722e3fbSopenharmony_ci	r = amdgpu_cs_query_reset_state(context_handle, &hang_state, &hangs);
4244d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4245d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(hang_state, AMDGPU_CTX_UNKNOWN_RESET);
4246d722e3fbSopenharmony_ci
4247d722e3fbSopenharmony_ci	r = amdgpu_bo_list_destroy(bo_list);
4248d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4249d722e3fbSopenharmony_ci
4250d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_dst, va_dst, mc_address_dst, bo_size);
4251d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4252d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_src, va_src, mc_address_src, bo_size);
4253d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4254d722e3fbSopenharmony_ci
4255d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_cmd, va_cmd, mc_address_cmd, bo_cmd_size);
4256d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4257d722e3fbSopenharmony_ci
4258d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_shader_ps, va_shader_ps, mc_address_shader_ps, bo_shader_ps_size);
4259d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4260d722e3fbSopenharmony_ci	r = amdgpu_bo_unmap_and_free(bo_shader_vs, va_shader_vs, mc_address_shader_vs, bo_shader_vs_size);
4261d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4262d722e3fbSopenharmony_ci
4263d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
4264d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4265d722e3fbSopenharmony_ci}
4266d722e3fbSopenharmony_ci
4267d722e3fbSopenharmony_cistatic void amdgpu_gpu_reset_test(void)
4268d722e3fbSopenharmony_ci{
4269d722e3fbSopenharmony_ci	int r;
4270d722e3fbSopenharmony_ci	char debugfs_path[256], tmp[10];
4271d722e3fbSopenharmony_ci	int fd;
4272d722e3fbSopenharmony_ci	struct stat sbuf;
4273d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
4274d722e3fbSopenharmony_ci	uint32_t hang_state, hangs;
4275d722e3fbSopenharmony_ci
4276d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
4277d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4278d722e3fbSopenharmony_ci
4279d722e3fbSopenharmony_ci	r = fstat(drm_amdgpu[0], &sbuf);
4280d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4281d722e3fbSopenharmony_ci
4282d722e3fbSopenharmony_ci	sprintf(debugfs_path, "/sys/kernel/debug/dri/%d/amdgpu_gpu_recover", minor(sbuf.st_rdev));
4283d722e3fbSopenharmony_ci	fd = open(debugfs_path, O_RDONLY);
4284d722e3fbSopenharmony_ci	CU_ASSERT(fd >= 0);
4285d722e3fbSopenharmony_ci
4286d722e3fbSopenharmony_ci	r = read(fd, tmp, sizeof(tmp)/sizeof(char));
4287d722e3fbSopenharmony_ci	CU_ASSERT(r > 0);
4288d722e3fbSopenharmony_ci
4289d722e3fbSopenharmony_ci	r = amdgpu_cs_query_reset_state(context_handle, &hang_state, &hangs);
4290d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4291d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(hang_state, AMDGPU_CTX_UNKNOWN_RESET);
4292d722e3fbSopenharmony_ci
4293d722e3fbSopenharmony_ci	close(fd);
4294d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
4295d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4296d722e3fbSopenharmony_ci
4297d722e3fbSopenharmony_ci	amdgpu_compute_dispatch_test();
4298d722e3fbSopenharmony_ci	amdgpu_gfx_dispatch_test();
4299d722e3fbSopenharmony_ci}
4300d722e3fbSopenharmony_ci
4301d722e3fbSopenharmony_cistatic void amdgpu_stable_pstate_test(void)
4302d722e3fbSopenharmony_ci{
4303d722e3fbSopenharmony_ci	int r;
4304d722e3fbSopenharmony_ci	amdgpu_context_handle context_handle;
4305d722e3fbSopenharmony_ci	uint32_t current_pstate = 0, new_pstate = 0;
4306d722e3fbSopenharmony_ci
4307d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_create(device_handle, &context_handle);
4308d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4309d722e3fbSopenharmony_ci
4310d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_stable_pstate(context_handle,
4311d722e3fbSopenharmony_ci					AMDGPU_CTX_OP_GET_STABLE_PSTATE,
4312d722e3fbSopenharmony_ci					0, &current_pstate);
4313d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4314d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(new_pstate, AMDGPU_CTX_STABLE_PSTATE_NONE);
4315d722e3fbSopenharmony_ci
4316d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_stable_pstate(context_handle,
4317d722e3fbSopenharmony_ci					AMDGPU_CTX_OP_SET_STABLE_PSTATE,
4318d722e3fbSopenharmony_ci					AMDGPU_CTX_STABLE_PSTATE_PEAK, NULL);
4319d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4320d722e3fbSopenharmony_ci
4321d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_stable_pstate(context_handle,
4322d722e3fbSopenharmony_ci					AMDGPU_CTX_OP_GET_STABLE_PSTATE,
4323d722e3fbSopenharmony_ci					0, &new_pstate);
4324d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4325d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(new_pstate, AMDGPU_CTX_STABLE_PSTATE_PEAK);
4326d722e3fbSopenharmony_ci
4327d722e3fbSopenharmony_ci	r = amdgpu_cs_ctx_free(context_handle);
4328d722e3fbSopenharmony_ci	CU_ASSERT_EQUAL(r, 0);
4329d722e3fbSopenharmony_ci}
4330