1e5c31af7Sopenharmony_ci/*------------------------------------------------------------------------
2e5c31af7Sopenharmony_ci * OpenGL Conformance Tests
3e5c31af7Sopenharmony_ci * ------------------------
4e5c31af7Sopenharmony_ci *
5e5c31af7Sopenharmony_ci * Copyright (c) 2017-2019 The Khronos Group Inc.
6e5c31af7Sopenharmony_ci * Copyright (c) 2017 Codeplay Software Ltd.
7e5c31af7Sopenharmony_ci * Copyright (c) 2019 NVIDIA Corporation.
8e5c31af7Sopenharmony_ci *
9e5c31af7Sopenharmony_ci * Licensed under the Apache License, Version 2.0 (the "License");
10e5c31af7Sopenharmony_ci * you may not use this file except in compliance with the License.
11e5c31af7Sopenharmony_ci * You may obtain a copy of the License at
12e5c31af7Sopenharmony_ci *
13e5c31af7Sopenharmony_ci *      http://www.apache.org/licenses/LICENSE-2.0
14e5c31af7Sopenharmony_ci *
15e5c31af7Sopenharmony_ci * Unless required by applicable law or agreed to in writing, software
16e5c31af7Sopenharmony_ci * distributed under the License is distributed on an "AS IS" BASIS,
17e5c31af7Sopenharmony_ci * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
18e5c31af7Sopenharmony_ci * See the License for the specific language governing permissions and
19e5c31af7Sopenharmony_ci * limitations under the License.
20e5c31af7Sopenharmony_ci *
21e5c31af7Sopenharmony_ci */ /*!
22e5c31af7Sopenharmony_ci * \file
23e5c31af7Sopenharmony_ci * \brief Subgroups Tests
24e5c31af7Sopenharmony_ci */ /*--------------------------------------------------------------------*/
25e5c31af7Sopenharmony_ci
26e5c31af7Sopenharmony_ci#include "glcSubgroupsBallotBroadcastTests.hpp"
27e5c31af7Sopenharmony_ci#include "glcSubgroupsTestsUtils.hpp"
28e5c31af7Sopenharmony_ci
29e5c31af7Sopenharmony_ci#include <string>
30e5c31af7Sopenharmony_ci#include <vector>
31e5c31af7Sopenharmony_ci
32e5c31af7Sopenharmony_ciusing namespace tcu;
33e5c31af7Sopenharmony_ciusing namespace std;
34e5c31af7Sopenharmony_ci
35e5c31af7Sopenharmony_cinamespace glc
36e5c31af7Sopenharmony_ci{
37e5c31af7Sopenharmony_cinamespace subgroups
38e5c31af7Sopenharmony_ci{
39e5c31af7Sopenharmony_cinamespace
40e5c31af7Sopenharmony_ci{
41e5c31af7Sopenharmony_cienum OpType
42e5c31af7Sopenharmony_ci{
43e5c31af7Sopenharmony_ci	OPTYPE_BROADCAST = 0,
44e5c31af7Sopenharmony_ci	OPTYPE_BROADCAST_FIRST,
45e5c31af7Sopenharmony_ci	OPTYPE_LAST
46e5c31af7Sopenharmony_ci};
47e5c31af7Sopenharmony_ci
48e5c31af7Sopenharmony_cistatic bool checkVertexPipelineStages(std::vector<const void*> datas,
49e5c31af7Sopenharmony_ci									  deUint32 width, deUint32)
50e5c31af7Sopenharmony_ci{
51e5c31af7Sopenharmony_ci	return glc::subgroups::check(datas, width, 3);
52e5c31af7Sopenharmony_ci}
53e5c31af7Sopenharmony_ci
54e5c31af7Sopenharmony_cistatic bool checkComputeStages(std::vector<const void*> datas,
55e5c31af7Sopenharmony_ci						 const deUint32 numWorkgroups[3], const deUint32 localSize[3],
56e5c31af7Sopenharmony_ci						 deUint32)
57e5c31af7Sopenharmony_ci{
58e5c31af7Sopenharmony_ci	return glc::subgroups::checkCompute(datas, numWorkgroups, localSize, 3);
59e5c31af7Sopenharmony_ci}
60e5c31af7Sopenharmony_ci
61e5c31af7Sopenharmony_cistd::string getOpTypeName(int opType)
62e5c31af7Sopenharmony_ci{
63e5c31af7Sopenharmony_ci	switch (opType)
64e5c31af7Sopenharmony_ci	{
65e5c31af7Sopenharmony_ci		default:
66e5c31af7Sopenharmony_ci			DE_FATAL("Unsupported op type");
67e5c31af7Sopenharmony_ci			return "";
68e5c31af7Sopenharmony_ci		case OPTYPE_BROADCAST:
69e5c31af7Sopenharmony_ci			return "subgroupBroadcast";
70e5c31af7Sopenharmony_ci		case OPTYPE_BROADCAST_FIRST:
71e5c31af7Sopenharmony_ci			return "subgroupBroadcastFirst";
72e5c31af7Sopenharmony_ci	}
73e5c31af7Sopenharmony_ci}
74e5c31af7Sopenharmony_ci
75e5c31af7Sopenharmony_cistruct CaseDefinition
76e5c31af7Sopenharmony_ci{
77e5c31af7Sopenharmony_ci	int					opType;
78e5c31af7Sopenharmony_ci	ShaderStageFlags	shaderStage;
79e5c31af7Sopenharmony_ci	Format				format;
80e5c31af7Sopenharmony_ci};
81e5c31af7Sopenharmony_ci
82e5c31af7Sopenharmony_cistd::string getBodySource(CaseDefinition caseDef)
83e5c31af7Sopenharmony_ci{
84e5c31af7Sopenharmony_ci	std::ostringstream bdy;
85e5c31af7Sopenharmony_ci
86e5c31af7Sopenharmony_ci	bdy << "  uvec4 mask = subgroupBallot(true);\n";
87e5c31af7Sopenharmony_ci	bdy << "  uint tempResult = 0u;\n";
88e5c31af7Sopenharmony_ci
89e5c31af7Sopenharmony_ci	if (OPTYPE_BROADCAST == caseDef.opType)
90e5c31af7Sopenharmony_ci	{
91e5c31af7Sopenharmony_ci		bdy	<< "  tempResult = 0x3u;\n";
92e5c31af7Sopenharmony_ci		for (int i = 0; i < (int)subgroups::maxSupportedSubgroupSize(); i++)
93e5c31af7Sopenharmony_ci		{
94e5c31af7Sopenharmony_ci			bdy << "  {\n"
95e5c31af7Sopenharmony_ci			<< "    const uint id = "<< i << "u;\n"
96e5c31af7Sopenharmony_ci			<< "    " << subgroups::getFormatNameForGLSL(caseDef.format)
97e5c31af7Sopenharmony_ci			<< " op = subgroupBroadcast(data1[gl_SubgroupInvocationID], id);\n"
98e5c31af7Sopenharmony_ci			<< "    if ((id < gl_SubgroupSize) && subgroupBallotBitExtract(mask, id))\n"
99e5c31af7Sopenharmony_ci			<< "    {\n"
100e5c31af7Sopenharmony_ci			<< "      if (op != data1[id])\n"
101e5c31af7Sopenharmony_ci			<< "      {\n"
102e5c31af7Sopenharmony_ci			<< "        tempResult = 0u;\n"
103e5c31af7Sopenharmony_ci			<< "      }\n"
104e5c31af7Sopenharmony_ci			<< "    }\n"
105e5c31af7Sopenharmony_ci			<< "  }\n";
106e5c31af7Sopenharmony_ci		}
107e5c31af7Sopenharmony_ci	}
108e5c31af7Sopenharmony_ci	else
109e5c31af7Sopenharmony_ci	{
110e5c31af7Sopenharmony_ci		bdy	<< "  uint firstActive = 0u;\n"
111e5c31af7Sopenharmony_ci			<< "  for (uint i = 0u; i < gl_SubgroupSize; i++)\n"
112e5c31af7Sopenharmony_ci			<< "  {\n"
113e5c31af7Sopenharmony_ci			<< "    if (subgroupBallotBitExtract(mask, i))\n"
114e5c31af7Sopenharmony_ci			<< "    {\n"
115e5c31af7Sopenharmony_ci			<< "      firstActive = i;\n"
116e5c31af7Sopenharmony_ci			<< "      break;\n"
117e5c31af7Sopenharmony_ci			<< "    }\n"
118e5c31af7Sopenharmony_ci			<< "  }\n"
119e5c31af7Sopenharmony_ci			<< "  tempResult |= (subgroupBroadcastFirst(data1[gl_SubgroupInvocationID]) == data1[firstActive]) ? 0x1u : 0u;\n"
120e5c31af7Sopenharmony_ci			<< "  // make the firstActive invocation inactive now\n"
121e5c31af7Sopenharmony_ci			<< "  if (firstActive == gl_SubgroupInvocationID)\n"
122e5c31af7Sopenharmony_ci			<< "  {\n"
123e5c31af7Sopenharmony_ci			<< "    for (uint i = 0u; i < gl_SubgroupSize; i++)\n"
124e5c31af7Sopenharmony_ci			<< "    {\n"
125e5c31af7Sopenharmony_ci			<< "      if (subgroupBallotBitExtract(mask, i))\n"
126e5c31af7Sopenharmony_ci			<< "      {\n"
127e5c31af7Sopenharmony_ci			<< "        firstActive = i;\n"
128e5c31af7Sopenharmony_ci			<< "        break;\n"
129e5c31af7Sopenharmony_ci			<< "      }\n"
130e5c31af7Sopenharmony_ci			<< "    }\n"
131e5c31af7Sopenharmony_ci			<< "    tempResult |= (subgroupBroadcastFirst(data1[gl_SubgroupInvocationID]) == data1[firstActive]) ? 0x2u : 0u;\n"
132e5c31af7Sopenharmony_ci			<< "  }\n"
133e5c31af7Sopenharmony_ci			<< "  else\n"
134e5c31af7Sopenharmony_ci			<< "  {\n"
135e5c31af7Sopenharmony_ci			<< "    // the firstActive invocation didn't partake in the second result so set it to true\n"
136e5c31af7Sopenharmony_ci			<< "    tempResult |= 0x2u;\n"
137e5c31af7Sopenharmony_ci			<< "  }\n";
138e5c31af7Sopenharmony_ci	}
139e5c31af7Sopenharmony_ci   return bdy.str();
140e5c31af7Sopenharmony_ci}
141e5c31af7Sopenharmony_ci
142e5c31af7Sopenharmony_civoid initFrameBufferPrograms(SourceCollections& programCollection, CaseDefinition caseDef)
143e5c31af7Sopenharmony_ci{
144e5c31af7Sopenharmony_ci	subgroups::setFragmentShaderFrameBuffer(programCollection);
145e5c31af7Sopenharmony_ci
146e5c31af7Sopenharmony_ci	if (SHADER_STAGE_VERTEX_BIT != caseDef.shaderStage)
147e5c31af7Sopenharmony_ci		subgroups::setVertexShaderFrameBuffer(programCollection);
148e5c31af7Sopenharmony_ci
149e5c31af7Sopenharmony_ci	std::string bdyStr = getBodySource(caseDef);
150e5c31af7Sopenharmony_ci
151e5c31af7Sopenharmony_ci	if (SHADER_STAGE_VERTEX_BIT == caseDef.shaderStage)
152e5c31af7Sopenharmony_ci	{
153e5c31af7Sopenharmony_ci		std::ostringstream				vertex;
154e5c31af7Sopenharmony_ci		vertex << "${VERSION_DECL}\n"
155e5c31af7Sopenharmony_ci			<< "#extension GL_KHR_shader_subgroup_ballot: enable\n"
156e5c31af7Sopenharmony_ci			<< "layout(location = 0) in highp vec4 in_position;\n"
157e5c31af7Sopenharmony_ci			<< "layout(location = 0) out float out_color;\n"
158e5c31af7Sopenharmony_ci			<< "layout(binding = 0, std140) uniform Buffer0\n"
159e5c31af7Sopenharmony_ci			<< "{\n"
160e5c31af7Sopenharmony_ci			<< "  " << subgroups::getFormatNameForGLSL(caseDef.format) << " data1[" << subgroups::maxSupportedSubgroupSize() << "];\n"
161e5c31af7Sopenharmony_ci			<< "};\n"
162e5c31af7Sopenharmony_ci			<< "\n"
163e5c31af7Sopenharmony_ci			<< "void main (void)\n"
164e5c31af7Sopenharmony_ci			<< "{\n"
165e5c31af7Sopenharmony_ci			<< bdyStr
166e5c31af7Sopenharmony_ci			<< "  out_color = float(tempResult);\n"
167e5c31af7Sopenharmony_ci			<< "  gl_Position = in_position;\n"
168e5c31af7Sopenharmony_ci			<< "  gl_PointSize = 1.0f;\n"
169e5c31af7Sopenharmony_ci			<< "}\n";
170e5c31af7Sopenharmony_ci		programCollection.add("vert") << glu::VertexSource(vertex.str());
171e5c31af7Sopenharmony_ci	}
172e5c31af7Sopenharmony_ci	else if (SHADER_STAGE_GEOMETRY_BIT == caseDef.shaderStage)
173e5c31af7Sopenharmony_ci	{
174e5c31af7Sopenharmony_ci		std::ostringstream geometry;
175e5c31af7Sopenharmony_ci
176e5c31af7Sopenharmony_ci		geometry << "${VERSION_DECL}\n"
177e5c31af7Sopenharmony_ci			<< "#extension GL_KHR_shader_subgroup_ballot: enable\n"
178e5c31af7Sopenharmony_ci			<< "layout(points) in;\n"
179e5c31af7Sopenharmony_ci			<< "layout(points, max_vertices = 1) out;\n"
180e5c31af7Sopenharmony_ci			<< "layout(location = 0) out float out_color;\n"
181e5c31af7Sopenharmony_ci			<< "layout(binding = 0, std140) uniform Buffer0\n"
182e5c31af7Sopenharmony_ci			<< "{\n"
183e5c31af7Sopenharmony_ci			<< "  " << subgroups::getFormatNameForGLSL(caseDef.format) << " data1[" <<subgroups::maxSupportedSubgroupSize() << "];\n"
184e5c31af7Sopenharmony_ci			<< "};\n"
185e5c31af7Sopenharmony_ci			<< "\n"
186e5c31af7Sopenharmony_ci			<< "void main (void)\n"
187e5c31af7Sopenharmony_ci			<< "{\n"
188e5c31af7Sopenharmony_ci			<< bdyStr
189e5c31af7Sopenharmony_ci			<< "  out_color = float(tempResult);\n"
190e5c31af7Sopenharmony_ci			<< "  gl_Position = gl_in[0].gl_Position;\n"
191e5c31af7Sopenharmony_ci			<< "  EmitVertex();\n"
192e5c31af7Sopenharmony_ci			<< "  EndPrimitive();\n"
193e5c31af7Sopenharmony_ci			<< "}\n";
194e5c31af7Sopenharmony_ci
195e5c31af7Sopenharmony_ci		programCollection.add("geometry") << glu::GeometrySource(geometry.str());
196e5c31af7Sopenharmony_ci	}
197e5c31af7Sopenharmony_ci	else if (SHADER_STAGE_TESS_CONTROL_BIT == caseDef.shaderStage)
198e5c31af7Sopenharmony_ci	{
199e5c31af7Sopenharmony_ci		std::ostringstream controlSource;
200e5c31af7Sopenharmony_ci
201e5c31af7Sopenharmony_ci		controlSource << "${VERSION_DECL}\n"
202e5c31af7Sopenharmony_ci			<< "#extension GL_KHR_shader_subgroup_ballot: enable\n"
203e5c31af7Sopenharmony_ci			<< "layout(vertices = 2) out;\n"
204e5c31af7Sopenharmony_ci			<< "layout(location = 0) out float out_color[];\n"
205e5c31af7Sopenharmony_ci			<< "layout(binding = 0, std140) uniform Buffer0\n"
206e5c31af7Sopenharmony_ci			<< "{\n"
207e5c31af7Sopenharmony_ci			<< "  " << subgroups::getFormatNameForGLSL(caseDef.format) << " data1[" <<subgroups::maxSupportedSubgroupSize() << "];\n"
208e5c31af7Sopenharmony_ci			<< "};\n"
209e5c31af7Sopenharmony_ci			<< "\n"
210e5c31af7Sopenharmony_ci			<< "void main (void)\n"
211e5c31af7Sopenharmony_ci			<< "{\n"
212e5c31af7Sopenharmony_ci			<< "  if (gl_InvocationID == 0)\n"
213e5c31af7Sopenharmony_ci			<< "  {\n"
214e5c31af7Sopenharmony_ci			<< "    gl_TessLevelOuter[0] = 1.0f;\n"
215e5c31af7Sopenharmony_ci			<< "    gl_TessLevelOuter[1] = 1.0f;\n"
216e5c31af7Sopenharmony_ci			<< "  }\n"
217e5c31af7Sopenharmony_ci			<< bdyStr
218e5c31af7Sopenharmony_ci			<< "  out_color[gl_InvocationID ] = float(tempResult);\n"
219e5c31af7Sopenharmony_ci			<< "  gl_out[gl_InvocationID].gl_Position = gl_in[gl_InvocationID].gl_Position;\n"
220e5c31af7Sopenharmony_ci			<< "}\n";
221e5c31af7Sopenharmony_ci
222e5c31af7Sopenharmony_ci		programCollection.add("tesc") << glu::TessellationControlSource(controlSource.str());
223e5c31af7Sopenharmony_ci		subgroups::setTesEvalShaderFrameBuffer(programCollection);
224e5c31af7Sopenharmony_ci	}
225e5c31af7Sopenharmony_ci	else if (SHADER_STAGE_TESS_EVALUATION_BIT == caseDef.shaderStage)
226e5c31af7Sopenharmony_ci	{
227e5c31af7Sopenharmony_ci		std::ostringstream evaluationSource;
228e5c31af7Sopenharmony_ci		evaluationSource << "${VERSION_DECL}\n"
229e5c31af7Sopenharmony_ci			<< "#extension GL_KHR_shader_subgroup_ballot: enable\n"
230e5c31af7Sopenharmony_ci			<< "layout(isolines, equal_spacing, ccw ) in;\n"
231e5c31af7Sopenharmony_ci			<< "layout(location = 0) out float out_color;\n"
232e5c31af7Sopenharmony_ci			<< "layout(binding = 0, std140) uniform Buffer0\n"
233e5c31af7Sopenharmony_ci			<< "{\n"
234e5c31af7Sopenharmony_ci			<< "  " << subgroups::getFormatNameForGLSL(caseDef.format) << " data1[" <<subgroups::maxSupportedSubgroupSize() << "];\n"
235e5c31af7Sopenharmony_ci			<< "};\n"
236e5c31af7Sopenharmony_ci			<< "\n"
237e5c31af7Sopenharmony_ci			<< "void main (void)\n"
238e5c31af7Sopenharmony_ci			<< "{\n"
239e5c31af7Sopenharmony_ci			<< bdyStr
240e5c31af7Sopenharmony_ci			<< "  out_color  = float(tempResult);\n"
241e5c31af7Sopenharmony_ci			<< "  gl_Position = mix(gl_in[0].gl_Position, gl_in[1].gl_Position, gl_TessCoord.x);\n"
242e5c31af7Sopenharmony_ci			<< "}\n";
243e5c31af7Sopenharmony_ci
244e5c31af7Sopenharmony_ci		subgroups::setTesCtrlShaderFrameBuffer(programCollection);
245e5c31af7Sopenharmony_ci		programCollection.add("tese") << glu::TessellationEvaluationSource(evaluationSource.str());
246e5c31af7Sopenharmony_ci	}
247e5c31af7Sopenharmony_ci	else
248e5c31af7Sopenharmony_ci	{
249e5c31af7Sopenharmony_ci		DE_FATAL("Unsupported shader stage");
250e5c31af7Sopenharmony_ci	}
251e5c31af7Sopenharmony_ci}
252e5c31af7Sopenharmony_ci
253e5c31af7Sopenharmony_civoid initPrograms(SourceCollections& programCollection, CaseDefinition caseDef)
254e5c31af7Sopenharmony_ci{
255e5c31af7Sopenharmony_ci	std::string bdyStr = getBodySource(caseDef);
256e5c31af7Sopenharmony_ci
257e5c31af7Sopenharmony_ci	if (SHADER_STAGE_COMPUTE_BIT == caseDef.shaderStage)
258e5c31af7Sopenharmony_ci	{
259e5c31af7Sopenharmony_ci		std::ostringstream src;
260e5c31af7Sopenharmony_ci
261e5c31af7Sopenharmony_ci		src << "${VERSION_DECL}\n"
262e5c31af7Sopenharmony_ci			<< "#extension GL_KHR_shader_subgroup_ballot: enable\n"
263e5c31af7Sopenharmony_ci			<< "layout (${LOCAL_SIZE_X}, ${LOCAL_SIZE_Y}, ${LOCAL_SIZE_Z}) in;\n"
264e5c31af7Sopenharmony_ci			<< "layout(binding = 0, std430) buffer Buffer0\n"
265e5c31af7Sopenharmony_ci			<< "{\n"
266e5c31af7Sopenharmony_ci			<< "  uint result[];\n"
267e5c31af7Sopenharmony_ci			<< "};\n"
268e5c31af7Sopenharmony_ci			<< "layout(binding = 1, std430) buffer Buffer1\n"
269e5c31af7Sopenharmony_ci			<< "{\n"
270e5c31af7Sopenharmony_ci			<< "  " << subgroups::getFormatNameForGLSL(caseDef.format) << " data1[];\n"
271e5c31af7Sopenharmony_ci			<< "};\n"
272e5c31af7Sopenharmony_ci			<< "\n"
273e5c31af7Sopenharmony_ci			<< "void main (void)\n"
274e5c31af7Sopenharmony_ci			<< "{\n"
275e5c31af7Sopenharmony_ci			<< "  uvec3 globalSize = gl_NumWorkGroups * gl_WorkGroupSize;\n"
276e5c31af7Sopenharmony_ci			<< "  highp uint offset = globalSize.x * ((globalSize.y * "
277e5c31af7Sopenharmony_ci			"gl_GlobalInvocationID.z) + gl_GlobalInvocationID.y) + "
278e5c31af7Sopenharmony_ci			"gl_GlobalInvocationID.x;\n"
279e5c31af7Sopenharmony_ci			<< bdyStr
280e5c31af7Sopenharmony_ci			<< "  result[offset] = tempResult;\n"
281e5c31af7Sopenharmony_ci			<< "}\n";
282e5c31af7Sopenharmony_ci
283e5c31af7Sopenharmony_ci		programCollection.add("comp") << glu::ComputeSource(src.str());
284e5c31af7Sopenharmony_ci	}
285e5c31af7Sopenharmony_ci	else
286e5c31af7Sopenharmony_ci	{
287e5c31af7Sopenharmony_ci		const string vertex =
288e5c31af7Sopenharmony_ci			"${VERSION_DECL}\n"
289e5c31af7Sopenharmony_ci			"#extension GL_KHR_shader_subgroup_ballot: enable\n"
290e5c31af7Sopenharmony_ci			"layout(binding = 0, std430) buffer Buffer0\n"
291e5c31af7Sopenharmony_ci			"{\n"
292e5c31af7Sopenharmony_ci			"  uint result[];\n"
293e5c31af7Sopenharmony_ci			"} b0;\n"
294e5c31af7Sopenharmony_ci			"layout(binding = 4, std430) readonly buffer Buffer4\n"
295e5c31af7Sopenharmony_ci			"{\n"
296e5c31af7Sopenharmony_ci			"  " + subgroups::getFormatNameForGLSL(caseDef.format) + " data1[];\n"
297e5c31af7Sopenharmony_ci			"};\n"
298e5c31af7Sopenharmony_ci			"\n"
299e5c31af7Sopenharmony_ci			"void main (void)\n"
300e5c31af7Sopenharmony_ci			"{\n"
301e5c31af7Sopenharmony_ci			+ bdyStr +
302e5c31af7Sopenharmony_ci			"  b0.result[gl_VertexID] = tempResult;\n"
303e5c31af7Sopenharmony_ci			"  float pixelSize = 2.0f/1024.0f;\n"
304e5c31af7Sopenharmony_ci			"  float pixelPosition = pixelSize/2.0f - 1.0f;\n"
305e5c31af7Sopenharmony_ci			"  gl_Position = vec4(float(gl_VertexID) * pixelSize + pixelPosition, 0.0f, 0.0f, 1.0f);\n"
306e5c31af7Sopenharmony_ci			"  gl_PointSize = 1.0f;\n"
307e5c31af7Sopenharmony_ci			"}\n";
308e5c31af7Sopenharmony_ci
309e5c31af7Sopenharmony_ci		const string tesc =
310e5c31af7Sopenharmony_ci			"${VERSION_DECL}\n"
311e5c31af7Sopenharmony_ci			"#extension GL_KHR_shader_subgroup_ballot: enable\n"
312e5c31af7Sopenharmony_ci			"layout(vertices=1) out;\n"
313e5c31af7Sopenharmony_ci			"layout(binding = 1, std430) buffer Buffer1\n"
314e5c31af7Sopenharmony_ci			"{\n"
315e5c31af7Sopenharmony_ci			"  uint result[];\n"
316e5c31af7Sopenharmony_ci			"} b1;\n"
317e5c31af7Sopenharmony_ci			"layout(binding = 4, std430) readonly buffer Buffer4\n"
318e5c31af7Sopenharmony_ci			"{\n"
319e5c31af7Sopenharmony_ci			"  " + subgroups::getFormatNameForGLSL(caseDef.format) + " data1[];\n"
320e5c31af7Sopenharmony_ci			"};\n"
321e5c31af7Sopenharmony_ci			"\n"
322e5c31af7Sopenharmony_ci			"void main (void)\n"
323e5c31af7Sopenharmony_ci			"{\n"
324e5c31af7Sopenharmony_ci			+ bdyStr +
325e5c31af7Sopenharmony_ci			"  b1.result[gl_PrimitiveID] = tempResult;\n"
326e5c31af7Sopenharmony_ci			"  if (gl_InvocationID == 0)\n"
327e5c31af7Sopenharmony_ci			"  {\n"
328e5c31af7Sopenharmony_ci			"    gl_TessLevelOuter[0] = 1.0f;\n"
329e5c31af7Sopenharmony_ci			"    gl_TessLevelOuter[1] = 1.0f;\n"
330e5c31af7Sopenharmony_ci			"  }\n"
331e5c31af7Sopenharmony_ci			"  gl_out[gl_InvocationID].gl_Position = gl_in[gl_InvocationID].gl_Position;\n"
332e5c31af7Sopenharmony_ci			"}\n";
333e5c31af7Sopenharmony_ci
334e5c31af7Sopenharmony_ci		const string tese =
335e5c31af7Sopenharmony_ci			"${VERSION_DECL}\n"
336e5c31af7Sopenharmony_ci			"#extension GL_KHR_shader_subgroup_ballot: enable\n"
337e5c31af7Sopenharmony_ci			"layout(isolines) in;\n"
338e5c31af7Sopenharmony_ci			"layout(binding = 2, std430) buffer Buffer2\n"
339e5c31af7Sopenharmony_ci			"{\n"
340e5c31af7Sopenharmony_ci			"  uint result[];\n"
341e5c31af7Sopenharmony_ci			"} b2;\n"
342e5c31af7Sopenharmony_ci			"layout(binding = 4, std430) readonly buffer Buffer4\n"
343e5c31af7Sopenharmony_ci			"{\n"
344e5c31af7Sopenharmony_ci			"  " + subgroups::getFormatNameForGLSL(caseDef.format) + " data1[];\n"
345e5c31af7Sopenharmony_ci			"};\n"
346e5c31af7Sopenharmony_ci			"\n"
347e5c31af7Sopenharmony_ci			"void main (void)\n"
348e5c31af7Sopenharmony_ci			"{\n"
349e5c31af7Sopenharmony_ci			+ bdyStr +
350e5c31af7Sopenharmony_ci			"  b2.result[gl_PrimitiveID * 2 + int(gl_TessCoord.x + 0.5)] = tempResult;\n"
351e5c31af7Sopenharmony_ci			"  float pixelSize = 2.0f/1024.0f;\n"
352e5c31af7Sopenharmony_ci			"  gl_Position = gl_in[0].gl_Position + gl_TessCoord.x * pixelSize / 2.0f;\n"
353e5c31af7Sopenharmony_ci			"}\n";
354e5c31af7Sopenharmony_ci
355e5c31af7Sopenharmony_ci		const string geometry =
356e5c31af7Sopenharmony_ci			//version string added by addGeometryShadersFromTemplate
357e5c31af7Sopenharmony_ci			"#extension GL_KHR_shader_subgroup_ballot: enable\n"
358e5c31af7Sopenharmony_ci			"layout(${TOPOLOGY}) in;\n"
359e5c31af7Sopenharmony_ci			"layout(points, max_vertices = 1) out;\n"
360e5c31af7Sopenharmony_ci			"layout(binding = 3, std430) buffer Buffer3\n"
361e5c31af7Sopenharmony_ci			"{\n"
362e5c31af7Sopenharmony_ci			"  uint result[];\n"
363e5c31af7Sopenharmony_ci			"} b3;\n"
364e5c31af7Sopenharmony_ci			"layout(binding = 4, std430) readonly buffer Buffer4\n"
365e5c31af7Sopenharmony_ci			"{\n"
366e5c31af7Sopenharmony_ci			"  " + subgroups::getFormatNameForGLSL(caseDef.format) + " data1[];\n"
367e5c31af7Sopenharmony_ci			"};\n"
368e5c31af7Sopenharmony_ci			"\n"
369e5c31af7Sopenharmony_ci			"void main (void)\n"
370e5c31af7Sopenharmony_ci			"{\n"
371e5c31af7Sopenharmony_ci			+ bdyStr +
372e5c31af7Sopenharmony_ci			"  b3.result[gl_PrimitiveIDIn] = tempResult;\n"
373e5c31af7Sopenharmony_ci			"  gl_Position = gl_in[0].gl_Position;\n"
374e5c31af7Sopenharmony_ci			"  EmitVertex();\n"
375e5c31af7Sopenharmony_ci			"  EndPrimitive();\n"
376e5c31af7Sopenharmony_ci			"}\n";
377e5c31af7Sopenharmony_ci
378e5c31af7Sopenharmony_ci		const string fragment =
379e5c31af7Sopenharmony_ci			"${VERSION_DECL}\n"
380e5c31af7Sopenharmony_ci			"#extension GL_KHR_shader_subgroup_ballot: enable\n"
381e5c31af7Sopenharmony_ci			"precision highp int;\n"
382e5c31af7Sopenharmony_ci			"precision highp float;\n"
383e5c31af7Sopenharmony_ci			"layout(location = 0) out uint result;\n"
384e5c31af7Sopenharmony_ci			"layout(binding = 4, std430) readonly buffer Buffer4\n"
385e5c31af7Sopenharmony_ci			"{\n"
386e5c31af7Sopenharmony_ci			"  " + subgroups::getFormatNameForGLSL(caseDef.format) + " data1[];\n"
387e5c31af7Sopenharmony_ci			"};\n"
388e5c31af7Sopenharmony_ci			"void main (void)\n"
389e5c31af7Sopenharmony_ci			"{\n"
390e5c31af7Sopenharmony_ci			+ bdyStr +
391e5c31af7Sopenharmony_ci			"  result = tempResult;\n"
392e5c31af7Sopenharmony_ci			"}\n";
393e5c31af7Sopenharmony_ci
394e5c31af7Sopenharmony_ci		subgroups::addNoSubgroupShader(programCollection);
395e5c31af7Sopenharmony_ci
396e5c31af7Sopenharmony_ci		programCollection.add("vert") << glu::VertexSource(vertex);
397e5c31af7Sopenharmony_ci		programCollection.add("tesc") << glu::TessellationControlSource(tesc);
398e5c31af7Sopenharmony_ci		programCollection.add("tese") << glu::TessellationEvaluationSource(tese);
399e5c31af7Sopenharmony_ci		subgroups::addGeometryShadersFromTemplate(geometry, programCollection);
400e5c31af7Sopenharmony_ci		programCollection.add("fragment") << glu::FragmentSource(fragment);
401e5c31af7Sopenharmony_ci	}
402e5c31af7Sopenharmony_ci}
403e5c31af7Sopenharmony_ci
404e5c31af7Sopenharmony_civoid supportedCheck (Context& context, CaseDefinition caseDef)
405e5c31af7Sopenharmony_ci{
406e5c31af7Sopenharmony_ci	if (!subgroups::isSubgroupSupported(context))
407e5c31af7Sopenharmony_ci		TCU_THROW(NotSupportedError, "Subgroup operations are not supported");
408e5c31af7Sopenharmony_ci
409e5c31af7Sopenharmony_ci	if (!subgroups::isSubgroupFeatureSupportedForDevice(context, SUBGROUP_FEATURE_BALLOT_BIT))
410e5c31af7Sopenharmony_ci	{
411e5c31af7Sopenharmony_ci		TCU_THROW(NotSupportedError, "Device does not support subgroup ballot operations");
412e5c31af7Sopenharmony_ci	}
413e5c31af7Sopenharmony_ci
414e5c31af7Sopenharmony_ci	if (subgroups::isDoubleFormat(caseDef.format) &&
415e5c31af7Sopenharmony_ci		!subgroups::isDoubleSupportedForDevice(context))
416e5c31af7Sopenharmony_ci	{
417e5c31af7Sopenharmony_ci		TCU_THROW(NotSupportedError, "Device does not support subgroup double operations");
418e5c31af7Sopenharmony_ci	}
419e5c31af7Sopenharmony_ci}
420e5c31af7Sopenharmony_ci
421e5c31af7Sopenharmony_citcu::TestStatus noSSBOtest (Context& context, const CaseDefinition caseDef)
422e5c31af7Sopenharmony_ci{
423e5c31af7Sopenharmony_ci	if (!subgroups::areSubgroupOperationsSupportedForStage(
424e5c31af7Sopenharmony_ci			context, caseDef.shaderStage))
425e5c31af7Sopenharmony_ci	{
426e5c31af7Sopenharmony_ci		if (subgroups::areSubgroupOperationsRequiredForStage(caseDef.shaderStage))
427e5c31af7Sopenharmony_ci		{
428e5c31af7Sopenharmony_ci			return tcu::TestStatus::fail(
429e5c31af7Sopenharmony_ci					   "Shader stage " +
430e5c31af7Sopenharmony_ci					   subgroups::getShaderStageName(caseDef.shaderStage) +
431e5c31af7Sopenharmony_ci					   " is required to support subgroup operations!");
432e5c31af7Sopenharmony_ci		}
433e5c31af7Sopenharmony_ci		else
434e5c31af7Sopenharmony_ci		{
435e5c31af7Sopenharmony_ci			TCU_THROW(NotSupportedError, "Device does not support subgroup operations for this stage");
436e5c31af7Sopenharmony_ci		}
437e5c31af7Sopenharmony_ci	}
438e5c31af7Sopenharmony_ci
439e5c31af7Sopenharmony_ci	subgroups::SSBOData inputData[1];
440e5c31af7Sopenharmony_ci	inputData[0].format = caseDef.format;
441e5c31af7Sopenharmony_ci	inputData[0].layout = subgroups::SSBOData::LayoutStd140;
442e5c31af7Sopenharmony_ci	inputData[0].numElements = subgroups::maxSupportedSubgroupSize();
443e5c31af7Sopenharmony_ci	inputData[0].initializeType = subgroups::SSBOData::InitializeNonZero;
444e5c31af7Sopenharmony_ci
445e5c31af7Sopenharmony_ci	if (SHADER_STAGE_VERTEX_BIT == caseDef.shaderStage)
446e5c31af7Sopenharmony_ci		return subgroups::makeVertexFrameBufferTest(context, FORMAT_R32_UINT, inputData, 1, checkVertexPipelineStages);
447e5c31af7Sopenharmony_ci	else if (SHADER_STAGE_GEOMETRY_BIT == caseDef.shaderStage)
448e5c31af7Sopenharmony_ci		return subgroups::makeGeometryFrameBufferTest(context, FORMAT_R32_UINT, inputData, 1, checkVertexPipelineStages);
449e5c31af7Sopenharmony_ci	else if (SHADER_STAGE_TESS_CONTROL_BIT == caseDef.shaderStage)
450e5c31af7Sopenharmony_ci		return subgroups::makeTessellationEvaluationFrameBufferTest(context, FORMAT_R32_UINT, inputData, 1, checkVertexPipelineStages, SHADER_STAGE_TESS_CONTROL_BIT);
451e5c31af7Sopenharmony_ci	else if (SHADER_STAGE_TESS_EVALUATION_BIT == caseDef.shaderStage)
452e5c31af7Sopenharmony_ci		return subgroups::makeTessellationEvaluationFrameBufferTest(context, FORMAT_R32_UINT, inputData, 1, checkVertexPipelineStages, SHADER_STAGE_TESS_EVALUATION_BIT);
453e5c31af7Sopenharmony_ci	else
454e5c31af7Sopenharmony_ci		TCU_THROW(InternalError, "Unhandled shader stage");
455e5c31af7Sopenharmony_ci}
456e5c31af7Sopenharmony_ci
457e5c31af7Sopenharmony_ci
458e5c31af7Sopenharmony_citcu::TestStatus test(Context& context, const CaseDefinition caseDef)
459e5c31af7Sopenharmony_ci{
460e5c31af7Sopenharmony_ci	if (SHADER_STAGE_COMPUTE_BIT == caseDef.shaderStage)
461e5c31af7Sopenharmony_ci	{
462e5c31af7Sopenharmony_ci		if (!subgroups::areSubgroupOperationsSupportedForStage(context, caseDef.shaderStage))
463e5c31af7Sopenharmony_ci		{
464e5c31af7Sopenharmony_ci			if (subgroups::areSubgroupOperationsRequiredForStage(caseDef.shaderStage))
465e5c31af7Sopenharmony_ci			{
466e5c31af7Sopenharmony_ci				return tcu::TestStatus::fail(
467e5c31af7Sopenharmony_ci						   "Shader stage " +
468e5c31af7Sopenharmony_ci						   subgroups::getShaderStageName(caseDef.shaderStage) +
469e5c31af7Sopenharmony_ci						   " is required to support subgroup operations!");
470e5c31af7Sopenharmony_ci			}
471e5c31af7Sopenharmony_ci			else
472e5c31af7Sopenharmony_ci			{
473e5c31af7Sopenharmony_ci				TCU_THROW(NotSupportedError, "Device does not support subgroup operations for this stage");
474e5c31af7Sopenharmony_ci			}
475e5c31af7Sopenharmony_ci		}
476e5c31af7Sopenharmony_ci		subgroups::SSBOData inputData[1];
477e5c31af7Sopenharmony_ci		inputData[0].format = caseDef.format;
478e5c31af7Sopenharmony_ci		inputData[0].layout = subgroups::SSBOData::LayoutStd430;
479e5c31af7Sopenharmony_ci		inputData[0].numElements = subgroups::maxSupportedSubgroupSize();
480e5c31af7Sopenharmony_ci		inputData[0].initializeType = subgroups::SSBOData::InitializeNonZero;
481e5c31af7Sopenharmony_ci		inputData[0].binding = 1u;
482e5c31af7Sopenharmony_ci
483e5c31af7Sopenharmony_ci		return subgroups::makeComputeTest(context, FORMAT_R32_UINT, inputData, 1, checkComputeStages);
484e5c31af7Sopenharmony_ci	}
485e5c31af7Sopenharmony_ci	else
486e5c31af7Sopenharmony_ci	{
487e5c31af7Sopenharmony_ci		int supportedStages = context.getDeqpContext().getContextInfo().getInt(GL_SUBGROUP_SUPPORTED_STAGES_KHR);
488e5c31af7Sopenharmony_ci
489e5c31af7Sopenharmony_ci		ShaderStageFlags stages = (ShaderStageFlags)(caseDef.shaderStage & supportedStages);
490e5c31af7Sopenharmony_ci
491e5c31af7Sopenharmony_ci		if ( SHADER_STAGE_FRAGMENT_BIT != stages && !subgroups::isVertexSSBOSupportedForDevice(context))
492e5c31af7Sopenharmony_ci		{
493e5c31af7Sopenharmony_ci			if ( (stages & SHADER_STAGE_FRAGMENT_BIT) == 0)
494e5c31af7Sopenharmony_ci				TCU_THROW(NotSupportedError, "Device does not support vertex stage SSBO writes");
495e5c31af7Sopenharmony_ci			else
496e5c31af7Sopenharmony_ci				stages = SHADER_STAGE_FRAGMENT_BIT;
497e5c31af7Sopenharmony_ci		}
498e5c31af7Sopenharmony_ci
499e5c31af7Sopenharmony_ci		if ((ShaderStageFlags)0u == stages)
500e5c31af7Sopenharmony_ci			TCU_THROW(NotSupportedError, "Subgroup operations are not supported for any graphic shader");
501e5c31af7Sopenharmony_ci
502e5c31af7Sopenharmony_ci		subgroups::SSBOData inputData;
503e5c31af7Sopenharmony_ci		inputData.format			= caseDef.format;
504e5c31af7Sopenharmony_ci		inputData.layout			= subgroups::SSBOData::LayoutStd430;
505e5c31af7Sopenharmony_ci		inputData.numElements		= subgroups::maxSupportedSubgroupSize();
506e5c31af7Sopenharmony_ci		inputData.initializeType	= subgroups::SSBOData::InitializeNonZero;
507e5c31af7Sopenharmony_ci		inputData.binding			= 4u;
508e5c31af7Sopenharmony_ci		inputData.stages			= stages;
509e5c31af7Sopenharmony_ci
510e5c31af7Sopenharmony_ci		return subgroups::allStages(context, FORMAT_R32_UINT, &inputData, 1, checkVertexPipelineStages, stages);
511e5c31af7Sopenharmony_ci	}
512e5c31af7Sopenharmony_ci}
513e5c31af7Sopenharmony_ci}
514e5c31af7Sopenharmony_ci
515e5c31af7Sopenharmony_cideqp::TestCaseGroup* createSubgroupsBallotBroadcastTests(deqp::Context& testCtx)
516e5c31af7Sopenharmony_ci{
517e5c31af7Sopenharmony_ci	de::MovePtr<deqp::TestCaseGroup> graphicGroup(new deqp::TestCaseGroup(
518e5c31af7Sopenharmony_ci		testCtx, "graphics", "Subgroup ballot broadcast category tests: graphics"));
519e5c31af7Sopenharmony_ci	de::MovePtr<deqp::TestCaseGroup> computeGroup(new deqp::TestCaseGroup(
520e5c31af7Sopenharmony_ci		testCtx, "compute", "Subgroup ballot broadcast category tests: compute"));
521e5c31af7Sopenharmony_ci	de::MovePtr<deqp::TestCaseGroup> framebufferGroup(new deqp::TestCaseGroup(
522e5c31af7Sopenharmony_ci		testCtx, "framebuffer", "Subgroup ballot broadcast category tests: framebuffer"));
523e5c31af7Sopenharmony_ci
524e5c31af7Sopenharmony_ci	const ShaderStageFlags stages[] =
525e5c31af7Sopenharmony_ci	{
526e5c31af7Sopenharmony_ci		SHADER_STAGE_VERTEX_BIT,
527e5c31af7Sopenharmony_ci		SHADER_STAGE_TESS_EVALUATION_BIT,
528e5c31af7Sopenharmony_ci		SHADER_STAGE_TESS_CONTROL_BIT,
529e5c31af7Sopenharmony_ci		SHADER_STAGE_GEOMETRY_BIT,
530e5c31af7Sopenharmony_ci	};
531e5c31af7Sopenharmony_ci
532e5c31af7Sopenharmony_ci	const Format formats[] =
533e5c31af7Sopenharmony_ci	{
534e5c31af7Sopenharmony_ci		FORMAT_R32_SINT, FORMAT_R32G32_SINT, FORMAT_R32G32B32_SINT,
535e5c31af7Sopenharmony_ci		FORMAT_R32G32B32A32_SINT, FORMAT_R32_UINT, FORMAT_R32G32_UINT,
536e5c31af7Sopenharmony_ci		FORMAT_R32G32B32_UINT, FORMAT_R32G32B32A32_UINT,
537e5c31af7Sopenharmony_ci		FORMAT_R32_SFLOAT, FORMAT_R32G32_SFLOAT,
538e5c31af7Sopenharmony_ci		FORMAT_R32G32B32_SFLOAT, FORMAT_R32G32B32A32_SFLOAT,
539e5c31af7Sopenharmony_ci		FORMAT_R64_SFLOAT, FORMAT_R64G64_SFLOAT,
540e5c31af7Sopenharmony_ci		FORMAT_R64G64B64_SFLOAT, FORMAT_R64G64B64A64_SFLOAT,
541e5c31af7Sopenharmony_ci		FORMAT_R32_BOOL, FORMAT_R32G32_BOOL,
542e5c31af7Sopenharmony_ci		FORMAT_R32G32B32_BOOL, FORMAT_R32G32B32A32_BOOL,
543e5c31af7Sopenharmony_ci	};
544e5c31af7Sopenharmony_ci
545e5c31af7Sopenharmony_ci	for (int formatIndex = 0; formatIndex < DE_LENGTH_OF_ARRAY(formats); ++formatIndex)
546e5c31af7Sopenharmony_ci	{
547e5c31af7Sopenharmony_ci		const Format format = formats[formatIndex];
548e5c31af7Sopenharmony_ci
549e5c31af7Sopenharmony_ci		for (int opTypeIndex = 0; opTypeIndex < OPTYPE_LAST; ++opTypeIndex)
550e5c31af7Sopenharmony_ci		{
551e5c31af7Sopenharmony_ci			const std::string op = de::toLower(getOpTypeName(opTypeIndex));
552e5c31af7Sopenharmony_ci			const std::string name = op + "_" + subgroups::getFormatNameForGLSL(format);
553e5c31af7Sopenharmony_ci
554e5c31af7Sopenharmony_ci			{
555e5c31af7Sopenharmony_ci				CaseDefinition caseDef = {opTypeIndex, SHADER_STAGE_COMPUTE_BIT, format};
556e5c31af7Sopenharmony_ci				SubgroupFactory<CaseDefinition>::addFunctionCaseWithPrograms(computeGroup.get(), name, "", supportedCheck, initPrograms, test, caseDef);
557e5c31af7Sopenharmony_ci			}
558e5c31af7Sopenharmony_ci
559e5c31af7Sopenharmony_ci			{
560e5c31af7Sopenharmony_ci				const CaseDefinition caseDef = {opTypeIndex, SHADER_STAGE_ALL_GRAPHICS, format};
561e5c31af7Sopenharmony_ci				SubgroupFactory<CaseDefinition>::addFunctionCaseWithPrograms(graphicGroup.get(), name, "", supportedCheck, initPrograms, test, caseDef);
562e5c31af7Sopenharmony_ci			}
563e5c31af7Sopenharmony_ci
564e5c31af7Sopenharmony_ci			for (int stageIndex = 0; stageIndex < DE_LENGTH_OF_ARRAY(stages); ++stageIndex)
565e5c31af7Sopenharmony_ci			{
566e5c31af7Sopenharmony_ci				const CaseDefinition caseDef = {opTypeIndex, stages[stageIndex], format};
567e5c31af7Sopenharmony_ci				SubgroupFactory<CaseDefinition>::addFunctionCaseWithPrograms(framebufferGroup.get(), name + getShaderStageName(caseDef.shaderStage), "",
568e5c31af7Sopenharmony_ci							supportedCheck, initFrameBufferPrograms, noSSBOtest, caseDef);
569e5c31af7Sopenharmony_ci			}
570e5c31af7Sopenharmony_ci		}
571e5c31af7Sopenharmony_ci	}
572e5c31af7Sopenharmony_ci
573e5c31af7Sopenharmony_ci	de::MovePtr<deqp::TestCaseGroup> group(new deqp::TestCaseGroup(
574e5c31af7Sopenharmony_ci		testCtx, "ballot_broadcast", "Subgroup ballot broadcast category tests"));
575e5c31af7Sopenharmony_ci
576e5c31af7Sopenharmony_ci	group->addChild(graphicGroup.release());
577e5c31af7Sopenharmony_ci	group->addChild(computeGroup.release());
578e5c31af7Sopenharmony_ci	group->addChild(framebufferGroup.release());
579e5c31af7Sopenharmony_ci	return group.release();
580e5c31af7Sopenharmony_ci}
581e5c31af7Sopenharmony_ci
582e5c31af7Sopenharmony_ci} // subgroups
583e5c31af7Sopenharmony_ci} // glc
584