1e5c31af7Sopenharmony_ci/*------------------------------------------------------------------------ 2e5c31af7Sopenharmony_ci * OpenGL Conformance Tests 3e5c31af7Sopenharmony_ci * ------------------------ 4e5c31af7Sopenharmony_ci * 5e5c31af7Sopenharmony_ci * Copyright (c) 2017-2019 The Khronos Group Inc. 6e5c31af7Sopenharmony_ci * Copyright (c) 2017 Codeplay Software Ltd. 7e5c31af7Sopenharmony_ci * Copyright (c) 2019 NVIDIA Corporation. 8e5c31af7Sopenharmony_ci * 9e5c31af7Sopenharmony_ci * Licensed under the Apache License, Version 2.0 (the "License"); 10e5c31af7Sopenharmony_ci * you may not use this file except in compliance with the License. 11e5c31af7Sopenharmony_ci * You may obtain a copy of the License at 12e5c31af7Sopenharmony_ci * 13e5c31af7Sopenharmony_ci * http://www.apache.org/licenses/LICENSE-2.0 14e5c31af7Sopenharmony_ci * 15e5c31af7Sopenharmony_ci * Unless required by applicable law or agreed to in writing, software 16e5c31af7Sopenharmony_ci * distributed under the License is distributed on an "AS IS" BASIS, 17e5c31af7Sopenharmony_ci * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 18e5c31af7Sopenharmony_ci * See the License for the specific language governing permissions and 19e5c31af7Sopenharmony_ci * limitations under the License. 20e5c31af7Sopenharmony_ci * 21e5c31af7Sopenharmony_ci */ /*! 22e5c31af7Sopenharmony_ci * \file 23e5c31af7Sopenharmony_ci * \brief Subgroups Tests 24e5c31af7Sopenharmony_ci */ /*--------------------------------------------------------------------*/ 25e5c31af7Sopenharmony_ci 26e5c31af7Sopenharmony_ci#include "glcSubgroupsBallotBroadcastTests.hpp" 27e5c31af7Sopenharmony_ci#include "glcSubgroupsTestsUtils.hpp" 28e5c31af7Sopenharmony_ci 29e5c31af7Sopenharmony_ci#include <string> 30e5c31af7Sopenharmony_ci#include <vector> 31e5c31af7Sopenharmony_ci 32e5c31af7Sopenharmony_ciusing namespace tcu; 33e5c31af7Sopenharmony_ciusing namespace std; 34e5c31af7Sopenharmony_ci 35e5c31af7Sopenharmony_cinamespace glc 36e5c31af7Sopenharmony_ci{ 37e5c31af7Sopenharmony_cinamespace subgroups 38e5c31af7Sopenharmony_ci{ 39e5c31af7Sopenharmony_cinamespace 40e5c31af7Sopenharmony_ci{ 41e5c31af7Sopenharmony_cienum OpType 42e5c31af7Sopenharmony_ci{ 43e5c31af7Sopenharmony_ci OPTYPE_BROADCAST = 0, 44e5c31af7Sopenharmony_ci OPTYPE_BROADCAST_FIRST, 45e5c31af7Sopenharmony_ci OPTYPE_LAST 46e5c31af7Sopenharmony_ci}; 47e5c31af7Sopenharmony_ci 48e5c31af7Sopenharmony_cistatic bool checkVertexPipelineStages(std::vector<const void*> datas, 49e5c31af7Sopenharmony_ci deUint32 width, deUint32) 50e5c31af7Sopenharmony_ci{ 51e5c31af7Sopenharmony_ci return glc::subgroups::check(datas, width, 3); 52e5c31af7Sopenharmony_ci} 53e5c31af7Sopenharmony_ci 54e5c31af7Sopenharmony_cistatic bool checkComputeStages(std::vector<const void*> datas, 55e5c31af7Sopenharmony_ci const deUint32 numWorkgroups[3], const deUint32 localSize[3], 56e5c31af7Sopenharmony_ci deUint32) 57e5c31af7Sopenharmony_ci{ 58e5c31af7Sopenharmony_ci return glc::subgroups::checkCompute(datas, numWorkgroups, localSize, 3); 59e5c31af7Sopenharmony_ci} 60e5c31af7Sopenharmony_ci 61e5c31af7Sopenharmony_cistd::string getOpTypeName(int opType) 62e5c31af7Sopenharmony_ci{ 63e5c31af7Sopenharmony_ci switch (opType) 64e5c31af7Sopenharmony_ci { 65e5c31af7Sopenharmony_ci default: 66e5c31af7Sopenharmony_ci DE_FATAL("Unsupported op type"); 67e5c31af7Sopenharmony_ci return ""; 68e5c31af7Sopenharmony_ci case OPTYPE_BROADCAST: 69e5c31af7Sopenharmony_ci return "subgroupBroadcast"; 70e5c31af7Sopenharmony_ci case OPTYPE_BROADCAST_FIRST: 71e5c31af7Sopenharmony_ci return "subgroupBroadcastFirst"; 72e5c31af7Sopenharmony_ci } 73e5c31af7Sopenharmony_ci} 74e5c31af7Sopenharmony_ci 75e5c31af7Sopenharmony_cistruct CaseDefinition 76e5c31af7Sopenharmony_ci{ 77e5c31af7Sopenharmony_ci int opType; 78e5c31af7Sopenharmony_ci ShaderStageFlags shaderStage; 79e5c31af7Sopenharmony_ci Format format; 80e5c31af7Sopenharmony_ci}; 81e5c31af7Sopenharmony_ci 82e5c31af7Sopenharmony_cistd::string getBodySource(CaseDefinition caseDef) 83e5c31af7Sopenharmony_ci{ 84e5c31af7Sopenharmony_ci std::ostringstream bdy; 85e5c31af7Sopenharmony_ci 86e5c31af7Sopenharmony_ci bdy << " uvec4 mask = subgroupBallot(true);\n"; 87e5c31af7Sopenharmony_ci bdy << " uint tempResult = 0u;\n"; 88e5c31af7Sopenharmony_ci 89e5c31af7Sopenharmony_ci if (OPTYPE_BROADCAST == caseDef.opType) 90e5c31af7Sopenharmony_ci { 91e5c31af7Sopenharmony_ci bdy << " tempResult = 0x3u;\n"; 92e5c31af7Sopenharmony_ci for (int i = 0; i < (int)subgroups::maxSupportedSubgroupSize(); i++) 93e5c31af7Sopenharmony_ci { 94e5c31af7Sopenharmony_ci bdy << " {\n" 95e5c31af7Sopenharmony_ci << " const uint id = "<< i << "u;\n" 96e5c31af7Sopenharmony_ci << " " << subgroups::getFormatNameForGLSL(caseDef.format) 97e5c31af7Sopenharmony_ci << " op = subgroupBroadcast(data1[gl_SubgroupInvocationID], id);\n" 98e5c31af7Sopenharmony_ci << " if ((id < gl_SubgroupSize) && subgroupBallotBitExtract(mask, id))\n" 99e5c31af7Sopenharmony_ci << " {\n" 100e5c31af7Sopenharmony_ci << " if (op != data1[id])\n" 101e5c31af7Sopenharmony_ci << " {\n" 102e5c31af7Sopenharmony_ci << " tempResult = 0u;\n" 103e5c31af7Sopenharmony_ci << " }\n" 104e5c31af7Sopenharmony_ci << " }\n" 105e5c31af7Sopenharmony_ci << " }\n"; 106e5c31af7Sopenharmony_ci } 107e5c31af7Sopenharmony_ci } 108e5c31af7Sopenharmony_ci else 109e5c31af7Sopenharmony_ci { 110e5c31af7Sopenharmony_ci bdy << " uint firstActive = 0u;\n" 111e5c31af7Sopenharmony_ci << " for (uint i = 0u; i < gl_SubgroupSize; i++)\n" 112e5c31af7Sopenharmony_ci << " {\n" 113e5c31af7Sopenharmony_ci << " if (subgroupBallotBitExtract(mask, i))\n" 114e5c31af7Sopenharmony_ci << " {\n" 115e5c31af7Sopenharmony_ci << " firstActive = i;\n" 116e5c31af7Sopenharmony_ci << " break;\n" 117e5c31af7Sopenharmony_ci << " }\n" 118e5c31af7Sopenharmony_ci << " }\n" 119e5c31af7Sopenharmony_ci << " tempResult |= (subgroupBroadcastFirst(data1[gl_SubgroupInvocationID]) == data1[firstActive]) ? 0x1u : 0u;\n" 120e5c31af7Sopenharmony_ci << " // make the firstActive invocation inactive now\n" 121e5c31af7Sopenharmony_ci << " if (firstActive == gl_SubgroupInvocationID)\n" 122e5c31af7Sopenharmony_ci << " {\n" 123e5c31af7Sopenharmony_ci << " for (uint i = 0u; i < gl_SubgroupSize; i++)\n" 124e5c31af7Sopenharmony_ci << " {\n" 125e5c31af7Sopenharmony_ci << " if (subgroupBallotBitExtract(mask, i))\n" 126e5c31af7Sopenharmony_ci << " {\n" 127e5c31af7Sopenharmony_ci << " firstActive = i;\n" 128e5c31af7Sopenharmony_ci << " break;\n" 129e5c31af7Sopenharmony_ci << " }\n" 130e5c31af7Sopenharmony_ci << " }\n" 131e5c31af7Sopenharmony_ci << " tempResult |= (subgroupBroadcastFirst(data1[gl_SubgroupInvocationID]) == data1[firstActive]) ? 0x2u : 0u;\n" 132e5c31af7Sopenharmony_ci << " }\n" 133e5c31af7Sopenharmony_ci << " else\n" 134e5c31af7Sopenharmony_ci << " {\n" 135e5c31af7Sopenharmony_ci << " // the firstActive invocation didn't partake in the second result so set it to true\n" 136e5c31af7Sopenharmony_ci << " tempResult |= 0x2u;\n" 137e5c31af7Sopenharmony_ci << " }\n"; 138e5c31af7Sopenharmony_ci } 139e5c31af7Sopenharmony_ci return bdy.str(); 140e5c31af7Sopenharmony_ci} 141e5c31af7Sopenharmony_ci 142e5c31af7Sopenharmony_civoid initFrameBufferPrograms(SourceCollections& programCollection, CaseDefinition caseDef) 143e5c31af7Sopenharmony_ci{ 144e5c31af7Sopenharmony_ci subgroups::setFragmentShaderFrameBuffer(programCollection); 145e5c31af7Sopenharmony_ci 146e5c31af7Sopenharmony_ci if (SHADER_STAGE_VERTEX_BIT != caseDef.shaderStage) 147e5c31af7Sopenharmony_ci subgroups::setVertexShaderFrameBuffer(programCollection); 148e5c31af7Sopenharmony_ci 149e5c31af7Sopenharmony_ci std::string bdyStr = getBodySource(caseDef); 150e5c31af7Sopenharmony_ci 151e5c31af7Sopenharmony_ci if (SHADER_STAGE_VERTEX_BIT == caseDef.shaderStage) 152e5c31af7Sopenharmony_ci { 153e5c31af7Sopenharmony_ci std::ostringstream vertex; 154e5c31af7Sopenharmony_ci vertex << "${VERSION_DECL}\n" 155e5c31af7Sopenharmony_ci << "#extension GL_KHR_shader_subgroup_ballot: enable\n" 156e5c31af7Sopenharmony_ci << "layout(location = 0) in highp vec4 in_position;\n" 157e5c31af7Sopenharmony_ci << "layout(location = 0) out float out_color;\n" 158e5c31af7Sopenharmony_ci << "layout(binding = 0, std140) uniform Buffer0\n" 159e5c31af7Sopenharmony_ci << "{\n" 160e5c31af7Sopenharmony_ci << " " << subgroups::getFormatNameForGLSL(caseDef.format) << " data1[" << subgroups::maxSupportedSubgroupSize() << "];\n" 161e5c31af7Sopenharmony_ci << "};\n" 162e5c31af7Sopenharmony_ci << "\n" 163e5c31af7Sopenharmony_ci << "void main (void)\n" 164e5c31af7Sopenharmony_ci << "{\n" 165e5c31af7Sopenharmony_ci << bdyStr 166e5c31af7Sopenharmony_ci << " out_color = float(tempResult);\n" 167e5c31af7Sopenharmony_ci << " gl_Position = in_position;\n" 168e5c31af7Sopenharmony_ci << " gl_PointSize = 1.0f;\n" 169e5c31af7Sopenharmony_ci << "}\n"; 170e5c31af7Sopenharmony_ci programCollection.add("vert") << glu::VertexSource(vertex.str()); 171e5c31af7Sopenharmony_ci } 172e5c31af7Sopenharmony_ci else if (SHADER_STAGE_GEOMETRY_BIT == caseDef.shaderStage) 173e5c31af7Sopenharmony_ci { 174e5c31af7Sopenharmony_ci std::ostringstream geometry; 175e5c31af7Sopenharmony_ci 176e5c31af7Sopenharmony_ci geometry << "${VERSION_DECL}\n" 177e5c31af7Sopenharmony_ci << "#extension GL_KHR_shader_subgroup_ballot: enable\n" 178e5c31af7Sopenharmony_ci << "layout(points) in;\n" 179e5c31af7Sopenharmony_ci << "layout(points, max_vertices = 1) out;\n" 180e5c31af7Sopenharmony_ci << "layout(location = 0) out float out_color;\n" 181e5c31af7Sopenharmony_ci << "layout(binding = 0, std140) uniform Buffer0\n" 182e5c31af7Sopenharmony_ci << "{\n" 183e5c31af7Sopenharmony_ci << " " << subgroups::getFormatNameForGLSL(caseDef.format) << " data1[" <<subgroups::maxSupportedSubgroupSize() << "];\n" 184e5c31af7Sopenharmony_ci << "};\n" 185e5c31af7Sopenharmony_ci << "\n" 186e5c31af7Sopenharmony_ci << "void main (void)\n" 187e5c31af7Sopenharmony_ci << "{\n" 188e5c31af7Sopenharmony_ci << bdyStr 189e5c31af7Sopenharmony_ci << " out_color = float(tempResult);\n" 190e5c31af7Sopenharmony_ci << " gl_Position = gl_in[0].gl_Position;\n" 191e5c31af7Sopenharmony_ci << " EmitVertex();\n" 192e5c31af7Sopenharmony_ci << " EndPrimitive();\n" 193e5c31af7Sopenharmony_ci << "}\n"; 194e5c31af7Sopenharmony_ci 195e5c31af7Sopenharmony_ci programCollection.add("geometry") << glu::GeometrySource(geometry.str()); 196e5c31af7Sopenharmony_ci } 197e5c31af7Sopenharmony_ci else if (SHADER_STAGE_TESS_CONTROL_BIT == caseDef.shaderStage) 198e5c31af7Sopenharmony_ci { 199e5c31af7Sopenharmony_ci std::ostringstream controlSource; 200e5c31af7Sopenharmony_ci 201e5c31af7Sopenharmony_ci controlSource << "${VERSION_DECL}\n" 202e5c31af7Sopenharmony_ci << "#extension GL_KHR_shader_subgroup_ballot: enable\n" 203e5c31af7Sopenharmony_ci << "layout(vertices = 2) out;\n" 204e5c31af7Sopenharmony_ci << "layout(location = 0) out float out_color[];\n" 205e5c31af7Sopenharmony_ci << "layout(binding = 0, std140) uniform Buffer0\n" 206e5c31af7Sopenharmony_ci << "{\n" 207e5c31af7Sopenharmony_ci << " " << subgroups::getFormatNameForGLSL(caseDef.format) << " data1[" <<subgroups::maxSupportedSubgroupSize() << "];\n" 208e5c31af7Sopenharmony_ci << "};\n" 209e5c31af7Sopenharmony_ci << "\n" 210e5c31af7Sopenharmony_ci << "void main (void)\n" 211e5c31af7Sopenharmony_ci << "{\n" 212e5c31af7Sopenharmony_ci << " if (gl_InvocationID == 0)\n" 213e5c31af7Sopenharmony_ci << " {\n" 214e5c31af7Sopenharmony_ci << " gl_TessLevelOuter[0] = 1.0f;\n" 215e5c31af7Sopenharmony_ci << " gl_TessLevelOuter[1] = 1.0f;\n" 216e5c31af7Sopenharmony_ci << " }\n" 217e5c31af7Sopenharmony_ci << bdyStr 218e5c31af7Sopenharmony_ci << " out_color[gl_InvocationID ] = float(tempResult);\n" 219e5c31af7Sopenharmony_ci << " gl_out[gl_InvocationID].gl_Position = gl_in[gl_InvocationID].gl_Position;\n" 220e5c31af7Sopenharmony_ci << "}\n"; 221e5c31af7Sopenharmony_ci 222e5c31af7Sopenharmony_ci programCollection.add("tesc") << glu::TessellationControlSource(controlSource.str()); 223e5c31af7Sopenharmony_ci subgroups::setTesEvalShaderFrameBuffer(programCollection); 224e5c31af7Sopenharmony_ci } 225e5c31af7Sopenharmony_ci else if (SHADER_STAGE_TESS_EVALUATION_BIT == caseDef.shaderStage) 226e5c31af7Sopenharmony_ci { 227e5c31af7Sopenharmony_ci std::ostringstream evaluationSource; 228e5c31af7Sopenharmony_ci evaluationSource << "${VERSION_DECL}\n" 229e5c31af7Sopenharmony_ci << "#extension GL_KHR_shader_subgroup_ballot: enable\n" 230e5c31af7Sopenharmony_ci << "layout(isolines, equal_spacing, ccw ) in;\n" 231e5c31af7Sopenharmony_ci << "layout(location = 0) out float out_color;\n" 232e5c31af7Sopenharmony_ci << "layout(binding = 0, std140) uniform Buffer0\n" 233e5c31af7Sopenharmony_ci << "{\n" 234e5c31af7Sopenharmony_ci << " " << subgroups::getFormatNameForGLSL(caseDef.format) << " data1[" <<subgroups::maxSupportedSubgroupSize() << "];\n" 235e5c31af7Sopenharmony_ci << "};\n" 236e5c31af7Sopenharmony_ci << "\n" 237e5c31af7Sopenharmony_ci << "void main (void)\n" 238e5c31af7Sopenharmony_ci << "{\n" 239e5c31af7Sopenharmony_ci << bdyStr 240e5c31af7Sopenharmony_ci << " out_color = float(tempResult);\n" 241e5c31af7Sopenharmony_ci << " gl_Position = mix(gl_in[0].gl_Position, gl_in[1].gl_Position, gl_TessCoord.x);\n" 242e5c31af7Sopenharmony_ci << "}\n"; 243e5c31af7Sopenharmony_ci 244e5c31af7Sopenharmony_ci subgroups::setTesCtrlShaderFrameBuffer(programCollection); 245e5c31af7Sopenharmony_ci programCollection.add("tese") << glu::TessellationEvaluationSource(evaluationSource.str()); 246e5c31af7Sopenharmony_ci } 247e5c31af7Sopenharmony_ci else 248e5c31af7Sopenharmony_ci { 249e5c31af7Sopenharmony_ci DE_FATAL("Unsupported shader stage"); 250e5c31af7Sopenharmony_ci } 251e5c31af7Sopenharmony_ci} 252e5c31af7Sopenharmony_ci 253e5c31af7Sopenharmony_civoid initPrograms(SourceCollections& programCollection, CaseDefinition caseDef) 254e5c31af7Sopenharmony_ci{ 255e5c31af7Sopenharmony_ci std::string bdyStr = getBodySource(caseDef); 256e5c31af7Sopenharmony_ci 257e5c31af7Sopenharmony_ci if (SHADER_STAGE_COMPUTE_BIT == caseDef.shaderStage) 258e5c31af7Sopenharmony_ci { 259e5c31af7Sopenharmony_ci std::ostringstream src; 260e5c31af7Sopenharmony_ci 261e5c31af7Sopenharmony_ci src << "${VERSION_DECL}\n" 262e5c31af7Sopenharmony_ci << "#extension GL_KHR_shader_subgroup_ballot: enable\n" 263e5c31af7Sopenharmony_ci << "layout (${LOCAL_SIZE_X}, ${LOCAL_SIZE_Y}, ${LOCAL_SIZE_Z}) in;\n" 264e5c31af7Sopenharmony_ci << "layout(binding = 0, std430) buffer Buffer0\n" 265e5c31af7Sopenharmony_ci << "{\n" 266e5c31af7Sopenharmony_ci << " uint result[];\n" 267e5c31af7Sopenharmony_ci << "};\n" 268e5c31af7Sopenharmony_ci << "layout(binding = 1, std430) buffer Buffer1\n" 269e5c31af7Sopenharmony_ci << "{\n" 270e5c31af7Sopenharmony_ci << " " << subgroups::getFormatNameForGLSL(caseDef.format) << " data1[];\n" 271e5c31af7Sopenharmony_ci << "};\n" 272e5c31af7Sopenharmony_ci << "\n" 273e5c31af7Sopenharmony_ci << "void main (void)\n" 274e5c31af7Sopenharmony_ci << "{\n" 275e5c31af7Sopenharmony_ci << " uvec3 globalSize = gl_NumWorkGroups * gl_WorkGroupSize;\n" 276e5c31af7Sopenharmony_ci << " highp uint offset = globalSize.x * ((globalSize.y * " 277e5c31af7Sopenharmony_ci "gl_GlobalInvocationID.z) + gl_GlobalInvocationID.y) + " 278e5c31af7Sopenharmony_ci "gl_GlobalInvocationID.x;\n" 279e5c31af7Sopenharmony_ci << bdyStr 280e5c31af7Sopenharmony_ci << " result[offset] = tempResult;\n" 281e5c31af7Sopenharmony_ci << "}\n"; 282e5c31af7Sopenharmony_ci 283e5c31af7Sopenharmony_ci programCollection.add("comp") << glu::ComputeSource(src.str()); 284e5c31af7Sopenharmony_ci } 285e5c31af7Sopenharmony_ci else 286e5c31af7Sopenharmony_ci { 287e5c31af7Sopenharmony_ci const string vertex = 288e5c31af7Sopenharmony_ci "${VERSION_DECL}\n" 289e5c31af7Sopenharmony_ci "#extension GL_KHR_shader_subgroup_ballot: enable\n" 290e5c31af7Sopenharmony_ci "layout(binding = 0, std430) buffer Buffer0\n" 291e5c31af7Sopenharmony_ci "{\n" 292e5c31af7Sopenharmony_ci " uint result[];\n" 293e5c31af7Sopenharmony_ci "} b0;\n" 294e5c31af7Sopenharmony_ci "layout(binding = 4, std430) readonly buffer Buffer4\n" 295e5c31af7Sopenharmony_ci "{\n" 296e5c31af7Sopenharmony_ci " " + subgroups::getFormatNameForGLSL(caseDef.format) + " data1[];\n" 297e5c31af7Sopenharmony_ci "};\n" 298e5c31af7Sopenharmony_ci "\n" 299e5c31af7Sopenharmony_ci "void main (void)\n" 300e5c31af7Sopenharmony_ci "{\n" 301e5c31af7Sopenharmony_ci + bdyStr + 302e5c31af7Sopenharmony_ci " b0.result[gl_VertexID] = tempResult;\n" 303e5c31af7Sopenharmony_ci " float pixelSize = 2.0f/1024.0f;\n" 304e5c31af7Sopenharmony_ci " float pixelPosition = pixelSize/2.0f - 1.0f;\n" 305e5c31af7Sopenharmony_ci " gl_Position = vec4(float(gl_VertexID) * pixelSize + pixelPosition, 0.0f, 0.0f, 1.0f);\n" 306e5c31af7Sopenharmony_ci " gl_PointSize = 1.0f;\n" 307e5c31af7Sopenharmony_ci "}\n"; 308e5c31af7Sopenharmony_ci 309e5c31af7Sopenharmony_ci const string tesc = 310e5c31af7Sopenharmony_ci "${VERSION_DECL}\n" 311e5c31af7Sopenharmony_ci "#extension GL_KHR_shader_subgroup_ballot: enable\n" 312e5c31af7Sopenharmony_ci "layout(vertices=1) out;\n" 313e5c31af7Sopenharmony_ci "layout(binding = 1, std430) buffer Buffer1\n" 314e5c31af7Sopenharmony_ci "{\n" 315e5c31af7Sopenharmony_ci " uint result[];\n" 316e5c31af7Sopenharmony_ci "} b1;\n" 317e5c31af7Sopenharmony_ci "layout(binding = 4, std430) readonly buffer Buffer4\n" 318e5c31af7Sopenharmony_ci "{\n" 319e5c31af7Sopenharmony_ci " " + subgroups::getFormatNameForGLSL(caseDef.format) + " data1[];\n" 320e5c31af7Sopenharmony_ci "};\n" 321e5c31af7Sopenharmony_ci "\n" 322e5c31af7Sopenharmony_ci "void main (void)\n" 323e5c31af7Sopenharmony_ci "{\n" 324e5c31af7Sopenharmony_ci + bdyStr + 325e5c31af7Sopenharmony_ci " b1.result[gl_PrimitiveID] = tempResult;\n" 326e5c31af7Sopenharmony_ci " if (gl_InvocationID == 0)\n" 327e5c31af7Sopenharmony_ci " {\n" 328e5c31af7Sopenharmony_ci " gl_TessLevelOuter[0] = 1.0f;\n" 329e5c31af7Sopenharmony_ci " gl_TessLevelOuter[1] = 1.0f;\n" 330e5c31af7Sopenharmony_ci " }\n" 331e5c31af7Sopenharmony_ci " gl_out[gl_InvocationID].gl_Position = gl_in[gl_InvocationID].gl_Position;\n" 332e5c31af7Sopenharmony_ci "}\n"; 333e5c31af7Sopenharmony_ci 334e5c31af7Sopenharmony_ci const string tese = 335e5c31af7Sopenharmony_ci "${VERSION_DECL}\n" 336e5c31af7Sopenharmony_ci "#extension GL_KHR_shader_subgroup_ballot: enable\n" 337e5c31af7Sopenharmony_ci "layout(isolines) in;\n" 338e5c31af7Sopenharmony_ci "layout(binding = 2, std430) buffer Buffer2\n" 339e5c31af7Sopenharmony_ci "{\n" 340e5c31af7Sopenharmony_ci " uint result[];\n" 341e5c31af7Sopenharmony_ci "} b2;\n" 342e5c31af7Sopenharmony_ci "layout(binding = 4, std430) readonly buffer Buffer4\n" 343e5c31af7Sopenharmony_ci "{\n" 344e5c31af7Sopenharmony_ci " " + subgroups::getFormatNameForGLSL(caseDef.format) + " data1[];\n" 345e5c31af7Sopenharmony_ci "};\n" 346e5c31af7Sopenharmony_ci "\n" 347e5c31af7Sopenharmony_ci "void main (void)\n" 348e5c31af7Sopenharmony_ci "{\n" 349e5c31af7Sopenharmony_ci + bdyStr + 350e5c31af7Sopenharmony_ci " b2.result[gl_PrimitiveID * 2 + int(gl_TessCoord.x + 0.5)] = tempResult;\n" 351e5c31af7Sopenharmony_ci " float pixelSize = 2.0f/1024.0f;\n" 352e5c31af7Sopenharmony_ci " gl_Position = gl_in[0].gl_Position + gl_TessCoord.x * pixelSize / 2.0f;\n" 353e5c31af7Sopenharmony_ci "}\n"; 354e5c31af7Sopenharmony_ci 355e5c31af7Sopenharmony_ci const string geometry = 356e5c31af7Sopenharmony_ci //version string added by addGeometryShadersFromTemplate 357e5c31af7Sopenharmony_ci "#extension GL_KHR_shader_subgroup_ballot: enable\n" 358e5c31af7Sopenharmony_ci "layout(${TOPOLOGY}) in;\n" 359e5c31af7Sopenharmony_ci "layout(points, max_vertices = 1) out;\n" 360e5c31af7Sopenharmony_ci "layout(binding = 3, std430) buffer Buffer3\n" 361e5c31af7Sopenharmony_ci "{\n" 362e5c31af7Sopenharmony_ci " uint result[];\n" 363e5c31af7Sopenharmony_ci "} b3;\n" 364e5c31af7Sopenharmony_ci "layout(binding = 4, std430) readonly buffer Buffer4\n" 365e5c31af7Sopenharmony_ci "{\n" 366e5c31af7Sopenharmony_ci " " + subgroups::getFormatNameForGLSL(caseDef.format) + " data1[];\n" 367e5c31af7Sopenharmony_ci "};\n" 368e5c31af7Sopenharmony_ci "\n" 369e5c31af7Sopenharmony_ci "void main (void)\n" 370e5c31af7Sopenharmony_ci "{\n" 371e5c31af7Sopenharmony_ci + bdyStr + 372e5c31af7Sopenharmony_ci " b3.result[gl_PrimitiveIDIn] = tempResult;\n" 373e5c31af7Sopenharmony_ci " gl_Position = gl_in[0].gl_Position;\n" 374e5c31af7Sopenharmony_ci " EmitVertex();\n" 375e5c31af7Sopenharmony_ci " EndPrimitive();\n" 376e5c31af7Sopenharmony_ci "}\n"; 377e5c31af7Sopenharmony_ci 378e5c31af7Sopenharmony_ci const string fragment = 379e5c31af7Sopenharmony_ci "${VERSION_DECL}\n" 380e5c31af7Sopenharmony_ci "#extension GL_KHR_shader_subgroup_ballot: enable\n" 381e5c31af7Sopenharmony_ci "precision highp int;\n" 382e5c31af7Sopenharmony_ci "precision highp float;\n" 383e5c31af7Sopenharmony_ci "layout(location = 0) out uint result;\n" 384e5c31af7Sopenharmony_ci "layout(binding = 4, std430) readonly buffer Buffer4\n" 385e5c31af7Sopenharmony_ci "{\n" 386e5c31af7Sopenharmony_ci " " + subgroups::getFormatNameForGLSL(caseDef.format) + " data1[];\n" 387e5c31af7Sopenharmony_ci "};\n" 388e5c31af7Sopenharmony_ci "void main (void)\n" 389e5c31af7Sopenharmony_ci "{\n" 390e5c31af7Sopenharmony_ci + bdyStr + 391e5c31af7Sopenharmony_ci " result = tempResult;\n" 392e5c31af7Sopenharmony_ci "}\n"; 393e5c31af7Sopenharmony_ci 394e5c31af7Sopenharmony_ci subgroups::addNoSubgroupShader(programCollection); 395e5c31af7Sopenharmony_ci 396e5c31af7Sopenharmony_ci programCollection.add("vert") << glu::VertexSource(vertex); 397e5c31af7Sopenharmony_ci programCollection.add("tesc") << glu::TessellationControlSource(tesc); 398e5c31af7Sopenharmony_ci programCollection.add("tese") << glu::TessellationEvaluationSource(tese); 399e5c31af7Sopenharmony_ci subgroups::addGeometryShadersFromTemplate(geometry, programCollection); 400e5c31af7Sopenharmony_ci programCollection.add("fragment") << glu::FragmentSource(fragment); 401e5c31af7Sopenharmony_ci } 402e5c31af7Sopenharmony_ci} 403e5c31af7Sopenharmony_ci 404e5c31af7Sopenharmony_civoid supportedCheck (Context& context, CaseDefinition caseDef) 405e5c31af7Sopenharmony_ci{ 406e5c31af7Sopenharmony_ci if (!subgroups::isSubgroupSupported(context)) 407e5c31af7Sopenharmony_ci TCU_THROW(NotSupportedError, "Subgroup operations are not supported"); 408e5c31af7Sopenharmony_ci 409e5c31af7Sopenharmony_ci if (!subgroups::isSubgroupFeatureSupportedForDevice(context, SUBGROUP_FEATURE_BALLOT_BIT)) 410e5c31af7Sopenharmony_ci { 411e5c31af7Sopenharmony_ci TCU_THROW(NotSupportedError, "Device does not support subgroup ballot operations"); 412e5c31af7Sopenharmony_ci } 413e5c31af7Sopenharmony_ci 414e5c31af7Sopenharmony_ci if (subgroups::isDoubleFormat(caseDef.format) && 415e5c31af7Sopenharmony_ci !subgroups::isDoubleSupportedForDevice(context)) 416e5c31af7Sopenharmony_ci { 417e5c31af7Sopenharmony_ci TCU_THROW(NotSupportedError, "Device does not support subgroup double operations"); 418e5c31af7Sopenharmony_ci } 419e5c31af7Sopenharmony_ci} 420e5c31af7Sopenharmony_ci 421e5c31af7Sopenharmony_citcu::TestStatus noSSBOtest (Context& context, const CaseDefinition caseDef) 422e5c31af7Sopenharmony_ci{ 423e5c31af7Sopenharmony_ci if (!subgroups::areSubgroupOperationsSupportedForStage( 424e5c31af7Sopenharmony_ci context, caseDef.shaderStage)) 425e5c31af7Sopenharmony_ci { 426e5c31af7Sopenharmony_ci if (subgroups::areSubgroupOperationsRequiredForStage(caseDef.shaderStage)) 427e5c31af7Sopenharmony_ci { 428e5c31af7Sopenharmony_ci return tcu::TestStatus::fail( 429e5c31af7Sopenharmony_ci "Shader stage " + 430e5c31af7Sopenharmony_ci subgroups::getShaderStageName(caseDef.shaderStage) + 431e5c31af7Sopenharmony_ci " is required to support subgroup operations!"); 432e5c31af7Sopenharmony_ci } 433e5c31af7Sopenharmony_ci else 434e5c31af7Sopenharmony_ci { 435e5c31af7Sopenharmony_ci TCU_THROW(NotSupportedError, "Device does not support subgroup operations for this stage"); 436e5c31af7Sopenharmony_ci } 437e5c31af7Sopenharmony_ci } 438e5c31af7Sopenharmony_ci 439e5c31af7Sopenharmony_ci subgroups::SSBOData inputData[1]; 440e5c31af7Sopenharmony_ci inputData[0].format = caseDef.format; 441e5c31af7Sopenharmony_ci inputData[0].layout = subgroups::SSBOData::LayoutStd140; 442e5c31af7Sopenharmony_ci inputData[0].numElements = subgroups::maxSupportedSubgroupSize(); 443e5c31af7Sopenharmony_ci inputData[0].initializeType = subgroups::SSBOData::InitializeNonZero; 444e5c31af7Sopenharmony_ci 445e5c31af7Sopenharmony_ci if (SHADER_STAGE_VERTEX_BIT == caseDef.shaderStage) 446e5c31af7Sopenharmony_ci return subgroups::makeVertexFrameBufferTest(context, FORMAT_R32_UINT, inputData, 1, checkVertexPipelineStages); 447e5c31af7Sopenharmony_ci else if (SHADER_STAGE_GEOMETRY_BIT == caseDef.shaderStage) 448e5c31af7Sopenharmony_ci return subgroups::makeGeometryFrameBufferTest(context, FORMAT_R32_UINT, inputData, 1, checkVertexPipelineStages); 449e5c31af7Sopenharmony_ci else if (SHADER_STAGE_TESS_CONTROL_BIT == caseDef.shaderStage) 450e5c31af7Sopenharmony_ci return subgroups::makeTessellationEvaluationFrameBufferTest(context, FORMAT_R32_UINT, inputData, 1, checkVertexPipelineStages, SHADER_STAGE_TESS_CONTROL_BIT); 451e5c31af7Sopenharmony_ci else if (SHADER_STAGE_TESS_EVALUATION_BIT == caseDef.shaderStage) 452e5c31af7Sopenharmony_ci return subgroups::makeTessellationEvaluationFrameBufferTest(context, FORMAT_R32_UINT, inputData, 1, checkVertexPipelineStages, SHADER_STAGE_TESS_EVALUATION_BIT); 453e5c31af7Sopenharmony_ci else 454e5c31af7Sopenharmony_ci TCU_THROW(InternalError, "Unhandled shader stage"); 455e5c31af7Sopenharmony_ci} 456e5c31af7Sopenharmony_ci 457e5c31af7Sopenharmony_ci 458e5c31af7Sopenharmony_citcu::TestStatus test(Context& context, const CaseDefinition caseDef) 459e5c31af7Sopenharmony_ci{ 460e5c31af7Sopenharmony_ci if (SHADER_STAGE_COMPUTE_BIT == caseDef.shaderStage) 461e5c31af7Sopenharmony_ci { 462e5c31af7Sopenharmony_ci if (!subgroups::areSubgroupOperationsSupportedForStage(context, caseDef.shaderStage)) 463e5c31af7Sopenharmony_ci { 464e5c31af7Sopenharmony_ci if (subgroups::areSubgroupOperationsRequiredForStage(caseDef.shaderStage)) 465e5c31af7Sopenharmony_ci { 466e5c31af7Sopenharmony_ci return tcu::TestStatus::fail( 467e5c31af7Sopenharmony_ci "Shader stage " + 468e5c31af7Sopenharmony_ci subgroups::getShaderStageName(caseDef.shaderStage) + 469e5c31af7Sopenharmony_ci " is required to support subgroup operations!"); 470e5c31af7Sopenharmony_ci } 471e5c31af7Sopenharmony_ci else 472e5c31af7Sopenharmony_ci { 473e5c31af7Sopenharmony_ci TCU_THROW(NotSupportedError, "Device does not support subgroup operations for this stage"); 474e5c31af7Sopenharmony_ci } 475e5c31af7Sopenharmony_ci } 476e5c31af7Sopenharmony_ci subgroups::SSBOData inputData[1]; 477e5c31af7Sopenharmony_ci inputData[0].format = caseDef.format; 478e5c31af7Sopenharmony_ci inputData[0].layout = subgroups::SSBOData::LayoutStd430; 479e5c31af7Sopenharmony_ci inputData[0].numElements = subgroups::maxSupportedSubgroupSize(); 480e5c31af7Sopenharmony_ci inputData[0].initializeType = subgroups::SSBOData::InitializeNonZero; 481e5c31af7Sopenharmony_ci inputData[0].binding = 1u; 482e5c31af7Sopenharmony_ci 483e5c31af7Sopenharmony_ci return subgroups::makeComputeTest(context, FORMAT_R32_UINT, inputData, 1, checkComputeStages); 484e5c31af7Sopenharmony_ci } 485e5c31af7Sopenharmony_ci else 486e5c31af7Sopenharmony_ci { 487e5c31af7Sopenharmony_ci int supportedStages = context.getDeqpContext().getContextInfo().getInt(GL_SUBGROUP_SUPPORTED_STAGES_KHR); 488e5c31af7Sopenharmony_ci 489e5c31af7Sopenharmony_ci ShaderStageFlags stages = (ShaderStageFlags)(caseDef.shaderStage & supportedStages); 490e5c31af7Sopenharmony_ci 491e5c31af7Sopenharmony_ci if ( SHADER_STAGE_FRAGMENT_BIT != stages && !subgroups::isVertexSSBOSupportedForDevice(context)) 492e5c31af7Sopenharmony_ci { 493e5c31af7Sopenharmony_ci if ( (stages & SHADER_STAGE_FRAGMENT_BIT) == 0) 494e5c31af7Sopenharmony_ci TCU_THROW(NotSupportedError, "Device does not support vertex stage SSBO writes"); 495e5c31af7Sopenharmony_ci else 496e5c31af7Sopenharmony_ci stages = SHADER_STAGE_FRAGMENT_BIT; 497e5c31af7Sopenharmony_ci } 498e5c31af7Sopenharmony_ci 499e5c31af7Sopenharmony_ci if ((ShaderStageFlags)0u == stages) 500e5c31af7Sopenharmony_ci TCU_THROW(NotSupportedError, "Subgroup operations are not supported for any graphic shader"); 501e5c31af7Sopenharmony_ci 502e5c31af7Sopenharmony_ci subgroups::SSBOData inputData; 503e5c31af7Sopenharmony_ci inputData.format = caseDef.format; 504e5c31af7Sopenharmony_ci inputData.layout = subgroups::SSBOData::LayoutStd430; 505e5c31af7Sopenharmony_ci inputData.numElements = subgroups::maxSupportedSubgroupSize(); 506e5c31af7Sopenharmony_ci inputData.initializeType = subgroups::SSBOData::InitializeNonZero; 507e5c31af7Sopenharmony_ci inputData.binding = 4u; 508e5c31af7Sopenharmony_ci inputData.stages = stages; 509e5c31af7Sopenharmony_ci 510e5c31af7Sopenharmony_ci return subgroups::allStages(context, FORMAT_R32_UINT, &inputData, 1, checkVertexPipelineStages, stages); 511e5c31af7Sopenharmony_ci } 512e5c31af7Sopenharmony_ci} 513e5c31af7Sopenharmony_ci} 514e5c31af7Sopenharmony_ci 515e5c31af7Sopenharmony_cideqp::TestCaseGroup* createSubgroupsBallotBroadcastTests(deqp::Context& testCtx) 516e5c31af7Sopenharmony_ci{ 517e5c31af7Sopenharmony_ci de::MovePtr<deqp::TestCaseGroup> graphicGroup(new deqp::TestCaseGroup( 518e5c31af7Sopenharmony_ci testCtx, "graphics", "Subgroup ballot broadcast category tests: graphics")); 519e5c31af7Sopenharmony_ci de::MovePtr<deqp::TestCaseGroup> computeGroup(new deqp::TestCaseGroup( 520e5c31af7Sopenharmony_ci testCtx, "compute", "Subgroup ballot broadcast category tests: compute")); 521e5c31af7Sopenharmony_ci de::MovePtr<deqp::TestCaseGroup> framebufferGroup(new deqp::TestCaseGroup( 522e5c31af7Sopenharmony_ci testCtx, "framebuffer", "Subgroup ballot broadcast category tests: framebuffer")); 523e5c31af7Sopenharmony_ci 524e5c31af7Sopenharmony_ci const ShaderStageFlags stages[] = 525e5c31af7Sopenharmony_ci { 526e5c31af7Sopenharmony_ci SHADER_STAGE_VERTEX_BIT, 527e5c31af7Sopenharmony_ci SHADER_STAGE_TESS_EVALUATION_BIT, 528e5c31af7Sopenharmony_ci SHADER_STAGE_TESS_CONTROL_BIT, 529e5c31af7Sopenharmony_ci SHADER_STAGE_GEOMETRY_BIT, 530e5c31af7Sopenharmony_ci }; 531e5c31af7Sopenharmony_ci 532e5c31af7Sopenharmony_ci const Format formats[] = 533e5c31af7Sopenharmony_ci { 534e5c31af7Sopenharmony_ci FORMAT_R32_SINT, FORMAT_R32G32_SINT, FORMAT_R32G32B32_SINT, 535e5c31af7Sopenharmony_ci FORMAT_R32G32B32A32_SINT, FORMAT_R32_UINT, FORMAT_R32G32_UINT, 536e5c31af7Sopenharmony_ci FORMAT_R32G32B32_UINT, FORMAT_R32G32B32A32_UINT, 537e5c31af7Sopenharmony_ci FORMAT_R32_SFLOAT, FORMAT_R32G32_SFLOAT, 538e5c31af7Sopenharmony_ci FORMAT_R32G32B32_SFLOAT, FORMAT_R32G32B32A32_SFLOAT, 539e5c31af7Sopenharmony_ci FORMAT_R64_SFLOAT, FORMAT_R64G64_SFLOAT, 540e5c31af7Sopenharmony_ci FORMAT_R64G64B64_SFLOAT, FORMAT_R64G64B64A64_SFLOAT, 541e5c31af7Sopenharmony_ci FORMAT_R32_BOOL, FORMAT_R32G32_BOOL, 542e5c31af7Sopenharmony_ci FORMAT_R32G32B32_BOOL, FORMAT_R32G32B32A32_BOOL, 543e5c31af7Sopenharmony_ci }; 544e5c31af7Sopenharmony_ci 545e5c31af7Sopenharmony_ci for (int formatIndex = 0; formatIndex < DE_LENGTH_OF_ARRAY(formats); ++formatIndex) 546e5c31af7Sopenharmony_ci { 547e5c31af7Sopenharmony_ci const Format format = formats[formatIndex]; 548e5c31af7Sopenharmony_ci 549e5c31af7Sopenharmony_ci for (int opTypeIndex = 0; opTypeIndex < OPTYPE_LAST; ++opTypeIndex) 550e5c31af7Sopenharmony_ci { 551e5c31af7Sopenharmony_ci const std::string op = de::toLower(getOpTypeName(opTypeIndex)); 552e5c31af7Sopenharmony_ci const std::string name = op + "_" + subgroups::getFormatNameForGLSL(format); 553e5c31af7Sopenharmony_ci 554e5c31af7Sopenharmony_ci { 555e5c31af7Sopenharmony_ci CaseDefinition caseDef = {opTypeIndex, SHADER_STAGE_COMPUTE_BIT, format}; 556e5c31af7Sopenharmony_ci SubgroupFactory<CaseDefinition>::addFunctionCaseWithPrograms(computeGroup.get(), name, "", supportedCheck, initPrograms, test, caseDef); 557e5c31af7Sopenharmony_ci } 558e5c31af7Sopenharmony_ci 559e5c31af7Sopenharmony_ci { 560e5c31af7Sopenharmony_ci const CaseDefinition caseDef = {opTypeIndex, SHADER_STAGE_ALL_GRAPHICS, format}; 561e5c31af7Sopenharmony_ci SubgroupFactory<CaseDefinition>::addFunctionCaseWithPrograms(graphicGroup.get(), name, "", supportedCheck, initPrograms, test, caseDef); 562e5c31af7Sopenharmony_ci } 563e5c31af7Sopenharmony_ci 564e5c31af7Sopenharmony_ci for (int stageIndex = 0; stageIndex < DE_LENGTH_OF_ARRAY(stages); ++stageIndex) 565e5c31af7Sopenharmony_ci { 566e5c31af7Sopenharmony_ci const CaseDefinition caseDef = {opTypeIndex, stages[stageIndex], format}; 567e5c31af7Sopenharmony_ci SubgroupFactory<CaseDefinition>::addFunctionCaseWithPrograms(framebufferGroup.get(), name + getShaderStageName(caseDef.shaderStage), "", 568e5c31af7Sopenharmony_ci supportedCheck, initFrameBufferPrograms, noSSBOtest, caseDef); 569e5c31af7Sopenharmony_ci } 570e5c31af7Sopenharmony_ci } 571e5c31af7Sopenharmony_ci } 572e5c31af7Sopenharmony_ci 573e5c31af7Sopenharmony_ci de::MovePtr<deqp::TestCaseGroup> group(new deqp::TestCaseGroup( 574e5c31af7Sopenharmony_ci testCtx, "ballot_broadcast", "Subgroup ballot broadcast category tests")); 575e5c31af7Sopenharmony_ci 576e5c31af7Sopenharmony_ci group->addChild(graphicGroup.release()); 577e5c31af7Sopenharmony_ci group->addChild(computeGroup.release()); 578e5c31af7Sopenharmony_ci group->addChild(framebufferGroup.release()); 579e5c31af7Sopenharmony_ci return group.release(); 580e5c31af7Sopenharmony_ci} 581e5c31af7Sopenharmony_ci 582e5c31af7Sopenharmony_ci} // subgroups 583e5c31af7Sopenharmony_ci} // glc 584