| /*------------------------------------------------------------------------ |
| * Vulkan Conformance Tests |
| * ------------------------ |
| * |
| * Copyright (c) 2019 The Khronos Group Inc. |
| * Copyright (c) 2019 Google Inc. |
| * Copyright (c) 2017 Codeplay Software Ltd. |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| * |
| */ /*! |
| * \file |
| * \brief Subgroups Tests |
| */ /*--------------------------------------------------------------------*/ |
| |
| #include "vktSubgroupsBallotTests.hpp" |
| #include "vktSubgroupsTestsUtils.hpp" |
| |
| #include <string> |
| #include <vector> |
| |
| using namespace tcu; |
| using namespace std; |
| using namespace vk; |
| using namespace vkt; |
| |
| namespace |
| { |
| static bool checkVertexPipelineStages(const void* internalData, std::vector<const void*> datas, |
| deUint32 width, deUint32) |
| { |
| DE_UNREF(internalData); |
| return vkt::subgroups::check(datas, width, 0x7); |
| } |
| |
| static bool checkCompute(const void* internalData, std::vector<const void*> datas, |
| const deUint32 numWorkgroups[3], const deUint32 localSize[3], |
| deUint32) |
| { |
| DE_UNREF(internalData); |
| return vkt::subgroups::checkCompute(datas, numWorkgroups, localSize, 0x7); |
| } |
| |
| struct CaseDefinition |
| { |
| VkShaderStageFlags shaderStage; |
| de::SharedPtr<bool> geometryPointSizeSupported; |
| deBool extShaderSubGroupBallotTests; |
| deBool requiredSubgroupSize; |
| }; |
| |
| |
| void initFrameBufferPrograms(SourceCollections& programCollection, CaseDefinition caseDef) |
| { |
| const vk::SpirVAsmBuildOptions buildOptionsSpr (programCollection.usedVulkanVersion, vk::SPIRV_VERSION_1_3); |
| std::ostringstream subgroupSizeStr; |
| subgroupSizeStr << subgroups::maxSupportedSubgroupSize(); |
| const string extensionHeader = (caseDef.extShaderSubGroupBallotTests ? "OpExtension \"SPV_KHR_shader_ballot\"\n" : ""); |
| const string capabilityBallotHeader = (caseDef.extShaderSubGroupBallotTests ? "OpCapability SubgroupBallotKHR\n" : "OpCapability GroupNonUniformBallot\n"); |
| |
| subgroups::setFragmentShaderFrameBuffer(programCollection); |
| |
| if (VK_SHADER_STAGE_VERTEX_BIT != caseDef.shaderStage) |
| subgroups::setVertexShaderFrameBuffer(programCollection); |
| |
| if (VK_SHADER_STAGE_VERTEX_BIT == caseDef.shaderStage) |
| { |
| /* |
| "#extension GL_KHR_shader_subgroup_ballot: enable\n" |
| "layout(location = 0) in highp vec4 in_position;\n" |
| "layout(location = 0) out float out_color;\n" |
| "layout(set = 0, binding = 0) uniform Buffer1\n" |
| "{\n" |
| " uint data[" << subgroups::maxSupportedSubgroupSize() << "];\n" |
| "};\n" |
| "\n" |
| "void main (void)\n" |
| "{\n" |
| " uint tempResult = 0;\n" |
| " tempResult |= !bool(uvec4(0) == subgroupBallot(true)) ? 0x1 : 0;\n" |
| " bool bData = data[gl_SubgroupInvocationID] != 0;\n" |
| " tempResult |= !bool(uvec4(0) == subgroupBallot(bData)) ? 0x2 : 0;\n" |
| " tempResult |= uvec4(0) == subgroupBallot(false) ? 0x4 : 0;\n" |
| " out_color = float(tempResult);\n" |
| " gl_Position = in_position;\n" |
| " gl_PointSize = 1.0f;\n" |
| "}\n"; |
| */ |
| const string vertex = |
| "; SPIR-V\n" |
| "; Version: 1.3\n" |
| "; Generator: Khronos Glslang Reference Front End; 2\n" |
| "; Bound: 76\n" |
| "; Schema: 0\n" |
| "OpCapability Shader\n" |
| "OpCapability GroupNonUniform\n" |
| + capabilityBallotHeader |
| + extensionHeader + |
| "%1 = OpExtInstImport \"GLSL.std.450\"\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint Vertex %4 \"main\" %35 %62 %70 %72\n" |
| "OpDecorate %30 ArrayStride 16\n" |
| "OpMemberDecorate %31 0 Offset 0\n" |
| "OpDecorate %31 Block\n" |
| "OpDecorate %33 DescriptorSet 0\n" |
| "OpDecorate %33 Binding 0\n" |
| "OpDecorate %35 RelaxedPrecision\n" |
| "OpDecorate %35 BuiltIn SubgroupLocalInvocationId\n" |
| "OpDecorate %36 RelaxedPrecision\n" |
| "OpDecorate %62 Location 0\n" |
| "OpMemberDecorate %68 0 BuiltIn Position\n" |
| "OpMemberDecorate %68 1 BuiltIn PointSize\n" |
| "OpMemberDecorate %68 2 BuiltIn ClipDistance\n" |
| "OpMemberDecorate %68 3 BuiltIn CullDistance\n" |
| "OpDecorate %68 Block\n" |
| "OpDecorate %72 Location 0\n" |
| "%2 = OpTypeVoid\n" |
| "%3 = OpTypeFunction %2\n" |
| "%6 = OpTypeInt 32 0\n" |
| "%7 = OpTypePointer Function %6\n" |
| "%9 = OpConstant %6 0\n" |
| "%10 = OpTypeVector %6 4\n" |
| "%11 = OpConstantComposite %10 %9 %9 %9 %9\n" |
| "%12 = OpTypeBool\n" |
| "%13 = OpConstantTrue %12\n" |
| "%14 = OpConstant %6 3\n" |
| "%16 = OpTypeVector %12 4\n" |
| "%20 = OpTypeInt 32 1\n" |
| "%21 = OpConstant %20 1\n" |
| "%22 = OpConstant %20 0\n" |
| "%27 = OpTypePointer Function %12\n" |
| "%29 = OpConstant %6 " + subgroupSizeStr.str() + "\n" |
| "%30 = OpTypeArray %6 %29\n" |
| "%31 = OpTypeStruct %30\n" |
| "%32 = OpTypePointer Uniform %31\n" |
| "%33 = OpVariable %32 Uniform\n" |
| "%34 = OpTypePointer Input %6\n" |
| "%35 = OpVariable %34 Input\n" |
| "%37 = OpTypePointer Uniform %6\n" |
| "%46 = OpConstant %20 2\n" |
| "%51 = OpConstantFalse %12\n" |
| "%55 = OpConstant %20 4\n" |
| "%60 = OpTypeFloat 32\n" |
| "%61 = OpTypePointer Output %60\n" |
| "%62 = OpVariable %61 Output\n" |
| "%65 = OpTypeVector %60 4\n" |
| "%66 = OpConstant %6 1\n" |
| "%67 = OpTypeArray %60 %66\n" |
| "%68 = OpTypeStruct %65 %60 %67 %67\n" |
| "%69 = OpTypePointer Output %68\n" |
| "%70 = OpVariable %69 Output\n" |
| "%71 = OpTypePointer Input %65\n" |
| "%72 = OpVariable %71 Input\n" |
| "%74 = OpTypePointer Output %65\n" |
| "%76 = OpConstant %60 1\n" |
| "%4 = OpFunction %2 None %3\n" |
| "%5 = OpLabel\n" |
| "%8 = OpVariable %7 Function\n" |
| "%28 = OpVariable %27 Function\n" |
| "OpStore %8 %9\n" |
| "%15 = " + (caseDef.extShaderSubGroupBallotTests ? "OpSubgroupBallotKHR %10 %13" : "OpGroupNonUniformBallot %10 %14 %13") + "\n" |
| "%17 = OpIEqual %16 %11 %15\n" |
| "%18 = OpAll %12 %17\n" |
| "%19 = OpLogicalNot %12 %18\n" |
| "%23 = OpSelect %20 %19 %21 %22\n" |
| "%24 = OpBitcast %6 %23\n" |
| "%25 = OpLoad %6 %8\n" |
| "%26 = OpBitwiseOr %6 %25 %24\n" |
| "OpStore %8 %26\n" |
| "%36 = OpLoad %6 %35\n" |
| "%38 = OpAccessChain %37 %33 %22 %36\n" |
| "%39 = OpLoad %6 %38\n" |
| "%40 = OpINotEqual %12 %39 %9\n" |
| "OpStore %28 %40\n" |
| "%41 = OpLoad %12 %28\n" |
| "%42 = " + (caseDef.extShaderSubGroupBallotTests ? "OpSubgroupBallotKHR %10 %41" : "OpGroupNonUniformBallot %10 %14 %41") + "\n" |
| "%43 = OpIEqual %16 %11 %42\n" |
| "%44 = OpAll %12 %43\n" |
| "%45 = OpLogicalNot %12 %44\n" |
| "%47 = OpSelect %20 %45 %46 %22\n" |
| "%48 = OpBitcast %6 %47\n" |
| "%49 = OpLoad %6 %8\n" |
| "%50 = OpBitwiseOr %6 %49 %48\n" |
| "OpStore %8 %50\n" |
| "%52 = " + (caseDef.extShaderSubGroupBallotTests ? "OpSubgroupBallotKHR %10 %51" : "OpGroupNonUniformBallot %10 %14 %51") + "\n" |
| "%53 = OpIEqual %16 %11 %52\n" |
| "%54 = OpAll %12 %53\n" |
| "%56 = OpSelect %20 %54 %55 %22\n" |
| "%57 = OpBitcast %6 %56\n" |
| "%58 = OpLoad %6 %8\n" |
| "%59 = OpBitwiseOr %6 %58 %57\n" |
| "OpStore %8 %59\n" |
| "%63 = OpLoad %6 %8\n" |
| "%64 = OpConvertUToF %60 %63\n" |
| "OpStore %62 %64\n" |
| "%73 = OpLoad %65 %72\n" |
| "%75 = OpAccessChain %74 %70 %22\n" |
| "OpStore %75 %73\n" |
| "%77 = OpAccessChain %61 %70 %21\n" |
| "OpStore %77 %76\n" |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| programCollection.spirvAsmSources.add("vert") << vertex << buildOptionsSpr; |
| } |
| else if (VK_SHADER_STAGE_GEOMETRY_BIT == caseDef.shaderStage) |
| { |
| /* |
| "#extension GL_KHR_shader_subgroup_ballot: enable\n" |
| "layout(points) in;\n" |
| "layout(points, max_vertices = 1) out;\n" |
| "layout(location = 0) out float out_color;\n" |
| "layout(set = 0, binding = 0) uniform Buffer1\n" |
| "{\n" |
| " uint data[" << subgroups::maxSupportedSubgroupSize() << "];\n" |
| "};\n" |
| "\n" |
| "void main (void)\n" |
| "{\n" |
| " uint tempResult = 0;\n" |
| " tempResult |= !bool(uvec4(0) == subgroupBallot(true)) ? 0x1 : 0;\n" |
| " bool bData = data[gl_SubgroupInvocationID] != 0;\n" |
| " tempResult |= !bool(uvec4(0) == subgroupBallot(bData)) ? 0x2 : 0;\n" |
| " tempResult |= uvec4(0) == subgroupBallot(false) ? 0x4 : 0;\n" |
| " out_color = float(tempResult);\n" |
| " gl_Position = gl_in[0].gl_Position;\n" |
| " gl_PointSize = gl_in[0].gl_PointSize;\n" |
| " EmitVertex();\n" |
| " EndPrimitive();\n" |
| "}\n"; |
| */ |
| std::ostringstream geometry; |
| geometry |
| << "; SPIR-V\n" |
| << "; Version: 1.3\n" |
| << "; Generator: Khronos Glslang Reference Front End; 2\n" |
| << "; Bound: 80\n" |
| << "; Schema: 0\n" |
| << "OpCapability Geometry\n" |
| << (*caseDef.geometryPointSizeSupported ? "OpCapability GeometryPointSize\n" : "") |
| << "OpCapability GroupNonUniform\n" |
| << capabilityBallotHeader.c_str() |
| << extensionHeader.c_str() |
| << "%1 = OpExtInstImport \"GLSL.std.450\"\n" |
| << "OpMemoryModel Logical GLSL450\n" |
| << "OpEntryPoint Geometry %4 \"main\" %35 %62 %70 %74\n" |
| << "OpExecutionMode %4 InputPoints\n" |
| << "OpExecutionMode %4 Invocations 1\n" |
| << "OpExecutionMode %4 OutputPoints\n" |
| << "OpExecutionMode %4 OutputVertices 1\n" |
| << "OpDecorate %30 ArrayStride 16\n" |
| << "OpMemberDecorate %31 0 Offset 0\n" |
| << "OpDecorate %31 Block\n" |
| << "OpDecorate %33 DescriptorSet 0\n" |
| << "OpDecorate %33 Binding 0\n" |
| << "OpDecorate %35 RelaxedPrecision\n" |
| << "OpDecorate %35 BuiltIn SubgroupLocalInvocationId\n" |
| << "OpDecorate %36 RelaxedPrecision\n" |
| << "OpDecorate %62 Location 0\n" |
| << "OpMemberDecorate %68 0 BuiltIn Position\n" |
| << "OpMemberDecorate %68 1 BuiltIn PointSize\n" |
| << "OpMemberDecorate %68 2 BuiltIn ClipDistance\n" |
| << "OpMemberDecorate %68 3 BuiltIn CullDistance\n" |
| << "OpDecorate %68 Block\n" |
| << "OpMemberDecorate %71 0 BuiltIn Position\n" |
| << "OpMemberDecorate %71 1 BuiltIn PointSize\n" |
| << "OpMemberDecorate %71 2 BuiltIn ClipDistance\n" |
| << "OpMemberDecorate %71 3 BuiltIn CullDistance\n" |
| << "OpDecorate %71 Block\n" |
| << "%2 = OpTypeVoid\n" |
| << "%3 = OpTypeFunction %2\n" |
| << "%6 = OpTypeInt 32 0\n" |
| << "%7 = OpTypePointer Function %6\n" |
| << "%9 = OpConstant %6 0\n" |
| << "%10 = OpTypeVector %6 4\n" |
| << "%11 = OpConstantComposite %10 %9 %9 %9 %9\n" |
| << "%12 = OpTypeBool\n" |
| << "%13 = OpConstantTrue %12\n" |
| << "%14 = OpConstant %6 3\n" |
| << "%16 = OpTypeVector %12 4\n" |
| << "%20 = OpTypeInt 32 1\n" |
| << "%21 = OpConstant %20 1\n" |
| << "%22 = OpConstant %20 0\n" |
| << "%27 = OpTypePointer Function %12\n" |
| << "%29 = OpConstant %6 " << subgroupSizeStr.str() << "\n" |
| << "%30 = OpTypeArray %6 %29\n" |
| << "%31 = OpTypeStruct %30\n" |
| << "%32 = OpTypePointer Uniform %31\n" |
| << "%33 = OpVariable %32 Uniform\n" |
| << "%34 = OpTypePointer Input %6\n" |
| << "%35 = OpVariable %34 Input\n" |
| << "%37 = OpTypePointer Uniform %6\n" |
| << "%46 = OpConstant %20 2\n" |
| << "%51 = OpConstantFalse %12\n" |
| << "%55 = OpConstant %20 4\n" |
| << "%60 = OpTypeFloat 32\n" |
| << "%61 = OpTypePointer Output %60\n" |
| << "%62 = OpVariable %61 Output\n" |
| << "%65 = OpTypeVector %60 4\n" |
| << "%66 = OpConstant %6 1\n" |
| << "%67 = OpTypeArray %60 %66\n" |
| << "%68 = OpTypeStruct %65 %60 %67 %67\n" |
| << "%69 = OpTypePointer Output %68\n" |
| << "%70 = OpVariable %69 Output\n" |
| << "%71 = OpTypeStruct %65 %60 %67 %67\n" |
| << "%72 = OpTypeArray %71 %66\n" |
| << "%73 = OpTypePointer Input %72\n" |
| << "%74 = OpVariable %73 Input\n" |
| << "%75 = OpTypePointer Input %65\n" |
| << "%78 = OpTypePointer Output %65\n" |
| << (*caseDef.geometryPointSizeSupported ? |
| "%80 = OpTypePointer Input %60\n" |
| "%81 = OpTypePointer Output %60\n" : "") |
| << "%4 = OpFunction %2 None %3\n" |
| << "%5 = OpLabel\n" |
| << "%8 = OpVariable %7 Function\n" |
| << "%28 = OpVariable %27 Function\n" |
| << "OpStore %8 %9\n" |
| << "%15 = " << (caseDef.extShaderSubGroupBallotTests ? "OpSubgroupBallotKHR %10 %13" : "OpGroupNonUniformBallot %10 %14 %13") << "\n" |
| << "%17 = OpIEqual %16 %11 %15\n" |
| << "%18 = OpAll %12 %17\n" |
| << "%19 = OpLogicalNot %12 %18\n" |
| << "%23 = OpSelect %20 %19 %21 %22\n" |
| << "%24 = OpBitcast %6 %23\n" |
| << "%25 = OpLoad %6 %8\n" |
| << "%26 = OpBitwiseOr %6 %25 %24\n" |
| << "OpStore %8 %26\n" |
| << "%36 = OpLoad %6 %35\n" |
| << "%38 = OpAccessChain %37 %33 %22 %36\n" |
| << "%39 = OpLoad %6 %38\n" |
| << "%40 = OpINotEqual %12 %39 %9\n" |
| << "OpStore %28 %40\n" |
| << "%41 = OpLoad %12 %28\n" |
| << "%42 = " << (caseDef.extShaderSubGroupBallotTests ? "OpSubgroupBallotKHR %10 %41" : "OpGroupNonUniformBallot %10 %14 %41") << "\n" |
| << "%43 = OpIEqual %16 %11 %42\n" |
| << "%44 = OpAll %12 %43\n" |
| << "%45 = OpLogicalNot %12 %44\n" |
| << "%47 = OpSelect %20 %45 %46 %22\n" |
| << "%48 = OpBitcast %6 %47\n" |
| << "%49 = OpLoad %6 %8\n" |
| << "%50 = OpBitwiseOr %6 %49 %48\n" |
| << "OpStore %8 %50\n" |
| << "%52 = " << (caseDef.extShaderSubGroupBallotTests ? "OpSubgroupBallotKHR %10 %51" : "OpGroupNonUniformBallot %10 %14 %51") << "\n" |
| << "%53 = OpIEqual %16 %11 %52\n" |
| << "%54 = OpAll %12 %53\n" |
| << "%56 = OpSelect %20 %54 %55 %22\n" |
| << "%57 = OpBitcast %6 %56\n" |
| << "%58 = OpLoad %6 %8\n" |
| << "%59 = OpBitwiseOr %6 %58 %57\n" |
| << "OpStore %8 %59\n" |
| << "%63 = OpLoad %6 %8\n" |
| << "%64 = OpConvertUToF %60 %63\n" |
| << "OpStore %62 %64\n" |
| << "%76 = OpAccessChain %75 %74 %22 %22\n" |
| << "%77 = OpLoad %65 %76\n" |
| << "%79 = OpAccessChain %78 %70 %22\n" |
| << "OpStore %79 %77\n" |
| << (*caseDef.geometryPointSizeSupported ? |
| "%82 = OpAccessChain %80 %74 %22 %21\n" |
| "%83 = OpLoad %60 %82\n" |
| "%84 = OpAccessChain %81 %70 %21\n" |
| "OpStore %84 %83\n" : "") |
| << "OpEmitVertex\n" |
| << "OpEndPrimitive\n" |
| << "OpReturn\n" |
| << "OpFunctionEnd\n"; |
| programCollection.spirvAsmSources.add("geometry") << geometry.str() << buildOptionsSpr; |
| } |
| else if (VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT == caseDef.shaderStage) |
| { |
| /* |
| "#extension GL_KHR_shader_subgroup_ballot: enable\n" |
| "layout(vertices = 2) out;\n" |
| "layout(location = 0) out float out_color[];\n" |
| "layout(set = 0, binding = 0) uniform Buffer1\n" |
| "{\n" |
| " uint data[" << subgroups::maxSupportedSubgroupSize() << "];\n" |
| "};\n" |
| "\n" |
| "void main (void)\n" |
| "{\n" |
| " if (gl_InvocationID == 0)\n" |
| {\n" |
| " gl_TessLevelOuter[0] = 1.0f;\n" |
| " gl_TessLevelOuter[1] = 1.0f;\n" |
| " }\n" |
| " uint tempResult = 0;\n" |
| " tempResult |= !bool(uvec4(0) == subgroupBallot(true)) ? 0x1 : 0;\n" |
| " bool bData = data[gl_SubgroupInvocationID] != 0;\n" |
| " tempResult |= !bool(uvec4(0) == subgroupBallot(bData)) ? 0x2 : 0;\n" |
| " tempResult |= uvec4(0) == subgroupBallot(false) ? 0x4 : 0;\n" |
| " out_color[gl_InvocationID] = float(tempResult);\n" |
| " gl_out[gl_InvocationID].gl_Position = gl_in[gl_InvocationID].gl_Position;\n" |
| "}\n"; |
| */ |
| const string controlSource = |
| "; SPIR-V\n" |
| "; Version: 1.3\n" |
| "; Generator: Khronos Glslang Reference Front End; 2\n" |
| "; Bound: 102\n" |
| "; Schema: 0\n" |
| "OpCapability Tessellation\n" |
| "OpCapability GroupNonUniform\n" |
| + capabilityBallotHeader |
| + extensionHeader + |
| "%1 = OpExtInstImport \"GLSL.std.450\"\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint TessellationControl %4 \"main\" %8 %20 %50 %78 %89 %95\n" |
| "OpExecutionMode %4 OutputVertices 2\n" |
| "OpDecorate %8 BuiltIn InvocationId\n" |
| "OpDecorate %20 Patch\n" |
| "OpDecorate %20 BuiltIn TessLevelOuter\n" |
| "OpDecorate %45 ArrayStride 16\n" |
| "OpMemberDecorate %46 0 Offset 0\n" |
| "OpDecorate %46 Block\n" |
| "OpDecorate %48 DescriptorSet 0\n" |
| "OpDecorate %48 Binding 0\n" |
| "OpDecorate %50 RelaxedPrecision\n" |
| "OpDecorate %50 BuiltIn SubgroupLocalInvocationId\n" |
| "OpDecorate %51 RelaxedPrecision\n" |
| "OpDecorate %78 Location 0\n" |
| "OpMemberDecorate %86 0 BuiltIn Position\n" |
| "OpMemberDecorate %86 1 BuiltIn PointSize\n" |
| "OpMemberDecorate %86 2 BuiltIn ClipDistance\n" |
| "OpMemberDecorate %86 3 BuiltIn CullDistance\n" |
| "OpDecorate %86 Block\n" |
| "OpMemberDecorate %91 0 BuiltIn Position\n" |
| "OpMemberDecorate %91 1 BuiltIn PointSize\n" |
| "OpMemberDecorate %91 2 BuiltIn ClipDistance\n" |
| "OpMemberDecorate %91 3 BuiltIn CullDistance\n" |
| "OpDecorate %91 Block\n" |
| "%2 = OpTypeVoid\n" |
| "%3 = OpTypeFunction %2\n" |
| "%6 = OpTypeInt 32 1\n" |
| "%7 = OpTypePointer Input %6\n" |
| "%8 = OpVariable %7 Input\n" |
| "%10 = OpConstant %6 0\n" |
| "%11 = OpTypeBool\n" |
| "%15 = OpTypeFloat 32\n" |
| "%16 = OpTypeInt 32 0\n" |
| "%17 = OpConstant %16 4\n" |
| "%18 = OpTypeArray %15 %17\n" |
| "%19 = OpTypePointer Output %18\n" |
| "%20 = OpVariable %19 Output\n" |
| "%21 = OpConstant %15 1\n" |
| "%22 = OpTypePointer Output %15\n" |
| "%24 = OpConstant %6 1\n" |
| "%26 = OpTypePointer Function %16\n" |
| "%28 = OpConstant %16 0\n" |
| "%29 = OpTypeVector %16 4\n" |
| "%30 = OpConstantComposite %29 %28 %28 %28 %28\n" |
| "%31 = OpConstantTrue %11\n" |
| "%32 = OpConstant %16 3\n" |
| "%34 = OpTypeVector %11 4\n" |
| "%42 = OpTypePointer Function %11\n" |
| "%44 = OpConstant %16 " + subgroupSizeStr.str() + "\n" |
| "%45 = OpTypeArray %16 %44\n" |
| "%46 = OpTypeStruct %45\n" |
| "%47 = OpTypePointer Uniform %46\n" |
| "%48 = OpVariable %47 Uniform\n" |
| "%49 = OpTypePointer Input %16\n" |
| "%50 = OpVariable %49 Input\n" |
| "%52 = OpTypePointer Uniform %16\n" |
| "%61 = OpConstant %6 2\n" |
| "%66 = OpConstantFalse %11\n" |
| "%70 = OpConstant %6 4\n" |
| "%75 = OpConstant %16 2\n" |
| "%76 = OpTypeArray %15 %75\n" |
| "%77 = OpTypePointer Output %76\n" |
| "%78 = OpVariable %77 Output\n" |
| "%83 = OpTypeVector %15 4\n" |
| "%84 = OpConstant %16 1\n" |
| "%85 = OpTypeArray %15 %84\n" |
| "%86 = OpTypeStruct %83 %15 %85 %85\n" |
| "%87 = OpTypeArray %86 %75\n" |
| "%88 = OpTypePointer Output %87\n" |
| "%89 = OpVariable %88 Output\n" |
| "%91 = OpTypeStruct %83 %15 %85 %85\n" |
| "%92 = OpConstant %16 32\n" |
| "%93 = OpTypeArray %91 %92\n" |
| "%94 = OpTypePointer Input %93\n" |
| "%95 = OpVariable %94 Input\n" |
| "%97 = OpTypePointer Input %83\n" |
| "%100 = OpTypePointer Output %83\n" |
| "%4 = OpFunction %2 None %3\n" |
| "%5 = OpLabel\n" |
| "%27 = OpVariable %26 Function\n" |
| "%43 = OpVariable %42 Function\n" |
| "%9 = OpLoad %6 %8\n" |
| "%12 = OpIEqual %11 %9 %10\n" |
| "OpSelectionMerge %14 None\n" |
| "OpBranchConditional %12 %13 %14\n" |
| "%13 = OpLabel\n" |
| "%23 = OpAccessChain %22 %20 %10\n" |
| "OpStore %23 %21\n" |
| "%25 = OpAccessChain %22 %20 %24\n" |
| "OpStore %25 %21\n" |
| "OpBranch %14\n" |
| "%14 = OpLabel\n" |
| "OpStore %27 %28\n" |
| "%33 = " + (caseDef.extShaderSubGroupBallotTests ? "OpSubgroupBallotKHR %29 %31" : "OpGroupNonUniformBallot %29 %32 %31") + "\n" |
| "%35 = OpIEqual %34 %30 %33\n" |
| "%36 = OpAll %11 %35\n" |
| "%37 = OpLogicalNot %11 %36\n" |
| "%38 = OpSelect %6 %37 %24 %10\n" |
| "%39 = OpBitcast %16 %38\n" |
| "%40 = OpLoad %16 %27\n" |
| "%41 = OpBitwiseOr %16 %40 %39\n" |
| "OpStore %27 %41\n" |
| "%51 = OpLoad %16 %50\n" |
| "%53 = OpAccessChain %52 %48 %10 %51\n" |
| "%54 = OpLoad %16 %53\n" |
| "%55 = OpINotEqual %11 %54 %28\n" |
| "OpStore %43 %55\n" |
| "%56 = OpLoad %11 %43\n" |
| "%57 = " + (caseDef.extShaderSubGroupBallotTests ? "OpSubgroupBallotKHR %29 %56" : "OpGroupNonUniformBallot %29 %32 %56") + "\n" |
| "%58 = OpIEqual %34 %30 %57\n" |
| "%59 = OpAll %11 %58\n" |
| "%60 = OpLogicalNot %11 %59\n" |
| "%62 = OpSelect %6 %60 %61 %10\n" |
| "%63 = OpBitcast %16 %62\n" |
| "%64 = OpLoad %16 %27\n" |
| "%65 = OpBitwiseOr %16 %64 %63\n" |
| "OpStore %27 %65\n" |
| "%67 = " + (caseDef.extShaderSubGroupBallotTests ? "OpSubgroupBallotKHR %29 %66" : "OpGroupNonUniformBallot %29 %32 %66") + "\n" |
| "%68 = OpIEqual %34 %30 %67\n" |
| "%69 = OpAll %11 %68\n" |
| "%71 = OpSelect %6 %69 %70 %10\n" |
| "%72 = OpBitcast %16 %71\n" |
| "%73 = OpLoad %16 %27\n" |
| "%74 = OpBitwiseOr %16 %73 %72\n" |
| "OpStore %27 %74\n" |
| "%79 = OpLoad %6 %8\n" |
| "%80 = OpLoad %16 %27\n" |
| "%81 = OpConvertUToF %15 %80\n" |
| "%82 = OpAccessChain %22 %78 %79\n" |
| "OpStore %82 %81\n" |
| "%90 = OpLoad %6 %8\n" |
| "%96 = OpLoad %6 %8\n" |
| "%98 = OpAccessChain %97 %95 %96 %10\n" |
| "%99 = OpLoad %83 %98\n" |
| "%101 = OpAccessChain %100 %89 %90 %10\n" |
| "OpStore %101 %99\n" |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| |
| programCollection.spirvAsmSources.add("tesc") << controlSource << buildOptionsSpr; |
| subgroups::setTesEvalShaderFrameBuffer(programCollection); |
| |
| } |
| else if (VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT == caseDef.shaderStage) |
| { |
| /* |
| "#extension GL_KHR_shader_subgroup_ballot: enable\n" |
| "layout(isolines, equal_spacing, ccw ) in;\n" |
| "layout(location = 0) out float out_color;\n" |
| "layout(set = 0, binding = 0) uniform Buffer1\n" |
| "{\n" |
| " uint data[" << subgroups::maxSupportedSubgroupSize() << "];\n" |
| "};\n" |
| "\n" |
| "void main (void)\n" |
| "{\n" |
| " uint tempResult = 0;\n" |
| " tempResult |= !bool(uvec4(0) == subgroupBallot(true)) ? 0x1 : 0;\n" |
| " bool bData = data[gl_SubgroupInvocationID] != 0;\n" |
| " tempResult |= !bool(uvec4(0) == subgroupBallot(bData)) ? 0x2 : 0;\n" |
| " tempResult |= uvec4(0) == subgroupBallot(false) ? 0x4 : 0;\n" |
| " out_color = float(tempResult);\n" |
| " gl_Position = mix(gl_in[0].gl_Position, gl_in[1].gl_Position, gl_TessCoord.x);\n" |
| "}\n"; |
| */ |
| const string evaluationSource = |
| "; SPIR-V\n" |
| "; Version: 1.3\n" |
| "; Generator: Khronos Glslang Reference Front End; 2\n" |
| "; Bound: 91\n" |
| "; Schema: 0\n" |
| "OpCapability Tessellation\n" |
| "OpCapability GroupNonUniform\n" |
| + capabilityBallotHeader |
| + extensionHeader + |
| "%1 = OpExtInstImport \"GLSL.std.450\"\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint TessellationEvaluation %4 \"main\" %35 %62 %70 %75 %83\n" |
| "OpExecutionMode %4 Isolines\n" |
| "OpExecutionMode %4 SpacingEqual\n" |
| "OpExecutionMode %4 VertexOrderCcw\n" |
| "OpDecorate %30 ArrayStride 16\n" |
| "OpMemberDecorate %31 0 Offset 0\n" |
| "OpDecorate %31 Block\n" |
| "OpDecorate %33 DescriptorSet 0\n" |
| "OpDecorate %33 Binding 0\n" |
| "OpDecorate %35 RelaxedPrecision\n" |
| "OpDecorate %35 BuiltIn SubgroupLocalInvocationId\n" |
| "OpDecorate %36 RelaxedPrecision\n" |
| "OpDecorate %62 Location 0\n" |
| "OpMemberDecorate %68 0 BuiltIn Position\n" |
| "OpMemberDecorate %68 1 BuiltIn PointSize\n" |
| "OpMemberDecorate %68 2 BuiltIn ClipDistance\n" |
| "OpMemberDecorate %68 3 BuiltIn CullDistance\n" |
| "OpDecorate %68 Block\n" |
| "OpMemberDecorate %71 0 BuiltIn Position\n" |
| "OpMemberDecorate %71 1 BuiltIn PointSize\n" |
| "OpMemberDecorate %71 2 BuiltIn ClipDistance\n" |
| "OpMemberDecorate %71 3 BuiltIn CullDistance\n" |
| "OpDecorate %71 Block\n" |
| "OpDecorate %83 BuiltIn TessCoord\n" |
| "%2 = OpTypeVoid\n" |
| "%3 = OpTypeFunction %2\n" |
| "%6 = OpTypeInt 32 0\n" |
| "%7 = OpTypePointer Function %6\n" |
| "%9 = OpConstant %6 0\n" |
| "%10 = OpTypeVector %6 4\n" |
| "%11 = OpConstantComposite %10 %9 %9 %9 %9\n" |
| "%12 = OpTypeBool\n" |
| "%13 = OpConstantTrue %12\n" |
| "%14 = OpConstant %6 3\n" |
| "%16 = OpTypeVector %12 4\n" |
| "%20 = OpTypeInt 32 1\n" |
| "%21 = OpConstant %20 1\n" |
| "%22 = OpConstant %20 0\n" |
| "%27 = OpTypePointer Function %12\n" |
| "%29 = OpConstant %6 " + subgroupSizeStr.str() + "\n" |
| "%30 = OpTypeArray %6 %29\n" |
| "%31 = OpTypeStruct %30\n" |
| "%32 = OpTypePointer Uniform %31\n" |
| "%33 = OpVariable %32 Uniform\n" |
| "%34 = OpTypePointer Input %6\n" |
| "%35 = OpVariable %34 Input\n" |
| "%37 = OpTypePointer Uniform %6\n" |
| "%46 = OpConstant %20 2\n" |
| "%51 = OpConstantFalse %12\n" |
| "%55 = OpConstant %20 4\n" |
| "%60 = OpTypeFloat 32\n" |
| "%61 = OpTypePointer Output %60\n" |
| "%62 = OpVariable %61 Output\n" |
| "%65 = OpTypeVector %60 4\n" |
| "%66 = OpConstant %6 1\n" |
| "%67 = OpTypeArray %60 %66\n" |
| "%68 = OpTypeStruct %65 %60 %67 %67\n" |
| "%69 = OpTypePointer Output %68\n" |
| "%70 = OpVariable %69 Output\n" |
| "%71 = OpTypeStruct %65 %60 %67 %67\n" |
| "%72 = OpConstant %6 32\n" |
| "%73 = OpTypeArray %71 %72\n" |
| "%74 = OpTypePointer Input %73\n" |
| "%75 = OpVariable %74 Input\n" |
| "%76 = OpTypePointer Input %65\n" |
| "%81 = OpTypeVector %60 3\n" |
| "%82 = OpTypePointer Input %81\n" |
| "%83 = OpVariable %82 Input\n" |
| "%84 = OpTypePointer Input %60\n" |
| "%89 = OpTypePointer Output %65\n" |
| "%4 = OpFunction %2 None %3\n" |
| "%5 = OpLabel\n" |
| "%8 = OpVariable %7 Function\n" |
| "%28 = OpVariable %27 Function\n" |
| "OpStore %8 %9\n" |
| "%15 = " + (caseDef.extShaderSubGroupBallotTests ? "OpSubgroupBallotKHR %10 %13" : "OpGroupNonUniformBallot %10 %14 %13") + "\n" |
| "%17 = OpIEqual %16 %11 %15\n" |
| "%18 = OpAll %12 %17\n" |
| "%19 = OpLogicalNot %12 %18\n" |
| "%23 = OpSelect %20 %19 %21 %22\n" |
| "%24 = OpBitcast %6 %23\n" |
| "%25 = OpLoad %6 %8\n" |
| "%26 = OpBitwiseOr %6 %25 %24\n" |
| "OpStore %8 %26\n" |
| "%36 = OpLoad %6 %35\n" |
| "%38 = OpAccessChain %37 %33 %22 %36\n" |
| "%39 = OpLoad %6 %38\n" |
| "%40 = OpINotEqual %12 %39 %9\n" |
| "OpStore %28 %40\n" |
| "%41 = OpLoad %12 %28\n" |
| "%42 = " + (caseDef.extShaderSubGroupBallotTests ? "OpSubgroupBallotKHR %10 %41" : "OpGroupNonUniformBallot %10 %14 %41") + "\n" |
| "%43 = OpIEqual %16 %11 %42\n" |
| "%44 = OpAll %12 %43\n" |
| "%45 = OpLogicalNot %12 %44\n" |
| "%47 = OpSelect %20 %45 %46 %22\n" |
| "%48 = OpBitcast %6 %47\n" |
| "%49 = OpLoad %6 %8\n" |
| "%50 = OpBitwiseOr %6 %49 %48\n" |
| "OpStore %8 %50\n" |
| "%52 = " + (caseDef.extShaderSubGroupBallotTests ? "OpSubgroupBallotKHR %10 %51" : "OpGroupNonUniformBallot %10 %14 %51") + "\n" |
| "%53 = OpIEqual %16 %11 %52\n" |
| "%54 = OpAll %12 %53\n" |
| "%56 = OpSelect %20 %54 %55 %22\n" |
| "%57 = OpBitcast %6 %56\n" |
| "%58 = OpLoad %6 %8\n" |
| "%59 = OpBitwiseOr %6 %58 %57\n" |
| "OpStore %8 %59\n" |
| "%63 = OpLoad %6 %8\n" |
| "%64 = OpConvertUToF %60 %63\n" |
| "OpStore %62 %64\n" |
| "%77 = OpAccessChain %76 %75 %22 %22\n" |
| "%78 = OpLoad %65 %77\n" |
| "%79 = OpAccessChain %76 %75 %21 %22\n" |
| "%80 = OpLoad %65 %79\n" |
| "%85 = OpAccessChain %84 %83 %9\n" |
| "%86 = OpLoad %60 %85\n" |
| "%87 = OpCompositeConstruct %65 %86 %86 %86 %86\n" |
| "%88 = OpExtInst %65 %1 FMix %78 %80 %87\n" |
| "%90 = OpAccessChain %89 %70 %22\n" |
| "OpStore %90 %88\n" |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| subgroups::setTesCtrlShaderFrameBuffer(programCollection); |
| programCollection.spirvAsmSources.add("tese") << evaluationSource << buildOptionsSpr; |
| } |
| else |
| { |
| DE_FATAL("Unsupported shader stage"); |
| } |
| } |
| |
| |
| void initPrograms(SourceCollections& programCollection, CaseDefinition caseDef) |
| { |
| const string extensionHeader = (caseDef.extShaderSubGroupBallotTests ? |
| "#extension GL_ARB_shader_ballot: enable\n" |
| "#extension GL_ARB_gpu_shader_int64: enable\n" |
| "#extension GL_KHR_shader_subgroup_basic: enable\n" |
| : |
| "#extension GL_KHR_shader_subgroup_ballot: enable\n"); |
| |
| if (VK_SHADER_STAGE_COMPUTE_BIT == caseDef.shaderStage) |
| { |
| std::ostringstream src; |
| |
| src << "#version 450\n" |
| << extensionHeader.c_str() |
| << "layout (local_size_x_id = 0, local_size_y_id = 1, " |
| "local_size_z_id = 2) in;\n" |
| << "layout(set = 0, binding = 0, std430) buffer Buffer1\n" |
| << "{\n" |
| << " uint result[];\n" |
| << "};\n" |
| << "layout(set = 0, binding = 1, std430) buffer Buffer2\n" |
| << "{\n" |
| << " uint data[];\n" |
| << "};\n" |
| << "\n" |
| << (caseDef.extShaderSubGroupBallotTests ? subgroups::getSharedMemoryBallotHelperARB() : subgroups::getSharedMemoryBallotHelper()) |
| << "void main (void)\n" |
| << "{\n" |
| << " uvec3 globalSize = gl_NumWorkGroups * gl_WorkGroupSize;\n" |
| << " highp uint offset = globalSize.x * ((globalSize.y * " |
| "gl_GlobalInvocationID.z) + gl_GlobalInvocationID.y) + " |
| "gl_GlobalInvocationID.x;\n" |
| << " uint tempResult = 0;\n" |
| << " tempResult |= sharedMemoryBallot(true) == " << (caseDef.extShaderSubGroupBallotTests ? "ballotARB" : "subgroupBallot") << "(true) ? 0x1 : 0;\n" |
| << " bool bData = data[gl_SubgroupInvocationID] != 0;\n" |
| << " tempResult |= sharedMemoryBallot(bData) == " << (caseDef.extShaderSubGroupBallotTests ? "ballotARB" : "subgroupBallot") << "(bData) ? 0x2 : 0;\n" |
| << " tempResult |= " << (caseDef.extShaderSubGroupBallotTests ? "uint64_t(0) == ballotARB" : "uvec4(0) == subgroupBallot") << "(false) ? 0x4 : 0;\n" |
| << " result[offset] = tempResult;\n" |
| << "}\n"; |
| |
| programCollection.glslSources.add("comp") |
| << glu::ComputeSource(src.str()) << vk::ShaderBuildOptions(programCollection.usedVulkanVersion, vk::SPIRV_VERSION_1_3, 0u); |
| } |
| else |
| { |
| const string cmpStr = (caseDef.extShaderSubGroupBallotTests ? "uint64_t(0) == ballotARB" : "uvec4(0) == subgroupBallot"); |
| const string testSrc = |
| " uint tempResult = 0;\n" |
| " tempResult |= !bool(" + cmpStr + "(true)) ? 0x1 : 0;\n" |
| " bool bData = data[gl_SubgroupInvocationID] != 0;\n" |
| " tempResult |= !bool(" + cmpStr + "(bData)) ? 0x2 : 0;\n" |
| " tempResult |= " + cmpStr + "(false) ? 0x4 : 0;\n"; |
| |
| const string vertex = |
| "#version 450\n" |
| + extensionHeader + |
| "layout(set = 0, binding = 0, std430) buffer Buffer1\n" |
| "{\n" |
| " uint result[];\n" |
| "};\n" |
| "layout(set = 0, binding = 4, std430) readonly buffer Buffer2\n" |
| "{\n" |
| " uint data[];\n" |
| "};\n" |
| "\n" |
| "void main (void)\n" |
| "{\n" |
| + testSrc + |
| " result[gl_VertexIndex] = tempResult;\n" |
| " float pixelSize = 2.0f/1024.0f;\n" |
| " float pixelPosition = pixelSize/2.0f - 1.0f;\n" |
| " gl_Position = vec4(float(gl_VertexIndex) * pixelSize + pixelPosition, 0.0f, 0.0f, 1.0f);\n" |
| " gl_PointSize = 1.0f;\n" |
| "}\n"; |
| |
| const string tesc = |
| "#version 450\n" |
| + extensionHeader + |
| "layout(vertices=1) out;\n" |
| "layout(set = 0, binding = 1, std430) buffer Buffer1\n" |
| "{\n" |
| " uint result[];\n" |
| "};\n" |
| "layout(set = 0, binding = 4, std430) readonly buffer Buffer2\n" |
| "{\n" |
| " uint data[];\n" |
| "};\n" |
| "\n" |
| "void main (void)\n" |
| "{\n" |
| + testSrc + |
| " result[gl_PrimitiveID] = tempResult;\n" |
| " if (gl_InvocationID == 0)\n" |
| " {\n" |
| " gl_TessLevelOuter[0] = 1.0f;\n" |
| " gl_TessLevelOuter[1] = 1.0f;\n" |
| " }\n" |
| " gl_out[gl_InvocationID].gl_Position = gl_in[gl_InvocationID].gl_Position;\n" |
| "}\n"; |
| |
| const string tese = |
| "#version 450\n" |
| + extensionHeader + |
| "layout(isolines) in;\n" |
| "layout(set = 0, binding = 2, std430) buffer Buffer1\n" |
| "{\n" |
| " uint result[];\n" |
| "};\n" |
| "layout(set = 0, binding = 4, std430) readonly buffer Buffer2\n" |
| "{\n" |
| " uint data[];\n" |
| "};\n" |
| "\n" |
| "void main (void)\n" |
| "{\n" |
| + testSrc + |
| " result[gl_PrimitiveID * 2 + uint(gl_TessCoord.x + 0.5)] = tempResult;\n" |
| " float pixelSize = 2.0f/1024.0f;\n" |
| " gl_Position = gl_in[0].gl_Position + gl_TessCoord.x * pixelSize / 2.0f;\n" |
| "}\n"; |
| |
| const string geometry = |
| "#version 450\n" |
| + extensionHeader + |
| "layout(${TOPOLOGY}) in;\n" |
| "layout(points, max_vertices = 1) out;\n" |
| "layout(set = 0, binding = 3, std430) buffer Buffer1\n" |
| "{\n" |
| " uint result[];\n" |
| "};\n" |
| "layout(set = 0, binding = 4, std430) readonly buffer Buffer2\n" |
| "{\n" |
| " uint data[];\n" |
| "};\n" |
| "\n" |
| "void main (void)\n" |
| "{\n" |
| + testSrc + |
| " result[gl_PrimitiveIDIn] = tempResult;\n" |
| " gl_Position = gl_in[0].gl_Position;\n" |
| " EmitVertex();\n" |
| " EndPrimitive();\n" |
| "}\n"; |
| |
| const string fragment = |
| "#version 450\n" |
| + extensionHeader + |
| "layout(location = 0) out uint result;\n" |
| "layout(set = 0, binding = 4, std430) readonly buffer Buffer1\n" |
| "{\n" |
| " uint data[];\n" |
| "};\n" |
| "void main (void)\n" |
| "{\n" |
| + testSrc + |
| " result = tempResult;\n" |
| "}\n"; |
| |
| subgroups::addNoSubgroupShader(programCollection); |
| |
| programCollection.glslSources.add("vert") |
| << glu::VertexSource(vertex) << vk::ShaderBuildOptions(programCollection.usedVulkanVersion, vk::SPIRV_VERSION_1_3, 0u); |
| programCollection.glslSources.add("tesc") |
| << glu::TessellationControlSource(tesc) << vk::ShaderBuildOptions(programCollection.usedVulkanVersion, vk::SPIRV_VERSION_1_3, 0u); |
| programCollection.glslSources.add("tese") |
| << glu::TessellationEvaluationSource(tese) << vk::ShaderBuildOptions(programCollection.usedVulkanVersion, vk::SPIRV_VERSION_1_3, 0u); |
| subgroups::addGeometryShadersFromTemplate(geometry, vk::ShaderBuildOptions(programCollection.usedVulkanVersion, vk::SPIRV_VERSION_1_3, 0u), |
| programCollection.glslSources); |
| programCollection.glslSources.add("fragment") |
| << glu::FragmentSource(fragment)<< vk::ShaderBuildOptions(programCollection.usedVulkanVersion, vk::SPIRV_VERSION_1_3, 0u); |
| } |
| } |
| |
| void supportedCheck (Context& context, CaseDefinition caseDef) |
| { |
| if (!subgroups::isSubgroupSupported(context)) |
| TCU_THROW(NotSupportedError, "Subgroup operations are not supported"); |
| |
| if (!subgroups::isSubgroupFeatureSupportedForDevice(context, VK_SUBGROUP_FEATURE_BALLOT_BIT)) |
| { |
| TCU_THROW(NotSupportedError, "Device does not support subgroup ballot operations"); |
| } |
| |
| if (caseDef.extShaderSubGroupBallotTests && !context.requireDeviceFunctionality("VK_EXT_shader_subgroup_ballot")) |
| { |
| TCU_THROW(NotSupportedError, "Device does not support VK_EXT_shader_subgroup_ballot extension"); |
| } |
| |
| if (caseDef.extShaderSubGroupBallotTests && !subgroups::isInt64SupportedForDevice(context)) |
| { |
| TCU_THROW(NotSupportedError, "Device does not support int64 data types"); |
| } |
| |
| if (caseDef.requiredSubgroupSize) |
| { |
| if (!context.requireDeviceFunctionality("VK_EXT_subgroup_size_control")) |
| TCU_THROW(NotSupportedError, "Device does not support VK_EXT_subgroup_size_control extension"); |
| VkPhysicalDeviceSubgroupSizeControlFeaturesEXT subgroupSizeControlFeatures; |
| subgroupSizeControlFeatures.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_SUBGROUP_SIZE_CONTROL_FEATURES_EXT; |
| subgroupSizeControlFeatures.pNext = DE_NULL; |
| |
| VkPhysicalDeviceFeatures2 features; |
| features.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_FEATURES_2; |
| features.pNext = &subgroupSizeControlFeatures; |
| |
| context.getInstanceInterface().getPhysicalDeviceFeatures2(context.getPhysicalDevice(), &features); |
| |
| if (subgroupSizeControlFeatures.subgroupSizeControl == DE_FALSE) |
| TCU_THROW(NotSupportedError, "Device does not support varying subgroup sizes nor required subgroup size"); |
| |
| if (subgroupSizeControlFeatures.computeFullSubgroups == DE_FALSE) |
| TCU_THROW(NotSupportedError, "Device does not support full subgroups in compute shaders"); |
| } |
| |
| *caseDef.geometryPointSizeSupported = subgroups::isTessellationAndGeometryPointSizeSupported(context); |
| } |
| |
| tcu::TestStatus noSSBOtest (Context& context, const CaseDefinition caseDef) |
| { |
| if (!subgroups::areSubgroupOperationsSupportedForStage( |
| context, caseDef.shaderStage)) |
| { |
| if (subgroups::areSubgroupOperationsRequiredForStage(caseDef.shaderStage)) |
| { |
| return tcu::TestStatus::fail( |
| "Shader stage " + |
| subgroups::getShaderStageName(caseDef.shaderStage) + |
| " is required to support subgroup operations!"); |
| } |
| else |
| { |
| TCU_THROW(NotSupportedError, "Device does not support subgroup operations for this stage"); |
| } |
| } |
| |
| subgroups::SSBOData inputData[1]; |
| inputData[0].format = VK_FORMAT_R32_UINT; |
| inputData[0].layout = subgroups::SSBOData::LayoutStd140; |
| inputData[0].numElements = subgroups::maxSupportedSubgroupSize(); |
| inputData[0].initializeType = subgroups::SSBOData::InitializeNonZero; |
| |
| if (VK_SHADER_STAGE_VERTEX_BIT == caseDef.shaderStage) |
| return subgroups::makeVertexFrameBufferTest(context, VK_FORMAT_R32_UINT, inputData, 1, DE_NULL, checkVertexPipelineStages); |
| else if (VK_SHADER_STAGE_GEOMETRY_BIT == caseDef.shaderStage) |
| return subgroups::makeGeometryFrameBufferTest(context, VK_FORMAT_R32_UINT, inputData, 1, DE_NULL, checkVertexPipelineStages); |
| else if (VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT == caseDef.shaderStage) |
| return subgroups::makeTessellationEvaluationFrameBufferTest(context, VK_FORMAT_R32_UINT, inputData, 1, DE_NULL, checkVertexPipelineStages, VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT); |
| else if (VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT == caseDef.shaderStage) |
| return subgroups::makeTessellationEvaluationFrameBufferTest(context, VK_FORMAT_R32_UINT, inputData, 1, DE_NULL, checkVertexPipelineStages, VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT); |
| else |
| TCU_THROW(InternalError, "Unhandled shader stage"); |
| } |
| |
| tcu::TestStatus test(Context& context, const CaseDefinition caseDef) |
| { |
| if (VK_SHADER_STAGE_COMPUTE_BIT == caseDef.shaderStage) |
| { |
| if (!subgroups::areSubgroupOperationsSupportedForStage(context, caseDef.shaderStage)) |
| { |
| return tcu::TestStatus::fail( |
| "Shader stage " + |
| subgroups::getShaderStageName(caseDef.shaderStage) + |
| " is required to support subgroup operations!"); |
| } |
| subgroups::SSBOData inputData[1]; |
| inputData[0].format = VK_FORMAT_R32_UINT; |
| inputData[0].layout = subgroups::SSBOData::LayoutStd430; |
| inputData[0].numElements = subgroups::maxSupportedSubgroupSize(); |
| inputData[0].initializeType = subgroups::SSBOData::InitializeNonZero; |
| |
| if (caseDef.requiredSubgroupSize == DE_FALSE) |
| return subgroups::makeComputeTest(context, VK_FORMAT_R32_UINT, inputData, 1, DE_NULL, checkCompute); |
| |
| tcu::TestLog& log = context.getTestContext().getLog(); |
| VkPhysicalDeviceSubgroupSizeControlPropertiesEXT subgroupSizeControlProperties; |
| subgroupSizeControlProperties.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_SUBGROUP_SIZE_CONTROL_PROPERTIES_EXT; |
| subgroupSizeControlProperties.pNext = DE_NULL; |
| VkPhysicalDeviceProperties2 properties; |
| properties.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_PROPERTIES_2; |
| properties.pNext = &subgroupSizeControlProperties; |
| |
| context.getInstanceInterface().getPhysicalDeviceProperties2(context.getPhysicalDevice(), &properties); |
| |
| log << tcu::TestLog::Message << "Testing required subgroup size range [" << subgroupSizeControlProperties.minSubgroupSize << ", " |
| << subgroupSizeControlProperties.maxSubgroupSize << "]" << tcu::TestLog::EndMessage; |
| |
| // According to the spec, requiredSubgroupSize must be a power-of-two integer. |
| for (deUint32 size = subgroupSizeControlProperties.minSubgroupSize; size <= subgroupSizeControlProperties.maxSubgroupSize; size *= 2) |
| { |
| tcu::TestStatus result = subgroups::makeComputeTest(context, VK_FORMAT_R32_UINT, inputData, 1, DE_NULL, checkCompute, |
| size, VK_PIPELINE_SHADER_STAGE_CREATE_REQUIRE_FULL_SUBGROUPS_BIT_EXT); |
| if (result.getCode() != QP_TEST_RESULT_PASS) |
| { |
| log << tcu::TestLog::Message << "subgroupSize " << size << " failed" << tcu::TestLog::EndMessage; |
| return result; |
| } |
| } |
| |
| return tcu::TestStatus::pass("OK"); |
| } |
| else |
| { |
| VkPhysicalDeviceSubgroupProperties subgroupProperties; |
| subgroupProperties.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_SUBGROUP_PROPERTIES; |
| subgroupProperties.pNext = DE_NULL; |
| |
| VkPhysicalDeviceProperties2 properties; |
| properties.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_PROPERTIES_2; |
| properties.pNext = &subgroupProperties; |
| |
| context.getInstanceInterface().getPhysicalDeviceProperties2(context.getPhysicalDevice(), &properties); |
| |
| VkShaderStageFlagBits stages = (VkShaderStageFlagBits)(caseDef.shaderStage & subgroupProperties.supportedStages); |
| |
| if ( VK_SHADER_STAGE_FRAGMENT_BIT != stages && !subgroups::isVertexSSBOSupportedForDevice(context)) |
| { |
| if ( (stages & VK_SHADER_STAGE_FRAGMENT_BIT) == 0) |
| TCU_THROW(NotSupportedError, "Device does not support vertex stage SSBO writes"); |
| else |
| stages = VK_SHADER_STAGE_FRAGMENT_BIT; |
| } |
| |
| if ((VkShaderStageFlagBits)0u == stages) |
| TCU_THROW(NotSupportedError, "Subgroup operations are not supported for any graphic shader"); |
| |
| subgroups::SSBOData inputData; |
| inputData.format = VK_FORMAT_R32_UINT; |
| inputData.layout = subgroups::SSBOData::LayoutStd430; |
| inputData.numElements = subgroups::maxSupportedSubgroupSize(); |
| inputData.initializeType = subgroups::SSBOData::InitializeNonZero; |
| inputData.binding = 4u; |
| inputData.stages = stages; |
| |
| return subgroups::allStages(context, VK_FORMAT_R32_UINT, &inputData, 1, DE_NULL, checkVertexPipelineStages, stages); |
| } |
| } |
| } |
| |
| namespace vkt |
| { |
| namespace subgroups |
| { |
| tcu::TestCaseGroup* createSubgroupsBallotTests(tcu::TestContext& testCtx) |
| { |
| de::MovePtr<tcu::TestCaseGroup> graphicGroup(new tcu::TestCaseGroup( |
| testCtx, "graphics", "Subgroup ballot category tests: graphics")); |
| de::MovePtr<tcu::TestCaseGroup> computeGroup(new tcu::TestCaseGroup( |
| testCtx, "compute", "Subgroup ballot category tests: compute")); |
| de::MovePtr<tcu::TestCaseGroup> framebufferGroup(new tcu::TestCaseGroup( |
| testCtx, "framebuffer", "Subgroup ballot category tests: framebuffer")); |
| |
| de::MovePtr<tcu::TestCaseGroup> graphicGroupEXT(new tcu::TestCaseGroup( |
| testCtx, "graphics", "VK_EXT_shader_subgroups_ballot category tests: graphics")); |
| de::MovePtr<tcu::TestCaseGroup> computeGroupEXT(new tcu::TestCaseGroup( |
| testCtx, "compute", "VK_EXT_shader_subgroups_ballot category tests: compute")); |
| de::MovePtr<tcu::TestCaseGroup> framebufferGroupEXT(new tcu::TestCaseGroup( |
| testCtx, "framebuffer", "VK_EXT_shader_subgroups_ballot category tests: framebuffer")); |
| |
| const VkShaderStageFlags stages[] = |
| { |
| VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT, |
| VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT, |
| VK_SHADER_STAGE_GEOMETRY_BIT, |
| VK_SHADER_STAGE_VERTEX_BIT |
| }; |
| |
| |
| { |
| CaseDefinition caseDef = {VK_SHADER_STAGE_COMPUTE_BIT, de::SharedPtr<bool>(new bool), DE_FALSE, DE_FALSE}; |
| addFunctionCaseWithPrograms(computeGroup.get(), getShaderStageName(caseDef.shaderStage), "", supportedCheck, initPrograms, test, caseDef); |
| caseDef.extShaderSubGroupBallotTests = DE_TRUE; |
| addFunctionCaseWithPrograms(computeGroupEXT.get(), getShaderStageName(caseDef.shaderStage), "", supportedCheck, initPrograms, test, caseDef); |
| |
| caseDef.requiredSubgroupSize = DE_TRUE; |
| caseDef.extShaderSubGroupBallotTests = DE_FALSE; |
| addFunctionCaseWithPrograms(computeGroup.get(), getShaderStageName(caseDef.shaderStage) + "_requiredsubgroupsize", "", supportedCheck, initPrograms, test, caseDef); |
| caseDef.extShaderSubGroupBallotTests = DE_TRUE; |
| addFunctionCaseWithPrograms(computeGroupEXT.get(), getShaderStageName(caseDef.shaderStage) + "_requiredsubgroupsize", "", supportedCheck, initPrograms, test, caseDef); |
| } |
| |
| { |
| CaseDefinition caseDef = {VK_SHADER_STAGE_ALL_GRAPHICS, de::SharedPtr<bool>(new bool), DE_FALSE, DE_FALSE}; |
| addFunctionCaseWithPrograms(graphicGroup.get(), "graphic", "", supportedCheck, initPrograms, test, caseDef); |
| caseDef.extShaderSubGroupBallotTests = DE_TRUE; |
| addFunctionCaseWithPrograms(graphicGroupEXT.get(), "graphic", "", supportedCheck, initPrograms, test, caseDef); |
| } |
| |
| for (int stageIndex = 0; stageIndex < DE_LENGTH_OF_ARRAY(stages); ++stageIndex) |
| { |
| CaseDefinition caseDef = {stages[stageIndex],de::SharedPtr<bool>(new bool), DE_FALSE, DE_FALSE}; |
| addFunctionCaseWithPrograms(framebufferGroup.get(), getShaderStageName(caseDef.shaderStage), "", |
| supportedCheck, initFrameBufferPrograms, noSSBOtest, caseDef); |
| caseDef.extShaderSubGroupBallotTests = DE_TRUE; |
| addFunctionCaseWithPrograms(framebufferGroupEXT.get(), getShaderStageName(caseDef.shaderStage), "", |
| supportedCheck, initFrameBufferPrograms, noSSBOtest, caseDef); |
| |
| } |
| |
| de::MovePtr<tcu::TestCaseGroup> groupEXT(new tcu::TestCaseGroup( |
| testCtx, "ext_shader_subgroup_ballot", "VK_EXT_shader_subgroups_ballot category tests")); |
| |
| groupEXT->addChild(graphicGroupEXT.release()); |
| groupEXT->addChild(computeGroupEXT.release()); |
| groupEXT->addChild(framebufferGroupEXT.release()); |
| |
| de::MovePtr<tcu::TestCaseGroup> group(new tcu::TestCaseGroup( |
| testCtx, "ballot", "Subgroup ballot category tests")); |
| |
| group->addChild(graphicGroup.release()); |
| group->addChild(computeGroup.release()); |
| group->addChild(framebufferGroup.release()); |
| |
| group->addChild(groupEXT.release()); |
| |
| return group.release(); |
| } |
| |
| } // subgroups |
| } // vkt |