| // Copyright 2021 The SwiftShader Authors. All Rights Reserved. |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| |
| #include "Device.hpp" |
| #include "Driver.hpp" |
| |
| #include "gmock/gmock.h" |
| #include "gtest/gtest.h" |
| |
| #include "spirv-tools/libspirv.hpp" |
| |
| #include <cstring> |
| #include <sstream> |
| |
| namespace { |
| size_t alignUp(size_t val, size_t alignment) |
| { |
| return alignment * ((val + alignment - 1) / alignment); |
| } |
| } // anonymous namespace |
| |
| struct ComputeParams |
| { |
| size_t numElements; |
| int localSizeX; |
| int localSizeY; |
| int localSizeZ; |
| |
| friend std::ostream &operator<<(std::ostream &os, const ComputeParams ¶ms) |
| { |
| return os << "ComputeParams{" |
| << "numElements: " << params.numElements << ", " |
| << "localSizeX: " << params.localSizeX << ", " |
| << "localSizeY: " << params.localSizeY << ", " |
| << "localSizeZ: " << params.localSizeZ << "}"; |
| } |
| }; |
| |
| class ComputeTest : public testing::TestWithParam<ComputeParams> |
| { |
| protected: |
| static Driver driver; |
| |
| static void SetUpTestSuite() |
| { |
| ASSERT_TRUE(driver.loadSwiftShader()); |
| } |
| |
| static void TearDownTestSuite() |
| { |
| driver.unload(); |
| } |
| }; |
| |
| Driver ComputeTest::driver; |
| |
| std::vector<uint32_t> compileSpirv(const char *assembly) |
| { |
| spvtools::SpirvTools core(SPV_ENV_VULKAN_1_0); |
| |
| core.SetMessageConsumer([](spv_message_level_t, const char *, const spv_position_t &p, const char *m) { |
| FAIL() << p.line << ":" << p.column << ": " << m; |
| }); |
| |
| std::vector<uint32_t> spirv; |
| EXPECT_TRUE(core.Assemble(assembly, &spirv)); |
| EXPECT_TRUE(core.Validate(spirv)); |
| |
| // Warn if the disassembly does not match the source assembly. |
| // We do this as debugging tests in the debugger is often made much harder |
| // if the SSA names (%X) in the debugger do not match the source. |
| std::string disassembled; |
| core.Disassemble(spirv, &disassembled, SPV_BINARY_TO_TEXT_OPTION_NO_HEADER); |
| if(disassembled != assembly) |
| { |
| printf("-- WARNING: Disassembly does not match assembly: ---\n\n"); |
| |
| auto splitLines = [](const std::string &str) -> std::vector<std::string> { |
| std::stringstream ss(str); |
| std::vector<std::string> out; |
| std::string line; |
| while(std::getline(ss, line, '\n')) { out.push_back(line); } |
| return out; |
| }; |
| |
| auto srcLines = splitLines(std::string(assembly)); |
| auto disLines = splitLines(disassembled); |
| |
| for(size_t line = 0; line < srcLines.size() && line < disLines.size(); line++) |
| { |
| auto srcLine = (line < srcLines.size()) ? srcLines[line] : "<missing>"; |
| auto disLine = (line < disLines.size()) ? disLines[line] : "<missing>"; |
| if(srcLine != disLine) |
| { |
| printf("%zu: '%s' != '%s'\n", line, srcLine.c_str(), disLine.c_str()); |
| } |
| } |
| printf("\n\n---\nExpected:\n\n%s", disassembled.c_str()); |
| } |
| |
| return spirv; |
| } |
| |
| #define VK_ASSERT(x) ASSERT_EQ(x, VK_SUCCESS) |
| |
| // Base class for compute tests that read from an input buffer and write to an |
| // output buffer of same length. |
| class SwiftShaderVulkanBufferToBufferComputeTest : public ComputeTest |
| { |
| public: |
| void test(const std::string &shader, |
| std::function<uint32_t(uint32_t idx)> input, |
| std::function<uint32_t(uint32_t idx)> expected); |
| }; |
| |
| void SwiftShaderVulkanBufferToBufferComputeTest::test( |
| const std::string &shader, |
| std::function<uint32_t(uint32_t idx)> input, |
| std::function<uint32_t(uint32_t idx)> expected) |
| { |
| auto code = compileSpirv(shader.c_str()); |
| |
| const VkInstanceCreateInfo createInfo = { |
| VK_STRUCTURE_TYPE_INSTANCE_CREATE_INFO, // sType |
| nullptr, // pNext |
| 0, // flags |
| nullptr, // pApplicationInfo |
| 0, // enabledLayerCount |
| nullptr, // ppEnabledLayerNames |
| 0, // enabledExtensionCount |
| nullptr, // ppEnabledExtensionNames |
| }; |
| |
| VkInstance instance = VK_NULL_HANDLE; |
| VK_ASSERT(driver.vkCreateInstance(&createInfo, nullptr, &instance)); |
| |
| ASSERT_TRUE(driver.resolve(instance)); |
| |
| std::unique_ptr<Device> device; |
| VK_ASSERT(Device::CreateComputeDevice(&driver, instance, device)); |
| ASSERT_TRUE(device->IsValid()); |
| |
| // struct Buffers |
| // { |
| // uint32_t pad0[63]; |
| // uint32_t magic0; |
| // uint32_t in[NUM_ELEMENTS]; // Aligned to 0x100 |
| // uint32_t magic1; |
| // uint32_t pad1[N]; |
| // uint32_t magic2; |
| // uint32_t out[NUM_ELEMENTS]; // Aligned to 0x100 |
| // uint32_t magic3; |
| // }; |
| static constexpr uint32_t magic0 = 0x01234567; |
| static constexpr uint32_t magic1 = 0x89abcdef; |
| static constexpr uint32_t magic2 = 0xfedcba99; |
| static constexpr uint32_t magic3 = 0x87654321; |
| size_t numElements = GetParam().numElements; |
| size_t alignElements = 0x100 / sizeof(uint32_t); |
| size_t magic0Offset = alignElements - 1; |
| size_t inOffset = 1 + magic0Offset; |
| size_t magic1Offset = numElements + inOffset; |
| size_t magic2Offset = alignUp(magic1Offset + 1, alignElements) - 1; |
| size_t outOffset = 1 + magic2Offset; |
| size_t magic3Offset = numElements + outOffset; |
| size_t buffersTotalElements = alignUp(1 + magic3Offset, alignElements); |
| size_t buffersSize = sizeof(uint32_t) * buffersTotalElements; |
| |
| VkDeviceMemory memory; |
| VK_ASSERT(device->AllocateMemory(buffersSize, |
| VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT | VK_MEMORY_PROPERTY_HOST_COHERENT_BIT, |
| &memory)); |
| |
| uint32_t *buffers; |
| VK_ASSERT(device->MapMemory(memory, 0, buffersSize, 0, (void **)&buffers)); |
| |
| memset(buffers, 0, buffersSize); |
| |
| buffers[magic0Offset] = magic0; |
| buffers[magic1Offset] = magic1; |
| buffers[magic2Offset] = magic2; |
| buffers[magic3Offset] = magic3; |
| |
| for(size_t i = 0; i < numElements; i++) |
| { |
| buffers[inOffset + i] = input((uint32_t)i); |
| } |
| |
| device->UnmapMemory(memory); |
| buffers = nullptr; |
| |
| VkBuffer bufferIn; |
| VK_ASSERT(device->CreateStorageBuffer(memory, |
| sizeof(uint32_t) * numElements, |
| sizeof(uint32_t) * inOffset, |
| &bufferIn)); |
| |
| VkBuffer bufferOut; |
| VK_ASSERT(device->CreateStorageBuffer(memory, |
| sizeof(uint32_t) * numElements, |
| sizeof(uint32_t) * outOffset, |
| &bufferOut)); |
| |
| VkShaderModule shaderModule; |
| VK_ASSERT(device->CreateShaderModule(code, &shaderModule)); |
| |
| std::vector<VkDescriptorSetLayoutBinding> descriptorSetLayoutBindings = { |
| { |
| 0, // binding |
| VK_DESCRIPTOR_TYPE_STORAGE_BUFFER, // descriptorType |
| 1, // descriptorCount |
| VK_SHADER_STAGE_COMPUTE_BIT, // stageFlags |
| 0, // pImmutableSamplers |
| }, |
| { |
| 1, // binding |
| VK_DESCRIPTOR_TYPE_STORAGE_BUFFER, // descriptorType |
| 1, // descriptorCount |
| VK_SHADER_STAGE_COMPUTE_BIT, // stageFlags |
| 0, // pImmutableSamplers |
| } |
| }; |
| |
| VkDescriptorSetLayout descriptorSetLayout; |
| VK_ASSERT(device->CreateDescriptorSetLayout(descriptorSetLayoutBindings, &descriptorSetLayout)); |
| |
| VkPipelineLayout pipelineLayout; |
| VK_ASSERT(device->CreatePipelineLayout(descriptorSetLayout, &pipelineLayout)); |
| |
| VkPipeline pipeline; |
| VK_ASSERT(device->CreateComputePipeline(shaderModule, pipelineLayout, &pipeline)); |
| |
| VkDescriptorPool descriptorPool; |
| VK_ASSERT(device->CreateStorageBufferDescriptorPool(2, &descriptorPool)); |
| |
| VkDescriptorSet descriptorSet; |
| VK_ASSERT(device->AllocateDescriptorSet(descriptorPool, descriptorSetLayout, &descriptorSet)); |
| |
| std::vector<VkDescriptorBufferInfo> descriptorBufferInfos = { |
| { |
| bufferIn, // buffer |
| 0, // offset |
| VK_WHOLE_SIZE, // range |
| }, |
| { |
| bufferOut, // buffer |
| 0, // offset |
| VK_WHOLE_SIZE, // range |
| } |
| }; |
| device->UpdateStorageBufferDescriptorSets(descriptorSet, descriptorBufferInfos); |
| |
| VkCommandPool commandPool; |
| VK_ASSERT(device->CreateCommandPool(&commandPool)); |
| |
| VkCommandBuffer commandBuffer; |
| VK_ASSERT(device->AllocateCommandBuffer(commandPool, &commandBuffer)); |
| |
| VK_ASSERT(device->BeginCommandBuffer(VK_COMMAND_BUFFER_USAGE_ONE_TIME_SUBMIT_BIT, commandBuffer)); |
| |
| driver.vkCmdBindPipeline(commandBuffer, VK_PIPELINE_BIND_POINT_COMPUTE, pipeline); |
| |
| driver.vkCmdBindDescriptorSets(commandBuffer, VK_PIPELINE_BIND_POINT_COMPUTE, pipelineLayout, 0, 1, &descriptorSet, |
| 0, nullptr); |
| |
| driver.vkCmdDispatch(commandBuffer, (uint32_t)(numElements / GetParam().localSizeX), 1, 1); |
| |
| VK_ASSERT(driver.vkEndCommandBuffer(commandBuffer)); |
| |
| VK_ASSERT(device->QueueSubmitAndWait(commandBuffer)); |
| |
| VK_ASSERT(device->MapMemory(memory, 0, buffersSize, 0, (void **)&buffers)); |
| |
| for(size_t i = 0; i < numElements; ++i) |
| { |
| auto got = buffers[i + outOffset]; |
| EXPECT_EQ(expected((uint32_t)i), got) << "Unexpected output at " << i; |
| } |
| |
| // Check for writes outside of bounds. |
| EXPECT_EQ(buffers[magic0Offset], magic0); |
| EXPECT_EQ(buffers[magic1Offset], magic1); |
| EXPECT_EQ(buffers[magic2Offset], magic2); |
| EXPECT_EQ(buffers[magic3Offset], magic3); |
| |
| device->UnmapMemory(memory); |
| buffers = nullptr; |
| |
| device->FreeCommandBuffer(commandPool, commandBuffer); |
| device->FreeMemory(memory); |
| device->DestroyPipeline(pipeline); |
| device->DestroyCommandPool(commandPool); |
| device->DestroyPipelineLayout(pipelineLayout); |
| device->DestroyDescriptorSetLayout(descriptorSetLayout); |
| device->DestroyDescriptorPool(descriptorPool); |
| device->DestroyBuffer(bufferIn); |
| device->DestroyBuffer(bufferOut); |
| device->DestroyShaderModule(shaderModule); |
| device.reset(nullptr); |
| driver.vkDestroyInstance(instance, nullptr); |
| } |
| |
| INSTANTIATE_TEST_SUITE_P(ComputeParams, SwiftShaderVulkanBufferToBufferComputeTest, testing::Values(ComputeParams{ 512, 1, 1, 1 }, ComputeParams{ 512, 2, 1, 1 }, ComputeParams{ 512, 4, 1, 1 }, ComputeParams{ 512, 8, 1, 1 }, ComputeParams{ 512, 16, 1, 1 }, ComputeParams{ 512, 32, 1, 1 }, |
| |
| // Non-multiple of SIMD-lane. |
| ComputeParams{ 3, 1, 1, 1 }, ComputeParams{ 2, 1, 1, 1 })); |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, Memcpy) |
| { |
| std::stringstream src; |
| // #version 450 |
| // layout(local_size_x = 1, local_size_y = 1, local_size_z = 1) in; |
| // layout(binding = 0, std430) buffer InBuffer |
| // { |
| // int Data[]; |
| // } In; |
| // layout(binding = 1, std430) buffer OutBuffer |
| // { |
| // int Data[]; |
| // } Out; |
| // void main() |
| // { |
| // Out.Data[gl_GlobalInvocationID.x] = In.Data[gl_GlobalInvocationID.x]; |
| // } |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%11 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %11 Uniform\n" // struct{ int32[] }* in |
| "%12 = OpConstant %9 0\n" // int32(0) |
| "%13 = OpConstant %10 0\n" // uint32(0) |
| "%14 = OpTypeVector %10 3\n" // vec3<int32> |
| "%15 = OpTypePointer Input %14\n" // vec3<int32>* |
| "%2 = OpVariable %15 Input\n" // gl_GlobalInvocationId |
| "%16 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %11 Uniform\n" // struct{ int32[] }* out |
| "%17 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%18 = OpLabel\n" |
| "%19 = OpAccessChain %16 %2 %13\n" // &gl_GlobalInvocationId.x |
| "%20 = OpLoad %10 %19\n" // gl_GlobalInvocationId.x |
| "%21 = OpAccessChain %17 %6 %12 %20\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%22 = OpLoad %9 %21\n" // in.arr[gl_GlobalInvocationId.x] |
| "%23 = OpAccessChain %17 %5 %12 %20\n" // &out.arr[gl_GlobalInvocationId.x] |
| "OpStore %23 %22\n" // out.arr[gl_GlobalInvocationId.x] = in[gl_GlobalInvocationId.x] |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, GlobalInvocationId) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%11 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %11 Uniform\n" // struct{ int32[] }* in |
| "%12 = OpConstant %9 0\n" // int32(0) |
| "%13 = OpConstant %9 1\n" // int32(1) |
| "%14 = OpConstant %10 0\n" // uint32(0) |
| "%15 = OpConstant %10 1\n" // uint32(1) |
| "%16 = OpConstant %10 2\n" // uint32(2) |
| "%17 = OpTypeVector %10 3\n" // vec3<int32> |
| "%18 = OpTypePointer Input %17\n" // vec3<int32>* |
| "%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId |
| "%19 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %11 Uniform\n" // struct{ int32[] }* out |
| "%20 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%21 = OpLabel\n" |
| "%22 = OpAccessChain %19 %2 %14\n" // &gl_GlobalInvocationId.x |
| "%23 = OpAccessChain %19 %2 %15\n" // &gl_GlobalInvocationId.y |
| "%24 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.z |
| "%25 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x |
| "%26 = OpLoad %10 %23\n" // gl_GlobalInvocationId.y |
| "%27 = OpLoad %10 %24\n" // gl_GlobalInvocationId.z |
| "%28 = OpAccessChain %20 %6 %12 %25\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%29 = OpLoad %9 %28\n" // out.arr[gl_GlobalInvocationId.x] |
| "%30 = OpIAdd %9 %29 %26\n" // in[gl_GlobalInvocationId.x] + gl_GlobalInvocationId.y |
| "%31 = OpIAdd %9 %30 %27\n" // in[gl_GlobalInvocationId.x] + gl_GlobalInvocationId.y + gl_GlobalInvocationId.z |
| "%32 = OpAccessChain %20 %5 %12 %25\n" // &out.arr[gl_GlobalInvocationId.x] |
| "OpStore %32 %31\n" // out.arr[gl_GlobalInvocationId.x] = in[gl_GlobalInvocationId.x] + gl_GlobalInvocationId.y + gl_GlobalInvocationId.z |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| // gl_GlobalInvocationId.y and gl_GlobalInvocationId.z should both be zero. |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchSimple) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%11 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %11 Uniform\n" // struct{ int32[] }* in |
| "%12 = OpConstant %9 0\n" // int32(0) |
| "%13 = OpConstant %10 0\n" // uint32(0) |
| "%14 = OpTypeVector %10 3\n" // vec3<int32> |
| "%15 = OpTypePointer Input %14\n" // vec3<int32>* |
| "%2 = OpVariable %15 Input\n" // gl_GlobalInvocationId |
| "%16 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %11 Uniform\n" // struct{ int32[] }* out |
| "%17 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%18 = OpLabel\n" |
| "%19 = OpAccessChain %16 %2 %13\n" // &gl_GlobalInvocationId.x |
| "%20 = OpLoad %10 %19\n" // gl_GlobalInvocationId.x |
| "%21 = OpAccessChain %17 %6 %12 %20\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%22 = OpLoad %9 %21\n" // in.arr[gl_GlobalInvocationId.x] |
| "%23 = OpAccessChain %17 %5 %12 %20\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %22 = in value |
| "OpBranch %24\n" |
| "%24 = OpLabel\n" |
| "OpBranch %25\n" |
| "%25 = OpLabel\n" |
| "OpBranch %26\n" |
| "%26 = OpLabel\n" |
| // %22 = out value |
| // End of branch logic |
| "OpStore %23 %22\n" |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchDeclareSSA) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%11 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %11 Uniform\n" // struct{ int32[] }* in |
| "%12 = OpConstant %9 0\n" // int32(0) |
| "%13 = OpConstant %10 0\n" // uint32(0) |
| "%14 = OpTypeVector %10 3\n" // vec3<int32> |
| "%15 = OpTypePointer Input %14\n" // vec3<int32>* |
| "%2 = OpVariable %15 Input\n" // gl_GlobalInvocationId |
| "%16 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %11 Uniform\n" // struct{ int32[] }* out |
| "%17 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%18 = OpLabel\n" |
| "%19 = OpAccessChain %16 %2 %13\n" // &gl_GlobalInvocationId.x |
| "%20 = OpLoad %10 %19\n" // gl_GlobalInvocationId.x |
| "%21 = OpAccessChain %17 %6 %12 %20\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%22 = OpLoad %9 %21\n" // in.arr[gl_GlobalInvocationId.x] |
| "%23 = OpAccessChain %17 %5 %12 %20\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %22 = in value |
| "OpBranch %24\n" |
| "%24 = OpLabel\n" |
| "%25 = OpIAdd %9 %22 %22\n" // %25 = in*2 |
| "OpBranch %26\n" |
| "%26 = OpLabel\n" |
| "OpBranch %27\n" |
| "%27 = OpLabel\n" |
| // %25 = out value |
| // End of branch logic |
| "OpStore %23 %25\n" // use SSA value from previous block |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i * 2; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchConditionalSimple) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%11 = OpTypeBool\n" |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in |
| "%13 = OpConstant %9 0\n" // int32(0) |
| "%14 = OpConstant %9 2\n" // int32(2) |
| "%15 = OpConstant %10 0\n" // uint32(0) |
| "%16 = OpTypeVector %10 3\n" // vec4<int32> |
| "%17 = OpTypePointer Input %16\n" // vec4<int32>* |
| "%2 = OpVariable %17 Input\n" // gl_GlobalInvocationId |
| "%18 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out |
| "%19 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%20 = OpLabel\n" |
| "%21 = OpAccessChain %18 %2 %15\n" // &gl_GlobalInvocationId.x |
| "%22 = OpLoad %10 %21\n" // gl_GlobalInvocationId.x |
| "%23 = OpAccessChain %19 %6 %13 %22\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%24 = OpLoad %9 %23\n" // in.arr[gl_GlobalInvocationId.x] |
| "%25 = OpAccessChain %19 %5 %13 %22\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %24 = in value |
| "%26 = OpSMod %9 %24 %14\n" // in % 2 |
| "%27 = OpIEqual %11 %26 %13\n" // (in % 2) == 0 |
| "OpSelectionMerge %28 None\n" |
| "OpBranchConditional %27 %28 %28\n" // Both go to %28 |
| "%28 = OpLabel\n" |
| // %26 = out value |
| // End of branch logic |
| "OpStore %25 %26\n" // use SSA value from previous block |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i % 2; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchConditionalTwoEmptyBlocks) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%11 = OpTypeBool\n" |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in |
| "%13 = OpConstant %9 0\n" // int32(0) |
| "%14 = OpConstant %9 2\n" // int32(2) |
| "%15 = OpConstant %10 0\n" // uint32(0) |
| "%16 = OpTypeVector %10 3\n" // vec4<int32> |
| "%17 = OpTypePointer Input %16\n" // vec4<int32>* |
| "%2 = OpVariable %17 Input\n" // gl_GlobalInvocationId |
| "%18 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out |
| "%19 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%20 = OpLabel\n" |
| "%21 = OpAccessChain %18 %2 %15\n" // &gl_GlobalInvocationId.x |
| "%22 = OpLoad %10 %21\n" // gl_GlobalInvocationId.x |
| "%23 = OpAccessChain %19 %6 %13 %22\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%24 = OpLoad %9 %23\n" // in.arr[gl_GlobalInvocationId.x] |
| "%25 = OpAccessChain %19 %5 %13 %22\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %24 = in value |
| "%26 = OpSMod %9 %24 %14\n" // in % 2 |
| "%27 = OpIEqual %11 %26 %13\n" // (in % 2) == 0 |
| "OpSelectionMerge %28 None\n" |
| "OpBranchConditional %27 %29 %30\n" |
| "%29 = OpLabel\n" // (in % 2) == 0 |
| "OpBranch %28\n" |
| "%30 = OpLabel\n" // (in % 2) != 0 |
| "OpBranch %28\n" |
| "%28 = OpLabel\n" |
| // %26 = out value |
| // End of branch logic |
| "OpStore %25 %26\n" // use SSA value from previous block |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i % 2; }); |
| } |
| |
| // TODO: Test for parallel assignment |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchConditionalStore) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%11 = OpTypeBool\n" |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in |
| "%13 = OpConstant %9 0\n" // int32(0) |
| "%14 = OpConstant %9 1\n" // int32(1) |
| "%15 = OpConstant %9 2\n" // int32(2) |
| "%16 = OpConstant %10 0\n" // uint32(0) |
| "%17 = OpTypeVector %10 3\n" // vec4<int32> |
| "%18 = OpTypePointer Input %17\n" // vec4<int32>* |
| "%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId |
| "%19 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out |
| "%20 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%21 = OpLabel\n" |
| "%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x |
| "%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x |
| "%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x] |
| "%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %25 = in value |
| "%27 = OpSMod %9 %25 %15\n" // in % 2 |
| "%28 = OpIEqual %11 %27 %13\n" // (in % 2) == 0 |
| "OpSelectionMerge %29 None\n" |
| "OpBranchConditional %28 %30 %31\n" |
| "%30 = OpLabel\n" // (in % 2) == 0 |
| "OpStore %26 %14\n" // write 1 |
| "OpBranch %29\n" |
| "%31 = OpLabel\n" // (in % 2) != 0 |
| "OpStore %26 %15\n" // write 2 |
| "OpBranch %29\n" |
| "%29 = OpLabel\n" |
| // End of branch logic |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 0 ? 1 : 2; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchConditionalReturnTrue) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%11 = OpTypeBool\n" |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in |
| "%13 = OpConstant %9 0\n" // int32(0) |
| "%14 = OpConstant %9 1\n" // int32(1) |
| "%15 = OpConstant %9 2\n" // int32(2) |
| "%16 = OpConstant %10 0\n" // uint32(0) |
| "%17 = OpTypeVector %10 3\n" // vec4<int32> |
| "%18 = OpTypePointer Input %17\n" // vec4<int32>* |
| "%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId |
| "%19 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out |
| "%20 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%21 = OpLabel\n" |
| "%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x |
| "%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x |
| "%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x] |
| "%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %25 = in value |
| "%27 = OpSMod %9 %25 %15\n" // in % 2 |
| "%28 = OpIEqual %11 %27 %13\n" // (in % 2) == 0 |
| "OpSelectionMerge %29 None\n" |
| "OpBranchConditional %28 %30 %29\n" |
| "%30 = OpLabel\n" // (in % 2) == 0 |
| "OpReturn\n" |
| "%29 = OpLabel\n" // merge |
| "OpStore %26 %15\n" // write 2 |
| // End of branch logic |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 0 ? 0 : 2; }); |
| } |
| |
| // TODO: Test for parallel assignment |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchConditionalPhi) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%11 = OpTypeBool\n" |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in |
| "%13 = OpConstant %9 0\n" // int32(0) |
| "%14 = OpConstant %9 1\n" // int32(1) |
| "%15 = OpConstant %9 2\n" // int32(2) |
| "%16 = OpConstant %10 0\n" // uint32(0) |
| "%17 = OpTypeVector %10 3\n" // vec4<int32> |
| "%18 = OpTypePointer Input %17\n" // vec4<int32>* |
| "%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId |
| "%19 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out |
| "%20 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%21 = OpLabel\n" |
| "%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x |
| "%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x |
| "%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x] |
| "%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %25 = in value |
| "%27 = OpSMod %9 %25 %15\n" // in % 2 |
| "%28 = OpIEqual %11 %27 %13\n" // (in % 2) == 0 |
| "OpSelectionMerge %29 None\n" |
| "OpBranchConditional %28 %30 %31\n" |
| "%30 = OpLabel\n" // (in % 2) == 0 |
| "OpBranch %29\n" |
| "%31 = OpLabel\n" // (in % 2) != 0 |
| "OpBranch %29\n" |
| "%29 = OpLabel\n" |
| "%32 = OpPhi %9 %14 %30 %15 %31\n" // (in % 2) == 0 ? 1 : 2 |
| // End of branch logic |
| "OpStore %26 %32\n" |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 0 ? 1 : 2; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchEmptyCases) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%11 = OpTypeBool\n" |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in |
| "%13 = OpConstant %9 0\n" // int32(0) |
| "%14 = OpConstant %9 2\n" // int32(2) |
| "%15 = OpConstant %10 0\n" // uint32(0) |
| "%16 = OpTypeVector %10 3\n" // vec4<int32> |
| "%17 = OpTypePointer Input %16\n" // vec4<int32>* |
| "%2 = OpVariable %17 Input\n" // gl_GlobalInvocationId |
| "%18 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out |
| "%19 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%20 = OpLabel\n" |
| "%21 = OpAccessChain %18 %2 %15\n" // &gl_GlobalInvocationId.x |
| "%22 = OpLoad %10 %21\n" // gl_GlobalInvocationId.x |
| "%23 = OpAccessChain %19 %6 %13 %22\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%24 = OpLoad %9 %23\n" // in.arr[gl_GlobalInvocationId.x] |
| "%25 = OpAccessChain %19 %5 %13 %22\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %24 = in value |
| "%26 = OpSMod %9 %24 %14\n" // in % 2 |
| "OpSelectionMerge %27 None\n" |
| "OpSwitch %26 %27 0 %28 1 %29\n" |
| "%28 = OpLabel\n" // (in % 2) == 0 |
| "OpBranch %27\n" |
| "%29 = OpLabel\n" // (in % 2) == 1 |
| "OpBranch %27\n" |
| "%27 = OpLabel\n" |
| // %26 = out value |
| // End of branch logic |
| "OpStore %25 %26\n" // use SSA value from previous block |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i % 2; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchStore) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%11 = OpTypeBool\n" |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in |
| "%13 = OpConstant %9 0\n" // int32(0) |
| "%14 = OpConstant %9 1\n" // int32(1) |
| "%15 = OpConstant %9 2\n" // int32(2) |
| "%16 = OpConstant %10 0\n" // uint32(0) |
| "%17 = OpTypeVector %10 3\n" // vec4<int32> |
| "%18 = OpTypePointer Input %17\n" // vec4<int32>* |
| "%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId |
| "%19 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out |
| "%20 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%21 = OpLabel\n" |
| "%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x |
| "%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x |
| "%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x] |
| "%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %25 = in value |
| "%27 = OpSMod %9 %25 %15\n" // in % 2 |
| "OpSelectionMerge %28 None\n" |
| "OpSwitch %27 %28 0 %29 1 %30\n" |
| "%29 = OpLabel\n" // (in % 2) == 0 |
| "OpStore %26 %15\n" // write 2 |
| "OpBranch %28\n" |
| "%30 = OpLabel\n" // (in % 2) == 1 |
| "OpStore %26 %14\n" // write 1 |
| "OpBranch %28\n" |
| "%28 = OpLabel\n" |
| // End of branch logic |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 0 ? 2 : 1; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchCaseReturn) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%11 = OpTypeBool\n" |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in |
| "%13 = OpConstant %9 0\n" // int32(0) |
| "%14 = OpConstant %9 1\n" // int32(1) |
| "%15 = OpConstant %9 2\n" // int32(2) |
| "%16 = OpConstant %10 0\n" // uint32(0) |
| "%17 = OpTypeVector %10 3\n" // vec4<int32> |
| "%18 = OpTypePointer Input %17\n" // vec4<int32>* |
| "%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId |
| "%19 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out |
| "%20 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%21 = OpLabel\n" |
| "%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x |
| "%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x |
| "%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x] |
| "%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %25 = in value |
| "%27 = OpSMod %9 %25 %15\n" // in % 2 |
| "OpSelectionMerge %28 None\n" |
| "OpSwitch %27 %28 0 %29 1 %30\n" |
| "%29 = OpLabel\n" // (in % 2) == 0 |
| "OpBranch %28\n" |
| "%30 = OpLabel\n" // (in % 2) == 1 |
| "OpReturn\n" |
| "%28 = OpLabel\n" |
| "OpStore %26 %14\n" // write 1 |
| // End of branch logic |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 1 ? 0 : 1; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchDefaultReturn) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%11 = OpTypeBool\n" |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in |
| "%13 = OpConstant %9 0\n" // int32(0) |
| "%14 = OpConstant %9 1\n" // int32(1) |
| "%15 = OpConstant %9 2\n" // int32(2) |
| "%16 = OpConstant %10 0\n" // uint32(0) |
| "%17 = OpTypeVector %10 3\n" // vec4<int32> |
| "%18 = OpTypePointer Input %17\n" // vec4<int32>* |
| "%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId |
| "%19 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out |
| "%20 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%21 = OpLabel\n" |
| "%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x |
| "%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x |
| "%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x] |
| "%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %25 = in value |
| "%27 = OpSMod %9 %25 %15\n" // in % 2 |
| "OpSelectionMerge %28 None\n" |
| "OpSwitch %27 %29 1 %30\n" |
| "%30 = OpLabel\n" // (in % 2) == 1 |
| "OpBranch %28\n" |
| "%29 = OpLabel\n" // (in % 2) != 1 |
| "OpReturn\n" |
| "%28 = OpLabel\n" // merge |
| "OpStore %26 %14\n" // write 1 |
| // End of branch logic |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 1 ? 1 : 0; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchCaseFallthrough) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%11 = OpTypeBool\n" |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in |
| "%13 = OpConstant %9 0\n" // int32(0) |
| "%14 = OpConstant %9 1\n" // int32(1) |
| "%15 = OpConstant %9 2\n" // int32(2) |
| "%16 = OpConstant %10 0\n" // uint32(0) |
| "%17 = OpTypeVector %10 3\n" // vec4<int32> |
| "%18 = OpTypePointer Input %17\n" // vec4<int32>* |
| "%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId |
| "%19 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out |
| "%20 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%21 = OpLabel\n" |
| "%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x |
| "%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x |
| "%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x] |
| "%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %25 = in value |
| "%27 = OpSMod %9 %25 %15\n" // in % 2 |
| "OpSelectionMerge %28 None\n" |
| "OpSwitch %27 %29 0 %30 1 %31\n" |
| "%30 = OpLabel\n" // (in % 2) == 0 |
| "%32 = OpIAdd %9 %27 %14\n" // generate an intermediate |
| "OpStore %26 %32\n" // write a value (overwritten later) |
| "OpBranch %31\n" // fallthrough |
| "%31 = OpLabel\n" // (in % 2) == 1 |
| "OpStore %26 %15\n" // write 2 |
| "OpBranch %28\n" |
| "%29 = OpLabel\n" // unreachable |
| "OpUnreachable\n" |
| "%28 = OpLabel\n" // merge |
| // End of branch logic |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return 2; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchDefaultFallthrough) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%11 = OpTypeBool\n" |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in |
| "%13 = OpConstant %9 0\n" // int32(0) |
| "%14 = OpConstant %9 1\n" // int32(1) |
| "%15 = OpConstant %9 2\n" // int32(2) |
| "%16 = OpConstant %10 0\n" // uint32(0) |
| "%17 = OpTypeVector %10 3\n" // vec4<int32> |
| "%18 = OpTypePointer Input %17\n" // vec4<int32>* |
| "%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId |
| "%19 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out |
| "%20 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%21 = OpLabel\n" |
| "%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x |
| "%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x |
| "%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x] |
| "%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %25 = in value |
| "%27 = OpSMod %9 %25 %15\n" // in % 2 |
| "OpSelectionMerge %28 None\n" |
| "OpSwitch %27 %29 0 %30 1 %31\n" |
| "%30 = OpLabel\n" // (in % 2) == 0 |
| "%32 = OpIAdd %9 %27 %14\n" // generate an intermediate |
| "OpStore %26 %32\n" // write a value (overwritten later) |
| "OpBranch %29\n" // fallthrough |
| "%29 = OpLabel\n" // default |
| "%33 = OpIAdd %9 %27 %14\n" // generate an intermediate |
| "OpStore %26 %33\n" // write a value (overwritten later) |
| "OpBranch %31\n" // fallthrough |
| "%31 = OpLabel\n" // (in % 2) == 1 |
| "OpStore %26 %15\n" // write 2 |
| "OpBranch %28\n" |
| "%28 = OpLabel\n" // merge |
| // End of branch logic |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return 2; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchPhi) |
| { |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %1 \"main\" %2\n" |
| "OpExecutionMode %1 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 ArrayStride 4\n" |
| "OpMemberDecorate %4 0 Offset 0\n" |
| "OpDecorate %4 BufferBlock\n" |
| "OpDecorate %5 DescriptorSet 0\n" |
| "OpDecorate %5 Binding 1\n" |
| "OpDecorate %2 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "%7 = OpTypeVoid\n" |
| "%8 = OpTypeFunction %7\n" // void() |
| "%9 = OpTypeInt 32 1\n" // int32 |
| "%10 = OpTypeInt 32 0\n" // uint32 |
| "%11 = OpTypeBool\n" |
| "%3 = OpTypeRuntimeArray %9\n" // int32[] |
| "%4 = OpTypeStruct %3\n" // struct{ int32[] } |
| "%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }* |
| "%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in |
| "%13 = OpConstant %9 0\n" // int32(0) |
| "%14 = OpConstant %9 1\n" // int32(1) |
| "%15 = OpConstant %9 2\n" // int32(2) |
| "%16 = OpConstant %10 0\n" // uint32(0) |
| "%17 = OpTypeVector %10 3\n" // vec4<int32> |
| "%18 = OpTypePointer Input %17\n" // vec4<int32>* |
| "%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId |
| "%19 = OpTypePointer Input %10\n" // uint32* |
| "%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out |
| "%20 = OpTypePointer Uniform %9\n" // int32* |
| "%1 = OpFunction %7 None %8\n" // -- Function begin -- |
| "%21 = OpLabel\n" |
| "%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x |
| "%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x |
| "%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x] |
| "%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x] |
| "%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x] |
| // Start of branch logic |
| // %25 = in value |
| "%27 = OpSMod %9 %25 %15\n" // in % 2 |
| "OpSelectionMerge %28 None\n" |
| "OpSwitch %27 %29 1 %30\n" |
| "%30 = OpLabel\n" // (in % 2) == 1 |
| "OpBranch %28\n" |
| "%29 = OpLabel\n" // (in % 2) != 1 |
| "OpBranch %28\n" |
| "%28 = OpLabel\n" // merge |
| "%31 = OpPhi %9 %14 %30 %15 %29\n" // (in % 2) == 1 ? 1 : 2 |
| "OpStore %26 %31\n" |
| // End of branch logic |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 1 ? 1 : 2; }); |
| } |
| |
| TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, LoopDivergentMergePhi) |
| { |
| // #version 450 |
| // layout(local_size_x = 1, local_size_y = 1, local_size_z = 1) in; |
| // layout(binding = 0, std430) buffer InBuffer |
| // { |
| // int Data[]; |
| // } In; |
| // layout(binding = 1, std430) buffer OutBuffer |
| // { |
| // int Data[]; |
| // } Out; |
| // void main() |
| // { |
| // int phi = 0; |
| // uint lane = gl_GlobalInvocationID.x % 4; |
| // for (uint i = 0; i < 4; i++) |
| // { |
| // if (lane == i) |
| // { |
| // phi = In.Data[gl_GlobalInvocationID.x]; |
| // break; |
| // } |
| // } |
| // Out.Data[gl_GlobalInvocationID.x] = phi; |
| // } |
| std::stringstream src; |
| // clang-format off |
| src << |
| "OpCapability Shader\n" |
| "%1 = OpExtInstImport \"GLSL.std.450\"\n" |
| "OpMemoryModel Logical GLSL450\n" |
| "OpEntryPoint GLCompute %2 \"main\" %3\n" |
| "OpExecutionMode %2 LocalSize " << |
| GetParam().localSizeX << " " << |
| GetParam().localSizeY << " " << |
| GetParam().localSizeZ << "\n" << |
| "OpDecorate %3 BuiltIn GlobalInvocationId\n" |
| "OpDecorate %4 ArrayStride 4\n" |
| "OpMemberDecorate %5 0 Offset 0\n" |
| "OpDecorate %5 BufferBlock\n" |
| "OpDecorate %6 DescriptorSet 0\n" |
| "OpDecorate %6 Binding 0\n" |
| "OpDecorate %7 ArrayStride 4\n" |
| "OpMemberDecorate %8 0 Offset 0\n" |
| "OpDecorate %8 BufferBlock\n" |
| "OpDecorate %9 DescriptorSet 0\n" |
| "OpDecorate %9 Binding 1\n" |
| "%10 = OpTypeVoid\n" |
| "%11 = OpTypeFunction %10\n" |
| "%12 = OpTypeInt 32 1\n" |
| "%13 = OpConstant %12 0\n" |
| "%14 = OpTypeInt 32 0\n" |
| "%15 = OpTypeVector %14 3\n" |
| "%16 = OpTypePointer Input %15\n" |
| "%3 = OpVariable %16 Input\n" |
| "%17 = OpConstant %14 0\n" |
| "%18 = OpTypePointer Input %14\n" |
| "%19 = OpConstant %14 4\n" |
| "%20 = OpTypeBool\n" |
| "%4 = OpTypeRuntimeArray %12\n" |
| "%5 = OpTypeStruct %4\n" |
| "%21 = OpTypePointer Uniform %5\n" |
| "%6 = OpVariable %21 Uniform\n" |
| "%22 = OpTypePointer Uniform %12\n" |
| "%23 = OpConstant %12 1\n" |
| "%7 = OpTypeRuntimeArray %12\n" |
| "%8 = OpTypeStruct %7\n" |
| "%24 = OpTypePointer Uniform %8\n" |
| "%9 = OpVariable %24 Uniform\n" |
| "%2 = OpFunction %10 None %11\n" |
| "%25 = OpLabel\n" |
| "%26 = OpAccessChain %18 %3 %17\n" |
| "%27 = OpLoad %14 %26\n" |
| "%28 = OpUMod %14 %27 %19\n" |
| "OpBranch %29\n" |
| "%29 = OpLabel\n" |
| "%30 = OpPhi %14 %17 %25 %31 %32\n" |
| "%33 = OpULessThan %20 %30 %19\n" |
| "OpLoopMerge %34 %32 None\n" |
| "OpBranchConditional %33 %35 %34\n" |
| "%35 = OpLabel\n" |
| "%36 = OpIEqual %20 %28 %30\n" |
| "OpSelectionMerge %37 None\n" |
| "OpBranchConditional %36 %38 %37\n" |
| "%38 = OpLabel\n" |
| "%39 = OpAccessChain %22 %6 %13 %27\n" |
| "%40 = OpLoad %12 %39\n" |
| "OpBranch %34\n" |
| "%37 = OpLabel\n" |
| "OpBranch %32\n" |
| "%32 = OpLabel\n" |
| "%31 = OpIAdd %14 %30 %23\n" |
| "OpBranch %29\n" |
| "%34 = OpLabel\n" |
| "%41 = OpPhi %12 %13 %29 %40 %38\n" // %40: phi |
| "%42 = OpAccessChain %22 %9 %13 %27\n" |
| "OpStore %42 %41\n" |
| "OpReturn\n" |
| "OpFunctionEnd\n"; |
| // clang-format on |
| |
| test( |
| src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i; }); |
| } |