You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
1482 lines
63 KiB
1482 lines
63 KiB
// Copyright 2021 The SwiftShader Authors. All Rights Reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
#include "Device.hpp"
|
|
#include "Driver.hpp"
|
|
|
|
#include "gmock/gmock.h"
|
|
#include "gtest/gtest.h"
|
|
|
|
#include "spirv-tools/libspirv.hpp"
|
|
|
|
#include <cstring>
|
|
#include <sstream>
|
|
|
|
namespace {
|
|
size_t alignUp(size_t val, size_t alignment)
|
|
{
|
|
return alignment * ((val + alignment - 1) / alignment);
|
|
}
|
|
} // anonymous namespace
|
|
|
|
struct ComputeParams
|
|
{
|
|
size_t numElements;
|
|
int localSizeX;
|
|
int localSizeY;
|
|
int localSizeZ;
|
|
|
|
friend std::ostream &operator<<(std::ostream &os, const ComputeParams ¶ms)
|
|
{
|
|
return os << "ComputeParams{"
|
|
<< "numElements: " << params.numElements << ", "
|
|
<< "localSizeX: " << params.localSizeX << ", "
|
|
<< "localSizeY: " << params.localSizeY << ", "
|
|
<< "localSizeZ: " << params.localSizeZ << "}";
|
|
}
|
|
};
|
|
|
|
class ComputeTest : public testing::TestWithParam<ComputeParams>
|
|
{
|
|
protected:
|
|
static Driver driver;
|
|
|
|
static void SetUpTestSuite()
|
|
{
|
|
ASSERT_TRUE(driver.loadSwiftShader());
|
|
}
|
|
|
|
static void TearDownTestSuite()
|
|
{
|
|
driver.unload();
|
|
}
|
|
};
|
|
|
|
Driver ComputeTest::driver;
|
|
|
|
std::vector<uint32_t> compileSpirv(const char *assembly)
|
|
{
|
|
spvtools::SpirvTools core(SPV_ENV_VULKAN_1_0);
|
|
|
|
core.SetMessageConsumer([](spv_message_level_t, const char *, const spv_position_t &p, const char *m) {
|
|
FAIL() << p.line << ":" << p.column << ": " << m;
|
|
});
|
|
|
|
std::vector<uint32_t> spirv;
|
|
EXPECT_TRUE(core.Assemble(assembly, &spirv));
|
|
EXPECT_TRUE(core.Validate(spirv));
|
|
|
|
// Warn if the disassembly does not match the source assembly.
|
|
// We do this as debugging tests in the debugger is often made much harder
|
|
// if the SSA names (%X) in the debugger do not match the source.
|
|
std::string disassembled;
|
|
core.Disassemble(spirv, &disassembled, SPV_BINARY_TO_TEXT_OPTION_NO_HEADER);
|
|
if(disassembled != assembly)
|
|
{
|
|
printf("-- WARNING: Disassembly does not match assembly: ---\n\n");
|
|
|
|
auto splitLines = [](const std::string &str) -> std::vector<std::string> {
|
|
std::stringstream ss(str);
|
|
std::vector<std::string> out;
|
|
std::string line;
|
|
while(std::getline(ss, line, '\n')) { out.push_back(line); }
|
|
return out;
|
|
};
|
|
|
|
auto srcLines = splitLines(std::string(assembly));
|
|
auto disLines = splitLines(disassembled);
|
|
|
|
for(size_t line = 0; line < srcLines.size() && line < disLines.size(); line++)
|
|
{
|
|
auto srcLine = (line < srcLines.size()) ? srcLines[line] : "<missing>";
|
|
auto disLine = (line < disLines.size()) ? disLines[line] : "<missing>";
|
|
if(srcLine != disLine)
|
|
{
|
|
printf("%zu: '%s' != '%s'\n", line, srcLine.c_str(), disLine.c_str());
|
|
}
|
|
}
|
|
printf("\n\n---\nExpected:\n\n%s", disassembled.c_str());
|
|
}
|
|
|
|
return spirv;
|
|
}
|
|
|
|
#define VK_ASSERT(x) ASSERT_EQ(x, VK_SUCCESS)
|
|
|
|
// Base class for compute tests that read from an input buffer and write to an
|
|
// output buffer of same length.
|
|
class SwiftShaderVulkanBufferToBufferComputeTest : public ComputeTest
|
|
{
|
|
public:
|
|
void test(const std::string &shader,
|
|
std::function<uint32_t(uint32_t idx)> input,
|
|
std::function<uint32_t(uint32_t idx)> expected);
|
|
};
|
|
|
|
void SwiftShaderVulkanBufferToBufferComputeTest::test(
|
|
const std::string &shader,
|
|
std::function<uint32_t(uint32_t idx)> input,
|
|
std::function<uint32_t(uint32_t idx)> expected)
|
|
{
|
|
auto code = compileSpirv(shader.c_str());
|
|
|
|
const VkInstanceCreateInfo createInfo = {
|
|
VK_STRUCTURE_TYPE_INSTANCE_CREATE_INFO, // sType
|
|
nullptr, // pNext
|
|
0, // flags
|
|
nullptr, // pApplicationInfo
|
|
0, // enabledLayerCount
|
|
nullptr, // ppEnabledLayerNames
|
|
0, // enabledExtensionCount
|
|
nullptr, // ppEnabledExtensionNames
|
|
};
|
|
|
|
VkInstance instance = VK_NULL_HANDLE;
|
|
VK_ASSERT(driver.vkCreateInstance(&createInfo, nullptr, &instance));
|
|
|
|
ASSERT_TRUE(driver.resolve(instance));
|
|
|
|
std::unique_ptr<Device> device;
|
|
VK_ASSERT(Device::CreateComputeDevice(&driver, instance, device));
|
|
ASSERT_TRUE(device->IsValid());
|
|
|
|
// struct Buffers
|
|
// {
|
|
// uint32_t pad0[63];
|
|
// uint32_t magic0;
|
|
// uint32_t in[NUM_ELEMENTS]; // Aligned to 0x100
|
|
// uint32_t magic1;
|
|
// uint32_t pad1[N];
|
|
// uint32_t magic2;
|
|
// uint32_t out[NUM_ELEMENTS]; // Aligned to 0x100
|
|
// uint32_t magic3;
|
|
// };
|
|
static constexpr uint32_t magic0 = 0x01234567;
|
|
static constexpr uint32_t magic1 = 0x89abcdef;
|
|
static constexpr uint32_t magic2 = 0xfedcba99;
|
|
static constexpr uint32_t magic3 = 0x87654321;
|
|
size_t numElements = GetParam().numElements;
|
|
size_t alignElements = 0x100 / sizeof(uint32_t);
|
|
size_t magic0Offset = alignElements - 1;
|
|
size_t inOffset = 1 + magic0Offset;
|
|
size_t magic1Offset = numElements + inOffset;
|
|
size_t magic2Offset = alignUp(magic1Offset + 1, alignElements) - 1;
|
|
size_t outOffset = 1 + magic2Offset;
|
|
size_t magic3Offset = numElements + outOffset;
|
|
size_t buffersTotalElements = alignUp(1 + magic3Offset, alignElements);
|
|
size_t buffersSize = sizeof(uint32_t) * buffersTotalElements;
|
|
|
|
VkDeviceMemory memory;
|
|
VK_ASSERT(device->AllocateMemory(buffersSize,
|
|
VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT | VK_MEMORY_PROPERTY_HOST_COHERENT_BIT,
|
|
&memory));
|
|
|
|
uint32_t *buffers;
|
|
VK_ASSERT(device->MapMemory(memory, 0, buffersSize, 0, (void **)&buffers));
|
|
|
|
buffers[magic0Offset] = magic0;
|
|
buffers[magic1Offset] = magic1;
|
|
buffers[magic2Offset] = magic2;
|
|
buffers[magic3Offset] = magic3;
|
|
|
|
for(size_t i = 0; i < numElements; i++)
|
|
{
|
|
buffers[inOffset + i] = input((uint32_t)i);
|
|
}
|
|
|
|
device->UnmapMemory(memory);
|
|
buffers = nullptr;
|
|
|
|
VkBuffer bufferIn;
|
|
VK_ASSERT(device->CreateStorageBuffer(memory,
|
|
sizeof(uint32_t) * numElements,
|
|
sizeof(uint32_t) * inOffset,
|
|
&bufferIn));
|
|
|
|
VkBuffer bufferOut;
|
|
VK_ASSERT(device->CreateStorageBuffer(memory,
|
|
sizeof(uint32_t) * numElements,
|
|
sizeof(uint32_t) * outOffset,
|
|
&bufferOut));
|
|
|
|
VkShaderModule shaderModule;
|
|
VK_ASSERT(device->CreateShaderModule(code, &shaderModule));
|
|
|
|
std::vector<VkDescriptorSetLayoutBinding> descriptorSetLayoutBindings = {
|
|
{
|
|
0, // binding
|
|
VK_DESCRIPTOR_TYPE_STORAGE_BUFFER, // descriptorType
|
|
1, // descriptorCount
|
|
VK_SHADER_STAGE_COMPUTE_BIT, // stageFlags
|
|
0, // pImmutableSamplers
|
|
},
|
|
{
|
|
1, // binding
|
|
VK_DESCRIPTOR_TYPE_STORAGE_BUFFER, // descriptorType
|
|
1, // descriptorCount
|
|
VK_SHADER_STAGE_COMPUTE_BIT, // stageFlags
|
|
0, // pImmutableSamplers
|
|
}
|
|
};
|
|
|
|
VkDescriptorSetLayout descriptorSetLayout;
|
|
VK_ASSERT(device->CreateDescriptorSetLayout(descriptorSetLayoutBindings, &descriptorSetLayout));
|
|
|
|
VkPipelineLayout pipelineLayout;
|
|
VK_ASSERT(device->CreatePipelineLayout(descriptorSetLayout, &pipelineLayout));
|
|
|
|
VkPipeline pipeline;
|
|
VK_ASSERT(device->CreateComputePipeline(shaderModule, pipelineLayout, &pipeline));
|
|
|
|
VkDescriptorPool descriptorPool;
|
|
VK_ASSERT(device->CreateStorageBufferDescriptorPool(2, &descriptorPool));
|
|
|
|
VkDescriptorSet descriptorSet;
|
|
VK_ASSERT(device->AllocateDescriptorSet(descriptorPool, descriptorSetLayout, &descriptorSet));
|
|
|
|
std::vector<VkDescriptorBufferInfo> descriptorBufferInfos = {
|
|
{
|
|
bufferIn, // buffer
|
|
0, // offset
|
|
VK_WHOLE_SIZE, // range
|
|
},
|
|
{
|
|
bufferOut, // buffer
|
|
0, // offset
|
|
VK_WHOLE_SIZE, // range
|
|
}
|
|
};
|
|
device->UpdateStorageBufferDescriptorSets(descriptorSet, descriptorBufferInfos);
|
|
|
|
VkCommandPool commandPool;
|
|
VK_ASSERT(device->CreateCommandPool(&commandPool));
|
|
|
|
VkCommandBuffer commandBuffer;
|
|
VK_ASSERT(device->AllocateCommandBuffer(commandPool, &commandBuffer));
|
|
|
|
VK_ASSERT(device->BeginCommandBuffer(VK_COMMAND_BUFFER_USAGE_ONE_TIME_SUBMIT_BIT, commandBuffer));
|
|
|
|
driver.vkCmdBindPipeline(commandBuffer, VK_PIPELINE_BIND_POINT_COMPUTE, pipeline);
|
|
|
|
driver.vkCmdBindDescriptorSets(commandBuffer, VK_PIPELINE_BIND_POINT_COMPUTE, pipelineLayout, 0, 1, &descriptorSet,
|
|
0, nullptr);
|
|
|
|
driver.vkCmdDispatch(commandBuffer, (uint32_t)(numElements / GetParam().localSizeX), 1, 1);
|
|
|
|
VK_ASSERT(driver.vkEndCommandBuffer(commandBuffer));
|
|
|
|
VK_ASSERT(device->QueueSubmitAndWait(commandBuffer));
|
|
|
|
VK_ASSERT(device->MapMemory(memory, 0, buffersSize, 0, (void **)&buffers));
|
|
|
|
for(size_t i = 0; i < numElements; ++i)
|
|
{
|
|
auto got = buffers[i + outOffset];
|
|
EXPECT_EQ(expected((uint32_t)i), got) << "Unexpected output at " << i;
|
|
}
|
|
|
|
// Check for writes outside of bounds.
|
|
EXPECT_EQ(buffers[magic0Offset], magic0);
|
|
EXPECT_EQ(buffers[magic1Offset], magic1);
|
|
EXPECT_EQ(buffers[magic2Offset], magic2);
|
|
EXPECT_EQ(buffers[magic3Offset], magic3);
|
|
|
|
device->UnmapMemory(memory);
|
|
buffers = nullptr;
|
|
|
|
device->FreeCommandBuffer(commandPool, commandBuffer);
|
|
device->FreeMemory(memory);
|
|
device->DestroyPipeline(pipeline);
|
|
device->DestroyCommandPool(commandPool);
|
|
device->DestroyPipelineLayout(pipelineLayout);
|
|
device->DestroyDescriptorSetLayout(descriptorSetLayout);
|
|
device->DestroyDescriptorPool(descriptorPool);
|
|
device->DestroyBuffer(bufferIn);
|
|
device->DestroyBuffer(bufferOut);
|
|
device->DestroyShaderModule(shaderModule);
|
|
device.reset(nullptr);
|
|
driver.vkDestroyInstance(instance, nullptr);
|
|
}
|
|
|
|
INSTANTIATE_TEST_SUITE_P(ComputeParams, SwiftShaderVulkanBufferToBufferComputeTest, testing::Values(ComputeParams{ 512, 1, 1, 1 }, ComputeParams{ 512, 2, 1, 1 }, ComputeParams{ 512, 4, 1, 1 }, ComputeParams{ 512, 8, 1, 1 }, ComputeParams{ 512, 16, 1, 1 }, ComputeParams{ 512, 32, 1, 1 },
|
|
|
|
// Non-multiple of SIMD-lane.
|
|
ComputeParams{ 3, 1, 1, 1 }, ComputeParams{ 2, 1, 1, 1 }));
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, Memcpy)
|
|
{
|
|
std::stringstream src;
|
|
// #version 450
|
|
// layout(local_size_x = 1, local_size_y = 1, local_size_z = 1) in;
|
|
// layout(binding = 0, std430) buffer InBuffer
|
|
// {
|
|
// int Data[];
|
|
// } In;
|
|
// layout(binding = 1, std430) buffer OutBuffer
|
|
// {
|
|
// int Data[];
|
|
// } Out;
|
|
// void main()
|
|
// {
|
|
// Out.Data[gl_GlobalInvocationID.x] = In.Data[gl_GlobalInvocationID.x];
|
|
// }
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%11 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %11 Uniform\n" // struct{ int32[] }* in
|
|
"%12 = OpConstant %9 0\n" // int32(0)
|
|
"%13 = OpConstant %10 0\n" // uint32(0)
|
|
"%14 = OpTypeVector %10 3\n" // vec3<int32>
|
|
"%15 = OpTypePointer Input %14\n" // vec3<int32>*
|
|
"%2 = OpVariable %15 Input\n" // gl_GlobalInvocationId
|
|
"%16 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %11 Uniform\n" // struct{ int32[] }* out
|
|
"%17 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%18 = OpLabel\n"
|
|
"%19 = OpAccessChain %16 %2 %13\n" // &gl_GlobalInvocationId.x
|
|
"%20 = OpLoad %10 %19\n" // gl_GlobalInvocationId.x
|
|
"%21 = OpAccessChain %17 %6 %12 %20\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%22 = OpLoad %9 %21\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%23 = OpAccessChain %17 %5 %12 %20\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
"OpStore %23 %22\n" // out.arr[gl_GlobalInvocationId.x] = in[gl_GlobalInvocationId.x]
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, GlobalInvocationId)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%11 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %11 Uniform\n" // struct{ int32[] }* in
|
|
"%12 = OpConstant %9 0\n" // int32(0)
|
|
"%13 = OpConstant %9 1\n" // int32(1)
|
|
"%14 = OpConstant %10 0\n" // uint32(0)
|
|
"%15 = OpConstant %10 1\n" // uint32(1)
|
|
"%16 = OpConstant %10 2\n" // uint32(2)
|
|
"%17 = OpTypeVector %10 3\n" // vec3<int32>
|
|
"%18 = OpTypePointer Input %17\n" // vec3<int32>*
|
|
"%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId
|
|
"%19 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %11 Uniform\n" // struct{ int32[] }* out
|
|
"%20 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%21 = OpLabel\n"
|
|
"%22 = OpAccessChain %19 %2 %14\n" // &gl_GlobalInvocationId.x
|
|
"%23 = OpAccessChain %19 %2 %15\n" // &gl_GlobalInvocationId.y
|
|
"%24 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.z
|
|
"%25 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x
|
|
"%26 = OpLoad %10 %23\n" // gl_GlobalInvocationId.y
|
|
"%27 = OpLoad %10 %24\n" // gl_GlobalInvocationId.z
|
|
"%28 = OpAccessChain %20 %6 %12 %25\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%29 = OpLoad %9 %28\n" // out.arr[gl_GlobalInvocationId.x]
|
|
"%30 = OpIAdd %9 %29 %26\n" // in[gl_GlobalInvocationId.x] + gl_GlobalInvocationId.y
|
|
"%31 = OpIAdd %9 %30 %27\n" // in[gl_GlobalInvocationId.x] + gl_GlobalInvocationId.y + gl_GlobalInvocationId.z
|
|
"%32 = OpAccessChain %20 %5 %12 %25\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
"OpStore %32 %31\n" // out.arr[gl_GlobalInvocationId.x] = in[gl_GlobalInvocationId.x] + gl_GlobalInvocationId.y + gl_GlobalInvocationId.z
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
// gl_GlobalInvocationId.y and gl_GlobalInvocationId.z should both be zero.
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchSimple)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%11 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %11 Uniform\n" // struct{ int32[] }* in
|
|
"%12 = OpConstant %9 0\n" // int32(0)
|
|
"%13 = OpConstant %10 0\n" // uint32(0)
|
|
"%14 = OpTypeVector %10 3\n" // vec3<int32>
|
|
"%15 = OpTypePointer Input %14\n" // vec3<int32>*
|
|
"%2 = OpVariable %15 Input\n" // gl_GlobalInvocationId
|
|
"%16 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %11 Uniform\n" // struct{ int32[] }* out
|
|
"%17 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%18 = OpLabel\n"
|
|
"%19 = OpAccessChain %16 %2 %13\n" // &gl_GlobalInvocationId.x
|
|
"%20 = OpLoad %10 %19\n" // gl_GlobalInvocationId.x
|
|
"%21 = OpAccessChain %17 %6 %12 %20\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%22 = OpLoad %9 %21\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%23 = OpAccessChain %17 %5 %12 %20\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %22 = in value
|
|
"OpBranch %24\n"
|
|
"%24 = OpLabel\n"
|
|
"OpBranch %25\n"
|
|
"%25 = OpLabel\n"
|
|
"OpBranch %26\n"
|
|
"%26 = OpLabel\n"
|
|
// %22 = out value
|
|
// End of branch logic
|
|
"OpStore %23 %22\n"
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchDeclareSSA)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%11 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %11 Uniform\n" // struct{ int32[] }* in
|
|
"%12 = OpConstant %9 0\n" // int32(0)
|
|
"%13 = OpConstant %10 0\n" // uint32(0)
|
|
"%14 = OpTypeVector %10 3\n" // vec3<int32>
|
|
"%15 = OpTypePointer Input %14\n" // vec3<int32>*
|
|
"%2 = OpVariable %15 Input\n" // gl_GlobalInvocationId
|
|
"%16 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %11 Uniform\n" // struct{ int32[] }* out
|
|
"%17 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%18 = OpLabel\n"
|
|
"%19 = OpAccessChain %16 %2 %13\n" // &gl_GlobalInvocationId.x
|
|
"%20 = OpLoad %10 %19\n" // gl_GlobalInvocationId.x
|
|
"%21 = OpAccessChain %17 %6 %12 %20\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%22 = OpLoad %9 %21\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%23 = OpAccessChain %17 %5 %12 %20\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %22 = in value
|
|
"OpBranch %24\n"
|
|
"%24 = OpLabel\n"
|
|
"%25 = OpIAdd %9 %22 %22\n" // %25 = in*2
|
|
"OpBranch %26\n"
|
|
"%26 = OpLabel\n"
|
|
"OpBranch %27\n"
|
|
"%27 = OpLabel\n"
|
|
// %25 = out value
|
|
// End of branch logic
|
|
"OpStore %23 %25\n" // use SSA value from previous block
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i * 2; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchConditionalSimple)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%11 = OpTypeBool\n"
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in
|
|
"%13 = OpConstant %9 0\n" // int32(0)
|
|
"%14 = OpConstant %9 2\n" // int32(2)
|
|
"%15 = OpConstant %10 0\n" // uint32(0)
|
|
"%16 = OpTypeVector %10 3\n" // vec4<int32>
|
|
"%17 = OpTypePointer Input %16\n" // vec4<int32>*
|
|
"%2 = OpVariable %17 Input\n" // gl_GlobalInvocationId
|
|
"%18 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out
|
|
"%19 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%20 = OpLabel\n"
|
|
"%21 = OpAccessChain %18 %2 %15\n" // &gl_GlobalInvocationId.x
|
|
"%22 = OpLoad %10 %21\n" // gl_GlobalInvocationId.x
|
|
"%23 = OpAccessChain %19 %6 %13 %22\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%24 = OpLoad %9 %23\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%25 = OpAccessChain %19 %5 %13 %22\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %24 = in value
|
|
"%26 = OpSMod %9 %24 %14\n" // in % 2
|
|
"%27 = OpIEqual %11 %26 %13\n" // (in % 2) == 0
|
|
"OpSelectionMerge %28 None\n"
|
|
"OpBranchConditional %27 %28 %28\n" // Both go to %28
|
|
"%28 = OpLabel\n"
|
|
// %26 = out value
|
|
// End of branch logic
|
|
"OpStore %25 %26\n" // use SSA value from previous block
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i % 2; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchConditionalTwoEmptyBlocks)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%11 = OpTypeBool\n"
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in
|
|
"%13 = OpConstant %9 0\n" // int32(0)
|
|
"%14 = OpConstant %9 2\n" // int32(2)
|
|
"%15 = OpConstant %10 0\n" // uint32(0)
|
|
"%16 = OpTypeVector %10 3\n" // vec4<int32>
|
|
"%17 = OpTypePointer Input %16\n" // vec4<int32>*
|
|
"%2 = OpVariable %17 Input\n" // gl_GlobalInvocationId
|
|
"%18 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out
|
|
"%19 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%20 = OpLabel\n"
|
|
"%21 = OpAccessChain %18 %2 %15\n" // &gl_GlobalInvocationId.x
|
|
"%22 = OpLoad %10 %21\n" // gl_GlobalInvocationId.x
|
|
"%23 = OpAccessChain %19 %6 %13 %22\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%24 = OpLoad %9 %23\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%25 = OpAccessChain %19 %5 %13 %22\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %24 = in value
|
|
"%26 = OpSMod %9 %24 %14\n" // in % 2
|
|
"%27 = OpIEqual %11 %26 %13\n" // (in % 2) == 0
|
|
"OpSelectionMerge %28 None\n"
|
|
"OpBranchConditional %27 %29 %30\n"
|
|
"%29 = OpLabel\n" // (in % 2) == 0
|
|
"OpBranch %28\n"
|
|
"%30 = OpLabel\n" // (in % 2) != 0
|
|
"OpBranch %28\n"
|
|
"%28 = OpLabel\n"
|
|
// %26 = out value
|
|
// End of branch logic
|
|
"OpStore %25 %26\n" // use SSA value from previous block
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i % 2; });
|
|
}
|
|
|
|
// TODO: Test for parallel assignment
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchConditionalStore)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%11 = OpTypeBool\n"
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in
|
|
"%13 = OpConstant %9 0\n" // int32(0)
|
|
"%14 = OpConstant %9 1\n" // int32(1)
|
|
"%15 = OpConstant %9 2\n" // int32(2)
|
|
"%16 = OpConstant %10 0\n" // uint32(0)
|
|
"%17 = OpTypeVector %10 3\n" // vec4<int32>
|
|
"%18 = OpTypePointer Input %17\n" // vec4<int32>*
|
|
"%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId
|
|
"%19 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out
|
|
"%20 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%21 = OpLabel\n"
|
|
"%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x
|
|
"%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x
|
|
"%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %25 = in value
|
|
"%27 = OpSMod %9 %25 %15\n" // in % 2
|
|
"%28 = OpIEqual %11 %27 %13\n" // (in % 2) == 0
|
|
"OpSelectionMerge %29 None\n"
|
|
"OpBranchConditional %28 %30 %31\n"
|
|
"%30 = OpLabel\n" // (in % 2) == 0
|
|
"OpStore %26 %14\n" // write 1
|
|
"OpBranch %29\n"
|
|
"%31 = OpLabel\n" // (in % 2) != 0
|
|
"OpStore %26 %15\n" // write 2
|
|
"OpBranch %29\n"
|
|
"%29 = OpLabel\n"
|
|
// End of branch logic
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 0 ? 1 : 2; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchConditionalReturnTrue)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%11 = OpTypeBool\n"
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in
|
|
"%13 = OpConstant %9 0\n" // int32(0)
|
|
"%14 = OpConstant %9 1\n" // int32(1)
|
|
"%15 = OpConstant %9 2\n" // int32(2)
|
|
"%16 = OpConstant %10 0\n" // uint32(0)
|
|
"%17 = OpTypeVector %10 3\n" // vec4<int32>
|
|
"%18 = OpTypePointer Input %17\n" // vec4<int32>*
|
|
"%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId
|
|
"%19 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out
|
|
"%20 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%21 = OpLabel\n"
|
|
"%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x
|
|
"%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x
|
|
"%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %25 = in value
|
|
"%27 = OpSMod %9 %25 %15\n" // in % 2
|
|
"%28 = OpIEqual %11 %27 %13\n" // (in % 2) == 0
|
|
"OpSelectionMerge %29 None\n"
|
|
"OpBranchConditional %28 %30 %29\n"
|
|
"%30 = OpLabel\n" // (in % 2) == 0
|
|
"OpReturn\n"
|
|
"%29 = OpLabel\n" // merge
|
|
"OpStore %26 %15\n" // write 2
|
|
// End of branch logic
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 0 ? 0 : 2; });
|
|
}
|
|
|
|
// TODO: Test for parallel assignment
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, BranchConditionalPhi)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%11 = OpTypeBool\n"
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in
|
|
"%13 = OpConstant %9 0\n" // int32(0)
|
|
"%14 = OpConstant %9 1\n" // int32(1)
|
|
"%15 = OpConstant %9 2\n" // int32(2)
|
|
"%16 = OpConstant %10 0\n" // uint32(0)
|
|
"%17 = OpTypeVector %10 3\n" // vec4<int32>
|
|
"%18 = OpTypePointer Input %17\n" // vec4<int32>*
|
|
"%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId
|
|
"%19 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out
|
|
"%20 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%21 = OpLabel\n"
|
|
"%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x
|
|
"%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x
|
|
"%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %25 = in value
|
|
"%27 = OpSMod %9 %25 %15\n" // in % 2
|
|
"%28 = OpIEqual %11 %27 %13\n" // (in % 2) == 0
|
|
"OpSelectionMerge %29 None\n"
|
|
"OpBranchConditional %28 %30 %31\n"
|
|
"%30 = OpLabel\n" // (in % 2) == 0
|
|
"OpBranch %29\n"
|
|
"%31 = OpLabel\n" // (in % 2) != 0
|
|
"OpBranch %29\n"
|
|
"%29 = OpLabel\n"
|
|
"%32 = OpPhi %9 %14 %30 %15 %31\n" // (in % 2) == 0 ? 1 : 2
|
|
// End of branch logic
|
|
"OpStore %26 %32\n"
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 0 ? 1 : 2; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchEmptyCases)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%11 = OpTypeBool\n"
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in
|
|
"%13 = OpConstant %9 0\n" // int32(0)
|
|
"%14 = OpConstant %9 2\n" // int32(2)
|
|
"%15 = OpConstant %10 0\n" // uint32(0)
|
|
"%16 = OpTypeVector %10 3\n" // vec4<int32>
|
|
"%17 = OpTypePointer Input %16\n" // vec4<int32>*
|
|
"%2 = OpVariable %17 Input\n" // gl_GlobalInvocationId
|
|
"%18 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out
|
|
"%19 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%20 = OpLabel\n"
|
|
"%21 = OpAccessChain %18 %2 %15\n" // &gl_GlobalInvocationId.x
|
|
"%22 = OpLoad %10 %21\n" // gl_GlobalInvocationId.x
|
|
"%23 = OpAccessChain %19 %6 %13 %22\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%24 = OpLoad %9 %23\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%25 = OpAccessChain %19 %5 %13 %22\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %24 = in value
|
|
"%26 = OpSMod %9 %24 %14\n" // in % 2
|
|
"OpSelectionMerge %27 None\n"
|
|
"OpSwitch %26 %27 0 %28 1 %29\n"
|
|
"%28 = OpLabel\n" // (in % 2) == 0
|
|
"OpBranch %27\n"
|
|
"%29 = OpLabel\n" // (in % 2) == 1
|
|
"OpBranch %27\n"
|
|
"%27 = OpLabel\n"
|
|
// %26 = out value
|
|
// End of branch logic
|
|
"OpStore %25 %26\n" // use SSA value from previous block
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i % 2; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchStore)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%11 = OpTypeBool\n"
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in
|
|
"%13 = OpConstant %9 0\n" // int32(0)
|
|
"%14 = OpConstant %9 1\n" // int32(1)
|
|
"%15 = OpConstant %9 2\n" // int32(2)
|
|
"%16 = OpConstant %10 0\n" // uint32(0)
|
|
"%17 = OpTypeVector %10 3\n" // vec4<int32>
|
|
"%18 = OpTypePointer Input %17\n" // vec4<int32>*
|
|
"%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId
|
|
"%19 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out
|
|
"%20 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%21 = OpLabel\n"
|
|
"%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x
|
|
"%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x
|
|
"%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %25 = in value
|
|
"%27 = OpSMod %9 %25 %15\n" // in % 2
|
|
"OpSelectionMerge %28 None\n"
|
|
"OpSwitch %27 %28 0 %29 1 %30\n"
|
|
"%29 = OpLabel\n" // (in % 2) == 0
|
|
"OpStore %26 %15\n" // write 2
|
|
"OpBranch %28\n"
|
|
"%30 = OpLabel\n" // (in % 2) == 1
|
|
"OpStore %26 %14\n" // write 1
|
|
"OpBranch %28\n"
|
|
"%28 = OpLabel\n"
|
|
// End of branch logic
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 0 ? 2 : 1; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchCaseReturn)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%11 = OpTypeBool\n"
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in
|
|
"%13 = OpConstant %9 0\n" // int32(0)
|
|
"%14 = OpConstant %9 1\n" // int32(1)
|
|
"%15 = OpConstant %9 2\n" // int32(2)
|
|
"%16 = OpConstant %10 0\n" // uint32(0)
|
|
"%17 = OpTypeVector %10 3\n" // vec4<int32>
|
|
"%18 = OpTypePointer Input %17\n" // vec4<int32>*
|
|
"%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId
|
|
"%19 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out
|
|
"%20 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%21 = OpLabel\n"
|
|
"%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x
|
|
"%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x
|
|
"%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %25 = in value
|
|
"%27 = OpSMod %9 %25 %15\n" // in % 2
|
|
"OpSelectionMerge %28 None\n"
|
|
"OpSwitch %27 %28 0 %29 1 %30\n"
|
|
"%29 = OpLabel\n" // (in % 2) == 0
|
|
"OpBranch %28\n"
|
|
"%30 = OpLabel\n" // (in % 2) == 1
|
|
"OpReturn\n"
|
|
"%28 = OpLabel\n"
|
|
"OpStore %26 %14\n" // write 1
|
|
// End of branch logic
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 1 ? 0 : 1; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchDefaultReturn)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%11 = OpTypeBool\n"
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in
|
|
"%13 = OpConstant %9 0\n" // int32(0)
|
|
"%14 = OpConstant %9 1\n" // int32(1)
|
|
"%15 = OpConstant %9 2\n" // int32(2)
|
|
"%16 = OpConstant %10 0\n" // uint32(0)
|
|
"%17 = OpTypeVector %10 3\n" // vec4<int32>
|
|
"%18 = OpTypePointer Input %17\n" // vec4<int32>*
|
|
"%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId
|
|
"%19 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out
|
|
"%20 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%21 = OpLabel\n"
|
|
"%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x
|
|
"%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x
|
|
"%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %25 = in value
|
|
"%27 = OpSMod %9 %25 %15\n" // in % 2
|
|
"OpSelectionMerge %28 None\n"
|
|
"OpSwitch %27 %29 1 %30\n"
|
|
"%30 = OpLabel\n" // (in % 2) == 1
|
|
"OpBranch %28\n"
|
|
"%29 = OpLabel\n" // (in % 2) != 1
|
|
"OpReturn\n"
|
|
"%28 = OpLabel\n" // merge
|
|
"OpStore %26 %14\n" // write 1
|
|
// End of branch logic
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 1 ? 1 : 0; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchCaseFallthrough)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%11 = OpTypeBool\n"
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in
|
|
"%13 = OpConstant %9 0\n" // int32(0)
|
|
"%14 = OpConstant %9 1\n" // int32(1)
|
|
"%15 = OpConstant %9 2\n" // int32(2)
|
|
"%16 = OpConstant %10 0\n" // uint32(0)
|
|
"%17 = OpTypeVector %10 3\n" // vec4<int32>
|
|
"%18 = OpTypePointer Input %17\n" // vec4<int32>*
|
|
"%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId
|
|
"%19 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out
|
|
"%20 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%21 = OpLabel\n"
|
|
"%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x
|
|
"%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x
|
|
"%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %25 = in value
|
|
"%27 = OpSMod %9 %25 %15\n" // in % 2
|
|
"OpSelectionMerge %28 None\n"
|
|
"OpSwitch %27 %29 0 %30 1 %31\n"
|
|
"%30 = OpLabel\n" // (in % 2) == 0
|
|
"%32 = OpIAdd %9 %27 %14\n" // generate an intermediate
|
|
"OpStore %26 %32\n" // write a value (overwritten later)
|
|
"OpBranch %31\n" // fallthrough
|
|
"%31 = OpLabel\n" // (in % 2) == 1
|
|
"OpStore %26 %15\n" // write 2
|
|
"OpBranch %28\n"
|
|
"%29 = OpLabel\n" // unreachable
|
|
"OpUnreachable\n"
|
|
"%28 = OpLabel\n" // merge
|
|
// End of branch logic
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return 2; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchDefaultFallthrough)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%11 = OpTypeBool\n"
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in
|
|
"%13 = OpConstant %9 0\n" // int32(0)
|
|
"%14 = OpConstant %9 1\n" // int32(1)
|
|
"%15 = OpConstant %9 2\n" // int32(2)
|
|
"%16 = OpConstant %10 0\n" // uint32(0)
|
|
"%17 = OpTypeVector %10 3\n" // vec4<int32>
|
|
"%18 = OpTypePointer Input %17\n" // vec4<int32>*
|
|
"%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId
|
|
"%19 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out
|
|
"%20 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%21 = OpLabel\n"
|
|
"%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x
|
|
"%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x
|
|
"%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %25 = in value
|
|
"%27 = OpSMod %9 %25 %15\n" // in % 2
|
|
"OpSelectionMerge %28 None\n"
|
|
"OpSwitch %27 %29 0 %30 1 %31\n"
|
|
"%30 = OpLabel\n" // (in % 2) == 0
|
|
"%32 = OpIAdd %9 %27 %14\n" // generate an intermediate
|
|
"OpStore %26 %32\n" // write a value (overwritten later)
|
|
"OpBranch %29\n" // fallthrough
|
|
"%29 = OpLabel\n" // default
|
|
"%33 = OpIAdd %9 %27 %14\n" // generate an intermediate
|
|
"OpStore %26 %33\n" // write a value (overwritten later)
|
|
"OpBranch %31\n" // fallthrough
|
|
"%31 = OpLabel\n" // (in % 2) == 1
|
|
"OpStore %26 %15\n" // write 2
|
|
"OpBranch %28\n"
|
|
"%28 = OpLabel\n" // merge
|
|
// End of branch logic
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return 2; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, SwitchPhi)
|
|
{
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %1 \"main\" %2\n"
|
|
"OpExecutionMode %1 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 ArrayStride 4\n"
|
|
"OpMemberDecorate %4 0 Offset 0\n"
|
|
"OpDecorate %4 BufferBlock\n"
|
|
"OpDecorate %5 DescriptorSet 0\n"
|
|
"OpDecorate %5 Binding 1\n"
|
|
"OpDecorate %2 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"%7 = OpTypeVoid\n"
|
|
"%8 = OpTypeFunction %7\n" // void()
|
|
"%9 = OpTypeInt 32 1\n" // int32
|
|
"%10 = OpTypeInt 32 0\n" // uint32
|
|
"%11 = OpTypeBool\n"
|
|
"%3 = OpTypeRuntimeArray %9\n" // int32[]
|
|
"%4 = OpTypeStruct %3\n" // struct{ int32[] }
|
|
"%12 = OpTypePointer Uniform %4\n" // struct{ int32[] }*
|
|
"%5 = OpVariable %12 Uniform\n" // struct{ int32[] }* in
|
|
"%13 = OpConstant %9 0\n" // int32(0)
|
|
"%14 = OpConstant %9 1\n" // int32(1)
|
|
"%15 = OpConstant %9 2\n" // int32(2)
|
|
"%16 = OpConstant %10 0\n" // uint32(0)
|
|
"%17 = OpTypeVector %10 3\n" // vec4<int32>
|
|
"%18 = OpTypePointer Input %17\n" // vec4<int32>*
|
|
"%2 = OpVariable %18 Input\n" // gl_GlobalInvocationId
|
|
"%19 = OpTypePointer Input %10\n" // uint32*
|
|
"%6 = OpVariable %12 Uniform\n" // struct{ int32[] }* out
|
|
"%20 = OpTypePointer Uniform %9\n" // int32*
|
|
"%1 = OpFunction %7 None %8\n" // -- Function begin --
|
|
"%21 = OpLabel\n"
|
|
"%22 = OpAccessChain %19 %2 %16\n" // &gl_GlobalInvocationId.x
|
|
"%23 = OpLoad %10 %22\n" // gl_GlobalInvocationId.x
|
|
"%24 = OpAccessChain %20 %6 %13 %23\n" // &in.arr[gl_GlobalInvocationId.x]
|
|
"%25 = OpLoad %9 %24\n" // in.arr[gl_GlobalInvocationId.x]
|
|
"%26 = OpAccessChain %20 %5 %13 %23\n" // &out.arr[gl_GlobalInvocationId.x]
|
|
// Start of branch logic
|
|
// %25 = in value
|
|
"%27 = OpSMod %9 %25 %15\n" // in % 2
|
|
"OpSelectionMerge %28 None\n"
|
|
"OpSwitch %27 %29 1 %30\n"
|
|
"%30 = OpLabel\n" // (in % 2) == 1
|
|
"OpBranch %28\n"
|
|
"%29 = OpLabel\n" // (in % 2) != 1
|
|
"OpBranch %28\n"
|
|
"%28 = OpLabel\n" // merge
|
|
"%31 = OpPhi %9 %14 %30 %15 %29\n" // (in % 2) == 1 ? 1 : 2
|
|
"OpStore %26 %31\n"
|
|
// End of branch logic
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return (i % 2) == 1 ? 1 : 2; });
|
|
}
|
|
|
|
TEST_P(SwiftShaderVulkanBufferToBufferComputeTest, LoopDivergentMergePhi)
|
|
{
|
|
// #version 450
|
|
// layout(local_size_x = 1, local_size_y = 1, local_size_z = 1) in;
|
|
// layout(binding = 0, std430) buffer InBuffer
|
|
// {
|
|
// int Data[];
|
|
// } In;
|
|
// layout(binding = 1, std430) buffer OutBuffer
|
|
// {
|
|
// int Data[];
|
|
// } Out;
|
|
// void main()
|
|
// {
|
|
// int phi = 0;
|
|
// uint lane = gl_GlobalInvocationID.x % 4;
|
|
// for (uint i = 0; i < 4; i++)
|
|
// {
|
|
// if (lane == i)
|
|
// {
|
|
// phi = In.Data[gl_GlobalInvocationID.x];
|
|
// break;
|
|
// }
|
|
// }
|
|
// Out.Data[gl_GlobalInvocationID.x] = phi;
|
|
// }
|
|
std::stringstream src;
|
|
// clang-format off
|
|
src <<
|
|
"OpCapability Shader\n"
|
|
"%1 = OpExtInstImport \"GLSL.std.450\"\n"
|
|
"OpMemoryModel Logical GLSL450\n"
|
|
"OpEntryPoint GLCompute %2 \"main\" %3\n"
|
|
"OpExecutionMode %2 LocalSize " <<
|
|
GetParam().localSizeX << " " <<
|
|
GetParam().localSizeY << " " <<
|
|
GetParam().localSizeZ << "\n" <<
|
|
"OpDecorate %3 BuiltIn GlobalInvocationId\n"
|
|
"OpDecorate %4 ArrayStride 4\n"
|
|
"OpMemberDecorate %5 0 Offset 0\n"
|
|
"OpDecorate %5 BufferBlock\n"
|
|
"OpDecorate %6 DescriptorSet 0\n"
|
|
"OpDecorate %6 Binding 0\n"
|
|
"OpDecorate %7 ArrayStride 4\n"
|
|
"OpMemberDecorate %8 0 Offset 0\n"
|
|
"OpDecorate %8 BufferBlock\n"
|
|
"OpDecorate %9 DescriptorSet 0\n"
|
|
"OpDecorate %9 Binding 1\n"
|
|
"%10 = OpTypeVoid\n"
|
|
"%11 = OpTypeFunction %10\n"
|
|
"%12 = OpTypeInt 32 1\n"
|
|
"%13 = OpConstant %12 0\n"
|
|
"%14 = OpTypeInt 32 0\n"
|
|
"%15 = OpTypeVector %14 3\n"
|
|
"%16 = OpTypePointer Input %15\n"
|
|
"%3 = OpVariable %16 Input\n"
|
|
"%17 = OpConstant %14 0\n"
|
|
"%18 = OpTypePointer Input %14\n"
|
|
"%19 = OpConstant %14 4\n"
|
|
"%20 = OpTypeBool\n"
|
|
"%4 = OpTypeRuntimeArray %12\n"
|
|
"%5 = OpTypeStruct %4\n"
|
|
"%21 = OpTypePointer Uniform %5\n"
|
|
"%6 = OpVariable %21 Uniform\n"
|
|
"%22 = OpTypePointer Uniform %12\n"
|
|
"%23 = OpConstant %12 1\n"
|
|
"%7 = OpTypeRuntimeArray %12\n"
|
|
"%8 = OpTypeStruct %7\n"
|
|
"%24 = OpTypePointer Uniform %8\n"
|
|
"%9 = OpVariable %24 Uniform\n"
|
|
"%2 = OpFunction %10 None %11\n"
|
|
"%25 = OpLabel\n"
|
|
"%26 = OpAccessChain %18 %3 %17\n"
|
|
"%27 = OpLoad %14 %26\n"
|
|
"%28 = OpUMod %14 %27 %19\n"
|
|
"OpBranch %29\n"
|
|
"%29 = OpLabel\n"
|
|
"%30 = OpPhi %14 %17 %25 %31 %32\n"
|
|
"%33 = OpULessThan %20 %30 %19\n"
|
|
"OpLoopMerge %34 %32 None\n"
|
|
"OpBranchConditional %33 %35 %34\n"
|
|
"%35 = OpLabel\n"
|
|
"%36 = OpIEqual %20 %28 %30\n"
|
|
"OpSelectionMerge %37 None\n"
|
|
"OpBranchConditional %36 %38 %37\n"
|
|
"%38 = OpLabel\n"
|
|
"%39 = OpAccessChain %22 %6 %13 %27\n"
|
|
"%40 = OpLoad %12 %39\n"
|
|
"OpBranch %34\n"
|
|
"%37 = OpLabel\n"
|
|
"OpBranch %32\n"
|
|
"%32 = OpLabel\n"
|
|
"%31 = OpIAdd %14 %30 %23\n"
|
|
"OpBranch %29\n"
|
|
"%34 = OpLabel\n"
|
|
"%41 = OpPhi %12 %13 %29 %40 %38\n" // %40: phi
|
|
"%42 = OpAccessChain %22 %9 %13 %27\n"
|
|
"OpStore %42 %41\n"
|
|
"OpReturn\n"
|
|
"OpFunctionEnd\n";
|
|
// clang-format on
|
|
|
|
test(
|
|
src.str(), [](uint32_t i) { return i; }, [](uint32_t i) { return i; });
|
|
}
|