Add more SPIR-V assembly tests based on compute shader.

author Lei Zhang <antiagainst@google.com>

Fri, 20 Nov 2015 15:44:30 +0000 (10:44 -0500)

committer Lei Zhang <antiagainst@google.com>

Tue, 15 Dec 2015 16:46:27 +0000 (11:46 -0500)
author Lei Zhang <antiagainst@google.com>
Fri, 20 Nov 2015 15:44:30 +0000 (10:44 -0500)
committer Lei Zhang <antiagainst@google.com>
Tue, 15 Dec 2015 16:46:27 +0000 (11:46 -0500)
diff --git a/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmComputeShaderCase.cpp b/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmComputeShaderCase.cpp

index 23872a5..d848695 100644 (file)
--- a/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmComputeShaderCase.cpp
+++ b/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmComputeShaderCase.cpp
@@ -91,11 +91,11 @@ void setMemory (const DeviceInterface& vkdi, const VkDevice& device, Allocation*
         flushMappedMemoryRange(vkdi, device, destAlloc->getMemory(), destAlloc->getOffset(), numBytes);
  }
  
-void clearMemory (const DeviceInterface& vkdi, const VkDevice& device, Allocation* destAlloc, size_t numBytes)
+void fillMemoryWithValue (const DeviceInterface& vkdi, const VkDevice& device, Allocation* destAlloc, size_t numBytes, deUint8 value)
  {
         void* const hostPtr = destAlloc->getHostPtr();
  
-       deMemset((deUint8*)hostPtr, 0, numBytes);
+       deMemset((deUint8*)hostPtr, value, numBytes);
         flushMappedMemoryRange(vkdi, device, destAlloc->getMemory(), destAlloc->getOffset(), numBytes);
  }
  
@@ -177,17 +177,38 @@ Move<VkDescriptorSet> createDescriptorSet (const DeviceInterface& vkdi, const Vk
  /*--------------------------------------------------------------------*//*!
   * \brief Create a compute pipeline based on the given shader
   *//*--------------------------------------------------------------------*/
-Move<VkPipeline> createComputePipeline (const DeviceInterface& vkdi, const VkDevice& device, VkPipelineLayout pipelineLayout, VkShaderModule shader)
+Move<VkPipeline> createComputePipeline (const DeviceInterface& vkdi, const VkDevice& device, VkPipelineLayout pipelineLayout, VkShaderModule shader, const char* entryPoint, const vector<deUint32>& specConstants)
  {
+       const deUint32                                                  numSpecConstants                                = (deUint32)specConstants.size();
+       vector<VkSpecializationMapEntry>                entries;
+       VkSpecializationInfo                                    specInfo;
+
+       if (numSpecConstants != 0)
+       {
+               entries.reserve(numSpecConstants);
+
+               for (deUint32 ndx = 0; ndx < numSpecConstants; ++ndx)
+               {
+                       entries[ndx].constantID = ndx;
+                       entries[ndx].offset             = ndx * (deUint32)sizeof(deUint32);
+                       entries[ndx].size               = sizeof(deUint32);
+               }
+
+               specInfo.mapEntryCount          = numSpecConstants;
+               specInfo.pMapEntries            = &entries[0];
+               specInfo.dataSize                       = numSpecConstants * sizeof(deUint32);
+               specInfo.pData                          = specConstants.data();
+       }
+
         const VkPipelineShaderStageCreateInfo   pipelineShaderStageCreateInfo   =
         {
                 VK_STRUCTURE_TYPE_PIPELINE_SHADER_STAGE_CREATE_INFO,    // sType
                 DE_NULL,                                                                                                // pNext
-               (VkPipelineShaderStageCreateFlags)0,
+               (VkPipelineShaderStageCreateFlags)0,                                    // flags
                 VK_SHADER_STAGE_COMPUTE_BIT,                                                    // stage
-               shader,                                                                                                 // shader
-               "main",
-               DE_NULL,                                                                                                // pSpecializationInfo
+               shader,                                                                                                 // module
+               entryPoint,                                                                                             // pName
+               (numSpecConstants == 0) ? DE_NULL : &specInfo,                  // pSpecializationInfo
         };
         const VkComputePipelineCreateInfo               pipelineCreateInfo                              =
         {
@@ -313,7 +334,7 @@ tcu::TestStatus SpvAsmComputeShaderInstance::iterate (void)
                 const size_t            numBytes        = output->getNumBytes();
                 BufferHandleUp*         buffer          = new BufferHandleUp(createBufferAndBindMemory(vkdi, device, allocator, numBytes, &alloc));
  
-               clearMemory(vkdi, device, &*alloc, numBytes);
+               fillMemoryWithValue(vkdi, device, &*alloc, numBytes, 0xff);
                 descriptorInfos.push_back(vk::makeDescriptorBufferInfo(**buffer, 0u, numBytes));
                 outputBuffers.push_back(BufferHandleSp(buffer));
                 outputAllocs.push_back(de::SharedPtr<Allocation>(alloc.release()));
@@ -331,7 +352,7 @@ tcu::TestStatus SpvAsmComputeShaderInstance::iterate (void)
         const ProgramBinary&                            binary                          = m_context.getBinaryCollection().get("compute");
         Unique<VkShaderModule>                          module                          (createShaderModule(vkdi, device, binary, (VkShaderModuleCreateFlags)0u));
  
-       Unique<VkPipeline>                                      computePipeline         (createComputePipeline(vkdi, device, *pipelineLayout, *module));
+       Unique<VkPipeline>                                      computePipeline         (createComputePipeline(vkdi, device, *pipelineLayout, *module, m_shaderSpec.entryPoint.c_str(), m_shaderSpec.specConstants));
  
         // Create command buffer and record commands
  
diff --git a/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmComputeShaderTestUtil.hpp b/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmComputeShaderTestUtil.hpp

index fbfa5c0..01af95d 100644 (file)
--- a/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmComputeShaderTestUtil.hpp
+++ b/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmComputeShaderTestUtil.hpp
@@ -78,7 +78,11 @@ private:
         std::vector<E>          m_elements;
  };
  
-typedef Buffer<float>  Float32Buffer;
+DE_STATIC_ASSERT(sizeof(tcu::Vec4) == 4 * sizeof(float));
+
+typedef Buffer<float>          Float32Buffer;
+typedef Buffer<deInt32>                Int32Buffer;
+typedef Buffer<tcu::Vec4>      Vec4Buffer;
  
  
  /*--------------------------------------------------------------------*//*!
@@ -90,9 +94,11 @@ typedef Buffer<float>        Float32Buffer;
  struct ComputeShaderSpec
  {
         std::string                             assembly;
+       std::string                             entryPoint;
         std::vector<BufferSp>   inputs;
         std::vector<BufferSp>   outputs;
         tcu::IVec3                              numWorkGroups;
+       std::vector<deUint32>   specConstants;
  };
  
  } // SpirVAssembly
diff --git a/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmInstructionTests.cpp b/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmInstructionTests.cpp

index 56f74cf..20a28fa 100644 (file)
--- a/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmInstructionTests.cpp
+++ b/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmInstructionTests.cpp
@@ -57,6 +57,8 @@
  #include "deUniquePtr.hpp"
  #include "tcuStringTemplate.hpp"
  
+#include <cmath>
+
  #include "vktSpvAsmComputeShaderCase.hpp"
  #include "vktSpvAsmComputeShaderTestUtil.hpp"
  #include "vktTestCaseUtil.hpp"
@@ -85,6 +87,7 @@ using tcu::TestStatus;
  using tcu::Vec4;
  using de::UniquePtr;
  using tcu::StringTemplate;
+using tcu::Vec4;
  
  typedef Unique<VkShaderModule>                 ModuleHandleUp;
  typedef de::SharedPtr<ModuleHandleUp>  ModuleHandleSp;
@@ -92,7 +95,6 @@ typedef de::SharedPtr<ModuleHandleUp> ModuleHandleSp;
  template<typename T>   T                       randomScalar    (de::Random& rnd, T minValue, T maxValue);
  template<> inline              float           randomScalar    (de::Random& rnd, float minValue, float maxValue)               { return rnd.getFloat(minValue, maxValue);      }
  template<> inline              deInt32         randomScalar    (de::Random& rnd, deInt32 minValue, deInt32 maxValue)   { return rnd.getInt(minValue, maxValue);        }
-template<> inline              deUint32        randomScalar    (de::Random& rnd, deUint32 minValue, deUint32 maxValue) { return minValue + rnd.getUint32() % (maxValue - minValue + 1); }
  
  template<typename T>
  static void fillRandomScalars (de::Random& rnd, T minValue, T maxValue, void* dst, int numValues, int offset = 0)
@@ -102,6 +104,14 @@ static void fillRandomScalars (de::Random& rnd, T minValue, T maxValue, void* ds
                 typedPtr[offset + ndx] = randomScalar<T>(rnd, minValue, maxValue);
  }
  
+struct CaseParameter
+{
+       const char*             name;
+       string                  param;
+
+       CaseParameter   (const char* case_, const string& param_) : name(case_), param(param_) {}
+};
+
  // Assembly code used for testing OpNop, OpConstant{Null|Composite}, Op[No]Line, OpSource[Continued], OpSourceExtension, OpUndef is based on GLSL source code:
  //
  // #version 430
@@ -207,6 +217,7 @@ tcu::TestCaseGroup* createOpNopGroup (tcu::TestContext& testCtx)
         spec.inputs.push_back(BufferSp(new Float32Buffer(positiveFloats)));
         spec.outputs.push_back(BufferSp(new Float32Buffer(negativeFloats)));
         spec.numWorkGroups = IVec3(numElements, 1, 1);
+       spec.entryPoint = "main";
  
         group->addChild(new SpvAsmComputeShaderCase(testCtx, "all", "OpNop appearing at different places", spec));
  
@@ -271,6 +282,7 @@ tcu::TestCaseGroup* createOpLineGroup (tcu::TestContext& testCtx)
         spec.inputs.push_back(BufferSp(new Float32Buffer(positiveFloats)));
         spec.outputs.push_back(BufferSp(new Float32Buffer(negativeFloats)));
         spec.numWorkGroups = IVec3(numElements, 1, 1);
+       spec.entryPoint = "main";
  
         group->addChild(new SpvAsmComputeShaderCase(testCtx, "all", "OpLine appearing at different places", spec));
  
@@ -337,12 +349,399 @@ tcu::TestCaseGroup* createOpNoLineGroup (tcu::TestContext& testCtx)
         spec.inputs.push_back(BufferSp(new Float32Buffer(positiveFloats)));
         spec.outputs.push_back(BufferSp(new Float32Buffer(negativeFloats)));
         spec.numWorkGroups = IVec3(numElements, 1, 1);
+       spec.entryPoint = "main";
  
         group->addChild(new SpvAsmComputeShaderCase(testCtx, "all", "OpNoLine appearing at different places", spec));
  
         return group.release();
  }
  
+tcu::TestCaseGroup* createNoContractionGroup (tcu::TestContext& testCtx)
+{
+       de::MovePtr<tcu::TestCaseGroup> group                   (new tcu::TestCaseGroup(testCtx, "nocontraction", "Test the NoContraction decoration"));
+       vector<CaseParameter>                   cases;
+       de::Random                                              rnd                             (deStringHash(group->getName()));
+       const int                                               numElements             = 100;
+       vector<float>                                   inputFloats1    (numElements, 0);
+       vector<float>                                   inputFloats2    (numElements, 0);
+       vector<float>                                   outputFloats    (numElements, 0);
+       const StringTemplate                    shaderTemplate  (
+               string(s_ShaderPreamble) +
+
+               "OpName %main           \"main\"\n"
+               "OpName %id             \"gl_GlobalInvocationID\"\n"
+
+               "OpDecorate %id BuiltIn GlobalInvocationId\n"
+
+               "${DECORATION}\n"
+
+               "OpDecorate %inbuf1 BufferBlock\n"
+               "OpDecorate %indata1 DescriptorSet 0\n"
+               "OpDecorate %indata1 Binding 0\n"
+               "OpDecorate %inbuf2 BufferBlock\n"
+               "OpDecorate %indata2 DescriptorSet 0\n"
+               "OpDecorate %indata2 Binding 1\n"
+               "OpDecorate %outbuf BufferBlock\n"
+               "OpDecorate %outdata DescriptorSet 0\n"
+               "OpDecorate %outdata Binding 2\n"
+               "OpDecorate %f32arr ArrayStride 4\n"
+               "OpMemberDecorate %inbuf1 0 Offset 0\n"
+               "OpMemberDecorate %inbuf2 0 Offset 0\n"
+               "OpMemberDecorate %outbuf 0 Offset 0\n"
+
+               + string(s_CommonTypes) +
+
+               "%inbuf1     = OpTypeStruct %f32arr\n"
+               "%inbufptr1  = OpTypePointer Uniform %inbuf1\n"
+               "%indata1    = OpVariable %inbufptr1 Uniform\n"
+               "%inbuf2     = OpTypeStruct %f32arr\n"
+               "%inbufptr2  = OpTypePointer Uniform %inbuf2\n"
+               "%indata2    = OpVariable %inbufptr2 Uniform\n"
+               "%outbuf     = OpTypeStruct %f32arr\n"
+               "%outbufptr  = OpTypePointer Uniform %outbuf\n"
+               "%outdata    = OpVariable %outbufptr Uniform\n"
+
+               "%id         = OpVariable %uvec3ptr Input\n"
+               "%zero       = OpConstant %i32 0\n"
+               "%c_f_m1     = OpConstant %f32 -1.\n"
+
+               "%main       = OpFunction %void None %voidf\n"
+               "%label      = OpLabel\n"
+               "%idval      = OpLoad %uvec3 %id\n"
+               "%x          = OpCompositeExtract %u32 %idval 0\n"
+               "%inloc1     = OpAccessChain %f32ptr %indata1 %zero %x\n"
+               "%inval1     = OpLoad %f32 %inloc1\n"
+               "%inloc2     = OpAccessChain %f32ptr %indata2 %zero %x\n"
+               "%inval2     = OpLoad %f32 %inloc2\n"
+               "%mul        = OpFMul %f32 %inval1 %inval2\n"
+               "%add        = OpFAdd %f32 %mul %c_f_m1\n"
+               "%outloc     = OpAccessChain %f32ptr %outdata %zero %x\n"
+               "              OpStore %outloc %add\n"
+               "              OpReturn\n"
+               "              OpFunctionEnd\n");
+
+       cases.push_back(CaseParameter("multiplication", "OpDecorate %mul NoContraction"));
+       cases.push_back(CaseParameter("addition",               "OpDecorate %add NoContraction"));
+       cases.push_back(CaseParameter("both",                   "OpDecorate %mul NoContraction\nOpDecorate %add NoContraction"));
+
+       for (size_t ndx = 0; ndx < numElements; ++ndx)
+       {
+               inputFloats1[ndx]       = 1.f + std::ldexp(1.f, -23); // 1 + 2^-23.
+               inputFloats2[ndx]       = 1.f - std::ldexp(1.f, -23); // 1 - 2^-23.
+               // Result for (1 + 2^-23) * (1 - 2^-23) - 1. With NoContraction, the multiplication will be
+               // conducted separately and the result is rounded to 1. So the final result will be 0.f.
+               // If the operation is combined into a precise fused multiply-add, then the result would be
+               // 2^-46 (0xa8800000).
+               outputFloats[ndx]       = 0.f;
+       }
+
+       for (size_t caseNdx = 0; caseNdx < cases.size(); ++caseNdx)
+       {
+               map<string, string>             specializations;
+               ComputeShaderSpec               spec;
+
+               specializations["DECORATION"] = cases[caseNdx].param;
+               spec.assembly = shaderTemplate.specialize(specializations);
+               spec.inputs.push_back(BufferSp(new Float32Buffer(inputFloats1)));
+               spec.inputs.push_back(BufferSp(new Float32Buffer(inputFloats2)));
+               spec.outputs.push_back(BufferSp(new Float32Buffer(outputFloats)));
+               spec.numWorkGroups = IVec3(numElements, 1, 1);
+               spec.entryPoint = "main";
+
+               group->addChild(new SpvAsmComputeShaderCase(testCtx, cases[caseNdx].name, cases[caseNdx].name, spec));
+       }
+       return group.release();
+}
+
+// Copy contents in the input buffer to the output buffer.
+tcu::TestCaseGroup* createOpCopyMemoryGroup (tcu::TestContext& testCtx)
+{
+       de::MovePtr<tcu::TestCaseGroup> group                   (new tcu::TestCaseGroup(testCtx, "opcopymemory", "Test the OpCopyMemory instruction"));
+       de::Random                                              rnd                             (deStringHash(group->getName()));
+       const int                                               numElements             = 100;
+
+       // The following case adds vec4(0., 0.5, 1.5, 2.5) to each of the elements in the input buffer and writes output to the output buffer.
+       ComputeShaderSpec                               spec1;
+       vector<Vec4>                                    inputFloats1    (numElements);
+       vector<Vec4>                                    outputFloats1   (numElements);
+
+       fillRandomScalars(rnd, -200.f, 200.f, &inputFloats1[0], numElements * 4);
+
+       for (size_t ndx = 0; ndx < numElements; ++ndx)
+               outputFloats1[ndx] = inputFloats1[ndx] + Vec4(0.f, 0.5f, 1.5f, 2.5f);
+
+       spec1.assembly =
+               string(s_ShaderPreamble) +
+
+               "OpName %main           \"main\"\n"
+               "OpName %id             \"gl_GlobalInvocationID\"\n"
+
+               "OpDecorate %id BuiltIn GlobalInvocationId\n"
+
+               + string(s_InputOutputBufferTraits) + string(s_CommonTypes) +
+
+               "%vec4       = OpTypeVector %f32 4\n"
+               "%vec4ptr_u  = OpTypePointer Uniform %vec4\n"
+               "%vec4ptr_f  = OpTypePointer Function %vec4\n"
+               "%vec4arr    = OpTypeRuntimeArray %vec4\n"
+               "%inbuf      = OpTypeStruct %vec4arr\n"
+               "%inbufptr   = OpTypePointer Uniform %inbuf\n"
+               "%indata     = OpVariable %inbufptr Uniform\n"
+               "%outbuf     = OpTypeStruct %vec4arr\n"
+               "%outbufptr  = OpTypePointer Uniform %outbuf\n"
+               "%outdata    = OpVariable %outbufptr Uniform\n"
+
+               "%id         = OpVariable %uvec3ptr Input\n"
+               "%zero       = OpConstant %i32 0\n"
+               "%c_f_0      = OpConstant %f32 0.\n"
+               "%c_f_0_5    = OpConstant %f32 0.5\n"
+               "%c_f_1_5    = OpConstant %f32 1.5\n"
+               "%c_f_2_5    = OpConstant %f32 2.5\n"
+               "%c_vec4     = OpConstantComposite %vec4 %c_f_0 %c_f_0_5 %c_f_1_5 %c_f_2_5\n"
+
+               "%main       = OpFunction %void None %voidf\n"
+               "%label      = OpLabel\n"
+               "%v_vec4     = OpVariable %vec4ptr_f Function\n"
+               "%idval      = OpLoad %uvec3 %id\n"
+               "%x          = OpCompositeExtract %u32 %idval 0\n"
+               "%inloc      = OpAccessChain %vec4ptr_u %indata %zero %x\n"
+               "%outloc     = OpAccessChain %vec4ptr_u %outdata %zero %x\n"
+               "              OpCopyMemory %v_vec4 %inloc\n"
+               "%v_vec4_val = OpLoad %vec4 %v_vec4\n"
+               "%add        = OpFAdd %vec4 %v_vec4_val %c_vec4\n"
+               "              OpStore %outloc %add\n"
+               "              OpReturn\n"
+               "              OpFunctionEnd\n";
+
+       spec1.inputs.push_back(BufferSp(new Vec4Buffer(inputFloats1)));
+       spec1.outputs.push_back(BufferSp(new Vec4Buffer(outputFloats1)));
+       spec1.numWorkGroups = IVec3(numElements, 1, 1);
+       spec1.entryPoint = "main";
+
+       group->addChild(new SpvAsmComputeShaderCase(testCtx, "vector", "OpCopyMemory elements of vector type", spec1));
+
+       // The following case copies a float[100] variable from the input buffer to the output buffer.
+       ComputeShaderSpec                               spec2;
+       vector<float>                                   inputFloats2    (numElements);
+       vector<float>                                   outputFloats2   (numElements);
+
+       fillRandomScalars(rnd, -200.f, 200.f, &inputFloats2[0], numElements);
+
+       for (size_t ndx = 0; ndx < numElements; ++ndx)
+               outputFloats2[ndx] = inputFloats2[ndx];
+
+       spec2.assembly =
+               string(s_ShaderPreamble) +
+
+               "OpName %main           \"main\"\n"
+               "OpName %id             \"gl_GlobalInvocationID\"\n"
+
+               "OpDecorate %id BuiltIn GlobalInvocationId\n"
+
+               + string(s_InputOutputBufferTraits) + string(s_CommonTypes) +
+
+               "%hundred        = OpConstant %u32 100\n"
+               "%f32arr100      = OpTypeArray %f32 %hundred\n"
+               "%f32arr100ptr_f = OpTypePointer Function %f32arr100\n"
+               "%f32arr100ptr_u = OpTypePointer Uniform %f32arr100\n"
+               "%inbuf          = OpTypeStruct %f32arr100\n"
+               "%inbufptr       = OpTypePointer Uniform %inbuf\n"
+               "%indata         = OpVariable %inbufptr Uniform\n"
+               "%outbuf         = OpTypeStruct %f32arr100\n"
+               "%outbufptr      = OpTypePointer Uniform %outbuf\n"
+               "%outdata        = OpVariable %outbufptr Uniform\n"
+
+               "%id             = OpVariable %uvec3ptr Input\n"
+               "%zero           = OpConstant %i32 0\n"
+
+               "%main           = OpFunction %void None %voidf\n"
+               "%label          = OpLabel\n"
+               "%var            = OpVariable %f32arr100ptr_f Function\n"
+               "%inarr          = OpAccessChain %f32arr100ptr_u %indata %zero\n"
+               "%outarr         = OpAccessChain %f32arr100ptr_u %outdata %zero\n"
+               "                  OpCopyMemory %var %inarr\n"
+               "                  OpCopyMemory %outarr %var\n"
+               "                  OpReturn\n"
+               "                  OpFunctionEnd\n";
+
+       spec2.inputs.push_back(BufferSp(new Float32Buffer(inputFloats2)));
+       spec2.outputs.push_back(BufferSp(new Float32Buffer(outputFloats2)));
+       spec2.numWorkGroups = IVec3(1, 1, 1);
+       spec2.entryPoint = "main";
+
+       group->addChild(new SpvAsmComputeShaderCase(testCtx, "array", "OpCopyMemory elements of array type", spec2));
+
+       // The following case copies a struct{vec4, vec4, vec4, vec4} variable from the input buffer to the output buffer.
+       ComputeShaderSpec                               spec3;
+       vector<float>                                   inputFloats3    (16);
+       vector<float>                                   outputFloats3   (16);
+
+       fillRandomScalars(rnd, -200.f, 200.f, &inputFloats3[0], 16);
+
+       for (size_t ndx = 0; ndx < 16; ++ndx)
+               outputFloats3[ndx] = -inputFloats3[ndx];
+
+       spec3.assembly =
+               string(s_ShaderPreamble) +
+
+               "OpName %main           \"main\"\n"
+               "OpName %id             \"gl_GlobalInvocationID\"\n"
+
+               "OpDecorate %id BuiltIn GlobalInvocationId\n"
+
+               + string(s_InputOutputBufferTraits) + string(s_CommonTypes) +
+
+               "%vec4      = OpTypeVector %f32 4\n"
+               "%inbuf     = OpTypeStruct %vec4 %vec4 %vec4 %vec4\n"
+               "%inbufptr  = OpTypePointer Uniform %inbuf\n"
+               "%indata    = OpVariable %inbufptr Uniform\n"
+               "%outbuf    = OpTypeStruct %vec4 %vec4 %vec4 %vec4\n"
+               "%outbufptr = OpTypePointer Uniform %outbuf\n"
+               "%outdata   = OpVariable %outbufptr Uniform\n"
+               "%vec4stptr = OpTypePointer Function %inbuf\n"
+
+               "%id        = OpVariable %uvec3ptr Input\n"
+               "%zero      = OpConstant %i32 0\n"
+
+               "%main      = OpFunction %void None %voidf\n"
+               "%label     = OpLabel\n"
+               "%var       = OpVariable %vec4stptr Function\n"
+               "             OpCopyMemory %var %indata\n"
+               "             OpCopyMemory %outdata %var\n"
+               "             OpReturn\n"
+               "             OpFunctionEnd\n";
+
+       spec3.inputs.push_back(BufferSp(new Float32Buffer(inputFloats3)));
+       spec3.outputs.push_back(BufferSp(new Float32Buffer(outputFloats3)));
+       spec3.numWorkGroups = IVec3(1, 1, 1);
+       spec3.entryPoint = "main";
+
+       group->addChild(new SpvAsmComputeShaderCase(testCtx, "struct", "OpCopyMemory elements of struct type", spec3));
+
+       // The following case negates multiple float variables from the input buffer and stores the results to the output buffer.
+       ComputeShaderSpec                               spec4;
+       vector<float>                                   inputFloats4    (numElements);
+       vector<float>                                   outputFloats4   (numElements);
+
+       fillRandomScalars(rnd, -200.f, 200.f, &inputFloats4[0], numElements);
+
+       for (size_t ndx = 0; ndx < numElements; ++ndx)
+               outputFloats4[ndx] = -inputFloats4[ndx];
+
+       spec4.assembly =
+               string(s_ShaderPreamble) +
+
+               "OpName %main           \"main\"\n"
+               "OpName %id             \"gl_GlobalInvocationID\"\n"
+
+               "OpDecorate %id BuiltIn GlobalInvocationId\n"
+
+               + string(s_InputOutputBufferTraits) + string(s_CommonTypes) + string(s_InputOutputBuffer) +
+
+               "%f32ptr_f  = OpTypePointer Function %f32\n"
+               "%id        = OpVariable %uvec3ptr Input\n"
+               "%zero      = OpConstant %i32 0\n"
+
+               "%main      = OpFunction %void None %voidf\n"
+               "%label     = OpLabel\n"
+               "%var       = OpVariable %f32ptr_f Function\n"
+               "%idval     = OpLoad %uvec3 %id\n"
+               "%x         = OpCompositeExtract %u32 %idval 0\n"
+               "%inloc     = OpAccessChain %f32ptr %indata %zero %x\n"
+               "%outloc    = OpAccessChain %f32ptr %outdata %zero %x\n"
+               "             OpCopyMemory %var %inloc\n"
+               "%val       = OpLoad %f32 %var\n"
+               "%neg       = OpFNegate %f32 %val\n"
+               "             OpStore %outloc %neg\n"
+               "             OpReturn\n"
+               "             OpFunctionEnd\n";
+
+       spec4.inputs.push_back(BufferSp(new Float32Buffer(inputFloats4)));
+       spec4.outputs.push_back(BufferSp(new Float32Buffer(outputFloats4)));
+       spec4.numWorkGroups = IVec3(numElements, 1, 1);
+       spec4.entryPoint = "main";
+
+       group->addChild(new SpvAsmComputeShaderCase(testCtx, "float", "OpCopyMemory elements of float type", spec4));
+
+       return group.release();
+}
+
+tcu::TestCaseGroup* createOpCopyObjectGroup (tcu::TestContext& testCtx)
+{
+       de::MovePtr<tcu::TestCaseGroup> group                   (new tcu::TestCaseGroup(testCtx, "opcopyobject", "Test the OpCopyObject instruction"));
+       ComputeShaderSpec                               spec;
+       de::Random                                              rnd                             (deStringHash(group->getName()));
+       const int                                               numElements             = 100;
+       vector<float>                                   inputFloats             (numElements, 0);
+       vector<float>                                   outputFloats    (numElements, 0);
+
+       fillRandomScalars(rnd, -200.f, 200.f, &inputFloats[0], numElements);
+
+       for (size_t ndx = 0; ndx < numElements; ++ndx)
+               outputFloats[ndx] = inputFloats[ndx] + 7.5f;
+
+       spec.assembly =
+               string(s_ShaderPreamble) +
+
+               "OpName %main           \"main\"\n"
+               "OpName %id             \"gl_GlobalInvocationID\"\n"
+
+               "OpDecorate %id BuiltIn GlobalInvocationId\n"
+
+               + string(s_InputOutputBufferTraits) + string(s_CommonTypes) +
+
+               "%fvec3    = OpTypeVector %f32 3\n"
+               "%fmat     = OpTypeMatrix %fvec3 3\n"
+               "%three    = OpConstant %u32 3\n"
+               "%farr     = OpTypeArray %f32 %three\n"
+               "%fst      = OpTypeStruct %f32 %f32\n"
+
+               + string(s_InputOutputBuffer) +
+
+               "%id            = OpVariable %uvec3ptr Input\n"
+               "%zero          = OpConstant %i32 0\n"
+               "%c_f           = OpConstant %f32 1.5\n"
+               "%c_fvec3       = OpConstantComposite %fvec3 %c_f %c_f %c_f\n"
+               "%c_fmat        = OpConstantComposite %fmat %c_fvec3 %c_fvec3 %c_fvec3\n"
+               "%c_farr        = OpConstantComposite %farr %c_f %c_f %c_f\n"
+               "%c_fst         = OpConstantComposite %fst %c_f %c_f\n"
+
+               "%main          = OpFunction %void None %voidf\n"
+               "%label         = OpLabel\n"
+               "%c_f_copy      = OpCopyObject %f32   %c_f\n"
+               "%c_fvec3_copy  = OpCopyObject %fvec3 %c_fvec3\n"
+               "%c_fmat_copy   = OpCopyObject %fmat  %c_fmat\n"
+               "%c_farr_copy   = OpCopyObject %farr  %c_farr\n"
+               "%c_fst_copy    = OpCopyObject %fst   %c_fst\n"
+               "%fvec3_elem    = OpCompositeExtract %f32 %c_fvec3_copy 0\n"
+               "%fmat_elem     = OpCompositeExtract %f32 %c_fmat_copy 1 2\n"
+               "%farr_elem     = OpCompositeExtract %f32 %c_fmat_copy 2\n"
+               "%fst_elem      = OpCompositeExtract %f32 %c_fmat_copy 1\n"
+               // Add up. 1.5 * 5 = 7.5.
+               "%add1          = OpFAdd %f32 %c_f_copy %fvec3_elem\n"
+               "%add2          = OpFAdd %f32 %add1     %fmat_elem\n"
+               "%add3          = OpFAdd %f32 %add2     %farr_elem\n"
+               "%add4          = OpFAdd %f32 %add3     %fst_elem\n"
+
+               "%idval         = OpLoad %uvec3 %id\n"
+               "%x             = OpCompositeExtract %u32 %idval 0\n"
+               "%inloc         = OpAccessChain %f32ptr %indata %zero %x\n"
+               "%outloc        = OpAccessChain %f32ptr %outdata %zero %x\n"
+               "%inval         = OpLoad %f32 %inloc\n"
+               "%add           = OpFAdd %f32 %add4 %inval\n"
+               "                 OpStore %outloc %add\n"
+               "                 OpReturn\n"
+               "                 OpFunctionEnd\n";
+       spec.inputs.push_back(BufferSp(new Float32Buffer(inputFloats)));
+       spec.outputs.push_back(BufferSp(new Float32Buffer(outputFloats)));
+       spec.numWorkGroups = IVec3(numElements, 1, 1);
+       spec.entryPoint = "main";
+
+       group->addChild(new SpvAsmComputeShaderCase(testCtx, "spotcheck", "OpCopyObject on different types", spec));
+
+       return group.release();
+}
+
  // Assembly code used for testing OpUnreachable is based on GLSL source code:
  //
  // #version 430
@@ -488,6 +887,7 @@ tcu::TestCaseGroup* createOpUnreachableGroup (tcu::TestContext& testCtx)
         spec.inputs.push_back(BufferSp(new Float32Buffer(positiveFloats)));
         spec.outputs.push_back(BufferSp(new Float32Buffer(negativeFloats)));
         spec.numWorkGroups = IVec3(numElements, 1, 1);
+       spec.entryPoint = "main";
  
         group->addChild(new SpvAsmComputeShaderCase(testCtx, "all", "OpUnreachable appearing at different places", spec));
  
@@ -649,13 +1049,238 @@ tcu::TestCaseGroup* createDecorationGroupGroup (tcu::TestContext& testCtx)
         spec.inputs.push_back(BufferSp(new Float32Buffer(inputFloats4)));
         spec.outputs.push_back(BufferSp(new Float32Buffer(outputFloats)));
         spec.numWorkGroups = IVec3(numElements, 1, 1);
+       spec.entryPoint = "main";
  
         group->addChild(new SpvAsmComputeShaderCase(testCtx, "all", "decoration group cases", spec));
  
         return group.release();
  }
  
-tcu::TestCaseGroup* createOpPhiGroup (tcu::TestContext& testCtx)
+struct SpecConstantTwoIntCase
+{
+       const char*             caseName;
+       const char*             scDefinition0;
+       const char*             scDefinition1;
+       const char*             scResultType;
+       const char*             scOperation;
+       deInt32                 scActualValue0;
+       deInt32                 scActualValue1;
+       const char*             resultOperation;
+       vector<deInt32> expectedOutput;
+
+                                       SpecConstantTwoIntCase (const char* name,
+                                                                                       const char* definition0,
+                                                                                       const char* definition1,
+                                                                                       const char* resultType,
+                                                                                       const char* operation,
+                                                                                       deInt32 value0,
+                                                                                       deInt32 value1,
+                                                                                       const char* resultOp,
+                                                                                       const vector<deInt32>& output)
+                                               : caseName                      (name)
+                                               , scDefinition0         (definition0)
+                                               , scDefinition1         (definition1)
+                                               , scResultType          (resultType)
+                                               , scOperation           (operation)
+                                               , scActualValue0        (value0)
+                                               , scActualValue1        (value1)
+                                               , resultOperation       (resultOp)
+                                               , expectedOutput        (output) {}
+};
+
+tcu::TestCaseGroup* createSpecConstantGroup (tcu::TestContext& testCtx)
+{
+       de::MovePtr<tcu::TestCaseGroup> group                   (new tcu::TestCaseGroup(testCtx, "opspecconstantop", "Test the OpSpecConstantOp instruction"));
+       vector<SpecConstantTwoIntCase>  cases;
+       de::Random                                              rnd                             (deStringHash(group->getName()));
+       const int                                               numElements             = 100;
+       vector<deInt32>                                 inputInts               (numElements, 0);
+       vector<deInt32>                                 outputInts1             (numElements, 0);
+       vector<deInt32>                                 outputInts2             (numElements, 0);
+       vector<deInt32>                                 outputInts3             (numElements, 0);
+       vector<deInt32>                                 outputInts4             (numElements, 0);
+       vector<deInt32>                                 outputInts5             (numElements, 0);
+       const StringTemplate                    shaderTemplate  (
+               string(s_ShaderPreamble) +
+
+               "OpName %main           \"main\"\n"
+               "OpName %id             \"gl_GlobalInvocationID\"\n"
+
+               "OpDecorate %id BuiltIn GlobalInvocationId\n"
+               "OpDecorate %sc_0  SpecId 0\n"
+               "OpDecorate %sc_1  SpecId 1\n"
+
+               + string(s_InputOutputBufferTraits) + string(s_CommonTypes) +
+
+               "%i32ptr    = OpTypePointer Uniform %i32\n"
+               "%i32arr    = OpTypeRuntimeArray %i32\n"
+               "%boolptr   = OpTypePointer Uniform %bool\n"
+               "%boolarr   = OpTypeRuntimeArray %bool\n"
+               "%inbuf     = OpTypeStruct %i32arr\n"
+               "%inbufptr  = OpTypePointer Uniform %inbuf\n"
+               "%indata    = OpVariable %inbufptr Uniform\n"
+               "%outbuf    = OpTypeStruct %i32arr\n"
+               "%outbufptr = OpTypePointer Uniform %outbuf\n"
+               "%outdata   = OpVariable %outbufptr Uniform\n"
+
+               "%id        = OpVariable %uvec3ptr Input\n"
+               "%zero      = OpConstant %i32 0\n"
+
+               "%sc_0      = OpSpecConstant${SC_DEF0}\n"
+               "%sc_1      = OpSpecConstant${SC_DEF1}\n"
+               "%sc_final  = OpSpecConstantOp ${SC_RESULT_TYPE} ${SC_OP}\n"
+
+               "%main      = OpFunction %void None %voidf\n"
+               "%label     = OpLabel\n"
+               "%idval     = OpLoad %uvec3 %id\n"
+               "%x         = OpCompositeExtract %u32 %idval 0\n"
+               "%inloc     = OpAccessChain %i32ptr %indata %zero %x\n"
+               "%inval     = OpLoad %i32 %inloc\n"
+               "%final     = ${GEN_RESULT}\n"
+               "%outloc    = OpAccessChain %i32ptr %outdata %zero %x\n"
+               "             OpStore %outloc %final\n"
+               "             OpReturn\n"
+               "             OpFunctionEnd\n");
+
+       fillRandomScalars(rnd, -65536, 65536, &inputInts[0], numElements);
+
+       for (size_t ndx = 0; ndx < numElements; ++ndx)
+       {
+               outputInts1[ndx] = inputInts[ndx] + 42;
+               outputInts2[ndx] = inputInts[ndx];
+               outputInts3[ndx] = inputInts[ndx] - 11200;
+               outputInts4[ndx] = inputInts[ndx] + 1;
+               outputInts5[ndx] = inputInts[ndx] - 2;
+       }
+
+       const char addScToInput[]               = "OpIAdd %i32 %inval %sc_final";
+       const char selectTrueUsingSc[]  = "OpSelect %i32 %sc_final %inval %zero";
+       const char selectFalseUsingSc[] = "OpSelect %i32 %sc_final %zero %inval";
+
+       cases.push_back(SpecConstantTwoIntCase("iadd",                                  " %i32 0",              " %i32 0",              "%i32",         "IAdd                 %sc_0 %sc_1",                     62,             -20,    addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("isub",                                  " %i32 0",              " %i32 0",              "%i32",         "ISub                 %sc_0 %sc_1",                     100,    58,             addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("imul",                                  " %i32 0",              " %i32 0",              "%i32",         "IMul                 %sc_0 %sc_1",                     -2,             -21,    addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("sdiv",                                  " %i32 0",              " %i32 0",              "%i32",         "SDiv                 %sc_0 %sc_1",                     -126,   -3,             addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("udiv",                                  " %i32 0",              " %i32 0",              "%i32",         "UDiv                 %sc_0 %sc_1",                     126,    3,              addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("srem",                                  " %i32 0",              " %i32 0",              "%i32",         "SRem                 %sc_0 %sc_1",                     7,              -3,             addScToInput,           outputInts4));
+       cases.push_back(SpecConstantTwoIntCase("smod",                                  " %i32 0",              " %i32 0",              "%i32",         "SMod                 %sc_0 %sc_1",                     7,              -3,             addScToInput,           outputInts5));
+       cases.push_back(SpecConstantTwoIntCase("umod",                                  " %i32 0",              " %i32 0",              "%i32",         "UMod                 %sc_0 %sc_1",                     342,    50,             addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("bitwiseand",                    " %i32 0",              " %i32 0",              "%i32",         "BitwiseAnd           %sc_0 %sc_1",                     42,             63,             addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("bitwiseor",                             " %i32 0",              " %i32 0",              "%i32",         "BitwiseOr            %sc_0 %sc_1",                     34,             8,              addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("bitwisexor",                    " %i32 0",              " %i32 0",              "%i32",         "BitwiseAnd           %sc_0 %sc_1",                     18,             56,             addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("shiftrightlogical",             " %i32 0",              " %i32 0",              "%i32",         "ShiftRightLogical    %sc_0 %sc_1",                     168,    2,              addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("shiftrightarithmetic",  " %i32 0",              " %i32 0",              "%i32",         "ShiftRightArithmetic %sc_0 %sc_1",                     168,    2,              addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("shiftleftlogical",              " %i32 0",              " %i32 0",              "%i32",         "ShiftLeftLogical     %sc_0 %sc_1",                     21,             1,              addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("slessthan",                             " %i32 0",              " %i32 0",              "%bool",        "SLessThan            %sc_0 %sc_1",                     -20,    -10,    selectTrueUsingSc,      outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("ulessthan",                             " %i32 0",              " %i32 0",              "%bool",        "ULessThan            %sc_0 %sc_1",                     10,             20,             selectTrueUsingSc,      outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("sgreaterthan",                  " %i32 0",              " %i32 0",              "%bool",        "SGreaterThan         %sc_0 %sc_1",                     -1000,  50,             selectFalseUsingSc,     outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("ugreaterthan",                  " %i32 0",              " %i32 0",              "%bool",        "UGreaterThan         %sc_0 %sc_1",                     10,             5,              selectTrueUsingSc,      outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("slessthanequal",                " %i32 0",              " %i32 0",              "%bool",        "SLessThanEqual       %sc_0 %sc_1",                     -10,    -10,    selectTrueUsingSc,      outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("ulessthanequal",                " %i32 0",              " %i32 0",              "%bool",        "ULessThanEqual       %sc_0 %sc_1",                     50,             100,    selectTrueUsingSc,      outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("sgreaterthanequal",             " %i32 0",              " %i32 0",              "%bool",        "SGreaterThanEqual    %sc_0 %sc_1",                     -1000,  50,             selectFalseUsingSc,     outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("ugreaterthanequal",             " %i32 0",              " %i32 0",              "%bool",        "UGreaterThanEqual    %sc_0 %sc_1",                     10,             10,             selectTrueUsingSc,      outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("iequal",                                " %i32 0",              " %i32 0",              "%bool",        "IEqual               %sc_0 %sc_1",                     42,             24,             selectFalseUsingSc,     outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("logicaland",                    "True %bool",   "True %bool",   "%bool",        "LogicalAnd           %sc_0 %sc_1",                     0,              1,              selectFalseUsingSc,     outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("logicalor",                             "False %bool",  "False %bool",  "%bool",        "LogicalOr            %sc_0 %sc_1",                     1,              0,              selectTrueUsingSc,      outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("logicalequal",                  "True %bool",   "True %bool",   "%bool",        "LogicalEqual         %sc_0 %sc_1",                     0,              1,              selectFalseUsingSc,     outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("logicalnotequal",               "False %bool",  "False %bool",  "%bool",        "LogicalNotEqual      %sc_0 %sc_1",                     1,              0,              selectTrueUsingSc,      outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("snegate",                               " %i32 0",              " %i32 0",              "%i32",         "SNegate              %sc_0",                           -42,    0,              addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("not",                                   " %i32 0",              " %i32 0",              "%i32",         "Not                  %sc_0",                           -43,    0,              addScToInput,           outputInts1));
+       cases.push_back(SpecConstantTwoIntCase("logicalnot",                    "False %bool",  "False %bool",  "%bool",        "LogicalNot           %sc_0",                           1,              0,              selectFalseUsingSc,     outputInts2));
+       cases.push_back(SpecConstantTwoIntCase("select",                                "False %bool",  " %i32 0",              "%i32",         "Select               %sc_0 %sc_1 %zero",       1,              42,             addScToInput,           outputInts1));
+       // OpSConvert, OpFConvert: these two instructions involve ints/floats of different bitwidths.
+       // \todo[2015-12-1 antiagainst] OpQuantizeToF16
+
+       for (size_t caseNdx = 0; caseNdx < cases.size(); ++caseNdx)
+       {
+               map<string, string>             specializations;
+               ComputeShaderSpec               spec;
+
+               specializations["SC_DEF0"]                      = cases[caseNdx].scDefinition0;
+               specializations["SC_DEF1"]                      = cases[caseNdx].scDefinition1;
+               specializations["SC_RESULT_TYPE"]       = cases[caseNdx].scResultType;
+               specializations["SC_OP"]                        = cases[caseNdx].scOperation;
+               specializations["GEN_RESULT"]           = cases[caseNdx].resultOperation;
+
+               spec.assembly = shaderTemplate.specialize(specializations);
+               spec.inputs.push_back(BufferSp(new Int32Buffer(inputInts)));
+               spec.outputs.push_back(BufferSp(new Int32Buffer(cases[caseNdx].expectedOutput)));
+               spec.numWorkGroups = IVec3(numElements, 1, 1);
+               spec.entryPoint = "main";
+               spec.specConstants.push_back(cases[caseNdx].scActualValue0);
+               spec.specConstants.push_back(cases[caseNdx].scActualValue1);
+
+               group->addChild(new SpvAsmComputeShaderCase(testCtx, cases[caseNdx].caseName, cases[caseNdx].caseName, spec));
+       }
+
+       ComputeShaderSpec                               spec;
+
+       spec.assembly =
+               string(s_ShaderPreamble) +
+
+               "OpName %main           \"main\"\n"
+               "OpName %id             \"gl_GlobalInvocationID\"\n"
+
+               "OpDecorate %id BuiltIn GlobalInvocationId\n"
+               "OpDecorate %sc_0  SpecId 0\n"
+               "OpDecorate %sc_1  SpecId 1\n"
+               "OpDecorate %sc_2  SpecId 2\n"
+
+               + string(s_InputOutputBufferTraits) + string(s_CommonTypes) +
+
+               "%ivec3     = OpTypeVector %i32 3\n"
+               "%i32ptr    = OpTypePointer Uniform %i32\n"
+               "%i32arr    = OpTypeRuntimeArray %i32\n"
+               "%boolptr   = OpTypePointer Uniform %bool\n"
+               "%boolarr   = OpTypeRuntimeArray %bool\n"
+               "%inbuf     = OpTypeStruct %i32arr\n"
+               "%inbufptr  = OpTypePointer Uniform %inbuf\n"
+               "%indata    = OpVariable %inbufptr Uniform\n"
+               "%outbuf    = OpTypeStruct %i32arr\n"
+               "%outbufptr = OpTypePointer Uniform %outbuf\n"
+               "%outdata   = OpVariable %outbufptr Uniform\n"
+
+               "%id        = OpVariable %uvec3ptr Input\n"
+               "%zero      = OpConstant %i32 0\n"
+               "%ivec3_0   = OpConstantComposite %ivec3 %zero %zero %zero\n"
+
+               "%sc_0        = OpSpecConstant %i32 0\n"
+               "%sc_1        = OpSpecConstant %i32 0\n"
+               "%sc_2        = OpSpecConstant %i32 0\n"
+               "%sc_vec3_0   = OpSpecConstantOp %ivec3 CompositeInsert  %sc_0        %ivec3_0   0\n"     // (sc_0, 0, 0)
+               "%sc_vec3_1   = OpSpecConstantOp %ivec3 CompositeInsert  %sc_1        %ivec3_0   1\n"     // (0, sc_1, 0)
+               "%sc_vec3_2   = OpSpecConstantOp %ivec3 CompositeInsert  %sc_2        %ivec3_0   2\n"     // (0, 0, sc_2)
+               "%sc_vec3_01  = OpSpecConstantOp %ivec3 VectorShuffle    %sc_vec3_0   %sc_vec3_1 1 0 4\n" // (0,    sc_0, sc_1)
+               "%sc_vec3_012 = OpSpecConstantOp %ivec3 VectorShuffle    %sc_vec3_01  %sc_vec3_2 5 1 2\n" // (sc_2, sc_0, sc_1)
+               "%sc_ext_0    = OpSpecConstantOp %i32   CompositeExtract %sc_vec3_012            0\n"     // sc_2
+               "%sc_ext_1    = OpSpecConstantOp %i32   CompositeExtract %sc_vec3_012            1\n"     // sc_0
+               "%sc_ext_2    = OpSpecConstantOp %i32   CompositeExtract %sc_vec3_012            2\n"     // sc_1
+               "%sc_sub      = OpSpecConstantOp %i32   ISub             %sc_ext_0    %sc_ext_1\n"        // (sc_2 - sc_0)
+               "%sc_final    = OpSpecConstantOp %i32   IMul             %sc_sub      %sc_ext_2\n"        // (sc_2 - sc_0) * sc_1
+
+               "%main      = OpFunction %void None %voidf\n"
+               "%label     = OpLabel\n"
+               "%idval     = OpLoad %uvec3 %id\n"
+               "%x         = OpCompositeExtract %u32 %idval 0\n"
+               "%inloc     = OpAccessChain %i32ptr %indata %zero %x\n"
+               "%inval     = OpLoad %i32 %inloc\n"
+               "%final     = OpIAdd %i32 %inval %sc_final\n"
+               "%outloc    = OpAccessChain %i32ptr %outdata %zero %x\n"
+               "             OpStore %outloc %final\n"
+               "             OpReturn\n"
+               "             OpFunctionEnd\n";
+       spec.inputs.push_back(BufferSp(new Int32Buffer(inputInts)));
+       spec.outputs.push_back(BufferSp(new Int32Buffer(outputInts3)));
+       spec.numWorkGroups = IVec3(numElements, 1, 1);
+       spec.entryPoint = "main";
+       spec.specConstants.push_back(123);
+       spec.specConstants.push_back(56);
+       spec.specConstants.push_back(-77);
+
+       group->addChild(new SpvAsmComputeShaderCase(testCtx, "vector_related", "VectorShuffle, CompositeExtract, & CompositeInsert", spec));
+
+       return group.release();
+} tcu::TestCaseGroup* createOpPhiGroup (tcu::TestContext& testCtx)
  {
         de::MovePtr<tcu::TestCaseGroup> group                   (new tcu::TestCaseGroup(testCtx, "opphi", "Test the OpPhi instruction"));
         ComputeShaderSpec                               spec;
@@ -734,6 +1359,7 @@ tcu::TestCaseGroup* createOpPhiGroup (tcu::TestContext& testCtx)
         spec.inputs.push_back(BufferSp(new Float32Buffer(inputFloats)));
         spec.outputs.push_back(BufferSp(new Float32Buffer(outputFloats)));
         spec.numWorkGroups = IVec3(numElements, 1, 1);
+       spec.entryPoint = "main";
  
         group->addChild(new SpvAsmComputeShaderCase(testCtx, "all", "OpPhi corner cases", spec));
  
@@ -892,19 +1518,129 @@ tcu::TestCaseGroup* createBlockOrderGroup (tcu::TestContext& testCtx)
         spec.inputs.push_back(BufferSp(new Float32Buffer(inputFloats)));
         spec.outputs.push_back(BufferSp(new Float32Buffer(outputFloats)));
         spec.numWorkGroups = IVec3(numElements, 1, 1);
+       spec.entryPoint = "main";
  
         group->addChild(new SpvAsmComputeShaderCase(testCtx, "all", "various out-of-order blocks", spec));
  
         return group.release();
  }
  
-struct CaseParameter
+tcu::TestCaseGroup* createMultipleShaderGroup (tcu::TestContext& testCtx)
  {
-       const char*             name;
-       string                  param;
+       de::MovePtr<tcu::TestCaseGroup> group                   (new tcu::TestCaseGroup(testCtx, "multiple_shaders", "Test multiple shaders in the same module"));
+       ComputeShaderSpec                               spec1;
+       ComputeShaderSpec                               spec2;
+       de::Random                                              rnd                             (deStringHash(group->getName()));
+       const int                                               numElements             = 100;
+       vector<float>                                   inputFloats             (numElements, 0);
+       vector<float>                                   outputFloats1   (numElements, 0);
+       vector<float>                                   outputFloats2   (numElements, 0);
  
-       CaseParameter   (const char* case_, const string& param_) : name(case_), param(param_) {}
-};
+       fillRandomScalars(rnd, -500.f, 500.f, &inputFloats[0], numElements);
+
+       for (size_t ndx = 0; ndx < numElements; ++ndx)
+       {
+               outputFloats1[ndx] = inputFloats[ndx] + inputFloats[ndx];
+               outputFloats2[ndx] = -inputFloats[ndx];
+       }
+
+       const string assembly =
+               "OpCapability Shader\n"
+               "OpMemoryModel Logical GLSL450\n"
+               "OpEntryPoint GLCompute %comp_main1 \"entrypoint1\" %id\n"
+               "OpEntryPoint GLCompute %comp_main2 \"entrypoint2\" %id\n"
+               // A module cannot have two OpEntryPoint instructions with the same Execution Model and the same Name string.
+               "OpEntryPoint Vertex    %vert_main  \"entrypoint2\" %vert_builtins %vertexID %instanceID\n"
+               "OpExecutionMode %main LocalSize 1 1 1\n";
+
+               "OpName %comp_main1              \"entrypoint1\"\n"
+               "OpName %comp_main2              \"entrypoint2\"\n"
+               "OpName %vert_main               \"entrypoint2\"\n"
+               "OpName %id                      \"gl_GlobalInvocationID\"\n"
+               "OpName %vert_builtin_st         \"gl_PerVertex\"\n"
+               "OpName %vertexID                \"gl_VertexID\"\n"
+               "OpName %instanceID              \"gl_InstanceID\"\n"
+               "OpMemberName %vert_builtin_st 0 \"gl_Position\"\n"
+               "OpMemberName %vert_builtin_st 1 \"gl_PointSize\"\n"
+               "OpMemberName %vert_builtin_st 2 \"gl_ClipDistance\"\n"
+
+               "OpDecorate %id                      BuiltIn GlobalInvocationId\n"
+               "OpDecorate %vertexID                BuiltIn VertexId\n"
+               "OpDecorate %instanceID              BuiltIn InstanceId\n"
+               "OpDecorate %vert_builtin_st         Block\n"
+               "OpMemberDecorate %vert_builtin_st 0 BuiltIn Position\n"
+               "OpMemberDecorate %vert_builtin_st 1 BuiltIn PointSize\n"
+               "OpMemberDecorate %vert_builtin_st 2 BuiltIn ClipDistance\n"
+
+               + string(s_InputOutputBufferTraits) + string(s_CommonTypes) + string(s_InputOutputBuffer) +
+
+               "%i32ptr              = OpTypePointer Input %i32\n"
+               "%vec4                = OpTypeVector %f32 4\n"
+               "%vec4ptr             = OpTypePointer Output %vec4\n"
+               "%f32arr1             = OpTypeArray %f32 %one\n"
+               "%vert_builtin_st     = OpTypeStruct %vec4 %f32 %f32arr1\n"
+               "%vert_builtin_st_ptr = OpTypePointer Output %vert_builtin_st\n"
+               "%vert_builtins       = OpVariable %vert_builtin_st_ptr Output\n"
+
+               "%id         = OpVariable %uvec3ptr Input\n"
+               "%vertexID   = OpVariable %i32ptr Input\n"
+               "%instanceID = OpVariable %i32ptr Input\n"
+               "%zero       = OpConstant %i32 0\n"
+               "%one        = OpConstant %u32 1\n"
+               "%c_f32_1    = OpConstant %f32 1\n"
+               "%c_vec4_1   = OpConstantComposite %vec4 %c_f32_1 %c_f32_1 %c_f32_1 %c_f32_1\n"
+
+               // gl_Position = vec4(1.);
+               "%vert_main  = OpFunction %void None %voidf\n"
+               "%vert_entry = OpLabel\n"
+               "%position   = OpAccessChain %vec4ptr %vert_builtins %zero\n"
+               "              OpStore %position %c_vec4_1\n"
+               "              OpReturn\n"
+               "              OpFunctionEnd\n"
+
+               // Double inputs.
+               "%comp_main1  = OpFunction %void None %voidf\n"
+               "%comp1_entry = OpLabel\n"
+               "%idval1      = OpLoad %uvec3 %id\n"
+               "%x1          = OpCompositeExtract %u32 %idval1 0\n"
+               "%inloc1      = OpAccessChain %f32ptr %indata %zero %x1\n"
+               "%inval1      = OpLoad %f32 %inloc1\n"
+               "%add         = OpFAdd %f32 %inval1 %inval1\n"
+               "%outloc1     = OpAccessChain %f32ptr %outdata %zero %x1\n"
+               "               OpStore %outloc1 %add\n"
+               "               OpReturn\n"
+               "               OpFunctionEnd\n"
+
+               // Negate inputs.
+               "%comp_main2  = OpFunction %void None %voidf\n"
+               "%comp2_entry = OpLabel\n"
+               "%idval2      = OpLoad %uvec3 %id\n"
+               "%x2          = OpCompositeExtract %u32 %idval2 0\n"
+               "%inloc2      = OpAccessChain %f32ptr %indata %zero %x2\n"
+               "%inval2      = OpLoad %f32 %inloc2\n"
+               "%neg         = OpFNegate %f32 %inval2\n"
+               "%outloc2     = OpAccessChain %f32ptr %outdata %zero %x2\n"
+               "               OpStore %outloc2 %neg\n"
+               "               OpReturn\n"
+               "               OpFunctionEnd\n";
+
+       spec1.assembly = assembly;
+       spec1.inputs.push_back(BufferSp(new Float32Buffer(inputFloats)));
+       spec1.outputs.push_back(BufferSp(new Float32Buffer(outputFloats1)));
+       spec1.numWorkGroups = IVec3(numElements, 1, 1);
+       spec1.entryPoint = "entrypoint1";
+
+       spec2.assembly = assembly;
+       spec2.inputs.push_back(BufferSp(new Float32Buffer(inputFloats)));
+       spec2.outputs.push_back(BufferSp(new Float32Buffer(outputFloats2)));
+       spec2.numWorkGroups = IVec3(numElements, 1, 1);
+       spec2.entryPoint = "entrypoint2";
+
+       group->addChild(new SpvAsmComputeShaderCase(testCtx, "shader1", "multiple shaders in the same module", spec1));
+       group->addChild(new SpvAsmComputeShaderCase(testCtx, "shader2", "multiple shaders in the same module", spec2));
+
+       return group.release();
+}
  
  tcu::TestCaseGroup* createOpSourceGroup (tcu::TestContext& testCtx)
  {
@@ -995,6 +1731,7 @@ tcu::TestCaseGroup* createOpSourceGroup (tcu::TestContext& testCtx)
                 spec.inputs.push_back(BufferSp(new Float32Buffer(positiveFloats)));
                 spec.outputs.push_back(BufferSp(new Float32Buffer(negativeFloats)));
                 spec.numWorkGroups = IVec3(numElements, 1, 1);
+               spec.entryPoint = "main";
  
                 group->addChild(new SpvAsmComputeShaderCase(testCtx, cases[caseNdx].name, cases[caseNdx].name, spec));
         }
@@ -1058,6 +1795,7 @@ tcu::TestCaseGroup* createOpSourceExtensionGroup (tcu::TestContext& testCtx)
                 spec.inputs.push_back(BufferSp(new Float32Buffer(inputFloats)));
                 spec.outputs.push_back(BufferSp(new Float32Buffer(outputFloats)));
                 spec.numWorkGroups = IVec3(numElements, 1, 1);
+               spec.entryPoint = "main";
  
                 group->addChild(new SpvAsmComputeShaderCase(testCtx, cases[caseNdx].name, cases[caseNdx].name, spec));
         }
@@ -1132,6 +1870,7 @@ tcu::TestCaseGroup* createOpConstantNullGroup (tcu::TestContext& testCtx)
                 spec.inputs.push_back(BufferSp(new Float32Buffer(positiveFloats)));
                 spec.outputs.push_back(BufferSp(new Float32Buffer(negativeFloats)));
                 spec.numWorkGroups = IVec3(numElements, 1, 1);
+               spec.entryPoint = "main";
  
                 group->addChild(new SpvAsmComputeShaderCase(testCtx, cases[caseNdx].name, cases[caseNdx].name, spec));
         }
@@ -1214,6 +1953,7 @@ tcu::TestCaseGroup* createOpConstantCompositeGroup (tcu::TestContext& testCtx)
                 spec.inputs.push_back(BufferSp(new Float32Buffer(positiveFloats)));
                 spec.outputs.push_back(BufferSp(new Float32Buffer(negativeFloats)));
                 spec.numWorkGroups = IVec3(numElements, 1, 1);
+               spec.entryPoint = "main";
  
                 group->addChild(new SpvAsmComputeShaderCase(testCtx, cases[caseNdx].name, cases[caseNdx].name, spec));
         }
@@ -1306,6 +2046,7 @@ tcu::TestCaseGroup* createOpConstantUsageGroup (tcu::TestContext& testCtx)
         spec.inputs.push_back(BufferSp(new Float32Buffer(positiveFloats)));
         spec.outputs.push_back(BufferSp(new Float32Buffer(negativeFloats)));
         spec.numWorkGroups = IVec3(numElements, 1, 1);
+       spec.entryPoint = "main";
  
         group->addChild(new SpvAsmComputeShaderCase(testCtx, "spotcheck", "Check that values constructed via OpConstantNull & OpConstantComposite can be used", spec));
  
@@ -1404,6 +2145,7 @@ tcu::TestCaseGroup* createLoopControlGroup (tcu::TestContext& testCtx)
                 spec.inputs.push_back(BufferSp(new Float32Buffer(inputFloats)));
                 spec.outputs.push_back(BufferSp(new Float32Buffer(outputFloats)));
                 spec.numWorkGroups = IVec3(numElements, 1, 1);
+               spec.entryPoint = "main";
  
                 group->addChild(new SpvAsmComputeShaderCase(testCtx, cases[caseNdx].name, cases[caseNdx].name, spec));
         }
@@ -1496,6 +2238,7 @@ tcu::TestCaseGroup* createSelectionControlGroup (tcu::TestContext& testCtx)
                 spec.inputs.push_back(BufferSp(new Float32Buffer(inputFloats)));
                 spec.outputs.push_back(BufferSp(new Float32Buffer(outputFloats)));
                 spec.numWorkGroups = IVec3(numElements, 1, 1);
+               spec.entryPoint = "main";
  
                 group->addChild(new SpvAsmComputeShaderCase(testCtx, cases[caseNdx].name, cases[caseNdx].name, spec));
         }
@@ -1588,6 +2331,78 @@ tcu::TestCaseGroup* createFunctionControlGroup (tcu::TestContext& testCtx)
                 spec.inputs.push_back(BufferSp(new Float32Buffer(inputFloats)));
                 spec.outputs.push_back(BufferSp(new Float32Buffer(outputFloats)));
                 spec.numWorkGroups = IVec3(numElements, 1, 1);
+               spec.entryPoint = "main";
+
+               group->addChild(new SpvAsmComputeShaderCase(testCtx, cases[caseNdx].name, cases[caseNdx].name, spec));
+       }
+
+       return group.release();
+}
+
+tcu::TestCaseGroup* createMemoryAccessGroup (tcu::TestContext& testCtx)
+{
+       de::MovePtr<tcu::TestCaseGroup> group                   (new tcu::TestCaseGroup(testCtx, "memory_access", "Tests memory access cases"));
+       vector<CaseParameter>                   cases;
+       de::Random                                              rnd                             (deStringHash(group->getName()));
+       const int                                               numElements             = 100;
+       vector<float>                                   inputFloats             (numElements, 0);
+       vector<float>                                   outputFloats    (numElements, 0);
+       const StringTemplate                    shaderTemplate  (
+               string(s_ShaderPreamble) +
+
+               "OpSource GLSL 430\n"
+               "OpName %main           \"main\"\n"
+               "OpName %id             \"gl_GlobalInvocationID\"\n"
+
+               "OpDecorate %id BuiltIn GlobalInvocationId\n"
+
+               + string(s_InputOutputBufferTraits) + string(s_CommonTypes) + string(s_InputOutputBuffer) +
+
+               "%f32ptr_f  = OpTypePointer Function %f32\n"
+
+               "%id        = OpVariable %uvec3ptr Input\n"
+               "%zero      = OpConstant %i32 0\n"
+               "%four      = OpConstant %i32 4\n"
+
+               "%main      = OpFunction %void None %voidf\n"
+               "%label     = OpLabel\n"
+               "%copy      = OpVariable %f32ptr_f Function\n"
+               "%idval     = OpLoad %uvec3 %id ${ACCESS}\n"
+               "%x         = OpCompositeExtract %u32 %idval 0\n"
+               "%inloc     = OpAccessChain %f32ptr %indata  %zero %x\n"
+               "%outloc    = OpAccessChain %f32ptr %outdata %zero %x\n"
+               "             OpCopyMemory %copy %inloc ${ACCESS}\n"
+               "%val1      = OpLoad %f32 %copy\n"
+               "%val2      = OpLoad %f32 %inloc\n"
+               "%add       = OpFAdd %f32 %val1 %val2\n"
+               "             OpStore %outloc %add ${ACCESS}\n"
+               "             OpReturn\n"
+               "             OpFunctionEnd\n");
+
+       cases.push_back(CaseParameter("null",                                   ""));
+       cases.push_back(CaseParameter("none",                                   "None"));
+       cases.push_back(CaseParameter("volatile",                               "Volatile"));
+       cases.push_back(CaseParameter("aligned",                                "Aligned 4"));
+       cases.push_back(CaseParameter("nontemporal",                    "Nontemporal"));
+       cases.push_back(CaseParameter("aligned_nontemporal",    "Aligned|Nontemporal 4"));
+       cases.push_back(CaseParameter("aligned_volatile",               "Volatile|Aligned 4"));
+
+       fillRandomScalars(rnd, -100.f, 100.f, &inputFloats[0], numElements);
+
+       for (size_t ndx = 0; ndx < numElements; ++ndx)
+               outputFloats[ndx] = inputFloats[ndx] + inputFloats[ndx];
+
+       for (size_t caseNdx = 0; caseNdx < cases.size(); ++caseNdx)
+       {
+               map<string, string>             specializations;
+               ComputeShaderSpec               spec;
+
+               specializations["ACCESS"] = cases[caseNdx].param;
+               spec.assembly = shaderTemplate.specialize(specializations);
+               spec.inputs.push_back(BufferSp(new Float32Buffer(inputFloats)));
+               spec.outputs.push_back(BufferSp(new Float32Buffer(outputFloats)));
+               spec.numWorkGroups = IVec3(numElements, 1, 1);
+               spec.entryPoint = "main";
  
                 group->addChild(new SpvAsmComputeShaderCase(testCtx, cases[caseNdx].name, cases[caseNdx].name, spec));
         }
@@ -1669,6 +2484,7 @@ tcu::TestCaseGroup* createOpUndefGroup (tcu::TestContext& testCtx)
         spec.inputs.push_back(BufferSp(new Float32Buffer(positiveFloats)));
         spec.outputs.push_back(BufferSp(new Float32Buffer(negativeFloats)));
                 spec.numWorkGroups = IVec3(numElements, 1, 1);
+               spec.entryPoint = "main";
  
                 group->addChild(new SpvAsmComputeShaderCase(testCtx, cases[caseNdx].name, cases[caseNdx].name, spec));
         }
@@ -3012,6 +3828,7 @@ tcu::TestCaseGroup* createInstructionTests (tcu::TestContext& testCtx)
         instructionTests->addChild(createOpConstantNullGroup(testCtx));
         instructionTests->addChild(createOpConstantCompositeGroup(testCtx));
         instructionTests->addChild(createOpConstantUsageGroup(testCtx));
+       instructionTests->addChild(createSpecConstantGroup(testCtx));
         instructionTests->addChild(createOpSourceGroup(testCtx));
         instructionTests->addChild(createOpSourceExtensionGroup(testCtx));
         instructionTests->addChild(createDecorationGroupGroup(testCtx));
@@ -3020,6 +3837,11 @@ tcu::TestCaseGroup* createInstructionTests (tcu::TestContext& testCtx)
         instructionTests->addChild(createFunctionControlGroup(testCtx));
         instructionTests->addChild(createSelectionControlGroup(testCtx));
         instructionTests->addChild(createBlockOrderGroup(testCtx));
+       instructionTests->addChild(createMultipleShaderGroup(testCtx));
+       instructionTests->addChild(createMemoryAccessGroup(testCtx));
+       instructionTests->addChild(createOpCopyMemoryGroup(testCtx));
+       instructionTests->addChild(createOpCopyObjectGroup(testCtx));
+       instructionTests->addChild(createNoContractionGroup(testCtx));
         instructionTests->addChild(createOpUndefGroup(testCtx));
         instructionTests->addChild(createOpUnreachableGroup(testCtx));
author	Lei Zhang <antiagainst@google.com>
	Fri, 20 Nov 2015 15:44:30 +0000 (10:44 -0500)
committer	Lei Zhang <antiagainst@google.com>
	Tue, 15 Dec 2015 16:46:27 +0000 (11:46 -0500)
external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmComputeShaderCase.cpp		patch \| blob \| history
external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmComputeShaderTestUtil.hpp		patch \| blob \| history
external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmInstructionTests.cpp		patch \| blob \| history