Merge vk-gl-cts/vulkan-cts-1.2.8 into vk-gl-cts/vulkan-cts-1.3.0
[platform/upstream/VK-GL-CTS.git] / external / vulkancts / modules / vulkan / fragment_shading_rate / vktFragmentShadingRateBasic.cpp
1 /*------------------------------------------------------------------------
2  * Vulkan Conformance Tests
3  * ------------------------
4  *
5  * Copyright (c) 2017-2019 The Khronos Group Inc.
6  * Copyright (c) 2018-2020 NVIDIA Corporation
7  *
8  * Licensed under the Apache License, Version 2.0 (the "License");
9  * you may not use this file except in compliance with the License.
10  * You may obtain a copy of the License at
11  *
12  *        http://www.apache.org/licenses/LICENSE-2.0
13  *
14  * Unless required by applicable law or agreed to in writing, software
15  * distributed under the License is distributed on an "AS IS" BASIS,
16  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
17  * See the License for the specific language governing permissions and
18  * limitations under the License.
19  *
20  *//*!
21  * \file
22  * \brief Tests for VK_KHR_fragment_shading_rate
23  * The test renders 9*9 triangles, where each triangle has one of the valid
24  * fragment sizes ({1,2,4},{1,2,4}) (clamped to implementation limits) for
25  * each of the pipeline shading rate and the primitive shading rate. The
26  * fragment shader does an atomic add to a memory location to get a unique
27  * identifier for the fragment, and outputs the primitive ID, atomic counter,
28  * fragment size, and some other info the the color output. Then a compute
29  * shader copies this to buffer memory, and the host verifies several
30  * properties of the output. For example, if a sample has a particular
31  * primitive ID and atomic value, then all other samples in the tile with
32  * the same primitive ID should have the same atomic value.
33  *//*--------------------------------------------------------------------*/
34
35 #include "vktFragmentShadingRateBasic.hpp"
36
37 #include "vkBufferWithMemory.hpp"
38 #include "vkImageWithMemory.hpp"
39 #include "vkQueryUtil.hpp"
40 #include "vkBuilderUtil.hpp"
41 #include "vkCmdUtil.hpp"
42 #include "vkTypeUtil.hpp"
43 #include "vkObjUtil.hpp"
44 #include "vkImageUtil.hpp"
45
46 #include "vktTestGroupUtil.hpp"
47 #include "vktTestCase.hpp"
48
49 #include "deDefs.h"
50 #include "deMath.h"
51 #include "deRandom.h"
52 #include "deSharedPtr.hpp"
53 #include "deString.h"
54
55 #include "tcuTestCase.hpp"
56 #include "tcuTestLog.hpp"
57
58 #include <string>
59 #include <sstream>
60
61 namespace vkt
62 {
63 namespace FragmentShadingRate
64 {
65 namespace
66 {
67 using namespace vk;
68 using namespace std;
69
70 #define NUM_TRIANGLES (9*9)
71
72 enum class AttachmentUsage
73 {
74         NO_ATTACHMENT = 0,
75         NO_ATTACHMENT_PTR,
76         WITH_ATTACHMENT,
77 };
78
79 struct CaseDef
80 {
81         deInt32 seed;
82         VkExtent2D framebufferDim;
83         VkSampleCountFlagBits samples;
84         VkFragmentShadingRateCombinerOpKHR combinerOp[2];
85         AttachmentUsage attachmentUsage;
86         bool shaderWritesRate;
87         bool geometryShader;
88         bool useDynamicState;
89         bool useDynamicRendering;
90         bool useApiSampleMask;
91         bool useSampleMaskIn;
92         bool conservativeEnable;
93         VkConservativeRasterizationModeEXT conservativeMode;
94         bool useDepthStencil; // == fragDepth || fragStencil
95         bool fragDepth;
96         bool fragStencil;
97         bool multiViewport;
98         bool colorLayered;
99         bool srLayered; // colorLayered must also be true
100         deUint32 numColorLayers;
101         bool multiView;
102         bool interlock;
103         bool sampleLocations;
104         bool sampleShadingEnable;
105         bool sampleShadingInput;
106         bool sampleMaskTest;
107
108         bool useAttachment () const
109         {
110                 return (attachmentUsage == AttachmentUsage::WITH_ATTACHMENT);
111         }
112 };
113
114 class FSRTestInstance : public TestInstance
115 {
116 public:
117                                                 FSRTestInstance         (Context& context, const CaseDef& data);
118                                                 ~FSRTestInstance        (void);
119         tcu::TestStatus         iterate                         (void);
120
121 private:
122         // Test parameters
123         CaseDef                         m_data;
124
125         // Cache simulated combiner operations, to avoid recomputing per-sample
126         deInt32                         m_simulateValueCount;
127         vector<deInt32>         m_simulateCache;
128         // Cache mapping of primitive ID to pipeline/primitive shading rate
129         vector<deInt32>         m_primIDToPrimitiveShadingRate;
130         vector<deInt32>         m_primIDToPipelineShadingRate;
131         deUint32                        m_supportedFragmentShadingRateCount;
132         vector<VkPhysicalDeviceFragmentShadingRateKHR>  m_supportedFragmentShadingRates;
133         VkPhysicalDeviceFragmentShadingRatePropertiesKHR        m_shadingRateProperties;
134
135         deInt32                         PrimIDToPrimitiveShadingRate    (deInt32 primID);
136         deInt32                         PrimIDToPipelineShadingRate             (deInt32 primID);
137         VkExtent2D                      SanitizeExtent          (VkExtent2D ext) const;
138         deInt32                         SanitizeRate            (deInt32 rate) const;
139         deInt32                         ShadingRateExtentToClampedMask  (VkExtent2D ext, bool allowSwap) const;
140         deInt32                         ShadingRateExtentToEnum (VkExtent2D ext) const;
141         VkExtent2D                      ShadingRateEnumToExtent (deInt32 rate) const;
142         deInt32                         Simulate                        (deInt32 rate0, deInt32 rate1, deInt32 rate2);
143         VkExtent2D                      Combine                         (VkExtent2D ext0, VkExtent2D ext1, VkFragmentShadingRateCombinerOpKHR comb) const;
144         bool                            Force1x1                        () const;
145 };
146
147 FSRTestInstance::FSRTestInstance (Context& context, const CaseDef& data)
148         : vkt::TestInstance             (context)
149         , m_data                                (data)
150         , m_simulateValueCount  (((4 * 4) | 4) + 1)
151         , m_simulateCache               (m_simulateValueCount*m_simulateValueCount*m_simulateValueCount, ~0)
152         , m_primIDToPrimitiveShadingRate(NUM_TRIANGLES, ~0)
153         , m_primIDToPipelineShadingRate(NUM_TRIANGLES, ~0)
154 {
155         m_supportedFragmentShadingRateCount = 0;
156         m_context.getInstanceInterface().getPhysicalDeviceFragmentShadingRatesKHR(m_context.getPhysicalDevice(), &m_supportedFragmentShadingRateCount, DE_NULL);
157
158         if (m_supportedFragmentShadingRateCount < 3)
159                 TCU_THROW(TestError, "*pFragmentShadingRateCount too small");
160
161         m_supportedFragmentShadingRates.resize(m_supportedFragmentShadingRateCount);
162         for (deUint32 i = 0; i < m_supportedFragmentShadingRateCount; ++i)
163         {
164                 m_supportedFragmentShadingRates[i].sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_FRAGMENT_SHADING_RATE_KHR;
165                 m_supportedFragmentShadingRates[i].pNext = nullptr;
166         }
167         m_context.getInstanceInterface().getPhysicalDeviceFragmentShadingRatesKHR(m_context.getPhysicalDevice(), &m_supportedFragmentShadingRateCount, &m_supportedFragmentShadingRates[0]);
168
169         m_shadingRateProperties = m_context.getFragmentShadingRateProperties();
170 }
171
172 FSRTestInstance::~FSRTestInstance (void)
173 {
174 }
175
176 class FSRTestCase : public TestCase
177 {
178         public:
179                                                                 FSRTestCase             (tcu::TestContext& context, const char* name, const char* desc, const CaseDef data);
180                                                                 ~FSRTestCase    (void);
181         virtual void                            initPrograms    (SourceCollections& programCollection) const;
182         virtual TestInstance*           createInstance  (Context& context) const;
183         virtual void                            checkSupport    (Context& context) const;
184
185 private:
186         CaseDef                                         m_data;
187 };
188
189 FSRTestCase::FSRTestCase (tcu::TestContext& context, const char* name, const char* desc, const CaseDef data)
190         : vkt::TestCase (context, name, desc)
191         , m_data                (data)
192 {
193 }
194
195 FSRTestCase::~FSRTestCase       (void)
196 {
197 }
198
199 bool FSRTestInstance::Force1x1() const
200 {
201         if (m_data.useApiSampleMask && !m_context.getFragmentShadingRateProperties().fragmentShadingRateWithSampleMask)
202                 return true;
203
204         if (m_data.useSampleMaskIn && !m_context.getFragmentShadingRateProperties().fragmentShadingRateWithShaderSampleMask)
205                 return true;
206
207         if (m_data.conservativeEnable && !m_context.getFragmentShadingRateProperties().fragmentShadingRateWithConservativeRasterization)
208                 return true;
209
210         if (m_data.useDepthStencil && !m_context.getFragmentShadingRateProperties().fragmentShadingRateWithShaderDepthStencilWrites)
211                 return true;
212
213         if (m_data.interlock && !m_context.getFragmentShadingRateProperties().fragmentShadingRateWithFragmentShaderInterlock)
214                 return true;
215
216         if (m_data.sampleLocations && !m_context.getFragmentShadingRateProperties().fragmentShadingRateWithCustomSampleLocations)
217                 return true;
218
219         if (m_data.sampleShadingEnable || m_data.sampleShadingInput)
220                 return true;
221
222         return false;
223 }
224
225 static VkImageUsageFlags cbUsage = VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT |
226                                                                    VK_IMAGE_USAGE_SAMPLED_BIT |
227                                                                    VK_IMAGE_USAGE_TRANSFER_DST_BIT |
228                                                                    VK_IMAGE_USAGE_TRANSFER_SRC_BIT;
229
230 void FSRTestCase::checkSupport(Context& context) const
231 {
232         context.requireDeviceFunctionality("VK_KHR_fragment_shading_rate");
233
234         if (m_data.useDynamicRendering)
235                 context.requireDeviceFunctionality("VK_KHR_dynamic_rendering");
236
237         if (!context.getFragmentShadingRateFeatures().pipelineFragmentShadingRate)
238                 TCU_THROW(NotSupportedError, "pipelineFragmentShadingRate not supported");
239
240         if (m_data.shaderWritesRate &&
241                 !context.getFragmentShadingRateFeatures().primitiveFragmentShadingRate)
242                 TCU_THROW(NotSupportedError, "primitiveFragmentShadingRate not supported");
243
244         if (!context.getFragmentShadingRateFeatures().primitiveFragmentShadingRate &&
245                 m_data.combinerOp[0] != VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR)
246                 TCU_THROW(NotSupportedError, "primitiveFragmentShadingRate not supported");
247
248         if (!context.getFragmentShadingRateFeatures().attachmentFragmentShadingRate &&
249                 m_data.combinerOp[1] != VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR)
250                 TCU_THROW(NotSupportedError, "attachmentFragmentShadingRate not supported");
251
252         VkImageFormatProperties imageProperties;
253         VkResult result = context.getInstanceInterface().getPhysicalDeviceImageFormatProperties(context.getPhysicalDevice(), VK_FORMAT_R32G32B32A32_UINT, VK_IMAGE_TYPE_2D,
254                                                                                                                                                                                         VK_IMAGE_TILING_OPTIMAL, cbUsage, 0, &imageProperties);
255
256         if (result == VK_ERROR_FORMAT_NOT_SUPPORTED)
257                 TCU_THROW(NotSupportedError, "VK_FORMAT_R32G32B32A32_UINT not supported");
258
259         if (!(imageProperties.sampleCounts & m_data.samples))
260                 TCU_THROW(NotSupportedError, "color buffer sample count not supported");
261
262         if (m_data.numColorLayers > imageProperties.maxArrayLayers)
263                 TCU_THROW(NotSupportedError, "color buffer layers not supported");
264
265         if (m_data.useAttachment() && !context.getFragmentShadingRateFeatures().attachmentFragmentShadingRate)
266                 TCU_THROW(NotSupportedError, "attachmentFragmentShadingRate not supported");
267
268         if (!context.getFragmentShadingRateProperties().fragmentShadingRateNonTrivialCombinerOps &&
269                 ((m_data.combinerOp[0] != VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR && m_data.combinerOp[0] != VK_FRAGMENT_SHADING_RATE_COMBINER_OP_REPLACE_KHR) ||
270                  (m_data.combinerOp[1] != VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR && m_data.combinerOp[1] != VK_FRAGMENT_SHADING_RATE_COMBINER_OP_REPLACE_KHR)))
271                 TCU_THROW(NotSupportedError, "fragmentShadingRateNonTrivialCombinerOps not supported");
272
273         if (m_data.conservativeEnable)
274         {
275                 context.requireDeviceFunctionality("VK_EXT_conservative_rasterization");
276                 if (m_data.conservativeMode == VK_CONSERVATIVE_RASTERIZATION_MODE_UNDERESTIMATE_EXT &&
277                         !context.getConservativeRasterizationPropertiesEXT().primitiveUnderestimation)
278                         TCU_THROW(NotSupportedError, "primitiveUnderestimation not supported");
279         }
280
281         if (m_data.fragStencil)
282                 context.requireDeviceFunctionality("VK_EXT_shader_stencil_export");
283
284         if (m_data.multiViewport &&
285                 !context.getFragmentShadingRateProperties().primitiveFragmentShadingRateWithMultipleViewports)
286                 TCU_THROW(NotSupportedError, "primitiveFragmentShadingRateWithMultipleViewports not supported");
287
288         if (m_data.srLayered &&
289                 !context.getFragmentShadingRateProperties().layeredShadingRateAttachments)
290                 TCU_THROW(NotSupportedError, "layeredShadingRateAttachments not supported");
291
292         if ((m_data.multiViewport || m_data.colorLayered) &&
293                 !m_data.geometryShader)
294                 context.requireDeviceFunctionality("VK_EXT_shader_viewport_index_layer");
295
296         if (m_data.multiView && m_data.geometryShader &&
297                 !context.getMultiviewFeatures().multiviewGeometryShader)
298                 TCU_THROW(NotSupportedError, "multiviewGeometryShader not supported");
299
300         if (m_data.interlock &&
301                 !context.getFragmentShaderInterlockFeaturesEXT().fragmentShaderPixelInterlock)
302                 TCU_THROW(NotSupportedError, "fragmentShaderPixelInterlock not supported");
303
304         if (m_data.sampleLocations)
305         {
306                 context.requireDeviceFunctionality("VK_EXT_sample_locations");
307                 if (!(m_data.samples & context.getSampleLocationsPropertiesEXT().sampleLocationSampleCounts))
308                         TCU_THROW(NotSupportedError, "samples not supported in sampleLocationSampleCounts");
309         }
310
311         if (m_data.sampleMaskTest && !context.getFragmentShadingRateProperties().fragmentShadingRateWithSampleMask)
312                 TCU_THROW(NotSupportedError, "fragmentShadingRateWithSampleMask not supported");
313 }
314
315 // Error codes writted by the fragment shader
316 enum
317 {
318         ERROR_NONE = 0,
319         ERROR_FRAGCOORD_CENTER = 1,
320         ERROR_VTG_READBACK = 2,
321         ERROR_FRAGCOORD_DERIV = 3,
322         ERROR_FRAGCOORD_IMPLICIT_DERIV = 4,
323 };
324
325 void FSRTestCase::initPrograms (SourceCollections& programCollection) const
326 {
327         std::stringstream vss;
328
329         vss <<
330                 "#version 450 core\n"
331                 "#extension GL_EXT_fragment_shading_rate : enable\n"
332                 "#extension GL_ARB_shader_viewport_layer_array : enable\n"
333                 "layout(push_constant) uniform PC {\n"
334                 "       int shadingRate;\n"
335                 "} pc;\n"
336                 "layout(location = 0) in vec2 pos;\n"
337                 "layout(location = 0) out int instanceIndex;\n"
338                 "layout(location = 1) out int readbackok;\n"
339                 "layout(location = 2) out float zero;\n"
340                 "out gl_PerVertex\n"
341                 "{\n"
342                 "   vec4 gl_Position;\n"
343                 "};\n"
344                 "void main()\n"
345                 "{\n"
346                 "  gl_Position = vec4(pos, 0, 1);\n"
347                 "  instanceIndex = gl_InstanceIndex;\n"
348                 "  readbackok = 1;\n"
349                 "  zero = 0;\n";
350
351         if (m_data.shaderWritesRate)
352         {
353                 vss << "  gl_PrimitiveShadingRateEXT = pc.shadingRate;\n";
354
355                 // Verify that we can read from the output variable
356                 vss << "  if (gl_PrimitiveShadingRateEXT != pc.shadingRate) readbackok = 0;\n";
357
358                 if (!m_data.geometryShader)
359                 {
360                         if (m_data.multiViewport)
361                                 vss << "  gl_ViewportIndex = instanceIndex & 1;\n";
362                         if (m_data.colorLayered)
363                                 vss << "  gl_Layer = (instanceIndex & 2) >> 1;\n";
364                 }
365         }
366
367         vss << "}\n";
368
369         programCollection.glslSources.add("vert") << glu::VertexSource(vss.str());
370
371         if (m_data.geometryShader)
372         {
373                 std::string writeShadingRate = "";
374                 if (m_data.shaderWritesRate)
375                 {
376                         writeShadingRate =
377                                 "  gl_PrimitiveShadingRateEXT = pc.shadingRate;\n"
378                                 "  if (gl_PrimitiveShadingRateEXT != pc.shadingRate) readbackok = 0;\n";
379
380                         if (m_data.multiViewport)
381                                 writeShadingRate += "  gl_ViewportIndex = inInstanceIndex[0] & 1;\n";
382
383                         if (m_data.colorLayered)
384                                 writeShadingRate += "  gl_Layer = (inInstanceIndex[0] & 2) >> 1;\n";
385                 }
386
387                 std::stringstream gss;
388                 gss <<
389                         "#version 450 core\n"
390                         "#extension GL_EXT_fragment_shading_rate : enable\n"
391                         "\n"
392                         "layout(push_constant) uniform PC {\n"
393                         "       int shadingRate;\n"
394                         "} pc;\n"
395                         "\n"
396                         "in gl_PerVertex\n"
397                         "{\n"
398                         "   vec4 gl_Position;\n"
399                         "} gl_in[3];\n"
400                         "\n"
401                         "layout(location = 0) in int inInstanceIndex[];\n"
402                         "layout(location = 0) out int outInstanceIndex;\n"
403                         "layout(location = 1) out int readbackok;\n"
404                         "layout(location = 2) out float zero;\n"
405                         "layout(triangles) in;\n"
406                         "layout(triangle_strip, max_vertices=3) out;\n"
407                         "\n"
408                         "out gl_PerVertex {\n"
409                         "   vec4 gl_Position;\n"
410                         "};\n"
411                         "\n"
412                         "void main(void)\n"
413                         "{\n"
414                         "   gl_Position = gl_in[0].gl_Position;\n"
415                         "   outInstanceIndex = inInstanceIndex[0];\n"
416                         "   readbackok  = 1;\n"
417                         "   zero = 0;\n"
418                         << writeShadingRate <<
419                         "   EmitVertex();"
420                         "\n"
421                         "   gl_Position = gl_in[1].gl_Position;\n"
422                         "   outInstanceIndex = inInstanceIndex[1];\n"
423                         "   readbackok = 1;\n"
424                         "   zero = 0;\n"
425                         << writeShadingRate <<
426                         "   EmitVertex();"
427                         "\n"
428                         "   gl_Position = gl_in[2].gl_Position;\n"
429                         "   outInstanceIndex = inInstanceIndex[2];\n"
430                         "   readbackok = 1;\n"
431                         "   zero = 0;\n"
432                         << writeShadingRate <<
433                         "   EmitVertex();"
434                         "}\n";
435
436                 programCollection.glslSources.add("geom") << glu::GeometrySource(gss.str());
437         }
438
439         std::stringstream fss;
440
441         fss <<
442                 "#version 450 core\n"
443                 "#extension GL_EXT_fragment_shading_rate : enable\n"
444                 "#extension GL_ARB_shader_stencil_export : enable\n"
445                 "#extension GL_ARB_fragment_shader_interlock : enable\n"
446                 "layout(location = 0) out uvec4 col0;\n"
447                 "layout(set = 0, binding = 0) buffer Block { uint counter; } buf;\n"
448                 "layout(set = 0, binding = 3) uniform usampler2D tex;\n"
449                 "layout(location = 0) flat in int instanceIndex;\n"
450                 "layout(location = 1) flat in int readbackok;\n"
451                 "layout(location = 2) " << (m_data.sampleShadingInput ? "sample " : "") << "in float zero;\n";
452
453         if (m_data.interlock)
454                 fss << "layout(pixel_interlock_ordered) in;\n";
455
456         fss <<
457                 "void main()\n"
458                 "{\n";
459
460         if (m_data.interlock)
461                 fss << "  beginInvocationInterlockARB();\n";
462
463         fss <<
464                 // X component gets shading rate enum
465                 "  col0.x = gl_ShadingRateEXT;\n"
466                 "  col0.y = 0;\n"
467                 // Z component gets packed primitiveID | atomic value
468                 "  col0.z = (instanceIndex << 24) | ((atomicAdd(buf.counter, 1) + 1) & 0x00FFFFFFu);\n"
469                 "  ivec2 fragCoordXY = ivec2(gl_FragCoord.xy);\n"
470                 "  ivec2 fragSize = ivec2(1<<((gl_ShadingRateEXT/4)&3), 1<<(gl_ShadingRateEXT&3));\n"
471                 // W component gets error code
472                 "  col0.w = uint(zero)" << (m_data.sampleShadingInput ? " * gl_SampleID" : "") << ";\n"
473                 "  if (((fragCoordXY - fragSize / 2) % fragSize) != ivec2(0,0))\n"
474                 "    col0.w = " << ERROR_FRAGCOORD_CENTER << ";\n";
475
476         if (m_data.shaderWritesRate)
477         {
478                 fss <<
479                         "  if (readbackok != 1)\n"
480                         "    col0.w = " << ERROR_VTG_READBACK << ";\n";
481         }
482
483         // When sample shading, gl_FragCoord is more likely to give bad derivatives,
484         // e.g. due to a partially covered quad having some pixels center sample and
485         // some sample at a sample location.
486         if (!m_data.sampleShadingEnable && !m_data.sampleShadingInput)
487         {
488                 fss << "  if (dFdx(gl_FragCoord.xy) != ivec2(fragSize.x, 0) || dFdy(gl_FragCoord.xy) != ivec2(0, fragSize.y))\n"
489                            "    col0.w = (fragSize.y << 26) | (fragSize.x << 20) | (int(dFdx(gl_FragCoord.xy)) << 14) | (int(dFdx(gl_FragCoord.xy)) << 8) | " << ERROR_FRAGCOORD_DERIV << ";\n";
490
491                 fss << "  uint implicitDerivX = texture(tex, vec2(gl_FragCoord.x / textureSize(tex, 0).x, 0)).x;\n"
492                            "  uint implicitDerivY = texture(tex, vec2(0, gl_FragCoord.y / textureSize(tex, 0).y)).x;\n"
493                            "  if (implicitDerivX != fragSize.x || implicitDerivY != fragSize.y)\n"
494                            "    col0.w = (fragSize.y << 26) | (fragSize.x << 20) | (implicitDerivY << 14) | (implicitDerivX << 8) | " << ERROR_FRAGCOORD_IMPLICIT_DERIV << ";\n";
495         }
496         // Y component gets sample mask value
497         if (m_data.useSampleMaskIn)
498                 fss << "  col0.y = gl_SampleMaskIn[0];\n";
499
500         if (m_data.fragDepth)
501                 fss << "  gl_FragDepth = float(instanceIndex) / float(" << NUM_TRIANGLES << ");\n";
502
503         if (m_data.fragStencil)
504                 fss << "  gl_FragStencilRefARB = instanceIndex;\n";
505
506         if (m_data.interlock)
507                 fss << "  endInvocationInterlockARB();\n";
508
509         fss <<
510                 "}\n";
511
512         programCollection.glslSources.add("frag") << glu::FragmentSource(fss.str());
513
514         std::stringstream css;
515
516         std::string fsampType = m_data.samples > 1 ?  "texture2DMSArray" :  "texture2DArray";
517         std::string usampType = m_data.samples > 1 ? "utexture2DMSArray" : "utexture2DArray";
518
519         // Compute shader copies color/depth/stencil to linear layout in buffer memory
520         css <<
521                 "#version 450 core\n"
522                 "#extension GL_EXT_samplerless_texture_functions : enable\n"
523                 "layout(set = 0, binding = 1) uniform " << usampType << " colorTex;\n"
524                 "layout(set = 0, binding = 2, std430) buffer Block0 { uvec4 b[]; } colorbuf;\n"
525                 "layout(set = 0, binding = 4, std430) buffer Block1 { float b[]; } depthbuf;\n"
526                 "layout(set = 0, binding = 5, std430) buffer Block2 { uint b[]; } stencilbuf;\n"
527                 "layout(set = 0, binding = 6) uniform " << fsampType << " depthTex;\n"
528                 "layout(set = 0, binding = 7) uniform " << usampType << " stencilTex;\n"
529                 "layout(local_size_x = 1, local_size_y = 1, local_size_z = 1) in;\n"
530                 "void main()\n"
531                 "{\n"
532                 "   for (int i = 0; i < " << m_data.samples << "; ++i) {\n"
533                 "      uint idx = ((gl_GlobalInvocationID.z * " << m_data.framebufferDim.height << " + gl_GlobalInvocationID.y) * " << m_data.framebufferDim.width << " + gl_GlobalInvocationID.x) * " << m_data.samples << " + i;\n"
534                 "      colorbuf.b[idx] = texelFetch(colorTex, ivec3(gl_GlobalInvocationID.xyz), i);\n";
535
536         if (m_data.fragDepth)
537                 css << "      depthbuf.b[idx] = texelFetch(depthTex, ivec3(gl_GlobalInvocationID.xyz), i).x;\n";
538
539         if (m_data.fragStencil)
540                 css << "      stencilbuf.b[idx] = texelFetch(stencilTex, ivec3(gl_GlobalInvocationID.xyz), i).x;\n";
541
542         css <<
543                 "   }\n"
544                 "}\n";
545
546         programCollection.glslSources.add("comp") << glu::ComputeSource(css.str());
547 }
548
549 TestInstance* FSRTestCase::createInstance (Context& context) const
550 {
551         return new FSRTestInstance(context, m_data);
552 }
553
554 deInt32 FSRTestInstance::ShadingRateExtentToEnum(VkExtent2D ext) const
555 {
556         ext.width = deCtz32(ext.width);
557         ext.height = deCtz32(ext.height);
558
559         return (ext.width << 2) | ext.height;
560 }
561
562 VkExtent2D FSRTestInstance::ShadingRateEnumToExtent(deInt32 rate) const
563 {
564         VkExtent2D ret;
565         ret.width = 1 << ((rate/4) & 3);
566         ret.height = 1 << (rate & 3);
567
568         return ret;
569 }
570
571 VkExtent2D FSRTestInstance::Combine(VkExtent2D ext0, VkExtent2D ext1, VkFragmentShadingRateCombinerOpKHR comb) const
572 {
573         VkExtent2D ret;
574         switch (comb)
575         {
576         default:
577                 DE_ASSERT(0);
578                 // fallthrough
579         case VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR:
580                 return ext0;
581         case VK_FRAGMENT_SHADING_RATE_COMBINER_OP_REPLACE_KHR:
582                 return ext1;
583         case VK_FRAGMENT_SHADING_RATE_COMBINER_OP_MIN_KHR:
584                 ret = { de::min(ext0.width, ext1.width), de::min(ext0.height, ext1.height) };
585                 return ret;
586         case VK_FRAGMENT_SHADING_RATE_COMBINER_OP_MAX_KHR:
587                 ret = { de::max(ext0.width, ext1.width), de::max(ext0.height, ext1.height) };
588                 return ret;
589         case VK_FRAGMENT_SHADING_RATE_COMBINER_OP_MUL_KHR:
590                 ret = { ext0.width * ext1.width, ext0.height * ext1.height };
591                 if (!m_shadingRateProperties.fragmentShadingRateStrictMultiplyCombiner)
592                 {
593                         if (ext0.width == 1 && ext1.width == 1)
594                                 ret.width = 2;
595                         if (ext0.height == 1 && ext1.height == 1)
596                                 ret.height = 2;
597                 }
598                 return ret;
599         }
600 }
601
602 deInt32 FSRTestInstance::Simulate(deInt32 rate0, deInt32 rate1, deInt32 rate2)
603 {
604         deInt32 &cachedRate = m_simulateCache[(rate2*m_simulateValueCount + rate1)*m_simulateValueCount + rate0];
605         if (cachedRate != ~0)
606                 return cachedRate;
607
608         VkExtent2D extent0 = ShadingRateEnumToExtent(rate0);
609         VkExtent2D extent1 = ShadingRateEnumToExtent(rate1);
610         VkExtent2D extent2 = ShadingRateEnumToExtent(rate2);
611
612         deInt32 finalMask = 0;
613         // Simulate once for implementations that don't allow swapping rate xy,
614         // and once for those that do. Any of those results is allowed.
615         for (deUint32 allowSwap = 0; allowSwap <= 1; ++allowSwap)
616         {
617                 // Combine rate 0 and 1, get a mask of possible clamped rates
618                 VkExtent2D intermed = Combine(extent0, extent1, m_data.combinerOp[0]);
619                 deInt32 intermedMask = ShadingRateExtentToClampedMask(intermed, allowSwap == 1);
620
621                 // For each clamped rate, combine that with rate 2 and accumulate the possible clamped rates
622                 for (int i = 0; i < 16; ++i)
623                 {
624                         if (intermedMask & (1<<i))
625                         {
626                                 VkExtent2D final = Combine(ShadingRateEnumToExtent(i), extent2, m_data.combinerOp[1]);
627                                 finalMask |= ShadingRateExtentToClampedMask(final, allowSwap == 1);
628                         }
629                 }
630                 {
631                         // unclamped intermediate value is also permitted
632                         VkExtent2D final = Combine(intermed, extent2, m_data.combinerOp[1]);
633                         finalMask |= ShadingRateExtentToClampedMask(final, allowSwap == 1);
634                 }
635         }
636
637         if (Force1x1())
638                 finalMask = 0x1;
639
640         cachedRate = finalMask;
641         return finalMask;
642 }
643
644 // If a rate is not valid (<=4x4), clamp it to something valid.
645 // This is only used for "inputs" to the system, not to mimic
646 // how the implementation internally clamps intermediate values.
647 VkExtent2D FSRTestInstance::SanitizeExtent(VkExtent2D ext) const
648 {
649         DE_ASSERT(ext.width > 0 && ext.height > 0);
650
651         ext.width = de::min(ext.width, 4u);
652         ext.height = de::min(ext.height, 4u);
653
654         return ext;
655 }
656
657 // Map an extent to a mask of all modes smaller than or equal to it in either dimension
658 deInt32 FSRTestInstance::ShadingRateExtentToClampedMask(VkExtent2D ext, bool allowSwap) const
659 {
660         deUint32 desiredSize = ext.width * ext.height;
661
662         deInt32 mask = 0;
663
664         while (desiredSize > 0)
665         {
666                 // First, find modes that maximize the area
667                 for (deUint32 i = 0; i < m_supportedFragmentShadingRateCount; ++i)
668                 {
669                         const VkPhysicalDeviceFragmentShadingRateKHR &supportedRate = m_supportedFragmentShadingRates[i];
670                         if ((supportedRate.sampleCounts & m_data.samples) &&
671                                 supportedRate.fragmentSize.width * supportedRate.fragmentSize.height == desiredSize &&
672                                 ((supportedRate.fragmentSize.width  <= ext.width && supportedRate.fragmentSize.height <= ext.height) ||
673                                  (supportedRate.fragmentSize.height <= ext.width && supportedRate.fragmentSize.width  <= ext.height && allowSwap)))
674                         {
675                                 mask |= 1 << ShadingRateExtentToEnum(supportedRate.fragmentSize);
676                         }
677                 }
678                 if (mask)
679                 {
680                         // Amongst the modes that maximize the area, pick the ones that
681                         // minimize the aspect ratio. Prefer ratio of 1, then 2, then 4.
682                         // 1x1 = 0, 2x2 = 5, 4x4 = 10
683                         static const deUint32 aspectMaskRatio1 = 0x421;
684                         // 2x1 = 4, 1x2 = 1, 4x2 = 9, 2x4 = 6
685                         static const deUint32 aspectMaskRatio2 = 0x252;
686                         // 4x1 = 8, 1x4 = 2,
687                         static const deUint32 aspectMaskRatio4 = 0x104;
688
689                         if (mask & aspectMaskRatio1)
690                         {
691                                 mask &= aspectMaskRatio1;
692                                 break;
693                         }
694                         if (mask & aspectMaskRatio2)
695                         {
696                                 mask &= aspectMaskRatio2;
697                                 break;
698                         }
699                         if (mask & aspectMaskRatio4)
700                         {
701                                 mask &= aspectMaskRatio4;
702                                 break;
703                         }
704                         DE_ASSERT(0);
705                 }
706                 desiredSize /= 2;
707         }
708
709         return mask;
710 }
711
712
713 deInt32 FSRTestInstance::SanitizeRate(deInt32 rate) const
714 {
715         VkExtent2D extent = ShadingRateEnumToExtent(rate);
716
717         extent = SanitizeExtent(extent);
718
719         return ShadingRateExtentToEnum(extent);
720 }
721
722 // Map primID % 9 to primitive shading rate
723 deInt32 FSRTestInstance::PrimIDToPrimitiveShadingRate(deInt32 primID)
724 {
725         deInt32 &cachedRate = m_primIDToPrimitiveShadingRate[primID];
726         if (cachedRate != ~0)
727                 return cachedRate;
728
729         VkExtent2D extent;
730         extent.width = 1 << (primID % 3);
731         extent.height = 1 << ((primID/3) % 3);
732
733         cachedRate = ShadingRateExtentToEnum(extent);
734         return cachedRate;
735 }
736
737 // Map primID / 9 to pipeline shading rate
738 deInt32 FSRTestInstance::PrimIDToPipelineShadingRate(deInt32 primID)
739 {
740         deInt32 &cachedRate = m_primIDToPipelineShadingRate[primID];
741         if (cachedRate != ~0)
742                 return cachedRate;
743
744         primID /= 9;
745         VkExtent2D extent;
746         extent.width = 1 << (primID % 3);
747         extent.height = 1 << ((primID/3) % 3);
748
749         cachedRate = ShadingRateExtentToEnum(extent);
750         return cachedRate;
751 }
752
753 static de::MovePtr<BufferWithMemory> CreateCachedBuffer(const vk::DeviceInterface&              vk,
754                                                                                                                 const vk::VkDevice                              device,
755                                                                                                                 vk::Allocator&                                  allocator,
756                                                                                                                 const vk::VkBufferCreateInfo&   bufferCreateInfo)
757 {
758         try
759         {
760                 return de::MovePtr<BufferWithMemory>(new BufferWithMemory(
761                         vk, device, allocator, bufferCreateInfo, MemoryRequirement::HostVisible | MemoryRequirement::Cached));
762         }
763         catch (const tcu::NotSupportedError&)
764         {
765                 return de::MovePtr<BufferWithMemory>(new BufferWithMemory(
766                         vk, device, allocator, bufferCreateInfo, MemoryRequirement::HostVisible));
767         }
768 }
769
770 tcu::TestStatus FSRTestInstance::iterate (void)
771 {
772         const DeviceInterface&  vk                                              = m_context.getDeviceInterface();
773         const VkDevice                  device                                  = m_context.getDevice();
774         tcu::TestLog&                   log                                             = m_context.getTestContext().getLog();
775         Allocator&                              allocator                               = m_context.getDefaultAllocator();
776         VkFlags                                 allShaderStages                 = VK_SHADER_STAGE_VERTEX_BIT | VK_SHADER_STAGE_FRAGMENT_BIT | VK_SHADER_STAGE_COMPUTE_BIT;
777         VkFlags                                 allPipelineStages               = VK_PIPELINE_STAGE_VERTEX_SHADER_BIT |
778                                                                                                           VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT |
779                                                                                                           VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT |
780                                                                                                           VK_PIPELINE_STAGE_EARLY_FRAGMENT_TESTS_BIT |
781                                                                                                           VK_PIPELINE_STAGE_LATE_FRAGMENT_TESTS_BIT |
782                                                                                                           VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT |
783                                                                                                           VK_PIPELINE_STAGE_SHADING_RATE_IMAGE_BIT_NV;
784         const VkFormat                  cbFormat                                = VK_FORMAT_R32G32B32A32_UINT;
785         const VkFormat                  dsFormat                                = VK_FORMAT_D32_SFLOAT_S8_UINT;
786
787         if (m_data.geometryShader)
788         {
789                 allShaderStages |= VK_SHADER_STAGE_GEOMETRY_BIT;
790                 allPipelineStages |= VK_PIPELINE_STAGE_GEOMETRY_SHADER_BIT;
791         }
792
793         deRandom rnd;
794         deRandom_init(&rnd, m_data.seed);
795
796         qpTestResult res = QP_TEST_RESULT_PASS;
797         deUint32 numUnexpected1x1Samples = 0;
798         deUint32 numTotalSamples = 0;
799
800         enum AttachmentModes
801         {
802                 ATTACHMENT_MODE_DEFAULT = 0,
803                 ATTACHMENT_MODE_LAYOUT_OPTIMAL,
804                 ATTACHMENT_MODE_IMAGELESS,
805                 ATTACHMENT_MODE_2DARRAY,
806                 ATTACHMENT_MODE_TILING_LINEAR,
807
808                 ATTACHMENT_MODE_COUNT,
809         };
810
811         deUint32 numSRLayers = m_data.srLayered ? 2u : 1u;
812
813         VkExtent2D minFragmentShadingRateAttachmentTexelSize = {1, 1};
814         VkExtent2D maxFragmentShadingRateAttachmentTexelSize = {1, 1};
815         deUint32 maxFragmentShadingRateAttachmentTexelSizeAspectRatio = 1;
816         if (m_context.getFragmentShadingRateFeatures().attachmentFragmentShadingRate)
817         {
818                 minFragmentShadingRateAttachmentTexelSize = m_context.getFragmentShadingRateProperties().minFragmentShadingRateAttachmentTexelSize;
819                 maxFragmentShadingRateAttachmentTexelSize = m_context.getFragmentShadingRateProperties().maxFragmentShadingRateAttachmentTexelSize;
820                 maxFragmentShadingRateAttachmentTexelSizeAspectRatio = m_context.getFragmentShadingRateProperties().maxFragmentShadingRateAttachmentTexelSizeAspectRatio;
821         }
822
823         VkDeviceSize atomicBufferSize = sizeof(deUint32);
824
825         de::MovePtr<BufferWithMemory> atomicBuffer;
826         atomicBuffer = de::MovePtr<BufferWithMemory>(new BufferWithMemory(
827                 vk, device, allocator, makeBufferCreateInfo(atomicBufferSize, VK_BUFFER_USAGE_TRANSFER_SRC_BIT | VK_BUFFER_USAGE_STORAGE_BUFFER_BIT), MemoryRequirement::HostVisible | MemoryRequirement::Coherent));
828
829         deUint32 *abuf = (deUint32 *)atomicBuffer->getAllocation().getHostPtr();
830
831         // NUM_TRIANGLES triangles, 3 vertices, 2 components of float position
832         VkDeviceSize vertexBufferSize = NUM_TRIANGLES * 3 * 2 * sizeof(float);
833
834         de::MovePtr<BufferWithMemory> vertexBuffer;
835         vertexBuffer = de::MovePtr<BufferWithMemory>(new BufferWithMemory(
836                 vk, device, allocator, makeBufferCreateInfo(vertexBufferSize, VK_BUFFER_USAGE_TRANSFER_SRC_BIT | VK_BUFFER_USAGE_VERTEX_BUFFER_BIT), MemoryRequirement::HostVisible | MemoryRequirement::Coherent));
837
838         float *vbuf = (float *)vertexBuffer->getAllocation().getHostPtr();
839         for (deInt32 i = 0; i < (deInt32)(vertexBufferSize / sizeof(float)); ++i)
840         {
841                 vbuf[i] = deRandom_getFloat(&rnd)*2.0f - 1.0f;
842         }
843         flushAlloc(vk, device, vertexBuffer->getAllocation());
844
845         VkDeviceSize colorOutputBufferSize = m_data.framebufferDim.width * m_data.framebufferDim.height * m_data.samples * 4 * sizeof(deUint32) * m_data.numColorLayers;
846         de::MovePtr<BufferWithMemory> colorOutputBuffer = CreateCachedBuffer(vk, device, allocator, makeBufferCreateInfo(colorOutputBufferSize, VK_BUFFER_USAGE_TRANSFER_DST_BIT | VK_BUFFER_USAGE_STORAGE_BUFFER_BIT));
847
848         VkDeviceSize depthOutputBufferSize = 0, stencilOutputBufferSize = 0;
849         de::MovePtr<BufferWithMemory> depthOutputBuffer, stencilOutputBuffer;
850         if (m_data.useDepthStencil)
851         {
852                 depthOutputBufferSize = m_data.framebufferDim.width * m_data.framebufferDim.height * m_data.samples * sizeof(float) * m_data.numColorLayers;
853                 depthOutputBuffer = CreateCachedBuffer(vk, device, allocator, makeBufferCreateInfo(depthOutputBufferSize, VK_BUFFER_USAGE_TRANSFER_DST_BIT | VK_BUFFER_USAGE_STORAGE_BUFFER_BIT));
854
855                 stencilOutputBufferSize = m_data.framebufferDim.width * m_data.framebufferDim.height * m_data.samples * sizeof(deUint32) * m_data.numColorLayers;
856                 stencilOutputBuffer = CreateCachedBuffer(vk, device, allocator, makeBufferCreateInfo(stencilOutputBufferSize, VK_BUFFER_USAGE_TRANSFER_DST_BIT | VK_BUFFER_USAGE_STORAGE_BUFFER_BIT));
857         }
858
859         deUint32 minSRTexelWidth = minFragmentShadingRateAttachmentTexelSize.width;
860         deUint32 minSRTexelHeight = minFragmentShadingRateAttachmentTexelSize.height;
861         deUint32 maxSRWidth = (m_data.framebufferDim.width + minSRTexelWidth - 1) / minSRTexelWidth;
862         deUint32 maxSRHeight = (m_data.framebufferDim.height + minSRTexelHeight - 1) / minSRTexelHeight;
863
864         // max size over all formats
865         VkDeviceSize srFillBufferSize = numSRLayers * maxSRWidth * maxSRHeight * 32/*4 component 64-bit*/;
866         de::MovePtr<BufferWithMemory> srFillBuffer;
867         deUint8 *fillPtr = DE_NULL;
868         if (m_data.useAttachment())
869         {
870                 srFillBuffer = CreateCachedBuffer(vk, device, allocator, makeBufferCreateInfo(srFillBufferSize, VK_BUFFER_USAGE_TRANSFER_SRC_BIT));
871                 fillPtr = (deUint8 *)srFillBuffer->getAllocation().getHostPtr();
872         }
873
874         de::MovePtr<ImageWithMemory> cbImage;
875         Move<VkImageView> cbImageView;
876         {
877                 const VkImageCreateInfo                 imageCreateInfo                 =
878                 {
879                         VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO,    // VkStructureType                      sType;
880                         DE_NULL,                                                                // const void*                          pNext;
881                         (VkImageCreateFlags)0u,                                 // VkImageCreateFlags           flags;
882                         VK_IMAGE_TYPE_2D,                                               // VkImageType                          imageType;
883                         cbFormat,                                                               // VkFormat                                     format;
884                         {
885                                 m_data.framebufferDim.width,            // deUint32     width;
886                                 m_data.framebufferDim.height,           // deUint32     height;
887                                 1u                                                                      // deUint32     depth;
888                         },                                                                              // VkExtent3D                           extent;
889                         1u,                                                                             // deUint32                                     mipLevels;
890                         m_data.numColorLayers,                                  // deUint32                                     arrayLayers;
891                         m_data.samples,                                                 // VkSampleCountFlagBits        samples;
892                         VK_IMAGE_TILING_OPTIMAL,                                // VkImageTiling                        tiling;
893                         cbUsage,                                                                // VkImageUsageFlags            usage;
894                         VK_SHARING_MODE_EXCLUSIVE,                              // VkSharingMode                        sharingMode;
895                         0u,                                                                             // deUint32                                     queueFamilyIndexCount;
896                         DE_NULL,                                                                // const deUint32*                      pQueueFamilyIndices;
897                         VK_IMAGE_LAYOUT_UNDEFINED                               // VkImageLayout                        initialLayout;
898                 };
899                 cbImage = de::MovePtr<ImageWithMemory>(new ImageWithMemory(
900                         vk, device, allocator, imageCreateInfo, MemoryRequirement::Any));
901
902                 VkImageViewCreateInfo           imageViewCreateInfo             =
903                 {
904                         VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,       // VkStructureType                      sType;
905                         DE_NULL,                                                                        // const void*                          pNext;
906                         (VkImageViewCreateFlags)0u,                                     // VkImageViewCreateFlags       flags;
907                         **cbImage,                                                                      // VkImage                                      image;
908                         VK_IMAGE_VIEW_TYPE_2D_ARRAY,                            // VkImageViewType                      viewType;
909                         cbFormat,                                                                       // VkFormat                                     format;
910                         {
911                                 VK_COMPONENT_SWIZZLE_R,                                 // VkComponentSwizzle   r;
912                                 VK_COMPONENT_SWIZZLE_G,                                 // VkComponentSwizzle   g;
913                                 VK_COMPONENT_SWIZZLE_B,                                 // VkComponentSwizzle   b;
914                                 VK_COMPONENT_SWIZZLE_A                                  // VkComponentSwizzle   a;
915                         },                                                                                      // VkComponentMapping            components;
916                         {
917                                 VK_IMAGE_ASPECT_COLOR_BIT,                              // VkImageAspectFlags   aspectMask;
918                                 0u,                                                                             // deUint32                             baseMipLevel;
919                                 1u,                                                                             // deUint32                             levelCount;
920                                 0u,                                                                             // deUint32                             baseArrayLayer;
921                                 m_data.numColorLayers                                   // deUint32                             layerCount;
922                         }                                                                                       // VkImageSubresourceRange      subresourceRange;
923                 };
924                 cbImageView = createImageView(vk, device, &imageViewCreateInfo, NULL);
925         }
926
927         de::MovePtr<ImageWithMemory> dsImage;
928         Move<VkImageView> dsImageView, dImageView, sImageView;
929         VkImageUsageFlags dsUsage = VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT |
930                                                                 VK_IMAGE_USAGE_SAMPLED_BIT |
931                                                                 VK_IMAGE_USAGE_TRANSFER_SRC_BIT |
932                                                                 VK_IMAGE_USAGE_TRANSFER_DST_BIT;
933         if (m_data.useDepthStencil)
934         {
935                 const VkImageCreateInfo                 imageCreateInfo                 =
936                 {
937                         VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO,    // VkStructureType                      sType;
938                         DE_NULL,                                                                // const void*                          pNext;
939                         (VkImageCreateFlags)0u,                                 // VkImageCreateFlags           flags;
940                         VK_IMAGE_TYPE_2D,                                               // VkImageType                          imageType;
941                         dsFormat,                                                               // VkFormat                                     format;
942                         {
943                                 m_data.framebufferDim.width,            // deUint32     width;
944                                 m_data.framebufferDim.height,           // deUint32     height;
945                                 1u                                                                      // deUint32     depth;
946                         },                                                                              // VkExtent3D                           extent;
947                         1u,                                                                             // deUint32                                     mipLevels;
948                         m_data.numColorLayers,                                  // deUint32                                     arrayLayers;
949                         m_data.samples,                                                 // VkSampleCountFlagBits        samples;
950                         VK_IMAGE_TILING_OPTIMAL,                                // VkImageTiling                        tiling;
951                         dsUsage,                                                                // VkImageUsageFlags            usage;
952                         VK_SHARING_MODE_EXCLUSIVE,                              // VkSharingMode                        sharingMode;
953                         0u,                                                                             // deUint32                                     queueFamilyIndexCount;
954                         DE_NULL,                                                                // const deUint32*                      pQueueFamilyIndices;
955                         VK_IMAGE_LAYOUT_UNDEFINED                               // VkImageLayout                        initialLayout;
956                 };
957                 dsImage = de::MovePtr<ImageWithMemory>(new ImageWithMemory(
958                         vk, device, allocator, imageCreateInfo, MemoryRequirement::Any));
959
960                 VkImageViewCreateInfo           imageViewCreateInfo             =
961                 {
962                         VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,       // VkStructureType                      sType;
963                         DE_NULL,                                                                        // const void*                          pNext;
964                         (VkImageViewCreateFlags)0u,                                     // VkImageViewCreateFlags       flags;
965                         **dsImage,                                                                      // VkImage                                      image;
966                         VK_IMAGE_VIEW_TYPE_2D_ARRAY,                            // VkImageViewType                      viewType;
967                         dsFormat,                                                                       // VkFormat                                     format;
968                         {
969                                 VK_COMPONENT_SWIZZLE_R,                                 // VkComponentSwizzle   r;
970                                 VK_COMPONENT_SWIZZLE_G,                                 // VkComponentSwizzle   g;
971                                 VK_COMPONENT_SWIZZLE_B,                                 // VkComponentSwizzle   b;
972                                 VK_COMPONENT_SWIZZLE_A                                  // VkComponentSwizzle   a;
973                         },                                                                                      // VkComponentMapping            components;
974                         {
975                                 VK_IMAGE_ASPECT_DEPTH_BIT | VK_IMAGE_ASPECT_STENCIL_BIT,        // VkImageAspectFlags   aspectMask;
976                                 0u,                                                                             // deUint32                             baseMipLevel;
977                                 1u,                                                                             // deUint32                             levelCount;
978                                 0u,                                                                             // deUint32                             baseArrayLayer;
979                                 m_data.numColorLayers                                   // deUint32                             layerCount;
980                         }                                                                                       // VkImageSubresourceRange      subresourceRange;
981                 };
982                 dsImageView = createImageView(vk, device, &imageViewCreateInfo, NULL);
983                 imageViewCreateInfo.subresourceRange.aspectMask = VK_IMAGE_ASPECT_DEPTH_BIT;
984                 dImageView = createImageView(vk, device, &imageViewCreateInfo, NULL);
985                 imageViewCreateInfo.subresourceRange.aspectMask = VK_IMAGE_ASPECT_STENCIL_BIT;
986                 sImageView = createImageView(vk, device, &imageViewCreateInfo, NULL);
987         }
988
989         // Image used to test implicit derivative calculations.
990         // Filled with a value of 1<<lod.
991         de::MovePtr<ImageWithMemory> derivImage;
992         Move<VkImageView> derivImageView;
993         VkImageUsageFlags derivUsage = VK_IMAGE_USAGE_SAMPLED_BIT |
994                                                                    VK_IMAGE_USAGE_TRANSFER_DST_BIT;
995         deUint32 derivNumLevels;
996         {
997                 deUint32 maxDim = de::max(m_context.getFragmentShadingRateProperties().maxFragmentSize.width, m_context.getFragmentShadingRateProperties().maxFragmentSize.height);
998                 derivNumLevels = 1 + deCtz32(maxDim);
999                 const VkImageCreateInfo                 imageCreateInfo                 =
1000                 {
1001                         VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO,    // VkStructureType                      sType;
1002                         DE_NULL,                                                                // const void*                          pNext;
1003                         (VkImageCreateFlags)0u,                                 // VkImageCreateFlags           flags;
1004                         VK_IMAGE_TYPE_2D,                                               // VkImageType                          imageType;
1005                         VK_FORMAT_R32_UINT,                                             // VkFormat                                     format;
1006                         {
1007                                 m_context.getFragmentShadingRateProperties().maxFragmentSize.width,             // deUint32     width;
1008                                 m_context.getFragmentShadingRateProperties().maxFragmentSize.height,    // deUint32     height;
1009                                 1u                                                                      // deUint32     depth;
1010                         },                                                                              // VkExtent3D                           extent;
1011                         derivNumLevels,                                                 // deUint32                                     mipLevels;
1012                         1u,                                                                             // deUint32                                     arrayLayers;
1013                         VK_SAMPLE_COUNT_1_BIT,                                  // VkSampleCountFlagBits        samples;
1014                         VK_IMAGE_TILING_OPTIMAL,                                // VkImageTiling                        tiling;
1015                         derivUsage,                                                             // VkImageUsageFlags            usage;
1016                         VK_SHARING_MODE_EXCLUSIVE,                              // VkSharingMode                        sharingMode;
1017                         0u,                                                                             // deUint32                                     queueFamilyIndexCount;
1018                         DE_NULL,                                                                // const deUint32*                      pQueueFamilyIndices;
1019                         VK_IMAGE_LAYOUT_UNDEFINED                               // VkImageLayout                        initialLayout;
1020                 };
1021                 derivImage = de::MovePtr<ImageWithMemory>(new ImageWithMemory(
1022                         vk, device, allocator, imageCreateInfo, MemoryRequirement::Any));
1023
1024                 VkImageViewCreateInfo           imageViewCreateInfo             =
1025                 {
1026                         VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,       // VkStructureType                      sType;
1027                         DE_NULL,                                                                        // const void*                          pNext;
1028                         (VkImageViewCreateFlags)0u,                                     // VkImageViewCreateFlags       flags;
1029                         **derivImage,                                                           // VkImage                                      image;
1030                         VK_IMAGE_VIEW_TYPE_2D,                                          // VkImageViewType                      viewType;
1031                         VK_FORMAT_R32_UINT,                                                     // VkFormat                                     format;
1032                         {
1033                                 VK_COMPONENT_SWIZZLE_R,                                 // VkComponentSwizzle   r;
1034                                 VK_COMPONENT_SWIZZLE_G,                                 // VkComponentSwizzle   g;
1035                                 VK_COMPONENT_SWIZZLE_B,                                 // VkComponentSwizzle   b;
1036                                 VK_COMPONENT_SWIZZLE_A                                  // VkComponentSwizzle   a;
1037                         },                                                                                      // VkComponentMapping            components;
1038                         {
1039                                 VK_IMAGE_ASPECT_COLOR_BIT,                              // VkImageAspectFlags   aspectMask;
1040                                 0u,                                                                             // deUint32                             baseMipLevel;
1041                                 derivNumLevels,                                                 // deUint32                             levelCount;
1042                                 0u,                                                                             // deUint32                             baseArrayLayer;
1043                                 1u                                                                              // deUint32                             layerCount;
1044                         }                                                                                       // VkImageSubresourceRange      subresourceRange;
1045                 };
1046                 derivImageView = createImageView(vk, device, &imageViewCreateInfo, NULL);
1047         }
1048
1049         // sampler used with derivImage
1050         const struct VkSamplerCreateInfo                samplerInfo     =
1051         {
1052                 VK_STRUCTURE_TYPE_SAMPLER_CREATE_INFO,          // sType
1053                 DE_NULL,                                                                        // pNext
1054                 0u,                                                                                     // flags
1055                 VK_FILTER_NEAREST,                                                      // magFilter
1056                 VK_FILTER_NEAREST,                                                      // minFilter
1057                 VK_SAMPLER_MIPMAP_MODE_NEAREST,                         // mipmapMode
1058                 VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE,          // addressModeU
1059                 VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE,          // addressModeV
1060                 VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE,          // addressModeW
1061                 0.0f,                                                                           // mipLodBias
1062                 VK_FALSE,                                                                       // anisotropyEnable
1063                 1.0f,                                                                           // maxAnisotropy
1064                 DE_FALSE,                                                                       // compareEnable
1065                 VK_COMPARE_OP_ALWAYS,                                           // compareOp
1066                 0.0f,                                                                           // minLod
1067                 (float)derivNumLevels,                                          // maxLod
1068                 VK_BORDER_COLOR_INT_TRANSPARENT_BLACK,          // borderColor
1069                 VK_FALSE,                                                                       // unnormalizedCoords
1070         };
1071
1072         Move<VkSampler>                 sampler = createSampler(vk, device, &samplerInfo);
1073
1074         Move<vk::VkDescriptorSetLayout> descriptorSetLayout;
1075         VkDescriptorSetLayoutCreateFlags layoutCreateFlags = 0;
1076
1077         const VkDescriptorSetLayoutBinding bindings[] =
1078         {
1079                 {
1080                         0u,                                                                             // binding
1081                         VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,              // descriptorType
1082                         1u,                                                                             // descriptorCount
1083                         allShaderStages,                                                // stageFlags
1084                         DE_NULL,                                                                // pImmutableSamplers
1085                 },
1086                 {
1087                         1u,                                                                             // binding
1088                         VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE,               // descriptorType
1089                         1u,                                                                             // descriptorCount
1090                         allShaderStages,                                                // stageFlags
1091                         DE_NULL,                                                                // pImmutableSamplers
1092                 },
1093                 {
1094                         2u,                                                                             // binding
1095                         VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,              // descriptorType
1096                         1u,                                                                             // descriptorCount
1097                         allShaderStages,                                                // stageFlags
1098                         DE_NULL,                                                                // pImmutableSamplers
1099                 },
1100                 {
1101                         3u,                                                                             // binding
1102                         VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER,      // descriptorType
1103                         1u,                                                                             // descriptorCount
1104                         allShaderStages,                                                // stageFlags
1105                         DE_NULL,                                                                // pImmutableSamplers
1106                 },
1107                 {
1108                         4u,                                                                             // binding
1109                         VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,              // descriptorType
1110                         1u,                                                                             // descriptorCount
1111                         allShaderStages,                                                // stageFlags
1112                         DE_NULL,                                                                // pImmutableSamplers
1113                 },
1114                 {
1115                         5u,                                                                             // binding
1116                         VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,              // descriptorType
1117                         1u,                                                                             // descriptorCount
1118                         allShaderStages,                                                // stageFlags
1119                         DE_NULL,                                                                // pImmutableSamplers
1120                 },
1121                 {
1122                         6u,                                                                             // binding
1123                         VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE,               // descriptorType
1124                         1u,                                                                             // descriptorCount
1125                         allShaderStages,                                                // stageFlags
1126                         DE_NULL,                                                                // pImmutableSamplers
1127                 },
1128                 {
1129                         7u,                                                                             // binding
1130                         VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE,               // descriptorType
1131                         1u,                                                                             // descriptorCount
1132                         allShaderStages,                                                // stageFlags
1133                         DE_NULL,                                                                // pImmutableSamplers
1134                 },
1135         };
1136
1137         // Create a layout and allocate a descriptor set for it.
1138         const VkDescriptorSetLayoutCreateInfo setLayoutCreateInfo =
1139         {
1140                 vk::VK_STRUCTURE_TYPE_DESCRIPTOR_SET_LAYOUT_CREATE_INFO,        // sType
1141                 DE_NULL,                                                                                                        // pNext
1142                 layoutCreateFlags,                                                                                      // flags
1143                 sizeof(bindings)/sizeof(bindings[0]),                                           // bindingCount
1144                 &bindings[0]                                                                                            // pBindings
1145         };
1146
1147         descriptorSetLayout = vk::createDescriptorSetLayout(vk, device, &setLayoutCreateInfo);
1148
1149         const VkPushConstantRange                               pushConstantRange                               =
1150         {
1151                 allShaderStages,                                                                                        // VkShaderStageFlags                                   stageFlags;
1152                 0u,                                                                                                                     // deUint32                                                             offset;
1153                 sizeof(deInt32)                                                                                         // deUint32                                                             size;
1154         };
1155
1156         const VkPipelineLayoutCreateInfo pipelineLayoutCreateInfo =
1157         {
1158                 VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO,                          // sType
1159                 DE_NULL,                                                                                                        // pNext
1160                 (VkPipelineLayoutCreateFlags)0,
1161                 1,                                                                                                                      // setLayoutCount
1162                 &descriptorSetLayout.get(),                                                                     // pSetLayouts
1163                 1u,                                                                                                                     // pushConstantRangeCount
1164                 &pushConstantRange,                                                                                     // pPushConstantRanges
1165         };
1166
1167         Move<VkPipelineLayout> pipelineLayout = createPipelineLayout(vk, device, &pipelineLayoutCreateInfo, NULL);
1168
1169         const Unique<VkShaderModule>    cs                                              (createShaderModule(vk, device, m_context.getBinaryCollection().get("comp"), 0));
1170
1171         const VkPipelineShaderStageCreateInfo   csShaderCreateInfo =
1172         {
1173                 VK_STRUCTURE_TYPE_PIPELINE_SHADER_STAGE_CREATE_INFO,
1174                 DE_NULL,
1175                 (VkPipelineShaderStageCreateFlags)0,
1176                 VK_SHADER_STAGE_COMPUTE_BIT,                                                            // stage
1177                 *cs,                                                                                                            // shader
1178                 "main",
1179                 DE_NULL,                                                                                                        // pSpecializationInfo
1180         };
1181
1182         const VkComputePipelineCreateInfo               pipelineCreateInfo =
1183         {
1184                 VK_STRUCTURE_TYPE_COMPUTE_PIPELINE_CREATE_INFO,
1185                 DE_NULL,
1186                 0u,                                                                                                                     // flags
1187                 csShaderCreateInfo,                                                                                     // cs
1188                 *pipelineLayout,                                                                                        // layout
1189                 (vk::VkPipeline)0,                                                                                      // basePipelineHandle
1190                 0u,                                                                                                                     // basePipelineIndex
1191         };
1192         Move<VkPipeline> computePipeline = createComputePipeline(vk, device, DE_NULL, &pipelineCreateInfo, NULL);
1193
1194         for (deUint32 modeIdx = 0; modeIdx < ATTACHMENT_MODE_COUNT; ++modeIdx)
1195         {
1196                 // If we're not using an attachment, don't test all the different attachment modes
1197                 if (modeIdx != ATTACHMENT_MODE_DEFAULT && !m_data.useAttachment())
1198                         continue;
1199
1200                 // Consider all uint formats possible
1201                 static const VkFormat srFillFormats[] =
1202                 {
1203                         VK_FORMAT_R8_UINT,
1204                         VK_FORMAT_R8G8_UINT,
1205                         VK_FORMAT_R8G8B8_UINT,
1206                         VK_FORMAT_R8G8B8A8_UINT,
1207                         VK_FORMAT_R16_UINT,
1208                         VK_FORMAT_R16G16_UINT,
1209                         VK_FORMAT_R16G16B16_UINT,
1210                         VK_FORMAT_R16G16B16A16_UINT,
1211                         VK_FORMAT_R32_UINT,
1212                         VK_FORMAT_R32G32_UINT,
1213                         VK_FORMAT_R32G32B32_UINT,
1214                         VK_FORMAT_R32G32B32A32_UINT,
1215                         VK_FORMAT_R64_UINT,
1216                         VK_FORMAT_R64G64_UINT,
1217                         VK_FORMAT_R64G64B64_UINT,
1218                         VK_FORMAT_R64G64B64A64_UINT,
1219                 };
1220                 // Only test all formats in the default mode
1221                 deUint32 numFillFormats = modeIdx == ATTACHMENT_MODE_DEFAULT ? (deUint32)(sizeof(srFillFormats)/sizeof(srFillFormats[0])) : 1u;
1222
1223                 // Iterate over all supported tile sizes and formats
1224                 for (deUint32 srTexelWidth  = minFragmentShadingRateAttachmentTexelSize.width;
1225                                           srTexelWidth <= maxFragmentShadingRateAttachmentTexelSize.width;
1226                                           srTexelWidth *= 2)
1227                 for (deUint32 srTexelHeight  = minFragmentShadingRateAttachmentTexelSize.height;
1228                                           srTexelHeight <= maxFragmentShadingRateAttachmentTexelSize.height;
1229                                           srTexelHeight *= 2)
1230                 for (deUint32 formatIdx = 0; formatIdx < numFillFormats; ++formatIdx)
1231                 {
1232
1233                         deUint32 aspectRatio = (srTexelHeight > srTexelWidth) ? (srTexelHeight / srTexelWidth) : (srTexelWidth / srTexelHeight);
1234                         if (aspectRatio > maxFragmentShadingRateAttachmentTexelSizeAspectRatio)
1235                                 continue;
1236
1237                         // Go through the loop only once when not using an attachment
1238                         if (!m_data.useAttachment() &&
1239                                 (srTexelWidth != minFragmentShadingRateAttachmentTexelSize.width ||
1240                                  srTexelHeight != minFragmentShadingRateAttachmentTexelSize.height ||
1241                                  formatIdx != 0))
1242                                  continue;
1243
1244                         bool imagelessFB = modeIdx == ATTACHMENT_MODE_IMAGELESS;
1245
1246                         deUint32 srWidth = (m_data.framebufferDim.width + srTexelWidth - 1) / srTexelWidth;
1247                         deUint32 srHeight = (m_data.framebufferDim.height + srTexelHeight - 1) / srTexelHeight;
1248
1249                         VkFormat srFormat = srFillFormats[formatIdx];
1250                         deUint32 srFillBpp = tcu::getPixelSize(mapVkFormat(srFormat));
1251
1252                         VkImageLayout srLayout = modeIdx == ATTACHMENT_MODE_LAYOUT_OPTIMAL ? VK_IMAGE_LAYOUT_FRAGMENT_SHADING_RATE_ATTACHMENT_OPTIMAL_KHR : VK_IMAGE_LAYOUT_GENERAL;
1253                         VkImageViewType srViewType = modeIdx == ATTACHMENT_MODE_2DARRAY ? VK_IMAGE_VIEW_TYPE_2D_ARRAY : VK_IMAGE_VIEW_TYPE_2D;
1254                         VkImageTiling srTiling = (modeIdx == ATTACHMENT_MODE_TILING_LINEAR) ? VK_IMAGE_TILING_LINEAR : VK_IMAGE_TILING_OPTIMAL;
1255
1256                         VkFormatProperties srFormatProperties;
1257                         m_context.getInstanceInterface().getPhysicalDeviceFormatProperties(m_context.getPhysicalDevice(), srFormat, &srFormatProperties);
1258                         VkFormatFeatureFlags srFormatFeatures = srTiling == VK_IMAGE_TILING_LINEAR ? srFormatProperties.linearTilingFeatures : srFormatProperties.optimalTilingFeatures;
1259
1260                         if (m_context.getFragmentShadingRateFeatures().attachmentFragmentShadingRate &&
1261                                 !(srFormatFeatures & VK_FORMAT_FEATURE_FRAGMENT_SHADING_RATE_ATTACHMENT_BIT_KHR))
1262                         {
1263                                 if (srFormat == VK_FORMAT_R8_UINT && srTiling == VK_IMAGE_TILING_OPTIMAL)
1264                                 {
1265                                         log << tcu::TestLog::Message << "VK_FORMAT_R8_UINT/VK_IMAGE_TILING_OPTIMAL don't support VK_FORMAT_FEATURE_FRAGMENT_SHADING_RATE_ATTACHMENT_BIT_KHR" << tcu::TestLog::EndMessage;
1266                                         res = QP_TEST_RESULT_FAIL;
1267                                 }
1268                                 continue;
1269                         }
1270
1271                         Move<vk::VkDescriptorPool>              descriptorPool;
1272                         Move<vk::VkDescriptorSet>               descriptorSet;
1273                         VkDescriptorPoolCreateFlags poolCreateFlags = VK_DESCRIPTOR_POOL_CREATE_FREE_DESCRIPTOR_SET_BIT;
1274
1275                         vk::DescriptorPoolBuilder poolBuilder;
1276                         for (deInt32 i = 0; i < (deInt32)(sizeof(bindings)/sizeof(bindings[0])); ++i)
1277                                 poolBuilder.addType(bindings[i].descriptorType, bindings[i].descriptorCount);
1278
1279                         descriptorPool = poolBuilder.build(vk, device, poolCreateFlags, 1u);
1280                         descriptorSet = makeDescriptorSet(vk, device, *descriptorPool, *descriptorSetLayout);
1281
1282                         de::MovePtr<ImageWithMemory> srImage;
1283                         Move<VkImageView> srImageView;
1284                         VkImageUsageFlags srUsage = VK_IMAGE_USAGE_FRAGMENT_SHADING_RATE_ATTACHMENT_BIT_KHR |
1285                                                                                 VK_IMAGE_USAGE_TRANSFER_DST_BIT |
1286                                                                                 VK_IMAGE_USAGE_TRANSFER_SRC_BIT;
1287
1288                         if (m_data.useAttachment())
1289                         {
1290                                 const VkImageCreateInfo                 imageCreateInfo                 =
1291                                 {
1292                                         VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO,    // VkStructureType                      sType;
1293                                         DE_NULL,                                                                // const void*                          pNext;
1294                                         (VkImageCreateFlags)0u,                                 // VkImageCreateFlags           flags;
1295                                         VK_IMAGE_TYPE_2D,                                               // VkImageType                          imageType;
1296                                         srFormat,                                                               // VkFormat                                     format;
1297                                         {
1298                                                 srWidth,                                                        // deUint32     width;
1299                                                 srHeight,                                                       // deUint32     height;
1300                                                 1u                                                                      // deUint32     depth;
1301                                         },                                                                              // VkExtent3D                           extent;
1302                                         1u,                                                                             // deUint32                                     mipLevels;
1303                                         numSRLayers,                                                    // deUint32                                     arrayLayers;
1304                                         VK_SAMPLE_COUNT_1_BIT,                                  // VkSampleCountFlagBits        samples;
1305                                         srTiling,                                                               // VkImageTiling                        tiling;
1306                                         srUsage,                                                                // VkImageUsageFlags            usage;
1307                                         VK_SHARING_MODE_EXCLUSIVE,                              // VkSharingMode                        sharingMode;
1308                                         0u,                                                                             // deUint32                                     queueFamilyIndexCount;
1309                                         DE_NULL,                                                                // const deUint32*                      pQueueFamilyIndices;
1310                                         VK_IMAGE_LAYOUT_UNDEFINED                               // VkImageLayout                        initialLayout;
1311                                 };
1312                                 srImage = de::MovePtr<ImageWithMemory>(new ImageWithMemory(
1313                                         vk, device, allocator, imageCreateInfo, MemoryRequirement::Any));
1314
1315                                 VkImageViewCreateInfo           imageViewCreateInfo             =
1316                                 {
1317                                         VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,       // VkStructureType                      sType;
1318                                         DE_NULL,                                                                        // const void*                          pNext;
1319                                         (VkImageViewCreateFlags)0u,                                     // VkImageViewCreateFlags       flags;
1320                                         **srImage,                                                                      // VkImage                                      image;
1321                                         srViewType,                                                                     // VkImageViewType                      viewType;
1322                                         srFormat,                                                                       // VkFormat                                     format;
1323                                         {
1324                                                 VK_COMPONENT_SWIZZLE_R,                                 // VkComponentSwizzle   r;
1325                                                 VK_COMPONENT_SWIZZLE_G,                                 // VkComponentSwizzle   g;
1326                                                 VK_COMPONENT_SWIZZLE_B,                                 // VkComponentSwizzle   b;
1327                                                 VK_COMPONENT_SWIZZLE_A                                  // VkComponentSwizzle   a;
1328                                         },                                                                                      // VkComponentMapping            components;
1329                                         {
1330                                                 VK_IMAGE_ASPECT_COLOR_BIT,                              // VkImageAspectFlags   aspectMask;
1331                                                 0u,                                                                             // deUint32                             baseMipLevel;
1332                                                 1u,                                                                             // deUint32                             levelCount;
1333                                                 0u,                                                                             // deUint32                             baseArrayLayer;
1334                                                 srViewType == VK_IMAGE_VIEW_TYPE_2D ?
1335                                                 1 : numSRLayers,                                                // deUint32                             layerCount;
1336                                         }                                                                                       // VkImageSubresourceRange      subresourceRange;
1337                                 };
1338                                 srImageView = createImageView(vk, device, &imageViewCreateInfo, NULL);
1339                         }
1340
1341                         VkDescriptorImageInfo imageInfo;
1342                         VkDescriptorBufferInfo bufferInfo;
1343
1344                         VkWriteDescriptorSet w =
1345                         {
1346                                 VK_STRUCTURE_TYPE_WRITE_DESCRIPTOR_SET,                                                 // sType
1347                                 DE_NULL,                                                                                                                // pNext
1348                                 *descriptorSet,                                                                                                 // dstSet
1349                                 (deUint32)0,                                                                                                    // dstBinding
1350                                 0,                                                                                                                              // dstArrayElement
1351                                 1u,                                                                                                                             // descriptorCount
1352                                 bindings[0].descriptorType,                                                                             // descriptorType
1353                                 &imageInfo,                                                                                                             // pImageInfo
1354                                 &bufferInfo,                                                                                                    // pBufferInfo
1355                                 DE_NULL,                                                                                                                // pTexelBufferView
1356                         };
1357
1358                         abuf[0] = 0;
1359                         flushAlloc(vk, device, atomicBuffer->getAllocation());
1360
1361                         bufferInfo = makeDescriptorBufferInfo(**atomicBuffer, 0, atomicBufferSize);
1362                         w.dstBinding = 0;
1363                         w.descriptorType = bindings[0].descriptorType;
1364                         vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1365
1366                         imageInfo = makeDescriptorImageInfo(DE_NULL, *cbImageView, VK_IMAGE_LAYOUT_GENERAL);
1367                         w.dstBinding = 1;
1368                         w.descriptorType = bindings[1].descriptorType;
1369                         vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1370
1371                         bufferInfo = makeDescriptorBufferInfo(**colorOutputBuffer, 0, colorOutputBufferSize);
1372                         w.dstBinding = 2;
1373                         w.descriptorType = bindings[2].descriptorType;
1374                         vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1375
1376                         imageInfo = makeDescriptorImageInfo(*sampler, *derivImageView, VK_IMAGE_LAYOUT_GENERAL);
1377                         w.dstBinding = 3;
1378                         w.descriptorType = bindings[3].descriptorType;
1379                         vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1380
1381                         if (m_data.useDepthStencil)
1382                         {
1383                                 bufferInfo = makeDescriptorBufferInfo(**depthOutputBuffer, 0, depthOutputBufferSize);
1384                                 w.dstBinding = 4;
1385                                 w.descriptorType = bindings[4].descriptorType;
1386                                 vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1387
1388                                 bufferInfo = makeDescriptorBufferInfo(**stencilOutputBuffer, 0, stencilOutputBufferSize);
1389                                 w.dstBinding = 5;
1390                                 w.descriptorType = bindings[5].descriptorType;
1391                                 vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1392
1393                                 imageInfo = makeDescriptorImageInfo(DE_NULL, *dImageView, VK_IMAGE_LAYOUT_GENERAL);
1394                                 w.dstBinding = 6;
1395                                 w.descriptorType = bindings[6].descriptorType;
1396                                 vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1397
1398                                 imageInfo = makeDescriptorImageInfo(DE_NULL, *sImageView, VK_IMAGE_LAYOUT_GENERAL);
1399                                 w.dstBinding = 7;
1400                                 w.descriptorType = bindings[7].descriptorType;
1401                                 vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1402                         }
1403
1404                         Move<VkRenderPass> renderPass;
1405                         Move<VkFramebuffer> framebuffer;
1406
1407                         std::vector<VkImageView> attachments;
1408                         attachments.push_back(*cbImageView);
1409                         deUint32 dsAttachmentIdx = 0, srAttachmentIdx = 0;
1410                         if (m_data.useAttachment())
1411                         {
1412                                 srAttachmentIdx = (deUint32)attachments.size();
1413                                 attachments.push_back(*srImageView);
1414                         }
1415                         if (m_data.useDepthStencil)
1416                         {
1417                                 dsAttachmentIdx = (deUint32)attachments.size();
1418                                 attachments.push_back(*dsImageView);
1419                         }
1420
1421                         if (!m_data.useDynamicRendering)
1422                         {
1423                                 const vk::VkAttachmentReference2 colorAttachmentReference
1424                                 {
1425                                         VK_STRUCTURE_TYPE_ATTACHMENT_REFERENCE_2,                                       // sType
1426                                         DE_NULL,                                                                                                        // pNext
1427                                         0,                                                                                                                      // attachment
1428                                         vk::VK_IMAGE_LAYOUT_GENERAL,                                                            // layout
1429                                         0,                                                                                                                      // aspectMask
1430                                 };
1431
1432                                 const vk::VkAttachmentReference2 fragmentShadingRateAttachment =
1433                                 {
1434                                         VK_STRUCTURE_TYPE_ATTACHMENT_REFERENCE_2,                                       // sType
1435                                         DE_NULL,                                                                                                        // pNext
1436                                         srAttachmentIdx,                                                                                        // attachment
1437                                         srLayout,                                                                                                       // layout
1438                                         0,                                                                                                                      // aspectMask
1439                                 };
1440
1441                                 const vk::VkAttachmentReference2 depthAttachmentReference =
1442                                 {
1443                                         VK_STRUCTURE_TYPE_ATTACHMENT_REFERENCE_2,                                       // sType
1444                                         DE_NULL,                                                                                                        // pNext
1445                                         dsAttachmentIdx,                                                                                        // attachment
1446                                         vk::VK_IMAGE_LAYOUT_GENERAL,                                                            // layout
1447                                         0,                                                                                                                      // aspectMask
1448                                 };
1449
1450                                 const bool                                                                              noAttachmentPtr                         = (m_data.attachmentUsage == AttachmentUsage::NO_ATTACHMENT_PTR);
1451                                 const VkFragmentShadingRateAttachmentInfoKHR    shadingRateAttachmentInfo       =
1452                                 {
1453                                         VK_STRUCTURE_TYPE_FRAGMENT_SHADING_RATE_ATTACHMENT_INFO_KHR,                                                    // VkStructureType                                sType;
1454                                         DE_NULL,                                                                                                                                                                // const void*                                    pNext;
1455                                         (noAttachmentPtr ? nullptr : &fragmentShadingRateAttachment),                                                   // const VkAttachmentReference2*        pFragmentShadingRateAttachment;
1456                                         { srTexelWidth, srTexelHeight },                                                                                                                // VkExtent2D                                      shadingRateAttachmentTexelSize;
1457                                 };
1458
1459                                 const bool                                              useAttachmentInfo       = (m_data.attachmentUsage != AttachmentUsage::NO_ATTACHMENT);
1460                                 const VkSubpassDescription2             subpassDesc                     =
1461                                 {
1462                                         VK_STRUCTURE_TYPE_SUBPASS_DESCRIPTION_2,                                                // sType
1463                                         (useAttachmentInfo ? &shadingRateAttachmentInfo : nullptr),             // pNext;
1464                                         (vk::VkSubpassDescriptionFlags)0,                                                               // flags
1465                                         vk::VK_PIPELINE_BIND_POINT_GRAPHICS,                                                    // pipelineBindPoint
1466                                         m_data.multiView ? 0x3 : 0u,                                                                    // viewMask
1467                                         0u,                                                                                                                             // inputCount
1468                                         DE_NULL,                                                                                                                // pInputAttachments
1469                                         1,                                                                                                                              // colorCount
1470                                         &colorAttachmentReference,                                                                              // pColorAttachments
1471                                         DE_NULL,                                                                                                                // pResolveAttachments
1472                                         m_data.useDepthStencil ? &depthAttachmentReference : DE_NULL,   // depthStencilAttachment
1473                                         0u,                                                                                                                             // preserveCount
1474                                         DE_NULL,                                                                                                                // pPreserveAttachments
1475                                 };
1476
1477                                 std::vector<VkAttachmentDescription2> attachmentDescriptions
1478                                 {
1479                                         {
1480                                                 VK_STRUCTURE_TYPE_ATTACHMENT_DESCRIPTION_2,     // VkStructureType sType;
1481                                                 DE_NULL,                                                                        // const void* pNext;
1482                                                 (VkAttachmentDescriptionFlags)0u,                       // VkAttachmentDescriptionFlags         flags;
1483                                                 cbFormat,                                       // VkFormat                                                     format;
1484                                                 m_data.samples,                                                         // VkSampleCountFlagBits                        samples;
1485                                                 VK_ATTACHMENT_LOAD_OP_LOAD,                                     // VkAttachmentLoadOp                           loadOp;
1486                                                 VK_ATTACHMENT_STORE_OP_STORE,                           // VkAttachmentStoreOp                          storeOp;
1487                                                 VK_ATTACHMENT_LOAD_OP_DONT_CARE,                        // VkAttachmentLoadOp                           stencilLoadOp;
1488                                                 VK_ATTACHMENT_STORE_OP_DONT_CARE,                       // VkAttachmentStoreOp                          stencilStoreOp;
1489                                                 VK_IMAGE_LAYOUT_GENERAL,                                        // VkImageLayout                                        initialLayout;
1490                                                 VK_IMAGE_LAYOUT_GENERAL                                         // VkImageLayout                                        finalLayout;
1491                                         }
1492                                 };
1493                                 if (m_data.useAttachment())
1494                                         attachmentDescriptions.push_back(
1495                                         {
1496                                                 VK_STRUCTURE_TYPE_ATTACHMENT_DESCRIPTION_2,     // VkStructureType sType;
1497                                                 DE_NULL,                                                                        // const void* pNext;
1498                                                 (VkAttachmentDescriptionFlags)0u,                       // VkAttachmentDescriptionFlags         flags;
1499                                                 srFormat,                                                                       // VkFormat                                                     format;
1500                                                 VK_SAMPLE_COUNT_1_BIT,                                          // VkSampleCountFlagBits                        samples;
1501                                                 VK_ATTACHMENT_LOAD_OP_LOAD,                                     // VkAttachmentLoadOp                           loadOp;
1502                                                 VK_ATTACHMENT_STORE_OP_STORE,                           // VkAttachmentStoreOp                          storeOp;
1503                                                 VK_ATTACHMENT_LOAD_OP_DONT_CARE,                        // VkAttachmentLoadOp                           stencilLoadOp;
1504                                                 VK_ATTACHMENT_STORE_OP_DONT_CARE,                       // VkAttachmentStoreOp                          stencilStoreOp;
1505                                                 srLayout,                                                                       // VkImageLayout                                        initialLayout;
1506                                                 srLayout                                                                        // VkImageLayout                                        finalLayout;
1507                                         }
1508                                         );
1509
1510                                 if (m_data.useDepthStencil)
1511                                         attachmentDescriptions.push_back(
1512                                         {
1513                                                 VK_STRUCTURE_TYPE_ATTACHMENT_DESCRIPTION_2,     // VkStructureType sType;
1514                                                 DE_NULL,                                                                        // const void* pNext;
1515                                                 (VkAttachmentDescriptionFlags)0u,                       // VkAttachmentDescriptionFlags         flags;
1516                                                 dsFormat,                                       // VkFormat                                                     format;
1517                                                 m_data.samples,                                                         // VkSampleCountFlagBits                        samples;
1518                                                 VK_ATTACHMENT_LOAD_OP_LOAD,                                     // VkAttachmentLoadOp                           loadOp;
1519                                                 VK_ATTACHMENT_STORE_OP_STORE,                           // VkAttachmentStoreOp                          storeOp;
1520                                                 VK_ATTACHMENT_LOAD_OP_LOAD,                                     // VkAttachmentLoadOp                           stencilLoadOp;
1521                                                 VK_ATTACHMENT_STORE_OP_STORE,                           // VkAttachmentStoreOp                          stencilStoreOp;
1522                                                 VK_IMAGE_LAYOUT_GENERAL,                                        // VkImageLayout                                        initialLayout;
1523                                                 VK_IMAGE_LAYOUT_GENERAL                                         // VkImageLayout                                        finalLayout;
1524                                         }
1525                                         );
1526
1527                                 const VkRenderPassCreateInfo2   renderPassParams        =
1528                                 {
1529                                         VK_STRUCTURE_TYPE_RENDER_PASS_CREATE_INFO_2,                    // sType
1530                                         DE_NULL,                                                                                                // pNext
1531                                         (vk::VkRenderPassCreateFlags)0,
1532                                         (deUint32)attachmentDescriptions.size(),                                // attachmentCount
1533                                         &attachmentDescriptions[0],                                                             // pAttachments
1534                                         1u,                                                                                                             // subpassCount
1535                                         &subpassDesc,                                                                                   // pSubpasses
1536                                         0u,                                                                                                             // dependencyCount
1537                                         DE_NULL,                                                                                                // pDependencies
1538                                         0u,                                                                                                             // correlatedViewMaskCount
1539                                         DE_NULL,                                                                                                // pCorrelatedViewMasks
1540                                 };
1541
1542                                 renderPass = createRenderPass2(vk, device, &renderPassParams);
1543
1544                                 std::vector<VkFramebufferAttachmentImageInfo> framebufferAttachmentImageInfo;
1545                                 framebufferAttachmentImageInfo.push_back(
1546                                         {
1547                                                 VK_STRUCTURE_TYPE_FRAMEBUFFER_ATTACHMENT_IMAGE_INFO,            //  VkStructureType             sType;
1548                                                 DE_NULL,                                                                                                        //  const void*                 pNext;
1549                                                 (VkImageCreateFlags)0u,                                                                         //  VkImageCreateFlags  flags;
1550                                                 cbUsage,                                                                                                        //  VkImageUsageFlags   usage;
1551                                                 m_data.framebufferDim.width,                                                            //  deUint32                    width;
1552                                                 m_data.framebufferDim.height,                                                           //  deUint32                    height;
1553                                                 m_data.numColorLayers,                                                                          //  deUint32                    layerCount;
1554                                                 1u,                                                                                                                     //  deUint32                    viewFormatCount;
1555                                                 &cbFormat                                                                                                       //  const VkFormat*             pViewFormats;
1556                                         }
1557                                 );
1558                                 if (m_data.useAttachment())
1559                                         framebufferAttachmentImageInfo.push_back(
1560                                         {
1561                                                 VK_STRUCTURE_TYPE_FRAMEBUFFER_ATTACHMENT_IMAGE_INFO,            //  VkStructureType             sType;
1562                                                 DE_NULL,                                                                                                        //  const void*                 pNext;
1563                                                 (VkImageCreateFlags)0u,                                                                         //  VkImageCreateFlags  flags;
1564                                                 srUsage,                                                                                                        //  VkImageUsageFlags   usage;
1565                                                 srWidth,                                                                                                        //  deUint32                    width;
1566                                                 srHeight,                                                                                                       //  deUint32                    height;
1567                                                 numSRLayers,                                                                                            //  deUint32                    layerCount;
1568                                                 1u,                                                                                                                     //  deUint32                    viewFormatCount;
1569                                                 &srFormat                                                                                                       //  const VkFormat*             pViewFormats;
1570                                         }
1571                                         );
1572
1573                                 if (m_data.useDepthStencil)
1574                                         framebufferAttachmentImageInfo.push_back(
1575                                         {
1576                                                 VK_STRUCTURE_TYPE_FRAMEBUFFER_ATTACHMENT_IMAGE_INFO,            //  VkStructureType             sType;
1577                                                 DE_NULL,                                                                                                        //  const void*                 pNext;
1578                                                 (VkImageCreateFlags)0u,                                                                         //  VkImageCreateFlags  flags;
1579                                                 dsUsage,                                                                                                        //  VkImageUsageFlags   usage;
1580                                                 m_data.framebufferDim.width,                                                            //  deUint32                    width;
1581                                                 m_data.framebufferDim.height,                                                           //  deUint32                    height;
1582                                                 m_data.numColorLayers,                                                                          //  deUint32                    layerCount;
1583                                                 1u,                                                                                                                     //  deUint32                    viewFormatCount;
1584                                                 &dsFormat                                                                                                       //  const VkFormat*             pViewFormats;
1585                                         }
1586                                         );
1587
1588                                 const VkFramebufferAttachmentsCreateInfo                                framebufferAttachmentsCreateInfo        =
1589                                 {
1590                                         VK_STRUCTURE_TYPE_FRAMEBUFFER_ATTACHMENTS_CREATE_INFO,          //  VkStructureType                                                             sType;
1591                                         DE_NULL,                                                                                                        //  const void*                                                                 pNext;
1592                                         (deUint32)framebufferAttachmentImageInfo.size(),                        //  deUint32                                                                    attachmentImageInfoCount;
1593                                         &framebufferAttachmentImageInfo[0]                                                      //  const VkFramebufferAttachmentImageInfo*             pAttachmentImageInfos;
1594                                 };
1595
1596                                 const vk::VkFramebufferCreateInfo       framebufferParams       =
1597                                 {
1598                                         vk::VK_STRUCTURE_TYPE_FRAMEBUFFER_CREATE_INFO,  // sType
1599                                         imagelessFB ? &framebufferAttachmentsCreateInfo : DE_NULL,                              // pNext
1600                                         (vk::VkFramebufferCreateFlags)(imagelessFB ? VK_FRAMEBUFFER_CREATE_IMAGELESS_BIT : 0),
1601                                         *renderPass,                                                                    // renderPass
1602                                         (deUint32)attachments.size(),                                   // attachmentCount
1603                                         imagelessFB ? DE_NULL : &attachments[0],                // pAttachments
1604                                         m_data.framebufferDim.width,                                    // width
1605                                         m_data.framebufferDim.height,                                   // height
1606                                         m_data.multiView ? 1 : m_data.numColorLayers,   // layers
1607                                 };
1608
1609                                 framebuffer = createFramebuffer(vk, device, &framebufferParams);
1610                         }
1611
1612                         const VkVertexInputBindingDescription           vertexBinding =
1613                         {
1614                                 0u,                                                     // deUint32                             binding;
1615                                 sizeof(float) * 2,                      // deUint32                             stride;
1616                                 VK_VERTEX_INPUT_RATE_VERTEX     // VkVertexInputRate    inputRate;
1617                         };
1618                         const VkVertexInputAttributeDescription         vertexInputAttributeDescription =
1619                         {
1620                                 0u,                                                     // deUint32     location;
1621                                 0u,                                                     // deUint32     binding;
1622                                 VK_FORMAT_R32G32_SFLOAT,        // VkFormat     format;
1623                                 0u                                                      // deUint32     offset;
1624                         };
1625
1626                         const VkPipelineVertexInputStateCreateInfo              vertexInputStateCreateInfo              =
1627                         {
1628                                 VK_STRUCTURE_TYPE_PIPELINE_VERTEX_INPUT_STATE_CREATE_INFO,      // VkStructureType                                                      sType;
1629                                 DE_NULL,                                                                                                        // const void*                                                          pNext;
1630                                 (VkPipelineVertexInputStateCreateFlags)0,                                       // VkPipelineVertexInputStateCreateFlags        flags;
1631                                 1u,                                                                                                                     // deUint32                                                                     vertexBindingDescriptionCount;
1632                                 &vertexBinding,                                                                                         // const VkVertexInputBindingDescription*       pVertexBindingDescriptions;
1633                                 1u,                                                                                                                     // deUint32                                                                     vertexAttributeDescriptionCount;
1634                                 &vertexInputAttributeDescription                                                        // const VkVertexInputAttributeDescription*     pVertexAttributeDescriptions;
1635                         };
1636
1637                         const VkPipelineInputAssemblyStateCreateInfo    inputAssemblyStateCreateInfo    =
1638                         {
1639                                 VK_STRUCTURE_TYPE_PIPELINE_INPUT_ASSEMBLY_STATE_CREATE_INFO,    // VkStructureType                                                      sType;
1640                                 DE_NULL,                                                                                                                // const void*                                                          pNext;
1641                                 (VkPipelineInputAssemblyStateCreateFlags)0,                                             // VkPipelineInputAssemblyStateCreateFlags      flags;
1642                                 VK_PRIMITIVE_TOPOLOGY_TRIANGLE_LIST,                                                    // VkPrimitiveTopology                                          topology;
1643                                 VK_FALSE                                                                                                                // VkBool32                                                                     primitiveRestartEnable;
1644                         };
1645
1646                         const VkPipelineRasterizationConservativeStateCreateInfoEXT consRastState =
1647                         {
1648                                 VK_STRUCTURE_TYPE_PIPELINE_RASTERIZATION_CONSERVATIVE_STATE_CREATE_INFO_EXT,    // VkStructureType                                                                                 sType;
1649                                 DE_NULL,                                                                                                                                                // const void*                                                                                     pNext;
1650                                 (VkPipelineRasterizationConservativeStateCreateFlagsEXT)0,                                              // VkPipelineRasterizationConservativeStateCreateFlagsEXT       flags;
1651                                 m_data.conservativeMode,                                                                                                                // VkConservativeRasterizationModeEXT                                           conservativeRasterizationMode;
1652                                 0.0f,                                                                                                                                                   // float                                                                                                         extraPrimitiveOverestimationSize;
1653                         };
1654
1655                         const VkPipelineRasterizationStateCreateInfo    rasterizationStateCreateInfo    =
1656                         {
1657                                 VK_STRUCTURE_TYPE_PIPELINE_RASTERIZATION_STATE_CREATE_INFO,             // VkStructureType                                                      sType;
1658                                 m_data.conservativeEnable ? &consRastState : DE_NULL,                   // const void*                                                          pNext;
1659                                 (VkPipelineRasterizationStateCreateFlags)0,                                             // VkPipelineRasterizationStateCreateFlags      flags;
1660                                 VK_FALSE,                                                                                                               // VkBool32                                                                     depthClampEnable;
1661                                 VK_FALSE,                                                                                                               // VkBool32                                                                     rasterizerDiscardEnable;
1662                                 VK_POLYGON_MODE_FILL,                                                                                   // VkPolygonMode                                                        polygonMode;
1663                                 VK_CULL_MODE_NONE,                                                                                              // VkCullModeFlags                                                      cullMode;
1664                                 VK_FRONT_FACE_CLOCKWISE,                                                                                // VkFrontFace                                                          frontFace;
1665                                 VK_FALSE,                                                                                                               // VkBool32                                                                     depthBiasEnable;
1666                                 0.0f,                                                                                                                   // float                                                                        depthBiasConstantFactor;
1667                                 0.0f,                                                                                                                   // float                                                                        depthBiasClamp;
1668                                 0.0f,                                                                                                                   // float                                                                        depthBiasSlopeFactor;
1669                                 1.0f                                                                                                                    // float                                                                        lineWidth;
1670                         };
1671
1672                         // Kill some bits from each AA mode
1673                         const VkSampleMask      sampleMask      = m_data.sampleMaskTest ? 0x9 : 0x7D56;
1674                         const VkSampleMask*     pSampleMask = m_data.useApiSampleMask ? &sampleMask : DE_NULL;
1675
1676                         // All samples at pixel center. We'll validate that pixels are fully covered or uncovered.
1677                         std::vector<VkSampleLocationEXT> sampleLocations(m_data.samples, { 0.5f, 0.5f });
1678                         const VkSampleLocationsInfoEXT sampleLocationsInfo =
1679                         {
1680                                 VK_STRUCTURE_TYPE_SAMPLE_LOCATIONS_INFO_EXT,    // VkStructureType                              sType;
1681                                 DE_NULL,                                                                                // const void*                                  pNext;
1682                                 (VkSampleCountFlagBits)m_data.samples,                  // VkSampleCountFlagBits                sampleLocationsPerPixel;
1683                                 { 1, 1 },                                                                               // VkExtent2D                                   sampleLocationGridSize;
1684                                 (deUint32)m_data.samples,                                               // uint32_t                                             sampleLocationsCount;
1685                                 &sampleLocations[0],                                                    // const VkSampleLocationEXT*   pSampleLocations;
1686                         };
1687
1688                         const VkPipelineSampleLocationsStateCreateInfoEXT pipelineSampleLocationsCreateInfo =
1689                         {
1690                                 VK_STRUCTURE_TYPE_PIPELINE_SAMPLE_LOCATIONS_STATE_CREATE_INFO_EXT,      // VkStructureType                      sType;
1691                                 DE_NULL,                                                                                                                        // const void*                          pNext;
1692                                 VK_TRUE,                                                                                                                        // VkBool32                                     sampleLocationsEnable;
1693                                 sampleLocationsInfo,                                                                                            // VkSampleLocationsInfoEXT     sampleLocationsInfo;
1694                         };
1695
1696                         const VkPipelineMultisampleStateCreateInfo              multisampleStateCreateInfo =
1697                         {
1698                                 VK_STRUCTURE_TYPE_PIPELINE_MULTISAMPLE_STATE_CREATE_INFO,       // VkStructureType                                                      sType
1699                                 m_data.sampleLocations ? &pipelineSampleLocationsCreateInfo : DE_NULL,  // const void*                                  pNext
1700                                 0u,                                                                                                                     // VkPipelineMultisampleStateCreateFlags        flags
1701                                 (VkSampleCountFlagBits)m_data.samples,                                          // VkSampleCountFlagBits                                        rasterizationSamples
1702                                 (VkBool32)m_data.sampleShadingEnable,                                           // VkBool32                                                                     sampleShadingEnable
1703                                 1.0f,                                                                                                           // float                                                                        minSampleShading
1704                                 pSampleMask,                                                                                            // const VkSampleMask*                                          pSampleMask
1705                                 VK_FALSE,                                                                                                       // VkBool32                                                                     alphaToCoverageEnable
1706                                 VK_FALSE                                                                                                        // VkBool32                                                                     alphaToOneEnable
1707                         };
1708
1709                         std::vector<VkViewport> viewports;
1710                         std::vector<VkRect2D> scissors;
1711                         if (m_data.multiViewport)
1712                         {
1713                                 // Split the viewport into left and right halves
1714                                 int x0 = 0, x1 = m_data.framebufferDim.width/2, x2 = m_data.framebufferDim.width;
1715
1716                                 viewports.push_back(makeViewport((float)x0, 0, (float)(x1-x0), (float)m_data.framebufferDim.height, 0.0f, 1.0f));
1717                                 scissors.push_back(makeRect2D(x0, 0, x1-x0, m_data.framebufferDim.height));
1718
1719                                 viewports.push_back(makeViewport((float)x1, 0, (float)(x2-x1), (float)m_data.framebufferDim.height, 0.0f, 1.0f));
1720                                 scissors.push_back(makeRect2D(x1, 0, x2-x1, m_data.framebufferDim.height));
1721                         }
1722                         else
1723                         {
1724                                 viewports.push_back(makeViewport(m_data.framebufferDim.width, m_data.framebufferDim.height));
1725                                 scissors.push_back(makeRect2D(m_data.framebufferDim.width, m_data.framebufferDim.height));
1726                         }
1727
1728                         const VkPipelineViewportStateCreateInfo                 viewportStateCreateInfo                         =
1729                         {
1730                                 VK_STRUCTURE_TYPE_PIPELINE_VIEWPORT_STATE_CREATE_INFO,          // VkStructureType                                                      sType
1731                                 DE_NULL,                                                                                                        // const void*                                                          pNext
1732                                 (VkPipelineViewportStateCreateFlags)0,                                          // VkPipelineViewportStateCreateFlags           flags
1733                                 (deUint32)viewports.size(),                                                                     // deUint32                                                                     viewportCount
1734                                 &viewports[0],                                                                                          // const VkViewport*                                            pViewports
1735                                 (deUint32)scissors.size(),                                                                      // deUint32                                                                     scissorCount
1736                                 &scissors[0]                                                                                            // const VkRect2D*                                                      pScissors
1737                         };
1738
1739                         Move<VkShaderModule> fragShader = createShaderModule(vk, device, m_context.getBinaryCollection().get("frag"), 0);
1740                         Move<VkShaderModule> vertShader = createShaderModule(vk, device, m_context.getBinaryCollection().get("vert"), 0);
1741                         Move<VkShaderModule> geomShader;
1742                         if (m_data.geometryShader)
1743                                 geomShader = createShaderModule(vk, device, m_context.getBinaryCollection().get("geom"), 0);
1744
1745                         deUint32 numStages = m_data.geometryShader ? 3 : 2u;
1746
1747                         const VkPipelineShaderStageCreateInfo   shaderCreateInfo[3] =
1748                         {
1749                                 {
1750                                         VK_STRUCTURE_TYPE_PIPELINE_SHADER_STAGE_CREATE_INFO,
1751                                         DE_NULL,
1752                                         (VkPipelineShaderStageCreateFlags)0,
1753                                         VK_SHADER_STAGE_VERTEX_BIT,                                                                     // stage
1754                                         *vertShader,                                                                                            // shader
1755                                         "main",
1756                                         DE_NULL,                                                                                                        // pSpecializationInfo
1757                                 },
1758                                 {
1759                                         VK_STRUCTURE_TYPE_PIPELINE_SHADER_STAGE_CREATE_INFO,
1760                                         DE_NULL,
1761                                         (VkPipelineShaderStageCreateFlags)0,
1762                                         VK_SHADER_STAGE_FRAGMENT_BIT,                                                           // stage
1763                                         *fragShader,                                                                                            // shader
1764                                         "main",
1765                                         DE_NULL,                                                                                                        // pSpecializationInfo
1766                                 },
1767                                 {
1768                                         VK_STRUCTURE_TYPE_PIPELINE_SHADER_STAGE_CREATE_INFO,
1769                                         DE_NULL,
1770                                         (VkPipelineShaderStageCreateFlags)0,
1771                                         VK_SHADER_STAGE_GEOMETRY_BIT,                                                           // stage
1772                                         *geomShader,                                                                                            // shader
1773                                         "main",
1774                                         DE_NULL,                                                                                                        // pSpecializationInfo
1775                                 }
1776                         };
1777
1778                         const VkPipelineColorBlendAttachmentState               colorBlendAttachmentState               =
1779                         {
1780                                 VK_FALSE,                               // VkBool32                                      blendEnable;
1781                                 VK_BLEND_FACTOR_ZERO,   // VkBlendFactor                        srcColorBlendFactor;
1782                                 VK_BLEND_FACTOR_ZERO,   // VkBlendFactor                        dstColorBlendFactor;
1783                                 VK_BLEND_OP_ADD,                // VkBlendOp                            colorBlendOp;
1784                                 VK_BLEND_FACTOR_ZERO,   // VkBlendFactor                        srcAlphaBlendFactor;
1785                                 VK_BLEND_FACTOR_ZERO,   // VkBlendFactor                        dstAlphaBlendFactor;
1786                                 VK_BLEND_OP_ADD,                // VkBlendOp                            alphaBlendOp;
1787                                 0xf                                             // VkColorComponentFlags        colorWriteMask;
1788                         };
1789
1790                         const VkPipelineColorBlendStateCreateInfo               colorBlendStateCreateInfo               =
1791                         {
1792                                 VK_STRUCTURE_TYPE_PIPELINE_COLOR_BLEND_STATE_CREATE_INFO,       // VkStructureType                                                              sType;
1793                                 DE_NULL,                                                                                                        // const void*                                                                  pNext;
1794                                 0u,                                                                                                                     // VkPipelineColorBlendStateCreateFlags                 flags;
1795                                 VK_FALSE,                                                                                                       // VkBool32                                                                             logicOpEnable;
1796                                 VK_LOGIC_OP_COPY,                                                                                       // VkLogicOp                                                                    logicOp;
1797                                 1u,                                                                                                                     // deUint32                                                                             attachmentCount;
1798                                 &colorBlendAttachmentState,                                                                     // const VkPipelineColorBlendAttachmentState*   pAttachments;
1799                                 { 1.0f, 1.0f, 1.0f, 1.0f }                                                                      // float                                                                                blendConstants[4];
1800                         };
1801
1802                         const deUint32 fragSizeWH = m_data.sampleMaskTest ? 2 : 0;
1803
1804                         VkPipelineRenderingCreateInfoKHR renderingCreateInfo
1805                         {
1806                                 VK_STRUCTURE_TYPE_PIPELINE_RENDERING_CREATE_INFO_KHR,
1807                                 DE_NULL,
1808                                 m_data.multiView ? 0x3 : 0u,
1809                                 1u,
1810                                 &cbFormat,
1811                                 m_data.useDepthStencil ? dsFormat : VK_FORMAT_UNDEFINED,
1812                                 m_data.useDepthStencil ? dsFormat : VK_FORMAT_UNDEFINED
1813                         };
1814
1815                         VkPipelineFragmentShadingRateStateCreateInfoKHR shadingRateStateCreateInfo =
1816                         {
1817                                 VK_STRUCTURE_TYPE_PIPELINE_FRAGMENT_SHADING_RATE_STATE_CREATE_INFO_KHR, // VkStructureType                                              sType;
1818                                 m_data.useDynamicRendering ? &renderingCreateInfo : DE_NULL,                    // const void*                                                  pNext;
1819                                 { fragSizeWH, fragSizeWH },                                                                                             // VkExtent2D                                                   fragmentSize;
1820                                 { m_data.combinerOp[0], m_data.combinerOp[1] },                                                 // VkFragmentShadingRateCombinerOpKHR   combinerOps[2];
1821                         };
1822
1823                         VkDynamicState dynamicState = VK_DYNAMIC_STATE_FRAGMENT_SHADING_RATE_KHR;
1824                         const VkPipelineDynamicStateCreateInfo dynamicStateCreateInfo =
1825                         {
1826                                 VK_STRUCTURE_TYPE_PIPELINE_DYNAMIC_STATE_CREATE_INFO,           // VkStructureType                                              sType;
1827                                 DE_NULL,                                                                                                        // const void*                                                  pNext;
1828                                 (VkPipelineDynamicStateCreateFlags)0,                                           // VkPipelineDynamicStateCreateFlags    flags;
1829                                 m_data.useDynamicState ? 1u : 0u,                                                       // uint32_t                                                             dynamicStateCount;
1830                                 &dynamicState,                                                                                          // const VkDynamicState*                                pDynamicStates;
1831                         };
1832
1833                         // Enable depth/stencil writes, always passing
1834                         VkPipelineDepthStencilStateCreateInfo           depthStencilStateParams                         =
1835                         {
1836                                 VK_STRUCTURE_TYPE_PIPELINE_DEPTH_STENCIL_STATE_CREATE_INFO,     // VkStructureType                                                      sType;
1837                                 DE_NULL,                                                                                                        // const void*                                                          pNext;
1838                                 0u,                                                                                                                     // VkPipelineDepthStencilStateCreateFlags       flags;
1839                                 VK_TRUE,                                                                                                        // VkBool32                                                                     depthTestEnable;
1840                                 VK_TRUE,                                                                                                        // VkBool32                                                                     depthWriteEnable;
1841                                 VK_COMPARE_OP_ALWAYS,                                                                           // VkCompareOp                                                          depthCompareOp;
1842                                 VK_FALSE,                                                                                                       // VkBool32                                                                     depthBoundsTestEnable;
1843                                 VK_TRUE,                                                                                                        // VkBool32                                                                     stencilTestEnable;
1844                                 // VkStencilOpState     front;
1845                                 {
1846                                         VK_STENCIL_OP_REPLACE,  // VkStencilOp  failOp;
1847                                         VK_STENCIL_OP_REPLACE,  // VkStencilOp  passOp;
1848                                         VK_STENCIL_OP_REPLACE,  // VkStencilOp  depthFailOp;
1849                                         VK_COMPARE_OP_ALWAYS,   // VkCompareOp  compareOp;
1850                                         0u,                                             // deUint32             compareMask;
1851                                         0xFFu,                                  // deUint32             writeMask;
1852                                         0xFFu,                                  // deUint32             reference;
1853                                 },
1854                                 // VkStencilOpState     back;
1855                                 {
1856                                         VK_STENCIL_OP_REPLACE,  // VkStencilOp  failOp;
1857                                         VK_STENCIL_OP_REPLACE,  // VkStencilOp  passOp;
1858                                         VK_STENCIL_OP_REPLACE,  // VkStencilOp  depthFailOp;
1859                                         VK_COMPARE_OP_ALWAYS,   // VkCompareOp  compareOp;
1860                                         0u,                                             // deUint32             compareMask;
1861                                         0xFFu,                                  // deUint32             writeMask;
1862                                         0xFFu,                                  // deUint32             reference;
1863                                 },
1864                                 0.0f,                                           // float                        minDepthBounds;
1865                                 0.0f,                                           // float                        maxDepthBounds;
1866                         };
1867
1868                         VkGraphicsPipelineCreateInfo graphicsPipelineCreateInfo =
1869                         {
1870                                 VK_STRUCTURE_TYPE_GRAPHICS_PIPELINE_CREATE_INFO,        // VkStructureType                                                                      sType;
1871                                 &shadingRateStateCreateInfo,                                            // const void*                                                                          pNext;
1872                                 (VkPipelineCreateFlags)0,                                                       // VkPipelineCreateFlags                                                        flags;
1873                                 numStages,                                                                                      // deUint32                                                                                     stageCount;
1874                                 &shaderCreateInfo[0],                                                           // const VkPipelineShaderStageCreateInfo*                       pStages;
1875                                 &vertexInputStateCreateInfo,                                            // const VkPipelineVertexInputStateCreateInfo*          pVertexInputState;
1876                                 &inputAssemblyStateCreateInfo,                                          // const VkPipelineInputAssemblyStateCreateInfo*        pInputAssemblyState;
1877                                 DE_NULL,                                                                                        // const VkPipelineTessellationStateCreateInfo*         pTessellationState;
1878                                 &viewportStateCreateInfo,                                                       // const VkPipelineViewportStateCreateInfo*                     pViewportState;
1879                                 &rasterizationStateCreateInfo,                                          // const VkPipelineRasterizationStateCreateInfo*        pRasterizationState;
1880                                 &multisampleStateCreateInfo,                                            // const VkPipelineMultisampleStateCreateInfo*          pMultisampleState;
1881                                 &depthStencilStateParams,                                                       // const VkPipelineDepthStencilStateCreateInfo*         pDepthStencilState;
1882                                 &colorBlendStateCreateInfo,                                                     // const VkPipelineColorBlendStateCreateInfo*           pColorBlendState;
1883                                 &dynamicStateCreateInfo,                                                        // const VkPipelineDynamicStateCreateInfo*                      pDynamicState;
1884                                 pipelineLayout.get(),                                                           // VkPipelineLayout                                                                     layout;
1885                                 renderPass.get(),                                                                       // VkRenderPass                                                                         renderPass;
1886                                 0u,                                                                                                     // deUint32                                                                                     subpass;
1887                                 DE_NULL,                                                                                        // VkPipeline                                                                           basePipelineHandle;
1888                                 0                                                                                                       // int                                                                                          basePipelineIndex;
1889                         };
1890
1891                         if (m_data.useDynamicRendering)
1892                                 graphicsPipelineCreateInfo.flags |= VK_PIPELINE_CREATE_RENDERING_FRAGMENT_SHADING_RATE_ATTACHMENT_BIT_KHR;
1893
1894                         VkImageMemoryBarrier imageBarrier =
1895                         {
1896                                 VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,                         // VkStructureType              sType
1897                                 DE_NULL,                                                                                        // const void*                  pNext
1898                                 0u,                                                                                                     // VkAccessFlags                srcAccessMask
1899                                 VK_ACCESS_TRANSFER_WRITE_BIT,                                           // VkAccessFlags                dstAccessMask
1900                                 VK_IMAGE_LAYOUT_UNDEFINED,                                                      // VkImageLayout                oldLayout
1901                                 VK_IMAGE_LAYOUT_GENERAL,                                                        // VkImageLayout                newLayout
1902                                 VK_QUEUE_FAMILY_IGNORED,                                                        // uint32_t                             srcQueueFamilyIndex
1903                                 VK_QUEUE_FAMILY_IGNORED,                                                        // uint32_t                             dstQueueFamilyIndex
1904                                 **cbImage,                                                                                      // VkImage                              image
1905                                 {
1906                                         VK_IMAGE_ASPECT_COLOR_BIT,                              // VkImageAspectFlags   aspectMask
1907                                         0u,                                                                             // uint32_t                             baseMipLevel
1908                                         VK_REMAINING_MIP_LEVELS,                                // uint32_t                             mipLevels,
1909                                         0u,                                                                             // uint32_t                             baseArray
1910                                         VK_REMAINING_ARRAY_LAYERS,                              // uint32_t                             arraySize
1911                                 }
1912                         };
1913
1914                         const VkQueue                                   queue                                   = m_context.getUniversalQueue();
1915                         Move<VkCommandPool>                             cmdPool                                 = createCommandPool(vk, device, VK_COMMAND_POOL_CREATE_RESET_COMMAND_BUFFER_BIT, m_context.getUniversalQueueFamilyIndex());
1916                         Move<VkCommandBuffer>                   cmdBuffer                               = allocateCommandBuffer(vk, device, *cmdPool, VK_COMMAND_BUFFER_LEVEL_PRIMARY);
1917                         VkClearValue                                    clearColor                              = makeClearValueColorU32(0, 0, 0, 0);
1918                         VkClearValue                                    clearDepthStencil               = makeClearValueDepthStencil(0.0, 0);
1919
1920                         beginCommandBuffer(vk, *cmdBuffer, 0u);
1921
1922                         vk.cmdPipelineBarrier(*cmdBuffer, VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT,
1923                                                                         (VkDependencyFlags)0,
1924                                                                         0, (const VkMemoryBarrier*)DE_NULL,
1925                                                                         0, (const VkBufferMemoryBarrier*)DE_NULL,
1926                                                                         1, &imageBarrier);
1927
1928                         imageBarrier.image = **derivImage;
1929                         imageBarrier.newLayout = VK_IMAGE_LAYOUT_GENERAL;
1930
1931                         vk.cmdPipelineBarrier(*cmdBuffer, VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT,
1932                                                                         (VkDependencyFlags)0,
1933                                                                         0, (const VkMemoryBarrier*)DE_NULL,
1934                                                                         0, (const VkBufferMemoryBarrier*)DE_NULL,
1935                                                                         1, &imageBarrier);
1936
1937                         // Clear level to 1<<level
1938                         for (deUint32 i = 0; i < derivNumLevels; ++i)
1939                         {
1940                                 VkImageSubresourceRange range = makeImageSubresourceRange(VK_IMAGE_ASPECT_COLOR_BIT, i, 1u, 0u, 1u);
1941                                 VkClearValue clearLevelColor = makeClearValueColorU32(1<<i,0,0,0);
1942                                 vk.cmdClearColorImage(*cmdBuffer, **derivImage, VK_IMAGE_LAYOUT_GENERAL, &clearLevelColor.color, 1, &range);
1943                         }
1944
1945                         // Clear color buffer to transparent black
1946                         {
1947                                 VkImageSubresourceRange range = makeImageSubresourceRange(VK_IMAGE_ASPECT_COLOR_BIT, 0u, 1u, 0u, VK_REMAINING_ARRAY_LAYERS);
1948                                 vk.cmdClearColorImage(*cmdBuffer, **cbImage, VK_IMAGE_LAYOUT_GENERAL, &clearColor.color, 1, &range);
1949                         }
1950
1951                         // Clear depth and stencil
1952                         if (m_data.useDepthStencil)
1953                         {
1954                                 VkImageSubresourceRange range = makeImageSubresourceRange(VK_IMAGE_ASPECT_DEPTH_BIT | VK_IMAGE_ASPECT_STENCIL_BIT, 0u, 1u, 0u, VK_REMAINING_ARRAY_LAYERS);
1955                                 VkImageMemoryBarrier dsBarrier = imageBarrier;
1956                                 dsBarrier.image = **dsImage;
1957                                 dsBarrier.newLayout = VK_IMAGE_LAYOUT_GENERAL;
1958                                 dsBarrier.subresourceRange = range;
1959                                 vk.cmdPipelineBarrier(*cmdBuffer, VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT,
1960                                                                                 0u, // dependencyFlags
1961                                                                                 0u, nullptr,
1962                                                                                 0u, nullptr,
1963                                                                                 1u, &dsBarrier);
1964                                 vk.cmdClearDepthStencilImage(*cmdBuffer, **dsImage, VK_IMAGE_LAYOUT_GENERAL, &clearDepthStencil.depthStencil, 1, &range);
1965                         }
1966
1967                         // Initialize shading rate image with varying values
1968                         if (m_data.useAttachment())
1969                         {
1970                                 imageBarrier.image = **srImage;
1971                                 imageBarrier.newLayout = VK_IMAGE_LAYOUT_GENERAL;
1972
1973                                 vk.cmdPipelineBarrier(*cmdBuffer, VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT,
1974                                                                                 (VkDependencyFlags)0,
1975                                                                                 0, (const VkMemoryBarrier*)DE_NULL,
1976                                                                                 0, (const VkBufferMemoryBarrier*)DE_NULL,
1977                                                                                 1, &imageBarrier);
1978
1979                                 deMemset(fillPtr, 0, (size_t)srFillBufferSize);
1980                                 for (deUint32 layer = 0; layer < numSRLayers; ++layer)
1981                                 {
1982                                         for (deUint32 x = 0; x < srWidth; ++x)
1983                                         {
1984                                                 for (deUint32 y = 0; y < srHeight; ++y)
1985                                                 {
1986                                                         deUint32 idx = (layer*srHeight + y)*srWidth + x;
1987                                                         deUint8 val = (deUint8)SanitizeRate(idx & 0xF);
1988                                                         // actual shading rate is always in the LSBs of the first byte of a texel
1989                                                         fillPtr[srFillBpp*idx] = val;
1990                                                 }
1991                                         }
1992                                 }
1993                                 flushAlloc(vk, device, srFillBuffer->getAllocation());
1994
1995                                 const VkBufferImageCopy                         copyRegion                                                      =
1996                                 {
1997                                         0u,                                                                                                                                     // VkDeviceSize                 bufferOffset;
1998                                         0u,                                                                                                                                     // deUint32                             bufferRowLength;
1999                                         0u,                                                                                                                                     // deUint32                             bufferImageHeight;
2000                                         {
2001                                                 VK_IMAGE_ASPECT_COLOR_BIT,                                                                              // VkImageAspectFlags   aspect;
2002                                                 0u,                                                                                                                             // deUint32                             mipLevel;
2003                                                 0u,                                                                                                                             // deUint32                             baseArrayLayer;
2004                                                 numSRLayers,                                                                                                    // deUint32                             layerCount;
2005                                         },                                                                                                                                      // VkImageSubresourceLayers imageSubresource;
2006                                         { 0, 0, 0 },                                                                                                            // VkOffset3D                   imageOffset;
2007                                         { srWidth, srHeight, 1 },                                                                                       // VkExtent3D                   imageExtent;
2008                                 };
2009
2010                                 vk.cmdCopyBufferToImage(*cmdBuffer, **srFillBuffer, **srImage, VK_IMAGE_LAYOUT_GENERAL, 1, &copyRegion);
2011
2012                                 imageBarrier.oldLayout = VK_IMAGE_LAYOUT_GENERAL;
2013                                 imageBarrier.newLayout = srLayout;
2014
2015                                 vk.cmdPipelineBarrier(*cmdBuffer, VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT,
2016                                                                                 (VkDependencyFlags)0,
2017                                                                                 0, (const VkMemoryBarrier*)DE_NULL,
2018                                                                                 0, (const VkBufferMemoryBarrier*)DE_NULL,
2019                                                                                 1, &imageBarrier);
2020                         }
2021
2022                         VkMemoryBarrier                                 memBarrier =
2023                         {
2024                                 VK_STRUCTURE_TYPE_MEMORY_BARRIER,       // sType
2025                                 DE_NULL,                                                        // pNext
2026                                 0u,                                                                     // srcAccessMask
2027                                 0u,                                                                     // dstAccessMask
2028                         };
2029
2030                         memBarrier.srcAccessMask = VK_ACCESS_TRANSFER_WRITE_BIT;
2031                         memBarrier.dstAccessMask = VK_ACCESS_SHADER_READ_BIT | VK_ACCESS_SHADER_WRITE_BIT | VK_ACCESS_FRAGMENT_SHADING_RATE_ATTACHMENT_READ_BIT_KHR;
2032                         vk.cmdPipelineBarrier(*cmdBuffer, VK_PIPELINE_STAGE_TRANSFER_BIT, allPipelineStages,
2033                                 0, 1, &memBarrier, 0, DE_NULL, 0, DE_NULL);
2034
2035                         vk.cmdBindDescriptorSets(*cmdBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, *pipelineLayout, 0, 1, &descriptorSet.get(), 0, DE_NULL);
2036
2037                         vector<Move<VkPipeline>> pipelines;
2038
2039                         // If using dynamic state, create a single graphics pipeline and bind it
2040                         if (m_data.useDynamicState)
2041                         {
2042                                 pipelines.push_back(createGraphicsPipeline(vk, device, DE_NULL, &graphicsPipelineCreateInfo));
2043                                 vk.cmdBindPipeline(*cmdBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, *pipelines[0]);
2044                         }
2045
2046                         VkRect2D renderArea = makeRect2D(m_data.framebufferDim.width, m_data.framebufferDim.height);
2047                         if (m_data.useDynamicRendering)
2048                         {
2049                                 VkRenderingFragmentShadingRateAttachmentInfoKHR shadingRateAttachmentInfo
2050                                 {
2051                                         VK_STRUCTURE_TYPE_RENDERING_FRAGMENT_SHADING_RATE_ATTACHMENT_INFO_KHR,  // VkStructureType              sType;
2052                                         DE_NULL,                                                                                                                                // const void*                  pNext;
2053                                         *srImageView,                                                                                                                   // VkImageView                  imageView;
2054                                         srLayout,                                                                                                                               // VkImageLayout                imageLayout;
2055                                         { srTexelWidth, srTexelHeight }                                                                                 // VkExtent2D                   shadingRateAttachmentTexelSize;
2056                                 };
2057
2058                                 VkRenderingAttachmentInfoKHR colorAttachment
2059                                 {
2060                                         vk::VK_STRUCTURE_TYPE_RENDERING_ATTACHMENT_INFO_KHR,                                    // VkStructureType                                              sType;
2061                                         DE_NULL,                                                                                                                                // const void*                                                  pNext;
2062                                         *cbImageView,                                                                                                                   // VkImageView                                                  imageView;
2063                                         VK_IMAGE_LAYOUT_GENERAL,                                                                                                // VkImageLayout                                                imageLayout;
2064                                         VK_RESOLVE_MODE_NONE,                                                                                                   // VkResolveModeFlagBits                                resolveMode;
2065                                         DE_NULL,                                                                                                                                // VkImageView                                                  resolveImageView;
2066                                         VK_IMAGE_LAYOUT_UNDEFINED,                                                                                              // VkImageLayout                                                resolveImageLayout;
2067                                         VK_ATTACHMENT_LOAD_OP_LOAD,                                                                                             // VkAttachmentLoadOp                                   loadOp;
2068                                         VK_ATTACHMENT_STORE_OP_STORE,                                                                                   // VkAttachmentStoreOp                                  storeOp;
2069                                         clearColor                                                                                                                              // VkClearValue                                                 clearValue;
2070                                 };
2071
2072                                 std::vector<VkRenderingAttachmentInfoKHR> depthStencilAttachments(2,
2073                                 {
2074                                         VK_STRUCTURE_TYPE_RENDERING_ATTACHMENT_INFO_KHR,                                                // VkStructureType                                              sType;
2075                                         DE_NULL,                                                                                                                                // const void*                                                  pNext;
2076                                         *dsImageView,                                                                                                                   // VkImageView                                                  imageView;
2077                                         VK_IMAGE_LAYOUT_GENERAL,                                                                                                // VkImageLayout                                                imageLayout;
2078                                         VK_RESOLVE_MODE_NONE,                                                                                                   // VkResolveModeFlagBits                                resolveMode;
2079                                         DE_NULL,                                                                                                                                // VkImageView                                                  resolveImageView;
2080                                         VK_IMAGE_LAYOUT_UNDEFINED,                                                                                              // VkImageLayout                                                resolveImageLayout;
2081                                         VK_ATTACHMENT_LOAD_OP_LOAD,                                                                                             // VkAttachmentLoadOp                                   loadOp;
2082                                         VK_ATTACHMENT_STORE_OP_STORE,                                                                                   // VkAttachmentStoreOp                                  storeOp;
2083                                         clearDepthStencil                                                                                                               // VkClearValue                                                 clearValue;
2084                                 });
2085
2086                                 vk::VkRenderingInfoKHR renderingInfo
2087                                 {
2088                                         vk::VK_STRUCTURE_TYPE_RENDERING_INFO_KHR,
2089                                         m_data.useAttachment() ? &shadingRateAttachmentInfo : DE_NULL,
2090                                         0,                                                                                                                                              // VkRenderingFlagsKHR                                  flags;
2091                                         renderArea,                                                                                                                             // VkRect2D                                                             renderArea;
2092                                         m_data.multiView ? 1 : m_data.numColorLayers,                                                   // deUint32                                                             layerCount;
2093                                         m_data.multiView ? 0x3 : 0u,                                                                                    // deUint32                                                             viewMask;
2094                                         1u,                                                                                                                                             // deUint32                                                             colorAttachmentCount;
2095                                         &colorAttachment,                                                                                                               // const VkRenderingAttachmentInfoKHR*  pColorAttachments;
2096                                         m_data.useDepthStencil ? &depthStencilAttachments[0] : DE_NULL,                 // const VkRenderingAttachmentInfoKHR*  pDepthAttachment;
2097                                         m_data.useDepthStencil ? &depthStencilAttachments[1] : DE_NULL,                 // const VkRenderingAttachmentInfoKHR*  pStencilAttachment;
2098                                 };
2099
2100                                 vk.cmdBeginRendering(*cmdBuffer, &renderingInfo);
2101                         }
2102                         else
2103                         {
2104                                 const VkRenderPassAttachmentBeginInfo renderPassAttachmentBeginInfo
2105                                 {
2106                                         VK_STRUCTURE_TYPE_RENDER_PASS_ATTACHMENT_BEGIN_INFO,            //  VkStructureType             sType;
2107                                         DE_NULL,                                                                                                        //  const void*                 pNext;
2108                                         (deUint32)attachments.size(),                                                           //  deUint32                    attachmentCount;
2109                                         &attachments[0]                                                                                         //  const VkImageView*  pAttachments;
2110                                 };
2111
2112                                 beginRenderPass(vk, *cmdBuffer, *renderPass, *framebuffer, renderArea,
2113                                                                 0, DE_NULL, VK_SUBPASS_CONTENTS_INLINE, imagelessFB ? &renderPassAttachmentBeginInfo : DE_NULL);
2114                         }
2115
2116                         for (deInt32 i = 0; i < NUM_TRIANGLES; ++i)
2117                         {
2118                                 // Bind vertex attributes pointing to the next triangle
2119                                 VkDeviceSize vertexBufferOffset = i*3*2*sizeof(float);
2120                                 VkBuffer vb = **vertexBuffer;
2121                                 vk.cmdBindVertexBuffers(*cmdBuffer, 0, 1, &vb, &vertexBufferOffset);
2122
2123                                 // Put primitive shading rate in a push constant
2124                                 deInt32 shadingRatePC = PrimIDToPrimitiveShadingRate(i);
2125                                 vk.cmdPushConstants(*cmdBuffer, *pipelineLayout, allShaderStages, 0, sizeof(shadingRatePC), &shadingRatePC);
2126
2127                                 if (m_data.useDynamicState)
2128                                 {
2129                                         VkExtent2D fragmentSize = ShadingRateEnumToExtent(PrimIDToPipelineShadingRate(i));
2130                                         vk.cmdSetFragmentShadingRateKHR(*cmdBuffer, &fragmentSize, m_data.combinerOp);
2131                                 }
2132                                 else
2133                                 {
2134                                         // Create a new pipeline with the desired pipeline shading rate
2135                                         shadingRateStateCreateInfo.fragmentSize = ShadingRateEnumToExtent(PrimIDToPipelineShadingRate(i));
2136                                         pipelines.push_back(createGraphicsPipeline(vk, device, DE_NULL, &graphicsPipelineCreateInfo));
2137                                         vk.cmdBindPipeline(*cmdBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, *pipelines.back());
2138                                 }
2139
2140                                 // Draw one triangle, with "primitive ID" in gl_InstanceIndex
2141                                 vk.cmdDraw(*cmdBuffer, 3u, 1, 0u, i);
2142                         }
2143
2144                         if (m_data.useDynamicRendering)
2145                                 endRendering(vk, *cmdBuffer);
2146                         else
2147                                 endRenderPass(vk, *cmdBuffer);
2148
2149                         memBarrier.srcAccessMask = VK_ACCESS_SHADER_READ_BIT | VK_ACCESS_SHADER_WRITE_BIT | VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT | VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT;
2150                         memBarrier.dstAccessMask = VK_ACCESS_SHADER_READ_BIT | VK_ACCESS_SHADER_WRITE_BIT;
2151                         vk.cmdPipelineBarrier(*cmdBuffer, allPipelineStages, allPipelineStages,
2152                                 0, 1, &memBarrier, 0, DE_NULL, 0, DE_NULL);
2153
2154                         vk.cmdBindDescriptorSets(*cmdBuffer, VK_PIPELINE_BIND_POINT_COMPUTE, *pipelineLayout, 0u, 1, &*descriptorSet, 0u, DE_NULL);
2155                         vk.cmdBindPipeline(*cmdBuffer, VK_PIPELINE_BIND_POINT_COMPUTE, *computePipeline);
2156
2157                         // Copy color/depth/stencil buffers to buffer memory
2158                         vk.cmdDispatch(*cmdBuffer, m_data.framebufferDim.width, m_data.framebufferDim.height, m_data.numColorLayers);
2159
2160                         memBarrier.srcAccessMask = VK_ACCESS_SHADER_WRITE_BIT;
2161                         memBarrier.dstAccessMask = VK_ACCESS_HOST_READ_BIT;
2162                         vk.cmdPipelineBarrier(*cmdBuffer, VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT, VK_PIPELINE_STAGE_HOST_BIT,
2163                                 0, 1, &memBarrier, 0, DE_NULL, 0, DE_NULL);
2164
2165                         endCommandBuffer(vk, *cmdBuffer);
2166
2167                         submitCommandsAndWait(vk, device, queue, cmdBuffer.get());
2168
2169                         deUint32 *colorptr = (deUint32 *)colorOutputBuffer->getAllocation().getHostPtr();
2170                         invalidateAlloc(vk, device, colorOutputBuffer->getAllocation());
2171
2172                         invalidateAlloc(vk, device, atomicBuffer->getAllocation());
2173
2174                         float *depthptr = DE_NULL;
2175                         deUint32 *stencilptr = DE_NULL;
2176
2177                         if (m_data.useDepthStencil)
2178                         {
2179                                 depthptr = (float *)depthOutputBuffer->getAllocation().getHostPtr();
2180                                 invalidateAlloc(vk, device, depthOutputBuffer->getAllocation());
2181
2182                                 stencilptr = (deUint32 *)stencilOutputBuffer->getAllocation().getHostPtr();
2183                                 invalidateAlloc(vk, device, stencilOutputBuffer->getAllocation());
2184                         }
2185
2186                         // Loop over all samples and validate the output
2187                         for (deUint32 layer = 0; layer < m_data.numColorLayers && res == QP_TEST_RESULT_PASS; ++layer)
2188                         {
2189                                 for (deUint32 y = 0; y < m_data.framebufferDim.height && res == QP_TEST_RESULT_PASS; ++y)
2190                                 {
2191                                         for (deUint32 x = 0; x < m_data.framebufferDim.width && res == QP_TEST_RESULT_PASS; ++x)
2192                                         {
2193                                                 for (deInt32 s = 0; s < m_data.samples && res == QP_TEST_RESULT_PASS; ++s)
2194                                                 {
2195                                                         deUint32 *sample = &colorptr[4*(((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + s)];
2196
2197                                                         // If testing the rasterizer sample mask, if this sample is not set in the
2198                                                         // mask then it shouldn't have written anything.
2199                                                         if (m_data.useApiSampleMask && !(sampleMask & (1 << s)) && sample[2] != 0)
2200                                                         {
2201                                                                 log << tcu::TestLog::Message << std::hex << "sample written despite pSampleMask (" << x << "," << y << ",sample " << s << ")" << tcu::TestLog::EndMessage;
2202                                                                 res = QP_TEST_RESULT_FAIL;
2203                                                                 continue;
2204                                                         }
2205
2206                                                         // The same isn't covered by any primitives, skip it
2207                                                         if (sample[2] == 0)
2208                                                                 continue;
2209
2210                                                         // skip samples that have the same value as sample zero - it would be redundant to check them.
2211                                                         if (s > 0)
2212                                                         {
2213                                                                 deUint32 *sample0 = &colorptr[4*(((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + 0)];
2214                                                                 bool same = deMemCmp(sample, sample0, 16) == 0;
2215
2216                                                                 if (m_data.fragDepth)
2217                                                                 {
2218                                                                         float *dsample = &depthptr[((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + s];
2219                                                                         float *dsample0 = &depthptr[((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + 0];
2220                                                                         same = same && (*dsample == *dsample0);
2221                                                                 }
2222
2223                                                                 if (m_data.fragStencil)
2224                                                                 {
2225                                                                         deUint32 *ssample = &stencilptr[((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + s];
2226                                                                         deUint32 *ssample0 = &stencilptr[((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + 0];
2227                                                                         same = same && (*ssample == *ssample0);
2228                                                                 }
2229
2230                                                                 if (same)
2231                                                                         continue;
2232                                                         }
2233
2234                                                         // Fragment shader writes error codes to .w component.
2235                                                         // All nonzero values are unconditionally failures
2236                                                         if (sample[3] != 0)
2237                                                         {
2238                                                                 if (sample[3] == ERROR_FRAGCOORD_CENTER)
2239                                                                         log << tcu::TestLog::Message << std::hex << "fragcoord test failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")" << tcu::TestLog::EndMessage;
2240                                                                 else if (sample[3] == ERROR_VTG_READBACK)
2241                                                                         log << tcu::TestLog::Message << std::hex << "vs/gs output readback test failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")" << tcu::TestLog::EndMessage;
2242                                                                 else if ((sample[3] & 0xFF) == ERROR_FRAGCOORD_DERIV)
2243                                                                         log << tcu::TestLog::Message << std::hex << "fragcoord derivative test failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")="
2244                                                                                                                                                                 "(0x" << ((sample[3] >>  8) & 0x3F) << ",0x" << ((sample[3] >> 14) & 0x3F) << "), expected="
2245                                                                                                                                                                 "(0x" << ((sample[3] >> 20) & 0x3F) << ",0x" << ((sample[3] >> 26) & 0x3F) << ")" << tcu::TestLog::EndMessage;
2246                                                                 else if ((sample[3] & 0xFF) == ERROR_FRAGCOORD_IMPLICIT_DERIV)
2247                                                                         log << tcu::TestLog::Message << std::hex << "implicit derivative test failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")="
2248                                                                                                                                                                 "(0x" << ((sample[3] >>  8) & 0x3F) << ",0x" << ((sample[3] >> 14) & 0x3F) << "), expected="
2249                                                                                                                                                                 "(0x" << ((sample[3] >> 20) & 0x3F) << ",0x" << ((sample[3] >> 26) & 0x3F) << ")" << tcu::TestLog::EndMessage;
2250                                                                 else
2251                                                                         log << tcu::TestLog::Message << std::hex << "w coord unknown test failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")" << tcu::TestLog::EndMessage;
2252                                                                 res = QP_TEST_RESULT_FAIL;
2253                                                                 continue;
2254                                                         }
2255
2256                                                         // x component of sample
2257                                                         deUint32 rate = sample[0];
2258                                                         // fragment size
2259                                                         deUint32 pixelsX = 1 << ((rate/4)&3);
2260                                                         deUint32 pixelsY = 1 << (rate&3);
2261
2262                                                         // Fragment region
2263                                                         deUint32 fragMinX = x & ~(pixelsX-1);
2264                                                         deUint32 fragMinY = y & ~(pixelsY-1);
2265                                                         deUint32 fragMaxX = fragMinX + pixelsX;
2266                                                         deUint32 fragMaxY = fragMinY + pixelsY;
2267
2268                                                         // Clamp to FB dimension for odd sizes
2269                                                         if (fragMaxX > m_data.framebufferDim.width)
2270                                                                 fragMaxX = m_data.framebufferDim.width;
2271                                                         if (fragMaxY > m_data.framebufferDim.height)
2272                                                                 fragMaxY = m_data.framebufferDim.height;
2273
2274                                                         // z component of sample
2275                                                         deUint32 primID = sample[2] >> 24;
2276                                                         deUint32 atomVal = sample[2] & 0xFFFFFF;
2277
2278                                                         // Compute pipeline and primitive rate from primitive ID, and attachment
2279                                                         // rate from the x/y coordinate
2280                                                         deInt32 pipelineRate = PrimIDToPipelineShadingRate(primID);
2281                                                         deInt32 primitiveRate = m_data.shaderWritesRate ? PrimIDToPrimitiveShadingRate(primID) : 0;
2282
2283                                                         deInt32 attachmentLayer = (m_data.srLayered && modeIdx == ATTACHMENT_MODE_2DARRAY) ? layer : 0;
2284                                                         deInt32 attachmentRate = m_data.useAttachment() ? fillPtr[srFillBpp*((attachmentLayer * srHeight + (y / srTexelHeight)) * srWidth + (x / srTexelWidth))] : 0;
2285
2286                                                         // Get mask of allowed shading rates
2287                                                         deInt32 expectedMasks = Simulate(pipelineRate, primitiveRate, attachmentRate);
2288
2289                                                         if (!(expectedMasks & (1 << rate)))
2290                                                         {
2291                                                                 log << tcu::TestLog::Message << std::hex << "unexpected shading rate. failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ") "
2292                                                                                                                                                         "result rate 0x" << rate << " mask of expected rates 0x" << expectedMasks <<
2293                                                                                                                                                         " pipelineRate=0x" << pipelineRate << " primitiveRate=0x" << primitiveRate << " attachmentRate =0x" << attachmentRate << tcu::TestLog::EndMessage;
2294                                                                 res = QP_TEST_RESULT_FAIL;
2295                                                                 continue;
2296                                                         }
2297                                                         // Check that not all fragments are downgraded to 1x1
2298                                                         if (rate == 0 && expectedMasks != 1)
2299                                                                 numUnexpected1x1Samples++;
2300                                                         numTotalSamples++;
2301
2302                                                         // Check that gl_FragDepth = primID / NUM_TRIANGLES
2303                                                         if (m_data.fragDepth)
2304                                                         {
2305                                                                 float *dsample = &depthptr[((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + s];
2306                                                                 float expected = (float)primID / NUM_TRIANGLES;
2307                                                                 if (fabs(*dsample - expected) > 0.01)
2308                                                                 {
2309                                                                         log << tcu::TestLog::Message << std::hex << "depth write failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")=" << *dsample << " expected " << expected << tcu::TestLog::EndMessage;
2310                                                                         res = QP_TEST_RESULT_FAIL;
2311                                                                         continue;
2312                                                                 }
2313                                                         }
2314
2315                                                         // Check that stencil value = primID
2316                                                         if (m_data.fragStencil)
2317                                                         {
2318                                                                 deUint32 *ssample = &stencilptr[((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + s];
2319                                                                 if (*ssample != primID)
2320                                                                 {
2321                                                                         log << tcu::TestLog::Message << std::hex << "stencil write failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")=" << *ssample << " expected " << primID << tcu::TestLog::EndMessage;
2322                                                                         res = QP_TEST_RESULT_FAIL;
2323                                                                         continue;
2324                                                                 }
2325                                                         }
2326
2327                                                         // Check that primitives are in the right viewport/scissor
2328                                                         if (m_data.multiViewport)
2329                                                         {
2330                                                                 VkRect2D *scissor = &scissors[primID & 1];
2331                                                                 if ((int)x < scissor->offset.x || (int)x >= (int)(scissor->offset.x + scissor->extent.width) ||
2332                                                                         (int)y < scissor->offset.y || (int)y >= (int)(scissor->offset.y + scissor->extent.height))
2333                                                                 {
2334                                                                         log << tcu::TestLog::Message << std::hex << "primitive found outside of expected viewport (0x" << x << ",0x" << y << ",sample 0x" << s << ") primID=" << primID << tcu::TestLog::EndMessage;
2335                                                                         res = QP_TEST_RESULT_FAIL;
2336                                                                         continue;
2337                                                                 }
2338                                                         }
2339
2340                                                         // Check that primitives are in the right layer
2341                                                         if (m_data.colorLayered)
2342                                                         {
2343                                                                 if (layer != ((primID & 2)>>1))
2344                                                                 {
2345                                                                         log << tcu::TestLog::Message << std::hex << "primitive found in wrong layer (0x" << x << ",0x" << y << ",sample 0x" << s << ") primID=" << primID << " layer=" << layer << tcu::TestLog::EndMessage;
2346                                                                         res = QP_TEST_RESULT_FAIL;
2347                                                                         continue;
2348                                                                 }
2349                                                         }
2350
2351                                                         // Check that multiview broadcasts the same primitive to both layers
2352                                                         if (m_data.multiView)
2353                                                         {
2354                                                                 deUint32 otherLayer = layer^1;
2355                                                                 deUint32 *othersample = &colorptr[4*(((otherLayer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + s)];
2356                                                                 deUint32 otherPrimID = othersample[2] >> 24;
2357                                                                 if (primID != otherPrimID)
2358                                                                 {
2359                                                                         log << tcu::TestLog::Message << std::hex << "multiview primitive mismatch (0x" << x << ",0x" << y << ",sample 0x" << s << ") primID=" << primID << "  otherPrimID=" << otherPrimID << tcu::TestLog::EndMessage;
2360                                                                         res = QP_TEST_RESULT_FAIL;
2361                                                                         continue;
2362                                                                 }
2363                                                         }
2364
2365                                                         // Loop over all samples in the same fragment
2366                                                         for (deUint32 fx = fragMinX; fx < fragMaxX; ++fx)
2367                                                         {
2368                                                                 for (deUint32 fy = fragMinY; fy < fragMaxY; ++fy)
2369                                                                 {
2370                                                                         for (deInt32 fs = 0; fs < m_data.samples; ++fs)
2371                                                                         {
2372                                                                                 deUint32 *fsample = &colorptr[4*(((layer * m_data.framebufferDim.height + fy) * m_data.framebufferDim.width + fx)*m_data.samples + fs)];
2373                                                                                 deUint32 frate = fsample[0];
2374                                                                                 deUint32 fprimID = fsample[2] >> 24;
2375                                                                                 deUint32 fatomVal = fsample[2] & 0xFFFFFF;
2376
2377                                                                                 // If we write out the sample mask value, check that the samples in the
2378                                                                                 // mask must not be uncovered, and that samples not in the mask must not
2379                                                                                 // be covered by this primitive
2380                                                                                 if (m_data.useSampleMaskIn)
2381                                                                                 {
2382                                                                                         int p = pixelsX * pixelsY - ((fx - fragMinX) + pixelsX * (fy - fragMinY)) - 1;
2383                                                                                         int sampleIdx = fs + m_data.samples * p;
2384
2385                                                                                         if ((sample[1] & (1 << sampleIdx)) && fsample[2] == 0)
2386                                                                                         {
2387                                                                                                 log << tcu::TestLog::Message << std::hex << "sample set in sampleMask but not written (0x" << fx << ",0x" << fy << ",sample 0x" << fs << ")" << tcu::TestLog::EndMessage;
2388                                                                                                 res = QP_TEST_RESULT_FAIL;
2389                                                                                                 continue;
2390                                                                                         }
2391                                                                                         if (!(sample[1] & (1 << sampleIdx)) && fsample[2] != 0 && fprimID == primID)
2392                                                                                         {
2393                                                                                                 log << tcu::TestLog::Message << std::hex << "sample not set in sampleMask but written with same primID (0x" << fx << ",0x" << fy << ",sample 0x" << fs << ")" << tcu::TestLog::EndMessage;
2394                                                                                                 res = QP_TEST_RESULT_FAIL;
2395                                                                                                 continue;
2396                                                                                         }
2397                                                                                 }
2398
2399                                                                                 // If conservative raster is enabled, or custom sample locations all at the center, check that
2400                                                                                 // samples in the same pixel must be covered.
2401                                                                                 if (m_data.conservativeEnable ||
2402                                                                                         (m_data.sampleLocations && m_context.getFragmentShadingRateProperties().fragmentShadingRateWithCustomSampleLocations))
2403                                                                                 {
2404                                                                                         // If it's in the same pixel, expect it to be fully covered.
2405                                                                                         if (fx == x && fy == y && fsample[2] == 0)
2406                                                                                         {
2407                                                                                                 log << tcu::TestLog::Message << std::hex << "pixel not fully covered (0x" << fx << ",0x" << fy << ",sample 0x" << fs << ")" << tcu::TestLog::EndMessage;
2408                                                                                                 res = QP_TEST_RESULT_FAIL;
2409                                                                                                 continue;
2410                                                                                         }
2411                                                                                 }
2412
2413                                                                                 if (fsample[2] == 0)
2414                                                                                         continue;
2415
2416                                                                                 // If the primitive matches this sample, then it must have the same rate and
2417                                                                                 // atomic value
2418                                                                                 if (fprimID == primID)
2419                                                                                 {
2420                                                                                         if (rate != frate || (atomVal != fatomVal && !(m_data.sampleShadingEnable || m_data.sampleShadingInput)))
2421                                                                                         {
2422                                                                                                 log << tcu::TestLog::Message << std::hex << "failed pixel (0x" << x << ",0x" << y << ",sample " << s << ")=0x" << ((primID<<24)|atomVal) <<
2423                                                                                                                                                                                         " compared to (0x" << fx << ",0x" << fy << ",sample " << fs << ")=0x" << ((fprimID<<24)|fatomVal) <<
2424                                                                                                                                                                                         " pipelineRate=0x" << pipelineRate << " primitiveRate=0x" << primitiveRate << " attachmentRate =0x" << attachmentRate <<
2425                                                                                                                                                                                         tcu::TestLog::EndMessage;
2426                                                                                                 res = QP_TEST_RESULT_FAIL;
2427                                                                                         }
2428                                                                                 }
2429                                                                         }
2430                                                                 }
2431                                                         }
2432                                                 }
2433                                         }
2434                                 }
2435                         }
2436                         if (res == QP_TEST_RESULT_FAIL)
2437                                 break;
2438                 }
2439         }
2440         // All samples were coerced to 1x1, unexpected
2441         if (res == QP_TEST_RESULT_PASS &&
2442                 numTotalSamples != 0 &&
2443                 numUnexpected1x1Samples == numTotalSamples &&
2444                 numTotalSamples > 16)
2445         {
2446                 log << tcu::TestLog::Message << std::hex << "Quality warning - all fragments used 1x1" << tcu::TestLog::EndMessage;
2447                 res = QP_TEST_RESULT_QUALITY_WARNING;
2448         }
2449
2450         return tcu::TestStatus(res, qpGetTestResultName(res));
2451 }
2452
2453 }       // anonymous
2454
2455 void createBasicTests (tcu::TestContext& testCtx, tcu::TestCaseGroup* parentGroup, bool useDynamicRendering)
2456 {
2457         typedef struct
2458         {
2459                 deUint32                                count;
2460                 const char*                             name;
2461                 const char*                             description;
2462         } TestGroupCase;
2463
2464         typedef struct
2465         {
2466                 VkExtent2D                              count;
2467                 const char*                             name;
2468                 const char*                             description;
2469         } TestGroupCase2D;
2470
2471         typedef struct
2472         {
2473                 AttachmentUsage                 usage;
2474                 const char*                             name;
2475                 const char*                             description;
2476         } TestGroupUsageCase;
2477
2478         TestGroupCase groupCases[] =
2479         {
2480                 { 0,    "basic",                                "basic tests"                                   },
2481                 { 1,    "apisamplemask",                "use pSampleMask"                               },
2482                 { 2,    "samplemaskin",                 "use gl_SampleMaskIn"                   },
2483                 { 3,    "conservativeunder",    "conservative underestimation"  },
2484                 { 4,    "conservativeover",             "conservative overestimation"   },
2485                 { 5,    "fragdepth",                    "depth shader output"                   },
2486                 { 6,    "fragstencil",                  "stencil shader output"                 },
2487                 { 7,    "multiviewport",                "multiple viewports and gl_ViewportIndex"       },
2488                 { 8,    "colorlayered",                 "multiple layer color, single layer shading rate"       },
2489                 { 9,    "srlayered",                    "multiple layer color, multiple layers shading rate"    },
2490                 { 10,   "multiview",                    "multiview"     },
2491                 { 11,   "multiviewsrlayered",   "multiview and multilayer shading rate" },
2492                 { 12,   "interlock",                    "fragment shader interlock"     },
2493                 { 13,   "samplelocations",              "custom sample locations"       },
2494                 { 14,   "sampleshadingenable",  "enable sample shading in createinfo"   },
2495                 { 15,   "sampleshadinginput",   "enable sample shading by using gl_SampleID"    },
2496         };
2497
2498         TestGroupCase dynCases[] =
2499         {
2500                 { 1,    "dynamic",      "uses dynamic shading rate state"       },
2501                 { 0,    "static",       "uses static shading rate state"        },
2502         };
2503
2504         TestGroupUsageCase attCases[] =
2505         {
2506                 { AttachmentUsage::NO_ATTACHMENT,               "noattachment",         "no shading rate attachment"                    },
2507                 { AttachmentUsage::WITH_ATTACHMENT,             "attachment",           "has shading rate attachment"                   },
2508                 { AttachmentUsage::NO_ATTACHMENT_PTR,   "noattachmentptr",      "no shading rate attachment pointer"    },
2509         };
2510
2511         TestGroupCase shdCases[] =
2512         {
2513                 { 0,    "noshaderrate", "shader doesn't write rate"     },
2514                 { 1,    "shaderrate",   "shader writes rate"    },
2515         };
2516
2517         TestGroupCase combCases[] =
2518         {
2519                 { VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR,        "keep",         "keep"  },
2520                 { VK_FRAGMENT_SHADING_RATE_COMBINER_OP_REPLACE_KHR,     "replace",      "replace"       },
2521                 { VK_FRAGMENT_SHADING_RATE_COMBINER_OP_MIN_KHR,         "min",          "min"   },
2522                 { VK_FRAGMENT_SHADING_RATE_COMBINER_OP_MAX_KHR,         "max",          "max"   },
2523                 { VK_FRAGMENT_SHADING_RATE_COMBINER_OP_MUL_KHR,         "mul",          "mul"   },
2524         };
2525
2526         TestGroupCase2D extentCases[] =
2527         {
2528                 { {1,   1},             "1x1",          "1x1"           },
2529                 { {4,   4},             "4x4",          "4x4"           },
2530                 { {33,  35},    "33x35",        "33x35"         },
2531                 { {151, 431},   "151x431",      "151x431"       },
2532                 { {256, 256},   "256x256",      "256x256"       },
2533         };
2534
2535         TestGroupCase sampCases[] =
2536         {
2537                 { VK_SAMPLE_COUNT_1_BIT,        "samples1",             "1 raster sample"       },
2538                 { VK_SAMPLE_COUNT_2_BIT,        "samples2",             "2 raster samples"      },
2539                 { VK_SAMPLE_COUNT_4_BIT,        "samples4",             "4 raster samples"      },
2540                 { VK_SAMPLE_COUNT_8_BIT,        "samples8",             "8 raster samples"      },
2541                 { VK_SAMPLE_COUNT_16_BIT,       "samples16",    "16 raster samples"     },
2542         };
2543
2544         TestGroupCase geomCases[] =
2545         {
2546                 { 0,    "vs",   "vertex shader only"    },
2547                 { 1,    "gs",   "vertex and geometry shader"    },
2548         };
2549
2550         deInt32 seed = 0;
2551
2552         for (int groupNdx = 0; groupNdx < DE_LENGTH_OF_ARRAY(groupCases); groupNdx++)
2553         {
2554                 de::MovePtr<tcu::TestCaseGroup> group(new tcu::TestCaseGroup(testCtx, groupCases[groupNdx].name, groupCases[groupNdx].description));
2555                 for (int dynNdx = 0; dynNdx < DE_LENGTH_OF_ARRAY(dynCases); dynNdx++)
2556                 {
2557                         de::MovePtr<tcu::TestCaseGroup> dynGroup(new tcu::TestCaseGroup(testCtx, dynCases[dynNdx].name, dynCases[dynNdx].description));
2558                         for (int attNdx = 0; attNdx < DE_LENGTH_OF_ARRAY(attCases); attNdx++)
2559                         {
2560                                 if (useDynamicRendering && attCases[attNdx].usage == AttachmentUsage::NO_ATTACHMENT_PTR)
2561                                         continue;
2562
2563                                 de::MovePtr<tcu::TestCaseGroup> attGroup(new tcu::TestCaseGroup(testCtx, attCases[attNdx].name, attCases[attNdx].description));
2564                                 for (int shdNdx = 0; shdNdx < DE_LENGTH_OF_ARRAY(shdCases); shdNdx++)
2565                                 {
2566                                         de::MovePtr<tcu::TestCaseGroup> shdGroup(new tcu::TestCaseGroup(testCtx, shdCases[shdNdx].name, shdCases[shdNdx].description));
2567                                         for (int cmb0Ndx = 0; cmb0Ndx < DE_LENGTH_OF_ARRAY(combCases); cmb0Ndx++)
2568                                         {
2569                                                 de::MovePtr<tcu::TestCaseGroup> cmb0Group(new tcu::TestCaseGroup(testCtx, combCases[cmb0Ndx].name, combCases[cmb0Ndx].description));
2570                                                 for (int cmb1Ndx = 0; cmb1Ndx < DE_LENGTH_OF_ARRAY(combCases); cmb1Ndx++)
2571                                                 {
2572                                                         de::MovePtr<tcu::TestCaseGroup> cmb1Group(new tcu::TestCaseGroup(testCtx, combCases[cmb1Ndx].name, combCases[cmb1Ndx].description));
2573                                                         for (int extNdx = 0; extNdx < DE_LENGTH_OF_ARRAY(extentCases); extNdx++)
2574                                                         {
2575                                                                 de::MovePtr<tcu::TestCaseGroup> extGroup(new tcu::TestCaseGroup(testCtx, extentCases[extNdx].name, extentCases[extNdx].description));
2576                                                                 for (int sampNdx = 0; sampNdx < DE_LENGTH_OF_ARRAY(sampCases); sampNdx++)
2577                                                                 {
2578                                                                         de::MovePtr<tcu::TestCaseGroup> sampGroup(new tcu::TestCaseGroup(testCtx, sampCases[sampNdx].name, sampCases[sampNdx].description));
2579                                                                         for (int geomNdx = 0; geomNdx < DE_LENGTH_OF_ARRAY(geomCases); geomNdx++)
2580                                                                         {
2581                                                                                 bool useApiSampleMask = groupNdx == 1;
2582                                                                                 bool useSampleMaskIn = groupNdx == 2;
2583                                                                                 bool consRast = groupNdx == 3 || groupNdx == 4;
2584                                                                                 bool fragDepth = groupNdx == 5;
2585                                                                                 bool fragStencil = groupNdx == 6;
2586                                                                                 bool multiViewport = groupNdx == 7;
2587                                                                                 bool colorLayered = groupNdx == 8 || groupNdx == 9;
2588                                                                                 bool srLayered = groupNdx == 9 || groupNdx == 11;
2589                                                                                 bool multiView = groupNdx == 10 || groupNdx == 11;
2590                                                                                 bool interlock = groupNdx == 12;
2591                                                                                 bool sampleLocations = groupNdx == 13;
2592                                                                                 bool sampleShadingEnable = groupNdx == 14;
2593                                                                                 bool sampleShadingInput = groupNdx == 15;
2594                                                                                 VkConservativeRasterizationModeEXT conservativeMode = (groupNdx == 3) ? VK_CONSERVATIVE_RASTERIZATION_MODE_UNDERESTIMATE_EXT : VK_CONSERVATIVE_RASTERIZATION_MODE_OVERESTIMATE_EXT;
2595                                                                                 deUint32 numColorLayers = (colorLayered || multiView) ? 2u : 1u;
2596
2597                                                                                 // Don't bother with geometry shader if we're not testing shader writes
2598                                                                                 if (geomCases[geomNdx].count && !shdCases[shdNdx].count)
2599                                                                                         continue;
2600
2601                                                                                 // reduce number of tests
2602                                                                                 if ((groupNdx != 0) &&
2603                                                                                         (!dynCases[dynNdx].count ||
2604                                                                                          !(combCases[cmb0Ndx].count == VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR || combCases[cmb0Ndx].count == VK_FRAGMENT_SHADING_RATE_COMBINER_OP_REPLACE_KHR) ||
2605                                                                                          !(combCases[cmb1Ndx].count == VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR || combCases[cmb1Ndx].count == VK_FRAGMENT_SHADING_RATE_COMBINER_OP_REPLACE_KHR)))
2606                                                                                         continue;
2607
2608                                                                                 // Don't bother with geometry shader if we're testing conservative raster, sample mask, depth/stencil
2609                                                                                 if (geomCases[geomNdx].count && (useApiSampleMask || useSampleMaskIn || consRast || fragDepth || fragStencil))
2610                                                                                         continue;
2611
2612                                                                                 // Don't bother with geometry shader if we're testing non-dynamic state
2613                                                                                 if (geomCases[geomNdx].count && !dynCases[dynNdx].count)
2614                                                                                         continue;
2615
2616                                                                                 // Only test multiViewport/layered with shaderWritesRate
2617                                                                                 if ((multiViewport || colorLayered) && !shdCases[shdNdx].count)
2618                                                                                         continue;
2619
2620                                                                                 // Can't test layered shading rate attachment without an attachment
2621                                                                                 if (srLayered && attCases[attNdx].usage != AttachmentUsage::WITH_ATTACHMENT)
2622                                                                                         continue;
2623
2624                                                                                 CaseDef c =
2625                                                                                 {
2626                                                                                         seed++,                                                                                                 // deInt32 seed;
2627                                                                                         extentCases[extNdx].count,                                                              // VkExtent2D framebufferDim;
2628                                                                                         (VkSampleCountFlagBits)sampCases[sampNdx].count,                // VkSampleCountFlagBits samples;
2629                                                                                         {
2630                                                                                                 (VkFragmentShadingRateCombinerOpKHR)combCases[cmb0Ndx].count,
2631                                                                                                 (VkFragmentShadingRateCombinerOpKHR)combCases[cmb1Ndx].count
2632                                                                                         },                                                                                                              // VkFragmentShadingRateCombinerOpKHR combinerOp[2];
2633                                                                                         attCases[attNdx].usage,                                                                 // AttachmentUsage attachmentUsage;
2634                                                                                         (bool)shdCases[shdNdx].count,                                                   // bool shaderWritesRate;
2635                                                                                         (bool)geomCases[geomNdx].count,                                                 // bool geometryShader;
2636                                                                                         (bool)dynCases[dynNdx].count,                                                   // bool useDynamicState;
2637                                                                                         useDynamicRendering,                                                                    // bool useDynamicRendering;
2638                                                                                         useApiSampleMask,                                                                               // bool useApiSampleMask;
2639                                                                                         useSampleMaskIn,                                                                                // bool useSampleMaskIn;
2640                                                                                         consRast,                                                                                               // bool conservativeEnable;
2641                                                                                         conservativeMode,                                                                               // VkConservativeRasterizationModeEXT conservativeMode;
2642                                                                                         fragDepth || fragStencil,                                                               // bool useDepthStencil;
2643                                                                                         fragDepth,                                                                                              // bool fragDepth;
2644                                                                                         fragStencil,                                                                                    // bool fragStencil;
2645                                                                                         multiViewport,                                                                                  // bool multiViewport;
2646                                                                                         colorLayered,                                                                                   // bool colorLayered;
2647                                                                                         srLayered,                                                                                              // bool srLayered;
2648                                                                                         numColorLayers,                                                                                 // deUint32 numColorLayers;
2649                                                                                         multiView,                                                                                              // bool multiView;
2650                                                                                         interlock,                                                                                              // bool interlock;
2651                                                                                         sampleLocations,                                                                                // bool sampleLocations;
2652                                                                                         sampleShadingEnable,                                                                    // bool sampleShadingEnable;
2653                                                                                         sampleShadingInput,                                                                             // bool sampleShadingInput;
2654                                                                                         false,                                                                                                  // bool sampleMaskTest;
2655                                                                                 };
2656
2657                                                                                 sampGroup->addChild(new FSRTestCase(testCtx, geomCases[geomNdx].name, geomCases[geomNdx].description, c));
2658                                                                         }
2659                                                                         extGroup->addChild(sampGroup.release());
2660                                                                 }
2661                                                                 cmb1Group->addChild(extGroup.release());
2662                                                         }
2663                                                         cmb0Group->addChild(cmb1Group.release());
2664                                                 }
2665                                                 shdGroup->addChild(cmb0Group.release());
2666                                         }
2667                                         attGroup->addChild(shdGroup.release());
2668                                 }
2669                                 dynGroup->addChild(attGroup.release());
2670                         }
2671                         group->addChild(dynGroup.release());
2672                 }
2673                 parentGroup->addChild(group.release());
2674         }
2675
2676         de::MovePtr<tcu::TestCaseGroup> group(new tcu::TestCaseGroup(testCtx, "misc_tests", "Single tests that don't need to be part of above test matrix"));
2677         group->addChild(new FSRTestCase(testCtx, "sample_mask_test", "", {
2678                 123,                                                                                                    // deInt32 seed;
2679                 {32,  33},                                                                                              // VkExtent2D framebufferDim;
2680                 VK_SAMPLE_COUNT_4_BIT,                                                                  // VkSampleCountFlagBits samples;
2681                 {
2682                         VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR,
2683                         VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR
2684                 },                                                                                                              // VkFragmentShadingRateCombinerOpKHR combinerOp[2];
2685                 AttachmentUsage::NO_ATTACHMENT,                                                 // AttachmentUsage attachmentUsage;
2686                 true,                                                                                                   // bool shaderWritesRate;
2687                 false,                                                                                                  // bool geometryShader;
2688                 false,                                                                                                  // bool useDynamicState;
2689                 false,                                                                                                  // bool useDynamicRendering;
2690                 true,                                                                                                   // bool useApiSampleMask;
2691                 false,                                                                                                  // bool useSampleMaskIn;
2692                 false,                                                                                                  // bool conservativeEnable;
2693                 VK_CONSERVATIVE_RASTERIZATION_MODE_UNDERESTIMATE_EXT,   // VkConservativeRasterizationModeEXT conservativeMode;
2694                 false,                                                                                                  // bool useDepthStencil;
2695                 false,                                                                                                  // bool fragDepth;
2696                 false,                                                                                                  // bool fragStencil;
2697                 false,                                                                                                  // bool multiViewport;
2698                 false,                                                                                                  // bool colorLayered;
2699                 false,                                                                                                  // bool srLayered;
2700                 1u,                                                                                                             // deUint32 numColorLayers;
2701                 false,                                                                                                  // bool multiView;
2702                 false,                                                                                                  // bool interlock;
2703                 false,                                                                                                  // bool sampleLocations;
2704                 false,                                                                                                  // bool sampleShadingEnable;
2705                 false,                                                                                                  // bool sampleShadingInput;
2706                 true,                                                                                                   // bool sampleMaskTest;
2707         }));
2708
2709         parentGroup->addChild(group.release());
2710 }
2711
2712 }       // FragmentShadingRage
2713 }       // vkt