1 /*------------------------------------------------------------------------
2 * Vulkan Conformance Tests
3 * ------------------------
5 * Copyright (c) 2017-2019 The Khronos Group Inc.
6 * Copyright (c) 2018-2020 NVIDIA Corporation
8 * Licensed under the Apache License, Version 2.0 (the "License");
9 * you may not use this file except in compliance with the License.
10 * You may obtain a copy of the License at
12 * http://www.apache.org/licenses/LICENSE-2.0
14 * Unless required by applicable law or agreed to in writing, software
15 * distributed under the License is distributed on an "AS IS" BASIS,
16 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
17 * See the License for the specific language governing permissions and
18 * limitations under the License.
22 * \brief Tests for VK_KHR_fragment_shading_rate
23 * The test renders 9*9 triangles, where each triangle has one of the valid
24 * fragment sizes ({1,2,4},{1,2,4}) (clamped to implementation limits) for
25 * each of the pipeline shading rate and the primitive shading rate. The
26 * fragment shader does an atomic add to a memory location to get a unique
27 * identifier for the fragment, and outputs the primitive ID, atomic counter,
28 * fragment size, and some other info the the color output. Then a compute
29 * shader copies this to buffer memory, and the host verifies several
30 * properties of the output. For example, if a sample has a particular
31 * primitive ID and atomic value, then all other samples in the tile with
32 * the same primitive ID should have the same atomic value.
33 *//*--------------------------------------------------------------------*/
35 #include "vktFragmentShadingRateBasic.hpp"
37 #include "vkBufferWithMemory.hpp"
38 #include "vkImageWithMemory.hpp"
39 #include "vkQueryUtil.hpp"
40 #include "vkBuilderUtil.hpp"
41 #include "vkCmdUtil.hpp"
42 #include "vkTypeUtil.hpp"
43 #include "vkObjUtil.hpp"
44 #include "vkImageUtil.hpp"
46 #include "vktTestGroupUtil.hpp"
47 #include "vktTestCase.hpp"
52 #include "deSharedPtr.hpp"
55 #include "tcuTestCase.hpp"
56 #include "tcuTestLog.hpp"
64 namespace FragmentShadingRate
71 #define NUM_TRIANGLES (9*9)
73 enum class AttachmentUsage
82 SharedGroupParams groupParams;
84 VkExtent2D framebufferDim;
85 VkSampleCountFlagBits samples;
86 VkFragmentShadingRateCombinerOpKHR combinerOp[2];
87 AttachmentUsage attachmentUsage;
88 bool shaderWritesRate;
91 bool useApiSampleMask;
93 bool conservativeEnable;
94 VkConservativeRasterizationModeEXT conservativeMode;
95 bool useDepthStencil; // == fragDepth || fragStencil
100 bool srLayered; // colorLayered must also be true
101 deUint32 numColorLayers;
103 bool correlationMask;
105 bool sampleLocations;
106 bool sampleShadingEnable;
107 bool sampleShadingInput;
110 bool useAttachment () const
112 return (attachmentUsage == AttachmentUsage::WITH_ATTACHMENT);
116 class FSRTestInstance : public TestInstance
119 FSRTestInstance (Context& context, const CaseDef& data);
120 ~FSRTestInstance (void);
121 tcu::TestStatus iterate (void);
127 // Cache simulated combiner operations, to avoid recomputing per-sample
128 deInt32 m_simulateValueCount;
129 vector<deInt32> m_simulateCache;
130 // Cache mapping of primitive ID to pipeline/primitive shading rate
131 vector<deInt32> m_primIDToPrimitiveShadingRate;
132 vector<deInt32> m_primIDToPipelineShadingRate;
133 deUint32 m_supportedFragmentShadingRateCount;
134 vector<VkPhysicalDeviceFragmentShadingRateKHR> m_supportedFragmentShadingRates;
135 VkPhysicalDeviceFragmentShadingRatePropertiesKHR m_shadingRateProperties;
139 void beginSecondaryCmdBuffer (VkCommandBuffer cmdBuffer,
142 VkRenderingFlagsKHR renderingFlags = 0u) const;
143 void preRenderCommands (VkCommandBuffer cmdBuffer,
144 ImageWithMemory* cbImage,
145 ImageWithMemory* dsImage,
146 ImageWithMemory* derivImage,
147 deUint32 derivNumLevels,
148 ImageWithMemory* srImage,
149 VkImageLayout srLayout,
150 BufferWithMemory* srFillBuffer,
151 deUint32 numSRLayers,
155 const VkClearValue& clearColor,
156 const VkClearValue& clearDepthStencil);
157 void beginRender (VkCommandBuffer cmdBuffer,
158 VkRenderPass renderPass,
159 VkFramebuffer framebuffer,
160 VkImageView srImageView,
161 VkImageLayout srImageLayout,
162 const VkExtent2D& srTexelSize,
163 VkImageView cbImageView,
164 VkImageView dsImageView,
166 const VkClearValue& clearColor,
167 const VkClearValue& clearDepthStencil,
168 VkRenderingFlagsKHR renderingFlags = 0u) const;
169 void drawCommands (VkCommandBuffer cmdBuffer,
170 std::vector<GraphicsPipelineWrapper>& pipelines,
171 const std::vector<VkViewport>& viewports,
172 const std::vector<VkRect2D>& scissors,
173 const VkPipelineLayout pipelineLayout,
174 const VkRenderPass renderPass,
175 const VkPipelineVertexInputStateCreateInfo* vertexInputState,
176 const VkPipelineDynamicStateCreateInfo* dynamicState,
177 const VkPipelineRasterizationStateCreateInfo* rasterizationState,
178 const VkPipelineDepthStencilStateCreateInfo* depthStencilState,
179 const VkPipelineMultisampleStateCreateInfo* multisampleState,
180 VkPipelineFragmentShadingRateStateCreateInfoKHR* shadingRateState,
181 VkPipelineRenderingCreateInfoKHR* dynamicRendering,
182 const VkShaderModule vertShader,
183 const VkShaderModule geomShader,
184 const VkShaderModule fragShader,
185 VkDescriptorSet descriptorSet,
186 VkBuffer vertexBuffer);
187 void endRender (VkCommandBuffer cmdBuffer) const;
189 deInt32 PrimIDToPrimitiveShadingRate (deInt32 primID);
190 deInt32 PrimIDToPipelineShadingRate (deInt32 primID);
191 VkExtent2D SanitizeExtent (VkExtent2D ext) const;
192 deInt32 SanitizeRate (deInt32 rate) const;
193 deInt32 ShadingRateExtentToClampedMask (VkExtent2D ext, bool allowSwap) const;
194 deInt32 ShadingRateExtentToEnum (VkExtent2D ext) const;
195 VkExtent2D ShadingRateEnumToExtent (deInt32 rate) const;
196 deInt32 Simulate (deInt32 rate0, deInt32 rate1, deInt32 rate2);
197 VkExtent2D Combine (VkExtent2D ext0, VkExtent2D ext1, VkFragmentShadingRateCombinerOpKHR comb) const;
198 bool Force1x1 () const;
201 FSRTestInstance::FSRTestInstance (Context& context, const CaseDef& data)
202 : vkt::TestInstance (context)
204 , m_simulateValueCount (((4 * 4) | 4) + 1)
205 , m_simulateCache (m_simulateValueCount*m_simulateValueCount*m_simulateValueCount, ~0)
206 , m_primIDToPrimitiveShadingRate(NUM_TRIANGLES, ~0)
207 , m_primIDToPipelineShadingRate(NUM_TRIANGLES, ~0)
209 m_supportedFragmentShadingRateCount = 0;
210 m_context.getInstanceInterface().getPhysicalDeviceFragmentShadingRatesKHR(m_context.getPhysicalDevice(), &m_supportedFragmentShadingRateCount, DE_NULL);
212 if (m_supportedFragmentShadingRateCount < 3)
213 TCU_THROW(TestError, "*pFragmentShadingRateCount too small");
215 m_supportedFragmentShadingRates.resize(m_supportedFragmentShadingRateCount);
216 for (deUint32 i = 0; i < m_supportedFragmentShadingRateCount; ++i)
218 m_supportedFragmentShadingRates[i].sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_FRAGMENT_SHADING_RATE_KHR;
219 m_supportedFragmentShadingRates[i].pNext = nullptr;
221 m_context.getInstanceInterface().getPhysicalDeviceFragmentShadingRatesKHR(m_context.getPhysicalDevice(), &m_supportedFragmentShadingRateCount, &m_supportedFragmentShadingRates[0]);
223 m_shadingRateProperties = m_context.getFragmentShadingRateProperties();
226 FSRTestInstance::~FSRTestInstance (void)
230 class FSRTestCase : public TestCase
233 FSRTestCase (tcu::TestContext& context, const char* name, const char* desc, const CaseDef data);
235 virtual void initPrograms (SourceCollections& programCollection) const;
236 virtual TestInstance* createInstance (Context& context) const;
237 virtual void checkSupport (Context& context) const;
243 FSRTestCase::FSRTestCase (tcu::TestContext& context, const char* name, const char* desc, const CaseDef data)
244 : vkt::TestCase (context, name, desc)
249 FSRTestCase::~FSRTestCase (void)
253 bool FSRTestInstance::Force1x1() const
255 if (m_data.useApiSampleMask && !m_context.getFragmentShadingRateProperties().fragmentShadingRateWithSampleMask)
258 if (m_data.useSampleMaskIn && !m_context.getFragmentShadingRateProperties().fragmentShadingRateWithShaderSampleMask)
261 if (m_data.conservativeEnable && !m_context.getFragmentShadingRateProperties().fragmentShadingRateWithConservativeRasterization)
264 if (m_data.useDepthStencil && !m_context.getFragmentShadingRateProperties().fragmentShadingRateWithShaderDepthStencilWrites)
267 if (m_data.interlock && !m_context.getFragmentShadingRateProperties().fragmentShadingRateWithFragmentShaderInterlock)
270 if (m_data.sampleLocations && !m_context.getFragmentShadingRateProperties().fragmentShadingRateWithCustomSampleLocations)
273 if (m_data.sampleShadingEnable || m_data.sampleShadingInput)
279 static VkImageUsageFlags cbUsage = VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT |
280 VK_IMAGE_USAGE_SAMPLED_BIT |
281 VK_IMAGE_USAGE_TRANSFER_DST_BIT |
282 VK_IMAGE_USAGE_TRANSFER_SRC_BIT;
284 void FSRTestCase::checkSupport(Context& context) const
286 context.requireDeviceFunctionality("VK_KHR_fragment_shading_rate");
288 checkPipelineLibraryRequirements(context.getInstanceInterface(), context.getPhysicalDevice(), m_data.groupParams->pipelineConstructionType);
290 if (m_data.groupParams->useDynamicRendering)
291 context.requireDeviceFunctionality("VK_KHR_dynamic_rendering");
293 if (!context.getFragmentShadingRateFeatures().pipelineFragmentShadingRate)
294 TCU_THROW(NotSupportedError, "pipelineFragmentShadingRate not supported");
296 if (m_data.shaderWritesRate &&
297 !context.getFragmentShadingRateFeatures().primitiveFragmentShadingRate)
298 TCU_THROW(NotSupportedError, "primitiveFragmentShadingRate not supported");
300 if (!context.getFragmentShadingRateFeatures().primitiveFragmentShadingRate &&
301 m_data.combinerOp[0] != VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR)
302 TCU_THROW(NotSupportedError, "primitiveFragmentShadingRate not supported");
304 if (!context.getFragmentShadingRateFeatures().attachmentFragmentShadingRate &&
305 m_data.combinerOp[1] != VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR)
306 TCU_THROW(NotSupportedError, "attachmentFragmentShadingRate not supported");
308 const auto& vki = context.getInstanceInterface();
309 const auto physicalDevice = context.getPhysicalDevice();
311 VkImageFormatProperties imageProperties;
312 VkResult result = vki.getPhysicalDeviceImageFormatProperties(physicalDevice, VK_FORMAT_R32G32B32A32_UINT, VK_IMAGE_TYPE_2D,
313 VK_IMAGE_TILING_OPTIMAL, cbUsage, 0, &imageProperties);
315 if (result == VK_ERROR_FORMAT_NOT_SUPPORTED)
316 TCU_THROW(NotSupportedError, "VK_FORMAT_R32G32B32A32_UINT not supported");
318 if (m_data.geometryShader)
319 context.requireDeviceCoreFeature(DEVICE_CORE_FEATURE_GEOMETRY_SHADER);
321 if (!(imageProperties.sampleCounts & m_data.samples))
322 TCU_THROW(NotSupportedError, "color buffer sample count not supported");
324 if (m_data.numColorLayers > imageProperties.maxArrayLayers)
325 TCU_THROW(NotSupportedError, "color buffer layers not supported");
327 if (m_data.useAttachment() && !context.getFragmentShadingRateFeatures().attachmentFragmentShadingRate)
328 TCU_THROW(NotSupportedError, "attachmentFragmentShadingRate not supported");
330 if (!context.getFragmentShadingRateProperties().fragmentShadingRateNonTrivialCombinerOps &&
331 ((m_data.combinerOp[0] != VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR && m_data.combinerOp[0] != VK_FRAGMENT_SHADING_RATE_COMBINER_OP_REPLACE_KHR) ||
332 (m_data.combinerOp[1] != VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR && m_data.combinerOp[1] != VK_FRAGMENT_SHADING_RATE_COMBINER_OP_REPLACE_KHR)))
333 TCU_THROW(NotSupportedError, "fragmentShadingRateNonTrivialCombinerOps not supported");
335 if (m_data.conservativeEnable)
337 context.requireDeviceFunctionality("VK_EXT_conservative_rasterization");
338 if (m_data.conservativeMode == VK_CONSERVATIVE_RASTERIZATION_MODE_UNDERESTIMATE_EXT &&
339 !context.getConservativeRasterizationPropertiesEXT().primitiveUnderestimation)
340 TCU_THROW(NotSupportedError, "primitiveUnderestimation not supported");
343 if (m_data.fragStencil)
344 context.requireDeviceFunctionality("VK_EXT_shader_stencil_export");
346 if (m_data.multiViewport &&
347 !context.getFragmentShadingRateProperties().primitiveFragmentShadingRateWithMultipleViewports)
348 TCU_THROW(NotSupportedError, "primitiveFragmentShadingRateWithMultipleViewports not supported");
350 if (m_data.srLayered &&
351 !context.getFragmentShadingRateProperties().layeredShadingRateAttachments)
352 TCU_THROW(NotSupportedError, "layeredShadingRateAttachments not supported");
354 if ((m_data.multiViewport || m_data.colorLayered) &&
355 !m_data.geometryShader)
356 context.requireDeviceFunctionality("VK_EXT_shader_viewport_index_layer");
358 if (m_data.multiView && m_data.geometryShader &&
359 !context.getMultiviewFeatures().multiviewGeometryShader)
360 TCU_THROW(NotSupportedError, "multiviewGeometryShader not supported");
362 if (m_data.interlock &&
363 !context.getFragmentShaderInterlockFeaturesEXT().fragmentShaderPixelInterlock)
364 TCU_THROW(NotSupportedError, "fragmentShaderPixelInterlock not supported");
366 if (m_data.sampleLocations)
368 context.requireDeviceFunctionality("VK_EXT_sample_locations");
369 if (!(m_data.samples & context.getSampleLocationsPropertiesEXT().sampleLocationSampleCounts))
370 TCU_THROW(NotSupportedError, "samples not supported in sampleLocationSampleCounts");
373 if (m_data.sampleMaskTest && !context.getFragmentShadingRateProperties().fragmentShadingRateWithSampleMask)
374 TCU_THROW(NotSupportedError, "fragmentShadingRateWithSampleMask not supported");
376 checkPipelineLibraryRequirements(vki, physicalDevice, m_data.groupParams->pipelineConstructionType);
379 // Error codes writted by the fragment shader
383 ERROR_FRAGCOORD_CENTER = 1,
384 ERROR_VTG_READBACK = 2,
385 ERROR_FRAGCOORD_DERIV = 3,
386 ERROR_FRAGCOORD_IMPLICIT_DERIV = 4,
389 void FSRTestCase::initPrograms (SourceCollections& programCollection) const
391 std::stringstream vss;
394 "#version 450 core\n"
395 "#extension GL_EXT_fragment_shading_rate : enable\n"
396 "#extension GL_ARB_shader_viewport_layer_array : enable\n"
397 "layout(push_constant) uniform PC {\n"
398 " int shadingRate;\n"
400 "layout(location = 0) in vec2 pos;\n"
401 "layout(location = 0) out int instanceIndex;\n"
402 "layout(location = 1) out int readbackok;\n"
403 "layout(location = 2) out float zero;\n"
406 " vec4 gl_Position;\n"
410 " gl_Position = vec4(pos, 0, 1);\n"
411 " instanceIndex = gl_InstanceIndex;\n"
415 if (m_data.shaderWritesRate)
417 vss << " gl_PrimitiveShadingRateEXT = pc.shadingRate;\n";
419 // Verify that we can read from the output variable
420 vss << " if (gl_PrimitiveShadingRateEXT != pc.shadingRate) readbackok = 0;\n";
422 if (!m_data.geometryShader)
424 if (m_data.multiViewport)
425 vss << " gl_ViewportIndex = instanceIndex & 1;\n";
426 if (m_data.colorLayered)
427 vss << " gl_Layer = (instanceIndex & 2) >> 1;\n";
433 programCollection.glslSources.add("vert") << glu::VertexSource(vss.str());
435 if (m_data.geometryShader)
437 std::string writeShadingRate = "";
438 if (m_data.shaderWritesRate)
441 " gl_PrimitiveShadingRateEXT = pc.shadingRate;\n"
442 " if (gl_PrimitiveShadingRateEXT != pc.shadingRate) readbackok = 0;\n";
444 if (m_data.multiViewport)
445 writeShadingRate += " gl_ViewportIndex = inInstanceIndex[0] & 1;\n";
447 if (m_data.colorLayered)
448 writeShadingRate += " gl_Layer = (inInstanceIndex[0] & 2) >> 1;\n";
451 std::stringstream gss;
453 "#version 450 core\n"
454 "#extension GL_EXT_fragment_shading_rate : enable\n"
456 "layout(push_constant) uniform PC {\n"
457 " int shadingRate;\n"
462 " vec4 gl_Position;\n"
465 "layout(location = 0) in int inInstanceIndex[];\n"
466 "layout(location = 0) out int outInstanceIndex;\n"
467 "layout(location = 1) out int readbackok;\n"
468 "layout(location = 2) out float zero;\n"
469 "layout(triangles) in;\n"
470 "layout(triangle_strip, max_vertices=3) out;\n"
472 "out gl_PerVertex {\n"
473 " vec4 gl_Position;\n"
478 " gl_Position = gl_in[0].gl_Position;\n"
479 " outInstanceIndex = inInstanceIndex[0];\n"
482 << writeShadingRate <<
485 " gl_Position = gl_in[1].gl_Position;\n"
486 " outInstanceIndex = inInstanceIndex[1];\n"
489 << writeShadingRate <<
492 " gl_Position = gl_in[2].gl_Position;\n"
493 " outInstanceIndex = inInstanceIndex[2];\n"
496 << writeShadingRate <<
500 programCollection.glslSources.add("geom") << glu::GeometrySource(gss.str());
503 std::stringstream fss;
506 "#version 450 core\n"
507 "#extension GL_EXT_fragment_shading_rate : enable\n"
508 "#extension GL_ARB_shader_stencil_export : enable\n"
509 "#extension GL_ARB_fragment_shader_interlock : enable\n"
510 "layout(location = 0) out uvec4 col0;\n"
511 "layout(set = 0, binding = 0) buffer Block { uint counter; } buf;\n"
512 "layout(set = 0, binding = 3) uniform usampler2D tex;\n"
513 "layout(location = 0) flat in int instanceIndex;\n"
514 "layout(location = 1) flat in int readbackok;\n"
515 "layout(location = 2) " << (m_data.sampleShadingInput ? "sample " : "") << "in float zero;\n";
517 if (m_data.interlock)
518 fss << "layout(pixel_interlock_ordered) in;\n";
524 if (m_data.interlock)
525 fss << " beginInvocationInterlockARB();\n";
528 // X component gets shading rate enum
529 " col0.x = gl_ShadingRateEXT;\n"
531 // Z component gets packed primitiveID | atomic value
532 " col0.z = (instanceIndex << 24) | ((atomicAdd(buf.counter, 1) + 1) & 0x00FFFFFFu);\n"
533 " ivec2 fragCoordXY = ivec2(gl_FragCoord.xy);\n"
534 " ivec2 fragSize = ivec2(1<<((gl_ShadingRateEXT/4)&3), 1<<(gl_ShadingRateEXT&3));\n"
535 // W component gets error code
536 " col0.w = uint(zero)" << (m_data.sampleShadingInput ? " * gl_SampleID" : "") << ";\n"
537 " if (((fragCoordXY - fragSize / 2) % fragSize) != ivec2(0,0))\n"
538 " col0.w = " << ERROR_FRAGCOORD_CENTER << ";\n";
540 if (m_data.shaderWritesRate)
543 " if (readbackok != 1)\n"
544 " col0.w = " << ERROR_VTG_READBACK << ";\n";
547 // When sample shading, gl_FragCoord is more likely to give bad derivatives,
548 // e.g. due to a partially covered quad having some pixels center sample and
549 // some sample at a sample location.
550 if (!m_data.sampleShadingEnable && !m_data.sampleShadingInput)
552 fss << " if (dFdx(gl_FragCoord.xy) != ivec2(fragSize.x, 0) || dFdy(gl_FragCoord.xy) != ivec2(0, fragSize.y))\n"
553 " col0.w = (fragSize.y << 26) | (fragSize.x << 20) | (int(dFdx(gl_FragCoord.xy)) << 14) | (int(dFdx(gl_FragCoord.xy)) << 8) | " << ERROR_FRAGCOORD_DERIV << ";\n";
555 fss << " uint implicitDerivX = texture(tex, vec2(gl_FragCoord.x / textureSize(tex, 0).x, 0)).x;\n"
556 " uint implicitDerivY = texture(tex, vec2(0, gl_FragCoord.y / textureSize(tex, 0).y)).x;\n"
557 " if (implicitDerivX != fragSize.x || implicitDerivY != fragSize.y)\n"
558 " col0.w = (fragSize.y << 26) | (fragSize.x << 20) | (implicitDerivY << 14) | (implicitDerivX << 8) | " << ERROR_FRAGCOORD_IMPLICIT_DERIV << ";\n";
560 // Y component gets sample mask value
561 if (m_data.useSampleMaskIn)
562 fss << " col0.y = gl_SampleMaskIn[0];\n";
564 if (m_data.fragDepth)
565 fss << " gl_FragDepth = float(instanceIndex) / float(" << NUM_TRIANGLES << ");\n";
567 if (m_data.fragStencil)
568 fss << " gl_FragStencilRefARB = instanceIndex;\n";
570 if (m_data.interlock)
571 fss << " endInvocationInterlockARB();\n";
576 programCollection.glslSources.add("frag") << glu::FragmentSource(fss.str());
578 std::stringstream css;
580 std::string fsampType = m_data.samples > 1 ? "texture2DMSArray" : "texture2DArray";
581 std::string usampType = m_data.samples > 1 ? "utexture2DMSArray" : "utexture2DArray";
583 // Compute shader copies color/depth/stencil to linear layout in buffer memory
585 "#version 450 core\n"
586 "#extension GL_EXT_samplerless_texture_functions : enable\n"
587 "layout(set = 0, binding = 1) uniform " << usampType << " colorTex;\n"
588 "layout(set = 0, binding = 2, std430) buffer Block0 { uvec4 b[]; } colorbuf;\n"
589 "layout(set = 0, binding = 4, std430) buffer Block1 { float b[]; } depthbuf;\n"
590 "layout(set = 0, binding = 5, std430) buffer Block2 { uint b[]; } stencilbuf;\n"
591 "layout(set = 0, binding = 6) uniform " << fsampType << " depthTex;\n"
592 "layout(set = 0, binding = 7) uniform " << usampType << " stencilTex;\n"
593 "layout(local_size_x = 1, local_size_y = 1, local_size_z = 1) in;\n"
596 " for (int i = 0; i < " << m_data.samples << "; ++i) {\n"
597 " uint idx = ((gl_GlobalInvocationID.z * " << m_data.framebufferDim.height << " + gl_GlobalInvocationID.y) * " << m_data.framebufferDim.width << " + gl_GlobalInvocationID.x) * " << m_data.samples << " + i;\n"
598 " colorbuf.b[idx] = texelFetch(colorTex, ivec3(gl_GlobalInvocationID.xyz), i);\n";
600 if (m_data.fragDepth)
601 css << " depthbuf.b[idx] = texelFetch(depthTex, ivec3(gl_GlobalInvocationID.xyz), i).x;\n";
603 if (m_data.fragStencil)
604 css << " stencilbuf.b[idx] = texelFetch(stencilTex, ivec3(gl_GlobalInvocationID.xyz), i).x;\n";
610 programCollection.glslSources.add("comp") << glu::ComputeSource(css.str());
613 TestInstance* FSRTestCase::createInstance (Context& context) const
615 return new FSRTestInstance(context, m_data);
618 deInt32 FSRTestInstance::ShadingRateExtentToEnum(VkExtent2D ext) const
620 ext.width = deCtz32(ext.width);
621 ext.height = deCtz32(ext.height);
623 return (ext.width << 2) | ext.height;
626 VkExtent2D FSRTestInstance::ShadingRateEnumToExtent(deInt32 rate) const
629 ret.width = 1 << ((rate/4) & 3);
630 ret.height = 1 << (rate & 3);
635 VkExtent2D FSRTestInstance::Combine(VkExtent2D ext0, VkExtent2D ext1, VkFragmentShadingRateCombinerOpKHR comb) const
643 case VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR:
645 case VK_FRAGMENT_SHADING_RATE_COMBINER_OP_REPLACE_KHR:
647 case VK_FRAGMENT_SHADING_RATE_COMBINER_OP_MIN_KHR:
648 ret = { de::min(ext0.width, ext1.width), de::min(ext0.height, ext1.height) };
650 case VK_FRAGMENT_SHADING_RATE_COMBINER_OP_MAX_KHR:
651 ret = { de::max(ext0.width, ext1.width), de::max(ext0.height, ext1.height) };
653 case VK_FRAGMENT_SHADING_RATE_COMBINER_OP_MUL_KHR:
654 ret = { ext0.width * ext1.width, ext0.height * ext1.height };
655 if (!m_shadingRateProperties.fragmentShadingRateStrictMultiplyCombiner)
657 if (ext0.width == 1 && ext1.width == 1)
659 if (ext0.height == 1 && ext1.height == 1)
666 deInt32 FSRTestInstance::Simulate(deInt32 rate0, deInt32 rate1, deInt32 rate2)
668 deInt32 &cachedRate = m_simulateCache[(rate2*m_simulateValueCount + rate1)*m_simulateValueCount + rate0];
669 if (cachedRate != ~0)
672 VkExtent2D extent0 = ShadingRateEnumToExtent(rate0);
673 VkExtent2D extent1 = ShadingRateEnumToExtent(rate1);
674 VkExtent2D extent2 = ShadingRateEnumToExtent(rate2);
676 deInt32 finalMask = 0;
677 // Simulate once for implementations that don't allow swapping rate xy,
678 // and once for those that do. Any of those results is allowed.
679 for (deUint32 allowSwap = 0; allowSwap <= 1; ++allowSwap)
681 // Combine rate 0 and 1, get a mask of possible clamped rates
682 VkExtent2D intermed = Combine(extent0, extent1, m_data.combinerOp[0]);
683 deInt32 intermedMask = ShadingRateExtentToClampedMask(intermed, allowSwap == 1);
685 // For each clamped rate, combine that with rate 2 and accumulate the possible clamped rates
686 for (int i = 0; i < 16; ++i)
688 if (intermedMask & (1<<i))
690 VkExtent2D final = Combine(ShadingRateEnumToExtent(i), extent2, m_data.combinerOp[1]);
691 finalMask |= ShadingRateExtentToClampedMask(final, allowSwap == 1);
695 // unclamped intermediate value is also permitted
696 VkExtent2D final = Combine(intermed, extent2, m_data.combinerOp[1]);
697 finalMask |= ShadingRateExtentToClampedMask(final, allowSwap == 1);
704 cachedRate = finalMask;
708 // If a rate is not valid (<=4x4), clamp it to something valid.
709 // This is only used for "inputs" to the system, not to mimic
710 // how the implementation internally clamps intermediate values.
711 VkExtent2D FSRTestInstance::SanitizeExtent(VkExtent2D ext) const
713 DE_ASSERT(ext.width > 0 && ext.height > 0);
715 ext.width = de::min(ext.width, 4u);
716 ext.height = de::min(ext.height, 4u);
721 // Map an extent to a mask of all modes smaller than or equal to it in either dimension
722 deInt32 FSRTestInstance::ShadingRateExtentToClampedMask(VkExtent2D ext, bool allowSwap) const
724 deUint32 desiredSize = ext.width * ext.height;
728 while (desiredSize > 0)
730 // First, find modes that maximize the area
731 for (deUint32 i = 0; i < m_supportedFragmentShadingRateCount; ++i)
733 const VkPhysicalDeviceFragmentShadingRateKHR &supportedRate = m_supportedFragmentShadingRates[i];
734 if ((supportedRate.sampleCounts & m_data.samples) &&
735 supportedRate.fragmentSize.width * supportedRate.fragmentSize.height == desiredSize &&
736 ((supportedRate.fragmentSize.width <= ext.width && supportedRate.fragmentSize.height <= ext.height) ||
737 (supportedRate.fragmentSize.height <= ext.width && supportedRate.fragmentSize.width <= ext.height && allowSwap)))
739 mask |= 1 << ShadingRateExtentToEnum(supportedRate.fragmentSize);
744 // Amongst the modes that maximize the area, pick the ones that
745 // minimize the aspect ratio. Prefer ratio of 1, then 2, then 4.
746 // 1x1 = 0, 2x2 = 5, 4x4 = 10
747 static const deUint32 aspectMaskRatio1 = 0x421;
748 // 2x1 = 4, 1x2 = 1, 4x2 = 9, 2x4 = 6
749 static const deUint32 aspectMaskRatio2 = 0x252;
751 static const deUint32 aspectMaskRatio4 = 0x104;
753 if (mask & aspectMaskRatio1)
755 mask &= aspectMaskRatio1;
758 if (mask & aspectMaskRatio2)
760 mask &= aspectMaskRatio2;
763 if (mask & aspectMaskRatio4)
765 mask &= aspectMaskRatio4;
777 deInt32 FSRTestInstance::SanitizeRate(deInt32 rate) const
779 VkExtent2D extent = ShadingRateEnumToExtent(rate);
781 extent = SanitizeExtent(extent);
783 return ShadingRateExtentToEnum(extent);
786 // Map primID % 9 to primitive shading rate
787 deInt32 FSRTestInstance::PrimIDToPrimitiveShadingRate(deInt32 primID)
789 deInt32 &cachedRate = m_primIDToPrimitiveShadingRate[primID];
790 if (cachedRate != ~0)
794 extent.width = 1 << (primID % 3);
795 extent.height = 1 << ((primID/3) % 3);
797 cachedRate = ShadingRateExtentToEnum(extent);
801 // Map primID / 9 to pipeline shading rate
802 deInt32 FSRTestInstance::PrimIDToPipelineShadingRate(deInt32 primID)
804 deInt32 &cachedRate = m_primIDToPipelineShadingRate[primID];
805 if (cachedRate != ~0)
810 extent.width = 1 << (primID % 3);
811 extent.height = 1 << ((primID/3) % 3);
813 cachedRate = ShadingRateExtentToEnum(extent);
817 static de::MovePtr<BufferWithMemory> CreateCachedBuffer(const vk::DeviceInterface& vk,
818 const vk::VkDevice device,
819 vk::Allocator& allocator,
820 const vk::VkBufferCreateInfo& bufferCreateInfo)
824 return de::MovePtr<BufferWithMemory>(new BufferWithMemory(
825 vk, device, allocator, bufferCreateInfo, MemoryRequirement::HostVisible | MemoryRequirement::Cached));
827 catch (const tcu::NotSupportedError&)
829 return de::MovePtr<BufferWithMemory>(new BufferWithMemory(
830 vk, device, allocator, bufferCreateInfo, MemoryRequirement::HostVisible));
834 tcu::TestStatus FSRTestInstance::iterate (void)
836 const DeviceInterface& vk = m_context.getDeviceInterface();
837 const VkDevice device = m_context.getDevice();
838 tcu::TestLog& log = m_context.getTestContext().getLog();
839 Allocator& allocator = m_context.getDefaultAllocator();
840 VkFlags allShaderStages = VK_SHADER_STAGE_VERTEX_BIT | VK_SHADER_STAGE_FRAGMENT_BIT | VK_SHADER_STAGE_COMPUTE_BIT;
841 VkFlags allPipelineStages = VK_PIPELINE_STAGE_VERTEX_SHADER_BIT |
842 VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT |
843 VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT |
844 VK_PIPELINE_STAGE_EARLY_FRAGMENT_TESTS_BIT |
845 VK_PIPELINE_STAGE_LATE_FRAGMENT_TESTS_BIT |
846 VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT |
847 VK_IMAGE_USAGE_FRAGMENT_SHADING_RATE_ATTACHMENT_BIT_KHR;
848 const VkFormat cbFormat = VK_FORMAT_R32G32B32A32_UINT;
849 VkFormat dsFormat = VK_FORMAT_UNDEFINED;
851 if (m_data.geometryShader)
853 allShaderStages |= VK_SHADER_STAGE_GEOMETRY_BIT;
854 allPipelineStages |= VK_PIPELINE_STAGE_GEOMETRY_SHADER_BIT;
857 if (m_data.useDepthStencil)
859 VkFormatProperties formatProps;
860 m_context.getInstanceInterface().getPhysicalDeviceFormatProperties(m_context.getPhysicalDevice(), VK_FORMAT_D32_SFLOAT_S8_UINT, &formatProps);
861 if (formatProps.optimalTilingFeatures & VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT)
863 dsFormat = VK_FORMAT_D32_SFLOAT_S8_UINT;
867 dsFormat = VK_FORMAT_D24_UNORM_S8_UINT;
872 deRandom_init(&rnd, m_data.seed);
874 qpTestResult res = QP_TEST_RESULT_PASS;
875 deUint32 numUnexpected1x1Samples = 0;
876 deUint32 numTotalSamples = 0;
880 ATTACHMENT_MODE_DEFAULT = 0,
881 ATTACHMENT_MODE_LAYOUT_OPTIMAL,
882 ATTACHMENT_MODE_IMAGELESS,
883 ATTACHMENT_MODE_2DARRAY,
884 ATTACHMENT_MODE_TILING_LINEAR,
886 ATTACHMENT_MODE_COUNT,
889 deUint32 numSRLayers = m_data.srLayered ? 2u : 1u;
891 VkExtent2D minFragmentShadingRateAttachmentTexelSize = {1, 1};
892 VkExtent2D maxFragmentShadingRateAttachmentTexelSize = {1, 1};
893 deUint32 maxFragmentShadingRateAttachmentTexelSizeAspectRatio = 1;
894 if (m_context.getFragmentShadingRateFeatures().attachmentFragmentShadingRate)
896 minFragmentShadingRateAttachmentTexelSize = m_context.getFragmentShadingRateProperties().minFragmentShadingRateAttachmentTexelSize;
897 maxFragmentShadingRateAttachmentTexelSize = m_context.getFragmentShadingRateProperties().maxFragmentShadingRateAttachmentTexelSize;
898 maxFragmentShadingRateAttachmentTexelSizeAspectRatio = m_context.getFragmentShadingRateProperties().maxFragmentShadingRateAttachmentTexelSizeAspectRatio;
901 VkDeviceSize atomicBufferSize = sizeof(deUint32);
903 de::MovePtr<BufferWithMemory> atomicBuffer;
904 atomicBuffer = de::MovePtr<BufferWithMemory>(new BufferWithMemory(
905 vk, device, allocator, makeBufferCreateInfo(atomicBufferSize, VK_BUFFER_USAGE_TRANSFER_SRC_BIT | VK_BUFFER_USAGE_STORAGE_BUFFER_BIT), MemoryRequirement::HostVisible | MemoryRequirement::Coherent));
907 deUint32 *abuf = (deUint32 *)atomicBuffer->getAllocation().getHostPtr();
909 // NUM_TRIANGLES triangles, 3 vertices, 2 components of float position
910 VkDeviceSize vertexBufferSize = NUM_TRIANGLES * 3 * 2 * sizeof(float);
912 de::MovePtr<BufferWithMemory> vertexBuffer;
913 vertexBuffer = de::MovePtr<BufferWithMemory>(new BufferWithMemory(
914 vk, device, allocator, makeBufferCreateInfo(vertexBufferSize, VK_BUFFER_USAGE_TRANSFER_SRC_BIT | VK_BUFFER_USAGE_VERTEX_BUFFER_BIT), MemoryRequirement::HostVisible | MemoryRequirement::Coherent));
916 float *vbuf = (float *)vertexBuffer->getAllocation().getHostPtr();
917 for (deInt32 i = 0; i < (deInt32)(vertexBufferSize / sizeof(float)); ++i)
919 vbuf[i] = deRandom_getFloat(&rnd)*2.0f - 1.0f;
921 flushAlloc(vk, device, vertexBuffer->getAllocation());
923 VkDeviceSize colorOutputBufferSize = m_data.framebufferDim.width * m_data.framebufferDim.height * m_data.samples * 4 * sizeof(deUint32) * m_data.numColorLayers;
924 de::MovePtr<BufferWithMemory> colorOutputBuffer = CreateCachedBuffer(vk, device, allocator, makeBufferCreateInfo(colorOutputBufferSize, VK_BUFFER_USAGE_TRANSFER_DST_BIT | VK_BUFFER_USAGE_STORAGE_BUFFER_BIT));
926 VkDeviceSize depthOutputBufferSize = 0, stencilOutputBufferSize = 0;
927 de::MovePtr<BufferWithMemory> depthOutputBuffer, stencilOutputBuffer;
928 if (m_data.useDepthStencil)
930 depthOutputBufferSize = m_data.framebufferDim.width * m_data.framebufferDim.height * m_data.samples * sizeof(float) * m_data.numColorLayers;
931 depthOutputBuffer = CreateCachedBuffer(vk, device, allocator, makeBufferCreateInfo(depthOutputBufferSize, VK_BUFFER_USAGE_TRANSFER_DST_BIT | VK_BUFFER_USAGE_STORAGE_BUFFER_BIT));
933 stencilOutputBufferSize = m_data.framebufferDim.width * m_data.framebufferDim.height * m_data.samples * sizeof(deUint32) * m_data.numColorLayers;
934 stencilOutputBuffer = CreateCachedBuffer(vk, device, allocator, makeBufferCreateInfo(stencilOutputBufferSize, VK_BUFFER_USAGE_TRANSFER_DST_BIT | VK_BUFFER_USAGE_STORAGE_BUFFER_BIT));
937 deUint32 minSRTexelWidth = minFragmentShadingRateAttachmentTexelSize.width;
938 deUint32 minSRTexelHeight = minFragmentShadingRateAttachmentTexelSize.height;
939 deUint32 maxSRWidth = (m_data.framebufferDim.width + minSRTexelWidth - 1) / minSRTexelWidth;
940 deUint32 maxSRHeight = (m_data.framebufferDim.height + minSRTexelHeight - 1) / minSRTexelHeight;
942 // max size over all formats
943 VkDeviceSize srFillBufferSize = numSRLayers * maxSRWidth * maxSRHeight * 32/*4 component 64-bit*/;
944 de::MovePtr<BufferWithMemory> srFillBuffer;
945 deUint8 *fillPtr = DE_NULL;
946 if (m_data.useAttachment())
948 srFillBuffer = CreateCachedBuffer(vk, device, allocator, makeBufferCreateInfo(srFillBufferSize, VK_BUFFER_USAGE_TRANSFER_SRC_BIT));
949 fillPtr = (deUint8 *)srFillBuffer->getAllocation().getHostPtr();
952 de::MovePtr<ImageWithMemory> cbImage;
953 Move<VkImageView> cbImageView;
955 const VkImageCreateInfo imageCreateInfo =
957 VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO, // VkStructureType sType;
958 DE_NULL, // const void* pNext;
959 (VkImageCreateFlags)0u, // VkImageCreateFlags flags;
960 VK_IMAGE_TYPE_2D, // VkImageType imageType;
961 cbFormat, // VkFormat format;
963 m_data.framebufferDim.width, // deUint32 width;
964 m_data.framebufferDim.height, // deUint32 height;
965 1u // deUint32 depth;
966 }, // VkExtent3D extent;
967 1u, // deUint32 mipLevels;
968 m_data.numColorLayers, // deUint32 arrayLayers;
969 m_data.samples, // VkSampleCountFlagBits samples;
970 VK_IMAGE_TILING_OPTIMAL, // VkImageTiling tiling;
971 cbUsage, // VkImageUsageFlags usage;
972 VK_SHARING_MODE_EXCLUSIVE, // VkSharingMode sharingMode;
973 0u, // deUint32 queueFamilyIndexCount;
974 DE_NULL, // const deUint32* pQueueFamilyIndices;
975 VK_IMAGE_LAYOUT_UNDEFINED // VkImageLayout initialLayout;
977 cbImage = de::MovePtr<ImageWithMemory>(new ImageWithMemory(
978 vk, device, allocator, imageCreateInfo, MemoryRequirement::Any));
980 VkImageViewCreateInfo imageViewCreateInfo =
982 VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO, // VkStructureType sType;
983 DE_NULL, // const void* pNext;
984 (VkImageViewCreateFlags)0u, // VkImageViewCreateFlags flags;
985 **cbImage, // VkImage image;
986 VK_IMAGE_VIEW_TYPE_2D_ARRAY, // VkImageViewType viewType;
987 cbFormat, // VkFormat format;
989 VK_COMPONENT_SWIZZLE_R, // VkComponentSwizzle r;
990 VK_COMPONENT_SWIZZLE_G, // VkComponentSwizzle g;
991 VK_COMPONENT_SWIZZLE_B, // VkComponentSwizzle b;
992 VK_COMPONENT_SWIZZLE_A // VkComponentSwizzle a;
993 }, // VkComponentMapping components;
995 VK_IMAGE_ASPECT_COLOR_BIT, // VkImageAspectFlags aspectMask;
996 0u, // deUint32 baseMipLevel;
997 1u, // deUint32 levelCount;
998 0u, // deUint32 baseArrayLayer;
999 m_data.numColorLayers // deUint32 layerCount;
1000 } // VkImageSubresourceRange subresourceRange;
1002 cbImageView = createImageView(vk, device, &imageViewCreateInfo, NULL);
1005 de::MovePtr<ImageWithMemory> dsImage;
1006 Move<VkImageView> dsImageView, dImageView, sImageView;
1007 VkImageUsageFlags dsUsage = VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT |
1008 VK_IMAGE_USAGE_SAMPLED_BIT |
1009 VK_IMAGE_USAGE_TRANSFER_SRC_BIT |
1010 VK_IMAGE_USAGE_TRANSFER_DST_BIT;
1011 if (m_data.useDepthStencil)
1013 const VkImageCreateInfo imageCreateInfo =
1015 VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO, // VkStructureType sType;
1016 DE_NULL, // const void* pNext;
1017 (VkImageCreateFlags)0u, // VkImageCreateFlags flags;
1018 VK_IMAGE_TYPE_2D, // VkImageType imageType;
1019 dsFormat, // VkFormat format;
1021 m_data.framebufferDim.width, // deUint32 width;
1022 m_data.framebufferDim.height, // deUint32 height;
1023 1u // deUint32 depth;
1024 }, // VkExtent3D extent;
1025 1u, // deUint32 mipLevels;
1026 m_data.numColorLayers, // deUint32 arrayLayers;
1027 m_data.samples, // VkSampleCountFlagBits samples;
1028 VK_IMAGE_TILING_OPTIMAL, // VkImageTiling tiling;
1029 dsUsage, // VkImageUsageFlags usage;
1030 VK_SHARING_MODE_EXCLUSIVE, // VkSharingMode sharingMode;
1031 0u, // deUint32 queueFamilyIndexCount;
1032 DE_NULL, // const deUint32* pQueueFamilyIndices;
1033 VK_IMAGE_LAYOUT_UNDEFINED // VkImageLayout initialLayout;
1035 dsImage = de::MovePtr<ImageWithMemory>(new ImageWithMemory(
1036 vk, device, allocator, imageCreateInfo, MemoryRequirement::Any));
1038 VkImageViewCreateInfo imageViewCreateInfo =
1040 VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO, // VkStructureType sType;
1041 DE_NULL, // const void* pNext;
1042 (VkImageViewCreateFlags)0u, // VkImageViewCreateFlags flags;
1043 **dsImage, // VkImage image;
1044 VK_IMAGE_VIEW_TYPE_2D_ARRAY, // VkImageViewType viewType;
1045 dsFormat, // VkFormat format;
1047 VK_COMPONENT_SWIZZLE_R, // VkComponentSwizzle r;
1048 VK_COMPONENT_SWIZZLE_G, // VkComponentSwizzle g;
1049 VK_COMPONENT_SWIZZLE_B, // VkComponentSwizzle b;
1050 VK_COMPONENT_SWIZZLE_A // VkComponentSwizzle a;
1051 }, // VkComponentMapping components;
1053 VK_IMAGE_ASPECT_DEPTH_BIT | VK_IMAGE_ASPECT_STENCIL_BIT, // VkImageAspectFlags aspectMask;
1054 0u, // deUint32 baseMipLevel;
1055 1u, // deUint32 levelCount;
1056 0u, // deUint32 baseArrayLayer;
1057 m_data.numColorLayers // deUint32 layerCount;
1058 } // VkImageSubresourceRange subresourceRange;
1060 dsImageView = createImageView(vk, device, &imageViewCreateInfo, NULL);
1061 imageViewCreateInfo.subresourceRange.aspectMask = VK_IMAGE_ASPECT_DEPTH_BIT;
1062 dImageView = createImageView(vk, device, &imageViewCreateInfo, NULL);
1063 imageViewCreateInfo.subresourceRange.aspectMask = VK_IMAGE_ASPECT_STENCIL_BIT;
1064 sImageView = createImageView(vk, device, &imageViewCreateInfo, NULL);
1067 // Image used to test implicit derivative calculations.
1068 // Filled with a value of 1<<lod.
1069 de::MovePtr<ImageWithMemory> derivImage;
1070 Move<VkImageView> derivImageView;
1071 VkImageUsageFlags derivUsage = VK_IMAGE_USAGE_SAMPLED_BIT |
1072 VK_IMAGE_USAGE_TRANSFER_DST_BIT;
1073 deUint32 derivNumLevels;
1075 deUint32 maxDim = de::max(m_context.getFragmentShadingRateProperties().maxFragmentSize.width, m_context.getFragmentShadingRateProperties().maxFragmentSize.height);
1076 derivNumLevels = 1 + deCtz32(maxDim);
1077 const VkImageCreateInfo imageCreateInfo =
1079 VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO, // VkStructureType sType;
1080 DE_NULL, // const void* pNext;
1081 (VkImageCreateFlags)0u, // VkImageCreateFlags flags;
1082 VK_IMAGE_TYPE_2D, // VkImageType imageType;
1083 VK_FORMAT_R32_UINT, // VkFormat format;
1085 m_context.getFragmentShadingRateProperties().maxFragmentSize.width, // deUint32 width;
1086 m_context.getFragmentShadingRateProperties().maxFragmentSize.height, // deUint32 height;
1087 1u // deUint32 depth;
1088 }, // VkExtent3D extent;
1089 derivNumLevels, // deUint32 mipLevels;
1090 1u, // deUint32 arrayLayers;
1091 VK_SAMPLE_COUNT_1_BIT, // VkSampleCountFlagBits samples;
1092 VK_IMAGE_TILING_OPTIMAL, // VkImageTiling tiling;
1093 derivUsage, // VkImageUsageFlags usage;
1094 VK_SHARING_MODE_EXCLUSIVE, // VkSharingMode sharingMode;
1095 0u, // deUint32 queueFamilyIndexCount;
1096 DE_NULL, // const deUint32* pQueueFamilyIndices;
1097 VK_IMAGE_LAYOUT_UNDEFINED // VkImageLayout initialLayout;
1099 derivImage = de::MovePtr<ImageWithMemory>(new ImageWithMemory(
1100 vk, device, allocator, imageCreateInfo, MemoryRequirement::Any));
1102 VkImageViewCreateInfo imageViewCreateInfo =
1104 VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO, // VkStructureType sType;
1105 DE_NULL, // const void* pNext;
1106 (VkImageViewCreateFlags)0u, // VkImageViewCreateFlags flags;
1107 **derivImage, // VkImage image;
1108 VK_IMAGE_VIEW_TYPE_2D, // VkImageViewType viewType;
1109 VK_FORMAT_R32_UINT, // VkFormat format;
1111 VK_COMPONENT_SWIZZLE_R, // VkComponentSwizzle r;
1112 VK_COMPONENT_SWIZZLE_G, // VkComponentSwizzle g;
1113 VK_COMPONENT_SWIZZLE_B, // VkComponentSwizzle b;
1114 VK_COMPONENT_SWIZZLE_A // VkComponentSwizzle a;
1115 }, // VkComponentMapping components;
1117 VK_IMAGE_ASPECT_COLOR_BIT, // VkImageAspectFlags aspectMask;
1118 0u, // deUint32 baseMipLevel;
1119 derivNumLevels, // deUint32 levelCount;
1120 0u, // deUint32 baseArrayLayer;
1121 1u // deUint32 layerCount;
1122 } // VkImageSubresourceRange subresourceRange;
1124 derivImageView = createImageView(vk, device, &imageViewCreateInfo, NULL);
1127 // sampler used with derivImage
1128 const struct VkSamplerCreateInfo samplerInfo =
1130 VK_STRUCTURE_TYPE_SAMPLER_CREATE_INFO, // sType
1133 VK_FILTER_NEAREST, // magFilter
1134 VK_FILTER_NEAREST, // minFilter
1135 VK_SAMPLER_MIPMAP_MODE_NEAREST, // mipmapMode
1136 VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE, // addressModeU
1137 VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE, // addressModeV
1138 VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE, // addressModeW
1140 VK_FALSE, // anisotropyEnable
1141 1.0f, // maxAnisotropy
1142 DE_FALSE, // compareEnable
1143 VK_COMPARE_OP_ALWAYS, // compareOp
1145 (float)derivNumLevels, // maxLod
1146 VK_BORDER_COLOR_INT_TRANSPARENT_BLACK, // borderColor
1147 VK_FALSE, // unnormalizedCoords
1150 Move<VkSampler> sampler = createSampler(vk, device, &samplerInfo);
1152 Move<vk::VkDescriptorSetLayout> descriptorSetLayout;
1153 VkDescriptorSetLayoutCreateFlags layoutCreateFlags = 0;
1155 const VkDescriptorSetLayoutBinding bindings[] =
1159 VK_DESCRIPTOR_TYPE_STORAGE_BUFFER, // descriptorType
1160 1u, // descriptorCount
1161 allShaderStages, // stageFlags
1162 DE_NULL, // pImmutableSamplers
1166 VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE, // descriptorType
1167 1u, // descriptorCount
1168 allShaderStages, // stageFlags
1169 DE_NULL, // pImmutableSamplers
1173 VK_DESCRIPTOR_TYPE_STORAGE_BUFFER, // descriptorType
1174 1u, // descriptorCount
1175 allShaderStages, // stageFlags
1176 DE_NULL, // pImmutableSamplers
1180 VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER, // descriptorType
1181 1u, // descriptorCount
1182 allShaderStages, // stageFlags
1183 DE_NULL, // pImmutableSamplers
1187 VK_DESCRIPTOR_TYPE_STORAGE_BUFFER, // descriptorType
1188 1u, // descriptorCount
1189 allShaderStages, // stageFlags
1190 DE_NULL, // pImmutableSamplers
1194 VK_DESCRIPTOR_TYPE_STORAGE_BUFFER, // descriptorType
1195 1u, // descriptorCount
1196 allShaderStages, // stageFlags
1197 DE_NULL, // pImmutableSamplers
1201 VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE, // descriptorType
1202 1u, // descriptorCount
1203 allShaderStages, // stageFlags
1204 DE_NULL, // pImmutableSamplers
1208 VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE, // descriptorType
1209 1u, // descriptorCount
1210 allShaderStages, // stageFlags
1211 DE_NULL, // pImmutableSamplers
1215 // Create a layout and allocate a descriptor set for it.
1216 const VkDescriptorSetLayoutCreateInfo setLayoutCreateInfo =
1218 vk::VK_STRUCTURE_TYPE_DESCRIPTOR_SET_LAYOUT_CREATE_INFO, // sType
1220 layoutCreateFlags, // flags
1221 sizeof(bindings)/sizeof(bindings[0]), // bindingCount
1222 &bindings[0] // pBindings
1225 descriptorSetLayout = vk::createDescriptorSetLayout(vk, device, &setLayoutCreateInfo);
1227 const VkPushConstantRange pushConstantRange =
1229 allShaderStages, // VkShaderStageFlags stageFlags;
1230 0u, // deUint32 offset;
1231 sizeof(deInt32) // deUint32 size;
1234 const VkPipelineLayoutCreateInfo pipelineLayoutCreateInfo =
1236 VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO, // sType
1238 (VkPipelineLayoutCreateFlags)0,
1239 1, // setLayoutCount
1240 &descriptorSetLayout.get(), // pSetLayouts
1241 1u, // pushConstantRangeCount
1242 &pushConstantRange, // pPushConstantRanges
1245 Move<VkPipelineLayout> pipelineLayout = createPipelineLayout(vk, device, &pipelineLayoutCreateInfo, NULL);
1247 const Unique<VkShaderModule> cs (createShaderModule(vk, device, m_context.getBinaryCollection().get("comp"), 0));
1249 const VkPipelineShaderStageCreateInfo csShaderCreateInfo =
1251 VK_STRUCTURE_TYPE_PIPELINE_SHADER_STAGE_CREATE_INFO,
1253 (VkPipelineShaderStageCreateFlags)0,
1254 VK_SHADER_STAGE_COMPUTE_BIT, // stage
1257 DE_NULL, // pSpecializationInfo
1260 const VkComputePipelineCreateInfo pipelineCreateInfo =
1262 VK_STRUCTURE_TYPE_COMPUTE_PIPELINE_CREATE_INFO,
1265 csShaderCreateInfo, // cs
1266 *pipelineLayout, // layout
1267 (vk::VkPipeline)0, // basePipelineHandle
1268 0u, // basePipelineIndex
1270 Move<VkPipeline> computePipeline = createComputePipeline(vk, device, DE_NULL, &pipelineCreateInfo, NULL);
1272 for (deUint32 modeIdx = 0; modeIdx < ATTACHMENT_MODE_COUNT; ++modeIdx)
1274 // If we're not using an attachment, don't test all the different attachment modes
1275 if (modeIdx != ATTACHMENT_MODE_DEFAULT && !m_data.useAttachment())
1278 // Consider all uint formats possible
1279 static const VkFormat srFillFormats[] =
1282 VK_FORMAT_R8G8_UINT,
1283 VK_FORMAT_R8G8B8_UINT,
1284 VK_FORMAT_R8G8B8A8_UINT,
1286 VK_FORMAT_R16G16_UINT,
1287 VK_FORMAT_R16G16B16_UINT,
1288 VK_FORMAT_R16G16B16A16_UINT,
1290 VK_FORMAT_R32G32_UINT,
1291 VK_FORMAT_R32G32B32_UINT,
1292 VK_FORMAT_R32G32B32A32_UINT,
1294 VK_FORMAT_R64G64_UINT,
1295 VK_FORMAT_R64G64B64_UINT,
1296 VK_FORMAT_R64G64B64A64_UINT,
1298 // Only test all formats in the default mode
1299 deUint32 numFillFormats = modeIdx == ATTACHMENT_MODE_DEFAULT ? (deUint32)(sizeof(srFillFormats)/sizeof(srFillFormats[0])) : 1u;
1301 // Iterate over all supported tile sizes and formats
1302 for (deUint32 srTexelWidth = minFragmentShadingRateAttachmentTexelSize.width;
1303 srTexelWidth <= maxFragmentShadingRateAttachmentTexelSize.width;
1305 for (deUint32 srTexelHeight = minFragmentShadingRateAttachmentTexelSize.height;
1306 srTexelHeight <= maxFragmentShadingRateAttachmentTexelSize.height;
1308 for (deUint32 formatIdx = 0; formatIdx < numFillFormats; ++formatIdx)
1310 deUint32 aspectRatio = (srTexelHeight > srTexelWidth) ? (srTexelHeight / srTexelWidth) : (srTexelWidth / srTexelHeight);
1311 if (aspectRatio > maxFragmentShadingRateAttachmentTexelSizeAspectRatio)
1314 // Go through the loop only once when not using an attachment
1315 if (!m_data.useAttachment() &&
1316 (srTexelWidth != minFragmentShadingRateAttachmentTexelSize.width ||
1317 srTexelHeight != minFragmentShadingRateAttachmentTexelSize.height ||
1321 bool imagelessFB = modeIdx == ATTACHMENT_MODE_IMAGELESS;
1323 deUint32 srWidth = (m_data.framebufferDim.width + srTexelWidth - 1) / srTexelWidth;
1324 deUint32 srHeight = (m_data.framebufferDim.height + srTexelHeight - 1) / srTexelHeight;
1326 VkFormat srFormat = srFillFormats[formatIdx];
1327 deUint32 srFillBpp = tcu::getPixelSize(mapVkFormat(srFormat));
1329 VkImageLayout srLayout = modeIdx == ATTACHMENT_MODE_LAYOUT_OPTIMAL ? VK_IMAGE_LAYOUT_FRAGMENT_SHADING_RATE_ATTACHMENT_OPTIMAL_KHR : VK_IMAGE_LAYOUT_GENERAL;
1330 VkImageViewType srViewType = (modeIdx == ATTACHMENT_MODE_2DARRAY || numSRLayers > 1u) ? VK_IMAGE_VIEW_TYPE_2D_ARRAY : VK_IMAGE_VIEW_TYPE_2D;
1331 VkImageTiling srTiling = (modeIdx == ATTACHMENT_MODE_TILING_LINEAR) ? VK_IMAGE_TILING_LINEAR : VK_IMAGE_TILING_OPTIMAL;
1333 VkFormatProperties srFormatProperties;
1334 m_context.getInstanceInterface().getPhysicalDeviceFormatProperties(m_context.getPhysicalDevice(), srFormat, &srFormatProperties);
1335 VkFormatFeatureFlags srFormatFeatures = srTiling == VK_IMAGE_TILING_LINEAR ? srFormatProperties.linearTilingFeatures : srFormatProperties.optimalTilingFeatures;
1337 if (m_context.getFragmentShadingRateFeatures().attachmentFragmentShadingRate &&
1338 !(srFormatFeatures & VK_FORMAT_FEATURE_FRAGMENT_SHADING_RATE_ATTACHMENT_BIT_KHR))
1340 if (srFormat == VK_FORMAT_R8_UINT && srTiling == VK_IMAGE_TILING_OPTIMAL)
1342 log << tcu::TestLog::Message << "VK_FORMAT_R8_UINT/VK_IMAGE_TILING_OPTIMAL don't support VK_FORMAT_FEATURE_FRAGMENT_SHADING_RATE_ATTACHMENT_BIT_KHR" << tcu::TestLog::EndMessage;
1343 res = QP_TEST_RESULT_FAIL;
1348 Move<vk::VkDescriptorPool> descriptorPool;
1349 Move<vk::VkDescriptorSet> descriptorSet;
1350 VkDescriptorPoolCreateFlags poolCreateFlags = VK_DESCRIPTOR_POOL_CREATE_FREE_DESCRIPTOR_SET_BIT;
1352 vk::DescriptorPoolBuilder poolBuilder;
1353 for (deInt32 i = 0; i < (deInt32)(sizeof(bindings)/sizeof(bindings[0])); ++i)
1354 poolBuilder.addType(bindings[i].descriptorType, bindings[i].descriptorCount);
1356 descriptorPool = poolBuilder.build(vk, device, poolCreateFlags, 1u);
1357 descriptorSet = makeDescriptorSet(vk, device, *descriptorPool, *descriptorSetLayout);
1359 de::MovePtr<ImageWithMemory> srImage;
1360 Move<VkImageView> srImageView;
1361 VkImageUsageFlags srUsage = VK_IMAGE_USAGE_FRAGMENT_SHADING_RATE_ATTACHMENT_BIT_KHR |
1362 VK_IMAGE_USAGE_TRANSFER_DST_BIT |
1363 VK_IMAGE_USAGE_TRANSFER_SRC_BIT;
1365 if (m_data.useAttachment())
1367 const VkImageCreateInfo imageCreateInfo =
1369 VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO, // VkStructureType sType;
1370 DE_NULL, // const void* pNext;
1371 (VkImageCreateFlags)0u, // VkImageCreateFlags flags;
1372 VK_IMAGE_TYPE_2D, // VkImageType imageType;
1373 srFormat, // VkFormat format;
1375 srWidth, // deUint32 width;
1376 srHeight, // deUint32 height;
1377 1u // deUint32 depth;
1378 }, // VkExtent3D extent;
1379 1u, // deUint32 mipLevels;
1380 numSRLayers, // deUint32 arrayLayers;
1381 VK_SAMPLE_COUNT_1_BIT, // VkSampleCountFlagBits samples;
1382 srTiling, // VkImageTiling tiling;
1383 srUsage, // VkImageUsageFlags usage;
1384 VK_SHARING_MODE_EXCLUSIVE, // VkSharingMode sharingMode;
1385 0u, // deUint32 queueFamilyIndexCount;
1386 DE_NULL, // const deUint32* pQueueFamilyIndices;
1387 VK_IMAGE_LAYOUT_UNDEFINED // VkImageLayout initialLayout;
1389 srImage = de::MovePtr<ImageWithMemory>(new ImageWithMemory(
1390 vk, device, allocator, imageCreateInfo, MemoryRequirement::Any));
1392 VkImageViewCreateInfo imageViewCreateInfo =
1394 VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO, // VkStructureType sType;
1395 DE_NULL, // const void* pNext;
1396 (VkImageViewCreateFlags)0u, // VkImageViewCreateFlags flags;
1397 **srImage, // VkImage image;
1398 srViewType, // VkImageViewType viewType;
1399 srFormat, // VkFormat format;
1401 VK_COMPONENT_SWIZZLE_R, // VkComponentSwizzle r;
1402 VK_COMPONENT_SWIZZLE_G, // VkComponentSwizzle g;
1403 VK_COMPONENT_SWIZZLE_B, // VkComponentSwizzle b;
1404 VK_COMPONENT_SWIZZLE_A // VkComponentSwizzle a;
1405 }, // VkComponentMapping components;
1407 VK_IMAGE_ASPECT_COLOR_BIT, // VkImageAspectFlags aspectMask;
1408 0u, // deUint32 baseMipLevel;
1409 1u, // deUint32 levelCount;
1410 0u, // deUint32 baseArrayLayer;
1411 srViewType == VK_IMAGE_VIEW_TYPE_2D ?
1412 1 : numSRLayers, // deUint32 layerCount;
1413 } // VkImageSubresourceRange subresourceRange;
1415 srImageView = createImageView(vk, device, &imageViewCreateInfo, NULL);
1418 VkDescriptorImageInfo imageInfo;
1419 VkDescriptorBufferInfo bufferInfo;
1421 VkWriteDescriptorSet w =
1423 VK_STRUCTURE_TYPE_WRITE_DESCRIPTOR_SET, // sType
1425 *descriptorSet, // dstSet
1426 (deUint32)0, // dstBinding
1427 0, // dstArrayElement
1428 1u, // descriptorCount
1429 bindings[0].descriptorType, // descriptorType
1430 &imageInfo, // pImageInfo
1431 &bufferInfo, // pBufferInfo
1432 DE_NULL, // pTexelBufferView
1436 flushAlloc(vk, device, atomicBuffer->getAllocation());
1438 bufferInfo = makeDescriptorBufferInfo(**atomicBuffer, 0, atomicBufferSize);
1440 w.descriptorType = bindings[0].descriptorType;
1441 vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1443 imageInfo = makeDescriptorImageInfo(DE_NULL, *cbImageView, VK_IMAGE_LAYOUT_GENERAL);
1445 w.descriptorType = bindings[1].descriptorType;
1446 vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1448 bufferInfo = makeDescriptorBufferInfo(**colorOutputBuffer, 0, colorOutputBufferSize);
1450 w.descriptorType = bindings[2].descriptorType;
1451 vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1453 imageInfo = makeDescriptorImageInfo(*sampler, *derivImageView, VK_IMAGE_LAYOUT_GENERAL);
1455 w.descriptorType = bindings[3].descriptorType;
1456 vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1458 if (m_data.useDepthStencil)
1460 bufferInfo = makeDescriptorBufferInfo(**depthOutputBuffer, 0, depthOutputBufferSize);
1462 w.descriptorType = bindings[4].descriptorType;
1463 vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1465 bufferInfo = makeDescriptorBufferInfo(**stencilOutputBuffer, 0, stencilOutputBufferSize);
1467 w.descriptorType = bindings[5].descriptorType;
1468 vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1470 imageInfo = makeDescriptorImageInfo(DE_NULL, *dImageView, VK_IMAGE_LAYOUT_GENERAL);
1472 w.descriptorType = bindings[6].descriptorType;
1473 vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1475 imageInfo = makeDescriptorImageInfo(DE_NULL, *sImageView, VK_IMAGE_LAYOUT_GENERAL);
1477 w.descriptorType = bindings[7].descriptorType;
1478 vk.updateDescriptorSets(device, 1, &w, 0, NULL);
1481 Move<VkRenderPass> renderPass;
1482 Move<VkFramebuffer> framebuffer;
1484 std::vector<VkImageView> attachments;
1485 attachments.push_back(*cbImageView);
1486 deUint32 dsAttachmentIdx = 0, srAttachmentIdx = 0;
1487 if (m_data.useAttachment())
1489 srAttachmentIdx = (deUint32)attachments.size();
1490 attachments.push_back(*srImageView);
1492 if (m_data.useDepthStencil)
1494 dsAttachmentIdx = (deUint32)attachments.size();
1495 attachments.push_back(*dsImageView);
1498 if (!m_data.groupParams->useDynamicRendering)
1500 const vk::VkAttachmentReference2 colorAttachmentReference
1502 VK_STRUCTURE_TYPE_ATTACHMENT_REFERENCE_2, // sType
1505 vk::VK_IMAGE_LAYOUT_GENERAL, // layout
1509 const vk::VkAttachmentReference2 fragmentShadingRateAttachment =
1511 VK_STRUCTURE_TYPE_ATTACHMENT_REFERENCE_2, // sType
1513 srAttachmentIdx, // attachment
1518 const vk::VkAttachmentReference2 depthAttachmentReference =
1520 VK_STRUCTURE_TYPE_ATTACHMENT_REFERENCE_2, // sType
1522 dsAttachmentIdx, // attachment
1523 vk::VK_IMAGE_LAYOUT_GENERAL, // layout
1527 const bool noAttachmentPtr = (m_data.attachmentUsage == AttachmentUsage::NO_ATTACHMENT_PTR);
1528 const VkFragmentShadingRateAttachmentInfoKHR shadingRateAttachmentInfo =
1530 VK_STRUCTURE_TYPE_FRAGMENT_SHADING_RATE_ATTACHMENT_INFO_KHR, // VkStructureType sType;
1531 DE_NULL, // const void* pNext;
1532 (noAttachmentPtr ? nullptr : &fragmentShadingRateAttachment), // const VkAttachmentReference2* pFragmentShadingRateAttachment;
1533 { srTexelWidth, srTexelHeight }, // VkExtent2D shadingRateAttachmentTexelSize;
1536 const bool useAttachmentInfo = (m_data.attachmentUsage != AttachmentUsage::NO_ATTACHMENT);
1537 const VkSubpassDescription2 subpassDesc =
1539 VK_STRUCTURE_TYPE_SUBPASS_DESCRIPTION_2, // sType
1540 (useAttachmentInfo ? &shadingRateAttachmentInfo : nullptr), // pNext;
1541 (vk::VkSubpassDescriptionFlags)0, // flags
1542 vk::VK_PIPELINE_BIND_POINT_GRAPHICS, // pipelineBindPoint
1543 m_data.multiView ? 0x3 : 0u, // viewMask
1545 DE_NULL, // pInputAttachments
1547 &colorAttachmentReference, // pColorAttachments
1548 DE_NULL, // pResolveAttachments
1549 m_data.useDepthStencil ? &depthAttachmentReference : DE_NULL, // depthStencilAttachment
1550 0u, // preserveCount
1551 DE_NULL, // pPreserveAttachments
1554 std::vector<VkAttachmentDescription2> attachmentDescriptions
1557 VK_STRUCTURE_TYPE_ATTACHMENT_DESCRIPTION_2, // VkStructureType sType;
1558 DE_NULL, // const void* pNext;
1559 (VkAttachmentDescriptionFlags)0u, // VkAttachmentDescriptionFlags flags;
1560 cbFormat, // VkFormat format;
1561 m_data.samples, // VkSampleCountFlagBits samples;
1562 VK_ATTACHMENT_LOAD_OP_LOAD, // VkAttachmentLoadOp loadOp;
1563 VK_ATTACHMENT_STORE_OP_STORE, // VkAttachmentStoreOp storeOp;
1564 VK_ATTACHMENT_LOAD_OP_DONT_CARE, // VkAttachmentLoadOp stencilLoadOp;
1565 VK_ATTACHMENT_STORE_OP_DONT_CARE, // VkAttachmentStoreOp stencilStoreOp;
1566 VK_IMAGE_LAYOUT_GENERAL, // VkImageLayout initialLayout;
1567 VK_IMAGE_LAYOUT_GENERAL // VkImageLayout finalLayout;
1570 if (m_data.useAttachment())
1571 attachmentDescriptions.push_back(
1573 VK_STRUCTURE_TYPE_ATTACHMENT_DESCRIPTION_2, // VkStructureType sType;
1574 DE_NULL, // const void* pNext;
1575 (VkAttachmentDescriptionFlags)0u, // VkAttachmentDescriptionFlags flags;
1576 srFormat, // VkFormat format;
1577 VK_SAMPLE_COUNT_1_BIT, // VkSampleCountFlagBits samples;
1578 VK_ATTACHMENT_LOAD_OP_LOAD, // VkAttachmentLoadOp loadOp;
1579 VK_ATTACHMENT_STORE_OP_STORE, // VkAttachmentStoreOp storeOp;
1580 VK_ATTACHMENT_LOAD_OP_DONT_CARE, // VkAttachmentLoadOp stencilLoadOp;
1581 VK_ATTACHMENT_STORE_OP_DONT_CARE, // VkAttachmentStoreOp stencilStoreOp;
1582 srLayout, // VkImageLayout initialLayout;
1583 srLayout // VkImageLayout finalLayout;
1587 if (m_data.useDepthStencil)
1588 attachmentDescriptions.push_back(
1590 VK_STRUCTURE_TYPE_ATTACHMENT_DESCRIPTION_2, // VkStructureType sType;
1591 DE_NULL, // const void* pNext;
1592 (VkAttachmentDescriptionFlags)0u, // VkAttachmentDescriptionFlags flags;
1593 dsFormat, // VkFormat format;
1594 m_data.samples, // VkSampleCountFlagBits samples;
1595 VK_ATTACHMENT_LOAD_OP_LOAD, // VkAttachmentLoadOp loadOp;
1596 VK_ATTACHMENT_STORE_OP_STORE, // VkAttachmentStoreOp storeOp;
1597 VK_ATTACHMENT_LOAD_OP_LOAD, // VkAttachmentLoadOp stencilLoadOp;
1598 VK_ATTACHMENT_STORE_OP_STORE, // VkAttachmentStoreOp stencilStoreOp;
1599 VK_IMAGE_LAYOUT_GENERAL, // VkImageLayout initialLayout;
1600 VK_IMAGE_LAYOUT_GENERAL // VkImageLayout finalLayout;
1604 const deUint32 correlatedViewMask = 0x3;
1605 const VkRenderPassCreateInfo2 renderPassParams =
1607 VK_STRUCTURE_TYPE_RENDER_PASS_CREATE_INFO_2, // sType
1609 (vk::VkRenderPassCreateFlags)0,
1610 (deUint32)attachmentDescriptions.size(), // attachmentCount
1611 &attachmentDescriptions[0], // pAttachments
1613 &subpassDesc, // pSubpasses
1614 0u, // dependencyCount
1615 DE_NULL, // pDependencies
1616 m_data.correlationMask, // correlatedViewMaskCount
1617 m_data.correlationMask ? &correlatedViewMask : DE_NULL // pCorrelatedViewMasks
1620 renderPass = createRenderPass2(vk, device, &renderPassParams);
1622 std::vector<VkFramebufferAttachmentImageInfo> framebufferAttachmentImageInfo;
1623 framebufferAttachmentImageInfo.push_back(
1625 VK_STRUCTURE_TYPE_FRAMEBUFFER_ATTACHMENT_IMAGE_INFO, // VkStructureType sType;
1626 DE_NULL, // const void* pNext;
1627 (VkImageCreateFlags)0u, // VkImageCreateFlags flags;
1628 cbUsage, // VkImageUsageFlags usage;
1629 m_data.framebufferDim.width, // deUint32 width;
1630 m_data.framebufferDim.height, // deUint32 height;
1631 m_data.numColorLayers, // deUint32 layerCount;
1632 1u, // deUint32 viewFormatCount;
1633 &cbFormat // const VkFormat* pViewFormats;
1636 if (m_data.useAttachment())
1637 framebufferAttachmentImageInfo.push_back(
1639 VK_STRUCTURE_TYPE_FRAMEBUFFER_ATTACHMENT_IMAGE_INFO, // VkStructureType sType;
1640 DE_NULL, // const void* pNext;
1641 (VkImageCreateFlags)0u, // VkImageCreateFlags flags;
1642 srUsage, // VkImageUsageFlags usage;
1643 srWidth, // deUint32 width;
1644 srHeight, // deUint32 height;
1645 numSRLayers, // deUint32 layerCount;
1646 srViewType == VK_IMAGE_VIEW_TYPE_2D ? 1 : numSRLayers, // deUint32 viewFormatCount;
1647 &srFormat // const VkFormat* pViewFormats;
1651 if (m_data.useDepthStencil)
1652 framebufferAttachmentImageInfo.push_back(
1654 VK_STRUCTURE_TYPE_FRAMEBUFFER_ATTACHMENT_IMAGE_INFO, // VkStructureType sType;
1655 DE_NULL, // const void* pNext;
1656 (VkImageCreateFlags)0u, // VkImageCreateFlags flags;
1657 dsUsage, // VkImageUsageFlags usage;
1658 m_data.framebufferDim.width, // deUint32 width;
1659 m_data.framebufferDim.height, // deUint32 height;
1660 m_data.numColorLayers, // deUint32 layerCount;
1661 1u, // deUint32 viewFormatCount;
1662 &dsFormat // const VkFormat* pViewFormats;
1666 const VkFramebufferAttachmentsCreateInfo framebufferAttachmentsCreateInfo =
1668 VK_STRUCTURE_TYPE_FRAMEBUFFER_ATTACHMENTS_CREATE_INFO, // VkStructureType sType;
1669 DE_NULL, // const void* pNext;
1670 (deUint32)framebufferAttachmentImageInfo.size(), // deUint32 attachmentImageInfoCount;
1671 &framebufferAttachmentImageInfo[0] // const VkFramebufferAttachmentImageInfo* pAttachmentImageInfos;
1674 const vk::VkFramebufferCreateInfo framebufferParams =
1676 vk::VK_STRUCTURE_TYPE_FRAMEBUFFER_CREATE_INFO, // sType
1677 imagelessFB ? &framebufferAttachmentsCreateInfo : DE_NULL, // pNext
1678 (vk::VkFramebufferCreateFlags)(imagelessFB ? VK_FRAMEBUFFER_CREATE_IMAGELESS_BIT : 0),
1679 *renderPass, // renderPass
1680 (deUint32)attachments.size(), // attachmentCount
1681 imagelessFB ? DE_NULL : &attachments[0], // pAttachments
1682 m_data.framebufferDim.width, // width
1683 m_data.framebufferDim.height, // height
1684 m_data.multiView ? 1 : m_data.numColorLayers, // layers
1687 framebuffer = createFramebuffer(vk, device, &framebufferParams);
1690 const VkVertexInputBindingDescription vertexBinding =
1692 0u, // deUint32 binding;
1693 sizeof(float) * 2, // deUint32 stride;
1694 VK_VERTEX_INPUT_RATE_VERTEX // VkVertexInputRate inputRate;
1696 const VkVertexInputAttributeDescription vertexInputAttributeDescription =
1698 0u, // deUint32 location;
1699 0u, // deUint32 binding;
1700 VK_FORMAT_R32G32_SFLOAT, // VkFormat format;
1701 0u // deUint32 offset;
1704 const VkPipelineVertexInputStateCreateInfo vertexInputStateCreateInfo =
1706 VK_STRUCTURE_TYPE_PIPELINE_VERTEX_INPUT_STATE_CREATE_INFO, // VkStructureType sType;
1707 DE_NULL, // const void* pNext;
1708 (VkPipelineVertexInputStateCreateFlags)0, // VkPipelineVertexInputStateCreateFlags flags;
1709 1u, // deUint32 vertexBindingDescriptionCount;
1710 &vertexBinding, // const VkVertexInputBindingDescription* pVertexBindingDescriptions;
1711 1u, // deUint32 vertexAttributeDescriptionCount;
1712 &vertexInputAttributeDescription // const VkVertexInputAttributeDescription* pVertexAttributeDescriptions;
1715 const VkPipelineRasterizationConservativeStateCreateInfoEXT consRastState =
1717 VK_STRUCTURE_TYPE_PIPELINE_RASTERIZATION_CONSERVATIVE_STATE_CREATE_INFO_EXT, // VkStructureType sType;
1718 DE_NULL, // const void* pNext;
1719 (VkPipelineRasterizationConservativeStateCreateFlagsEXT)0, // VkPipelineRasterizationConservativeStateCreateFlagsEXT flags;
1720 m_data.conservativeMode, // VkConservativeRasterizationModeEXT conservativeRasterizationMode;
1721 0.0f, // float extraPrimitiveOverestimationSize;
1724 const VkPipelineRasterizationStateCreateInfo rasterizationStateCreateInfo =
1726 VK_STRUCTURE_TYPE_PIPELINE_RASTERIZATION_STATE_CREATE_INFO, // VkStructureType sType;
1727 m_data.conservativeEnable ? &consRastState : DE_NULL, // const void* pNext;
1728 (VkPipelineRasterizationStateCreateFlags)0, // VkPipelineRasterizationStateCreateFlags flags;
1729 VK_FALSE, // VkBool32 depthClampEnable;
1730 VK_FALSE, // VkBool32 rasterizerDiscardEnable;
1731 VK_POLYGON_MODE_FILL, // VkPolygonMode polygonMode;
1732 VK_CULL_MODE_NONE, // VkCullModeFlags cullMode;
1733 VK_FRONT_FACE_CLOCKWISE, // VkFrontFace frontFace;
1734 VK_FALSE, // VkBool32 depthBiasEnable;
1735 0.0f, // float depthBiasConstantFactor;
1736 0.0f, // float depthBiasClamp;
1737 0.0f, // float depthBiasSlopeFactor;
1738 1.0f // float lineWidth;
1741 // Kill some bits from each AA mode
1742 const VkSampleMask sampleMask = m_data.sampleMaskTest ? 0x9 : 0x7D56;
1743 const VkSampleMask* pSampleMask = m_data.useApiSampleMask ? &sampleMask : DE_NULL;
1745 // All samples at pixel center. We'll validate that pixels are fully covered or uncovered.
1746 std::vector<VkSampleLocationEXT> sampleLocations(m_data.samples, { 0.5f, 0.5f });
1747 const VkSampleLocationsInfoEXT sampleLocationsInfo =
1749 VK_STRUCTURE_TYPE_SAMPLE_LOCATIONS_INFO_EXT, // VkStructureType sType;
1750 DE_NULL, // const void* pNext;
1751 (VkSampleCountFlagBits)m_data.samples, // VkSampleCountFlagBits sampleLocationsPerPixel;
1752 { 1, 1 }, // VkExtent2D sampleLocationGridSize;
1753 (deUint32)m_data.samples, // uint32_t sampleLocationsCount;
1754 &sampleLocations[0], // const VkSampleLocationEXT* pSampleLocations;
1757 const VkPipelineSampleLocationsStateCreateInfoEXT pipelineSampleLocationsCreateInfo =
1759 VK_STRUCTURE_TYPE_PIPELINE_SAMPLE_LOCATIONS_STATE_CREATE_INFO_EXT, // VkStructureType sType;
1760 DE_NULL, // const void* pNext;
1761 VK_TRUE, // VkBool32 sampleLocationsEnable;
1762 sampleLocationsInfo, // VkSampleLocationsInfoEXT sampleLocationsInfo;
1765 const VkPipelineMultisampleStateCreateInfo multisampleStateCreateInfo =
1767 VK_STRUCTURE_TYPE_PIPELINE_MULTISAMPLE_STATE_CREATE_INFO, // VkStructureType sType
1768 m_data.sampleLocations ? &pipelineSampleLocationsCreateInfo : DE_NULL, // const void* pNext
1769 0u, // VkPipelineMultisampleStateCreateFlags flags
1770 (VkSampleCountFlagBits)m_data.samples, // VkSampleCountFlagBits rasterizationSamples
1771 (VkBool32)m_data.sampleShadingEnable, // VkBool32 sampleShadingEnable
1772 1.0f, // float minSampleShading
1773 pSampleMask, // const VkSampleMask* pSampleMask
1774 VK_FALSE, // VkBool32 alphaToCoverageEnable
1775 VK_FALSE // VkBool32 alphaToOneEnable
1778 std::vector<VkViewport> viewports;
1779 std::vector<VkRect2D> scissors;
1780 if (m_data.multiViewport)
1782 // Split the viewport into left and right halves
1783 int x0 = 0, x1 = m_data.framebufferDim.width/2, x2 = m_data.framebufferDim.width;
1785 viewports.push_back(makeViewport((float)x0, 0, std::max((float)(x1 - x0), 1.0f), (float)m_data.framebufferDim.height, 0.0f, 1.0f));
1786 scissors.push_back(makeRect2D(x0, 0, x1 - x0, m_data.framebufferDim.height));
1788 viewports.push_back(makeViewport((float)x1, 0, std::max((float)(x2 - x1), 1.0f), (float)m_data.framebufferDim.height, 0.0f, 1.0f));
1789 scissors.push_back(makeRect2D(x1, 0, x2 - x1, m_data.framebufferDim.height));
1793 viewports.push_back(makeViewport(m_data.framebufferDim.width, m_data.framebufferDim.height));
1794 scissors.push_back(makeRect2D(m_data.framebufferDim.width, m_data.framebufferDim.height));
1797 Move<VkShaderModule> fragShader = createShaderModule(vk, device, m_context.getBinaryCollection().get("frag"), 0);
1798 Move<VkShaderModule> vertShader = createShaderModule(vk, device, m_context.getBinaryCollection().get("vert"), 0);
1799 Move<VkShaderModule> geomShader;
1800 if (m_data.geometryShader)
1801 geomShader = createShaderModule(vk, device, m_context.getBinaryCollection().get("geom"), 0);
1803 const deUint32 fragSizeWH = m_data.sampleMaskTest ? 2 : 0;
1805 #ifndef CTS_USES_VULKANSC
1806 VkPipelineRenderingCreateInfoKHR renderingCreateInfo
1808 VK_STRUCTURE_TYPE_PIPELINE_RENDERING_CREATE_INFO_KHR,
1810 m_data.multiView ? 0x3 : 0u,
1816 #endif // CTS_USES_VULKANSC
1818 VkPipelineFragmentShadingRateStateCreateInfoKHR shadingRateStateCreateInfo
1820 VK_STRUCTURE_TYPE_PIPELINE_FRAGMENT_SHADING_RATE_STATE_CREATE_INFO_KHR, // VkStructureType sType;
1821 #ifndef CTS_USES_VULKANSC
1822 m_data.groupParams->useDynamicRendering ? &renderingCreateInfo : DE_NULL, // const void* pNext;
1824 DE_NULL, // const void* pNext;
1825 #endif // CTS_USES_VULKANSC
1826 { fragSizeWH, fragSizeWH }, // VkExtent2D fragmentSize;
1827 { m_data.combinerOp[0], m_data.combinerOp[1] }, // VkFragmentShadingRateCombinerOpKHR combinerOps[2];
1830 VkDynamicState dynamicState = VK_DYNAMIC_STATE_FRAGMENT_SHADING_RATE_KHR;
1831 const VkPipelineDynamicStateCreateInfo dynamicStateCreateInfo
1833 VK_STRUCTURE_TYPE_PIPELINE_DYNAMIC_STATE_CREATE_INFO, // VkStructureType sType;
1834 DE_NULL, // const void* pNext;
1835 (VkPipelineDynamicStateCreateFlags)0, // VkPipelineDynamicStateCreateFlags flags;
1836 m_data.useDynamicState ? 1u : 0u, // uint32_t dynamicStateCount;
1837 &dynamicState, // const VkDynamicState* pDynamicStates;
1839 vk::VkPipelineRenderingCreateInfoKHR* pDynamicRendering = (m_data.groupParams->useDynamicRendering ? &renderingCreateInfo : DE_NULL);
1841 // Enable depth/stencil writes, always passing
1842 VkPipelineDepthStencilStateCreateInfo depthStencilStateParams =
1844 VK_STRUCTURE_TYPE_PIPELINE_DEPTH_STENCIL_STATE_CREATE_INFO, // VkStructureType sType;
1845 DE_NULL, // const void* pNext;
1846 0u, // VkPipelineDepthStencilStateCreateFlags flags;
1847 VK_TRUE, // VkBool32 depthTestEnable;
1848 VK_TRUE, // VkBool32 depthWriteEnable;
1849 VK_COMPARE_OP_ALWAYS, // VkCompareOp depthCompareOp;
1850 VK_FALSE, // VkBool32 depthBoundsTestEnable;
1851 VK_TRUE, // VkBool32 stencilTestEnable;
1852 // VkStencilOpState front;
1854 VK_STENCIL_OP_REPLACE, // VkStencilOp failOp;
1855 VK_STENCIL_OP_REPLACE, // VkStencilOp passOp;
1856 VK_STENCIL_OP_REPLACE, // VkStencilOp depthFailOp;
1857 VK_COMPARE_OP_ALWAYS, // VkCompareOp compareOp;
1858 0u, // deUint32 compareMask;
1859 0xFFu, // deUint32 writeMask;
1860 0xFFu, // deUint32 reference;
1862 // VkStencilOpState back;
1864 VK_STENCIL_OP_REPLACE, // VkStencilOp failOp;
1865 VK_STENCIL_OP_REPLACE, // VkStencilOp passOp;
1866 VK_STENCIL_OP_REPLACE, // VkStencilOp depthFailOp;
1867 VK_COMPARE_OP_ALWAYS, // VkCompareOp compareOp;
1868 0u, // deUint32 compareMask;
1869 0xFFu, // deUint32 writeMask;
1870 0xFFu, // deUint32 reference;
1872 0.0f, // float minDepthBounds;
1873 0.0f, // float maxDepthBounds;
1876 const VkQueue queue = m_context.getUniversalQueue();
1877 Move<VkCommandPool> cmdPool = createCommandPool(vk, device, VK_COMMAND_POOL_CREATE_RESET_COMMAND_BUFFER_BIT, m_context.getUniversalQueueFamilyIndex());
1878 Move<VkCommandBuffer> cmdBuffer = allocateCommandBuffer(vk, device, *cmdPool, VK_COMMAND_BUFFER_LEVEL_PRIMARY);
1879 Move<VkCommandBuffer> secCmdBuffer;
1880 VkClearValue clearColor = makeClearValueColorU32(0, 0, 0, 0);
1881 VkClearValue clearDepthStencil = makeClearValueDepthStencil(0.0, 0);
1882 const VkExtent2D srTexelSize { srTexelWidth, srTexelHeight };
1884 std::vector<GraphicsPipelineWrapper> pipelines;
1885 pipelines.reserve(m_data.useDynamicState ? 1u : NUM_TRIANGLES);
1887 if (m_data.groupParams->useSecondaryCmdBuffer)
1889 secCmdBuffer = allocateCommandBuffer(vk, device, *cmdPool, VK_COMMAND_BUFFER_LEVEL_SECONDARY);
1891 // record secondary command buffer
1892 if (m_data.groupParams->secondaryCmdBufferCompletelyContainsDynamicRenderpass)
1894 beginSecondaryCmdBuffer(*secCmdBuffer, cbFormat, dsFormat, VK_RENDERING_CONTENTS_SECONDARY_COMMAND_BUFFERS_BIT);
1895 beginRender(*secCmdBuffer, *renderPass, *framebuffer, *srImageView, srLayout, srTexelSize,
1896 *cbImageView, *dsImageView, imagelessFB, clearColor, clearDepthStencil);
1899 beginSecondaryCmdBuffer(*secCmdBuffer, cbFormat, dsFormat);
1901 drawCommands(*secCmdBuffer, pipelines, viewports, scissors, *pipelineLayout, *renderPass,
1902 &vertexInputStateCreateInfo, &dynamicStateCreateInfo, &rasterizationStateCreateInfo,
1903 &depthStencilStateParams, &multisampleStateCreateInfo, &shadingRateStateCreateInfo,
1904 pDynamicRendering, *vertShader, *geomShader, *fragShader, *descriptorSet, **vertexBuffer);
1906 if (m_data.groupParams->secondaryCmdBufferCompletelyContainsDynamicRenderpass)
1907 endRender(*secCmdBuffer);
1909 endCommandBuffer(vk, *secCmdBuffer);
1911 // record primary command buffer
1912 beginCommandBuffer(vk, *cmdBuffer, 0u);
1914 preRenderCommands(*cmdBuffer, cbImage.get(), dsImage.get(), derivImage.get(), derivNumLevels, srImage.get(), srLayout,
1915 srFillBuffer.get(), numSRLayers, srWidth, srHeight, srFillBpp, clearColor, clearDepthStencil);
1916 if (!m_data.groupParams->secondaryCmdBufferCompletelyContainsDynamicRenderpass)
1917 beginRender(*cmdBuffer, *renderPass, *framebuffer, *srImageView, srLayout, srTexelSize,
1918 *cbImageView, *dsImageView, imagelessFB, clearColor, clearDepthStencil, VK_SUBPASS_CONTENTS_SECONDARY_COMMAND_BUFFERS);
1920 vk.cmdExecuteCommands(*cmdBuffer, 1u, &*secCmdBuffer);
1922 if (!m_data.groupParams->secondaryCmdBufferCompletelyContainsDynamicRenderpass)
1923 endRender(*cmdBuffer);
1927 beginCommandBuffer(vk, *cmdBuffer);
1928 preRenderCommands(*cmdBuffer, cbImage.get(), dsImage.get(), derivImage.get(), derivNumLevels, srImage.get(), srLayout,
1929 srFillBuffer.get(), numSRLayers, srWidth, srHeight, srFillBpp, clearColor, clearDepthStencil);
1930 beginRender(*cmdBuffer, *renderPass, *framebuffer, *srImageView, srLayout, srTexelSize,
1931 *cbImageView, *dsImageView, imagelessFB, clearColor, clearDepthStencil);
1932 drawCommands(*cmdBuffer, pipelines, viewports, scissors, *pipelineLayout, *renderPass,
1933 &vertexInputStateCreateInfo, &dynamicStateCreateInfo, &rasterizationStateCreateInfo,
1934 &depthStencilStateParams, &multisampleStateCreateInfo, &shadingRateStateCreateInfo,
1935 pDynamicRendering, *vertShader, *geomShader, *fragShader, *descriptorSet, **vertexBuffer);
1936 endRender(*cmdBuffer);
1939 VkMemoryBarrier memBarrier
1941 VK_STRUCTURE_TYPE_MEMORY_BARRIER,
1943 VK_ACCESS_SHADER_READ_BIT | VK_ACCESS_SHADER_WRITE_BIT | VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT | VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT,
1944 VK_ACCESS_SHADER_READ_BIT | VK_ACCESS_SHADER_WRITE_BIT
1946 vk.cmdPipelineBarrier(*cmdBuffer, allPipelineStages, allPipelineStages, 0, 1, &memBarrier, 0, DE_NULL, 0, DE_NULL);
1948 vk.cmdBindDescriptorSets(*cmdBuffer, VK_PIPELINE_BIND_POINT_COMPUTE, *pipelineLayout, 0u, 1, &*descriptorSet, 0u, DE_NULL);
1949 vk.cmdBindPipeline(*cmdBuffer, VK_PIPELINE_BIND_POINT_COMPUTE, *computePipeline);
1951 // Copy color/depth/stencil buffers to buffer memory
1952 vk.cmdDispatch(*cmdBuffer, m_data.framebufferDim.width, m_data.framebufferDim.height, m_data.numColorLayers);
1954 memBarrier.srcAccessMask = VK_ACCESS_SHADER_WRITE_BIT;
1955 memBarrier.dstAccessMask = VK_ACCESS_HOST_READ_BIT;
1956 vk.cmdPipelineBarrier(*cmdBuffer, VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT, VK_PIPELINE_STAGE_HOST_BIT,
1957 0, 1, &memBarrier, 0, DE_NULL, 0, DE_NULL);
1959 endCommandBuffer(vk, *cmdBuffer);
1961 submitCommandsAndWait(vk, device, queue, cmdBuffer.get());
1963 deUint32 *colorptr = (deUint32 *)colorOutputBuffer->getAllocation().getHostPtr();
1964 invalidateAlloc(vk, device, colorOutputBuffer->getAllocation());
1966 invalidateAlloc(vk, device, atomicBuffer->getAllocation());
1968 float *depthptr = DE_NULL;
1969 deUint32 *stencilptr = DE_NULL;
1971 if (m_data.useDepthStencil)
1973 depthptr = (float *)depthOutputBuffer->getAllocation().getHostPtr();
1974 invalidateAlloc(vk, device, depthOutputBuffer->getAllocation());
1976 stencilptr = (deUint32 *)stencilOutputBuffer->getAllocation().getHostPtr();
1977 invalidateAlloc(vk, device, stencilOutputBuffer->getAllocation());
1980 // Loop over all samples and validate the output
1981 for (deUint32 layer = 0; layer < m_data.numColorLayers && res == QP_TEST_RESULT_PASS; ++layer)
1983 for (deUint32 y = 0; y < m_data.framebufferDim.height && res == QP_TEST_RESULT_PASS; ++y)
1985 for (deUint32 x = 0; x < m_data.framebufferDim.width && res == QP_TEST_RESULT_PASS; ++x)
1987 for (deInt32 s = 0; s < m_data.samples && res == QP_TEST_RESULT_PASS; ++s)
1989 deUint32 *sample = &colorptr[4*(((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + s)];
1991 // If testing the rasterizer sample mask, if this sample is not set in the
1992 // mask then it shouldn't have written anything.
1993 if (m_data.useApiSampleMask && !(sampleMask & (1 << s)) && sample[2] != 0)
1995 log << tcu::TestLog::Message << std::hex << "sample written despite pSampleMask (" << x << "," << y << ",sample " << s << ")" << tcu::TestLog::EndMessage;
1996 res = QP_TEST_RESULT_FAIL;
2000 // The same isn't covered by any primitives, skip it
2004 // skip samples that have the same value as sample zero - it would be redundant to check them.
2007 deUint32 *sample0 = &colorptr[4*(((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + 0)];
2008 bool same = deMemCmp(sample, sample0, 16) == 0;
2010 if (m_data.fragDepth)
2012 float *dsample = &depthptr[((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + s];
2013 float *dsample0 = &depthptr[((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + 0];
2014 same = same && (*dsample == *dsample0);
2017 if (m_data.fragStencil)
2019 deUint32 *ssample = &stencilptr[((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + s];
2020 deUint32 *ssample0 = &stencilptr[((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + 0];
2021 same = same && (*ssample == *ssample0);
2028 // Fragment shader writes error codes to .w component.
2029 // All nonzero values are unconditionally failures
2032 if (sample[3] == ERROR_FRAGCOORD_CENTER)
2033 log << tcu::TestLog::Message << std::hex << "fragcoord test failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")" << tcu::TestLog::EndMessage;
2034 else if (sample[3] == ERROR_VTG_READBACK)
2035 log << tcu::TestLog::Message << std::hex << "vs/gs output readback test failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")" << tcu::TestLog::EndMessage;
2036 else if ((sample[3] & 0xFF) == ERROR_FRAGCOORD_DERIV)
2037 log << tcu::TestLog::Message << std::hex << "fragcoord derivative test failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")="
2038 "(0x" << ((sample[3] >> 8) & 0x3F) << ",0x" << ((sample[3] >> 14) & 0x3F) << "), expected="
2039 "(0x" << ((sample[3] >> 20) & 0x3F) << ",0x" << ((sample[3] >> 26) & 0x3F) << ")" << tcu::TestLog::EndMessage;
2040 else if ((sample[3] & 0xFF) == ERROR_FRAGCOORD_IMPLICIT_DERIV)
2041 log << tcu::TestLog::Message << std::hex << "implicit derivative test failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")="
2042 "(0x" << ((sample[3] >> 8) & 0x3F) << ",0x" << ((sample[3] >> 14) & 0x3F) << "), expected="
2043 "(0x" << ((sample[3] >> 20) & 0x3F) << ",0x" << ((sample[3] >> 26) & 0x3F) << ")" << tcu::TestLog::EndMessage;
2045 log << tcu::TestLog::Message << std::hex << "w coord unknown test failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")" << tcu::TestLog::EndMessage;
2046 res = QP_TEST_RESULT_FAIL;
2050 // x component of sample
2051 deUint32 rate = sample[0];
2053 deUint32 pixelsX = 1 << ((rate/4)&3);
2054 deUint32 pixelsY = 1 << (rate&3);
2057 deUint32 fragMinX = x & ~(pixelsX-1);
2058 deUint32 fragMinY = y & ~(pixelsY-1);
2059 deUint32 fragMaxX = fragMinX + pixelsX;
2060 deUint32 fragMaxY = fragMinY + pixelsY;
2062 // Clamp to FB dimension for odd sizes
2063 if (fragMaxX > m_data.framebufferDim.width)
2064 fragMaxX = m_data.framebufferDim.width;
2065 if (fragMaxY > m_data.framebufferDim.height)
2066 fragMaxY = m_data.framebufferDim.height;
2068 // z component of sample
2069 deUint32 primID = sample[2] >> 24;
2070 deUint32 atomVal = sample[2] & 0xFFFFFF;
2072 // Compute pipeline and primitive rate from primitive ID, and attachment
2073 // rate from the x/y coordinate
2074 deInt32 pipelineRate = PrimIDToPipelineShadingRate(primID);
2075 deInt32 primitiveRate = m_data.shaderWritesRate ? PrimIDToPrimitiveShadingRate(primID) : 0;
2077 deInt32 attachmentLayer = (m_data.srLayered && modeIdx == ATTACHMENT_MODE_2DARRAY) ? layer : 0;
2078 deInt32 attachmentRate = m_data.useAttachment() ? fillPtr[srFillBpp*((attachmentLayer * srHeight + (y / srTexelHeight)) * srWidth + (x / srTexelWidth))] : 0;
2080 // Get mask of allowed shading rates
2081 deInt32 expectedMasks = Simulate(pipelineRate, primitiveRate, attachmentRate);
2083 if (!(expectedMasks & (1 << rate)))
2085 log << tcu::TestLog::Message << std::hex << "unexpected shading rate. failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ") "
2086 "result rate 0x" << rate << " mask of expected rates 0x" << expectedMasks <<
2087 " pipelineRate=0x" << pipelineRate << " primitiveRate=0x" << primitiveRate << " attachmentRate =0x" << attachmentRate << tcu::TestLog::EndMessage;
2088 res = QP_TEST_RESULT_FAIL;
2091 // Check that not all fragments are downgraded to 1x1
2092 if (rate == 0 && expectedMasks != 1)
2093 numUnexpected1x1Samples++;
2096 // Check that gl_FragDepth = primID / NUM_TRIANGLES
2097 if (m_data.fragDepth)
2099 float *dsample = &depthptr[((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + s];
2100 float expected = (float)primID / NUM_TRIANGLES;
2101 if (fabs(*dsample - expected) > 0.01)
2103 log << tcu::TestLog::Message << std::hex << "depth write failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")=" << *dsample << " expected " << expected << tcu::TestLog::EndMessage;
2104 res = QP_TEST_RESULT_FAIL;
2109 // Check that stencil value = primID
2110 if (m_data.fragStencil)
2112 deUint32 *ssample = &stencilptr[((layer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + s];
2113 if (*ssample != primID)
2115 log << tcu::TestLog::Message << std::hex << "stencil write failed pixel (0x" << x << ",0x" << y << ",sample 0x" << s << ")=" << *ssample << " expected " << primID << tcu::TestLog::EndMessage;
2116 res = QP_TEST_RESULT_FAIL;
2121 // Check that primitives are in the right viewport/scissor
2122 if (m_data.multiViewport)
2124 VkRect2D *scissor = &scissors[primID & 1];
2125 if ((int)x < scissor->offset.x || (int)x >= (int)(scissor->offset.x + scissor->extent.width) ||
2126 (int)y < scissor->offset.y || (int)y >= (int)(scissor->offset.y + scissor->extent.height))
2128 log << tcu::TestLog::Message << std::hex << "primitive found outside of expected viewport (0x" << x << ",0x" << y << ",sample 0x" << s << ") primID=" << primID << tcu::TestLog::EndMessage;
2129 res = QP_TEST_RESULT_FAIL;
2134 // Check that primitives are in the right layer
2135 if (m_data.colorLayered)
2137 if (layer != ((primID & 2)>>1))
2139 log << tcu::TestLog::Message << std::hex << "primitive found in wrong layer (0x" << x << ",0x" << y << ",sample 0x" << s << ") primID=" << primID << " layer=" << layer << tcu::TestLog::EndMessage;
2140 res = QP_TEST_RESULT_FAIL;
2145 // Check that multiview broadcasts the same primitive to both layers
2146 if (m_data.multiView)
2148 deUint32 otherLayer = layer^1;
2149 deUint32 *othersample = &colorptr[4*(((otherLayer * m_data.framebufferDim.height + y) * m_data.framebufferDim.width + x)*m_data.samples + s)];
2150 deUint32 otherPrimID = othersample[2] >> 24;
2151 if (primID != otherPrimID)
2153 log << tcu::TestLog::Message << std::hex << "multiview primitive mismatch (0x" << x << ",0x" << y << ",sample 0x" << s << ") primID=" << primID << " otherPrimID=" << otherPrimID << tcu::TestLog::EndMessage;
2154 res = QP_TEST_RESULT_FAIL;
2159 // Loop over all samples in the same fragment
2160 for (deUint32 fx = fragMinX; fx < fragMaxX; ++fx)
2162 for (deUint32 fy = fragMinY; fy < fragMaxY; ++fy)
2164 for (deInt32 fs = 0; fs < m_data.samples; ++fs)
2166 deUint32 *fsample = &colorptr[4*(((layer * m_data.framebufferDim.height + fy) * m_data.framebufferDim.width + fx)*m_data.samples + fs)];
2167 deUint32 frate = fsample[0];
2168 deUint32 fprimID = fsample[2] >> 24;
2169 deUint32 fatomVal = fsample[2] & 0xFFFFFF;
2171 // If we write out the sample mask value, check that the samples in the
2172 // mask must not be uncovered, and that samples not in the mask must not
2173 // be covered by this primitive
2174 if (m_data.useSampleMaskIn)
2176 int p = pixelsX * pixelsY - ((fx - fragMinX) + pixelsX * (fy - fragMinY)) - 1;
2177 int sampleIdx = fs + m_data.samples * p;
2179 if ((sample[1] & (1 << sampleIdx)) && fsample[2] == 0)
2181 log << tcu::TestLog::Message << std::hex << "sample set in sampleMask but not written (0x" << fx << ",0x" << fy << ",sample 0x" << fs << ")" << tcu::TestLog::EndMessage;
2182 res = QP_TEST_RESULT_FAIL;
2185 if (!(sample[1] & (1 << sampleIdx)) && fsample[2] != 0 && fprimID == primID)
2187 log << tcu::TestLog::Message << std::hex << "sample not set in sampleMask but written with same primID (0x" << fx << ",0x" << fy << ",sample 0x" << fs << ")" << tcu::TestLog::EndMessage;
2188 res = QP_TEST_RESULT_FAIL;
2193 // If conservative raster is enabled, or custom sample locations all at the center, check that
2194 // samples in the same pixel must be covered.
2195 if (m_data.conservativeEnable ||
2196 (m_data.sampleLocations && m_context.getFragmentShadingRateProperties().fragmentShadingRateWithCustomSampleLocations))
2198 // If it's in the same pixel, expect it to be fully covered.
2199 if (fx == x && fy == y && fsample[2] == 0)
2201 log << tcu::TestLog::Message << std::hex << "pixel not fully covered (0x" << fx << ",0x" << fy << ",sample 0x" << fs << ")" << tcu::TestLog::EndMessage;
2202 res = QP_TEST_RESULT_FAIL;
2207 if (fsample[2] == 0)
2210 // If the primitive matches this sample, then it must have the same rate and
2212 if (fprimID == primID)
2214 if (rate != frate || (atomVal != fatomVal && !(m_data.sampleShadingEnable || m_data.sampleShadingInput)))
2216 log << tcu::TestLog::Message << std::hex << "failed pixel (0x" << x << ",0x" << y << ",sample " << s << ")=0x" << ((primID<<24)|atomVal) <<
2217 " compared to (0x" << fx << ",0x" << fy << ",sample " << fs << ")=0x" << ((fprimID<<24)|fatomVal) <<
2218 " pipelineRate=0x" << pipelineRate << " primitiveRate=0x" << primitiveRate << " attachmentRate =0x" << attachmentRate <<
2219 tcu::TestLog::EndMessage;
2220 res = QP_TEST_RESULT_FAIL;
2230 if (res == QP_TEST_RESULT_FAIL)
2234 // All samples were coerced to 1x1, unexpected
2235 if (res == QP_TEST_RESULT_PASS &&
2236 numTotalSamples != 0 &&
2237 numUnexpected1x1Samples == numTotalSamples &&
2238 numTotalSamples > 16)
2240 log << tcu::TestLog::Message << std::hex << "Quality warning - all fragments used 1x1" << tcu::TestLog::EndMessage;
2241 res = QP_TEST_RESULT_QUALITY_WARNING;
2244 return tcu::TestStatus(res, qpGetTestResultName(res));
2247 void FSRTestInstance::beginSecondaryCmdBuffer(VkCommandBuffer cmdBuffer, VkFormat cbFormat, VkFormat dsFormat, VkRenderingFlagsKHR renderingFlags) const
2249 VkCommandBufferInheritanceRenderingInfoKHR inheritanceRenderingInfo
2251 VK_STRUCTURE_TYPE_COMMAND_BUFFER_INHERITANCE_RENDERING_INFO_KHR, // VkStructureType sType;
2252 DE_NULL, // const void* pNext;
2253 renderingFlags, // VkRenderingFlagsKHR flags;
2254 m_data.multiView ? 0x3 : 0u, // uint32_t viewMask;
2255 1u, // uint32_t colorAttachmentCount;
2256 &cbFormat, // const VkFormat* pColorAttachmentFormats;
2257 dsFormat, // VkFormat depthAttachmentFormat;
2258 dsFormat, // VkFormat stencilAttachmentFormat;
2259 m_data.samples, // VkSampleCountFlagBits rasterizationSamples;
2261 const VkCommandBufferInheritanceInfo bufferInheritanceInfo = initVulkanStructure(&inheritanceRenderingInfo);
2263 VkCommandBufferUsageFlags usageFlags = VK_COMMAND_BUFFER_USAGE_ONE_TIME_SUBMIT_BIT;
2264 if (!m_data.groupParams->secondaryCmdBufferCompletelyContainsDynamicRenderpass)
2265 usageFlags |= VK_COMMAND_BUFFER_USAGE_RENDER_PASS_CONTINUE_BIT;
2267 const VkCommandBufferBeginInfo commandBufBeginParams
2269 VK_STRUCTURE_TYPE_COMMAND_BUFFER_BEGIN_INFO, // VkStructureType sType;
2270 DE_NULL, // const void* pNext;
2271 usageFlags, // VkCommandBufferUsageFlags flags;
2272 &bufferInheritanceInfo
2275 const DeviceInterface& vk = m_context.getDeviceInterface();
2276 VK_CHECK(vk.beginCommandBuffer(cmdBuffer, &commandBufBeginParams));
2279 void FSRTestInstance::preRenderCommands(VkCommandBuffer cmdBuffer, ImageWithMemory* cbImage, ImageWithMemory* dsImage,
2280 ImageWithMemory* derivImage, deUint32 derivNumLevels,
2281 ImageWithMemory* srImage, VkImageLayout srLayout, BufferWithMemory* srFillBuffer,
2282 deUint32 numSRLayers, deUint32 srWidth, deUint32 srHeight, deUint32 srFillBpp,
2283 const VkClearValue& clearColor, const VkClearValue& clearDepthStencil)
2285 const DeviceInterface& vk = m_context.getDeviceInterface();
2286 const VkDevice device = m_context.getDevice();
2288 VkFlags allPipelineStages = VK_PIPELINE_STAGE_VERTEX_SHADER_BIT |
2289 VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT |
2290 VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT |
2291 VK_PIPELINE_STAGE_EARLY_FRAGMENT_TESTS_BIT |
2292 VK_PIPELINE_STAGE_LATE_FRAGMENT_TESTS_BIT |
2293 VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT |
2294 VK_PIPELINE_STAGE_SHADING_RATE_IMAGE_BIT_NV;
2296 if (m_data.geometryShader)
2297 allPipelineStages |= VK_PIPELINE_STAGE_GEOMETRY_SHADER_BIT;
2299 VkImageMemoryBarrier imageBarrier
2301 VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER, // VkStructureType sType
2302 DE_NULL, // const void* pNext
2303 0u, // VkAccessFlags srcAccessMask
2304 VK_ACCESS_TRANSFER_WRITE_BIT, // VkAccessFlags dstAccessMask
2305 VK_IMAGE_LAYOUT_UNDEFINED, // VkImageLayout oldLayout
2306 VK_IMAGE_LAYOUT_GENERAL, // VkImageLayout newLayout
2307 VK_QUEUE_FAMILY_IGNORED, // uint32_t srcQueueFamilyIndex
2308 VK_QUEUE_FAMILY_IGNORED, // uint32_t dstQueueFamilyIndex
2309 cbImage->get(), // VkImage image
2311 VK_IMAGE_ASPECT_COLOR_BIT, // VkImageAspectFlags aspectMask
2312 0u, // uint32_t baseMipLevel
2313 VK_REMAINING_MIP_LEVELS, // uint32_t mipLevels,
2314 0u, // uint32_t baseArray
2315 VK_REMAINING_ARRAY_LAYERS, // uint32_t arraySize
2319 vk.cmdPipelineBarrier(cmdBuffer, VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT,
2320 (VkDependencyFlags)0,
2321 0, (const VkMemoryBarrier*)DE_NULL,
2322 0, (const VkBufferMemoryBarrier*)DE_NULL,
2325 imageBarrier.image = derivImage->get();
2326 imageBarrier.newLayout = VK_IMAGE_LAYOUT_GENERAL;
2328 vk.cmdPipelineBarrier(cmdBuffer, VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT,
2329 (VkDependencyFlags)0,
2330 0, (const VkMemoryBarrier*)DE_NULL,
2331 0, (const VkBufferMemoryBarrier*)DE_NULL,
2334 // Clear level to 1<<level
2335 for (deUint32 i = 0; i < derivNumLevels; ++i)
2337 VkImageSubresourceRange range = makeImageSubresourceRange(VK_IMAGE_ASPECT_COLOR_BIT, i, 1u, 0u, 1u);
2338 VkClearValue clearLevelColor = makeClearValueColorU32(1<<i,0,0,0);
2339 vk.cmdClearColorImage(cmdBuffer, derivImage->get(), VK_IMAGE_LAYOUT_GENERAL, &clearLevelColor.color, 1, &range);
2342 // Clear color buffer to transparent black
2344 VkImageSubresourceRange range = makeImageSubresourceRange(VK_IMAGE_ASPECT_COLOR_BIT, 0u, 1u, 0u, VK_REMAINING_ARRAY_LAYERS);
2345 vk.cmdClearColorImage(cmdBuffer, cbImage->get(), VK_IMAGE_LAYOUT_GENERAL, &clearColor.color, 1, &range);
2348 // Clear depth and stencil
2349 if (m_data.useDepthStencil)
2351 VkImageSubresourceRange range = makeImageSubresourceRange(VK_IMAGE_ASPECT_DEPTH_BIT | VK_IMAGE_ASPECT_STENCIL_BIT, 0u, 1u, 0u, VK_REMAINING_ARRAY_LAYERS);
2352 VkImageMemoryBarrier dsBarrier = imageBarrier;
2353 dsBarrier.image = dsImage->get();
2354 dsBarrier.newLayout = VK_IMAGE_LAYOUT_GENERAL;
2355 dsBarrier.subresourceRange = range;
2356 vk.cmdPipelineBarrier(cmdBuffer, VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT,
2357 0u, // dependencyFlags
2361 vk.cmdClearDepthStencilImage(cmdBuffer, dsImage->get(), VK_IMAGE_LAYOUT_GENERAL, &clearDepthStencil.depthStencil, 1, &range);
2364 // Initialize shading rate image with varying values
2365 if (m_data.useAttachment())
2367 imageBarrier.image = srImage->get();
2368 imageBarrier.newLayout = VK_IMAGE_LAYOUT_GENERAL;
2370 vk.cmdPipelineBarrier(cmdBuffer, VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT,
2371 (VkDependencyFlags)0,
2372 0, (const VkMemoryBarrier*)DE_NULL,
2373 0, (const VkBufferMemoryBarrier*)DE_NULL,
2376 deUint8 *fillPtr = (deUint8 *)srFillBuffer->getAllocation().getHostPtr();
2377 for (deUint32 layer = 0; layer < numSRLayers; ++layer)
2379 for (deUint32 x = 0; x < srWidth; ++x)
2381 for (deUint32 y = 0; y < srHeight; ++y)
2383 deUint32 idx = (layer*srHeight + y)*srWidth + x;
2384 deUint8 val = (deUint8)SanitizeRate(idx & 0xF);
2385 // actual shading rate is always in the LSBs of the first byte of a texel
2386 fillPtr[srFillBpp*idx] = val;
2390 flushAlloc(vk, device, srFillBuffer->getAllocation());
2392 const VkBufferImageCopy copyRegion
2394 0u, // VkDeviceSize bufferOffset;
2395 0u, // deUint32 bufferRowLength;
2396 0u, // deUint32 bufferImageHeight;
2398 VK_IMAGE_ASPECT_COLOR_BIT, // VkImageAspectFlags aspect;
2399 0u, // deUint32 mipLevel;
2400 0u, // deUint32 baseArrayLayer;
2401 numSRLayers, // deUint32 layerCount;
2402 }, // VkImageSubresourceLayers imageSubresource;
2403 { 0, 0, 0 }, // VkOffset3D imageOffset;
2404 { srWidth, srHeight, 1 }, // VkExtent3D imageExtent;
2407 vk.cmdCopyBufferToImage(cmdBuffer, srFillBuffer->get(), srImage->get(), VK_IMAGE_LAYOUT_GENERAL, 1, ©Region);
2409 imageBarrier.oldLayout = VK_IMAGE_LAYOUT_GENERAL;
2410 imageBarrier.newLayout = srLayout;
2412 vk.cmdPipelineBarrier(cmdBuffer, VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT,
2413 (VkDependencyFlags)0,
2414 0, (const VkMemoryBarrier*)DE_NULL,
2415 0, (const VkBufferMemoryBarrier*)DE_NULL,
2419 VkMemoryBarrier memBarrier
2421 VK_STRUCTURE_TYPE_MEMORY_BARRIER, // sType
2423 0u, // srcAccessMask
2424 0u, // dstAccessMask
2427 memBarrier.srcAccessMask = VK_ACCESS_TRANSFER_WRITE_BIT;
2428 memBarrier.dstAccessMask = VK_ACCESS_SHADER_READ_BIT | VK_ACCESS_SHADER_WRITE_BIT | VK_ACCESS_FRAGMENT_SHADING_RATE_ATTACHMENT_READ_BIT_KHR;
2429 vk.cmdPipelineBarrier(cmdBuffer, VK_PIPELINE_STAGE_TRANSFER_BIT, allPipelineStages,
2430 0, 1, &memBarrier, 0, DE_NULL, 0, DE_NULL);
2433 void FSRTestInstance::beginRender(VkCommandBuffer cmdBuffer, VkRenderPass renderPass, VkFramebuffer framebuffer,
2434 VkImageView srImageView, VkImageLayout srImageLayout, const VkExtent2D& srTexelSize,
2435 VkImageView cbImageView, VkImageView dsImageView, bool imagelessFB,
2436 const VkClearValue& clearColor, const VkClearValue& clearDepthStencil,
2437 VkRenderingFlagsKHR renderingFlags) const
2439 const DeviceInterface& vk = m_context.getDeviceInterface();
2440 VkRect2D renderArea = makeRect2D(m_data.framebufferDim.width, m_data.framebufferDim.height);
2442 if (m_data.groupParams->useDynamicRendering)
2444 VkRenderingFragmentShadingRateAttachmentInfoKHR shadingRateAttachmentInfo
2446 VK_STRUCTURE_TYPE_RENDERING_FRAGMENT_SHADING_RATE_ATTACHMENT_INFO_KHR, // VkStructureType sType;
2447 DE_NULL, // const void* pNext;
2448 srImageView, // VkImageView imageView;
2449 srImageLayout, // VkImageLayout imageLayout;
2450 srTexelSize // VkExtent2D shadingRateAttachmentTexelSize;
2453 VkRenderingAttachmentInfoKHR colorAttachment
2455 vk::VK_STRUCTURE_TYPE_RENDERING_ATTACHMENT_INFO_KHR, // VkStructureType sType;
2456 DE_NULL, // const void* pNext;
2457 cbImageView, // VkImageView imageView;
2458 VK_IMAGE_LAYOUT_GENERAL, // VkImageLayout imageLayout;
2459 VK_RESOLVE_MODE_NONE, // VkResolveModeFlagBits resolveMode;
2460 DE_NULL, // VkImageView resolveImageView;
2461 VK_IMAGE_LAYOUT_UNDEFINED, // VkImageLayout resolveImageLayout;
2462 VK_ATTACHMENT_LOAD_OP_LOAD, // VkAttachmentLoadOp loadOp;
2463 VK_ATTACHMENT_STORE_OP_STORE, // VkAttachmentStoreOp storeOp;
2464 clearColor // VkClearValue clearValue;
2467 std::vector<VkRenderingAttachmentInfoKHR> depthStencilAttachments(2,
2469 VK_STRUCTURE_TYPE_RENDERING_ATTACHMENT_INFO_KHR, // VkStructureType sType;
2470 DE_NULL, // const void* pNext;
2471 dsImageView, // VkImageView imageView;
2472 VK_IMAGE_LAYOUT_GENERAL, // VkImageLayout imageLayout;
2473 VK_RESOLVE_MODE_NONE, // VkResolveModeFlagBits resolveMode;
2474 DE_NULL, // VkImageView resolveImageView;
2475 VK_IMAGE_LAYOUT_UNDEFINED, // VkImageLayout resolveImageLayout;
2476 VK_ATTACHMENT_LOAD_OP_LOAD, // VkAttachmentLoadOp loadOp;
2477 VK_ATTACHMENT_STORE_OP_STORE, // VkAttachmentStoreOp storeOp;
2478 clearDepthStencil // VkClearValue clearValue;
2481 vk::VkRenderingInfoKHR renderingInfo
2483 vk::VK_STRUCTURE_TYPE_RENDERING_INFO_KHR,
2484 m_data.useAttachment() ? &shadingRateAttachmentInfo : DE_NULL,
2485 renderingFlags, // VkRenderingFlagsKHR flags;
2486 renderArea, // VkRect2D renderArea;
2487 m_data.multiView ? 1 : m_data.numColorLayers, // deUint32 layerCount;
2488 m_data.multiView ? 0x3 : 0u, // deUint32 viewMask;
2489 1u, // deUint32 colorAttachmentCount;
2490 &colorAttachment, // const VkRenderingAttachmentInfoKHR* pColorAttachments;
2491 m_data.useDepthStencil ? &depthStencilAttachments[0] : DE_NULL, // const VkRenderingAttachmentInfoKHR* pDepthAttachment;
2492 m_data.useDepthStencil ? &depthStencilAttachments[1] : DE_NULL, // const VkRenderingAttachmentInfoKHR* pStencilAttachment;
2495 vk.cmdBeginRendering(cmdBuffer, &renderingInfo);
2499 std::vector<VkImageView> attachments = { cbImageView };
2500 if (m_data.useAttachment())
2501 attachments.push_back(srImageView);
2502 if (m_data.useDepthStencil)
2503 attachments.push_back(dsImageView);
2505 const VkRenderPassAttachmentBeginInfo renderPassAttachmentBeginInfo
2507 VK_STRUCTURE_TYPE_RENDER_PASS_ATTACHMENT_BEGIN_INFO, // VkStructureType sType;
2508 DE_NULL, // const void* pNext;
2509 (deUint32)attachments.size(), // deUint32 attachmentCount;
2510 &attachments[0] // const VkImageView* pAttachments;
2513 beginRenderPass(vk, cmdBuffer, renderPass, framebuffer, renderArea,
2514 0, DE_NULL, VK_SUBPASS_CONTENTS_INLINE, imagelessFB ? &renderPassAttachmentBeginInfo : DE_NULL);
2518 void FSRTestInstance::drawCommands(VkCommandBuffer cmdBuffer,
2519 std::vector<GraphicsPipelineWrapper>& pipelines,
2520 const std::vector<VkViewport>& viewports,
2521 const std::vector<VkRect2D>& scissors,
2522 const VkPipelineLayout pipelineLayout,
2523 const VkRenderPass renderPass,
2524 const VkPipelineVertexInputStateCreateInfo* vertexInputState,
2525 const VkPipelineDynamicStateCreateInfo* dynamicState,
2526 const VkPipelineRasterizationStateCreateInfo* rasterizationState,
2527 const VkPipelineDepthStencilStateCreateInfo* depthStencilState,
2528 const VkPipelineMultisampleStateCreateInfo* multisampleState,
2529 VkPipelineFragmentShadingRateStateCreateInfoKHR* shadingRateState,
2530 VkPipelineRenderingCreateInfoKHR* dynamicRendering,
2531 const VkShaderModule vertShader,
2532 const VkShaderModule geomShader,
2533 const VkShaderModule fragShader,
2534 VkDescriptorSet descriptorSet,
2535 VkBuffer vertexBuffer)
2537 const DeviceInterface& vk = m_context.getDeviceInterface();
2538 const VkDevice device = m_context.getDevice();
2540 VkFlags allShaderStages = VK_SHADER_STAGE_VERTEX_BIT | VK_SHADER_STAGE_FRAGMENT_BIT | VK_SHADER_STAGE_COMPUTE_BIT;
2541 if (m_data.geometryShader)
2542 allShaderStages |= VK_SHADER_STAGE_GEOMETRY_BIT;
2544 VkPipelineCreateFlags pipelineCreateFlags = (VkPipelineCreateFlags)0;
2545 if (m_data.groupParams->useDynamicRendering)
2546 pipelineCreateFlags |= VK_PIPELINE_CREATE_RENDERING_FRAGMENT_SHADING_RATE_ATTACHMENT_BIT_KHR;
2548 vk.cmdBindDescriptorSets(cmdBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, pipelineLayout, 0, 1, &descriptorSet, 0, DE_NULL);
2550 // If using dynamic state, create a single graphics pipeline and bind it
2551 if (m_data.useDynamicState)
2553 pipelines.emplace_back(vk, device, m_data.groupParams->pipelineConstructionType, pipelineCreateFlags);
2555 .setDefaultColorBlendState()
2556 .setDynamicState(dynamicState)
2557 .setupVertexInputStete(vertexInputState)
2558 .setupPreRasterizationShaderState(viewports,
2570 .setupFragmentShaderState(pipelineLayout,
2577 .setupFragmentOutputState(renderPass, 0u, DE_NULL, multisampleState)
2578 .setMonolithicPipelineLayout(pipelineLayout)
2581 vk.cmdBindPipeline(cmdBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, pipelines.back().getPipeline());
2584 for (deInt32 i = 0; i < NUM_TRIANGLES; ++i)
2586 // Bind vertex attributes pointing to the next triangle
2587 VkDeviceSize vertexBufferOffset = i * 3 * 2 * sizeof(float);
2588 vk.cmdBindVertexBuffers(cmdBuffer, 0, 1, &vertexBuffer, &vertexBufferOffset);
2590 // Put primitive shading rate in a push constant
2591 deInt32 shadingRatePC = PrimIDToPrimitiveShadingRate(i);
2592 vk.cmdPushConstants(cmdBuffer, pipelineLayout, allShaderStages, 0, sizeof(shadingRatePC), &shadingRatePC);
2594 if (m_data.useDynamicState)
2596 VkExtent2D fragmentSize = ShadingRateEnumToExtent(PrimIDToPipelineShadingRate(i));
2597 vk.cmdSetFragmentShadingRateKHR(cmdBuffer, &fragmentSize, m_data.combinerOp);
2601 // Create a new pipeline with the desired pipeline shading rate
2602 shadingRateState->fragmentSize = ShadingRateEnumToExtent(PrimIDToPipelineShadingRate(i));
2604 pipelines.emplace_back(vk, device, m_data.groupParams->pipelineConstructionType, pipelineCreateFlags);
2606 .setDefaultColorBlendState()
2607 .setDynamicState(dynamicState)
2608 .setupVertexInputStete(vertexInputState)
2609 .setupPreRasterizationShaderState(viewports,
2621 .setupFragmentShaderState(pipelineLayout,
2628 .setupFragmentOutputState(renderPass, 0u, DE_NULL, multisampleState)
2629 .setMonolithicPipelineLayout(pipelineLayout)
2632 vk.cmdBindPipeline(cmdBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, pipelines.back().getPipeline());
2635 // Draw one triangle, with "primitive ID" in gl_InstanceIndex
2636 vk.cmdDraw(cmdBuffer, 3u, 1, 0u, i);
2640 void FSRTestInstance::endRender(VkCommandBuffer cmdBuffer) const
2642 const DeviceInterface& vk = m_context.getDeviceInterface();
2643 if (m_data.groupParams->useDynamicRendering)
2644 endRendering(vk, cmdBuffer);
2646 endRenderPass(vk, cmdBuffer);
2651 void createBasicTests (tcu::TestContext& testCtx, tcu::TestCaseGroup* parentGroup, SharedGroupParams groupParams)
2657 const char* description;
2664 const char* description;
2669 AttachmentUsage usage;
2671 const char* description;
2672 } TestGroupUsageCase;
2674 TestGroupCase groupCases[] =
2676 { 0, "basic", "basic tests" },
2677 { 1, "apisamplemask", "use pSampleMask" },
2678 { 2, "samplemaskin", "use gl_SampleMaskIn" },
2679 { 3, "conservativeunder", "conservative underestimation" },
2680 { 4, "conservativeover", "conservative overestimation" },
2681 { 5, "fragdepth", "depth shader output" },
2682 { 6, "fragstencil", "stencil shader output" },
2683 { 7, "multiviewport", "multiple viewports and gl_ViewportIndex" },
2684 { 8, "colorlayered", "multiple layer color, single layer shading rate" },
2685 { 9, "srlayered", "multiple layer color, multiple layers shading rate" },
2686 { 10, "multiview", "multiview" },
2687 { 11, "multiviewsrlayered", "multiview and multilayer shading rate" },
2688 { 12, "multiviewcorrelation", "multiview with correlation mask" },
2689 { 13, "interlock", "fragment shader interlock" },
2690 { 14, "samplelocations", "custom sample locations" },
2691 { 15, "sampleshadingenable", "enable sample shading in createinfo" },
2692 { 16, "sampleshadinginput", "enable sample shading by using gl_SampleID" },
2695 TestGroupCase dynCases[] =
2697 { 1, "dynamic", "uses dynamic shading rate state" },
2698 { 0, "static", "uses static shading rate state" },
2701 TestGroupUsageCase attCases[] =
2703 { AttachmentUsage::NO_ATTACHMENT, "noattachment", "no shading rate attachment" },
2704 { AttachmentUsage::WITH_ATTACHMENT, "attachment", "has shading rate attachment" },
2705 { AttachmentUsage::NO_ATTACHMENT_PTR, "noattachmentptr", "no shading rate attachment pointer" },
2708 TestGroupCase shdCases[] =
2710 { 0, "noshaderrate", "shader doesn't write rate" },
2711 { 1, "shaderrate", "shader writes rate" },
2714 TestGroupCase combCases[] =
2716 { VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR, "keep", "keep" },
2717 { VK_FRAGMENT_SHADING_RATE_COMBINER_OP_REPLACE_KHR, "replace", "replace" },
2718 { VK_FRAGMENT_SHADING_RATE_COMBINER_OP_MIN_KHR, "min", "min" },
2719 { VK_FRAGMENT_SHADING_RATE_COMBINER_OP_MAX_KHR, "max", "max" },
2720 { VK_FRAGMENT_SHADING_RATE_COMBINER_OP_MUL_KHR, "mul", "mul" },
2723 TestGroupCase2D extentCases[] =
2725 { {1, 1}, "1x1", "1x1" },
2726 { {4, 4}, "4x4", "4x4" },
2727 { {33, 35}, "33x35", "33x35" },
2728 { {151, 431}, "151x431", "151x431" },
2729 { {256, 256}, "256x256", "256x256" },
2732 TestGroupCase sampCases[] =
2734 { VK_SAMPLE_COUNT_1_BIT, "samples1", "1 raster sample" },
2735 { VK_SAMPLE_COUNT_2_BIT, "samples2", "2 raster samples" },
2736 { VK_SAMPLE_COUNT_4_BIT, "samples4", "4 raster samples" },
2737 { VK_SAMPLE_COUNT_8_BIT, "samples8", "8 raster samples" },
2738 { VK_SAMPLE_COUNT_16_BIT, "samples16", "16 raster samples" },
2741 TestGroupCase geomCases[] =
2743 { 0, "vs", "vertex shader only" },
2744 { 1, "gs", "vertex and geometry shader" },
2749 for (int groupNdx = 0; groupNdx < DE_LENGTH_OF_ARRAY(groupCases); groupNdx++)
2751 if (groupParams->useDynamicRendering && groupNdx == 12)
2754 if (groupParams->pipelineConstructionType != PIPELINE_CONSTRUCTION_TYPE_MONOLITHIC)
2756 // for graphics pipeline library we need to repeat only selected groups
2757 if (std::set<int> { 2, 3, 4, 10, 11, 12, 13, 14, 15 }.count(groupNdx) == 0)
2761 de::MovePtr<tcu::TestCaseGroup> group(new tcu::TestCaseGroup(testCtx, groupCases[groupNdx].name, groupCases[groupNdx].description));
2762 for (int dynNdx = 0; dynNdx < DE_LENGTH_OF_ARRAY(dynCases); dynNdx++)
2764 // reduce number of tests for dynamic rendering cases where secondary command buffer is used
2765 if (groupParams->useSecondaryCmdBuffer && (dynNdx != 0))
2768 de::MovePtr<tcu::TestCaseGroup> dynGroup(new tcu::TestCaseGroup(testCtx, dynCases[dynNdx].name, dynCases[dynNdx].description));
2769 for (int attNdx = 0; attNdx < DE_LENGTH_OF_ARRAY(attCases); attNdx++)
2771 if (groupParams->useDynamicRendering && attCases[attNdx].usage == AttachmentUsage::NO_ATTACHMENT_PTR)
2774 de::MovePtr<tcu::TestCaseGroup> attGroup(new tcu::TestCaseGroup(testCtx, attCases[attNdx].name, attCases[attNdx].description));
2775 for (int shdNdx = 0; shdNdx < DE_LENGTH_OF_ARRAY(shdCases); shdNdx++)
2777 de::MovePtr<tcu::TestCaseGroup> shdGroup(new tcu::TestCaseGroup(testCtx, shdCases[shdNdx].name, shdCases[shdNdx].description));
2778 for (int cmb0Ndx = 0; cmb0Ndx < DE_LENGTH_OF_ARRAY(combCases); cmb0Ndx++)
2780 de::MovePtr<tcu::TestCaseGroup> cmb0Group(new tcu::TestCaseGroup(testCtx, combCases[cmb0Ndx].name, combCases[cmb0Ndx].description));
2781 for (int cmb1Ndx = 0; cmb1Ndx < DE_LENGTH_OF_ARRAY(combCases); cmb1Ndx++)
2783 de::MovePtr<tcu::TestCaseGroup> cmb1Group(new tcu::TestCaseGroup(testCtx, combCases[cmb1Ndx].name, combCases[cmb1Ndx].description));
2784 for (int extNdx = 0; extNdx < DE_LENGTH_OF_ARRAY(extentCases); extNdx++)
2786 // reduce number of cases repeat every other extent case for graphics pipeline library
2787 if ((groupParams->pipelineConstructionType != PIPELINE_CONSTRUCTION_TYPE_MONOLITHIC) && ((extNdx % 2) == 1))
2790 // reduce number of tests for dynamic rendering cases where secondary command buffer is used
2791 if (groupParams->useSecondaryCmdBuffer && (extNdx != 1))
2794 de::MovePtr<tcu::TestCaseGroup> extGroup(new tcu::TestCaseGroup(testCtx, extentCases[extNdx].name, extentCases[extNdx].description));
2795 for (int sampNdx = 0; sampNdx < DE_LENGTH_OF_ARRAY(sampCases); sampNdx++)
2797 // reduce number of tests for dynamic rendering cases where secondary command buffer is used
2798 if (groupParams->useSecondaryCmdBuffer && (sampNdx != 1))
2801 de::MovePtr<tcu::TestCaseGroup> sampGroup(new tcu::TestCaseGroup(testCtx, sampCases[sampNdx].name, sampCases[sampNdx].description));
2802 for (int geomNdx = 0; geomNdx < DE_LENGTH_OF_ARRAY(geomCases); geomNdx++)
2804 // reduce number of tests for dynamic rendering cases where secondary command buffer is used
2805 if (groupParams->useSecondaryCmdBuffer && (geomNdx != 0))
2808 bool useApiSampleMask = groupNdx == 1;
2809 bool useSampleMaskIn = groupNdx == 2;
2810 bool consRast = groupNdx == 3 || groupNdx == 4;
2811 bool fragDepth = groupNdx == 5;
2812 bool fragStencil = groupNdx == 6;
2813 bool multiViewport = groupNdx == 7;
2814 bool colorLayered = groupNdx == 8 || groupNdx == 9;
2815 bool srLayered = groupNdx == 9 || groupNdx == 11;
2816 bool multiView = groupNdx == 10 || groupNdx == 11 || groupNdx == 12;
2817 bool correlationMask = groupNdx == 12;
2818 bool interlock = groupNdx == 13;
2819 bool sampleLocations = groupNdx == 14;
2820 bool sampleShadingEnable = groupNdx == 15;
2821 bool sampleShadingInput = groupNdx == 16;
2822 VkConservativeRasterizationModeEXT conservativeMode = (groupNdx == 3) ? VK_CONSERVATIVE_RASTERIZATION_MODE_UNDERESTIMATE_EXT : VK_CONSERVATIVE_RASTERIZATION_MODE_OVERESTIMATE_EXT;
2823 deUint32 numColorLayers = (colorLayered || multiView) ? 2u : 1u;
2825 // Don't bother with geometry shader if we're not testing shader writes
2826 if (geomCases[geomNdx].count && !shdCases[shdNdx].count)
2829 // reduce number of tests
2830 if ((groupNdx != 0) &&
2831 (!dynCases[dynNdx].count ||
2832 !(combCases[cmb0Ndx].count == VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR || combCases[cmb0Ndx].count == VK_FRAGMENT_SHADING_RATE_COMBINER_OP_REPLACE_KHR) ||
2833 !(combCases[cmb1Ndx].count == VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR || combCases[cmb1Ndx].count == VK_FRAGMENT_SHADING_RATE_COMBINER_OP_REPLACE_KHR)))
2836 // Don't bother with geometry shader if we're testing conservative raster, sample mask, depth/stencil
2837 if (geomCases[geomNdx].count && (useApiSampleMask || useSampleMaskIn || consRast || fragDepth || fragStencil))
2840 // Don't bother with geometry shader if we're testing non-dynamic state
2841 if (geomCases[geomNdx].count && !dynCases[dynNdx].count)
2844 // Only test multiViewport/layered with shaderWritesRate
2845 if ((multiViewport || colorLayered) && !shdCases[shdNdx].count)
2848 // Can't test layered shading rate attachment without an attachment
2849 if (srLayered && attCases[attNdx].usage != AttachmentUsage::WITH_ATTACHMENT)
2854 groupParams, // SharedGroupParams groupParams;
2855 seed++, // deInt32 seed;
2856 extentCases[extNdx].count, // VkExtent2D framebufferDim;
2857 (VkSampleCountFlagBits)sampCases[sampNdx].count, // VkSampleCountFlagBits samples;
2859 (VkFragmentShadingRateCombinerOpKHR)combCases[cmb0Ndx].count,
2860 (VkFragmentShadingRateCombinerOpKHR)combCases[cmb1Ndx].count
2861 }, // VkFragmentShadingRateCombinerOpKHR combinerOp[2];
2862 attCases[attNdx].usage, // AttachmentUsage attachmentUsage;
2863 (bool)shdCases[shdNdx].count, // bool shaderWritesRate;
2864 (bool)geomCases[geomNdx].count, // bool geometryShader;
2865 (bool)dynCases[dynNdx].count, // bool useDynamicState;
2866 useApiSampleMask, // bool useApiSampleMask;
2867 useSampleMaskIn, // bool useSampleMaskIn;
2868 consRast, // bool conservativeEnable;
2869 conservativeMode, // VkConservativeRasterizationModeEXT conservativeMode;
2870 fragDepth || fragStencil, // bool useDepthStencil;
2871 fragDepth, // bool fragDepth;
2872 fragStencil, // bool fragStencil;
2873 multiViewport, // bool multiViewport;
2874 colorLayered, // bool colorLayered;
2875 srLayered, // bool srLayered;
2876 numColorLayers, // deUint32 numColorLayers;
2877 multiView, // bool multiView;
2878 correlationMask, // bool correlationMask;
2879 interlock, // bool interlock;
2880 sampleLocations, // bool sampleLocations;
2881 sampleShadingEnable, // bool sampleShadingEnable;
2882 sampleShadingInput, // bool sampleShadingInput;
2883 false, // bool sampleMaskTest;
2886 sampGroup->addChild(new FSRTestCase(testCtx, geomCases[geomNdx].name, geomCases[geomNdx].description, c));
2888 extGroup->addChild(sampGroup.release());
2890 cmb1Group->addChild(extGroup.release());
2892 cmb0Group->addChild(cmb1Group.release());
2894 shdGroup->addChild(cmb0Group.release());
2896 attGroup->addChild(shdGroup.release());
2898 dynGroup->addChild(attGroup.release());
2900 group->addChild(dynGroup.release());
2902 parentGroup->addChild(group.release());
2905 if (!groupParams->useSecondaryCmdBuffer)
2907 de::MovePtr<tcu::TestCaseGroup> group(new tcu::TestCaseGroup(testCtx, "misc_tests", "Single tests that don't need to be part of above test matrix"));
2908 group->addChild(new FSRTestCase(testCtx, "sample_mask_test", "", {
2909 groupParams, // SharedGroupParams groupParams;
2910 123, // deInt32 seed;
2911 {32, 33}, // VkExtent2D framebufferDim;
2912 VK_SAMPLE_COUNT_4_BIT, // VkSampleCountFlagBits samples;
2914 VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR,
2915 VK_FRAGMENT_SHADING_RATE_COMBINER_OP_KEEP_KHR
2916 }, // VkFragmentShadingRateCombinerOpKHR combinerOp[2];
2917 AttachmentUsage::NO_ATTACHMENT, // AttachmentUsage attachmentUsage;
2918 true, // bool shaderWritesRate;
2919 false, // bool geometryShader;
2920 false, // bool useDynamicState;
2921 true, // bool useApiSampleMask;
2922 false, // bool useSampleMaskIn;
2923 false, // bool conservativeEnable;
2924 VK_CONSERVATIVE_RASTERIZATION_MODE_UNDERESTIMATE_EXT, // VkConservativeRasterizationModeEXT conservativeMode;
2925 false, // bool useDepthStencil;
2926 false, // bool fragDepth;
2927 false, // bool fragStencil;
2928 false, // bool multiViewport;
2929 false, // bool colorLayered;
2930 false, // bool srLayered;
2931 1u, // deUint32 numColorLayers;
2932 false, // bool multiView;
2933 false, // bool correlationMask;
2934 false, // bool interlock;
2935 false, // bool sampleLocations;
2936 false, // bool sampleShadingEnable;
2937 false, // bool sampleShadingInput;
2938 true, // bool sampleMaskTest;
2941 parentGroup->addChild(group.release());
2945 } // FragmentShadingRage