1 /*------------------------------------------------------------------------
2 * Vulkan Conformance Tests
3 * ------------------------
4 *
5 * Copyright (c) 2016 The Khronos Group Inc.
6 * Copyright (c) 2016 The Android Open Source Project
7 *
8 * Licensed under the Apache License, Version 2.0 (the "License");
9 * you may not use this file except in compliance with the License.
10 * You may obtain a copy of the License at
11 *
12 * http://www.apache.org/licenses/LICENSE-2.0
13 *
14 * Unless required by applicable law or agreed to in writing, software
15 * distributed under the License is distributed on an "AS IS" BASIS,
16 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
17 * See the License for the specific language governing permissions and
18 * limitations under the License.
19 *
20 *//*!
21 * \file
22 * \brief Multisampled image load/store Tests
23 *//*--------------------------------------------------------------------*/
24
25 #include "vktImageMultisampleLoadStoreTests.hpp"
26 #include "vktTestCaseUtil.hpp"
27 #include "vktImageTestsUtil.hpp"
28 #include "vktImageLoadStoreUtil.hpp"
29 #include "vktImageTexture.hpp"
30
31 #include "vkDefs.hpp"
32 #include "vkRef.hpp"
33 #include "vkRefUtil.hpp"
34 #include "vkPlatform.hpp"
35 #include "vkPrograms.hpp"
36 #include "vkMemUtil.hpp"
37 #include "vkBarrierUtil.hpp"
38 #include "vkBuilderUtil.hpp"
39 #include "vkQueryUtil.hpp"
40 #include "vkImageUtil.hpp"
41 #include "vkCmdUtil.hpp"
42
43 #include "deUniquePtr.hpp"
44
45 #include "tcuTextureUtil.hpp"
46 #include "tcuTestLog.hpp"
47
48 #include <string>
49 #include <vector>
50
51 namespace vkt
52 {
53 namespace image
54 {
55 namespace
56 {
57 using namespace vk;
58 using de::MovePtr;
59 using de::UniquePtr;
60 using tcu::IVec3;
61
62 static const VkFormat CHECKSUM_IMAGE_FORMAT = VK_FORMAT_R32_SINT;
63
64 struct CaseDef
65 {
66 Texture texture;
67 VkFormat format;
68 VkSampleCountFlagBits numSamples;
69 bool singleLayerBind;
70 };
71
72 // Multisampled storage image test.
73 //
74 // Pass 1: Write a slightly different color pattern per-sample to the whole image.
75 // Pass 2: Read samples of the same image and check if color values are in the expected range.
76 // Write back results as a checksum image and verify them on the host.
77 // Each checksum image pixel should contain an integer equal to the number of samples.
78
initPrograms(SourceCollections & programCollection,const CaseDef caseDef)79 void initPrograms (SourceCollections& programCollection, const CaseDef caseDef)
80 {
81 const int dimension = (caseDef.singleLayerBind ? caseDef.texture.layerDimension() : caseDef.texture.dimension());
82 const std::string texelCoordStr = (dimension == 1 ? "gx" : dimension == 2 ? "ivec2(gx, gy)" : dimension == 3 ? "ivec3(gx, gy, gz)" : "");
83
84 const ImageType usedImageType = (caseDef.singleLayerBind ? getImageTypeForSingleLayer(caseDef.texture.type()) : caseDef.texture.type());
85 const std::string formatQualifierStr = getShaderImageFormatQualifier(mapVkFormat(caseDef.format));
86 const std::string msImageTypeStr = getShaderImageType(mapVkFormat(caseDef.format), usedImageType, (caseDef.texture.numSamples() > 1));
87
88 const std::string xMax = de::toString(caseDef.texture.size().x() - 1);
89 const std::string yMax = de::toString(caseDef.texture.size().y() - 1);
90 const std::string signednessPrefix = isUintFormat(caseDef.format) ? "u" : isIntFormat(caseDef.format) ? "i" : "";
91 const std::string gvec4Expr = signednessPrefix + "vec4";
92 const int numColorComponents = tcu::getNumUsedChannels(mapVkFormat(caseDef.format).order);
93
94 const float storeColorScale = computeStoreColorScale(caseDef.format, caseDef.texture.size());
95 const float storeColorBias = computeStoreColorBias(caseDef.format);
96 DE_ASSERT(colorScaleAndBiasAreValid(caseDef.format, storeColorScale, storeColorBias));
97
98 const std::string colorScaleExpr = (storeColorScale == 1.0f ? "" : "*" + de::toString(storeColorScale))
99 + (storeColorBias == 0.0f ? "" : " + float(" + de::toString(storeColorBias) + ")");
100 const std::string colorExpr =
101 gvec4Expr + "("
102 + "gx^gy^gz^(sampleNdx >> 5)^(sampleNdx & 31), " // we "split" sampleNdx to keep this value in [0, 31] range for numSamples = 64 case
103 + (numColorComponents > 1 ? "(" + xMax + "-gx)^gy^gz, " : "0, ")
104 + (numColorComponents > 2 ? "gx^(" + yMax + "-gy)^gz, " : "0, ")
105 + (numColorComponents > 3 ? "(" + xMax + "-gx)^(" + yMax + "-gy)^gz" : "1")
106 + ")" + colorScaleExpr;
107
108 // Store shader
109 {
110 std::ostringstream src;
111 src << glu::getGLSLVersionDeclaration(glu::GLSL_VERSION_450) << "\n"
112 << "\n"
113 << "layout(local_size_x = 1) in;\n"
114 << "layout(set = 0, binding = 1, " << formatQualifierStr << ") writeonly uniform " << msImageTypeStr << " u_msImage;\n";
115
116 if (caseDef.singleLayerBind)
117 src << "layout(set = 0, binding = 0) readonly uniform Constants {\n"
118 << " int u_layerNdx;\n"
119 << "};\n";
120
121 src << "\n"
122 << "void main (void)\n"
123 << "{\n"
124 << " int gx = int(gl_GlobalInvocationID.x);\n"
125 << " int gy = int(gl_GlobalInvocationID.y);\n"
126 << " int gz = " << (caseDef.singleLayerBind ? "u_layerNdx" : "int(gl_GlobalInvocationID.z)") << ";\n"
127 << "\n"
128 << " for (int sampleNdx = 0; sampleNdx < " << caseDef.texture.numSamples() <<"; ++sampleNdx) {\n"
129 << " imageStore(u_msImage, " << texelCoordStr << ", sampleNdx, " << colorExpr << ");\n"
130 << " }\n"
131 << "}\n";
132
133 programCollection.glslSources.add("comp_store") << glu::ComputeSource(src.str());
134 }
135
136 // Load shader
137 {
138 const tcu::TextureFormat checksumFormat = mapVkFormat(CHECKSUM_IMAGE_FORMAT);
139 const std::string checksumImageTypeStr = getShaderImageType(checksumFormat, usedImageType);
140 const bool useExactCompare = isIntegerFormat(caseDef.format);
141
142 std::ostringstream src;
143 src << glu::getGLSLVersionDeclaration(glu::GLSL_VERSION_450) << "\n"
144 << "\n"
145 << "layout(local_size_x = 1) in;\n"
146 << "layout(set = 0, binding = 1, " << formatQualifierStr << ") readonly uniform " << msImageTypeStr << " u_msImage;\n"
147 << "layout(set = 0, binding = 2, " << getShaderImageFormatQualifier(checksumFormat) << ") writeonly uniform " << checksumImageTypeStr << " u_checksumImage;\n";
148
149 if (caseDef.singleLayerBind)
150 src << "layout(set = 0, binding = 0) readonly uniform Constants {\n"
151 << " int u_layerNdx;\n"
152 << "};\n";
153
154 src << "\n"
155 << "void main (void)\n"
156 << "{\n"
157 << " int gx = int(gl_GlobalInvocationID.x);\n"
158 << " int gy = int(gl_GlobalInvocationID.y);\n"
159 << " int gz = " << (caseDef.singleLayerBind ? "u_layerNdx" : "int(gl_GlobalInvocationID.z)") << ";\n"
160 << "\n"
161 << " int checksum = 0;\n"
162 << " for (int sampleNdx = 0; sampleNdx < " << caseDef.texture.numSamples() <<"; ++sampleNdx) {\n"
163 << " " << gvec4Expr << " color = imageLoad(u_msImage, " << texelCoordStr << ", sampleNdx);\n";
164
165 if (useExactCompare)
166 src << " if (color == " << colorExpr << ")\n"
167 << " ++checksum;\n";
168 else
169 src << " " << gvec4Expr << " diff = abs(abs(color) - abs(" << colorExpr << "));\n"
170 << " if (all(lessThan(diff, " << gvec4Expr << "(0.02))))\n"
171 << " ++checksum;\n";
172
173 src << " }\n"
174 << "\n"
175 << " imageStore(u_checksumImage, " << texelCoordStr << ", ivec4(checksum));\n"
176 << "}\n";
177
178 programCollection.glslSources.add("comp_load") << glu::ComputeSource(src.str());
179 }
180 }
181
checkRequirements(const InstanceInterface & vki,const VkPhysicalDevice physDevice,const CaseDef & caseDef)182 void checkRequirements (const InstanceInterface& vki, const VkPhysicalDevice physDevice, const CaseDef& caseDef)
183 {
184 VkPhysicalDeviceFeatures features;
185 vki.getPhysicalDeviceFeatures(physDevice, &features);
186
187 if (!features.shaderStorageImageMultisample)
188 TCU_THROW(NotSupportedError, "Multisampled storage images are not supported");
189
190 VkImageFormatProperties imageFormatProperties;
191 const VkResult imageFormatResult = vki.getPhysicalDeviceImageFormatProperties(
192 physDevice, caseDef.format, VK_IMAGE_TYPE_2D, VK_IMAGE_TILING_OPTIMAL, VK_IMAGE_USAGE_STORAGE_BIT, (VkImageCreateFlags)0, &imageFormatProperties);
193
194 if (imageFormatResult == VK_ERROR_FORMAT_NOT_SUPPORTED)
195 TCU_THROW(NotSupportedError, "Format is not supported");
196
197 if ((imageFormatProperties.sampleCounts & caseDef.numSamples) != caseDef.numSamples)
198 TCU_THROW(NotSupportedError, "Requested sample count is not supported");
199 }
200
201 //! Helper function to deal with per-layer resources.
insertImageViews(const DeviceInterface & vk,const VkDevice device,const CaseDef & caseDef,const VkFormat format,const VkImage image,std::vector<SharedVkImageView> * const pOutImageViews)202 void insertImageViews (const DeviceInterface& vk, const VkDevice device, const CaseDef& caseDef, const VkFormat format, const VkImage image, std::vector<SharedVkImageView>* const pOutImageViews)
203 {
204 if (caseDef.singleLayerBind)
205 {
206 pOutImageViews->clear();
207 pOutImageViews->resize(caseDef.texture.numLayers());
208 for (int layerNdx = 0; layerNdx < caseDef.texture.numLayers(); ++layerNdx)
209 {
210 (*pOutImageViews)[layerNdx] = makeVkSharedPtr(makeImageView(
211 vk, device, image, mapImageViewType(getImageTypeForSingleLayer(caseDef.texture.type())), format,
212 makeImageSubresourceRange(VK_IMAGE_ASPECT_COLOR_BIT, 0u, 1u, layerNdx, 1u)));
213 }
214 }
215 else // bind all layers at once
216 {
217 pOutImageViews->clear();
218 pOutImageViews->resize(1);
219 (*pOutImageViews)[0] = makeVkSharedPtr(makeImageView(
220 vk, device, image, mapImageViewType(caseDef.texture.type()), format,
221 makeImageSubresourceRange(VK_IMAGE_ASPECT_COLOR_BIT, 0u, 1u, 0u, caseDef.texture.numLayers())));
222 }
223 }
224
225 //! Helper function to deal with per-layer resources.
insertDescriptorSets(const DeviceInterface & vk,const VkDevice device,const CaseDef & caseDef,const VkDescriptorPool descriptorPool,const VkDescriptorSetLayout descriptorSetLayout,std::vector<SharedVkDescriptorSet> * const pOutDescriptorSets)226 void insertDescriptorSets (const DeviceInterface& vk, const VkDevice device, const CaseDef& caseDef, const VkDescriptorPool descriptorPool, const VkDescriptorSetLayout descriptorSetLayout, std::vector<SharedVkDescriptorSet>* const pOutDescriptorSets)
227 {
228 if (caseDef.singleLayerBind)
229 {
230 pOutDescriptorSets->clear();
231 pOutDescriptorSets->resize(caseDef.texture.numLayers());
232 for (int layerNdx = 0; layerNdx < caseDef.texture.numLayers(); ++layerNdx)
233 (*pOutDescriptorSets)[layerNdx] = makeVkSharedPtr(makeDescriptorSet(vk, device, descriptorPool, descriptorSetLayout));
234 }
235 else // bind all layers at once
236 {
237 pOutDescriptorSets->clear();
238 pOutDescriptorSets->resize(1);
239 (*pOutDescriptorSets)[0] = makeVkSharedPtr(makeDescriptorSet(vk, device, descriptorPool, descriptorSetLayout));
240 }
241 }
242
test(Context & context,const CaseDef caseDef)243 tcu::TestStatus test (Context& context, const CaseDef caseDef)
244 {
245 const InstanceInterface& vki = context.getInstanceInterface();
246 const VkPhysicalDevice physDevice = context.getPhysicalDevice();
247 const DeviceInterface& vk = context.getDeviceInterface();
248 const VkDevice device = context.getDevice();
249 const VkQueue queue = context.getUniversalQueue();
250 const deUint32 queueFamilyIndex = context.getUniversalQueueFamilyIndex();
251 Allocator& allocator = context.getDefaultAllocator();
252
253 checkRequirements(vki, physDevice, caseDef);
254
255 // Images
256
257 const UniquePtr<Image> msImage(new Image(
258 vk, device, allocator, makeImageCreateInfo(caseDef.texture, caseDef.format, VK_IMAGE_USAGE_STORAGE_BIT, 0u), MemoryRequirement::Any));
259
260 const UniquePtr<Image> checksumImage(new Image(
261 vk, device, allocator,
262 makeImageCreateInfo(Texture(caseDef.texture, 1), CHECKSUM_IMAGE_FORMAT, VK_IMAGE_USAGE_STORAGE_BIT | VK_IMAGE_USAGE_TRANSFER_SRC_BIT, 0u),
263 MemoryRequirement::Any));
264
265 // Buffer used to pass constants to the shader.
266
267 const int numLayers = caseDef.texture.numLayers();
268 const VkDeviceSize bufferChunkSize = getOptimalUniformBufferChunkSize(vki, physDevice, sizeof(deInt32));
269 const VkDeviceSize constantsBufferSizeBytes = numLayers * bufferChunkSize;
270 UniquePtr<Buffer> constantsBuffer (new Buffer(vk, device, allocator, makeBufferCreateInfo(constantsBufferSizeBytes, VK_BUFFER_USAGE_UNIFORM_BUFFER_BIT),
271 MemoryRequirement::HostVisible));
272
273 {
274 const Allocation& alloc = constantsBuffer->getAllocation();
275 deUint8* const basePtr = static_cast<deUint8*>(alloc.getHostPtr());
276
277 deMemset(alloc.getHostPtr(), 0, static_cast<size_t>(constantsBufferSizeBytes));
278
279 for (int layerNdx = 0; layerNdx < numLayers; ++layerNdx)
280 {
281 deInt32* const valuePtr = reinterpret_cast<deInt32*>(basePtr + layerNdx * bufferChunkSize);
282 *valuePtr = layerNdx;
283 }
284
285 flushAlloc(vk, device, alloc);
286 }
287
288 const VkDeviceSize resultBufferSizeBytes = getImageSizeBytes(caseDef.texture.size(), CHECKSUM_IMAGE_FORMAT);
289 UniquePtr<Buffer> resultBuffer (new Buffer(vk, device, allocator, makeBufferCreateInfo(resultBufferSizeBytes, VK_BUFFER_USAGE_TRANSFER_DST_BIT),
290 MemoryRequirement::HostVisible));
291
292 {
293 const Allocation& alloc = resultBuffer->getAllocation();
294 deMemset(alloc.getHostPtr(), 0, static_cast<size_t>(resultBufferSizeBytes));
295 flushAlloc(vk, device, alloc);
296 }
297
298 // Descriptors
299
300 Unique<VkDescriptorSetLayout> descriptorSetLayout(DescriptorSetLayoutBuilder()
301 .addSingleBinding(VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER, VK_SHADER_STAGE_COMPUTE_BIT)
302 .addSingleBinding(VK_DESCRIPTOR_TYPE_STORAGE_IMAGE, VK_SHADER_STAGE_COMPUTE_BIT)
303 .addSingleBinding(VK_DESCRIPTOR_TYPE_STORAGE_IMAGE, VK_SHADER_STAGE_COMPUTE_BIT)
304 .build(vk, device));
305
306 Unique<VkDescriptorPool> descriptorPool(DescriptorPoolBuilder()
307 .addType(VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER, numLayers)
308 .addType(VK_DESCRIPTOR_TYPE_STORAGE_IMAGE, numLayers)
309 .addType(VK_DESCRIPTOR_TYPE_STORAGE_IMAGE, numLayers)
310 .build(vk, device, VK_DESCRIPTOR_POOL_CREATE_FREE_DESCRIPTOR_SET_BIT, numLayers));
311
312 std::vector<SharedVkDescriptorSet> allDescriptorSets;
313 std::vector<SharedVkImageView> allMultisampledImageViews;
314 std::vector<SharedVkImageView> allChecksumImageViews;
315
316 insertDescriptorSets(vk, device, caseDef, *descriptorPool, *descriptorSetLayout, &allDescriptorSets);
317 insertImageViews (vk, device, caseDef, caseDef.format, **msImage, &allMultisampledImageViews);
318 insertImageViews (vk, device, caseDef, CHECKSUM_IMAGE_FORMAT, **checksumImage, &allChecksumImageViews);
319
320 // Prepare commands
321
322 const Unique<VkPipelineLayout> pipelineLayout (makePipelineLayout(vk, device, *descriptorSetLayout));
323 const Unique<VkCommandPool> cmdPool (createCommandPool(vk, device, VK_COMMAND_POOL_CREATE_RESET_COMMAND_BUFFER_BIT, queueFamilyIndex));
324 const Unique<VkCommandBuffer> cmdBuffer (allocateCommandBuffer(vk, device, *cmdPool, VK_COMMAND_BUFFER_LEVEL_PRIMARY));
325
326 const tcu::IVec3 workSize = (caseDef.singleLayerBind ? caseDef.texture.layerSize() : caseDef.texture.size());
327 const int loopNumLayers = (caseDef.singleLayerBind ? numLayers : 1);
328 const VkImageSubresourceRange subresourceAllLayers = makeImageSubresourceRange(VK_IMAGE_ASPECT_COLOR_BIT, 0u, 1u, 0u, caseDef.texture.numLayers());
329
330 // Pass 1: Write MS image
331 {
332 const Unique<VkShaderModule> shaderModule (createShaderModule (vk, device, context.getBinaryCollection().get("comp_store"), 0));
333 const Unique<VkPipeline> pipeline (makeComputePipeline(vk, device, *pipelineLayout, *shaderModule));
334
335 beginCommandBuffer(vk, *cmdBuffer);
336 vk.cmdBindPipeline(*cmdBuffer, VK_PIPELINE_BIND_POINT_COMPUTE, *pipeline);
337
338 {
339 const VkImageMemoryBarrier barriers[] =
340 {
341 makeImageMemoryBarrier((VkAccessFlags)0, VK_ACCESS_SHADER_WRITE_BIT, VK_IMAGE_LAYOUT_UNDEFINED, VK_IMAGE_LAYOUT_GENERAL, **msImage, subresourceAllLayers),
342 makeImageMemoryBarrier((VkAccessFlags)0, VK_ACCESS_SHADER_WRITE_BIT, VK_IMAGE_LAYOUT_UNDEFINED, VK_IMAGE_LAYOUT_GENERAL, **checksumImage, subresourceAllLayers),
343 };
344
345 vk.cmdPipelineBarrier(*cmdBuffer, VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT, VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT, (VkDependencyFlags)0,
346 0u, DE_NULL, 0u, DE_NULL, DE_LENGTH_OF_ARRAY(barriers), barriers);
347 }
348
349 for (int layerNdx = 0; layerNdx < loopNumLayers; ++layerNdx)
350 {
351 const VkDescriptorSet descriptorSet = **allDescriptorSets[layerNdx];
352 const VkDescriptorImageInfo descriptorMultiImageInfo = makeDescriptorImageInfo(DE_NULL, **allMultisampledImageViews[layerNdx], VK_IMAGE_LAYOUT_GENERAL);
353 const VkDescriptorBufferInfo descriptorConstantsBufferInfo = makeDescriptorBufferInfo(constantsBuffer->get(), layerNdx*bufferChunkSize, bufferChunkSize);
354
355 DescriptorSetUpdateBuilder()
356 .writeSingle(descriptorSet, DescriptorSetUpdateBuilder::Location::binding(0u), VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER, &descriptorConstantsBufferInfo)
357 .writeSingle(descriptorSet, DescriptorSetUpdateBuilder::Location::binding(1u), VK_DESCRIPTOR_TYPE_STORAGE_IMAGE, &descriptorMultiImageInfo)
358 .update(vk, device);
359
360 vk.cmdBindDescriptorSets(*cmdBuffer, VK_PIPELINE_BIND_POINT_COMPUTE, *pipelineLayout, 0u, 1u, &descriptorSet, 0u, DE_NULL);
361 vk.cmdDispatch(*cmdBuffer, workSize.x(), workSize.y(), workSize.z());
362 }
363
364 endCommandBuffer(vk, *cmdBuffer);
365 submitCommandsAndWait(vk, device, queue, *cmdBuffer);
366 }
367
368 // Pass 2: "Resolve" MS image in compute shader
369 {
370 const Unique<VkShaderModule> shaderModule (createShaderModule (vk, device, context.getBinaryCollection().get("comp_load"), 0));
371 const Unique<VkPipeline> pipeline (makeComputePipeline(vk, device, *pipelineLayout, *shaderModule));
372
373 beginCommandBuffer(vk, *cmdBuffer);
374 vk.cmdBindPipeline(*cmdBuffer, VK_PIPELINE_BIND_POINT_COMPUTE, *pipeline);
375
376 {
377 const VkImageMemoryBarrier barriers[] =
378 {
379 makeImageMemoryBarrier(VK_ACCESS_SHADER_WRITE_BIT, VK_ACCESS_SHADER_READ_BIT, VK_IMAGE_LAYOUT_GENERAL, VK_IMAGE_LAYOUT_GENERAL, **msImage, subresourceAllLayers),
380 };
381
382 vk.cmdPipelineBarrier(*cmdBuffer, VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT, VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT, (VkDependencyFlags)0,
383 0u, DE_NULL, 0u, DE_NULL, DE_LENGTH_OF_ARRAY(barriers), barriers);
384 }
385
386 for (int layerNdx = 0; layerNdx < loopNumLayers; ++layerNdx)
387 {
388 const VkDescriptorSet descriptorSet = **allDescriptorSets[layerNdx];
389 const VkDescriptorImageInfo descriptorMultiImageInfo = makeDescriptorImageInfo(DE_NULL, **allMultisampledImageViews[layerNdx], VK_IMAGE_LAYOUT_GENERAL);
390 const VkDescriptorImageInfo descriptorChecksumImageInfo = makeDescriptorImageInfo(DE_NULL, **allChecksumImageViews[layerNdx], VK_IMAGE_LAYOUT_GENERAL);
391 const VkDescriptorBufferInfo descriptorConstantsBufferInfo = makeDescriptorBufferInfo(constantsBuffer->get(), layerNdx*bufferChunkSize, bufferChunkSize);
392
393 DescriptorSetUpdateBuilder()
394 .writeSingle(descriptorSet, DescriptorSetUpdateBuilder::Location::binding(0u), VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER, &descriptorConstantsBufferInfo)
395 .writeSingle(descriptorSet, DescriptorSetUpdateBuilder::Location::binding(1u), VK_DESCRIPTOR_TYPE_STORAGE_IMAGE, &descriptorMultiImageInfo)
396 .writeSingle(descriptorSet, DescriptorSetUpdateBuilder::Location::binding(2u), VK_DESCRIPTOR_TYPE_STORAGE_IMAGE, &descriptorChecksumImageInfo)
397 .update(vk, device);
398
399 vk.cmdBindDescriptorSets(*cmdBuffer, VK_PIPELINE_BIND_POINT_COMPUTE, *pipelineLayout, 0u, 1u, &descriptorSet, 0u, DE_NULL);
400 vk.cmdDispatch(*cmdBuffer, workSize.x(), workSize.y(), workSize.z());
401 }
402
403 endCommandBuffer(vk, *cmdBuffer);
404 submitCommandsAndWait(vk, device, queue, *cmdBuffer);
405 }
406
407 // Retrieve result
408 {
409 beginCommandBuffer(vk, *cmdBuffer);
410
411 {
412 const VkImageMemoryBarrier barriers[] =
413 {
414 makeImageMemoryBarrier(VK_ACCESS_SHADER_WRITE_BIT, VK_ACCESS_TRANSFER_READ_BIT, VK_IMAGE_LAYOUT_GENERAL, VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL, **checksumImage, subresourceAllLayers),
415 };
416 vk.cmdPipelineBarrier(*cmdBuffer, VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT, (VkDependencyFlags)0,
417 0u, DE_NULL, 0u, DE_NULL, DE_LENGTH_OF_ARRAY(barriers), barriers);
418 }
419 {
420 const VkBufferImageCopy copyRegion = makeBufferImageCopy(makeExtent3D(caseDef.texture.layerSize()), caseDef.texture.numLayers());
421 vk.cmdCopyImageToBuffer(*cmdBuffer, **checksumImage, VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL, **resultBuffer, 1u, ©Region);
422 }
423 {
424 const VkBufferMemoryBarrier barriers[] =
425 {
426 makeBufferMemoryBarrier(VK_ACCESS_TRANSFER_WRITE_BIT, VK_ACCESS_HOST_READ_BIT, **resultBuffer, 0ull, resultBufferSizeBytes),
427 };
428 vk.cmdPipelineBarrier(*cmdBuffer, VK_PIPELINE_STAGE_TRANSFER_BIT, VK_PIPELINE_STAGE_HOST_BIT, (VkDependencyFlags)0,
429 0u, DE_NULL, DE_LENGTH_OF_ARRAY(barriers), barriers, 0u, DE_NULL);
430 }
431
432 endCommandBuffer(vk, *cmdBuffer);
433 submitCommandsAndWait(vk, device, queue, *cmdBuffer);
434 }
435
436 // Verify
437 {
438 const Allocation& alloc = resultBuffer->getAllocation();
439 invalidateAlloc(vk, device, alloc);
440
441 const IVec3 imageSize = caseDef.texture.size();
442 const deInt32* pDataPtr = static_cast<deInt32*>(alloc.getHostPtr());
443 const deInt32 expectedChecksum = caseDef.texture.numSamples();
444
445 for (int layer = 0; layer < imageSize.z(); ++layer)
446 for (int y = 0; y < imageSize.y(); ++y)
447 for (int x = 0; x < imageSize.x(); ++x)
448 {
449 if (*pDataPtr != expectedChecksum)
450 {
451 context.getTestContext().getLog()
452 << tcu::TestLog::Message << "Some sample colors were incorrect at (x, y, layer) = (" << x << ", " << y << ", " << layer << ")" << tcu::TestLog::EndMessage
453 << tcu::TestLog::Message << "Checksum value is " << *pDataPtr << " but expected " << expectedChecksum << tcu::TestLog::EndMessage;
454
455 return tcu::TestStatus::fail("Some sample colors were incorrect");
456 }
457 ++pDataPtr;
458 }
459
460 return tcu::TestStatus::pass("OK");
461 }
462 }
463
464 } // anonymous ns
465
createImageMultisampleLoadStoreTests(tcu::TestContext & testCtx)466 tcu::TestCaseGroup* createImageMultisampleLoadStoreTests (tcu::TestContext& testCtx)
467 {
468 const Texture textures[] =
469 {
470 // \note Shader code is tweaked to work with image size of 32, take a look if this needs to be modified.
471 Texture(IMAGE_TYPE_2D, tcu::IVec3(32, 32, 1), 1),
472 Texture(IMAGE_TYPE_2D_ARRAY, tcu::IVec3(32, 32, 1), 4),
473 };
474
475 static const VkFormat formats[] =
476 {
477 VK_FORMAT_R32G32B32A32_SFLOAT,
478 VK_FORMAT_R16G16B16A16_SFLOAT,
479 VK_FORMAT_R32_SFLOAT,
480
481 VK_FORMAT_R32G32B32A32_UINT,
482 VK_FORMAT_R16G16B16A16_UINT,
483 VK_FORMAT_R8G8B8A8_UINT,
484 VK_FORMAT_R32_UINT,
485
486 VK_FORMAT_R32G32B32A32_SINT,
487 VK_FORMAT_R16G16B16A16_SINT,
488 VK_FORMAT_R8G8B8A8_SINT,
489 VK_FORMAT_R32_SINT,
490
491 VK_FORMAT_R8G8B8A8_UNORM,
492
493 VK_FORMAT_R8G8B8A8_SNORM,
494 };
495
496 static const VkSampleCountFlagBits samples[] =
497 {
498 VK_SAMPLE_COUNT_2_BIT,
499 VK_SAMPLE_COUNT_4_BIT,
500 VK_SAMPLE_COUNT_8_BIT,
501 VK_SAMPLE_COUNT_16_BIT,
502 VK_SAMPLE_COUNT_32_BIT,
503 VK_SAMPLE_COUNT_64_BIT,
504 };
505
506 MovePtr<tcu::TestCaseGroup> testGroup(new tcu::TestCaseGroup(testCtx, "load_store_multisample", "Multisampled image store and load"));
507
508 for (int baseTextureNdx = 0; baseTextureNdx < DE_LENGTH_OF_ARRAY(textures); ++baseTextureNdx)
509 {
510 const Texture& baseTexture = textures[baseTextureNdx];
511 MovePtr<tcu::TestCaseGroup> imageViewGroup (new tcu::TestCaseGroup(testCtx, getImageTypeName(baseTexture.type()).c_str(), ""));
512 const int numLayerBindModes = (baseTexture.numLayers() == 1 ? 1 : 2);
513
514 for (int formatNdx = 0; formatNdx < DE_LENGTH_OF_ARRAY(formats); ++formatNdx)
515 for (int layerBindMode = 0; layerBindMode < numLayerBindModes; ++layerBindMode)
516 {
517 const bool singleLayerBind = (layerBindMode != 0);
518 const std::string formatGroupName = getFormatShortString(formats[formatNdx]) + (singleLayerBind ? "_single_layer" : "");
519 MovePtr<tcu::TestCaseGroup> formatGroup (new tcu::TestCaseGroup(testCtx, formatGroupName.c_str(), ""));
520
521 for (int samplesNdx = 0; samplesNdx < DE_LENGTH_OF_ARRAY(samples); ++samplesNdx)
522 {
523 const std::string samplesCaseName = "samples_" + de::toString(samples[samplesNdx]);
524
525 const CaseDef caseDef =
526 {
527 Texture(baseTexture, samples[samplesNdx]),
528 formats[formatNdx],
529 samples[samplesNdx],
530 singleLayerBind,
531 };
532
533 addFunctionCaseWithPrograms(formatGroup.get(), samplesCaseName, "", initPrograms, test, caseDef);
534 }
535 imageViewGroup->addChild(formatGroup.release());
536 }
537 testGroup->addChild(imageViewGroup.release());
538 }
539
540 return testGroup.release();
541 }
542
543 } // image
544 } // vkt
545