1 /*
2 * Copyright 2015 Google Inc.
3 *
4 * Use of this source code is governed by a BSD-style license that can be
5 * found in the LICENSE file.
6 */
7
8 #include "GrVkCaps.h"
9 #include "GrRenderTarget.h"
10 #include "GrShaderCaps.h"
11 #include "GrVkUtil.h"
12 #include "vk/GrVkBackendContext.h"
13 #include "vk/GrVkInterface.h"
14
GrVkCaps(const GrContextOptions & contextOptions,const GrVkInterface * vkInterface,VkPhysicalDevice physDev,uint32_t featureFlags,uint32_t extensionFlags)15 GrVkCaps::GrVkCaps(const GrContextOptions& contextOptions, const GrVkInterface* vkInterface,
16 VkPhysicalDevice physDev, uint32_t featureFlags, uint32_t extensionFlags)
17 : INHERITED(contextOptions) {
18 fCanUseGLSLForShaderModule = false;
19 fMustDoCopiesFromOrigin = false;
20 fSupportsCopiesAsDraws = false;
21 fMustSubmitCommandsBeforeCopyOp = false;
22 fMustSleepOnTearDown = false;
23 fNewSecondaryCBOnPipelineChange = false;
24
25 /**************************************************************************
26 * GrDrawTargetCaps fields
27 **************************************************************************/
28 fMipMapSupport = true; // always available in Vulkan
29 fSRGBSupport = true; // always available in Vulkan
30 fNPOTTextureTileSupport = true; // always available in Vulkan
31 fTwoSidedStencilSupport = true; // always available in Vulkan
32 fStencilWrapOpsSupport = true; // always available in Vulkan
33 fDiscardRenderTargetSupport = true;
34 fReuseScratchTextures = true; //TODO: figure this out
35 fGpuTracingSupport = false; //TODO: figure this out
36 fCompressedTexSubImageSupport = false; //TODO: figure this out
37 fOversizedStencilSupport = false; //TODO: figure this out
38
39 fUseDrawInsteadOfClear = false;
40 fFenceSyncSupport = true; // always available in Vulkan
41 fCrossContextTextureSupport = false; // TODO: Add thread-safe memory pools so we can enable this
42
43 fMapBufferFlags = kNone_MapFlags; //TODO: figure this out
44 fBufferMapThreshold = SK_MaxS32; //TODO: figure this out
45
46 fMaxRenderTargetSize = 4096; // minimum required by spec
47 fMaxTextureSize = 4096; // minimum required by spec
48 fMaxColorSampleCount = 4; // minimum required by spec
49 fMaxStencilSampleCount = 4; // minimum required by spec
50
51 fShaderCaps.reset(new GrShaderCaps(contextOptions));
52
53 this->init(contextOptions, vkInterface, physDev, featureFlags, extensionFlags);
54 }
55
initDescForDstCopy(const GrRenderTarget * src,GrSurfaceDesc * desc) const56 bool GrVkCaps::initDescForDstCopy(const GrRenderTarget* src, GrSurfaceDesc* desc) const {
57 // We can always succeed here with either a CopyImage (none msaa src) or ResolveImage (msaa).
58 // For CopyImage we can make a simple texture, for ResolveImage we require the dst to be a
59 // render target as well.
60 desc->fOrigin = src->origin();
61 desc->fConfig = src->config();
62 if (src->numColorSamples() > 1 || (src->asTexture() && this->supportsCopiesAsDraws())) {
63 desc->fFlags = kRenderTarget_GrSurfaceFlag;
64 } else {
65 // Just going to use CopyImage here
66 desc->fFlags = kNone_GrSurfaceFlags;
67 }
68
69 return true;
70 }
71
init(const GrContextOptions & contextOptions,const GrVkInterface * vkInterface,VkPhysicalDevice physDev,uint32_t featureFlags,uint32_t extensionFlags)72 void GrVkCaps::init(const GrContextOptions& contextOptions, const GrVkInterface* vkInterface,
73 VkPhysicalDevice physDev, uint32_t featureFlags, uint32_t extensionFlags) {
74
75 VkPhysicalDeviceProperties properties;
76 GR_VK_CALL(vkInterface, GetPhysicalDeviceProperties(physDev, &properties));
77
78 VkPhysicalDeviceMemoryProperties memoryProperties;
79 GR_VK_CALL(vkInterface, GetPhysicalDeviceMemoryProperties(physDev, &memoryProperties));
80
81 this->initGrCaps(properties, memoryProperties, featureFlags);
82 this->initShaderCaps(properties, featureFlags);
83 this->initConfigTable(vkInterface, physDev);
84 this->initStencilFormat(vkInterface, physDev);
85
86 if (SkToBool(extensionFlags & kNV_glsl_shader_GrVkExtensionFlag)) {
87 // Currently disabling this feature since it does not play well with validation layers which
88 // expect a SPIR-V shader
89 // fCanUseGLSLForShaderModule = true;
90 }
91
92 if (kQualcomm_VkVendor == properties.vendorID) {
93 fMustDoCopiesFromOrigin = true;
94 }
95
96 if (kNvidia_VkVendor == properties.vendorID) {
97 fSupportsCopiesAsDraws = true;
98 fMustSubmitCommandsBeforeCopyOp = true;
99 }
100
101 #if defined(SK_BUILD_FOR_WIN)
102 if (kNvidia_VkVendor == properties.vendorID) {
103 fMustSleepOnTearDown = true;
104 }
105 #elif defined(SK_BUILD_FOR_ANDROID)
106 if (kImagination_VkVendor == properties.vendorID) {
107 fMustSleepOnTearDown = true;
108 }
109 #endif
110
111 this->applyOptionsOverrides(contextOptions);
112 fShaderCaps->applyOptionsOverrides(contextOptions);
113 }
114
get_max_sample_count(VkSampleCountFlags flags)115 int get_max_sample_count(VkSampleCountFlags flags) {
116 SkASSERT(flags & VK_SAMPLE_COUNT_1_BIT);
117 if (!(flags & VK_SAMPLE_COUNT_2_BIT)) {
118 return 0;
119 }
120 if (!(flags & VK_SAMPLE_COUNT_4_BIT)) {
121 return 2;
122 }
123 if (!(flags & VK_SAMPLE_COUNT_8_BIT)) {
124 return 4;
125 }
126 if (!(flags & VK_SAMPLE_COUNT_16_BIT)) {
127 return 8;
128 }
129 if (!(flags & VK_SAMPLE_COUNT_32_BIT)) {
130 return 16;
131 }
132 if (!(flags & VK_SAMPLE_COUNT_64_BIT)) {
133 return 32;
134 }
135 return 64;
136 }
137
initSampleCount(const VkPhysicalDeviceProperties & properties)138 void GrVkCaps::initSampleCount(const VkPhysicalDeviceProperties& properties) {
139 VkSampleCountFlags colorSamples = properties.limits.framebufferColorSampleCounts;
140 VkSampleCountFlags stencilSamples = properties.limits.framebufferStencilSampleCounts;
141
142 fMaxColorSampleCount = get_max_sample_count(colorSamples);
143 fMaxStencilSampleCount = get_max_sample_count(stencilSamples);
144 }
145
initGrCaps(const VkPhysicalDeviceProperties & properties,const VkPhysicalDeviceMemoryProperties & memoryProperties,uint32_t featureFlags)146 void GrVkCaps::initGrCaps(const VkPhysicalDeviceProperties& properties,
147 const VkPhysicalDeviceMemoryProperties& memoryProperties,
148 uint32_t featureFlags) {
149 // So GPUs, like AMD, are reporting MAX_INT support vertex attributes. In general, there is no
150 // need for us ever to support that amount, and it makes tests which tests all the vertex
151 // attribs timeout looping over that many. For now, we'll cap this at 64 max and can raise it if
152 // we ever find that need.
153 static const uint32_t kMaxVertexAttributes = 64;
154 fMaxVertexAttributes = SkTMin(properties.limits.maxVertexInputAttributes, kMaxVertexAttributes);
155 // AMD advertises support for MAX_UINT vertex input attributes, but in reality only supports 32.
156 if (kAMD_VkVendor == properties.vendorID) {
157 fMaxVertexAttributes = SkTMin(fMaxVertexAttributes, 32);
158 }
159
160 // We could actually query and get a max size for each config, however maxImageDimension2D will
161 // give the minimum max size across all configs. So for simplicity we will use that for now.
162 fMaxRenderTargetSize = SkTMin(properties.limits.maxImageDimension2D, (uint32_t)INT_MAX);
163 fMaxTextureSize = SkTMin(properties.limits.maxImageDimension2D, (uint32_t)INT_MAX);
164
165 this->initSampleCount(properties);
166
167 // Assuming since we will always map in the end to upload the data we might as well just map
168 // from the get go. There is no hard data to suggest this is faster or slower.
169 fBufferMapThreshold = 0;
170
171 fMapBufferFlags = kCanMap_MapFlag | kSubset_MapFlag;
172
173 fStencilWrapOpsSupport = true;
174 fOversizedStencilSupport = true;
175 fSampleShadingSupport = SkToBool(featureFlags & kSampleRateShading_GrVkFeatureFlag);
176
177 // AMD seems to have issues binding new VkPipelines inside a secondary command buffer.
178 // Current workaround is to use a different secondary command buffer for each new VkPipeline.
179 if (kAMD_VkVendor == properties.vendorID) {
180 fNewSecondaryCBOnPipelineChange = true;
181 }
182 }
183
initShaderCaps(const VkPhysicalDeviceProperties & properties,uint32_t featureFlags)184 void GrVkCaps::initShaderCaps(const VkPhysicalDeviceProperties& properties, uint32_t featureFlags) {
185 GrShaderCaps* shaderCaps = fShaderCaps.get();
186 shaderCaps->fVersionDeclString = "#version 330\n";
187
188
189 // fConfigOutputSwizzle will default to RGBA so we only need to set it for alpha only config.
190 for (int i = 0; i < kGrPixelConfigCnt; ++i) {
191 GrPixelConfig config = static_cast<GrPixelConfig>(i);
192 if (GrPixelConfigIsAlphaOnly(config)) {
193 shaderCaps->fConfigTextureSwizzle[i] = GrSwizzle::RRRR();
194 shaderCaps->fConfigOutputSwizzle[i] = GrSwizzle::AAAA();
195 } else {
196 if (kGray_8_GrPixelConfig == config) {
197 shaderCaps->fConfigTextureSwizzle[i] = GrSwizzle::RRRA();
198 } else if (kRGBA_4444_GrPixelConfig == config) {
199 // The vulkan spec does not require R4G4B4A4 to be supported for texturing so we
200 // store the data in a B4G4R4A4 texture and then swizzle it when doing texture reads
201 // or writing to outputs. Since we're not actually changing the data at all, the
202 // only extra work is the swizzle in the shader for all operations.
203 shaderCaps->fConfigTextureSwizzle[i] = GrSwizzle::BGRA();
204 shaderCaps->fConfigOutputSwizzle[i] = GrSwizzle::BGRA();
205 } else {
206 shaderCaps->fConfigTextureSwizzle[i] = GrSwizzle::RGBA();
207 }
208 }
209 }
210
211 if (kImagination_VkVendor == properties.vendorID) {
212 shaderCaps->fAtan2ImplementedAsAtanYOverX = true;
213 }
214
215 // Vulkan is based off ES 3.0 so the following should all be supported
216 shaderCaps->fUsesPrecisionModifiers = true;
217 shaderCaps->fFlatInterpolationSupport = true;
218
219 // GrShaderCaps
220
221 shaderCaps->fShaderDerivativeSupport = true;
222 shaderCaps->fGeometryShaderSupport = SkToBool(featureFlags & kGeometryShader_GrVkFeatureFlag);
223
224 shaderCaps->fDualSourceBlendingSupport = SkToBool(featureFlags & kDualSrcBlend_GrVkFeatureFlag);
225 if (kAMD_VkVendor == properties.vendorID) {
226 // Currently DualSourceBlending is not working on AMD. vkCreateGraphicsPipeline fails when
227 // using a draw with dual source. Looking into whether it is driver bug or issue with our
228 // SPIR-V. Bug skia:6405
229 shaderCaps->fDualSourceBlendingSupport = false;
230 }
231
232 shaderCaps->fIntegerSupport = true;
233
234 // Assume the minimum precisions mandated by the SPIR-V spec.
235 shaderCaps->fShaderPrecisionVaries = true;
236 for (int s = 0; s < kGrShaderTypeCount; ++s) {
237 auto& highp = shaderCaps->fFloatPrecisions[s][kHigh_GrSLPrecision];
238 highp.fLogRangeLow = highp.fLogRangeHigh = 127;
239 highp.fBits = 23;
240
241 auto& mediump = shaderCaps->fFloatPrecisions[s][kMedium_GrSLPrecision];
242 mediump.fLogRangeLow = mediump.fLogRangeHigh = 14;
243 mediump.fBits = 10;
244
245 shaderCaps->fFloatPrecisions[s][kLow_GrSLPrecision] = mediump;
246 }
247 shaderCaps->initSamplerPrecisionTable();
248
249 shaderCaps->fMaxVertexSamplers =
250 shaderCaps->fMaxGeometrySamplers =
251 shaderCaps->fMaxFragmentSamplers = SkTMin(
252 SkTMin(properties.limits.maxPerStageDescriptorSampledImages,
253 properties.limits.maxPerStageDescriptorSamplers),
254 (uint32_t)INT_MAX);
255 shaderCaps->fMaxCombinedSamplers = SkTMin(
256 SkTMin(properties.limits.maxDescriptorSetSampledImages,
257 properties.limits.maxDescriptorSetSamplers),
258 (uint32_t)INT_MAX);
259 }
260
stencil_format_supported(const GrVkInterface * interface,VkPhysicalDevice physDev,VkFormat format)261 bool stencil_format_supported(const GrVkInterface* interface,
262 VkPhysicalDevice physDev,
263 VkFormat format) {
264 VkFormatProperties props;
265 memset(&props, 0, sizeof(VkFormatProperties));
266 GR_VK_CALL(interface, GetPhysicalDeviceFormatProperties(physDev, format, &props));
267 return SkToBool(VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT & props.optimalTilingFeatures);
268 }
269
initStencilFormat(const GrVkInterface * interface,VkPhysicalDevice physDev)270 void GrVkCaps::initStencilFormat(const GrVkInterface* interface, VkPhysicalDevice physDev) {
271 // List of legal stencil formats (though perhaps not supported on
272 // the particular gpu/driver) from most preferred to least. We are guaranteed to have either
273 // VK_FORMAT_D24_UNORM_S8_UINT or VK_FORMAT_D32_SFLOAT_S8_UINT. VK_FORMAT_D32_SFLOAT_S8_UINT
274 // can optionally have 24 unused bits at the end so we assume the total bits is 64.
275 static const StencilFormat
276 // internal Format stencil bits total bits packed?
277 gS8 = { VK_FORMAT_S8_UINT, 8, 8, false },
278 gD24S8 = { VK_FORMAT_D24_UNORM_S8_UINT, 8, 32, true },
279 gD32S8 = { VK_FORMAT_D32_SFLOAT_S8_UINT, 8, 64, true };
280
281 if (stencil_format_supported(interface, physDev, VK_FORMAT_S8_UINT)) {
282 fPreferedStencilFormat = gS8;
283 } else if (stencil_format_supported(interface, physDev, VK_FORMAT_D24_UNORM_S8_UINT)) {
284 fPreferedStencilFormat = gD24S8;
285 } else {
286 SkASSERT(stencil_format_supported(interface, physDev, VK_FORMAT_D32_SFLOAT_S8_UINT));
287 fPreferedStencilFormat = gD32S8;
288 }
289 }
290
initConfigTable(const GrVkInterface * interface,VkPhysicalDevice physDev)291 void GrVkCaps::initConfigTable(const GrVkInterface* interface, VkPhysicalDevice physDev) {
292 for (int i = 0; i < kGrPixelConfigCnt; ++i) {
293 VkFormat format;
294 if (GrPixelConfigToVkFormat(static_cast<GrPixelConfig>(i), &format)) {
295 fConfigTable[i].init(interface, physDev, format);
296 }
297 }
298
299 // We currently do not support compressed textures in Vulkan
300 const uint16_t kFlagsToRemove = ConfigInfo::kTextureable_Flag|ConfigInfo::kRenderable_Flag;
301 fConfigTable[kETC1_GrPixelConfig].fOptimalFlags &= ~kFlagsToRemove;
302 fConfigTable[kETC1_GrPixelConfig].fLinearFlags &= ~kFlagsToRemove;
303 }
304
InitConfigFlags(VkFormatFeatureFlags vkFlags,uint16_t * flags)305 void GrVkCaps::ConfigInfo::InitConfigFlags(VkFormatFeatureFlags vkFlags, uint16_t* flags) {
306 if (SkToBool(VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT & vkFlags) &&
307 SkToBool(VK_FORMAT_FEATURE_SAMPLED_IMAGE_FILTER_LINEAR_BIT & vkFlags)) {
308 *flags = *flags | kTextureable_Flag;
309 }
310
311 if (SkToBool(VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BLEND_BIT & vkFlags)) {
312 *flags = *flags | kRenderable_Flag;
313 }
314
315 if (SkToBool(VK_FORMAT_FEATURE_BLIT_SRC_BIT & vkFlags)) {
316 *flags = *flags | kBlitSrc_Flag;
317 }
318
319 if (SkToBool(VK_FORMAT_FEATURE_BLIT_DST_BIT & vkFlags)) {
320 *flags = *flags | kBlitDst_Flag;
321 }
322 }
323
init(const GrVkInterface * interface,VkPhysicalDevice physDev,VkFormat format)324 void GrVkCaps::ConfigInfo::init(const GrVkInterface* interface,
325 VkPhysicalDevice physDev,
326 VkFormat format) {
327 VkFormatProperties props;
328 memset(&props, 0, sizeof(VkFormatProperties));
329 GR_VK_CALL(interface, GetPhysicalDeviceFormatProperties(physDev, format, &props));
330 InitConfigFlags(props.linearTilingFeatures, &fLinearFlags);
331 InitConfigFlags(props.optimalTilingFeatures, &fOptimalFlags);
332 }
333