• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright 2015 Google Inc.
3  *
4  * Use of this source code is governed by a BSD-style license that can be
5  * found in the LICENSE file.
6  */
7 
8 #ifndef GrVkCaps_DEFINED
9 #define GrVkCaps_DEFINED
10 
11 #include "include/gpu/vk/GrVkTypes.h"
12 #include "src/gpu/GrCaps.h"
13 
14 class GrShaderCaps;
15 class GrVkExtensions;
16 struct GrVkInterface;
17 class GrVkRenderTarget;
18 
19 /**
20  * Stores some capabilities of a Vk backend.
21  */
22 class GrVkCaps : public GrCaps {
23 public:
24     /**
25      * Creates a GrVkCaps that is set such that nothing is supported. The init function should
26      * be called to fill out the caps.
27      */
28     GrVkCaps(const GrContextOptions& contextOptions,
29              const GrVkInterface* vkInterface,
30              VkPhysicalDevice device,
31              const VkPhysicalDeviceFeatures2& features,
32              uint32_t instanceVersion,
33              uint32_t physicalDeviceVersion,
34              const GrVkExtensions& extensions,
35              GrProtected isProtected = GrProtected::kNo);
36 
37     bool isFormatSRGB(const GrBackendFormat&) const override;
38 
39     bool isFormatTexturable(const GrBackendFormat&, GrTextureType) const override;
40     bool isVkFormatTexturable(VkFormat) const;
41 
isFormatCopyable(const GrBackendFormat &)42     bool isFormatCopyable(const GrBackendFormat&) const override { return true; }
43 
44     bool isFormatAsColorTypeRenderable(GrColorType ct,
45                                        const GrBackendFormat& format,
46                                        int sampleCount = 1) const override;
47     bool isFormatRenderable(const GrBackendFormat& format, int sampleCount) const override;
48     bool isFormatRenderable(VkFormat, int sampleCount) const;
49 
50     int getRenderTargetSampleCount(int requestedCount, const GrBackendFormat&) const override;
51     int getRenderTargetSampleCount(int requestedCount, VkFormat) const;
52 
53     int maxRenderTargetSampleCount(const GrBackendFormat&) const override;
54     int maxRenderTargetSampleCount(VkFormat format) const;
55 
56     SupportedWrite supportedWritePixelsColorType(GrColorType surfaceColorType,
57                                                  const GrBackendFormat& surfaceFormat,
58                                                  GrColorType srcColorType) const override;
59 
60     SurfaceReadPixelsSupport surfaceSupportsReadPixels(const GrSurface*) const override;
61 
isVkFormatTexturableLinearly(VkFormat format)62     bool isVkFormatTexturableLinearly(VkFormat format) const {
63         return SkToBool(FormatInfo::kTexturable_Flag & this->getFormatInfo(format).fLinearFlags);
64     }
65 
formatCanBeDstofBlit(VkFormat format,bool linearTiled)66     bool formatCanBeDstofBlit(VkFormat format, bool linearTiled) const {
67         const FormatInfo& info = this->getFormatInfo(format);
68         const uint16_t& flags = linearTiled ? info.fLinearFlags : info.fOptimalFlags;
69         return SkToBool(FormatInfo::kBlitDst_Flag & flags);
70     }
71 
formatCanBeSrcofBlit(VkFormat format,bool linearTiled)72     bool formatCanBeSrcofBlit(VkFormat format, bool linearTiled) const {
73         const FormatInfo& info = this->getFormatInfo(format);
74         const uint16_t& flags = linearTiled ? info.fLinearFlags : info.fOptimalFlags;
75         return SkToBool(FormatInfo::kBlitSrc_Flag & flags);
76     }
77 
78     // Gets the GrColorType that should be used to transfer data in/out of a transfer buffer to
79     // write/read data when using a VkFormat with a specified color type.
80     GrColorType transferColorType(VkFormat, GrColorType surfaceColorType) const;
81 
82     // On some GPUs (Windows Nvidia and Imagination) calls to QueueWaitIdle return before actually
83     // signalling the fences on the command buffers even though they have completed. This causes
84     // issues when then deleting the command buffers. Therefore we additionally will call
85     // vkWaitForFences on each outstanding command buffer to make sure the driver signals the fence.
mustSyncCommandBuffersWithQueue()86     bool mustSyncCommandBuffersWithQueue() const { return fMustSyncCommandBuffersWithQueue; }
87 
88     // Returns true if we should always make dedicated allocations for VkImages.
shouldAlwaysUseDedicatedImageMemory()89     bool shouldAlwaysUseDedicatedImageMemory() const {
90         return fShouldAlwaysUseDedicatedImageMemory;
91     }
92 
93     // Always use a transfer buffer instead of vkCmdUpdateBuffer to upload data to a VkBuffer.
avoidUpdateBuffers()94     bool avoidUpdateBuffers() const { return fAvoidUpdateBuffers; }
95 
96     /**
97      * Returns both a supported and most preferred stencil format to use in draws.
98      */
preferredStencilFormat()99     VkFormat preferredStencilFormat() const { return fPreferredStencilFormat; }
100 
101     // Returns total number of bits used by stencil + depth + padding
GetStencilFormatTotalBitCount(VkFormat format)102     static int GetStencilFormatTotalBitCount(VkFormat format) {
103         switch (format) {
104             case VK_FORMAT_S8_UINT:
105                 return 8;
106             case VK_FORMAT_D24_UNORM_S8_UINT:
107                 return 32;
108             case VK_FORMAT_D32_SFLOAT_S8_UINT:
109                 // can optionally have 24 unused bits at the end so we assume the total bits is 64.
110                 return 64;
111             default:
112                 SkASSERT(false);
113                 return 0;
114         }
115     }
116 
117     // Returns whether the device supports VK_KHR_Swapchain. Internally Skia never uses any of the
118     // swapchain functions, but we may need to transition to and from the
119     // VK_IMAGE_LAYOUT_PRESENT_SRC_KHR image layout, so we must know whether that layout is
120     // supported.
supportsSwapchain()121     bool supportsSwapchain() const { return fSupportsSwapchain; }
122 
123     // Returns whether the device supports the ability to extend VkPhysicalDeviceProperties struct.
supportsPhysicalDeviceProperties2()124     bool supportsPhysicalDeviceProperties2() const { return fSupportsPhysicalDeviceProperties2; }
125     // Returns whether the device supports the ability to extend VkMemoryRequirements struct.
supportsMemoryRequirements2()126     bool supportsMemoryRequirements2() const { return fSupportsMemoryRequirements2; }
127 
128     // Returns whether the device supports the ability to extend the vkBindMemory call.
supportsBindMemory2()129     bool supportsBindMemory2() const { return fSupportsBindMemory2; }
130 
131     // Returns whether or not the device suports the various API maintenance fixes to Vulkan 1.0. In
132     // Vulkan 1.1 all these maintenance are part of the core spec.
supportsMaintenance1()133     bool supportsMaintenance1() const { return fSupportsMaintenance1; }
supportsMaintenance2()134     bool supportsMaintenance2() const { return fSupportsMaintenance2; }
supportsMaintenance3()135     bool supportsMaintenance3() const { return fSupportsMaintenance3; }
136 
137     // Returns true if the device supports passing in a flag to say we are using dedicated GPU when
138     // allocating memory. For some devices this allows them to return more optimized memory knowning
139     // they will never need to suballocate amonst multiple objects.
supportsDedicatedAllocation()140     bool supportsDedicatedAllocation() const { return fSupportsDedicatedAllocation; }
141 
142     // Returns true if the device supports importing of external memory into Vulkan memory.
supportsExternalMemory()143     bool supportsExternalMemory() const { return fSupportsExternalMemory; }
144     // Returns true if the device supports importing Android hardware buffers into Vulkan memory.
supportsAndroidHWBExternalMemory()145     bool supportsAndroidHWBExternalMemory() const { return fSupportsAndroidHWBExternalMemory; }
146 
147     // Returns true if it supports ycbcr conversion for samplers
supportsYcbcrConversion()148     bool supportsYcbcrConversion() const { return fSupportsYcbcrConversion; }
149 
150     // Returns the number of descriptor slots used by immutable ycbcr VkImages.
151     //
152     // TODO: We should update this to return a count for a specific format or external format. We
153     // can use vkGetPhysicalDeviceImageFormatProperties2 with a
154     // VkSamplerYcbcrConversionImageFormatProperties to query this. However, right now that call
155     // does not support external android formats which is where the majority of ycbcr images are
156     // coming from. So for now we stay safe and always return 3 here which is the max value that the
157     // count could be for any format.
ycbcrCombinedImageSamplerDescriptorCount()158     uint32_t ycbcrCombinedImageSamplerDescriptorCount() const {
159         return 3;
160     }
161 
162     // Returns true if the device supports protected memory.
supportsProtectedMemory()163     bool supportsProtectedMemory() const { return fSupportsProtectedMemory; }
164 
165     // Returns true if the VK_EXT_image_drm_format_modifier is enabled.
supportsDRMFormatModifiers()166     bool supportsDRMFormatModifiers() const { return fSupportsDRMFormatModifiers; }
167 
168     // Returns whether we prefer to record draws directly into a primary command buffer.
preferPrimaryOverSecondaryCommandBuffers()169     bool preferPrimaryOverSecondaryCommandBuffers() const {
170         return fPreferPrimaryOverSecondaryCommandBuffers;
171     }
172 
maxPerPoolCachedSecondaryCommandBuffers()173     int maxPerPoolCachedSecondaryCommandBuffers() const {
174         return fMaxPerPoolCachedSecondaryCommandBuffers;
175     }
176 
maxInputAttachmentDescriptors()177     uint32_t maxInputAttachmentDescriptors() const { return fMaxInputAttachmentDescriptors; }
178 
mustInvalidatePrimaryCmdBufferStateAfterClearAttachments()179     bool mustInvalidatePrimaryCmdBufferStateAfterClearAttachments() const {
180         return fMustInvalidatePrimaryCmdBufferStateAfterClearAttachments;
181     }
182 
183     // For host visible allocations, this returns true if we require that they are coherent. This
184     // is used to work around bugs for devices that don't handle non-coherent memory correctly.
mustUseCoherentHostVisibleMemory()185     bool mustUseCoherentHostVisibleMemory() const { return fMustUseCoherentHostVisibleMemory; }
186 
187     // Returns whether a pure GPU accessible buffer is more performant to read than a buffer that is
188     // also host visible. If so then in some cases we may prefer the cost of doing a copy to the
189     // buffer. This typically would only be the case for buffers that are written once and read
190     // many times on the gpu.
gpuOnlyBuffersMorePerformant()191     bool gpuOnlyBuffersMorePerformant() const { return fGpuOnlyBuffersMorePerformant; }
192 
193     // For our CPU write and GPU read buffers (vertex, uniform, etc.), should we keep these buffers
194     // persistently mapped. In general the answer will be yes. The main case we don't do this is
195     // when using special memory that is DEVICE_LOCAL and HOST_VISIBLE on discrete GPUs.
shouldPersistentlyMapCpuToGpuBuffers()196     bool shouldPersistentlyMapCpuToGpuBuffers() const {
197         return fShouldPersistentlyMapCpuToGpuBuffers;
198     }
199 
200     // The max draw count that can be passed into indirect draw calls.
maxDrawIndirectDrawCount()201     uint32_t  maxDrawIndirectDrawCount() const { return fMaxDrawIndirectDrawCount; }
202 
203     /**
204      * Helpers used by canCopySurface. In all cases if the SampleCnt parameter is zero that means
205      * the surface is not a render target, otherwise it is the number of samples in the render
206      * target.
207      */
208     bool canCopyImage(VkFormat dstFormat,
209                       int dstSampleCnt,
210                       bool dstHasYcbcr,
211                       VkFormat srcFormat,
212                       int srcSamplecnt,
213                       bool srcHasYcbcr) const;
214 
215     bool canCopyAsBlit(VkFormat dstConfig,
216                        int dstSampleCnt,
217                        bool dstIsLinear,
218                        bool dstHasYcbcr,
219                        VkFormat srcConfig,
220                        int srcSampleCnt,
221                        bool srcIsLinear,
222                        bool srcHasYcbcr) const;
223 
224     bool canCopyAsResolve(VkFormat dstConfig,
225                           int dstSampleCnt,
226                           bool dstHasYcbcr,
227                           VkFormat srcConfig,
228                           int srcSamplecnt,
229                           bool srcHasYcbcr) const;
230 
231     GrBackendFormat getBackendFormatFromCompressionType(SkImage::CompressionType) const override;
232 
getFormatFromColorType(GrColorType colorType)233     VkFormat getFormatFromColorType(GrColorType colorType) const {
234         int idx = static_cast<int>(colorType);
235         return fColorTypeToFormatTable[idx];
236     }
237 
238     GrSwizzle getWriteSwizzle(const GrBackendFormat&, GrColorType) const override;
239 
240     uint64_t computeFormatKey(const GrBackendFormat&) const override;
241 
242     int getFragmentUniformBinding() const;
243     int getFragmentUniformSet() const;
244 
245     void addExtraSamplerKey(GrProcessorKeyBuilder*,
246                             GrSamplerState,
247                             const GrBackendFormat&) const override;
248 
249     GrProgramDesc makeDesc(GrRenderTarget*,
250                            const GrProgramInfo&,
251                            ProgramDescOverrideFlags) const override;
252 
253     GrInternalSurfaceFlags getExtraSurfaceFlagsForDeferredRT() const override;
254 
255     VkShaderStageFlags getPushConstantStageFlags() const;
256 
257     // If true then when doing MSAA draws, we will prefer to discard the msaa attachment on load
258     // and stores. The use of this feature for specific draws depends on the render target having a
259     // resolve attachment, and if we need to load previous data the resolve attachment must be
260     // usable as an input attachment. Otherwise we will just write out and store the msaa attachment
261     // like normal.
262     // This flag is similar to enabling gl render to texture for msaa rendering.
preferDiscardableMSAAAttachment()263     bool preferDiscardableMSAAAttachment() const { return fPreferDiscardableMSAAAttachment; }
mustLoadFullImageWithDiscardableMSAA()264     bool mustLoadFullImageWithDiscardableMSAA() const {
265         return fMustLoadFullImageWithDiscardableMSAA;
266     }
supportsDiscardableMSAAForDMSAA()267     bool supportsDiscardableMSAAForDMSAA() const { return fSupportsDiscardableMSAAForDMSAA; }
268     bool renderTargetSupportsDiscardableMSAA(const GrVkRenderTarget*) const;
269     bool programInfoWillUseDiscardableMSAA(const GrProgramInfo&) const;
270 
dmsaaResolveCanBeUsedAsTextureInSameRenderPass()271     bool dmsaaResolveCanBeUsedAsTextureInSameRenderPass() const override { return false; }
272 
supportsMemorylessAttachments()273     bool supportsMemorylessAttachments() const { return fSupportsMemorylessAttachments; }
274 
275     bool supportsHpsBlur(const GrSurfaceProxyView* proxyViewPtr) const override;
276 
277 #if GR_TEST_UTILS
278     std::vector<TestFormatColorTypeCombination> getTestingCombinations() const override;
279 #endif
280 
281 private:
282     enum VkVendor {
283         kAMD_VkVendor = 4098,
284         kARM_VkVendor = 5045,
285         kHisi_VkVendor = 6629,
286         kImagination_VkVendor = 4112,
287         kIntel_VkVendor = 32902,
288         kNvidia_VkVendor = 4318,
289         kQualcomm_VkVendor = 20803,
290     };
291 
292     void init(const GrContextOptions& contextOptions, const GrVkInterface* vkInterface,
293               VkPhysicalDevice device, const VkPhysicalDeviceFeatures2&,
294               uint32_t physicalDeviceVersion, const GrVkExtensions&, GrProtected isProtected);
295     void initGrCaps(const GrVkInterface* vkInterface,
296                     VkPhysicalDevice physDev,
297                     const VkPhysicalDeviceProperties&,
298                     const VkPhysicalDeviceMemoryProperties&,
299                     const VkPhysicalDeviceFeatures2&,
300                     const GrVkExtensions&);
301     void initShaderCaps(const VkPhysicalDeviceProperties&, const VkPhysicalDeviceFeatures2&);
302 
303     void initFormatTable(const GrVkInterface*, VkPhysicalDevice, const VkPhysicalDeviceProperties&);
304     void initStencilFormat(const GrVkInterface* iface, VkPhysicalDevice physDev);
305 
306     void applyDriverCorrectnessWorkarounds(const VkPhysicalDeviceProperties&);
307 
308     bool onSurfaceSupportsWritePixels(const GrSurface*) const override;
309     bool onCanCopySurface(const GrSurfaceProxy* dst, const GrSurfaceProxy* src,
310                           const SkIRect& srcRect, const SkIPoint& dstPoint) const override;
311     GrBackendFormat onGetDefaultBackendFormat(GrColorType) const override;
312 
313     bool onAreColorTypeAndFormatCompatible(GrColorType, const GrBackendFormat&) const override;
314 
315     SupportedRead onSupportedReadPixelsColorType(GrColorType, const GrBackendFormat&,
316                                                  GrColorType) const override;
317 
318     GrSwizzle onGetReadSwizzle(const GrBackendFormat&, GrColorType) const override;
319 
320     GrDstSampleFlags onGetDstSampleFlagsForProxy(const GrRenderTargetProxy*) const override;
321 
322     bool onSupportsDynamicMSAA(const GrRenderTargetProxy*) const override;
323 
324     // ColorTypeInfo for a specific format
325     struct ColorTypeInfo {
326         GrColorType fColorType = GrColorType::kUnknown;
327         GrColorType fTransferColorType = GrColorType::kUnknown;
328         enum {
329             kUploadData_Flag = 0x1,
330             // Does Ganesh itself support rendering to this colorType & format pair. Renderability
331             // still additionally depends on if the format itself is renderable.
332             kRenderable_Flag = 0x2,
333             // Indicates that this colorType is supported only if we are wrapping a texture with
334             // the given format and colorType. We do not allow creation with this pair.
335             kWrappedOnly_Flag = 0x4,
336         };
337         uint32_t fFlags = 0;
338 
339         GrSwizzle fReadSwizzle;
340         GrSwizzle fWriteSwizzle;
341     };
342 
343     struct FormatInfo {
colorTypeFlagsFormatInfo344         uint32_t colorTypeFlags(GrColorType colorType) const {
345             for (int i = 0; i < fColorTypeInfoCount; ++i) {
346                 if (fColorTypeInfos[i].fColorType == colorType) {
347                     return fColorTypeInfos[i].fFlags;
348                 }
349             }
350             return 0;
351         }
352 
353         void init(const GrVkInterface*, VkPhysicalDevice, const VkPhysicalDeviceProperties&,
354                   VkFormat);
355         static void InitFormatFlags(VkFormatFeatureFlags, uint16_t* flags);
356         void initSampleCounts(const GrVkInterface*, VkPhysicalDevice,
357                               const VkPhysicalDeviceProperties&, VkFormat);
358 
359         enum {
360             kTexturable_Flag = 0x1,
361             kRenderable_Flag = 0x2,
362             kBlitSrc_Flag    = 0x4,
363             kBlitDst_Flag    = 0x8,
364         };
365 
366         uint16_t fOptimalFlags = 0;
367         uint16_t fLinearFlags = 0;
368 
369         SkTDArray<int> fColorSampleCounts;
370 
371         std::unique_ptr<ColorTypeInfo[]> fColorTypeInfos;
372         int fColorTypeInfoCount = 0;
373     };
374     static const size_t kNumVkFormats = 25;
375     FormatInfo fFormatTable[kNumVkFormats];
376 
377     FormatInfo& getFormatInfo(VkFormat);
378     const FormatInfo& getFormatInfo(VkFormat) const;
379 
380     VkFormat fColorTypeToFormatTable[kGrColorTypeCnt];
381     void setColorType(GrColorType, std::initializer_list<VkFormat> formats);
382 
383     VkFormat fPreferredStencilFormat;
384 
385     SkSTArray<1, GrVkYcbcrConversionInfo> fYcbcrInfos;
386 
387     bool fMustSyncCommandBuffersWithQueue = false;
388     bool fShouldAlwaysUseDedicatedImageMemory = false;
389 
390     bool fAvoidUpdateBuffers = false;
391 
392     bool fSupportsSwapchain = false;
393 
394     bool fSupportsPhysicalDeviceProperties2 = false;
395     bool fSupportsMemoryRequirements2 = false;
396     bool fSupportsBindMemory2 = false;
397     bool fSupportsMaintenance1 = false;
398     bool fSupportsMaintenance2 = false;
399     bool fSupportsMaintenance3 = false;
400 
401     bool fSupportsDedicatedAllocation = false;
402     bool fSupportsExternalMemory = false;
403     bool fSupportsAndroidHWBExternalMemory = false;
404 
405     bool fSupportsYcbcrConversion = false;
406 
407     bool fSupportsProtectedMemory = false;
408 
409     bool fSupportsDRMFormatModifiers = false;
410 
411     bool fPreferPrimaryOverSecondaryCommandBuffers = true;
412     bool fMustInvalidatePrimaryCmdBufferStateAfterClearAttachments = false;
413 
414     bool fMustUseCoherentHostVisibleMemory = false;
415     bool fGpuOnlyBuffersMorePerformant = false;
416     bool fShouldPersistentlyMapCpuToGpuBuffers = true;
417 
418     // We default this to 100 since we already cap the max render tasks at 100 before doing a
419     // submission in the GrDrawingManager, so we shouldn't be going over 100 secondary command
420     // buffers per primary anyways.
421     int fMaxPerPoolCachedSecondaryCommandBuffers = 100;
422 
423     uint32_t fMaxInputAttachmentDescriptors = 0;
424 
425     bool fPreferDiscardableMSAAAttachment = false;
426     bool fMustLoadFullImageWithDiscardableMSAA = false;
427     bool fSupportsDiscardableMSAAForDMSAA = true;
428     bool fSupportsMemorylessAttachments = false;
429 
430     bool fSupportHpsBlur = false;
431 
432     uint32_t fMaxDrawIndirectDrawCount = 0;
433 
434     using INHERITED = GrCaps;
435 };
436 
437 #endif
438