• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright 2014 Google Inc.
3  *
4  * Use of this source code is governed by a BSD-style license that can be
5  * found in the LICENSE file.
6  */
7 #include "src/gpu/effects/GrMatrixConvolutionEffect.h"
8 
9 #include "include/private/SkHalf.h"
10 #include "src/gpu/GrDirectContextPriv.h"
11 #include "src/gpu/GrProxyProvider.h"
12 #include "src/gpu/GrRecordingContextPriv.h"
13 #include "src/gpu/GrTexture.h"
14 #include "src/gpu/GrTextureProxy.h"
15 #include "src/gpu/GrThreadSafeCache.h"
16 #include "src/gpu/SkGr.h"
17 #include "src/gpu/effects/GrTextureEffect.h"
18 #include "src/gpu/glsl/GrGLSLFragmentShaderBuilder.h"
19 #include "src/gpu/glsl/GrGLSLProgramDataManager.h"
20 #include "src/gpu/glsl/GrGLSLUniformHandler.h"
21 
22 class GrMatrixConvolutionEffect::Impl : public ProgramImpl {
23 public:
24     void emitCode(EmitArgs&) override;
25 
26 private:
27     void onSetData(const GrGLSLProgramDataManager&, const GrFragmentProcessor&) override;
28 
29     typedef GrGLSLProgramDataManager::UniformHandle UniformHandle;
30 
31     void emitKernelBlock(EmitArgs&, SkIPoint);
32 
33     UniformHandle               fKernelUni;
34     UniformHandle               fKernelOffsetUni;
35     UniformHandle               fGainUni;
36     UniformHandle               fBiasUni;
37     UniformHandle               fKernelBiasUni;
38 
39     using INHERITED = ProgramImpl;
40 };
41 
42 GrMatrixConvolutionEffect::KernelWrapper::MakeResult
Make(GrRecordingContext * rContext,SkISize size,const GrCaps & caps,const SkScalar * values)43 GrMatrixConvolutionEffect::KernelWrapper::Make(GrRecordingContext* rContext,
44                                                SkISize size,
45                                                const GrCaps& caps,
46                                                const SkScalar* values) {
47     if (!rContext || !values || size.isEmpty()) {
48         return {};
49     }
50 
51     const int length = size.area();
52     // Small kernel -> just fill the array.
53     KernelWrapper result(size);
54     if (length <= kMaxUniformSize) {
55         for (int i = 0; i < length; i++) {
56             result.fArray[i] = SkScalarToFloat(values[i]);
57         }
58         return {result, nullptr};
59     }
60 
61     BiasAndGain& scalableSampler = result.fBiasAndGain;
62     bool useA16 =
63         rContext->defaultBackendFormat(kA16_float_SkColorType, GrRenderable::kNo).isValid();
64     SkScalar min = values[0];
65     if (!useA16) {
66         // Determine min and max values to figure out inner gain & bias.
67         SkScalar max = values[0];
68         for (int i = 1; i < length; i++) {
69             if (values[i] < min) {
70                 min = values[i];
71             }
72             if (values[i] > max) {
73                 max = values[i];
74             }
75         }
76         // Treat near-0 gain (i.e. box blur) as 1, and let the kernelBias
77         // move everything up to the final value.
78         const SkScalar computedGain = max - min;
79         scalableSampler.fGain =
80             SkScalarNearlyZero(computedGain) ? 1.0f : SkScalarToFloat(computedGain);
81         // Inner bias is pre-inner-gain so we divide that out.
82         scalableSampler.fBias = SkScalarToFloat(min) / scalableSampler.fGain;
83     }
84 
85     // TODO: Pick cache or dont-cache based on observed perf.
86     static constexpr bool kCacheKernelTexture = true;
87 
88     GrUniqueKey key;
89     if (kCacheKernelTexture) {
90         static const GrUniqueKey::Domain kDomain = GrUniqueKey::GenerateDomain();
91         GrUniqueKey::Builder builder(&key, kDomain, length, "Matrix Convolution Kernel");
92         // Texture cache key is the exact content of the kernel.
93         static_assert(sizeof(float) == 4);
94         for (int i = 0; i < length; i++) {
95             builder[i] = *(const uint32_t*)&values[i];
96         }
97         builder.finish();
98     }
99 
100     // Find or create a texture.
101     auto threadSafeCache = rContext->priv().threadSafeCache();
102 
103     SkColorType colorType = useA16 ? kA16_float_SkColorType : kAlpha_8_SkColorType;
104 
105     GrSurfaceProxyView view;
106     if (kCacheKernelTexture && (view = threadSafeCache->find(key))) {
107         SkASSERT(view.origin() == kTopLeft_GrSurfaceOrigin);
108         auto kernelFP = GrTextureEffect::Make(std::move(view), kUnknown_SkAlphaType);
109         return {result, std::move(kernelFP)};
110     }
111 
112     SkBitmap bm;
113     auto info = SkImageInfo::Make({length, 1}, colorType, kPremul_SkAlphaType, nullptr);
114     if (!bm.tryAllocPixels(info)) {
115         return {};
116     }
117     for (int i = 0; i < length; i++) {
118         if (useA16) {
119             *bm.getAddr16(i, 0) = SkFloatToHalf(values[i]);
120         } else {
121             *bm.getAddr8(i, 0) =
122                 SkScalarRoundToInt((values[i] - min) / scalableSampler.fGain * 255);
123         }
124     }
125     bm.setImmutable();
126 
127     view = std::get<0>(GrMakeUncachedBitmapProxyView(rContext, bm));
128     if (!view) {
129         return {};
130     }
131 
132     if (kCacheKernelTexture) {
133         view = threadSafeCache->add(key, view);
134     }
135 
136     SkASSERT(view.origin() == kTopLeft_GrSurfaceOrigin);
137     auto kernelFP = GrTextureEffect::Make(std::move(view), kUnknown_SkAlphaType);
138     return {result, std::move(kernelFP)};
139 }
140 
operator ==(const KernelWrapper & k) const141 bool GrMatrixConvolutionEffect::KernelWrapper::operator==(const KernelWrapper& k) const {
142     if (fSize != k.fSize) {
143         return false;
144     } else if (this->isSampled()) {
145         return fBiasAndGain == k.fBiasAndGain;
146     } else {
147         return std::equal(fArray.begin(), fArray.begin() + fSize.area(), k.fArray.begin());
148     }
149 }
150 
operator ==(const BiasAndGain & k) const151 bool GrMatrixConvolutionEffect::KernelWrapper::BiasAndGain::operator==(
152                                                                 const BiasAndGain& k) const {
153     return fGain == k.fGain && fBias == k.fBias;
154 }
155 
156 // For sampled kernels, emit a for loop that does all the kernel accumulation.
157 // For uniform kernels, emit a single iteration. Function is called repeatedly in a for loop.
158 // loc is ignored for sampled kernels.
emitKernelBlock(EmitArgs & args,SkIPoint loc)159 void GrMatrixConvolutionEffect::Impl::emitKernelBlock(EmitArgs& args, SkIPoint loc) {
160     const GrMatrixConvolutionEffect& mce = args.fFp.cast<GrMatrixConvolutionEffect>();
161     GrGLSLFPFragmentBuilder* fragBuilder = args.fFragBuilder;
162     GrGLSLUniformHandler* uniformHandler = args.fUniformHandler;
163     int kernelWidth = mce.fKernel.size().width();
164     int kernelHeight = mce.fKernel.size().height();
165     int kernelArea = kernelWidth * kernelHeight;
166 
167     if (mce.fKernel.isSampled()) {
168         fragBuilder->codeAppendf("for (int i = 0; i < %d; ++i)", (int)kernelArea);
169     }
170 
171     GrGLSLShaderBuilder::ShaderBlock block(fragBuilder);
172 
173     fragBuilder->codeAppend("half k;");
174     fragBuilder->codeAppend("half2 sourceOffset;");
175     if (mce.fKernel.isSampled()) {
176         const char* kernelBias = uniformHandler->getUniformCStr(fKernelBiasUni);
177         SkString kernelSample = this->invokeChild(1, args, "float2(float(i) + 0.5, 0.5)");
178         fragBuilder->codeAppendf("k = %s.w + %s;", kernelSample.c_str(), kernelBias);
179         fragBuilder->codeAppendf("sourceOffset.y = floor(half(i) / %d);", kernelWidth);
180         fragBuilder->codeAppendf("sourceOffset.x = half(i) - sourceOffset.y * %d;", kernelWidth);
181     } else {
182         fragBuilder->codeAppendf("sourceOffset = half2(%d, %d);", loc.x(), loc.y());
183         int offset = loc.y() * kernelWidth + loc.x();
184         const char* kernel = uniformHandler->getUniformCStr(fKernelUni);
185         fragBuilder->codeAppendf("k = %s[%d][%d];", kernel, offset / 4, offset & 0x3);
186     }
187 
188     auto sample = this->invokeChild(0, args, "coord + sourceOffset");
189     fragBuilder->codeAppendf("half4 c = %s;", sample.c_str());
190     if (!mce.fConvolveAlpha) {
191         fragBuilder->codeAppend("c = unpremul(c);");
192         fragBuilder->codeAppend("c.rgb = saturate(c.rgb);");
193     }
194     fragBuilder->codeAppend("sum += c * k;");
195 }
196 
emitCode(EmitArgs & args)197 void GrMatrixConvolutionEffect::Impl::emitCode(EmitArgs& args) {
198     const GrMatrixConvolutionEffect& mce = args.fFp.cast<GrMatrixConvolutionEffect>();
199 
200     int kernelWidth = mce.fKernel.size().width();
201     int kernelHeight = mce.fKernel.size().height();
202 
203     int arrayCount = (kernelWidth * kernelHeight + 3) / 4;
204     SkASSERT(4 * arrayCount >= kernelWidth * kernelHeight);
205 
206     GrGLSLUniformHandler* uniformHandler = args.fUniformHandler;
207     if (mce.fKernel.isSampled()) {
208         fKernelBiasUni = uniformHandler->addUniform(&mce, kFragment_GrShaderFlag,
209                                                     kHalf_GrSLType, "KernelBias");
210     } else {
211         fKernelUni = uniformHandler->addUniformArray(&mce, kFragment_GrShaderFlag,
212                                                      kHalf4_GrSLType, "Kernel", arrayCount);
213     }
214     fKernelOffsetUni = uniformHandler->addUniform(&mce, kFragment_GrShaderFlag, kHalf2_GrSLType,
215                                                   "KernelOffset");
216     fGainUni = uniformHandler->addUniform(&mce, kFragment_GrShaderFlag, kHalf_GrSLType, "Gain");
217     fBiasUni = uniformHandler->addUniform(&mce, kFragment_GrShaderFlag, kHalf_GrSLType, "Bias");
218 
219     const char* kernelOffset = uniformHandler->getUniformCStr(fKernelOffsetUni);
220     const char* gain = uniformHandler->getUniformCStr(fGainUni);
221     const char* bias = uniformHandler->getUniformCStr(fBiasUni);
222 
223     GrGLSLFPFragmentBuilder* fragBuilder = args.fFragBuilder;
224     fragBuilder->codeAppend("half4 sum = half4(0);");
225     fragBuilder->codeAppendf("float2 coord = %s - %s;", args.fSampleCoord, kernelOffset);
226 
227     if (mce.fKernel.isSampled()) {
228         this->emitKernelBlock(args, {});
229     } else {
230         for (int x = 0; x < kernelWidth; ++x) {
231             for (int y = 0; y < kernelHeight; ++y) {
232                 this->emitKernelBlock(args, SkIPoint::Make(x, y));
233             }
234         }
235     }
236 
237     fragBuilder->codeAppendf("half4 color;");
238     if (mce.fConvolveAlpha) {
239         fragBuilder->codeAppendf("color = sum * %s + %s;", gain, bias);
240         fragBuilder->codeAppendf("color.a = saturate(color.a);");
241         fragBuilder->codeAppendf("color.rgb = clamp(color.rgb, 0.0, color.a);");
242     } else {
243         auto sample = this->invokeChild(0, args);
244         fragBuilder->codeAppendf("half4 c = %s;", sample.c_str());
245         fragBuilder->codeAppendf("color.a = c.a;");
246         fragBuilder->codeAppendf("color.rgb = saturate(sum.rgb * %s + %s);", gain, bias);
247         fragBuilder->codeAppendf("color.rgb *= color.a;");
248     }
249     fragBuilder->codeAppendf("return color;");
250 }
251 
onSetData(const GrGLSLProgramDataManager & pdman,const GrFragmentProcessor & processor)252 void GrMatrixConvolutionEffect::Impl::onSetData(const GrGLSLProgramDataManager& pdman,
253                                                 const GrFragmentProcessor& processor) {
254     const GrMatrixConvolutionEffect& conv = processor.cast<GrMatrixConvolutionEffect>();
255     pdman.set2f(fKernelOffsetUni, conv.fKernelOffset.fX, conv.fKernelOffset.fY);
256     float totalGain = conv.fGain;
257     if (conv.fKernel.isSampled()) {
258         totalGain *= conv.fKernel.biasAndGain().fGain;
259         pdman.set1f(fKernelBiasUni, conv.fKernel.biasAndGain().fBias);
260     } else {
261         int kernelCount = conv.fKernel.size().area();
262         int arrayCount = (kernelCount + 3) / 4;
263         SkASSERT(4 * arrayCount >= kernelCount);
264         pdman.set4fv(fKernelUni, arrayCount, conv.fKernel.array().data());
265     }
266     pdman.set1f(fBiasUni, conv.fBias);
267     pdman.set1f(fGainUni, totalGain);
268 }
269 
GrMatrixConvolutionEffect(std::unique_ptr<GrFragmentProcessor> child,const KernelWrapper & kernel,std::unique_ptr<GrFragmentProcessor> kernelFP,SkScalar gain,SkScalar bias,const SkIPoint & kernelOffset,bool convolveAlpha)270 GrMatrixConvolutionEffect::GrMatrixConvolutionEffect(std::unique_ptr<GrFragmentProcessor> child,
271                                                      const KernelWrapper& kernel,
272                                                      std::unique_ptr<GrFragmentProcessor> kernelFP,
273                                                      SkScalar gain,
274                                                      SkScalar bias,
275                                                      const SkIPoint& kernelOffset,
276                                                      bool convolveAlpha)
277         // To advertise either the modulation or opaqueness optimizations we'd have to examine the
278         // parameters.
279         : INHERITED(kGrMatrixConvolutionEffect_ClassID, kNone_OptimizationFlags)
280         , fKernel(kernel)
281         , fGain(SkScalarToFloat(gain))
282         , fBias(SkScalarToFloat(bias) / 255.0f)
283         , fConvolveAlpha(convolveAlpha) {
284     this->registerChild(std::move(child), SkSL::SampleUsage::Explicit());
285     this->registerChild(std::move(kernelFP), SkSL::SampleUsage::Explicit());
286     fKernelOffset = {static_cast<float>(kernelOffset.x()),
287                      static_cast<float>(kernelOffset.y())};
288     this->setUsesSampleCoordsDirectly();
289 }
290 
GrMatrixConvolutionEffect(const GrMatrixConvolutionEffect & that)291 GrMatrixConvolutionEffect::GrMatrixConvolutionEffect(const GrMatrixConvolutionEffect& that)
292         : INHERITED(that)
293         , fKernel(that.fKernel)
294         , fGain(that.fGain)
295         , fBias(that.fBias)
296         , fKernelOffset(that.fKernelOffset)
297         , fConvolveAlpha(that.fConvolveAlpha) {}
298 
clone() const299 std::unique_ptr<GrFragmentProcessor> GrMatrixConvolutionEffect::clone() const {
300     return std::unique_ptr<GrFragmentProcessor>(new GrMatrixConvolutionEffect(*this));
301 }
302 
onAddToKey(const GrShaderCaps & caps,GrProcessorKeyBuilder * b) const303 void GrMatrixConvolutionEffect::onAddToKey(const GrShaderCaps& caps,
304                                            GrProcessorKeyBuilder* b) const {
305     SkASSERT(this->fKernel.size().width() <= 0x7FFF && this->fKernel.size().height() <= 0xFFFF);
306     uint32_t key = this->fKernel.size().width() << 16 | this->fKernel.size().height();
307     key |= fConvolveAlpha ? 1U << 31 : 0;
308     b->add32(key);
309 }
310 
311 std::unique_ptr<GrFragmentProcessor::ProgramImpl>
onMakeProgramImpl() const312 GrMatrixConvolutionEffect::onMakeProgramImpl() const {
313     return std::make_unique<Impl>();
314 }
315 
onIsEqual(const GrFragmentProcessor & sBase) const316 bool GrMatrixConvolutionEffect::onIsEqual(const GrFragmentProcessor& sBase) const {
317     const GrMatrixConvolutionEffect& s = sBase.cast<GrMatrixConvolutionEffect>();
318     return fKernel == s.fKernel             &&
319            fGain == s.fGain                 &&
320            fBias == s.fBias                 &&
321            fKernelOffset == s.fKernelOffset &&
322            fConvolveAlpha == s.fConvolveAlpha;
323 }
324 
Make(GrRecordingContext * context,GrSurfaceProxyView srcView,const SkIRect & srcBounds,const SkISize & kernelSize,const SkScalar * kernel,SkScalar gain,SkScalar bias,const SkIPoint & kernelOffset,GrSamplerState::WrapMode wm,bool convolveAlpha,const GrCaps & caps)325 std::unique_ptr<GrFragmentProcessor> GrMatrixConvolutionEffect::Make(GrRecordingContext* context,
326                                                                      GrSurfaceProxyView srcView,
327                                                                      const SkIRect& srcBounds,
328                                                                      const SkISize& kernelSize,
329                                                                      const SkScalar* kernel,
330                                                                      SkScalar gain,
331                                                                      SkScalar bias,
332                                                                      const SkIPoint& kernelOffset,
333                                                                      GrSamplerState::WrapMode wm,
334                                                                      bool convolveAlpha,
335                                                                      const GrCaps& caps) {
336     auto [kernelWrapper, kernelFP] = KernelWrapper::Make(context, kernelSize, caps, kernel);
337     if (!kernelWrapper.isValid()) {
338         return nullptr;
339     }
340     GrSamplerState sampler(wm, GrSamplerState::Filter::kNearest);
341     auto child = GrTextureEffect::MakeSubset(std::move(srcView), kPremul_SkAlphaType, SkMatrix::I(),
342                                              sampler, SkRect::Make(srcBounds), caps);
343     return std::unique_ptr<GrFragmentProcessor>(
344             new GrMatrixConvolutionEffect(std::move(child), kernelWrapper, std::move(kernelFP),
345                                           gain, bias, kernelOffset, convolveAlpha));
346 }
347 
348 GR_DEFINE_FRAGMENT_PROCESSOR_TEST(GrMatrixConvolutionEffect);
349 
350 #if GR_TEST_UTILS
TestCreate(GrProcessorTestData * d)351 std::unique_ptr<GrFragmentProcessor> GrMatrixConvolutionEffect::TestCreate(GrProcessorTestData* d) {
352     auto [view, ct, at] = d->randomView();
353 
354     static constexpr size_t kMaxTestKernelSize = 2 * kMaxUniformSize;
355     int width = d->fRandom->nextRangeU(1, kMaxTestKernelSize);
356     int height = d->fRandom->nextRangeU(1, kMaxTestKernelSize / width);
357     SkISize kernelSize = SkISize::Make(width, height);
358     std::unique_ptr<SkScalar[]> kernel(new SkScalar[width * height]);
359     for (int i = 0; i < width * height; i++) {
360         kernel.get()[i] = d->fRandom->nextSScalar1();
361     }
362     SkScalar gain = d->fRandom->nextSScalar1();
363     SkScalar bias = d->fRandom->nextSScalar1();
364 
365     uint32_t kernalOffsetX = d->fRandom->nextRangeU(0, kernelSize.width());
366     uint32_t kernalOffsetY = d->fRandom->nextRangeU(0, kernelSize.height());
367     SkIPoint kernelOffset = SkIPoint::Make(kernalOffsetX, kernalOffsetY);
368 
369     uint32_t boundsX = d->fRandom->nextRangeU(0, view.width());
370     uint32_t boundsY = d->fRandom->nextRangeU(0, view.height());
371     uint32_t boundsW = d->fRandom->nextRangeU(0, view.width());
372     uint32_t boundsH = d->fRandom->nextRangeU(0, view.height());
373     SkIRect bounds = SkIRect::MakeXYWH(boundsX, boundsY, boundsW, boundsH);
374 
375     auto wm = static_cast<GrSamplerState::WrapMode>(
376             d->fRandom->nextULessThan(GrSamplerState::kWrapModeCount));
377     bool convolveAlpha = d->fRandom->nextBool();
378     return GrMatrixConvolutionEffect::Make(d->context(),
379                                            std::move(view),
380                                            bounds,
381                                            kernelSize,
382                                            kernel.get(),
383                                            gain,
384                                            bias,
385                                            kernelOffset,
386                                            wm,
387                                            convolveAlpha,
388                                            *d->caps());
389 }
390 #endif
391