blob: 91301ff9ac914622c02ba167a1629839f44eb8d6 [file] [log] [blame]
tomhudson@google.comd8f856c2012-05-10 12:13:36 +00001/*
2 * Copyright 2012 Google Inc.
3 *
4 * Use of this source code is governed by a BSD-style license that can be
5 * found in the LICENSE file.
6 */
7
Brian Salomonaee504b2017-01-24 12:29:36 -05008#include "GrGaussianConvolutionFragmentProcessor.h"
9#include "../private/GrGLSL.h"
egdaniel64c47282015-11-13 06:54:19 -080010#include "glsl/GrGLSLFragmentProcessor.h"
egdaniel2d721d32015-11-11 13:06:05 -080011#include "glsl/GrGLSLFragmentShaderBuilder.h"
egdaniel018fb622015-10-28 07:26:40 -070012#include "glsl/GrGLSLProgramDataManager.h"
egdaniel7ea439b2015-12-03 09:20:44 -080013#include "glsl/GrGLSLUniformHandler.h"
tomhudson@google.comd8f856c2012-05-10 12:13:36 +000014
bsalomon@google.comdbbc4e22012-07-25 17:48:39 +000015// For brevity
egdaniel018fb622015-10-28 07:26:40 -070016typedef GrGLSLProgramDataManager::UniformHandle UniformHandle;
bsalomon@google.com032b2212012-07-16 13:36:18 +000017
egdaniel64c47282015-11-13 06:54:19 -080018class GrGLConvolutionEffect : public GrGLSLFragmentProcessor {
tomhudson@google.comd8f856c2012-05-10 12:13:36 +000019public:
robertphillips9cdb9922016-02-03 12:25:40 -080020 void emitCode(EmitArgs&) override;
ericrk7a787b42015-07-21 14:06:16 -070021
Brian Salomon94efbf52016-11-29 13:43:05 -050022 static inline void GenKey(const GrProcessor&, const GrShaderCaps&, GrProcessorKeyBuilder*);
tomhudson@google.comd8f856c2012-05-10 12:13:36 +000023
wangyixb1daa862015-08-18 11:29:31 -070024protected:
egdaniel018fb622015-10-28 07:26:40 -070025 void onSetData(const GrGLSLProgramDataManager& pdman, const GrProcessor&) override;
wangyixb1daa862015-08-18 11:29:31 -070026
ericrk0f386122015-07-21 13:15:47 -070027private:
Brian Salomonaee504b2017-01-24 12:29:36 -050028 UniformHandle fKernelUni;
29 UniformHandle fImageIncrementUni;
30 UniformHandle fBoundsUni;
tomhudson@google.comd8f856c2012-05-10 12:13:36 +000031
egdaniel64c47282015-11-13 06:54:19 -080032 typedef GrGLSLFragmentProcessor INHERITED;
tomhudson@google.comd8f856c2012-05-10 12:13:36 +000033};
34
wangyix7c157a92015-07-22 15:08:53 -070035void GrGLConvolutionEffect::emitCode(EmitArgs& args) {
Brian Salomonaee504b2017-01-24 12:29:36 -050036 const GrGaussianConvolutionFragmentProcessor& ce =
37 args.fFp.cast<GrGaussianConvolutionFragmentProcessor>();
robertphillipsbf536af2016-02-04 06:11:53 -080038
egdaniel7ea439b2015-12-03 09:20:44 -080039 GrGLSLUniformHandler* uniformHandler = args.fUniformHandler;
Brian Salomonaee504b2017-01-24 12:29:36 -050040 fImageIncrementUni = uniformHandler->addUniform(kFragment_GrShaderFlag, kVec2f_GrSLType,
41 kDefault_GrSLPrecision, "ImageIncrement");
robertphillipsbf536af2016-02-04 06:11:53 -080042 if (ce.useBounds()) {
Brian Salomonaee504b2017-01-24 12:29:36 -050043 fBoundsUni = uniformHandler->addUniform(kFragment_GrShaderFlag, kVec2f_GrSLType,
44 kDefault_GrSLPrecision, "Bounds");
ericrk7a787b42015-07-21 14:06:16 -070045 }
robertphillipsbf536af2016-02-04 06:11:53 -080046
47 int width = Gr1DKernelEffect::WidthFromRadius(ce.radius());
48
jvanverth78d6eb02016-03-02 13:21:16 -080049 int arrayCount = (width + 3) / 4;
50 SkASSERT(4 * arrayCount >= width);
51
Brian Salomonaee504b2017-01-24 12:29:36 -050052 fKernelUni = uniformHandler->addUniformArray(kFragment_GrShaderFlag, kVec4f_GrSLType,
53 kDefault_GrSLPrecision, "Kernel", arrayCount);
ericrk7a787b42015-07-21 14:06:16 -070054
cdalton85285412016-02-18 12:37:07 -080055 GrGLSLFPFragmentBuilder* fragBuilder = args.fFragBuilder;
bsalomon1a1aa932016-09-12 09:30:36 -070056 SkString coords2D = fragBuilder->ensureCoords2D(args.fTransformedCoords[0]);
ericrk7a787b42015-07-21 14:06:16 -070057
robertphillipsbf536af2016-02-04 06:11:53 -080058 fragBuilder->codeAppendf("%s = vec4(0, 0, 0, 0);", args.fOutputColor);
ericrk7a787b42015-07-21 14:06:16 -070059
Brian Salomon99938a82016-11-21 13:41:08 -050060 const GrShaderVar& kernel = uniformHandler->getUniformVariable(fKernelUni);
egdaniel7ea439b2015-12-03 09:20:44 -080061 const char* imgInc = uniformHandler->getUniformCStr(fImageIncrementUni);
ericrk7a787b42015-07-21 14:06:16 -070062
robertphillipsbf536af2016-02-04 06:11:53 -080063 fragBuilder->codeAppendf("vec2 coord = %s - %d.0 * %s;", coords2D.c_str(), ce.radius(), imgInc);
ericrk7a787b42015-07-21 14:06:16 -070064
65 // Manually unroll loop because some drivers don't; yields 20-30% speedup.
Brian Salomonaee504b2017-01-24 12:29:36 -050066 const char* kVecSuffix[4] = {".x", ".y", ".z", ".w"};
ericrk7a787b42015-07-21 14:06:16 -070067 for (int i = 0; i < width; i++) {
68 SkString index;
69 SkString kernelIndex;
Brian Salomonaee504b2017-01-24 12:29:36 -050070 index.appendS32(i / 4);
ericrk7a787b42015-07-21 14:06:16 -070071 kernel.appendArrayAccess(index.c_str(), &kernelIndex);
jvanverth78d6eb02016-03-02 13:21:16 -080072 kernelIndex.append(kVecSuffix[i & 0x3]);
ericrk7a787b42015-07-21 14:06:16 -070073
robertphillipsbf536af2016-02-04 06:11:53 -080074 if (ce.useBounds()) {
ericrk7a787b42015-07-21 14:06:16 -070075 // We used to compute a bool indicating whether we're in bounds or not, cast it to a
76 // float, and then mul weight*texture_sample by the float. However, the Adreno 430 seems
77 // to have a bug that caused corruption.
egdaniel7ea439b2015-12-03 09:20:44 -080078 const char* bounds = uniformHandler->getUniformCStr(fBoundsUni);
robertphillipsbf536af2016-02-04 06:11:53 -080079 const char* component = ce.direction() == Gr1DKernelEffect::kY_Direction ? "y" : "x";
Brian Salomonaee504b2017-01-24 12:29:36 -050080 fragBuilder->codeAppendf("if (coord.%s >= %s.x && coord.%s <= %s.y) {", component,
81 bounds, component, bounds);
ericrk7a787b42015-07-21 14:06:16 -070082 }
Brian Salomonaee504b2017-01-24 12:29:36 -050083 fragBuilder->codeAppendf("%s += ", args.fOutputColor);
cdalton3f6f76f2016-04-11 12:18:09 -070084 fragBuilder->appendTextureLookup(args.fTexSamplers[0], "coord");
egdaniel4ca2e602015-11-18 08:01:26 -080085 fragBuilder->codeAppendf(" * %s;\n", kernelIndex.c_str());
robertphillipsbf536af2016-02-04 06:11:53 -080086 if (ce.useBounds()) {
egdaniel4ca2e602015-11-18 08:01:26 -080087 fragBuilder->codeAppend("}");
ericrk7a787b42015-07-21 14:06:16 -070088 }
Brian Salomonaee504b2017-01-24 12:29:36 -050089 fragBuilder->codeAppendf("coord += %s;\n", imgInc);
ericrk7a787b42015-07-21 14:06:16 -070090 }
91
92 SkString modulate;
wangyix7c157a92015-07-22 15:08:53 -070093 GrGLSLMulVarBy4f(&modulate, args.fOutputColor, args.fInputColor);
egdaniel4ca2e602015-11-18 08:01:26 -080094 fragBuilder->codeAppend(modulate.c_str());
ericrk7a787b42015-07-21 14:06:16 -070095}
96
egdaniel018fb622015-10-28 07:26:40 -070097void GrGLConvolutionEffect::onSetData(const GrGLSLProgramDataManager& pdman,
98 const GrProcessor& processor) {
Brian Salomonaee504b2017-01-24 12:29:36 -050099 const GrGaussianConvolutionFragmentProcessor& conv =
100 processor.cast<GrGaussianConvolutionFragmentProcessor>();
Brian Salomondb4183d2016-11-17 12:48:40 -0500101 GrTexture& texture = *conv.textureSampler(0).texture();
robertphillipsbf536af2016-02-04 06:11:53 -0800102
Brian Salomonaee504b2017-01-24 12:29:36 -0500103 float imageIncrement[2] = {0};
ericrk7a787b42015-07-21 14:06:16 -0700104 float ySign = texture.origin() != kTopLeft_GrSurfaceOrigin ? 1.0f : -1.0f;
105 switch (conv.direction()) {
106 case Gr1DKernelEffect::kX_Direction:
107 imageIncrement[0] = 1.0f / texture.width();
108 break;
109 case Gr1DKernelEffect::kY_Direction:
110 imageIncrement[1] = ySign / texture.height();
111 break;
112 default:
113 SkFAIL("Unknown filter direction.");
114 }
115 pdman.set2fv(fImageIncrementUni, 1, imageIncrement);
116 if (conv.useBounds()) {
117 const float* bounds = conv.bounds();
118 if (Gr1DKernelEffect::kY_Direction == conv.direction() &&
119 texture.origin() != kTopLeft_GrSurfaceOrigin) {
120 pdman.set2f(fBoundsUni, 1.0f - bounds[1], 1.0f - bounds[0]);
121 } else {
122 pdman.set2f(fBoundsUni, bounds[0], bounds[1]);
123 }
124 }
robertphillipsbf536af2016-02-04 06:11:53 -0800125 int width = Gr1DKernelEffect::WidthFromRadius(conv.radius());
126
jvanverth78d6eb02016-03-02 13:21:16 -0800127 int arrayCount = (width + 3) / 4;
128 SkASSERT(4 * arrayCount >= width);
129 pdman.set4fv(fKernelUni, arrayCount, conv.kernel());
ericrk7a787b42015-07-21 14:06:16 -0700130}
131
Brian Salomon94efbf52016-11-29 13:43:05 -0500132void GrGLConvolutionEffect::GenKey(const GrProcessor& processor, const GrShaderCaps&,
joshualittb0a8a372014-09-23 09:50:21 -0700133 GrProcessorKeyBuilder* b) {
Brian Salomonaee504b2017-01-24 12:29:36 -0500134 const GrGaussianConvolutionFragmentProcessor& conv =
135 processor.cast<GrGaussianConvolutionFragmentProcessor>();
bsalomon63e99f72014-07-21 08:03:14 -0700136 uint32_t key = conv.radius();
senorblanco@chromium.orge8232bc2013-07-29 18:45:44 +0000137 key <<= 2;
138 if (conv.useBounds()) {
139 key |= 0x2;
Brian Salomonaee504b2017-01-24 12:29:36 -0500140 key |= GrGaussianConvolutionFragmentProcessor::kY_Direction == conv.direction() ? 0x1 : 0x0;
senorblanco@chromium.orge8232bc2013-07-29 18:45:44 +0000141 }
bsalomon63e99f72014-07-21 08:03:14 -0700142 b->add32(key);
tomhudson@google.comd8f856c2012-05-10 12:13:36 +0000143}
144
bsalomon@google.comb505a122012-05-31 18:40:36 +0000145///////////////////////////////////////////////////////////////////////////////
tomhudson@google.comd8f856c2012-05-10 12:13:36 +0000146
Brian Salomonaee504b2017-01-24 12:29:36 -0500147GrGaussianConvolutionFragmentProcessor::GrGaussianConvolutionFragmentProcessor(GrTexture* texture,
148 Direction direction,
149 int radius,
150 float gaussianSigma,
151 bool useBounds,
152 float bounds[2])
153 : INHERITED(texture, direction, radius), fUseBounds(useBounds) {
154 this->initClassID<GrGaussianConvolutionFragmentProcessor>();
tfarina@chromium.orgf6de4752013-08-17 00:02:59 +0000155 SkASSERT(radius <= kMaxKernelRadius);
tomhudson@google.comfde2c0a2012-07-16 12:23:32 +0000156 int width = this->width();
157
158 float sum = 0.0f;
159 float denom = 1.0f / (2.0f * gaussianSigma * gaussianSigma);
160 for (int i = 0; i < width; ++i) {
161 float x = static_cast<float>(i - this->radius());
162 // Note that the constant term (1/(sqrt(2*pi*sigma^2)) of the Gaussian
163 // is dropped here, since we renormalize the kernel below.
Brian Salomonaee504b2017-01-24 12:29:36 -0500164 fKernel[i] = sk_float_exp(-x * x * denom);
tomhudson@google.comfde2c0a2012-07-16 12:23:32 +0000165 sum += fKernel[i];
166 }
167 // Normalize the kernel
168 float scale = 1.0f / sum;
169 for (int i = 0; i < width; ++i) {
170 fKernel[i] *= scale;
171 }
senorblanco@chromium.orge8232bc2013-07-29 18:45:44 +0000172 memcpy(fBounds, bounds, sizeof(fBounds));
tomhudson@google.comfde2c0a2012-07-16 12:23:32 +0000173}
174
Brian Salomonaee504b2017-01-24 12:29:36 -0500175GrGaussianConvolutionFragmentProcessor::~GrGaussianConvolutionFragmentProcessor() {}
tomhudson@google.comd8f856c2012-05-10 12:13:36 +0000176
Brian Salomonaee504b2017-01-24 12:29:36 -0500177void GrGaussianConvolutionFragmentProcessor::onGetGLSLProcessorKey(const GrShaderCaps& caps,
178 GrProcessorKeyBuilder* b) const {
joshualitteb2a6762014-12-04 11:35:33 -0800179 GrGLConvolutionEffect::GenKey(*this, caps, b);
180}
181
Brian Salomonaee504b2017-01-24 12:29:36 -0500182GrGLSLFragmentProcessor* GrGaussianConvolutionFragmentProcessor::onCreateGLSLInstance() const {
robertphillipsbf536af2016-02-04 06:11:53 -0800183 return new GrGLConvolutionEffect;
tomhudson@google.comd8f856c2012-05-10 12:13:36 +0000184}
185
Brian Salomonaee504b2017-01-24 12:29:36 -0500186bool GrGaussianConvolutionFragmentProcessor::onIsEqual(const GrFragmentProcessor& sBase) const {
187 const GrGaussianConvolutionFragmentProcessor& s =
188 sBase.cast<GrGaussianConvolutionFragmentProcessor>();
189 return (this->radius() == s.radius() && this->direction() == s.direction() &&
senorblanco@chromium.orge8232bc2013-07-29 18:45:44 +0000190 this->useBounds() == s.useBounds() &&
191 0 == memcmp(fBounds, s.fBounds, sizeof(fBounds)) &&
tomhudson@google.comd0c1a062012-07-12 17:23:52 +0000192 0 == memcmp(fKernel, s.fKernel, this->width() * sizeof(float)));
tomhudson@google.comd8f856c2012-05-10 12:13:36 +0000193}
bsalomon@google.com0a7672f2012-08-03 18:12:20 +0000194
195///////////////////////////////////////////////////////////////////////////////
196
Brian Salomonaee504b2017-01-24 12:29:36 -0500197GR_DEFINE_FRAGMENT_PROCESSOR_TEST(GrGaussianConvolutionFragmentProcessor);
bsalomon@google.com0a7672f2012-08-03 18:12:20 +0000198
Brian Salomonaee504b2017-01-24 12:29:36 -0500199sk_sp<GrFragmentProcessor> GrGaussianConvolutionFragmentProcessor::TestCreate(
200 GrProcessorTestData* d) {
201 int texIdx = d->fRandom->nextBool() ? GrProcessorUnitTest::kSkiaPMTextureIdx
202 : GrProcessorUnitTest::kAlphaTextureIdx;
joshualitt0067ff52015-07-08 14:26:19 -0700203 Direction dir = d->fRandom->nextBool() ? kX_Direction : kY_Direction;
204 int radius = d->fRandom->nextRangeU(1, kMaxKernelRadius);
Brian Salomonaee504b2017-01-24 12:29:36 -0500205
206 bool useBounds = d->fRandom->nextBool();
senorblanco@chromium.orge8232bc2013-07-29 18:45:44 +0000207 float bounds[2];
bungeman@google.com43486632013-08-20 15:20:34 +0000208 for (size_t i = 0; i < SK_ARRAY_COUNT(bounds); ++i) {
joshualitt0067ff52015-07-08 14:26:19 -0700209 bounds[i] = d->fRandom->nextF();
senorblanco@chromium.org194d7752013-07-24 22:19:24 +0000210 }
bsalomon@google.com0a7672f2012-08-03 18:12:20 +0000211
Brian Salomonaee504b2017-01-24 12:29:36 -0500212 float sigma = radius / 3.f;
213 return GrGaussianConvolutionFragmentProcessor::Make(
214 d->fTextures[texIdx], dir, radius, sigma, useBounds, bounds);
bsalomon@google.com0a7672f2012-08-03 18:12:20 +0000215}