joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 1 | /* |
| 2 | * Copyright 2014 Google Inc. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license that can be |
| 5 | * found in the LICENSE file. |
| 6 | */ |
Mike Klein | c0bd9f9 | 2019-04-23 12:05:21 -0500 | [diff] [blame] | 7 | #include "src/gpu/effects/GrMatrixConvolutionEffect.h" |
Robert Phillips | 296b1cc | 2017-03-15 10:42:12 -0400 | [diff] [blame] | 8 | |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 9 | #include "include/private/SkHalf.h" |
| 10 | #include "src/gpu/GrBitmapTextureMaker.h" |
| 11 | #include "src/gpu/GrContextPriv.h" |
| 12 | #include "src/gpu/GrProxyProvider.h" |
| 13 | #include "src/gpu/GrRecordingContextPriv.h" |
Greg Daniel | 456f9b5 | 2020-03-05 19:14:18 +0000 | [diff] [blame] | 14 | #include "src/gpu/GrTexture.h" |
Greg Daniel | f91aeb2 | 2019-06-18 09:58:02 -0400 | [diff] [blame] | 15 | #include "src/gpu/GrTextureProxy.h" |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 16 | #include "src/gpu/effects/GrTextureEffect.h" |
Mike Klein | c0bd9f9 | 2019-04-23 12:05:21 -0500 | [diff] [blame] | 17 | #include "src/gpu/glsl/GrGLSLFragmentProcessor.h" |
| 18 | #include "src/gpu/glsl/GrGLSLFragmentShaderBuilder.h" |
| 19 | #include "src/gpu/glsl/GrGLSLProgramDataManager.h" |
| 20 | #include "src/gpu/glsl/GrGLSLUniformHandler.h" |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 21 | |
egdaniel | 64c4728 | 2015-11-13 06:54:19 -0800 | [diff] [blame] | 22 | class GrGLMatrixConvolutionEffect : public GrGLSLFragmentProcessor { |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 23 | public: |
robertphillips | 9cdb992 | 2016-02-03 12:25:40 -0800 | [diff] [blame] | 24 | void emitCode(EmitArgs&) override; |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 25 | |
Brian Salomon | 94efbf5 | 2016-11-29 13:43:05 -0500 | [diff] [blame] | 26 | static inline void GenKey(const GrProcessor&, const GrShaderCaps&, GrProcessorKeyBuilder*); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 27 | |
wangyix | b1daa86 | 2015-08-18 11:29:31 -0700 | [diff] [blame] | 28 | protected: |
Brian Salomon | ab015ef | 2017-04-04 10:15:51 -0400 | [diff] [blame] | 29 | void onSetData(const GrGLSLProgramDataManager&, const GrFragmentProcessor&) override; |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 30 | |
| 31 | private: |
egdaniel | 018fb62 | 2015-10-28 07:26:40 -0700 | [diff] [blame] | 32 | typedef GrGLSLProgramDataManager::UniformHandle UniformHandle; |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 33 | |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 34 | void emitKernelBlock(EmitArgs&, SkIPoint); |
| 35 | |
joshualitt | 5ae5fc5 | 2014-07-29 12:59:27 -0700 | [diff] [blame] | 36 | UniformHandle fKernelUni; |
joshualitt | 5ae5fc5 | 2014-07-29 12:59:27 -0700 | [diff] [blame] | 37 | UniformHandle fKernelOffsetUni; |
| 38 | UniformHandle fGainUni; |
| 39 | UniformHandle fBiasUni; |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 40 | UniformHandle fKernelBiasUni; |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 41 | |
egdaniel | 64c4728 | 2015-11-13 06:54:19 -0800 | [diff] [blame] | 42 | typedef GrGLSLFragmentProcessor INHERITED; |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 43 | }; |
| 44 | |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 45 | GrMatrixConvolutionEffect::KernelWrapper GrMatrixConvolutionEffect::KernelWrapper::Make( |
| 46 | GrRecordingContext* context, SkISize size, const GrCaps& caps, const SkScalar* values) { |
| 47 | if (nullptr == context || nullptr == values || size.isEmpty()) { |
| 48 | return {}; |
| 49 | } |
| 50 | const int length = size.area(); |
| 51 | // Small kernel -> just fill the array. |
| 52 | KernelWrapper result(size); |
| 53 | if (length <= kMaxUniformSize) { |
| 54 | for (int i = 0; i < length; i++) { |
| 55 | result.fArray[i] = SkScalarToFloat(values[i]); |
| 56 | } |
| 57 | return result; |
| 58 | } |
| 59 | |
| 60 | ScalableSampler& scalableSampler = result.fScalableSampler; |
| 61 | bool useA16 = |
| 62 | context->defaultBackendFormat(kA16_float_SkColorType, GrRenderable::kNo).isValid(); |
| 63 | SkScalar min = values[0]; |
| 64 | if (!useA16) { |
| 65 | // Determine min and max values to figure out inner gain & bias. |
| 66 | SkScalar max = values[0]; |
| 67 | for (int i = 1; i < length; i++) { |
| 68 | if (values[i] < min) { |
| 69 | min = values[i]; |
| 70 | } |
| 71 | if (values[i] > max) { |
| 72 | max = values[i]; |
| 73 | } |
| 74 | } |
| 75 | // Treat near-0 gain (i.e. box blur) as 1, and let the kernelBias |
| 76 | // move everything up to the final value. |
| 77 | const SkScalar computedGain = max - min; |
| 78 | scalableSampler.fGain = |
| 79 | SkScalarNearlyZero(computedGain) ? 1.0f : SkScalarToFloat(computedGain); |
| 80 | // Inner bias is pre-inner-gain so we divide that out. |
| 81 | scalableSampler.fBias = SkScalarToFloat(min) / scalableSampler.fGain; |
| 82 | } |
| 83 | |
Adlai Holler | dcfb233 | 2020-05-13 15:02:28 -0400 | [diff] [blame^] | 84 | // TODO: Pick cache or dont-cache based on observed perf. |
| 85 | static constexpr bool kCacheKernelTexture = true; |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 86 | |
| 87 | GrUniqueKey key; |
| 88 | if (kCacheKernelTexture) { |
| 89 | static const GrUniqueKey::Domain kDomain = GrUniqueKey::GenerateDomain(); |
| 90 | GrUniqueKey::Builder builder(&key, kDomain, length, "Matrix Convolution Kernel"); |
| 91 | // Texture cache key is the exact content of the kernel. |
| 92 | static_assert(sizeof(float) == 4); |
| 93 | for (int i = 0; i < length; i++) { |
| 94 | builder[i] = *(const uint32_t*)&values[i]; |
| 95 | } |
| 96 | builder.finish(); |
| 97 | } |
| 98 | |
| 99 | // Find or create a texture. |
| 100 | GrProxyProvider* proxyProvider = context->priv().proxyProvider(); |
| 101 | GrSurfaceProxyView view; |
| 102 | SkColorType colorType = useA16 ? kA16_float_SkColorType : kAlpha_8_SkColorType; |
| 103 | sk_sp<GrTextureProxy> cachedKernel; |
| 104 | if (kCacheKernelTexture && (cachedKernel = proxyProvider->findOrCreateProxyByUniqueKey(key))) { |
| 105 | GrSwizzle swizzle = |
| 106 | context->priv().caps()->getReadSwizzle(cachedKernel->backendFormat(), |
| 107 | SkColorTypeToGrColorType(colorType)); |
| 108 | view = {std::move(cachedKernel), kTopLeft_GrSurfaceOrigin, swizzle}; |
| 109 | } else { |
| 110 | SkBitmap bm; |
| 111 | auto info = SkImageInfo::Make({(int)GrNextPow2(length), 1}, colorType, |
| 112 | kPremul_SkAlphaType, nullptr); |
| 113 | if (!bm.tryAllocPixels(info)) { |
| 114 | return {}; |
| 115 | } |
| 116 | for (int i = 0; i < length; i++) { |
| 117 | if (useA16) { |
| 118 | *bm.getAddr16(i, 0) = SkFloatToHalf(values[i]); |
| 119 | } else { |
| 120 | *bm.getAddr8(i, 0) = |
| 121 | SkScalarRoundToInt((values[i] - min) / scalableSampler.fGain * 255); |
| 122 | } |
| 123 | } |
| 124 | bm.setImmutable(); |
| 125 | GrBitmapTextureMaker maker(context, bm, GrImageTexGenPolicy::kNew_Uncached_Budgeted); |
| 126 | view = maker.view(GrMipMapped::kNo); |
| 127 | if (!view) { |
| 128 | return {}; |
| 129 | } |
| 130 | if (kCacheKernelTexture) { |
| 131 | proxyProvider->assignUniqueKeyToProxy(key, view.asTextureProxy()); |
| 132 | } |
| 133 | } |
| 134 | scalableSampler.fSampler = { std::move(view) }; |
| 135 | return result; |
| 136 | } |
| 137 | |
| 138 | bool GrMatrixConvolutionEffect::KernelWrapper::operator==(const KernelWrapper& k) const { |
| 139 | if (fSize != k.fSize) { |
| 140 | return false; |
| 141 | } else if (this->isSampled()) { |
| 142 | return fScalableSampler == k.fScalableSampler; |
| 143 | } else { |
| 144 | return std::equal(fArray.begin(), fArray.begin() + fSize.area(), k.fArray.begin()); |
| 145 | } |
| 146 | } |
| 147 | |
| 148 | bool GrMatrixConvolutionEffect::KernelWrapper::ScalableSampler::operator==( |
| 149 | const ScalableSampler& k) const { |
| 150 | return fSampler == k.fSampler && fGain == k.fGain && fBias == k.fBias; |
| 151 | } |
| 152 | |
| 153 | // For sampled kernels, emit a for loop that does all the kernel accumulation. |
| 154 | // For uniform kernels, emit a single iteration. Function is called repeatedly in a for loop. |
| 155 | // loc is ignored for sampled kernels. |
| 156 | void GrGLMatrixConvolutionEffect::emitKernelBlock(EmitArgs& args, SkIPoint loc) { |
| 157 | const GrMatrixConvolutionEffect& mce = args.fFp.cast<GrMatrixConvolutionEffect>(); |
| 158 | GrGLSLFPFragmentBuilder* fragBuilder = args.fFragBuilder; |
| 159 | GrGLSLUniformHandler* uniformHandler = args.fUniformHandler; |
| 160 | int kernelWidth = mce.kernelSize().width(); |
| 161 | int kernelHeight = mce.kernelSize().height(); |
| 162 | int kernelArea = kernelWidth * kernelHeight; |
| 163 | |
| 164 | if (mce.kernelIsSampled()) { |
| 165 | fragBuilder->codeAppendf("half2 kernelCoord = half2(0, 0);"); |
| 166 | fragBuilder->codeAppendf("for (int i = 0; i < %d; ++i)", (int)kernelArea); |
| 167 | } |
| 168 | |
| 169 | GrGLSLShaderBuilder::ShaderBlock block(fragBuilder); |
| 170 | |
| 171 | fragBuilder->codeAppend("half k;"); |
| 172 | fragBuilder->codeAppend("half2 sourceOffset;"); |
| 173 | if (mce.kernelIsSampled()) { |
| 174 | const char* kernelBias = uniformHandler->getUniformCStr(fKernelBiasUni); |
| 175 | fragBuilder->codeAppend("k = "); |
| 176 | fragBuilder->appendTextureLookup(args.fTexSamplers[0], "kernelCoord"); |
| 177 | fragBuilder->codeAppendf(".w + %s;", kernelBias); |
| 178 | fragBuilder->codeAppendf("sourceOffset.y = floor(i / %d);", kernelWidth); |
| 179 | fragBuilder->codeAppendf("sourceOffset.x = i - sourceOffset.y * %d;", kernelWidth); |
| 180 | float kernelStride = 1.0f / (float)GrNextPow2(kernelArea); |
| 181 | fragBuilder->codeAppendf("kernelCoord.x += %f;", kernelStride); |
| 182 | } else { |
| 183 | fragBuilder->codeAppendf("sourceOffset = half2(%d, %d);", loc.x(), loc.y()); |
| 184 | int offset = loc.y() * kernelWidth + loc.x(); |
| 185 | static constexpr const char kVecSuffix[][4] = { ".x", ".y", ".z", ".w" }; |
| 186 | const char* kernel = uniformHandler->getUniformCStr(fKernelUni); |
| 187 | fragBuilder->codeAppendf("k = %s[%d]%s;", kernel, offset / 4, |
| 188 | kVecSuffix[offset & 0x3]); |
| 189 | } |
| 190 | |
| 191 | auto sample = this->invokeChild(0, args, "coord + sourceOffset"); |
| 192 | fragBuilder->codeAppendf("half4 c = %s;", sample.c_str()); |
| 193 | if (!mce.convolveAlpha()) { |
| 194 | fragBuilder->codeAppend("c.rgb /= max(c.a, 0.0001);"); |
| 195 | fragBuilder->codeAppend("c.rgb = saturate(c.rgb);"); |
| 196 | } |
| 197 | fragBuilder->codeAppend("sum += c * k;"); |
| 198 | } |
| 199 | |
wangyix | 7c157a9 | 2015-07-22 15:08:53 -0700 | [diff] [blame] | 200 | void GrGLMatrixConvolutionEffect::emitCode(EmitArgs& args) { |
robertphillips | bf536af | 2016-02-04 06:11:53 -0800 | [diff] [blame] | 201 | const GrMatrixConvolutionEffect& mce = args.fFp.cast<GrMatrixConvolutionEffect>(); |
robertphillips | bf536af | 2016-02-04 06:11:53 -0800 | [diff] [blame] | 202 | |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 203 | int kernelWidth = mce.kernelSize().width(); |
| 204 | int kernelHeight = mce.kernelSize().height(); |
robertphillips | bf536af | 2016-02-04 06:11:53 -0800 | [diff] [blame] | 205 | |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 206 | int arrayCount = (kernelWidth * kernelHeight + 3) / 4; |
| 207 | SkASSERT(4 * arrayCount >= kernelWidth * kernelHeight); |
jvanverth | 78d6eb0 | 2016-03-02 13:21:16 -0800 | [diff] [blame] | 208 | |
egdaniel | 7ea439b | 2015-12-03 09:20:44 -0800 | [diff] [blame] | 209 | GrGLSLUniformHandler* uniformHandler = args.fUniformHandler; |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 210 | if (mce.kernelIsSampled()) { |
| 211 | fKernelBiasUni = uniformHandler->addUniform(&mce, kFragment_GrShaderFlag, |
| 212 | kHalf_GrSLType, "KernelBias"); |
| 213 | } else { |
| 214 | fKernelUni = uniformHandler->addUniformArray(&mce, kFragment_GrShaderFlag, |
| 215 | kHalf4_GrSLType, "Kernel", arrayCount); |
| 216 | } |
Ethan Nicholas | 16464c3 | 2020-04-06 13:53:05 -0400 | [diff] [blame] | 217 | fKernelOffsetUni = uniformHandler->addUniform(&mce, kFragment_GrShaderFlag, kHalf2_GrSLType, |
egdaniel | 7ea439b | 2015-12-03 09:20:44 -0800 | [diff] [blame] | 218 | "KernelOffset"); |
Brian Salomon | 41e377d | 2020-05-05 01:27:57 +0000 | [diff] [blame] | 219 | fGainUni = uniformHandler->addUniform(&mce, kFragment_GrShaderFlag, kHalf_GrSLType, "Gain"); |
| 220 | fBiasUni = uniformHandler->addUniform(&mce, kFragment_GrShaderFlag, kHalf_GrSLType, "Bias"); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 221 | |
egdaniel | 7ea439b | 2015-12-03 09:20:44 -0800 | [diff] [blame] | 222 | const char* kernelOffset = uniformHandler->getUniformCStr(fKernelOffsetUni); |
egdaniel | 7ea439b | 2015-12-03 09:20:44 -0800 | [diff] [blame] | 223 | const char* gain = uniformHandler->getUniformCStr(fGainUni); |
| 224 | const char* bias = uniformHandler->getUniformCStr(fBiasUni); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 225 | |
cdalton | 8528541 | 2016-02-18 12:37:07 -0800 | [diff] [blame] | 226 | GrGLSLFPFragmentBuilder* fragBuilder = args.fFragBuilder; |
Ethan Nicholas | 5843012 | 2020-04-14 09:54:02 -0400 | [diff] [blame] | 227 | SkString coords2D = fragBuilder->ensureCoords2D(args.fTransformedCoords[0].fVaryingPoint, |
| 228 | mce.sampleMatrix()); |
Brian Salomon | 41e377d | 2020-05-05 01:27:57 +0000 | [diff] [blame] | 229 | fragBuilder->codeAppend("half4 sum = half4(0, 0, 0, 0);"); |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 230 | fragBuilder->codeAppendf("float2 coord = %s - %s;", coords2D.c_str(), kernelOffset); |
joshualitt | 5ae5fc5 | 2014-07-29 12:59:27 -0700 | [diff] [blame] | 231 | |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 232 | if (mce.kernelIsSampled()) { |
| 233 | this->emitKernelBlock(args, {}); |
| 234 | } else { |
| 235 | for (int x = 0; x < kernelWidth; ++x) { |
| 236 | for (int y = 0; y < kernelHeight; ++y) { |
| 237 | this->emitKernelBlock(args, SkIPoint::Make(x, y)); |
joshualitt | 5ae5fc5 | 2014-07-29 12:59:27 -0700 | [diff] [blame] | 238 | } |
joshualitt | 5ae5fc5 | 2014-07-29 12:59:27 -0700 | [diff] [blame] | 239 | } |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 240 | } |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 241 | |
robertphillips | bf536af | 2016-02-04 06:11:53 -0800 | [diff] [blame] | 242 | if (mce.convolveAlpha()) { |
Brian Salomon | 41e377d | 2020-05-05 01:27:57 +0000 | [diff] [blame] | 243 | fragBuilder->codeAppendf("%s = sum * %s + %s;", args.fOutputColor, gain, bias); |
Ethan Nicholas | 12fb9cf | 2018-08-03 16:16:57 -0400 | [diff] [blame] | 244 | fragBuilder->codeAppendf("%s.a = saturate(%s.a);", args.fOutputColor, args.fOutputColor); |
egdaniel | 4ca2e60 | 2015-11-18 08:01:26 -0800 | [diff] [blame] | 245 | fragBuilder->codeAppendf("%s.rgb = clamp(%s.rgb, 0.0, %s.a);", |
| 246 | args.fOutputColor, args.fOutputColor, args.fOutputColor); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 247 | } else { |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 248 | auto sample = this->invokeChild(0, args, coords2D.c_str()); |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 249 | fragBuilder->codeAppendf("half4 c = %s;", sample.c_str()); |
Brian Salomon | 41e377d | 2020-05-05 01:27:57 +0000 | [diff] [blame] | 250 | fragBuilder->codeAppendf("%s.a = c.a;", args.fOutputColor); |
| 251 | fragBuilder->codeAppendf("%s.rgb = saturate(sum.rgb * %s + %s);", args.fOutputColor, gain, bias); |
egdaniel | 4ca2e60 | 2015-11-18 08:01:26 -0800 | [diff] [blame] | 252 | fragBuilder->codeAppendf("%s.rgb *= %s.a;", args.fOutputColor, args.fOutputColor); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 253 | } |
Ethan Nicholas | 2983f40 | 2017-05-08 09:36:08 -0400 | [diff] [blame] | 254 | fragBuilder->codeAppendf("%s *= %s;\n", args.fOutputColor, args.fInputColor); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 255 | } |
| 256 | |
joshualitt | b0a8a37 | 2014-09-23 09:50:21 -0700 | [diff] [blame] | 257 | void GrGLMatrixConvolutionEffect::GenKey(const GrProcessor& processor, |
Brian Salomon | 94efbf5 | 2016-11-29 13:43:05 -0500 | [diff] [blame] | 258 | const GrShaderCaps&, GrProcessorKeyBuilder* b) { |
joshualitt | b0a8a37 | 2014-09-23 09:50:21 -0700 | [diff] [blame] | 259 | const GrMatrixConvolutionEffect& m = processor.cast<GrMatrixConvolutionEffect>(); |
joshualitt | 5ae5fc5 | 2014-07-29 12:59:27 -0700 | [diff] [blame] | 260 | SkASSERT(m.kernelSize().width() <= 0x7FFF && m.kernelSize().height() <= 0xFFFF); |
| 261 | uint32_t key = m.kernelSize().width() << 16 | m.kernelSize().height(); |
caryclark | 952538e | 2016-02-26 05:01:42 -0800 | [diff] [blame] | 262 | key |= m.convolveAlpha() ? 1U << 31 : 0; |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 263 | b->add32(key); |
| 264 | } |
| 265 | |
egdaniel | 018fb62 | 2015-10-28 07:26:40 -0700 | [diff] [blame] | 266 | void GrGLMatrixConvolutionEffect::onSetData(const GrGLSLProgramDataManager& pdman, |
Brian Salomon | ab015ef | 2017-04-04 10:15:51 -0400 | [diff] [blame] | 267 | const GrFragmentProcessor& processor) { |
joshualitt | b0a8a37 | 2014-09-23 09:50:21 -0700 | [diff] [blame] | 268 | const GrMatrixConvolutionEffect& conv = processor.cast<GrMatrixConvolutionEffect>(); |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 269 | pdman.set2fv(fKernelOffsetUni, 1, conv.kernelOffset().ptr()); |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 270 | float totalGain = conv.gain(); |
| 271 | if (conv.kernelIsSampled()) { |
| 272 | totalGain *= conv.kernelSampleGain(); |
| 273 | pdman.set1f(fKernelBiasUni, conv.kernelSampleBias()); |
| 274 | } else { |
| 275 | int kernelCount = conv.kernelSize().area(); |
| 276 | int arrayCount = (kernelCount + 3) / 4; |
| 277 | SkASSERT(4 * arrayCount >= kernelCount); |
| 278 | pdman.set4fv(fKernelUni, arrayCount, conv.kernel()); |
| 279 | } |
kkinnunen | 7510b22 | 2014-07-30 00:04:16 -0700 | [diff] [blame] | 280 | pdman.set1f(fBiasUni, conv.bias()); |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 281 | pdman.set1f(fGainUni, totalGain); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 282 | } |
| 283 | |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 284 | GrMatrixConvolutionEffect::GrMatrixConvolutionEffect(std::unique_ptr<GrFragmentProcessor> child, |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 285 | KernelWrapper kernel, |
Robert Phillips | 40fd7c9 | 2017-01-30 08:06:27 -0500 | [diff] [blame] | 286 | SkScalar gain, |
| 287 | SkScalar bias, |
| 288 | const SkIPoint& kernelOffset, |
Robert Phillips | 40fd7c9 | 2017-01-30 08:06:27 -0500 | [diff] [blame] | 289 | bool convolveAlpha) |
Brian Salomon | 6cd51b5 | 2017-07-26 19:07:15 -0400 | [diff] [blame] | 290 | // To advertise either the modulation or opaqueness optimizations we'd have to examine the |
| 291 | // parameters. |
Ethan Nicholas | abff956 | 2017-10-09 10:54:08 -0400 | [diff] [blame] | 292 | : INHERITED(kGrMatrixConvolutionEffect_ClassID, kNone_OptimizationFlags) |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 293 | , fKernel(std::move(kernel)) |
Brian Salomon | 6cd51b5 | 2017-07-26 19:07:15 -0400 | [diff] [blame] | 294 | , fGain(SkScalarToFloat(gain)) |
| 295 | , fBias(SkScalarToFloat(bias) / 255.0f) |
| 296 | , fConvolveAlpha(convolveAlpha) { |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 297 | child->setSampledWithExplicitCoords(); |
| 298 | this->registerChildProcessor(std::move(child)); |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 299 | if (fKernel.isSampled()) { |
| 300 | this->setTextureSamplerCnt(1); |
Robert Phillips | 40fd7c9 | 2017-01-30 08:06:27 -0500 | [diff] [blame] | 301 | } |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 302 | fKernelOffset = {static_cast<float>(kernelOffset.x()), |
| 303 | static_cast<float>(kernelOffset.y())}; |
| 304 | this->addCoordTransform(&fCoordTransform); |
Robert Phillips | 40fd7c9 | 2017-01-30 08:06:27 -0500 | [diff] [blame] | 305 | } |
| 306 | |
Brian Salomon | 3f6f965 | 2017-07-28 07:34:05 -0400 | [diff] [blame] | 307 | GrMatrixConvolutionEffect::GrMatrixConvolutionEffect(const GrMatrixConvolutionEffect& that) |
Ethan Nicholas | abff956 | 2017-10-09 10:54:08 -0400 | [diff] [blame] | 308 | : INHERITED(kGrMatrixConvolutionEffect_ClassID, kNone_OptimizationFlags) |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 309 | , fKernel(that.fKernel) |
Brian Salomon | 3f6f965 | 2017-07-28 07:34:05 -0400 | [diff] [blame] | 310 | , fGain(that.fGain) |
| 311 | , fBias(that.fBias) |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 312 | , fKernelOffset(that.fKernelOffset) |
Brian Salomon | 3f6f965 | 2017-07-28 07:34:05 -0400 | [diff] [blame] | 313 | , fConvolveAlpha(that.fConvolveAlpha) { |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 314 | auto child = that.childProcessor(0).clone(); |
| 315 | child->setSampledWithExplicitCoords(); |
| 316 | this->registerChildProcessor(std::move(child)); |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 317 | if (fKernel.isSampled()) { |
| 318 | this->setTextureSamplerCnt(1); |
| 319 | } |
Brian Salomon | 3f6f965 | 2017-07-28 07:34:05 -0400 | [diff] [blame] | 320 | this->addCoordTransform(&fCoordTransform); |
Brian Salomon | 3f6f965 | 2017-07-28 07:34:05 -0400 | [diff] [blame] | 321 | } |
| 322 | |
Brian Salomon | aff329b | 2017-08-11 09:40:37 -0400 | [diff] [blame] | 323 | std::unique_ptr<GrFragmentProcessor> GrMatrixConvolutionEffect::clone() const { |
| 324 | return std::unique_ptr<GrFragmentProcessor>(new GrMatrixConvolutionEffect(*this)); |
Brian Salomon | 3f6f965 | 2017-07-28 07:34:05 -0400 | [diff] [blame] | 325 | } |
| 326 | |
Brian Salomon | 94efbf5 | 2016-11-29 13:43:05 -0500 | [diff] [blame] | 327 | void GrMatrixConvolutionEffect::onGetGLSLProcessorKey(const GrShaderCaps& caps, |
egdaniel | 57d3b03 | 2015-11-13 11:57:27 -0800 | [diff] [blame] | 328 | GrProcessorKeyBuilder* b) const { |
joshualitt | eb2a676 | 2014-12-04 11:35:33 -0800 | [diff] [blame] | 329 | GrGLMatrixConvolutionEffect::GenKey(*this, caps, b); |
| 330 | } |
| 331 | |
egdaniel | 57d3b03 | 2015-11-13 11:57:27 -0800 | [diff] [blame] | 332 | GrGLSLFragmentProcessor* GrMatrixConvolutionEffect::onCreateGLSLInstance() const { |
robertphillips | bf536af | 2016-02-04 06:11:53 -0800 | [diff] [blame] | 333 | return new GrGLMatrixConvolutionEffect; |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 334 | } |
| 335 | |
bsalomon | 0e08fc1 | 2014-10-15 08:19:04 -0700 | [diff] [blame] | 336 | bool GrMatrixConvolutionEffect::onIsEqual(const GrFragmentProcessor& sBase) const { |
joshualitt | 49586be | 2014-09-16 08:21:41 -0700 | [diff] [blame] | 337 | const GrMatrixConvolutionEffect& s = sBase.cast<GrMatrixConvolutionEffect>(); |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 338 | return fKernel == s.fKernel && |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 339 | fGain == s.gain() && |
| 340 | fBias == s.bias() && |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 341 | fKernelOffset == s.kernelOffset() && |
| 342 | fConvolveAlpha == s.convolveAlpha(); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 343 | } |
| 344 | |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 345 | const GrFragmentProcessor::TextureSampler& GrMatrixConvolutionEffect::onTextureSampler( |
| 346 | int index) const { |
| 347 | return IthTextureSampler(index, fKernel.scalableSampler().fSampler); |
| 348 | } |
| 349 | |
Robert Phillips | 4e962c6 | 2018-06-20 07:46:19 -0400 | [diff] [blame] | 350 | static void fill_in_1D_gaussian_kernel_with_stride(float* kernel, int size, int stride, |
| 351 | float twoSigmaSqrd) { |
| 352 | SkASSERT(!SkScalarNearlyZero(twoSigmaSqrd, SK_ScalarNearlyZero)); |
| 353 | |
| 354 | const float sigmaDenom = 1.0f / twoSigmaSqrd; |
| 355 | const int radius = size / 2; |
| 356 | |
| 357 | float sum = 0.0f; |
| 358 | for (int i = 0; i < size; ++i) { |
| 359 | float term = static_cast<float>(i - radius); |
| 360 | // Note that the constant term (1/(sqrt(2*pi*sigma^2)) of the Gaussian |
| 361 | // is dropped here, since we renormalize the kernel below. |
| 362 | kernel[i * stride] = sk_float_exp(-term * term * sigmaDenom); |
| 363 | sum += kernel[i * stride]; |
| 364 | } |
| 365 | // Normalize the kernel |
| 366 | float scale = 1.0f / sum; |
| 367 | for (int i = 0; i < size; ++i) { |
| 368 | kernel[i * stride] *= scale; |
| 369 | } |
| 370 | } |
| 371 | |
Robert Phillips | 40fd7c9 | 2017-01-30 08:06:27 -0500 | [diff] [blame] | 372 | static void fill_in_2D_gaussian_kernel(float* kernel, int width, int height, |
| 373 | SkScalar sigmaX, SkScalar sigmaY) { |
Greg Daniel | 4eda8d9 | 2018-04-03 14:03:15 -0400 | [diff] [blame] | 374 | const float twoSigmaSqrdX = 2.0f * SkScalarToFloat(SkScalarSquare(sigmaX)); |
| 375 | const float twoSigmaSqrdY = 2.0f * SkScalarToFloat(SkScalarSquare(sigmaY)); |
| 376 | |
Robert Phillips | 4e962c6 | 2018-06-20 07:46:19 -0400 | [diff] [blame] | 377 | // TODO: in all of these degenerate cases we're uploading (and using) a whole lot of zeros. |
Greg Daniel | 4eda8d9 | 2018-04-03 14:03:15 -0400 | [diff] [blame] | 378 | if (SkScalarNearlyZero(twoSigmaSqrdX, SK_ScalarNearlyZero) || |
| 379 | SkScalarNearlyZero(twoSigmaSqrdY, SK_ScalarNearlyZero)) { |
Robert Phillips | 4e962c6 | 2018-06-20 07:46:19 -0400 | [diff] [blame] | 380 | // In this case the 2D Gaussian degenerates to a 1D Gaussian (in X or Y) or a point |
| 381 | SkASSERT(3 == width || 3 == height); |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 382 | std::fill_n(kernel, width*height, 0); |
Robert Phillips | 4e962c6 | 2018-06-20 07:46:19 -0400 | [diff] [blame] | 383 | |
| 384 | if (SkScalarNearlyZero(twoSigmaSqrdX, SK_ScalarNearlyZero) && |
| 385 | SkScalarNearlyZero(twoSigmaSqrdY, SK_ScalarNearlyZero)) { |
| 386 | // A point |
| 387 | SkASSERT(3 == width && 3 == height); |
| 388 | kernel[4] = 1.0f; |
| 389 | } else if (SkScalarNearlyZero(twoSigmaSqrdX, SK_ScalarNearlyZero)) { |
| 390 | // A 1D Gaussian in Y |
| 391 | SkASSERT(3 == width); |
| 392 | // Down the middle column of the kernel with a stride of width |
| 393 | fill_in_1D_gaussian_kernel_with_stride(&kernel[1], height, width, twoSigmaSqrdY); |
| 394 | } else { |
| 395 | // A 1D Gaussian in X |
| 396 | SkASSERT(SkScalarNearlyZero(twoSigmaSqrdY, SK_ScalarNearlyZero)); |
| 397 | SkASSERT(3 == height); |
| 398 | // Down the middle row of the kernel with a stride of 1 |
| 399 | fill_in_1D_gaussian_kernel_with_stride(&kernel[width], width, 1, twoSigmaSqrdX); |
Greg Daniel | 4eda8d9 | 2018-04-03 14:03:15 -0400 | [diff] [blame] | 400 | } |
| 401 | return; |
| 402 | } |
| 403 | |
| 404 | const float sigmaXDenom = 1.0f / twoSigmaSqrdX; |
| 405 | const float sigmaYDenom = 1.0f / twoSigmaSqrdY; |
Robert Phillips | 40fd7c9 | 2017-01-30 08:06:27 -0500 | [diff] [blame] | 406 | const int xRadius = width / 2; |
| 407 | const int yRadius = height / 2; |
| 408 | |
joshualitt | 5acfea7 | 2014-08-11 13:55:34 -0700 | [diff] [blame] | 409 | float sum = 0.0f; |
joshualitt | 5acfea7 | 2014-08-11 13:55:34 -0700 | [diff] [blame] | 410 | for (int x = 0; x < width; x++) { |
Robert Phillips | 40fd7c9 | 2017-01-30 08:06:27 -0500 | [diff] [blame] | 411 | float xTerm = static_cast<float>(x - xRadius); |
| 412 | xTerm = xTerm * xTerm * sigmaXDenom; |
| 413 | for (int y = 0; y < height; y++) { |
| 414 | float yTerm = static_cast<float>(y - yRadius); |
| 415 | float xyTerm = sk_float_exp(-(xTerm + yTerm * yTerm * sigmaYDenom)); |
| 416 | // Note that the constant term (1/(sqrt(2*pi*sigma^2)) of the Gaussian |
| 417 | // is dropped here, since we renormalize the kernel below. |
| 418 | kernel[y * width + x] = xyTerm; |
| 419 | sum += xyTerm; |
| 420 | } |
joshualitt | 5acfea7 | 2014-08-11 13:55:34 -0700 | [diff] [blame] | 421 | } |
| 422 | // Normalize the kernel |
| 423 | float scale = 1.0f / sum; |
| 424 | for (int i = 0; i < width * height; ++i) { |
| 425 | kernel[i] *= scale; |
| 426 | } |
Robert Phillips | 40fd7c9 | 2017-01-30 08:06:27 -0500 | [diff] [blame] | 427 | } |
| 428 | |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 429 | std::unique_ptr<GrFragmentProcessor> GrMatrixConvolutionEffect::Make(GrRecordingContext* context, |
| 430 | GrSurfaceProxyView srcView, |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 431 | const SkIRect& srcBounds, |
| 432 | const SkISize& kernelSize, |
| 433 | const SkScalar* kernel, |
| 434 | SkScalar gain, |
| 435 | SkScalar bias, |
| 436 | const SkIPoint& kernelOffset, |
| 437 | GrSamplerState::WrapMode wm, |
| 438 | bool convolveAlpha, |
| 439 | const GrCaps& caps) { |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 440 | auto kw = KernelWrapper::Make(context, kernelSize, caps, kernel); |
| 441 | if (!kw.isValid()) { |
| 442 | return nullptr; |
| 443 | } |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 444 | GrSamplerState sampler(wm, GrSamplerState::Filter::kNearest); |
| 445 | auto child = GrTextureEffect::MakeSubset(std::move(srcView), kPremul_SkAlphaType, SkMatrix::I(), |
| 446 | sampler, SkRect::Make(srcBounds), caps); |
| 447 | return std::unique_ptr<GrFragmentProcessor>(new GrMatrixConvolutionEffect( |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 448 | std::move(child), std::move(kw), gain, bias, kernelOffset, convolveAlpha)); |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 449 | } |
| 450 | |
Brian Salomon | aff329b | 2017-08-11 09:40:37 -0400 | [diff] [blame] | 451 | std::unique_ptr<GrFragmentProcessor> GrMatrixConvolutionEffect::MakeGaussian( |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 452 | GrRecordingContext* context, |
Greg Daniel | 5c08249 | 2020-01-29 15:06:49 -0500 | [diff] [blame] | 453 | GrSurfaceProxyView srcView, |
Robert Phillips | 5140f9a | 2018-05-11 16:11:45 -0400 | [diff] [blame] | 454 | const SkIRect& srcBounds, |
Brian Salomon | aff329b | 2017-08-11 09:40:37 -0400 | [diff] [blame] | 455 | const SkISize& kernelSize, |
| 456 | SkScalar gain, |
| 457 | SkScalar bias, |
| 458 | const SkIPoint& kernelOffset, |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 459 | GrSamplerState::WrapMode wm, |
Brian Salomon | aff329b | 2017-08-11 09:40:37 -0400 | [diff] [blame] | 460 | bool convolveAlpha, |
| 461 | SkScalar sigmaX, |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 462 | SkScalar sigmaY, |
| 463 | const GrCaps& caps) { |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 464 | SkAutoSTMalloc<32, float> kernel(kernelSize.area()); |
| 465 | fill_in_2D_gaussian_kernel(kernel.get(), kernelSize.width(), kernelSize.height(), |
| 466 | sigmaX, sigmaY); |
| 467 | return Make(context, std::move(srcView), srcBounds, kernelSize, kernel.get(), |
| 468 | gain, bias, kernelOffset, wm, convolveAlpha, caps); |
Robert Phillips | 40fd7c9 | 2017-01-30 08:06:27 -0500 | [diff] [blame] | 469 | } |
| 470 | |
joshualitt | b0a8a37 | 2014-09-23 09:50:21 -0700 | [diff] [blame] | 471 | GR_DEFINE_FRAGMENT_PROCESSOR_TEST(GrMatrixConvolutionEffect); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 472 | |
Hal Canary | 6f6961e | 2017-01-31 13:50:44 -0500 | [diff] [blame] | 473 | #if GR_TEST_UTILS |
Brian Salomon | aff329b | 2017-08-11 09:40:37 -0400 | [diff] [blame] | 474 | std::unique_ptr<GrFragmentProcessor> GrMatrixConvolutionEffect::TestCreate(GrProcessorTestData* d) { |
Greg Daniel | 026a60c | 2020-02-12 10:53:51 -0500 | [diff] [blame] | 475 | auto [view, ct, at] = d->randomView(); |
Robert Phillips | dbc8eeb | 2017-02-21 10:04:31 -0500 | [diff] [blame] | 476 | |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 477 | static constexpr size_t kMaxTestKernelSize = 2 * kMaxUniformSize; |
| 478 | int width = d->fRandom->nextRangeU(1, kMaxTestKernelSize); |
| 479 | int height = d->fRandom->nextRangeU(1, kMaxTestKernelSize / width); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 480 | SkISize kernelSize = SkISize::Make(width, height); |
Ben Wagner | 7ecc596 | 2016-11-02 17:07:33 -0400 | [diff] [blame] | 481 | std::unique_ptr<SkScalar[]> kernel(new SkScalar[width * height]); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 482 | for (int i = 0; i < width * height; i++) { |
joshualitt | 0067ff5 | 2015-07-08 14:26:19 -0700 | [diff] [blame] | 483 | kernel.get()[i] = d->fRandom->nextSScalar1(); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 484 | } |
joshualitt | 0067ff5 | 2015-07-08 14:26:19 -0700 | [diff] [blame] | 485 | SkScalar gain = d->fRandom->nextSScalar1(); |
| 486 | SkScalar bias = d->fRandom->nextSScalar1(); |
Greg Daniel | 026a60c | 2020-02-12 10:53:51 -0500 | [diff] [blame] | 487 | |
| 488 | uint32_t kernalOffsetX = d->fRandom->nextRangeU(0, kernelSize.width()); |
| 489 | uint32_t kernalOffsetY = d->fRandom->nextRangeU(0, kernelSize.height()); |
| 490 | SkIPoint kernelOffset = SkIPoint::Make(kernalOffsetX, kernalOffsetY); |
| 491 | |
| 492 | uint32_t boundsX = d->fRandom->nextRangeU(0, view.width()); |
| 493 | uint32_t boundsY = d->fRandom->nextRangeU(0, view.height()); |
| 494 | uint32_t boundsW = d->fRandom->nextRangeU(0, view.width()); |
| 495 | uint32_t boundsH = d->fRandom->nextRangeU(0, view.height()); |
| 496 | SkIRect bounds = SkIRect::MakeXYWH(boundsX, boundsY, boundsW, boundsH); |
| 497 | |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 498 | auto wm = static_cast<GrSamplerState::WrapMode>( |
| 499 | d->fRandom->nextULessThan(GrSamplerState::kWrapModeCount)); |
joshualitt | 0067ff5 | 2015-07-08 14:26:19 -0700 | [diff] [blame] | 500 | bool convolveAlpha = d->fRandom->nextBool(); |
Adlai Holler | 00ddb00 | 2020-05-11 19:25:52 -0400 | [diff] [blame] | 501 | return GrMatrixConvolutionEffect::Make(d->context()->priv().asRecordingContext(), |
| 502 | std::move(view), |
bungeman | 06ca8ec | 2016-06-09 08:01:03 -0700 | [diff] [blame] | 503 | bounds, |
| 504 | kernelSize, |
| 505 | kernel.get(), |
| 506 | gain, |
| 507 | bias, |
| 508 | kernelOffset, |
Brian Salomon | 694ec49 | 2020-04-14 13:39:31 -0400 | [diff] [blame] | 509 | wm, |
| 510 | convolveAlpha, |
| 511 | *d->caps()); |
joshualitt | ac97792 | 2014-07-22 09:52:11 -0700 | [diff] [blame] | 512 | } |
Hal Canary | 6f6961e | 2017-01-31 13:50:44 -0500 | [diff] [blame] | 513 | #endif |