blob: 5c3ff493c27ebae1eee6ed1c301e7280b8dd8a63 [file] [log] [blame]
senorblanco@chromium.org60014ca2011-11-09 16:05:58 +00001/*
2 * Copyright 2011 The Android Open Source Project
3 *
4 * Use of this source code is governed by a BSD-style license that can be
5 * found in the LICENSE file.
6 */
7
djsollen@google.com64a0ec32012-06-12 15:17:27 +00008#include "SkBitmap.h"
senorblanco@chromium.org60014ca2011-11-09 16:05:58 +00009#include "SkBlurImageFilter.h"
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +000010#include "SkColorPriv.h"
commit-bot@chromium.org8b0e8ac2014-01-30 18:58:24 +000011#include "SkReadBuffer.h"
12#include "SkWriteBuffer.h"
robertphillips@google.com736dd032013-07-15 15:06:54 +000013#include "SkGpuBlurUtils.h"
senorblanco@chromium.org27eec462013-11-08 20:49:04 +000014#include "SkBlurImage_opts.h"
bsalomon@google.comcf8fb1f2012-08-02 14:03:32 +000015#if SK_SUPPORT_GPU
senorblanco@chromium.org302cffb2012-08-01 20:16:34 +000016#include "GrContext.h"
bsalomon@google.comcf8fb1f2012-08-02 14:03:32 +000017#endif
senorblanco@chromium.org60014ca2011-11-09 16:05:58 +000018
senorblanco@chromium.org09843fd2014-03-24 20:50:59 +000019// This rather arbitrary-looking value results in a maximum box blur kernel size
20// of 1000 pixels on the raster path, which matches the WebKit and Firefox
21// implementations. Since the GPU path does not compute a box blur, putting
22// the limit on sigma ensures consistent behaviour between the GPU and
23// raster paths.
24#define MAX_SIGMA SkIntToScalar(532)
25
commit-bot@chromium.org8b0e8ac2014-01-30 18:58:24 +000026SkBlurImageFilter::SkBlurImageFilter(SkReadBuffer& buffer)
commit-bot@chromium.orgce33d602013-11-25 21:46:31 +000027 : INHERITED(1, buffer) {
senorblanco@chromium.org54e01b22011-11-16 18:20:47 +000028 fSigma.fWidth = buffer.readScalar();
29 fSigma.fHeight = buffer.readScalar();
commit-bot@chromium.orgc0b7e102013-10-23 17:06:21 +000030 buffer.validate(SkScalarIsFinite(fSigma.fWidth) &&
31 SkScalarIsFinite(fSigma.fHeight) &&
32 (fSigma.fWidth >= 0) &&
33 (fSigma.fHeight >= 0));
senorblanco@chromium.org54e01b22011-11-16 18:20:47 +000034}
35
senorblanco@chromium.org194d7752013-07-24 22:19:24 +000036SkBlurImageFilter::SkBlurImageFilter(SkScalar sigmaX,
37 SkScalar sigmaY,
38 SkImageFilter* input,
senorblanco@chromium.orgb295fb62013-10-10 13:51:19 +000039 const CropRect* cropRect)
senorblanco9ea3d572014-07-08 09:16:22 -070040 : INHERITED(1, &input, cropRect), fSigma(SkSize::Make(sigmaX, sigmaY)) {
senorblanco@chromium.org60014ca2011-11-09 16:05:58 +000041 SkASSERT(sigmaX >= 0 && sigmaY >= 0);
42}
43
commit-bot@chromium.org8b0e8ac2014-01-30 18:58:24 +000044void SkBlurImageFilter::flatten(SkWriteBuffer& buffer) const {
senorblanco@chromium.org54e01b22011-11-16 18:20:47 +000045 this->INHERITED::flatten(buffer);
46 buffer.writeScalar(fSigma.fWidth);
47 buffer.writeScalar(fSigma.fHeight);
48}
49
senorblanco@chromium.org0cc00c22013-11-07 18:35:12 +000050enum BlurDirection {
51 kX, kY
52};
53
54/**
55 *
56 * In order to make memory accesses cache-friendly, we reorder the passes to
57 * use contiguous memory reads wherever possible.
58 *
59 * For example, the 6 passes of the X-and-Y blur case are rewritten as
60 * follows. Instead of 3 passes in X and 3 passes in Y, we perform
61 * 2 passes in X, 1 pass in X transposed to Y on write, 2 passes in X,
62 * then 1 pass in X transposed to Y on write.
63 *
64 * +----+ +----+ +----+ +---+ +---+ +---+ +----+
65 * + AB + ----> | AB | ----> | AB | -----> | A | ----> | A | ----> | A | -----> | AB |
66 * +----+ blurX +----+ blurX +----+ blurXY | B | blurX | B | blurX | B | blurXY +----+
67 * +---+ +---+ +---+
68 *
69 * In this way, two of the y-blurs become x-blurs applied to transposed
70 * images, and all memory reads are contiguous.
71 */
72
73template<BlurDirection srcDirection, BlurDirection dstDirection>
74static void boxBlur(const SkPMColor* src, int srcStride, SkPMColor* dst, int kernelSize,
75 int leftOffset, int rightOffset, int width, int height)
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +000076{
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +000077 int rightBorder = SkMin32(rightOffset + 1, width);
senorblanco@chromium.org0cc00c22013-11-07 18:35:12 +000078 int srcStrideX = srcDirection == kX ? 1 : srcStride;
79 int dstStrideX = dstDirection == kX ? 1 : height;
80 int srcStrideY = srcDirection == kX ? srcStride : 1;
81 int dstStrideY = dstDirection == kX ? width : 1;
senorblanco@chromium.orgfe2faa82013-11-04 16:07:33 +000082 uint32_t scale = (1 << 24) / kernelSize;
83 uint32_t half = 1 << 23;
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +000084 for (int y = 0; y < height; ++y) {
85 int sumA = 0, sumR = 0, sumG = 0, sumB = 0;
senorblanco@chromium.org0cc00c22013-11-07 18:35:12 +000086 const SkPMColor* p = src;
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +000087 for (int i = 0; i < rightBorder; ++i) {
88 sumA += SkGetPackedA32(*p);
89 sumR += SkGetPackedR32(*p);
90 sumG += SkGetPackedG32(*p);
91 sumB += SkGetPackedB32(*p);
senorblanco@chromium.org0cc00c22013-11-07 18:35:12 +000092 p += srcStrideX;
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +000093 }
94
senorblanco@chromium.org0cc00c22013-11-07 18:35:12 +000095 const SkPMColor* sptr = src;
96 SkColor* dptr = dst;
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +000097 for (int x = 0; x < width; ++x) {
senorblanco@chromium.orgfe2faa82013-11-04 16:07:33 +000098 *dptr = SkPackARGB32((sumA * scale + half) >> 24,
99 (sumR * scale + half) >> 24,
100 (sumG * scale + half) >> 24,
101 (sumB * scale + half) >> 24);
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000102 if (x >= leftOffset) {
senorblanco@chromium.org0cc00c22013-11-07 18:35:12 +0000103 SkColor l = *(sptr - leftOffset * srcStrideX);
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000104 sumA -= SkGetPackedA32(l);
105 sumR -= SkGetPackedR32(l);
106 sumG -= SkGetPackedG32(l);
107 sumB -= SkGetPackedB32(l);
108 }
109 if (x + rightOffset + 1 < width) {
senorblanco@chromium.org0cc00c22013-11-07 18:35:12 +0000110 SkColor r = *(sptr + (rightOffset + 1) * srcStrideX);
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000111 sumA += SkGetPackedA32(r);
112 sumR += SkGetPackedR32(r);
113 sumG += SkGetPackedG32(r);
114 sumB += SkGetPackedB32(r);
115 }
senorblanco@chromium.org0cc00c22013-11-07 18:35:12 +0000116 sptr += srcStrideX;
117 if (srcDirection == kY) {
118 SK_PREFETCH(sptr + (rightOffset + 1) * srcStrideX);
119 }
120 dptr += dstStrideX;
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000121 }
senorblanco@chromium.org0cc00c22013-11-07 18:35:12 +0000122 src += srcStrideY;
123 dst += dstStrideY;
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000124 }
125}
126
commit-bot@chromium.org7b320702013-07-10 21:22:18 +0000127static void getBox3Params(SkScalar s, int *kernelSize, int* kernelSize3, int *lowOffset,
128 int *highOffset)
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000129{
schenney@chromium.org73f3ded2011-12-20 22:31:40 +0000130 float pi = SkScalarToFloat(SK_ScalarPI);
131 int d = static_cast<int>(floorf(SkScalarToFloat(s) * 3.0f * sqrtf(2.0f * pi) / 4.0f + 0.5f));
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000132 *kernelSize = d;
133 if (d % 2 == 1) {
134 *lowOffset = *highOffset = (d - 1) / 2;
135 *kernelSize3 = d;
136 } else {
137 *highOffset = d / 2;
138 *lowOffset = *highOffset - 1;
139 *kernelSize3 = d + 1;
140 }
141}
142
senorblanco@chromium.orgf1369ce2012-08-20 14:53:21 +0000143bool SkBlurImageFilter::onFilterImage(Proxy* proxy,
senorblanco@chromium.org4cb543d2014-03-14 15:44:01 +0000144 const SkBitmap& source, const Context& ctx,
commit-bot@chromium.orgae761f72014-02-05 22:32:02 +0000145 SkBitmap* dst, SkIPoint* offset) const {
senorblanco@chromium.org68400762013-05-24 15:04:07 +0000146 SkBitmap src = source;
senorblanco@chromium.org6776b822014-01-03 21:48:22 +0000147 SkIPoint srcOffset = SkIPoint::Make(0, 0);
senorblanco@chromium.org4cb543d2014-03-14 15:44:01 +0000148 if (getInput(0) && !getInput(0)->filterImage(proxy, source, ctx, &src, &srcOffset)) {
senorblanco@chromium.org68400762013-05-24 15:04:07 +0000149 return false;
150 }
151
commit-bot@chromium.org28fcae22014-04-11 17:15:40 +0000152 if (src.colorType() != kN32_SkColorType) {
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000153 return false;
154 }
155
senorblanco@chromium.org11825292014-03-14 17:44:41 +0000156 SkIRect srcBounds, dstBounds;
157 if (!this->applyCropRect(ctx, proxy, src, &srcOffset, &srcBounds, &src)) {
reed@google.com76dd2772012-01-05 21:15:07 +0000158 return false;
159 }
160
senorblanco@chromium.org11825292014-03-14 17:44:41 +0000161 SkAutoLockPixels alp(src);
162 if (!src.getPixels()) {
senorblanco@chromium.org194d7752013-07-24 22:19:24 +0000163 return false;
164 }
165
reedc77392e2014-06-02 13:07:26 -0700166 if (!dst->allocPixels(src.info().makeWH(srcBounds.width(), srcBounds.height()))) {
commit-bot@chromium.orgcd3b15c2013-12-04 17:06:49 +0000167 return false;
168 }
reedc77392e2014-06-02 13:07:26 -0700169 dst->getBounds(&dstBounds);
commit-bot@chromium.orgcd3b15c2013-12-04 17:06:49 +0000170
senorblanco@chromium.orgba31f1d2014-05-07 20:56:08 +0000171 SkVector sigma = SkVector::Make(fSigma.width(), fSigma.height());
172 ctx.ctm().mapVectors(&sigma, 1);
senorblanco@chromium.org09843fd2014-03-24 20:50:59 +0000173 sigma.fX = SkMinScalar(sigma.fX, MAX_SIGMA);
174 sigma.fY = SkMinScalar(sigma.fY, MAX_SIGMA);
senorblanco@chromium.org2bfe36b2014-01-20 19:58:28 +0000175
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000176 int kernelSizeX, kernelSizeX3, lowOffsetX, highOffsetX;
177 int kernelSizeY, kernelSizeY3, lowOffsetY, highOffsetY;
senorblanco@chromium.org2bfe36b2014-01-20 19:58:28 +0000178 getBox3Params(sigma.x(), &kernelSizeX, &kernelSizeX3, &lowOffsetX, &highOffsetX);
179 getBox3Params(sigma.y(), &kernelSizeY, &kernelSizeY3, &lowOffsetY, &highOffsetY);
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000180
181 if (kernelSizeX < 0 || kernelSizeY < 0) {
182 return false;
183 }
184
185 if (kernelSizeX == 0 && kernelSizeY == 0) {
commit-bot@chromium.org8a2ad3c2014-02-23 03:59:35 +0000186 src.copyTo(dst, dst->colorType());
senorblanco@chromium.org6776b822014-01-03 21:48:22 +0000187 offset->fX = srcBounds.fLeft;
188 offset->fY = srcBounds.fTop;
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000189 return true;
190 }
191
192 SkBitmap temp;
reedc77392e2014-06-02 13:07:26 -0700193 if (!temp.allocPixels(dst->info())) {
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000194 return false;
195 }
196
senorblanco@chromium.org6776b822014-01-03 21:48:22 +0000197 offset->fX = srcBounds.fLeft;
198 offset->fY = srcBounds.fTop;
199 srcBounds.offset(-srcOffset);
senorblanco@chromium.org0cc00c22013-11-07 18:35:12 +0000200 const SkPMColor* s = src.getAddr32(srcBounds.left(), srcBounds.top());
201 SkPMColor* t = temp.getAddr32(0, 0);
202 SkPMColor* d = dst->getAddr32(0, 0);
203 int w = dstBounds.width(), h = dstBounds.height();
204 int sw = src.rowBytesAsPixels();
senorblanco@chromium.org05edd022013-11-11 20:12:34 +0000205 SkBoxBlurProc boxBlurX, boxBlurY, boxBlurXY, boxBlurYX;
206 if (!SkBoxBlurGetPlatformProcs(&boxBlurX, &boxBlurY, &boxBlurXY, &boxBlurYX)) {
senorblanco@chromium.org27eec462013-11-08 20:49:04 +0000207 boxBlurX = boxBlur<kX, kX>;
208 boxBlurY = boxBlur<kY, kY>;
209 boxBlurXY = boxBlur<kX, kY>;
senorblanco@chromium.org05edd022013-11-11 20:12:34 +0000210 boxBlurYX = boxBlur<kY, kX>;
senorblanco@chromium.org27eec462013-11-08 20:49:04 +0000211 }
212
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000213 if (kernelSizeX > 0 && kernelSizeY > 0) {
senorblanco@chromium.org0cc00c22013-11-07 18:35:12 +0000214 boxBlurX(s, sw, t, kernelSizeX, lowOffsetX, highOffsetX, w, h);
215 boxBlurX(t, w, d, kernelSizeX, highOffsetX, lowOffsetX, w, h);
216 boxBlurXY(d, w, t, kernelSizeX3, highOffsetX, highOffsetX, w, h);
217 boxBlurX(t, h, d, kernelSizeY, lowOffsetY, highOffsetY, h, w);
218 boxBlurX(d, h, t, kernelSizeY, highOffsetY, lowOffsetY, h, w);
219 boxBlurXY(t, h, d, kernelSizeY3, highOffsetY, highOffsetY, h, w);
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000220 } else if (kernelSizeX > 0) {
senorblanco@chromium.org0cc00c22013-11-07 18:35:12 +0000221 boxBlurX(s, sw, d, kernelSizeX, lowOffsetX, highOffsetX, w, h);
222 boxBlurX(d, w, t, kernelSizeX, highOffsetX, lowOffsetX, w, h);
223 boxBlurX(t, w, d, kernelSizeX3, highOffsetX, highOffsetX, w, h);
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000224 } else if (kernelSizeY > 0) {
senorblanco@chromium.org05edd022013-11-11 20:12:34 +0000225 boxBlurYX(s, sw, d, kernelSizeY, lowOffsetY, highOffsetY, h, w);
226 boxBlurX(d, h, t, kernelSizeY, highOffsetY, lowOffsetY, h, w);
227 boxBlurXY(t, h, d, kernelSizeY3, highOffsetY, highOffsetY, h, w);
senorblanco@chromium.orgae814c72011-12-20 20:02:19 +0000228 }
229 return true;
230}
231
senorblanco@chromium.org336d1d72014-01-27 21:03:17 +0000232
233void SkBlurImageFilter::computeFastBounds(const SkRect& src, SkRect* dst) const {
234 if (getInput(0)) {
235 getInput(0)->computeFastBounds(src, dst);
236 } else {
237 *dst = src;
238 }
239
240 dst->outset(SkScalarMul(fSigma.width(), SkIntToScalar(3)),
241 SkScalarMul(fSigma.height(), SkIntToScalar(3)));
242}
senorblanco@chromium.orgc4b12f12014-02-05 17:51:22 +0000243
244bool SkBlurImageFilter::onFilterBounds(const SkIRect& src, const SkMatrix& ctm,
245 SkIRect* dst) const {
246 SkIRect bounds = src;
247 if (getInput(0) && !getInput(0)->filterBounds(src, ctm, &bounds)) {
248 return false;
249 }
senorblanco@chromium.orgba31f1d2014-05-07 20:56:08 +0000250 SkVector sigma = SkVector::Make(fSigma.width(), fSigma.height());
251 ctm.mapVectors(&sigma, 1);
senorblanco@chromium.orgc4b12f12014-02-05 17:51:22 +0000252 bounds.outset(SkScalarCeilToInt(SkScalarMul(sigma.x(), SkIntToScalar(3))),
253 SkScalarCeilToInt(SkScalarMul(sigma.y(), SkIntToScalar(3))));
254 *dst = bounds;
255 return true;
256}
257
senorblanco@chromium.org4cb543d2014-03-14 15:44:01 +0000258bool SkBlurImageFilter::filterImageGPU(Proxy* proxy, const SkBitmap& src, const Context& ctx,
commit-bot@chromium.orgae761f72014-02-05 22:32:02 +0000259 SkBitmap* result, SkIPoint* offset) const {
bsalomon@google.comcf8fb1f2012-08-02 14:03:32 +0000260#if SK_SUPPORT_GPU
senorblanco@chromium.org6aa6fec2014-03-03 22:13:56 +0000261 SkBitmap input = src;
senorblanco@chromium.orgaba651c2014-02-03 22:22:16 +0000262 SkIPoint srcOffset = SkIPoint::Make(0, 0);
senorblanco@chromium.org4cb543d2014-03-14 15:44:01 +0000263 if (getInput(0) && !getInput(0)->getInputResultGPU(proxy, src, ctx, &input, &srcOffset)) {
senorblanco@chromium.orgc2594f42013-01-30 19:08:47 +0000264 return false;
265 }
senorblanco@chromium.org194d7752013-07-24 22:19:24 +0000266 SkIRect rect;
senorblanco@chromium.org11825292014-03-14 17:44:41 +0000267 if (!this->applyCropRect(ctx, proxy, input, &srcOffset, &rect, &input)) {
senorblanco@chromium.org194d7752013-07-24 22:19:24 +0000268 return false;
269 }
senorblanco@chromium.org11825292014-03-14 17:44:41 +0000270 GrTexture* source = input.getTexture();
senorblanco@chromium.orgba31f1d2014-05-07 20:56:08 +0000271 SkVector sigma = SkVector::Make(fSigma.width(), fSigma.height());
272 ctx.ctm().mapVectors(&sigma, 1);
senorblanco@chromium.org09843fd2014-03-24 20:50:59 +0000273 sigma.fX = SkMinScalar(sigma.fX, MAX_SIGMA);
274 sigma.fY = SkMinScalar(sigma.fY, MAX_SIGMA);
senorblanco@chromium.orgaba651c2014-02-03 22:22:16 +0000275 offset->fX = rect.fLeft;
276 offset->fY = rect.fTop;
277 rect.offset(-srcOffset);
skia.committer@gmail.com6ae63832013-07-23 07:01:05 +0000278 SkAutoTUnref<GrTexture> tex(SkGpuBlurUtils::GaussianBlur(source->getContext(),
senorblanco@chromium.org194d7752013-07-24 22:19:24 +0000279 source,
280 false,
281 SkRect::Make(rect),
282 true,
senorblanco@chromium.org2bfe36b2014-01-20 19:58:28 +0000283 sigma.x(),
284 sigma.y()));
senorblanco@chromium.org6aa6fec2014-03-03 22:13:56 +0000285 WrapTexture(tex, rect.width(), rect.height(), result);
286 return true;
bsalomon@google.comcf8fb1f2012-08-02 14:03:32 +0000287#else
288 SkDEBUGFAIL("Should not call in GPU-less build");
senorblanco@chromium.orgc2594f42013-01-30 19:08:47 +0000289 return false;
bsalomon@google.comcf8fb1f2012-08-02 14:03:32 +0000290#endif
senorblanco@chromium.org302cffb2012-08-01 20:16:34 +0000291}