src/effects/gradients/Sk4fLinearGradient.cpp - platform/external/skia - Gitiles

 /*
  * Copyright 2016 Google Inc.
  *
  * Use of this source code is governed by a BSD-style license that can be
  * found in the LICENSE file.
  */

 #include "Sk4fLinearGradient.h"
 #include "Sk4x4f.h"

 #include <cmath>

 namespace {

 template<DstType dstType, ApplyPremul premul>
 void ramp(const Sk4f& c, const Sk4f& dc, typename DstTraits<dstType, premul>::Type dst[], int n) {
     SkASSERT(n > 0);

     const Sk4f dc2 = dc + dc;
     const Sk4f dc4 = dc2 + dc2;

     Sk4f c0 = c ;
     Sk4f c1 = c + dc;
     Sk4f c2 = c0 + dc2;
     Sk4f c3 = c1 + dc2;

     while (n >= 4) {
         DstTraits<dstType, premul>::store4x(c0, c1, c2, c3, dst);
         dst += 4;

         c0 = c0 + dc4;
         c1 = c1 + dc4;
         c2 = c2 + dc4;
         c3 = c3 + dc4;
         n -= 4;
     }
     if (n & 2) {
         DstTraits<dstType, premul>::store(c0, dst++);
         DstTraits<dstType, premul>::store(c1, dst++);
         c0 = c0 + dc2;
     }
     if (n & 1) {
         DstTraits<dstType, premul>::store(c0, dst);
     }
 }

 // Planar version of ramp (S32 no-premul only).
 template<>
 void ramp<DstType::S32, ApplyPremul::False>(const Sk4f& c, const Sk4f& dc, SkPMColor dst[], int n) {
     SkASSERT(n > 0);

     const Sk4f    dc4 = dc * 4;
     const Sk4x4f dc4x = { Sk4f(dc4[0]), Sk4f(dc4[1]), Sk4f(dc4[2]), Sk4f(dc4[3]) };
     Sk4x4f        c4x = Sk4x4f::Transpose(c, c + dc, c + dc * 2, c + dc * 3);

     while (n >= 4) {
         ( sk_linear_to_srgb(c4x.r) <<  0
         | sk_linear_to_srgb(c4x.g) <<  8
         | sk_linear_to_srgb(c4x.b) << 16
         | Sk4f_round(255.0f*c4x.a) << 24).store(dst);

         c4x.r += dc4x.r;
         c4x.g += dc4x.g;
         c4x.b += dc4x.b;
         c4x.a += dc4x.a;

         dst += 4;
         n   -= 4;
     }

     if (n & 2) {
         DstTraits<DstType::S32, ApplyPremul::False>
             ::store(Sk4f(c4x.r[0], c4x.g[0], c4x.b[0], c4x.a[0]), dst++);
         DstTraits<DstType::S32, ApplyPremul::False>
             ::store(Sk4f(c4x.r[1], c4x.g[1], c4x.b[1], c4x.a[1]), dst++);
     }

     if (n & 1) {
         DstTraits<DstType::S32, ApplyPremul::False>
             ::store(Sk4f(c4x.r[n & 2], c4x.g[n & 2], c4x.b[n & 2], c4x.a[n & 2]), dst);
     }
 }

 template<SkShader::TileMode>
 SkScalar pinFx(SkScalar);

 template<>
 SkScalar pinFx<SkShader::kClamp_TileMode>(SkScalar fx) {
     return fx;
 }

 template<>
 SkScalar pinFx<SkShader::kRepeat_TileMode>(SkScalar fx) {
     SkScalar f = SkScalarFraction(fx);
     if (f < 0) {
         f = SkTMin(f + 1, nextafterf(1, 0));
     }
     SkASSERT(f >= 0);
     SkASSERT(f < 1.0f);
     return f;
 }

 template<>
 SkScalar pinFx<SkShader::kMirror_TileMode>(SkScalar fx) {
     SkScalar f = SkScalarMod(fx, 2.0f);
     if (f < 0) {
         f = SkTMin(f + 2, nextafterf(2, 0));
     }
     SkASSERT(f >= 0);
     SkASSERT(f < 2.0f);
     return f;
 }

 // true when x is in [k1,k2], or [k2, k1] when the interval is reversed.
 // TODO(fmalita): hoist the reversed interval check out of this helper.
 bool in_range(SkScalar x, SkScalar k1, SkScalar k2) {
     SkASSERT(k1 != k2);
     return (k1 < k2)
         ? (x >= k1 && x <= k2)
         : (x >= k2 && x <= k1);
 }

 } // anonymous namespace

 SkLinearGradient::
 LinearGradient4fContext::LinearGradient4fContext(const SkLinearGradient& shader,
                                                  const ContextRec& rec)
     : INHERITED(shader, rec) {

     // Our fast path expects interval points to be monotonically increasing in x.
     const bool reverseIntervals = this->isFast() && std::signbit(fDstToPos.getScaleX());
     fIntervals.init(shader.fOrigColors, shader.fOrigPos, shader.fColorCount, shader.fTileMode,
                     fColorsArePremul, rec.fPaint->getAlpha() * (1.0f / 255), reverseIntervals);

     SkASSERT(fIntervals->count() > 0);
     fCachedInterval = fIntervals->begin();
 }

 const Sk4fGradientInterval*
 SkLinearGradient::LinearGradient4fContext::findInterval(SkScalar fx) const {
     SkASSERT(in_range(fx, fIntervals->front().fT0, fIntervals->back().fT1));

     if (1) {
         // Linear search, using the last scanline interval as a starting point.
         SkASSERT(fCachedInterval >= fIntervals->begin());
         SkASSERT(fCachedInterval < fIntervals->end());
         const int search_dir = fDstToPos.getScaleX() >= 0 ? 1 : -1;
         while (!in_range(fx, fCachedInterval->fT0, fCachedInterval->fT1)) {
             fCachedInterval += search_dir;
             if (fCachedInterval >= fIntervals->end()) {
                 fCachedInterval = fIntervals->begin();
             } else if (fCachedInterval < fIntervals->begin()) {
                 fCachedInterval = fIntervals->end() - 1;
             }
         }
         return fCachedInterval;
     } else {
         // Binary search.  Seems less effective than linear + caching.
         const auto* i0 = fIntervals->begin();
         const auto* i1 = fIntervals->end() - 1;

         while (i0 != i1) {
             SkASSERT(i0 < i1);
             SkASSERT(in_range(fx, i0->fT0, i1->fT1));

             const auto* i = i0 + ((i1 - i0) >> 1);

             if (in_range(fx, i0->fT0, i->fT1)) {
                 i1 = i;
             } else {
                 SkASSERT(in_range(fx, i->fT1, i1->fT1));
                 i0 = i + 1;
             }
         }

         SkASSERT(in_range(fx, i0->fT0, i0->fT1));
         return i0;
     }
 }

 void SkLinearGradient::
 LinearGradient4fContext::shadeSpan(int x, int y, SkPMColor dst[], int count) {
     if (!this->isFast()) {
         this->INHERITED::shadeSpan(x, y, dst, count);
         return;
     }

     // TODO: plumb dithering
     SkASSERT(count > 0);
     if (fColorsArePremul) {
         this->shadePremulSpan<DstType::L32,
                               ApplyPremul::False>(x, y, dst, count);
     } else {
         this->shadePremulSpan<DstType::L32,
                               ApplyPremul::True>(x, y, dst, count);
     }
 }

 void SkLinearGradient::
 LinearGradient4fContext::shadeSpan4f(int x, int y, SkPM4f dst[], int count) {
     if (!this->isFast()) {
         this->INHERITED::shadeSpan4f(x, y, dst, count);
         return;
     }

     // TONOTDO: plumb dithering
     SkASSERT(count > 0);
     if (fColorsArePremul) {
         this->shadePremulSpan<DstType::F32,
                               ApplyPremul::False>(x, y, dst, count);
     } else {
         this->shadePremulSpan<DstType::F32,
                               ApplyPremul::True>(x, y, dst, count);
     }
 }

 template<DstType dstType, ApplyPremul premul>
 void SkLinearGradient::
 LinearGradient4fContext::shadePremulSpan(int x, int y,
                                          typename DstTraits<dstType, premul>::Type dst[],
                                          int count) const {
     const SkLinearGradient& shader =
         static_cast<const SkLinearGradient&>(fShader);
     switch (shader.fTileMode) {
     case kClamp_TileMode:
         this->shadeSpanInternal<dstType,
                                 premul,
                                 kClamp_TileMode>(x, y, dst, count);
         break;
     case kRepeat_TileMode:
         this->shadeSpanInternal<dstType,
                                 premul,
                                 kRepeat_TileMode>(x, y, dst, count);
         break;
     case kMirror_TileMode:
         this->shadeSpanInternal<dstType,
                                 premul,
                                 kMirror_TileMode>(x, y, dst, count);
         break;
     }
 }

 template<DstType dstType, ApplyPremul premul, SkShader::TileMode tileMode>
 void SkLinearGradient::
 LinearGradient4fContext::shadeSpanInternal(int x, int y,
                                            typename DstTraits<dstType, premul>::Type dst[],
                                            int count) const {
     SkPoint pt;
     fDstToPosProc(fDstToPos,
                   x + SK_ScalarHalf,
                   y + SK_ScalarHalf,
                   &pt);
     const SkScalar fx = pinFx<tileMode>(pt.x());
     const SkScalar dx = fDstToPos.getScaleX();
     LinearIntervalProcessor<dstType, premul, tileMode> proc(fIntervals->begin(),
                                                             fIntervals->end() - 1,
                                                             this->findInterval(fx),
                                                             fx,
                                                             dx,
                                                             SkScalarNearlyZero(dx * count));
     while (count > 0) {
         // What we really want here is SkTPin(advance, 1, count)
         // but that's a significant perf hit for >> stops; investigate.
         const int n = SkScalarTruncToInt(
             SkTMin<SkScalar>(proc.currentAdvance() + 1, SkIntToScalar(count)));

         // The current interval advance can be +inf (e.g. when reaching
         // the clamp mode end intervals) - when that happens, we expect to
         //   a) consume all remaining count in one swoop
         //   b) return a zero color gradient
         SkASSERT(SkScalarIsFinite(proc.currentAdvance())
             || (n == count && proc.currentRampIsZero()));

         if (proc.currentRampIsZero()) {
             DstTraits<dstType, premul>::store(proc.currentColor(),
                                               dst, n);
         } else {
             ramp<dstType, premul>(proc.currentColor(),
                                   proc.currentColorGrad(),
                                   dst, n);
         }

         proc.advance(SkIntToScalar(n));
         count -= n;
         dst   += n;
     }
 }

 template<DstType dstType, ApplyPremul premul, SkShader::TileMode tileMode>
 class SkLinearGradient::
 LinearGradient4fContext::LinearIntervalProcessor {
 public:
     LinearIntervalProcessor(const Sk4fGradientInterval* firstInterval,
                             const Sk4fGradientInterval* lastInterval,
                             const Sk4fGradientInterval* i,
                             SkScalar fx,
                             SkScalar dx,
                             bool is_vertical)
         : fAdvX(is_vertical ? SK_ScalarInfinity : (i->fT1 - fx) / dx)
         , fFirstInterval(firstInterval)
         , fLastInterval(lastInterval)
         , fInterval(i)
         , fDx(dx)
         , fIsVertical(is_vertical)
     {
         SkASSERT(fAdvX >= 0);
         SkASSERT(firstInterval <= lastInterval);

         if (tileMode != kClamp_TileMode && !is_vertical) {
             const auto spanX = (lastInterval->fT1 - firstInterval->fT0) / dx;
             SkASSERT(spanX >= 0);

             // If we're in a repeating tile mode and the whole gradient is compressed into a
             // fraction of a pixel, we just use the average color in zero-ramp mode.
             // This also avoids cases where we make no progress due to interval advances being
             // close to zero.
             static constexpr SkScalar kMinSpanX = .25f;
             if (spanX < kMinSpanX) {
                 this->init_average_props();
                 return;
             }
         }

         this->compute_interval_props(fx);
     }

     SkScalar currentAdvance() const {
         SkASSERT(fAdvX >= 0);
         SkASSERT(fAdvX <= (fInterval->fT1 - fInterval->fT0) / fDx || !std::isfinite(fAdvX));
         return fAdvX;
     }

     bool currentRampIsZero() const { return fZeroRamp; }
     const Sk4f& currentColor() const { return fCc; }
     const Sk4f& currentColorGrad() const { return fDcDx; }

     void advance(SkScalar advX) {
         SkASSERT(advX > 0);
         SkASSERT(fAdvX >= 0);

         if (advX >= fAdvX) {
             advX = this->advance_interval(advX);
         }
         SkASSERT(advX < fAdvX);

         fCc = fCc + fDcDx * Sk4f(advX);
         fAdvX -= advX;
     }

 private:
     void compute_interval_props(SkScalar t) {
         SkASSERT(in_range(t, fInterval->fT0, fInterval->fT1));

         const Sk4f dc = DstTraits<dstType, premul>::load(fInterval->fCg);
                   fCc = DstTraits<dstType, premul>::load(fInterval->fCb) + dc * Sk4f(t);
                 fDcDx = dc * fDx;
             fZeroRamp = fIsVertical || (dc == 0).allTrue();
     }

     void init_average_props() {
         fAdvX     = SK_ScalarInfinity;
         fZeroRamp = true;
         fDcDx     = 0;
         fCc       = Sk4f(0);

         // TODO: precompute the average at interval setup time?
         for (const auto* i = fFirstInterval; i <= fLastInterval; ++i) {
             // Each interval contributes its average color to the total/weighted average:
             //
             //   C = (c0 + c1) / 2 = (Cb + Cg * t0 + Cb + Cg * t1) / 2 = Cb + Cg *(t0 + t1) / 2
             //
             //   Avg += C * (t1 - t0)
             //
             const auto c = DstTraits<dstType, premul>::load(i->fCb)
                          + DstTraits<dstType, premul>::load(i->fCg) * (i->fT0 + i->fT1) * 0.5f;
             fCc = fCc + c * (i->fT1 - i->fT0);
         }
     }

     const Sk4fGradientInterval* next_interval(const Sk4fGradientInterval* i) const {
         SkASSERT(i >= fFirstInterval);
         SkASSERT(i <= fLastInterval);
         i++;

         if (tileMode == kClamp_TileMode) {
             SkASSERT(i <= fLastInterval);
             return i;
         }

         return (i <= fLastInterval) ? i : fFirstInterval;
     }

     SkScalar advance_interval(SkScalar advX) {
         SkASSERT(advX >= fAdvX);

         do {
             advX -= fAdvX;
             fInterval = this->next_interval(fInterval);
             fAdvX = (fInterval->fT1 - fInterval->fT0) / fDx;
             SkASSERT(fAdvX > 0);
         } while (advX >= fAdvX);

         compute_interval_props(fInterval->fT0);

         SkASSERT(advX >= 0);
         return advX;
     }

     // Current interval properties.
     Sk4f            fDcDx;      // dst color gradient (dc/dx)
     Sk4f            fCc;        // current color, interpolated in dst
     SkScalar        fAdvX;      // remaining interval advance in dst
     bool            fZeroRamp;  // current interval color grad is 0

     const Sk4fGradientInterval* fFirstInterval;
     const Sk4fGradientInterval* fLastInterval;
     const Sk4fGradientInterval* fInterval;  // current interval
     const SkScalar              fDx;        // 'dx' for consistency with other impls; actually dt/dx
     const bool                  fIsVertical;
 };

 void SkLinearGradient::
 LinearGradient4fContext::mapTs(int x, int y, SkScalar ts[], int count) const {
     SkASSERT(count > 0);
     SkASSERT(fDstToPosClass != kLinear_MatrixClass);

     SkScalar sx = x + SK_ScalarHalf;
     const SkScalar sy = y + SK_ScalarHalf;
     SkPoint pt;

     if (fDstToPosClass != kPerspective_MatrixClass) {
         // kLinear_MatrixClass, kFixedStepInX_MatrixClass => fixed dt per scanline
         const SkScalar dtdx = fDstToPos.fixedStepInX(sy).x();
         fDstToPosProc(fDstToPos, sx, sy, &pt);

         const Sk4f dtdx4 = Sk4f(4 * dtdx);
         Sk4f t4 = Sk4f(pt.x() + 0 * dtdx,
                        pt.x() + 1 * dtdx,
                        pt.x() + 2 * dtdx,
                        pt.x() + 3 * dtdx);

         while (count >= 4) {
             t4.store(ts);
             t4 = t4 + dtdx4;
             ts += 4;
             count -= 4;
         }

         if (count & 2) {
             *ts++ = t4[0];
             *ts++ = t4[1];
             t4 = SkNx_shuffle<2, 0, 1, 3>(t4);
         }

         if (count & 1) {
             *ts++ = t4[0];
         }
     } else {
         for (int i = 0; i < count; ++i) {
             fDstToPosProc(fDstToPos, sx, sy, &pt);
             // Perspective may yield NaN values.
             // Short of a better idea, drop to 0.
             ts[i] = SkScalarIsNaN(pt.x()) ? 0 : pt.x();
             sx += SK_Scalar1;
         }
     }
 }

 bool SkLinearGradient::LinearGradient4fContext::onChooseBlitProcs(const SkImageInfo& info,
                                                                   BlitState* state) {
     if (state->fMode != SkBlendMode::kSrc &&
         !(state->fMode == SkBlendMode::kSrcOver && (fFlags & kOpaqueAlpha_Flag))) {
         return false;
     }

     switch (info.colorType()) {
         case kN32_SkColorType:
             state->fBlitBW = D32_BlitBW;
             return true;
         case kRGBA_F16_SkColorType:
             state->fBlitBW = D64_BlitBW;
             return true;
         default:
             return false;
     }
 }

 void SkLinearGradient::
 LinearGradient4fContext::D32_BlitBW(BlitState* state, int x, int y, const SkPixmap& dst,
                                     int count) {
     // FIXME: ignoring coverage for now
     const LinearGradient4fContext* ctx =
         static_cast<const LinearGradient4fContext*>(state->fCtx);

     if (!dst.info().gammaCloseToSRGB()) {
         if (ctx->fColorsArePremul) {
             ctx->shadePremulSpan<DstType::L32, ApplyPremul::False>(
                 x, y, dst.writable_addr32(x, y), count);
         } else {
             ctx->shadePremulSpan<DstType::L32, ApplyPremul::True>(
                 x, y, dst.writable_addr32(x, y), count);
         }
     } else {
         if (ctx->fColorsArePremul) {
             ctx->shadePremulSpan<DstType::S32, ApplyPremul::False>(
                 x, y, dst.writable_addr32(x, y), count);
         } else {
             ctx->shadePremulSpan<DstType::S32, ApplyPremul::True>(
                 x, y, dst.writable_addr32(x, y), count);
         }
     }
 }

 void SkLinearGradient::
 LinearGradient4fContext::D64_BlitBW(BlitState* state, int x, int y, const SkPixmap& dst,
                                     int count) {
     // FIXME: ignoring coverage for now
     const LinearGradient4fContext* ctx =
         static_cast<const LinearGradient4fContext*>(state->fCtx);

     if (ctx->fColorsArePremul) {
         ctx->shadePremulSpan<DstType::F16, ApplyPremul::False>(
             x, y, dst.writable_addr64(x, y), count);
     } else {
         ctx->shadePremulSpan<DstType::F16, ApplyPremul::True>(
             x, y, dst.writable_addr64(x, y), count);
     }
 }
	/*
	* Copyright 2016 Google Inc.
	*
	* Use of this source code is governed by a BSD-style license that can be
	* found in the LICENSE file.
	*/

	#include "Sk4fLinearGradient.h"
	#include "Sk4x4f.h"

	#include <cmath>

	namespace {

	template<DstType dstType, ApplyPremul premul>
	void ramp(const Sk4f& c, const Sk4f& dc, typename DstTraits<dstType, premul>::Type dst[], int n) {
	SkASSERT(n > 0);

	const Sk4f dc2 = dc + dc;
	const Sk4f dc4 = dc2 + dc2;

	Sk4f c0 = c ;
	Sk4f c1 = c + dc;
	Sk4f c2 = c0 + dc2;
	Sk4f c3 = c1 + dc2;

	while (n >= 4) {
	DstTraits<dstType, premul>::store4x(c0, c1, c2, c3, dst);
	dst += 4;

	c0 = c0 + dc4;
	c1 = c1 + dc4;
	c2 = c2 + dc4;
	c3 = c3 + dc4;
	n -= 4;
	}
	if (n & 2) {
	DstTraits<dstType, premul>::store(c0, dst++);
	DstTraits<dstType, premul>::store(c1, dst++);
	c0 = c0 + dc2;
	}
	if (n & 1) {
	DstTraits<dstType, premul>::store(c0, dst);
	}
	}

	// Planar version of ramp (S32 no-premul only).
	template<>
	void ramp<DstType::S32, ApplyPremul::False>(const Sk4f& c, const Sk4f& dc, SkPMColor dst[], int n) {
	SkASSERT(n > 0);

	const Sk4f dc4 = dc * 4;
	const Sk4x4f dc4x = { Sk4f(dc4[0]), Sk4f(dc4[1]), Sk4f(dc4[2]), Sk4f(dc4[3]) };
	Sk4x4f c4x = Sk4x4f::Transpose(c, c + dc, c + dc * 2, c + dc * 3);

	while (n >= 4) {
	( sk_linear_to_srgb(c4x.r) << 0
	\| sk_linear_to_srgb(c4x.g) << 8
	\| sk_linear_to_srgb(c4x.b) << 16
	\| Sk4f_round(255.0f*c4x.a) << 24).store(dst);

	c4x.r += dc4x.r;
	c4x.g += dc4x.g;
	c4x.b += dc4x.b;
	c4x.a += dc4x.a;

	dst += 4;
	n -= 4;
	}

	if (n & 2) {
	DstTraits<DstType::S32, ApplyPremul::False>
	::store(Sk4f(c4x.r[0], c4x.g[0], c4x.b[0], c4x.a[0]), dst++);
	DstTraits<DstType::S32, ApplyPremul::False>
	::store(Sk4f(c4x.r[1], c4x.g[1], c4x.b[1], c4x.a[1]), dst++);
	}

	if (n & 1) {
	DstTraits<DstType::S32, ApplyPremul::False>
	::store(Sk4f(c4x.r[n & 2], c4x.g[n & 2], c4x.b[n & 2], c4x.a[n & 2]), dst);
	}
	}

	template<SkShader::TileMode>
	SkScalar pinFx(SkScalar);

	template<>
	SkScalar pinFx<SkShader::kClamp_TileMode>(SkScalar fx) {
	return fx;
	}

	template<>
	SkScalar pinFx<SkShader::kRepeat_TileMode>(SkScalar fx) {
	SkScalar f = SkScalarFraction(fx);
	if (f < 0) {
	f = SkTMin(f + 1, nextafterf(1, 0));
	}
	SkASSERT(f >= 0);
	SkASSERT(f < 1.0f);
	return f;
	}

	template<>
	SkScalar pinFx<SkShader::kMirror_TileMode>(SkScalar fx) {
	SkScalar f = SkScalarMod(fx, 2.0f);
	if (f < 0) {
	f = SkTMin(f + 2, nextafterf(2, 0));
	}
	SkASSERT(f >= 0);
	SkASSERT(f < 2.0f);
	return f;
	}

	// true when x is in [k1,k2], or [k2, k1] when the interval is reversed.
	// TODO(fmalita): hoist the reversed interval check out of this helper.
	bool in_range(SkScalar x, SkScalar k1, SkScalar k2) {
	SkASSERT(k1 != k2);
	return (k1 < k2)
	? (x >= k1 && x <= k2)
	: (x >= k2 && x <= k1);
	}

	} // anonymous namespace

	SkLinearGradient::
	LinearGradient4fContext::LinearGradient4fContext(const SkLinearGradient& shader,
	const ContextRec& rec)
	: INHERITED(shader, rec) {

	// Our fast path expects interval points to be monotonically increasing in x.
	const bool reverseIntervals = this->isFast() && std::signbit(fDstToPos.getScaleX());
	fIntervals.init(shader.fOrigColors, shader.fOrigPos, shader.fColorCount, shader.fTileMode,
	fColorsArePremul, rec.fPaint->getAlpha() * (1.0f / 255), reverseIntervals);

	SkASSERT(fIntervals->count() > 0);
	fCachedInterval = fIntervals->begin();
	}

	const Sk4fGradientInterval*
	SkLinearGradient::LinearGradient4fContext::findInterval(SkScalar fx) const {
	SkASSERT(in_range(fx, fIntervals->front().fT0, fIntervals->back().fT1));

	if (1) {
	// Linear search, using the last scanline interval as a starting point.
	SkASSERT(fCachedInterval >= fIntervals->begin());
	SkASSERT(fCachedInterval < fIntervals->end());
	const int search_dir = fDstToPos.getScaleX() >= 0 ? 1 : -1;
	while (!in_range(fx, fCachedInterval->fT0, fCachedInterval->fT1)) {
	fCachedInterval += search_dir;
	if (fCachedInterval >= fIntervals->end()) {
	fCachedInterval = fIntervals->begin();
	} else if (fCachedInterval < fIntervals->begin()) {
	fCachedInterval = fIntervals->end() - 1;
	}
	}
	return fCachedInterval;
	} else {
	// Binary search. Seems less effective than linear + caching.
	const auto* i0 = fIntervals->begin();
	const auto* i1 = fIntervals->end() - 1;

	while (i0 != i1) {
	SkASSERT(i0 < i1);
	SkASSERT(in_range(fx, i0->fT0, i1->fT1));

	const auto* i = i0 + ((i1 - i0) >> 1);

	if (in_range(fx, i0->fT0, i->fT1)) {
	i1 = i;
	} else {
	SkASSERT(in_range(fx, i->fT1, i1->fT1));
	i0 = i + 1;
	}
	}

	SkASSERT(in_range(fx, i0->fT0, i0->fT1));
	return i0;
	}
	}

	void SkLinearGradient::
	LinearGradient4fContext::shadeSpan(int x, int y, SkPMColor dst[], int count) {
	if (!this->isFast()) {
	this->INHERITED::shadeSpan(x, y, dst, count);
	return;
	}

	// TODO: plumb dithering
	SkASSERT(count > 0);
	if (fColorsArePremul) {
	this->shadePremulSpan<DstType::L32,
	ApplyPremul::False>(x, y, dst, count);
	} else {
	this->shadePremulSpan<DstType::L32,
	ApplyPremul::True>(x, y, dst, count);
	}
	}

	void SkLinearGradient::
	LinearGradient4fContext::shadeSpan4f(int x, int y, SkPM4f dst[], int count) {
	if (!this->isFast()) {
	this->INHERITED::shadeSpan4f(x, y, dst, count);
	return;
	}

	// TONOTDO: plumb dithering
	SkASSERT(count > 0);
	if (fColorsArePremul) {
	this->shadePremulSpan<DstType::F32,
	ApplyPremul::False>(x, y, dst, count);
	} else {
	this->shadePremulSpan<DstType::F32,
	ApplyPremul::True>(x, y, dst, count);
	}
	}

	template<DstType dstType, ApplyPremul premul>
	void SkLinearGradient::
	LinearGradient4fContext::shadePremulSpan(int x, int y,
	typename DstTraits<dstType, premul>::Type dst[],
	int count) const {
	const SkLinearGradient& shader =
	static_cast<const SkLinearGradient&>(fShader);
	switch (shader.fTileMode) {
	case kClamp_TileMode:
	this->shadeSpanInternal<dstType,
	premul,
	kClamp_TileMode>(x, y, dst, count);
	break;
	case kRepeat_TileMode:
	this->shadeSpanInternal<dstType,
	premul,
	kRepeat_TileMode>(x, y, dst, count);
	break;
	case kMirror_TileMode:
	this->shadeSpanInternal<dstType,
	premul,
	kMirror_TileMode>(x, y, dst, count);
	break;
	}
	}

	template<DstType dstType, ApplyPremul premul, SkShader::TileMode tileMode>
	void SkLinearGradient::
	LinearGradient4fContext::shadeSpanInternal(int x, int y,
	typename DstTraits<dstType, premul>::Type dst[],
	int count) const {
	SkPoint pt;
	fDstToPosProc(fDstToPos,
	x + SK_ScalarHalf,
	y + SK_ScalarHalf,
	&pt);
	const SkScalar fx = pinFx<tileMode>(pt.x());
	const SkScalar dx = fDstToPos.getScaleX();
	LinearIntervalProcessor<dstType, premul, tileMode> proc(fIntervals->begin(),
	fIntervals->end() - 1,
	this->findInterval(fx),
	fx,
	dx,
	SkScalarNearlyZero(dx * count));
	while (count > 0) {
	// What we really want here is SkTPin(advance, 1, count)
	// but that's a significant perf hit for >> stops; investigate.
	const int n = SkScalarTruncToInt(
	SkTMin<SkScalar>(proc.currentAdvance() + 1, SkIntToScalar(count)));

	// The current interval advance can be +inf (e.g. when reaching
	// the clamp mode end intervals) - when that happens, we expect to
	// a) consume all remaining count in one swoop
	// b) return a zero color gradient
	SkASSERT(SkScalarIsFinite(proc.currentAdvance())
	\|\| (n == count && proc.currentRampIsZero()));

	if (proc.currentRampIsZero()) {
	DstTraits<dstType, premul>::store(proc.currentColor(),
	dst, n);
	} else {
	ramp<dstType, premul>(proc.currentColor(),
	proc.currentColorGrad(),
	dst, n);
	}

	proc.advance(SkIntToScalar(n));
	count -= n;
	dst += n;
	}
	}

	template<DstType dstType, ApplyPremul premul, SkShader::TileMode tileMode>
	class SkLinearGradient::
	LinearGradient4fContext::LinearIntervalProcessor {
	public:
	LinearIntervalProcessor(const Sk4fGradientInterval* firstInterval,
	const Sk4fGradientInterval* lastInterval,
	const Sk4fGradientInterval* i,
	SkScalar fx,
	SkScalar dx,
	bool is_vertical)
	: fAdvX(is_vertical ? SK_ScalarInfinity : (i->fT1 - fx) / dx)
	, fFirstInterval(firstInterval)
	, fLastInterval(lastInterval)
	, fInterval(i)
	, fDx(dx)
	, fIsVertical(is_vertical)
	{
	SkASSERT(fAdvX >= 0);
	SkASSERT(firstInterval <= lastInterval);

	if (tileMode != kClamp_TileMode && !is_vertical) {
	const auto spanX = (lastInterval->fT1 - firstInterval->fT0) / dx;
	SkASSERT(spanX >= 0);

	// If we're in a repeating tile mode and the whole gradient is compressed into a
	// fraction of a pixel, we just use the average color in zero-ramp mode.
	// This also avoids cases where we make no progress due to interval advances being
	// close to zero.
	static constexpr SkScalar kMinSpanX = .25f;
	if (spanX < kMinSpanX) {
	this->init_average_props();
	return;
	}
	}

	this->compute_interval_props(fx);
	}

	SkScalar currentAdvance() const {
	SkASSERT(fAdvX >= 0);
	SkASSERT(fAdvX <= (fInterval->fT1 - fInterval->fT0) / fDx \|\| !std::isfinite(fAdvX));
	return fAdvX;
	}

	bool currentRampIsZero() const { return fZeroRamp; }
	const Sk4f& currentColor() const { return fCc; }
	const Sk4f& currentColorGrad() const { return fDcDx; }

	void advance(SkScalar advX) {
	SkASSERT(advX > 0);
	SkASSERT(fAdvX >= 0);

	if (advX >= fAdvX) {
	advX = this->advance_interval(advX);
	}
	SkASSERT(advX < fAdvX);

	fCc = fCc + fDcDx * Sk4f(advX);
	fAdvX -= advX;
	}

	private:
	void compute_interval_props(SkScalar t) {
	SkASSERT(in_range(t, fInterval->fT0, fInterval->fT1));

	const Sk4f dc = DstTraits<dstType, premul>::load(fInterval->fCg);
	fCc = DstTraits<dstType, premul>::load(fInterval->fCb) + dc * Sk4f(t);
	fDcDx = dc * fDx;
	fZeroRamp = fIsVertical \|\| (dc == 0).allTrue();
	}

	void init_average_props() {
	fAdvX = SK_ScalarInfinity;
	fZeroRamp = true;
	fDcDx = 0;
	fCc = Sk4f(0);

	// TODO: precompute the average at interval setup time?
	for (const auto* i = fFirstInterval; i <= fLastInterval; ++i) {
	// Each interval contributes its average color to the total/weighted average:
	//
	// C = (c0 + c1) / 2 = (Cb + Cg * t0 + Cb + Cg * t1) / 2 = Cb + Cg *(t0 + t1) / 2
	//
	// Avg += C * (t1 - t0)
	//
	const auto c = DstTraits<dstType, premul>::load(i->fCb)
	+ DstTraits<dstType, premul>::load(i->fCg) * (i->fT0 + i->fT1) * 0.5f;
	fCc = fCc + c * (i->fT1 - i->fT0);
	}
	}

	const Sk4fGradientInterval* next_interval(const Sk4fGradientInterval* i) const {
	SkASSERT(i >= fFirstInterval);
	SkASSERT(i <= fLastInterval);
	i++;

	if (tileMode == kClamp_TileMode) {
	SkASSERT(i <= fLastInterval);
	return i;
	}

	return (i <= fLastInterval) ? i : fFirstInterval;
	}

	SkScalar advance_interval(SkScalar advX) {
	SkASSERT(advX >= fAdvX);

	do {
	advX -= fAdvX;
	fInterval = this->next_interval(fInterval);
	fAdvX = (fInterval->fT1 - fInterval->fT0) / fDx;
	SkASSERT(fAdvX > 0);
	} while (advX >= fAdvX);

	compute_interval_props(fInterval->fT0);

	SkASSERT(advX >= 0);
	return advX;
	}

	// Current interval properties.
	Sk4f fDcDx; // dst color gradient (dc/dx)
	Sk4f fCc; // current color, interpolated in dst
	SkScalar fAdvX; // remaining interval advance in dst
	bool fZeroRamp; // current interval color grad is 0

	const Sk4fGradientInterval* fFirstInterval;
	const Sk4fGradientInterval* fLastInterval;
	const Sk4fGradientInterval* fInterval; // current interval
	const SkScalar fDx; // 'dx' for consistency with other impls; actually dt/dx
	const bool fIsVertical;
	};

	void SkLinearGradient::
	LinearGradient4fContext::mapTs(int x, int y, SkScalar ts[], int count) const {
	SkASSERT(count > 0);
	SkASSERT(fDstToPosClass != kLinear_MatrixClass);

	SkScalar sx = x + SK_ScalarHalf;
	const SkScalar sy = y + SK_ScalarHalf;
	SkPoint pt;

	if (fDstToPosClass != kPerspective_MatrixClass) {
	// kLinear_MatrixClass, kFixedStepInX_MatrixClass => fixed dt per scanline
	const SkScalar dtdx = fDstToPos.fixedStepInX(sy).x();
	fDstToPosProc(fDstToPos, sx, sy, &pt);

	const Sk4f dtdx4 = Sk4f(4 * dtdx);
	Sk4f t4 = Sk4f(pt.x() + 0 * dtdx,
	pt.x() + 1 * dtdx,
	pt.x() + 2 * dtdx,
	pt.x() + 3 * dtdx);

	while (count >= 4) {
	t4.store(ts);
	t4 = t4 + dtdx4;
	ts += 4;
	count -= 4;
	}

	if (count & 2) {
	*ts++ = t4[0];
	*ts++ = t4[1];
	t4 = SkNx_shuffle<2, 0, 1, 3>(t4);
	}

	if (count & 1) {
	*ts++ = t4[0];
	}
	} else {
	for (int i = 0; i < count; ++i) {
	fDstToPosProc(fDstToPos, sx, sy, &pt);
	// Perspective may yield NaN values.
	// Short of a better idea, drop to 0.
	ts[i] = SkScalarIsNaN(pt.x()) ? 0 : pt.x();
	sx += SK_Scalar1;
	}
	}
	}

	bool SkLinearGradient::LinearGradient4fContext::onChooseBlitProcs(const SkImageInfo& info,
	BlitState* state) {
	if (state->fMode != SkBlendMode::kSrc &&
	!(state->fMode == SkBlendMode::kSrcOver && (fFlags & kOpaqueAlpha_Flag))) {
	return false;
	}

	switch (info.colorType()) {
	case kN32_SkColorType:
	state->fBlitBW = D32_BlitBW;
	return true;
	case kRGBA_F16_SkColorType:
	state->fBlitBW = D64_BlitBW;
	return true;
	default:
	return false;
	}
	}

	void SkLinearGradient::
	LinearGradient4fContext::D32_BlitBW(BlitState* state, int x, int y, const SkPixmap& dst,
	int count) {
	// FIXME: ignoring coverage for now
	const LinearGradient4fContext* ctx =
	static_cast<const LinearGradient4fContext*>(state->fCtx);

	if (!dst.info().gammaCloseToSRGB()) {
	if (ctx->fColorsArePremul) {
	ctx->shadePremulSpan<DstType::L32, ApplyPremul::False>(
	x, y, dst.writable_addr32(x, y), count);
	} else {
	ctx->shadePremulSpan<DstType::L32, ApplyPremul::True>(
	x, y, dst.writable_addr32(x, y), count);
	}
	} else {
	if (ctx->fColorsArePremul) {
	ctx->shadePremulSpan<DstType::S32, ApplyPremul::False>(
	x, y, dst.writable_addr32(x, y), count);
	} else {
	ctx->shadePremulSpan<DstType::S32, ApplyPremul::True>(
	x, y, dst.writable_addr32(x, y), count);
	}
	}
	}

	void SkLinearGradient::
	LinearGradient4fContext::D64_BlitBW(BlitState* state, int x, int y, const SkPixmap& dst,
	int count) {
	// FIXME: ignoring coverage for now
	const LinearGradient4fContext* ctx =
	static_cast<const LinearGradient4fContext*>(state->fCtx);

	if (ctx->fColorsArePremul) {
	ctx->shadePremulSpan<DstType::F16, ApplyPremul::False>(
	x, y, dst.writable_addr64(x, y), count);
	} else {
	ctx->shadePremulSpan<DstType::F16, ApplyPremul::True>(
	x, y, dst.writable_addr64(x, y), count);
	}
	}