blob: 184e93335e3f907dac915425fea921e48ee3fb6b [file] [log] [blame]
herbcc49e592016-05-17 09:57:34 -07001/*
2 * Copyright 2016 Google Inc.
3 *
4 * Use of this source code is governed by a BSD-style license that can be
5 * found in the LICENSE file.
6 */
7
8#include <tuple>
9
10#include "Benchmark.h"
11#include "Resources.h"
12#include "SkCpu.h"
13#include "SkImage.h"
14#include "SkImage_Base.h"
15#include "SkNx.h"
16#include "SkOpts.h"
herb2edf0c62016-07-12 15:00:46 -070017#include "SkPM4fPriv.h"
herbcc49e592016-05-17 09:57:34 -070018#include "SkString.h"
19
20#define INNER_LOOPS 10
21
mtklein0c902472016-07-20 18:10:07 -070022static inline void brute_srcover_srgb_srgb_1(uint32_t* dst, uint32_t src) {
23 auto d = Sk4f_fromS32(*dst),
24 s = Sk4f_fromS32( src);
25 *dst = Sk4f_toS32(s + d * (1.0f - s[3]));
26}
27
28static inline void srcover_srgb_srgb_1(uint32_t* dst, uint32_t src) {
29 if (src >= 0xFF000000) {
30 *dst = src;
31 return;
32 }
33 brute_srcover_srgb_srgb_1(dst, src);
34}
35
herb2edf0c62016-07-12 15:00:46 -070036static void brute_force_srcover_srgb_srgb(
37 uint32_t* dst, const uint32_t* const src, int ndst, const int nsrc) {
38 while (ndst > 0) {
39 int n = SkTMin(ndst, nsrc);
40
41 for (int i = 0; i < n; i++) {
mtklein0c902472016-07-20 18:10:07 -070042 brute_srcover_srgb_srgb_1(dst++, src[i]);
43 }
44 ndst -= n;
45 }
46}
47
48static void trivial_srcover_srgb_srgb(
49 uint32_t* dst, const uint32_t* const src, int ndst, const int nsrc) {
50 while (ndst > 0) {
51 int n = SkTMin(ndst, nsrc);
52
53 for (int i = 0; i < n; i++) {
54 srcover_srgb_srgb_1(dst++, src[i]);
herb2edf0c62016-07-12 15:00:46 -070055 }
56 ndst -= n;
57 }
58}
59
60static void best_non_simd_srcover_srgb_srgb(
61 uint32_t* dst, const uint32_t* const src, int ndst, const int nsrc) {
62 uint64_t* ddst = reinterpret_cast<uint64_t*>(dst);
63
64 auto srcover_srgb_srgb_2 = [](uint32_t* dst, const uint32_t* src) {
mtklein0c902472016-07-20 18:10:07 -070065 srcover_srgb_srgb_1(dst++, *src++);
66 srcover_srgb_srgb_1(dst, *src);
herb2edf0c62016-07-12 15:00:46 -070067 };
68
69 while (ndst >0) {
70 int count = SkTMin(ndst, nsrc);
71 ndst -= count;
72 const uint64_t* dsrc = reinterpret_cast<const uint64_t*>(src);
73 const uint64_t* end = dsrc + (count >> 1);
74 do {
75 if ((~*dsrc & 0xFF000000FF000000) == 0) {
76 do {
77 *ddst++ = *dsrc++;
78 } while (dsrc < end && (~*dsrc & 0xFF000000FF000000) == 0);
79 } else if ((*dsrc & 0xFF000000FF000000) == 0) {
80 do {
81 dsrc++;
82 ddst++;
83 } while (dsrc < end && (*dsrc & 0xFF000000FF000000) == 0);
84 } else {
85 srcover_srgb_srgb_2(reinterpret_cast<uint32_t*>(ddst++),
86 reinterpret_cast<const uint32_t*>(dsrc++));
87 }
88 } while (dsrc < end);
89
90 if ((count & 1) != 0) {
mtklein0c902472016-07-20 18:10:07 -070091 srcover_srgb_srgb_1(reinterpret_cast<uint32_t*>(ddst),
92 *reinterpret_cast<const uint32_t*>(dsrc));
herb2edf0c62016-07-12 15:00:46 -070093 }
94 }
95}
96
herbcc49e592016-05-17 09:57:34 -070097class SrcOverVSkOptsBruteForce {
98public:
99 static SkString Name() { return SkString{"VSkOptsBruteForce"}; }
herb2edf0c62016-07-12 15:00:46 -0700100 static void BlendN(uint32_t* dst, const uint32_t* src, int count) {
101 brute_force_srcover_srgb_srgb(dst, src, count, count);
herbcc49e592016-05-17 09:57:34 -0700102 }
103};
104
herbcc49e592016-05-17 09:57:34 -0700105class SrcOverVSkOptsTrivial {
106public:
107 static SkString Name() { return SkString{"VSkOptsTrivial"}; }
herb2edf0c62016-07-12 15:00:46 -0700108 static void BlendN(uint32_t* dst, const uint32_t* src, int count) {
109 trivial_srcover_srgb_srgb(dst, src, count, count);
herbcc49e592016-05-17 09:57:34 -0700110 }
111};
112
herbcc49e592016-05-17 09:57:34 -0700113class SrcOverVSkOptsNonSimdCore {
114public:
115 static SkString Name() { return SkString{"VSkOptsNonSimdCore"}; }
herb2edf0c62016-07-12 15:00:46 -0700116 static void BlendN(uint32_t* dst, const uint32_t* src, int count) {
117 best_non_simd_srcover_srgb_srgb(dst, src, count, count);
herbcc49e592016-05-17 09:57:34 -0700118 }
119};
120
herbcc49e592016-05-17 09:57:34 -0700121class SrcOverVSkOptsDefault {
122public:
123 static SkString Name() { return SkString{"VSkOptsDefault"}; }
herb2edf0c62016-07-12 15:00:46 -0700124 static void BlendN(uint32_t* dst, const uint32_t* src, int count) {
mtklein0358a6a2016-07-13 08:02:20 -0700125 SkOpts::srcover_srgb_srgb(dst, src, count, count);
herbcc49e592016-05-17 09:57:34 -0700126 }
127};
128
129///////////////////////////////////////////////////////////////////////////////////////////////////
130
131template <typename Blender>
132class LinearSrcOverBench : public Benchmark {
133public:
bsalomon809f2582016-05-20 08:54:23 -0700134 LinearSrcOverBench(const char* fileName) : fFileName(fileName) {
herb2edf0c62016-07-12 15:00:46 -0700135 fName = "LinearSrcOver_";
herbcc49e592016-05-17 09:57:34 -0700136 fName.append(fileName);
137 fName.append(Blender::Name());
herbcc49e592016-05-17 09:57:34 -0700138 }
139
140protected:
mtklein0358a6a2016-07-13 08:02:20 -0700141 bool isSuitableFor(Backend backend) override { return backend == kNonRendering_Backend; }
herbcc49e592016-05-17 09:57:34 -0700142 const char* onGetName() override { return fName.c_str(); }
bsalomon809f2582016-05-20 08:54:23 -0700143
144 void onPreDraw(SkCanvas*) override {
145 if (!fPixmap.addr()) {
146 sk_sp<SkImage> image = GetResourceAsImage(fFileName.c_str());
147 SkBitmap bm;
148 if (!as_IB(image)->getROPixels(&bm)) {
149 SkFAIL("Could not read resource");
150 }
151 bm.peekPixels(&fPixmap);
152 fCount = fPixmap.rowBytesAsPixels();
153 fDst.reset(fCount);
herb2edf0c62016-07-12 15:00:46 -0700154 sk_bzero(fDst.get(), fPixmap.rowBytes());
bsalomon809f2582016-05-20 08:54:23 -0700155 }
156 }
157
herbcc49e592016-05-17 09:57:34 -0700158 void onDraw(int loops, SkCanvas*) override {
159 SkASSERT(fPixmap.colorType() == kN32_SkColorType);
160
161 const int width = fPixmap.rowBytesAsPixels();
162
163 for (int i = 0; i < loops * INNER_LOOPS; ++i) {
164 const uint32_t* src = fPixmap.addr32();
165 for (int y = 0; y < fPixmap.height(); y++) {
herb2edf0c62016-07-12 15:00:46 -0700166 Blender::BlendN(fDst.get(), src, width);
herbcc49e592016-05-17 09:57:34 -0700167 src += width;
168 }
169 }
170 }
171
172 void onPostDraw(SkCanvas*) override {
173 // Make sure the compiler does not optimize away the operation.
174 volatile uint32_t v = 0;
175 for (int i = 0; i < fCount; i++) {
176 v ^= fDst[i];
177 }
178 }
179
180private:
181 int fCount;
182 SkAutoTArray<uint32_t> fDst;
bsalomon809f2582016-05-20 08:54:23 -0700183 SkString fFileName;
herbcc49e592016-05-17 09:57:34 -0700184 SkString fName;
185 SkPixmap fPixmap;
186
187 typedef Benchmark INHERITED;
188};
189
mtklein0358a6a2016-07-13 08:02:20 -0700190#define BENCHES(fileName) \
191 DEF_BENCH( return new LinearSrcOverBench<SrcOverVSkOptsBruteForce>(fileName); ) \
192 DEF_BENCH( return new LinearSrcOverBench<SrcOverVSkOptsTrivial>(fileName); ) \
193 DEF_BENCH( return new LinearSrcOverBench<SrcOverVSkOptsNonSimdCore>(fileName); ) \
194 DEF_BENCH( return new LinearSrcOverBench<SrcOverVSkOptsDefault>(fileName); )
herbcc49e592016-05-17 09:57:34 -0700195
196BENCHES("yellow_rose.png")
197BENCHES("baby_tux.png")
198BENCHES("plane.png")
199BENCHES("mandrill_512.png")
200BENCHES("iconstrip.png")