mtklein | 15391ee | 2015-03-25 13:43:34 -0700 | [diff] [blame^] | 1 | /* |
| 2 | * Copyright 2015 Google Inc. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license that can be |
| 5 | * found in the LICENSE file. |
| 6 | */ |
| 7 | |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 8 | #include "Benchmark.h" |
| 9 | #include "SkPMFloat.h" |
mtklein | 60ff458 | 2015-03-03 08:03:27 -0800 | [diff] [blame] | 10 | |
| 11 | // Used to prevent the compiler from optimizing away the whole loop. |
| 12 | volatile uint32_t blackhole = 0; |
| 13 | |
| 14 | // Not a great random number generator, but it's very fast. |
| 15 | // The code we're measuring is quite fast, so low overhead is essential. |
| 16 | static uint32_t lcg_rand(uint32_t* seed) { |
| 17 | *seed *= 1664525; |
| 18 | *seed += 1013904223; |
| 19 | return *seed; |
| 20 | } |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 21 | |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame] | 22 | // I'm having better luck getting these to constant-propagate away as template parameters. |
| 23 | template <bool kClamp, bool kWide> |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 24 | struct PMFloatBench : public Benchmark { |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame] | 25 | PMFloatBench() {} |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 26 | |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame] | 27 | const char* onGetName() SK_OVERRIDE { |
| 28 | switch (kClamp << 1 | kWide) { |
| 29 | case 0: return "SkPMFloat_get_1x"; |
| 30 | case 1: return "SkPMFloat_get_4x"; |
| 31 | case 2: return "SkPMFloat_clamp_1x"; |
| 32 | case 3: return "SkPMFloat_clamp_4x"; |
| 33 | } |
| 34 | SkFAIL("unreachable"); |
| 35 | return "oh bother"; |
| 36 | } |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 37 | bool isSuitableFor(Backend backend) SK_OVERRIDE { return backend == kNonRendering_Backend; } |
| 38 | |
| 39 | void onDraw(const int loops, SkCanvas* canvas) SK_OVERRIDE { |
mtklein | 60ff458 | 2015-03-03 08:03:27 -0800 | [diff] [blame] | 40 | // Unlike blackhole, junk can and probably will be a register. |
| 41 | uint32_t junk = 0; |
| 42 | uint32_t seed = 0; |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 43 | for (int i = 0; i < loops; i++) { |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame] | 44 | SkPMColor colors[4]; |
mtklein | 60ff458 | 2015-03-03 08:03:27 -0800 | [diff] [blame] | 45 | #ifdef SK_DEBUG |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame] | 46 | for (int i = 0; i < 4; i++) { |
| 47 | // Our SkASSERTs will remind us that it's technically required that we premultiply. |
| 48 | colors[i] = SkPreMultiplyColor(lcg_rand(&seed)); |
| 49 | } |
mtklein | 60ff458 | 2015-03-03 08:03:27 -0800 | [diff] [blame] | 50 | #else |
| 51 | // But it's a lot faster not to, and this code won't really mind the non-PM colors. |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame] | 52 | (void)lcg_rand(&seed); |
| 53 | colors[0] = seed + 0; |
| 54 | colors[1] = seed + 1; |
| 55 | colors[2] = seed + 2; |
| 56 | colors[3] = seed + 3; |
mtklein | 60ff458 | 2015-03-03 08:03:27 -0800 | [diff] [blame] | 57 | #endif |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame] | 58 | |
mtklein | 15391ee | 2015-03-25 13:43:34 -0700 | [diff] [blame^] | 59 | SkPMFloat fa,fb,fc,fd; |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame] | 60 | if (kWide) { |
mtklein | 15391ee | 2015-03-25 13:43:34 -0700 | [diff] [blame^] | 61 | SkPMFloat::From4PMColors(colors, &fa, &fb, &fc, &fd); |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame] | 62 | } else { |
mtklein | 15391ee | 2015-03-25 13:43:34 -0700 | [diff] [blame^] | 63 | fa = SkPMFloat::FromPMColor(colors[0]); |
| 64 | fb = SkPMFloat::FromPMColor(colors[1]); |
| 65 | fc = SkPMFloat::FromPMColor(colors[2]); |
| 66 | fd = SkPMFloat::FromPMColor(colors[3]); |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame] | 67 | } |
| 68 | |
| 69 | SkPMColor back[4]; |
| 70 | switch (kClamp << 1 | kWide) { |
mtklein | 15391ee | 2015-03-25 13:43:34 -0700 | [diff] [blame^] | 71 | case 0: { |
| 72 | back[0] = fa.get(); |
| 73 | back[1] = fb.get(); |
| 74 | back[2] = fc.get(); |
| 75 | back[3] = fd.get(); |
| 76 | } break; |
| 77 | case 1: SkPMFloat::To4PMColors(fa, fb, fc, fd, back); break; |
| 78 | case 2: { |
| 79 | back[0] = fa.clamped(); |
| 80 | back[1] = fb.clamped(); |
| 81 | back[2] = fc.clamped(); |
| 82 | back[3] = fd.clamped(); |
| 83 | } break; |
| 84 | case 3: SkPMFloat::ClampTo4PMColors(fa, fb, fc, fd, back); break; |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame] | 85 | } |
| 86 | for (int i = 0; i < 4; i++) { |
| 87 | junk ^= back[i]; |
| 88 | } |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 89 | } |
mtklein | 60ff458 | 2015-03-03 08:03:27 -0800 | [diff] [blame] | 90 | blackhole ^= junk; |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 91 | } |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 92 | }; |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame] | 93 | |
| 94 | // Extra () help DEF_BENCH not get confused by the comma inside the <>. |
| 95 | DEF_BENCH(return (new PMFloatBench< true, true>);) |
| 96 | DEF_BENCH(return (new PMFloatBench<false, true>);) |
| 97 | DEF_BENCH(return (new PMFloatBench< true, false>);) |
| 98 | DEF_BENCH(return (new PMFloatBench<false, false>);) |