mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 1 | #include "Benchmark.h" |
| 2 | #include "SkPMFloat.h" |
mtklein | 60ff458 | 2015-03-03 08:03:27 -0800 | [diff] [blame] | 3 | |
| 4 | // Used to prevent the compiler from optimizing away the whole loop. |
| 5 | volatile uint32_t blackhole = 0; |
| 6 | |
| 7 | // Not a great random number generator, but it's very fast. |
| 8 | // The code we're measuring is quite fast, so low overhead is essential. |
| 9 | static uint32_t lcg_rand(uint32_t* seed) { |
| 10 | *seed *= 1664525; |
| 11 | *seed += 1013904223; |
| 12 | return *seed; |
| 13 | } |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 14 | |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame^] | 15 | // I'm having better luck getting these to constant-propagate away as template parameters. |
| 16 | template <bool kClamp, bool kWide> |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 17 | struct PMFloatBench : public Benchmark { |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame^] | 18 | PMFloatBench() {} |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 19 | |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame^] | 20 | const char* onGetName() SK_OVERRIDE { |
| 21 | switch (kClamp << 1 | kWide) { |
| 22 | case 0: return "SkPMFloat_get_1x"; |
| 23 | case 1: return "SkPMFloat_get_4x"; |
| 24 | case 2: return "SkPMFloat_clamp_1x"; |
| 25 | case 3: return "SkPMFloat_clamp_4x"; |
| 26 | } |
| 27 | SkFAIL("unreachable"); |
| 28 | return "oh bother"; |
| 29 | } |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 30 | bool isSuitableFor(Backend backend) SK_OVERRIDE { return backend == kNonRendering_Backend; } |
| 31 | |
| 32 | void onDraw(const int loops, SkCanvas* canvas) SK_OVERRIDE { |
mtklein | 60ff458 | 2015-03-03 08:03:27 -0800 | [diff] [blame] | 33 | // Unlike blackhole, junk can and probably will be a register. |
| 34 | uint32_t junk = 0; |
| 35 | uint32_t seed = 0; |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 36 | for (int i = 0; i < loops; i++) { |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame^] | 37 | SkPMColor colors[4]; |
mtklein | 60ff458 | 2015-03-03 08:03:27 -0800 | [diff] [blame] | 38 | #ifdef SK_DEBUG |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame^] | 39 | for (int i = 0; i < 4; i++) { |
| 40 | // Our SkASSERTs will remind us that it's technically required that we premultiply. |
| 41 | colors[i] = SkPreMultiplyColor(lcg_rand(&seed)); |
| 42 | } |
mtklein | 60ff458 | 2015-03-03 08:03:27 -0800 | [diff] [blame] | 43 | #else |
| 44 | // But it's a lot faster not to, and this code won't really mind the non-PM colors. |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame^] | 45 | (void)lcg_rand(&seed); |
| 46 | colors[0] = seed + 0; |
| 47 | colors[1] = seed + 1; |
| 48 | colors[2] = seed + 2; |
| 49 | colors[3] = seed + 3; |
mtklein | 60ff458 | 2015-03-03 08:03:27 -0800 | [diff] [blame] | 50 | #endif |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame^] | 51 | |
| 52 | SkPMFloat floats[4]; |
| 53 | if (kWide) { |
| 54 | SkPMFloat::From4PMColors(floats, colors); |
| 55 | } else { |
| 56 | for (int i = 0; i < 4; i++) { |
| 57 | floats[i] = SkPMFloat::FromPMColor(colors[i]); |
| 58 | } |
| 59 | } |
| 60 | |
| 61 | SkPMColor back[4]; |
| 62 | switch (kClamp << 1 | kWide) { |
| 63 | case 0: for (int i = 0; i < 4; i++) { back[i] = floats[i].get(); } break; |
| 64 | case 1: SkPMFloat::To4PMColors(back, floats); break; |
| 65 | case 2: for (int i = 0; i < 4; i++) { back[i] = floats[i].clamped(); } break; |
| 66 | case 3: SkPMFloat::ClampTo4PMColors(back, floats); break; |
| 67 | } |
| 68 | for (int i = 0; i < 4; i++) { |
| 69 | junk ^= back[i]; |
| 70 | } |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 71 | } |
mtklein | 60ff458 | 2015-03-03 08:03:27 -0800 | [diff] [blame] | 72 | blackhole ^= junk; |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 73 | } |
mtklein | a2f4be7 | 2015-02-23 10:04:34 -0800 | [diff] [blame] | 74 | }; |
mtklein | 548bf38 | 2015-03-05 11:31:59 -0800 | [diff] [blame^] | 75 | |
| 76 | // Extra () help DEF_BENCH not get confused by the comma inside the <>. |
| 77 | DEF_BENCH(return (new PMFloatBench< true, true>);) |
| 78 | DEF_BENCH(return (new PMFloatBench<false, true>);) |
| 79 | DEF_BENCH(return (new PMFloatBench< true, false>);) |
| 80 | DEF_BENCH(return (new PMFloatBench<false, false>);) |