blob: b5b7f81bbfc5feea2c252c1e103353e92b159efe [file] [log] [blame]
/*
* Copyright 2016 Google Inc.
*
* Use of this source code is governed by a BSD-style license that can be
* found in the LICENSE file.
*/
#ifndef SkColorXform_opts_DEFINED
#define SkColorXform_opts_DEFINED
#include "SkNx.h"
#include "SkColorPriv.h"
#include "SkHalf.h"
#include "SkSRGB.h"
#include "SkTemplates.h"
namespace SK_OPTS_NS {
// Strange that we need a wrapper on SkNx_cast to use as a function ptr.
static Sk4i Sk4f_trunc(const Sk4f& x) {
return SkNx_cast<int>(x);
}
static Sk4f linear_to_2dot2(const Sk4f& x) {
// x^(29/64) is a very good approximation of the true value, x^(1/2.2).
auto x2 = x.rsqrt(), // x^(-1/2)
x32 = x2.rsqrt().rsqrt().rsqrt().rsqrt(), // x^(-1/32)
x64 = x32.rsqrt(); // x^(+1/64)
// 29 = 32 - 2 - 1
return 255.0f * x2.invert() * x32 * x64.invert();
}
enum DstGamma {
// 8888
kSRGB_DstGamma,
k2Dot2_DstGamma,
kTable_DstGamma,
// F16
kLinear_DstGamma,
};
template <DstGamma kDstGamma>
static void color_xform_RGB1(void* dst, const uint32_t* src, int len,
const float* const srcTables[3], const float matrix[16],
const uint8_t* const dstTables[3]) {
Sk4f rXgXbX = Sk4f::Load(matrix + 0),
rYgYbY = Sk4f::Load(matrix + 4),
rZgZbZ = Sk4f::Load(matrix + 8),
rTgTbT = Sk4f::Load(matrix + 12);
if (len >= 4) {
Sk4f reds, greens, blues;
auto load_next_4 = [&reds, &greens, &blues, &src, &len, &srcTables] {
reds = Sk4f{srcTables[0][(src[0] >> 0) & 0xFF],
srcTables[0][(src[1] >> 0) & 0xFF],
srcTables[0][(src[2] >> 0) & 0xFF],
srcTables[0][(src[3] >> 0) & 0xFF]};
greens = Sk4f{srcTables[1][(src[0] >> 8) & 0xFF],
srcTables[1][(src[1] >> 8) & 0xFF],
srcTables[1][(src[2] >> 8) & 0xFF],
srcTables[1][(src[3] >> 8) & 0xFF]};
blues = Sk4f{srcTables[2][(src[0] >> 16) & 0xFF],
srcTables[2][(src[1] >> 16) & 0xFF],
srcTables[2][(src[2] >> 16) & 0xFF],
srcTables[2][(src[3] >> 16) & 0xFF]};
src += 4;
len -= 4;
};
Sk4f dstReds, dstGreens, dstBlues;
auto transform_4 = [&reds, &greens, &blues, &dstReds, &dstGreens, &dstBlues, &rXgXbX,
&rYgYbY, &rZgZbZ, &rTgTbT] {
dstReds = rXgXbX[0]*reds + rYgYbY[0]*greens + rZgZbZ[0]*blues + rTgTbT[0];
dstGreens = rXgXbX[1]*reds + rYgYbY[1]*greens + rZgZbZ[1]*blues + rTgTbT[1];
dstBlues = rXgXbX[2]*reds + rYgYbY[2]*greens + rZgZbZ[2]*blues + rTgTbT[2];
};
auto store_4 = [&dstReds, &dstGreens, &dstBlues, &dst, &dstTables] {
if (kSRGB_DstGamma == kDstGamma || k2Dot2_DstGamma == kDstGamma) {
Sk4f (*linear_to_curve)(const Sk4f&) = (kSRGB_DstGamma == kDstGamma) ?
sk_linear_to_srgb_needs_trunc : linear_to_2dot2;
Sk4i (*float_to_int)(const Sk4f&) = (kSRGB_DstGamma == kDstGamma) ?
Sk4f_trunc : Sk4f_round;
dstReds = linear_to_curve(dstReds);
dstGreens = linear_to_curve(dstGreens);
dstBlues = linear_to_curve(dstBlues);
dstReds = sk_clamp_0_255(dstReds);
dstGreens = sk_clamp_0_255(dstGreens);
dstBlues = sk_clamp_0_255(dstBlues);
auto rgba = (float_to_int(dstReds) << SK_R32_SHIFT)
| (float_to_int(dstGreens) << SK_G32_SHIFT)
| (float_to_int(dstBlues) << SK_B32_SHIFT)
| (Sk4i{0xFF} << SK_A32_SHIFT);
rgba.store((uint32_t*) dst);
dst = SkTAddOffset<void>(dst, 4 * sizeof(uint32_t));
} else if (kTable_DstGamma == kDstGamma) {
Sk4f scaledReds = Sk4f::Min(Sk4f::Max(1023.0f * dstReds, 0.0f), 1023.0f);
Sk4f scaledGreens = Sk4f::Min(Sk4f::Max(1023.0f * dstGreens, 0.0f), 1023.0f);
Sk4f scaledBlues = Sk4f::Min(Sk4f::Max(1023.0f * dstBlues, 0.0f), 1023.0f);
Sk4i indicesReds = Sk4f_round(scaledReds);
Sk4i indicesGreens = Sk4f_round(scaledGreens);
Sk4i indicesBlues = Sk4f_round(scaledBlues);
uint32_t* dst32 = (uint32_t*) dst;
dst32[0] = dstTables[0][indicesReds [0]] << SK_R32_SHIFT
| dstTables[1][indicesGreens[0]] << SK_G32_SHIFT
| dstTables[2][indicesBlues [0]] << SK_B32_SHIFT
| 0xFF << SK_A32_SHIFT;
dst32[1] = dstTables[0][indicesReds [1]] << SK_R32_SHIFT
| dstTables[1][indicesGreens[1]] << SK_G32_SHIFT
| dstTables[2][indicesBlues [1]] << SK_B32_SHIFT
| 0xFF << SK_A32_SHIFT;
dst32[2] = dstTables[0][indicesReds [2]] << SK_R32_SHIFT
| dstTables[1][indicesGreens[2]] << SK_G32_SHIFT
| dstTables[2][indicesBlues [2]] << SK_B32_SHIFT
| 0xFF << SK_A32_SHIFT;
dst32[3] = dstTables[0][indicesReds [3]] << SK_R32_SHIFT
| dstTables[1][indicesGreens[3]] << SK_G32_SHIFT
| dstTables[2][indicesBlues [3]] << SK_B32_SHIFT
| 0xFF << SK_A32_SHIFT;
dst = SkTAddOffset<void>(dst, 4 * sizeof(uint32_t));
} else {
Sk4h_store4(dst, SkFloatToHalf_finite(dstReds),
SkFloatToHalf_finite(dstGreens),
SkFloatToHalf_finite(dstBlues),
SK_Half1);
dst = SkTAddOffset<void>(dst, 4 * sizeof(uint64_t));
}
};
load_next_4();
while (len >= 4) {
transform_4();
load_next_4();
store_4();
}
transform_4();
store_4();
}
while (len > 0) {
// Splat r,g,b across a register each.
auto r = Sk4f{srcTables[0][(*src >> 0) & 0xFF]},
g = Sk4f{srcTables[1][(*src >> 8) & 0xFF]},
b = Sk4f{srcTables[2][(*src >> 16) & 0xFF]};
auto dstPixel = rXgXbX*r + rYgYbY*g + rZgZbZ*b + rTgTbT;
if (kSRGB_DstGamma == kDstGamma || k2Dot2_DstGamma == kDstGamma) {
Sk4f (*linear_to_curve)(const Sk4f&) = (kSRGB_DstGamma == kDstGamma) ?
sk_linear_to_srgb_needs_trunc : linear_to_2dot2;
Sk4i (*float_to_int)(const Sk4f&) = (kSRGB_DstGamma == kDstGamma) ?
Sk4f_trunc : Sk4f_round;
dstPixel = sk_clamp_0_255(linear_to_curve(dstPixel));
uint32_t rgba;
SkNx_cast<uint8_t>(float_to_int(dstPixel)).store(&rgba);
rgba |= 0xFF000000;
*((uint32_t*) dst) = SkSwizzle_RGBA_to_PMColor(rgba);
dst = SkTAddOffset<void>(dst, sizeof(uint32_t));
} else if (kTable_DstGamma == kDstGamma) {
Sk4f scaledPixel = Sk4f::Min(Sk4f::Max(1023.0f * dstPixel, 0.0f), 1023.0f);
Sk4i indices = Sk4f_round(scaledPixel);
*((uint32_t*) dst) = dstTables[0][indices[0]] << SK_R32_SHIFT
| dstTables[1][indices[1]] << SK_G32_SHIFT
| dstTables[2][indices[2]] << SK_B32_SHIFT
| 0xFF << SK_A32_SHIFT;
dst = SkTAddOffset<void>(dst, sizeof(uint32_t));
} else {
uint64_t rgba;
SkFloatToHalf_finite(dstPixel).store(&rgba);
rgba |= static_cast<uint64_t>(SK_Half1) << 48;
*((uint64_t*) dst) = rgba;
dst = SkTAddOffset<void>(dst, sizeof(uint64_t));
}
src += 1;
len -= 1;
}
}
static void color_xform_RGB1_to_2dot2(uint32_t* dst, const uint32_t* src, int len,
const float* const srcTables[3], const float matrix[16]) {
color_xform_RGB1<k2Dot2_DstGamma>(dst, src, len, srcTables, matrix, nullptr);
}
static void color_xform_RGB1_to_srgb(uint32_t* dst, const uint32_t* src, int len,
const float* const srcTables[3], const float matrix[16]) {
color_xform_RGB1<kSRGB_DstGamma>(dst, src, len, srcTables, matrix, nullptr);
}
static void color_xform_RGB1_to_table(uint32_t* dst, const uint32_t* src, int len,
const float* const srcTables[3], const float matrix[16],
const uint8_t* const dstTables[3]) {
color_xform_RGB1<kTable_DstGamma>(dst, src, len, srcTables, matrix, dstTables);
}
static void color_xform_RGB1_to_linear(uint64_t* dst, const uint32_t* src, int len,
const float* const srcTables[3], const float matrix[16]) {
color_xform_RGB1<kLinear_DstGamma>(dst, src, len, srcTables, matrix, nullptr);
}
} // namespace SK_OPTS_NS
#endif // SkColorXform_opts_DEFINED