Index: src/opts/SkColorXform_opts.h |
diff --git a/src/opts/SkColorXform_opts.h b/src/opts/SkColorXform_opts.h |
index b4eb9a2552b556563e1fd34f87a69d91a9a93750..b3da55c1fdd758d2b3b7d74ea41b050b5918eb18 100644 |
--- a/src/opts/SkColorXform_opts.h |
+++ b/src/opts/SkColorXform_opts.h |
@@ -16,14 +16,19 @@ |
namespace SK_OPTS_NS { |
-static Sk4i linear_to_2dot2(const Sk4f& x) { |
+// Strange that we need a wrapper on SkNx_cast to use as a function ptr. |
+static Sk4i Sk4f_trunc(const Sk4f& x) { |
+ return SkNx_cast<int>(x); |
+} |
+ |
+static Sk4f linear_to_2dot2(const Sk4f& x) { |
// x^(29/64) is a very good approximation of the true value, x^(1/2.2). |
auto x2 = x.rsqrt(), // x^(-1/2) |
x32 = x2.rsqrt().rsqrt().rsqrt().rsqrt(), // x^(-1/32) |
x64 = x32.rsqrt(); // x^(+1/64) |
// 29 = 32 - 2 - 1 |
- return Sk4f_round(sk_clamp_0_255(255.0f * x2.invert() * x32 * x64.invert())); |
+ return 255.0f * x2.invert() * x32 * x64.invert(); |
} |
enum DstGamma { |
@@ -36,13 +41,23 @@ enum DstGamma { |
kLinear_DstGamma, |
}; |
-template <DstGamma kDstGamma> |
+template <DstGamma kDstGamma, bool kSwapRB> |
static void color_xform_RGB1(void* dst, const uint32_t* src, int len, |
const float* const srcTables[3], const float matrix[16], |
const uint8_t* const dstTables[3]) { |
- Sk4f rXgXbX = Sk4f::Load(matrix + 0), |
- rYgYbY = Sk4f::Load(matrix + 4), |
- rZgZbZ = Sk4f::Load(matrix + 8); |
+ int kRShift = 0; |
+ int kGShift = 8; |
+ int kBShift = 16; |
+ int kAShift = 24; |
+ if (kSwapRB) { |
+ kBShift = 0; |
+ kRShift = 16; |
+ } |
+ |
+ Sk4f rXgXbX = Sk4f::Load(matrix + 0), |
+ rYgYbY = Sk4f::Load(matrix + 4), |
+ rZgZbZ = Sk4f::Load(matrix + 8), |
+ rTgTbT = Sk4f::Load(matrix + 12); |
if (len >= 4) { |
Sk4f reds, greens, blues; |
@@ -65,25 +80,32 @@ static void color_xform_RGB1(void* dst, const uint32_t* src, int len, |
Sk4f dstReds, dstGreens, dstBlues; |
auto transform_4 = [&reds, &greens, &blues, &dstReds, &dstGreens, &dstBlues, &rXgXbX, |
- &rYgYbY, &rZgZbZ] { |
- dstReds = rXgXbX[0]*reds + rYgYbY[0]*greens + rZgZbZ[0]*blues; |
- dstGreens = rXgXbX[1]*reds + rYgYbY[1]*greens + rZgZbZ[1]*blues; |
- dstBlues = rXgXbX[2]*reds + rYgYbY[2]*greens + rZgZbZ[2]*blues; |
+ &rYgYbY, &rZgZbZ, &rTgTbT] { |
+ dstReds = rXgXbX[0]*reds + rYgYbY[0]*greens + rZgZbZ[0]*blues + rTgTbT[0]; |
+ dstGreens = rXgXbX[1]*reds + rYgYbY[1]*greens + rZgZbZ[1]*blues + rTgTbT[1]; |
+ dstBlues = rXgXbX[2]*reds + rYgYbY[2]*greens + rZgZbZ[2]*blues + rTgTbT[2]; |
}; |
- auto store_4 = [&dstReds, &dstGreens, &dstBlues, &dst, &dstTables] { |
+ auto store_4 = [&dstReds, &dstGreens, &dstBlues, &dst, &dstTables, kRShift, kGShift, |
+ kBShift, kAShift] { |
if (kSRGB_DstGamma == kDstGamma || k2Dot2_DstGamma == kDstGamma) { |
- Sk4i (*linear_to_curve)(const Sk4f&) = |
- (kSRGB_DstGamma == kDstGamma) ? sk_linear_to_srgb : linear_to_2dot2; |
- |
- auto reds = linear_to_curve(dstReds); |
- auto greens = linear_to_curve(dstGreens); |
- auto blues = linear_to_curve(dstBlues); |
- |
- auto rgba = (reds << SK_R32_SHIFT) |
- | (greens << SK_G32_SHIFT) |
- | (blues << SK_B32_SHIFT) |
- | (Sk4i{0xFF} << SK_A32_SHIFT); |
+ Sk4f (*linear_to_curve)(const Sk4f&) = (kSRGB_DstGamma == kDstGamma) ? |
+ sk_linear_to_srgb_needs_trunc : linear_to_2dot2; |
+ Sk4i (*float_to_int)(const Sk4f&) = (kSRGB_DstGamma == kDstGamma) ? |
+ Sk4f_trunc : Sk4f_round; |
+ |
+ dstReds = linear_to_curve(dstReds); |
+ dstGreens = linear_to_curve(dstGreens); |
+ dstBlues = linear_to_curve(dstBlues); |
+ |
+ dstReds = sk_clamp_0_255(dstReds); |
+ dstGreens = sk_clamp_0_255(dstGreens); |
+ dstBlues = sk_clamp_0_255(dstBlues); |
+ |
+ auto rgba = (float_to_int(dstReds) << kRShift) |
+ | (float_to_int(dstGreens) << kGShift) |
+ | (float_to_int(dstBlues) << kBShift) |
+ | (Sk4i{0xFF} << kAShift); |
rgba.store((uint32_t*) dst); |
dst = SkTAddOffset<void>(dst, 4 * sizeof(uint32_t)); |
@@ -97,22 +119,22 @@ static void color_xform_RGB1(void* dst, const uint32_t* src, int len, |
Sk4i indicesBlues = Sk4f_round(scaledBlues); |
uint32_t* dst32 = (uint32_t*) dst; |
- dst32[0] = dstTables[0][indicesReds [0]] << SK_R32_SHIFT |
- | dstTables[1][indicesGreens[0]] << SK_G32_SHIFT |
- | dstTables[2][indicesBlues [0]] << SK_B32_SHIFT |
- | 0xFF << SK_A32_SHIFT; |
- dst32[1] = dstTables[0][indicesReds [1]] << SK_R32_SHIFT |
- | dstTables[1][indicesGreens[1]] << SK_G32_SHIFT |
- | dstTables[2][indicesBlues [1]] << SK_B32_SHIFT |
- | 0xFF << SK_A32_SHIFT; |
- dst32[2] = dstTables[0][indicesReds [2]] << SK_R32_SHIFT |
- | dstTables[1][indicesGreens[2]] << SK_G32_SHIFT |
- | dstTables[2][indicesBlues [2]] << SK_B32_SHIFT |
- | 0xFF << SK_A32_SHIFT; |
- dst32[3] = dstTables[0][indicesReds [3]] << SK_R32_SHIFT |
- | dstTables[1][indicesGreens[3]] << SK_G32_SHIFT |
- | dstTables[2][indicesBlues [3]] << SK_B32_SHIFT |
- | 0xFF << SK_A32_SHIFT; |
+ dst32[0] = dstTables[0][indicesReds [0]] << kRShift |
+ | dstTables[1][indicesGreens[0]] << kGShift |
+ | dstTables[2][indicesBlues [0]] << kBShift |
+ | 0xFF << kAShift; |
+ dst32[1] = dstTables[0][indicesReds [1]] << kRShift |
+ | dstTables[1][indicesGreens[1]] << kGShift |
+ | dstTables[2][indicesBlues [1]] << kBShift |
+ | 0xFF << kAShift; |
+ dst32[2] = dstTables[0][indicesReds [2]] << kRShift |
+ | dstTables[1][indicesGreens[2]] << kGShift |
+ | dstTables[2][indicesBlues [2]] << kBShift |
+ | 0xFF << kAShift; |
+ dst32[3] = dstTables[0][indicesReds [3]] << kRShift |
+ | dstTables[1][indicesGreens[3]] << kGShift |
+ | dstTables[2][indicesBlues [3]] << kBShift |
+ | 0xFF << kAShift; |
dst = SkTAddOffset<void>(dst, 4 * sizeof(uint32_t)); |
} else { |
@@ -142,28 +164,34 @@ static void color_xform_RGB1(void* dst, const uint32_t* src, int len, |
g = Sk4f{srcTables[1][(*src >> 8) & 0xFF]}, |
b = Sk4f{srcTables[2][(*src >> 16) & 0xFF]}; |
- auto dstPixel = rXgXbX*r + rYgYbY*g + rZgZbZ*b; |
+ auto dstPixel = rXgXbX*r + rYgYbY*g + rZgZbZ*b + rTgTbT; |
if (kSRGB_DstGamma == kDstGamma || k2Dot2_DstGamma == kDstGamma) { |
- Sk4i (*linear_to_curve)(const Sk4f&) = |
- (kSRGB_DstGamma == kDstGamma) ? sk_linear_to_srgb : linear_to_2dot2; |
+ Sk4f (*linear_to_curve)(const Sk4f&) = (kSRGB_DstGamma == kDstGamma) ? |
+ sk_linear_to_srgb_needs_trunc : linear_to_2dot2; |
+ Sk4i (*float_to_int)(const Sk4f&) = (kSRGB_DstGamma == kDstGamma) ? |
+ Sk4f_trunc : Sk4f_round; |
- auto pixel = linear_to_curve(dstPixel); |
+ dstPixel = sk_clamp_0_255(linear_to_curve(dstPixel)); |
uint32_t rgba; |
- SkNx_cast<uint8_t>(pixel).store(&rgba); |
+ SkNx_cast<uint8_t>(float_to_int(dstPixel)).store(&rgba); |
rgba |= 0xFF000000; |
- *((uint32_t*) dst) = SkSwizzle_RGBA_to_PMColor(rgba); |
+ if (kSwapRB) { |
+ *((uint32_t*) dst) = SkSwizzle_RB(rgba); |
+ } else { |
+ *((uint32_t*) dst) = rgba; |
+ } |
dst = SkTAddOffset<void>(dst, sizeof(uint32_t)); |
} else if (kTable_DstGamma == kDstGamma) { |
Sk4f scaledPixel = Sk4f::Min(Sk4f::Max(1023.0f * dstPixel, 0.0f), 1023.0f); |
Sk4i indices = Sk4f_round(scaledPixel); |
- *((uint32_t*) dst) = dstTables[0][indices[0]] << SK_R32_SHIFT |
- | dstTables[1][indices[1]] << SK_G32_SHIFT |
- | dstTables[2][indices[2]] << SK_B32_SHIFT |
- | 0xFF << SK_A32_SHIFT; |
+ *((uint32_t*) dst) = dstTables[0][indices[0]] << kRShift |
+ | dstTables[1][indices[1]] << kGShift |
+ | dstTables[2][indices[2]] << kBShift |
+ | 0xFF << kAShift; |
dst = SkTAddOffset<void>(dst, sizeof(uint32_t)); |
} else { |
@@ -181,23 +209,42 @@ static void color_xform_RGB1(void* dst, const uint32_t* src, int len, |
static void color_xform_RGB1_to_2dot2(uint32_t* dst, const uint32_t* src, int len, |
const float* const srcTables[3], const float matrix[16]) { |
- color_xform_RGB1<k2Dot2_DstGamma>(dst, src, len, srcTables, matrix, nullptr); |
+ color_xform_RGB1<k2Dot2_DstGamma, false>(dst, src, len, srcTables, matrix, nullptr); |
} |
static void color_xform_RGB1_to_srgb(uint32_t* dst, const uint32_t* src, int len, |
const float* const srcTables[3], const float matrix[16]) { |
- color_xform_RGB1<kSRGB_DstGamma>(dst, src, len, srcTables, matrix, nullptr); |
+ color_xform_RGB1<kSRGB_DstGamma, false>(dst, src, len, srcTables, matrix, nullptr); |
} |
static void color_xform_RGB1_to_table(uint32_t* dst, const uint32_t* src, int len, |
const float* const srcTables[3], const float matrix[16], |
const uint8_t* const dstTables[3]) { |
- color_xform_RGB1<kTable_DstGamma>(dst, src, len, srcTables, matrix, dstTables); |
+ color_xform_RGB1<kTable_DstGamma, false>(dst, src, len, srcTables, matrix, dstTables); |
} |
static void color_xform_RGB1_to_linear(uint64_t* dst, const uint32_t* src, int len, |
const float* const srcTables[3], const float matrix[16]) { |
- color_xform_RGB1<kLinear_DstGamma>(dst, src, len, srcTables, matrix, nullptr); |
+ color_xform_RGB1<kLinear_DstGamma, false>(dst, src, len, srcTables, matrix, nullptr); |
+} |
+ |
+static void color_xform_RGB1_to_2dot2_swaprb(uint32_t* dst, const uint32_t* src, int len, |
+ const float* const srcTables[3], |
+ const float matrix[16]) { |
+ color_xform_RGB1<k2Dot2_DstGamma, true>(dst, src, len, srcTables, matrix, nullptr); |
+} |
+ |
+static void color_xform_RGB1_to_srgb_swaprb(uint32_t* dst, const uint32_t* src, int len, |
+ const float* const srcTables[3], |
+ const float matrix[16]) { |
+ color_xform_RGB1<kSRGB_DstGamma, true>(dst, src, len, srcTables, matrix, nullptr); |
+} |
+ |
+static void color_xform_RGB1_to_table_swaprb(uint32_t* dst, const uint32_t* src, int len, |
+ const float* const srcTables[3], |
+ const float matrix[16], |
+ const uint8_t* const dstTables[3]) { |
+ color_xform_RGB1<kTable_DstGamma, true>(dst, src, len, srcTables, matrix, dstTables); |
} |
} // namespace SK_OPTS_NS |