OLD | NEW |
1 /* | 1 /* |
2 * Copyright 2016 Google Inc. | 2 * Copyright 2016 Google Inc. |
3 * | 3 * |
4 * Use of this source code is governed by a BSD-style license that can be | 4 * Use of this source code is governed by a BSD-style license that can be |
5 * found in the LICENSE file. | 5 * found in the LICENSE file. |
6 */ | 6 */ |
7 | 7 |
8 #ifndef SkColorXform_opts_DEFINED | 8 #ifndef SkColorXform_opts_DEFINED |
9 #define SkColorXform_opts_DEFINED | 9 #define SkColorXform_opts_DEFINED |
10 | 10 |
11 #include "SkNx.h" | 11 #include "SkNx.h" |
12 #include "SkColorPriv.h" | 12 #include "SkColorPriv.h" |
13 #include "SkHalf.h" | 13 #include "SkHalf.h" |
14 #include "SkSRGB.h" | 14 #include "SkSRGB.h" |
15 #include "SkTemplates.h" | 15 #include "SkTemplates.h" |
16 | 16 |
17 namespace SK_OPTS_NS { | 17 namespace SK_OPTS_NS { |
18 | 18 |
19 static Sk4f linear_to_2dot2(const Sk4f& x) { | 19 static Sk4f clamp_0_1(const Sk4f& x) { |
| 20 // The order of the arguments is important here. We want to make sure that
NaN |
| 21 // clamps to zero. Note that max(NaN, 0) = 0, while max(0, NaN) = NaN. |
| 22 return Sk4f::Min(Sk4f::Max(x, 0.0f), 1.0f); |
| 23 } |
| 24 |
| 25 static Sk4i linear_to_2dot2(const Sk4f& x) { |
20 // x^(29/64) is a very good approximation of the true value, x^(1/2.2). | 26 // x^(29/64) is a very good approximation of the true value, x^(1/2.2). |
21 auto x2 = x.rsqrt(), // x^(-1/2) | 27 auto x2 = x.rsqrt(), // x^(-1/2) |
22 x32 = x2.rsqrt().rsqrt().rsqrt().rsqrt(), // x^(-1/32) | 28 x32 = x2.rsqrt().rsqrt().rsqrt().rsqrt(), // x^(-1/32) |
23 x64 = x32.rsqrt(); // x^(+1/64) | 29 x64 = x32.rsqrt(); // x^(+1/64) |
24 | 30 |
25 // 29 = 32 - 2 - 1 | 31 // 29 = 32 - 2 - 1 |
26 return 255.0f * x2.invert() * x32 * x64.invert(); | 32 return Sk4f_round(255.0f * x2.invert() * x32 * x64.invert()); |
27 } | |
28 | |
29 static Sk4f clamp_0_to_255(const Sk4f& x) { | |
30 // The order of the arguments is important here. We want to make sure that
NaN | |
31 // clamps to zero. Note that max(NaN, 0) = 0, while max(0, NaN) = NaN. | |
32 return Sk4f::Min(Sk4f::Max(x, 0.0f), 255.0f); | |
33 } | 33 } |
34 | 34 |
35 enum DstGamma { | 35 enum DstGamma { |
36 // 8888 | 36 // 8888 |
37 kSRGB_DstGamma, | 37 kSRGB_DstGamma, |
38 k2Dot2_DstGamma, | 38 k2Dot2_DstGamma, |
39 kTable_DstGamma, | 39 kTable_DstGamma, |
40 | 40 |
41 // F16 | 41 // F16 |
42 kLinear_DstGamma, | 42 kLinear_DstGamma, |
(...skipping 29 matching lines...) Expand all Loading... |
72 Sk4f dstReds, dstGreens, dstBlues; | 72 Sk4f dstReds, dstGreens, dstBlues; |
73 auto transform_4 = [&reds, &greens, &blues, &dstReds, &dstGreens, &dstBl
ues, &rXgXbX, | 73 auto transform_4 = [&reds, &greens, &blues, &dstReds, &dstGreens, &dstBl
ues, &rXgXbX, |
74 &rYgYbY, &rZgZbZ] { | 74 &rYgYbY, &rZgZbZ] { |
75 dstReds = rXgXbX[0]*reds + rYgYbY[0]*greens + rZgZbZ[0]*blues; | 75 dstReds = rXgXbX[0]*reds + rYgYbY[0]*greens + rZgZbZ[0]*blues; |
76 dstGreens = rXgXbX[1]*reds + rYgYbY[1]*greens + rZgZbZ[1]*blues; | 76 dstGreens = rXgXbX[1]*reds + rYgYbY[1]*greens + rZgZbZ[1]*blues; |
77 dstBlues = rXgXbX[2]*reds + rYgYbY[2]*greens + rZgZbZ[2]*blues; | 77 dstBlues = rXgXbX[2]*reds + rYgYbY[2]*greens + rZgZbZ[2]*blues; |
78 }; | 78 }; |
79 | 79 |
80 auto store_4 = [&dstReds, &dstGreens, &dstBlues, &dst, &dstTables] { | 80 auto store_4 = [&dstReds, &dstGreens, &dstBlues, &dst, &dstTables] { |
81 if (kSRGB_DstGamma == kDstGamma || k2Dot2_DstGamma == kDstGamma) { | 81 if (kSRGB_DstGamma == kDstGamma || k2Dot2_DstGamma == kDstGamma) { |
82 Sk4f (*linear_to_curve)(const Sk4f&) = | 82 Sk4i (*linear_to_curve)(const Sk4f&) = |
83 (kSRGB_DstGamma == kDstGamma) ? sk_linear_to_srgb : line
ar_to_2dot2; | 83 (kSRGB_DstGamma == kDstGamma) ? sk_linear_to_srgb : line
ar_to_2dot2; |
84 | 84 |
85 dstReds = linear_to_curve(dstReds); | 85 auto reds = linear_to_curve(clamp_0_1(dstReds)); |
86 dstGreens = linear_to_curve(dstGreens); | 86 auto greens = linear_to_curve(clamp_0_1(dstGreens)); |
87 dstBlues = linear_to_curve(dstBlues); | 87 auto blues = linear_to_curve(clamp_0_1(dstBlues)); |
88 | 88 |
89 dstReds = clamp_0_to_255(dstReds); | |
90 dstGreens = clamp_0_to_255(dstGreens); | |
91 dstBlues = clamp_0_to_255(dstBlues); | |
92 | 89 |
93 auto rgba = (Sk4f_round(dstReds) << SK_R32_SHIFT) | 90 auto rgba = (reds << SK_R32_SHIFT) |
94 | (Sk4f_round(dstGreens) << SK_G32_SHIFT) | 91 | (greens << SK_G32_SHIFT) |
95 | (Sk4f_round(dstBlues) << SK_B32_SHIFT) | 92 | (blues << SK_B32_SHIFT) |
96 | (Sk4i{ 0xFF << SK_A32_SHIFT}); | 93 | (Sk4i{0xFF} << SK_A32_SHIFT); |
97 rgba.store((uint32_t*) dst); | 94 rgba.store((uint32_t*) dst); |
98 | 95 |
99 dst = SkTAddOffset<void>(dst, 4 * sizeof(uint32_t)); | 96 dst = SkTAddOffset<void>(dst, 4 * sizeof(uint32_t)); |
100 } else if (kTable_DstGamma == kDstGamma) { | 97 } else if (kTable_DstGamma == kDstGamma) { |
101 Sk4f scaledReds = Sk4f::Min(Sk4f::Max(1023.0f * dstReds, 0.0
f), 1023.0f); | 98 Sk4f scaledReds = Sk4f::Min(Sk4f::Max(1023.0f * dstReds, 0.0
f), 1023.0f); |
102 Sk4f scaledGreens = Sk4f::Min(Sk4f::Max(1023.0f * dstGreens, 0.0
f), 1023.0f); | 99 Sk4f scaledGreens = Sk4f::Min(Sk4f::Max(1023.0f * dstGreens, 0.0
f), 1023.0f); |
103 Sk4f scaledBlues = Sk4f::Min(Sk4f::Max(1023.0f * dstBlues, 0.0
f), 1023.0f); | 100 Sk4f scaledBlues = Sk4f::Min(Sk4f::Max(1023.0f * dstBlues, 0.0
f), 1023.0f); |
104 | 101 |
105 Sk4i indicesReds = Sk4f_round(scaledReds); | 102 Sk4i indicesReds = Sk4f_round(scaledReds); |
106 Sk4i indicesGreens = Sk4f_round(scaledGreens); | 103 Sk4i indicesGreens = Sk4f_round(scaledGreens); |
(...skipping 41 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
148 | 145 |
149 while (len > 0) { | 146 while (len > 0) { |
150 // Splat r,g,b across a register each. | 147 // Splat r,g,b across a register each. |
151 auto r = Sk4f{srcTables[0][(*src >> 0) & 0xFF]}, | 148 auto r = Sk4f{srcTables[0][(*src >> 0) & 0xFF]}, |
152 g = Sk4f{srcTables[1][(*src >> 8) & 0xFF]}, | 149 g = Sk4f{srcTables[1][(*src >> 8) & 0xFF]}, |
153 b = Sk4f{srcTables[2][(*src >> 16) & 0xFF]}; | 150 b = Sk4f{srcTables[2][(*src >> 16) & 0xFF]}; |
154 | 151 |
155 auto dstPixel = rXgXbX*r + rYgYbY*g + rZgZbZ*b; | 152 auto dstPixel = rXgXbX*r + rYgYbY*g + rZgZbZ*b; |
156 | 153 |
157 if (kSRGB_DstGamma == kDstGamma || k2Dot2_DstGamma == kDstGamma) { | 154 if (kSRGB_DstGamma == kDstGamma || k2Dot2_DstGamma == kDstGamma) { |
158 Sk4f (*linear_to_curve)(const Sk4f&) = | 155 Sk4i (*linear_to_curve)(const Sk4f&) = |
159 (kSRGB_DstGamma == kDstGamma) ? sk_linear_to_srgb : linear_t
o_2dot2; | 156 (kSRGB_DstGamma == kDstGamma) ? sk_linear_to_srgb : linear_t
o_2dot2; |
160 | 157 |
161 dstPixel = linear_to_curve(dstPixel); | 158 auto pixel = linear_to_curve(clamp_0_1(dstPixel)); |
162 | |
163 dstPixel = clamp_0_to_255(dstPixel); | |
164 | 159 |
165 uint32_t rgba; | 160 uint32_t rgba; |
166 SkNx_cast<uint8_t>(Sk4f_round(dstPixel)).store(&rgba); | 161 SkNx_cast<uint8_t>(pixel).store(&rgba); |
167 rgba |= 0xFF000000; | 162 rgba |= 0xFF000000; |
168 *((uint32_t*) dst) = SkSwizzle_RGBA_to_PMColor(rgba); | 163 *((uint32_t*) dst) = SkSwizzle_RGBA_to_PMColor(rgba); |
169 dst = SkTAddOffset<void>(dst, sizeof(uint32_t)); | 164 dst = SkTAddOffset<void>(dst, sizeof(uint32_t)); |
170 } else if (kTable_DstGamma == kDstGamma) { | 165 } else if (kTable_DstGamma == kDstGamma) { |
171 Sk4f scaledPixel = Sk4f::Min(Sk4f::Max(1023.0f * dstPixel, 0.0f), 10
23.0f); | 166 Sk4f scaledPixel = Sk4f::Min(Sk4f::Max(1023.0f * dstPixel, 0.0f), 10
23.0f); |
172 | 167 |
173 Sk4i indices = Sk4f_round(scaledPixel); | 168 Sk4i indices = Sk4f_round(scaledPixel); |
174 | 169 |
175 *((uint32_t*) dst) = dstTables[0][indices[0]] << SK_R32_SHIFT | 170 *((uint32_t*) dst) = dstTables[0][indices[0]] << SK_R32_SHIFT |
176 | dstTables[1][indices[1]] << SK_G32_SHIFT | 171 | dstTables[1][indices[1]] << SK_G32_SHIFT |
(...skipping 31 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
208 } | 203 } |
209 | 204 |
210 static void color_xform_RGB1_to_linear(uint64_t* dst, const uint32_t* src, int l
en, | 205 static void color_xform_RGB1_to_linear(uint64_t* dst, const uint32_t* src, int l
en, |
211 const float* const srcTables[3], const fl
oat matrix[12]) { | 206 const float* const srcTables[3], const fl
oat matrix[12]) { |
212 color_xform_RGB1<kLinear_DstGamma>(dst, src, len, srcTables, matrix, nullptr
); | 207 color_xform_RGB1<kLinear_DstGamma>(dst, src, len, srcTables, matrix, nullptr
); |
213 } | 208 } |
214 | 209 |
215 } // namespace SK_OPTS_NS | 210 } // namespace SK_OPTS_NS |
216 | 211 |
217 #endif // SkColorXform_opts_DEFINED | 212 #endif // SkColorXform_opts_DEFINED |
OLD | NEW |