Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(12)

Side by Side Diff: src/core/SkXfermode.cpp

Issue 1043413002: experimental speedup some xfermodes with Sk4f (Closed) Base URL: https://skia.googlesource.com/skia.git@master
Patch Set: Created 5 years, 8 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« no previous file with comments | « bench/XfermodeBench.cpp ('k') | no next file » | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 1
2 /* 2 /*
3 * Copyright 2006 The Android Open Source Project 3 * Copyright 2006 The Android Open Source Project
4 * 4 *
5 * Use of this source code is governed by a BSD-style license that can be 5 * Use of this source code is governed by a BSD-style license that can be
6 * found in the LICENSE file. 6 * found in the LICENSE file.
7 */ 7 */
8 8
9 #include "SkXfermode.h" 9 #include "SkXfermode.h"
10 #include "SkXfermode_opts_SSE2.h" 10 #include "SkXfermode_opts_SSE2.h"
11 #include "SkXfermode_proccoeff.h" 11 #include "SkXfermode_proccoeff.h"
12 #include "SkColorPriv.h" 12 #include "SkColorPriv.h"
13 #include "SkLazyPtr.h" 13 #include "SkLazyPtr.h"
14 #include "SkMathPriv.h" 14 #include "SkMathPriv.h"
15 #include "SkPMFloat.h"
15 #include "SkReadBuffer.h" 16 #include "SkReadBuffer.h"
16 #include "SkString.h" 17 #include "SkString.h"
17 #include "SkUtilsArm.h" 18 #include "SkUtilsArm.h"
18 #include "SkWriteBuffer.h" 19 #include "SkWriteBuffer.h"
19 20
21 //#define SK_SUPPORT_LEGACY_SCALAR_XFERMODES
22
20 #if !SK_ARM_NEON_IS_NONE 23 #if !SK_ARM_NEON_IS_NONE
21 #include "SkXfermode_opts_arm_neon.h" 24 #include "SkXfermode_opts_arm_neon.h"
22 #endif 25 #endif
23 26
24 #define SkAlphaMulAlpha(a, b) SkMulDiv255Round(a, b) 27 #define SkAlphaMulAlpha(a, b) SkMulDiv255Round(a, b)
25 28
26 #if 0
27 // idea for higher precision blends in xfer procs (and slightly faster)
28 // see DstATop as a probable caller
29 static U8CPU mulmuldiv255round(U8CPU a, U8CPU b, U8CPU c, U8CPU d) {
30 SkASSERT(a <= 255);
31 SkASSERT(b <= 255);
32 SkASSERT(c <= 255);
33 SkASSERT(d <= 255);
34 unsigned prod = SkMulS16(a, b) + SkMulS16(c, d) + 128;
35 unsigned result = (prod + (prod >> 8)) >> 8;
36 SkASSERT(result <= 255);
37 return result;
38 }
39 #endif
40
41 static inline unsigned saturated_add(unsigned a, unsigned b) { 29 static inline unsigned saturated_add(unsigned a, unsigned b) {
42 SkASSERT(a <= 255); 30 SkASSERT(a <= 255);
43 SkASSERT(b <= 255); 31 SkASSERT(b <= 255);
44 unsigned sum = a + b; 32 unsigned sum = a + b;
45 if (sum > 255) { 33 if (sum > 255) {
46 sum = 255; 34 sum = 255;
47 } 35 }
48 return sum; 36 return sum;
49 } 37 }
50 38
(...skipping 1128 matching lines...) Expand 10 before | Expand all | Expand 10 after
1179 } 1167 }
1180 1168
1181 #ifndef SK_IGNORE_TO_STRING 1169 #ifndef SK_IGNORE_TO_STRING
1182 void SkDstInXfermode::toString(SkString* str) const { 1170 void SkDstInXfermode::toString(SkString* str) const {
1183 this->INHERITED::toString(str); 1171 this->INHERITED::toString(str);
1184 } 1172 }
1185 #endif 1173 #endif
1186 1174
1187 /////////////////////////////////////////////////////////////////////////////// 1175 ///////////////////////////////////////////////////////////////////////////////
1188 1176
1177 /* These modes can merge coverage into src-alpha
1178 *
1179 { dst_modeproc, SkXfermode::kZero_Coeff, SkXfermode::kOne_Coeff },
1180 { srcover_modeproc, SkXfermode::kOne_Coeff, SkXfermode::kISA_Coeff },
1181 { dstover_modeproc, SkXfermode::kIDA_Coeff, SkXfermode::kOne_Coeff },
1182 { dstout_modeproc, SkXfermode::kZero_Coeff, SkXfermode::kISA_Coeff },
1183 { srcatop_modeproc, SkXfermode::kDA_Coeff, SkXfermode::kISA_Coeff },
1184 { xor_modeproc, SkXfermode::kIDA_Coeff, SkXfermode::kISA_Coeff },
1185 { plus_modeproc, SkXfermode::kOne_Coeff, SkXfermode::kOne_Coeff },
1186 { screen_modeproc, SkXfermode::kOne_Coeff, SkXfermode::kISC_Coeff },
1187 */
1188
1189 #ifndef SK_SUPPORT_LEGACY_SCALAR_XFERMODES
1190 static const float gInv255 = 0.0039215683f; // (1.0f / 255) - ULP == SkBits2Flo at(0x3B808080)
1191
1192 static Sk4f ramp(const Sk4f& v0, const Sk4f& v1, const Sk4f& t) {
1193 return v0 + (v1 - v0) * t;
1194 }
1195
1196 static Sk4f clamp_255(const Sk4f& value) {
1197 return Sk4f::Min(value, Sk4f(255));
1198 }
1199
1200 static inline SkPMFloat check_as_pmfloat(const Sk4f& value) {
1201 SkPMFloat pm = value;
1202 SkASSERT(pm.isValid());
1203 return pm;
1204 }
1205
1206 // kSrcATop_Mode, //!< [Da, Sc * Da + (1 - Sa) * Dc]
1207 struct SrcATop4f {
1208 static SkPMFloat Xfer(const SkPMFloat& src, const SkPMFloat& dst) {
1209 const Sk4f inv255(gInv255);
1210 Sk4f s4 = src;
1211 Sk4f d4 = dst;
1212 return check_as_pmfloat(d4 + (s4 * Sk4f(dst.a()) - d4 * Sk4f(src.a())) * inv255);
1213 }
1214 static const bool kFoldCoverageIntoSrcAlpha = true;
1215 static const SkXfermode::Mode kMode = SkXfermode::kSrcATop_Mode;
1216 };
1217
1218 // kDstATop_Mode, //!< [Sa, Sa * Dc + Sc * (1 - Da)]
1219 struct DstATop4f {
1220 static SkPMFloat Xfer(const SkPMFloat& src, const SkPMFloat& dst) {
1221 const Sk4f inv255(gInv255);
1222 Sk4f s4 = src;
1223 Sk4f d4 = dst;
1224 return check_as_pmfloat(s4 + (d4 * Sk4f(src.a()) - s4 * Sk4f(dst.a())) * inv255);
1225 }
1226 static const bool kFoldCoverageIntoSrcAlpha = false;
1227 static const SkXfermode::Mode kMode = SkXfermode::kDstATop_Mode;
1228 };
1229
1230 // kXor_Mode [Sa + Da - 2 * Sa * Da, Sc * (1 - Da) + (1 - Sa) * Dc]
1231 struct Xor4f {
1232 static SkPMFloat Xfer(const SkPMFloat& src, const SkPMFloat& dst) {
1233 const Sk4f inv255(gInv255);
1234 Sk4f s4 = src;
1235 Sk4f d4 = dst;
1236 return check_as_pmfloat(s4 + d4 - (s4 * Sk4f(dst.a()) + d4 * Sk4f(src.a( ))) * inv255);
1237 }
1238 static const bool kFoldCoverageIntoSrcAlpha = true;
1239 static const SkXfermode::Mode kMode = SkXfermode::kXor_Mode;
1240 };
1241
1242 // kPlus_Mode [Sa + Da, Sc + Dc]
1243 struct Plus4f {
1244 static SkPMFloat Xfer(const SkPMFloat& src, const SkPMFloat& dst) {
1245 Sk4f s4 = src;
1246 Sk4f d4 = dst;
1247 return check_as_pmfloat(clamp_255(s4 + d4));
1248 }
1249 static const bool kFoldCoverageIntoSrcAlpha = true;
1250 static const SkXfermode::Mode kMode = SkXfermode::kPlus_Mode;
1251 };
1252
1253 // kModulate_Mode [Sa * Da, Sc * Dc]
1254 struct Modulate4f {
1255 static SkPMFloat Xfer(const SkPMFloat& src, const SkPMFloat& dst) {
1256 const Sk4f inv255(gInv255);
1257 Sk4f s4 = src;
1258 Sk4f d4 = dst;
1259 return check_as_pmfloat(s4 * d4 * inv255);
1260 }
1261 static const bool kFoldCoverageIntoSrcAlpha = false;
1262 static const SkXfermode::Mode kMode = SkXfermode::kModulate_Mode;
1263 };
1264
1265 // kScreen_Mode [S + D - S * D]
1266 struct Screen4f {
1267 static SkPMFloat Xfer(const SkPMFloat& src, const SkPMFloat& dst) {
1268 const Sk4f inv255(gInv255);
1269 Sk4f s4 = src;
1270 Sk4f d4 = dst;
1271 return check_as_pmfloat(clamp_255(s4 + d4 - s4 * d4 * inv255));
1272 }
1273 static const bool kFoldCoverageIntoSrcAlpha = true;
1274 static const SkXfermode::Mode kMode = SkXfermode::kScreen_Mode;
1275 };
1276
1277 template <typename ProcType>
1278 class SkT4fXfermode : public SkProcCoeffXfermode {
1279 public:
1280 static SkXfermode* Create(const ProcCoeff& rec) {
1281 return SkNEW_ARGS(SkT4fXfermode, (rec));
1282 }
1283
1284 void xfer32(SkPMColor dst[], const SkPMColor src[], int n, const SkAlpha aa[ ]) const override {
1285 if (NULL == aa) {
1286 while (n & 3) {
1287 *dst = ProcType::Xfer(SkPMFloat(*src++), SkPMFloat(*dst)).get();
1288 dst++;
1289 n -= 1;
1290 }
1291 n >>= 2;
1292 for (int i = 0; i < n; ++i) {
1293 SkPMFloat s0, s1, s2, s3;
1294 SkPMFloat::From4PMColors(src, &s0, &s1, &s2, &s3);
1295 SkPMFloat d0, d1, d2, d3;
1296 SkPMFloat::From4PMColors(dst, &d0, &d1, &d2, &d3);
1297 SkPMFloat::To4PMColors(ProcType::Xfer(s0, d0), ProcType::Xfer(s1 , d1),
1298 ProcType::Xfer(s2, d2), ProcType::Xfer(s3 , d3), dst);
1299 src += 4;
1300 dst += 4;
1301 }
1302 } else {
1303 for (int i = 0; i < n; ++i) {
1304 const Sk4f aa4 = Sk4f(aa[i] * gInv255);
1305 SkPMFloat dstF(dst[i]);
1306 SkPMFloat srcF(src[i]);
1307 Sk4f res;
1308 if (ProcType::kFoldCoverageIntoSrcAlpha && false) {
mtklein 2015/04/02 17:18:00 ? Something about this still TODO?
reed2 2015/04/02 17:27:40 Needed some Min() checks in Screen and Xor... done
1309 Sk4f src4 = srcF;
1310 res = ProcType::Xfer(src4 * aa4, dstF);
1311 } else {
1312 res = ramp(dstF, ProcType::Xfer(srcF, dstF), aa4);
1313 }
1314 dst[i] = SkPMFloat(res).get();
1315 }
1316 }
1317 }
1318
1319 private:
1320 SkT4fXfermode(const ProcCoeff& rec) : SkProcCoeffXfermode(rec, ProcType::kMo de) {}
1321
1322 typedef SkProcCoeffXfermode INHERITED;
1323 };
1324 #endif
1325
1326 ///////////////////////////////////////////////////////////////////////////////
1327
1189 class SkDstOutXfermode : public SkProcCoeffXfermode { 1328 class SkDstOutXfermode : public SkProcCoeffXfermode {
1190 public: 1329 public:
1191 static SkDstOutXfermode* Create(const ProcCoeff& rec) { 1330 static SkDstOutXfermode* Create(const ProcCoeff& rec) {
1192 return SkNEW_ARGS(SkDstOutXfermode, (rec)); 1331 return SkNEW_ARGS(SkDstOutXfermode, (rec));
1193 } 1332 }
1194 1333
1195 void xfer32(SkPMColor*, const SkPMColor*, int, const SkAlpha*) const overrid e; 1334 void xfer32(SkPMColor*, const SkPMColor*, int, const SkAlpha*) const overrid e;
1196 1335
1197 SK_TO_STRING_OVERRIDE() 1336 SK_TO_STRING_OVERRIDE()
1198 1337
(...skipping 39 matching lines...) Expand 10 before | Expand all | Expand 10 after
1238 SkXfermode* create_mode(int iMode) { 1377 SkXfermode* create_mode(int iMode) {
1239 SkXfermode::Mode mode = (SkXfermode::Mode)iMode; 1378 SkXfermode::Mode mode = (SkXfermode::Mode)iMode;
1240 1379
1241 ProcCoeff rec = gProcCoeffs[mode]; 1380 ProcCoeff rec = gProcCoeffs[mode];
1242 SkXfermodeProc pp = SkPlatformXfermodeProcFactory(mode); 1381 SkXfermodeProc pp = SkPlatformXfermodeProcFactory(mode);
1243 if (pp != NULL) { 1382 if (pp != NULL) {
1244 rec.fProc = pp; 1383 rec.fProc = pp;
1245 } 1384 }
1246 1385
1247 SkXfermode* xfer = NULL; 1386 SkXfermode* xfer = NULL;
1387
1388 #ifndef SK_SUPPORT_LEGACY_SCALAR_XFERMODES
1389 switch (mode) {
1390 case SkXfermode::kSrcATop_Mode:
1391 xfer = SkT4fXfermode<SrcATop4f>::Create(rec);
1392 break;
1393 case SkXfermode::kDstATop_Mode:
1394 xfer = SkT4fXfermode<DstATop4f>::Create(rec);
1395 break;
1396 case SkXfermode::kXor_Mode:
1397 xfer = SkT4fXfermode<Xor4f>::Create(rec);
1398 break;
1399 case SkXfermode::kPlus_Mode:
1400 xfer = SkT4fXfermode<Plus4f>::Create(rec);
1401 break;
1402 case SkXfermode::kModulate_Mode:
1403 xfer = SkT4fXfermode<Modulate4f>::Create(rec);
1404 break;
1405 case SkXfermode::kScreen_Mode:
1406 xfer = SkT4fXfermode<Screen4f>::Create(rec);
1407 break;
1408 default:
1409 break;
1410 }
1411 if (xfer) {
1412 return xfer;
1413 }
1414 #endif
1415
1248 // check if we have a platform optim for that 1416 // check if we have a platform optim for that
1249 SkProcCoeffXfermode* xfm = SkPlatformXfermodeFactory(rec, mode); 1417 SkProcCoeffXfermode* xfm = SkPlatformXfermodeFactory(rec, mode);
1250 if (xfm != NULL) { 1418 if (xfm != NULL) {
1251 xfer = xfm; 1419 xfer = xfm;
1252 } else { 1420 } else {
1253 // All modes can in theory be represented by the ProcCoeff rec, since 1421 // All modes can in theory be represented by the ProcCoeff rec, since
1254 // it contains function ptrs. However, a few modes are both simple and 1422 // it contains function ptrs. However, a few modes are both simple and
1255 // commonly used, so we call those out for their own subclasses here. 1423 // commonly used, so we call those out for their own subclasses here.
1256 switch (mode) { 1424 switch (mode) {
1257 case SkXfermode::kClear_Mode: 1425 case SkXfermode::kClear_Mode:
(...skipping 278 matching lines...) Expand 10 before | Expand all | Expand 10 after
1536 } else { 1704 } else {
1537 proc16 = rec.fProc16_General; 1705 proc16 = rec.fProc16_General;
1538 } 1706 }
1539 } 1707 }
1540 return proc16; 1708 return proc16;
1541 } 1709 }
1542 1710
1543 SK_DEFINE_FLATTENABLE_REGISTRAR_GROUP_START(SkXfermode) 1711 SK_DEFINE_FLATTENABLE_REGISTRAR_GROUP_START(SkXfermode)
1544 SK_DEFINE_FLATTENABLE_REGISTRAR_ENTRY(SkProcCoeffXfermode) 1712 SK_DEFINE_FLATTENABLE_REGISTRAR_ENTRY(SkProcCoeffXfermode)
1545 SK_DEFINE_FLATTENABLE_REGISTRAR_GROUP_END 1713 SK_DEFINE_FLATTENABLE_REGISTRAR_GROUP_END
OLDNEW
« no previous file with comments | « bench/XfermodeBench.cpp ('k') | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698