src/opts/SkXfermode_opts_arm_neon.cpp - Issue 104883004: ARM Skia NEON patches - 32 - Xfermode: 1-pixel NEON modeprocs

Unified Diff: src/opts/SkXfermode_opts_arm_neon.cpp

Issue 104883004: ARM Skia NEON patches - 32 - Xfermode: 1-pixel NEON modeprocs (Closed) Base URL: https://skia.googlecode.com/svn/trunk

Patch Set: Created 7 years ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: src/opts/SkXfermode_opts_arm_neon.cpp

diff --git a/src/opts/SkXfermode_opts_arm_neon.cpp b/src/opts/SkXfermode_opts_arm_neon.cpp

index 7435dd44de102af82ac3af028fb57da1be8ac7a4..c920e537b1e551f87d093dbdfcdc7f84d155f04b 100644

--- a/src/opts/SkXfermode_opts_arm_neon.cpp

+++ b/src/opts/SkXfermode_opts_arm_neon.cpp

@@ -93,6 +93,133 @@ static inline uint8x8_t clamp_div255round_simd8_32(int32x4_t val1, int32x4_t val

}

////////////////////////////////////////////////////////////////////////////////

+// 1 pixel modeprocs

+////////////////////////////////////////////////////////////////////////////////

+// kSrcATop_Mode, //!< [Da, Sc * Da + (1 - Sa) * Dc]

+SkPMColor srcatop_modeproc_neon(SkPMColor src, SkPMColor dst) {

+ unsigned sa = SkGetPackedA32(src);

+ unsigned da = SkGetPackedA32(dst);

+ unsigned isa = 255 - sa;

+ uint8x8_t vda, visa, vsrc, vdst;

+ vda = vdup_n_u8(da);

+ visa = vdup_n_u8(isa);

+ uint16x8_t vsrc_wide, vdst_wide;

+ vsrc_wide = vmull_u8(vda, vreinterpret_u8_u32(vdup_n_u32(src)));

+ vdst_wide = vmull_u8(visa, vreinterpret_u8_u32(vdup_n_u32(dst)));

+ vsrc_wide += vdupq_n_u16(128);

+ vsrc_wide += vshrq_n_u16(vsrc_wide, 8);

+ vdst_wide += vdupq_n_u16(128);

+ vdst_wide += vshrq_n_u16(vdst_wide, 8);

+ vsrc = vshrn_n_u16(vsrc_wide, 8);

+ vdst = vshrn_n_u16(vdst_wide, 8);

+ vsrc += vdst;

+ vsrc = vset_lane_u8(da, vsrc, 3);

+ return vget_lane_u32(vreinterpret_u32_u8(vsrc), 0);

+// kDstATop_Mode, //!< [Sa, Sa * Dc + Sc * (1 - Da)]

+SkPMColor dstatop_modeproc_neon(SkPMColor src, SkPMColor dst) {

+ unsigned sa = SkGetPackedA32(src);

+ unsigned da = SkGetPackedA32(dst);

+ unsigned ida = 255 - da;

+ uint8x8_t vsa, vida, vsrc, vdst;

+ vsa = vdup_n_u8(sa);

+ vida = vdup_n_u8(ida);

+ uint16x8_t vsrc_wide, vdst_wide;

+ vsrc_wide = vmull_u8(vida, vreinterpret_u8_u32(vdup_n_u32(src)));

+ vdst_wide = vmull_u8(vsa, vreinterpret_u8_u32(vdup_n_u32(dst)));

+ vsrc_wide += vdupq_n_u16(128);

+ vsrc_wide += vshrq_n_u16(vsrc_wide, 8);

+ vdst_wide += vdupq_n_u16(128);

+ vdst_wide += vshrq_n_u16(vdst_wide, 8);

+ vsrc = vshrn_n_u16(vsrc_wide, 8);

+ vdst = vshrn_n_u16(vdst_wide, 8);

+ vsrc += vdst;

+ vsrc = vset_lane_u8(sa, vsrc, 3);

+ return vget_lane_u32(vreinterpret_u32_u8(vsrc), 0);

+// kXor_Mode [Sa + Da - 2 * Sa * Da, Sc * (1 - Da) + (1 - Sa) * Dc]

+SkPMColor xor_modeproc_neon(SkPMColor src, SkPMColor dst) {

+ unsigned sa = SkGetPackedA32(src);

+ unsigned da = SkGetPackedA32(dst);

+ unsigned ret_alpha = sa + da - (SkAlphaMulAlpha(sa, da) << 1);

+ unsigned isa = 255 - sa;

+ unsigned ida = 255 - da;

+ uint8x8_t vsrc, vdst, visa, vida;

+ uint16x8_t vsrc_wide, vdst_wide;

+ visa = vdup_n_u8(isa);

+ vida = vdup_n_u8(ida);

+ vsrc = vreinterpret_u8_u32(vdup_n_u32(src));

+ vdst = vreinterpret_u8_u32(vdup_n_u32(dst));

+ vsrc_wide = vmull_u8(vsrc, vida);

+ vdst_wide = vmull_u8(vdst, visa);

+ vsrc_wide += vdupq_n_u16(128);

+ vsrc_wide += vshrq_n_u16(vsrc_wide, 8);

+ vdst_wide += vdupq_n_u16(128);

+ vdst_wide += vshrq_n_u16(vdst_wide, 8);

+ vsrc = vshrn_n_u16(vsrc_wide, 8);

+ vdst = vshrn_n_u16(vdst_wide, 8);

+ vsrc += vdst;

+ vsrc = vset_lane_u8(ret_alpha, vsrc, 3);

+ return vget_lane_u32(vreinterpret_u32_u8(vsrc), 0);

+// kPlus_Mode

+SkPMColor plus_modeproc_neon(SkPMColor src, SkPMColor dst) {

+ uint8x8_t vsrc, vdst;

+ vsrc = vreinterpret_u8_u32(vdup_n_u32(src));

+ vdst = vreinterpret_u8_u32(vdup_n_u32(dst));

+ vsrc = vqadd_u8(vsrc, vdst);

+ return vget_lane_u32(vreinterpret_u32_u8(vsrc), 0);

+// kModulate_Mode

+SkPMColor modulate_modeproc_neon(SkPMColor src, SkPMColor dst) {

+ uint8x8_t vsrc, vdst, vres;

+ uint16x8_t vres_wide;

+ vsrc = vreinterpret_u8_u32(vdup_n_u32(src));

+ vdst = vreinterpret_u8_u32(vdup_n_u32(dst));

+ vres_wide = vmull_u8(vsrc, vdst);

+ vres_wide += vdupq_n_u16(128);

+ vres_wide += vshrq_n_u16(vres_wide, 8);

+ vres = vshrn_n_u16(vres_wide, 8);

+ return vget_lane_u32(vreinterpret_u32_u8(vres), 0);

+////////////////////////////////////////////////////////////////////////////////

// 8 pixels modeprocs

////////////////////////////////////////////////////////////////////////////////

« src/core/SkXfermode.cpp ('K') | « src/opts/SkXfermode_opts_arm_neon.h ('k') | no next file » | no next file with comments »