| OLD | NEW |
| 1 #include "SkColorPriv.h" | 1 #include "SkColorPriv.h" |
| 2 #include <arm_neon.h> | 2 #include <arm_neon.h> |
| 3 | 3 |
| 4 // For set(), we widen our 8 bit components (fix8) to 8-bit components in 16 bit
s (fix8_16), | 4 // For SkPMFloat(SkPMFColor), we widen our 8 bit components (fix8) to 8-bit comp
onents in 16 bits |
| 5 // then widen those to 8-bit-in-32-bits (fix8_32), and finally convert those to
floats. | 5 // (fix8_16), then widen those to 8-bit-in-32-bits (fix8_32), and finally conver
t those to floats. |
| 6 | 6 |
| 7 // get() and clamped() do the opposite, working from floats to 8-bit-in-32-bit, | 7 // get() and clamped() do the opposite, working from floats to 8-bit-in-32-bit, |
| 8 // to 8-bit-in-16-bit, back down to 8-bit components. | 8 // to 8-bit-in-16-bit, back down to 8-bit components. |
| 9 // clamped() uses vqmovn to clamp while narrowing instead of just narrowing with
vmovn. | 9 // clamped() uses vqmovn to clamp while narrowing instead of just narrowing with
vmovn. |
| 10 | 10 |
| 11 inline void SkPMFloat::set(SkPMColor c) { | 11 inline SkPMFloat::SkPMFloat(SkPMColor c) { |
| 12 SkPMColorAssert(c); | 12 SkPMColorAssert(c); |
| 13 uint8x8_t fix8 = (uint8x8_t)vdup_n_u32(c); | 13 uint8x8_t fix8 = (uint8x8_t)vdup_n_u32(c); |
| 14 uint16x8_t fix8_16 = vmovl_u8(fix8); | 14 uint16x8_t fix8_16 = vmovl_u8(fix8); |
| 15 uint32x4_t fix8_32 = vmovl_u16(vget_low_u16(fix8_16)); | 15 uint32x4_t fix8_32 = vmovl_u16(vget_low_u16(fix8_16)); |
| 16 vst1q_f32(fColor, vcvtq_f32_u32(fix8_32)); | 16 vst1q_f32(fColor, vcvtq_f32_u32(fix8_32)); |
| 17 SkASSERT(this->isValid()); | 17 SkASSERT(this->isValid()); |
| 18 } | 18 } |
| 19 | 19 |
| 20 inline SkPMColor SkPMFloat::get() const { | 20 inline SkPMColor SkPMFloat::get() const { |
| 21 SkASSERT(this->isValid()); | 21 SkASSERT(this->isValid()); |
| 22 float32x4_t add_half = vaddq_f32(vld1q_f32(fColor), vdupq_n_f32(0.5f)); | 22 float32x4_t add_half = vaddq_f32(vld1q_f32(fColor), vdupq_n_f32(0.5f)); |
| 23 uint32x4_t fix8_32 = vcvtq_u32_f32(add_half); // vcvtq_u32_f32 truncates,
so round manually | 23 uint32x4_t fix8_32 = vcvtq_u32_f32(add_half); // vcvtq_u32_f32 truncates,
so round manually |
| 24 uint16x4_t fix8_16 = vmovn_u32(fix8_32); | 24 uint16x4_t fix8_16 = vmovn_u32(fix8_32); |
| 25 uint8x8_t fix8 = vmovn_u16(vcombine_u16(fix8_16, vdup_n_u16(0))); | 25 uint8x8_t fix8 = vmovn_u16(vcombine_u16(fix8_16, vdup_n_u16(0))); |
| 26 SkPMColor c = vget_lane_u32((uint32x2_t)fix8, 0); | 26 SkPMColor c = vget_lane_u32((uint32x2_t)fix8, 0); |
| 27 SkPMColorAssert(c); | 27 SkPMColorAssert(c); |
| 28 return c; | 28 return c; |
| 29 } | 29 } |
| 30 | 30 |
| 31 inline SkPMColor SkPMFloat::clamped() const { | 31 inline SkPMColor SkPMFloat::clamped() const { |
| 32 float32x4_t add_half = vaddq_f32(vld1q_f32(fColor), vdupq_n_f32(0.5f)); | 32 float32x4_t add_half = vaddq_f32(vld1q_f32(fColor), vdupq_n_f32(0.5f)); |
| 33 uint32x4_t fix8_32 = vcvtq_u32_f32(add_half); // vcvtq_u32_f32 truncates,
so round manually | 33 uint32x4_t fix8_32 = vcvtq_u32_f32(add_half); // vcvtq_u32_f32 truncates,
so round manually |
| 34 uint16x4_t fix8_16 = vqmovn_u32(fix8_32); | 34 uint16x4_t fix8_16 = vqmovn_u32(fix8_32); |
| 35 uint8x8_t fix8 = vqmovn_u16(vcombine_u16(fix8_16, vdup_n_u16(0))); | 35 uint8x8_t fix8 = vqmovn_u16(vcombine_u16(fix8_16, vdup_n_u16(0))); |
| 36 SkPMColor c = vget_lane_u32((uint32x2_t)fix8, 0); | 36 SkPMColor c = vget_lane_u32((uint32x2_t)fix8, 0); |
| 37 SkPMColorAssert(c); | 37 SkPMColorAssert(c); |
| 38 return c; | 38 return c; |
| 39 } | 39 } |
| OLD | NEW |