OLD | NEW |
1 #ifndef Sk4x_DEFINED | 1 #ifndef Sk4x_DEFINED |
2 #define Sk4x_DEFINED | 2 #define Sk4x_DEFINED |
3 | 3 |
4 #include "SkTypes.h" | 4 #include "SkTypes.h" |
5 | 5 |
6 #define SK4X_PREAMBLE 1 | 6 #define SK4X_PREAMBLE 1 |
7 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE2 | 7 #include "Sk4x_portable.h" |
8 #include "Sk4x_sse.h" | |
9 #else | |
10 #include "Sk4x_portable.h" | |
11 #endif | |
12 #undef SK4X_PREAMBLE | 8 #undef SK4X_PREAMBLE |
13 | 9 |
14 template <typename T> class Sk4x; | 10 template <typename T> class Sk4x; |
15 typedef Sk4x<float> Sk4f; | 11 typedef Sk4x<float> Sk4f; |
16 typedef Sk4x<int32_t> Sk4i; | 12 typedef Sk4x<int32_t> Sk4i; |
17 | 13 |
18 // Some Sk4x methods are implemented only for Sk4f or Sk4i. | |
19 // They might be unavailable, really slow, or just a bad idea. | |
20 // Talk to mtklein if you find yourself unable to link and | |
21 // really need one of those methods. | |
22 | |
23 template <typename T> class Sk4x { | 14 template <typename T> class Sk4x { |
24 public: | 15 public: |
25 Sk4x(); // Uninitialized; use Sk4x(0,0,0,0) for zero. | 16 Sk4x(); // Uninitialized; use Sk4x(0,0,0,0) for zero. |
26 Sk4x(T, T, T, T); | 17 Sk4x(T, T, T, T); |
27 | 18 |
28 Sk4x(const Sk4x&); | 19 Sk4x(const Sk4x&); |
29 Sk4x& operator=(const Sk4x&); | 20 Sk4x& operator=(const Sk4x&); |
30 | 21 |
31 static Sk4x Load (const T[4]); | 22 static Sk4x Load (const T[4]); |
32 static Sk4x LoadAligned(const T[4]); | 23 static Sk4x LoadAligned(const T[4]); |
33 | 24 |
34 void store (T[4]) const; | 25 void store (T[4]) const; |
35 void storeAligned(T[4]) const; | 26 void storeAligned(T[4]) const; |
36 | 27 |
37 template <typename Dst> Dst reinterpret() const; | 28 template <typename Dst> Dst reinterpret() const; |
38 template <typename Dst> Dst cast() const; | 29 template <typename Dst> Dst cast() const; |
39 | 30 |
40 bool allTrue() const; | 31 bool allTrue() const; |
41 bool anyTrue() const; | 32 bool anyTrue() const; |
42 | 33 |
43 Sk4x bitNot() const; | 34 Sk4x bitNot() const; |
44 Sk4x bitAnd(const Sk4x&) const; | 35 Sk4x bitAnd(const Sk4x&) const; |
45 Sk4x bitOr(const Sk4x&) const; | 36 Sk4x bitOr(const Sk4x&) const; |
46 // TODO: Sk4x bitAndNot(const Sk4x&) const; is efficient in SSE. | |
47 Sk4x add(const Sk4x&) const; | 37 Sk4x add(const Sk4x&) const; |
48 Sk4x subtract(const Sk4x&) const; | 38 Sk4x subtract(const Sk4x&) const; |
49 Sk4x multiply(const Sk4x&) const; | 39 Sk4x multiply(const Sk4x&) const; |
50 Sk4x divide(const Sk4x&) const; | 40 Sk4x divide(const Sk4x&) const; |
51 | 41 |
52 Sk4i equal(const Sk4x&) const; | 42 Sk4i equal(const Sk4x&) const; |
53 Sk4i notEqual(const Sk4x&) const; | 43 Sk4i notEqual(const Sk4x&) const; |
54 Sk4i lessThan(const Sk4x&) const; | 44 Sk4i lessThan(const Sk4x&) const; |
55 Sk4i greaterThan(const Sk4x&) const; | 45 Sk4i greaterThan(const Sk4x&) const; |
56 Sk4i lessThanEqual(const Sk4x&) const; | 46 Sk4i lessThanEqual(const Sk4x&) const; |
57 Sk4i greaterThanEqual(const Sk4x&) const; | 47 Sk4i greaterThanEqual(const Sk4x&) const; |
58 | 48 |
59 static Sk4x Min(const Sk4x& a, const Sk4x& b); | 49 static Sk4x Min(const Sk4x& a, const Sk4x& b); |
60 static Sk4x Max(const Sk4x& a, const Sk4x& b); | 50 static Sk4x Max(const Sk4x& a, const Sk4x& b); |
61 | 51 |
62 // Swizzles follow OpenCL xyzw convention. | 52 // Swizzles follow OpenCL xyzw convention. |
63 Sk4x zwxy() const; | 53 Sk4x zwxy() const; |
64 | 54 |
65 // When there's a second argument, it's abcd. | 55 // When there's a second argument, it's abcd. |
66 static Sk4x XYAB(const Sk4x& xyzw, const Sk4x& abcd); | 56 static Sk4x XYAB(const Sk4x& xyzw, const Sk4x& abcd); |
67 static Sk4x ZWCD(const Sk4x& xyzw, const Sk4x& abcd); | 57 static Sk4x ZWCD(const Sk4x& xyzw, const Sk4x& abcd); |
68 | 58 |
69 // TODO: these are particularly efficient in SSE. Useful? Also efficient i
n NEON? | |
70 // static Sk4x XAYB(const Sk4x& xyzw, const Sk4x& abcd); | |
71 // static Sk4x ZCWD(const Sk4x& xyzw, const Sk4x& abcd); | |
72 | |
73 private: | 59 private: |
74 // It's handy to have Sk4f and Sk4i be mutual friends. | 60 // It's handy to have Sk4f and Sk4i be mutual friends. |
75 template <typename S> friend class Sk4x; | 61 template <typename S> friend class Sk4x; |
76 | 62 |
77 #define SK4X_PRIVATE 1 | 63 #define SK4X_PRIVATE 1 |
78 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE2 | 64 #include "Sk4x_portable.h" |
79 #include "Sk4x_sse.h" | |
80 #else | |
81 #include "Sk4x_portable.h" | |
82 #endif | |
83 #undef SK4X_PRIVATE | 65 #undef SK4X_PRIVATE |
84 }; | 66 }; |
85 | 67 |
86 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE2 | 68 #include "Sk4x_portable.h" |
87 #include "Sk4x_sse.h" | |
88 #else | |
89 #include "Sk4x_portable.h" | |
90 #endif | |
91 | 69 |
92 #endif//Sk4x_DEFINED | 70 #endif//Sk4x_DEFINED |
OLD | NEW |