third_party/WebKit/Source/platform/cpu/mips/CommonMacrosMSA.h - Issue 2392443003: Add MSA (MIPS SIMD Arch) optimized color conversion functions

Unified Diff: third_party/WebKit/Source/platform/cpu/mips/CommonMacrosMSA.h

Issue 2392443003: Add MSA (MIPS SIMD Arch) optimized color conversion functions (Closed)

Patch Set: Created 4 years, 2 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Index: third_party/WebKit/Source/platform/cpu/mips/CommonMacrosMSA.h

diff --git a/third_party/WebKit/Source/platform/cpu/mips/CommonMacrosMSA.h b/third_party/WebKit/Source/platform/cpu/mips/CommonMacrosMSA.h

index e20cfca38a9e8201ab46ee507f1894b38feefa13..5f3d3326c2e69dc54cead1d1054b4c4c9e550448 100644

--- a/third_party/WebKit/Source/platform/cpu/mips/CommonMacrosMSA.h

+++ b/third_party/WebKit/Source/platform/cpu/mips/CommonMacrosMSA.h

@@ -142,6 +142,14 @@ MSA_STORE_FUNC(uint32_t, usw, msa_usw);

#define LD_UH4(...) LD_V4(v8u16, __VA_ARGS__)

#define LD_SP4(...) LD_V4(v4f32, __VA_ARGS__)

+#define LD_V5(RTYPE, psrc, stride, out0, out1, out2, out3, out4) \

+ { \

+ LD_V4(RTYPE, psrc, stride, out0, out1, out2, out3); \

+ out4 = LD_V(RTYPE, psrc); \

+ psrc += stride; \

+ }

+#define LD_UB5(...) LD_V5(v16u8, __VA_ARGS__)

#define LD_V6(RTYPE, psrc, stride, out0, out1, out2, out3, out4, out5) \

{ \

LD_V4(RTYPE, psrc, stride, out0, out1, out2, out3); \

@@ -151,6 +159,13 @@ MSA_STORE_FUNC(uint32_t, usw, msa_usw);

#define LD_UH6(...) LD_V6(v8u16, __VA_ARGS__)

#define LD_SP6(...) LD_V6(v4f32, __VA_ARGS__)

+#define LD_V7(RTYPE, psrc, stride, out0, out1, out2, out3, out4, out5, out6) \

+ { \

+ LD_V5(RTYPE, psrc, stride, out0, out1, out2, out3, out4); \

+ LD_V2(RTYPE, psrc, stride, out5, out6); \

+ }

+#define LD_UB7(...) LD_V7(v16u8, __VA_ARGS__)

#define LD_V8(RTYPE, psrc, stride, out0, out1, out2, out3, out4, out5, out6, \

out7) \

{ \

@@ -212,6 +227,17 @@ MSA_STORE_FUNC(uint32_t, usw, msa_usw);

#define ST_UB8(...) ST_V8(v16u8, __VA_ARGS__)

#define ST_SP8(...) ST_V8(v4f32, __VA_ARGS__)

+/* Description : Store 8x1 byte block to destination memory from input vector

+ Arguments : Inputs - in, pdst

+ Details : Index 0 double word element from 'in' vector is copied to the

+ GP register and stored to (pdst)

+*/

+#define ST8x1_UB(in, pdst) \

+ { \

+ const uint64_t out0m = __msa_copy_s_d((v2i64)in, 0); \

+ SD(out0m, pdst); \

+ }

/* Description : Logical and in0 and in1.

Arguments : Inputs - in0, in1, in2, in3,

Outputs - out0, out1, out2, out3

@@ -297,6 +323,14 @@ MSA_STORE_FUNC(uint32_t, usw, msa_usw);

#define SHF_B2_UB(...) SHF_B2(v16u8, __VA_ARGS__)

#define SHF_B2_UH(...) SHF_B2(v8u16, __VA_ARGS__)

+#define SHF_B3(RTYPE, in0, in1, in2, shf_val) \

+ { \

+ SHF_B2(RTYPE, in0, in1, shf_val); \

+ in2 = (RTYPE)__msa_shf_b((v16i8)in2, shf_val); \

+ }

+#define SHF_B3_UB(...) SHF_B3(v16u8, __VA_ARGS__)

+#define SHF_B3_UH(...) SHF_B3(v8u16, __VA_ARGS__)

#define SHF_B4(RTYPE, in0, in1, in2, in3, shf_val) \

{ \

SHF_B2(RTYPE, in0, in1, shf_val); \

@@ -305,6 +339,17 @@ MSA_STORE_FUNC(uint32_t, usw, msa_usw);

#define SHF_B4_UB(...) SHF_B4(v16u8, __VA_ARGS__)

#define SHF_B4_UH(...) SHF_B4(v8u16, __VA_ARGS__)

+/* Description : Shuffle byte vector elements as per mask vector

+ Arguments : Inputs - in0, in1, in2, in3, mask0, mask1

+ Outputs - out0, out1

+ Return Type - as per RTYPE

+ Details : Byte elements from 'in0' & 'in1' are copied selectively to

+ 'out0' as per control vector 'mask0'

+*/

+#define VSHF_B(RTYPE, in0, in1, mask) \

+ (RTYPE) __msa_vshf_b((v16i8)mask, (v16i8)in1, (v16i8)in0);

+#define VSHF_UB(...) VSHF_B(v16u8, __VA_ARGS__)

/* Description : Interleave even byte elements from vectors

Arguments : Inputs - in0, in1, in2, in3

Outputs - out0, out1

@@ -341,6 +386,35 @@ MSA_STORE_FUNC(uint32_t, usw, msa_usw);

}

#define ILVEV_H2_UB(...) ILVEV_H2(v16u8, __VA_ARGS__)

+/* Description : Interleave right half of double word elements from vectors

+ * Arguments : Inputs - in0, in1, in2, in3

+ * Outputs - out0, out1

+ * Return Type - as per RTYPE

+ * Details : Right half of double word elements of 'in0' and 'in1' are

+ * interleaved and written to 'out0'.

+ */

+#define ILVR_D2(RTYPE, in0, in1, in2, in3, out0, out1) \

+ { \

+ out0 = (RTYPE)__msa_ilvr_d((v2i64)in0, (v2i64)in1); \

+ out1 = (RTYPE)__msa_ilvr_d((v2i64)in2, (v2i64)in3); \

+ }

+#define ILVR_D2_UB(...) ILVR_D2(v16u8, __VA_ARGS__)

+#define ILVR_D3(RTYPE, in0, in1, in2, in3, in4, in5, out0, out1, out2) \

+ { \

+ ILVR_D2(RTYPE, in0, in1, in2, in3, out0, out1); \

+ out2 = (RTYPE)__msa_ilvr_d((v2i64)in4, (v2i64)in5); \

+ }

+#define ILVR_D3_UB(...) ILVR_D3(v16u8, __VA_ARGS__)

+#define ILVR_D4(RTYPE, in0, in1, in2, in3, in4, in5, in6, in7, out0, out1, \

+ out2, out3) \

+ { \

+ ILVR_D2(RTYPE, in0, in1, in2, in3, out0, out1); \

+ ILVR_D2(RTYPE, in4, in5, in6, in7, out2, out3); \

+ }

+#define ILVR_D4_UB(...) ILVR_D4(v16u8, __VA_ARGS__)

/* Description : Interleave both left and right half of input vectors

Arguments : Inputs - in0, in1

Outputs - out0, out1

@@ -376,6 +450,37 @@ MSA_STORE_FUNC(uint32_t, usw, msa_usw);

}

#define ILVODEV_B2_UB(...) ILVODEV_B2(v16u8, __VA_ARGS__)

+/* Description : Pack even byte elements of vector pairs

+ * Arguments : Inputs - in0, in1, in2, in3

+ * Outputs - out0, out1

+ * Return Type - as per RTYPE

+ * Details : Even byte elements of 'in0' are copied to the left half of

+ * 'out0' & even byte elements of 'in1' are copied to the right

+ * half of 'out0'.

+ */

+#define PCKEV_B2(RTYPE, in0, in1, in2, in3, out0, out1) \

+ { \

+ out0 = (RTYPE)__msa_pckev_b((v16i8)in0, (v16i8)in1); \

+ out1 = (RTYPE)__msa_pckev_b((v16i8)in2, (v16i8)in3); \

+ }

+#define PCKEV_B2_UB(...) PCKEV_B2(v16u8, __VA_ARGS__)

+#define PCKEV_B2_UH(...) PCKEV_B2(v8u16, __VA_ARGS__)

+#define PCKEV_B3(RTYPE, in0, in1, in2, in3, in4, in5, out0, out1, out2) \

+ { \

+ PCKEV_B2(RTYPE, in0, in1, in2, in3, out0, out1); \

+ out2 = (RTYPE)__msa_pckev_b((v16i8)in4, (v16i8)in5); \

+ }

+#define PCKEV_B3_UH(...) PCKEV_B3(v8u16, __VA_ARGS__)

+#define PCKEV_B4(RTYPE, in0, in1, in2, in3, in4, in5, in6, in7, out0, out1, \

+ out2, out3) \

+ { \

+ PCKEV_B2(RTYPE, in0, in1, in2, in3, out0, out1); \

+ PCKEV_B2(RTYPE, in4, in5, in6, in7, out2, out3); \

+ }

+#define PCKEV_B4_UH(...) PCKEV_B4(v8u16, __VA_ARGS__)

/* Description : Pack even halfword elements of vector pairs

Arguments : Inputs - in0, in1, in2, in3

Outputs - out0, out1

@@ -464,6 +569,43 @@ MSA_STORE_FUNC(uint32_t, usw, msa_usw);

}

#define SRLI_B4_UB(...) SRLI_B4(v16u8, __VA_ARGS__)

+/* Description : Logical shift right all elements of vector (immediate)

+ Arguments : Inputs - in0, in1, in2, in3, shift

+ Outputs - out0, out1, out2, out3

+ Return Type - as per RTYPE

+ Details : Each element of vector 'in0' is right shifted by 'shift' and

+ the result is written in 'out0'. 'shift' is an immediate value.

+*/

+#define SRLI_H2(RTYPE, in0, in1, out0, out1, shift) \

+ { \

+ out0 = (RTYPE)SRLI_H((v8i16)in0, shift); \

+ out1 = (RTYPE)SRLI_H((v8i16)in1, shift); \

+ }

+#define SRLI_H2_UB(...) SRLI_H2(v16u8, __VA_ARGS__)

+#define SRLI_H4(RTYPE, in0, in1, in2, in3, out0, out1, out2, out3, shift) \

+ { \

+ SRLI_H2(RTYPE, in0, in1, out0, out1, shift); \

+ SRLI_H2(RTYPE, in2, in3, out2, out3, shift); \

+ }

+#define SRLI_H4_UB(...) SRLI_H4(v16u8, __VA_ARGS__)

+/* Description : Immediate Bit Insert Left (immediate)

+ Arguments : Inputs - in0, in1, in2, in3, shift

+ Outputs - out0, out1

+ Return Type - as per RTYPE

+ Details : Copy most significant (left) bits in each element of vector

+ 'in1' to elements in vector in0 while preserving the least

+ significant (right) bits. The number of bits to copy is given

+ by the immediate 'shift + 1'.

+*/

+#define BINSLI_B2(RTYPE, in0, in1, in2, in3, out0, out1, shift) \

+ { \

+ out0 = (RTYPE)__msa_binsli_b((v16u8)in0, (v16u8)in1, shift); \

+ out1 = (RTYPE)__msa_binsli_b((v16u8)in2, (v16u8)in3, shift); \

+ }

+#define BINSLI_B2_UB(...) BINSLI_B2(v16u8, __VA_ARGS__)

/* Description : Immediate Bit Insert Right (immediate)

Arguments : Inputs - in0, in1, in2, in3, shift

Outputs - out0, out1

« no previous file with comments | « no previous file | third_party/WebKit/Source/platform/graphics/cpu/mips/WebGLImageConversionMSA.h » ('j') | no next file with comments »