Chromium Code Reviews| Index: tests_lit/llvm2ice_tests/vector-ops.ll |
| diff --git a/tests_lit/llvm2ice_tests/vector-ops.ll b/tests_lit/llvm2ice_tests/vector-ops.ll |
| index 86647db26b822136b40c8f58f92028e01545885d..c730d7315cd981518200e359df0fc1c47e9e3a05 100644 |
| --- a/tests_lit/llvm2ice_tests/vector-ops.ll |
| +++ b/tests_lit/llvm2ice_tests/vector-ops.ll |
| @@ -1,10 +1,19 @@ |
| ; This checks support for insertelement and extractelement. |
| -; RUN: %llvm2ice --verbose inst %s | FileCheck %s |
| +; RUN: %llvm2ice -O2 --verbose none %s | FileCheck %s |
| +; RUN: %llvm2ice -Om1 --verbose none %s | FileCheck %s |
| +; RUN: %llvm2ice -O2 -mattr=sse4.1 --verbose none %s \ |
| +; RUN: | FileCheck %s --check-prefix=SSE41 |
| +; RUN: %llvm2ice -Om1 -mattr=sse4.1 --verbose none %s \ |
| +; RUN: | FileCheck %s --check-prefix=SSE41 |
| ; RUN: %llvm2ice -O2 --verbose none %s \ |
| ; RUN: | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj |
| ; RUN: %llvm2ice -Om1 --verbose none %s \ |
| ; RUN: | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj |
| +; RUN: %llvm2ice -O2 -mattr=sse4.1 --verbose none %s \ |
| +; RUN: | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj |
| +; RUN: %llvm2ice -Om1 -mattr=sse4.1 --verbose none %s \ |
| +; RUN: | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj |
| ; RUN: %llvm2ice --verbose none %s | FileCheck --check-prefix=ERRORS %s |
| ; RUN: %llvm2iceinsts %s | %szdiff %s | FileCheck --check-prefix=DUMP %s |
| ; RUN: %llvm2iceinsts --pnacl %s | %szdiff %s \ |
| @@ -18,6 +27,9 @@ entry: |
| ret <4 x float> %res |
| ; CHECK-LABEL: insertelement_v4f32_0: |
| ; CHECK: movss |
| + |
| +; SSE41-LABEL: insertelement_v4f32_0: |
| +; SSE41: insertps {{.*}}, {{.*}}, 0 |
| } |
| define <4 x i32> @insertelement_v4i32_0(<4 x i32> %vec, i32 %elt) { |
| @@ -26,6 +38,9 @@ entry: |
| ret <4 x i32> %res |
| ; CHECK-LABEL: insertelement_v4i32_0: |
| ; CHECK: movss |
| + |
| +; SSE41-LABEL: insertelement_v4i32_0: |
| +; SSE41: pinsrd {{.*}}, {{.*}}, 0 |
| } |
| @@ -36,6 +51,9 @@ entry: |
| ; CHECK-LABEL: insertelement_v4f32_1: |
| ; CHECK: shufps |
| ; CHECK: shufps |
| + |
| +; SSE41-LABEL: insertelement_v4f32_1: |
| +; SSE41: insertps {{.*}}, {{.*}}, 16 |
| } |
| define <4 x i32> @insertelement_v4i32_1(<4 x i32> %vec, i32 %elt) { |
| @@ -45,6 +63,9 @@ entry: |
| ; CHECK-LABEL: insertelement_v4i32_1: |
| ; CHECK: shufps |
| ; CHECK: shufps |
| + |
| +; SSE41-LABEL: insertelement_v4i32_1: |
| +; SSE41: pinsrd {{.*}}, {{.*}}, 1 |
| } |
| define <8 x i16> @insertelement_v8i16(<8 x i16> %vec, i32 %elt.arg) { |
| @@ -52,8 +73,11 @@ entry: |
| %elt = trunc i32 %elt.arg to i16 |
| %res = insertelement <8 x i16> %vec, i16 %elt, i32 1 |
| ret <8 x i16> %res |
| -; CHECK-LABEL: insertelement_v8i16 |
| +; CHECK-LABEL: insertelement_v8i16: |
| ; CHECK: pinsrw |
| + |
| +; SSE41-LABEL: insertelement_v8i16: |
| +; SSE41: pinsrw |
| } |
| define <16 x i8> @insertelement_v16i8(<16 x i8> %vec, i32 %elt.arg) { |
| @@ -65,6 +89,9 @@ entry: |
| ; CHECK: movups |
| ; CHECK: lea |
| ; CHECK: mov |
| + |
| +; SSE41-LABEL: insertelement_v16i8: |
| +; SSE41: pinsrb |
| } |
| define <4 x i1> @insertelement_v4i1_0(<4 x i1> %vec, i32 %elt.arg) { |
| @@ -74,6 +101,9 @@ entry: |
| ret <4 x i1> %res |
| ; CHECK-LABEL: insertelement_v4i1_0: |
| ; CHECK: movss |
| + |
| +; SSE41-LABEL: insertelement_v4i1_0: |
| +; SSE41: pinsrd {{.*}}, {{.*}}, 0 |
| } |
| define <4 x i1> @insertelement_v4i1_1(<4 x i1> %vec, i32 %elt.arg) { |
| @@ -84,6 +114,9 @@ entry: |
| ; CHECK-LABEL: insertelement_v4i1_1: |
| ; CHECK: shufps |
| ; CHECK: shufps |
| + |
| +; SSE41-LABEL: insertelement_v4i1_1: |
| +; SSE41: pinsrd {{.*}}, {{.*}}, 1 |
| } |
| define <8 x i1> @insertelement_v8i1(<8 x i1> %vec, i32 %elt.arg) { |
| @@ -93,6 +126,9 @@ entry: |
| ret <8 x i1> %res |
| ; CHECK-LABEL: insertelement_v8i1: |
| ; CHECK: pinsrw |
| + |
| +; SSE41-LABEL: insertelement_v8i1: |
| +; SSE41: pinsrw |
| } |
| define <16 x i1> @insertelement_v16i1(<16 x i1> %vec, i32 %elt.arg) { |
| @@ -104,6 +140,9 @@ entry: |
| ; CHECK: movups |
| ; CHECK: lea |
| ; CHECK: mov |
| + |
| +; SSE41-LABEL: insertelement_v16i1: |
| +; SSE41: pinsrb |
| } |
| ; extractelement operations |
| @@ -114,6 +153,9 @@ entry: |
| ret float %res |
| ; CHECK-LABEL: extractelement_v4f32: |
| ; CHECK: pshufd |
| + |
| +; SSE41-LABEL: extractelement_v4f32: |
| +; SSE41: pshufd |
|
jvoung (off chromium)
2014/07/30 04:30:11
Is the plan to use extractps later?
wala
2014/07/30 18:11:55
No. I now think we should not be using extractps t
|
| } |
| define i32 @extractelement_v4i32(<4 x i32> %vec) { |
| @@ -122,6 +164,9 @@ entry: |
| ret i32 %res |
| ; CHECK-LABEL: extractelement_v4i32: |
| ; CHECK: pshufd |
| + |
| +; SSE41-LABEL: extractelement_v4i32: |
| +; SSE41: pextrd |
| } |
| define i32 @extractelement_v8i16(<8 x i16> %vec) { |
| @@ -131,6 +176,9 @@ entry: |
| ret i32 %res.ext |
| ; CHECK-LABEL: extractelement_v8i16: |
| ; CHECK: pextrw |
| + |
| +; SSE41-LABEL: extractelement_v8i16: |
| +; SSE41: pextrw |
| } |
| define i32 @extractelement_v16i8(<16 x i8> %vec) { |
| @@ -142,6 +190,9 @@ entry: |
| ; CHECK: movups |
| ; CHECK: lea |
| ; CHECK: mov |
| + |
| +; SSE41-LABEL: extractelement_v16i8: |
| +; SSE41: pextrb |
| } |
| define i32 @extractelement_v4i1(<4 x i1> %vec) { |
| @@ -151,6 +202,9 @@ entry: |
| ret i32 %res.ext |
| ; CHECK-LABEL: extractelement_v4i1: |
| ; CHECK: pshufd |
| + |
| +; SSE41-LABEL: extractelement_v4i1: |
| +; SSE41: pextrd |
| } |
| define i32 @extractelement_v8i1(<8 x i1> %vec) { |
| @@ -160,6 +214,9 @@ entry: |
| ret i32 %res.ext |
| ; CHECK-LABEL: extractelement_v8i1: |
| ; CHECK: pextrw |
| + |
| +; SSE41-LABEL: extractelement_v8i1: |
| +; SSE41: pextrw |
| } |
| define i32 @extractelement_v16i1(<16 x i1> %vec) { |
| @@ -171,6 +228,9 @@ entry: |
| ; CHECK: movups |
| ; CHECK: lea |
| ; CHECK: mov |
| + |
| +; SSE41-LABEL: extractelement_v16i1: |
| +; SSE41: pextrb |
| } |
| ; ERRORS-NOT: ICE translation error |