Index: tests_lit/llvm2ice_tests/vector-ops.ll |
diff --git a/tests_lit/llvm2ice_tests/vector-ops.ll b/tests_lit/llvm2ice_tests/vector-ops.ll |
index 86647db26b822136b40c8f58f92028e01545885d..c730d7315cd981518200e359df0fc1c47e9e3a05 100644 |
--- a/tests_lit/llvm2ice_tests/vector-ops.ll |
+++ b/tests_lit/llvm2ice_tests/vector-ops.ll |
@@ -1,10 +1,19 @@ |
; This checks support for insertelement and extractelement. |
-; RUN: %llvm2ice --verbose inst %s | FileCheck %s |
+; RUN: %llvm2ice -O2 --verbose none %s | FileCheck %s |
+; RUN: %llvm2ice -Om1 --verbose none %s | FileCheck %s |
+; RUN: %llvm2ice -O2 -mattr=sse4.1 --verbose none %s \ |
+; RUN: | FileCheck %s --check-prefix=SSE41 |
+; RUN: %llvm2ice -Om1 -mattr=sse4.1 --verbose none %s \ |
+; RUN: | FileCheck %s --check-prefix=SSE41 |
; RUN: %llvm2ice -O2 --verbose none %s \ |
; RUN: | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj |
; RUN: %llvm2ice -Om1 --verbose none %s \ |
; RUN: | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj |
+; RUN: %llvm2ice -O2 -mattr=sse4.1 --verbose none %s \ |
+; RUN: | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj |
+; RUN: %llvm2ice -Om1 -mattr=sse4.1 --verbose none %s \ |
+; RUN: | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj |
; RUN: %llvm2ice --verbose none %s | FileCheck --check-prefix=ERRORS %s |
; RUN: %llvm2iceinsts %s | %szdiff %s | FileCheck --check-prefix=DUMP %s |
; RUN: %llvm2iceinsts --pnacl %s | %szdiff %s \ |
@@ -18,6 +27,9 @@ entry: |
ret <4 x float> %res |
; CHECK-LABEL: insertelement_v4f32_0: |
; CHECK: movss |
+ |
+; SSE41-LABEL: insertelement_v4f32_0: |
+; SSE41: insertps {{.*}}, {{.*}}, 0 |
} |
define <4 x i32> @insertelement_v4i32_0(<4 x i32> %vec, i32 %elt) { |
@@ -26,6 +38,9 @@ entry: |
ret <4 x i32> %res |
; CHECK-LABEL: insertelement_v4i32_0: |
; CHECK: movss |
+ |
+; SSE41-LABEL: insertelement_v4i32_0: |
+; SSE41: pinsrd {{.*}}, {{.*}}, 0 |
} |
@@ -36,6 +51,9 @@ entry: |
; CHECK-LABEL: insertelement_v4f32_1: |
; CHECK: shufps |
; CHECK: shufps |
+ |
+; SSE41-LABEL: insertelement_v4f32_1: |
+; SSE41: insertps {{.*}}, {{.*}}, 16 |
} |
define <4 x i32> @insertelement_v4i32_1(<4 x i32> %vec, i32 %elt) { |
@@ -45,6 +63,9 @@ entry: |
; CHECK-LABEL: insertelement_v4i32_1: |
; CHECK: shufps |
; CHECK: shufps |
+ |
+; SSE41-LABEL: insertelement_v4i32_1: |
+; SSE41: pinsrd {{.*}}, {{.*}}, 1 |
} |
define <8 x i16> @insertelement_v8i16(<8 x i16> %vec, i32 %elt.arg) { |
@@ -52,8 +73,11 @@ entry: |
%elt = trunc i32 %elt.arg to i16 |
%res = insertelement <8 x i16> %vec, i16 %elt, i32 1 |
ret <8 x i16> %res |
-; CHECK-LABEL: insertelement_v8i16 |
+; CHECK-LABEL: insertelement_v8i16: |
; CHECK: pinsrw |
+ |
+; SSE41-LABEL: insertelement_v8i16: |
+; SSE41: pinsrw |
} |
define <16 x i8> @insertelement_v16i8(<16 x i8> %vec, i32 %elt.arg) { |
@@ -65,6 +89,9 @@ entry: |
; CHECK: movups |
; CHECK: lea |
; CHECK: mov |
+ |
+; SSE41-LABEL: insertelement_v16i8: |
+; SSE41: pinsrb |
} |
define <4 x i1> @insertelement_v4i1_0(<4 x i1> %vec, i32 %elt.arg) { |
@@ -74,6 +101,9 @@ entry: |
ret <4 x i1> %res |
; CHECK-LABEL: insertelement_v4i1_0: |
; CHECK: movss |
+ |
+; SSE41-LABEL: insertelement_v4i1_0: |
+; SSE41: pinsrd {{.*}}, {{.*}}, 0 |
} |
define <4 x i1> @insertelement_v4i1_1(<4 x i1> %vec, i32 %elt.arg) { |
@@ -84,6 +114,9 @@ entry: |
; CHECK-LABEL: insertelement_v4i1_1: |
; CHECK: shufps |
; CHECK: shufps |
+ |
+; SSE41-LABEL: insertelement_v4i1_1: |
+; SSE41: pinsrd {{.*}}, {{.*}}, 1 |
} |
define <8 x i1> @insertelement_v8i1(<8 x i1> %vec, i32 %elt.arg) { |
@@ -93,6 +126,9 @@ entry: |
ret <8 x i1> %res |
; CHECK-LABEL: insertelement_v8i1: |
; CHECK: pinsrw |
+ |
+; SSE41-LABEL: insertelement_v8i1: |
+; SSE41: pinsrw |
} |
define <16 x i1> @insertelement_v16i1(<16 x i1> %vec, i32 %elt.arg) { |
@@ -104,6 +140,9 @@ entry: |
; CHECK: movups |
; CHECK: lea |
; CHECK: mov |
+ |
+; SSE41-LABEL: insertelement_v16i1: |
+; SSE41: pinsrb |
} |
; extractelement operations |
@@ -114,6 +153,9 @@ entry: |
ret float %res |
; CHECK-LABEL: extractelement_v4f32: |
; CHECK: pshufd |
+ |
+; SSE41-LABEL: extractelement_v4f32: |
+; SSE41: pshufd |
} |
define i32 @extractelement_v4i32(<4 x i32> %vec) { |
@@ -122,6 +164,9 @@ entry: |
ret i32 %res |
; CHECK-LABEL: extractelement_v4i32: |
; CHECK: pshufd |
+ |
+; SSE41-LABEL: extractelement_v4i32: |
+; SSE41: pextrd |
} |
define i32 @extractelement_v8i16(<8 x i16> %vec) { |
@@ -131,6 +176,9 @@ entry: |
ret i32 %res.ext |
; CHECK-LABEL: extractelement_v8i16: |
; CHECK: pextrw |
+ |
+; SSE41-LABEL: extractelement_v8i16: |
+; SSE41: pextrw |
} |
define i32 @extractelement_v16i8(<16 x i8> %vec) { |
@@ -142,6 +190,9 @@ entry: |
; CHECK: movups |
; CHECK: lea |
; CHECK: mov |
+ |
+; SSE41-LABEL: extractelement_v16i8: |
+; SSE41: pextrb |
} |
define i32 @extractelement_v4i1(<4 x i1> %vec) { |
@@ -151,6 +202,9 @@ entry: |
ret i32 %res.ext |
; CHECK-LABEL: extractelement_v4i1: |
; CHECK: pshufd |
+ |
+; SSE41-LABEL: extractelement_v4i1: |
+; SSE41: pextrd |
} |
define i32 @extractelement_v8i1(<8 x i1> %vec) { |
@@ -160,6 +214,9 @@ entry: |
ret i32 %res.ext |
; CHECK-LABEL: extractelement_v8i1: |
; CHECK: pextrw |
+ |
+; SSE41-LABEL: extractelement_v8i1: |
+; SSE41: pextrw |
} |
define i32 @extractelement_v16i1(<16 x i1> %vec) { |
@@ -171,6 +228,9 @@ entry: |
; CHECK: movups |
; CHECK: lea |
; CHECK: mov |
+ |
+; SSE41-LABEL: extractelement_v16i1: |
+; SSE41: pextrb |
} |
; ERRORS-NOT: ICE translation error |