| Index: tests_lit/llvm2ice_tests/vector-fcmp.ll
|
| diff --git a/tests_lit/llvm2ice_tests/vector-fcmp.ll b/tests_lit/llvm2ice_tests/vector-fcmp.ll
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..7fb717a282830a879d1c4802710d1706eb8fa711
|
| --- /dev/null
|
| +++ b/tests_lit/llvm2ice_tests/vector-fcmp.ll
|
| @@ -0,0 +1,178 @@
|
| +; This file checks support for comparing vector values with the fcmp
|
| +; instruction.
|
| +
|
| +; RUN: %llvm2ice -O2 --verbose none %s | FileCheck %s
|
| +; RUN: %llvm2ice -Om1 --verbose none %s | FileCheck %s
|
| +; RUN: %llvm2ice -O2 --verbose none %s \
|
| +; RUN: | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj
|
| +; RUN: %llvm2ice -Om1 --verbose none %s \
|
| +; RUN: | llvm-mc -arch=x86 -x86-asm-syntax=intel -filetype=obj
|
| +; RUN: %llvm2ice --verbose none %s | FileCheck --check-prefix=ERRORS %s
|
| +; RUN: %llvm2iceinsts %s | %szdiff %s | FileCheck --check-prefix=DUMP %s
|
| +; RUN: %llvm2iceinsts --pnacl %s | %szdiff %s \
|
| +; RUN: | FileCheck --check-prefix=DUMP %s
|
| +
|
| +; Check that sext elimination occurs when the result of the comparison
|
| +; instruction is alrady sign extended. Sign extension to 4 x i32 uses
|
| +; the pslld instruction.
|
| +define <4 x i32> @sextElimination(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp oeq <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: sextElimination:
|
| +; CHECK: cmpeqps
|
| +; CHECK-NOT: pslld
|
| +}
|
| +
|
| +define <4 x i32> @fcmpFalseVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp false <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpFalseVector:
|
| +; CHECK: pxor
|
| +}
|
| +
|
| +define <4 x i32> @fcmpOeqVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp oeq <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpOeqVector:
|
| +; CHECK: cmpeqps
|
| +}
|
| +
|
| +define <4 x i32> @fcmpOgeVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp oge <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpOgeVector:
|
| +; CHECK: cmpleps
|
| +}
|
| +
|
| +define <4 x i32> @fcmpOgtVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp ogt <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpOgtVector:
|
| +; CHECK: cmpltps
|
| +}
|
| +
|
| +define <4 x i32> @fcmpOleVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp ole <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpOleVector:
|
| +; CHECK: cmpleps
|
| +}
|
| +
|
| +define <4 x i32> @fcmpOltVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp olt <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpOltVector:
|
| +; CHECK: cmpltps
|
| +}
|
| +
|
| +define <4 x i32> @fcmpOneVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp one <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpOneVector:
|
| +; CHECK: cmpneqps
|
| +; CHECK: cmpordps
|
| +; CHECK: pand
|
| +}
|
| +
|
| +define <4 x i32> @fcmpOrdVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp ord <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpOrdVector:
|
| +; CHECK: cmpordps
|
| +}
|
| +
|
| +define <4 x i32> @fcmpTrueVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp true <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpTrueVector:
|
| +; CHECK: pcmpeqd
|
| +}
|
| +
|
| +define <4 x i32> @fcmpUeqVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp ueq <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpUeqVector:
|
| +; CHECK: cmpeqps
|
| +; CHECK: cmpunordps
|
| +; CHECK: por
|
| +}
|
| +
|
| +define <4 x i32> @fcmpUgeVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp uge <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpUgeVector:
|
| +; CHECK: cmpnltps
|
| +}
|
| +
|
| +define <4 x i32> @fcmpUgtVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp ugt <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpUgtVector:
|
| +; CHECK: cmpnleps
|
| +}
|
| +
|
| +define <4 x i32> @fcmpUleVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp ule <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpUleVector:
|
| +; CHECK: cmpnltps
|
| +}
|
| +
|
| +define <4 x i32> @fcmpUltVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp ult <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpUltVector:
|
| +; CHECK: cmpnleps
|
| +}
|
| +
|
| +define <4 x i32> @fcmpUneVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp une <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpUneVector:
|
| +; CHECK: cmpneqps
|
| +}
|
| +
|
| +define <4 x i32> @fcmpUnoVector(<4 x float> %a, <4 x float> %b) {
|
| +entry:
|
| + %res.trunc = fcmp uno <4 x float> %a, %b
|
| + %res = sext <4 x i1> %res.trunc to <4 x i32>
|
| + ret <4 x i32> %res
|
| +; CHECK-LABEL: fcmpUnoVector:
|
| +; CHECK: cmpunordps
|
| +}
|
| +
|
| +; ERRORS-NOT: ICE translation error
|
| +; DUMP-NOT: SZ
|
| +
|
|
|