| Index: tests_lit/llvm2ice_tests/nop-insertion.ll
|
| diff --git a/tests_lit/llvm2ice_tests/nop-insertion.ll b/tests_lit/llvm2ice_tests/nop-insertion.ll
|
| index 160d9336214a50e0acab40f8c987651e2d90e457..785ef486ab887b20b3536dabef8b1f7e57f876e0 100644
|
| --- a/tests_lit/llvm2ice_tests/nop-insertion.ll
|
| +++ b/tests_lit/llvm2ice_tests/nop-insertion.ll
|
| @@ -25,106 +25,112 @@ entry:
|
| ret <4 x i32> %res
|
|
|
| ; PROB50-LABEL: mul_v4i32
|
| -; PROB50: nop # variant = 4
|
| +; PROB50: nop # variant = 1
|
| ; PROB50: subl $60, %esp
|
| +; PROB50: nop # variant = 3
|
| ; PROB50: movups %xmm0, 32(%esp)
|
| -; PROB50: nop # variant = 0
|
| ; PROB50: movups %xmm1, 16(%esp)
|
| -; PROB50: nop # variant = 4
|
| ; PROB50: movups 32(%esp), %xmm0
|
| +; PROB50: nop # variant = 1
|
| ; PROB50: pshufd $49, 32(%esp), %xmm1
|
| +; PROB50: nop # variant = 4
|
| ; PROB50: pshufd $49, 16(%esp), %xmm2
|
| +; PROB50: nop # variant = 1
|
| ; PROB50: pmuludq 16(%esp), %xmm0
|
| -; PROB50: nop # variant = 0
|
| ; PROB50: pmuludq %xmm2, %xmm1
|
| +; PROB50: nop # variant = 0
|
| ; PROB50: shufps $136, %xmm1, %xmm0
|
| -; PROB50: nop # variant = 2
|
| +; PROB50: nop # variant = 3
|
| ; PROB50: pshufd $216, %xmm0, %xmm0
|
| +; PROB50: nop # variant = 1
|
| ; PROB50: movups %xmm0, (%esp)
|
| ; PROB50: movups (%esp), %xmm0
|
| -; PROB50: nop # variant = 0
|
| ; PROB50: addl $60, %esp
|
| -; PROB50: nop # variant = 3
|
| ; PROB50: ret
|
|
|
| ; PROB90-LABEL: mul_v4i32
|
| -; PROB90: nop # variant = 4
|
| +; PROB90: nop # variant = 1
|
| ; PROB90: subl $60, %esp
|
| ; PROB90: nop # variant = 3
|
| ; PROB90: movups %xmm0, 32(%esp)
|
| -; PROB90: nop # variant = 2
|
| +; PROB90: nop # variant = 4
|
| ; PROB90: movups %xmm1, 16(%esp)
|
| -; PROB90: nop # variant = 3
|
| +; PROB90: nop # variant = 1
|
| ; PROB90: movups 32(%esp), %xmm0
|
| ; PROB90: nop # variant = 4
|
| ; PROB90: pshufd $49, 32(%esp), %xmm1
|
| -; PROB90: nop # variant = 0
|
| +; PROB90: nop # variant = 1
|
| ; PROB90: pshufd $49, 16(%esp), %xmm2
|
| -; PROB90: nop # variant = 2
|
| +; PROB90: nop # variant = 4
|
| ; PROB90: pmuludq 16(%esp), %xmm0
|
| -; PROB90: nop # variant = 3
|
| +; PROB90: nop # variant = 2
|
| ; PROB90: pmuludq %xmm2, %xmm1
|
| -; PROB90: nop # variant = 4
|
| ; PROB90: shufps $136, %xmm1, %xmm0
|
| -; PROB90: nop # variant = 2
|
| +; PROB90: nop # variant = 1
|
| ; PROB90: pshufd $216, %xmm0, %xmm0
|
| -; PROB90: nop # variant = 4
|
| ; PROB90: movups %xmm0, (%esp)
|
| -; PROB90: nop # variant = 2
|
| +; PROB90: nop # variant = 1
|
| ; PROB90: movups (%esp), %xmm0
|
| -; PROB90: nop # variant = 3
|
| +; PROB90: nop # variant = 0
|
| ; PROB90: addl $60, %esp
|
| -; PROB90: nop # variant = 3
|
| +; PROB90: nop # variant = 0
|
| ; PROB90: ret
|
| +; PROB90: nop # variant = 4
|
|
|
| ; MAXNOPS2-LABEL: mul_v4i32
|
| -; MAXNOPS2: nop # variant = 4
|
| +; MAXNOPS2: nop # variant = 1
|
| +; MAXNOPS2: nop # variant = 3
|
| ; MAXNOPS2: subl $60, %esp
|
| -; MAXNOPS2: nop # variant = 0
|
| -; MAXNOPS2: nop # variant = 4
|
| ; MAXNOPS2: movups %xmm0, 32(%esp)
|
| +; MAXNOPS2: nop # variant = 1
|
| +; MAXNOPS2: nop # variant = 4
|
| ; MAXNOPS2: movups %xmm1, 16(%esp)
|
| -; MAXNOPS2: nop # variant = 0
|
| +; MAXNOPS2: nop # variant = 1
|
| ; MAXNOPS2: movups 32(%esp), %xmm0
|
| -; MAXNOPS2: nop # variant = 2
|
| -; MAXNOPS2: pshufd $49, 32(%esp), %xmm1
|
| -; MAXNOPS2: pshufd $49, 16(%esp), %xmm2
|
| ; MAXNOPS2: nop # variant = 0
|
| ; MAXNOPS2: nop # variant = 3
|
| +; MAXNOPS2: pshufd $49, 32(%esp), %xmm1
|
| +; MAXNOPS2: nop # variant = 1
|
| +; MAXNOPS2: pshufd $49, 16(%esp), %xmm2
|
| ; MAXNOPS2: pmuludq 16(%esp), %xmm0
|
| ; MAXNOPS2: pmuludq %xmm2, %xmm1
|
| +; MAXNOPS2: nop # variant = 0
|
| ; MAXNOPS2: shufps $136, %xmm1, %xmm0
|
| -; MAXNOPS2: nop # variant = 3
|
| -; MAXNOPS2: pshufd $216, %xmm0, %xmm0
|
| ; MAXNOPS2: nop # variant = 0
|
| +; MAXNOPS2: nop # variant = 0
|
| +; MAXNOPS2: pshufd $216, %xmm0, %xmm0
|
| +; MAXNOPS2: nop # variant = 1
|
| +; MAXNOPS2: nop # variant = 3
|
| ; MAXNOPS2: movups %xmm0, (%esp)
|
| -; MAXNOPS2: nop # variant = 2
|
| +; MAXNOPS2: nop # variant = 3
|
| ; MAXNOPS2: movups (%esp), %xmm0
|
| -; MAXNOPS2: nop # variant = 4
|
| ; MAXNOPS2: addl $60, %esp
|
| +; MAXNOPS2: nop # variant = 3
|
| ; MAXNOPS2: ret
|
|
|
| +
|
| ; SANDBOX50-LABEL: mul_v4i32
|
| -; SANDBOX50: nop # variant = 4
|
| +; SANDBOX50: nop # variant = 1
|
| ; SANDBOX50: subl $60, %esp
|
| +; SANDBOX50: nop # variant = 3
|
| ; SANDBOX50: movups %xmm0, 32(%esp)
|
| -; SANDBOX50: nop # variant = 0
|
| ; SANDBOX50: movups %xmm1, 16(%esp)
|
| -; SANDBOX50: nop # variant = 4
|
| ; SANDBOX50: movups 32(%esp), %xmm0
|
| +; SANDBOX50: nop # variant = 1
|
| ; SANDBOX50: pshufd $49, 32(%esp), %xmm1
|
| +; SANDBOX50: nop # variant = 4
|
| ; SANDBOX50: pshufd $49, 16(%esp), %xmm2
|
| +; SANDBOX50: nop # variant = 1
|
| ; SANDBOX50: pmuludq 16(%esp), %xmm0
|
| -; SANDBOX50: nop # variant = 0
|
| ; SANDBOX50: pmuludq %xmm2, %xmm1
|
| +; SANDBOX50: nop # variant = 0
|
| ; SANDBOX50: shufps $136, %xmm1, %xmm0
|
| -; SANDBOX50: nop # variant = 2
|
| +; SANDBOX50: nop # variant = 3
|
| ; SANDBOX50: pshufd $216, %xmm0, %xmm0
|
| +; SANDBOX50: nop # variant = 1
|
| ; SANDBOX50: movups %xmm0, (%esp)
|
| ; SANDBOX50: movups (%esp), %xmm0
|
| -; SANDBOX50: nop # variant = 0
|
| ; SANDBOX50: addl $60, %esp
|
| -; SANDBOX50: nop # variant = 3
|
| ; SANDBOX50: pop %ecx
|
| ; SANDBOX50: .bundle_lock
|
| ; SANDBOX50: andl $-32, %ecx
|
|
|