OLD | NEW |
1 ; This file checks support for address mode optimization. | 1 ; This file checks support for address mode optimization. |
2 | 2 |
3 ; RUN: %p2i -i %s --args -O2 --verbose none \ | 3 ; RUN: %p2i --assemble --disassemble -i %s --args -O2 --verbose none \ |
4 ; RUN: | llvm-mc -triple=i686-none-nacl -filetype=obj \ | 4 ; RUN: | FileCheck %s |
5 ; RUN: | llvm-objdump -d --symbolize -x86-asm-syntax=intel - | FileCheck %s | 5 ; RUN: %p2i --assemble --disassemble -i %s --args -O2 -mattr=sse4.1 \ |
6 ; RUN: %p2i -i %s --args -O2 -mattr=sse4.1 --verbose none \ | 6 ; RUN: --verbose none | FileCheck --check-prefix=SSE41 %s |
7 ; RUN: | llvm-mc -triple=i686-none-nacl -filetype=obj \ | |
8 ; RUN: | llvm-objdump -d --symbolize -x86-asm-syntax=intel - \ | |
9 ; RUN: | FileCheck --check-prefix=SSE41 %s | |
10 | 7 |
11 define float @load_arg_plus_200000(float* %arg) { | 8 define float @load_arg_plus_200000(float* %arg) { |
12 entry: | 9 entry: |
13 %arg.int = ptrtoint float* %arg to i32 | 10 %arg.int = ptrtoint float* %arg to i32 |
14 %addr.int = add i32 %arg.int, 200000 | 11 %addr.int = add i32 %arg.int, 200000 |
15 %addr.ptr = inttoptr i32 %addr.int to float* | 12 %addr.ptr = inttoptr i32 %addr.int to float* |
16 %addr.load = load float* %addr.ptr, align 4 | 13 %addr.load = load float* %addr.ptr, align 4 |
17 ret float %addr.load | 14 ret float %addr.load |
18 ; CHECK-LABEL: load_arg_plus_200000: | 15 ; CHECK-LABEL: load_arg_plus_200000 |
19 ; CHECK: movss xmm0, dword ptr [eax + 200000] | 16 ; CHECK: movss xmm0,DWORD ptr [eax+200000] |
20 } | 17 } |
21 | 18 |
22 define float @load_200000_plus_arg(float* %arg) { | 19 define float @load_200000_plus_arg(float* %arg) { |
23 entry: | 20 entry: |
24 %arg.int = ptrtoint float* %arg to i32 | 21 %arg.int = ptrtoint float* %arg to i32 |
25 %addr.int = add i32 200000, %arg.int | 22 %addr.int = add i32 200000, %arg.int |
26 %addr.ptr = inttoptr i32 %addr.int to float* | 23 %addr.ptr = inttoptr i32 %addr.int to float* |
27 %addr.load = load float* %addr.ptr, align 4 | 24 %addr.load = load float* %addr.ptr, align 4 |
28 ret float %addr.load | 25 ret float %addr.load |
29 ; CHECK-LABEL: load_200000_plus_arg: | 26 ; CHECK-LABEL: load_200000_plus_arg |
30 ; CHECK: movss xmm0, dword ptr [eax + 200000] | 27 ; CHECK: movss xmm0,DWORD ptr [eax+200000] |
31 } | 28 } |
32 | 29 |
33 define float @load_arg_minus_200000(float* %arg) { | 30 define float @load_arg_minus_200000(float* %arg) { |
34 entry: | 31 entry: |
35 %arg.int = ptrtoint float* %arg to i32 | 32 %arg.int = ptrtoint float* %arg to i32 |
36 %addr.int = sub i32 %arg.int, 200000 | 33 %addr.int = sub i32 %arg.int, 200000 |
37 %addr.ptr = inttoptr i32 %addr.int to float* | 34 %addr.ptr = inttoptr i32 %addr.int to float* |
38 %addr.load = load float* %addr.ptr, align 4 | 35 %addr.load = load float* %addr.ptr, align 4 |
39 ret float %addr.load | 36 ret float %addr.load |
40 ; CHECK-LABEL: load_arg_minus_200000: | 37 ; CHECK-LABEL: load_arg_minus_200000 |
41 ; CHECK: movss xmm0, dword ptr [eax - 200000] | 38 ; CHECK: movss xmm0,DWORD ptr [eax-200000] |
42 } | 39 } |
43 | 40 |
44 define float @load_200000_minus_arg(float* %arg) { | 41 define float @load_200000_minus_arg(float* %arg) { |
45 entry: | 42 entry: |
46 %arg.int = ptrtoint float* %arg to i32 | 43 %arg.int = ptrtoint float* %arg to i32 |
47 %addr.int = sub i32 200000, %arg.int | 44 %addr.int = sub i32 200000, %arg.int |
48 %addr.ptr = inttoptr i32 %addr.int to float* | 45 %addr.ptr = inttoptr i32 %addr.int to float* |
49 %addr.load = load float* %addr.ptr, align 4 | 46 %addr.load = load float* %addr.ptr, align 4 |
50 ret float %addr.load | 47 ret float %addr.load |
51 ; CHECK-LABEL: load_200000_minus_arg: | 48 ; CHECK-LABEL: load_200000_minus_arg |
52 ; CHECK: movss xmm0, dword ptr [e{{..}}] | 49 ; CHECK: movss xmm0,DWORD ptr [e{{..}}] |
53 } | 50 } |
54 | 51 |
55 define <8 x i16> @load_mul_v8i16_mem(<8 x i16> %arg0, i32 %arg1_iptr) { | 52 define <8 x i16> @load_mul_v8i16_mem(<8 x i16> %arg0, i32 %arg1_iptr) { |
56 entry: | 53 entry: |
57 %addr_sub = sub i32 %arg1_iptr, 200000 | 54 %addr_sub = sub i32 %arg1_iptr, 200000 |
58 %addr_ptr = inttoptr i32 %addr_sub to <8 x i16>* | 55 %addr_ptr = inttoptr i32 %addr_sub to <8 x i16>* |
59 %arg1 = load <8 x i16>* %addr_ptr, align 2 | 56 %arg1 = load <8 x i16>* %addr_ptr, align 2 |
60 %res_vec = mul <8 x i16> %arg0, %arg1 | 57 %res_vec = mul <8 x i16> %arg0, %arg1 |
61 ret <8 x i16> %res_vec | 58 ret <8 x i16> %res_vec |
62 ; CHECK-LABEL: load_mul_v8i16_mem: | 59 ; CHECK-LABEL: load_mul_v8i16_mem |
63 ; CHECK: pmullw xmm{{.*}}, xmmword ptr [e{{.*}} - 200000] | 60 ; CHECK: pmullw xmm{{.*}}, XMMWORD PTR [e{{.*}}-200000] |
64 } | 61 } |
65 | 62 |
66 define <4 x i32> @load_mul_v4i32_mem(<4 x i32> %arg0, i32 %arg1_iptr) { | 63 define <4 x i32> @load_mul_v4i32_mem(<4 x i32> %arg0, i32 %arg1_iptr) { |
67 entry: | 64 entry: |
68 %addr_sub = sub i32 %arg1_iptr, 200000 | 65 %addr_sub = sub i32 %arg1_iptr, 200000 |
69 %addr_ptr = inttoptr i32 %addr_sub to <4 x i32>* | 66 %addr_ptr = inttoptr i32 %addr_sub to <4 x i32>* |
70 %arg1 = load <4 x i32>* %addr_ptr, align 4 | 67 %arg1 = load <4 x i32>* %addr_ptr, align 4 |
71 %res = mul <4 x i32> %arg0, %arg1 | 68 %res = mul <4 x i32> %arg0, %arg1 |
72 ret <4 x i32> %res | 69 ret <4 x i32> %res |
73 ; CHECK-LABEL: load_mul_v4i32_mem: | 70 ; CHECK-LABEL: load_mul_v4i32_mem |
74 ; CHECK: pmuludq xmm{{.*}}, xmmword ptr [e{{.*}} - 200000] | 71 ; CHECK: pmuludq xmm{{.*}}, XMMWORD PTR [e{{.*}}-200000] |
75 ; CHECK: pmuludq | 72 ; CHECK: pmuludq |
76 ; | 73 ; |
77 ; SSE41-LABEL: load_mul_v4i32_mem: | 74 ; SSE41-LABEL: load_mul_v4i32_mem |
78 ; SSE41: pmulld xmm{{.*}}, xmmword ptr [e{{.*}} - 200000] | 75 ; SSE41: pmulld xmm{{.*}}, XMMWORD PTR [e{{.*}} - 200000] |
79 } | 76 } |
80 | 77 |
81 define float @address_mode_opt_chaining(float* %arg) { | 78 define float @address_mode_opt_chaining(float* %arg) { |
82 entry: | 79 entry: |
83 %arg.int = ptrtoint float* %arg to i32 | 80 %arg.int = ptrtoint float* %arg to i32 |
84 %addr1.int = add i32 12, %arg.int | 81 %addr1.int = add i32 12, %arg.int |
85 %addr2.int = sub i32 %addr1.int, 4 | 82 %addr2.int = sub i32 %addr1.int, 4 |
86 %addr2.ptr = inttoptr i32 %addr2.int to float* | 83 %addr2.ptr = inttoptr i32 %addr2.int to float* |
87 %addr2.load = load float* %addr2.ptr, align 4 | 84 %addr2.load = load float* %addr2.ptr, align 4 |
88 ret float %addr2.load | 85 ret float %addr2.load |
89 ; CHECK-LABEL: address_mode_opt_chaining: | 86 ; CHECK-LABEL: address_mode_opt_chaining |
90 ; CHECK: movss xmm0, dword ptr [eax + 8] | 87 ; CHECK: movss xmm0,DWORD ptr [eax+8] |
91 } | 88 } |
92 | 89 |
93 define float @address_mode_opt_chaining_overflow(float* %arg) { | 90 define float @address_mode_opt_chaining_overflow(float* %arg) { |
94 entry: | 91 entry: |
95 %arg.int = ptrtoint float* %arg to i32 | 92 %arg.int = ptrtoint float* %arg to i32 |
96 %addr1.int = add i32 2147483640, %arg.int | 93 %addr1.int = add i32 2147483640, %arg.int |
97 %addr2.int = add i32 %addr1.int, 2147483643 | 94 %addr2.int = add i32 %addr1.int, 2147483643 |
98 %addr2.ptr = inttoptr i32 %addr2.int to float* | 95 %addr2.ptr = inttoptr i32 %addr2.int to float* |
99 %addr2.load = load float* %addr2.ptr, align 4 | 96 %addr2.load = load float* %addr2.ptr, align 4 |
100 ret float %addr2.load | 97 ret float %addr2.load |
101 ; CHECK-LABEL: address_mode_opt_chaining_overflow: | 98 ; CHECK-LABEL: address_mode_opt_chaining_overflow |
102 ; CHECK: 2147483640 | 99 ; CHECK: 2147483640 |
103 ; CHECK: movss xmm0, dword ptr [{{.*}} + 2147483643] | 100 ; CHECK: movss xmm0,DWORD ptr [{{.*}}+2147483643] |
104 } | 101 } |
105 | 102 |
106 define float @address_mode_opt_chaining_overflow_sub(float* %arg) { | 103 define float @address_mode_opt_chaining_overflow_sub(float* %arg) { |
107 entry: | 104 entry: |
108 %arg.int = ptrtoint float* %arg to i32 | 105 %arg.int = ptrtoint float* %arg to i32 |
109 %addr1.int = sub i32 %arg.int, 2147483640 | 106 %addr1.int = sub i32 %arg.int, 2147483640 |
110 %addr2.int = sub i32 %addr1.int, 2147483643 | 107 %addr2.int = sub i32 %addr1.int, 2147483643 |
111 %addr2.ptr = inttoptr i32 %addr2.int to float* | 108 %addr2.ptr = inttoptr i32 %addr2.int to float* |
112 %addr2.load = load float* %addr2.ptr, align 4 | 109 %addr2.load = load float* %addr2.ptr, align 4 |
113 ret float %addr2.load | 110 ret float %addr2.load |
114 ; CHECK-LABEL: address_mode_opt_chaining_overflow_sub: | 111 ; CHECK-LABEL: address_mode_opt_chaining_overflow_sub |
115 ; CHECK: 2147483640 | 112 ; CHECK: 2147483640 |
116 ; CHECK: movss xmm0, dword ptr [{{.*}} - 2147483643] | 113 ; CHECK: movss xmm0,DWORD ptr [{{.*}}-2147483643] |
117 } | 114 } |
118 | 115 |
119 define float @address_mode_opt_chaining_no_overflow(float* %arg) { | 116 define float @address_mode_opt_chaining_no_overflow(float* %arg) { |
120 entry: | 117 entry: |
121 %arg.int = ptrtoint float* %arg to i32 | 118 %arg.int = ptrtoint float* %arg to i32 |
122 %addr1.int = sub i32 %arg.int, 2147483640 | 119 %addr1.int = sub i32 %arg.int, 2147483640 |
123 %addr2.int = add i32 %addr1.int, 2147483643 | 120 %addr2.int = add i32 %addr1.int, 2147483643 |
124 %addr2.ptr = inttoptr i32 %addr2.int to float* | 121 %addr2.ptr = inttoptr i32 %addr2.int to float* |
125 %addr2.load = load float* %addr2.ptr, align 4 | 122 %addr2.load = load float* %addr2.ptr, align 4 |
126 ret float %addr2.load | 123 ret float %addr2.load |
127 ; CHECK-LABEL: address_mode_opt_chaining_no_overflow: | 124 ; CHECK-LABEL: address_mode_opt_chaining_no_overflow |
128 ; CHECK: movss xmm0, dword ptr [{{.*}} + 3] | 125 ; CHECK: movss xmm0,DWORD ptr [{{.*}}+3] |
129 } | 126 } |
130 | 127 |
131 define float @address_mode_opt_add_pos_min_int(float* %arg) { | 128 define float @address_mode_opt_add_pos_min_int(float* %arg) { |
132 entry: | 129 entry: |
133 %arg.int = ptrtoint float* %arg to i32 | 130 %arg.int = ptrtoint float* %arg to i32 |
134 %addr1.int = add i32 %arg.int, 2147483648 | 131 %addr1.int = add i32 %arg.int, 2147483648 |
135 %addr1.ptr = inttoptr i32 %addr1.int to float* | 132 %addr1.ptr = inttoptr i32 %addr1.int to float* |
136 %addr1.load = load float* %addr1.ptr, align 4 | 133 %addr1.load = load float* %addr1.ptr, align 4 |
137 ret float %addr1.load | 134 ret float %addr1.load |
138 ; CHECK-LABEL: address_mode_opt_add_pos_min_int: | 135 ; CHECK-LABEL: address_mode_opt_add_pos_min_int |
139 ; CHECK: movss xmm0, dword ptr [{{.*}} - 2147483648] | 136 ; CHECK: movss xmm0,DWORD ptr [{{.*}}-2147483648] |
140 } | 137 } |
141 | 138 |
142 define float @address_mode_opt_sub_min_int(float* %arg) { | 139 define float @address_mode_opt_sub_min_int(float* %arg) { |
143 entry: | 140 entry: |
144 %arg.int = ptrtoint float* %arg to i32 | 141 %arg.int = ptrtoint float* %arg to i32 |
145 %addr1.int = sub i32 %arg.int, 2147483648 | 142 %addr1.int = sub i32 %arg.int, 2147483648 |
146 %addr1.ptr = inttoptr i32 %addr1.int to float* | 143 %addr1.ptr = inttoptr i32 %addr1.int to float* |
147 %addr1.load = load float* %addr1.ptr, align 4 | 144 %addr1.load = load float* %addr1.ptr, align 4 |
148 ret float %addr1.load | 145 ret float %addr1.load |
149 ; CHECK-LABEL: address_mode_opt_sub_min_int: | 146 ; CHECK-LABEL: address_mode_opt_sub_min_int |
150 ; CHECK: movss xmm0, dword ptr [{{.*}} - 2147483648] | 147 ; CHECK: movss xmm0,DWORD ptr [{{.*}}-2147483648] |
151 } | 148 } |
OLD | NEW |