| OLD | NEW |
| 1 ; This file checks support for address mode optimization. | 1 ; This file checks support for address mode optimization. |
| 2 | 2 |
| 3 ; RUN: %p2i -i %s --args -O2 --verbose none \ | 3 ; RUN: %p2i --assemble --disassemble -i %s --args -O2 --verbose none \ |
| 4 ; RUN: | llvm-mc -triple=i686-none-nacl -filetype=obj \ | 4 ; RUN: | FileCheck %s |
| 5 ; RUN: | llvm-objdump -d --symbolize -x86-asm-syntax=intel - | FileCheck %s | 5 ; RUN: %p2i --assemble --disassemble -i %s --args -O2 -mattr=sse4.1 \ |
| 6 ; RUN: %p2i -i %s --args -O2 -mattr=sse4.1 --verbose none \ | 6 ; RUN: --verbose none | FileCheck --check-prefix=SSE41 %s |
| 7 ; RUN: | llvm-mc -triple=i686-none-nacl -filetype=obj \ | |
| 8 ; RUN: | llvm-objdump -d --symbolize -x86-asm-syntax=intel - \ | |
| 9 ; RUN: | FileCheck --check-prefix=SSE41 %s | |
| 10 | 7 |
| 11 define float @load_arg_plus_200000(float* %arg) { | 8 define float @load_arg_plus_200000(float* %arg) { |
| 12 entry: | 9 entry: |
| 13 %arg.int = ptrtoint float* %arg to i32 | 10 %arg.int = ptrtoint float* %arg to i32 |
| 14 %addr.int = add i32 %arg.int, 200000 | 11 %addr.int = add i32 %arg.int, 200000 |
| 15 %addr.ptr = inttoptr i32 %addr.int to float* | 12 %addr.ptr = inttoptr i32 %addr.int to float* |
| 16 %addr.load = load float* %addr.ptr, align 4 | 13 %addr.load = load float* %addr.ptr, align 4 |
| 17 ret float %addr.load | 14 ret float %addr.load |
| 18 ; CHECK-LABEL: load_arg_plus_200000: | 15 ; CHECK-LABEL: load_arg_plus_200000 |
| 19 ; CHECK: movss xmm0, dword ptr [eax + 200000] | 16 ; CHECK: movss xmm0,DWORD ptr [eax+200000] |
| 20 } | 17 } |
| 21 | 18 |
| 22 define float @load_200000_plus_arg(float* %arg) { | 19 define float @load_200000_plus_arg(float* %arg) { |
| 23 entry: | 20 entry: |
| 24 %arg.int = ptrtoint float* %arg to i32 | 21 %arg.int = ptrtoint float* %arg to i32 |
| 25 %addr.int = add i32 200000, %arg.int | 22 %addr.int = add i32 200000, %arg.int |
| 26 %addr.ptr = inttoptr i32 %addr.int to float* | 23 %addr.ptr = inttoptr i32 %addr.int to float* |
| 27 %addr.load = load float* %addr.ptr, align 4 | 24 %addr.load = load float* %addr.ptr, align 4 |
| 28 ret float %addr.load | 25 ret float %addr.load |
| 29 ; CHECK-LABEL: load_200000_plus_arg: | 26 ; CHECK-LABEL: load_200000_plus_arg |
| 30 ; CHECK: movss xmm0, dword ptr [eax + 200000] | 27 ; CHECK: movss xmm0,DWORD ptr [eax+200000] |
| 31 } | 28 } |
| 32 | 29 |
| 33 define float @load_arg_minus_200000(float* %arg) { | 30 define float @load_arg_minus_200000(float* %arg) { |
| 34 entry: | 31 entry: |
| 35 %arg.int = ptrtoint float* %arg to i32 | 32 %arg.int = ptrtoint float* %arg to i32 |
| 36 %addr.int = sub i32 %arg.int, 200000 | 33 %addr.int = sub i32 %arg.int, 200000 |
| 37 %addr.ptr = inttoptr i32 %addr.int to float* | 34 %addr.ptr = inttoptr i32 %addr.int to float* |
| 38 %addr.load = load float* %addr.ptr, align 4 | 35 %addr.load = load float* %addr.ptr, align 4 |
| 39 ret float %addr.load | 36 ret float %addr.load |
| 40 ; CHECK-LABEL: load_arg_minus_200000: | 37 ; CHECK-LABEL: load_arg_minus_200000 |
| 41 ; CHECK: movss xmm0, dword ptr [eax - 200000] | 38 ; CHECK: movss xmm0,DWORD ptr [eax-200000] |
| 42 } | 39 } |
| 43 | 40 |
| 44 define float @load_200000_minus_arg(float* %arg) { | 41 define float @load_200000_minus_arg(float* %arg) { |
| 45 entry: | 42 entry: |
| 46 %arg.int = ptrtoint float* %arg to i32 | 43 %arg.int = ptrtoint float* %arg to i32 |
| 47 %addr.int = sub i32 200000, %arg.int | 44 %addr.int = sub i32 200000, %arg.int |
| 48 %addr.ptr = inttoptr i32 %addr.int to float* | 45 %addr.ptr = inttoptr i32 %addr.int to float* |
| 49 %addr.load = load float* %addr.ptr, align 4 | 46 %addr.load = load float* %addr.ptr, align 4 |
| 50 ret float %addr.load | 47 ret float %addr.load |
| 51 ; CHECK-LABEL: load_200000_minus_arg: | 48 ; CHECK-LABEL: load_200000_minus_arg |
| 52 ; CHECK: movss xmm0, dword ptr [e{{..}}] | 49 ; CHECK: movss xmm0,DWORD ptr [e{{..}}] |
| 53 } | 50 } |
| 54 | 51 |
| 55 define <8 x i16> @load_mul_v8i16_mem(<8 x i16> %arg0, i32 %arg1_iptr) { | 52 define <8 x i16> @load_mul_v8i16_mem(<8 x i16> %arg0, i32 %arg1_iptr) { |
| 56 entry: | 53 entry: |
| 57 %addr_sub = sub i32 %arg1_iptr, 200000 | 54 %addr_sub = sub i32 %arg1_iptr, 200000 |
| 58 %addr_ptr = inttoptr i32 %addr_sub to <8 x i16>* | 55 %addr_ptr = inttoptr i32 %addr_sub to <8 x i16>* |
| 59 %arg1 = load <8 x i16>* %addr_ptr, align 2 | 56 %arg1 = load <8 x i16>* %addr_ptr, align 2 |
| 60 %res_vec = mul <8 x i16> %arg0, %arg1 | 57 %res_vec = mul <8 x i16> %arg0, %arg1 |
| 61 ret <8 x i16> %res_vec | 58 ret <8 x i16> %res_vec |
| 62 ; CHECK-LABEL: load_mul_v8i16_mem: | 59 ; CHECK-LABEL: load_mul_v8i16_mem |
| 63 ; CHECK: pmullw xmm{{.*}}, xmmword ptr [e{{.*}} - 200000] | 60 ; CHECK: pmullw xmm{{.*}}, XMMWORD PTR [e{{.*}}-200000] |
| 64 } | 61 } |
| 65 | 62 |
| 66 define <4 x i32> @load_mul_v4i32_mem(<4 x i32> %arg0, i32 %arg1_iptr) { | 63 define <4 x i32> @load_mul_v4i32_mem(<4 x i32> %arg0, i32 %arg1_iptr) { |
| 67 entry: | 64 entry: |
| 68 %addr_sub = sub i32 %arg1_iptr, 200000 | 65 %addr_sub = sub i32 %arg1_iptr, 200000 |
| 69 %addr_ptr = inttoptr i32 %addr_sub to <4 x i32>* | 66 %addr_ptr = inttoptr i32 %addr_sub to <4 x i32>* |
| 70 %arg1 = load <4 x i32>* %addr_ptr, align 4 | 67 %arg1 = load <4 x i32>* %addr_ptr, align 4 |
| 71 %res = mul <4 x i32> %arg0, %arg1 | 68 %res = mul <4 x i32> %arg0, %arg1 |
| 72 ret <4 x i32> %res | 69 ret <4 x i32> %res |
| 73 ; CHECK-LABEL: load_mul_v4i32_mem: | 70 ; CHECK-LABEL: load_mul_v4i32_mem |
| 74 ; CHECK: pmuludq xmm{{.*}}, xmmword ptr [e{{.*}} - 200000] | 71 ; CHECK: pmuludq xmm{{.*}}, XMMWORD PTR [e{{.*}}-200000] |
| 75 ; CHECK: pmuludq | 72 ; CHECK: pmuludq |
| 76 ; | 73 ; |
| 77 ; SSE41-LABEL: load_mul_v4i32_mem: | 74 ; SSE41-LABEL: load_mul_v4i32_mem |
| 78 ; SSE41: pmulld xmm{{.*}}, xmmword ptr [e{{.*}} - 200000] | 75 ; SSE41: pmulld xmm{{.*}}, XMMWORD PTR [e{{.*}} - 200000] |
| 79 } | 76 } |
| 80 | 77 |
| 81 define float @address_mode_opt_chaining(float* %arg) { | 78 define float @address_mode_opt_chaining(float* %arg) { |
| 82 entry: | 79 entry: |
| 83 %arg.int = ptrtoint float* %arg to i32 | 80 %arg.int = ptrtoint float* %arg to i32 |
| 84 %addr1.int = add i32 12, %arg.int | 81 %addr1.int = add i32 12, %arg.int |
| 85 %addr2.int = sub i32 %addr1.int, 4 | 82 %addr2.int = sub i32 %addr1.int, 4 |
| 86 %addr2.ptr = inttoptr i32 %addr2.int to float* | 83 %addr2.ptr = inttoptr i32 %addr2.int to float* |
| 87 %addr2.load = load float* %addr2.ptr, align 4 | 84 %addr2.load = load float* %addr2.ptr, align 4 |
| 88 ret float %addr2.load | 85 ret float %addr2.load |
| 89 ; CHECK-LABEL: address_mode_opt_chaining: | 86 ; CHECK-LABEL: address_mode_opt_chaining |
| 90 ; CHECK: movss xmm0, dword ptr [eax + 8] | 87 ; CHECK: movss xmm0,DWORD ptr [eax+8] |
| 91 } | 88 } |
| 92 | 89 |
| 93 define float @address_mode_opt_chaining_overflow(float* %arg) { | 90 define float @address_mode_opt_chaining_overflow(float* %arg) { |
| 94 entry: | 91 entry: |
| 95 %arg.int = ptrtoint float* %arg to i32 | 92 %arg.int = ptrtoint float* %arg to i32 |
| 96 %addr1.int = add i32 2147483640, %arg.int | 93 %addr1.int = add i32 2147483640, %arg.int |
| 97 %addr2.int = add i32 %addr1.int, 2147483643 | 94 %addr2.int = add i32 %addr1.int, 2147483643 |
| 98 %addr2.ptr = inttoptr i32 %addr2.int to float* | 95 %addr2.ptr = inttoptr i32 %addr2.int to float* |
| 99 %addr2.load = load float* %addr2.ptr, align 4 | 96 %addr2.load = load float* %addr2.ptr, align 4 |
| 100 ret float %addr2.load | 97 ret float %addr2.load |
| 101 ; CHECK-LABEL: address_mode_opt_chaining_overflow: | 98 ; CHECK-LABEL: address_mode_opt_chaining_overflow |
| 102 ; CHECK: 2147483640 | 99 ; CHECK: 2147483640 |
| 103 ; CHECK: movss xmm0, dword ptr [{{.*}} + 2147483643] | 100 ; CHECK: movss xmm0,DWORD ptr [{{.*}}+2147483643] |
| 104 } | 101 } |
| 105 | 102 |
| 106 define float @address_mode_opt_chaining_overflow_sub(float* %arg) { | 103 define float @address_mode_opt_chaining_overflow_sub(float* %arg) { |
| 107 entry: | 104 entry: |
| 108 %arg.int = ptrtoint float* %arg to i32 | 105 %arg.int = ptrtoint float* %arg to i32 |
| 109 %addr1.int = sub i32 %arg.int, 2147483640 | 106 %addr1.int = sub i32 %arg.int, 2147483640 |
| 110 %addr2.int = sub i32 %addr1.int, 2147483643 | 107 %addr2.int = sub i32 %addr1.int, 2147483643 |
| 111 %addr2.ptr = inttoptr i32 %addr2.int to float* | 108 %addr2.ptr = inttoptr i32 %addr2.int to float* |
| 112 %addr2.load = load float* %addr2.ptr, align 4 | 109 %addr2.load = load float* %addr2.ptr, align 4 |
| 113 ret float %addr2.load | 110 ret float %addr2.load |
| 114 ; CHECK-LABEL: address_mode_opt_chaining_overflow_sub: | 111 ; CHECK-LABEL: address_mode_opt_chaining_overflow_sub |
| 115 ; CHECK: 2147483640 | 112 ; CHECK: 2147483640 |
| 116 ; CHECK: movss xmm0, dword ptr [{{.*}} - 2147483643] | 113 ; CHECK: movss xmm0,DWORD ptr [{{.*}}-2147483643] |
| 117 } | 114 } |
| 118 | 115 |
| 119 define float @address_mode_opt_chaining_no_overflow(float* %arg) { | 116 define float @address_mode_opt_chaining_no_overflow(float* %arg) { |
| 120 entry: | 117 entry: |
| 121 %arg.int = ptrtoint float* %arg to i32 | 118 %arg.int = ptrtoint float* %arg to i32 |
| 122 %addr1.int = sub i32 %arg.int, 2147483640 | 119 %addr1.int = sub i32 %arg.int, 2147483640 |
| 123 %addr2.int = add i32 %addr1.int, 2147483643 | 120 %addr2.int = add i32 %addr1.int, 2147483643 |
| 124 %addr2.ptr = inttoptr i32 %addr2.int to float* | 121 %addr2.ptr = inttoptr i32 %addr2.int to float* |
| 125 %addr2.load = load float* %addr2.ptr, align 4 | 122 %addr2.load = load float* %addr2.ptr, align 4 |
| 126 ret float %addr2.load | 123 ret float %addr2.load |
| 127 ; CHECK-LABEL: address_mode_opt_chaining_no_overflow: | 124 ; CHECK-LABEL: address_mode_opt_chaining_no_overflow |
| 128 ; CHECK: movss xmm0, dword ptr [{{.*}} + 3] | 125 ; CHECK: movss xmm0,DWORD ptr [{{.*}}+3] |
| 129 } | 126 } |
| 130 | 127 |
| 131 define float @address_mode_opt_add_pos_min_int(float* %arg) { | 128 define float @address_mode_opt_add_pos_min_int(float* %arg) { |
| 132 entry: | 129 entry: |
| 133 %arg.int = ptrtoint float* %arg to i32 | 130 %arg.int = ptrtoint float* %arg to i32 |
| 134 %addr1.int = add i32 %arg.int, 2147483648 | 131 %addr1.int = add i32 %arg.int, 2147483648 |
| 135 %addr1.ptr = inttoptr i32 %addr1.int to float* | 132 %addr1.ptr = inttoptr i32 %addr1.int to float* |
| 136 %addr1.load = load float* %addr1.ptr, align 4 | 133 %addr1.load = load float* %addr1.ptr, align 4 |
| 137 ret float %addr1.load | 134 ret float %addr1.load |
| 138 ; CHECK-LABEL: address_mode_opt_add_pos_min_int: | 135 ; CHECK-LABEL: address_mode_opt_add_pos_min_int |
| 139 ; CHECK: movss xmm0, dword ptr [{{.*}} - 2147483648] | 136 ; CHECK: movss xmm0,DWORD ptr [{{.*}}-2147483648] |
| 140 } | 137 } |
| 141 | 138 |
| 142 define float @address_mode_opt_sub_min_int(float* %arg) { | 139 define float @address_mode_opt_sub_min_int(float* %arg) { |
| 143 entry: | 140 entry: |
| 144 %arg.int = ptrtoint float* %arg to i32 | 141 %arg.int = ptrtoint float* %arg to i32 |
| 145 %addr1.int = sub i32 %arg.int, 2147483648 | 142 %addr1.int = sub i32 %arg.int, 2147483648 |
| 146 %addr1.ptr = inttoptr i32 %addr1.int to float* | 143 %addr1.ptr = inttoptr i32 %addr1.int to float* |
| 147 %addr1.load = load float* %addr1.ptr, align 4 | 144 %addr1.load = load float* %addr1.ptr, align 4 |
| 148 ret float %addr1.load | 145 ret float %addr1.load |
| 149 ; CHECK-LABEL: address_mode_opt_sub_min_int: | 146 ; CHECK-LABEL: address_mode_opt_sub_min_int |
| 150 ; CHECK: movss xmm0, dword ptr [{{.*}} - 2147483648] | 147 ; CHECK: movss xmm0,DWORD ptr [{{.*}}-2147483648] |
| 151 } | 148 } |
| OLD | NEW |