| OLD | NEW |
| 1 ; This file checks support for address mode optimization. | 1 ; This file checks support for address mode optimization. |
| 2 | 2 |
| 3 ; RUN: %p2i --filetype=obj --disassemble -i %s --args -O2 \ | 3 ; RUN: %p2i --filetype=obj --disassemble -i %s --args -O2 \ |
| 4 ; RUN: | FileCheck %s | 4 ; RUN: | FileCheck %s |
| 5 ; RUN: %p2i --filetype=obj --disassemble -i %s --args -O2 -mattr=sse4.1 \ | 5 ; RUN: %p2i --filetype=obj --disassemble -i %s --args -O2 -mattr=sse4.1 \ |
| 6 ; RUN: | FileCheck --check-prefix=SSE41 %s | 6 ; RUN: | FileCheck --check-prefix=SSE41 %s |
| 7 | 7 |
| 8 define float @load_arg_plus_200000(float* %arg) { | 8 define float @load_arg_plus_200000(float* %arg) { |
| 9 entry: | 9 entry: |
| 10 %arg.int = ptrtoint float* %arg to i32 | 10 %arg.int = ptrtoint float* %arg to i32 |
| 11 %addr.int = add i32 %arg.int, 200000 | 11 %addr.int = add i32 %arg.int, 200000 |
| 12 %addr.ptr = inttoptr i32 %addr.int to float* | 12 %addr.ptr = inttoptr i32 %addr.int to float* |
| 13 %addr.load = load float* %addr.ptr, align 4 | 13 %addr.load = load float, float* %addr.ptr, align 4 |
| 14 ret float %addr.load | 14 ret float %addr.load |
| 15 ; CHECK-LABEL: load_arg_plus_200000 | 15 ; CHECK-LABEL: load_arg_plus_200000 |
| 16 ; CHECK: movss xmm0,DWORD PTR [eax+0x30d40] | 16 ; CHECK: movss xmm0,DWORD PTR [eax+0x30d40] |
| 17 } | 17 } |
| 18 | 18 |
| 19 define float @load_200000_plus_arg(float* %arg) { | 19 define float @load_200000_plus_arg(float* %arg) { |
| 20 entry: | 20 entry: |
| 21 %arg.int = ptrtoint float* %arg to i32 | 21 %arg.int = ptrtoint float* %arg to i32 |
| 22 %addr.int = add i32 200000, %arg.int | 22 %addr.int = add i32 200000, %arg.int |
| 23 %addr.ptr = inttoptr i32 %addr.int to float* | 23 %addr.ptr = inttoptr i32 %addr.int to float* |
| 24 %addr.load = load float* %addr.ptr, align 4 | 24 %addr.load = load float, float* %addr.ptr, align 4 |
| 25 ret float %addr.load | 25 ret float %addr.load |
| 26 ; CHECK-LABEL: load_200000_plus_arg | 26 ; CHECK-LABEL: load_200000_plus_arg |
| 27 ; CHECK: movss xmm0,DWORD PTR [eax+0x30d40] | 27 ; CHECK: movss xmm0,DWORD PTR [eax+0x30d40] |
| 28 } | 28 } |
| 29 | 29 |
| 30 define float @load_arg_minus_200000(float* %arg) { | 30 define float @load_arg_minus_200000(float* %arg) { |
| 31 entry: | 31 entry: |
| 32 %arg.int = ptrtoint float* %arg to i32 | 32 %arg.int = ptrtoint float* %arg to i32 |
| 33 %addr.int = sub i32 %arg.int, 200000 | 33 %addr.int = sub i32 %arg.int, 200000 |
| 34 %addr.ptr = inttoptr i32 %addr.int to float* | 34 %addr.ptr = inttoptr i32 %addr.int to float* |
| 35 %addr.load = load float* %addr.ptr, align 4 | 35 %addr.load = load float, float* %addr.ptr, align 4 |
| 36 ret float %addr.load | 36 ret float %addr.load |
| 37 ; CHECK-LABEL: load_arg_minus_200000 | 37 ; CHECK-LABEL: load_arg_minus_200000 |
| 38 ; CHECK: movss xmm0,DWORD PTR [eax-0x30d40] | 38 ; CHECK: movss xmm0,DWORD PTR [eax-0x30d40] |
| 39 } | 39 } |
| 40 | 40 |
| 41 define float @load_200000_minus_arg(float* %arg) { | 41 define float @load_200000_minus_arg(float* %arg) { |
| 42 entry: | 42 entry: |
| 43 %arg.int = ptrtoint float* %arg to i32 | 43 %arg.int = ptrtoint float* %arg to i32 |
| 44 %addr.int = sub i32 200000, %arg.int | 44 %addr.int = sub i32 200000, %arg.int |
| 45 %addr.ptr = inttoptr i32 %addr.int to float* | 45 %addr.ptr = inttoptr i32 %addr.int to float* |
| 46 %addr.load = load float* %addr.ptr, align 4 | 46 %addr.load = load float, float* %addr.ptr, align 4 |
| 47 ret float %addr.load | 47 ret float %addr.load |
| 48 ; CHECK-LABEL: load_200000_minus_arg | 48 ; CHECK-LABEL: load_200000_minus_arg |
| 49 ; CHECK: movss xmm0,DWORD PTR [e{{..}}] | 49 ; CHECK: movss xmm0,DWORD PTR [e{{..}}] |
| 50 } | 50 } |
| 51 | 51 |
| 52 define <8 x i16> @load_mul_v8i16_mem(<8 x i16> %arg0, i32 %arg1_iptr) { | 52 define <8 x i16> @load_mul_v8i16_mem(<8 x i16> %arg0, i32 %arg1_iptr) { |
| 53 entry: | 53 entry: |
| 54 %addr_sub = sub i32 %arg1_iptr, 200000 | 54 %addr_sub = sub i32 %arg1_iptr, 200000 |
| 55 %addr_ptr = inttoptr i32 %addr_sub to <8 x i16>* | 55 %addr_ptr = inttoptr i32 %addr_sub to <8 x i16>* |
| 56 %arg1 = load <8 x i16>* %addr_ptr, align 2 | 56 %arg1 = load <8 x i16>, <8 x i16>* %addr_ptr, align 2 |
| 57 %res_vec = mul <8 x i16> %arg0, %arg1 | 57 %res_vec = mul <8 x i16> %arg0, %arg1 |
| 58 ret <8 x i16> %res_vec | 58 ret <8 x i16> %res_vec |
| 59 ; Address mode optimization is generally unsafe for SSE vector instructions. | 59 ; Address mode optimization is generally unsafe for SSE vector instructions. |
| 60 ; CHECK-LABEL: load_mul_v8i16_mem | 60 ; CHECK-LABEL: load_mul_v8i16_mem |
| 61 ; CHECK-NOT: pmullw xmm{{.*}},XMMWORD PTR [e{{..}}-0x30d40] | 61 ; CHECK-NOT: pmullw xmm{{.*}},XMMWORD PTR [e{{..}}-0x30d40] |
| 62 } | 62 } |
| 63 | 63 |
| 64 define <4 x i32> @load_mul_v4i32_mem(<4 x i32> %arg0, i32 %arg1_iptr) { | 64 define <4 x i32> @load_mul_v4i32_mem(<4 x i32> %arg0, i32 %arg1_iptr) { |
| 65 entry: | 65 entry: |
| 66 %addr_sub = sub i32 %arg1_iptr, 200000 | 66 %addr_sub = sub i32 %arg1_iptr, 200000 |
| 67 %addr_ptr = inttoptr i32 %addr_sub to <4 x i32>* | 67 %addr_ptr = inttoptr i32 %addr_sub to <4 x i32>* |
| 68 %arg1 = load <4 x i32>* %addr_ptr, align 4 | 68 %arg1 = load <4 x i32>, <4 x i32>* %addr_ptr, align 4 |
| 69 %res = mul <4 x i32> %arg0, %arg1 | 69 %res = mul <4 x i32> %arg0, %arg1 |
| 70 ret <4 x i32> %res | 70 ret <4 x i32> %res |
| 71 ; Address mode optimization is generally unsafe for SSE vector instructions. | 71 ; Address mode optimization is generally unsafe for SSE vector instructions. |
| 72 ; CHECK-LABEL: load_mul_v4i32_mem | 72 ; CHECK-LABEL: load_mul_v4i32_mem |
| 73 ; CHECK-NOT: pmuludq xmm{{.*}},XMMWORD PTR [e{{..}}-0x30d40] | 73 ; CHECK-NOT: pmuludq xmm{{.*}},XMMWORD PTR [e{{..}}-0x30d40] |
| 74 ; CHECK: pmuludq | 74 ; CHECK: pmuludq |
| 75 ; | 75 ; |
| 76 ; SSE41-LABEL: load_mul_v4i32_mem | 76 ; SSE41-LABEL: load_mul_v4i32_mem |
| 77 ; SSE41-NOT: pmulld xmm{{.*}},XMMWORD PTR [e{{..}}-0x30d40] | 77 ; SSE41-NOT: pmulld xmm{{.*}},XMMWORD PTR [e{{..}}-0x30d40] |
| 78 } | 78 } |
| 79 | 79 |
| 80 define float @address_mode_opt_chaining(float* %arg) { | 80 define float @address_mode_opt_chaining(float* %arg) { |
| 81 entry: | 81 entry: |
| 82 %arg.int = ptrtoint float* %arg to i32 | 82 %arg.int = ptrtoint float* %arg to i32 |
| 83 %addr1.int = add i32 12, %arg.int | 83 %addr1.int = add i32 12, %arg.int |
| 84 %addr2.int = sub i32 %addr1.int, 4 | 84 %addr2.int = sub i32 %addr1.int, 4 |
| 85 %addr2.ptr = inttoptr i32 %addr2.int to float* | 85 %addr2.ptr = inttoptr i32 %addr2.int to float* |
| 86 %addr2.load = load float* %addr2.ptr, align 4 | 86 %addr2.load = load float, float* %addr2.ptr, align 4 |
| 87 ret float %addr2.load | 87 ret float %addr2.load |
| 88 ; CHECK-LABEL: address_mode_opt_chaining | 88 ; CHECK-LABEL: address_mode_opt_chaining |
| 89 ; CHECK: movss xmm0,DWORD PTR [eax+0x8] | 89 ; CHECK: movss xmm0,DWORD PTR [eax+0x8] |
| 90 } | 90 } |
| 91 | 91 |
| 92 define float @address_mode_opt_chaining_overflow(float* %arg) { | 92 define float @address_mode_opt_chaining_overflow(float* %arg) { |
| 93 entry: | 93 entry: |
| 94 %arg.int = ptrtoint float* %arg to i32 | 94 %arg.int = ptrtoint float* %arg to i32 |
| 95 %addr1.int = add i32 2147483640, %arg.int | 95 %addr1.int = add i32 2147483640, %arg.int |
| 96 %addr2.int = add i32 %addr1.int, 2147483643 | 96 %addr2.int = add i32 %addr1.int, 2147483643 |
| 97 %addr2.ptr = inttoptr i32 %addr2.int to float* | 97 %addr2.ptr = inttoptr i32 %addr2.int to float* |
| 98 %addr2.load = load float* %addr2.ptr, align 4 | 98 %addr2.load = load float, float* %addr2.ptr, align 4 |
| 99 ret float %addr2.load | 99 ret float %addr2.load |
| 100 ; CHECK-LABEL: address_mode_opt_chaining_overflow | 100 ; CHECK-LABEL: address_mode_opt_chaining_overflow |
| 101 ; CHECK: 0x7ffffff8 | 101 ; CHECK: 0x7ffffff8 |
| 102 ; CHECK: movss xmm0,DWORD PTR [{{.*}}+0x7ffffffb] | 102 ; CHECK: movss xmm0,DWORD PTR [{{.*}}+0x7ffffffb] |
| 103 } | 103 } |
| 104 | 104 |
| 105 define float @address_mode_opt_chaining_overflow_sub(float* %arg) { | 105 define float @address_mode_opt_chaining_overflow_sub(float* %arg) { |
| 106 entry: | 106 entry: |
| 107 %arg.int = ptrtoint float* %arg to i32 | 107 %arg.int = ptrtoint float* %arg to i32 |
| 108 %addr1.int = sub i32 %arg.int, 2147483640 | 108 %addr1.int = sub i32 %arg.int, 2147483640 |
| 109 %addr2.int = sub i32 %addr1.int, 2147483643 | 109 %addr2.int = sub i32 %addr1.int, 2147483643 |
| 110 %addr2.ptr = inttoptr i32 %addr2.int to float* | 110 %addr2.ptr = inttoptr i32 %addr2.int to float* |
| 111 %addr2.load = load float* %addr2.ptr, align 4 | 111 %addr2.load = load float, float* %addr2.ptr, align 4 |
| 112 ret float %addr2.load | 112 ret float %addr2.load |
| 113 ; CHECK-LABEL: address_mode_opt_chaining_overflow_sub | 113 ; CHECK-LABEL: address_mode_opt_chaining_overflow_sub |
| 114 ; CHECK: 0x7ffffff8 | 114 ; CHECK: 0x7ffffff8 |
| 115 ; CHECK: movss xmm0,DWORD PTR [{{.*}}-0x7ffffffb] | 115 ; CHECK: movss xmm0,DWORD PTR [{{.*}}-0x7ffffffb] |
| 116 } | 116 } |
| 117 | 117 |
| 118 define float @address_mode_opt_chaining_no_overflow(float* %arg) { | 118 define float @address_mode_opt_chaining_no_overflow(float* %arg) { |
| 119 entry: | 119 entry: |
| 120 %arg.int = ptrtoint float* %arg to i32 | 120 %arg.int = ptrtoint float* %arg to i32 |
| 121 %addr1.int = sub i32 %arg.int, 2147483640 | 121 %addr1.int = sub i32 %arg.int, 2147483640 |
| 122 %addr2.int = add i32 %addr1.int, 2147483643 | 122 %addr2.int = add i32 %addr1.int, 2147483643 |
| 123 %addr2.ptr = inttoptr i32 %addr2.int to float* | 123 %addr2.ptr = inttoptr i32 %addr2.int to float* |
| 124 %addr2.load = load float* %addr2.ptr, align 4 | 124 %addr2.load = load float, float* %addr2.ptr, align 4 |
| 125 ret float %addr2.load | 125 ret float %addr2.load |
| 126 ; CHECK-LABEL: address_mode_opt_chaining_no_overflow | 126 ; CHECK-LABEL: address_mode_opt_chaining_no_overflow |
| 127 ; CHECK: movss xmm0,DWORD PTR [{{.*}}+0x3] | 127 ; CHECK: movss xmm0,DWORD PTR [{{.*}}+0x3] |
| 128 } | 128 } |
| 129 | 129 |
| 130 define float @address_mode_opt_add_pos_min_int(float* %arg) { | 130 define float @address_mode_opt_add_pos_min_int(float* %arg) { |
| 131 entry: | 131 entry: |
| 132 %arg.int = ptrtoint float* %arg to i32 | 132 %arg.int = ptrtoint float* %arg to i32 |
| 133 %addr1.int = add i32 %arg.int, 2147483648 | 133 %addr1.int = add i32 %arg.int, 2147483648 |
| 134 %addr1.ptr = inttoptr i32 %addr1.int to float* | 134 %addr1.ptr = inttoptr i32 %addr1.int to float* |
| 135 %addr1.load = load float* %addr1.ptr, align 4 | 135 %addr1.load = load float, float* %addr1.ptr, align 4 |
| 136 ret float %addr1.load | 136 ret float %addr1.load |
| 137 ; CHECK-LABEL: address_mode_opt_add_pos_min_int | 137 ; CHECK-LABEL: address_mode_opt_add_pos_min_int |
| 138 ; CHECK: movss xmm0,DWORD PTR [{{.*}}-0x80000000] | 138 ; CHECK: movss xmm0,DWORD PTR [{{.*}}-0x80000000] |
| 139 } | 139 } |
| 140 | 140 |
| 141 define float @address_mode_opt_sub_min_int(float* %arg) { | 141 define float @address_mode_opt_sub_min_int(float* %arg) { |
| 142 entry: | 142 entry: |
| 143 %arg.int = ptrtoint float* %arg to i32 | 143 %arg.int = ptrtoint float* %arg to i32 |
| 144 %addr1.int = sub i32 %arg.int, 2147483648 | 144 %addr1.int = sub i32 %arg.int, 2147483648 |
| 145 %addr1.ptr = inttoptr i32 %addr1.int to float* | 145 %addr1.ptr = inttoptr i32 %addr1.int to float* |
| 146 %addr1.load = load float* %addr1.ptr, align 4 | 146 %addr1.load = load float, float* %addr1.ptr, align 4 |
| 147 ret float %addr1.load | 147 ret float %addr1.load |
| 148 ; CHECK-LABEL: address_mode_opt_sub_min_int | 148 ; CHECK-LABEL: address_mode_opt_sub_min_int |
| 149 ; CHECK: movss xmm0,DWORD PTR [{{.*}}-0x80000000] | 149 ; CHECK: movss xmm0,DWORD PTR [{{.*}}-0x80000000] |
| 150 } | 150 } |
| OLD | NEW |