Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(189)

Side by Side Diff: tests_lit/llvm2ice_tests/nacl-mem-intrinsics.ll

Issue 1278173009: Inline memove for small constant sizes and refactor memcpy and memset. (Closed) Base URL: https://chromium.googlesource.com/native_client/pnacl-subzero.git@master
Patch Set: Simplify xtests and add flags for memory intrinsic optimization. Created 5 years, 4 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
OLDNEW
1 ; This tests the NaCl intrinsics memset, memcpy and memmove. 1 ; This tests the NaCl intrinsics memset, memcpy and memmove.
2 2
3 ; RUN: %if --need=target_X8632 --command %p2i --filetype=obj --disassemble \ 3 ; RUN: %if --need=target_X8632 --command %p2i --filetype=obj --disassemble \
4 ; RUN: --target x8632 -i %s --args -O2 -sandbox \ 4 ; RUN: --target x8632 -i %s --args -O2 -sandbox \
5 ; RUN: | %if --need=target_X8632 --command FileCheck %s 5 ; RUN: | %if --need=target_X8632 --command FileCheck %s
6 ; RUN: %if --need=target_X8632 --command %p2i --filetype=obj --disassemble \ 6 ; RUN: %if --need=target_X8632 --command %p2i --filetype=obj --disassemble \
7 ; RUN: --target x8632 -i %s --args -Om1 -sandbox \ 7 ; RUN: --target x8632 -i %s --args -Om1 --fmem-intrin-opt -sandbox \
Jim Stichnoth 2015/08/18 17:11:28 I think you should have one more RUN configuration
ascull 2015/08/18 18:38:01 Done.
8 ; RUN: | %if --need=target_X8632 --command FileCheck %s 8 ; RUN: | %if --need=target_X8632 --command FileCheck %s
9 9
10 ; RUN: %if --need=target_ARM32 --need=allow_dump \ 10 ; RUN: %if --need=target_ARM32 --need=allow_dump \
11 ; RUN: --command %p2i --filetype=asm --assemble --disassemble --target arm32 \ 11 ; RUN: --command %p2i --filetype=asm --assemble --disassemble --target arm32 \
12 ; RUN: -i %s --args -O2 --skip-unimplemented \ 12 ; RUN: -i %s --args -O2 --skip-unimplemented \
13 ; RUN: | %if --need=target_ARM32 --need=allow_dump \ 13 ; RUN: | %if --need=target_ARM32 --need=allow_dump \
14 ; RUN: --command FileCheck --check-prefix ARM32 %s 14 ; RUN: --command FileCheck --check-prefix ARM32 %s
15 15
16 declare void @llvm.memcpy.p0i8.p0i8.i32(i8*, i8*, i32, i32, i1) 16 declare void @llvm.memcpy.p0i8.p0i8.i32(i8*, i8*, i32, i32, i1)
17 declare void @llvm.memmove.p0i8.p0i8.i32(i8*, i8*, i32, i32, i1) 17 declare void @llvm.memmove.p0i8.p0i8.i32(i8*, i8*, i32, i32, i1)
(...skipping 120 matching lines...) Expand 10 before | Expand all | Expand 10 after
138 ; CHECK: movups [[REG:xmm[0-9]+]],XMMWORD PTR [{{.*}}+0x10] 138 ; CHECK: movups [[REG:xmm[0-9]+]],XMMWORD PTR [{{.*}}+0x10]
139 ; CHECK-NEXT: movups XMMWORD PTR [{{.*}}+0x10],[[REG]] 139 ; CHECK-NEXT: movups XMMWORD PTR [{{.*}}+0x10],[[REG]]
140 ; CHECK-NEXT: movups [[REG:xmm[0-9]+]],XMMWORD PTR [{{.*}}] 140 ; CHECK-NEXT: movups [[REG:xmm[0-9]+]],XMMWORD PTR [{{.*}}]
141 ; CHECK-NEXT: movups XMMWORD PTR [{{.*}}],[[REG]] 141 ; CHECK-NEXT: movups XMMWORD PTR [{{.*}}],[[REG]]
142 ; CHECK-NEXT: mov [[REG:[^,]*]],BYTE PTR [{{.*}}+0x20] 142 ; CHECK-NEXT: mov [[REG:[^,]*]],BYTE PTR [{{.*}}+0x20]
143 ; CHECK-NEXT: mov BYTE PTR [{{.*}}+0x20],[[REG]] 143 ; CHECK-NEXT: mov BYTE PTR [{{.*}}+0x20],[[REG]]
144 ; CHECK-NOT: mov 144 ; CHECK-NOT: mov
145 ; ARM32-LABEL: test_memcpy_large_const_len 145 ; ARM32-LABEL: test_memcpy_large_const_len
146 ; ARM32: bl {{.*}} memcpy 146 ; ARM32: bl {{.*}} memcpy
147 147
148 ; TODO(jvoung) -- if we want to be clever, we can do memset without a function
149 ; call similar to memcpy.
150 define void @test_memmove(i32 %iptr_dst, i32 %iptr_src, i32 %len) { 148 define void @test_memmove(i32 %iptr_dst, i32 %iptr_src, i32 %len) {
151 entry: 149 entry:
152 %dst = inttoptr i32 %iptr_dst to i8* 150 %dst = inttoptr i32 %iptr_dst to i8*
153 %src = inttoptr i32 %iptr_src to i8* 151 %src = inttoptr i32 %iptr_src to i8*
154 call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src, 152 call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
155 i32 %len, i32 1, i1 false) 153 i32 %len, i32 1, i1 false)
156 ret void 154 ret void
157 } 155 }
158 ; CHECK-LABEL: test_memmove 156 ; CHECK-LABEL: test_memmove
159 ; CHECK: call {{.*}} R_{{.*}} memmove 157 ; CHECK: call {{.*}} R_{{.*}} memmove
160 ; ARM32-LABEL: test_memmove 158 ; ARM32-LABEL: test_memmove
161 ; ARM32: bl {{.*}} memmove 159 ; ARM32: bl {{.*}} memmove
162 160
163 define void @test_memmove_const_len_align(i32 %iptr_dst, i32 %iptr_src) { 161 define void @test_memmove_long_const_len(i32 %iptr_dst, i32 %iptr_src) {
164 entry: 162 entry:
165 %dst = inttoptr i32 %iptr_dst to i8* 163 %dst = inttoptr i32 %iptr_dst to i8*
166 %src = inttoptr i32 %iptr_src to i8* 164 %src = inttoptr i32 %iptr_src to i8*
167 call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src, 165 call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
168 i32 32, i32 1, i1 false) 166 i32 4876, i32 1, i1 false)
169 ret void 167 ret void
170 } 168 }
171 ; CHECK-LABEL: test_memmove_const_len_align 169 ; CHECK-LABEL: test_memmove_long_const_len
172 ; CHECK: call {{.*}} R_{{.*}} memmove 170 ; CHECK: call {{.*}} R_{{.*}} memmove
173 ; ARM32-LABEL: test_memmove_const_len_align 171 ; ARM32-LABEL: test_memmove_long_const_len
172 ; ARM32: bl {{.*}} memmove
173
174 define void @test_memmove_very_small_const_len(i32 %iptr_dst, i32 %iptr_src) {
175 entry:
176 %dst = inttoptr i32 %iptr_dst to i8*
177 %src = inttoptr i32 %iptr_src to i8*
178 call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
179 i32 2, i32 1, i1 false)
180 ret void
181 }
182 ; CHECK-LABEL: test_memmove_very_small_const_len
183 ; CHECK: mov [[REG:[^,]*]],WORD PTR [{{.*}}]
184 ; CHECK-NEXT: mov WORD PTR [{{.*}}],[[REG]]
185 ; CHECK-NOT: mov
186 ; ARM32-LABEL: test_memmove_very_small_const_len
187 ; ARM32: bl {{.*}} memmove
188
189 define void @test_memmove_const_len_3(i32 %iptr_dst, i32 %iptr_src) {
190 entry:
191 %dst = inttoptr i32 %iptr_dst to i8*
192 %src = inttoptr i32 %iptr_src to i8*
193 call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
194 i32 3, i32 1, i1 false)
195 ret void
196 }
197 ; CHECK-LABEL: test_memmove_const_len_3
198 ; CHECK: mov [[REG0:[^,]*]],WORD PTR [{{.*}}]
199 ; CHECK-NEXT: mov [[REG1:[^,]*]],BYTE PTR [{{.*}}+0x2]
200 ; CHECK-NEXT: mov WORD PTR [{{.*}}],[[REG0]]
201 ; CHECK-NEXT: mov BYTE PTR [{{.*}}+0x2],[[REG1]]
202 ; CHECK-NOT: mov
203 ; ARM32-LABEL: test_memmove_const_len_3
204 ; ARM32: bl {{.*}} memmove
205
206 define void @test_memmove_mid_const_len(i32 %iptr_dst, i32 %iptr_src) {
207 entry:
208 %dst = inttoptr i32 %iptr_dst to i8*
209 %src = inttoptr i32 %iptr_src to i8*
210 call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
211 i32 9, i32 1, i1 false)
212 ret void
213 }
214 ; CHECK-LABEL: test_memmove_mid_const_len
215 ; CHECK: movq [[REG0:xmm[0-9]+]],QWORD PTR [{{.*}}]
216 ; CHECK-NEXT: mov [[REG1:[^,]*]],BYTE PTR [{{.*}}+0x8]
217 ; CHECK-NEXT: movq QWORD PTR [{{.*}}],[[REG0]]
218 ; CHECK-NEXT: mov BYTE PTR [{{.*}}+0x8],[[REG1]]
219 ; CHECK-NOT: mov
220 ; ARM32-LABEL: test_memmove_mid_const_len
221 ; ARM32: bl {{.*}} memmove
222
223 define void @test_memmove_mid_const_len_overlap(i32 %iptr_dst, i32 %iptr_src) {
224 entry:
225 %dst = inttoptr i32 %iptr_dst to i8*
226 %src = inttoptr i32 %iptr_src to i8*
227 call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
228 i32 15, i32 1, i1 false)
229 ret void
230 }
231 ; CHECK-LABEL: test_memmove_mid_const_len_overlap
232 ; CHECK: movq [[REG0:xmm[0-9]+]],QWORD PTR [{{.*}}]
233 ; CHECK-NEXT: movq [[REG1:xmm[0-9]+]],QWORD PTR [{{.*}}+0x7]
234 ; CHECK-NEXT: movq QWORD PTR [{{.*}}],[[REG0]]
235 ; CHECK-NEXT: movq QWORD PTR [{{.*}}+0x7],[[REG1]]
236 ; CHECK-NOT: mov
237 ; ARM32-LABEL: test_memmove_mid_const_len_overlap
238 ; ARM32: bl {{.*}} memmove
239
240 define void @test_memmove_large_const_len_overlap(i32 %iptr_dst, i32 %iptr_src) {
241 entry:
242 %dst = inttoptr i32 %iptr_dst to i8*
243 %src = inttoptr i32 %iptr_src to i8*
244 call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
245 i32 30, i32 1, i1 false)
246 ret void
247 }
248 ; CHECK-LABEL: test_memmove_large_const_len_overlap
249 ; CHECK: movups [[REG0:xmm[0-9]+]],XMMWORD PTR [{{.*}}]
250 ; CHECK-NEXT: movups [[REG1:xmm[0-9]+]],XMMWORD PTR [{{.*}}+0xe]
251 ; CHECK-NEXT: movups XMMWORD PTR [{{.*}}],[[REG0]]
252 ; CHECK-NEXT: movups XMMWORD PTR [{{.*}}+0xe],[[REG1]]
253 ; CHECK-NOT: mov
254 ; ARM32-LABEL: test_memmove_large_const_len_overlap
255 ; ARM32: bl {{.*}} memmove
256
257 define void @test_memmove_large_const_len(i32 %iptr_dst, i32 %iptr_src) {
258 entry:
259 %dst = inttoptr i32 %iptr_dst to i8*
260 %src = inttoptr i32 %iptr_src to i8*
261 call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
262 i32 33, i32 1, i1 false)
263 ret void
264 }
265 ; CHECK-LABEL: test_memmove_large_const_len
266 ; CHECK: movups [[REG0:xmm[0-9]+]],XMMWORD PTR [{{.*}}+0x10]
267 ; CHECK-NEXT: movups [[REG1:xmm[0-9]+]],XMMWORD PTR [{{.*}}]
268 ; CHECK-NEXT: mov [[REG2:[^,]*]],BYTE PTR [{{.*}}+0x20]
269 ; CHECK-NEXT: movups XMMWORD PTR [{{.*}}+0x10],[[REG0]]
270 ; CHECK-NEXT: movups XMMWORD PTR [{{.*}}],[[REG1]]
271 ; CHECK-NEXT: mov BYTE PTR [{{.*}}+0x20],[[REG2]]
272 ; CHECK-NOT: mov
273 ; ARM32-LABEL: test_memmove_large_const_len
174 ; ARM32: bl {{.*}} memmove 274 ; ARM32: bl {{.*}} memmove
175 275
176 define void @test_memset(i32 %iptr_dst, i32 %wide_val, i32 %len) { 276 define void @test_memset(i32 %iptr_dst, i32 %wide_val, i32 %len) {
177 entry: 277 entry:
178 %val = trunc i32 %wide_val to i8 278 %val = trunc i32 %wide_val to i8
179 %dst = inttoptr i32 %iptr_dst to i8* 279 %dst = inttoptr i32 %iptr_dst to i8*
180 call void @llvm.memset.p0i8.i32(i8* %dst, i8 %val, 280 call void @llvm.memset.p0i8.i32(i8* %dst, i8 %val,
181 i32 %len, i32 1, i1 false) 281 i32 %len, i32 1, i1 false)
182 ret void 282 ret void
183 } 283 }
(...skipping 140 matching lines...) Expand 10 before | Expand all | Expand 10 after
324 } 424 }
325 ; CHECK-LABEL: test_memset_zero_const_len_large 425 ; CHECK-LABEL: test_memset_zero_const_len_large
326 ; CHECK: pxor [[ZERO:xmm[0-9]+]],[[ZERO]] 426 ; CHECK: pxor [[ZERO:xmm[0-9]+]],[[ZERO]]
327 ; CHECK-NEXT: movups XMMWORD PTR [{{.*}}+0x10],[[ZERO]] 427 ; CHECK-NEXT: movups XMMWORD PTR [{{.*}}+0x10],[[ZERO]]
328 ; CHECK-NEXT: movups XMMWORD PTR [{{.*}}],[[ZERO]] 428 ; CHECK-NEXT: movups XMMWORD PTR [{{.*}}],[[ZERO]]
329 ; CHECK-NEXT: mov BYTE PTR [{{.*}}+0x20],0x0 429 ; CHECK-NEXT: mov BYTE PTR [{{.*}}+0x20],0x0
330 ; CHECK-NOT: mov 430 ; CHECK-NOT: mov
331 ; ARM32-LABEL: test_memset_zero_const_len_large 431 ; ARM32-LABEL: test_memset_zero_const_len_large
332 ; ARM32: uxtb 432 ; ARM32: uxtb
333 ; ARM32: bl {{.*}} memset 433 ; ARM32: bl {{.*}} memset
OLDNEW

Powered by Google App Engine
This is Rietveld 408576698