Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(970)

Unified Diff: tests_lit/llvm2ice_tests/nacl-mem-intrinsics.ll

Issue 1278173009: Inline memove for small constant sizes and refactor memcpy and memset. (Closed) Base URL: https://chromium.googlesource.com/native_client/pnacl-subzero.git@master
Patch Set: Created 5 years, 4 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
« src/IceTargetLoweringX86BaseImpl.h ('K') | « src/IceTargetLoweringX86BaseImpl.h ('k') | no next file » | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
Index: tests_lit/llvm2ice_tests/nacl-mem-intrinsics.ll
diff --git a/tests_lit/llvm2ice_tests/nacl-mem-intrinsics.ll b/tests_lit/llvm2ice_tests/nacl-mem-intrinsics.ll
index 8175eab856947136bd127f0831b37340a98caa6a..00354e6212c3f11cb0284b47f5779827fe816612 100644
--- a/tests_lit/llvm2ice_tests/nacl-mem-intrinsics.ll
+++ b/tests_lit/llvm2ice_tests/nacl-mem-intrinsics.ll
@@ -145,8 +145,6 @@ entry:
; ARM32-LABEL: test_memcpy_large_const_len
; ARM32: bl {{.*}} memcpy
-; TODO(jvoung) -- if we want to be clever, we can do memset without a function
-; call similar to memcpy.
define void @test_memmove(i32 %iptr_dst, i32 %iptr_src, i32 %len) {
entry:
%dst = inttoptr i32 %iptr_dst to i8*
@@ -160,17 +158,145 @@ entry:
; ARM32-LABEL: test_memmove
; ARM32: bl {{.*}} memmove
-define void @test_memmove_const_len_align(i32 %iptr_dst, i32 %iptr_src) {
+define void @test_memmove_long_const_len(i32 %iptr_dst, i32 %iptr_src) {
entry:
%dst = inttoptr i32 %iptr_dst to i8*
%src = inttoptr i32 %iptr_src to i8*
call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
- i32 32, i32 1, i1 false)
+ i32 4876, i32 1, i1 false)
ret void
}
-; CHECK-LABEL: test_memmove_const_len_align
+; CHECK-LABEL: test_memmove_long_const_len
; CHECK: call {{.*}} R_{{.*}} memmove
-; ARM32-LABEL: test_memmove_const_len_align
+; ARM32-LABEL: test_memmove_long_const_len
+; ARM32: bl {{.*}} memmove
+
+define void @test_memmove_very_small_const_len(i32 %iptr_dst, i32 %iptr_src) {
+entry:
+ %dst = inttoptr i32 %iptr_dst to i8*
+ %src = inttoptr i32 %iptr_src to i8*
+ call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
+ i32 2, i32 1, i1 false)
+ ret void
+}
+; CHECK-LABEL: test_memmove_very_small_const_len
+; CHECK: cmp {{.*}},{{.*}}
+; CHECK-NEXT: jb
+; CHECK-NEXT: xchg {{.*}},{{.*}}
+; CHECK-NEXT: mov [[REG:[^,]*]],WORD PTR [{{.*}}]
+; CHECK-NEXT: mov WORD PTR [{{.*}}],[[REG]]
+; CHECK-NOT: mov
+; ARM32-LABEL: test_memmove_very_small_const_len
+; ARM32: bl {{.*}} memmove
+
+define void @test_memmove_const_len_3(i32 %iptr_dst, i32 %iptr_src) {
+entry:
+ %dst = inttoptr i32 %iptr_dst to i8*
+ %src = inttoptr i32 %iptr_src to i8*
+ call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
+ i32 3, i32 1, i1 false)
+ ret void
+}
+; CHECK-LABEL: test_memmove_const_len_3
+; CHECK: cmp {{.*}},{{.*}}
+; CHECK-NEXT: jb
+; CHECK-NEXT: xchg {{.*}},{{.*}}
+; CHECK-NEXT: mov [[REG:[^,]*]],WORD PTR [{{.*}}]
+; CHECK-NEXT: mov WORD PTR [{{.*}}],[[REG]]
+; CHECK-NEXT: mov [[REG:[^,]*]],BYTE PTR [{{.*}}+0x2]
+; CHECK-NEXT: mov BYTE PTR [{{.*}}+0x2],[[REG]]
+; CHECK-NOT: mov
+; ARM32-LABEL: test_memmove_const_len_3
+; ARM32: bl {{.*}} memmove
+
+define void @test_memmove_mid_const_len(i32 %iptr_dst, i32 %iptr_src) {
+entry:
+ %dst = inttoptr i32 %iptr_dst to i8*
+ %src = inttoptr i32 %iptr_src to i8*
+ call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
+ i32 9, i32 1, i1 false)
+ ret void
+}
+; CHECK-LABEL: test_memmove_mid_const_len
+; CHECK: cmp {{.*}},{{.*}}
+; CHECK-NEXT: jb
+; CHECK-NEXT: xchg {{.*}},{{.*}}
+; CHECK-NEXT: movq [[REG:xmm[0-9]+]],QWORD PTR [{{.*}}]
+; CHECK-NEXT: movq QWORD PTR [{{.*}}],[[REG]]
+; CHECK-NEXT: mov [[REG:[^,]*]],BYTE PTR [{{.*}}+0x8]
+; CHECK-NEXT: mov BYTE PTR [{{.*}}+0x8],[[REG]]
+; CHECK-NOT: mov
+; ARM32-LABEL: test_memmove_mid_const_len
+; ARM32: bl {{.*}} memmove
+
+define void @test_memmove_mid_const_len_no_overlap(i32 %iptr_dst, i32 %iptr_src) {
+entry:
+ %dst = inttoptr i32 %iptr_dst to i8*
+ %src = inttoptr i32 %iptr_src to i8*
+ call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
+ i32 15, i32 1, i1 false)
+ ret void
+}
+; CHECK-LABEL: test_memmove_mid_const_len_no_overlap
+; CHECK: cmp {{.*}},{{.*}}
+; CHECK-NEXT: jb
+; CHECK-NEXT: xchg {{.*}},{{.*}}
+; CHECK-NEXT: movq [[REG:xmm[0-9]+]],QWORD PTR [{{.*}}]
+; CHECK-NEXT: movq QWORD PTR [{{.*}}],[[REG]]
+; CHECK-NEXT: mov [[REG:[^,]*]],DWORD PTR [{{.*}}+0x8]
+; CHECK-NEXT: mov DWORD PTR [{{.*}}+0x8],[[REG]]
+; CHECK-NEXT: mov [[REG:[^,]*]],WORD PTR [{{.*}}+0xc]
+; CHECK: mov WORD PTR [{{.*}}+0xc],[[REG]]
Jim Stichnoth 2015/08/12 13:41:47 Is this a CHECK instead of CHECK-NEXT because sand
ascull 2015/08/17 22:18:53 With the new (and correct) implementation on memmo
+; CHECK-NEXT: mov [[REG:[^,]*]],BYTE PTR [{{.*}}+0xe]
+; CHECK-NEXT: mov BYTE PTR [{{.*}}+0xe],[[REG]]
+; CHECK-NOT: mov
+; ARM32-LABEL: test_memmove_mid_const_len_no_overlap
+; ARM32: bl {{.*}} memmove
+
+define void @test_memmove_big_const_len_no_overlap(i32 %iptr_dst, i32 %iptr_src) {
+entry:
+ %dst = inttoptr i32 %iptr_dst to i8*
+ %src = inttoptr i32 %iptr_src to i8*
+ call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
+ i32 30, i32 1, i1 false)
+ ret void
+}
+; CHECK-LABEL: test_memmove_big_const_len_no_overlap
+; CHECK: cmp {{.*}},{{.*}}
+; CHECK-NEXT: jb
+; CHECK-NEXT: xchg {{.*}},{{.*}}
+; CHECK-NEXT: movups [[REG:xmm[0-9]+]],XMMWORD PTR [{{.*}}]
+; CHECK-NEXT: movups XMMWORD PTR [{{.*}}],[[REG]]
+; CHECK-NEXT: movq [[REG:xmm[0-9]+]],QWORD PTR [{{.*}}+0x10]
+; CHECK-NEXT: movq QWORD PTR [{{.*}}+0x10],[[REG]]
+; CHECK-NEXT: mov [[REG:[^,]*]],DWORD PTR [{{.*}}+0x18]
+; CHECK-NEXT: mov DWORD PTR [{{.*}}+0x18],[[REG]]
+; CHECK-NEXT: mov [[REG:[^,]*]],WORD PTR [{{.*}}+0x1c]
+; CHECK-NEXT: mov WORD PTR [{{.*}}+0x1c],[[REG]]
+; CHECK-NOT: mov
+; ARM32-LABEL: test_memmove_big_const_len_no_overlap
+; ARM32: bl {{.*}} memmove
+
+define void @test_memmove_large_const_len(i32 %iptr_dst, i32 %iptr_src) {
+entry:
+ %dst = inttoptr i32 %iptr_dst to i8*
+ %src = inttoptr i32 %iptr_src to i8*
+ call void @llvm.memmove.p0i8.p0i8.i32(i8* %dst, i8* %src,
+ i32 33, i32 1, i1 false)
+ ret void
+}
+; CHECK-LABEL: test_memmove_large_const_len
+; CHECK: cmp {{.*}},{{.*}}
+; CHECK-NEXT: jb
+; CHECK-NEXT: xchg {{.*}},{{.*}}
+; CHECK-NEXT: movups [[REG:xmm[0-9]+]],XMMWORD PTR [{{.*}}]
+; CHECK-NEXT: movups XMMWORD PTR [{{.*}}],[[REG]]
+; CHECK-NEXT: movups [[REG:xmm[0-9]+]],XMMWORD PTR [{{.*}}+0x10]
+; CHECK-NEXT: movups XMMWORD PTR [{{.*}}+0x10],[[REG]]
+; CHECK-NEXT: mov [[REG:[^,]*]],BYTE PTR [{{.*}}+0x20]
+; CHECK: mov BYTE PTR [{{.*}}+0x20],[[REG]]
+; CHECK-NOT: mov
+; ARM32-LABEL: test_memmove_large_const_len
; ARM32: bl {{.*}} memmove
define void @test_memset(i32 %iptr_dst, i32 %wide_val, i32 %len) {
« src/IceTargetLoweringX86BaseImpl.h ('K') | « src/IceTargetLoweringX86BaseImpl.h ('k') | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698