OLD | NEW |
---|---|
(Empty) | |
1 ; Show that we know how to translate vector urem, srem and frem. | |
2 | |
3 ; NOTE: We use -O2 to get rid of memory stores. | |
4 | |
5 ; REQUIRES: allow_dump | |
6 | |
7 ; Compile using standalone assembler. | |
8 ; RUN: %p2i --filetype=asm -i %s --target=arm32 --args -O2 -mattr=hwdiv-arm \ | |
9 ; RUN: | FileCheck %s --check-prefix=ASM | |
10 | |
11 define internal <4 x i32> @Urem4i32(<4 x i32> %a, <4 x i32> %b) { | |
12 ; ASM-LABEL:Urem4i32: | |
13 | |
14 entry: | |
15 ; ASM-NEXT:.LUrem4i32$entry: | |
16 | |
17 %v = urem <4 x i32> %a, %b | |
18 | |
19 ; ASM-LABEL:.LUrem4i32$local$__0: | |
20 ; ASM-NEXT: udiv r2, r0, r1 | |
21 ; ASM-NEXT: mls r2, r2, r1, r0 | |
22 ; ASM-NEXT: vmov.32 d4[0], r2 | |
23 | |
24 ; ASM-LABEL:.LUrem4i32$local$__1: | |
25 ; ASM-NEXT: udiv r2, r0, r1 | |
26 ; ASM-NEXT: mls r2, r2, r1, r0 | |
27 ; ASM-NEXT: vmov.32 d4[1], r2 | |
28 | |
29 ; ASM-LABEL:.LUrem4i32$local$__2: | |
30 ; ASM-NEXT: udiv r2, r0, r1 | |
31 ; ASM-NEXT: mls r2, r2, r1, r0 | |
32 ; ASM-NEXT: vmov.32 d5[0], r2 | |
33 | |
34 ; ASM-LABEL:.LUrem4i32$local$__3: | |
35 ; ASM-NEXT: udiv r2, r0, r1 | |
36 ; ASM-NEXT: mls r2, r2, r1, r0 | |
37 ; ASM-NEXT: vmov.32 d5[1], r2 | |
38 | |
39 ret <4 x i32> %v | |
40 } | |
41 | |
42 define internal <4 x i32> @Srem4i32(<4 x i32> %a, <4 x i32> %b) { | |
43 ; ASM-LABEL:Srem4i32: | |
44 | |
45 entry: | |
46 ; ASM-NEXT:.LSrem4i32$entry: | |
47 | |
48 %v = srem <4 x i32> %a, %b | |
49 | |
50 ; ASM-LABEL:.LSrem4i32$local$__0: | |
51 ; ASM-NEXT: sdiv r2, r0, r1 | |
52 ; ASM-NEXT: mls r2, r2, r1, r0 | |
53 ; ASM-NEXT: vmov.32 d4[0], r2 | |
54 | |
55 ; ASM-LABEL:.LSrem4i32$local$__1: | |
56 ; ASM-NEXT: sdiv r2, r0, r1 | |
57 ; ASM-NEXT: mls r2, r2, r1, r0 | |
58 ; ASM-NEXT: vmov.32 d4[1], r2 | |
59 | |
60 ; ASM-LABEL:.LSrem4i32$local$__2: | |
61 ; ASM-NEXT: sdiv r2, r0, r1 | |
62 ; ASM-NEXT: mls r2, r2, r1, r0 | |
63 ; ASM-NEXT: vmov.32 d5[0], r2 | |
64 | |
65 ; ASM-LABEL:.LSrem4i32$local$__3: | |
66 ; ASM-NEXT: sdiv r2, r0, r1 | |
67 ; ASM-NEXT: mls r2, r2, r1, r0 | |
68 ; ASM-NEXT: vmov.32 d5[1], r2 | |
69 | |
70 ret <4 x i32> %v | |
71 } | |
72 | |
73 define internal <4 x float> @Frem4float(<4 x float> %a, <4 x float> %b) { | |
74 ; ASM-LABEL:Frem4float: | |
75 | |
76 entry: | |
77 ; ASM-NEXT:.LFrem4float$entry: | |
78 | |
79 %v = frem <4 x float> %a, %b | |
80 | |
81 ; ASM: vmov.f32 s0, s16 | |
82 ; ASM-NEXT: vmov.f32 s1, s20 | |
83 ; ASM-NEXT: movw r0, #:lower16:fmodf | |
84 ; ASM-NEXT: movt r0, #:upper16:fmodf | |
85 ; ASM-NEXT: blx r0 | |
86 | |
87 ; ASM: vmov.f32 s0, s17 | |
88 ; ASM-NEXT: vmov.f32 s1, s21 | |
89 ; ASM-NEXT: movw r0, #:lower16:fmodf | |
90 ; ASM-NEXT: movt r0, #:upper16:fmodf | |
91 ; ASM-NEXT: blx r0 | |
92 | |
93 ; ASM: vmov.f32 s0, s18 | |
94 ; ASM-NEXT: vmov.f32 s1, s22 | |
95 ; ASM-NEXT: movw r0, #:lower16:fmodf | |
96 ; ASM-NEXT: movt r0, #:upper16:fmodf | |
97 ; ASM-NEXT: blx r0 | |
98 | |
99 ; ASM: vmov.f32 s16, s19 | |
100 ; ASM-NEXT: vmov.f32 s20, s23 | |
101 ; ASM-NEXT: movw r0, #:lower16:fmodf | |
102 ; ASM-NEXT: movt r0, #:upper16:fmodf | |
103 ; ASM: blx r0 | |
104 | |
105 ret <4 x float> %v | |
106 } | |
107 | |
Jim Stichnoth
2016/02/17 04:15:44
trailing blank line
| |
OLD | NEW |