OLD | NEW |
1 ; Show that we know how to translate vector urem, srem and frem. | 1 ; Show that we know how to translate vector urem, srem and frem. |
2 | 2 |
3 ; NOTE: We use -O2 to get rid of memory stores. | 3 ; NOTE: We use -O2 to get rid of memory stores. |
4 | 4 |
5 ; REQUIRES: allow_dump | 5 ; REQUIRES: allow_dump |
6 | 6 |
7 ; Compile using standalone assembler. | 7 ; Compile using standalone assembler. |
8 ; RUN: %p2i --filetype=asm -i %s --target=arm32 --args -O2 -mattr=hwdiv-arm \ | 8 ; RUN: %p2i --filetype=asm -i %s --target=arm32 --args -O2 -mattr=hwdiv-arm \ |
9 ; RUN: | FileCheck %s --check-prefix=ASM | 9 ; RUN: | FileCheck %s --check-prefix=ASM |
10 | 10 |
11 define internal <4 x i32> @Urem4i32(<4 x i32> %a, <4 x i32> %b) { | 11 define internal <4 x i32> @Urem4i32(<4 x i32> %a, <4 x i32> %b) { |
12 ; ASM-LABEL:Urem4i32: | 12 ; ASM-LABEL:Urem4i32: |
13 | 13 |
14 entry: | 14 entry: |
15 ; ASM-NEXT:.LUrem4i32$entry: | 15 ; ASM-NEXT:.LUrem4i32$entry: |
16 | 16 |
17 %v = urem <4 x i32> %a, %b | 17 %v = urem <4 x i32> %a, %b |
18 | 18 |
19 ; ASM-LABEL:.LUrem4i32$local$__0: | 19 ; ASM-LABEL:.LUrem4i32$local$__0: |
20 ; ASM-NEXT:» udiv» r2, r0, r1 | 20 ; ASM-NEXT: udiv r2, r0, r1 |
21 ; ASM-NEXT:» mls» r2, r2, r1, r0 | 21 ; ASM-NEXT: mls r2, r2, r1, r0 |
22 ; ASM-NEXT:» vmov.32»d4[0], r2 | 22 ; ASM-NEXT: vmov.32 d4[0], r2 |
23 | 23 |
24 ; ASM-LABEL:.LUrem4i32$local$__1: | 24 ; ASM-LABEL:.LUrem4i32$local$__1: |
25 ; ASM-NEXT:» udiv» r2, r0, r1 | 25 ; ASM-NEXT: udiv r2, r0, r1 |
26 ; ASM-NEXT:» mls» r2, r2, r1, r0 | 26 ; ASM-NEXT: mls r2, r2, r1, r0 |
27 ; ASM-NEXT:» vmov.32»d4[1], r2 | 27 ; ASM-NEXT: vmov.32 d4[1], r2 |
28 | 28 |
29 ; ASM-LABEL:.LUrem4i32$local$__2: | 29 ; ASM-LABEL:.LUrem4i32$local$__2: |
30 ; ASM-NEXT:» udiv» r2, r0, r1 | 30 ; ASM-NEXT: udiv r2, r0, r1 |
31 ; ASM-NEXT:» mls» r2, r2, r1, r0 | 31 ; ASM-NEXT: mls r2, r2, r1, r0 |
32 ; ASM-NEXT:» vmov.32»d5[0], r2 | 32 ; ASM-NEXT: vmov.32 d5[0], r2 |
33 | 33 |
34 ; ASM-LABEL:.LUrem4i32$local$__3: | 34 ; ASM-LABEL:.LUrem4i32$local$__3: |
35 ; ASM-NEXT:» udiv» r2, r0, r1 | 35 ; ASM-NEXT: udiv r2, r0, r1 |
36 ; ASM-NEXT:» mls» r2, r2, r1, r0 | 36 ; ASM-NEXT: mls r2, r2, r1, r0 |
37 ; ASM-NEXT:» vmov.32»d5[1], r2 | 37 ; ASM-NEXT: vmov.32 d5[1], r2 |
38 | 38 |
39 ret <4 x i32> %v | 39 ret <4 x i32> %v |
40 } | 40 } |
41 | 41 |
42 define internal <4 x i32> @Srem4i32(<4 x i32> %a, <4 x i32> %b) { | 42 define internal <4 x i32> @Srem4i32(<4 x i32> %a, <4 x i32> %b) { |
43 ; ASM-LABEL:Srem4i32: | 43 ; ASM-LABEL:Srem4i32: |
44 | 44 |
45 entry: | 45 entry: |
46 ; ASM-NEXT:.LSrem4i32$entry: | 46 ; ASM-NEXT:.LSrem4i32$entry: |
47 | 47 |
48 %v = srem <4 x i32> %a, %b | 48 %v = srem <4 x i32> %a, %b |
49 | 49 |
50 ; ASM-LABEL:.LSrem4i32$local$__0: | 50 ; ASM-LABEL:.LSrem4i32$local$__0: |
51 ; ASM-NEXT:» sdiv» r2, r0, r1 | 51 ; ASM-NEXT: sdiv r2, r0, r1 |
52 ; ASM-NEXT:» mls» r2, r2, r1, r0 | 52 ; ASM-NEXT: mls r2, r2, r1, r0 |
53 ; ASM-NEXT:» vmov.32»d4[0], r2 | 53 ; ASM-NEXT: vmov.32 d4[0], r2 |
54 | 54 |
55 ; ASM-LABEL:.LSrem4i32$local$__1: | 55 ; ASM-LABEL:.LSrem4i32$local$__1: |
56 ; ASM-NEXT:» sdiv» r2, r0, r1 | 56 ; ASM-NEXT: sdiv r2, r0, r1 |
57 ; ASM-NEXT:» mls» r2, r2, r1, r0 | 57 ; ASM-NEXT: mls r2, r2, r1, r0 |
58 ; ASM-NEXT:» vmov.32»d4[1], r2 | 58 ; ASM-NEXT: vmov.32 d4[1], r2 |
59 | 59 |
60 ; ASM-LABEL:.LSrem4i32$local$__2: | 60 ; ASM-LABEL:.LSrem4i32$local$__2: |
61 ; ASM-NEXT:» sdiv» r2, r0, r1 | 61 ; ASM-NEXT: sdiv r2, r0, r1 |
62 ; ASM-NEXT:» mls» r2, r2, r1, r0 | 62 ; ASM-NEXT: mls r2, r2, r1, r0 |
63 ; ASM-NEXT:» vmov.32»d5[0], r2 | 63 ; ASM-NEXT: vmov.32 d5[0], r2 |
64 | 64 |
65 ; ASM-LABEL:.LSrem4i32$local$__3: | 65 ; ASM-LABEL:.LSrem4i32$local$__3: |
66 ; ASM-NEXT:» sdiv» r2, r0, r1 | 66 ; ASM-NEXT: sdiv r2, r0, r1 |
67 ; ASM-NEXT:» mls» r2, r2, r1, r0 | 67 ; ASM-NEXT: mls r2, r2, r1, r0 |
68 ; ASM-NEXT:» vmov.32»d5[1], r2 | 68 ; ASM-NEXT: vmov.32 d5[1], r2 |
69 | 69 |
70 ret <4 x i32> %v | 70 ret <4 x i32> %v |
71 } | 71 } |
72 | 72 |
73 define internal <4 x float> @Frem4float(<4 x float> %a, <4 x float> %b) { | 73 define internal <4 x float> @Frem4float(<4 x float> %a, <4 x float> %b) { |
74 ; ASM-LABEL:Frem4float: | 74 ; ASM-LABEL:Frem4float: |
75 | 75 |
76 entry: | 76 entry: |
77 ; ASM-NEXT:.LFrem4float$entry: | 77 ; ASM-NEXT:.LFrem4float$entry: |
78 | 78 |
79 %v = frem <4 x float> %a, %b | 79 %v = frem <4 x float> %a, %b |
80 | 80 |
81 ; ASM:» »vmov.f32» s0, s16 | 81 ; ASM: vmov.f32 s0, s16 |
82 ; ASM-NEXT:» vmov.f32» s1, s20 | 82 ; ASM-NEXT: vmov.f32 s1, s20 |
83 ; ASM-NEXT:» movw» r0, #:lower16:fmodf | 83 ; ASM-NEXT: bl fmodf |
84 ; ASM-NEXT:» movt» r0, #:upper16:fmodf | |
85 ; ASM-NEXT:» blx» r0 | |
86 | 84 |
87 ; ASM:» » vmov.f32» s0, s17 | 85 ; ASM: vmov.f32 s0, s17 |
88 ; ASM-NEXT:» vmov.f32» s1, s21 | 86 ; ASM-NEXT: vmov.f32 s1, s21 |
89 ; ASM-NEXT:» movw» r0, #:lower16:fmodf | 87 ; ASM-NEXT: bl fmodf |
90 ; ASM-NEXT:» movt» r0, #:upper16:fmodf | |
91 ; ASM-NEXT:» blx» r0 | |
92 | 88 |
93 ; ASM:» » vmov.f32» s0, s18 | 89 ; ASM: vmov.f32 s0, s18 |
94 ; ASM-NEXT:» vmov.f32» s1, s22 | 90 ; ASM-NEXT: vmov.f32 s1, s22 |
95 ; ASM-NEXT:» movw» r0, #:lower16:fmodf | 91 ; ASM-NEXT: bl fmodf |
96 ; ASM-NEXT:» movt» r0, #:upper16:fmodf | |
97 ; ASM-NEXT:» blx» r0 | |
98 | 92 |
99 ; ASM:» » vmov.f32» s16, s19 | 93 ; ASM: vmov.f32 s16, s19 |
100 ; ASM-NEXT:» vmov.f32» s20, s23 | 94 ; ASM-NEXT: vmov.f32 s20, s23 |
101 ; ASM-NEXT:» movw» r0, #:lower16:fmodf | 95 ; ASM: bl fmodf |
102 ; ASM-NEXT:» movt» r0, #:upper16:fmodf | |
103 ; ASM:» blx» r0 | |
104 | 96 |
105 ret <4 x float> %v | 97 ret <4 x float> %v |
106 } | 98 } |
OLD | NEW |