Chromium Code Reviews| OLD | NEW |
|---|---|
| (Empty) | |
| 1 ; Show that we know how to translate vector urem, srem and frem. | |
| 2 | |
| 3 ; NOTE: We use -O2 to get rid of memory stores. | |
| 4 | |
| 5 ; REQUIRES: allow_dump | |
| 6 | |
| 7 ; Compile using standalone assembler. | |
| 8 ; RUN: %p2i --filetype=asm -i %s --target=arm32 --args -O2 -mattr=hwdiv-arm \ | |
| 9 ; RUN: | FileCheck %s --check-prefix=ASM | |
| 10 | |
| 11 define internal <4 x i32> @Urem4i32(<4 x i32> %a, <4 x i32> %b) { | |
| 12 ; ASM-LABEL:Urem4i32: | |
| 13 | |
| 14 entry: | |
| 15 ; ASM-NEXT:.LUrem4i32$entry: | |
| 16 | |
| 17 %v = urem <4 x i32> %a, %b | |
| 18 | |
| 19 ; ASM-LABEL:.LUrem4i32$local$__0: | |
| 20 ; ASM-NEXT: udiv r2, r0, r1 | |
| 21 ; ASM-NEXT: mls r2, r2, r1, r0 | |
| 22 ; ASM-NEXT: vmov.32 d4[0], r2 | |
| 23 | |
| 24 ; ASM-LABEL:.LUrem4i32$local$__1: | |
| 25 ; ASM-NEXT: udiv r2, r0, r1 | |
| 26 ; ASM-NEXT: mls r2, r2, r1, r0 | |
| 27 ; ASM-NEXT: vmov.32 d4[1], r2 | |
| 28 | |
| 29 ; ASM-LABEL:.LUrem4i32$local$__2: | |
| 30 ; ASM-NEXT: udiv r2, r0, r1 | |
| 31 ; ASM-NEXT: mls r2, r2, r1, r0 | |
| 32 ; ASM-NEXT: vmov.32 d5[0], r2 | |
| 33 | |
| 34 ; ASM-LABEL:.LUrem4i32$local$__3: | |
| 35 ; ASM-NEXT: udiv r2, r0, r1 | |
| 36 ; ASM-NEXT: mls r2, r2, r1, r0 | |
| 37 ; ASM-NEXT: vmov.32 d5[1], r2 | |
| 38 | |
| 39 ret <4 x i32> %v | |
| 40 } | |
| 41 | |
| 42 define internal <4 x i32> @Srem4i32(<4 x i32> %a, <4 x i32> %b) { | |
| 43 ; ASM-LABEL:Srem4i32: | |
| 44 | |
| 45 entry: | |
| 46 ; ASM-NEXT:.LSrem4i32$entry: | |
| 47 | |
| 48 %v = srem <4 x i32> %a, %b | |
| 49 | |
| 50 ; ASM-LABEL:.LSrem4i32$local$__0: | |
| 51 ; ASM-NEXT: sdiv r2, r0, r1 | |
| 52 ; ASM-NEXT: mls r2, r2, r1, r0 | |
| 53 ; ASM-NEXT: vmov.32 d4[0], r2 | |
| 54 | |
| 55 ; ASM-LABEL:.LSrem4i32$local$__1: | |
| 56 ; ASM-NEXT: sdiv r2, r0, r1 | |
| 57 ; ASM-NEXT: mls r2, r2, r1, r0 | |
| 58 ; ASM-NEXT: vmov.32 d4[1], r2 | |
| 59 | |
| 60 ; ASM-LABEL:.LSrem4i32$local$__2: | |
| 61 ; ASM-NEXT: sdiv r2, r0, r1 | |
| 62 ; ASM-NEXT: mls r2, r2, r1, r0 | |
| 63 ; ASM-NEXT: vmov.32 d5[0], r2 | |
| 64 | |
| 65 ; ASM-LABEL:.LSrem4i32$local$__3: | |
| 66 ; ASM-NEXT: sdiv r2, r0, r1 | |
| 67 ; ASM-NEXT: mls r2, r2, r1, r0 | |
| 68 ; ASM-NEXT: vmov.32 d5[1], r2 | |
| 69 | |
| 70 ret <4 x i32> %v | |
| 71 } | |
| 72 | |
| 73 define internal <4 x float> @Frem4float(<4 x float> %a, <4 x float> %b) { | |
| 74 ; ASM-LABEL:Frem4float: | |
| 75 | |
| 76 entry: | |
| 77 ; ASM-NEXT:.LFrem4float$entry: | |
| 78 | |
| 79 %v = frem <4 x float> %a, %b | |
| 80 | |
| 81 ; ASM: vmov.f32 s0, s16 | |
| 82 ; ASM-NEXT: vmov.f32 s1, s20 | |
| 83 ; ASM-NEXT: movw r0, #:lower16:fmodf | |
| 84 ; ASM-NEXT: movt r0, #:upper16:fmodf | |
| 85 ; ASM-NEXT: blx r0 | |
| 86 | |
| 87 ; ASM: vmov.f32 s0, s17 | |
| 88 ; ASM-NEXT: vmov.f32 s1, s21 | |
| 89 ; ASM-NEXT: movw r0, #:lower16:fmodf | |
| 90 ; ASM-NEXT: movt r0, #:upper16:fmodf | |
| 91 ; ASM-NEXT: blx r0 | |
| 92 | |
| 93 ; ASM: vmov.f32 s0, s18 | |
| 94 ; ASM-NEXT: vmov.f32 s1, s22 | |
| 95 ; ASM-NEXT: movw r0, #:lower16:fmodf | |
| 96 ; ASM-NEXT: movt r0, #:upper16:fmodf | |
| 97 ; ASM-NEXT: blx r0 | |
| 98 | |
| 99 ; ASM: vmov.f32 s16, s19 | |
| 100 ; ASM-NEXT: vmov.f32 s20, s23 | |
| 101 ; ASM-NEXT: movw r0, #:lower16:fmodf | |
| 102 ; ASM-NEXT: movt r0, #:upper16:fmodf | |
| 103 ; ASM: blx r0 | |
| 104 | |
| 105 ret <4 x float> %v | |
| 106 } | |
| 107 | |
|
Jim Stichnoth
2016/02/17 20:59:51
remove trailing blank line
Eric Holk
2016/02/17 22:31:56
Done.
| |
| OLD | NEW |