| Index: celt/arm/celt_pitch_xcorr_arm.s
|
| diff --git a/celt/arm/celt_pitch_xcorr_arm.s b/celt/arm/celt_pitch_xcorr_arm.s
|
| index 598e45be36bf2700b26c4a36db3f42631b913300..f96e0a88bbe609ed638b1a44b67e9038a3ed3447 100644
|
| --- a/celt/arm/celt_pitch_xcorr_arm.s
|
| +++ b/celt/arm/celt_pitch_xcorr_arm.s
|
| @@ -42,6 +42,7 @@ IF OPUS_ARM_MAY_HAVE_NEON
|
|
|
| ; Compute sum[k]=sum(x[j]*y[j+k],j=0...len-1), k=0...3
|
| xcorr_kernel_neon PROC
|
| +xcorr_kernel_neon_start
|
| ; input:
|
| ; r3 = int len
|
| ; r4 = opus_val16 *x
|
| @@ -181,7 +182,7 @@ celt_pitch_xcorr_neon_process4
|
| VEOR q0, q0, q0
|
| ; xcorr_kernel_neon only modifies r4, r5, r12, and q0...q3.
|
| ; So we don't save/restore any other registers.
|
| - BL xcorr_kernel_neon
|
| + BL xcorr_kernel_neon_start
|
| SUBS r6, r6, #4
|
| VST1.32 {q0}, [r2]!
|
| ; _y += 4
|
| @@ -257,6 +258,7 @@ IF OPUS_ARM_MAY_HAVE_EDSP
|
| ; This will get used on ARMv7 devices without NEON, so it has been optimized
|
| ; to take advantage of dual-issuing where possible.
|
| xcorr_kernel_edsp PROC
|
| +xcorr_kernel_edsp_start
|
| ; input:
|
| ; r3 = int len
|
| ; r4 = opus_val16 *_x (must be 32-bit aligned)
|
| @@ -416,7 +418,7 @@ celt_pitch_xcorr_edsp_process4
|
| MOV r7, #0
|
| MOV r8, #0
|
| MOV r9, #0
|
| - BL xcorr_kernel_edsp ; xcorr_kernel_edsp(_x, _y+i, xcorr+i, len)
|
| + BL xcorr_kernel_edsp_start ; xcorr_kernel_edsp(_x, _y+i, xcorr+i, len)
|
| ; maxcorr = max(maxcorr, sum0, sum1, sum2, sum3)
|
| CMP r0, r6
|
| ; _y+=4
|
|
|