OLD | NEW |
1 /* | 1 /* |
2 * Copyright (c) 2014 The WebM project authors. All Rights Reserved. | 2 * Copyright (c) 2014 The WebM project authors. All Rights Reserved. |
3 * | 3 * |
4 * Use of this source code is governed by a BSD-style license | 4 * Use of this source code is governed by a BSD-style license |
5 * that can be found in the LICENSE file in the root of the source | 5 * that can be found in the LICENSE file in the root of the source |
6 * tree. An additional intellectual property rights grant can be found | 6 * tree. An additional intellectual property rights grant can be found |
7 * in the file PATENTS. All contributing project authors may | 7 * in the file PATENTS. All contributing project authors may |
8 * be found in the AUTHORS file in the root of the source tree. | 8 * be found in the AUTHORS file in the root of the source tree. |
9 */ | 9 */ |
10 | 10 |
11 #include <arm_neon.h> | 11 #include <arm_neon.h> |
12 | 12 |
13 #include "vpx_dsp/inv_txfm.h" | 13 #include "vpx_dsp/inv_txfm.h" |
14 #include "vpx_ports/mem.h" | 14 #include "vpx_ports/mem.h" |
15 | 15 |
16 void vp9_idct16x16_1_add_neon( | 16 void vpx_idct16x16_1_add_neon( |
17 int16_t *input, | 17 int16_t *input, |
18 uint8_t *dest, | 18 uint8_t *dest, |
19 int dest_stride) { | 19 int dest_stride) { |
20 uint8x8_t d2u8, d3u8, d30u8, d31u8; | 20 uint8x8_t d2u8, d3u8, d30u8, d31u8; |
21 uint64x1_t d2u64, d3u64, d4u64, d5u64; | 21 uint64x1_t d2u64, d3u64, d4u64, d5u64; |
22 uint16x8_t q0u16, q9u16, q10u16, q11u16, q12u16; | 22 uint16x8_t q0u16, q9u16, q10u16, q11u16, q12u16; |
23 int16x8_t q0s16; | 23 int16x8_t q0s16; |
24 uint8_t *d1, *d2; | 24 uint8_t *d1, *d2; |
25 int16_t i, j, a1, cospi_16_64 = 11585; | 25 int16_t i, j, a1, cospi_16_64 = 11585; |
26 int16_t out = dct_const_round_shift(input[0] * cospi_16_64); | 26 int16_t out = dct_const_round_shift(input[0] * cospi_16_64); |
(...skipping 25 matching lines...) Expand all Loading... |
52 vst1_u64((uint64_t *)d2, vreinterpret_u64_u8(d2u8)); | 52 vst1_u64((uint64_t *)d2, vreinterpret_u64_u8(d2u8)); |
53 vst1_u64((uint64_t *)(d2 + 8), vreinterpret_u64_u8(d3u8)); | 53 vst1_u64((uint64_t *)(d2 + 8), vreinterpret_u64_u8(d3u8)); |
54 d2 += dest_stride; | 54 d2 += dest_stride; |
55 vst1_u64((uint64_t *)d2, vreinterpret_u64_u8(d30u8)); | 55 vst1_u64((uint64_t *)d2, vreinterpret_u64_u8(d30u8)); |
56 vst1_u64((uint64_t *)(d2 + 8), vreinterpret_u64_u8(d31u8)); | 56 vst1_u64((uint64_t *)(d2 + 8), vreinterpret_u64_u8(d31u8)); |
57 d2 += dest_stride; | 57 d2 += dest_stride; |
58 } | 58 } |
59 } | 59 } |
60 return; | 60 return; |
61 } | 61 } |
OLD | NEW |