source/libvpx/vp9/encoder/x86/vp9_dct_sse2.c - Issue 1162573005: libvpx: Pull from upstream

Unified Diff: source/libvpx/vp9/encoder/x86/vp9_dct_sse2.c

Issue 1162573005: libvpx: Pull from upstream (Closed) Base URL: https://chromium.googlesource.com/chromium/deps/libvpx.git@master

Patch Set: Created 5 years, 7 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: source/libvpx/vp9/encoder/x86/vp9_dct_sse2.c

diff --git a/source/libvpx/vp9/encoder/x86/vp9_dct_sse2.c b/source/libvpx/vp9/encoder/x86/vp9_dct_sse2.c

index 564b7955e5b9b54c2c803e653b234351bd642a3a..cff4fcbdce0a6ba61229495594da70042ccfc0ac 100644

--- a/source/libvpx/vp9/encoder/x86/vp9_dct_sse2.c

+++ b/source/libvpx/vp9/encoder/x86/vp9_dct_sse2.c

@@ -10,6 +10,8 @@

#include <assert.h>

#include <emmintrin.h> // SSE2

+#include "./vp9_rtcd.h"

#include "vp9/common/vp9_idct.h" // for cospi constants

#include "vp9/encoder/vp9_dct.h"

#include "vp9/encoder/x86/vp9_dct_sse2.h"

@@ -96,7 +98,7 @@ static INLINE void transpose_4x4(__m128i *res) {

res[3] = _mm_unpackhi_epi64(res[2], res[2]);

}

-void fdct4_sse2(__m128i *in) {

+static void fdct4_sse2(__m128i *in) {

const __m128i k__cospi_p16_p16 = _mm_set1_epi16((int16_t)cospi_16_64);

const __m128i k__cospi_p16_m16 = pair_set_epi16(cospi_16_64, -cospi_16_64);

const __m128i k__cospi_p08_p24 = pair_set_epi16(cospi_8_64, cospi_24_64);

@@ -129,7 +131,7 @@ void fdct4_sse2(__m128i *in) {

transpose_4x4(in);

}

-void fadst4_sse2(__m128i *in) {

+static void fadst4_sse2(__m128i *in) {

const __m128i k__sinpi_p01_p02 = pair_set_epi16(sinpi_1_9, sinpi_2_9);

const __m128i k__sinpi_p04_m01 = pair_set_epi16(sinpi_4_9, -sinpi_1_9);

const __m128i k__sinpi_p03_p04 = pair_set_epi16(sinpi_3_9, sinpi_4_9);

@@ -831,7 +833,7 @@ static INLINE void array_transpose_8x8(__m128i *in, __m128i *res) {

// 07 17 27 37 47 57 67 77

}

-void fdct8_sse2(__m128i *in) {

+static void fdct8_sse2(__m128i *in) {

// constants

const __m128i k__cospi_p16_p16 = _mm_set1_epi16((int16_t)cospi_16_64);

const __m128i k__cospi_p16_m16 = pair_set_epi16(cospi_16_64, -cospi_16_64);

@@ -971,7 +973,7 @@ void fdct8_sse2(__m128i *in) {

array_transpose_8x8(in, in);

}

-void fadst8_sse2(__m128i *in) {

+static void fadst8_sse2(__m128i *in) {

// Constants

const __m128i k__cospi_p02_p30 = pair_set_epi16(cospi_2_64, cospi_30_64);

const __m128i k__cospi_p30_m02 = pair_set_epi16(cospi_30_64, -cospi_2_64);

@@ -1353,7 +1355,7 @@ static INLINE void right_shift_16x16(__m128i *res0, __m128i *res1) {

right_shift_8x8(res1 + 8, 2);

}

-void fdct16_8col(__m128i *in) {

+static void fdct16_8col(__m128i *in) {

// perform 16x16 1-D DCT for 8 columns

__m128i i[8], s[8], p[8], t[8], u[16], v[16];

const __m128i k__cospi_p16_p16 = _mm_set1_epi16((int16_t)cospi_16_64);

@@ -1675,7 +1677,7 @@ void fdct16_8col(__m128i *in) {

in[15] = _mm_packs_epi32(v[14], v[15]);

}

-void fadst16_8col(__m128i *in) {

+static void fadst16_8col(__m128i *in) {

// perform 16x16 1-D ADST for 8 columns

__m128i s[16], x[16], u[32], v[32];

const __m128i k__cospi_p01_p31 = pair_set_epi16(cospi_1_64, cospi_31_64);

@@ -2145,13 +2147,13 @@ void fadst16_8col(__m128i *in) {

in[15] = _mm_sub_epi16(kZero, s[1]);

}

-void fdct16_sse2(__m128i *in0, __m128i *in1) {

+static void fdct16_sse2(__m128i *in0, __m128i *in1) {

fdct16_8col(in0);

fdct16_8col(in1);

array_transpose_16x16(in0, in1);

}

-void fadst16_sse2(__m128i *in0, __m128i *in1) {

+static void fadst16_sse2(__m128i *in0, __m128i *in1) {

fadst16_8col(in0);

fadst16_8col(in1);

array_transpose_16x16(in0, in1);

@@ -2334,7 +2336,7 @@ void vp9_highbd_fht8x8_sse2(const int16_t *input, tran_low_t *output,

}

-void vp9_highbd_fht16x16_sse2(int16_t *input, tran_low_t *output,

+void vp9_highbd_fht16x16_sse2(const int16_t *input, tran_low_t *output,

int stride, int tx_type) {

if (tx_type == DCT_DCT) {

vp9_highbd_fdct16x16_sse2(input, output, stride);

@@ -2368,8 +2370,8 @@ void vp9_highbd_fht16x16_sse2(int16_t *input, tran_low_t *output,

* The DCTnxn functions are defined using the macros below. The main code for

- * them is in separate files (vp9/encoder/x86/vp9_dct_impl_sse2.c &

- * vp9/encoder/x86/vp9_dct32x32_sse2.c) which are used by both the 8 bit code

+ * them is in separate files (vp9/encoder/x86/vp9_dct_sse2_impl.h &

+ * vp9/encoder/x86/vp9_dct32x32_sse2_impl.h) which are used by both the 8 bit code

* and the high bit depth code.

@@ -2378,20 +2380,20 @@ void vp9_highbd_fht16x16_sse2(int16_t *input, tran_low_t *output,

#define FDCT4x4_2D vp9_fdct4x4_sse2

#define FDCT8x8_2D vp9_fdct8x8_sse2

#define FDCT16x16_2D vp9_fdct16x16_sse2

-#include "vp9/encoder/x86/vp9_dct_impl_sse2.c"

+#include "vp9/encoder/x86/vp9_dct_sse2_impl.h"

#undef FDCT4x4_2D

#undef FDCT8x8_2D

#undef FDCT16x16_2D

#define FDCT32x32_2D vp9_fdct32x32_rd_sse2

#define FDCT32x32_HIGH_PRECISION 0

-#include "vp9/encoder/x86/vp9_dct32x32_sse2.c"

+#include "vp9/encoder/x86/vp9_dct32x32_sse2_impl.h"

#undef FDCT32x32_2D

#undef FDCT32x32_HIGH_PRECISION

#define FDCT32x32_2D vp9_fdct32x32_sse2

#define FDCT32x32_HIGH_PRECISION 1

-#include "vp9/encoder/x86/vp9_dct32x32_sse2.c" // NOLINT

+#include "vp9/encoder/x86/vp9_dct32x32_sse2_impl.h" // NOLINT

#undef FDCT32x32_2D

#undef FDCT32x32_HIGH_PRECISION

@@ -2405,20 +2407,20 @@ void vp9_highbd_fht16x16_sse2(int16_t *input, tran_low_t *output,

#define FDCT4x4_2D vp9_highbd_fdct4x4_sse2

#define FDCT8x8_2D vp9_highbd_fdct8x8_sse2

#define FDCT16x16_2D vp9_highbd_fdct16x16_sse2

-#include "vp9/encoder/x86/vp9_dct_impl_sse2.c" // NOLINT

+#include "vp9/encoder/x86/vp9_dct_sse2_impl.h" // NOLINT

#undef FDCT4x4_2D

#undef FDCT8x8_2D

#undef FDCT16x16_2D

#define FDCT32x32_2D vp9_highbd_fdct32x32_rd_sse2

#define FDCT32x32_HIGH_PRECISION 0

-#include "vp9/encoder/x86/vp9_dct32x32_sse2.c" // NOLINT

+#include "vp9/encoder/x86/vp9_dct32x32_sse2_impl.h" // NOLINT

#undef FDCT32x32_2D

#undef FDCT32x32_HIGH_PRECISION

#define FDCT32x32_2D vp9_highbd_fdct32x32_sse2

#define FDCT32x32_HIGH_PRECISION 1

-#include "vp9/encoder/x86/vp9_dct32x32_sse2.c" // NOLINT

+#include "vp9/encoder/x86/vp9_dct32x32_sse2_impl.h" // NOLINT

#undef FDCT32x32_2D

#undef FDCT32x32_HIGH_PRECISION

« no previous file with comments | « source/libvpx/vp9/encoder/x86/vp9_dct_impl_sse2.c ('k') | source/libvpx/vp9/encoder/x86/vp9_dct_sse2_impl.h » ('j') | no next file with comments »