source/patched-ffmpeg-mt/libavcodec/x86/dsputil_mmx.c - Issue 3384002: ffmpeg source update for sep 09

Unified Diff: source/patched-ffmpeg-mt/libavcodec/x86/dsputil_mmx.c

Issue 3384002: ffmpeg source update for sep 09 (Closed) Base URL: svn://chrome-svn/chrome/trunk/deps/third_party/ffmpeg/

Patch Set: Created 10 years, 3 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« no previous file with comments | « source/patched-ffmpeg-mt/libavcodec/x86/dsputil_mmx.h ('k') | source/patched-ffmpeg-mt/libavcodec/x86/dsputilenc_mmx.c » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: source/patched-ffmpeg-mt/libavcodec/x86/dsputil_mmx.c

===================================================================

--- source/patched-ffmpeg-mt/libavcodec/x86/dsputil_mmx.c (revision 59334)

+++ source/patched-ffmpeg-mt/libavcodec/x86/dsputil_mmx.c (working copy)

@@ -22,23 +22,18 @@

* MMX optimization by Nick Kurshev <nickols_k@mail.ru>

+#include "libavutil/cpu.h"

#include "libavutil/x86_cpu.h"

#include "libavcodec/dsputil.h"

#include "libavcodec/h264dsp.h"

#include "libavcodec/mpegvideo.h"

#include "libavcodec/simple_idct.h"

#include "dsputil_mmx.h"

-#include "vp3dsp_mmx.h"

-#include "vp3dsp_sse2.h"

-#include "vp6dsp_mmx.h"

-#include "vp6dsp_sse2.h"

#include "idct_xvid.h"

//#undef NDEBUG

//#include <assert.h>

-int mm_flags; /* multimedia extension flags */

/* pixel operations */

DECLARE_ALIGNED(8, const uint64_t, ff_bone) = 0x0101010101010101ULL;

DECLARE_ALIGNED(8, const uint64_t, ff_wtwo) = 0x0002000200020002ULL;

@@ -66,6 +61,7 @@

DECLARE_ALIGNED(8, const uint64_t, ff_pw_128) = 0x0080008000800080ULL;

DECLARE_ALIGNED(8, const uint64_t, ff_pw_255) = 0x00ff00ff00ff00ffULL;

+DECLARE_ALIGNED(16, const xmm_reg, ff_pb_0 ) = {0x0000000000000000ULL, 0x0000000000000000ULL};

DECLARE_ALIGNED(16, const xmm_reg, ff_pb_1 ) = {0x0101010101010101ULL, 0x0101010101010101ULL};

DECLARE_ALIGNED(16, const xmm_reg, ff_pb_3 ) = {0x0303030303030303ULL, 0x0303030303030303ULL};

DECLARE_ALIGNED(16, const xmm_reg, ff_pb_4 ) = {0x0404040404040404ULL, 0x0404040404040404ULL};

@@ -74,7 +70,7 @@

DECLARE_ALIGNED(8, const uint64_t, ff_pb_3F ) = 0x3F3F3F3F3F3F3F3FULL;

DECLARE_ALIGNED(16, const xmm_reg, ff_pb_80 ) = {0x8080808080808080ULL, 0x8080808080808080ULL};

DECLARE_ALIGNED(8, const uint64_t, ff_pb_81 ) = 0x8181818181818181ULL;

-DECLARE_ALIGNED(8, const uint64_t, ff_pb_A1 ) = 0xA1A1A1A1A1A1A1A1ULL;

+DECLARE_ALIGNED(16, const xmm_reg, ff_pb_A1 ) = {0xA1A1A1A1A1A1A1A1ULL, 0xA1A1A1A1A1A1A1A1ULL};

DECLARE_ALIGNED(16, const xmm_reg, ff_pb_F8 ) = {0xF8F8F8F8F8F8F8F8ULL, 0xF8F8F8F8F8F8F8F8ULL};

DECLARE_ALIGNED(8, const uint64_t, ff_pb_FC ) = 0xFCFCFCFCFCFCFCFCULL;

DECLARE_ALIGNED(16, const xmm_reg, ff_pb_FE ) = {0xFEFEFEFEFEFEFEFEULL, 0xFEFEFEFEFEFEFEFEULL};

@@ -232,7 +228,7 @@

/***********************************/

/* standard MMX */

-void put_pixels_clamped_mmx(const DCTELEM *block, uint8_t *pixels, int line_size)

+void ff_put_pixels_clamped_mmx(const DCTELEM *block, uint8_t *pixels, int line_size)

{

const DCTELEM *p;

uint8_t *pix;

@@ -308,7 +304,7 @@

"movq %%mm3, (%0, %3, 2) \n\t"\

"movq %%mm4, (%0, %1) \n\t"

-void put_signed_pixels_clamped_mmx(const DCTELEM *block, uint8_t *pixels, int line_size)

+void ff_put_signed_pixels_clamped_mmx(const DCTELEM *block, uint8_t *pixels, int line_size)

{

x86_reg line_skip = line_size;

x86_reg line_skip3;

@@ -324,7 +320,7 @@

:"memory");

}

-void add_pixels_clamped_mmx(const DCTELEM *block, uint8_t *pixels, int line_size)

+void ff_add_pixels_clamped_mmx(const DCTELEM *block, uint8_t *pixels, int line_size)

{

const DCTELEM *p;

uint8_t *pix;

@@ -732,35 +728,6 @@

}

-static inline void transpose4x4(uint8_t *dst, uint8_t *src, int dst_stride, int src_stride){

- __asm__ volatile( //FIXME could save 1 instruction if done as 8x4 ...

- "movd %4, %%mm0 \n\t"

- "movd %5, %%mm1 \n\t"

- "movd %6, %%mm2 \n\t"

- "movd %7, %%mm3 \n\t"

- "punpcklbw %%mm1, %%mm0 \n\t"

- "punpcklbw %%mm3, %%mm2 \n\t"

- "movq %%mm0, %%mm1 \n\t"

- "punpcklwd %%mm2, %%mm0 \n\t"

- "punpckhwd %%mm2, %%mm1 \n\t"

- "movd %%mm0, %0 \n\t"

- "punpckhdq %%mm0, %%mm0 \n\t"

- "movd %%mm0, %1 \n\t"

- "movd %%mm1, %2 \n\t"

- "punpckhdq %%mm1, %%mm1 \n\t"

- "movd %%mm1, %3 \n\t"

- : "=m" (*(uint32_t*)(dst + 0*dst_stride)),

- "=m" (*(uint32_t*)(dst + 1*dst_stride)),

- "=m" (*(uint32_t*)(dst + 2*dst_stride)),

- "=m" (*(uint32_t*)(dst + 3*dst_stride))

- : "m" (*(uint32_t*)(src + 0*src_stride)),

- "m" (*(uint32_t*)(src + 1*src_stride)),

- "m" (*(uint32_t*)(src + 2*src_stride)),

- "m" (*(uint32_t*)(src + 3*src_stride))

- );

static void h263_h_loop_filter_mmx(uint8_t *src, int stride, int qscale){

if(CONFIG_H263_DECODER || CONFIG_H263_ENCODER) {

const int strength= ff_h263_loop_filter_strength[qscale];

@@ -1829,9 +1796,60 @@

PREFETCH(prefetch_3dnow, prefetch)

#undef PREFETCH

-#include "h264dsp_mmx.c"

-#include "rv40dsp_mmx.c"

+#include "h264_qpel_mmx.c"

+void ff_put_h264_chroma_mc8_mmx_rnd (uint8_t *dst, uint8_t *src,