source/row_neon.cc - Issue 1535833003: avx2 interpolate use 8 bit

Keyboard Shortcuts

	File
u :	up to issue
j / k :	jump to file after / before current file
J / K :	jump to next file with a comment after / before current file
	Side-by-side diff
i :	toggle intra-line diffs
e :	expand all comments
c :	collapse all comments
s :	toggle showing all comments
n / p :	next / previous diff chunk or comment
N / P :	next / previous comment
<Up> / <Down> :	next / previous line

	Issue
u :	up to list of issues
j / k :	jump to patch after / before current patch
o / <Enter> :	open current patch in side-by-side view
i :	open current patch in unified diff view

	Issue List
j / k :	jump to issue after / before current issue
o / <Enter> :	open current issue

Unified Diff: source/row_neon.cc

Issue 1535833003: avx2 interpolate use 8 bit (Closed) Base URL: https://chromium.googlesource.com/libyuv/libyuv@master

Patch Set: gcc version of interpolate Created 5 years ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

Index: source/row_neon.cc

diff --git a/source/row_neon.cc b/source/row_neon.cc

index 2522d501ae3ffc36836db7796cf6284cccd35929..5b4ff3b5a889977e031a78f593daed9e59721ff3 100644

--- a/source/row_neon.cc

+++ b/source/row_neon.cc

@@ -2259,16 +2259,16 @@ void RAWToYRow_NEON(const uint8* src_raw, uint8* dst_y, int width) {

void InterpolateRow_NEON(uint8* dst_ptr,

const uint8* src_ptr, ptrdiff_t src_stride,

int dst_width, int source_y_fraction) {

- int y1_fraction = source_y_fraction >> 1;

+ int y1_fraction = source_y_fraction;

asm volatile (

"cmp %4, #0 \n"

"beq 100f \n"

"add %2, %1 \n"

- "cmp %4, #64 \n"

+ "cmp %4, #128 \n"

"beq 50f \n"

"vdup.8 d5, %4 \n"

- "rsb %4, #128 \n"

+ "rsb %4, #256 \n"

"vdup.8 d4, %4 \n"

// General purpose row blend.

"1: \n"

@@ -2281,8 +2281,8 @@ void InterpolateRow_NEON(uint8* dst_ptr,

"vmull.u8 q14, d1, d4 \n"

"vmlal.u8 q13, d2, d5 \n"

"vmlal.u8 q14, d3, d5 \n"

- "vrshrn.u16 d0, q13, #7 \n"

- "vrshrn.u16 d1, q14, #7 \n"

+ "vrshrn.u16 d0, q13, #8 \n"

+ "vrshrn.u16 d1, q14, #8 \n"

MEMACCESS(0)

"vst1.8 {q0}, [%0]! \n"

"bgt 1b \n"

« no previous file with comments | « source/row_gcc.cc ('k') | source/row_neon64.cc » ('j') | no next file with comments »