media/base/sinc_resampler.cc - Issue 18566009: Optimize loop condition for SincResampler.

Unified Diff: media/base/sinc_resampler.cc

Issue 18566009: Optimize loop condition for SincResampler. (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src

Patch Set: Comments. const! Created 7 years, 5 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: media/base/sinc_resampler.cc

diff --git a/media/base/sinc_resampler.cc b/media/base/sinc_resampler.cc

index 1df8d4d08f894201a823c15c2066ca3ad43904ec..a2918c3f0d2e590c2eedc48ed29aa92a3e015343 100644

--- a/media/base/sinc_resampler.cc

+++ b/media/base/sinc_resampler.cc

@@ -138,7 +138,7 @@ void SincResampler::InitializeCPUSpecificFeatures() {}

#endif

SincResampler::SincResampler(double io_sample_rate_ratio,

- size_t request_frames,

+ int request_frames,

const ReadCB& read_cb)

: io_sample_rate_ratio_(io_sample_rate_ratio),

read_cb_(read_cb),

@@ -155,8 +155,9 @@ SincResampler::SincResampler(double io_sample_rate_ratio,

base::AlignedAlloc(sizeof(float) * input_buffer_size_, 16))),

r1_(input_buffer_.get()),

r2_(input_buffer_.get() + kKernelSize / 2) {

+ CHECK_GT(request_frames_, 0);

Flush();

- CHECK_GT(block_size_, static_cast<size_t>(kKernelSize))

+ CHECK_GT(block_size_, kKernelSize)

<< "block_size must be greater than kKernelSize!";

memset(kernel_storage_.get(), 0,

@@ -255,14 +256,25 @@ void SincResampler::Resample(int frames, float* destination) {

int remaining_frames = frames;

// Step (1) -- Prime the input buffer at the start of the input stream.

- if (!buffer_primed_) {

+ if (!buffer_primed_ && remaining_frames) {

read_cb_.Run(request_frames_, r0_);

buffer_primed_ = true;

}

- // Step (2) -- Resample!

+ // Step (2) -- Resample! const what we can outside of the loop for speed. It

+ // actually has an impact on ARM performance. See inner loop comment below.

+ const double current_io_ratio = io_sample_rate_ratio_;

+ const float* const kernel_ptr = kernel_storage_.get();

while (remaining_frames) {

- while (virtual_source_idx_ < block_size_) {

+ // |i| may be negative if the last Resample() call ended on an iteration

+ // that put |virtual_source_idx_| over the limit.

+ //

+ // Note: The loop construct here can severely impact performance on ARM

+ // or when built with clang. See https://codereview.chromium.org/18566009/

+ for (int i = ceil((block_size_ - virtual_source_idx_) / current_io_ratio);

+ i > 0; --i) {

+ DCHECK_LT(virtual_source_idx_, block_size_);

// |virtual_source_idx_| lies in between two kernel offsets so figure out

// what they are.

const int source_idx = virtual_source_idx_;

@@ -274,8 +286,8 @@ void SincResampler::Resample(int frames, float* destination) {

// We'll compute "convolutions" for the two kernels which straddle

// |virtual_source_idx_|.

- const float* k1 = kernel_storage_.get() + offset_idx * kKernelSize;

- const float* k2 = k1 + kKernelSize;

+ const float* const k1 = kernel_ptr + offset_idx * kKernelSize;

+ const float* const k2 = k1 + kKernelSize;

// Ensure |k1|, |k2| are 16-byte aligned for SIMD usage. Should always be

// true so long as kKernelSize is a multiple of 16.

@@ -283,7 +295,7 @@ void SincResampler::Resample(int frames, float* destination) {

DCHECK_EQ(0u, reinterpret_cast<uintptr_t>(k2) & 0x0F);

// Initialize input pointer based on quantized |virtual_source_idx_|.

- const float* input_ptr = r1_ + source_idx;

+ const float* const input_ptr = r1_ + source_idx;

// Figure out how much to weight each kernel's "convolution".

const double kernel_interpolation_factor =

@@ -292,7 +304,7 @@ void SincResampler::Resample(int frames, float* destination) {

input_ptr, k1, k2, kernel_interpolation_factor);

// Advance the virtual index.

- virtual_source_idx_ += io_sample_rate_ratio_;

+ virtual_source_idx_ += current_io_ratio;

if (!--remaining_frames)

return;

« no previous file with comments | « media/base/sinc_resampler.h ('k') | no next file » | no next file with comments »