| Index: media/base/sinc_resampler.cc
|
| diff --git a/media/base/sinc_resampler.cc b/media/base/sinc_resampler.cc
|
| index 6bce67a3e7e85252240fad089711a2f769be6d14..c253b8355bfa72c5fafa5d9a5b3a2b9d9be54785 100644
|
| --- a/media/base/sinc_resampler.cc
|
| +++ b/media/base/sinc_resampler.cc
|
| @@ -2,31 +2,73 @@
|
| // Use of this source code is governed by a BSD-style license that can be
|
| // found in the LICENSE file.
|
| //
|
| -// Input buffer layout, dividing the total buffer into regions (r0_ - r5_):
|
| +// Initial input buffer layout, dividing into regions r0_ to r4_ (note: r0_, r3_
|
| +// and r4_ will move after the first load):
|
| //
|
| // |----------------|-----------------------------------------|----------------|
|
| //
|
| -// kBlockSize + kKernelSize / 2
|
| +// request_frames_
|
| // <--------------------------------------------------------->
|
| -// r0_
|
| +// r0_ (during first load)
|
| //
|
| // kKernelSize / 2 kKernelSize / 2 kKernelSize / 2 kKernelSize / 2
|
| // <---------------> <---------------> <---------------> <--------------->
|
| // r1_ r2_ r3_ r4_
|
| //
|
| -// kBlockSize
|
| -// <--------------------------------------->
|
| -// r5_
|
| +// block_size_ == r4_ - r2_
|
| +// <--------------------------------------->
|
| +//
|
| +// request_frames_
|
| +// <------------------ ... ----------------->
|
| +// r0_ (during second load)
|
| +//
|
| +// On the second request r0_ slides to the right by kKernelSize / 2 and r3_, r4_
|
| +// and block_size_ are reinitialized via step (3) in the algorithm below.
|
| +//
|
| +// These new regions remain constant until a Flush() occurs. While complicated,
|
| +// this allows us to reduce jitter by always requesting the same amount from the
|
| +// provided callback.
|
| //
|
| // The algorithm:
|
| //
|
| -// 1) Consume input frames into r0_ (r1_ is zero-initialized).
|
| -// 2) Position kernel centered at start of r0_ (r2_) and generate output frames
|
| -// until kernel is centered at start of r4_ or we've finished generating all
|
| -// the output frames.
|
| -// 3) Copy r3_ to r1_ and r4_ to r2_.
|
| -// 4) Consume input frames into r5_ (zero-pad if we run out of input).
|
| -// 5) Goto (2) until all of input is consumed.
|
| +// 1) Allocate input_buffer of size: request_frames_ + kKernelSize; this ensures
|
| +// there's enough room to read request_frames_ from the callback into region
|
| +// r0_ (which will move between the first and subsequent passes).
|
| +//
|
| +// 2) Let r1_, r2_ each represent half the kernel centered around r0_:
|
| +//
|
| +// r0_ = input_buffer_ + kKernelSize / 2
|
| +// r1_ = input_buffer_
|
| +// r2_ = r0_
|
| +//
|
| +// r0_ is always request_frames_ in size. r1_, r2_ are kKernelSize / 2 in
|
| +// size. r1_ must be zero initialized to avoid convolution with garbage (see
|
| +// step (5) for why).
|
| +//
|
| +// 3) Let r3_, r4_ each represent half the kernel right aligned with the end of
|
| +// r0_ and choose block_size_ as the distance in frames between r4_ and r2_:
|
| +//
|
| +// r3_ = r0_ + request_frames_ - kKernelSize
|
| +// r4_ = r0_ + request_frames_ - kKernelSize / 2
|
| +// block_size_ = r4_ - r2_ = request_frames_ - kKernelSize / 2
|
| +//
|
| +// 4) Consume request_frames_ frames into r0_.
|
| +//
|
| +// 5) Position kernel centered at start of r2_ and generate output frames until
|
| +// the kernel is centered at the start of r4_ or we've finished generating
|
| +// all the output frames.
|
| +//
|
| +// 6) Wrap left over data from the r3_ to r1_ and r4_ to r2_.
|
| +//
|
| +// 7) If we're on the second load, in order to avoid overwriting the frames we
|
| +// just wrapped from r4_ we need to slide r0_ to the right by the size of
|
| +// r4_, which is kKernelSize / 2:
|
| +//
|
| +// r0_ = r0_ + kKernelSize / 2 = input_buffer_ + kKernelSize
|
| +//
|
| +// r3_, r4_, and block_size_ then need to be reinitialized, so goto (3).
|
| +//
|
| +// 8) Else, if we're not on the second load, goto (4).
|
| //
|
| // Note: we're glossing over how the sub-sample handling works with
|
| // |virtual_source_idx_|, etc.
|
| @@ -64,11 +106,13 @@ static double SincScaleFactor(double io_ratio) {
|
| return sinc_scale_factor;
|
| }
|
|
|
| -SincResampler::SincResampler(double io_sample_rate_ratio, const ReadCB& read_cb)
|
| +SincResampler::SincResampler(double io_sample_rate_ratio,
|
| + size_t request_frames,
|
| + const ReadCB& read_cb)
|
| : io_sample_rate_ratio_(io_sample_rate_ratio),
|
| - virtual_source_idx_(0),
|
| - buffer_primed_(false),
|
| read_cb_(read_cb),
|
| + request_frames_(request_frames),
|
| + input_buffer_size_(request_frames_ + kKernelSize),
|
| // Create input buffers with a 16-byte alignment for SSE optimizations.
|
| kernel_storage_(static_cast<float*>(
|
| base::AlignedAlloc(sizeof(float) * kKernelStorageSize, 16))),
|
| @@ -77,36 +121,15 @@ SincResampler::SincResampler(double io_sample_rate_ratio, const ReadCB& read_cb)
|
| kernel_window_storage_(static_cast<float*>(
|
| base::AlignedAlloc(sizeof(float) * kKernelStorageSize, 16))),
|
| input_buffer_(static_cast<float*>(
|
| - base::AlignedAlloc(sizeof(float) * kBufferSize, 16))),
|
| + base::AlignedAlloc(sizeof(float) * input_buffer_size_, 16))),
|
| #if defined(ARCH_CPU_X86_FAMILY) && !defined(__SSE__)
|
| convolve_proc_(base::CPU().has_sse() ? Convolve_SSE : Convolve_C),
|
| #endif
|
| - // Setup various region pointers in the buffer (see diagram above).
|
| - r0_(input_buffer_.get() + kKernelSize / 2),
|
| r1_(input_buffer_.get()),
|
| - r2_(r0_),
|
| - r3_(r0_ + kBlockSize - kKernelSize / 2),
|
| - r4_(r0_ + kBlockSize),
|
| - r5_(r0_ + kKernelSize / 2) {
|
| - // Ensure kKernelSize is a multiple of 32 for easy SSE optimizations; causes
|
| - // r0_ and r5_ (used for input) to always be 16-byte aligned by virtue of
|
| - // input_buffer_ being 16-byte aligned.
|
| - DCHECK_EQ(kKernelSize % 32, 0) << "kKernelSize must be a multiple of 32!";
|
| - DCHECK_GT(kBlockSize, kKernelSize)
|
| - << "kBlockSize must be greater than kKernelSize!";
|
| - // Basic sanity checks to ensure buffer regions are laid out correctly:
|
| - // r0_ and r2_ should always be the same position.
|
| - DCHECK_EQ(r0_, r2_);
|
| - // r1_ at the beginning of the buffer.
|
| - DCHECK_EQ(r1_, input_buffer_.get());
|
| - // r1_ left of r2_, r2_ left of r5_ and r1_, r2_ size correct.
|
| - DCHECK_EQ(r2_ - r1_, r5_ - r2_);
|
| - // r3_ left of r4_, r5_ left of r0_ and r3_ size correct.
|
| - DCHECK_EQ(r4_ - r3_, r5_ - r0_);
|
| - // r3_, r4_ size correct and r4_ at the end of the buffer.
|
| - DCHECK_EQ(r4_ + (r4_ - r3_), r1_ + kBufferSize);
|
| - // r5_ size correct and at the end of the buffer.
|
| - DCHECK_EQ(r5_ + kBlockSize, r1_ + kBufferSize);
|
| + r2_(input_buffer_.get() + kKernelSize / 2) {
|
| + Flush();
|
| + CHECK_GT(block_size_, static_cast<size_t>(kKernelSize))
|
| + << "block_size must be greater than kKernelSize!";
|
|
|
| memset(kernel_storage_.get(), 0,
|
| sizeof(*kernel_storage_.get()) * kKernelStorageSize);
|
| @@ -114,13 +137,28 @@ SincResampler::SincResampler(double io_sample_rate_ratio, const ReadCB& read_cb)
|
| sizeof(*kernel_pre_sinc_storage_.get()) * kKernelStorageSize);
|
| memset(kernel_window_storage_.get(), 0,
|
| sizeof(*kernel_window_storage_.get()) * kKernelStorageSize);
|
| - memset(input_buffer_.get(), 0, sizeof(*input_buffer_.get()) * kBufferSize);
|
|
|
| InitializeKernel();
|
| }
|
|
|
| SincResampler::~SincResampler() {}
|
|
|
| +void SincResampler::UpdateRegions(bool second_load) {
|
| + // Setup various region pointers in the buffer (see diagram above). If we're
|
| + // on the second load we need to slide r0_ to the right by kKernelSize / 2.
|
| + r0_ = input_buffer_.get() + (second_load ? kKernelSize : kKernelSize / 2);
|
| + r3_ = r0_ + request_frames_ - kKernelSize;
|
| + r4_ = r0_ + request_frames_ - kKernelSize / 2;
|
| + block_size_ = r4_ - r2_;
|
| +
|
| + // r1_ at the beginning of the buffer.
|
| + CHECK_EQ(r1_, input_buffer_.get());
|
| + // r1_ left of r2_, r4_ left of r3_ and size correct.
|
| + CHECK_EQ(r2_ - r1_, r4_ - r3_);
|
| + // r2_ left of r3.
|
| + CHECK_LT(r2_, r3_);
|
| +}
|
| +
|
| void SincResampler::InitializeKernel() {
|
| // Blackman window parameters.
|
| static const double kAlpha = 0.16;
|
| @@ -201,30 +239,31 @@ void SincResampler::SetRatio(double io_sample_rate_ratio) {
|
| #define CONVOLVE_FUNC Convolve_C
|
| #endif
|
|
|
| -void SincResampler::Resample(float* destination, int frames) {
|
| +void SincResampler::Resample(int frames, float* destination) {
|
| int remaining_frames = frames;
|
|
|
| // Step (1) -- Prime the input buffer at the start of the input stream.
|
| if (!buffer_primed_) {
|
| - read_cb_.Run(r0_, kBlockSize + kKernelSize / 2);
|
| + read_cb_.Run(request_frames_, r0_);
|
| buffer_primed_ = true;
|
| }
|
|
|
| // Step (2) -- Resample!
|
| while (remaining_frames) {
|
| - while (virtual_source_idx_ < kBlockSize) {
|
| + while (virtual_source_idx_ < block_size_) {
|
| // |virtual_source_idx_| lies in between two kernel offsets so figure out
|
| // what they are.
|
| - int source_idx = static_cast<int>(virtual_source_idx_);
|
| - double subsample_remainder = virtual_source_idx_ - source_idx;
|
| + const int source_idx = virtual_source_idx_;
|
| + const double subsample_remainder = virtual_source_idx_ - source_idx;
|
|
|
| - double virtual_offset_idx = subsample_remainder * kKernelOffsetCount;
|
| - int offset_idx = static_cast<int>(virtual_offset_idx);
|
| + const double virtual_offset_idx =
|
| + subsample_remainder * kKernelOffsetCount;
|
| + const int offset_idx = virtual_offset_idx;
|
|
|
| // We'll compute "convolutions" for the two kernels which straddle
|
| // |virtual_source_idx_|.
|
| - float* k1 = kernel_storage_.get() + offset_idx * kKernelSize;
|
| - float* k2 = k1 + kKernelSize;
|
| + const float* k1 = kernel_storage_.get() + offset_idx * kKernelSize;
|
| + const float* k2 = k1 + kKernelSize;
|
|
|
| // Ensure |k1|, |k2| are 16-byte aligned for SIMD usage. Should always be
|
| // true so long as kKernelSize is a multiple of 16.
|
| @@ -232,10 +271,11 @@ void SincResampler::Resample(float* destination, int frames) {
|
| DCHECK_EQ(0u, reinterpret_cast<uintptr_t>(k2) & 0x0F);
|
|
|
| // Initialize input pointer based on quantized |virtual_source_idx_|.
|
| - float* input_ptr = r1_ + source_idx;
|
| + const float* input_ptr = r1_ + source_idx;
|
|
|
| // Figure out how much to weight each kernel's "convolution".
|
| - double kernel_interpolation_factor = virtual_offset_idx - offset_idx;
|
| + const double kernel_interpolation_factor =
|
| + virtual_offset_idx - offset_idx;
|
| *destination++ = CONVOLVE_FUNC(
|
| input_ptr, k1, k2, kernel_interpolation_factor);
|
|
|
| @@ -247,29 +287,33 @@ void SincResampler::Resample(float* destination, int frames) {
|
| }
|
|
|
| // Wrap back around to the start.
|
| - virtual_source_idx_ -= kBlockSize;
|
| + virtual_source_idx_ -= block_size_;
|
|
|
| - // Step (3) Copy r3_ to r1_ and r4_ to r2_.
|
| + // Step (3) -- Copy r3_, r4_ to r1_, r2_.
|
| // This wraps the last input frames back to the start of the buffer.
|
| - memcpy(r1_, r3_, sizeof(*input_buffer_.get()) * (kKernelSize / 2));
|
| - memcpy(r2_, r4_, sizeof(*input_buffer_.get()) * (kKernelSize / 2));
|
| + memcpy(r1_, r3_, sizeof(*input_buffer_.get()) * kKernelSize);
|
| +
|
| + // Step (4) -- Reinitialize regions if necessary.
|
| + if (r0_ == r2_)
|
| + UpdateRegions(true);
|
|
|
| - // Step (4)
|
| - // Refresh the buffer with more input.
|
| - read_cb_.Run(r5_, kBlockSize);
|
| + // Step (5) -- Refresh the buffer with more input.
|
| + read_cb_.Run(request_frames_, r0_);
|
| }
|
| }
|
|
|
| #undef CONVOLVE_FUNC
|
|
|
| int SincResampler::ChunkSize() const {
|
| - return kBlockSize / io_sample_rate_ratio_;
|
| + return block_size_ / io_sample_rate_ratio_;
|
| }
|
|
|
| void SincResampler::Flush() {
|
| virtual_source_idx_ = 0;
|
| buffer_primed_ = false;
|
| - memset(input_buffer_.get(), 0, sizeof(*input_buffer_.get()) * kBufferSize);
|
| + memset(input_buffer_.get(), 0,
|
| + sizeof(*input_buffer_.get()) * input_buffer_size_);
|
| + UpdateRegions(false);
|
| }
|
|
|
| float SincResampler::Convolve_C(const float* input_ptr, const float* k1,
|
|
|