media/filters/audio_renderer_algorithm.cc - Issue 19111004: Upgrade AudioRendererAlgorithm to use WSOLA,

Side by Side Diff: media/filters/audio_renderer_algorithm.cc

Issue 19111004: Upgrade AudioRendererAlgorithm to use WSOLA, (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src

Patch Set: Comments addressed, AudioRendererAlgorithmTest::WsolaTest modified. Created 7 years, 4 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch | Annotate | Revision Log

OLD	NEW
1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.	1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.

2 // Use of this source code is governed by a BSD-style license that can be	2 // Use of this source code is governed by a BSD-style license that can be

3 // found in the LICENSE file.	3 // found in the LICENSE file.

4	4

5 #include "media/filters/audio_renderer_algorithm.h"	5 #include "media/filters/audio_renderer_algorithm.h"

6	6

7 #include <algorithm>	7 #include <algorithm>

8 #include <cmath>	8 #include <cmath>

9	9

10 #include "base/logging.h"	10 #include "base/logging.h"

11 #include "base/memory/scoped_ptr.h"	11 #include "base/memory/scoped_ptr.h"

12 #include "media/audio/audio_util.h"	12 #include "media/audio/audio_util.h"

13 #include "media/base/audio_buffer.h"	13 #include "media/base/audio_buffer.h"

14 #include "media/base/audio_bus.h"	14 #include "media/base/audio_bus.h"

	15 #include "media/filters/wsola_internals.h"

15	16

16 namespace media {	17 namespace media {

17	18

18 // The starting size in frames for \|audio_buffer_\|. Previous usage maintained a	19

19 // queue of 16 AudioBuffers, each of 512 frames. This worked well, so we	20 // Waveform Similarity Overlap-and-add (WSOLA).

20 // maintain this number of frames.	21 //

21 static const int kStartingBufferSizeInFrames = 16 * 512;	22 // One WSOLA iteration

	23 //

	24 // 1) Extract \|target_block_\| as input frames at indices

	25 // [\|target_block_index_\|, \|target_block_index_\| + \|ola_window_size_\|).

	26 // Note that \|target_block_\| is the "natural" continuation of the output.

	27 //

	28 // 2) Extract \|search_block_\| as input frames at indices

	29 // [\|search_block_index_\|,

	30 // \|search_block_index_\| + \|num_candidate_blocks_\| + \|ola_window_size_\|).

	31 //

	32 // 3) Find a block within the \|search_block_\| that is most similar

	33 // to \|target_block_\|. Let \|optimal_index\| be the index of such block and

	34 // write it to \|optimal_block_\|.

	35 //

	36 // 4) Update:

	37 // \|optimal_block_\| = \|transition_window_\| * \|target_block_\| +

	38 // (1 - \|transition_window_\|) * \|optimal_block_\|.

	39 //

	40 // 5) Overlap-and-add \|optimal_block_\| to the \|wsola_output_\|.

	41 //

	42 // 6) Update:

	43 // \|target_block_\| = \|optimal_index\| + \|ola_window_size_\| / 2.

	44 // \|output_index_\| = \|output_index_\| + \|ola_window_size_\| / 2,

	45 // \|search_block_center_offset_\| = \|output_index_\| * \|playback_rate_\|, and

	46 // \|search_block_index_\| = \|search_block_center_offset_\| -

	47 // \|search_block_center_offset_\|.

22	48

23 // The maximum size in frames for the \|audio_buffer_\|. Arbitrarily determined.	49 // The maximum size in frames for the \|audio_buffer_\|. Arbitrarily determined.

24 // This number represents 3 seconds of 96kHz/16 bit 7.1 surround sound.	50 // This number represents 3 seconds of 96kHz/16 bit 7.1 surround sound.

25 static const int kMaxBufferSizeInFrames = 3 * 96000;	51 static const int kMaxBufferSizeInFrames = 3 * 96000;

26	52

27 // Duration of audio segments used for crossfading (in seconds).

28 static const double kWindowDuration = 0.08;

29

30 // Duration of crossfade between audio segments (in seconds).

31 static const double kCrossfadeDuration = 0.008;

32

33 // Max/min supported playback rates for fast/slow audio. Audio outside of these	53 // Max/min supported playback rates for fast/slow audio. Audio outside of these

34 // ranges are muted.	54 // ranges are muted.

35 // Audio at these speeds would sound better under a frequency domain algorithm.	55 // Audio at these speeds would sound better under a frequency domain algorithm.

36 static const float kMinPlaybackRate = 0.5f;	56 static const float kMinPlaybackRate = 0.5f;

37 static const float kMaxPlaybackRate = 4.0f;	57 static const float kMaxPlaybackRate = 4.0f;

38	58

	59 // Overlap-and-add window size in milliseconds.

	60 static const int kOlaWindowSizeMs = 20;

	61

	62 // Size of search interval in milliseconds. The search interval is

	63 // [-delta delta] around \|output_index_\| * \|playback_rate_\|. So the search

	64 // interval is 2 * delta.

	65 static const int kWsolaSearchIntervalMs = 30;

	66

	67 // The starting size in frames for \|audio_buffer_\|. Previous usage maintained a

	68 // queue of 16 AudioBuffers, each of 512 frames. This worked well, so we

	69 // maintain this number of frames.

	70 static const int kStartingBufferSizeInFrames = 16 * 512;

	71

39 AudioRendererAlgorithm::AudioRendererAlgorithm()	72 AudioRendererAlgorithm::AudioRendererAlgorithm()

40 : channels_(0),	73 : channels_(0),

41 samples_per_second_(0),	74 samples_per_second_(0),

42 playback_rate_(0),	75 playback_rate_(0),

43 frames_in_crossfade_(0),

44 index_into_window_(0),

45 crossfade_frame_number_(0),

46 muted_(false),	76 muted_(false),

47 muted_partial_frame_(0),	77 muted_partial_frame_(0),

48 window_size_(0),	78 capacity_(kStartingBufferSizeInFrames),

49 capacity_(kStartingBufferSizeInFrames) {	79 output_time_(0),

	80 search_block_center_offset_(0),

	81 search_block_index_(0),

	82 num_candidate_blocks_(0),

	83 target_block_index_(0),

	84 ola_window_size_(0),

	85 ola_hop_size_(0),

	86 num_complete_frames_(0) {

50 }	87 }

51	88

52 AudioRendererAlgorithm::~AudioRendererAlgorithm() {}	89 AudioRendererAlgorithm::~AudioRendererAlgorithm() {}

53	90

54 void AudioRendererAlgorithm::Initialize(float initial_playback_rate,	91 void AudioRendererAlgorithm::Initialize(float initial_playback_rate,

55 const AudioParameters& params) {	92 const AudioParameters& params) {

56 CHECK(params.IsValid());	93 CHECK(params.IsValid());

57	94

58 channels_ = params.channels();	95 channels_ = params.channels();

59 samples_per_second_ = params.sample_rate();	96 samples_per_second_ = params.sample_rate();

60 SetPlaybackRate(initial_playback_rate);	97 SetPlaybackRate(initial_playback_rate);

	98 num_candidate_blocks_ = (kWsolaSearchIntervalMs * samples_per_second_) / 1000;

	99 ola_window_size_ = kOlaWindowSizeMs * samples_per_second_ / 1000;

61	100

62 window_size_ = samples_per_second_ * kWindowDuration;	101 // Make sure window size in an even number.

63 frames_in_crossfade_ = samples_per_second_ * kCrossfadeDuration;	102 ola_window_size_ += ola_window_size_ & 1;

64 crossfade_buffer_ = AudioBus::Create(channels_, frames_in_crossfade_);	103 ola_hop_size_ = ola_window_size_ / 2;

	104

	105 // \|num_candidate_blocks_\| / 2 is the offset of the center of the search

	106 // block to the center of the first (left most) candidate block. The offset

	107 // of the center of a candidate block to its left most point is

	108 // \|ola_window_size_\| / 2 - 1. Note that \|ola_window_size_\| is even and in

	109 // our convention the center belongs to the left half, so we need to subtract

	110 // one frame to get the correct offset.

	111 //

	112 // Search Block

	113 // <------------------------------------------->

	114 //

	115 // \|ola_window_size_\| / 2 - 1

	116 // <----

	117 //

	118 // \|num_candidate_blocks_\| / 2

	119 // <----------------

	120 // center

	121 // X----X----------------X---------------X-----X

	122 // <----------> <---------->

	123 // Candidate ... Candidate

	124 // 1, ... \|num_candidate_blocks_\|

	125 search_block_center_offset_ = num_candidate_blocks_ / 2 +

	126 (ola_window_size_ / 2 - 1);

	127

	128 ola_window_.reset(new float[ola_window_size_]);

	129 internal::GetSymmetricHanningWindow(ola_window_size_, ola_window_.get());

	130

	131 transition_window_.reset(new float[ola_window_size_ * 2]);

	132 internal::GetSymmetricHanningWindow(2 * ola_window_size_,

	133 transition_window_.get());

	134

	135 wsola_output_ = AudioBus::Create(channels_, ola_window_size_ + ola_hop_size_);

	136

	137 // Auxiliary containers.

	138 optimal_block_ = AudioBus::Create(channels_, ola_window_size_);

	139 search_block_ = AudioBus::Create(

	140 channels_, num_candidate_blocks_ + (ola_window_size_ - 1));

	141 target_block_ = AudioBus::Create(channels_, ola_window_size_);

65 }	142 }

66	143

67 int AudioRendererAlgorithm::FillBuffer(AudioBus* dest, int requested_frames) {	144 int AudioRendererAlgorithm::FillBuffer(AudioBus* dest, int requested_frames) {

68 if (playback_rate_ == 0)	145 if (playback_rate_ == 0)

69 return 0;	146 return 0;

70	147

	148 DCHECK_EQ(channels_, dest->channels());

	149

71 // Optimize the \|muted_\| case to issue a single clear instead of performing	150 // Optimize the \|muted_\| case to issue a single clear instead of performing

72 // the full crossfade and clearing each crossfaded frame.	151 // the full crossfade and clearing each crossfaded frame.

73 if (muted_) {	152 if (muted_) {

74 int frames_to_render =	153 int frames_to_render =

75 std::min(static_cast<int>(audio_buffer_.frames() / playback_rate_),	154 std::min(static_cast<int>(audio_buffer_.frames() / playback_rate_),

76 requested_frames);	155 requested_frames);

77	156

78 // Compute accurate number of frames to actually skip in the source data.	157 // Compute accurate number of frames to actually skip in the source data.

79 // Includes the leftover partial frame from last request. However, we can	158 // Includes the leftover partial frame from last request. However, we can

80 // only skip over complete frames, so a partial frame may remain for next	159 // only skip over complete frames, so a partial frame may remain for next

81 // time.	160 // time.

82 muted_partial_frame_ += frames_to_render * playback_rate_;	161 muted_partial_frame_ += frames_to_render * playback_rate_;

83 int seek_frames = static_cast<int>(muted_partial_frame_);	162 int seek_frames = static_cast<int>(muted_partial_frame_);

84 dest->ZeroFrames(frames_to_render);	163 dest->ZeroFrames(frames_to_render);

85 audio_buffer_.SeekFrames(seek_frames);	164 audio_buffer_.SeekFrames(seek_frames);

86	165

87 // Determine the partial frame that remains to be skipped for next call. If	166 // Determine the partial frame that remains to be skipped for next call. If

88 // the user switches back to playing, it may be off time by this partial	167 // the user switches back to playing, it may be off time by this partial

89 // frame, which would be undetectable. If they subsequently switch to	168 // frame, which would be undetectable. If they subsequently switch to

90 // another playback rate that mutes, the code will attempt to line up the	169 // another playback rate that mutes, the code will attempt to line up the

91 // frames again.	170 // frames again.

92 muted_partial_frame_ -= seek_frames;	171 muted_partial_frame_ -= seek_frames;

93 return frames_to_render;	172 return frames_to_render;

94 }	173 }

95	174

96 int slower_step = ceil(window_size_ * playback_rate_);	175 int slower_step = ceil(ola_window_size_ * playback_rate_);

97 int faster_step = ceil(window_size_ / playback_rate_);	176 int faster_step = ceil(ola_window_size_ / playback_rate_);

98	177

99 // Optimize the most common \|playback_rate_\| ~= 1 case to use a single copy	178 // Optimize the most common \|playback_rate_\| ~= 1 case to use a single copy

100 // instead of copying frame by frame.	179 // instead of copying frame by frame.

101 if (window_size_ <= faster_step && slower_step >= window_size_) {	180 if (ola_window_size_ <= faster_step && slower_step >= ola_window_size_) {

102 const int frames_to_copy =	181 const int frames_to_copy =

103 std::min(audio_buffer_.frames(), requested_frames);	182 std::min(audio_buffer_.frames(), requested_frames);

104 const int frames_read = audio_buffer_.ReadFrames(frames_to_copy, 0, dest);	183 const int frames_read = audio_buffer_.ReadFrames(frames_to_copy, 0, dest);

105 DCHECK_EQ(frames_read, frames_to_copy);	184 DCHECK_EQ(frames_read, frames_to_copy);

106 return frames_read;	185 return frames_read;

107 }	186 }

108	187

109 int total_frames_rendered = 0;	188 int rendered_frames = 0;

110 while (total_frames_rendered < requested_frames) {	189 do {

111 if (index_into_window_ >= window_size_)	190 rendered_frames += WriteCompletedFramesTo(

112 ResetWindow();	191 requested_frames - rendered_frames, rendered_frames, dest);

113	192 } while (rendered_frames < requested_frames && RunOneWsolaIteration());

114 int rendered_frames = 0;	193 return rendered_frames;

115 if (window_size_ > faster_step) {

116 rendered_frames =

117 OutputFasterPlayback(dest,

118 total_frames_rendered,

119 requested_frames - total_frames_rendered,

120 window_size_,

121 faster_step);

122 } else if (slower_step < window_size_) {

123 rendered_frames =

124 OutputSlowerPlayback(dest,

125 total_frames_rendered,

126 requested_frames - total_frames_rendered,

127 slower_step,

128 window_size_);

129 } else {

130 NOTREACHED();

131 }

132

133 if (rendered_frames == 0)

134 break;

135

136 total_frames_rendered += rendered_frames;

137 }

138 return total_frames_rendered;

139 }

140

141 void AudioRendererAlgorithm::ResetWindow() {

142 DCHECK_LE(index_into_window_, window_size_);

143 index_into_window_ = 0;

144 crossfade_frame_number_ = 0;

145 }

146

147 int AudioRendererAlgorithm::OutputFasterPlayback(AudioBus* dest,

148 int dest_offset,

149 int requested_frames,

150 int input_step,

151 int output_step) {

152 // Ensure we don't run into OOB read/write situation.

153 CHECK_GT(input_step, output_step);

154 DCHECK_LT(index_into_window_, window_size_);

155 DCHECK_GT(playback_rate_, 1.0);

156 DCHECK(!muted_);

157

158 if (audio_buffer_.frames() < 1)

159 return 0;

160

161 // The audio data is output in a series of windows. For sped-up playback,

162 // the window is comprised of the following phases:

163 //

164 // a) Output raw data.

165 // b) Save bytes for crossfade in \|crossfade_buffer_\|.

166 // c) Drop data.

167 // d) Output crossfaded audio leading up to the next window.

168 //

169 // The duration of each phase is computed below based on the \|window_size_\|

170 // and \|playback_rate_\|.

171 DCHECK_LE(frames_in_crossfade_, output_step);

172

173 // This is the index of the end of phase a, beginning of phase b.

174 int outtro_crossfade_begin = output_step - frames_in_crossfade_;

175

176 // This is the index of the end of phase b, beginning of phase c.

177 int outtro_crossfade_end = output_step;

178

179 // This is the index of the end of phase c, beginning of phase d.

180 // This phase continues until \|index_into_window_\| reaches \|window_size_\|, at

181 // which point the window restarts.

182 int intro_crossfade_begin = input_step - frames_in_crossfade_;

183

184 // a) Output raw frames if we haven't reached the crossfade section.

185 if (index_into_window_ < outtro_crossfade_begin) {

186 // Read as many frames as we can and return the count. If it's not enough,

187 // we will get called again.

188 const int frames_to_copy =

189 std::min(requested_frames, outtro_crossfade_begin - index_into_window_);

190 int copied = audio_buffer_.ReadFrames(frames_to_copy, dest_offset, dest);

191 index_into_window_ += copied;

192 return copied;

193 }

194

195 // b) Save outtro crossfade frames into intermediate buffer, but do not output

196 // anything to \|dest\|.

197 if (index_into_window_ < outtro_crossfade_end) {

198 // This phase only applies if there are bytes to crossfade.

199 DCHECK_GT(frames_in_crossfade_, 0);

200 int crossfade_start = index_into_window_ - outtro_crossfade_begin;

201 int crossfade_count = outtro_crossfade_end - index_into_window_;

202 int copied = audio_buffer_.ReadFrames(

203 crossfade_count, crossfade_start, crossfade_buffer_.get());

204 index_into_window_ += copied;

205

206 // Did we get all the frames we need? If not, return and let subsequent

207 // calls try to get the rest.

208 if (copied != crossfade_count)

209 return 0;

210 }

211

212 // c) Drop frames until we reach the intro crossfade section.

213 if (index_into_window_ < intro_crossfade_begin) {

214 // Check if there is enough data to skip all the frames needed. If not,

215 // return 0 and let subsequent calls try to skip it all.

216 int seek_frames = intro_crossfade_begin - index_into_window_;

217 if (audio_buffer_.frames() < seek_frames)

218 return 0;

219 audio_buffer_.SeekFrames(seek_frames);

220

221 // We've dropped all the frames that need to be dropped.

222 index_into_window_ += seek_frames;

223 }

224

225 // d) Crossfade and output a frame, as long as we have data.

226 if (audio_buffer_.frames() < 1)

227 return 0;

228 DCHECK_GT(frames_in_crossfade_, 0);

229 DCHECK_LT(index_into_window_, window_size_);

230

231 int offset_into_buffer = index_into_window_ - intro_crossfade_begin;

232 int copied = audio_buffer_.ReadFrames(1, dest_offset, dest);

233 DCHECK_EQ(copied, 1);

234 CrossfadeFrame(crossfade_buffer_.get(),

235 offset_into_buffer,

236 dest,

237 dest_offset,

238 offset_into_buffer);

239 index_into_window_ += copied;

240 return copied;

241 }

242

243 int AudioRendererAlgorithm::OutputSlowerPlayback(AudioBus* dest,

244 int dest_offset,

245 int requested_frames,

246 int input_step,

247 int output_step) {

248 // Ensure we don't run into OOB read/write situation.

249 CHECK_LT(input_step, output_step);

250 DCHECK_LT(index_into_window_, window_size_);

251 DCHECK_LT(playback_rate_, 1.0);

252 DCHECK_NE(playback_rate_, 0);

253 DCHECK(!muted_);

254

255 if (audio_buffer_.frames() < 1)

256 return 0;

257

258 // The audio data is output in a series of windows. For slowed down playback,

259 // the window is comprised of the following phases:

260 //

261 // a) Output raw data.

262 // b) Output and save bytes for crossfade in \|crossfade_buffer_\|.

263 // c) Output* raw data.

264 // d) Output* crossfaded audio leading up to the next window.

265 //

266 // * Phases c) and d) do not progress \|audio_buffer_\|'s cursor so that the

267 // \|audio_buffer_\|'s cursor is in the correct place for the next window.

268 //

269 // The duration of each phase is computed below based on the \|window_size_\|

270 // and \|playback_rate_\|.

271 DCHECK_LE(frames_in_crossfade_, input_step);

272

273 // This is the index of the end of phase a, beginning of phase b.

274 int intro_crossfade_begin = input_step - frames_in_crossfade_;

275

276 // This is the index of the end of phase b, beginning of phase c.

277 int intro_crossfade_end = input_step;

278

279 // This is the index of the end of phase c, beginning of phase d.

280 // This phase continues until \|index_into_window_\| reaches \|window_size_\|, at

281 // which point the window restarts.

282 int outtro_crossfade_begin = output_step - frames_in_crossfade_;

283

284 // a) Output raw frames.

285 if (index_into_window_ < intro_crossfade_begin) {

286 // Read as many frames as we can and return the count. If it's not enough,

287 // we will get called again.

288 const int frames_to_copy =

289 std::min(requested_frames, intro_crossfade_begin - index_into_window_);

290 int copied = audio_buffer_.ReadFrames(frames_to_copy, dest_offset, dest);

291 index_into_window_ += copied;

292 return copied;

293 }

294

295 // b) Save the raw frames for the intro crossfade section, then copy the

296 // same frames to \|dest\|.

297 if (index_into_window_ < intro_crossfade_end) {

298 const int frames_to_copy =

299 std::min(requested_frames, intro_crossfade_end - index_into_window_);

300 int offset = index_into_window_ - intro_crossfade_begin;

301 int copied = audio_buffer_.ReadFrames(

302 frames_to_copy, offset, crossfade_buffer_.get());

303 crossfade_buffer_->CopyPartialFramesTo(offset, copied, dest_offset, dest);

304 index_into_window_ += copied;

305 return copied;

306 }

307

308 // c) Output a raw frame into \|dest\| without advancing the \|audio_buffer_\|

309 // cursor.

310 int audio_buffer_offset = index_into_window_ - intro_crossfade_end;

311 DCHECK_GE(audio_buffer_offset, 0);

312 if (audio_buffer_.frames() <= audio_buffer_offset)

313 return 0;

314 int copied =

315 audio_buffer_.PeekFrames(1, audio_buffer_offset, dest_offset, dest);

316 DCHECK_EQ(1, copied);

317

318 // d) Crossfade the next frame of \|crossfade_buffer_\| into \|dest\| if we've

319 // reached the outtro crossfade section of the window.

320 if (index_into_window_ >= outtro_crossfade_begin) {

321 int offset_into_crossfade_buffer =

322 index_into_window_ - outtro_crossfade_begin;

323 CrossfadeFrame(dest,

324 dest_offset,

325 crossfade_buffer_.get(),

326 offset_into_crossfade_buffer,

327 offset_into_crossfade_buffer);

328 }

329

330 index_into_window_ += copied;

331 return copied;

332 }

333

334 void AudioRendererAlgorithm::CrossfadeFrame(AudioBus* intro,

335 int intro_offset,

336 AudioBus* outtro,

337 int outtro_offset,

338 int fade_offset) {

339 float crossfade_ratio =

340 static_cast<float>(fade_offset) / frames_in_crossfade_;

341 for (int channel = 0; channel < channels_; ++channel) {

342 outtro->channel(channel)[outtro_offset] =

343 (1.0f - crossfade_ratio) * intro->channel(channel)[intro_offset] +

344 (crossfade_ratio) * outtro->channel(channel)[outtro_offset];

345 }

346 }	194 }

347	195

348 void AudioRendererAlgorithm::SetPlaybackRate(float new_rate) {	196 void AudioRendererAlgorithm::SetPlaybackRate(float new_rate) {

349 DCHECK_GE(new_rate, 0);	197 DCHECK_GE(new_rate, 0);

350 playback_rate_ = new_rate;	198 playback_rate_ = new_rate;

351 muted_ =	199 muted_ =

352 playback_rate_ < kMinPlaybackRate \|\| playback_rate_ > kMaxPlaybackRate;	200 playback_rate_ < kMinPlaybackRate \|\| playback_rate_ > kMaxPlaybackRate;

353

354 ResetWindow();

355 }	201 }

356	202

357 void AudioRendererAlgorithm::FlushBuffers() {	203 void AudioRendererAlgorithm::FlushBuffers() {

358 ResetWindow();

359

360 // Clear the queue of decoded packets (releasing the buffers).	204 // Clear the queue of decoded packets (releasing the buffers).

361 audio_buffer_.Clear();	205 audio_buffer_.Clear();

	206 output_time_ = 0;

	207 search_block_index_ = 0;

	208 target_block_index_ = 0;

	209 wsola_output_->Zero();

	210 num_complete_frames_ = 0;

362 }	211 }

363	212

364 base::TimeDelta AudioRendererAlgorithm::GetTime() {	213 base::TimeDelta AudioRendererAlgorithm::GetTime() {

365 return audio_buffer_.current_time();	214 return audio_buffer_.current_time();

366 }	215 }

367	216

368 void AudioRendererAlgorithm::EnqueueBuffer(	217 void AudioRendererAlgorithm::EnqueueBuffer(

369 const scoped_refptr<AudioBuffer>& buffer_in) {	218 const scoped_refptr<AudioBuffer>& buffer_in) {

370 DCHECK(!buffer_in->end_of_stream());	219 DCHECK(!buffer_in->end_of_stream());

371 audio_buffer_.Append(buffer_in);	220 audio_buffer_.Append(buffer_in);

372 }	221 }

373	222

374 bool AudioRendererAlgorithm::IsQueueFull() {	223 bool AudioRendererAlgorithm::IsQueueFull() {

375 return audio_buffer_.frames() >= capacity_;	224 return audio_buffer_.frames() >= capacity_;

376 }	225 }

377	226

378 void AudioRendererAlgorithm::IncreaseQueueCapacity() {	227 void AudioRendererAlgorithm::IncreaseQueueCapacity() {

379 capacity_ = std::min(2 * capacity_, kMaxBufferSizeInFrames);	228 capacity_ = std::min(2 * capacity_, kMaxBufferSizeInFrames);

380 }	229 }

381	230

	231 bool AudioRendererAlgorithm::CanPerformWsola() const {

	232 const int search_block_size = num_candidate_blocks_ + (ola_window_size_ - 1);

	233 const int frames = audio_buffer_.frames();

	234 return target_block_index_ + ola_window_size_ <= frames &&

	235 search_block_index_ + search_block_size <= frames;

	236 }

	237

	238 bool AudioRendererAlgorithm::RunOneWsolaIteration() {

	239 if (!CanPerformWsola())

	240 return false;

	241

	242 GetOptimalBlock();

	243

	244 // Overlap-and-add.

	245 for (int k = 0; k < channels_; ++k) {

	246 const float* const ch_opt_frame = optimal_block_->channel(k);

	247 float* ch_output = wsola_output_->channel(k) + num_complete_frames_;

	248 for (int n = 0; n < ola_hop_size_; ++n) {

	249 ch_output[n] = ch_output[n] * ola_window_[ola_hop_size_ + n] +

	250 ch_opt_frame[n] * ola_window_[n];

	251 }

	252

	253 // Copy the second half to the output.

	254 memcpy(&ch_output[ola_hop_size_], &ch_opt_frame[ola_hop_size_],

	255 sizeof(ch_opt_frame) ola_hop_size_);

	256 }

	257

	258 num_complete_frames_ += ola_hop_size_;

	259 UpdateOutputTime(ola_hop_size_);

	260 RemoveOldInputFrames();

	261 return true;

	262 }

	263

	264 void AudioRendererAlgorithm::UpdateOutputTime(float time_change) {

	265 output_time_ += time_change;

	266 // Center of the search region, in frames.

	267 const int search_block_center_index = static_cast<int>(

	268 output_time_ * playback_rate_ + 0.5f);

	269 search_block_index_ = search_block_center_index - search_block_center_offset_;

	270 }

	271

	272 void AudioRendererAlgorithm::RemoveOldInputFrames() {

	273 const int earliest_used_index = std::min(target_block_index_,

	274 search_block_index_);

	275 if (earliest_used_index <= 0)

	276 return; // Nothing to remove.

	277

	278 // Remove frames from input and adjust indices accordingly.

	279 audio_buffer_.SeekFrames(earliest_used_index);

	280 target_block_index_ -= earliest_used_index;

	281

	282 // Adjust output index.

	283 float output_time_change = earliest_used_index / playback_rate_;

	284 CHECK_GE(output_time_, output_time_change);

	285 UpdateOutputTime(-output_time_change);

	286 }

	287

	288 int AudioRendererAlgorithm::WriteCompletedFramesTo(

	289 int requested_frames, int dest_offset, AudioBus* dest) {

	290 int rendered_frames = std::min(num_complete_frames_, requested_frames);

	291

	292 if (rendered_frames == 0)

	293 return 0; // There is nothing to read from \|wsola_output_\|, return.

	294

	295 wsola_output_->CopyPartialFramesTo(0, rendered_frames, dest_offset, dest);

	296

	297 // Remove the frames which are read.

	298 int frames_to_move = wsola_output_->frames() - rendered_frames;

	299 for (int k = 0; k < channels_; ++k) {

	300 float* ch = wsola_output_->channel(k);

	301 memmove(ch, &ch[rendered_frames], sizeof(ch) frames_to_move);

	302 }

	303 num_complete_frames_ -= rendered_frames;

	304 return rendered_frames;

	305 }

	306

	307 bool AudioRendererAlgorithm::TargetIsWithinSearchRegion() const {

	308 const int search_block_size = num_candidate_blocks_ + (ola_window_size_ - 1);

	309

	310 return target_block_index_ >= search_block_index_ &&

	311 target_block_index_ + ola_window_size_ <=

	312 search_block_index_ + search_block_size;

	313 }

	314

	315 void AudioRendererAlgorithm::GetOptimalBlock() {

	316 int optimal_index = 0;

	317

	318 // An interval around last optimal block which is excluded from the search.

	319 // This is to reduce the buzzy sound. The number 160 is rather arbitrary and

	320 // derived heuristically.

	321 const int kExcludeIntervalLengthFrames = 160;

	322 if (TargetIsWithinSearchRegion()) {

	323 optimal_index = target_block_index_;

	324 PeekAudioWithZeroPrepend(optimal_index, optimal_block_.get());

	325 } else {

	326 PeekAudioWithZeroPrepend(target_block_index_, target_block_.get());

	327 PeekAudioWithZeroPrepend(search_block_index_, search_block_.get());

	328 int last_optimal = target_block_index_ - ola_hop_size_ -

	329 search_block_index_;

	330 internal::Interval exclude_iterval = std::make_pair(

	331 last_optimal - kExcludeIntervalLengthFrames / 2,

	332 last_optimal + kExcludeIntervalLengthFrames / 2);

	333

	334 // \|optimal_index\| is in frames and it is relative to the beginning of the

	335 // \|search_block_\|.

	336 optimal_index = internal::OptimalIndex(

	337 search_block_.get(), target_block_.get(), exclude_iterval);

	338

	339 // Translate \|index\| w.r.t. the beginning of \|audio_buffer_\| and extract the

	340 // optimal block.

	341 optimal_index += search_block_index_;

	342 PeekAudioWithZeroPrepend(optimal_index, optimal_block_.get());

	343

	344 // Make a transition from target block to the optimal block if different.

	345 // Target block has the best continuation to the current output.

	346 // Optimal block is the most similar block to the target, however, it might

	347 // introduce some discontinuity when over-lap-added. Therefore, we combine

	348 // them for a smoother transition. The length of transition window is twice

	349 // as that of the optimal-block which makes it like a weighting function

	350 // where target-block has higher weight close to zero (weight of 1 at index

	351 // 0) and lower weight close the end.

	352 for (int k = 0; k < channels_; ++k) {

	353 float* ch_opt = optimal_block_->channel(k);

	354 const float* const ch_target = target_block_->channel(k);

	355 for (int n = 0; n < ola_window_size_; ++n) {

	356 ch_opt[n] = ch_opt[n] * transition_window_[n] + ch_target[n] *

	357 transition_window_[ola_window_size_ + n];

	358 }

	359 }

	360 }

	361

	362 // Next target is one hop ahead of the current optimal.

	363 target_block_index_ = optimal_index + ola_hop_size_;

	364 }

	365

	366 void AudioRendererAlgorithm::PeekAudioWithZeroPrepend(

	367 int read_offset_frames, AudioBus* dest) {

	368 CHECK_LE(read_offset_frames + dest->frames(), audio_buffer_.frames());

	369

	370 int write_offset = 0;

	371 int num_frames_to_read = dest->frames();

	372 if (read_offset_frames < 0) {

	373 int num_zero_frames_appended = std::min(-read_offset_frames,

	374 num_frames_to_read);

	375 read_offset_frames = 0;

	376 num_frames_to_read -= num_zero_frames_appended;

	377 write_offset = num_zero_frames_appended;

	378 dest->ZeroFrames(num_zero_frames_appended);

	379 }

	380 audio_buffer_.PeekFrames(num_frames_to_read, read_offset_frames,

	381 write_offset, dest);

	382 }

	383

382 } // namespace media	384 } // namespace media

OLD	NEW

« no previous file with comments | « media/filters/audio_renderer_algorithm.h ('k') | media/filters/audio_renderer_algorithm_unittest.cc » ('j') | media/filters/wsola_internals.h » ('J')