media/filters/ffmpeg_audio_decoder.cc - Issue 259453003: Introduce AudioDiscardHelper. Refactor audio decoders to use it.

Side by Side Diff: media/filters/ffmpeg_audio_decoder.cc

Issue 259453003: Introduce AudioDiscardHelper. Refactor audio decoders to use it. (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src

Patch Set: Comments. Created 6 years, 7 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch | Annotate | Revision Log

OLD	NEW
1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.	1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.

2 // Use of this source code is governed by a BSD-style license that can be	2 // Use of this source code is governed by a BSD-style license that can be

3 // found in the LICENSE file.	3 // found in the LICENSE file.

4	4

5 #include "media/filters/ffmpeg_audio_decoder.h"	5 #include "media/filters/ffmpeg_audio_decoder.h"

6	6

7 #include "base/callback_helpers.h"	7 #include "base/callback_helpers.h"

8 #include "base/single_thread_task_runner.h"	8 #include "base/single_thread_task_runner.h"

9 #include "media/base/audio_buffer.h"	9 #include "media/base/audio_buffer.h"

10 #include "media/base/audio_bus.h"	10 #include "media/base/audio_bus.h"

11 #include "media/base/audio_decoder_config.h"	11 #include "media/base/audio_decoder_config.h"

12 #include "media/base/audio_timestamp_helper.h"	12 #include "media/base/audio_discard_helper.h"

13 #include "media/base/bind_to_current_loop.h"	13 #include "media/base/bind_to_current_loop.h"

14 #include "media/base/decoder_buffer.h"	14 #include "media/base/decoder_buffer.h"

15 #include "media/base/limits.h"	15 #include "media/base/limits.h"

16 #include "media/base/sample_format.h"	16 #include "media/base/sample_format.h"

17 #include "media/ffmpeg/ffmpeg_common.h"	17 #include "media/ffmpeg/ffmpeg_common.h"

18 #include "media/filters/ffmpeg_glue.h"	18 #include "media/filters/ffmpeg_glue.h"

19	19

20 namespace media {	20 namespace media {

21	21

22 // Returns true if the decode result was end of stream.	22 // Returns true if the decode result was end of stream.

(...skipping 97 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
120 // reference to the AudioBuffer object.	120 // reference to the AudioBuffer object.

121 void* opaque = NULL;	121 void* opaque = NULL;

122 buffer.swap(reinterpret_cast<AudioBuffer**>(&opaque));	122 buffer.swap(reinterpret_cast<AudioBuffer**>(&opaque));

123 frame->buf[0] = av_buffer_create(	123 frame->buf[0] = av_buffer_create(

124 frame->data[0], buffer_size_in_bytes, ReleaseAudioBufferImpl, opaque, 0);	124 frame->data[0], buffer_size_in_bytes, ReleaseAudioBufferImpl, opaque, 0);

125 return 0;	125 return 0;

126 }	126 }

127	127

128 FFmpegAudioDecoder::FFmpegAudioDecoder(	128 FFmpegAudioDecoder::FFmpegAudioDecoder(

129 const scoped_refptr<base::SingleThreadTaskRunner>& task_runner)	129 const scoped_refptr<base::SingleThreadTaskRunner>& task_runner)

130 : task_runner_(task_runner),	130 : task_runner_(task_runner), state_(kUninitialized), av_sample_format_(0) {

131 state_(kUninitialized),	131 }

132 av_sample_format_(0),

133 last_input_timestamp_(kNoTimestamp()),

134 output_frames_to_drop_(0) {}

135	132

136 FFmpegAudioDecoder::~FFmpegAudioDecoder() {	133 FFmpegAudioDecoder::~FFmpegAudioDecoder() {

137 DCHECK_EQ(state_, kUninitialized);	134 DCHECK_EQ(state_, kUninitialized);

138 DCHECK(!codec_context_);	135 DCHECK(!codec_context_);

139 DCHECK(!av_frame_);	136 DCHECK(!av_frame_);

140 }	137 }

141	138

142 void FFmpegAudioDecoder::Initialize(const AudioDecoderConfig& config,	139 void FFmpegAudioDecoder::Initialize(const AudioDecoderConfig& config,

143 const PipelineStatusCB& status_cb) {	140 const PipelineStatusCB& status_cb) {

144 DCHECK(task_runner_->BelongsToCurrentThread());	141 DCHECK(task_runner_->BelongsToCurrentThread());

(...skipping 102 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
247 // A decoding error occurs and decoding needs to stop.	244 // A decoding error occurs and decoding needs to stop.

248 // kFlushCodec -> kDecodeFinished:	245 // kFlushCodec -> kDecodeFinished:

249 // When avcodec_decode_audio4() returns 0 data.	246 // When avcodec_decode_audio4() returns 0 data.

250 // kFlushCodec -> kError:	247 // kFlushCodec -> kError:

251 // When avcodec_decode_audio4() errors out.	248 // When avcodec_decode_audio4() errors out.

252 // (any state) -> kNormal:	249 // (any state) -> kNormal:

253 // Any time Reset() is called.	250 // Any time Reset() is called.

254	251

255 // Make sure we are notified if http://crbug.com/49709 returns. Issue also	252 // Make sure we are notified if http://crbug.com/49709 returns. Issue also

256 // occurs with some damaged files.	253 // occurs with some damaged files.

257 if (!buffer->end_of_stream() && buffer->timestamp() == kNoTimestamp() &&	254 if (!buffer->end_of_stream() && buffer->timestamp() == kNoTimestamp()) {

258 output_timestamp_helper_->base_timestamp() == kNoTimestamp()) {

259 DVLOG(1) << "Received a buffer without timestamps!";	255 DVLOG(1) << "Received a buffer without timestamps!";

260 decode_cb.Run(kDecodeError, NULL);	256 decode_cb.Run(kDecodeError, NULL);

261 return;	257 return;

262 }	258 }

263	259

264 if (!buffer->end_of_stream()) {	260 if (!buffer->end_of_stream() && !discard_helper_->initialized() &&

265 DCHECK(buffer->timestamp() != kNoTimestamp());	261 codec_context_->codec_id == AV_CODEC_ID_VORBIS &&

266 const bool first_buffer =	262 buffer->timestamp() < base::TimeDelta()) {

267 last_input_timestamp_ == kNoTimestamp() &&	263 // Dropping frames for negative timestamps as outlined in section A.2

268 output_timestamp_helper_->base_timestamp() == kNoTimestamp();	264 // in the Vorbis spec. http://xiph.org/vorbis/doc/Vorbis_I_spec.html

269 if (first_buffer && codec_context_->codec_id == AV_CODEC_ID_VORBIS &&	265 const int discard_frames =

270 buffer->timestamp() < base::TimeDelta()) {	266 discard_helper_->TimeDeltaToFrames(-buffer->timestamp());

271 // Dropping frames for negative timestamps as outlined in section A.2	267 discard_helper_->Reset(discard_frames);

272 // in the Vorbis spec. http://xiph.org/vorbis/doc/Vorbis_I_spec.html

273 DCHECK_EQ(output_frames_to_drop_, 0);

274 output_frames_to_drop_ =

275 0.5 +

276 -buffer->timestamp().InSecondsF() * config_.samples_per_second();

277

278 // If we are dropping samples for Vorbis, the timeline always starts at 0.

279 output_timestamp_helper_->SetBaseTimestamp(base::TimeDelta());

280 } else {

281 if (first_buffer) {

282 output_timestamp_helper_->SetBaseTimestamp(buffer->timestamp());

283 } else if (buffer->timestamp() < last_input_timestamp_) {

284 const base::TimeDelta diff =

285 buffer->timestamp() - last_input_timestamp_;

286 DLOG(WARNING) << "Input timestamps are not monotonically increasing! "

287 << " ts " << buffer->timestamp().InMicroseconds() << " us"

288 << " diff " << diff.InMicroseconds() << " us";

289 }

290

291 last_input_timestamp_ = buffer->timestamp();

292 }

293 }	268 }

294	269

295 // Transition to kFlushCodec on the first end of stream buffer.	270 // Transition to kFlushCodec on the first end of stream buffer.

296 if (state_ == kNormal && buffer->end_of_stream()) {	271 if (state_ == kNormal && buffer->end_of_stream()) {

297 state_ = kFlushCodec;	272 state_ = kFlushCodec;

298 }	273 }

299	274

300 if (!FFmpegDecode(buffer)) {	275 if (!FFmpegDecode(buffer)) {

301 state_ = kError;	276 state_ = kError;

302 decode_cb.Run(kDecodeError, NULL);	277 decode_cb.Run(kDecodeError, NULL);

(...skipping 11 matching lines...) Expand all Loading...
314 decode_cb.Run(kNotEnoughData, NULL);	289 decode_cb.Run(kNotEnoughData, NULL);

315 return;	290 return;

316 }	291 }

317	292

318 decode_cb.Run(kOk, queued_audio_.front());	293 decode_cb.Run(kOk, queued_audio_.front());

319 queued_audio_.pop_front();	294 queued_audio_.pop_front();

320 }	295 }

321	296

322 bool FFmpegAudioDecoder::FFmpegDecode(	297 bool FFmpegAudioDecoder::FFmpegDecode(

323 const scoped_refptr<DecoderBuffer>& buffer) {	298 const scoped_refptr<DecoderBuffer>& buffer) {

324

325 DCHECK(queued_audio_.empty());	299 DCHECK(queued_audio_.empty());

326	300

327 AVPacket packet;	301 AVPacket packet;

328 av_init_packet(&packet);	302 av_init_packet(&packet);

329 if (buffer->end_of_stream()) {	303 if (buffer->end_of_stream()) {

330 packet.data = NULL;	304 packet.data = NULL;

331 packet.size = 0;	305 packet.size = 0;

332 } else {	306 } else {

333 packet.data = const_cast<uint8*>(buffer->data());	307 packet.data = const_cast<uint8*>(buffer->data());

334 packet.size = buffer->data_size();	308 packet.size = buffer->data_size();

335 }	309 }

336	310

337 // Each audio packet may contain several frames, so we must call the decoder	311 // Each audio packet may contain several frames, so we must call the decoder

338 // until we've exhausted the packet. Regardless of the packet size we always	312 // until we've exhausted the packet. Regardless of the packet size we always

339 // want to hand it to the decoder at least once, otherwise we would end up	313 // want to hand it to the decoder at least once, otherwise we would end up

340 // skipping end of stream packets since they have a size of zero.	314 // skipping end of stream packets since they have a size of zero.

341 do {	315 do {

342 int frame_decoded = 0;	316 int frame_decoded = 0;

343 int result = avcodec_decode_audio4(	317 const int result = avcodec_decode_audio4(

344 codec_context_.get(), av_frame_.get(), &frame_decoded, &packet);	318 codec_context_.get(), av_frame_.get(), &frame_decoded, &packet);

345	319

346 if (result < 0) {	320 if (result < 0) {

347 DCHECK(!buffer->end_of_stream())	321 DCHECK(!buffer->end_of_stream())

348 << "End of stream buffer produced an error! "	322 << "End of stream buffer produced an error! "

349 << "This is quite possibly a bug in the audio decoder not handling "	323 << "This is quite possibly a bug in the audio decoder not handling "

350 << "end of stream AVPackets correctly.";	324 << "end of stream AVPackets correctly.";

351	325

352 DLOG(WARNING)	326 DLOG(WARNING)

353 << "Failed to decode an audio frame with timestamp: "	327 << "Failed to decode an audio frame with timestamp: "

354 << buffer->timestamp().InMicroseconds() << " us, duration: "	328 << buffer->timestamp().InMicroseconds() << " us, duration: "

355 << buffer->duration().InMicroseconds() << " us, packet size: "	329 << buffer->duration().InMicroseconds() << " us, packet size: "

356 << buffer->data_size() << " bytes";	330 << buffer->data_size() << " bytes";

357	331

358 break;	332 break;

359 }	333 }

360	334

361 // Update packet size and data pointer in case we need to call the decoder	335 // Update packet size and data pointer in case we need to call the decoder

362 // with the remaining bytes from this packet.	336 // with the remaining bytes from this packet.

363 packet.size -= result;	337 packet.size -= result;

364 packet.data += result;	338 packet.data += result;

365	339

366 scoped_refptr<AudioBuffer> output;	340 scoped_refptr<AudioBuffer> output;

367 int decoded_frames = 0;	341 const int channels = DetermineChannels(av_frame_.get());

368 int original_frames = 0;

369 int channels = DetermineChannels(av_frame_.get());

370 if (frame_decoded) {	342 if (frame_decoded) {

371 if (av_frame_->sample_rate != config_.samples_per_second() \|\|	343 if (av_frame_->sample_rate != config_.samples_per_second() \|\|

372 channels != ChannelLayoutToChannelCount(config_.channel_layout()) \|\|	344 channels != ChannelLayoutToChannelCount(config_.channel_layout()) \|\|

373 av_frame_->format != av_sample_format_) {	345 av_frame_->format != av_sample_format_) {

374 DLOG(ERROR) << "Unsupported midstream configuration change!"	346 DLOG(ERROR) << "Unsupported midstream configuration change!"

375 << " Sample Rate: " << av_frame_->sample_rate << " vs "	347 << " Sample Rate: " << av_frame_->sample_rate << " vs "

376 << config_.samples_per_second()	348 << config_.samples_per_second()

377 << ", Channels: " << channels << " vs "	349 << ", Channels: " << channels << " vs "

378 << ChannelLayoutToChannelCount(config_.channel_layout())	350 << ChannelLayoutToChannelCount(config_.channel_layout())

379 << ", Sample Format: " << av_frame_->format << " vs "	351 << ", Sample Format: " << av_frame_->format << " vs "

380 << av_sample_format_;	352 << av_sample_format_;

381	353

382 // This is an unrecoverable error, so bail out.	354 // This is an unrecoverable error, so bail out.

383 queued_audio_.clear();	355 queued_audio_.clear();

384 av_frame_unref(av_frame_.get());	356 av_frame_unref(av_frame_.get());

385 return false;	357 return false;

386 }	358 }

387	359

388 // Get the AudioBuffer that the data was decoded into. Adjust the number	360 // Get the AudioBuffer that the data was decoded into. Adjust the number

389 // of frames, in case fewer than requested were actually decoded.	361 // of frames, in case fewer than requested were actually decoded.

390 output = reinterpret_cast<AudioBuffer*>(	362 output = reinterpret_cast<AudioBuffer*>(

391 av_buffer_get_opaque(av_frame_->buf[0]));	363 av_buffer_get_opaque(av_frame_->buf[0]));

392	364

393 DCHECK_EQ(ChannelLayoutToChannelCount(config_.channel_layout()),	365 DCHECK_EQ(ChannelLayoutToChannelCount(config_.channel_layout()),

394 output->channel_count());	366 output->channel_count());

395 original_frames = av_frame_->nb_samples;	367 const int unread_frames = output->frame_count() - av_frame_->nb_samples;

396 int unread_frames = output->frame_count() - original_frames;

397 DCHECK_GE(unread_frames, 0);	368 DCHECK_GE(unread_frames, 0);

398 if (unread_frames > 0)	369 if (unread_frames > 0)

399 output->TrimEnd(unread_frames);	370 output->TrimEnd(unread_frames);

400	371

401 // If there are frames to drop, get rid of as many as we can.

402 if (output_frames_to_drop_ > 0) {

403 int drop = std::min(output->frame_count(), output_frames_to_drop_);

404 output->TrimStart(drop);

405 output_frames_to_drop_ -= drop;

406 }

407

408 decoded_frames = output->frame_count();

409 av_frame_unref(av_frame_.get());	372 av_frame_unref(av_frame_.get());

410 }	373 }

411	374

412 // WARNING: \|av_frame_\| no longer has valid data at this point.	375 // WARNING: \|av_frame_\| no longer has valid data at this point.

413	376 const int decoded_frames = frame_decoded ? output->frame_count() : 0;

414 if (decoded_frames > 0) {	377 if (IsEndOfStream(result, decoded_frames, buffer)) {

415 // Set the timestamp/duration once all the extra frames have been

416 // discarded.

417 output->set_timestamp(output_timestamp_helper_->GetTimestamp());

418 output->set_duration(

419 output_timestamp_helper_->GetFrameDuration(decoded_frames));

420 output_timestamp_helper_->AddFrames(decoded_frames);

421 } else if (IsEndOfStream(result, original_frames, buffer)) {

422 DCHECK_EQ(packet.size, 0);	378 DCHECK_EQ(packet.size, 0);

423 output = AudioBuffer::CreateEOSBuffer();	379 queued_audio_.push_back(AudioBuffer::CreateEOSBuffer());

424 } else {	380 } else if (discard_helper_->ProcessBuffers(buffer, output)) {

425 // In case all the frames in the buffer were dropped.	381 queued_audio_.push_back(output);

426 output = NULL;

427 }	382 }

428

429 if (output.get())

430 queued_audio_.push_back(output);

431

432 } while (packet.size > 0);	383 } while (packet.size > 0);

433	384

434 return true;	385 return true;

435 }	386 }

436	387

437 void FFmpegAudioDecoder::ReleaseFFmpegResources() {	388 void FFmpegAudioDecoder::ReleaseFFmpegResources() {

438 codec_context_.reset();	389 codec_context_.reset();

439 av_frame_.reset();	390 av_frame_.reset();

440 }	391 }

441	392

(...skipping 27 matching lines...) Expand all Loading...
469 if (!codec \|\| avcodec_open2(codec_context_.get(), codec, NULL) < 0) {	420 if (!codec \|\| avcodec_open2(codec_context_.get(), codec, NULL) < 0) {

470 DLOG(ERROR) << "Could not initialize audio decoder: "	421 DLOG(ERROR) << "Could not initialize audio decoder: "

471 << codec_context_->codec_id;	422 << codec_context_->codec_id;

472 ReleaseFFmpegResources();	423 ReleaseFFmpegResources();

473 state_ = kUninitialized;	424 state_ = kUninitialized;

474 return false;	425 return false;

475 }	426 }

476	427

477 // Success!	428 // Success!

478 av_frame_.reset(av_frame_alloc());	429 av_frame_.reset(av_frame_alloc());

479 output_timestamp_helper_.reset(	430 discard_helper_.reset(new AudioDiscardHelper(config_.samples_per_second()));

480 new AudioTimestampHelper(config_.samples_per_second()));

481 ResetTimestampState();

482

483 av_sample_format_ = codec_context_->sample_fmt;	431 av_sample_format_ = codec_context_->sample_fmt;

484	432

485 if (codec_context_->channels !=	433 if (codec_context_->channels !=

486 ChannelLayoutToChannelCount(config_.channel_layout())) {	434 ChannelLayoutToChannelCount(config_.channel_layout())) {

487 DLOG(ERROR) << "Audio configuration specified "	435 DLOG(ERROR) << "Audio configuration specified "

488 << ChannelLayoutToChannelCount(config_.channel_layout())	436 << ChannelLayoutToChannelCount(config_.channel_layout())

489 << " channels, but FFmpeg thinks the file contains "	437 << " channels, but FFmpeg thinks the file contains "

490 << codec_context_->channels << " channels";	438 << codec_context_->channels << " channels";

491 ReleaseFFmpegResources();	439 ReleaseFFmpegResources();

492 state_ = kUninitialized;	440 state_ = kUninitialized;

493 return false;	441 return false;

494 }	442 }

495	443

496 output_frames_to_drop_ = config_.codec_delay();	444 ResetTimestampState();

497 return true;	445 return true;

498 }	446 }

499	447

500 void FFmpegAudioDecoder::ResetTimestampState() {	448 void FFmpegAudioDecoder::ResetTimestampState() {

501 output_timestamp_helper_->SetBaseTimestamp(kNoTimestamp());	449 discard_helper_->Reset(config_.codec_delay());

502 last_input_timestamp_ = kNoTimestamp();

503 output_frames_to_drop_ = 0;

504 }	450 }

505	451

506 } // namespace media	452 } // namespace media

OLD	NEW

« media/filters/ffmpeg_audio_decoder.h ('K') | « media/filters/ffmpeg_audio_decoder.h ('k') | media/filters/opus_audio_decoder.h » ('j') | media/filters/opus_audio_decoder.cc » ('J')