| OLD | NEW |
| 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. | 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
| 4 | 4 |
| 5 #include "media/filters/ffmpeg_audio_decoder.h" | 5 #include "media/filters/ffmpeg_audio_decoder.h" |
| 6 | 6 |
| 7 #include "base/bind.h" | 7 #include "base/bind.h" |
| 8 #include "base/callback_helpers.h" | 8 #include "base/callback_helpers.h" |
| 9 #include "base/location.h" | 9 #include "base/location.h" |
| 10 #include "base/single_thread_task_runner.h" | 10 #include "base/single_thread_task_runner.h" |
| (...skipping 55 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 66 // AudioBuffer allocated, so unref it. | 66 // AudioBuffer allocated, so unref it. |
| 67 static void ReleaseAudioBufferImpl(void* opaque, uint8* data) { | 67 static void ReleaseAudioBufferImpl(void* opaque, uint8* data) { |
| 68 scoped_refptr<AudioBuffer> buffer; | 68 scoped_refptr<AudioBuffer> buffer; |
| 69 buffer.swap(reinterpret_cast<AudioBuffer**>(&opaque)); | 69 buffer.swap(reinterpret_cast<AudioBuffer**>(&opaque)); |
| 70 } | 70 } |
| 71 | 71 |
| 72 FFmpegAudioDecoder::FFmpegAudioDecoder( | 72 FFmpegAudioDecoder::FFmpegAudioDecoder( |
| 73 const scoped_refptr<base::SingleThreadTaskRunner>& task_runner) | 73 const scoped_refptr<base::SingleThreadTaskRunner>& task_runner) |
| 74 : task_runner_(task_runner), | 74 : task_runner_(task_runner), |
| 75 weak_factory_(this), | 75 weak_factory_(this), |
| 76 demuxer_stream_(NULL), | 76 state_(kUninitialized), |
| 77 bytes_per_channel_(0), | 77 bytes_per_channel_(0), |
| 78 channel_layout_(CHANNEL_LAYOUT_NONE), | 78 channel_layout_(CHANNEL_LAYOUT_NONE), |
| 79 channels_(0), | 79 channels_(0), |
| 80 samples_per_second_(0), | 80 samples_per_second_(0), |
| 81 av_sample_format_(0), | 81 av_sample_format_(0), |
| 82 last_input_timestamp_(kNoTimestamp()), | 82 last_input_timestamp_(kNoTimestamp()), |
| 83 output_frames_to_drop_(0) { | 83 output_frames_to_drop_(0) {} |
| 84 |
| 85 FFmpegAudioDecoder::~FFmpegAudioDecoder() { |
| 86 DCHECK_EQ(state_, kUninitialized); |
| 87 DCHECK(!codec_context_); |
| 88 DCHECK(!av_frame_); |
| 84 } | 89 } |
| 85 | 90 |
| 86 void FFmpegAudioDecoder::Initialize( | 91 void FFmpegAudioDecoder::Initialize(const AudioDecoderConfig& config, |
| 87 DemuxerStream* stream, | 92 const PipelineStatusCB& status_cb) { |
| 88 const PipelineStatusCB& status_cb, | |
| 89 const StatisticsCB& statistics_cb) { | |
| 90 DCHECK(task_runner_->BelongsToCurrentThread()); | 93 DCHECK(task_runner_->BelongsToCurrentThread()); |
| 94 DCHECK(decode_cb_.is_null()); |
| 95 DCHECK(reset_cb_.is_null()); |
| 96 DCHECK(!config.is_encrypted()); |
| 97 |
| 98 FFmpegGlue::InitializeFFmpeg(); |
| 99 weak_this_ = weak_factory_.GetWeakPtr(); |
| 100 |
| 101 config_ = config; |
| 91 PipelineStatusCB initialize_cb = BindToCurrentLoop(status_cb); | 102 PipelineStatusCB initialize_cb = BindToCurrentLoop(status_cb); |
| 92 | 103 |
| 93 FFmpegGlue::InitializeFFmpeg(); | 104 if (!config.IsValidConfig() || !ConfigureDecoder()) { |
| 94 | 105 initialize_cb.Run(DECODER_ERROR_NOT_SUPPORTED); |
| 95 if (demuxer_stream_) { | |
| 96 // TODO(scherkus): initialization currently happens more than once in | |
| 97 // PipelineIntegrationTest.BasicPlayback. | |
| 98 LOG(ERROR) << "Initialize has already been called."; | |
| 99 CHECK(false); | |
| 100 } | |
| 101 | |
| 102 weak_this_ = weak_factory_.GetWeakPtr(); | |
| 103 demuxer_stream_ = stream; | |
| 104 | |
| 105 if (!ConfigureDecoder()) { | |
| 106 status_cb.Run(DECODER_ERROR_NOT_SUPPORTED); | |
| 107 return; | 106 return; |
| 108 } | 107 } |
| 109 | 108 |
| 110 statistics_cb_ = statistics_cb; | 109 // Success! |
| 110 state_ = kNormal; |
| 111 initialize_cb.Run(PIPELINE_OK); | 111 initialize_cb.Run(PIPELINE_OK); |
| 112 } | 112 } |
| 113 | 113 |
| 114 void FFmpegAudioDecoder::Read(const ReadCB& read_cb) { | 114 void FFmpegAudioDecoder::Decode(const scoped_refptr<DecoderBuffer>& buffer, |
| 115 const DecodeCB& decode_cb) { |
| 115 DCHECK(task_runner_->BelongsToCurrentThread()); | 116 DCHECK(task_runner_->BelongsToCurrentThread()); |
| 116 DCHECK(!read_cb.is_null()); | 117 DCHECK(!decode_cb.is_null()); |
| 117 CHECK(read_cb_.is_null()) << "Overlapping decodes are not supported."; | 118 CHECK_NE(state_, kUninitialized); |
| 118 DCHECK(reset_cb_.is_null()); | 119 CHECK(decode_cb_.is_null()) << "Overlapping decodes are not supported."; |
| 119 DCHECK(stop_cb_.is_null()); | 120 decode_cb_ = BindToCurrentLoop(decode_cb); |
| 120 | 121 |
| 121 read_cb_ = BindToCurrentLoop(read_cb); | 122 if (state_ == kError) { |
| 122 | 123 base::ResetAndReturn(&decode_cb_).Run(kDecodeError, NULL); |
| 123 // If we don't have any queued audio from the last packet we decoded, ask for | |
| 124 // more data from the demuxer to satisfy this read. | |
| 125 if (queued_audio_.empty()) { | |
| 126 ReadFromDemuxerStream(); | |
| 127 return; | 124 return; |
| 128 } | 125 } |
| 129 | 126 |
| 130 base::ResetAndReturn(&read_cb_).Run( | 127 // Return empty frames if decoding has finished. |
| 131 queued_audio_.front().status, queued_audio_.front().buffer); | 128 if (state_ == kDecodeFinished) { |
| 129 base::ResetAndReturn(&decode_cb_).Run(kOk, AudioBuffer::CreateEOSBuffer()); |
| 130 return; |
| 131 } |
| 132 |
| 133 DecodeBuffer(buffer); |
| 134 } |
| 135 |
| 136 scoped_refptr<AudioBuffer> FFmpegAudioDecoder::GetAudioBuffer( |
| 137 AudioDecoder::Status* status) { |
| 138 DCHECK(status); |
| 139 if (queued_audio_.empty()) { |
| 140 return NULL; |
| 141 } |
| 142 *status = queued_audio_.front().status; |
| 143 scoped_refptr<AudioBuffer> out = queued_audio_.front().buffer; |
| 132 queued_audio_.pop_front(); | 144 queued_audio_.pop_front(); |
| 145 return out; |
| 133 } | 146 } |
| 134 | 147 |
| 135 int FFmpegAudioDecoder::bits_per_channel() { | 148 int FFmpegAudioDecoder::bits_per_channel() { |
| 136 DCHECK(task_runner_->BelongsToCurrentThread()); | |
| 137 return bytes_per_channel_ * 8; | 149 return bytes_per_channel_ * 8; |
| 138 } | 150 } |
| 139 | 151 |
| 140 ChannelLayout FFmpegAudioDecoder::channel_layout() { | 152 ChannelLayout FFmpegAudioDecoder::channel_layout() { |
| 141 DCHECK(task_runner_->BelongsToCurrentThread()); | |
| 142 return channel_layout_; | 153 return channel_layout_; |
| 143 } | 154 } |
| 144 | 155 |
| 145 int FFmpegAudioDecoder::samples_per_second() { | 156 int FFmpegAudioDecoder::samples_per_second() { |
| 146 DCHECK(task_runner_->BelongsToCurrentThread()); | |
| 147 return samples_per_second_; | 157 return samples_per_second_; |
| 148 } | 158 } |
| 149 | 159 |
| 150 void FFmpegAudioDecoder::Reset(const base::Closure& closure) { | 160 void FFmpegAudioDecoder::Reset(const base::Closure& closure) { |
| 151 DCHECK(task_runner_->BelongsToCurrentThread()); | 161 DCHECK(task_runner_->BelongsToCurrentThread()); |
| 162 DCHECK(reset_cb_.is_null()); |
| 152 reset_cb_ = BindToCurrentLoop(closure); | 163 reset_cb_ = BindToCurrentLoop(closure); |
| 153 | 164 |
| 154 // A demuxer read is pending, we'll wait until it finishes. | 165 // Defer the reset if a decode is pending. |
| 155 if (!read_cb_.is_null()) | 166 if (!decode_cb_.is_null()) |
| 156 return; | 167 return; |
| 157 | 168 |
| 158 DoReset(); | 169 DoReset(); |
| 159 } | 170 } |
| 160 | 171 |
| 161 void FFmpegAudioDecoder::Stop(const base::Closure& closure) { | 172 void FFmpegAudioDecoder::Stop(const base::Closure& closure) { |
| 162 DCHECK(task_runner_->BelongsToCurrentThread()); | 173 DCHECK(task_runner_->BelongsToCurrentThread()); |
| 163 stop_cb_ = BindToCurrentLoop(closure); | 174 base::ScopedClosureRunner runner(BindToCurrentLoop(closure)); |
| 164 | 175 |
| 165 // A demuxer read is pending, we'll wait until it finishes. | 176 if (state_ == kUninitialized) |
| 166 if (!read_cb_.is_null()) | |
| 167 return; | 177 return; |
| 168 | 178 |
| 169 if (!reset_cb_.is_null()) { | 179 if (!decode_cb_.is_null()) { |
| 170 DoReset(); | 180 base::ResetAndReturn(&decode_cb_).Run(kAborted, NULL); |
| 171 return; | 181 // Reset is pending only when decode is pending. |
| 182 if (!reset_cb_.is_null()) |
| 183 base::ResetAndReturn(&reset_cb_).Run(); |
| 172 } | 184 } |
| 173 | 185 |
| 174 DoStop(); | 186 ReleaseFFmpegResources(); |
| 187 ResetTimestampState(); |
| 188 state_ = kUninitialized; |
| 175 } | 189 } |
| 176 | 190 |
| 177 FFmpegAudioDecoder::~FFmpegAudioDecoder() {} | 191 // Callback called from within FFmpeg to allocate a buffer based on |
| 178 | 192 // the dimensions of |codec_context|. See AVCodecContext.get_buffer2 |
| 193 // documentation inside FFmpeg. |
| 179 int FFmpegAudioDecoder::GetAudioBuffer(AVCodecContext* codec, | 194 int FFmpegAudioDecoder::GetAudioBuffer(AVCodecContext* codec, |
| 180 AVFrame* frame, | 195 AVFrame* frame, |
| 181 int flags) { | 196 int flags) { |
| 182 // Since this routine is called by FFmpeg when a buffer is required for audio | 197 // Since this routine is called by FFmpeg when a buffer is required for audio |
| 183 // data, use the values supplied by FFmpeg (ignoring the current settings). | 198 // data, use the values supplied by FFmpeg (ignoring the current settings). |
| 184 // RunDecodeLoop() gets to determine if the buffer is useable or not. | 199 // FFmpegDecode() gets to determine if the buffer is useable or not. |
| 185 AVSampleFormat format = static_cast<AVSampleFormat>(frame->format); | 200 AVSampleFormat format = static_cast<AVSampleFormat>(frame->format); |
| 186 SampleFormat sample_format = AVSampleFormatToSampleFormat(format); | 201 SampleFormat sample_format = AVSampleFormatToSampleFormat(format); |
| 187 int channels = DetermineChannels(frame); | 202 int channels = DetermineChannels(frame); |
| 188 if ((channels <= 0) || (channels >= limits::kMaxChannels)) { | 203 if ((channels <= 0) || (channels >= limits::kMaxChannels)) { |
| 189 DLOG(ERROR) << "Requested number of channels (" << channels | 204 DLOG(ERROR) << "Requested number of channels (" << channels |
| 190 << ") exceeds limit."; | 205 << ") exceeds limit."; |
| 191 return AVERROR(EINVAL); | 206 return AVERROR(EINVAL); |
| 192 } | 207 } |
| 193 | 208 |
| 194 int bytes_per_channel = SampleFormatToBytesPerChannel(sample_format); | 209 int bytes_per_channel = SampleFormatToBytesPerChannel(sample_format); |
| (...skipping 39 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 234 | 249 |
| 235 // Now create an AVBufferRef for the data just allocated. It will own the | 250 // Now create an AVBufferRef for the data just allocated. It will own the |
| 236 // reference to the AudioBuffer object. | 251 // reference to the AudioBuffer object. |
| 237 void* opaque = NULL; | 252 void* opaque = NULL; |
| 238 buffer.swap(reinterpret_cast<AudioBuffer**>(&opaque)); | 253 buffer.swap(reinterpret_cast<AudioBuffer**>(&opaque)); |
| 239 frame->buf[0] = av_buffer_create( | 254 frame->buf[0] = av_buffer_create( |
| 240 frame->data[0], buffer_size_in_bytes, ReleaseAudioBufferImpl, opaque, 0); | 255 frame->data[0], buffer_size_in_bytes, ReleaseAudioBufferImpl, opaque, 0); |
| 241 return 0; | 256 return 0; |
| 242 } | 257 } |
| 243 | 258 |
| 244 void FFmpegAudioDecoder::DoStop() { | 259 void FFmpegAudioDecoder::DoReset() { |
| 245 DCHECK(task_runner_->BelongsToCurrentThread()); | 260 DCHECK(decode_cb_.is_null()); |
| 246 DCHECK(!stop_cb_.is_null()); | 261 DCHECK(!reset_cb_.is_null()); |
| 247 DCHECK(read_cb_.is_null()); | |
| 248 DCHECK(reset_cb_.is_null()); | |
| 249 | 262 |
| 263 avcodec_flush_buffers(codec_context_.get()); |
| 264 state_ = kNormal; |
| 250 ResetTimestampState(); | 265 ResetTimestampState(); |
| 251 queued_audio_.clear(); | 266 base::ResetAndReturn(&reset_cb_).Run(); |
| 252 ReleaseFFmpegResources(); | |
| 253 base::ResetAndReturn(&stop_cb_).Run(); | |
| 254 } | 267 } |
| 255 | 268 |
| 256 void FFmpegAudioDecoder::DoReset() { | 269 void FFmpegAudioDecoder::DecodeBuffer( |
| 270 const scoped_refptr<DecoderBuffer>& buffer) { |
| 257 DCHECK(task_runner_->BelongsToCurrentThread()); | 271 DCHECK(task_runner_->BelongsToCurrentThread()); |
| 258 DCHECK(!reset_cb_.is_null()); | 272 DCHECK_NE(state_, kUninitialized); |
| 259 DCHECK(read_cb_.is_null()); | 273 DCHECK_NE(state_, kDecodeFinished); |
| 274 DCHECK_NE(state_, kError); |
| 275 DCHECK(reset_cb_.is_null()); |
| 276 DCHECK(!decode_cb_.is_null()); |
| 260 | 277 |
| 261 avcodec_flush_buffers(codec_context_.get()); | 278 DCHECK(buffer && queued_audio_.empty()); |
| 262 ResetTimestampState(); | |
| 263 queued_audio_.clear(); | |
| 264 base::ResetAndReturn(&reset_cb_).Run(); | |
| 265 | 279 |
| 266 if (!stop_cb_.is_null()) | 280 // During decode, because reads are issued asynchronously, it is possible to |
| 267 DoStop(); | 281 // receive multiple end of stream buffers since each decode is acked. When the |
| 268 } | 282 // first end of stream buffer is read, FFmpeg may still have frames queued |
| 283 // up in the decoder so we need to go through the decode loop until it stops |
| 284 // giving sensible data. After that, the decoder should output empty |
| 285 // frames. There are three states the decoder can be in: |
| 286 // |
| 287 // kNormal: This is the starting state. Buffers are decoded. Decode errors |
| 288 // are discarded. |
| 289 // kFlushCodec: There isn't any more input data. Call avcodec_decode_audio4 |
| 290 // until no more data is returned to flush out remaining |
| 291 // frames. The input buffer is ignored at this point. |
| 292 // kDecodeFinished: All calls return empty frames. |
| 293 // kError: Unexpected error happened. |
| 294 // |
| 295 // These are the possible state transitions. |
| 296 // |
| 297 // kNormal -> kFlushCodec: |
| 298 // When buffer->end_of_stream() is first true. |
| 299 // kNormal -> kError: |
| 300 // A decoding error occurs and decoding needs to stop. |
| 301 // kFlushCodec -> kDecodeFinished: |
| 302 // When avcodec_decode_audio4() returns 0 data. |
| 303 // kFlushCodec -> kError: |
| 304 // When avcodec_decode_audio4() errors out. |
| 305 // (any state) -> kNormal: |
| 306 // Any time Reset() is called. |
| 269 | 307 |
| 270 void FFmpegAudioDecoder::ReadFromDemuxerStream() { | 308 // Make sure we are notified if http://crbug.com/49709 returns. Issue also |
| 271 DCHECK(!read_cb_.is_null()); | 309 // occurs with some damaged files. |
| 272 demuxer_stream_->Read(base::Bind( | 310 if (!buffer->end_of_stream() && buffer->timestamp() == kNoTimestamp() && |
| 273 &FFmpegAudioDecoder::BufferReady, weak_this_)); | 311 output_timestamp_helper_->base_timestamp() == kNoTimestamp()) { |
| 274 } | 312 DVLOG(1) << "Received a buffer without timestamps!"; |
| 275 | 313 base::ResetAndReturn(&decode_cb_).Run(kDecodeError, NULL); |
| 276 void FFmpegAudioDecoder::BufferReady( | |
| 277 DemuxerStream::Status status, | |
| 278 const scoped_refptr<DecoderBuffer>& input) { | |
| 279 DCHECK(task_runner_->BelongsToCurrentThread()); | |
| 280 DCHECK(!read_cb_.is_null()); | |
| 281 DCHECK(queued_audio_.empty()); | |
| 282 DCHECK_EQ(status != DemuxerStream::kOk, !input.get()) << status; | |
| 283 | |
| 284 // Pending Reset: ignore the buffer we just got, send kAborted to |read_cb_| | |
| 285 // and carry out the Reset(). | |
| 286 // If there happens to also be a pending Stop(), that will be handled at | |
| 287 // the end of DoReset(). | |
| 288 if (!reset_cb_.is_null()) { | |
| 289 base::ResetAndReturn(&read_cb_).Run(kAborted, NULL); | |
| 290 DoReset(); | |
| 291 return; | 314 return; |
| 292 } | 315 } |
| 293 | 316 |
| 294 // Pending Stop: ignore the buffer we just got, send kAborted to |read_cb_| | 317 if (!buffer->end_of_stream()) { |
| 295 // and carry out the Stop(). | 318 if (last_input_timestamp_ == kNoTimestamp() && |
| 296 if (!stop_cb_.is_null()) { | 319 codec_context_->codec_id == AV_CODEC_ID_VORBIS && |
| 297 base::ResetAndReturn(&read_cb_).Run(kAborted, NULL); | 320 buffer->timestamp() < base::TimeDelta()) { |
| 298 DoStop(); | 321 // Dropping frames for negative timestamps as outlined in section A.2 |
| 322 // in the Vorbis spec. http://xiph.org/vorbis/doc/Vorbis_I_spec.html |
| 323 output_frames_to_drop_ = floor( |
| 324 0.5 + -buffer->timestamp().InSecondsF() * samples_per_second_); |
| 325 } else { |
| 326 if (last_input_timestamp_ != kNoTimestamp() && |
| 327 buffer->timestamp() < last_input_timestamp_) { |
| 328 const base::TimeDelta diff = |
| 329 buffer->timestamp() - last_input_timestamp_; |
| 330 DLOG(WARNING) |
| 331 << "Input timestamps are not monotonically increasing! " |
| 332 << " ts " << buffer->timestamp().InMicroseconds() << " us" |
| 333 << " diff " << diff.InMicroseconds() << " us"; |
| 334 } |
| 335 |
| 336 last_input_timestamp_ = buffer->timestamp(); |
| 337 } |
| 338 } |
| 339 |
| 340 // Transition to kFlushCodec on the first end of stream buffer. |
| 341 if (state_ == kNormal && buffer->end_of_stream()) { |
| 342 state_ = kFlushCodec; |
| 343 } |
| 344 |
| 345 scoped_refptr<AudioBuffer> audio_buffer; |
| 346 if (!FFmpegDecode(buffer)) { |
| 347 state_ = kError; |
| 348 base::ResetAndReturn(&decode_cb_).Run(kDecodeError, NULL); |
| 299 return; | 349 return; |
| 300 } | 350 } |
| 301 | 351 |
| 302 if (status == DemuxerStream::kAborted) { | 352 if (queued_audio_.empty()) { |
| 303 DCHECK(!input.get()); | 353 if (state_ == kFlushCodec) { |
| 304 base::ResetAndReturn(&read_cb_).Run(kAborted, NULL); | 354 DCHECK(buffer->end_of_stream()); |
| 355 state_ = kDecodeFinished; |
| 356 base::ResetAndReturn(&decode_cb_) |
| 357 .Run(kOk, AudioBuffer::CreateEOSBuffer()); |
| 358 return; |
| 359 } |
| 360 |
| 361 base::ResetAndReturn(&decode_cb_).Run(kNotEnoughData, NULL); |
| 305 return; | 362 return; |
| 306 } | 363 } |
| 307 | 364 |
| 308 if (status == DemuxerStream::kConfigChanged) { | 365 base::ResetAndReturn(&decode_cb_) |
| 309 DCHECK(!input.get()); | 366 .Run(queued_audio_.front().status, queued_audio_.front().buffer); |
| 310 | |
| 311 // Send a "end of stream" buffer to the decode loop | |
| 312 // to output any remaining data still in the decoder. | |
| 313 RunDecodeLoop(DecoderBuffer::CreateEOSBuffer(), true); | |
| 314 | |
| 315 DVLOG(1) << "Config changed."; | |
| 316 | |
| 317 if (!ConfigureDecoder()) { | |
| 318 base::ResetAndReturn(&read_cb_).Run(kDecodeError, NULL); | |
| 319 return; | |
| 320 } | |
| 321 | |
| 322 ResetTimestampState(); | |
| 323 | |
| 324 if (queued_audio_.empty()) { | |
| 325 ReadFromDemuxerStream(); | |
| 326 return; | |
| 327 } | |
| 328 | |
| 329 base::ResetAndReturn(&read_cb_).Run( | |
| 330 queued_audio_.front().status, queued_audio_.front().buffer); | |
| 331 queued_audio_.pop_front(); | |
| 332 return; | |
| 333 } | |
| 334 | |
| 335 DCHECK_EQ(status, DemuxerStream::kOk); | |
| 336 DCHECK(input.get()); | |
| 337 | |
| 338 // Make sure we are notified if http://crbug.com/49709 returns. Issue also | |
| 339 // occurs with some damaged files. | |
| 340 if (!input->end_of_stream() && input->timestamp() == kNoTimestamp() && | |
| 341 output_timestamp_helper_->base_timestamp() == kNoTimestamp()) { | |
| 342 DVLOG(1) << "Received a buffer without timestamps!"; | |
| 343 base::ResetAndReturn(&read_cb_).Run(kDecodeError, NULL); | |
| 344 return; | |
| 345 } | |
| 346 | |
| 347 if (!input->end_of_stream()) { | |
| 348 if (last_input_timestamp_ == kNoTimestamp() && | |
| 349 codec_context_->codec_id == AV_CODEC_ID_VORBIS && | |
| 350 input->timestamp() < base::TimeDelta()) { | |
| 351 // Dropping frames for negative timestamps as outlined in section A.2 | |
| 352 // in the Vorbis spec. http://xiph.org/vorbis/doc/Vorbis_I_spec.html | |
| 353 output_frames_to_drop_ = floor( | |
| 354 0.5 + -input->timestamp().InSecondsF() * samples_per_second_); | |
| 355 } else { | |
| 356 if (last_input_timestamp_ != kNoTimestamp() && | |
| 357 input->timestamp() < last_input_timestamp_) { | |
| 358 const base::TimeDelta diff = input->timestamp() - last_input_timestamp_; | |
| 359 DLOG(WARNING) | |
| 360 << "Input timestamps are not monotonically increasing! " | |
| 361 << " ts " << input->timestamp().InMicroseconds() << " us" | |
| 362 << " diff " << diff.InMicroseconds() << " us"; | |
| 363 } | |
| 364 | |
| 365 last_input_timestamp_ = input->timestamp(); | |
| 366 } | |
| 367 } | |
| 368 | |
| 369 RunDecodeLoop(input, false); | |
| 370 | |
| 371 // We exhausted the provided packet, but it wasn't enough for a frame. Ask | |
| 372 // for more data in order to fulfill this read. | |
| 373 if (queued_audio_.empty()) { | |
| 374 ReadFromDemuxerStream(); | |
| 375 return; | |
| 376 } | |
| 377 | |
| 378 // Execute callback to return the first frame we decoded. | |
| 379 base::ResetAndReturn(&read_cb_).Run( | |
| 380 queued_audio_.front().status, queued_audio_.front().buffer); | |
| 381 queued_audio_.pop_front(); | 367 queued_audio_.pop_front(); |
| 382 } | 368 } |
| 383 | 369 |
| 384 bool FFmpegAudioDecoder::ConfigureDecoder() { | 370 bool FFmpegAudioDecoder::FFmpegDecode( |
| 385 const AudioDecoderConfig& config = demuxer_stream_->audio_decoder_config(); | 371 const scoped_refptr<DecoderBuffer>& buffer) { |
| 386 | 372 |
| 387 if (!config.IsValidConfig()) { | 373 DCHECK(queued_audio_.empty()); |
| 388 DLOG(ERROR) << "Invalid audio stream -" | |
| 389 << " codec: " << config.codec() | |
| 390 << " channel layout: " << config.channel_layout() | |
| 391 << " bits per channel: " << config.bits_per_channel() | |
| 392 << " samples per second: " << config.samples_per_second(); | |
| 393 return false; | |
| 394 } | |
| 395 | 374 |
| 396 if (config.is_encrypted()) { | |
| 397 DLOG(ERROR) << "Encrypted audio stream not supported"; | |
| 398 return false; | |
| 399 } | |
| 400 | |
| 401 if (codec_context_.get() && | |
| 402 (bytes_per_channel_ != config.bytes_per_channel() || | |
| 403 channel_layout_ != config.channel_layout() || | |
| 404 samples_per_second_ != config.samples_per_second())) { | |
| 405 DVLOG(1) << "Unsupported config change :"; | |
| 406 DVLOG(1) << "\tbytes_per_channel : " << bytes_per_channel_ | |
| 407 << " -> " << config.bytes_per_channel(); | |
| 408 DVLOG(1) << "\tchannel_layout : " << channel_layout_ | |
| 409 << " -> " << config.channel_layout(); | |
| 410 DVLOG(1) << "\tsample_rate : " << samples_per_second_ | |
| 411 << " -> " << config.samples_per_second(); | |
| 412 return false; | |
| 413 } | |
| 414 | |
| 415 // Release existing decoder resources if necessary. | |
| 416 ReleaseFFmpegResources(); | |
| 417 | |
| 418 // Initialize AVCodecContext structure. | |
| 419 codec_context_.reset(avcodec_alloc_context3(NULL)); | |
| 420 AudioDecoderConfigToAVCodecContext(config, codec_context_.get()); | |
| 421 | |
| 422 codec_context_->opaque = this; | |
| 423 codec_context_->get_buffer2 = GetAudioBufferImpl; | |
| 424 codec_context_->refcounted_frames = 1; | |
| 425 | |
| 426 AVCodec* codec = avcodec_find_decoder(codec_context_->codec_id); | |
| 427 if (!codec || avcodec_open2(codec_context_.get(), codec, NULL) < 0) { | |
| 428 DLOG(ERROR) << "Could not initialize audio decoder: " | |
| 429 << codec_context_->codec_id; | |
| 430 return false; | |
| 431 } | |
| 432 | |
| 433 // Success! | |
| 434 av_frame_.reset(av_frame_alloc()); | |
| 435 channel_layout_ = config.channel_layout(); | |
| 436 samples_per_second_ = config.samples_per_second(); | |
| 437 output_timestamp_helper_.reset( | |
| 438 new AudioTimestampHelper(config.samples_per_second())); | |
| 439 | |
| 440 // Store initial values to guard against midstream configuration changes. | |
| 441 channels_ = codec_context_->channels; | |
| 442 if (channels_ != ChannelLayoutToChannelCount(channel_layout_)) { | |
| 443 DLOG(ERROR) << "Audio configuration specified " | |
| 444 << ChannelLayoutToChannelCount(channel_layout_) | |
| 445 << " channels, but FFmpeg thinks the file contains " | |
| 446 << channels_ << " channels"; | |
| 447 return false; | |
| 448 } | |
| 449 av_sample_format_ = codec_context_->sample_fmt; | |
| 450 sample_format_ = AVSampleFormatToSampleFormat( | |
| 451 static_cast<AVSampleFormat>(av_sample_format_)); | |
| 452 bytes_per_channel_ = SampleFormatToBytesPerChannel(sample_format_); | |
| 453 | |
| 454 return true; | |
| 455 } | |
| 456 | |
| 457 void FFmpegAudioDecoder::ReleaseFFmpegResources() { | |
| 458 codec_context_.reset(); | |
| 459 av_frame_.reset(); | |
| 460 } | |
| 461 | |
| 462 void FFmpegAudioDecoder::ResetTimestampState() { | |
| 463 output_timestamp_helper_->SetBaseTimestamp(kNoTimestamp()); | |
| 464 last_input_timestamp_ = kNoTimestamp(); | |
| 465 output_frames_to_drop_ = 0; | |
| 466 } | |
| 467 | |
| 468 void FFmpegAudioDecoder::RunDecodeLoop( | |
| 469 const scoped_refptr<DecoderBuffer>& input, | |
| 470 bool skip_eos_append) { | |
| 471 AVPacket packet; | 375 AVPacket packet; |
| 472 av_init_packet(&packet); | 376 av_init_packet(&packet); |
| 473 if (input->end_of_stream()) { | 377 if (buffer->end_of_stream()) { |
| 474 packet.data = NULL; | 378 packet.data = NULL; |
| 475 packet.size = 0; | 379 packet.size = 0; |
| 476 } else { | 380 } else { |
| 477 packet.data = const_cast<uint8*>(input->data()); | 381 packet.data = const_cast<uint8*>(buffer->data()); |
| 478 packet.size = input->data_size(); | 382 packet.size = buffer->data_size(); |
| 479 } | 383 } |
| 480 | 384 |
| 481 // Each audio packet may contain several frames, so we must call the decoder | 385 // Each audio packet may contain several frames, so we must call the decoder |
| 482 // until we've exhausted the packet. Regardless of the packet size we always | 386 // until we've exhausted the packet. Regardless of the packet size we always |
| 483 // want to hand it to the decoder at least once, otherwise we would end up | 387 // want to hand it to the decoder at least once, otherwise we would end up |
| 484 // skipping end of stream packets since they have a size of zero. | 388 // skipping end of stream packets since they have a size of zero. |
| 485 do { | 389 do { |
| 486 int frame_decoded = 0; | 390 int frame_decoded = 0; |
| 487 int result = avcodec_decode_audio4( | 391 int result = avcodec_decode_audio4( |
| 488 codec_context_.get(), av_frame_.get(), &frame_decoded, &packet); | 392 codec_context_.get(), av_frame_.get(), &frame_decoded, &packet); |
| 489 | 393 |
| 490 if (result < 0) { | 394 if (result < 0) { |
| 491 DCHECK(!input->end_of_stream()) | 395 DCHECK(!buffer->end_of_stream()) |
| 492 << "End of stream buffer produced an error! " | 396 << "End of stream buffer produced an error! " |
| 493 << "This is quite possibly a bug in the audio decoder not handling " | 397 << "This is quite possibly a bug in the audio decoder not handling " |
| 494 << "end of stream AVPackets correctly."; | 398 << "end of stream AVPackets correctly."; |
| 495 | 399 |
| 496 DLOG(WARNING) | 400 DLOG(WARNING) |
| 497 << "Failed to decode an audio frame with timestamp: " | 401 << "Failed to decode an audio frame with timestamp: " |
| 498 << input->timestamp().InMicroseconds() << " us, duration: " | 402 << buffer->timestamp().InMicroseconds() << " us, duration: " |
| 499 << input->duration().InMicroseconds() << " us, packet size: " | 403 << buffer->duration().InMicroseconds() << " us, packet size: " |
| 500 << input->data_size() << " bytes"; | 404 << buffer->data_size() << " bytes"; |
| 501 | 405 |
| 502 break; | 406 break; |
| 503 } | 407 } |
| 504 | 408 |
| 505 // Update packet size and data pointer in case we need to call the decoder | 409 // Update packet size and data pointer in case we need to call the decoder |
| 506 // with the remaining bytes from this packet. | 410 // with the remaining bytes from this packet. |
| 507 packet.size -= result; | 411 packet.size -= result; |
| 508 packet.data += result; | 412 packet.data += result; |
| 509 | 413 |
| 510 if (output_timestamp_helper_->base_timestamp() == kNoTimestamp() && | 414 if (output_timestamp_helper_->base_timestamp() == kNoTimestamp() && |
| 511 !input->end_of_stream()) { | 415 !buffer->end_of_stream()) { |
| 512 DCHECK(input->timestamp() != kNoTimestamp()); | 416 DCHECK(buffer->timestamp() != kNoTimestamp()); |
| 513 if (output_frames_to_drop_ > 0) { | 417 if (output_frames_to_drop_ > 0) { |
| 514 // Currently Vorbis is the only codec that causes us to drop samples. | 418 // Currently Vorbis is the only codec that causes us to drop samples. |
| 515 // If we have to drop samples it always means the timeline starts at 0. | 419 // If we have to drop samples it always means the timeline starts at 0. |
| 516 DCHECK_EQ(codec_context_->codec_id, AV_CODEC_ID_VORBIS); | 420 DCHECK_EQ(codec_context_->codec_id, AV_CODEC_ID_VORBIS); |
| 517 output_timestamp_helper_->SetBaseTimestamp(base::TimeDelta()); | 421 output_timestamp_helper_->SetBaseTimestamp(base::TimeDelta()); |
| 518 } else { | 422 } else { |
| 519 output_timestamp_helper_->SetBaseTimestamp(input->timestamp()); | 423 output_timestamp_helper_->SetBaseTimestamp(buffer->timestamp()); |
| 520 } | 424 } |
| 521 } | 425 } |
| 522 | 426 |
| 523 scoped_refptr<AudioBuffer> output; | 427 scoped_refptr<AudioBuffer> output; |
| 524 int decoded_frames = 0; | 428 int decoded_frames = 0; |
| 525 int original_frames = 0; | 429 int original_frames = 0; |
| 526 int channels = DetermineChannels(av_frame_.get()); | 430 int channels = DetermineChannels(av_frame_.get()); |
| 527 if (frame_decoded) { | 431 if (frame_decoded) { |
| 528 if (av_frame_->sample_rate != samples_per_second_ || | 432 |
| 433 // TODO(rileya) Remove this check once we properly support midstream audio |
| 434 // config changes. |
| 435 if (av_frame_->sample_rate != config_.samples_per_second() || |
| 529 channels != channels_ || | 436 channels != channels_ || |
| 530 av_frame_->format != av_sample_format_) { | 437 av_frame_->format != av_sample_format_) { |
| 531 DLOG(ERROR) << "Unsupported midstream configuration change!" | 438 DLOG(ERROR) << "Unsupported midstream configuration change!" |
| 532 << " Sample Rate: " << av_frame_->sample_rate << " vs " | 439 << " Sample Rate: " << av_frame_->sample_rate << " vs " |
| 533 << samples_per_second_ | 440 << samples_per_second_ |
| 534 << ", Channels: " << channels << " vs " | 441 << ", Channels: " << channels << " vs " |
| 535 << channels_ | 442 << channels_ |
| 536 << ", Sample Format: " << av_frame_->format << " vs " | 443 << ", Sample Format: " << av_frame_->format << " vs " |
| 537 << av_sample_format_; | 444 << av_sample_format_; |
| 538 | 445 |
| 539 // This is an unrecoverable error, so bail out. | 446 // This is an unrecoverable error, so bail out. |
| 540 QueuedAudioBuffer queue_entry = { kDecodeError, NULL }; | 447 QueuedAudioBuffer queue_entry = { kDecodeError, NULL }; |
| 541 queued_audio_.push_back(queue_entry); | 448 queued_audio_.push_back(queue_entry); |
| 542 av_frame_unref(av_frame_.get()); | 449 av_frame_unref(av_frame_.get()); |
| 543 break; | 450 break; |
| 544 } | 451 } |
| 545 | 452 |
| 546 // Get the AudioBuffer that the data was decoded into. Adjust the number | 453 // Get the AudioBuffer that the data was decoded into. Adjust the number |
| 547 // of frames, in case fewer than requested were actually decoded. | 454 // of frames, in case fewer than requested were actually decoded. |
| 548 output = reinterpret_cast<AudioBuffer*>( | 455 output = reinterpret_cast<AudioBuffer*>( |
| 549 av_buffer_get_opaque(av_frame_->buf[0])); | 456 av_buffer_get_opaque(av_frame_->buf[0])); |
| 457 |
| 550 DCHECK_EQ(channels_, output->channel_count()); | 458 DCHECK_EQ(channels_, output->channel_count()); |
| 551 original_frames = av_frame_->nb_samples; | 459 original_frames = av_frame_->nb_samples; |
| 552 int unread_frames = output->frame_count() - original_frames; | 460 int unread_frames = output->frame_count() - original_frames; |
| 553 DCHECK_GE(unread_frames, 0); | 461 DCHECK_GE(unread_frames, 0); |
| 554 if (unread_frames > 0) | 462 if (unread_frames > 0) |
| 555 output->TrimEnd(unread_frames); | 463 output->TrimEnd(unread_frames); |
| 556 | 464 |
| 557 // If there are frames to drop, get rid of as many as we can. | 465 // If there are frames to drop, get rid of as many as we can. |
| 558 if (output_frames_to_drop_ > 0) { | 466 if (output_frames_to_drop_ > 0) { |
| 559 int drop = std::min(output->frame_count(), output_frames_to_drop_); | 467 int drop = std::min(output->frame_count(), output_frames_to_drop_); |
| 560 output->TrimStart(drop); | 468 output->TrimStart(drop); |
| 561 output_frames_to_drop_ -= drop; | 469 output_frames_to_drop_ -= drop; |
| 562 } | 470 } |
| 563 | 471 |
| 564 decoded_frames = output->frame_count(); | 472 decoded_frames = output->frame_count(); |
| 565 av_frame_unref(av_frame_.get()); | 473 av_frame_unref(av_frame_.get()); |
| 566 } | 474 } |
| 567 | 475 |
| 568 // WARNING: |av_frame_| no longer has valid data at this point. | 476 // WARNING: |av_frame_| no longer has valid data at this point. |
| 569 | 477 |
| 570 if (decoded_frames > 0) { | 478 if (decoded_frames > 0) { |
| 571 // Set the timestamp/duration once all the extra frames have been | 479 // Set the timestamp/duration once all the extra frames have been |
| 572 // discarded. | 480 // discarded. |
| 573 output->set_timestamp(output_timestamp_helper_->GetTimestamp()); | 481 output->set_timestamp(output_timestamp_helper_->GetTimestamp()); |
| 574 output->set_duration( | 482 output->set_duration( |
| 575 output_timestamp_helper_->GetFrameDuration(decoded_frames)); | 483 output_timestamp_helper_->GetFrameDuration(decoded_frames)); |
| 576 output_timestamp_helper_->AddFrames(decoded_frames); | 484 output_timestamp_helper_->AddFrames(decoded_frames); |
| 577 } else if (IsEndOfStream(result, original_frames, input) && | 485 } else if (IsEndOfStream(result, original_frames, buffer)) { |
| 578 !skip_eos_append) { | |
| 579 DCHECK_EQ(packet.size, 0); | 486 DCHECK_EQ(packet.size, 0); |
| 580 output = AudioBuffer::CreateEOSBuffer(); | 487 output = AudioBuffer::CreateEOSBuffer(); |
| 581 } else { | 488 } else { |
| 582 // In case all the frames in the buffer were dropped. | 489 // In case all the frames in the buffer were dropped. |
| 583 output = NULL; | 490 output = NULL; |
| 584 } | 491 } |
| 585 | 492 |
| 586 if (output.get()) { | 493 if (output.get()) { |
| 587 QueuedAudioBuffer queue_entry = { kOk, output }; | 494 QueuedAudioBuffer queue_entry = { kOk, output }; |
| 588 queued_audio_.push_back(queue_entry); | 495 queued_audio_.push_back(queue_entry); |
| 589 } | 496 } |
| 497 } while (packet.size > 0); |
| 590 | 498 |
| 591 // Decoding finished successfully, update statistics. | 499 return true; |
| 592 if (result > 0) { | 500 } |
| 593 PipelineStatistics statistics; | 501 |
| 594 statistics.audio_bytes_decoded = result; | 502 void FFmpegAudioDecoder::ReleaseFFmpegResources() { |
| 595 statistics_cb_.Run(statistics); | 503 codec_context_.reset(); |
| 596 } | 504 av_frame_.reset(); |
| 597 } while (packet.size > 0); | 505 } |
| 506 |
| 507 bool FFmpegAudioDecoder::ConfigureDecoder() { |
| 508 if (!config_.IsValidConfig()) { |
| 509 DLOG(ERROR) << "Invalid audio stream -" |
| 510 << " codec: " << config_.codec() |
| 511 << " channel layout: " << config_.channel_layout() |
| 512 << " bits per channel: " << config_.bits_per_channel() |
| 513 << " samples per second: " << config_.samples_per_second(); |
| 514 return false; |
| 515 } |
| 516 |
| 517 if (config_.is_encrypted()) { |
| 518 DLOG(ERROR) << "Encrypted audio stream not supported"; |
| 519 return false; |
| 520 } |
| 521 |
| 522 // TODO(rileya) Remove this check once we properly support midstream audio |
| 523 // config changes. |
| 524 if (codec_context_.get() && |
| 525 (bytes_per_channel_ != config_.bytes_per_channel() || |
| 526 channel_layout_ != config_.channel_layout() || |
| 527 samples_per_second_ != config_.samples_per_second())) { |
| 528 DVLOG(1) << "Unsupported config change :"; |
| 529 DVLOG(1) << "\tbytes_per_channel : " << bytes_per_channel_ |
| 530 << " -> " << config_.bytes_per_channel(); |
| 531 DVLOG(1) << "\tchannel_layout : " << channel_layout_ |
| 532 << " -> " << config_.channel_layout(); |
| 533 DVLOG(1) << "\tsample_rate : " << samples_per_second_ |
| 534 << " -> " << config_.samples_per_second(); |
| 535 return false; |
| 536 } |
| 537 |
| 538 // Release existing decoder resources if necessary. |
| 539 ReleaseFFmpegResources(); |
| 540 |
| 541 // Initialize AVCodecContext structure. |
| 542 codec_context_.reset(avcodec_alloc_context3(NULL)); |
| 543 AudioDecoderConfigToAVCodecContext(config_, codec_context_.get()); |
| 544 |
| 545 codec_context_->opaque = this; |
| 546 codec_context_->get_buffer2 = GetAudioBufferImpl; |
| 547 codec_context_->refcounted_frames = 1; |
| 548 |
| 549 AVCodec* codec = avcodec_find_decoder(codec_context_->codec_id); |
| 550 if (!codec || avcodec_open2(codec_context_.get(), codec, NULL) < 0) { |
| 551 DLOG(ERROR) << "Could not initialize audio decoder: " |
| 552 << codec_context_->codec_id; |
| 553 ReleaseFFmpegResources(); |
| 554 state_ = kUninitialized; |
| 555 return false; |
| 556 } |
| 557 |
| 558 // Success! |
| 559 av_frame_.reset(av_frame_alloc()); |
| 560 channel_layout_ = config_.channel_layout(); |
| 561 samples_per_second_ = config_.samples_per_second(); |
| 562 output_timestamp_helper_.reset( |
| 563 new AudioTimestampHelper(config_.samples_per_second())); |
| 564 |
| 565 // Store initial values to guard against midstream configuration changes. |
| 566 channels_ = codec_context_->channels; |
| 567 if (channels_ != ChannelLayoutToChannelCount(channel_layout_)) { |
| 568 DLOG(ERROR) << "Audio configuration specified " |
| 569 << ChannelLayoutToChannelCount(channel_layout_) |
| 570 << " channels, but FFmpeg thinks the file contains " |
| 571 << channels_ << " channels"; |
| 572 return false; |
| 573 } |
| 574 av_sample_format_ = codec_context_->sample_fmt; |
| 575 sample_format_ = AVSampleFormatToSampleFormat( |
| 576 static_cast<AVSampleFormat>(av_sample_format_)); |
| 577 bytes_per_channel_ = SampleFormatToBytesPerChannel(sample_format_); |
| 578 |
| 579 return true; |
| 580 } |
| 581 |
| 582 void FFmpegAudioDecoder::ResetTimestampState() { |
| 583 output_timestamp_helper_->SetBaseTimestamp(kNoTimestamp()); |
| 584 last_input_timestamp_ = kNoTimestamp(); |
| 585 output_frames_to_drop_ = 0; |
| 598 } | 586 } |
| 599 | 587 |
| 600 } // namespace media | 588 } // namespace media |
| OLD | NEW |