media/mp2t/es_parser_adts.cc - Issue 23566013: Mpeg2 TS stream parser for media source.

Side by Side Diff: media/mp2t/es_parser_adts.cc

Issue 23566013: Mpeg2 TS stream parser for media source. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: Cleanup - address comments from patch set #8 Created 7 years, 3 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch

OLD	NEW
(Empty)
	1 // Copyright (c) 2013 The Chromium Authors. All rights reserved.

	2 // Use of this source code is governed by a BSD-style license that can be

	3 // found in the LICENSE file.

	4

	5 #include "media/mp2t/es_parser_adts.h"

	6

	7 #include <list>

	8

	9 #include "base/basictypes.h"

	10 #include "base/logging.h"

	11 #include "base/strings/string_number_conversions.h"

	12 #include "media/base/audio_decoder_config.h"
	acolwell GONE FROM CHROMIUM 2013/09/16 06:19:30 nit: Shouldn't need this now since it is in the he nit: Shouldn't need this now since it is in the header. damienv1 2013/09/17 02:58:22 Done. Show quoted text On 2013/09/16 06:19:30, acolwell wrote: > nit: Shouldn't need this now since it is in the header. Done.
	13 #include "media/base/audio_timestamp_helper.h"

	14 #include "media/base/bit_reader.h"

	15 #include "media/base/buffers.h"

	16 #include "media/base/channel_layout.h"

	17 #include "media/base/stream_parser_buffer.h"

	18 #include "media/mp2t/mp2t_common.h"

	19

	20 // Adts header is at least 7 bytes (can be 9 bytes).

	21 static const int kAdtsHeaderMinSize = 7;

	22

	23 static const int adts_frequency_table[16] = {

	24 96000,

	25 88200,

	26 64000,

	27 48000,

	28 44100,

	29 32000,

	30 24000,

	31 22050,

	32 16000,

	33 12000,

	34 11025,

	35 8000,

	36 7350,

	37 0,

	38 0,

	39 0,

	40 };

	41 static const int kMaxSupportedFrequencyIndex = 12;

	42

	43 static media::ChannelLayout adts_channel_layout[8] = {

	44 media::CHANNEL_LAYOUT_NONE,

	45 media::CHANNEL_LAYOUT_MONO,

	46 media::CHANNEL_LAYOUT_STEREO,

	47 media::CHANNEL_LAYOUT_SURROUND,

	48 media::CHANNEL_LAYOUT_4_0,

	49 media::CHANNEL_LAYOUT_5_0_BACK,

	50 media::CHANNEL_LAYOUT_5_1_BACK,

	51 media::CHANNEL_LAYOUT_7_1,

	52 };

	53

	54 // Number of samples per frame.

	55 static const int kNumberSamplesPerAACFrame = 1024;

	56

	57 static int ExtractAdtsFrameSize(const uint8* adts_header) {

	58 return ((static_cast<int>(adts_header[5]) >> 5) \|

	59 (static_cast<int>(adts_header[4]) << 3) \|

	60 ((static_cast<int>(adts_header[3]) & 0x3) << 11));

	61 }

	62

	63 static int ExtractAdtsFrequencyIndex(const uint8* adts_header) {

	64 return ((adts_header[2] >> 2) & 0xf);

	65 }

	66

	67 static int ExtractAdtsChannelConfig(const uint8* adts_header) {

	68 return (((adts_header[3] >> 6) & 0x3) \|

	69 ((adts_header[2] & 0x1) << 2));

	70 }

	71

	72 // Look for an ADTS syncword.

	73 // \|new_pos\| returns

	74 // - either the byte position of the ADTS frame (if found)

	75 // - or the byte position of 1st byte that was not processed (if not found).

	76 // \|frame_sz\| returns the size of the ADTS frame (if found).

	77 // Return whether a syncword was found.

	78 static bool LookForSyncWord(const uint8* raw_es, int raw_es_size,

	79 int pos,

	80 int* new_pos, int* frame_sz) {

	81 int max_offset = raw_es_size - kAdtsHeaderMinSize;
	acolwell GONE FROM CHROMIUM 2013/09/16 06:19:30 nit: DCHECK_GE(pos, 0); DCHECK_LT(pos, raw_es_siz nit: DCHECK_GE(pos, 0); DCHECK_LT(pos, raw_es_size); damienv1 2013/09/17 02:58:22 Done. Except that this should be DCHECK_LE(pos, ra Show quoted text On 2013/09/16 06:19:30, acolwell wrote: > nit: > DCHECK_GE(pos, 0); > DCHECK_LT(pos, raw_es_size); Done. Except that this should be DCHECK_LE(pos, raw_es_size); As \|pos\| can point to the 1st byte that was not processed yet. So if the last byte of the buffer was processed, pos is pointing to \|raw_es_size\|.
	82 if (max_offset < 0)

	83 max_offset = 0;
	acolwell GONE FROM CHROMIUM 2013/09/16 06:19:30 nit: I think it might be clearer if you just set * nit: I think it might be clearer if you just set new_pos and early return here. Also I think there might be a bug in the existing code if pos > 0 && max_offset < 0. new_pos should always be == to pos in this case right? damienv1 2013/09/17 02:58:22 Yes, the new position should remain unchanged if m Show quoted text On 2013/09/16 06:19:30, acolwell wrote: > nit: I think it might be clearer if you just set new_pos and early return here. > > Also I think there might be a bug in the existing code if pos > 0 && max_offset > < 0. new_pos should always be == to pos in this case right? Yes, the new position should remain unchanged if max_offset < 0. I updated the behavior.
	84

	85 for (int offset = pos; offset < max_offset; offset++) {

	86 const uint8* cur_buf = &raw_es[offset];

	87

	88 if ((cur_buf[0] != 0xff) \|\| ((cur_buf[1] & 0xf6) != 0xf0))

	89 // The first 12 bits must be 1.

	90 // The layer field (2 bits) must be set to 0.

	91 continue;

	92

	93 int frame_size = ExtractAdtsFrameSize(cur_buf);

	94 if (frame_size < kAdtsHeaderMinSize)

	95 // Too short to be an ADTS frame.

	96 continue;

	97

	98 // Check whether there is another frame

	99 // \|size\| apart from the current one.

	100 int remaining_size = raw_es_size - offset;

	101 if (remaining_size >= frame_size + 2) {

	102 if ((cur_buf[frame_size] != 0xff) \|\|
	acolwell GONE FROM CHROMIUM 2013/09/16 06:19:30 nit: Replace this and the check above w/ isSyncWor nit: Replace this and the check above w/ isSyncWord() helper call just to make the code a little clearer? damienv1 2013/09/17 02:58:22 Done. Show quoted text On 2013/09/16 06:19:30, acolwell wrote: > nit: Replace this and the check above w/ isSyncWord() helper call just to make > the code a little clearer? Done.
	103 (cur_buf[frame_size + 1] & 0xf6) != 0xf0)

	104 continue;

	105 }

	106

	107 *new_pos = offset;

	108 *frame_sz = frame_size;

	109 return true;

	110 }

	111

	112 *new_pos = max_offset;

	113 return false;

	114 }

	115

	116 namespace media {

	117 namespace mp2t {

	118

	119 EsParserAdts::EsParserAdts(

	120 NewAudioConfigCB new_audio_config_cb,

	121 EmitBufferCB emit_buffer_cb)

	122 : new_audio_config_cb_(new_audio_config_cb),

	123 emit_buffer_cb_(emit_buffer_cb) {

	124 }

	125

	126 EsParserAdts::~EsParserAdts() {

	127 }

	128

	129 bool EsParserAdts::Parse(const uint8* buf, int size,

	130 base::TimeDelta pts,

	131 base::TimeDelta dts) {

	132 int raw_es_size = 0;

	133 const uint8* raw_es = NULL;
	acolwell GONE FROM CHROMIUM 2013/09/16 06:19:30 nit: var init isn't needed here. nit: var init isn't needed here. damienv1 2013/09/17 02:58:22 Done. Show quoted text On 2013/09/16 06:19:30, acolwell wrote: > nit: var init isn't needed here. Done.
	134

	135 // The incoming PTS applies to the access unit that comes just after

	136 // the beginning of \|buf\|.

	137 if (pts != kNoTimestamp()) {

	138 es_byte_queue_.Peek(&raw_es, &raw_es_size);

	139 pts_list_.push_back(EsPts(raw_es_size, pts));

	140 }

	141

	142 // Copy the input data to the ES buffer.

	143 es_byte_queue_.Push(buf, size);

	144 es_byte_queue_.Peek(&raw_es, &raw_es_size);

	145

	146 // Look for every ADTS frame in the ES buffer starting at offset = 0

	147 int es_position = 0;

	148 int frame_size;

	149 while (LookForSyncWord(raw_es, raw_es_size, es_position,

	150 &es_position, &frame_size)) {

	151 DVLOG(LOG_LEVEL_ES) << "ADTS syncword @ pos=" << es_position

	152 << " frame_size=" << frame_size;

	153 DVLOG(LOG_LEVEL_ES) << "ADTS header: "

	154 << base::HexEncode(&raw_es[es_position], 7);

	155

	156 // Do not process the frame if this one is a partial frame.

	157 int remaining_size = raw_es_size - es_position;

	158 if (frame_size > remaining_size)

	159 break;

	160

	161 // Update the audio configuration if needed.

	162 DCHECK_GE(frame_size, kAdtsHeaderMinSize);

	163 if (!UpdateAudioConfiguration(&raw_es[es_position]))

	164 return false;

	165

	166 // Get the PTS & the duration of this access unit.

	167 DCHECK(audio_timestamp_helper_);
	acolwell GONE FROM CHROMIUM 2013/09/16 06:19:30 nit: No need for DCHECK here since the code will c nit: No need for DCHECK here since the code will crash in 4 or 7 lines later. Usually in these types of situations we just let the code crash instead of putting a DCHECK. We tend to use NULL DCHECKs only for method param verification. damienv1 2013/09/17 02:58:22 Done. Show quoted text On 2013/09/16 06:19:30, acolwell wrote: > nit: No need for DCHECK here since the code will crash in 4 or 7 lines later. > Usually in these types of situations we just let the code crash instead of > putting a DCHECK. We tend to use NULL DCHECKs only for method param > verification. Done.
	168 while (!pts_list_.empty() &&

	169 pts_list_.front().first <= es_position) {

	170 audio_timestamp_helper_->SetBaseTimestamp(pts_list_.front().second);
	acolwell GONE FROM CHROMIUM 2013/09/16 06:19:30 Is this here to compensate for gaps in the audio? Is this here to compensate for gaps in the audio? You shouldn't need to do this otherwise since the accumulation of samples should be more accurate and ensures that gaps/overlaps aren't created. I think you should only reset the base if the timestamp is more than a few samples different. damienv1 2013/09/17 02:58:22 1) The timestamp helper has a resolution of 1 samp Show quoted text On 2013/09/16 06:19:30, acolwell wrote: > Is this here to compensate for gaps in the audio? You shouldn't need to do this > otherwise since the accumulation of samples should be more accurate and ensures > that gaps/overlaps aren't created. I think you should only reset the base if the > timestamp is more than a few samples different. 1) The timestamp helper has a resolution of 1 sample. The Mpeg2 TS timestamps have a resolution of 90kHz which in case of AAC is less than a sample (except for 96kHz where it's slightly more). 2) The Mpeg2 TS timestamp should be the one to use as there might be some GAP in the audio as well. I think the ADTS parser should not be the one to decide which PTS to use when there is one coming from the stream.
	171 pts_list_.pop_front();

	172 }

	173

	174 base::TimeDelta current_pts = audio_timestamp_helper_->GetTimestamp();

	175 base::TimeDelta frame_duration =

	176 audio_timestamp_helper_->GetFrameDuration(kNumberSamplesPerAACFrame);

	177

	178 // Emit an audio frame.

	179 bool is_key_frame = true;

	180 scoped_refptr<StreamParserBuffer> stream_parser_buffer =

	181 StreamParserBuffer::CopyFrom(

	182 &raw_es[es_position],

	183 frame_size,

	184 is_key_frame);

	185 stream_parser_buffer->SetDecodeTimestamp(current_pts);

	186 stream_parser_buffer->set_timestamp(current_pts);

	187 stream_parser_buffer->set_duration(frame_duration);

	188 emit_buffer_cb_.Run(stream_parser_buffer);

	189

	190 // Update the PTS of the next frame.

	191 audio_timestamp_helper_->AddFrames(kNumberSamplesPerAACFrame);

	192

	193 // Skip the current frame.

	194 es_position += frame_size;

	195 }

	196

	197 // Discard all the bytes that have been processed.

	198 DiscardEs(es_position);

	199

	200 return true;

	201 }

	202

	203 void EsParserAdts::Flush() {

	204 // All the complete frames have been emitted,

	205 // so just clear the ES buffer.

	206 es_byte_queue_.Reset();

	207 pts_list_.clear();
	acolwell GONE FROM CHROMIUM 2013/09/16 06:19:30 This doesn't seem consistent w/ the description in This doesn't seem consistent w/ the description in es_parser.h. I'd expect this function to be a noop, but it looks like it is effecting the parser state. Am I misunderstanding something here? damienv1 2013/09/17 02:58:22 I made it a noop to match the description. It does Show quoted text On 2013/09/16 06:19:30, acolwell wrote: > This doesn't seem consistent w/ the description in es_parser.h. I'd expect this > function to be a noop, but it looks like it is effecting the parser state. Am I > misunderstanding something here? I made it a noop to match the description. It does not impact the behavior since a Flush is always followed by a Reset in practice.
	208 }

	209

	210 void EsParserAdts::Reset() {

	211 es_byte_queue_.Reset();

	212 pts_list_.clear();

	213 last_audio_decoder_config_ = AudioDecoderConfig();

	214 }

	215

	216 bool EsParserAdts::UpdateAudioConfiguration(const uint8* adts_header) {

	217 int frequency_index = ExtractAdtsFrequencyIndex(adts_header);

	218 if (frequency_index > kMaxSupportedFrequencyIndex) {

	219 // Frequency index 13 & 14 are reserved

	220 // while 15 means that the frequency is explicitly written

	221 // (not supported).

	222 return false;

	223 }

	224

	225 // TODO(damienv): support HE-AAC frequency doubling (SBR)

	226 // based on the incoming ADTS profile.

	227 int samples_per_second = adts_frequency_table[frequency_index];

	228 int channel_configuration = ExtractAdtsChannelConfig(adts_header);

	229 int adts_profile = (adts_header[2] >> 6) & 0x3;

	230
	acolwell GONE FROM CHROMIUM 2013/09/16 06:19:30 I think you need the following since I don't belie I think you need the following since I don't believe we support inband-channel layout. // TODO: Add support for inband channel configurations. if (channel_configuration == 0) return false; damienv1 2013/09/17 02:58:22 Done. Show quoted text On 2013/09/16 06:19:30, acolwell wrote: > I think you need the following since I don't believe we support inband-channel > layout. > > // TODO: Add support for inband channel configurations. > if (channel_configuration == 0) > return false; Done.
	231 AudioDecoderConfig audio_decoder_config(

	232 kCodecAAC,

	233 kSampleFormatS16,

	234 adts_channel_layout[channel_configuration],

	235 samples_per_second,

	236 NULL, 0,

	237 false);

	238

	239 if (!audio_decoder_config.Matches(last_audio_decoder_config_)) {

	240 DVLOG(1) << "Sampling frequency: " << samples_per_second;

	241 DVLOG(1) << "Channel config: " << channel_configuration;

	242 DVLOG(1) << "Adts profile: " << adts_profile;

	243 // Reset the timestamp helper to use a new time scale.

	244 if (audio_timestamp_helper_) {

	245 base::TimeDelta base_timestamp = audio_timestamp_helper_->GetTimestamp();

	246 audio_timestamp_helper_.reset(

	247 new AudioTimestampHelper(samples_per_second));

	248 audio_timestamp_helper_->SetBaseTimestamp(base_timestamp);

	249 } else {

	250 audio_timestamp_helper_.reset(

	251 new AudioTimestampHelper(samples_per_second));

	252 }

	253 // Audio config notification.

	254 last_audio_decoder_config_ = audio_decoder_config;

	255 new_audio_config_cb_.Run(audio_decoder_config);

	256 }

	257

	258 return true;

	259 }

	260

	261 void EsParserAdts::DiscardEs(int nbytes) {

	262 DCHECK_GE(nbytes, 0);

	263 if (nbytes <= 0)

	264 return;

	265

	266 // Adjust the ES position of each PTS.

	267 for (EsPtsList::iterator it = pts_list_.begin(); it != pts_list_.end(); ++it)

	268 it->first -= nbytes;
	acolwell GONE FROM CHROMIUM 2013/09/16 06:19:30 How big is this list likely to be? It might be mor How big is this list likely to be? It might be more efficient to keep a bytes_consumed_ count and then just add the offset when you insert the elements & subract it off when you are popping them off. damienv1 2013/09/17 02:58:22 In the general case, the size of the list will be Show quoted text On 2013/09/16 06:19:30, acolwell wrote: > How big is this list likely to be? It might be more efficient to keep a > bytes_consumed_ count and then just add the offset when you insert the elements > & subract it off when you are popping them off. In the general case, the size of the list will be 0 at this time or possibly 1 (if there is no full ADTS frame in the last reassembled PES). "List size > 1" is very unlikely since this would mean: - an ADTS frame spreads over multiple reassembled PES - or no ADTS header was found over the last couple of reassembled PES At any time in this code, the PTS list size should be between 0 and 2 included. Any other value (> 2) is very unlikely (though not impossible).
	269

	270 // Discard \|nbytes\| of ES.

	271 es_byte_queue_.Pop(nbytes);

	272 }

	273

	274 } // namespace mp2t

	275 } // namespace media

	276

OLD	NEW

« media/mp2t/es_parser_adts.h ('K') | « media/mp2t/es_parser_adts.h ('k') | media/mp2t/es_parser_h264.h » ('j') | media/mp2t/es_parser_h264.cc » ('J')