media/mp3/mp3_stream_parser.cc - Issue 23454006: Implement experimental MP3 support for Media Source API.

Side by Side Diff: media/mp3/mp3_stream_parser.cc

Issue 23454006: Implement experimental MP3 support for Media Source API. (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src

Patch Set: Rebase Created 7 years, 3 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch | Annotate | Revision Log

OLD	NEW
(Empty)
	1 // Copyright (c) 2013 The Chromium Authors. All rights reserved.

	2 // Use of this source code is governed by a BSD-style license that can be

	3 // found in the LICENSE file.

	4

	5 #include "media/mp3/mp3_stream_parser.h"

	6

	7 #include "base/bind.h"

	8 #include "base/callback_helpers.h"

	9 #include "base/message_loop/message_loop.h"

	10 #include "media/base/bit_reader.h"

	11 #include "media/base/buffers.h"

	12 #include "media/base/stream_parser_buffer.h"

	13 #include "media/base/video_decoder_config.h"

	14 #include "net/http/http_util.h"

	15

	16 namespace media {

	17

	18 static const uint32 kMP3StartCodeMask = 0xffe00000;

	19 static const uint32 kICYStartCode = 0x49435920; // 'ICY '

	20

	21 // Arbitrary upper bound on the size of an IceCast header before it

	22 // triggers an error.

	23 static const int kMaxIcecastHeaderSize = 4096;

	24

	25 static const uint32 kID3StartCodeMask = 0xffffff00;

	26 static const uint32 kID3v1StartCode = 0x54414700; // 'TAG\0'

	27 static const int kID3v1Size = 128;

	28 static const int kID3v1ExtendedSize = 227;

	29 static const uint32 kID3v2StartCode = 0x49443300; // 'ID3\0'

	30

	31 // Map that determines which bitrate_index & channel_mode combinations

	32 // are allowed.

	33 // Derived from: http://mpgedit.org/mpgedit/mpeg_format/MP3Format.html

	34 static const bool kIsAllowed[17][4] = {

	35 { true, true, true, true }, // free

	36 { true, false, false, false }, // 32

	37 { true, false, false, false }, // 48

	38 { true, false, false, false }, // 56

	39 { true, true, true, true }, // 64

	40 { true, false, false, false }, // 80

	41 { true, true, true, true }, // 96

	42 { true, true, true, true }, // 112

	43 { true, true, true, true }, // 128

	44 { true, true, true, true }, // 160

	45 { true, true, true, true }, // 192

	46 { false, true, true, true }, // 224

	47 { false, true, true, true }, // 256

	48 { false, true, true, true }, // 320

	49 { false, true, true, true }, // 384

	50 { false, false, false, false } // bad

	51 };

	52

	53 // Maps version and layer information in the frame header

	54 // into an index for the \|kBitrateMap\|.

	55 // Derived from: http://mpgedit.org/mpgedit/mpeg_format/MP3Format.html

	56 static const int kVersionLayerMap[4][4] = {

	57 // { reserved, L3, L2, L1 }

	58 { 5, 4, 4, 3 }, // MPEG 2.5

	59 { 5, 5, 5, 5 }, // reserved

	60 { 5, 4, 4, 3 }, // MPEG 2

	61 { 5, 2, 1, 0 } // MPEG 1

	62 };

	63

	64 // Maps the bitrate index field in the header and an index

	65 // from \|kVersionLayerMap\| to a frame bitrate.

	66 // Derived from: http://mpgedit.org/mpgedit/mpeg_format/MP3Format.html

	67 static const int kBitrateMap[16][6] = {

	68 // { V1L1, V1L2, V1L3, V2L1, V2L2 & V2L3, reserved }

	69 { 0, 0, 0, 0, 0, 0 },

	70 { 32, 32, 32, 32, 8, 0 },

	71 { 64, 48, 40, 48, 16, 0 },

	72 { 96, 56, 48, 56, 24, 0 },

	73 { 128, 64, 56, 64, 32, 0 },

	74 { 160, 80, 64, 80, 40, 0 },

	75 { 192, 96, 80, 96, 48, 0 },

	76 { 224, 112, 96, 112, 56, 0 },

	77 { 256, 128, 112, 128, 64, 0 },

	78 { 288, 160, 128, 144, 80, 0 },

	79 { 320, 192, 160, 160, 96, 0 },

	80 { 352, 224, 192, 176, 112, 0 },

	81 { 384, 256, 224, 192, 128, 0 },

	82 { 416, 320, 256, 224, 144, 0 },

	83 { 448, 384, 320, 256, 160, 0 },

	84 { 0, 0, 0, 0, 0}

	85 };

	86

	87 // Maps the sample rate index and version fields from the frame header

	88 // to a sample rate.

	89 // Derived from: http://mpgedit.org/mpgedit/mpeg_format/MP3Format.html

	90 static const int kSampleRateMap[4][4] = {

	91 // { V2.5, reserved, V2, V1 }

	92 { 11025, 0, 22050, 44100 },

	93 { 12000, 0, 24000, 48000 },

	94 { 8000, 0, 16000, 32000 },

	95 { 0, 0, 0, 0 }

	96 };

	97

	98 // Frame header field constants.

	99 static const int kVersion1 = 3;

	100 static const int kVersion2 = 2;

	101 static const int kVersionReserved = 1;

	102 static const int kVersion2_5 = 0;

	103 static const int kLayerReserved = 0;

	104 static const int kLayer1 = 3;

	105 static const int kLayer2 = 2;

	106 static const int kLayer3 = 1;

	107 static const int kBitrateFree = 0;

	108 static const int kBitrateBad = 0xf;

	109 static const int kSampleRateReserved = 3;

	110

	111 MP3StreamParser::MP3StreamParser()

	112 : state_(UNINITIALIZED),

	113 in_media_segment_(false) {

	114 }

	115

	116 MP3StreamParser::~MP3StreamParser() {}

	117

	118 void MP3StreamParser::Init(const InitCB& init_cb,

	119 const NewConfigCB& config_cb,

	120 const NewBuffersCB& new_buffers_cb,

	121 const NewTextBuffersCB& text_cb,

	122 const NeedKeyCB& need_key_cb,

	123 const AddTextTrackCB& add_text_track_cb,

	124 const NewMediaSegmentCB& new_segment_cb,

	125 const base::Closure& end_of_segment_cb,

	126 const LogCB& log_cb) {

	127 DVLOG(1) << __FUNCTION__;

	128 DCHECK_EQ(state_, UNINITIALIZED);

	129 init_cb_ = init_cb;

	130 config_cb_ = config_cb;

	131 new_buffers_cb_ = new_buffers_cb;

	132 new_segment_cb_ = new_segment_cb;

	133 end_of_segment_cb_ = end_of_segment_cb;

	134 log_cb_ = log_cb;

	135

	136 ChangeState(INITIALIZED);

	137 }

	138

	139 void MP3StreamParser::Flush() {

	140 DVLOG(1) << __FUNCTION__;

	141 DCHECK_NE(state_, UNINITIALIZED);

	142 queue_.Reset();

	143 timestamp_helper_->SetBaseTimestamp(base::TimeDelta());

	144 in_media_segment_ = false;

	145 }

	146

	147 bool MP3StreamParser::Parse(const uint8* buf, int size) {

	148 DVLOG(1) << __FUNCTION__ << "(" << size << ")";

	149 DCHECK(buf);

	150 DCHECK_GT(size, 0);

	151 DCHECK_NE(state_, UNINITIALIZED);

	152

	153 if (state_ == PARSE_ERROR)

	154 return false;

	155

	156 DCHECK_EQ(state_, INITIALIZED);

	157

	158 queue_.Push(buf, size);

	159

	160 for (;;) {

	161 const uint8* data;

	162 int data_size;

	163 queue_.Peek(&data, &data_size);

	164

	165 if (size < 4)

	166 return true;

	167

	168 uint32 start_code = data[0] << 24 \| data[1] << 16 \| data[2] << 8 \| data[3];

	169 int bytes_read = 0;

	170 if ((start_code & kMP3StartCodeMask) == kMP3StartCodeMask) {

	171 bytes_read = ParseMP3Frame(data, data_size);

	172 } else if (start_code == kICYStartCode) {

	173 bytes_read = ParseIcecastHeader(data, data_size);

	174 } else if ((start_code & kID3StartCodeMask) == kID3v1StartCode) {

	175 bytes_read = ParseID3v1(data, data_size);

	176 } else if ((start_code & kID3StartCodeMask) == kID3v2StartCode) {

	177 bytes_read = ParseID3v2(data, data_size);

	178 } else {

	179 bytes_read = FindNextValidStartCode(data, data_size);

	180

	181 if (bytes_read > 0) {

	182 DVLOG(1) << "Unexpected start code 0x" << std::hex << start_code;

	183 DVLOG(1) << "SKIPPING " << bytes_read << " bytes of garbage.";

	184 }

	185 }

	186

	187 CHECK_LE(bytes_read, data_size);

	188

	189 if (bytes_read < 0) {

	190 ChangeState(PARSE_ERROR);

	191 return false;

	192 } else if (bytes_read == 0) {

	193 // Need more data.

	194 return true;

	195 }

	196

	197 queue_.Pop(bytes_read);

	198 }

	199

	200 return true;

	201 }

	202

	203 void MP3StreamParser::ChangeState(State state) {

	204 DVLOG(1) << __FUNCTION__ << "() : " << state_ << " -> " << state;

	205 state_ = state;

	206 }

	207

	208 int MP3StreamParser::ParseFrameHeader(const uint8* data, int size,

	209 int* frame_size,

	210 int* sample_rate,

	211 ChannelLayout* channel_layout,

	212 int* sample_count) const {

	213 DCHECK(data);

	214 DCHECK_GE(size, 0);

	215 DCHECK(frame_size);

	216

	217 if (size < 4)

	218 return 0;

	219

	220 BitReader reader(data, size);

	221 int sync;

	222 int version;

	223 int layer;

	224 int is_protected;

	225 int bitrate_index;

	226 int sample_rate_index;

	227 int has_padding;

	228 int is_private;

	229 int channel_mode;

	230 int other_flags;

	231

	232 if (!reader.ReadBits(11, &sync) \|\|

	233 !reader.ReadBits(2, &version) \|\|

	234 !reader.ReadBits(2, &layer) \|\|

	235 !reader.ReadBits(1, &is_protected) \|\|

	236 !reader.ReadBits(4, &bitrate_index) \|\|

	237 !reader.ReadBits(2, &sample_rate_index) \|\|

	238 !reader.ReadBits(1, &has_padding) \|\|

	239 !reader.ReadBits(1, &is_private) \|\|

	240 !reader.ReadBits(2, &channel_mode) \|\|

	241 !reader.ReadBits(6, &other_flags)) {

	242 return -1;

	243 }

	244

	245 DVLOG(2) << "Header data :" << std::hex

	246 << " sync 0x" << sync

	247 << " version 0x" << version

	248 << " layer 0x" << layer

	249 << " bitrate_index 0x" << bitrate_index

	250 << " sample_rate_index 0x" << sample_rate_index

	251 << " channel_mode 0x" << channel_mode;

	252

	253 if (sync != 0x7ff \|\|

	254 version == kVersionReserved \|\|

	255 layer == kLayerReserved \|\|

	256 bitrate_index == kBitrateFree \|\| bitrate_index == kBitrateBad \|\|

	257 sample_rate_index == kSampleRateReserved) {

	258 MEDIA_LOG(log_cb_) << "Invalid header data :" << std::hex

	259 << " sync 0x" << sync

	260 << " version 0x" << version

	261 << " layer 0x" << layer

	262 << " bitrate_index 0x" << bitrate_index

	263 << " sample_rate_index 0x" << sample_rate_index

	264 << " channel_mode 0x" << channel_mode;

	265 return -1;

	266 }

	267

	268 if (layer == kLayer2 && kIsAllowed[bitrate_index][channel_mode]) {

	269 MEDIA_LOG(log_cb_) << "Invalid (bitrate_index, channel_mode) combination :"

	270 << std::hex

	271 << " bitrate_index " << bitrate_index

	272 << " channel_mode " << channel_mode;

	273 return -1;

	274 }

	275

	276 int bitrate = kBitrateMap[bitrate_index][kVersionLayerMap[version][layer]];

	277

	278 if (bitrate == 0) {

	279 MEDIA_LOG(log_cb_) << "Invalid bitrate :" << std::hex

	280 << " version " << version

	281 << " layer " << layer

	282 << " bitrate_index " << bitrate_index;

	283 return -1;

	284 }

	285

	286 DVLOG(2) << " bitrate " << bitrate;

	287

	288 int frame_sample_rate = kSampleRateMap[sample_rate_index][version];

	289 if (frame_sample_rate == 0) {

	290 MEDIA_LOG(log_cb_) << "Invalid sample rate :" << std::hex

	291 << " version " << version

	292 << " sample_rate_index " << sample_rate_index;

	293 return -1;

	294 }

	295

	296 if (sample_rate)

	297 *sample_rate = frame_sample_rate;

	298

	299 // http://teslabs.com/openplayer/docs/docs/specs/mp3_structure2.pdf

	300 // Table 2.1.5

	301 int samples_per_frame;

	302 switch (layer) {

	303 case kLayer1:

	304 samples_per_frame = 384;

	305 break;

	306

	307 case kLayer2:

	308 samples_per_frame = 1152;

	309 break;

	310

	311 case kLayer3:

	312 if (version == kVersion2 \|\| version == kVersion2_5)

	313 samples_per_frame = 576;

	314 else

	315 samples_per_frame = 1152;

	316 break;

	317

	318 default:

	319 return -1;

	320 }

	321

	322 if (sample_count)

	323 *sample_count = samples_per_frame;

	324

	325 // http://teslabs.com/openplayer/docs/docs/specs/mp3_structure2.pdf

	326 // Text just below Table 2.1.5.

	327 if (layer == kLayer1) {

	328 // This formulation is a slight variation on the equation below,

	329 // but has slightly different truncation characteristics to deal

	330 // with the fact that Layer 1 has 4 byte "slots" instead of single

	331 // byte ones.

	332 frame_size = 4 (12 * bitrate * 1000 / frame_sample_rate);

	333 } else {

	334 *frame_size =

	335 ((samples_per_frame / 8) * bitrate * 1000) / frame_sample_rate;

	336 }

	337

	338 if (has_padding)

	339 *frame_size += (layer == kLayer1) ? 4 : 1;

	340

	341 if (channel_layout) {

	342 // Map Stereo(0), Joint Stereo(1), and Dual Channel (2) to

	343 // CHANNEL_LAYOUT_STEREO and Single Channel (3) to CHANNEL_LAYOUT_MONO.

	344 *channel_layout =

	345 (channel_mode == 3) ? CHANNEL_LAYOUT_MONO : CHANNEL_LAYOUT_STEREO;

	346 }

	347

	348 return 4;

	349 }

	350

	351 int MP3StreamParser::ParseMP3Frame(const uint8* data, int size) {

	352 DVLOG(2) << __FUNCTION__ << "(" << size << ")";

	353

	354 int sample_rate;

	355 ChannelLayout channel_layout;

	356 int frame_size;

	357 int sample_count;

	358 int bytes_read = ParseFrameHeader(

	359 data, size, &frame_size, &sample_rate, &channel_layout, &sample_count);

	360

	361 if (bytes_read <= 0)

	362 return bytes_read;

	363

	364 // Make sure data contains the entire frame.

	365 if (size < frame_size)

	366 return 0;

	367

	368 DVLOG(2) << " sample_rate " << sample_rate

	369 << " channel_layout " << channel_layout

	370 << " frame_size " << frame_size;

	371

	372 if (config_.IsValidConfig() &&

	373 (config_.samples_per_second() != sample_rate \|\|

	374 config_.channel_layout() != channel_layout)) {

	375 // Clear config data so that a config change is initiated.

	376 config_ = AudioDecoderConfig();

	377 }

	378

	379 if (!config_.IsValidConfig()) {

	380 config_.Initialize(kCodecMP3, kSampleFormatF32, channel_layout,

	381 sample_rate, NULL, 0, false, false);

	382

	383 base::TimeDelta base_timestamp;

	384 if (timestamp_helper_)

	385 base_timestamp = timestamp_helper_->GetTimestamp();

	386

	387 timestamp_helper_.reset(new AudioTimestampHelper(sample_rate));

	388 timestamp_helper_->SetBaseTimestamp(base_timestamp);

	389

	390 VideoDecoderConfig video_config;

	391 bool success = config_cb_.Run(config_, video_config);

	392

	393 if (!init_cb_.is_null())

	394 base::ResetAndReturn(&init_cb_).Run(success, kInfiniteDuration());

	395

	396 if (!success)

	397 return -1;

	398 }

	399

	400 if (!in_media_segment_) {

	401 in_media_segment_ = true;

	402 new_segment_cb_.Run();

	403 }

	404

	405 BufferQueue audio_buffers;

	406 BufferQueue video_buffers;

	407

	408 // TODO(acolwell): Change this code to parse as many frames as

	409 // possible before calling \|new_buffers_cb_\|.

	410 scoped_refptr<StreamParserBuffer> buffer =

	411 StreamParserBuffer::CopyFrom(data, frame_size, true);

	412 audio_buffers.push_back(buffer);

	413

	414 if (!new_buffers_cb_.Run(audio_buffers, video_buffers))

	415 return -1;

	416

	417 timestamp_helper_->AddFrames(sample_count);

	418

	419 return frame_size;

	420 }

	421

	422 int MP3StreamParser::ParseIcecastHeader(const uint8* data, int size) {

	423 DVLOG(1) << __FUNCTION__ << "(" << size << ")";

	424

	425 if (size < 4)

	426 return 0;

	427

	428 if (memcmp("ICY ", data, 4))

	429 return -1;

	430

	431 int locate_size = std::min(size, kMaxIcecastHeaderSize);

	432 int offset = net::HttpUtil::LocateEndOfHeaders(

	433 reinterpret_cast<const char*>(data), locate_size, 4);

	434 if (offset < 0) {

	435 if (locate_size == kMaxIcecastHeaderSize) {

	436 MEDIA_LOG(log_cb_) << "Icecast header is too large.";

	437 return -1;

	438 }

	439

	440 return 0;

	441 }

	442

	443 return offset;

	444 }

	445

	446 int MP3StreamParser::ParseID3v1(const uint8* data, int size) {

	447 DVLOG(1) << __FUNCTION__ << "(" << size << ")";

	448

	449 if (size < kID3v1Size)

	450 return 0;

	451

	452 // TODO(acolwell): Add code to actually validate ID3v1 data and

	453 // expose it as a metadata text track.

	454 return !memcmp(data, "TAG+", 4) ? kID3v1ExtendedSize : kID3v1Size;

	455 }

	456

	457 int MP3StreamParser::ParseID3v2(const uint8* data, int size) {

	458 DVLOG(1) << __FUNCTION__ << "(" << size << ")";

	459

	460 if (size < 10)

	461 return 0;

	462

	463 BitReader reader(data, size);

	464 int32 id;

	465 int version;

	466 uint8 flags;

	467 int32 id3_size;

	468

	469 if (!reader.ReadBits(24, &id) \|\|

	470 !reader.ReadBits(16, &version) \|\|

	471 !reader.ReadBits(8, &flags) \|\|

	472 !ParseSyncSafeInt(&reader, &id3_size)) {

	473 return -1;

	474 }

	475

	476 int32 actual_tag_size = 10 + id3_size;

	477

	478 // Increment size if 'Footer present' flag is set.

	479 if (flags & 0x10)

	480 actual_tag_size += 10;

	481

	482 // Make sure we have the entire tag.

	483 if (size < actual_tag_size)

	484 return 0;

	485

	486 // TODO(acolwell): Add code to actually validate ID3v2 data and

	487 // expose it as a metadata text track.

	488 return actual_tag_size;

	489 }

	490

	491 bool MP3StreamParser::ParseSyncSafeInt(BitReader* reader, int32* value) {

	492 *value = 0;

	493 for (int i = 0; i < 4; ++i) {

	494 uint8 tmp;

	495 if (!reader->ReadBits(1, &tmp) \|\| tmp != 0) {

	496 MEDIA_LOG(log_cb_) << "ID3 syncsafe integer byte MSb is not 0!";

	497 return false;

	498 }

	499

	500 if (!reader->ReadBits(7, &tmp))

	501 return false;

	502

	503 *value <<= 7;

	504 *value += tmp;

	505 }

	506

	507 return true;

	508 }

	509

	510 int MP3StreamParser::FindNextValidStartCode(const uint8* data, int size) const {

	511 const uint8* start = data;

	512 const uint8* end = data + size;

	513

	514 while (start < end) {

	515 int bytes_left = end - start;

	516 const uint8* candidate_start_code =

	517 static_cast<const uint8*>(memchr(start, 0xff, bytes_left));

	518

	519 if (!candidate_start_code)

	520 return 0;

	521

	522 bool parse_header_failed = false;

	523 const uint8* sync = candidate_start_code;

	524 // Try to find 3 valid frames in a row. 3 was selected to decrease

	525 // the probability of false positives.

	526 for (int i = 0; i < 3; ++i) {

	527 int sync_size = end - sync;

	528 int frame_size;

	529 int sync_bytes = ParseFrameHeader(

	530 sync, sync_size, &frame_size, NULL, NULL, NULL);

	531

	532 if (sync_bytes == 0)

	533 return 0;

	534

	535 if (sync_bytes > 0) {

	536 DCHECK_LT(sync_bytes, sync_size);

	537

	538 // Skip over this frame so we can check the next one.

	539 sync += frame_size;

	540

	541 // Make sure the next frame starts inside the buffer.

	542 if (sync >= end)

	543 return 0;

	544 } else {

	545 DVLOG(1) << "ParseFrameHeader() " << i << " failed @" << (sync - data);

	546 parse_header_failed = true;

	547 break;

	548 }

	549 }

	550

	551 if (parse_header_failed) {

	552 // One of the frame header parses failed so \|candidate_start_code\|

	553 // did not point to the start of a real frame. Move \|start\| forward

	554 // so we can find the next candidate.

	555 start = candidate_start_code + 1;

	556 continue;

	557 }

	558

	559 return candidate_start_code - data;

	560 }

	561

	562 return 0;

	563 }

	564

	565 } // namespace media

OLD	NEW

« no previous file with comments | « media/mp3/mp3_stream_parser.h ('k') | tools/metrics/histograms/histograms.xml » ('j') | no next file with comments »