OLD | NEW |
(Empty) | |
| 1 // Copyright (c) 2013 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. |
| 4 |
| 5 #include "media/mp3/mp3_stream_parser.h" |
| 6 |
| 7 #include "base/bind.h" |
| 8 #include "base/callback_helpers.h" |
| 9 #include "base/message_loop/message_loop.h" |
| 10 #include "media/base/bit_reader.h" |
| 11 #include "media/base/buffers.h" |
| 12 #include "media/base/stream_parser_buffer.h" |
| 13 #include "media/base/video_decoder_config.h" |
| 14 #include "net/http/http_util.h" |
| 15 |
| 16 namespace media { |
| 17 |
| 18 static const uint32 kMP3StartCodeMask = 0xffe00000; |
| 19 static const uint32 kICYStartCode = 0x49435920; // 'ICY ' |
| 20 |
| 21 // Arbitrary upper bound on the size of an IceCast header before it |
| 22 // triggers an error. |
| 23 static const int kMaxIcecastHeaderSize = 4096; |
| 24 |
| 25 static const uint32 kID3StartCodeMask = 0xffffff00; |
| 26 static const uint32 kID3v1StartCode = 0x54414700; // 'TAG\0' |
| 27 static const int kID3v1Size = 128; |
| 28 static const int kID3v1ExtendedSize = 227; |
| 29 static const uint32 kID3v2StartCode = 0x49443300; // 'ID3\0' |
| 30 |
| 31 // Map that determines which bitrate_index & channel_mode combinations |
| 32 // are allowed. |
| 33 // Derived from: http://mpgedit.org/mpgedit/mpeg_format/MP3Format.html |
| 34 static const bool kIsAllowed[17][4] = { |
| 35 { true, true, true, true }, // free |
| 36 { true, false, false, false }, // 32 |
| 37 { true, false, false, false }, // 48 |
| 38 { true, false, false, false }, // 56 |
| 39 { true, true, true, true }, // 64 |
| 40 { true, false, false, false }, // 80 |
| 41 { true, true, true, true }, // 96 |
| 42 { true, true, true, true }, // 112 |
| 43 { true, true, true, true }, // 128 |
| 44 { true, true, true, true }, // 160 |
| 45 { true, true, true, true }, // 192 |
| 46 { false, true, true, true }, // 224 |
| 47 { false, true, true, true }, // 256 |
| 48 { false, true, true, true }, // 320 |
| 49 { false, true, true, true }, // 384 |
| 50 { false, false, false, false } // bad |
| 51 }; |
| 52 |
| 53 // Maps version and layer information in the frame header |
| 54 // into an index for the |kBitrateMap|. |
| 55 // Derived from: http://mpgedit.org/mpgedit/mpeg_format/MP3Format.html |
| 56 static const int kVersionLayerMap[4][4] = { |
| 57 // { reserved, L3, L2, L1 } |
| 58 { 5, 4, 4, 3 }, // MPEG 2.5 |
| 59 { 5, 5, 5, 5 }, // reserved |
| 60 { 5, 4, 4, 3 }, // MPEG 2 |
| 61 { 5, 2, 1, 0 } // MPEG 1 |
| 62 }; |
| 63 |
| 64 // Maps the bitrate index field in the header and an index |
| 65 // from |kVersionLayerMap| to a frame bitrate. |
| 66 // Derived from: http://mpgedit.org/mpgedit/mpeg_format/MP3Format.html |
| 67 static const int kBitrateMap[16][6] = { |
| 68 // { V1L1, V1L2, V1L3, V2L1, V2L2 & V2L3, reserved } |
| 69 { 0, 0, 0, 0, 0, 0 }, |
| 70 { 32, 32, 32, 32, 8, 0 }, |
| 71 { 64, 48, 40, 48, 16, 0 }, |
| 72 { 96, 56, 48, 56, 24, 0 }, |
| 73 { 128, 64, 56, 64, 32, 0 }, |
| 74 { 160, 80, 64, 80, 40, 0 }, |
| 75 { 192, 96, 80, 96, 48, 0 }, |
| 76 { 224, 112, 96, 112, 56, 0 }, |
| 77 { 256, 128, 112, 128, 64, 0 }, |
| 78 { 288, 160, 128, 144, 80, 0 }, |
| 79 { 320, 192, 160, 160, 96, 0 }, |
| 80 { 352, 224, 192, 176, 112, 0 }, |
| 81 { 384, 256, 224, 192, 128, 0 }, |
| 82 { 416, 320, 256, 224, 144, 0 }, |
| 83 { 448, 384, 320, 256, 160, 0 }, |
| 84 { 0, 0, 0, 0, 0} |
| 85 }; |
| 86 |
| 87 // Maps the sample rate index and version fields from the frame header |
| 88 // to a sample rate. |
| 89 // Derived from: http://mpgedit.org/mpgedit/mpeg_format/MP3Format.html |
| 90 static const int kSampleRateMap[4][4] = { |
| 91 // { V2.5, reserved, V2, V1 } |
| 92 { 11025, 0, 22050, 44100 }, |
| 93 { 12000, 0, 24000, 48000 }, |
| 94 { 8000, 0, 16000, 32000 }, |
| 95 { 0, 0, 0, 0 } |
| 96 }; |
| 97 |
| 98 // Frame header field constants. |
| 99 static const int kVersion1 = 3; |
| 100 static const int kVersion2 = 2; |
| 101 static const int kVersionReserved = 1; |
| 102 static const int kVersion2_5 = 0; |
| 103 static const int kLayerReserved = 0; |
| 104 static const int kLayer1 = 3; |
| 105 static const int kLayer2 = 2; |
| 106 static const int kLayer3 = 1; |
| 107 static const int kBitrateFree = 0; |
| 108 static const int kBitrateBad = 0xf; |
| 109 static const int kSampleRateReserved = 3; |
| 110 |
| 111 MP3StreamParser::MP3StreamParser() |
| 112 : state_(UNINITIALIZED), |
| 113 in_media_segment_(false) { |
| 114 } |
| 115 |
| 116 MP3StreamParser::~MP3StreamParser() {} |
| 117 |
| 118 void MP3StreamParser::Init(const InitCB& init_cb, |
| 119 const NewConfigCB& config_cb, |
| 120 const NewBuffersCB& new_buffers_cb, |
| 121 const NewTextBuffersCB& text_cb, |
| 122 const NeedKeyCB& need_key_cb, |
| 123 const AddTextTrackCB& add_text_track_cb, |
| 124 const NewMediaSegmentCB& new_segment_cb, |
| 125 const base::Closure& end_of_segment_cb, |
| 126 const LogCB& log_cb) { |
| 127 DVLOG(1) << __FUNCTION__; |
| 128 DCHECK_EQ(state_, UNINITIALIZED); |
| 129 init_cb_ = init_cb; |
| 130 config_cb_ = config_cb; |
| 131 new_buffers_cb_ = new_buffers_cb; |
| 132 new_segment_cb_ = new_segment_cb; |
| 133 end_of_segment_cb_ = end_of_segment_cb; |
| 134 log_cb_ = log_cb; |
| 135 |
| 136 ChangeState(INITIALIZED); |
| 137 } |
| 138 |
| 139 void MP3StreamParser::Flush() { |
| 140 DVLOG(1) << __FUNCTION__; |
| 141 DCHECK_NE(state_, UNINITIALIZED); |
| 142 queue_.Reset(); |
| 143 timestamp_helper_->SetBaseTimestamp(base::TimeDelta()); |
| 144 in_media_segment_ = false; |
| 145 } |
| 146 |
| 147 bool MP3StreamParser::Parse(const uint8* buf, int size) { |
| 148 DVLOG(1) << __FUNCTION__ << "(" << size << ")"; |
| 149 DCHECK(buf); |
| 150 DCHECK_GT(size, 0); |
| 151 DCHECK_NE(state_, UNINITIALIZED); |
| 152 |
| 153 if (state_ == PARSE_ERROR) |
| 154 return false; |
| 155 |
| 156 DCHECK_EQ(state_, INITIALIZED); |
| 157 |
| 158 queue_.Push(buf, size); |
| 159 |
| 160 for (;;) { |
| 161 const uint8* data; |
| 162 int data_size; |
| 163 queue_.Peek(&data, &data_size); |
| 164 |
| 165 if (size < 4) |
| 166 return true; |
| 167 |
| 168 uint32 start_code = data[0] << 24 | data[1] << 16 | data[2] << 8 | data[3]; |
| 169 int bytes_read = 0; |
| 170 if ((start_code & kMP3StartCodeMask) == kMP3StartCodeMask) { |
| 171 bytes_read = ParseMP3Frame(data, data_size); |
| 172 } else if (start_code == kICYStartCode) { |
| 173 bytes_read = ParseIcecastHeader(data, data_size); |
| 174 } else if ((start_code & kID3StartCodeMask) == kID3v1StartCode) { |
| 175 bytes_read = ParseID3v1(data, data_size); |
| 176 } else if ((start_code & kID3StartCodeMask) == kID3v2StartCode) { |
| 177 bytes_read = ParseID3v2(data, data_size); |
| 178 } else { |
| 179 bytes_read = FindNextValidStartCode(data, data_size); |
| 180 |
| 181 if (bytes_read > 0) { |
| 182 DVLOG(1) << "Unexpected start code 0x" << std::hex << start_code; |
| 183 DVLOG(1) << "SKIPPING " << bytes_read << " bytes of garbage."; |
| 184 } |
| 185 } |
| 186 |
| 187 CHECK_LE(bytes_read, data_size); |
| 188 |
| 189 if (bytes_read < 0) { |
| 190 ChangeState(PARSE_ERROR); |
| 191 return false; |
| 192 } else if (bytes_read == 0) { |
| 193 // Need more data. |
| 194 return true; |
| 195 } |
| 196 |
| 197 queue_.Pop(bytes_read); |
| 198 } |
| 199 |
| 200 return true; |
| 201 } |
| 202 |
| 203 void MP3StreamParser::ChangeState(State state) { |
| 204 DVLOG(1) << __FUNCTION__ << "() : " << state_ << " -> " << state; |
| 205 state_ = state; |
| 206 } |
| 207 |
| 208 int MP3StreamParser::ParseFrameHeader(const uint8* data, int size, |
| 209 int* frame_size, |
| 210 int* sample_rate, |
| 211 ChannelLayout* channel_layout, |
| 212 int* sample_count) const { |
| 213 DCHECK(data); |
| 214 DCHECK_GE(size, 0); |
| 215 DCHECK(frame_size); |
| 216 |
| 217 if (size < 4) |
| 218 return 0; |
| 219 |
| 220 BitReader reader(data, size); |
| 221 int sync; |
| 222 int version; |
| 223 int layer; |
| 224 int is_protected; |
| 225 int bitrate_index; |
| 226 int sample_rate_index; |
| 227 int has_padding; |
| 228 int is_private; |
| 229 int channel_mode; |
| 230 int other_flags; |
| 231 |
| 232 if (!reader.ReadBits(11, &sync) || |
| 233 !reader.ReadBits(2, &version) || |
| 234 !reader.ReadBits(2, &layer) || |
| 235 !reader.ReadBits(1, &is_protected) || |
| 236 !reader.ReadBits(4, &bitrate_index) || |
| 237 !reader.ReadBits(2, &sample_rate_index) || |
| 238 !reader.ReadBits(1, &has_padding) || |
| 239 !reader.ReadBits(1, &is_private) || |
| 240 !reader.ReadBits(2, &channel_mode) || |
| 241 !reader.ReadBits(6, &other_flags)) { |
| 242 return -1; |
| 243 } |
| 244 |
| 245 DVLOG(2) << "Header data :" << std::hex |
| 246 << " sync 0x" << sync |
| 247 << " version 0x" << version |
| 248 << " layer 0x" << layer |
| 249 << " bitrate_index 0x" << bitrate_index |
| 250 << " sample_rate_index 0x" << sample_rate_index |
| 251 << " channel_mode 0x" << channel_mode; |
| 252 |
| 253 if (sync != 0x7ff || |
| 254 version == kVersionReserved || |
| 255 layer == kLayerReserved || |
| 256 bitrate_index == kBitrateFree || bitrate_index == kBitrateBad || |
| 257 sample_rate_index == kSampleRateReserved) { |
| 258 MEDIA_LOG(log_cb_) << "Invalid header data :" << std::hex |
| 259 << " sync 0x" << sync |
| 260 << " version 0x" << version |
| 261 << " layer 0x" << layer |
| 262 << " bitrate_index 0x" << bitrate_index |
| 263 << " sample_rate_index 0x" << sample_rate_index |
| 264 << " channel_mode 0x" << channel_mode; |
| 265 return -1; |
| 266 } |
| 267 |
| 268 if (layer == kLayer2 && kIsAllowed[bitrate_index][channel_mode]) { |
| 269 MEDIA_LOG(log_cb_) << "Invalid (bitrate_index, channel_mode) combination :" |
| 270 << std::hex |
| 271 << " bitrate_index " << bitrate_index |
| 272 << " channel_mode " << channel_mode; |
| 273 return -1; |
| 274 } |
| 275 |
| 276 int bitrate = kBitrateMap[bitrate_index][kVersionLayerMap[version][layer]]; |
| 277 |
| 278 if (bitrate == 0) { |
| 279 MEDIA_LOG(log_cb_) << "Invalid bitrate :" << std::hex |
| 280 << " version " << version |
| 281 << " layer " << layer |
| 282 << " bitrate_index " << bitrate_index; |
| 283 return -1; |
| 284 } |
| 285 |
| 286 DVLOG(2) << " bitrate " << bitrate; |
| 287 |
| 288 int frame_sample_rate = kSampleRateMap[sample_rate_index][version]; |
| 289 if (frame_sample_rate == 0) { |
| 290 MEDIA_LOG(log_cb_) << "Invalid sample rate :" << std::hex |
| 291 << " version " << version |
| 292 << " sample_rate_index " << sample_rate_index; |
| 293 return -1; |
| 294 } |
| 295 |
| 296 if (sample_rate) |
| 297 *sample_rate = frame_sample_rate; |
| 298 |
| 299 // http://teslabs.com/openplayer/docs/docs/specs/mp3_structure2.pdf |
| 300 // Table 2.1.5 |
| 301 int samples_per_frame; |
| 302 switch (layer) { |
| 303 case kLayer1: |
| 304 samples_per_frame = 384; |
| 305 break; |
| 306 |
| 307 case kLayer2: |
| 308 samples_per_frame = 1152; |
| 309 break; |
| 310 |
| 311 case kLayer3: |
| 312 if (version == kVersion2 || version == kVersion2_5) |
| 313 samples_per_frame = 576; |
| 314 else |
| 315 samples_per_frame = 1152; |
| 316 break; |
| 317 |
| 318 default: |
| 319 return -1; |
| 320 } |
| 321 |
| 322 if (sample_count) |
| 323 *sample_count = samples_per_frame; |
| 324 |
| 325 // http://teslabs.com/openplayer/docs/docs/specs/mp3_structure2.pdf |
| 326 // Text just below Table 2.1.5. |
| 327 if (layer == kLayer1) { |
| 328 // This formulation is a slight variation on the equation below, |
| 329 // but has slightly different truncation characteristics to deal |
| 330 // with the fact that Layer 1 has 4 byte "slots" instead of single |
| 331 // byte ones. |
| 332 *frame_size = 4 * (12 * bitrate * 1000 / frame_sample_rate); |
| 333 } else { |
| 334 *frame_size = |
| 335 ((samples_per_frame / 8) * bitrate * 1000) / frame_sample_rate; |
| 336 } |
| 337 |
| 338 if (has_padding) |
| 339 *frame_size += (layer == kLayer1) ? 4 : 1; |
| 340 |
| 341 if (channel_layout) { |
| 342 // Map Stereo(0), Joint Stereo(1), and Dual Channel (2) to |
| 343 // CHANNEL_LAYOUT_STEREO and Single Channel (3) to CHANNEL_LAYOUT_MONO. |
| 344 *channel_layout = |
| 345 (channel_mode == 3) ? CHANNEL_LAYOUT_MONO : CHANNEL_LAYOUT_STEREO; |
| 346 } |
| 347 |
| 348 return 4; |
| 349 } |
| 350 |
| 351 int MP3StreamParser::ParseMP3Frame(const uint8* data, int size) { |
| 352 DVLOG(2) << __FUNCTION__ << "(" << size << ")"; |
| 353 |
| 354 int sample_rate; |
| 355 ChannelLayout channel_layout; |
| 356 int frame_size; |
| 357 int sample_count; |
| 358 int bytes_read = ParseFrameHeader( |
| 359 data, size, &frame_size, &sample_rate, &channel_layout, &sample_count); |
| 360 |
| 361 if (bytes_read <= 0) |
| 362 return bytes_read; |
| 363 |
| 364 // Make sure data contains the entire frame. |
| 365 if (size < frame_size) |
| 366 return 0; |
| 367 |
| 368 DVLOG(2) << " sample_rate " << sample_rate |
| 369 << " channel_layout " << channel_layout |
| 370 << " frame_size " << frame_size; |
| 371 |
| 372 if (config_.IsValidConfig() && |
| 373 (config_.samples_per_second() != sample_rate || |
| 374 config_.channel_layout() != channel_layout)) { |
| 375 // Clear config data so that a config change is initiated. |
| 376 config_ = AudioDecoderConfig(); |
| 377 } |
| 378 |
| 379 if (!config_.IsValidConfig()) { |
| 380 config_.Initialize(kCodecMP3, kSampleFormatF32, channel_layout, |
| 381 sample_rate, NULL, 0, false, false); |
| 382 |
| 383 base::TimeDelta base_timestamp; |
| 384 if (timestamp_helper_) |
| 385 base_timestamp = timestamp_helper_->GetTimestamp(); |
| 386 |
| 387 timestamp_helper_.reset(new AudioTimestampHelper(sample_rate)); |
| 388 timestamp_helper_->SetBaseTimestamp(base_timestamp); |
| 389 |
| 390 VideoDecoderConfig video_config; |
| 391 bool success = config_cb_.Run(config_, video_config); |
| 392 |
| 393 if (!init_cb_.is_null()) |
| 394 base::ResetAndReturn(&init_cb_).Run(success, kInfiniteDuration()); |
| 395 |
| 396 if (!success) |
| 397 return -1; |
| 398 } |
| 399 |
| 400 if (!in_media_segment_) { |
| 401 in_media_segment_ = true; |
| 402 new_segment_cb_.Run(); |
| 403 } |
| 404 |
| 405 BufferQueue audio_buffers; |
| 406 BufferQueue video_buffers; |
| 407 |
| 408 // TODO(acolwell): Change this code to parse as many frames as |
| 409 // possible before calling |new_buffers_cb_|. |
| 410 scoped_refptr<StreamParserBuffer> buffer = |
| 411 StreamParserBuffer::CopyFrom(data, frame_size, true); |
| 412 audio_buffers.push_back(buffer); |
| 413 |
| 414 if (!new_buffers_cb_.Run(audio_buffers, video_buffers)) |
| 415 return -1; |
| 416 |
| 417 timestamp_helper_->AddFrames(sample_count); |
| 418 |
| 419 return frame_size; |
| 420 } |
| 421 |
| 422 int MP3StreamParser::ParseIcecastHeader(const uint8* data, int size) { |
| 423 DVLOG(1) << __FUNCTION__ << "(" << size << ")"; |
| 424 |
| 425 if (size < 4) |
| 426 return 0; |
| 427 |
| 428 if (memcmp("ICY ", data, 4)) |
| 429 return -1; |
| 430 |
| 431 int locate_size = std::min(size, kMaxIcecastHeaderSize); |
| 432 int offset = net::HttpUtil::LocateEndOfHeaders( |
| 433 reinterpret_cast<const char*>(data), locate_size, 4); |
| 434 if (offset < 0) { |
| 435 if (locate_size == kMaxIcecastHeaderSize) { |
| 436 MEDIA_LOG(log_cb_) << "Icecast header is too large."; |
| 437 return -1; |
| 438 } |
| 439 |
| 440 return 0; |
| 441 } |
| 442 |
| 443 return offset; |
| 444 } |
| 445 |
| 446 int MP3StreamParser::ParseID3v1(const uint8* data, int size) { |
| 447 DVLOG(1) << __FUNCTION__ << "(" << size << ")"; |
| 448 |
| 449 if (size < kID3v1Size) |
| 450 return 0; |
| 451 |
| 452 // TODO(acolwell): Add code to actually validate ID3v1 data and |
| 453 // expose it as a metadata text track. |
| 454 return !memcmp(data, "TAG+", 4) ? kID3v1ExtendedSize : kID3v1Size; |
| 455 } |
| 456 |
| 457 int MP3StreamParser::ParseID3v2(const uint8* data, int size) { |
| 458 DVLOG(1) << __FUNCTION__ << "(" << size << ")"; |
| 459 |
| 460 if (size < 10) |
| 461 return 0; |
| 462 |
| 463 BitReader reader(data, size); |
| 464 int32 id; |
| 465 int version; |
| 466 uint8 flags; |
| 467 int32 id3_size; |
| 468 |
| 469 if (!reader.ReadBits(24, &id) || |
| 470 !reader.ReadBits(16, &version) || |
| 471 !reader.ReadBits(8, &flags) || |
| 472 !ParseSyncSafeInt(&reader, &id3_size)) { |
| 473 return -1; |
| 474 } |
| 475 |
| 476 int32 actual_tag_size = 10 + id3_size; |
| 477 |
| 478 // Increment size if 'Footer present' flag is set. |
| 479 if (flags & 0x10) |
| 480 actual_tag_size += 10; |
| 481 |
| 482 // Make sure we have the entire tag. |
| 483 if (size < actual_tag_size) |
| 484 return 0; |
| 485 |
| 486 // TODO(acolwell): Add code to actually validate ID3v2 data and |
| 487 // expose it as a metadata text track. |
| 488 return actual_tag_size; |
| 489 } |
| 490 |
| 491 bool MP3StreamParser::ParseSyncSafeInt(BitReader* reader, int32* value) { |
| 492 *value = 0; |
| 493 for (int i = 0; i < 4; ++i) { |
| 494 uint8 tmp; |
| 495 if (!reader->ReadBits(1, &tmp) || tmp != 0) { |
| 496 MEDIA_LOG(log_cb_) << "ID3 syncsafe integer byte MSb is not 0!"; |
| 497 return false; |
| 498 } |
| 499 |
| 500 if (!reader->ReadBits(7, &tmp)) |
| 501 return false; |
| 502 |
| 503 *value <<= 7; |
| 504 *value += tmp; |
| 505 } |
| 506 |
| 507 return true; |
| 508 } |
| 509 |
| 510 int MP3StreamParser::FindNextValidStartCode(const uint8* data, int size) const { |
| 511 const uint8* start = data; |
| 512 const uint8* end = data + size; |
| 513 |
| 514 while (start < end) { |
| 515 int bytes_left = end - start; |
| 516 const uint8* candidate_start_code = |
| 517 static_cast<const uint8*>(memchr(start, 0xff, bytes_left)); |
| 518 |
| 519 if (!candidate_start_code) |
| 520 return 0; |
| 521 |
| 522 bool parse_header_failed = false; |
| 523 const uint8* sync = candidate_start_code; |
| 524 // Try to find 3 valid frames in a row. 3 was selected to decrease |
| 525 // the probability of false positives. |
| 526 for (int i = 0; i < 3; ++i) { |
| 527 int sync_size = end - sync; |
| 528 int frame_size; |
| 529 int sync_bytes = ParseFrameHeader( |
| 530 sync, sync_size, &frame_size, NULL, NULL, NULL); |
| 531 |
| 532 if (sync_bytes == 0) |
| 533 return 0; |
| 534 |
| 535 if (sync_bytes > 0) { |
| 536 DCHECK_LT(sync_bytes, sync_size); |
| 537 |
| 538 // Skip over this frame so we can check the next one. |
| 539 sync += frame_size; |
| 540 |
| 541 // Make sure the next frame starts inside the buffer. |
| 542 if (sync >= end) |
| 543 return 0; |
| 544 } else { |
| 545 DVLOG(1) << "ParseFrameHeader() " << i << " failed @" << (sync - data); |
| 546 parse_header_failed = true; |
| 547 break; |
| 548 } |
| 549 } |
| 550 |
| 551 if (parse_header_failed) { |
| 552 // One of the frame header parses failed so |candidate_start_code| |
| 553 // did not point to the start of a real frame. Move |start| forward |
| 554 // so we can find the next candidate. |
| 555 start = candidate_start_code + 1; |
| 556 continue; |
| 557 } |
| 558 |
| 559 return candidate_start_code - data; |
| 560 } |
| 561 |
| 562 return 0; |
| 563 } |
| 564 |
| 565 } // namespace media |
OLD | NEW |