5 #include "packager/media/formats/wvm/wvm_media_parser.h"
11 #include "packager/base/stl_util.h"
12 #include "packager/base/strings/string_number_conversions.h"
13 #include "packager/media/base/aes_encryptor.h"
14 #include "packager/media/base/audio_stream_info.h"
15 #include "packager/media/base/key_source.h"
16 #include "packager/media/base/media_sample.h"
17 #include "packager/media/base/status.h"
18 #include "packager/media/base/video_stream_info.h"
19 #include "packager/media/filters/avc_decoder_configuration.h"
20 #include "packager/media/formats/mp2t/adts_header.h"
21 #include "packager/media/formats/mp4/aac_audio_specific_config.h"
22 #include "packager/media/formats/mp4/es_descriptor.h"
24 #define HAS_HEADER_EXTENSION(x) ((x != 0xBC) && (x != 0xBE) && (x != 0xBF) \
25 && (x != 0xF0) && (x != 0xF2) && (x != 0xF8) \
29 const uint32_t kMpeg2ClockRate = 90000;
30 const uint32_t kPesOptPts = 0x80;
31 const uint32_t kPesOptDts = 0x40;
32 const uint32_t kPesOptAlign = 0x04;
33 const uint32_t kPsmStreamId = 0xBC;
34 const uint32_t kPaddingStreamId = 0xBE;
35 const uint32_t kIndexMagic = 0x49444d69;
36 const uint32_t kIndexStreamId = 0xBF;
37 const uint32_t kIndexVersion4HeaderSize = 12;
38 const uint32_t kEcmStreamId = 0xF0;
39 const uint32_t kV2MetadataStreamId = 0xF1;
40 const uint32_t kScramblingBitsMask = 0x30;
41 const uint32_t kStartCode1 = 0x00;
42 const uint32_t kStartCode2 = 0x00;
43 const uint32_t kStartCode3 = 0x01;
44 const uint32_t kStartCode4Pack = 0xBA;
45 const uint32_t kStartCode4System = 0xBB;
46 const uint32_t kStartCode4ProgramEnd = 0xB9;
47 const uint32_t kPesStreamIdVideoMask = 0xF0;
48 const uint32_t kPesStreamIdVideo = 0xE0;
49 const uint32_t kPesStreamIdAudioMask = 0xE0;
50 const uint32_t kPesStreamIdAudio = 0xC0;
51 const uint32_t kVersion4 = 4;
52 const int kAdtsHeaderMinSize = 7;
53 const uint8_t kAacSampleSizeBits = 16;
55 const uint8_t kNaluLengthSize = 4;
58 const uint32_t kDefaultSamplingFrequency = 100;
59 const uint16_t kEcmSizeBytes = 80;
60 const uint32_t kInitializationVectorSizeBytes = 16;
62 const uint32_t kEcmContentKeySizeBytes = 16;
63 const uint32_t kEcmDCPFlagsSizeBytes = 3;
64 const uint32_t kEcmCCIFlagsSizeBytes = 1;
65 const uint32_t kEcmFlagsSizeBytes =
66 kEcmCCIFlagsSizeBytes + kEcmDCPFlagsSizeBytes;
67 const uint32_t kEcmPaddingSizeBytes = 12;
68 const uint32_t kAssetKeySizeBytes = 16;
70 const uint8_t kDefaultAudioStreamId = kPesStreamIdAudio;
71 const uint8_t kDefaultVideoStreamId = kPesStreamIdVideo;
88 namespace edash_packager {
92 WvmMediaParser::WvmMediaParser()
93 : is_initialized_(false),
94 parse_state_(StartCode1),
97 metadata_is_complete_(false),
98 current_program_id_(0),
100 prev_pes_stream_id_(0),
101 pes_packet_bytes_(0),
104 prev_pes_flags_1_(0),
105 pes_header_data_bytes_(0),
109 index_program_id_(0),
111 crypto_unit_start_pos_(0),
113 decryption_key_source_(NULL) {
116 WvmMediaParser::~WvmMediaParser() {}
118 void WvmMediaParser::Init(
const InitCB& init_cb,
119 const NewSampleCB& new_sample_cb,
121 DCHECK(!is_initialized_);
122 DCHECK(!init_cb.is_null());
123 DCHECK(!new_sample_cb.is_null());
124 decryption_key_source_ = decryption_key_source;
126 new_sample_cb_ = new_sample_cb;
129 bool WvmMediaParser::Parse(
const uint8_t* buf,
int size) {
130 uint32_t num_bytes, prev_size;
131 num_bytes = prev_size = 0;
132 const uint8_t* read_ptr = buf;
133 const uint8_t* end = read_ptr + size;
135 while (read_ptr < end) {
136 switch (parse_state_) {
138 if (*read_ptr == kStartCode1) {
139 parse_state_ = StartCode2;
143 if (*read_ptr == kStartCode2) {
144 parse_state_ = StartCode3;
146 parse_state_ = StartCode1;
150 if (*read_ptr == kStartCode3) {
151 parse_state_ = StartCode4;
153 parse_state_ = StartCode1;
158 case kStartCode4Pack:
159 parse_state_ = PackHeader1;
161 case kStartCode4System:
162 parse_state_ = SystemHeader1;
164 case kStartCode4ProgramEnd:
165 parse_state_ = ProgramEnd;
168 parse_state_ = PesStreamId;
173 parse_state_ = PackHeader2;
176 parse_state_ = PackHeader3;
179 parse_state_ = PackHeader4;
182 parse_state_ = PackHeader5;
185 parse_state_ = PackHeader6;
188 parse_state_ = PackHeader7;
191 parse_state_ = PackHeader8;
194 parse_state_ = PackHeader9;
197 parse_state_ = PackHeader10;
200 skip_bytes_ = *read_ptr & 0x07;
201 parse_state_ = PackHeaderStuffingSkip;
204 skip_bytes_ = *read_ptr;
206 parse_state_ = SystemHeader2;
209 skip_bytes_ |= *read_ptr;
210 parse_state_ = SystemHeaderSkip;
212 case PackHeaderStuffingSkip:
213 if ((end - read_ptr) >= (int32_t)skip_bytes_) {
214 read_ptr += skip_bytes_;
216 parse_state_ = StartCode1;
218 skip_bytes_ -= (end - read_ptr);
222 case SystemHeaderSkip:
223 if ((end - read_ptr) >= (int32_t)skip_bytes_) {
224 read_ptr += skip_bytes_;
226 parse_state_ = StartCode1;
228 uint32_t remaining_size = end - read_ptr;
229 skip_bytes_ -= remaining_size;
234 pes_stream_id_ = *read_ptr;
235 if (!metadata_is_complete_ &&
236 (pes_stream_id_ != kPsmStreamId) &&
237 (pes_stream_id_ != kIndexStreamId) &&
238 (pes_stream_id_ != kEcmStreamId) &&
239 (pes_stream_id_ != kV2MetadataStreamId) &&
240 (pes_stream_id_ != kPaddingStreamId)) {
241 metadata_is_complete_ =
true;
243 parse_state_ = PesPacketLength1;
245 case PesPacketLength1:
246 pes_packet_bytes_ = *read_ptr;
247 pes_packet_bytes_ <<= 8;
248 parse_state_ = PesPacketLength2;
250 case PesPacketLength2:
251 pes_packet_bytes_ |= *read_ptr;
252 if (HAS_HEADER_EXTENSION(pes_stream_id_)) {
253 parse_state_ = PesExtension1;
255 pes_flags_1_ = pes_flags_2_ = 0;
256 pes_header_data_bytes_ = 0;
257 parse_state_ = PesPayload;
261 prev_pes_flags_1_ = pes_flags_1_;
262 pes_flags_1_ = *read_ptr;
264 parse_state_ = PesExtension2;
267 pes_flags_2_ = *read_ptr;
269 parse_state_ = PesExtension3;
272 pes_header_data_bytes_ = *read_ptr;
274 if (pes_flags_2_ & kPesOptPts) {
277 parse_state_ = PesHeaderData;
281 timestamp_ = (*read_ptr & 0x0E);
282 --pes_header_data_bytes_;
288 timestamp_ |= *read_ptr;
289 --pes_header_data_bytes_;
295 timestamp_ |= *read_ptr >> 1;
296 --pes_header_data_bytes_;
302 timestamp_ |= *read_ptr;
303 --pes_header_data_bytes_;
309 timestamp_ |= *read_ptr >> 1;
311 --pes_header_data_bytes_;
313 if (pes_flags_2_ & kPesOptDts) {
317 parse_state_ = PesHeaderData;
321 timestamp_ = (*read_ptr & 0x0E);
322 --pes_header_data_bytes_;
328 timestamp_ |= *read_ptr;
329 --pes_header_data_bytes_;
335 timestamp_ |= *read_ptr >> 1;
336 --pes_header_data_bytes_;
342 timestamp_ |= *read_ptr;
343 --pes_header_data_bytes_;
349 timestamp_ |= *read_ptr >> 1;
351 --pes_header_data_bytes_;
353 parse_state_ = PesHeaderData;
356 num_bytes = end - read_ptr;
357 if (num_bytes >= pes_header_data_bytes_) {
358 num_bytes = pes_header_data_bytes_;
359 parse_state_ = PesPayload;
361 pes_header_data_bytes_ -= num_bytes;
362 pes_packet_bytes_ -= num_bytes;
363 read_ptr += num_bytes;
366 switch (pes_stream_id_) {
369 parse_state_ = PsmPayload;
371 case kPaddingStreamId:
372 parse_state_ = Padding;
376 parse_state_ = EcmPayload;
379 parse_state_ = IndexPayload;
382 if (!DemuxNextPes(
false)) {
385 parse_state_ = EsPayload;
389 num_bytes = end - read_ptr;
390 if (num_bytes >= pes_packet_bytes_) {
391 num_bytes = pes_packet_bytes_;
392 parse_state_ = StartCode1;
395 pes_packet_bytes_ -= num_bytes;
396 prev_size = psm_data_.size();
397 psm_data_.resize(prev_size + num_bytes);
398 memcpy(&psm_data_[prev_size], read_ptr, num_bytes);
400 read_ptr += num_bytes;
403 num_bytes = end - read_ptr;
404 if (num_bytes >= pes_packet_bytes_) {
405 num_bytes = pes_packet_bytes_;
406 parse_state_ = StartCode1;
409 pes_packet_bytes_ -= num_bytes;
410 prev_size = ecm_.size();
411 ecm_.resize(prev_size + num_bytes);
412 memcpy(&ecm_[prev_size], read_ptr, num_bytes);
414 if ((pes_packet_bytes_ == 0) && !ecm_.empty()) {
419 read_ptr += num_bytes;
422 num_bytes = end - read_ptr;
423 if (num_bytes >= pes_packet_bytes_) {
424 num_bytes = pes_packet_bytes_;
425 parse_state_ = StartCode1;
428 pes_packet_bytes_ -= num_bytes;
429 prev_size = index_data_.size();
430 index_data_.resize(prev_size + num_bytes);
431 memcpy(&index_data_[prev_size], read_ptr, num_bytes);
433 if (pes_packet_bytes_ == 0 && !index_data_.empty()) {
434 if (!metadata_is_complete_) {
435 if (!ParseIndexEntry()) {
440 read_ptr += num_bytes;
443 num_bytes = end - read_ptr;
444 if (num_bytes >= pes_packet_bytes_) {
445 num_bytes = pes_packet_bytes_;
446 parse_state_ = StartCode1;
448 pes_packet_bytes_ -= num_bytes;
449 if (pes_stream_id_ != kV2MetadataStreamId) {
450 sample_data_.resize(sample_data_.size() + num_bytes);
451 memcpy(&sample_data_[sample_data_.size() - num_bytes], read_ptr,
454 prev_pes_stream_id_ = pes_stream_id_;
455 read_ptr += num_bytes;
458 num_bytes = end - read_ptr;
459 if (num_bytes >= pes_packet_bytes_) {
460 num_bytes = pes_packet_bytes_;
461 parse_state_ = StartCode1;
463 pes_packet_bytes_ -= num_bytes;
464 read_ptr += num_bytes;
467 parse_state_ = StartCode1;
468 metadata_is_complete_ =
true;
469 if (!DemuxNextPes(
true)) {
477 parse_state_ = StartCode1;
478 prev_media_sample_data_.Reset();
479 current_program_id_++;
492 bool WvmMediaParser::EmitLastSample(uint32_t stream_id,
493 scoped_refptr<MediaSample>& new_sample) {
494 std::string key = base::UintToString(current_program_id_)
496 .append(base::UintToString(stream_id));
497 std::map<std::string, uint32_t>::iterator it =
498 program_demux_stream_map_.find(key);
499 if (it == program_demux_stream_map_.end())
501 return EmitSample(stream_id, (*it).second, new_sample,
true);
504 bool WvmMediaParser::EmitPendingSamples() {
506 while (!media_sample_queue_.empty()) {
507 DemuxStreamIdMediaSample& demux_stream_media_sample =
508 media_sample_queue_.front();
509 if (!EmitSample(demux_stream_media_sample.parsed_audio_or_video_stream_id,
510 demux_stream_media_sample.demux_stream_id,
511 demux_stream_media_sample.media_sample,
515 media_sample_queue_.pop_front();
520 bool WvmMediaParser::Flush() {
523 if (prev_media_sample_data_.audio_sample != NULL) {
524 if (!EmitLastSample(prev_pes_stream_id_,
525 prev_media_sample_data_.audio_sample)) {
526 LOG(ERROR) <<
"Did not emit last sample for audio stream with ID = "
527 << prev_pes_stream_id_;
531 if (prev_media_sample_data_.video_sample != NULL) {
532 if (!EmitLastSample(prev_pes_stream_id_,
533 prev_media_sample_data_.video_sample)) {
534 LOG(ERROR) <<
"Did not emit last sample for video stream with ID = "
535 << prev_pes_stream_id_;
542 bool WvmMediaParser::ParseIndexEntry() {
545 if (current_program_id_ > 0) {
548 uint32_t index_size = 0;
549 if (index_data_.size() < kIndexVersion4HeaderSize) {
553 const uint8_t* read_ptr = vector_as_array(&index_data_);
554 if (ntohlFromBuffer(read_ptr) != kIndexMagic) {
560 uint32_t version = ntohlFromBuffer(read_ptr);
562 if (version == kVersion4) {
563 index_size = kIndexVersion4HeaderSize + ntohlFromBuffer(read_ptr);
564 if (index_data_.size() < index_size) {
568 read_ptr +=
sizeof(uint32_t);
571 uint32_t index_metadata_max_size = index_size - kIndexVersion4HeaderSize;
572 if (index_metadata_max_size <
sizeof(uint8_t)) {
577 uint64_t track_duration = 0;
578 int16_t trick_play_rate = 0;
579 uint32_t sampling_frequency = kDefaultSamplingFrequency;
580 uint32_t time_scale = kMpeg2ClockRate;
581 uint16_t video_width = 0;
582 uint16_t video_height = 0;
583 uint32_t pixel_width = 0;
584 uint32_t pixel_height = 0;
585 uint8_t nalu_length_size = kNaluLengthSize;
586 uint8_t num_channels = 0;
587 int audio_pes_stream_id = 0;
588 int video_pes_stream_id = 0;
589 bool has_video =
false;
590 bool has_audio =
false;
591 std::vector<uint8_t> audio_codec_config;
592 std::vector<uint8_t> video_codec_config;
593 uint8_t num_index_entries = *read_ptr;
595 --index_metadata_max_size;
597 for (uint8_t idx = 0; idx < num_index_entries; ++idx) {
598 if (index_metadata_max_size < (2 *
sizeof(uint8_t)) +
sizeof(uint32_t)) {
601 uint8_t tag = *read_ptr;
603 uint8_t type = *read_ptr;
605 uint32_t length = ntohlFromBuffer(read_ptr);
606 read_ptr +=
sizeof(uint32_t);
607 index_metadata_max_size -= (2 *
sizeof(uint8_t)) +
sizeof(uint32_t);
608 if (index_metadata_max_size < length) {
613 std::vector<uint8_t> binary_data;
614 switch (Type(type)) {
616 if (length ==
sizeof(uint8_t)) {
617 tagtype = GetTag(tag, length, read_ptr, &value);
623 if (length ==
sizeof(int8_t)) {
624 tagtype = GetTag(tag, length, read_ptr, &value);
630 if (length ==
sizeof(uint16_t)) {
631 tagtype = GetTag(tag, length, read_ptr, &value);
637 if (length ==
sizeof(int16_t)) {
638 tagtype = GetTag(tag, length, read_ptr, &value);
644 if (length ==
sizeof(uint32_t)) {
645 tagtype = GetTag(tag, length, read_ptr, &value);
651 if (length ==
sizeof(int32_t)) {
652 tagtype = GetTag(tag, length, read_ptr, &value);
658 if (length ==
sizeof(uint64_t)) {
659 tagtype = GetTag(tag, length, read_ptr, &value);
665 if (length ==
sizeof(int64_t)) {
666 tagtype = GetTag(tag, length, read_ptr, &value);
672 case Type_BinaryData:
673 binary_data.assign(read_ptr, read_ptr + length);
682 track_duration = value;
684 case TrackTrickPlayRate:
685 trick_play_rate = value;
688 video_pes_stream_id = value;
691 audio_pes_stream_id = value;
694 video_width = (uint16_t)value;
697 video_height = (uint16_t)value;
699 case AudioNumChannels:
700 num_channels = (uint8_t)value;
708 case VideoPixelWidth:
709 pixel_width =
static_cast<uint32_t
>(value);
711 case VideoPixelHeight:
712 pixel_height =
static_cast<uint32_t
>(value);
714 case Audio_EsDescriptor: {
715 mp4::ESDescriptor descriptor;
716 if (!descriptor.Parse(binary_data)) {
718 "Could not extract AudioSpecificConfig from ES_Descriptor";
721 audio_codec_config = descriptor.decoder_specific_info();
724 case Audio_EC3SpecificData:
725 case Audio_DtsSpecificData:
726 case Audio_AC3SpecificData:
727 LOG(ERROR) <<
"Audio type not supported.";
729 case AVCDecoderConfigurationRecord:
730 video_codec_config = binary_data;
737 index_metadata_max_size -= length;
740 index_size = read_ptr - vector_as_array(&index_data_);
743 VideoCodec video_codec = kCodecH264;
744 stream_infos_.push_back(
new VideoStreamInfo(
745 stream_id_count_, time_scale, track_duration, video_codec,
746 std::string(), std::string(), video_width, video_height,
747 pixel_width, pixel_height, trick_play_rate, nalu_length_size,
748 vector_as_array(&video_codec_config), video_codec_config.size(),
750 program_demux_stream_map_[base::UintToString(index_program_id_) +
":" +
751 base::UintToString(video_pes_stream_id ?
752 video_pes_stream_id :
753 kDefaultVideoStreamId)] =
757 AudioCodec audio_codec = kCodecAAC;
759 stream_infos_.push_back(
new AudioStreamInfo(
760 stream_id_count_, time_scale, track_duration, audio_codec,
761 std::string(), std::string(), kAacSampleSizeBits, num_channels,
762 sampling_frequency, 0, 0, vector_as_array(&audio_codec_config),
763 audio_codec_config.size(),
true));
764 program_demux_stream_map_[base::UintToString(index_program_id_) +
":" +
765 base::UintToString(audio_pes_stream_id ?
766 audio_pes_stream_id :
767 kDefaultAudioStreamId)] =
777 bool WvmMediaParser::DemuxNextPes(
bool is_program_end) {
778 bool output_encrypted_sample =
false;
779 if (!sample_data_.empty() && (prev_pes_flags_1_ & kScramblingBitsMask)) {
781 if (!content_decryptor_) {
782 output_encrypted_sample =
true;
784 content_decryptor_->Decrypt(&sample_data_[crypto_unit_start_pos_],
785 sample_data_.size() - crypto_unit_start_pos_,
786 &sample_data_[crypto_unit_start_pos_]);
791 if ((pes_flags_2_ & kPesOptPts) || is_program_end) {
792 if (!sample_data_.empty()) {
793 if (!Output(output_encrypted_sample)) {
797 StartMediaSampleDemux();
800 crypto_unit_start_pos_ = sample_data_.size();
804 void WvmMediaParser::StartMediaSampleDemux() {
805 bool is_key_frame = ((pes_flags_1_ & kPesOptAlign) != 0);
807 media_sample_->set_dts(dts_);
808 media_sample_->set_pts(pts_);
809 media_sample_->set_is_key_frame(is_key_frame);
811 sample_data_.clear();
814 bool WvmMediaParser::Output(
bool output_encrypted_sample) {
815 if (output_encrypted_sample) {
816 media_sample_->set_data(vector_as_array(&sample_data_),
817 sample_data_.size());
818 media_sample_->set_is_encrypted(
true);
820 if ((prev_pes_stream_id_ & kPesStreamIdVideoMask) == kPesStreamIdVideo) {
822 std::vector<uint8_t> nal_unit_stream;
823 if (!byte_to_unit_stream_converter_.ConvertByteStreamToNalUnitStream(
824 vector_as_array(&sample_data_), sample_data_.size(),
826 LOG(ERROR) <<
"Could not convert h.264 byte stream sample";
829 media_sample_->set_data(nal_unit_stream.data(), nal_unit_stream.size());
830 if (!is_initialized_) {
833 std::vector<uint8_t> decoder_config_record;
834 byte_to_unit_stream_converter_.GetAVCDecoderConfigurationRecord(
835 &decoder_config_record);
836 for (uint32_t i = 0; i < stream_infos_.size(); i++) {
837 if (stream_infos_[i]->stream_type() == media::kStreamVideo &&
838 stream_infos_[i]->codec_string().empty()) {
839 const std::vector<uint8_t>* stream_config;
840 if (stream_infos_[i]->extra_data().empty()) {
843 stream_infos_[i]->set_extra_data(decoder_config_record);
844 stream_config = &decoder_config_record;
847 stream_config = &stream_infos_[i]->extra_data();
849 DCHECK(stream_config);
851 VideoStreamInfo* video_stream_info =
852 reinterpret_cast<VideoStreamInfo*
>(stream_infos_[i].get());
853 AVCDecoderConfiguration avc_config;
854 if (!avc_config.Parse(*stream_config)) {
855 LOG(WARNING) <<
"Failed to parse AVCDecoderConfigurationRecord. "
856 "Using computed configuration record instead.";
857 video_stream_info->set_extra_data(decoder_config_record);
858 if (!avc_config.Parse(decoder_config_record)) {
859 LOG(ERROR) <<
"Failed to parse AVCDecoderConfigurationRecord.";
863 video_stream_info->set_codec_string(avc_config.GetCodecString());
865 if (avc_config.pixel_width() != video_stream_info->pixel_width() ||
866 avc_config.pixel_height() !=
867 video_stream_info->pixel_height()) {
868 LOG_IF(WARNING, video_stream_info->pixel_width() != 0 ||
869 video_stream_info->pixel_height() != 0)
870 <<
"Pixel aspect ratio in WVM metadata ("
871 << video_stream_info->pixel_width() <<
","
872 << video_stream_info->pixel_height()
873 <<
") does not match with SAR in "
874 "AVCDecoderConfigurationRecord ("
875 << avc_config.pixel_width() <<
","
876 << avc_config.pixel_height()
877 <<
"). Use AVCDecoderConfigurationRecord.";
878 video_stream_info->set_pixel_width(avc_config.pixel_width());
879 video_stream_info->set_pixel_height(avc_config.pixel_height());
881 if (avc_config.coded_width() != video_stream_info->width() ||
882 avc_config.coded_height() != video_stream_info->height()) {
883 LOG(WARNING) <<
"Resolution in WVM metadata ("
884 << video_stream_info->width() <<
","
885 << video_stream_info->height()
886 <<
") does not match with resolution in "
887 "AVCDecoderConfigurationRecord ("
888 << avc_config.coded_width() <<
","
889 << avc_config.coded_height()
890 <<
"). Use AVCDecoderConfigurationRecord.";
891 video_stream_info->set_width(avc_config.coded_width());
892 video_stream_info->set_height(avc_config.coded_height());
897 }
else if ((prev_pes_stream_id_ & kPesStreamIdAudioMask) ==
901 vector_as_array(&sample_data_), kAdtsHeaderMinSize);
902 media::mp2t::AdtsHeader adts_header;
903 const uint8_t* frame_ptr = vector_as_array(&sample_data_);
904 if (!adts_header.Parse(frame_ptr, frame_size)) {
905 LOG(ERROR) <<
"Could not parse ADTS header";
908 size_t header_size = adts_header.GetAdtsHeaderSize(frame_ptr,
910 media_sample_->set_data(frame_ptr + header_size,
911 frame_size - header_size);
912 if (!is_initialized_) {
913 for (uint32_t i = 0; i < stream_infos_.size(); i++) {
914 if (stream_infos_[i]->stream_type() == media::kStreamAudio &&
915 stream_infos_[i]->codec_string().empty()) {
916 AudioStreamInfo* audio_stream_info =
917 reinterpret_cast<AudioStreamInfo*
>(stream_infos_[i].get());
918 if (audio_stream_info->extra_data().empty()) {
921 audio_stream_info->set_sampling_frequency(
922 adts_header.GetSamplingFrequency());
923 std::vector<uint8_t> audio_specific_config;
924 if (!adts_header.GetAudioSpecificConfig(&audio_specific_config)) {
925 LOG(ERROR) <<
"Could not compute AACaudiospecificconfig";
928 audio_stream_info->set_extra_data(audio_specific_config);
929 audio_stream_info->set_codec_string(
931 kCodecAAC, adts_header.GetObjectType()));
935 mp4::AACAudioSpecificConfig aac_config;
936 if (!aac_config.Parse(stream_infos_[i]->extra_data())) {
937 LOG(ERROR) <<
"Could not parse AACAudioSpecificconfig";
940 audio_stream_info->set_sampling_frequency(aac_config.frequency());
941 audio_stream_info->set_codec_string(
943 kCodecAAC, aac_config.audio_object_type()));
951 if (!is_initialized_) {
952 bool all_streams_have_config =
true;
954 for (uint32_t i = 0; i < stream_infos_.size(); i++) {
955 if (stream_infos_[i]->codec_string().empty()) {
956 all_streams_have_config =
false;
960 if (all_streams_have_config) {
961 init_cb_.Run(stream_infos_);
962 is_initialized_ =
true;
966 DCHECK_GT(media_sample_->data_size(), 0UL);
967 std::string key = base::UintToString(current_program_id_).append(
":")
968 .append(base::UintToString(prev_pes_stream_id_));
969 std::map<std::string, uint32_t>::iterator it =
970 program_demux_stream_map_.find(key);
971 if (it == program_demux_stream_map_.end()) {
976 DemuxStreamIdMediaSample demux_stream_media_sample;
977 demux_stream_media_sample.parsed_audio_or_video_stream_id =
979 demux_stream_media_sample.demux_stream_id = (*it).second;
980 demux_stream_media_sample.media_sample = media_sample_;
982 if (!is_initialized_) {
983 media_sample_queue_.push_back(demux_stream_media_sample);
986 while (!media_sample_queue_.empty()) {
987 if (!EmitPendingSamples())
991 if (!EmitSample(prev_pes_stream_id_, (*it).second, media_sample_,
false))
997 bool WvmMediaParser::EmitSample(uint32_t parsed_audio_or_video_stream_id,
999 scoped_refptr<MediaSample>& new_sample,
1000 bool isLastSample) {
1003 if ((parsed_audio_or_video_stream_id & kPesStreamIdVideoMask) ==
1004 kPesStreamIdVideo) {
1005 new_sample->set_duration(prev_media_sample_data_.video_sample_duration);
1006 }
else if ((parsed_audio_or_video_stream_id & kPesStreamIdAudioMask) ==
1007 kPesStreamIdAudio) {
1008 new_sample->set_duration(prev_media_sample_data_.audio_sample_duration);
1010 if (!new_sample_cb_.Run(stream_id, new_sample)) {
1011 LOG(ERROR) <<
"Failed to process the last sample.";
1019 if ((parsed_audio_or_video_stream_id & kPesStreamIdVideoMask) ==
1020 kPesStreamIdVideo) {
1021 if (prev_media_sample_data_.video_sample == NULL) {
1022 prev_media_sample_data_.video_sample = new_sample;
1023 prev_media_sample_data_.video_stream_id = stream_id;
1026 prev_media_sample_data_.video_sample->set_duration(
1027 new_sample->dts() - prev_media_sample_data_.video_sample->dts());
1028 prev_media_sample_data_.video_sample_duration =
1029 prev_media_sample_data_.video_sample->duration();
1030 if (!new_sample_cb_.Run(prev_media_sample_data_.video_stream_id,
1031 prev_media_sample_data_.video_sample)) {
1032 LOG(ERROR) <<
"Failed to process the video sample.";
1035 prev_media_sample_data_.video_sample = new_sample;
1036 prev_media_sample_data_.video_stream_id = stream_id;
1037 }
else if ((parsed_audio_or_video_stream_id & kPesStreamIdAudioMask) ==
1038 kPesStreamIdAudio) {
1039 if (prev_media_sample_data_.audio_sample == NULL) {
1040 prev_media_sample_data_.audio_sample = new_sample;
1041 prev_media_sample_data_.audio_stream_id = stream_id;
1044 prev_media_sample_data_.audio_sample->set_duration(
1045 new_sample->dts() - prev_media_sample_data_.audio_sample->dts());
1046 prev_media_sample_data_.audio_sample_duration =
1047 prev_media_sample_data_.audio_sample->duration();
1048 if (!new_sample_cb_.Run(prev_media_sample_data_.audio_stream_id,
1049 prev_media_sample_data_.audio_sample)) {
1050 LOG(ERROR) <<
"Failed to process the audio sample.";
1053 prev_media_sample_data_.audio_sample = new_sample;
1054 prev_media_sample_data_.audio_stream_id = stream_id;
1059 bool WvmMediaParser::GetAssetKey(
const uint32_t asset_id,
1060 EncryptionKey* encryption_key) {
1061 DCHECK(decryption_key_source_);
1062 Status status = decryption_key_source_->FetchKeys(asset_id);
1064 LOG(ERROR) <<
"Fetch Key(s) failed for AssetID = " << asset_id
1065 <<
", error = " << status;
1069 status = decryption_key_source_->GetKey(KeySource::TRACK_TYPE_HD,
1072 LOG(ERROR) <<
"Fetch Key(s) failed for AssetID = " << asset_id
1073 <<
", error = " << status;
1080 bool WvmMediaParser::ProcessEcm() {
1082 if (!decryption_key_source_)
1085 if (current_program_id_ > 0) {
1088 if (ecm_.size() != kEcmSizeBytes) {
1089 LOG(ERROR) <<
"Unexpected ECM size = " << ecm_.size()
1090 <<
", expected size = " << kEcmSizeBytes;
1093 const uint8_t* ecm_data = ecm_.data();
1095 ecm_data +=
sizeof(uint32_t);
1096 ecm_data +=
sizeof(uint32_t);
1097 ecm_data +=
sizeof(uint32_t);
1098 uint32_t asset_id = ntohlFromBuffer(ecm_data);
1099 if (asset_id == 0) {
1100 LOG(ERROR) <<
"AssetID in ECM is not valid.";
1103 ecm_data +=
sizeof(uint32_t);
1104 EncryptionKey encryption_key;
1105 if (!GetAssetKey(asset_id, &encryption_key)) {
1108 if (encryption_key.key.size() < kAssetKeySizeBytes) {
1109 LOG(ERROR) <<
"Asset Key size of " << encryption_key.key.size()
1110 <<
" for AssetID = " << asset_id
1111 <<
" is less than minimum asset key size.";
1117 std::vector<uint8_t> asset_key(
1118 encryption_key.key.begin(),
1119 encryption_key.key.begin() + kAssetKeySizeBytes);
1120 std::vector<uint8_t> iv(kInitializationVectorSizeBytes);
1121 AesCbcCtsDecryptor asset_decryptor;
1122 if (!asset_decryptor.InitializeWithIv(asset_key, iv)) {
1123 LOG(ERROR) <<
"Failed to initialize asset_decryptor.";
1127 const size_t content_key_buffer_size =
1128 kEcmFlagsSizeBytes + kEcmContentKeySizeBytes +
1129 kEcmPaddingSizeBytes;
1130 std::vector<uint8_t> content_key_buffer(content_key_buffer_size);
1131 asset_decryptor.Decrypt(
1132 ecm_data, content_key_buffer_size, vector_as_array(&content_key_buffer));
1134 std::vector<uint8_t> decrypted_content_key_vec(
1135 content_key_buffer.begin() + 4,
1136 content_key_buffer.begin() + 20);
1137 scoped_ptr<AesCbcCtsDecryptor> content_decryptor(
new AesCbcCtsDecryptor);
1138 if (!content_decryptor->InitializeWithIv(decrypted_content_key_vec, iv)) {
1139 LOG(ERROR) <<
"Failed to initialize content decryptor.";
1143 content_decryptor_ = content_decryptor.Pass();
1147 DemuxStreamIdMediaSample::DemuxStreamIdMediaSample() :
1149 parsed_audio_or_video_stream_id(0) {}
1151 DemuxStreamIdMediaSample::~DemuxStreamIdMediaSample() {}
1153 PrevSampleData::PrevSampleData() {
1157 PrevSampleData::~PrevSampleData() {}
1159 void PrevSampleData::Reset() {
1160 audio_sample = NULL;
1161 video_sample = NULL;
1162 audio_stream_id = 0;
1163 video_stream_id = 0;
1164 audio_sample_duration = 0;
1165 video_sample_duration = 0;