Shaka Packager SDK
segmenter.cc
1 // Copyright 2014 Google Inc. All rights reserved.
2 //
3 // Use of this source code is governed by a BSD-style
4 // license that can be found in the LICENSE file or at
5 // https://developers.google.com/open-source/licenses/bsd
6 
7 #include "packager/media/formats/mp4/segmenter.h"
8 
9 #include <algorithm>
10 
11 #include "packager/base/logging.h"
12 #include "packager/media/base/buffer_writer.h"
13 #include "packager/media/base/id3_tag.h"
14 #include "packager/media/base/media_sample.h"
15 #include "packager/media/base/muxer_options.h"
16 #include "packager/media/base/muxer_util.h"
17 #include "packager/media/base/stream_info.h"
18 #include "packager/media/chunking/chunking_handler.h"
19 #include "packager/media/event/progress_listener.h"
20 #include "packager/media/formats/mp4/box_definitions.h"
21 #include "packager/media/formats/mp4/fragmenter.h"
22 #include "packager/media/formats/mp4/key_frame_info.h"
23 #include "packager/version/version.h"
24 
25 namespace shaka {
26 namespace media {
27 namespace mp4 {
28 
29 namespace {
30 
31 uint64_t Rescale(uint64_t time_in_old_scale,
32  uint32_t old_scale,
33  uint32_t new_scale) {
34  return static_cast<double>(time_in_old_scale) / old_scale * new_scale;
35 }
36 
37 } // namespace
38 
39 Segmenter::Segmenter(const MuxerOptions& options,
40  std::unique_ptr<FileType> ftyp,
41  std::unique_ptr<Movie> moov)
42  : options_(options),
43  ftyp_(std::move(ftyp)),
44  moov_(std::move(moov)),
45  moof_(new MovieFragment()),
46  fragment_buffer_(new BufferWriter()),
47  sidx_(new SegmentIndex()) {}
48 
49 Segmenter::~Segmenter() {}
50 
52  const std::vector<std::shared_ptr<const StreamInfo>>& streams,
53  MuxerListener* muxer_listener,
54  ProgressListener* progress_listener) {
55  DCHECK_LT(0u, streams.size());
56  muxer_listener_ = muxer_listener;
57  progress_listener_ = progress_listener;
58  moof_->header.sequence_number = 0;
59 
60  moof_->tracks.resize(streams.size());
61  fragmenters_.resize(streams.size());
62  stream_durations_.resize(streams.size());
63 
64  for (uint32_t i = 0; i < streams.size(); ++i) {
65  moof_->tracks[i].header.track_id = i + 1;
66  if (streams[i]->stream_type() == kStreamVideo) {
67  // Use the first video stream as the reference stream (which is 1-based).
68  if (sidx_->reference_id == 0)
69  sidx_->reference_id = i + 1;
70  }
71  fragmenters_[i].reset(new Fragmenter(streams[i], &moof_->tracks[i]));
72  }
73 
74  if (options_.mp4_params.use_decoding_timestamp_in_timeline) {
75  for (uint32_t i = 0; i < streams.size(); ++i)
76  fragmenters_[i]->set_use_decoding_timestamp_in_timeline(true);
77  }
78 
79  // Choose the first stream if there is no VIDEO.
80  if (sidx_->reference_id == 0)
81  sidx_->reference_id = 1;
82  sidx_->timescale = streams[GetReferenceStreamId()]->time_scale();
83 
84  // Use media duration as progress target.
85  progress_target_ = streams[GetReferenceStreamId()]->duration();
86 
87  // Use the reference stream's time scale as movie time scale.
88  moov_->header.timescale = sidx_->timescale;
89  moof_->header.sequence_number = 1;
90 
91  // Fill in version information.
92  const std::string version = GetPackagerVersion();
93  if (!version.empty()) {
94  moov_->metadata.handler.handler_type = FOURCC_ID32;
95  moov_->metadata.id3v2.language.code = "eng";
96 
97  Id3Tag id3_tag;
98  id3_tag.AddPrivateFrame(GetPackagerProjectUrl(), version);
99  CHECK(id3_tag.WriteToVector(&moov_->metadata.id3v2.id3v2_data));
100  }
101  return DoInitialize();
102 }
103 
105  // Set movie duration. Note that the duration in mvhd, tkhd, mdhd should not
106  // be touched, i.e. kept at 0. The updated moov box will be written to output
107  // file for VOD and static live case only.
108  moov_->extends.header.fragment_duration = 0;
109  for (size_t i = 0; i < stream_durations_.size(); ++i) {
110  uint64_t duration =
111  Rescale(stream_durations_[i], moov_->tracks[i].media.header.timescale,
112  moov_->header.timescale);
113  if (duration > moov_->extends.header.fragment_duration)
114  moov_->extends.header.fragment_duration = duration;
115  }
116  return DoFinalize();
117 }
118 
119 Status Segmenter::AddSample(size_t stream_id, const MediaSample& sample) {
120  // Set default sample duration if it has not been set yet.
121  if (moov_->extends.tracks[stream_id].default_sample_duration == 0) {
122  moov_->extends.tracks[stream_id].default_sample_duration =
123  sample.duration();
124  }
125 
126  DCHECK_LT(stream_id, fragmenters_.size());
127  Fragmenter* fragmenter = fragmenters_[stream_id].get();
128  if (fragmenter->fragment_finalized()) {
129  return Status(error::FRAGMENT_FINALIZED,
130  "Current fragment is finalized already.");
131  }
132 
133  Status status = fragmenter->AddSample(sample);
134  if (!status.ok())
135  return status;
136 
137  if (sample_duration_ == 0)
138  sample_duration_ = sample.duration();
139  stream_durations_[stream_id] += sample.duration();
140  return Status::OK;
141 }
142 
144  const SegmentInfo& segment_info) {
145  if (segment_info.key_rotation_encryption_config) {
146  FinalizeFragmentForKeyRotation(
147  stream_id, segment_info.is_encrypted,
148  *segment_info.key_rotation_encryption_config);
149  }
150 
151  DCHECK_LT(stream_id, fragmenters_.size());
152  Fragmenter* fragmenter = fragmenters_[stream_id].get();
153  DCHECK(fragmenter);
154  Status status = fragmenter->FinalizeFragment();
155  if (!status.ok())
156  return status;
157 
158  // Check if all tracks are ready for fragmentation.
159  for (const std::unique_ptr<Fragmenter>& fragmenter : fragmenters_) {
160  if (!fragmenter->fragment_finalized())
161  return Status::OK;
162  }
163 
164  MediaData mdat;
165  // Data offset relative to 'moof': moof size + mdat header size.
166  // The code will also update box sizes for moof_ and its child boxes.
167  uint64_t data_offset = moof_->ComputeSize() + mdat.HeaderSize();
168  // 'traf' should follow 'mfhd' moof header box.
169  uint64_t next_traf_position = moof_->HeaderSize() + moof_->header.box_size();
170  for (size_t i = 0; i < moof_->tracks.size(); ++i) {
171  TrackFragment& traf = moof_->tracks[i];
172  if (traf.auxiliary_offset.offsets.size() > 0) {
173  DCHECK_EQ(traf.auxiliary_offset.offsets.size(), 1u);
174  DCHECK(!traf.sample_encryption.sample_encryption_entries.empty());
175 
176  next_traf_position += traf.box_size();
177  // SampleEncryption 'senc' box should be the last box in 'traf'.
178  // |auxiliary_offset| should point to the data of SampleEncryption.
179  traf.auxiliary_offset.offsets[0] =
180  next_traf_position - traf.sample_encryption.box_size() +
181  traf.sample_encryption.HeaderSize() +
182  sizeof(uint32_t); // for sample count field in 'senc'
183  }
184  traf.runs[0].data_offset = data_offset + mdat.data_size;
185  mdat.data_size += static_cast<uint32_t>(fragmenters_[i]->data()->Size());
186  }
187 
188  // Generate segment reference.
189  sidx_->references.resize(sidx_->references.size() + 1);
190  fragmenters_[GetReferenceStreamId()]->GenerateSegmentReference(
191  &sidx_->references[sidx_->references.size() - 1]);
192  sidx_->references[sidx_->references.size() - 1].referenced_size =
193  data_offset + mdat.data_size;
194 
195  const uint64_t moof_start_offset = fragment_buffer_->Size();
196 
197  // Write the fragment to buffer.
198  moof_->Write(fragment_buffer_.get());
199  mdat.WriteHeader(fragment_buffer_.get());
200 
201  bool first_key_frame = true;
202  for (const std::unique_ptr<Fragmenter>& fragmenter : fragmenters_) {
203  // https://goo.gl/xcFus6 6. Trick play requirements
204  // 6.10. If using fMP4, I-frame segments must include the 'moof' header
205  // associated with the I-frame. It also implies that only the first key
206  // frame can be included.
207  if (!fragmenter->key_frame_infos().empty() && first_key_frame) {
208  const KeyFrameInfo& key_frame_info =
209  fragmenter->key_frame_infos().front();
210  first_key_frame = false;
211  key_frame_infos_.push_back(
212  {key_frame_info.timestamp, moof_start_offset,
213  fragment_buffer_->Size() - moof_start_offset + key_frame_info.size});
214  }
215  fragment_buffer_->AppendBuffer(*fragmenter->data());
216  }
217 
218  // Increase sequence_number for next fragment.
219  ++moof_->header.sequence_number;
220 
221  for (std::unique_ptr<Fragmenter>& fragmenter : fragmenters_)
222  fragmenter->ClearFragmentFinalized();
223  if (!segment_info.is_subsegment) {
224  Status status = DoFinalizeSegment();
225  // Reset segment information to initial state.
226  sidx_->references.clear();
227  key_frame_infos_.clear();
228  return status;
229  }
230  return Status::OK;
231 }
232 
233 uint32_t Segmenter::GetReferenceTimeScale() const {
234  return moov_->header.timescale;
235 }
236 
237 double Segmenter::GetDuration() const {
238  uint64_t duration = moov_->extends.header.fragment_duration;
239  if (duration == 0) {
240  // Handling the case where this is not properly initialized.
241  return 0.0;
242  }
243  return static_cast<double>(duration) / moov_->header.timescale;
244 }
245 
246 void Segmenter::UpdateProgress(uint64_t progress) {
247  accumulated_progress_ += progress;
248 
249  if (!progress_listener_) return;
250  if (progress_target_ == 0) return;
251  // It might happen that accumulated progress exceeds progress_target due to
252  // computation errors, e.g. rounding error. Cap it so it never reports > 100%
253  // progress.
254  if (accumulated_progress_ >= progress_target_) {
255  progress_listener_->OnProgress(1.0);
256  } else {
257  progress_listener_->OnProgress(static_cast<double>(accumulated_progress_) /
258  progress_target_);
259  }
260 }
261 
262 void Segmenter::SetComplete() {
263  if (!progress_listener_) return;
264  progress_listener_->OnProgress(1.0);
265 }
266 
267 uint32_t Segmenter::GetReferenceStreamId() {
268  DCHECK(sidx_);
269  return sidx_->reference_id - 1;
270 }
271 
272 void Segmenter::FinalizeFragmentForKeyRotation(
273  size_t stream_id,
274  bool fragment_encrypted,
275  const EncryptionConfig& encryption_config) {
276  if (options_.mp4_params.include_pssh_in_stream) {
277  const std::vector<ProtectionSystemSpecificInfo>& system_info =
278  encryption_config.key_system_info;
279  moof_->pssh.resize(system_info.size());
280  for (size_t i = 0; i < system_info.size(); i++)
281  moof_->pssh[i].raw_box = system_info[i].psshs;
282  } else {
283  LOG(WARNING)
284  << "Key rotation and no pssh in stream may not work well together.";
285  }
286 
287  // Skip the following steps if the current fragment is not going to be
288  // encrypted. 'pssh' box needs to be included in the fragment, which is
289  // performed above, regardless of whether the fragment is encrypted. This is
290  // necessary for two reasons: 1) Requesting keys before reaching encrypted
291  // content avoids playback delay due to license requests; 2) In Chrome, CDM
292  // must be initialized before starting the playback and CDM can only be
293  // initialized with a valid 'pssh'.
294  if (!fragment_encrypted)
295  return;
296 
297  DCHECK_LT(stream_id, moof_->tracks.size());
298  TrackFragment& traf = moof_->tracks[stream_id];
299  traf.sample_group_descriptions.resize(traf.sample_group_descriptions.size() +
300  1);
301  SampleGroupDescription& sample_group_description =
302  traf.sample_group_descriptions.back();
303  sample_group_description.grouping_type = FOURCC_seig;
304 
305  sample_group_description.cenc_sample_encryption_info_entries.resize(1);
306  CencSampleEncryptionInfoEntry& sample_group_entry =
307  sample_group_description.cenc_sample_encryption_info_entries.back();
308  sample_group_entry.is_protected = 1;
309  sample_group_entry.per_sample_iv_size = encryption_config.per_sample_iv_size;
310  sample_group_entry.constant_iv = encryption_config.constant_iv;
311  sample_group_entry.crypt_byte_block = encryption_config.crypt_byte_block;
312  sample_group_entry.skip_byte_block = encryption_config.skip_byte_block;
313  sample_group_entry.key_id = encryption_config.key_id;
314 }
315 
316 } // namespace mp4
317 } // namespace media
318 } // namespace shaka
uint32_t HeaderSize() const final
Definition: box.cc:75
virtual bool WriteToVector(std::vector< uint8_t > *output)
Definition: id3_tag.cc:67
STL namespace.
virtual void AddPrivateFrame(const std::string &owner, const std::string &data)
Definition: id3_tag.cc:49
All the methods that are virtual are virtual for mocking.
Status AddSample(const MediaSample &sample)
Definition: segmenter.cc:159
virtual Status FinalizeSegment(uint64_t start_timestamp, uint64_t duration_timestamp, bool is_subsegment)=0
Finalize the (sub)segment.
Definition: segmenter.cc:195
uint32_t ComputeSize()
Definition: box.cc:50
This class listens to progress updates events.
Status Initialize(const StreamInfo &info, ProgressListener *progress_listener, MuxerListener *muxer_listener)
Definition: segmenter.cc:78
Tracks key frame information.
uint32_t box_size()
Definition: box.h:55
virtual uint32_t HeaderSize() const
Definition: box.cc:55
Class to hold a media sample.
Definition: media_sample.h:22
void UpdateProgress(uint64_t progress)
Update segmentation progress using ProgressListener.
Definition: segmenter.cc:270
void WriteHeader(BufferWriter *writer)
Definition: box.cc:38