shaka-packager/packager/media/formats/mp4/webvtt_fragmenter.h

// Copyright 2015 Google Inc. All rights reserved.
//
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file or at
// https://developers.google.com/open-source/licenses/bsd

#ifndef PACKAGER_MEDIA_FORMATS_MP4_FRAGMENTER_H_
#define PACKAGER_MEDIA_FORMATS_MP4_FRAGMENTER_H_

#include <stdint.h>
#include <list>

#include "packager/media/base/status.h"
#include "packager/media/formats/mp4/box_definitions.h"
#include "packager/media/formats/webvtt/webvtt_media_parser.h"

namespace shaka {
namespace media {
namespace mp4 {

/// Appends box to vector.
/// @param box is the box to be serialized.
/// @param output_vector is where the data is appended.
void AppendBoxToVector(Box* box, std::vector<uint8_t>* output_vector);

/// According to the spec, when cues overlap, samples must be created.\n
/// The example below has 2 WebVTT cues:\n
/// 00:01:00.000 --> 00:02:00.000\n
/// hello\n
///\n
/// 00:01:15.000 --> 00:02:15.000\n
/// how are you?\n
///\n
/// These are added (AddSample()) as 2 samples but must be split into 3 samples
/// and 4 cues ('vttc' boxes).\n
/// First sample:\n
///  start_time: 00:01:00.000\n
///  duration: 15 seconds\n
///  cue payload: hello\n
///\n
/// Second sample:\n
///  start_time: 00:01:15.000\n
///  duration: 45 seconds\n
///  cue payload: hello\n
///  cue payload: how are you?\n
///\n
/// Third sample:\n
///  start_time: 00:02:00.000\n
///  duration: 15 seconds\n
///  cue payload: how are you?\n
///\n
/// This class buffers the samples that are passed to AddSample() and creates
/// more samples as necessary.
// TODO(rkuroiwa): Rename this to WebVttSampleConverter, and put this in
// webvtt parser.
// For now, the output (from PopSample()) should still be in ISO-BMFF box form;
// and also to signal that, should have different types for TextStreamInfo. e.g.
// TextStreamInfo::type() returns kIsoBmffStreamText.
class WebVttFragmenter {
 public:
  WebVttFragmenter();
  ~WebVttFragmenter();

  /// Add a sample.
  /// @param sample is the sample to be added. It should contain one VTT cue.
  void PushSample(std::shared_ptr<MediaSample> sample);

  /// Process all the buffered samples.
  /// This finalizes the object and further calls to PushSample() may result in
  /// an undefined behavior.
  void Flush();

  /// @return The number of samples that are processed and ready to be popped.
  size_t ReadySamplesSize();

  /// Returns a MediaSample that is non-overlapping with the previous samples
  /// that it has output. The data in the sample is one or more ISO-BMFF boxes
  /// for the duration of the sample.
  /// @return The first sample that is ready to be processed.
  std::shared_ptr<MediaSample> PopSample();

 private:
  // Handle |cues_| except the last item, and create samples from them.
  // All cues that overlap with the latest cue are not processed.
  // Usually the last cue (and cues that overlap with it) should not be
  // processed right away because the following cues may overlap with the latest
  // cue or the existing cues.
  // If a cue has been proceessed, then this returns true.
  bool HandleAllCuesButLatest();

  // Same as HandleAllCuesButLatest() but it also includes the latest cue.
  // If a cue has been processed, then this returns true.
  bool HandleAllCues();

  // Sweep line algorithm that handles the cues in |cues_|.
  // This does not erase |cues_|.
  // If a cue has been processed, this returns true.
  // |sweep_line| is the start time and |sweep_stop_time| is when the sweep
  // should stop.
  bool SweepCues(uint64_t sweep_line, uint64_t sweep_stop_time);

  // This is going to be in 'mdat' box. Keep this around until a sample is
  // ready.
  std::list<Cue> cues_;

  // For comment samples.
  std::list<VTTAdditionalTextBox> additional_texts_;

  // Samples that are ready to be processed.
  std::list<std::shared_ptr<MediaSample>> ready_samples_;

  // This keeps track of the max end time of the processed cues which is the
  // start time of the next cue. Used to check if cue_current_time has to be set
  // or an empty cue (gap) has to be added.
  uint64_t next_cue_start_time_;

  DISALLOW_COPY_AND_ASSIGN(WebVttFragmenter);
};

}  // namespace shaka
}  // namespace media
}  // namespace edash_packager

#endif  // PACKAGER_MEDIA_FORMATS_MP4_FRAGMENTER_H_