159 lines
5.0 KiB
Protocol Buffer
159 lines
5.0 KiB
Protocol Buffer
// This file defines the protocol between Muxer and classes for generating MPD
|
|
// files.
|
|
|
|
syntax = "proto2";
|
|
|
|
package shaka;
|
|
|
|
message Range {
|
|
optional uint64 begin = 1;
|
|
optional uint64 end = 2;
|
|
}
|
|
|
|
message MediaInfo {
|
|
enum ContainerType {
|
|
CONTAINER_UNKNOWN = 0;
|
|
CONTAINER_MP4 = 1;
|
|
CONTAINER_MPEG2_TS= 2;
|
|
CONTAINER_WEBM = 3;
|
|
CONTAINER_TEXT = 4;
|
|
}
|
|
|
|
message VideoInfo {
|
|
optional string codec = 1;
|
|
|
|
// The width and height of the actual number of pixels. This will not be the
|
|
// same as the visual width and height if the sample aspect ratio (sar)
|
|
// is not 1:1.
|
|
optional uint32 width = 2;
|
|
optional uint32 height = 3;
|
|
|
|
optional uint32 time_scale = 4;
|
|
// Relative to |time_scale|. IOW |time_scale| / |frame_duration| is the
|
|
// framerate.
|
|
optional uint64 frame_duration = 5;
|
|
optional bytes decoder_config = 6;
|
|
|
|
// pixel_width:pixel_height is the the sample aspect ratio (sar) of the
|
|
// video.
|
|
// Note that (pixel_width * width):(pixel_height * height) is the picture
|
|
// aspect ratio, or the @par attribute set on AdaptationSet element.
|
|
optional uint32 pixel_width = 7;
|
|
optional uint32 pixel_height = 8;
|
|
|
|
// trick_play_rate: sample rate of the key frame from the original stream.
|
|
// e.g., 1 means every key frame, 2 means every two key frames.
|
|
optional uint32 trick_play_rate = 9;
|
|
// playback_rate: the playout capability (e.g., 4x, 8x, 16x fast foward) of
|
|
// the trick play stream.
|
|
optional uint32 playback_rate = 10;
|
|
}
|
|
|
|
message AudioInfo {
|
|
optional string codec = 1;
|
|
optional uint32 sampling_frequency = 2;
|
|
optional uint32 time_scale = 3;
|
|
optional uint32 num_channels = 4;
|
|
optional string language = 5;
|
|
optional bytes decoder_config = 6;
|
|
optional AudioCodecSpecificData codec_specific_data = 7;
|
|
}
|
|
|
|
message AudioCodecSpecificData {
|
|
// EC3 Channel map bit fields, encoded based on ETSI TS 102 366 V1.3.1
|
|
// Digital Audio Compression (AC-3, Enhanced AC-3) Standard E.1.3.1.8.
|
|
optional uint32 ec3_channel_map = 1;
|
|
}
|
|
|
|
message TextInfo {
|
|
enum TextType {
|
|
UNKNOWN = 0;
|
|
CAPTION = 1;
|
|
SUBTITLE = 2;
|
|
}
|
|
optional string format = 1;
|
|
optional string language = 2;
|
|
optional TextType type = 3;
|
|
}
|
|
|
|
message ProtectedContent {
|
|
message ContentProtectionEntry {
|
|
// Human readable UUID of the DRM.
|
|
optional string uuid = 1;
|
|
// Human readable DRM name and version string.
|
|
// e.g. "My Content Protection v1.0"
|
|
optional string name_version = 2;
|
|
// The raw 'pssh' box for the media.
|
|
optional bytes pssh = 3;
|
|
}
|
|
|
|
// The default key ID for the encrypted media.
|
|
optional bytes default_key_id = 1;
|
|
repeated ContentProtectionEntry content_protection_entry = 2;
|
|
// Specifies the protection scheme: 'cenc', 'cens', 'cbc1', 'cbcs'.
|
|
// "cbca" is also valid which is a place holder for SAMPLE-AES encryption.
|
|
optional string protection_scheme = 3 [default = 'cenc'];
|
|
}
|
|
|
|
// TODO(rkuroiwa): Remove this. <ContentProtection> element that must be added
|
|
// should be done by directly using the MpdBuilder interface.
|
|
// Use this to specify ContentProtection elements that should be set in
|
|
// the MPD, if ContentProtectionEntry is not sufficient.
|
|
message ContentProtectionXml {
|
|
message AttributeNameValuePair {
|
|
optional string name = 1;
|
|
optional string value = 2;
|
|
}
|
|
|
|
message Element {
|
|
optional string name = 1;
|
|
repeated AttributeNameValuePair attributes = 2;
|
|
repeated Element subelements = 3;
|
|
}
|
|
|
|
// These two string fields are specified by the MPD spec. Just for
|
|
// clarification, the string set in |value| is the rhs of 'value' field in
|
|
// <ContentProtection>.
|
|
optional string scheme_id_uri = 1;
|
|
optional string value = 2;
|
|
repeated AttributeNameValuePair attributes = 3;
|
|
repeated Element subelements = 4;
|
|
}
|
|
|
|
optional uint32 bandwidth = 1;
|
|
|
|
// Note that DASH IOP v3.0 explicitly mentions that a segment should only
|
|
// have one {video, audio, text} track.
|
|
optional VideoInfo video_info = 2;
|
|
optional AudioInfo audio_info = 3;
|
|
optional TextInfo text_info = 4;
|
|
repeated ContentProtectionXml content_protections = 5;
|
|
|
|
// This is set if the content is protected with a content protection,
|
|
// i.e. encrypted.
|
|
optional ProtectedContent protected_content = 15;
|
|
|
|
// This is the reference time scale if there are multiple VideoInfo and/or
|
|
// AudioInfo.
|
|
optional uint32 reference_time_scale = 13;
|
|
optional ContainerType container_type = 14 [default = CONTAINER_UNKNOWN];
|
|
|
|
// VOD only.
|
|
optional Range init_range = 6;
|
|
optional Range index_range = 7;
|
|
optional string media_file_name = 8;
|
|
// END VOD only.
|
|
|
|
// VOD and static LIVE.
|
|
optional float media_duration_seconds = 9;
|
|
|
|
// LIVE only.
|
|
optional string init_segment_name = 10;
|
|
optional string segment_template = 11;
|
|
// This value is the user input “segment duration”.
|
|
// This value is not necessarily the same as the value passed to
|
|
// MpdNotifier::NotifyNewSegment().
|
|
optional float segment_duration_seconds = 12;
|
|
// END LIVE only.
|
|
}
|