DASH Media Packaging SDK
 All Classes Namespaces Functions Variables Typedefs Enumerator
nalu_reader.h
1 // Copyright 2016 Google Inc. All rights reserved.
2 //
3 // Use of this source code is governed by a BSD-style
4 // license that can be found in the LICENSE file or at
5 // https://developers.google.com/open-source/licenses/bsd
6 
7 #ifndef MEDIA_FILTERS_NALU_READER_H_
8 #define MEDIA_FILTERS_NALU_READER_H_
9 
10 #include <stdint.h>
11 #include <stdlib.h>
12 
13 #include "packager/base/compiler_specific.h"
14 #include "packager/base/macros.h"
15 
16 namespace edash_packager {
17 namespace media {
18 
19 // Used as the |nalu_length_size| argument to NaluReader to indicate to use
20 // AnnexB byte streams. An AnnexB byte stream starts with 3 or 4 byte start
21 // codes instead of a fixed size NAL unit length.
22 const uint8_t kIsAnnexbByteStream = 0;
23 
26 class Nalu {
27  public:
28  enum H264NaluType {
29  H264_Unspecified = 0,
30  H264_NonIDRSlice = 1,
31  H264_IDRSlice = 5,
32  H264_SEIMessage = 6,
33  H264_SPS = 7,
34  H264_PPS = 8,
35  H264_AUD = 9,
36  H264_EOSeq = 10,
37  H264_FillerData = 12,
38  H264_SPSExtension = 13,
39  H264_SubsetSPS = 15,
40  H264_Reserved17 = 17,
41  H264_Reserved18 = 18,
42  H264_CodedSliceExtension = 20,
43  H264_Reserved22 = 22,
44  };
45  enum H265NaluType {
46  H265_TRAIL_N = 0,
47  H265_TSA_N = 2,
48  H265_TSA_R = 3,
49  H265_STSA_N = 4,
50  H265_STSA_R = 5,
51  H265_RASL_R = 9,
52 
53  H265_RSV_VCL_N10 = 10,
54  H265_RSV_VCL_R15 = 15,
55 
56  H265_BLA_W_LP = 16,
57  H265_IDR_W_RADL = 19,
58  H265_IDR_N_LP = 20,
59  H265_CRA_NUT = 21,
60 
61  H265_RSV_IRAP_VCL22 = 22,
62  H265_RSV_IRAP_VCL23 = 23,
63  H265_RSV_VCL31 = 31,
64 
65  H265_VPS = 32,
66  H265_SPS = 33,
67  H265_PPS = 34,
68  H265_AUD = 35,
69 
70  H265_EOS = 36,
71  H265_EOB = 37,
72 
73  H265_RSV_NVCL41 = 41,
74  };
75  enum CodecType {
76  kH264,
77  kH265,
78  };
79 
80  Nalu();
81 
82  bool Initialize(CodecType type,
83  const uint8_t* data,
84  uint64_t size) WARN_UNUSED_RESULT;
85 
86  const uint8_t* data() const { return data_; }
87  uint64_t header_size() const { return header_size_; }
88  uint64_t payload_size() const { return payload_size_; }
89 
90  // H.264 Specific:
91  int ref_idc() const { return ref_idc_; }
92 
93  // H.265 Specific:
94  int nuh_layer_id() const { return nuh_layer_id_; }
95  int nuh_temporal_id() const { return nuh_temporal_id_; }
96 
97  int type() const { return type_; }
98  bool is_video_slice() const { return is_video_slice_; }
99 
100  private:
101  bool InitializeFromH264(const uint8_t* data, uint64_t size);
102  bool InitializeFromH265(const uint8_t* data, uint64_t size);
103 
104  // A pointer to the NALU (i.e. points to the header). This pointer is not
105  // owned by this instance.
106  const uint8_t* data_;
107  // NALU header size (e.g. 1 byte for H.264). Note that it does not include
108  // header extension data in some NAL units.
109  uint64_t header_size_;
110  // Size of data after the header.
111  uint64_t payload_size_;
112 
113  int ref_idc_;
114  int nuh_layer_id_;
115  int nuh_temporal_id_;
116  int type_;
117  bool is_video_slice_;
118 
119  // Don't use DISALLOW_COPY_AND_ASSIGN since it is just numbers and a pointer
120  // it does not own. This allows Nalus to be stored in a vector.
121 };
122 
126 class NaluReader {
127  public:
128  enum Result {
129  kOk,
130  kInvalidStream, // error in stream
131  kEOStream, // end of stream
132  };
133 
137  NaluReader(Nalu::CodecType type,
138  uint8_t nal_length_size,
139  const uint8_t* stream,
140  uint64_t stream_size);
141  ~NaluReader();
142 
143  // Find offset from start of data to next NALU start code
144  // and size of found start code (3 or 4 bytes).
145  // If no start code is found, offset is pointing to the first unprocessed byte
146  // (i.e. the first byte that was not considered as a possible start of a start
147  // code) and |*start_code_size| is set to 0.
148  // Postconditions:
149  // - |*offset| is between 0 and |data_size| included.
150  // It is strictly less than |data_size| if |data_size| > 0.
151  // - |*start_code_size| is either 0, 3 or 4.
152  static bool FindStartCode(const uint8_t* data,
153  uint64_t data_size,
154  uint64_t* offset,
155  uint8_t* start_code_size);
156 
162  Result Advance(Nalu* nalu);
163 
165  bool StartsWithStartCode();
166 
167  private:
168  enum Format {
169  kAnnexbByteStreamFormat,
170  kNalUnitStreamFormat
171  };
172 
173  // Move the stream pointer to the beginning of the next NALU,
174  // i.e. pointing at the next start code.
175  // Return true if a NALU has been found.
176  // If a NALU is found:
177  // - its size in bytes is returned in |*nalu_size| and includes
178  // the start code as well as the trailing zero bits.
179  // - the size in bytes of the start code is returned in |*start_code_size|.
180  bool LocateNaluByStartCode(uint64_t* nalu_size, uint8_t* start_code_size);
181 
182  // Pointer to the current NALU in the stream.
183  const uint8_t* stream_;
184  // The remaining size of the stream.
185  uint64_t stream_size_;
186  // The type of NALU being read.
187  Nalu::CodecType nalu_type_;
188  // The number of bytes the prefix length is; only valid if format is
189  // kAnnexbByteStreamFormat.
190  uint8_t nalu_length_size_;
191  // The format of the stream.
192  Format format_;
193 
194  DISALLOW_COPY_AND_ASSIGN(NaluReader);
195 };
196 
197 } // namespace media
198 } // namespace edash_packager
199 
200 #endif // MEDIA_FILTERS_NALU_READER_H_
NaluReader(Nalu::CodecType type, uint8_t nal_length_size, const uint8_t *stream, uint64_t stream_size)
Definition: nalu_reader.cc:156