shaka-packager/packager/media/codecs/aac_audio_specific_config.h

// Copyright (c) 2012 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.

#ifndef PACKAGER_MEDIA_CODECS_AAC_AUDIO_SPECIFIC_CONFIG_H_
#define PACKAGER_MEDIA_CODECS_AAC_AUDIO_SPECIFIC_CONFIG_H_

#include <stddef.h>
#include <stdint.h>

#include <vector>

namespace shaka {
namespace media {

class BitReader;

// Methods are virtual for mocking.
/// This class parses the AAC information from decoder specific information
/// embedded in the @b esds box in an ISO BMFF file.
/// Please refer to ISO 14496 Part 3 Table 1.13 - Syntax of AudioSpecificConfig
/// for more details.
class AACAudioSpecificConfig {
 public:
  // Audio Object Types specified in ISO 14496-3 (2005), Table 1.3
  enum AudioObjectType {
    AOT_NULL             = 0,
    AOT_AAC_MAIN         = 1,   // Main
    AOT_AAC_LC           = 2,   // Low Complexity
    AOT_AAC_SSR          = 3,   // Scalable Sample Rate
    AOT_AAC_LTP          = 4,   // Long Term Prediction
    AOT_SBR              = 5,   // Spectral Band Replication
    AOT_AAC_SCALABLE     = 6,   // Scalable
    AOT_TWINVQ           = 7,   // Twin Vector Quantizer
    AOT_CELP             = 8,   // Code Excited Linear Prediction
    AOT_HVXC             = 9,   // Harmonic Vector eXcitation Coding
    AOT_TTSI             = 12,  // Text-To-Speech Interface
    AOT_MAINSYNTH        = 13,  // Main Synthesis
    AOT_WAVESYNTH        = 14,  // Wavetable Synthesis
    AOT_MIDI             = 15,  // General MIDI
    AOT_SAFX             = 16,  // Algorithmic Synthesis and Audio Effects
    AOT_ER_AAC_LC        = 17,  // Error Resilient Low Complexity
    AOT_ER_AAC_LTP       = 19,  // Error Resilient Long Term Prediction
    AOT_ER_AAC_SCALABLE  = 20,  // Error Resilient Scalable
    AOT_ER_TWINVQ        = 21,  // Error Resilient Twin Vector Quantizer
    AOT_ER_BSAC          = 22,  // Error Resilient Bit-Sliced Arithmetic Coding
    AOT_ER_AAC_LD        = 23,  // Error Resilient Low Delay
    AOT_ER_CELP          = 24,  // Error Resilient Code Excited Linear
                                // Prediction
    AOT_ER_HVXC          = 25,  // Error Resilient Harmonic Vector eXcitation
                                // Coding
    AOT_ER_HILN          = 26,  // Error Resilient Harmonic and Individual Lines
                                // plus Noise
    AOT_ER_PARAM         = 27,  // Error Resilient Parametric
    AOT_SSC              = 28,  // SinuSoidal Coding
    AOT_PS               = 29,  // Parametric Stereo
    AOT_SURROUND         = 30,  // MPEG Surround
    AOT_ESCAPE           = 31,  // Escape Value
    AOT_L1               = 32,  // Layer 1
    AOT_L2               = 33,  // Layer 2
    AOT_L3               = 34,  // Layer 3
    AOT_DST              = 35,  // Direct Stream Transfer
    AOT_ALS              = 36,  // Audio LosslesS
    AOT_SLS              = 37,  // Scalable LosslesS
    AOT_SLS_NON_CORE     = 38,  // Scalable LosslesS (non core)
    AOT_ER_AAC_ELD       = 39,  // Error Resilient Enhanced Low Delay
    AOT_SMR_SIMPLE       = 40,  // Symbolic Music Representation Simple
    AOT_SMR_MAIN         = 41,  // Symbolic Music Representation Main
    AOT_USAC_NOSBR       = 42,  // Unified Speech and Audio Coding (no SBR)
    AOT_SAOC             = 43,  // Spatial Audio Object Coding
    AOT_LD_SURROUND      = 44,  // Low Delay MPEG Surround
    AOT_USAC             = 45,  // Unified Speech and Audio Coding
  };

  AACAudioSpecificConfig();
  virtual ~AACAudioSpecificConfig();

  /// Parse the AAC config from decoder specific information embedded in an @b
  /// esds box. The function will parse the data and get the
  /// ElementaryStreamDescriptor, then it will parse the
  /// ElementaryStreamDescriptor to get audio stream configurations.
  /// @param data contains decoder specific information from an @b esds box.
  /// @return true if successful, false otherwise.
  virtual bool Parse(const std::vector<uint8_t>& data);

  /// Convert a raw AAC frame into an AAC frame with an ADTS header.
  /// @param[in,out] buffer contains the raw AAC frame on input, and the
  ///                converted frame on output if successful; it is untouched
  ///                on failure.
  /// @return true on success, false otherwise.
  virtual bool ConvertToADTS(std::vector<uint8_t>* buffer) const;

  /// @return The audio object type for this AAC config, with possible extension
  ///         considered.
  AudioObjectType GetAudioObjectType() const;

  /// @return Sample rate for the AAC stream, with possible extensions
  ///         considered.
  uint32_t GetSamplesPerSecond() const;

  /// @return Number of channels for the AAC stream, with possible extensions
  ///         considered.
  uint8_t GetNumChannels() const;

  /// Size in bytes of the ADTS header added by ConvertEsdsToADTS().
  static const size_t kADTSHeaderSize = 7;

  /// @return whether Spectral Band Repliation (SBR) is present in the stream.
  bool sbr_present() const { return sbr_present_; }
  /// Indicate whether SBR is present in the stream.
  void set_sbr_present(bool sbr_present) { sbr_present_ = sbr_present; }

 private:
  bool SkipDecoderGASpecificConfig(BitReader* bit_reader) const;
  bool SkipErrorSpecificConfig() const;
  bool SkipGASpecificConfig(BitReader* bit_reader) const;

  // The following variables store the AAC specific configuration information
  // that are used to generate the ADTS header.
  AudioObjectType audio_object_type_ = AOT_NULL;
  uint8_t frequency_index_ = 0;
  uint8_t channel_config_ = 0;
  // Is Spectral Band Replication (SBR) available?
  bool sbr_present_ = false;
  // Is Parametric Stereo available?
  bool ps_present_ = false;

  // The following variables store audio configuration information.
  // They are based on the AAC specific configuration but can be overridden
  // by extensions in elementary stream descriptor.
  uint32_t frequency_ = 0;
  uint32_t extension_frequency_ = 0;
  uint8_t num_channels_ = 0;
};

}  // namespace media
}  // namespace shaka

#endif  // PACKAGER_MEDIA_CODECS_AAC_AUDIO_SPECIFIC_CONFIG_H_
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00			`// Copyright (c) 2012 The Chromium Authors. All rights reserved.`
			`// Use of this source code is governed by a BSD-style license that can be`
			`// found in the LICENSE file.`

Clean up #ifndef in packager/media. (#310) 2017-12-20 00:56:36 +00:00			`#ifndef PACKAGER_MEDIA_CODECS_AAC_AUDIO_SPECIFIC_CONFIG_H_`
			`#define PACKAGER_MEDIA_CODECS_AAC_AUDIO_SPECIFIC_CONFIG_H_`
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00
Clean up include files for int8_t,...int64_t Use <stdint.h> rather than "base/basictypes.h". This is a follow up to previous CL. Also get rid of ku?intxx(min\|max) and use std::numeric_limits as per base/basictypes.h, it is DEPRECATED too. The change was made using the below commands with some adjustments like include order etc: > find {media,app,mpd} -type f -exec sed -r -i 's/"base\/basictypes.h"/<stdint.h>/' {} \; > find {media,app,mpd} -type f -exec sed -r -i 's/k(u?int[0-9]+)(min\|max)/std::numeric_limits<\1_t>::\2\(\)/g' {} \; Change-Id: I6347723989c3d66e64ffcc54123b5c182b8c71b7 2014-09-30 23:52:58 +00:00			`#include <stddef.h>`
			`#include <stdint.h>`
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00
Clean up include files for int8_t,...int64_t Use <stdint.h> rather than "base/basictypes.h". This is a follow up to previous CL. Also get rid of ku?intxx(min\|max) and use std::numeric_limits as per base/basictypes.h, it is DEPRECATED too. The change was made using the below commands with some adjustments like include order etc: > find {media,app,mpd} -type f -exec sed -r -i 's/"base\/basictypes.h"/<stdint.h>/' {} \; > find {media,app,mpd} -type f -exec sed -r -i 's/k(u?int[0-9]+)(min\|max)/std::numeric_limits<\1_t>::\2\(\)/g' {} \; Change-Id: I6347723989c3d66e64ffcc54123b5c182b8c71b7 2014-09-30 23:52:58 +00:00			`#include <vector>`
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00
Rename top level namespace to shaka Issue #103 Change-Id: I67945c8ec6d2c178494d3b5400e5ec0170e9d115 2016-05-20 21:19:33 +00:00			`namespace shaka {`
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00			`namespace media {`

			`class BitReader;`

Add PES packet related classes - Define PesPacket class. - PesPacketGenerator creates PesPackets from samples. Change-Id: Icfd3656b498e0075f83ff3c789f95658f98c6144 2016-03-16 19:10:12 +00:00			`// Methods are virtual for mocking.`
First draft doxygen documentation for media/mp4. Change-Id: I13a28245168724a237a4653e298d6b835c24f17b 2014-01-23 22:34:39 +00:00			`/// This class parses the AAC information from decoder specific information`
			`/// embedded in the @b esds box in an ISO BMFF file.`
			`/// Please refer to ISO 14496 Part 3 Table 1.13 - Syntax of AudioSpecificConfig`
			`/// for more details.`
Rename AAC to AACAudioSpecificConfig. Change-Id: Idda2db1f2cdde6c2c220830c2681bef209ad4ce2 2014-01-10 00:21:06 +00:00			`class AACAudioSpecificConfig {`
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00			`public:`
Fix AAC-HE not correctly signaled in codec string - Also fixed a bug with dts audio in esds. Closes #225 Change-Id: I50ca731ac81bedfec37b0e2d577c51d643b7a839 2017-04-10 20:20:45 +00:00			`// Audio Object Types specified in ISO 14496-3 (2005), Table 1.3`
			`enum AudioObjectType {`
			`AOT_NULL = 0,`
			`AOT_AAC_MAIN = 1, // Main`
			`AOT_AAC_LC = 2, // Low Complexity`
			`AOT_AAC_SSR = 3, // Scalable Sample Rate`
			`AOT_AAC_LTP = 4, // Long Term Prediction`
			`AOT_SBR = 5, // Spectral Band Replication`
			`AOT_AAC_SCALABLE = 6, // Scalable`
			`AOT_TWINVQ = 7, // Twin Vector Quantizer`
			`AOT_CELP = 8, // Code Excited Linear Prediction`
			`AOT_HVXC = 9, // Harmonic Vector eXcitation Coding`
			`AOT_TTSI = 12, // Text-To-Speech Interface`
			`AOT_MAINSYNTH = 13, // Main Synthesis`
			`AOT_WAVESYNTH = 14, // Wavetable Synthesis`
			`AOT_MIDI = 15, // General MIDI`
			`AOT_SAFX = 16, // Algorithmic Synthesis and Audio Effects`
			`AOT_ER_AAC_LC = 17, // Error Resilient Low Complexity`
			`AOT_ER_AAC_LTP = 19, // Error Resilient Long Term Prediction`
			`AOT_ER_AAC_SCALABLE = 20, // Error Resilient Scalable`
			`AOT_ER_TWINVQ = 21, // Error Resilient Twin Vector Quantizer`
			`AOT_ER_BSAC = 22, // Error Resilient Bit-Sliced Arithmetic Coding`
			`AOT_ER_AAC_LD = 23, // Error Resilient Low Delay`
			`AOT_ER_CELP = 24, // Error Resilient Code Excited Linear`
			`// Prediction`
			`AOT_ER_HVXC = 25, // Error Resilient Harmonic Vector eXcitation`
			`// Coding`
			`AOT_ER_HILN = 26, // Error Resilient Harmonic and Individual Lines`
			`// plus Noise`
			`AOT_ER_PARAM = 27, // Error Resilient Parametric`
			`AOT_SSC = 28, // SinuSoidal Coding`
			`AOT_PS = 29, // Parametric Stereo`
			`AOT_SURROUND = 30, // MPEG Surround`
			`AOT_ESCAPE = 31, // Escape Value`
			`AOT_L1 = 32, // Layer 1`
			`AOT_L2 = 33, // Layer 2`
			`AOT_L3 = 34, // Layer 3`
			`AOT_DST = 35, // Direct Stream Transfer`
			`AOT_ALS = 36, // Audio LosslesS`
			`AOT_SLS = 37, // Scalable LosslesS`
			`AOT_SLS_NON_CORE = 38, // Scalable LosslesS (non core)`
			`AOT_ER_AAC_ELD = 39, // Error Resilient Enhanced Low Delay`
			`AOT_SMR_SIMPLE = 40, // Symbolic Music Representation Simple`
			`AOT_SMR_MAIN = 41, // Symbolic Music Representation Main`
			`AOT_USAC_NOSBR = 42, // Unified Speech and Audio Coding (no SBR)`
			`AOT_SAOC = 43, // Spatial Audio Object Coding`
			`AOT_LD_SURROUND = 44, // Low Delay MPEG Surround`
			`AOT_USAC = 45, // Unified Speech and Audio Coding`
			`};`

Rename AAC to AACAudioSpecificConfig. Change-Id: Idda2db1f2cdde6c2c220830c2681bef209ad4ce2 2014-01-10 00:21:06 +00:00			`AACAudioSpecificConfig();`
Add PES packet related classes - Define PesPacket class. - PesPacketGenerator creates PesPackets from samples. Change-Id: Icfd3656b498e0075f83ff3c789f95658f98c6144 2016-03-16 19:10:12 +00:00			`virtual ~AACAudioSpecificConfig();`
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00
First draft doxygen documentation for media/mp4. Change-Id: I13a28245168724a237a4653e298d6b835c24f17b 2014-01-23 22:34:39 +00:00			`/// Parse the AAC config from decoder specific information embedded in an @b`
			`/// esds box. The function will parse the data and get the`
			`/// ElementaryStreamDescriptor, then it will parse the`
			`/// ElementaryStreamDescriptor to get audio stream configurations.`
			`/// @param data contains decoder specific information from an @b esds box.`
			`/// @return true if successful, false otherwise.`
Add PES packet related classes - Define PesPacket class. - PesPacketGenerator creates PesPackets from samples. Change-Id: Icfd3656b498e0075f83ff3c789f95658f98c6144 2016-03-16 19:10:12 +00:00			`virtual bool Parse(const std::vector<uint8_t>& data);`

			`/// Convert a raw AAC frame into an AAC frame with an ADTS header.`
			`/// @param[in,out] buffer contains the raw AAC frame on input, and the`
			`/// converted frame on output if successful; it is untouched`
			`/// on failure.`
			`/// @return true on success, false otherwise.`
			`virtual bool ConvertToADTS(std::vector<uint8_t>* buffer) const;`
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00
Fix AAC-HE not correctly signaled in codec string - Also fixed a bug with dts audio in esds. Closes #225 Change-Id: I50ca731ac81bedfec37b0e2d577c51d643b7a839 2017-04-10 20:20:45 +00:00			`/// @return The audio object type for this AAC config, with possible extension`
			`/// considered.`
			`AudioObjectType GetAudioObjectType() const;`
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00
Fix AAC-HE not correctly signaled in codec string - Also fixed a bug with dts audio in esds. Closes #225 Change-Id: I50ca731ac81bedfec37b0e2d577c51d643b7a839 2017-04-10 20:20:45 +00:00			`/// @return Sample rate for the AAC stream, with possible extensions`
			`/// considered.`
			`uint32_t GetSamplesPerSecond() const;`
Add duration, language, codec data to stream info. Change-Id: I83d221fd36adb53ccf5629c80b137ba0ec730d55 2013-10-14 20:55:48 +00:00
Fix AAC-HE not correctly signaled in codec string - Also fixed a bug with dts audio in esds. Closes #225 Change-Id: I50ca731ac81bedfec37b0e2d577c51d643b7a839 2017-04-10 20:20:45 +00:00			`/// @return Number of channels for the AAC stream, with possible extensions`
			`/// considered.`
			`uint8_t GetNumChannels() const;`
Add duration, language, codec data to stream info. Change-Id: I83d221fd36adb53ccf5629c80b137ba0ec730d55 2013-10-14 20:55:48 +00:00
First draft doxygen documentation for media/mp4. Change-Id: I13a28245168724a237a4653e298d6b835c24f17b 2014-01-23 22:34:39 +00:00			`/// Size in bytes of the ADTS header added by ConvertEsdsToADTS().`
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00			`static const size_t kADTSHeaderSize = 7;`

Fix AAC-HE not correctly signaled in codec string - Also fixed a bug with dts audio in esds. Closes #225 Change-Id: I50ca731ac81bedfec37b0e2d577c51d643b7a839 2017-04-10 20:20:45 +00:00			`/// @return whether Spectral Band Repliation (SBR) is present in the stream.`
			`bool sbr_present() const { return sbr_present_; }`
			`/// Indicate whether SBR is present in the stream.`
			`void set_sbr_present(bool sbr_present) { sbr_present_ = sbr_present; }`

Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00			`private:`
			`bool SkipDecoderGASpecificConfig(BitReader* bit_reader) const;`
			`bool SkipErrorSpecificConfig() const;`
			`bool SkipGASpecificConfig(BitReader* bit_reader) const;`

			`// The following variables store the AAC specific configuration information`
			`// that are used to generate the ADTS header.`
Fix AAC-HE not correctly signaled in codec string - Also fixed a bug with dts audio in esds. Closes #225 Change-Id: I50ca731ac81bedfec37b0e2d577c51d643b7a839 2017-04-10 20:20:45 +00:00			`AudioObjectType audio_object_type_ = AOT_NULL;`
			`uint8_t frequency_index_ = 0;`
			`uint8_t channel_config_ = 0;`
			`// Is Spectral Band Replication (SBR) available?`
			`bool sbr_present_ = false;`
			`// Is Parametric Stereo available?`
			`bool ps_present_ = false;`
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00
Create MP4MediaParser and its dependents. Create new classes: StreamInfo, AudioStreamInfo, VideoStreamInfo, MediaParser, MediaSample, MP4MediaParser. Change-Id: I19c2fc73964d9f8fc90acaddd1783f4e6ff87d07 2013-09-24 04:17:12 +00:00			`// The following variables store audio configuration information.`
			`// They are based on the AAC specific configuration but can be overridden`
			`// by extensions in elementary stream descriptor.`
Fix AAC-HE not correctly signaled in codec string - Also fixed a bug with dts audio in esds. Closes #225 Change-Id: I50ca731ac81bedfec37b0e2d577c51d643b7a839 2017-04-10 20:20:45 +00:00			`uint32_t frequency_ = 0;`
			`uint32_t extension_frequency_ = 0;`
			`uint8_t num_channels_ = 0;`
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00			`};`

			`} // namespace media`
Rename top level namespace to shaka Issue #103 Change-Id: I67945c8ec6d2c178494d3b5400e5ec0170e9d115 2016-05-20 21:19:33 +00:00			`} // namespace shaka`
Start with media/mp4, media/webm and base codes from Chromium. 2013-09-24 01:35:40 +00:00
Clean up #ifndef in packager/media. (#310) 2017-12-20 00:56:36 +00:00			`#endif // PACKAGER_MEDIA_CODECS_AAC_AUDIO_SPECIFIC_CONFIG_H_`