Home | History | Annotate | Download | only in include
      1 /* -----------------------------------------------------------------------------
      2 Software License for The Fraunhofer FDK AAC Codec Library for Android
      3 
      4  Copyright  1995 - 2018 Fraunhofer-Gesellschaft zur Frderung der angewandten
      5 Forschung e.V. All rights reserved.
      6 
      7  1.    INTRODUCTION
      8 The Fraunhofer FDK AAC Codec Library for Android ("FDK AAC Codec") is software
      9 that implements the MPEG Advanced Audio Coding ("AAC") encoding and decoding
     10 scheme for digital audio. This FDK AAC Codec software is intended to be used on
     11 a wide variety of Android devices.
     12 
     13 AAC's HE-AAC and HE-AAC v2 versions are regarded as today's most efficient
     14 general perceptual audio codecs. AAC-ELD is considered the best-performing
     15 full-bandwidth communications codec by independent studies and is widely
     16 deployed. AAC has been standardized by ISO and IEC as part of the MPEG
     17 specifications.
     18 
     19 Patent licenses for necessary patent claims for the FDK AAC Codec (including
     20 those of Fraunhofer) may be obtained through Via Licensing
     21 (www.vialicensing.com) or through the respective patent owners individually for
     22 the purpose of encoding or decoding bit streams in products that are compliant
     23 with the ISO/IEC MPEG audio standards. Please note that most manufacturers of
     24 Android devices already license these patent claims through Via Licensing or
     25 directly from the patent owners, and therefore FDK AAC Codec software may
     26 already be covered under those patent licenses when it is used for those
     27 licensed purposes only.
     28 
     29 Commercially-licensed AAC software libraries, including floating-point versions
     30 with enhanced sound quality, are also available from Fraunhofer. Users are
     31 encouraged to check the Fraunhofer website for additional applications
     32 information and documentation.
     33 
     34 2.    COPYRIGHT LICENSE
     35 
     36 Redistribution and use in source and binary forms, with or without modification,
     37 are permitted without payment of copyright license fees provided that you
     38 satisfy the following conditions:
     39 
     40 You must retain the complete text of this software license in redistributions of
     41 the FDK AAC Codec or your modifications thereto in source code form.
     42 
     43 You must retain the complete text of this software license in the documentation
     44 and/or other materials provided with redistributions of the FDK AAC Codec or
     45 your modifications thereto in binary form. You must make available free of
     46 charge copies of the complete source code of the FDK AAC Codec and your
     47 modifications thereto to recipients of copies in binary form.
     48 
     49 The name of Fraunhofer may not be used to endorse or promote products derived
     50 from this library without prior written permission.
     51 
     52 You may not charge copyright license fees for anyone to use, copy or distribute
     53 the FDK AAC Codec software or your modifications thereto.
     54 
     55 Your modified versions of the FDK AAC Codec must carry prominent notices stating
     56 that you changed the software and the date of any change. For modified versions
     57 of the FDK AAC Codec, the term "Fraunhofer FDK AAC Codec Library for Android"
     58 must be replaced by the term "Third-Party Modified Version of the Fraunhofer FDK
     59 AAC Codec Library for Android."
     60 
     61 3.    NO PATENT LICENSE
     62 
     63 NO EXPRESS OR IMPLIED LICENSES TO ANY PATENT CLAIMS, including without
     64 limitation the patents of Fraunhofer, ARE GRANTED BY THIS SOFTWARE LICENSE.
     65 Fraunhofer provides no warranty of patent non-infringement with respect to this
     66 software.
     67 
     68 You may use this FDK AAC Codec software or modifications thereto only for
     69 purposes that are authorized by appropriate patent licenses.
     70 
     71 4.    DISCLAIMER
     72 
     73 This FDK AAC Codec software is provided by Fraunhofer on behalf of the copyright
     74 holders and contributors "AS IS" and WITHOUT ANY EXPRESS OR IMPLIED WARRANTIES,
     75 including but not limited to the implied warranties of merchantability and
     76 fitness for a particular purpose. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR
     77 CONTRIBUTORS BE LIABLE for any direct, indirect, incidental, special, exemplary,
     78 or consequential damages, including but not limited to procurement of substitute
     79 goods or services; loss of use, data, or profits, or business interruption,
     80 however caused and on any theory of liability, whether in contract, strict
     81 liability, or tort (including negligence), arising in any way out of the use of
     82 this software, even if advised of the possibility of such damage.
     83 
     84 5.    CONTACT INFORMATION
     85 
     86 Fraunhofer Institute for Integrated Circuits IIS
     87 Attention: Audio and Multimedia Departments - FDK AAC LL
     88 Am Wolfsmantel 33
     89 91058 Erlangen, Germany
     90 
     91 www.iis.fraunhofer.de/amm
     92 amm-info (at) iis.fraunhofer.de
     93 ----------------------------------------------------------------------------- */
     94 
     95 /************************* System integration library **************************
     96 
     97    Author(s):   Manuel Jander
     98 
     99    Description:
    100 
    101 *******************************************************************************/
    102 
    103 /** \file   FDK_audio.h
    104  *  \brief  Global audio struct and constant definitions.
    105  */
    106 
    107 #ifndef FDK_AUDIO_H
    108 #define FDK_AUDIO_H
    109 
    110 #include "machine_type.h"
    111 #include "genericStds.h"
    112 #include "syslib_channelMapDescr.h"
    113 
    114 #ifdef __cplusplus
    115 extern "C" {
    116 #endif
    117 
    118 /**
    119  * File format identifiers.
    120  */
    121 typedef enum {
    122   FF_UNKNOWN = -1, /**< Unknown format.        */
    123   FF_RAW = 0,      /**< No container, bit stream data conveyed "as is". */
    124 
    125   FF_MP4_3GPP = 3, /**< 3GPP file format.      */
    126   FF_MP4_MP4F = 4, /**< MPEG-4 File format.     */
    127 
    128   FF_RAWPACKETS = 5 /**< Proprietary raw packet file. */
    129 
    130 } FILE_FORMAT;
    131 
    132 /**
    133  * Transport type identifiers.
    134  */
    135 typedef enum {
    136   TT_UNKNOWN = -1, /**< Unknown format.            */
    137   TT_MP4_RAW = 0,  /**< "as is" access units (packet based since there is
    138                       obviously no sync layer) */
    139   TT_MP4_ADIF = 1, /**< ADIF bitstream format.     */
    140   TT_MP4_ADTS = 2, /**< ADTS bitstream format.     */
    141 
    142   TT_MP4_LATM_MCP1 = 6, /**< Audio Mux Elements with muxConfigPresent = 1 */
    143   TT_MP4_LATM_MCP0 = 7, /**< Audio Mux Elements with muxConfigPresent = 0, out
    144                            of band StreamMuxConfig */
    145 
    146   TT_MP4_LOAS = 10, /**< Audio Sync Stream.         */
    147 
    148   TT_DRM = 12 /**< Digital Radio Mondial (DRM30/DRM+) bitstream format. */
    149 
    150 } TRANSPORT_TYPE;
    151 
    152 #define TT_IS_PACKET(x)                                                   \
    153   (((x) == TT_MP4_RAW) || ((x) == TT_DRM) || ((x) == TT_MP4_LATM_MCP0) || \
    154    ((x) == TT_MP4_LATM_MCP1))
    155 
    156 /**
    157  * Audio Object Type definitions.
    158  */
    159 typedef enum {
    160   AOT_NONE = -1,
    161   AOT_NULL_OBJECT = 0,
    162   AOT_AAC_MAIN = 1, /**< Main profile                              */
    163   AOT_AAC_LC = 2,   /**< Low Complexity object                     */
    164   AOT_AAC_SSR = 3,
    165   AOT_AAC_LTP = 4,
    166   AOT_SBR = 5,
    167   AOT_AAC_SCAL = 6,
    168   AOT_TWIN_VQ = 7,
    169   AOT_CELP = 8,
    170   AOT_HVXC = 9,
    171   AOT_RSVD_10 = 10,          /**< (reserved)                                */
    172   AOT_RSVD_11 = 11,          /**< (reserved)                                */
    173   AOT_TTSI = 12,             /**< TTSI Object                               */
    174   AOT_MAIN_SYNTH = 13,       /**< Main Synthetic object                     */
    175   AOT_WAV_TAB_SYNTH = 14,    /**< Wavetable Synthesis object                */
    176   AOT_GEN_MIDI = 15,         /**< General MIDI object                       */
    177   AOT_ALG_SYNTH_AUD_FX = 16, /**< Algorithmic Synthesis and Audio FX object */
    178   AOT_ER_AAC_LC = 17,        /**< Error Resilient(ER) AAC Low Complexity    */
    179   AOT_RSVD_18 = 18,          /**< (reserved)                                */
    180   AOT_ER_AAC_LTP = 19,       /**< Error Resilient(ER) AAC LTP object        */
    181   AOT_ER_AAC_SCAL = 20,      /**< Error Resilient(ER) AAC Scalable object   */
    182   AOT_ER_TWIN_VQ = 21,       /**< Error Resilient(ER) TwinVQ object         */
    183   AOT_ER_BSAC = 22,          /**< Error Resilient(ER) BSAC object           */
    184   AOT_ER_AAC_LD = 23,        /**< Error Resilient(ER) AAC LowDelay object   */
    185   AOT_ER_CELP = 24,          /**< Error Resilient(ER) CELP object           */
    186   AOT_ER_HVXC = 25,          /**< Error Resilient(ER) HVXC object           */
    187   AOT_ER_HILN = 26,          /**< Error Resilient(ER) HILN object           */
    188   AOT_ER_PARA = 27,          /**< Error Resilient(ER) Parametric object     */
    189   AOT_RSVD_28 = 28,          /**< might become SSC                          */
    190   AOT_PS = 29,               /**< PS, Parametric Stereo (includes SBR)      */
    191   AOT_MPEGS = 30,            /**< MPEG Surround                             */
    192 
    193   AOT_ESCAPE = 31, /**< Signal AOT uses more than 5 bits          */
    194 
    195   AOT_MP3ONMP4_L1 = 32, /**< MPEG-Layer1 in mp4                        */
    196   AOT_MP3ONMP4_L2 = 33, /**< MPEG-Layer2 in mp4                        */
    197   AOT_MP3ONMP4_L3 = 34, /**< MPEG-Layer3 in mp4                        */
    198   AOT_RSVD_35 = 35,     /**< might become DST                          */
    199   AOT_RSVD_36 = 36,     /**< might become ALS                          */
    200   AOT_AAC_SLS = 37,     /**< AAC + SLS                                 */
    201   AOT_SLS = 38,         /**< SLS                                       */
    202   AOT_ER_AAC_ELD = 39,  /**< AAC Enhanced Low Delay                    */
    203 
    204   AOT_USAC = 42,     /**< USAC                                      */
    205   AOT_SAOC = 43,     /**< SAOC                                      */
    206   AOT_LD_MPEGS = 44, /**< Low Delay MPEG Surround                   */
    207 
    208   /* Pseudo AOTs */
    209   AOT_MP2_AAC_LC = 129, /**< Virtual AOT MP2 Low Complexity profile */
    210   AOT_MP2_SBR = 132, /**< Virtual AOT MP2 Low Complexity Profile with SBR    */
    211 
    212   AOT_DRM_AAC = 143, /**< Virtual AOT for DRM (ER-AAC-SCAL without SBR) */
    213   AOT_DRM_SBR = 144, /**< Virtual AOT for DRM (ER-AAC-SCAL with SBR) */
    214   AOT_DRM_MPEG_PS =
    215       145, /**< Virtual AOT for DRM (ER-AAC-SCAL with SBR and MPEG-PS) */
    216   AOT_DRM_SURROUND =
    217       146, /**< Virtual AOT for DRM Surround (ER-AAC-SCAL (+SBR) +MPS) */
    218   AOT_DRM_USAC = 147 /**< Virtual AOT for DRM with USAC */
    219 
    220 } AUDIO_OBJECT_TYPE;
    221 
    222 #define CAN_DO_PS(aot)                                           \
    223   ((aot) == AOT_AAC_LC || (aot) == AOT_SBR || (aot) == AOT_PS || \
    224    (aot) == AOT_ER_BSAC || (aot) == AOT_DRM_AAC)
    225 
    226 #define IS_USAC(aot) ((aot) == AOT_USAC)
    227 
    228 #define IS_LOWDELAY(aot) ((aot) == AOT_ER_AAC_LD || (aot) == AOT_ER_AAC_ELD)
    229 
    230 /** Channel Mode ( 1-7 equals MPEG channel configurations, others are
    231  * arbitrary). */
    232 typedef enum {
    233   MODE_INVALID = -1,
    234   MODE_UNKNOWN = 0,
    235   MODE_1 = 1,         /**< C */
    236   MODE_2 = 2,         /**< L+R */
    237   MODE_1_2 = 3,       /**< C, L+R */
    238   MODE_1_2_1 = 4,     /**< C, L+R, Rear */
    239   MODE_1_2_2 = 5,     /**< C, L+R, LS+RS */
    240   MODE_1_2_2_1 = 6,   /**< C, L+R, LS+RS, LFE */
    241   MODE_1_2_2_2_1 = 7, /**< C, LC+RC, L+R, LS+RS, LFE */
    242 
    243   MODE_6_1 = 11,           /**< C, L+R, LS+RS, Crear, LFE */
    244   MODE_7_1_BACK = 12,      /**< C, L+R, LS+RS, Lrear+Rrear, LFE */
    245   MODE_7_1_TOP_FRONT = 14, /**< C, L+R, LS+RS, LFE, Ltop+Rtop */
    246 
    247   MODE_7_1_REAR_SURROUND = 33, /**< C, L+R, LS+RS, Lrear+Rrear, LFE */
    248   MODE_7_1_FRONT_CENTER = 34,  /**< C, LC+RC, L+R, LS+RS, LFE */
    249 
    250   MODE_212 = 128 /**< 212 configuration, used in ELDv2 */
    251 
    252 } CHANNEL_MODE;
    253 
    254 /**
    255  * Speaker description tags.
    256  * Do not change the enumeration values unless it keeps the following
    257  * segmentation:
    258  * - Bit 0-3: Horizontal postion (0: none, 1: front, 2: side, 3: back, 4: lfe)
    259  * - Bit 4-7: Vertical position (0: normal, 1: top, 2: bottom)
    260  */
    261 typedef enum {
    262   ACT_NONE = 0x00,
    263   ACT_FRONT = 0x01, /*!< Front speaker position (at normal height) */
    264   ACT_SIDE = 0x02,  /*!< Side speaker position (at normal height) */
    265   ACT_BACK = 0x03,  /*!< Back speaker position (at normal height) */
    266   ACT_LFE = 0x04,   /*!< Low frequency effect speaker postion (front) */
    267 
    268   ACT_TOP =
    269       0x10, /*!< Top speaker area (for combination with speaker positions) */
    270   ACT_FRONT_TOP = 0x11, /*!< Top front speaker = (ACT_FRONT|ACT_TOP) */
    271   ACT_SIDE_TOP = 0x12,  /*!< Top side speaker  = (ACT_SIDE |ACT_TOP) */
    272   ACT_BACK_TOP = 0x13,  /*!< Top back speaker  = (ACT_BACK |ACT_TOP) */
    273 
    274   ACT_BOTTOM =
    275       0x20, /*!< Bottom speaker area (for combination with speaker positions) */
    276   ACT_FRONT_BOTTOM = 0x21, /*!< Bottom front speaker = (ACT_FRONT|ACT_BOTTOM) */
    277   ACT_SIDE_BOTTOM = 0x22,  /*!< Bottom side speaker  = (ACT_SIDE |ACT_BOTTOM) */
    278   ACT_BACK_BOTTOM = 0x23   /*!< Bottom back speaker  = (ACT_BACK |ACT_BOTTOM) */
    279 
    280 } AUDIO_CHANNEL_TYPE;
    281 
    282 typedef enum {
    283   SIG_UNKNOWN = -1,
    284   SIG_IMPLICIT = 0,
    285   SIG_EXPLICIT_BW_COMPATIBLE = 1,
    286   SIG_EXPLICIT_HIERARCHICAL = 2
    287 
    288 } SBR_PS_SIGNALING;
    289 
    290 /**
    291  * Audio Codec flags.
    292  */
    293 #define AC_ER_VCB11                                                           \
    294   0x000001 /*!< aacSectionDataResilienceFlag     flag (from ASC): 1 means use \
    295               virtual codebooks  */
    296 #define AC_ER_RVLC                                                             \
    297   0x000002 /*!< aacSpectralDataResilienceFlag     flag (from ASC): 1 means use \
    298               huffman codeword reordering */
    299 #define AC_ER_HCR                                                             \
    300   0x000004 /*!< aacSectionDataResilienceFlag     flag (from ASC): 1 means use \
    301               virtual codebooks  */
    302 #define AC_SCALABLE 0x000008    /*!< AAC Scalable*/
    303 #define AC_ELD 0x000010         /*!< AAC-ELD */
    304 #define AC_LD 0x000020          /*!< AAC-LD */
    305 #define AC_ER 0x000040          /*!< ER syntax */
    306 #define AC_BSAC 0x000080        /*!< BSAC */
    307 #define AC_USAC 0x000100        /*!< USAC */
    308 #define AC_RSV603DA 0x000200    /*!< RSVD60 3D audio */
    309 #define AC_HDAAC 0x000400       /*!< HD-AAC */
    310 #define AC_RSVD50 0x004000      /*!< Rsvd50 */
    311 #define AC_SBR_PRESENT 0x008000 /*!< SBR present flag (from ASC) */
    312 #define AC_SBRCRC \
    313   0x010000 /*!< SBR CRC present flag. Only relevant for AAC-ELD for now. */
    314 #define AC_PS_PRESENT 0x020000 /*!< PS present flag (from ASC or implicit)  */
    315 #define AC_MPS_PRESENT                                                     \
    316   0x040000                    /*!< MPS present flag (from ASC or implicit) \
    317                                */
    318 #define AC_DRM 0x080000       /*!< DRM bit stream syntax */
    319 #define AC_INDEP 0x100000     /*!< Independency flag */
    320 #define AC_MPEGD_RES 0x200000 /*!< MPEG-D residual individual channel data. */
    321 #define AC_SAOC_PRESENT 0x400000   /*!< SAOC Present Flag */
    322 #define AC_DAB 0x800000            /*!< DAB bit stream syntax */
    323 #define AC_ELD_DOWNSCALE 0x1000000 /*!< ELD Downscaled playout */
    324 #define AC_LD_MPS 0x2000000        /*!< Low Delay MPS. */
    325 #define AC_DRC_PRESENT                                   \
    326   0x4000000 /*!< Dynamic Range Control (DRC) data found. \
    327              */
    328 #define AC_USAC_SCFGI3 \
    329   0x8000000 /*!< USAC flag: If stereoConfigIndex is 3 the flag is set. */
    330 /**
    331  * Audio Codec flags (reconfiguration).
    332  */
    333 #define AC_CM_DET_CFG_CHANGE                                                 \
    334   0x000001 /*!< Config mode signalizes the callback to work in config change \
    335               detection mode */
    336 #define AC_CM_ALLOC_MEM                                               \
    337   0x000002 /*!< Config mode signalizes the callback to work in memory \
    338               allocation mode */
    339 
    340 /**
    341  * Audio Codec flags (element specific).
    342  */
    343 #define AC_EL_USAC_TW 0x000001    /*!< USAC time warped filter bank is active */
    344 #define AC_EL_USAC_NOISE 0x000002 /*!< USAC noise filling is active */
    345 #define AC_EL_USAC_ITES 0x000004  /*!< USAC SBR inter-TES tool is active */
    346 #define AC_EL_USAC_PVC \
    347   0x000008 /*!< USAC SBR predictive vector coding tool is active */
    348 #define AC_EL_USAC_MPS212 0x000010 /*!< USAC MPS212 tool is active */
    349 #define AC_EL_USAC_LFE 0x000020    /*!< USAC element is LFE */
    350 #define AC_EL_USAC_CP_POSSIBLE                                                 \
    351   0x000040 /*!< USAC may use Complex Stereo Prediction in this channel element \
    352             */
    353 #define AC_EL_ENHANCED_NOISE 0x000080   /*!< Enhanced noise filling*/
    354 #define AC_EL_IGF_AFTER_TNS 0x000100    /*!< IGF after TNS */
    355 #define AC_EL_IGF_INDEP_TILING 0x000200 /*!< IGF independent tiling */
    356 #define AC_EL_IGF_USE_ENF 0x000400      /*!< IGF use enhanced noise filling */
    357 #define AC_EL_FULLBANDLPD 0x000800      /*!< enable fullband LPD tools */
    358 #define AC_EL_LPDSTEREOIDX 0x001000     /*!< LPD-stereo-tool stereo index */
    359 #define AC_EL_LFE 0x002000              /*!< The element is of type LFE. */
    360 
    361 /* CODER_CONFIG::flags */
    362 #define CC_MPEG_ID 0x00100000
    363 #define CC_IS_BASELAYER 0x00200000
    364 #define CC_PROTECTION 0x00400000
    365 #define CC_SBR 0x00800000
    366 #define CC_SBRCRC 0x00010000
    367 #define CC_SAC 0x00020000
    368 #define CC_RVLC 0x01000000
    369 #define CC_VCB11 0x02000000
    370 #define CC_HCR 0x04000000
    371 #define CC_PSEUDO_SURROUND 0x08000000
    372 #define CC_USAC_NOISE 0x10000000
    373 #define CC_USAC_TW 0x20000000
    374 #define CC_USAC_HBE 0x40000000
    375 
    376 /** Generic audio coder configuration structure. */
    377 typedef struct {
    378   AUDIO_OBJECT_TYPE aot;     /**< Audio Object Type (AOT).           */
    379   AUDIO_OBJECT_TYPE extAOT;  /**< Extension Audio Object Type (SBR). */
    380   CHANNEL_MODE channelMode;  /**< Channel mode.                      */
    381   UCHAR channelConfigZero;   /**< Use channel config zero + pce although a
    382                                 standard channel config could be signaled. */
    383   INT samplingRate;          /**< Sampling rate.                     */
    384   INT extSamplingRate;       /**< Extended samplerate (SBR).         */
    385   INT downscaleSamplingRate; /**< Downscale sampling rate (ELD downscaled mode)
    386                               */
    387   INT bitRate;               /**< Average bitrate.                   */
    388   int samplesPerFrame; /**< Number of PCM samples per codec frame and audio
    389                           channel. */
    390   int noChannels;      /**< Number of audio channels.          */
    391   int bitsFrame;
    392   int nSubFrames; /**< Amount of encoder subframes. 1 means no subframing. */
    393   int BSACnumOfSubFrame; /**< The number of the sub-frames which are grouped and
    394                             transmitted in a super-frame (BSAC). */
    395   int BSAClayerLength; /**< The average length of the large-step layers in bytes
    396                           (BSAC).                            */
    397   UINT flags;          /**< flags */
    398   UCHAR matrixMixdownA; /**< Matrix mixdown index to put into PCE. Default value
    399                            0 means no mixdown coefficient, valid values are 1-4
    400                            which correspond to matrix_mixdown_idx 0-3. */
    401   UCHAR headerPeriod;   /**< Frame period for sending in band configuration
    402                            buffers in the transport layer. */
    403 
    404   UCHAR stereoConfigIndex;       /**< USAC MPS stereo mode */
    405   UCHAR sbrMode;                 /**< USAC SBR mode */
    406   SBR_PS_SIGNALING sbrSignaling; /**< 0: implicit signaling, 1: backwards
    407                                     compatible explicit signaling, 2:
    408                                     hierarcical explicit signaling */
    409 
    410   UCHAR rawConfig[64]; /**< raw codec specific config as bit stream */
    411   int rawConfigBits;   /**< Size of rawConfig in bits */
    412 
    413   UCHAR sbrPresent;
    414   UCHAR psPresent;
    415 } CODER_CONFIG;
    416 
    417 #define USAC_ID_BIT 16 /** USAC element IDs start at USAC_ID_BIT */
    418 
    419 /** MP4 Element IDs. */
    420 typedef enum {
    421   /* mp4 element IDs */
    422   ID_NONE = -1, /**< Invalid Element helper ID.             */
    423   ID_SCE = 0,   /**< Single Channel Element.                */
    424   ID_CPE = 1,   /**< Channel Pair Element.                  */
    425   ID_CCE = 2,   /**< Coupling Channel Element.              */
    426   ID_LFE = 3,   /**< LFE Channel Element.                   */
    427   ID_DSE = 4,   /**< Currently one Data Stream Element for ancillary data is
    428                    supported. */
    429   ID_PCE = 5,   /**< Program Config Element.                */
    430   ID_FIL = 6,   /**< Fill Element.                          */
    431   ID_END = 7,   /**< Arnie (End Element = Terminator).      */
    432   ID_EXT = 8,   /**< Extension Payload (ER only).           */
    433   ID_SCAL = 9,  /**< AAC scalable element (ER only).        */
    434   /* USAC element IDs */
    435   ID_USAC_SCE = 0 + USAC_ID_BIT, /**< Single Channel Element.                */
    436   ID_USAC_CPE = 1 + USAC_ID_BIT, /**< Channel Pair Element.                  */
    437   ID_USAC_LFE = 2 + USAC_ID_BIT, /**< LFE Channel Element.                   */
    438   ID_USAC_EXT = 3 + USAC_ID_BIT, /**< Extension Element.                     */
    439   ID_USAC_END = 4 + USAC_ID_BIT, /**< Arnie (End Element = Terminator).      */
    440   ID_LAST
    441 } MP4_ELEMENT_ID;
    442 
    443 /* usacConfigExtType q.v. ISO/IEC DIS 23008-3 Table 52  and  ISO/IEC FDIS
    444  * 23003-3:2011(E) Table 74*/
    445 typedef enum {
    446   /* USAC and RSVD60 3DA */
    447   ID_CONFIG_EXT_FILL = 0,
    448   /* RSVD60 3DA */
    449   ID_CONFIG_EXT_DOWNMIX = 1,
    450   ID_CONFIG_EXT_LOUDNESS_INFO = 2,
    451   ID_CONFIG_EXT_AUDIOSCENE_INFO = 3,
    452   ID_CONFIG_EXT_HOA_MATRIX = 4,
    453   ID_CONFIG_EXT_SIG_GROUP_INFO = 6
    454   /* 5-127 => reserved for ISO use */
    455   /* > 128 => reserved for use outside of ISO scope */
    456 } CONFIG_EXT_ID;
    457 
    458 #define IS_CHANNEL_ELEMENT(elementId)                                         \
    459   ((elementId) == ID_SCE || (elementId) == ID_CPE || (elementId) == ID_LFE || \
    460    (elementId) == ID_USAC_SCE || (elementId) == ID_USAC_CPE ||                \
    461    (elementId) == ID_USAC_LFE)
    462 
    463 #define IS_MP4_CHANNEL_ELEMENT(elementId) \
    464   ((elementId) == ID_SCE || (elementId) == ID_CPE || (elementId) == ID_LFE)
    465 
    466 #define EXT_ID_BITS 4 /**< Size in bits of extension payload type tags. */
    467 
    468 /** Extension payload types. */
    469 typedef enum {
    470   EXT_FIL = 0x00,
    471   EXT_FILL_DATA = 0x01,
    472   EXT_DATA_ELEMENT = 0x02,
    473   EXT_DATA_LENGTH = 0x03,
    474   EXT_UNI_DRC = 0x04,
    475   EXT_LDSAC_DATA = 0x09,
    476   EXT_SAOC_DATA = 0x0a,
    477   EXT_DYNAMIC_RANGE = 0x0b,
    478   EXT_SAC_DATA = 0x0c,
    479   EXT_SBR_DATA = 0x0d,
    480   EXT_SBR_DATA_CRC = 0x0e
    481 } EXT_PAYLOAD_TYPE;
    482 
    483 #define IS_USAC_CHANNEL_ELEMENT(elementId)                     \
    484   ((elementId) == ID_USAC_SCE || (elementId) == ID_USAC_CPE || \
    485    (elementId) == ID_USAC_LFE)
    486 
    487 /** MPEG-D USAC & RSVD60 3D audio Extension Element Types. */
    488 typedef enum {
    489   /* usac */
    490   ID_EXT_ELE_FILL = 0x00,
    491   ID_EXT_ELE_MPEGS = 0x01,
    492   ID_EXT_ELE_SAOC = 0x02,
    493   ID_EXT_ELE_AUDIOPREROLL = 0x03,
    494   ID_EXT_ELE_UNI_DRC = 0x04,
    495   /* rsv603da */
    496   ID_EXT_ELE_OBJ_METADATA = 0x05,
    497   ID_EXT_ELE_SAOC_3D = 0x06,
    498   ID_EXT_ELE_HOA = 0x07,
    499   ID_EXT_ELE_FMT_CNVRTR = 0x08,
    500   ID_EXT_ELE_MCT = 0x09,
    501   ID_EXT_ELE_ENHANCED_OBJ_METADATA = 0x0d,
    502   /* reserved for use outside of ISO scope */
    503   ID_EXT_ELE_VR_METADATA = 0x81,
    504   ID_EXT_ELE_UNKNOWN = 0xFF
    505 } USAC_EXT_ELEMENT_TYPE;
    506 
    507 /**
    508  * Proprietary raw packet file configuration data type identifier.
    509  */
    510 typedef enum {
    511   TC_NOTHING = 0,  /* No configuration available -> in-band configuration.   */
    512   TC_RAW_ADTS = 2, /* Transfer type is ADTS. */
    513   TC_RAW_LATM_MCP1 = 6, /* Transfer type is LATM with SMC present.    */
    514   TC_RAW_SDC = 21       /* Configuration data field is Drm SDC.             */
    515 
    516 } TP_CONFIG_TYPE;
    517 
    518 /*
    519  * ##############################################################################################
    520  * Library identification and error handling
    521  * ##############################################################################################
    522  */
    523 /* \cond */
    524 
    525 typedef enum {
    526   FDK_NONE = 0,
    527   FDK_TOOLS = 1,
    528   FDK_SYSLIB = 2,
    529   FDK_AACDEC = 3,
    530   FDK_AACENC = 4,
    531   FDK_SBRDEC = 5,
    532   FDK_SBRENC = 6,
    533   FDK_TPDEC = 7,
    534   FDK_TPENC = 8,
    535   FDK_MPSDEC = 9,
    536   FDK_MPEGFILEREAD = 10,
    537   FDK_MPEGFILEWRITE = 11,
    538   FDK_PCMDMX = 31,
    539   FDK_MPSENC = 34,
    540   FDK_TDLIMIT = 35,
    541   FDK_UNIDRCDEC = 38,
    542 
    543   FDK_MODULE_LAST
    544 
    545 } FDK_MODULE_ID;
    546 
    547 /* AAC capability flags */
    548 #define CAPF_AAC_LC 0x00000001 /**< Support flag for AAC Low Complexity. */
    549 #define CAPF_ER_AAC_LD                                                        \
    550   0x00000002 /**< Support flag for AAC Low Delay with Error Resilience tools. \
    551               */
    552 #define CAPF_ER_AAC_SCAL 0x00000004 /**< Support flag for AAC Scalable. */
    553 #define CAPF_ER_AAC_LC                                                      \
    554   0x00000008 /**< Support flag for AAC Low Complexity with Error Resilience \
    555                 tools. */
    556 #define CAPF_AAC_480 \
    557   0x00000010 /**< Support flag for AAC with 480 framelength.  */
    558 #define CAPF_AAC_512 \
    559   0x00000020 /**< Support flag for AAC with 512 framelength.  */
    560 #define CAPF_AAC_960 \
    561   0x00000040 /**< Support flag for AAC with 960 framelength.  */
    562 #define CAPF_AAC_1024 \
    563   0x00000080 /**< Support flag for AAC with 1024 framelength. */
    564 #define CAPF_AAC_HCR \
    565   0x00000100 /**< Support flag for AAC with Huffman Codeword Reordering.    */
    566 #define CAPF_AAC_VCB11 \
    567   0x00000200 /**< Support flag for AAC Virtual Codebook 11.    */
    568 #define CAPF_AAC_RVLC \
    569   0x00000400 /**< Support flag for AAC Reversible Variable Length Coding.   */
    570 #define CAPF_AAC_MPEG4 0x00000800 /**< Support flag for MPEG file format. */
    571 #define CAPF_AAC_DRC \
    572   0x00001000 /**< Support flag for AAC Dynamic Range Control. */
    573 #define CAPF_AAC_CONCEALMENT \
    574   0x00002000 /**< Support flag for AAC concealment.           */
    575 #define CAPF_AAC_DRM_BSFORMAT \
    576   0x00004000 /**< Support flag for AAC DRM bistream format. */
    577 #define CAPF_ER_AAC_ELD                                              \
    578   0x00008000 /**< Support flag for AAC Enhanced Low Delay with Error \
    579                 Resilience tools.  */
    580 #define CAPF_ER_AAC_BSAC \
    581   0x00010000 /**< Support flag for AAC BSAC.                           */
    582 #define CAPF_AAC_ELD_DOWNSCALE \
    583   0x00040000 /**< Support flag for AAC-ELD Downscaling           */
    584 #define CAPF_AAC_USAC_LP \
    585   0x00100000 /**< Support flag for USAC low power mode. */
    586 #define CAPF_AAC_USAC \
    587   0x00200000 /**< Support flag for Unified Speech and Audio Coding (USAC). */
    588 #define CAPF_ER_AAC_ELDV2 \
    589   0x00800000 /**< Support flag for AAC Enhanced Low Delay with MPS 212.  */
    590 #define CAPF_AAC_UNIDRC \
    591   0x01000000 /**< Support flag for MPEG-D Dynamic Range Control (uniDrc). */
    592 
    593 /* Transport capability flags */
    594 #define CAPF_ADTS \
    595   0x00000001 /**< Support flag for ADTS transport format.        */
    596 #define CAPF_ADIF \
    597   0x00000002 /**< Support flag for ADIF transport format.        */
    598 #define CAPF_LATM \
    599   0x00000004 /**< Support flag for LATM transport format.        */
    600 #define CAPF_LOAS \
    601   0x00000008 /**< Support flag for LOAS transport format.        */
    602 #define CAPF_RAWPACKETS \
    603   0x00000010 /**< Support flag for RAW PACKETS transport format. */
    604 #define CAPF_DRM \
    605   0x00000020 /**< Support flag for DRM/DRM+ transport format.    */
    606 #define CAPF_RSVD50 \
    607   0x00000040 /**< Support flag for RSVD50 transport format       */
    608 
    609 /* SBR capability flags */
    610 #define CAPF_SBR_LP \
    611   0x00000001 /**< Support flag for SBR Low Power mode.           */
    612 #define CAPF_SBR_HQ \
    613   0x00000002 /**< Support flag for SBR High Quality mode.        */
    614 #define CAPF_SBR_DRM_BS \
    615   0x00000004 /**< Support flag for                               */
    616 #define CAPF_SBR_CONCEALMENT \
    617   0x00000008 /**< Support flag for SBR concealment.              */
    618 #define CAPF_SBR_DRC \
    619   0x00000010 /**< Support flag for SBR Dynamic Range Control.    */
    620 #define CAPF_SBR_PS_MPEG \
    621   0x00000020 /**< Support flag for MPEG Parametric Stereo.       */
    622 #define CAPF_SBR_PS_DRM \
    623   0x00000040 /**< Support flag for DRM Parametric Stereo.        */
    624 #define CAPF_SBR_ELD_DOWNSCALE \
    625   0x00000080 /**< Support flag for ELD reduced delay mode        */
    626 #define CAPF_SBR_HBEHQ \
    627   0x00000100 /**< Support flag for HQ HBE                        */
    628 
    629 /* PCM utils capability flags */
    630 #define CAPF_DMX_BLIND \
    631   0x00000001 /**< Support flag for blind downmixing.             */
    632 #define CAPF_DMX_PCE                                                      \
    633   0x00000002 /**< Support flag for guided downmix with data from MPEG-2/4 \
    634                 Program Config Elements (PCE). */
    635 #define CAPF_DMX_ARIB                                                         \
    636   0x00000004 /**< Support flag for PCE guided downmix with slightly different \
    637                 equations and levels to fulfill ARIB standard. */
    638 #define CAPF_DMX_DVB                                                           \
    639   0x00000008 /**< Support flag for guided downmix with data from DVB ancillary \
    640                 data fields. */
    641 #define CAPF_DMX_CH_EXP                                                       \
    642   0x00000010 /**< Support flag for simple upmixing by dublicating channels or \
    643                 adding zero channels. */
    644 #define CAPF_DMX_6_CH                                                   \
    645   0x00000020 /**< Support flag for 5.1 channel configuration (input and \
    646                 output). */
    647 #define CAPF_DMX_8_CH                                                          \
    648   0x00000040 /**< Support flag for 6 and 7.1 channel configurations (input and \
    649                 output). */
    650 #define CAPF_DMX_24_CH                                                   \
    651   0x00000080 /**< Support flag for 22.2 channel configuration (input and \
    652                 output). */
    653 #define CAPF_LIMITER                                      \
    654   0x00002000 /**< Support flag for signal level limiting. \
    655               */
    656 
    657 /* MPEG Surround capability flags */
    658 #define CAPF_MPS_STD \
    659   0x00000001 /**< Support flag for MPEG Surround.           */
    660 #define CAPF_MPS_LD                                         \
    661   0x00000002 /**< Support flag for Low Delay MPEG Surround. \
    662               */
    663 #define CAPF_MPS_USAC \
    664   0x00000004 /**< Support flag for USAC MPEG Surround.      */
    665 #define CAPF_MPS_HQ                                                     \
    666   0x00000010 /**< Support flag indicating if high quality processing is \
    667                 supported */
    668 #define CAPF_MPS_LP                                                        \
    669   0x00000020 /**< Support flag indicating if partially complex (low power) \
    670                 processing is supported */
    671 #define CAPF_MPS_BLIND \
    672   0x00000040 /**< Support flag indicating if blind processing is supported */
    673 #define CAPF_MPS_BINAURAL \
    674   0x00000080 /**< Support flag indicating if binaural output is possible */
    675 #define CAPF_MPS_2CH_OUT \
    676   0x00000100 /**< Support flag indicating if 2ch output is possible      */
    677 #define CAPF_MPS_6CH_OUT \
    678   0x00000200 /**< Support flag indicating if 6ch output is possible      */
    679 #define CAPF_MPS_8CH_OUT \
    680   0x00000400 /**< Support flag indicating if 8ch output is possible      */
    681 #define CAPF_MPS_1CH_IN \
    682   0x00001000 /**< Support flag indicating if 1ch dmx input is possible   */
    683 #define CAPF_MPS_2CH_IN \
    684   0x00002000 /**< Support flag indicating if 2ch dmx input is possible   */
    685 #define CAPF_MPS_6CH_IN \
    686   0x00004000 /**< Support flag indicating if 5ch dmx input is possible   */
    687 
    688 /* \endcond */
    689 
    690 /*
    691  * ##############################################################################################
    692  * Library versioning
    693  * ##############################################################################################
    694  */
    695 
    696 /**
    697  * Convert each member of version numbers to one single numeric version
    698  * representation.
    699  * \param lev0  1st level of version number.
    700  * \param lev1  2nd level of version number.
    701  * \param lev2  3rd level of version number.
    702  */
    703 #define LIB_VERSION(lev0, lev1, lev2)                      \
    704   ((lev0 << 24 & 0xff000000) | (lev1 << 16 & 0x00ff0000) | \
    705    (lev2 << 8 & 0x0000ff00))
    706 
    707 /**
    708  *  Build text string of version.
    709  */
    710 #define LIB_VERSION_STRING(info)                                               \
    711   FDKsprintf((info)->versionStr, "%d.%d.%d", (((info)->version >> 24) & 0xff), \
    712              (((info)->version >> 16) & 0xff),                                 \
    713              (((info)->version >> 8) & 0xff))
    714 
    715 /**
    716  *  Library information.
    717  */
    718 typedef struct LIB_INFO {
    719   const char* title;
    720   const char* build_date;
    721   const char* build_time;
    722   FDK_MODULE_ID module_id;
    723   INT version;
    724   UINT flags;
    725   char versionStr[32];
    726 } LIB_INFO;
    727 
    728 #ifdef __cplusplus
    729 #define FDK_AUDIO_INLINE inline
    730 #else
    731 #define FDK_AUDIO_INLINE
    732 #endif
    733 
    734 /** Initialize library info. */
    735 static FDK_AUDIO_INLINE void FDKinitLibInfo(LIB_INFO* info) {
    736   int i;
    737 
    738   for (i = 0; i < FDK_MODULE_LAST; i++) {
    739     info[i].module_id = FDK_NONE;
    740   }
    741 }
    742 
    743 /** Aquire supported features of library. */
    744 static FDK_AUDIO_INLINE UINT
    745 FDKlibInfo_getCapabilities(const LIB_INFO* info, FDK_MODULE_ID module_id) {
    746   int i;
    747 
    748   for (i = 0; i < FDK_MODULE_LAST; i++) {
    749     if (info[i].module_id == module_id) {
    750       return info[i].flags;
    751     }
    752   }
    753   return 0;
    754 }
    755 
    756 /** Search for next free tab. */
    757 static FDK_AUDIO_INLINE INT FDKlibInfo_lookup(const LIB_INFO* info,
    758                                               FDK_MODULE_ID module_id) {
    759   int i = -1;
    760 
    761   for (i = 0; i < FDK_MODULE_LAST; i++) {
    762     if (info[i].module_id == module_id) return -1;
    763     if (info[i].module_id == FDK_NONE) break;
    764   }
    765   if (i == FDK_MODULE_LAST) return -1;
    766 
    767   return i;
    768 }
    769 
    770 /*
    771  * ##############################################################################################
    772  * Buffer description
    773  * ##############################################################################################
    774  */
    775 
    776 /**
    777  *  I/O buffer descriptor.
    778  */
    779 typedef struct FDK_bufDescr {
    780   void** ppBase;  /*!< Pointer to an array containing buffer base addresses.
    781                        Set to NULL for buffer requirement info. */
    782   UINT* pBufSize; /*!< Pointer to an array containing the number of elements
    783                      that can be placed in the specific buffer. */
    784   UINT* pEleSize; /*!< Pointer to an array containing the element size for each
    785                      buffer in bytes. That is mostly the number returned by the
    786                      sizeof() operator for the data type used for the specific
    787                      buffer. */
    788   UINT*
    789       pBufType; /*!< Pointer to an array of bit fields containing a description
    790                      for each buffer. See XXX below for more details.  */
    791   UINT numBufs; /*!< Total number of buffers. */
    792 
    793 } FDK_bufDescr;
    794 
    795 /**
    796  * Buffer type description field.
    797  */
    798 #define FDK_BUF_TYPE_MASK_IO ((UINT)0x03 << 30)
    799 #define FDK_BUF_TYPE_MASK_DESCR ((UINT)0x3F << 16)
    800 #define FDK_BUF_TYPE_MASK_ID ((UINT)0xFF)
    801 
    802 #define FDK_BUF_TYPE_INPUT ((UINT)0x1 << 30)
    803 #define FDK_BUF_TYPE_OUTPUT ((UINT)0x2 << 30)
    804 
    805 #define FDK_BUF_TYPE_PCM_DATA ((UINT)0x1 << 16)
    806 #define FDK_BUF_TYPE_ANC_DATA ((UINT)0x2 << 16)
    807 #define FDK_BUF_TYPE_BS_DATA ((UINT)0x4 << 16)
    808 
    809 #ifdef __cplusplus
    810 }
    811 #endif
    812 
    813 #endif /* FDK_AUDIO_H */
    814