mirror of
https://github.com/mstorsjo/fdk-aac.git
synced 2025-01-08 13:52:40 +01:00
5c54fa5387
Test: atest DecoderTestXheAac ; atest DecoderTestAacDrc Change-Id: Ic106c4371c5ac17cb832c7d9db042bcc9d1e7a09
467 lines
17 KiB
C
467 lines
17 KiB
C
/* -----------------------------------------------------------------------------
|
|
Software License for The Fraunhofer FDK AAC Codec Library for Android
|
|
|
|
© Copyright 1995 - 2018 Fraunhofer-Gesellschaft zur Förderung der angewandten
|
|
Forschung e.V. All rights reserved.
|
|
|
|
1. INTRODUCTION
|
|
The Fraunhofer FDK AAC Codec Library for Android ("FDK AAC Codec") is software
|
|
that implements the MPEG Advanced Audio Coding ("AAC") encoding and decoding
|
|
scheme for digital audio. This FDK AAC Codec software is intended to be used on
|
|
a wide variety of Android devices.
|
|
|
|
AAC's HE-AAC and HE-AAC v2 versions are regarded as today's most efficient
|
|
general perceptual audio codecs. AAC-ELD is considered the best-performing
|
|
full-bandwidth communications codec by independent studies and is widely
|
|
deployed. AAC has been standardized by ISO and IEC as part of the MPEG
|
|
specifications.
|
|
|
|
Patent licenses for necessary patent claims for the FDK AAC Codec (including
|
|
those of Fraunhofer) may be obtained through Via Licensing
|
|
(www.vialicensing.com) or through the respective patent owners individually for
|
|
the purpose of encoding or decoding bit streams in products that are compliant
|
|
with the ISO/IEC MPEG audio standards. Please note that most manufacturers of
|
|
Android devices already license these patent claims through Via Licensing or
|
|
directly from the patent owners, and therefore FDK AAC Codec software may
|
|
already be covered under those patent licenses when it is used for those
|
|
licensed purposes only.
|
|
|
|
Commercially-licensed AAC software libraries, including floating-point versions
|
|
with enhanced sound quality, are also available from Fraunhofer. Users are
|
|
encouraged to check the Fraunhofer website for additional applications
|
|
information and documentation.
|
|
|
|
2. COPYRIGHT LICENSE
|
|
|
|
Redistribution and use in source and binary forms, with or without modification,
|
|
are permitted without payment of copyright license fees provided that you
|
|
satisfy the following conditions:
|
|
|
|
You must retain the complete text of this software license in redistributions of
|
|
the FDK AAC Codec or your modifications thereto in source code form.
|
|
|
|
You must retain the complete text of this software license in the documentation
|
|
and/or other materials provided with redistributions of the FDK AAC Codec or
|
|
your modifications thereto in binary form. You must make available free of
|
|
charge copies of the complete source code of the FDK AAC Codec and your
|
|
modifications thereto to recipients of copies in binary form.
|
|
|
|
The name of Fraunhofer may not be used to endorse or promote products derived
|
|
from this library without prior written permission.
|
|
|
|
You may not charge copyright license fees for anyone to use, copy or distribute
|
|
the FDK AAC Codec software or your modifications thereto.
|
|
|
|
Your modified versions of the FDK AAC Codec must carry prominent notices stating
|
|
that you changed the software and the date of any change. For modified versions
|
|
of the FDK AAC Codec, the term "Fraunhofer FDK AAC Codec Library for Android"
|
|
must be replaced by the term "Third-Party Modified Version of the Fraunhofer FDK
|
|
AAC Codec Library for Android."
|
|
|
|
3. NO PATENT LICENSE
|
|
|
|
NO EXPRESS OR IMPLIED LICENSES TO ANY PATENT CLAIMS, including without
|
|
limitation the patents of Fraunhofer, ARE GRANTED BY THIS SOFTWARE LICENSE.
|
|
Fraunhofer provides no warranty of patent non-infringement with respect to this
|
|
software.
|
|
|
|
You may use this FDK AAC Codec software or modifications thereto only for
|
|
purposes that are authorized by appropriate patent licenses.
|
|
|
|
4. DISCLAIMER
|
|
|
|
This FDK AAC Codec software is provided by Fraunhofer on behalf of the copyright
|
|
holders and contributors "AS IS" and WITHOUT ANY EXPRESS OR IMPLIED WARRANTIES,
|
|
including but not limited to the implied warranties of merchantability and
|
|
fitness for a particular purpose. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR
|
|
CONTRIBUTORS BE LIABLE for any direct, indirect, incidental, special, exemplary,
|
|
or consequential damages, including but not limited to procurement of substitute
|
|
goods or services; loss of use, data, or profits, or business interruption,
|
|
however caused and on any theory of liability, whether in contract, strict
|
|
liability, or tort (including negligence), arising in any way out of the use of
|
|
this software, even if advised of the possibility of such damage.
|
|
|
|
5. CONTACT INFORMATION
|
|
|
|
Fraunhofer Institute for Integrated Circuits IIS
|
|
Attention: Audio and Multimedia Departments - FDK AAC LL
|
|
Am Wolfsmantel 33
|
|
91058 Erlangen, Germany
|
|
|
|
www.iis.fraunhofer.de/amm
|
|
amm-info@iis.fraunhofer.de
|
|
----------------------------------------------------------------------------- */
|
|
|
|
/******************* MPEG transport format encoder library *********************
|
|
|
|
Author(s): Manuel Jander
|
|
|
|
Description: MPEG Transport data tables
|
|
|
|
*******************************************************************************/
|
|
|
|
#ifndef TP_DATA_H
|
|
#define TP_DATA_H
|
|
|
|
#include "machine_type.h"
|
|
#include "FDK_audio.h"
|
|
#include "FDK_bitstream.h"
|
|
|
|
/*
|
|
* Configuration
|
|
*/
|
|
|
|
#define TP_USAC_MAX_SPEAKERS (24)
|
|
|
|
#define TP_USAC_MAX_EXT_ELEMENTS ((24))
|
|
|
|
#define TP_USAC_MAX_ELEMENTS ((24) + TP_USAC_MAX_EXT_ELEMENTS)
|
|
|
|
#define TP_USAC_MAX_CONFIG_LEN \
|
|
512 /* next power of two of maximum of escapedValue(hBs, 4, 4, 8) in \
|
|
AudioPreRoll() (285) */
|
|
|
|
#define TPDEC_USAC_NUM_CONFIG_CHANGE_FRAMES \
|
|
(1) /* Number of frames for config change in USAC */
|
|
|
|
enum {
|
|
TPDEC_FLUSH_OFF = 0,
|
|
TPDEC_RSV60_CFG_CHANGE_ATSC_FLUSH_ON = 1,
|
|
TPDEC_RSV60_DASH_IPF_ATSC_FLUSH_ON = 2,
|
|
TPDEC_USAC_DASH_IPF_FLUSH_ON = 3
|
|
};
|
|
|
|
enum {
|
|
TPDEC_BUILD_UP_OFF = 0,
|
|
TPDEC_RSV60_BUILD_UP_ON = 1,
|
|
TPDEC_RSV60_BUILD_UP_ON_IN_BAND = 2,
|
|
TPDEC_USAC_BUILD_UP_ON = 3,
|
|
TPDEC_RSV60_BUILD_UP_IDLE = 4,
|
|
TPDEC_RSV60_BUILD_UP_IDLE_IN_BAND = 5
|
|
};
|
|
|
|
/**
|
|
* ProgramConfig struct.
|
|
*/
|
|
/* ISO/IEC 14496-3 4.4.1.1 Table 4.2 Program config element */
|
|
#define PC_FSB_CHANNELS_MAX 16 /* Front/Side/Back channels */
|
|
#define PC_LFE_CHANNELS_MAX 4
|
|
#define PC_ASSOCDATA_MAX 8
|
|
#define PC_CCEL_MAX 16 /* CC elements */
|
|
#define PC_COMMENTLENGTH 256
|
|
#define PC_NUM_HEIGHT_LAYER 3
|
|
|
|
typedef struct {
|
|
/* PCE bitstream elements: */
|
|
UCHAR ElementInstanceTag;
|
|
UCHAR Profile;
|
|
UCHAR SamplingFrequencyIndex;
|
|
UCHAR NumFrontChannelElements;
|
|
UCHAR NumSideChannelElements;
|
|
UCHAR NumBackChannelElements;
|
|
UCHAR NumLfeChannelElements;
|
|
UCHAR NumAssocDataElements;
|
|
UCHAR NumValidCcElements;
|
|
|
|
UCHAR MonoMixdownPresent;
|
|
UCHAR MonoMixdownElementNumber;
|
|
|
|
UCHAR StereoMixdownPresent;
|
|
UCHAR StereoMixdownElementNumber;
|
|
|
|
UCHAR MatrixMixdownIndexPresent;
|
|
UCHAR MatrixMixdownIndex;
|
|
UCHAR PseudoSurroundEnable;
|
|
|
|
UCHAR FrontElementIsCpe[PC_FSB_CHANNELS_MAX];
|
|
UCHAR FrontElementTagSelect[PC_FSB_CHANNELS_MAX];
|
|
UCHAR FrontElementHeightInfo[PC_FSB_CHANNELS_MAX];
|
|
|
|
UCHAR SideElementIsCpe[PC_FSB_CHANNELS_MAX];
|
|
UCHAR SideElementTagSelect[PC_FSB_CHANNELS_MAX];
|
|
UCHAR SideElementHeightInfo[PC_FSB_CHANNELS_MAX];
|
|
|
|
UCHAR BackElementIsCpe[PC_FSB_CHANNELS_MAX];
|
|
UCHAR BackElementTagSelect[PC_FSB_CHANNELS_MAX];
|
|
UCHAR BackElementHeightInfo[PC_FSB_CHANNELS_MAX];
|
|
|
|
UCHAR LfeElementTagSelect[PC_LFE_CHANNELS_MAX];
|
|
|
|
UCHAR AssocDataElementTagSelect[PC_ASSOCDATA_MAX];
|
|
|
|
UCHAR CcElementIsIndSw[PC_CCEL_MAX];
|
|
UCHAR ValidCcElementTagSelect[PC_CCEL_MAX];
|
|
|
|
UCHAR CommentFieldBytes;
|
|
UCHAR Comment[PC_COMMENTLENGTH];
|
|
|
|
/* Helper variables for administration: */
|
|
UCHAR isValid; /*!< Flag showing if PCE has been read successfully. */
|
|
UCHAR
|
|
NumChannels; /*!< Amount of audio channels summing all channel elements
|
|
including LFEs */
|
|
UCHAR NumEffectiveChannels; /*!< Amount of audio channels summing only SCEs
|
|
and CPEs */
|
|
UCHAR elCounter;
|
|
|
|
} CProgramConfig;
|
|
|
|
typedef enum {
|
|
ASCEXT_UNKOWN = -1,
|
|
ASCEXT_SBR = 0x2b7,
|
|
ASCEXT_PS = 0x548,
|
|
ASCEXT_MPS = 0x76a,
|
|
ASCEXT_SAOC = 0x7cb,
|
|
ASCEXT_LDMPS = 0x7cc
|
|
|
|
} TP_ASC_EXTENSION_ID;
|
|
|
|
/**
|
|
* GaSpecificConfig struct
|
|
*/
|
|
typedef struct {
|
|
UINT m_frameLengthFlag;
|
|
UINT m_dependsOnCoreCoder;
|
|
UINT m_coreCoderDelay;
|
|
|
|
UINT m_extensionFlag;
|
|
UINT m_extensionFlag3;
|
|
|
|
UINT m_layer;
|
|
UINT m_numOfSubFrame;
|
|
UINT m_layerLength;
|
|
|
|
} CSGaSpecificConfig;
|
|
|
|
typedef enum {
|
|
ELDEXT_TERM = 0x0, /* Termination tag */
|
|
ELDEXT_SAOC = 0x1, /* SAOC config */
|
|
ELDEXT_LDSAC = 0x2, /* LD MPEG Surround config */
|
|
ELDEXT_DOWNSCALEINFO = 0x3 /* ELD sample rate adaptation */
|
|
/* reserved */
|
|
} ASC_ELD_EXT_TYPE;
|
|
|
|
typedef struct {
|
|
UCHAR m_frameLengthFlag;
|
|
|
|
UCHAR m_sbrPresentFlag;
|
|
UCHAR
|
|
m_useLdQmfTimeAlign; /* Use LD-MPS QMF in SBR to achive time alignment */
|
|
UCHAR m_sbrSamplingRate;
|
|
UCHAR m_sbrCrcFlag;
|
|
UINT m_downscaledSamplingFrequency;
|
|
|
|
} CSEldSpecificConfig;
|
|
|
|
typedef struct {
|
|
USAC_EXT_ELEMENT_TYPE usacExtElementType;
|
|
USHORT usacExtElementConfigLength;
|
|
USHORT usacExtElementDefaultLength;
|
|
UCHAR usacExtElementPayloadFrag;
|
|
UCHAR usacExtElementHasAudioPreRoll;
|
|
} CSUsacExtElementConfig;
|
|
|
|
typedef struct {
|
|
MP4_ELEMENT_ID usacElementType;
|
|
UCHAR m_noiseFilling;
|
|
UCHAR m_harmonicSBR;
|
|
UCHAR m_interTes;
|
|
UCHAR m_pvc;
|
|
UCHAR m_stereoConfigIndex;
|
|
CSUsacExtElementConfig extElement;
|
|
} CSUsacElementConfig;
|
|
|
|
typedef struct {
|
|
UCHAR m_frameLengthFlag;
|
|
UCHAR m_coreSbrFrameLengthIndex;
|
|
UCHAR m_sbrRatioIndex;
|
|
UCHAR m_nUsacChannels; /* number of audio channels signaled in
|
|
UsacDecoderConfig() / rsv603daDecoderConfig() via
|
|
numElements and usacElementType */
|
|
UCHAR m_channelConfigurationIndex;
|
|
UINT m_usacNumElements;
|
|
CSUsacElementConfig element[TP_USAC_MAX_ELEMENTS];
|
|
|
|
UCHAR numAudioChannels;
|
|
UCHAR m_usacConfigExtensionPresent;
|
|
UCHAR elementLengthPresent;
|
|
UCHAR UsacConfig[TP_USAC_MAX_CONFIG_LEN];
|
|
USHORT UsacConfigBits;
|
|
} CSUsacConfig;
|
|
|
|
/**
|
|
* Audio configuration struct, suitable for encoder and decoder configuration.
|
|
*/
|
|
typedef struct {
|
|
/* XYZ Specific Data */
|
|
union {
|
|
CSGaSpecificConfig
|
|
m_gaSpecificConfig; /**< General audio specific configuration. */
|
|
CSEldSpecificConfig m_eldSpecificConfig; /**< ELD specific configuration. */
|
|
CSUsacConfig m_usacConfig; /**< USAC specific configuration */
|
|
} m_sc;
|
|
|
|
/* Common ASC parameters */
|
|
CProgramConfig m_progrConfigElement; /**< Program configuration. */
|
|
|
|
AUDIO_OBJECT_TYPE m_aot; /**< Audio Object Type. */
|
|
UINT m_samplingFrequency; /**< Samplerate. */
|
|
UINT m_samplesPerFrame; /**< Amount of samples per frame. */
|
|
UINT m_directMapping; /**< Document this please !! */
|
|
|
|
AUDIO_OBJECT_TYPE m_extensionAudioObjectType; /**< Audio object type */
|
|
UINT m_extensionSamplingFrequency; /**< Samplerate */
|
|
|
|
SCHAR m_channelConfiguration; /**< Channel configuration index */
|
|
|
|
SCHAR m_epConfig; /**< Error protection index */
|
|
SCHAR m_vcb11Flag; /**< aacSectionDataResilienceFlag */
|
|
SCHAR m_rvlcFlag; /**< aacScalefactorDataResilienceFlag */
|
|
SCHAR m_hcrFlag; /**< aacSpectralDataResilienceFlag */
|
|
|
|
SCHAR m_sbrPresentFlag; /**< Flag indicating the presence of SBR data in the
|
|
bitstream */
|
|
SCHAR
|
|
m_psPresentFlag; /**< Flag indicating the presence of parametric stereo
|
|
data in the bitstream */
|
|
UCHAR m_samplingFrequencyIndex; /**< Samplerate index */
|
|
UCHAR m_extensionSamplingFrequencyIndex; /**< Samplerate index */
|
|
SCHAR m_extensionChannelConfiguration; /**< Channel configuration index */
|
|
|
|
UCHAR
|
|
configMode; /**< The flag indicates if the callback shall work in memory
|
|
allocation mode or in config change detection mode */
|
|
UCHAR AacConfigChanged; /**< The flag will be set if at least one aac config
|
|
parameter has changed that requires a memory
|
|
reconfiguration, otherwise it will be cleared */
|
|
UCHAR SbrConfigChanged; /**< The flag will be set if at least one sbr config
|
|
parameter has changed that requires a memory
|
|
reconfiguration, otherwise it will be cleared */
|
|
UCHAR SacConfigChanged; /**< The flag will be set if at least one sac config
|
|
parameter has changed that requires a memory
|
|
reconfiguration, otherwise it will be cleared */
|
|
|
|
UCHAR
|
|
config[TP_USAC_MAX_CONFIG_LEN]; /**< Configuration stored as bitstream */
|
|
UINT configBits; /**< Configuration length in bits */
|
|
|
|
} CSAudioSpecificConfig;
|
|
|
|
typedef struct {
|
|
SCHAR flushCnt; /**< Flush frame counter */
|
|
UCHAR flushStatus; /**< Flag indicates flush mode: on|off */
|
|
SCHAR buildUpCnt; /**< Build up frame counter */
|
|
UCHAR buildUpStatus; /**< Flag indicates build up mode: on|off */
|
|
UCHAR cfgChanged; /**< Flag indicates that the config changed and the decoder
|
|
needs to be initialized again via callback. Make sure
|
|
that memory is freed before initialization. */
|
|
UCHAR contentChanged; /**< Flag indicates that the content changed i.e. a
|
|
right truncation occured before */
|
|
UCHAR forceCfgChange; /**< Flag indicates if config change has to be forced
|
|
even if new config is the same */
|
|
} CCtrlCFGChange;
|
|
|
|
typedef INT (*cbUpdateConfig_t)(void *, const CSAudioSpecificConfig *,
|
|
const UCHAR configMode, UCHAR *configChanged);
|
|
typedef INT (*cbFreeMem_t)(void *, const CSAudioSpecificConfig *);
|
|
typedef INT (*cbCtrlCFGChange_t)(void *, const CCtrlCFGChange *);
|
|
typedef INT (*cbSsc_t)(void *, HANDLE_FDK_BITSTREAM,
|
|
const AUDIO_OBJECT_TYPE coreCodec,
|
|
const INT samplingRate, const INT frameSize,
|
|
const INT stereoConfigIndex,
|
|
const INT coreSbrFrameLengthIndex, const INT configBytes,
|
|
const UCHAR configMode, UCHAR *configChanged);
|
|
|
|
typedef INT (*cbSbr_t)(void *self, HANDLE_FDK_BITSTREAM hBs,
|
|
const INT sampleRateIn, const INT sampleRateOut,
|
|
const INT samplesPerFrame,
|
|
const AUDIO_OBJECT_TYPE coreCodec,
|
|
const MP4_ELEMENT_ID elementID, const INT elementIndex,
|
|
const UCHAR harmonicSbr, const UCHAR stereoConfigIndex,
|
|
const UCHAR configMode, UCHAR *configChanged,
|
|
const INT downscaleFactor);
|
|
|
|
typedef INT (*cbUsac_t)(void *self, HANDLE_FDK_BITSTREAM hBs);
|
|
|
|
typedef INT (*cbUniDrc_t)(void *self, HANDLE_FDK_BITSTREAM hBs,
|
|
const INT fullPayloadLength, const INT payloadType,
|
|
const INT subStreamIndex, const INT payloadStart,
|
|
const AUDIO_OBJECT_TYPE);
|
|
|
|
typedef struct {
|
|
cbUpdateConfig_t cbUpdateConfig; /*!< Function pointer for Config change
|
|
notify callback. */
|
|
void *cbUpdateConfigData; /*!< User data pointer for Config change notify
|
|
callback. */
|
|
cbFreeMem_t cbFreeMem; /*!< Function pointer for free memory callback. */
|
|
void *cbFreeMemData; /*!< User data pointer for free memory callback. */
|
|
cbCtrlCFGChange_t cbCtrlCFGChange; /*!< Function pointer for config change
|
|
control callback. */
|
|
void *cbCtrlCFGChangeData; /*!< User data pointer for config change control
|
|
callback. */
|
|
cbSsc_t cbSsc; /*!< Function pointer for SSC parser callback. */
|
|
void *cbSscData; /*!< User data pointer for SSC parser callback. */
|
|
cbSbr_t cbSbr; /*!< Function pointer for SBR header parser callback. */
|
|
void *cbSbrData; /*!< User data pointer for SBR header parser callback. */
|
|
cbUsac_t cbUsac;
|
|
void *cbUsacData;
|
|
cbUniDrc_t cbUniDrc; /*!< Function pointer for uniDrcConfig and
|
|
loudnessInfoSet parser callback. */
|
|
void *cbUniDrcData; /*!< User data pointer for uniDrcConfig and
|
|
loudnessInfoSet parser callback. */
|
|
} CSTpCallBacks;
|
|
|
|
static const UINT SamplingRateTable[] = {
|
|
96000, 88200, 64000, 48000, 44100, 32000, 24000, 22050, 16000, 12000, 11025,
|
|
8000, 7350, 0, 0, 57600, 51200, 40000, 38400, 34150, 28800, 25600,
|
|
20000, 19200, 17075, 14400, 12800, 9600, 0, 0, 0, 0};
|
|
|
|
static inline int getSamplingRateIndex(UINT samplingRate, UINT nBits) {
|
|
UINT sf_index;
|
|
UINT tableSize = (1 << nBits) - 1;
|
|
|
|
for (sf_index = 0; sf_index < tableSize; sf_index++) {
|
|
if (SamplingRateTable[sf_index] == samplingRate) break;
|
|
}
|
|
|
|
if (sf_index > tableSize) {
|
|
return tableSize - 1;
|
|
}
|
|
|
|
return sf_index;
|
|
}
|
|
|
|
/*
|
|
* Get Channel count from channel configuration
|
|
*/
|
|
static inline int getNumberOfTotalChannels(int channelConfig) {
|
|
switch (channelConfig) {
|
|
case 1:
|
|
case 2:
|
|
case 3:
|
|
case 4:
|
|
case 5:
|
|
case 6:
|
|
return channelConfig;
|
|
case 7:
|
|
case 12:
|
|
case 14:
|
|
return 8;
|
|
case 11:
|
|
return 7;
|
|
case 13:
|
|
return 24;
|
|
default:
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
static inline int getNumberOfEffectiveChannels(
|
|
const int
|
|
channelConfig) { /* index: 0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15 */
|
|
const int n[] = {0, 1, 2, 3, 4, 5, 5, 7, 0, 0, 0, 6, 7, 22, 7, 0};
|
|
return n[channelConfig];
|
|
}
|
|
|
|
#endif /* TP_DATA_H */
|