blob: df9e99691ff4d56f6148a1fa46caeb0fea6e7744 [file] [log] [blame]
/* -----------------------------------------------------------------------------
Software License for The Fraunhofer FDK AAC Codec Library for Android
© Copyright 1995 - 2018 Fraunhofer-Gesellschaft zur Förderung der angewandten
Forschung e.V. All rights reserved.
1. INTRODUCTION
The Fraunhofer FDK AAC Codec Library for Android ("FDK AAC Codec") is software
that implements the MPEG Advanced Audio Coding ("AAC") encoding and decoding
scheme for digital audio. This FDK AAC Codec software is intended to be used on
a wide variety of Android devices.
AAC's HE-AAC and HE-AAC v2 versions are regarded as today's most efficient
general perceptual audio codecs. AAC-ELD is considered the best-performing
full-bandwidth communications codec by independent studies and is widely
deployed. AAC has been standardized by ISO and IEC as part of the MPEG
specifications.
Patent licenses for necessary patent claims for the FDK AAC Codec (including
those of Fraunhofer) may be obtained through Via Licensing
(www.vialicensing.com) or through the respective patent owners individually for
the purpose of encoding or decoding bit streams in products that are compliant
with the ISO/IEC MPEG audio standards. Please note that most manufacturers of
Android devices already license these patent claims through Via Licensing or
directly from the patent owners, and therefore FDK AAC Codec software may
already be covered under those patent licenses when it is used for those
licensed purposes only.
Commercially-licensed AAC software libraries, including floating-point versions
with enhanced sound quality, are also available from Fraunhofer. Users are
encouraged to check the Fraunhofer website for additional applications
information and documentation.
2. COPYRIGHT LICENSE
Redistribution and use in source and binary forms, with or without modification,
are permitted without payment of copyright license fees provided that you
satisfy the following conditions:
You must retain the complete text of this software license in redistributions of
the FDK AAC Codec or your modifications thereto in source code form.
You must retain the complete text of this software license in the documentation
and/or other materials provided with redistributions of the FDK AAC Codec or
your modifications thereto in binary form. You must make available free of
charge copies of the complete source code of the FDK AAC Codec and your
modifications thereto to recipients of copies in binary form.
The name of Fraunhofer may not be used to endorse or promote products derived
from this library without prior written permission.
You may not charge copyright license fees for anyone to use, copy or distribute
the FDK AAC Codec software or your modifications thereto.
Your modified versions of the FDK AAC Codec must carry prominent notices stating
that you changed the software and the date of any change. For modified versions
of the FDK AAC Codec, the term "Fraunhofer FDK AAC Codec Library for Android"
must be replaced by the term "Third-Party Modified Version of the Fraunhofer FDK
AAC Codec Library for Android."
3. NO PATENT LICENSE
NO EXPRESS OR IMPLIED LICENSES TO ANY PATENT CLAIMS, including without
limitation the patents of Fraunhofer, ARE GRANTED BY THIS SOFTWARE LICENSE.
Fraunhofer provides no warranty of patent non-infringement with respect to this
software.
You may use this FDK AAC Codec software or modifications thereto only for
purposes that are authorized by appropriate patent licenses.
4. DISCLAIMER
This FDK AAC Codec software is provided by Fraunhofer on behalf of the copyright
holders and contributors "AS IS" and WITHOUT ANY EXPRESS OR IMPLIED WARRANTIES,
including but not limited to the implied warranties of merchantability and
fitness for a particular purpose. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR
CONTRIBUTORS BE LIABLE for any direct, indirect, incidental, special, exemplary,
or consequential damages, including but not limited to procurement of substitute
goods or services; loss of use, data, or profits, or business interruption,
however caused and on any theory of liability, whether in contract, strict
liability, or tort (including negligence), arising in any way out of the use of
this software, even if advised of the possibility of such damage.
5. CONTACT INFORMATION
Fraunhofer Institute for Integrated Circuits IIS
Attention: Audio and Multimedia Departments - FDK AAC LL
Am Wolfsmantel 33
91058 Erlangen, Germany
www.iis.fraunhofer.de/amm
amm-info@iis.fraunhofer.de
----------------------------------------------------------------------------- */
/**************************** SBR encoder library ******************************
Author(s): Andreas Ehret, Tobias Chalupka
Description: SBR encoder top level processing.
*******************************************************************************/
#include "sbr_encoder.h"
#include "sbrenc_ram.h"
#include "sbrenc_rom.h"
#include "sbrenc_freq_sca.h"
#include "env_bit.h"
#include "cmondata.h"
#include "sbr_misc.h"
#include "sbr.h"
#include "qmf.h"
#include "ps_main.h"
#define SBRENCODER_LIB_VL0 4
#define SBRENCODER_LIB_VL1 0
#define SBRENCODER_LIB_VL2 0
/***************************************************************************/
/*
* SBR Delay balancing definitions.
*/
/*
input buffer (1ch)
|------------ 1537 -------------|-----|---------- 2048 -------------|
(core2sbr delay ) ds (read, core and ds area)
*/
#define SFB(dwnsmp) \
(32 << (dwnsmp - \
1)) /* SBR Frequency bands: 64 for dual-rate, 32 for single-rate */
#define STS(fl) \
(((fl) == 1024) ? 32 \
: 30) /* SBR Time Slots: 32 for core frame length 1024, 30 \
for core frame length 960 */
#define DELAY_QMF_ANA(dwnsmp) \
((320 << ((dwnsmp)-1)) - (32 << ((dwnsmp)-1))) /* Full bandwidth */
#define DELAY_HYB_ANA (10 * 64) /* + 0.5 */ /* */
#define DELAY_HYB_SYN (6 * 64 - 32) /* */
#define DELAY_QMF_POSTPROC(dwnsmp) \
(32 * (dwnsmp)) /* QMF postprocessing delay */
#define DELAY_DEC_QMF(dwnsmp) (6 * SFB(dwnsmp)) /* Decoder QMF overlap */
#define DELAY_QMF_SYN(dwnsmp) \
(1 << (dwnsmp - \
1)) /* QMF_NO_POLY/2=2.5, rounded down to 2, half for single-rate */
#define DELAY_QMF_DS (32) /* QMF synthesis for downsampled time signal */
/* Delay in QMF paths */
#define DELAY_SBR(fl, dwnsmp) \
(DELAY_QMF_ANA(dwnsmp) + (SFB(dwnsmp) * STS(fl) - 1) + DELAY_QMF_SYN(dwnsmp))
#define DELAY_PS(fl, dwnsmp) \
(DELAY_QMF_ANA(dwnsmp) + DELAY_HYB_ANA + DELAY_DEC_QMF(dwnsmp) + \
(SFB(dwnsmp) * STS(fl) - 1) + DELAY_HYB_SYN + DELAY_QMF_SYN(dwnsmp))
#define DELAY_ELDSBR(fl, dwnsmp) \
((((fl) / 2) * (dwnsmp)) - 1 + DELAY_QMF_POSTPROC(dwnsmp))
#define DELAY_ELDv2SBR(fl, dwnsmp) \
((((fl) / 2) * (dwnsmp)) - 1 + 80 * (dwnsmp)) /* 80 is the delay caused \
by the sum of the CLD \
analysis and the MPSLD \
synthesis filterbank */
/* Delay in core path (core and downsampler not taken into account) */
#define DELAY_COREPATH_SBR(fl, dwnsmp) \
((DELAY_QMF_ANA(dwnsmp) + DELAY_DEC_QMF(dwnsmp) + DELAY_QMF_SYN(dwnsmp)))
#define DELAY_COREPATH_ELDSBR(fl, dwnsmp) ((DELAY_QMF_POSTPROC(dwnsmp)))
#define DELAY_COREPATH_ELDv2SBR(fl, dwnsmp) (128 * (dwnsmp)) /* 4 slots */
#define DELAY_COREPATH_PS(fl, dwnsmp) \
((DELAY_QMF_ANA(dwnsmp) + DELAY_QMF_DS + \
/*(DELAY_AAC(fl)*2) + */ DELAY_QMF_ANA(dwnsmp) + DELAY_DEC_QMF(dwnsmp) + \
DELAY_HYB_SYN + DELAY_QMF_SYN(dwnsmp))) /* 2048 - 463*2 */
/* Delay differences between SBR- and downsampled path for SBR and SBR+PS */
#define DELAY_AAC2SBR(fl, dwnsmp) \
((DELAY_COREPATH_SBR(fl, dwnsmp)) - DELAY_SBR((fl), (dwnsmp)))
#define DELAY_ELD2SBR(fl, dwnsmp) \
((DELAY_COREPATH_ELDSBR(fl, dwnsmp)) - DELAY_ELDSBR(fl, dwnsmp))
#define DELAY_AAC2PS(fl, dwnsmp) \
((DELAY_COREPATH_PS(fl, dwnsmp)) - DELAY_PS(fl, dwnsmp)) /* 2048 - 463*2 */
/* Assumption: The sample delay resulting of of DELAY_AAC2PS is always smaller
* than the sample delay implied by DELAY_AAC2SBR */
#define MAX_DS_FILTER_DELAY \
(5) /* the additional max downsampler filter delay (source fs) */
#define MAX_SAMPLE_DELAY \
(DELAY_AAC2SBR(1024, 2) + MAX_DS_FILTER_DELAY) /* maximum delay: frame \
length of 1024 and \
dual-rate sbr */
/***************************************************************************/
/*************** Delay parameters for sbrEncoder_Init_delay() **************/
typedef struct {
int dsDelay; /* the delay of the (time-domain) downsampler itself */
int delay; /* overall delay / samples */
int sbrDecDelay; /* SBR decoder's delay */
int corePathOffset; /* core path offset / samples; added by
sbrEncoder_Init_delay() */
int sbrPathOffset; /* SBR path offset / samples; added by
sbrEncoder_Init_delay() */
int bitstrDelay; /* bitstream delay / frames; added by sbrEncoder_Init_delay()
*/
int delayInput2Core; /* delay of the input to the core / samples */
} DELAY_PARAM;
/***************************************************************************/
#define INVALID_TABLE_IDX -1
/***************************************************************************/
/*!
\brief Selects the SBR tuning settings to use dependent on number of
channels, bitrate, sample rate and core coder
\return Index to the appropriate table
****************************************************************************/
#define DISTANCE_CEIL_VALUE 5000000
static INT getSbrTuningTableIndex(
UINT bitrate, /*! the total bitrate in bits/sec */
UINT numChannels, /*! the number of channels for the core coder */
UINT sampleRate, /*! the sampling rate of the core coder */
AUDIO_OBJECT_TYPE core, UINT *pBitRateClosest) {
int i, bitRateClosestLowerIndex = -1, bitRateClosestUpperIndex = -1,
found = 0;
UINT bitRateClosestUpper = 0, bitRateClosestLower = DISTANCE_CEIL_VALUE;
#define isForThisCore(i) \
((sbrTuningTable[i].coreCoder == CODEC_AACLD && core == AOT_ER_AAC_ELD) || \
(sbrTuningTable[i].coreCoder == CODEC_AAC && core != AOT_ER_AAC_ELD))
for (i = 0; i < sbrTuningTableSize; i++) {
if (isForThisCore(i)) /* tuning table is for this core codec */
{
if (numChannels == sbrTuningTable[i].numChannels &&
sampleRate == sbrTuningTable[i].sampleRate) {
found = 1;
if ((bitrate >= sbrTuningTable[i].bitrateFrom) &&
(bitrate < sbrTuningTable[i].bitrateTo)) {
return i;
} else {
if (sbrTuningTable[i].bitrateFrom > bitrate) {
if (sbrTuningTable[i].bitrateFrom < bitRateClosestLower) {
bitRateClosestLower = sbrTuningTable[i].bitrateFrom;
bitRateClosestLowerIndex = i;
}
}
if (sbrTuningTable[i].bitrateTo <= bitrate) {
if (sbrTuningTable[i].bitrateTo > bitRateClosestUpper) {
bitRateClosestUpper = sbrTuningTable[i].bitrateTo - 1;
bitRateClosestUpperIndex = i;
}
}
}
}
}
}
if (bitRateClosestUpperIndex >= 0) {
return bitRateClosestUpperIndex;
}
if (pBitRateClosest != NULL) {
/* If there was at least one matching tuning entry pick the least distance
* bit rate */
if (found) {
int distanceUpper = DISTANCE_CEIL_VALUE,
distanceLower = DISTANCE_CEIL_VALUE;
if (bitRateClosestLowerIndex >= 0) {
distanceLower =
sbrTuningTable[bitRateClosestLowerIndex].bitrateFrom - bitrate;
}
if (bitRateClosestUpperIndex >= 0) {
distanceUpper =
bitrate - sbrTuningTable[bitRateClosestUpperIndex].bitrateTo;
}
if (distanceUpper < distanceLower) {
*pBitRateClosest = bitRateClosestUpper;
} else {
*pBitRateClosest = bitRateClosestLower;
}
} else {
*pBitRateClosest = 0;
}
}
return INVALID_TABLE_IDX;
}
/***************************************************************************/
/*!
\brief Selects the PS tuning settings to use dependent on bitrate
and core coder
\return Index to the appropriate table
****************************************************************************/
static INT getPsTuningTableIndex(UINT bitrate, UINT *pBitRateClosest) {
INT i, paramSets = sizeof(psTuningTable) / sizeof(psTuningTable[0]);
int bitRateClosestLowerIndex = -1, bitRateClosestUpperIndex = -1;
UINT bitRateClosestUpper = 0, bitRateClosestLower = DISTANCE_CEIL_VALUE;
for (i = 0; i < paramSets; i++) {
if ((bitrate >= psTuningTable[i].bitrateFrom) &&
(bitrate < psTuningTable[i].bitrateTo)) {
return i;
} else {
if (psTuningTable[i].bitrateFrom > bitrate) {
if (psTuningTable[i].bitrateFrom < bitRateClosestLower) {
bitRateClosestLower = psTuningTable[i].bitrateFrom;
bitRateClosestLowerIndex = i;
}
}
if (psTuningTable[i].bitrateTo <= bitrate) {
if (psTuningTable[i].bitrateTo > bitRateClosestUpper) {
bitRateClosestUpper = psTuningTable[i].bitrateTo - 1;
bitRateClosestUpperIndex = i;
}
}
}
}
if (bitRateClosestUpperIndex >= 0) {
return bitRateClosestUpperIndex;
}
if (pBitRateClosest != NULL) {
int distanceUpper = DISTANCE_CEIL_VALUE,
distanceLower = DISTANCE_CEIL_VALUE;
if (bitRateClosestLowerIndex >= 0) {
distanceLower =
sbrTuningTable[bitRateClosestLowerIndex].bitrateFrom - bitrate;
}
if (bitRateClosestUpperIndex >= 0) {
distanceUpper =
bitrate - sbrTuningTable[bitRateClosestUpperIndex].bitrateTo;
}
if (distanceUpper < distanceLower) {
*pBitRateClosest = bitRateClosestUpper;
} else {
*pBitRateClosest = bitRateClosestLower;
}
}
return INVALID_TABLE_IDX;
}
/***************************************************************************/
/*!
\brief In case of downsampled SBR we may need to lower the stop freq
of a tuning setting to fit into the lower half of the
spectrum ( which is sampleRate/4 )
\return the adapted stop frequency index (-1 -> error)
\ingroup SbrEncCfg
****************************************************************************/
static INT FDKsbrEnc_GetDownsampledStopFreq(const INT sampleRateCore,
const INT startFreq, INT stopFreq,
const INT downSampleFactor) {
INT maxStopFreqRaw = sampleRateCore / 2;
INT startBand, stopBand;
HANDLE_ERROR_INFO err;
while (stopFreq > 0 && FDKsbrEnc_getSbrStopFreqRAW(stopFreq, sampleRateCore) >
maxStopFreqRaw) {
stopFreq--;
}
if (FDKsbrEnc_getSbrStopFreqRAW(stopFreq, sampleRateCore) > maxStopFreqRaw)
return -1;
err = FDKsbrEnc_FindStartAndStopBand(
sampleRateCore << (downSampleFactor - 1), sampleRateCore,
32 << (downSampleFactor - 1), startFreq, stopFreq, &startBand, &stopBand);
if (err) return -1;
return stopFreq;
}
/***************************************************************************/
/*!
\brief tells us, if for the given coreCoder, bitrate, number of channels
and input sampling rate an SBR setting is available. If yes, it
tells us also the core sampling rate we would need to run with
\return a flag indicating success: yes (1) or no (0)
****************************************************************************/
static UINT FDKsbrEnc_IsSbrSettingAvail(
UINT bitrate, /*! the total bitrate in bits/sec */
UINT vbrMode, /*! the vbr paramter, 0 means constant bitrate */
UINT numOutputChannels, /*! the number of channels for the core coder */
UINT sampleRateInput, /*! the input sample rate [in Hz] */
UINT sampleRateCore, /*! the core's sampling rate */
AUDIO_OBJECT_TYPE core) {
INT idx = INVALID_TABLE_IDX;
if (sampleRateInput < 16000) return 0;
if (bitrate == 0) {
/* map vbr quality to bitrate */
if (vbrMode < 30)
bitrate = 24000;
else if (vbrMode < 40)
bitrate = 28000;
else if (vbrMode < 60)
bitrate = 32000;
else if (vbrMode < 75)
bitrate = 40000;
else
bitrate = 48000;
bitrate *= numOutputChannels;
}
idx = getSbrTuningTableIndex(bitrate, numOutputChannels, sampleRateCore, core,
NULL);
return (idx == INVALID_TABLE_IDX ? 0 : 1);
}
/***************************************************************************/
/*!
\brief Adjusts the SBR settings according to the chosen core coder
settings which are accessible via config->codecSettings
\return A flag indicating success: yes (1) or no (0)
****************************************************************************/
static UINT FDKsbrEnc_AdjustSbrSettings(
const sbrConfigurationPtr config, /*! output, modified */
UINT bitRate, /*! the total bitrate in bits/sec */
UINT numChannels, /*! the core coder number of channels */
UINT sampleRateCore, /*! the core coder sampling rate in Hz */
UINT sampleRateSbr, /*! the sbr coder sampling rate in Hz */
UINT transFac, /*! the short block to long block ratio */
UINT standardBitrate, /*! the standard bitrate per channel in bits/sec */
UINT vbrMode, /*! the vbr paramter, 0 poor quality .. 100 high quality*/
UINT useSpeechConfig, /*!< adapt tuning parameters for speech ? */
UINT lcsMode, /*! the low complexity stereo mode */
UINT bParametricStereo, /*!< use parametric stereo */
AUDIO_OBJECT_TYPE core) /* Core audio codec object type */
{
INT idx = INVALID_TABLE_IDX;
/* set the core codec settings */
config->codecSettings.bitRate = bitRate;
config->codecSettings.nChannels = numChannels;
config->codecSettings.sampleFreq = sampleRateCore;
config->codecSettings.transFac = transFac;
config->codecSettings.standardBitrate = standardBitrate;
if (bitRate < 28000) {
config->threshold_AmpRes_FF_m = (FIXP_DBL)MAXVAL_DBL;
config->threshold_AmpRes_FF_e = 7;
} else if (bitRate >= 28000 && bitRate <= 48000) {
/* The float threshold is 75
0.524288f is fractional part of RELAXATION, the quotaMatrix and therefore
tonality are scaled by this 2/3 is because the original implementation
divides the tonality values by 3, here it's divided by 2 128 compensates
the necessary shiftfactor of 7 */
config->threshold_AmpRes_FF_m =
FL2FXCONST_DBL(75.0f * 0.524288f / (2.0f / 3.0f) / 128.0f);
config->threshold_AmpRes_FF_e = 7;
} else if (bitRate > 48000) {
config->threshold_AmpRes_FF_m = FL2FXCONST_DBL(0);
config->threshold_AmpRes_FF_e = 0;
}
if (bitRate == 0) {
/* map vbr quality to bitrate */
if (vbrMode < 30)
bitRate = 24000;
else if (vbrMode < 40)
bitRate = 28000;
else if (vbrMode < 60)
bitRate = 32000;
else if (vbrMode < 75)
bitRate = 40000;
else
bitRate = 48000;
bitRate *= numChannels;
/* fix to enable mono vbrMode<40 @ 44.1 of 48kHz */
if (numChannels == 1) {
if (sampleRateSbr == 44100 || sampleRateSbr == 48000) {
if (vbrMode < 40) bitRate = 32000;
}
}
}
idx =
getSbrTuningTableIndex(bitRate, numChannels, sampleRateCore, core, NULL);
if (idx != INVALID_TABLE_IDX) {
config->startFreq = sbrTuningTable[idx].startFreq;
config->stopFreq = sbrTuningTable[idx].stopFreq;
if (useSpeechConfig) {
config->startFreq = sbrTuningTable[idx].startFreqSpeech;
config->stopFreq = sbrTuningTable[idx].stopFreqSpeech;
}
/* Adapt stop frequency in case of downsampled SBR - only 32 bands then */
if (1 == config->downSampleFactor) {
INT dsStopFreq = FDKsbrEnc_GetDownsampledStopFreq(
sampleRateCore, config->startFreq, config->stopFreq,
config->downSampleFactor);
if (dsStopFreq < 0) {
return 0;
}
config->stopFreq = dsStopFreq;
}
config->sbr_noise_bands = sbrTuningTable[idx].numNoiseBands;
if (core == AOT_ER_AAC_ELD) config->init_amp_res_FF = SBR_AMP_RES_1_5;
config->noiseFloorOffset = sbrTuningTable[idx].noiseFloorOffset;
config->ana_max_level = sbrTuningTable[idx].noiseMaxLevel;
config->stereoMode = sbrTuningTable[idx].stereoMode;
config->freqScale = sbrTuningTable[idx].freqScale;
if (numChannels == 1) {
/* stereo case */
switch (core) {
case AOT_AAC_LC:
if (bitRate <= (useSpeechConfig ? 24000U : 20000U)) {
config->freq_res_fixfix[0] = FREQ_RES_LOW; /* set low frequency
resolution for
non-split frames */
config->freq_res_fixfix[1] = FREQ_RES_LOW; /* set low frequency
resolution for split
frames */
}
break;
case AOT_ER_AAC_ELD:
if (bitRate < 36000)
config->freq_res_fixfix[1] = FREQ_RES_LOW; /* set low frequency
resolution for split
frames */
if (bitRate < 26000) {
config->freq_res_fixfix[0] = FREQ_RES_LOW; /* set low frequency
resolution for
non-split frames */
config->fResTransIsLow =
1; /* for transient frames, set low frequency resolution */
}
break;
default:
break;
}
} else {
/* stereo case */
switch (core) {
case AOT_AAC_LC:
if (bitRate <= 28000) {
config->freq_res_fixfix[0] = FREQ_RES_LOW; /* set low frequency
resolution for
non-split frames */
config->freq_res_fixfix[1] = FREQ_RES_LOW; /* set low frequency
resolution for split
frames */
}
break;
case AOT_ER_AAC_ELD:
if (bitRate < 72000) {
config->freq_res_fixfix[1] = FREQ_RES_LOW; /* set low frequency
resolution for split
frames */
}
if (bitRate < 52000) {
config->freq_res_fixfix[0] = FREQ_RES_LOW; /* set low frequency
resolution for
non-split frames */
config->fResTransIsLow =
1; /* for transient frames, set low frequency resolution */
}
break;
default:
break;
}
if (bitRate <= 28000) {
/*
additionally restrict frequency resolution in FIXFIX frames
to further reduce SBR payload size */
config->freq_res_fixfix[0] = FREQ_RES_LOW;
config->freq_res_fixfix[1] = FREQ_RES_LOW;
}
}
/* adjust usage of parametric coding dependent on bitrate and speech config
* flag */
if (useSpeechConfig) config->parametricCoding = 0;
if (core == AOT_ER_AAC_ELD) {
if (bitRate < 28000) config->init_amp_res_FF = SBR_AMP_RES_3_0;
config->SendHeaderDataTime = -1;
}
if (numChannels == 1) {
if (bitRate < 16000) {
config->parametricCoding = 0;
}
} else {
if (bitRate < 20000) {
config->parametricCoding = 0;
}
}
config->useSpeechConfig = useSpeechConfig;
/* PS settings */
config->bParametricStereo = bParametricStereo;
return 1;
} else {
return 0;
}
}
/*****************************************************************************
functionname: FDKsbrEnc_InitializeSbrDefaults
description: initializes the SBR configuration
returns: error status
input: - core codec type,
- factor of SBR to core frame length,
- core frame length
output: initialized SBR configuration
*****************************************************************************/
static UINT FDKsbrEnc_InitializeSbrDefaults(sbrConfigurationPtr config,
INT downSampleFactor,
UINT codecGranuleLen,
const INT isLowDelay) {
if ((downSampleFactor < 1 || downSampleFactor > 2) ||
(codecGranuleLen * downSampleFactor > 64 * 32))
return (0); /* error */
config->SendHeaderDataTime = 1000;
config->useWaveCoding = 0;
config->crcSbr = 0;
config->dynBwSupported = 1;
if (isLowDelay)
config->tran_thr = 6000;
else
config->tran_thr = 13000;
config->parametricCoding = 1;
config->sbrFrameSize = codecGranuleLen * downSampleFactor;
config->downSampleFactor = downSampleFactor;
/* sbr default parameters */
config->sbr_data_extra = 0;
config->amp_res = SBR_AMP_RES_3_0;
config->tran_fc = 0;
config->tran_det_mode = 1;
config->spread = 1;
config->stat = 0;
config->e = 1;
config->deltaTAcrossFrames = 1;
config->dF_edge_1stEnv = FL2FXCONST_DBL(0.3f);
config->dF_edge_incr = FL2FXCONST_DBL(0.3f);
config->sbr_invf_mode = INVF_SWITCHED;
config->sbr_xpos_mode = XPOS_LC;
config->sbr_xpos_ctrl = SBR_XPOS_CTRL_DEFAULT;
config->sbr_xpos_level = 0;
config->useSaPan = 0;
config->dynBwEnabled = 0;
/* the following parameters are overwritten by the
FDKsbrEnc_AdjustSbrSettings() function since they are included in the
tuning table */
config->stereoMode = SBR_SWITCH_LRC;
config->ana_max_level = 6;
config->noiseFloorOffset = 0;
config->startFreq = 5; /* 5.9 respectively 6.0 kHz at fs = 44.1/48 kHz */
config->stopFreq = 9; /* 16.2 respectively 16.8 kHz at fs = 44.1/48 kHz */
config->freq_res_fixfix[0] = FREQ_RES_HIGH; /* non-split case */
config->freq_res_fixfix[1] = FREQ_RES_HIGH; /* split case */
config->fResTransIsLow = 0; /* for transient frames, set variable frequency
resolution according to freqResTable */
/* header_extra_1 */
config->freqScale = SBR_FREQ_SCALE_DEFAULT;
config->alterScale = SBR_ALTER_SCALE_DEFAULT;
config->sbr_noise_bands = SBR_NOISE_BANDS_DEFAULT;
/* header_extra_2 */
config->sbr_limiter_bands = SBR_LIMITER_BANDS_DEFAULT;
config->sbr_limiter_gains = SBR_LIMITER_GAINS_DEFAULT;
config->sbr_interpol_freq = SBR_INTERPOL_FREQ_DEFAULT;
config->sbr_smoothing_length = SBR_SMOOTHING_LENGTH_DEFAULT;
return 1;
}
/*****************************************************************************
functionname: DeleteEnvChannel
description: frees memory of one SBR channel
returns: -
input: handle of channel
output: released handle
*****************************************************************************/
static void deleteEnvChannel(HANDLE_ENV_CHANNEL hEnvCut) {
if (hEnvCut) {
FDKsbrEnc_DeleteTonCorrParamExtr(&hEnvCut->TonCorr);
FDKsbrEnc_deleteExtractSbrEnvelope(&hEnvCut->sbrExtractEnvelope);
}
}
/*****************************************************************************
functionname: sbrEncoder_ChannelClose
description: close the channel coding handle
returns:
input: phSbrChannel
output:
*****************************************************************************/
static void sbrEncoder_ChannelClose(HANDLE_SBR_CHANNEL hSbrChannel) {
if (hSbrChannel != NULL) {
deleteEnvChannel(&hSbrChannel->hEnvChannel);
}
}
/*****************************************************************************
functionname: sbrEncoder_ElementClose
description: close the channel coding handle
returns:
input: phSbrChannel
output:
*****************************************************************************/
static void sbrEncoder_ElementClose(HANDLE_SBR_ELEMENT *phSbrElement) {
HANDLE_SBR_ELEMENT hSbrElement = *phSbrElement;
if (hSbrElement != NULL) {
if (hSbrElement->sbrConfigData.v_k_master)
FreeRam_Sbr_v_k_master(&hSbrElement->sbrConfigData.v_k_master);
if (hSbrElement->sbrConfigData.freqBandTable[LO])
FreeRam_Sbr_freqBandTableLO(
&hSbrElement->sbrConfigData.freqBandTable[LO]);
if (hSbrElement->sbrConfigData.freqBandTable[HI])
FreeRam_Sbr_freqBandTableHI(
&hSbrElement->sbrConfigData.freqBandTable[HI]);
FreeRam_SbrElement(phSbrElement);
}
return;
}
void sbrEncoder_Close(HANDLE_SBR_ENCODER *phSbrEncoder) {
HANDLE_SBR_ENCODER hSbrEncoder = *phSbrEncoder;
if (hSbrEncoder != NULL) {
int el, ch;
for (el = 0; el < (8); el++) {
if (hSbrEncoder->sbrElement[el] != NULL) {
sbrEncoder_ElementClose(&hSbrEncoder->sbrElement[el]);
}
}
/* Close sbr Channels */
for (ch = 0; ch < (8); ch++) {
if (hSbrEncoder->pSbrChannel[ch]) {
sbrEncoder_ChannelClose(hSbrEncoder->pSbrChannel[ch]);
FreeRam_SbrChannel(&hSbrEncoder->pSbrChannel[ch]);
}
if (hSbrEncoder->QmfAnalysis[ch].FilterStates)
FreeRam_Sbr_QmfStatesAnalysis(
(FIXP_QAS **)&hSbrEncoder->QmfAnalysis[ch].FilterStates);
}
if (hSbrEncoder->hParametricStereo)
PSEnc_Destroy(&hSbrEncoder->hParametricStereo);
if (hSbrEncoder->qmfSynthesisPS.FilterStates)
FreeRam_PsQmfStatesSynthesis(
(FIXP_DBL **)&hSbrEncoder->qmfSynthesisPS.FilterStates);
/* Release Overlay */
if (hSbrEncoder->pSBRdynamic_RAM)
FreeRam_SbrDynamic_RAM((FIXP_DBL **)&hSbrEncoder->pSBRdynamic_RAM);
FreeRam_SbrEncoder(phSbrEncoder);
}
}
/*****************************************************************************
functionname: updateFreqBandTable
description: updates vk_master
returns: -
input: config handle
output: error info
*****************************************************************************/
static INT updateFreqBandTable(HANDLE_SBR_CONFIG_DATA sbrConfigData,
HANDLE_SBR_HEADER_DATA sbrHeaderData,
const INT downSampleFactor) {
INT k0, k2;
if (FDKsbrEnc_FindStartAndStopBand(
sbrConfigData->sampleFreq,
sbrConfigData->sampleFreq >> (downSampleFactor - 1),
sbrConfigData->noQmfBands, sbrHeaderData->sbr_start_frequency,
sbrHeaderData->sbr_stop_frequency, &k0, &k2))
return (1);
if (FDKsbrEnc_UpdateFreqScale(
sbrConfigData->v_k_master, &sbrConfigData->num_Master, k0, k2,
sbrHeaderData->freqScale, sbrHeaderData->alterScale))
return (1);
sbrHeaderData->sbr_xover_band = 0;
if (FDKsbrEnc_UpdateHiRes(sbrConfigData->freqBandTable[HI],
&sbrConfigData->nSfb[HI], sbrConfigData->v_k_master,
sbrConfigData->num_Master,
&sbrHeaderData->sbr_xover_band))
return (1);
FDKsbrEnc_UpdateLoRes(
sbrConfigData->freqBandTable[LO], &sbrConfigData->nSfb[LO],
sbrConfigData->freqBandTable[HI], sbrConfigData->nSfb[HI]);
sbrConfigData->xOverFreq =
(sbrConfigData->freqBandTable[LOW_RES][0] * sbrConfigData->sampleFreq /
sbrConfigData->noQmfBands +
1) >>
1;
return (0);
}
/*****************************************************************************
functionname: resetEnvChannel
description: resets parameters and allocates memory
returns: error status
input:
output: hEnv
*****************************************************************************/
static INT resetEnvChannel(HANDLE_SBR_CONFIG_DATA sbrConfigData,
HANDLE_SBR_HEADER_DATA sbrHeaderData,
HANDLE_ENV_CHANNEL hEnv) {
/* note !!! hEnv->encEnvData.noOfnoisebands will be updated later in function
* FDKsbrEnc_extractSbrEnvelope !!!*/
hEnv->TonCorr.sbrNoiseFloorEstimate.noiseBands =
sbrHeaderData->sbr_noise_bands;
if (FDKsbrEnc_ResetTonCorrParamExtr(
&hEnv->TonCorr, sbrConfigData->xposCtrlSwitch,
sbrConfigData->freqBandTable[HI][0], sbrConfigData->v_k_master,
sbrConfigData->num_Master, sbrConfigData->sampleFreq,
sbrConfigData->freqBandTable, sbrConfigData->nSfb,
sbrConfigData->noQmfBands))
return (1);
hEnv->sbrCodeNoiseFloor.nSfb[LO] =
hEnv->TonCorr.sbrNoiseFloorEstimate.noNoiseBands;
hEnv->sbrCodeNoiseFloor.nSfb[HI] =
hEnv->TonCorr.sbrNoiseFloorEstimate.noNoiseBands;
hEnv->sbrCodeEnvelope.nSfb[LO] = sbrConfigData->nSfb[LO];
hEnv->sbrCodeEnvelope.nSfb[HI] = sbrConfigData->nSfb[HI];
hEnv->encEnvData.noHarmonics = sbrConfigData->nSfb[HI];
hEnv->sbrCodeEnvelope.upDate = 0;
hEnv->sbrCodeNoiseFloor.upDate = 0;
return (0);
}
/* ****************************** FDKsbrEnc_SbrGetXOverFreq
* ******************************/
/**
* @fn
* @brief calculates the closest possible crossover frequency
* @return the crossover frequency SBR accepts
*
*/
static INT FDKsbrEnc_SbrGetXOverFreq(
HANDLE_SBR_ELEMENT hEnv, /*!< handle to SBR encoder instance */
INT xoverFreq) /*!< from core coder suggested crossover frequency */
{
INT band;
INT lastDiff, newDiff;
INT cutoffSb;
UCHAR *RESTRICT pVKMaster = hEnv->sbrConfigData.v_k_master;
/* Check if there is a matching cutoff frequency in the master table */
cutoffSb = (4 * xoverFreq * hEnv->sbrConfigData.noQmfBands /
hEnv->sbrConfigData.sampleFreq +
1) >>
1;
lastDiff = cutoffSb;
for (band = 0; band < hEnv->sbrConfigData.num_Master; band++) {
newDiff = fixp_abs((INT)pVKMaster[band] - cutoffSb);
if (newDiff >= lastDiff) {
band--;
break;
}
lastDiff = newDiff;
}
return ((pVKMaster[band] * hEnv->sbrConfigData.sampleFreq /
hEnv->sbrConfigData.noQmfBands +
1) >>
1);
}
/*****************************************************************************
functionname: FDKsbrEnc_EnvEncodeFrame
description: performs the sbr envelope calculation for one element
returns:
input:
output:
*****************************************************************************/
INT FDKsbrEnc_EnvEncodeFrame(
HANDLE_SBR_ENCODER hEnvEncoder, int iElement,
INT_PCM *samples, /*!< time samples, always deinterleaved */
UINT samplesBufSize, /*!< time buffer channel stride */
UINT *sbrDataBits, /*!< Size of SBR payload */
UCHAR *sbrData, /*!< SBR payload */
int clearOutput /*!< Do not consider any input signal */
) {
HANDLE_SBR_ELEMENT hSbrElement = NULL;
FDK_CRCINFO crcInfo;
INT crcReg;
INT ch;
INT band;
INT cutoffSb;
INT newXOver;
if (hEnvEncoder == NULL) return -1;
hSbrElement = hEnvEncoder->sbrElement[iElement];
if (hSbrElement == NULL) return -1;
/* header bitstream handling */
HANDLE_SBR_BITSTREAM_DATA sbrBitstreamData = &hSbrElement->sbrBitstreamData;
INT psHeaderActive = 0;
sbrBitstreamData->HeaderActive = 0;
/* Anticipate PS header because of internal PS bitstream delay in order to be
* in sync with SBR header. */
if (sbrBitstreamData->CountSendHeaderData ==
(sbrBitstreamData->NrSendHeaderData - 1)) {
psHeaderActive = 1;
}
/* Signal SBR header to be written into bitstream */
if (sbrBitstreamData->CountSendHeaderData == 0) {
sbrBitstreamData->HeaderActive = 1;
}
/* Increment header interval counter */
if (sbrBitstreamData->NrSendHeaderData == 0) {
sbrBitstreamData->CountSendHeaderData = 1;
} else {
if (sbrBitstreamData->CountSendHeaderData >= 0) {
sbrBitstreamData->CountSendHeaderData++;
sbrBitstreamData->CountSendHeaderData %=
sbrBitstreamData->NrSendHeaderData;
}
}
if (hSbrElement->CmonData.dynBwEnabled) {
INT i;
for (i = 4; i > 0; i--)
hSbrElement->dynXOverFreqDelay[i] = hSbrElement->dynXOverFreqDelay[i - 1];
hSbrElement->dynXOverFreqDelay[0] = hSbrElement->CmonData.dynXOverFreqEnc;
if (hSbrElement->dynXOverFreqDelay[1] > hSbrElement->dynXOverFreqDelay[2])
newXOver = hSbrElement->dynXOverFreqDelay[2];
else
newXOver = hSbrElement->dynXOverFreqDelay[1];
/* has the crossover frequency changed? */
if (hSbrElement->sbrConfigData.dynXOverFreq != newXOver) {
/* get corresponding master band */
cutoffSb = ((4 * newXOver * hSbrElement->sbrConfigData.noQmfBands /
hSbrElement->sbrConfigData.sampleFreq) +
1) >>
1;
for (band = 0; band < hSbrElement->sbrConfigData.num_Master; band++) {
if (cutoffSb == hSbrElement->sbrConfigData.v_k_master[band]) break;
}
FDK_ASSERT(band < hSbrElement->sbrConfigData.num_Master);
hSbrElement->sbrConfigData.dynXOverFreq = newXOver;
hSbrElement->sbrHeaderData.sbr_xover_band = band;
hSbrElement->sbrBitstreamData.HeaderActive = 1;
psHeaderActive = 1; /* ps header is one frame delayed */
/*
update vk_master table
*/
if (updateFreqBandTable(&hSbrElement->sbrConfigData,
&hSbrElement->sbrHeaderData,
hEnvEncoder->downSampleFactor))
return (1);
/* reset SBR channels */
INT nEnvCh = hSbrElement->sbrConfigData.nChannels;
for (ch = 0; ch < nEnvCh; ch++) {
if (resetEnvChannel(&hSbrElement->sbrConfigData,
&hSbrElement->sbrHeaderData,
&hSbrElement->sbrChannel[ch]->hEnvChannel))
return (1);
}
}
}
/*
allocate space for dummy header and crc
*/
crcReg = FDKsbrEnc_InitSbrBitstream(
&hSbrElement->CmonData,
hSbrElement->payloadDelayLine[hEnvEncoder->nBitstrDelay],
MAX_PAYLOAD_SIZE * sizeof(UCHAR), &crcInfo,
hSbrElement->sbrConfigData.sbrSyntaxFlags);
/* Temporal Envelope Data */
SBR_FRAME_TEMP_DATA _fData;
SBR_FRAME_TEMP_DATA *fData = &_fData;
SBR_ENV_TEMP_DATA eData[MAX_NUM_CHANNELS];
/* Init Temporal Envelope Data */
{
int i;
FDKmemclear(&eData[0], sizeof(SBR_ENV_TEMP_DATA));
FDKmemclear(&eData[1], sizeof(SBR_ENV_TEMP_DATA));
FDKmemclear(fData, sizeof(SBR_FRAME_TEMP_DATA));
for (i = 0; i < MAX_NUM_NOISE_VALUES; i++) fData->res[i] = FREQ_RES_HIGH;
}
if (!clearOutput) {
/*
* Transform audio data into QMF domain
*/
for (ch = 0; ch < hSbrElement->sbrConfigData.nChannels; ch++) {
HANDLE_ENV_CHANNEL h_envChan = &hSbrElement->sbrChannel[ch]->hEnvChannel;
HANDLE_SBR_EXTRACT_ENVELOPE sbrExtrEnv = &h_envChan->sbrExtractEnvelope;
if (hSbrElement->elInfo.fParametricStereo == 0) {
QMF_SCALE_FACTOR tmpScale;
FIXP_DBL **pQmfReal, **pQmfImag;
C_AALLOC_SCRATCH_START(qmfWorkBuffer, FIXP_DBL, 64 * 2)
/* Obtain pointers to QMF buffers. */
pQmfReal = sbrExtrEnv->rBuffer;
pQmfImag = sbrExtrEnv->iBuffer;
qmfAnalysisFiltering(
hSbrElement->hQmfAnalysis[ch], pQmfReal, pQmfImag, &tmpScale,
samples + hSbrElement->elInfo.ChannelIndex[ch] * samplesBufSize, 0,
1, qmfWorkBuffer);
h_envChan->qmfScale = tmpScale.lb_scale + 7;
C_AALLOC_SCRATCH_END(qmfWorkBuffer, FIXP_DBL, 64 * 2)
} /* fParametricStereo == 0 */
/*
Parametric Stereo processing
*/
if (hSbrElement->elInfo.fParametricStereo) {
INT error = noError;
/* Limit Parametric Stereo to one instance */
FDK_ASSERT(ch == 0);
if (error == noError) {
/* parametric stereo processing:
- input:
o left and right time domain samples
- processing:
o stereo qmf analysis
o stereo hybrid analysis
o ps parameter extraction
o downmix + hybrid synthesis
- output:
o downmixed qmf data is written to sbrExtrEnv->rBuffer and
sbrExtrEnv->iBuffer
*/
SCHAR qmfScale;
INT_PCM *pSamples[2] = {
samples + hSbrElement->elInfo.ChannelIndex[0] * samplesBufSize,
samples + hSbrElement->elInfo.ChannelIndex[1] * samplesBufSize};
error = FDKsbrEnc_PSEnc_ParametricStereoProcessing(
hEnvEncoder->hParametricStereo, pSamples, samplesBufSize,
hSbrElement->hQmfAnalysis, sbrExtrEnv->rBuffer,
sbrExtrEnv->iBuffer,
samples + hSbrElement->elInfo.ChannelIndex[ch] * samplesBufSize,
&hEnvEncoder->qmfSynthesisPS, &qmfScale, psHeaderActive);
h_envChan->qmfScale = (int)qmfScale;
}
} /* if (hEnvEncoder->hParametricStereo) */
/*
Extract Envelope relevant things from QMF data
*/
FDKsbrEnc_extractSbrEnvelope1(&hSbrElement->sbrConfigData,
&hSbrElement->sbrHeaderData,
&hSbrElement->sbrBitstreamData, h_envChan,
&hSbrElement->CmonData, &eData[ch], fData);
} /* hEnvEncoder->sbrConfigData.nChannels */
}
/*
Process Envelope relevant things and calculate envelope data and write
payload
*/
FDKsbrEnc_extractSbrEnvelope2(
&hSbrElement->sbrConfigData, &hSbrElement->sbrHeaderData,
(hSbrElement->elInfo.fParametricStereo) ? hEnvEncoder->hParametricStereo
: NULL,
&hSbrElement->sbrBitstreamData, &hSbrElement->sbrChannel[0]->hEnvChannel,
(hSbrElement->sbrConfigData.stereoMode != SBR_MONO)
? &hSbrElement->sbrChannel[1]->hEnvChannel
: NULL,
&hSbrElement->CmonData, eData, fData, clearOutput);
hSbrElement->sbrBitstreamData.rightBorderFIX = 0;
/*
format payload, calculate crc
*/
FDKsbrEnc_AssembleSbrBitstream(&hSbrElement->CmonData, &crcInfo, crcReg,
hSbrElement->sbrConfigData.sbrSyntaxFlags);
/*
save new payload, set to zero length if greater than MAX_PAYLOAD_SIZE
*/
hSbrElement->payloadDelayLineSize[hEnvEncoder->nBitstrDelay] =
FDKgetValidBits(&hSbrElement->CmonData.sbrBitbuf);
if (hSbrElement->payloadDelayLineSize[hEnvEncoder->nBitstrDelay] >
(MAX_PAYLOAD_SIZE << 3))
hSbrElement->payloadDelayLineSize[hEnvEncoder->nBitstrDelay] = 0;
/* While filling the Delay lines, sbrData is NULL */
if (sbrData) {
*sbrDataBits = hSbrElement->payloadDelayLineSize[0];
FDKmemcpy(sbrData, hSbrElement->payloadDelayLine[0],
(hSbrElement->payloadDelayLineSize[0] + 7) >> 3);
}
/* delay header active flag */
if (hSbrElement->sbrBitstreamData.HeaderActive == 1) {
hSbrElement->sbrBitstreamData.HeaderActiveDelay =
1 + hEnvEncoder->nBitstrDelay;
} else {
if (hSbrElement->sbrBitstreamData.HeaderActiveDelay > 0) {
hSbrElement->sbrBitstreamData.HeaderActiveDelay--;
}
}
return (0);
}
/*****************************************************************************
functionname: FDKsbrEnc_Downsample
description: performs downsampling and delay compensation of the core path
returns:
input:
output:
*****************************************************************************/
INT FDKsbrEnc_Downsample(
HANDLE_SBR_ENCODER hSbrEncoder,
INT_PCM *samples, /*!< time samples, always deinterleaved */
UINT samplesBufSize, /*!< time buffer size per channel */
UINT numChannels, /*!< number of channels */
UINT *sbrDataBits, /*!< Size of SBR payload */
UCHAR *sbrData, /*!< SBR payload */
int clearOutput /*!< Do not consider any input signal */
) {
HANDLE_SBR_ELEMENT hSbrElement = NULL;
INT nOutSamples;
int el;
if (hSbrEncoder->downSampleFactor > 1) {
/* Do downsampling */
/* Loop over elements (LFE is handled later) */
for (el = 0; el < hSbrEncoder->noElements; el++) {
hSbrElement = hSbrEncoder->sbrElement[el];
if (hSbrEncoder->sbrElement[el] != NULL) {
if (hSbrEncoder->downsamplingMethod == SBRENC_DS_TIME) {
int ch;
int nChannels = hSbrElement->sbrConfigData.nChannels;
for (ch = 0; ch < nChannels; ch++) {
FDKaacEnc_Downsample(
&hSbrElement->sbrChannel[ch]->downSampler,
samples +
hSbrElement->elInfo.ChannelIndex[ch] * samplesBufSize +
hSbrEncoder->bufferOffset / numChannels,
hSbrElement->sbrConfigData.frameSize,
samples + hSbrElement->elInfo.ChannelIndex[ch] * samplesBufSize,
&nOutSamples);
}
}
}
}
/* Handle LFE (if existing) */
if (hSbrEncoder->lfeChIdx != -1) { /* lfe downsampler */
FDKaacEnc_Downsample(&hSbrEncoder->lfeDownSampler,
samples + hSbrEncoder->lfeChIdx * samplesBufSize +
hSbrEncoder->bufferOffset / numChannels,
hSbrEncoder->frameSize,
samples + hSbrEncoder->lfeChIdx * samplesBufSize,
&nOutSamples);
}
} else {
/* No downsampling. Still, some buffer shifting for correct delay */
int samples2Copy = hSbrEncoder->frameSize;
if (hSbrEncoder->bufferOffset / (int)numChannels < samples2Copy) {
for (int c = 0; c < (int)numChannels; c++) {
/* Do memmove while taking care of overlapping memory areas. (memcpy
does not necessarily take care) Distinguish between oeverlapping and
non overlapping version due to reasons of complexity. */
FDKmemmove(samples + c * samplesBufSize,
samples + c * samplesBufSize +
hSbrEncoder->bufferOffset / numChannels,
samples2Copy * sizeof(INT_PCM));
}
} else {
for (int c = 0; c < (int)numChannels; c++) {
/* Simple memcpy since the memory areas are not overlapping */
FDKmemcpy(samples + c * samplesBufSize,
samples + c * samplesBufSize +
hSbrEncoder->bufferOffset / numChannels,
samples2Copy * sizeof(INT_PCM));
}
}
}
return 0;
}
/*****************************************************************************
functionname: createEnvChannel
description: initializes parameters and allocates memory
returns: error status
input:
output: hEnv
*****************************************************************************/
static INT createEnvChannel(HANDLE_ENV_CHANNEL hEnv, INT channel,
UCHAR *dynamic_RAM) {
FDKmemclear(hEnv, sizeof(struct ENV_CHANNEL));
if (FDKsbrEnc_CreateTonCorrParamExtr(&hEnv->TonCorr, channel)) {
return (1);
}
if (FDKsbrEnc_CreateExtractSbrEnvelope(&hEnv->sbrExtractEnvelope, channel,
/*chan*/ 0, dynamic_RAM)) {
return (1);
}
return 0;
}
/*****************************************************************************
functionname: initEnvChannel
description: initializes parameters
returns: error status
input:
output:
*****************************************************************************/
static INT initEnvChannel(HANDLE_SBR_CONFIG_DATA sbrConfigData,
HANDLE_SBR_HEADER_DATA sbrHeaderData,
HANDLE_ENV_CHANNEL hEnv, sbrConfigurationPtr params,
ULONG statesInitFlag, INT chanInEl,
UCHAR *dynamic_RAM) {
int frameShift, tran_off = 0;
INT e;
INT tran_fc;
INT timeSlots, timeStep, startIndex;
INT noiseBands[2] = {3, 3};
e = 1 << params->e;
FDK_ASSERT(params->e >= 0);
hEnv->encEnvData.freq_res_fixfix[0] = params->freq_res_fixfix[0];
hEnv->encEnvData.freq_res_fixfix[1] = params->freq_res_fixfix[1];
hEnv->encEnvData.fResTransIsLow = params->fResTransIsLow;
hEnv->fLevelProtect = 0;
hEnv->encEnvData.ldGrid =
(sbrConfigData->sbrSyntaxFlags & SBR_SYNTAX_LOW_DELAY) ? 1 : 0;
hEnv->encEnvData.sbr_xpos_mode = (XPOS_MODE)params->sbr_xpos_mode;
if (hEnv->encEnvData.sbr_xpos_mode == XPOS_SWITCHED) {
/*
no other type than XPOS_MDCT or XPOS_SPEECH allowed,
but enable switching
*/
sbrConfigData->switchTransposers = TRUE;
hEnv->encEnvData.sbr_xpos_mode = XPOS_MDCT;
} else {
sbrConfigData->switchTransposers = FALSE;
}
hEnv->encEnvData.sbr_xpos_ctrl = params->sbr_xpos_ctrl;
/* extended data */
if (params->parametricCoding) {
hEnv->encEnvData.extended_data = 1;
} else {
hEnv->encEnvData.extended_data = 0;
}
hEnv->encEnvData.extension_size = 0;
startIndex = QMF_FILTER_PROTOTYPE_SIZE - sbrConfigData->noQmfBands;
switch (params->sbrFrameSize) {
case 2304:
timeSlots = 18;
break;
case 2048:
case 1024:
case 512:
timeSlots = 16;
break;
case 1920:
case 960:
case 480:
timeSlots = 15;
break;
case 1152:
timeSlots = 9;
break;
default:
return (1); /* Illegal frame size */
}
timeStep = sbrConfigData->noQmfSlots / timeSlots;
if (FDKsbrEnc_InitTonCorrParamExtr(
params->sbrFrameSize, &hEnv->TonCorr, sbrConfigData, timeSlots,
params->sbr_xpos_ctrl, params->ana_max_level,
sbrHeaderData->sbr_noise_bands, params->noiseFloorOffset,
params->useSpeechConfig))
return (1);
hEnv->encEnvData.noOfnoisebands =
hEnv->TonCorr.sbrNoiseFloorEstimate.noNoiseBands;
noiseBands[0] = hEnv->encEnvData.noOfnoisebands;
noiseBands[1] = hEnv->encEnvData.noOfnoisebands;
hEnv->encEnvData.sbr_invf_mode = (INVF_MODE)params->sbr_invf_mode;
if (hEnv->encEnvData.sbr_invf_mode == INVF_SWITCHED) {
hEnv->encEnvData.sbr_invf_mode = INVF_MID_LEVEL;
hEnv->TonCorr.switchInverseFilt = TRUE;
} else {
hEnv->TonCorr.switchInverseFilt = FALSE;
}
tran_fc = params->tran_fc;
if (tran_fc == 0) {
tran_fc = fixMin(
5000, FDKsbrEnc_getSbrStartFreqRAW(sbrHeaderData->sbr_start_frequency,
params->codecSettings.sampleFreq));
}
tran_fc =
(tran_fc * 4 * sbrConfigData->noQmfBands / sbrConfigData->sampleFreq +
1) >>
1;
if (sbrConfigData->sbrSyntaxFlags & SBR_SYNTAX_LOW_DELAY) {
frameShift = LD_PRETRAN_OFF;
tran_off = LD_PRETRAN_OFF + FRAME_MIDDLE_SLOT_512LD * timeStep;
} else {
frameShift = 0;
switch (timeSlots) {
/* The factor of 2 is by definition. */
case NUMBER_TIME_SLOTS_2048:
tran_off = 8 + FRAME_MIDDLE_SLOT_2048 * timeStep;
break;
case NUMBER_TIME_SLOTS_1920:
tran_off = 7 + FRAME_MIDDLE_SLOT_1920 * timeStep;
break;
default:
return 1;
}
}
if (FDKsbrEnc_InitExtractSbrEnvelope(
&hEnv->sbrExtractEnvelope, sbrConfigData->noQmfSlots,
sbrConfigData->noQmfBands, startIndex, timeSlots, timeStep, tran_off,
statesInitFlag, chanInEl, dynamic_RAM, sbrConfigData->sbrSyntaxFlags))
return (1);
if (FDKsbrEnc_InitSbrCodeEnvelope(&hEnv->sbrCodeEnvelope, sbrConfigData->nSfb,
params->deltaTAcrossFrames,
params->dF_edge_1stEnv,
params->dF_edge_incr))
return (1);
if (FDKsbrEnc_InitSbrCodeEnvelope(&hEnv->sbrCodeNoiseFloor, noiseBands,
params->deltaTAcrossFrames, 0, 0))
return (1);
sbrConfigData->initAmpResFF = params->init_amp_res_FF;
if (FDKsbrEnc_InitSbrHuffmanTables(&hEnv->encEnvData, &hEnv->sbrCodeEnvelope,
&hEnv->sbrCodeNoiseFloor,
sbrHeaderData->sbr_amp_res))
return (1);
FDKsbrEnc_initFrameInfoGenerator(
&hEnv->SbrEnvFrame, params->spread, e, params->stat, timeSlots,
hEnv->encEnvData.freq_res_fixfix, hEnv->encEnvData.fResTransIsLow,
hEnv->encEnvData.ldGrid);
if (sbrConfigData->sbrSyntaxFlags & SBR_SYNTAX_LOW_DELAY)
{
INT bandwidth_qmf_slot =
(sbrConfigData->sampleFreq >> 1) / (sbrConfigData->noQmfBands);
if (FDKsbrEnc_InitSbrFastTransientDetector(
&hEnv->sbrFastTransientDetector, sbrConfigData->noQmfSlots,
bandwidth_qmf_slot, sbrConfigData->noQmfBands,
sbrConfigData->freqBandTable[0][0]))
return (1);
}
/* The transient detector has to be initialized also if the fast transient
detector was active, because the values from the transient detector
structure are used. */
if (FDKsbrEnc_InitSbrTransientDetector(
&hEnv->sbrTransientDetector, sbrConfigData->sbrSyntaxFlags,
sbrConfigData->frameSize, sbrConfigData->sampleFreq, params, tran_fc,
sbrConfigData->noQmfSlots, sbrConfigData->noQmfBands,
hEnv->sbrExtractEnvelope.YBufferWriteOffset,
hEnv->sbrExtractEnvelope.YBufferSzShift, frameShift, tran_off))
return (1);
sbrConfigData->xposCtrlSwitch = params->sbr_xpos_ctrl;
hEnv->encEnvData.noHarmonics = sbrConfigData->nSfb[HI];
hEnv->encEnvData.addHarmonicFlag = 0;
return (0);
}
INT sbrEncoder_Open(HANDLE_SBR_ENCODER *phSbrEncoder, INT nElements,
INT nChannels, INT supportPS) {
INT i;
INT errorStatus = 1;
HANDLE_SBR_ENCODER hSbrEncoder = NULL;
if (phSbrEncoder == NULL) {
goto bail;
}
hSbrEncoder = GetRam_SbrEncoder();
if (hSbrEncoder == NULL) {
goto bail;
}
FDKmemclear(hSbrEncoder, sizeof(SBR_ENCODER));
if (NULL ==
(hSbrEncoder->pSBRdynamic_RAM = (UCHAR *)GetRam_SbrDynamic_RAM())) {
goto bail;
}
hSbrEncoder->dynamicRam = hSbrEncoder->pSBRdynamic_RAM;
/* Create SBR elements */
for (i = 0; i < nElements; i++) {
hSbrEncoder->sbrElement[i] = GetRam_SbrElement(i);
if (hSbrEncoder->sbrElement[i] == NULL) {
goto bail;
}
FDKmemclear(hSbrEncoder->sbrElement[i], sizeof(SBR_ELEMENT));
hSbrEncoder->sbrElement[i]->sbrConfigData.freqBandTable[LO] =
GetRam_Sbr_freqBandTableLO(i);
hSbrEncoder->sbrElement[i]->sbrConfigData.freqBandTable[HI] =
GetRam_Sbr_freqBandTableHI(i);
hSbrEncoder->sbrElement[i]->sbrConfigData.v_k_master =
GetRam_Sbr_v_k_master(i);
if ((hSbrEncoder->sbrElement[i]->sbrConfigData.freqBandTable[LO] == NULL) ||
(hSbrEncoder->sbrElement[i]->sbrConfigData.freqBandTable[HI] == NULL) ||
(hSbrEncoder->sbrElement[i]->sbrConfigData.v_k_master == NULL)) {
goto bail;
}
}
/* Create SBR channels */
for (i = 0; i < nChannels; i++) {
hSbrEncoder->pSbrChannel[i] = GetRam_SbrChannel(i);
if (hSbrEncoder->pSbrChannel[i] == NULL) {
goto bail;
}
if (createEnvChannel(&hSbrEncoder->pSbrChannel[i]->hEnvChannel, i,
hSbrEncoder->dynamicRam)) {
goto bail;
}
}
/* Create QMF States */
for (i = 0; i < fixMax(nChannels, (supportPS) ? 2 : 0); i++) {
hSbrEncoder->QmfAnalysis[i].FilterStates = GetRam_Sbr_QmfStatesAnalysis(i);
if (hSbrEncoder->QmfAnalysis[i].FilterStates == NULL) {
goto bail;
}
}
/* Create Parametric Stereo handle */
if (supportPS) {
if (PSEnc_Create(&hSbrEncoder->hParametricStereo)) {
goto bail;
}
hSbrEncoder->qmfSynthesisPS.FilterStates = GetRam_PsQmfStatesSynthesis();
if (hSbrEncoder->qmfSynthesisPS.FilterStates == NULL) {
goto bail;
}
} /* supportPS */
*phSbrEncoder = hSbrEncoder;
errorStatus = 0;
return errorStatus;
bail:
/* Close SBR encoder instance */
sbrEncoder_Close(&hSbrEncoder);
return errorStatus;
}
static INT FDKsbrEnc_Reallocate(HANDLE_SBR_ENCODER hSbrEncoder,
SBR_ELEMENT_INFO elInfo[(8)],
const INT noElements) {
INT totalCh = 0;
INT totalQmf = 0;
INT coreEl;
INT el = -1;
hSbrEncoder->lfeChIdx = -1; /* default value, until lfe found */
for (coreEl = 0; coreEl < noElements; coreEl++) {
/* SBR only handles SCE and CPE's */
if (elInfo[coreEl].elType == ID_SCE || elInfo[coreEl].elType == ID_CPE) {
el++;
} else {
if (elInfo[coreEl].elType == ID_LFE) {
hSbrEncoder->lfeChIdx = elInfo[coreEl].ChannelIndex[0];
}
continue;
}
SBR_ELEMENT_INFO *pelInfo = &elInfo[coreEl];
HANDLE_SBR_ELEMENT hSbrElement = hSbrEncoder->sbrElement[el];
int ch;
for (ch = 0; ch < pelInfo->nChannelsInEl; ch++) {
hSbrElement->sbrChannel[ch] = hSbrEncoder->pSbrChannel[totalCh];
totalCh++;
}
/* analysis QMF */
for (ch = 0;
ch < ((pelInfo->fParametricStereo) ? 2 : pelInfo->nChannelsInEl);
ch++) {
hSbrElement->elInfo.ChannelIndex[ch] = pelInfo->ChannelIndex[ch];
hSbrElement->hQmfAnalysis[ch] = &hSbrEncoder->QmfAnalysis[totalQmf++];
}
/* Copy Element info */
hSbrElement->elInfo.elType = pelInfo->elType;
hSbrElement->elInfo.instanceTag = pelInfo->instanceTag;
hSbrElement->elInfo.nChannelsInEl = pelInfo->nChannelsInEl;
hSbrElement->elInfo.fParametricStereo = pelInfo->fParametricStereo;
hSbrElement->elInfo.fDualMono = pelInfo->fDualMono;
} /* coreEl */
return 0;
}
/*****************************************************************************
functionname: FDKsbrEnc_bsBufInit
description: initializes bitstream buffer
returns: initialized bitstream buffer in env encoder
input:
output: hEnv
*****************************************************************************/
static INT FDKsbrEnc_bsBufInit(HANDLE_SBR_ELEMENT hSbrElement,
int nBitstrDelay) {
UCHAR *bitstreamBuffer;
/* initialize the bitstream buffer */
bitstreamBuffer = hSbrElement->payloadDelayLine[nBitstrDelay];
FDKinitBitStream(&hSbrElement->CmonData.sbrBitbuf, bitstreamBuffer,
MAX_PAYLOAD_SIZE * sizeof(UCHAR), 0, BS_WRITER);
return (0);
}
/*****************************************************************************
functionname: FDKsbrEnc_EnvInit
description: initializes parameters
returns: error status
input:
output: hEnv
*****************************************************************************/
static INT FDKsbrEnc_EnvInit(HANDLE_SBR_ELEMENT hSbrElement,
sbrConfigurationPtr params, INT *coreBandWith,
AUDIO_OBJECT_TYPE aot, int nElement,
const int headerPeriod, ULONG statesInitFlag,
const SBRENC_DS_TYPE downsamplingMethod,
UCHAR *dynamic_RAM) {
int ch, i;
if ((params->codecSettings.nChannels < 1) ||
(params->codecSettings.nChannels > MAX_NUM_CHANNELS)) {
return (1);
}
/* init and set syntax flags */
hSbrElement->sbrConfigData.sbrSyntaxFlags = 0;
switch (aot) {
case AOT_ER_AAC_ELD:
hSbrElement->sbrConfigData.sbrSyntaxFlags |= SBR_SYNTAX_LOW_DELAY;
break;
default:
break;
}
if (params->crcSbr) {
hSbrElement->sbrConfigData.sbrSyntaxFlags |= SBR_SYNTAX_CRC;
}
hSbrElement->sbrConfigData.noQmfBands = 64 >> (2 - params->downSampleFactor);
switch (hSbrElement->sbrConfigData.noQmfBands) {
case 64:
hSbrElement->sbrConfigData.noQmfSlots = params->sbrFrameSize >> 6;
break;
case 32:
hSbrElement->sbrConfigData.noQmfSlots = params->sbrFrameSize >> 5;
break;
default:
hSbrElement->sbrConfigData.noQmfSlots = params->sbrFrameSize >> 6;
return (2);
}
/*
now initialize sbrConfigData, sbrHeaderData and sbrBitstreamData,
*/
hSbrElement->sbrConfigData.nChannels = params->codecSettings.nChannels;
if (params->codecSettings.nChannels == 2) {
if ((hSbrElement->elInfo.elType == ID_CPE) &&
((hSbrElement->elInfo.fDualMono == 1))) {
hSbrElement->sbrConfigData.stereoMode = SBR_LEFT_RIGHT;
} else {
hSbrElement->sbrConfigData.stereoMode = params->stereoMode;
}
} else {
hSbrElement->sbrConfigData.stereoMode = SBR_MONO;
}
hSbrElement->sbrConfigData.frameSize = params->sbrFrameSize;
hSbrElement->sbrConfigData.sampleFreq =
params->downSampleFactor * params->codecSettings.sampleFreq;
hSbrElement->sbrBitstreamData.CountSendHeaderData = 0;
if (params->SendHeaderDataTime > 0) {
if (headerPeriod == -1) {
hSbrElement->sbrBitstreamData.NrSendHeaderData = (INT)(
params->SendHeaderDataTime * hSbrElement->sbrConfigData.sampleFreq /
(1000 * hSbrElement->sbrConfigData.frameSize));
hSbrElement->sbrBitstreamData.NrSendHeaderData =
fixMax(hSbrElement->sbrBitstreamData.NrSendHeaderData, 1);
} else {
/* assure header period at least once per second */
hSbrElement->sbrBitstreamData.NrSendHeaderData = fixMin(
fixMax(headerPeriod, 1), (hSbrElement->sbrConfigData.sampleFreq /
hSbrElement->sbrConfigData.frameSize));
}
} else {
hSbrElement->sbrBitstreamData.NrSendHeaderData = 0;
}
hSbrElement->sbrHeaderData.sbr_data_extra = params->sbr_data_extra;
hSbrElement->sbrBitstreamData.HeaderActive = 0;
hSbrElement->sbrBitstreamData.rightBorderFIX = 0;
hSbrElement->sbrHeaderData.sbr_start_frequency = params->startFreq;
hSbrElement->sbrHeaderData.sbr_stop_frequency = params->stopFreq;
hSbrElement->sbrHeaderData.sbr_xover_band = 0;
hSbrElement->sbrHeaderData.sbr_lc_stereo_mode = 0;
/* data_extra */
if (params->sbr_xpos_ctrl != SBR_XPOS_CTRL_DEFAULT)
hSbrElement->sbrHeaderData.sbr_data_extra = 1;
hSbrElement->sbrHeaderData.sbr_amp_res = (AMP_RES)params->amp_res;
/* header_extra_1 */
hSbrElement->sbrHeaderData.freqScale = params->freqScale;
hSbrElement->sbrHeaderData.alterScale = params->alterScale;
hSbrElement->sbrHeaderData.sbr_noise_bands = params->sbr_noise_bands;
hSbrElement->sbrHeaderData.header_extra_1 = 0;
if ((params->freqScale != SBR_FREQ_SCALE_DEFAULT) ||
(params->alterScale != SBR_ALTER_SCALE_DEFAULT) ||
(params->sbr_noise_bands != SBR_NOISE_BANDS_DEFAULT)) {
hSbrElement->sbrHeaderData.header_extra_1 = 1;
}
/* header_extra_2 */
hSbrElement->sbrHeaderData.sbr_limiter_bands = params->sbr_limiter_bands;
hSbrElement->sbrHeaderData.sbr_limiter_gains = params->sbr_limiter_gains;
if ((hSbrElement->sbrConfigData.sampleFreq > 48000) &&
(hSbrElement->sbrHeaderData.sbr_start_frequency >= 9)) {
hSbrElement->sbrHeaderData.sbr_limiter_gains = SBR_LIMITER_GAINS_INFINITE;
}
hSbrElement->sbrHeaderData.sbr_interpol_freq = params->sbr_interpol_freq;
hSbrElement->sbrHeaderData.sbr_smoothing_length =
params->sbr_smoothing_length;
hSbrElement->sbrHeaderData.header_extra_2 = 0;
if ((params->sbr_limiter_bands != SBR_LIMITER_BANDS_DEFAULT) ||
(params->sbr_limiter_gains != SBR_LIMITER_GAINS_DEFAULT) ||
(params->sbr_interpol_freq != SBR_INTERPOL_FREQ_DEFAULT) ||
(params->sbr_smoothing_length != SBR_SMOOTHING_LENGTH_DEFAULT)) {
hSbrElement->sbrHeaderData.header_extra_2 = 1;
}
/* other switches */
hSbrElement->sbrConfigData.useWaveCoding = params->useWaveCoding;
hSbrElement->sbrConfigData.useParametricCoding = params->parametricCoding;
hSbrElement->sbrConfigData.thresholdAmpResFF_m =
params->threshold_AmpRes_FF_m;
hSbrElement->sbrConfigData.thresholdAmpResFF_e =
params->threshold_AmpRes_FF_e;
/* init freq band table */
if (updateFreqBandTable(&hSbrElement->sbrConfigData,
&hSbrElement->sbrHeaderData,
params->downSampleFactor)) {
return (1);
}
/* now create envelope ext and QMF for each available channel */
for (ch = 0; ch < hSbrElement->sbrConfigData.nChannels; ch++) {
if (initEnvChannel(&hSbrElement->sbrConfigData, &hSbrElement->sbrHeaderData,
&hSbrElement->sbrChannel[ch]->hEnvChannel, params,
statesInitFlag, ch, dynamic_RAM)) {
return (1);
}
} /* nChannels */
/* reset and intialize analysis qmf */
for (ch = 0; ch < ((hSbrElement->elInfo.fParametricStereo)
? 2
: hSbrElement->sbrConfigData.nChannels);
ch++) {
int err;
UINT qmfFlags =
(hSbrElement->sbrConfigData.sbrSyntaxFlags & SBR_SYNTAX_LOW_DELAY)
? QMF_FLAG_CLDFB
: 0;
if (statesInitFlag)
qmfFlags &= ~QMF_FLAG_KEEP_STATES;
else
qmfFlags |= QMF_FLAG_KEEP_STATES;
err = qmfInitAnalysisFilterBank(
hSbrElement->hQmfAnalysis[ch],
(FIXP_QAS *)hSbrElement->hQmfAnalysis[ch]->FilterStates,
hSbrElement->sbrConfigData.noQmfSlots,
hSbrElement->sbrConfigData.noQmfBands,
hSbrElement->sbrConfigData.noQmfBands,
hSbrElement->sbrConfigData.noQmfBands, qmfFlags);
if (0 != err) {
return err;
}
}
/* */
hSbrElement->CmonData.xOverFreq = hSbrElement->sbrConfigData.xOverFreq;
hSbrElement->CmonData.dynBwEnabled =
(params->dynBwSupported && params->dynBwEnabled);
hSbrElement->CmonData.dynXOverFreqEnc =
FDKsbrEnc_SbrGetXOverFreq(hSbrElement, hSbrElement->CmonData.xOverFreq);
for (i = 0; i < 5; i++)
hSbrElement->dynXOverFreqDelay[i] = hSbrElement->CmonData.dynXOverFreqEnc;
hSbrElement->CmonData.sbrNumChannels = hSbrElement->sbrConfigData.nChannels;
hSbrElement->sbrConfigData.dynXOverFreq = hSbrElement->CmonData.xOverFreq;
/* Update Bandwith to be passed to the core encoder */
*coreBandWith = hSbrElement->CmonData.xOverFreq;
return (0);
}
INT sbrEncoder_GetInBufferSize(int noChannels) {
INT temp;
temp = (2048);
temp += 1024 + MAX_SAMPLE_DELAY;
temp *= noChannels;
temp *= sizeof(INT_PCM);
return temp;
}
/*
* Encode Dummy SBR payload frames to fill the delay lines.
*/
static INT FDKsbrEnc_DelayCompensation(HANDLE_SBR_ENCODER hEnvEnc,
INT_PCM *timeBuffer,
UINT timeBufferBufSize) {
int n, el;
for (n = hEnvEnc->nBitstrDelay; n > 0; n--) {
for (el = 0; el < hEnvEnc->noElements; el++) {
if (FDKsbrEnc_EnvEncodeFrame(
hEnvEnc, el,
timeBuffer + hEnvEnc->downsampledOffset / hEnvEnc->nChannels,
timeBufferBufSize, NULL, NULL, 1))
return -1;
}
sbrEncoder_UpdateBuffers(hEnvEnc, timeBuffer, timeBufferBufSize);
}
return 0;
}
UINT sbrEncoder_LimitBitRate(UINT bitRate, UINT numChannels,
UINT coreSampleRate, AUDIO_OBJECT_TYPE aot) {
UINT newBitRate = bitRate;
INT index;
FDK_ASSERT(numChannels > 0 && numChannels <= 2);
if (aot == AOT_PS) {
if (numChannels == 1) {
index = getPsTuningTableIndex(bitRate, &newBitRate);
if (index == INVALID_TABLE_IDX) {
bitRate = newBitRate;
}
} else {
return 0;
}
}
index = getSbrTuningTableIndex(bitRate, numChannels, coreSampleRate, aot,
&newBitRate);
if (index != INVALID_TABLE_IDX) {
newBitRate = bitRate;
}
return newBitRate;
}
UINT sbrEncoder_IsSingleRatePossible(AUDIO_OBJECT_TYPE aot) {
UINT isPossible = (AOT_PS == aot) ? 0 : 1;
return isPossible;
}
/*****************************************************************************/
/* */
/*functionname: sbrEncoder_Init_delay */
/*description: Determine Delay balancing and new encoder delay */
/* */
/*returns: - error status */
/*input: - frame length of the core (i.e. e.g. AAC) */
/* - number of channels */
/* - downsample factor (1 for downsampled, 2 for dual-rate SBR) */
/* - low delay presence */
/* - ps presence */
/* - downsampling method: QMF-, time domain or no downsampling */
/* - various delay values (see DELAY_PARAM struct description) */
/* */
/*Example: Delay balancing for a HE-AACv1 encoder (time-domain downsampling) */
/*========================================================================== */
/* */
/* +--------+ +--------+ +--------+ +--------+ +--------+ */
/* |core | |ds 2:1 | |AAC | |QMF | |QMF | */
/* +-+path +------------+ +-+core +-+analysis+-+overlap +-+ */
/* | |offset | | | | | |32 bands| | | | */
/* | +--------+ +--------+ +--------+ +--------+ +--------+ | */
/* | core path +-------++ */
/* | |QMF | */
/*->+ +synth. +-> */
/* | |64 bands| */
/* | +-------++ */
/* | +--------+ +--------+ +--------+ +--------+ | */
/* | |SBR path| |QMF | |subband | |bs delay| | */
/* +-+offset +-+analysis+-+sample +-+(full +-----------------------+ */
/* | | |64 bands| |buffer | | frames)| */
/* +--------+ +--------+ +--------+ +--------+ */
/* SBR path */
/* */
/*****************************************************************************/
static INT sbrEncoder_Init_delay(
const int coreFrameLength, /* input */
const int numChannels, /* input */
const int downSampleFactor, /* input */
const int lowDelay, /* input */
const int usePs, /* input */
const int is212, /* input */
const SBRENC_DS_TYPE downsamplingMethod, /* input */
DELAY_PARAM *hDelayParam /* input/output */
) {
int delayCorePath = 0; /* delay in core path */
int delaySbrPath = 0; /* delay difference in QMF aka SBR path */
int delayInput2Core = 0; /* delay from the input to the core */
int delaySbrDec = 0; /* delay of the decoder's SBR module */
int delayCore = hDelayParam->delay; /* delay of the core */
/* Added delay by the SBR delay initialization */
int corePathOffset = 0; /* core path */
int sbrPathOffset = 0; /* sbr path */
int bitstreamDelay = 0; /* sbr path, framewise */
int flCore = coreFrameLength; /* core frame length */
int returnValue = 0; /* return value - 0 means: no error */
/* 1) Calculate actual delay for core and SBR path */
if (is212) {
delayCorePath = DELAY_COREPATH_ELDv2SBR(flCore, downSampleFactor);
delaySbrPath = DELAY_ELDv2SBR(flCore, downSampleFactor);
delaySbrDec = ((flCore) / 2) * (downSampleFactor);
} else if (lowDelay) {
delayCorePath = DELAY_COREPATH_ELDSBR(flCore, downSampleFactor);
delaySbrPath = DELAY_ELDSBR(flCore, downSampleFactor);
delaySbrDec = DELAY_QMF_POSTPROC(downSampleFactor);
} else if (usePs) {
delayCorePath = DELAY_COREPATH_PS(flCore, downSampleFactor);
delaySbrPath = DELAY_PS(flCore, downSampleFactor);
delaySbrDec = DELAY_COREPATH_SBR(flCore, downSampleFactor);
} else {
delayCorePath = DELAY_COREPATH_SBR(flCore, downSampleFactor);
delaySbrPath = DELAY_SBR(flCore, downSampleFactor);
delaySbrDec = DELAY_COREPATH_SBR(flCore, downSampleFactor);
}
delayCorePath += delayCore * downSampleFactor;
delayCorePath +=
(downsamplingMethod == SBRENC_DS_TIME) ? hDelayParam->dsDelay : 0;
/* 2) Manage coupling of paths */
if (downsamplingMethod == SBRENC_DS_QMF && delayCorePath > delaySbrPath) {
/* In case of QMF downsampling, both paths are coupled, i.e. the SBR path
offset would be added to both the SBR path and to the core path
as well, thus making it impossible to achieve delay balancing.
To overcome that problem, a framewise delay is added to the SBR path
first, until the overall delay of the core path is shorter than
the delay of the SBR path. When this is achieved, the missing delay
difference can be added as downsampled offset to the core path.
*/
while (delayCorePath > delaySbrPath) {
/* Add one frame delay to SBR path */
delaySbrPath += flCore * downSampleFactor;
bitstreamDelay += 1;
}
}
/* 3) Calculate necessary additional delay to balance the paths */
if (delayCorePath > delaySbrPath) {
/* Delay QMF input */
while (delayCorePath > delaySbrPath + (int)flCore * (int)downSampleFactor) {
/* Do bitstream frame-wise delay balancing if there are
more than SBR framelength samples delay difference */
delaySbrPath += flCore * downSampleFactor;
bitstreamDelay += 1;
}
/* Multiply input offset by input channels */
corePathOffset = 0;
sbrPathOffset = (delayCorePath - delaySbrPath) * numChannels;
} else {
/* Delay AAC data */
/* Multiply downsampled offset by AAC core channels. Divide by 2 because of
half samplerate of downsampled data. */
corePathOffset = ((delaySbrPath - delayCorePath) * numChannels) >>
(downSampleFactor - 1);
sbrPathOffset = 0;
}
/* 4) Calculate delay from input to core */
if (usePs) {
delayInput2Core =
(DELAY_QMF_ANA(downSampleFactor) + DELAY_QMF_DS + DELAY_HYB_SYN) +
(downSampleFactor * corePathOffset) + 1;
} else if (downsamplingMethod == SBRENC_DS_TIME) {
delayInput2Core = corePathOffset + hDelayParam->dsDelay;
} else {
delayInput2Core = corePathOffset;
}
/* 6) Set output parameters */
hDelayParam->delay = FDKmax(delayCorePath, delaySbrPath); /* overall delay */
hDelayParam->sbrDecDelay = delaySbrDec; /* SBR decoder delay */
hDelayParam->delayInput2Core = delayInput2Core; /* delay input - core */
hDelayParam->bitstrDelay = bitstreamDelay; /* bitstream delay, in frames */
hDelayParam->corePathOffset = corePathOffset; /* offset added to core path */
hDelayParam->sbrPathOffset = sbrPathOffset; /* offset added to SBR path */
return returnValue;
}
/*****************************************************************************
functionname: sbrEncoder_Init
description: initializes the SBR encoder
returns: error status
*****************************************************************************/
INT sbrEncoder_Init(HANDLE_SBR_ENCODER hSbrEncoder,
SBR_ELEMENT_INFO elInfo[(8)], int noElements,
INT_PCM *inputBuffer, UINT inputBufferBufSize,
INT *coreBandwidth, INT *inputBufferOffset,
INT *numChannels, const UINT syntaxFlags,
INT *coreSampleRate, UINT *downSampleFactor,
INT *frameLength, AUDIO_OBJECT_TYPE aot, int *delay,
int transformFactor, const int headerPeriod,
ULONG statesInitFlag) {
HANDLE_ERROR_INFO errorInfo = noError;
sbrConfiguration sbrConfig[(8)];
INT error = 0;
INT lowestBandwidth;
/* Save input parameters */
INT inputSampleRate = *coreSampleRate;
int coreFrameLength = *frameLength;
int inputBandWidth = *coreBandwidth;
int inputChannels = *numChannels;
SBRENC_DS_TYPE downsamplingMethod = SBRENC_DS_NONE;
int highestSbrStartFreq, highestSbrStopFreq;
int lowDelay = 0;
int usePs = 0;
int is212 = 0;
DELAY_PARAM delayParam;
/* check whether SBR setting is available for the current encoder
* configuration (bitrate, samplerate) */
if (!sbrEncoder_IsSingleRatePossible(aot)) {
*downSampleFactor = 2;
}
if (aot == AOT_PS) {
usePs = 1;
}
if (aot == AOT_ER_AAC_ELD) {
lowDelay = 1;
} else if (aot == AOT_ER_AAC_LD) {
error = 1;
goto bail;
}
/* Parametric Stereo */
if (usePs) {
if (*numChannels == 2 && noElements == 1) {
/* Override Element type in case of Parametric stereo */
elInfo[0].elType = ID_SCE;
elInfo[0].fParametricStereo = 1;
elInfo[0].nChannelsInEl = 1;
/* core encoder gets downmixed mono signal */
*numChannels = 1;
} else {
error = 1;
goto bail;
}
} /* usePs */
/* set the core's sample rate */
switch (*downSampleFactor) {
case 1:
*coreSampleRate = inputSampleRate;
downsamplingMethod = SBRENC_DS_NONE;
break;
case 2:
*coreSampleRate = inputSampleRate >> 1;
downsamplingMethod = usePs ? SBRENC_DS_QMF : SBRENC_DS_TIME;
break;
default:
*coreSampleRate = inputSampleRate >> 1;
return 0; /* return error */
}
/* check whether SBR setting is available for the current encoder
* configuration (bitrate, coreSampleRate) */
{
int el, coreEl;
/* Check if every element config is feasible */
for (coreEl = 0; coreEl < noElements; coreEl++) {
/* SBR only handles SCE and CPE's */
if (elInfo[coreEl].elType != ID_SCE && elInfo[coreEl].elType != ID_CPE) {
continue;
}
/* check if desired configuration is available */
if (!FDKsbrEnc_IsSbrSettingAvail(elInfo[coreEl].bitRate, 0,
elInfo[coreEl].nChannelsInEl,
inputSampleRate, *coreSampleRate, aot)) {
error = 1;
goto bail;
}
}
hSbrEncoder->nChannels = *numChannels;
hSbrEncoder->frameSize = coreFrameLength * *downSampleFactor;
hSbrEncoder->downsamplingMethod = downsamplingMethod;
hSbrEncoder->downSampleFactor = *downSampleFactor;
hSbrEncoder->estimateBitrate = 0;
hSbrEncoder->inputDataDelay = 0;
is212 = ((aot == AOT_ER_AAC_ELD) && (syntaxFlags & AC_LD_MPS)) ? 1 : 0;
/* Open SBR elements */
el = -1;
highestSbrStartFreq = highestSbrStopFreq = 0;
lowestBandwidth = 99999;
/* Loop through each core encoder element and get a matching SBR element
* config */
for (coreEl = 0; coreEl < noElements; coreEl++) {
/* SBR only handles SCE and CPE's */
if (elInfo[coreEl].elType == ID_SCE || elInfo[coreEl].elType == ID_CPE) {
el++;
} else {
continue;
}
/* Set parametric Stereo Flag. */
if (usePs) {
elInfo[coreEl].fParametricStereo = 1;
} else {
elInfo[coreEl].fParametricStereo = 0;
}
/*
* Init sbrConfig structure
*/
if (!FDKsbrEnc_InitializeSbrDefaults(&sbrConfig[el], *downSampleFactor,
coreFrameLength, IS_LOWDELAY(aot))) {
error = 1;
goto bail;
}
/*
* Modify sbrConfig structure according to Element parameters
*/
if (!FDKsbrEnc_AdjustSbrSettings(
&sbrConfig[el], elInfo[coreEl].bitRate,
elInfo[coreEl].nChannelsInEl, *coreSampleRate, inputSampleRate,
transformFactor, 24000, 0, 0, /* useSpeechConfig */
0, /* lcsMode */
usePs, /* bParametricStereo */
aot)) {
error = 1;
goto bail;
}
/* Find common frequency border for all SBR elements */
highestSbrStartFreq =
fixMax(highestSbrStartFreq, sbrConfig[el].startFreq);
highestSbrStopFreq = fixMax(highestSbrStopFreq, sbrConfig[el].stopFreq);
} /* first element loop */
/* Set element count (can be less than core encoder element count) */
hSbrEncoder->noElements = el + 1;
FDKsbrEnc_Reallocate(hSbrEncoder, elInfo, noElements);
for (el = 0; el < hSbrEncoder->noElements; el++) {
int bandwidth = *coreBandwidth;
/* Use lowest common bandwidth */
sbrConfig[el].startFreq = highestSbrStartFreq;
sbrConfig[el].stopFreq = highestSbrStopFreq;
/* initialize SBR element, and get core bandwidth */
error = FDKsbrEnc_EnvInit(hSbrEncoder->sbrElement[el], &sbrConfig[el],
&bandwidth, aot, el, headerPeriod,
statesInitFlag, hSbrEncoder->downsamplingMethod,
hSbrEncoder->dynamicRam);
if (error != 0) {
error = 2;
goto bail;
}
/* Get lowest core encoder bandwidth to be returned later. */
lowestBandwidth = fixMin(lowestBandwidth, bandwidth);
} /* second element loop */
/* Initialize a downsampler for each channel in each SBR element */
if (hSbrEncoder->downsamplingMethod == SBRENC_DS_TIME) {
for (el = 0; el < hSbrEncoder->noElements; el++) {
HANDLE_SBR_ELEMENT hSbrEl = hSbrEncoder->sbrElement[el];
INT Wc, ch;
Wc = 500; /* Cutoff frequency with full bandwidth */
for (ch = 0; ch < hSbrEl->elInfo.nChannelsInEl; ch++) {
FDKaacEnc_InitDownsampler(&hSbrEl->sbrChannel[ch]->downSampler, Wc,
*downSampleFactor);
FDK_ASSERT(hSbrEl->sbrChannel[ch]->downSampler.delay <=
MAX_DS_FILTER_DELAY);
}
} /* third element loop */
/* lfe */
FDKaacEnc_InitDownsampler(&hSbrEncoder->lfeDownSampler, 0,
*downSampleFactor);
}
/* Get delay information */
delayParam.dsDelay =
hSbrEncoder->sbrElement[0]->sbrChannel[0]->downSampler.delay;
delayParam.delay = *delay;
error = sbrEncoder_Init_delay(coreFrameLength, *numChannels,
*downSampleFactor, lowDelay, usePs, is212,
downsamplingMethod, &delayParam);
if (error != 0) {
error = 3;
goto bail;
}
hSbrEncoder->nBitstrDelay = delayParam.bitstrDelay;
hSbrEncoder->sbrDecDelay = delayParam.sbrDecDelay;
hSbrEncoder->inputDataDelay = delayParam.delayInput2Core;
/* Assign core encoder Bandwidth */
*coreBandwidth = lowestBandwidth;
/* Estimate sbr bitrate, 2.5 kBit/s per sbr channel */
hSbrEncoder->estimateBitrate += 2500 * (*numChannels);
/* Initialize bitstream buffer for each element */
for (el = 0; el < hSbrEncoder->noElements; el++) {
FDKsbrEnc_bsBufInit(hSbrEncoder->sbrElement[el], delayParam.bitstrDelay);
}
/* initialize parametric stereo */
if (usePs) {
PSENC_CONFIG psEncConfig;
FDK_ASSERT(hSbrEncoder->noElements == 1);
INT psTuningTableIdx = getPsTuningTableIndex(elInfo[0].bitRate, NULL);
psEncConfig.frameSize = coreFrameLength; // sbrConfig.sbrFrameSize;
psEncConfig.qmfFilterMode = 0;
psEncConfig.sbrPsDelay = 0;
/* tuning parameters */
if (psTuningTableIdx != INVALID_TABLE_IDX) {
psEncConfig.nStereoBands = psTuningTable[psTuningTableIdx].nStereoBands;
psEncConfig.maxEnvelopes = psTuningTable[psTuningTableIdx].nEnvelopes;
psEncConfig.iidQuantErrorThreshold =
(FIXP_DBL)psTuningTable[psTuningTableIdx].iidQuantErrorThreshold;
/* calculation is not quite linear, increased number of envelopes causes
* more bits */
/* assume avg. 50 bits per frame for 10 stereo bands / 1 envelope
* configuration */
hSbrEncoder->estimateBitrate +=
((((*coreSampleRate) * 5 * psEncConfig.nStereoBands *
psEncConfig.maxEnvelopes) /
hSbrEncoder->frameSize));
} else {
error = ERROR(CDI, "Invalid ps tuning table index.");
goto bail;
}
qmfInitSynthesisFilterBank(
&hSbrEncoder->qmfSynthesisPS,
(FIXP_DBL *)hSbrEncoder->qmfSynthesisPS.FilterStates,
hSbrEncoder->sbrElement[0]->sbrConfigData.noQmfSlots,
hSbrEncoder->sbrElement[0]->sbrConfigData.noQmfBands >> 1,
hSbrEncoder->sbrElement[0]->sbrConfigData.noQmfBands >> 1,
hSbrEncoder->sbrElement[0]->sbrConfigData.noQmfBands >> 1,
(statesInitFlag) ? 0 : QMF_FLAG_KEEP_STATES);
if (errorInfo == noError) {
/* update delay */
psEncConfig.sbrPsDelay =
FDKsbrEnc_GetEnvEstDelay(&hSbrEncoder->sbrElement[0]
->sbrChannel[0]
->hEnvChannel.sbrExtractEnvelope);
errorInfo =
PSEnc_Init(hSbrEncoder->hParametricStereo, &psEncConfig,
hSbrEncoder->sbrElement[0]->sbrConfigData.noQmfSlots,
hSbrEncoder->sbrElement[0]->sbrConfigData.noQmfBands,
hSbrEncoder->dynamicRam);
}
}
hSbrEncoder->downsampledOffset = delayParam.corePathOffset;
hSbrEncoder->bufferOffset = delayParam.sbrPathOffset;
*delay = delayParam.delay;
{ hSbrEncoder->downmixSize = coreFrameLength * (*numChannels); }
/* Delay Compensation: fill bitstream delay buffer with zero input signal */
if (hSbrEncoder->nBitstrDelay > 0) {
error = FDKsbrEnc_DelayCompensation(hSbrEncoder, inputBuffer,
inputBufferBufSize);
if (error != 0) goto bail;
}
/* Set Output frame length */
*frameLength = coreFrameLength * *downSampleFactor;
/* Input buffer offset */
*inputBufferOffset =
fixMax(delayParam.sbrPathOffset, delayParam.corePathOffset);
}
return error;
bail:
/* Restore input settings */
*coreSampleRate = inputSampleRate;
*frameLength = coreFrameLength;
*numChannels = inputChannels;
*coreBandwidth = inputBandWidth;
return error;
}
INT sbrEncoder_EncodeFrame(HANDLE_SBR_ENCODER hSbrEncoder, INT_PCM *samples,
UINT samplesBufSize, UINT sbrDataBits[(8)],
UCHAR sbrData[(8)][MAX_PAYLOAD_SIZE]) {
INT error;
int el;
for (el = 0; el < hSbrEncoder->noElements; el++) {
if (hSbrEncoder->sbrElement[el] != NULL) {
error = FDKsbrEnc_EnvEncodeFrame(
hSbrEncoder, el,
samples + hSbrEncoder->downsampledOffset / hSbrEncoder->nChannels,
samplesBufSize, &sbrDataBits[el], sbrData[el], 0);
if (error) return error;
}
}
error = FDKsbrEnc_Downsample(
hSbrEncoder,
samples + hSbrEncoder->downsampledOffset / hSbrEncoder->nChannels,
samplesBufSize, hSbrEncoder->nChannels, &sbrDataBits[el], sbrData[el], 0);
if (error) return error;
return 0;
}
INT sbrEncoder_UpdateBuffers(HANDLE_SBR_ENCODER hSbrEncoder,
INT_PCM *timeBuffer, UINT timeBufferBufSize) {
if (hSbrEncoder->downsampledOffset > 0) {
int c;
int nd = hSbrEncoder->downmixSize / hSbrEncoder->nChannels;
for (c = 0; c < hSbrEncoder->nChannels; c++) {
/* Move delayed downsampled data */
FDKmemcpy(timeBuffer + timeBufferBufSize * c,
timeBuffer + timeBufferBufSize * c + nd,
sizeof(INT_PCM) *
(hSbrEncoder->downsampledOffset / hSbrEncoder->nChannels));
}
} else {
int c;
for (c = 0; c < hSbrEncoder->nChannels; c++) {
/* Move delayed input data */
FDKmemcpy(
timeBuffer + timeBufferBufSize * c,
timeBuffer + timeBufferBufSize * c + hSbrEncoder->frameSize,
sizeof(INT_PCM) * hSbrEncoder->bufferOffset / hSbrEncoder->nChannels);
}
}
if (hSbrEncoder->nBitstrDelay > 0) {
int el;
for (el = 0; el < hSbrEncoder->noElements; el++) {
FDKmemmove(
hSbrEncoder->sbrElement[el]->payloadDelayLine[0],
hSbrEncoder->sbrElement[el]->payloadDelayLine[1],
sizeof(UCHAR) * (hSbrEncoder->nBitstrDelay * MAX_PAYLOAD_SIZE));
FDKmemmove(&hSbrEncoder->sbrElement[el]->payloadDelayLineSize[0],
&hSbrEncoder->sbrElement[el]->payloadDelayLineSize[1],
sizeof(UINT) * (hSbrEncoder->nBitstrDelay));
}
}
return 0;
}
INT sbrEncoder_SendHeader(HANDLE_SBR_ENCODER hSbrEncoder) {
INT error = -1;
if (hSbrEncoder) {
int el;
for (el = 0; el < hSbrEncoder->noElements; el++) {
if ((hSbrEncoder->noElements == 1) &&
(hSbrEncoder->sbrElement[0]->elInfo.fParametricStereo == 1)) {
hSbrEncoder->sbrElement[el]->sbrBitstreamData.CountSendHeaderData =
hSbrEncoder->sbrElement[el]->sbrBitstreamData.NrSendHeaderData - 1;
} else {
hSbrEncoder->sbrElement[el]->sbrBitstreamData.CountSendHeaderData = 0;
}
}
error = 0;
}
return error;
}
INT sbrEncoder_ContainsHeader(HANDLE_SBR_ENCODER hSbrEncoder) {
INT sbrHeader = 1;
if (hSbrEncoder) {
int el;
for (el = 0; el < hSbrEncoder->noElements; el++) {
sbrHeader &=
(hSbrEncoder->sbrElement[el]->sbrBitstreamData.HeaderActiveDelay == 1)
? 1
: 0;
}
}
return sbrHeader;
}
INT sbrEncoder_GetHeaderDelay(HANDLE_SBR_ENCODER hSbrEncoder) {
INT delay = -1;
if (hSbrEncoder) {
if ((hSbrEncoder->noElements == 1) &&
(hSbrEncoder->sbrElement[0]->elInfo.fParametricStereo == 1)) {
delay = hSbrEncoder->nBitstrDelay + 1;
} else {
delay = hSbrEncoder->nBitstrDelay;
}
}
return delay;
}
INT sbrEncoder_GetBsDelay(HANDLE_SBR_ENCODER hSbrEncoder) {
INT delay = -1;
if (hSbrEncoder) {
delay = hSbrEncoder->nBitstrDelay;
}
return delay;
}
INT sbrEncoder_SAPPrepare(HANDLE_SBR_ENCODER hSbrEncoder) {
INT error = -1;
if (hSbrEncoder) {
int el;
for (el = 0; el < hSbrEncoder->noElements; el++) {
hSbrEncoder->sbrElement[el]->sbrBitstreamData.rightBorderFIX = 1;
}
error = 0;
}
return error;
}
INT sbrEncoder_GetEstimateBitrate(HANDLE_SBR_ENCODER hSbrEncoder) {
INT estimateBitrate = 0;
if (hSbrEncoder) {
estimateBitrate += hSbrEncoder->estimateBitrate;
}
return estimateBitrate;
}
INT sbrEncoder_GetInputDataDelay(HANDLE_SBR_ENCODER hSbrEncoder) {
INT delay = -1;
if (hSbrEncoder) {
delay = hSbrEncoder->inputDataDelay;
}
return delay;
}
INT sbrEncoder_GetSbrDecDelay(HANDLE_SBR_ENCODER hSbrEncoder) {
INT delay = -1;
if (hSbrEncoder) {
delay = hSbrEncoder->sbrDecDelay;
}
return delay;
}
INT sbrEncoder_GetLibInfo(LIB_INFO *info) {
int i;
if (info == NULL) {
return -1;
}
/* search for next free tab */
for (i = 0; i < FDK_MODULE_LAST; i++) {
if (info[i].module_id == FDK_NONE) break;
}
if (i == FDK_MODULE_LAST) {
return -1;
}
info += i;
info->module_id = FDK_SBRENC;
info->version =
LIB_VERSION(SBRENCODER_LIB_VL0, SBRENCODER_LIB_VL1, SBRENCODER_LIB_VL2);
LIB_VERSION_STRING(info);
#ifdef __ANDROID__
info->build_date = "";
info->build_time = "";
#else
info->build_date = __DATE__;
info->build_time = __TIME__;
#endif
info->title = "SBR Encoder";
/* Set flags */
info->flags = 0 | CAPF_SBR_HQ | CAPF_SBR_PS_MPEG;
/* End of flags */
return 0;
}