Documents/api/aac_8h_source.html

 /*
  * AAC definitions and structures
  * Copyright (c) 2005-2006 Oded Shimon ( ods15 ods15 dyndns org )
  * Copyright (c) 2006-2007 Maxim Gavrilov ( maxim.gavrilov gmail com )
  *
  * This file is part of FFmpeg.
  *
  * FFmpeg is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
  * version 2.1 of the License, or (at your option) any later version.
  *
  * FFmpeg is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
  * License along with FFmpeg; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  */

 /**
  * @file
  * AAC definitions and structures
  * @author Oded Shimon  ( ods15 ods15 dyndns org )
  * @author Maxim Gavrilov ( maxim.gavrilov gmail com )
  */

 #ifndef AVCODEC_AAC_H
 #define AVCODEC_AAC_H


 #include "aac_defines.h"
 #include "libavutil/float_dsp.h"
 #include "libavutil/fixed_dsp.h"
 #include "avcodec.h"
 #if !USE_FIXED
 #include "mdct15.h"
 #endif
 #include "fft.h"
 #include "mpeg4audio.h"
 #include "sbr.h"

 #include <stdint.h>

 #define MAX_CHANNELS 64
 #define MAX_ELEM_ID 16

 #define TNS_MAX_ORDER 20
 #define MAX_LTP_LONG_SFB 40

 #define CLIP_AVOIDANCE_FACTOR 0.95f

 enum RawDataBlockType {
     TYPE_SCE,
     TYPE_CPE,
     TYPE_CCE,
     TYPE_LFE,
     TYPE_DSE,
     TYPE_PCE,
     TYPE_FIL,
     TYPE_END,
 };

 enum ExtensionPayloadID {
     EXT_FILL,
     EXT_FILL_DATA,
     EXT_DATA_ELEMENT,
     EXT_DYNAMIC_RANGE = 0xb,
     EXT_SBR_DATA      = 0xd,
     EXT_SBR_DATA_CRC  = 0xe,
 };

 enum WindowSequence {
     ONLY_LONG_SEQUENCE,
     LONG_START_SEQUENCE,
     EIGHT_SHORT_SEQUENCE,
     LONG_STOP_SEQUENCE,
 };

 enum BandType {
     ZERO_BT        = 0,     ///< Scalefactors and spectral data are all zero.
     FIRST_PAIR_BT  = 5,     ///< This and later band types encode two values (rather than four) with one code word.
     ESC_BT         = 11,    ///< Spectral data are coded with an escape sequence.
     RESERVED_BT    = 12,    ///< Band types following are encoded differently from others.
     NOISE_BT       = 13,    ///< Spectral data are scaled white noise not coded in the bitstream.
     INTENSITY_BT2  = 14,    ///< Scalefactor data are intensity stereo positions (out of phase).
     INTENSITY_BT   = 15,    ///< Scalefactor data are intensity stereo positions (in phase).
 };

 #define IS_CODEBOOK_UNSIGNED(x) (((x) - 1) & 10)

 enum ChannelPosition {
     AAC_CHANNEL_OFF   = 0,
     AAC_CHANNEL_FRONT = 1,
     AAC_CHANNEL_SIDE  = 2,
     AAC_CHANNEL_BACK  = 3,
     AAC_CHANNEL_LFE   = 4,
     AAC_CHANNEL_CC    = 5,
 };

 /**
  * The point during decoding at which channel coupling is applied.
  */
 enum CouplingPoint {
     BEFORE_TNS,
     BETWEEN_TNS_AND_IMDCT,
     AFTER_IMDCT = 3,
 };

 /**
  * Output configuration status
  */
 enum OCStatus {
     OC_NONE,        ///< Output unconfigured
     OC_TRIAL_PCE,   ///< Output configuration under trial specified by an inband PCE
     OC_TRIAL_FRAME, ///< Output configuration under trial specified by a frame header
     OC_GLOBAL_HDR,  ///< Output configuration set in a global header but not yet locked
     OC_LOCKED,      ///< Output configuration locked in place
 };

 typedef struct OutputConfiguration {
     MPEG4AudioConfig m4ac;
     uint8_t layout_map[MAX_ELEM_ID*4][3];
     int layout_map_tags;
     int channels;
     uint64_t channel_layout;
     enum OCStatus status;
 } OutputConfiguration;

 /**
  * Predictor State
  */
 typedef struct PredictorState {
     AAC_FLOAT cor0;
     AAC_FLOAT cor1;
     AAC_FLOAT var0;
     AAC_FLOAT var1;
     AAC_FLOAT r0;
     AAC_FLOAT r1;
     AAC_FLOAT k1;
     AAC_FLOAT x_est;
 } PredictorState;

 #define MAX_PREDICTORS 672

 #define SCALE_DIV_512    36    ///< scalefactor difference that corresponds to scale difference in 512 times
 #define SCALE_ONE_POS   140    ///< scalefactor index that corresponds to scale=1.0
 #define SCALE_MAX_POS   255    ///< scalefactor index maximum value
 #define SCALE_MAX_DIFF   60    ///< maximum scalefactor difference allowed by standard
 #define SCALE_DIFF_ZERO  60    ///< codebook index corresponding to zero scalefactor indices difference

 #define POW_SF2_ZERO    200    ///< ff_aac_pow2sf_tab index corresponding to pow(2, 0);

 #define NOISE_PRE       256    ///< preamble for NOISE_BT, put in bitstream with the first noise band
 #define NOISE_PRE_BITS    9    ///< length of preamble
 #define NOISE_OFFSET     90    ///< subtracted from global gain, used as offset for the preamble

 /**
  * Long Term Prediction
  */
 typedef struct LongTermPrediction {
     int8_t present;
     int16_t lag;
     int coef_idx;
     INTFLOAT coef;
     int8_t used[MAX_LTP_LONG_SFB];
 } LongTermPrediction;

 /**
  * Individual Channel Stream
  */
 typedef struct IndividualChannelStream {
     uint8_t max_sfb;            ///< number of scalefactor bands per group
     enum WindowSequence window_sequence[2];
     uint8_t use_kb_window[2];   ///< If set, use Kaiser-Bessel window, otherwise use a sine window.
     int num_window_groups;
     uint8_t group_len[8];
     LongTermPrediction ltp;
     const uint16_t *swb_offset; ///< table of offsets to the lowest spectral coefficient of a scalefactor band, sfb, for a particular window
     const uint8_t *swb_sizes;   ///< table of scalefactor band sizes for a particular window
     int num_swb;                ///< number of scalefactor window bands
     int num_windows;
     int tns_max_bands;
     int predictor_present;
     int predictor_initialized;
     int predictor_reset_group;
     int predictor_reset_count[31];  ///< used by encoder to count prediction resets
     uint8_t prediction_used[41];
     uint8_t window_clipping[8]; ///< set if a certain window is near clipping
     float clip_avoidance_factor; ///< set if any window is near clipping to the necessary atennuation factor to avoid it
 } IndividualChannelStream;

 /**
  * Temporal Noise Shaping
  */
 typedef struct TemporalNoiseShaping {
     int present;
     int n_filt[8];
     int length[8][4];
     int direction[8][4];
     int order[8][4];
     int coef_idx[8][4][TNS_MAX_ORDER];
     INTFLOAT coef[8][4][TNS_MAX_ORDER];
 } TemporalNoiseShaping;

 /**
  * Dynamic Range Control - decoded from the bitstream but not processed further.
  */
 typedef struct DynamicRangeControl {
     int pce_instance_tag;                           ///< Indicates with which program the DRC info is associated.
     int dyn_rng_sgn[17];                            ///< DRC sign information; 0 - positive, 1 - negative
     int dyn_rng_ctl[17];                            ///< DRC magnitude information
     int exclude_mask[MAX_CHANNELS];                 ///< Channels to be excluded from DRC processing.
     int band_incr;                                  ///< Number of DRC bands greater than 1 having DRC info.
     int interpolation_scheme;                       ///< Indicates the interpolation scheme used in the SBR QMF domain.
     int band_top[17];                               ///< Indicates the top of the i-th DRC band in units of 4 spectral lines.
     int prog_ref_level;                             /**< A reference level for the long-term program audio level for all
                                                      *   channels combined.
                                                      */
 } DynamicRangeControl;

 typedef struct Pulse {
     int num_pulse;
     int start;
     int pos[4];
     int amp[4];
 } Pulse;

 /**
  * coupling parameters
  */
 typedef struct ChannelCoupling {
     enum CouplingPoint coupling_point;  ///< The point during decoding at which coupling is applied.
     int num_coupled;       ///< number of target elements
     enum RawDataBlockType type[8];   ///< Type of channel element to be coupled - SCE or CPE.
     int id_select[8];      ///< element id
     int ch_select[8];      /**< [0] shared list of gains; [1] list of gains for right channel;
                             *   [2] list of gains for left channel; [3] lists of gains for both channels
                             */
     INTFLOAT gain[16][120];
 } ChannelCoupling;

 /**
  * Single Channel Element - used for both SCE and LFE elements.
  */
 typedef struct SingleChannelElement {
     IndividualChannelStream ics;
     TemporalNoiseShaping tns;
     Pulse pulse;
     enum BandType band_type[128];                   ///< band types
     enum BandType band_alt[128];                    ///< alternative band type (used by encoder)
     int band_type_run_end[120];                     ///< band type run end points
     INTFLOAT sf[120];                               ///< scalefactors
     int sf_idx[128];                                ///< scalefactor indices (used by encoder)
     uint8_t zeroes[128];                            ///< band is not coded (used by encoder)
     uint8_t can_pns[128];                           ///< band is allowed to PNS (informative)
     float  is_ener[128];                            ///< Intensity stereo pos (used by encoder)
     float pns_ener[128];                            ///< Noise energy values (used by encoder)
     DECLARE_ALIGNED(32, INTFLOAT, pcoeffs)[1024];   ///< coefficients for IMDCT, pristine
     DECLARE_ALIGNED(32, INTFLOAT, coeffs)[1024];    ///< coefficients for IMDCT, maybe processed
     DECLARE_ALIGNED(32, INTFLOAT, saved)[1536];     ///< overlap
     DECLARE_ALIGNED(32, INTFLOAT, ret_buf)[2048];   ///< PCM output buffer
     DECLARE_ALIGNED(16, INTFLOAT, ltp_state)[3072]; ///< time signal for LTP
     DECLARE_ALIGNED(32, AAC_FLOAT, lcoeffs)[1024];  ///< MDCT of LTP coefficients (used by encoder)
     DECLARE_ALIGNED(32, AAC_FLOAT, prcoeffs)[1024]; ///< Main prediction coefs (used by encoder)
     PredictorState predictor_state[MAX_PREDICTORS];
     INTFLOAT *ret;                                  ///< PCM output
 } SingleChannelElement;

 /**
  * channel element - generic struct for SCE/CPE/CCE/LFE
  */
 typedef struct ChannelElement {
     int present;
     // CPE specific
     int common_window;        ///< Set if channels share a common 'IndividualChannelStream' in bitstream.
     int     ms_mode;          ///< Signals mid/side stereo flags coding mode (used by encoder)
     uint8_t is_mode;          ///< Set if any bands have been encoded using intensity stereo (used by encoder)
     uint8_t ms_mask[128];     ///< Set if mid/side stereo is used for each scalefactor window band
     uint8_t is_mask[128];     ///< Set if intensity stereo is used (used by encoder)
     // shared
     SingleChannelElement ch[2];
     // CCE specific
     ChannelCoupling coup;
     SpectralBandReplication sbr;
 } ChannelElement;

 /**
  * main AAC context
  */
 struct AACContext {
     AVClass        *class;
     AVCodecContext *avctx;
     AVFrame *frame;

     int is_saved;                 ///< Set if elements have stored overlap from previous frame.
     DynamicRangeControl che_drc;

     /**
      * @name Channel element related data
      * @{
      */
     ChannelElement          *che[4][MAX_ELEM_ID];
     ChannelElement  *tag_che_map[4][MAX_ELEM_ID];
     int tags_mapped;
     int warned_remapping_once;
     /** @} */

     /**
      * @name temporary aligned temporary buffers
      * (We do not want to have these on the stack.)
      * @{
      */
     DECLARE_ALIGNED(32, INTFLOAT, buf_mdct)[1024];
     /** @} */

     /**
      * @name Computed / set up during initialization
      * @{
      */
     FFTContext mdct;
     FFTContext mdct_small;
     FFTContext mdct_ld;
     FFTContext mdct_ltp;
 #if USE_FIXED
     AVFixedDSPContext *fdsp;
 #else
     MDCT15Context *mdct120;
     MDCT15Context *mdct480;
     MDCT15Context *mdct960;
     AVFloatDSPContext *fdsp;
 #endif /* USE_FIXED */
     int random_state;
     /** @} */

     /**
      * @name Members used for output
      * @{
      */
     SingleChannelElement *output_element[MAX_CHANNELS]; ///< Points to each SingleChannelElement
     /** @} */


     /**
      * @name Japanese DTV specific extension
      * @{
      */
     int force_dmono_mode;///< 0->not dmono, 1->use first channel, 2->use second channel
     int dmono_mode;      ///< 0->not dmono, 1->use first channel, 2->use second channel
     /** @} */

     DECLARE_ALIGNED(32, INTFLOAT, temp)[128];

     OutputConfiguration oc[2];
     int warned_num_aac_frames;
     int warned_960_sbr;

     int warned_gain_control;

     /* aacdec functions pointers */
     void (*imdct_and_windowing)(AACContext *ac, SingleChannelElement *sce);
     void (*apply_ltp)(AACContext *ac, SingleChannelElement *sce);
     void (*apply_tns)(INTFLOAT coef[1024], TemporalNoiseShaping *tns,
                       IndividualChannelStream *ics, int decode);
     void (*windowing_and_mdct_ltp)(AACContext *ac, INTFLOAT *out,
                                    INTFLOAT *in, IndividualChannelStream *ics);
     void (*update_ltp)(AACContext *ac, SingleChannelElement *sce);
     void (*vector_pow43)(int *coefs, int len);
     void (*subband_scale)(int *dst, int *src, int scale, int offset, int len);

 };

 void ff_aacdec_init_mips(AACContext *c);

 #endif /* AVCODEC_AAC_H */
IndividualChannelStream::predictor_initialized
int predictor_initialized
Definition: aac.h:187

AACContext::fdsp
AVFloatDSPContext * fdsp
Definition: aac.h:333

LongTermPrediction::coef_idx
int coef_idx
Definition: aac.h:166

imdct_and_windowing
static void imdct_and_windowing(AACContext *ac, SingleChannelElement *sce)
Conduct IMDCT and windowing.
Definition: aacdec_template.c:2639

apply_ltp
static void apply_ltp(AACContext *ac, SingleChannelElement *sce)
Apply the long term prediction.
Definition: aacdec_template.c:2569

RESERVED_BT
Band types following are encoded differently from others.
Definition: aac.h:86

TYPE_DSE
Definition: aac.h:60

AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:218

OutputConfiguration::channels
int channels
Definition: aac.h:127

LONG_STOP_SEQUENCE
Definition: aac.h:79

AACContext::avctx
AVCodecContext * avctx
Definition: aac.h:295

Pulse
Definition: aac.h:224

AVFixedDSPContext
Definition: fixed_dsp.h:56

temp
else temp
Definition: vf_mcdeint.c:256

TYPE_END
Definition: aac.h:63

TYPE_SCE
Definition: aac.h:56

TYPE_CPE
Definition: aac.h:57

mpeg4audio.h

float_dsp.h

ch
uint8_t pi<< 24) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_U8,(uint64_t)((*(const uint8_t *) pi - 0x80U))<< 56) CONV_FUNC(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8,(*(const uint8_t *) pi - 0x80) *(1.0f/(1<< 7))) CONV_FUNC(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8,(*(const uint8_t *) pi - 0x80) *(1.0/(1<< 7))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16,(*(const int16_t *) pi >>8)+0x80) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_S16,(uint64_t)(*(const int16_t *) pi)<< 48) CONV_FUNC(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, *(const int16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, *(const int16_t *) pi *(1.0/(1<< 15))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32,(*(const int32_t *) pi >>24)+0x80) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_S32,(uint64_t)(*(const int32_t *) pi)<< 32) CONV_FUNC(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, *(const int32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, *(const int32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S64,(*(const int64_t *) pi >>56)+0x80) CONV_FUNC(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S64, *(const int64_t *) pi *(1.0f/(INT64_C(1)<< 63))) CONV_FUNC(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S64, *(const int64_t *) pi *(1.0/(INT64_C(1)<< 63))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, av_clip_uint8(lrintf(*(const float *) pi *(1<< 7))+0x80)) CONV_FUNC(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, av_clip_int16(lrintf(*(const float *) pi *(1<< 15)))) CONV_FUNC(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, av_clipl_int32(llrintf(*(const float *) pi *(1U<< 31)))) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_FLT, llrintf(*(const float *) pi *(INT64_C(1)<< 63))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, av_clip_uint8(lrint(*(const double *) pi *(1<< 7))+0x80)) CONV_FUNC(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, av_clip_int16(lrint(*(const double *) pi *(1<< 15)))) CONV_FUNC(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, av_clipl_int32(llrint(*(const double *) pi *(1U<< 31)))) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_DBL, llrint(*(const double *) pi *(INT64_C(1)<< 63))) #define FMT_PAIR_FUNC(out, in) static conv_func_type *const fmt_pair_to_conv_functions[AV_SAMPLE_FMT_NB *AV_SAMPLE_FMT_NB]={ FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_S64), };static void cpy1(uint8_t **dst, const uint8_t **src, int len){ memcpy(*dst, *src, len);} static void cpy2(uint8_t **dst, const uint8_t **src, int len){ memcpy(*dst, *src, 2 *len);} static void cpy4(uint8_t **dst, const uint8_t **src, int len){ memcpy(*dst, *src, 4 *len);} static void cpy8(uint8_t **dst, const uint8_t **src, int len){ memcpy(*dst, *src, 8 *len);} AudioConvert *swri_audio_convert_alloc(enum AVSampleFormat out_fmt, enum AVSampleFormat in_fmt, int channels, const int *ch_map, int flags) { AudioConvert *ctx;conv_func_type *f=fmt_pair_to_conv_functions[av_get_packed_sample_fmt(out_fmt)+AV_SAMPLE_FMT_NB *av_get_packed_sample_fmt(in_fmt)];if(!f) return NULL;ctx=av_mallocz(sizeof(*ctx));if(!ctx) return NULL;if(channels==1){ in_fmt=av_get_planar_sample_fmt(in_fmt);out_fmt=av_get_planar_sample_fmt(out_fmt);} ctx->channels=channels;ctx->conv_f=f;ctx->ch_map=ch_map;if(in_fmt==AV_SAMPLE_FMT_U8||in_fmt==AV_SAMPLE_FMT_U8P) memset(ctx->silence, 0x80, sizeof(ctx->silence));if(out_fmt==in_fmt &&!ch_map) { switch(av_get_bytes_per_sample(in_fmt)){ case 1:ctx->simd_f=cpy1;break;case 2:ctx->simd_f=cpy2;break;case 4:ctx->simd_f=cpy4;break;case 8:ctx->simd_f=cpy8;break;} } if(HAVE_X86ASM &&HAVE_MMX) swri_audio_convert_init_x86(ctx, out_fmt, in_fmt, channels);if(ARCH_ARM) swri_audio_convert_init_arm(ctx, out_fmt, in_fmt, channels);if(ARCH_AARCH64) swri_audio_convert_init_aarch64(ctx, out_fmt, in_fmt, channels);return ctx;} void swri_audio_convert_free(AudioConvert **ctx) { av_freep(ctx);} int swri_audio_convert(AudioConvert *ctx, AudioData *out, AudioData *in, int len) { int ch;int off=0;const int os=(out->planar ? 1 :out->ch_count) *out->bps;unsigned misaligned=0;av_assert0(ctx->channels==out->ch_count);if(ctx->in_simd_align_mask) { int planes=in->planar ? in->ch_count :1;unsigned m=0;for(ch=0;ch< planes;ch++) m|=(intptr_t) in->ch[ch];misaligned|=m &ctx->in_simd_align_mask;} if(ctx->out_simd_align_mask) { int planes=out->planar ? out->ch_count :1;unsigned m=0;for(ch=0;ch< planes;ch++) m|=(intptr_t) out->ch[ch];misaligned|=m &ctx->out_simd_align_mask;} if(ctx->simd_f &&!ctx->ch_map &&!misaligned){ off=len &~15;av_assert1(off >=0);av_assert1(off<=len);av_assert2(ctx->channels==SWR_CH_MAX||!in->ch[ctx->channels]);if(off >0){ if(out->planar==in->planar){ int planes=out->planar ? out->ch_count :1;for(ch=0;ch< planes;ch++){ ctx->simd_f(out-> ch ch
Definition: audioconvert.c:56

IndividualChannelStream::tns_max_bands
int tns_max_bands
Definition: aac.h:185

SingleChannelElement::ret
INTFLOAT * ret
PCM output.
Definition: aac.h:269

ChannelElement::present
int present
Definition: aac.h:276

ChannelElement::common_window
int common_window
Set if channels share a common &#39;IndividualChannelStream&#39; in bitstream.
Definition: aac.h:278

update_ltp
static void update_ltp(AACContext *ac, SingleChannelElement *sce)
Update the LTP buffer for next frame.
Definition: aacdec_template.c:2601

vector_pow43
static void vector_pow43(int *coefs, int len)
Definition: aacdec_fixed.c:151

OutputConfiguration::channel_layout
uint64_t channel_layout
Definition: aac.h:128

subband_scale
static void subband_scale(int *dst, int *src, int scale, int offset, int len)
Definition: aacdec_fixed.c:165

MAX_LTP_LONG_SFB
#define MAX_LTP_LONG_SFB
Definition: aac.h:51

DynamicRangeControl
Dynamic Range Control - decoded from the bitstream but not processed further.
Definition: aac.h:211

src
#define src
Definition: vp8dsp.c:254

ChannelPosition
ChannelPosition
Definition: aac.h:94

OutputConfiguration
Definition: aac.h:123

decode
static void decode(AVCodecContext *dec_ctx, AVPacket *pkt, AVFrame *frame, FILE *outfile)
Definition: decode_audio.c:42

NOISE_BT
Spectral data are scaled white noise not coded in the bitstream.
Definition: aac.h:87

TYPE_CCE
Definition: aac.h:58

fixed_dsp.h

AAC_CHANNEL_OFF
Definition: aac.h:95

mdct15.h

DynamicRangeControl::band_incr
int band_incr
Number of DRC bands greater than 1 having DRC info.
Definition: aac.h:216

AACContext::dmono_mode
int dmono_mode
0->not dmono, 1->use first channel, 2->use second channel
Definition: aac.h:351

IndividualChannelStream::swb_offset
const uint16_t * swb_offset
table of offsets to the lowest spectral coefficient of a scalefactor band, sfb, for a particular wind...
Definition: aac.h:181

INTFLOAT
float INTFLOAT
Definition: aac_defines.h:86

EXT_FILL
Definition: aac.h:67

PredictorState::cor0
AAC_FLOAT cor0
Definition: aac.h:136

BandType
BandType
Definition: aac.h:82

uint8_t
uint8_t
Definition: audio_convert.c:194

EIGHT_SHORT_SEQUENCE
Definition: aac.h:78

OutputConfiguration::layout_map
uint8_t layout_map[MAX_ELEM_ID *4][3]
Definition: aac.h:125

PredictorState::var1
AAC_FLOAT var1
Definition: aac.h:139

OC_TRIAL_PCE
Output configuration under trial specified by an inband PCE.
Definition: aac.h:117

AACContext::warned_960_sbr
int warned_960_sbr
Definition: aac.h:358

TYPE_LFE
Definition: aac.h:59

IndividualChannelStream::num_window_groups
int num_window_groups
Definition: aac.h:178

SingleChannelElement::tns
TemporalNoiseShaping tns
Definition: aac.h:250

CouplingPoint
CouplingPoint
The point during decoding at which channel coupling is applied.
Definition: aac.h:106

ChannelCoupling::num_coupled
int num_coupled
number of target elements
Definition: aac.h:236

EXT_FILL_DATA
Definition: aac.h:68

AACContext::mdct_ltp
FFTContext mdct_ltp
Definition: aac.h:326

DECLARE_ALIGNED
#define DECLARE_ALIGNED(n, t, v)
Declare a variable that is aligned in memory.
Definition: mem.h:112

PredictorState::cor1
AAC_FLOAT cor1
Definition: aac.h:137

INTENSITY_BT
Scalefactor data are intensity stereo positions (in phase).
Definition: aac.h:89

OC_GLOBAL_HDR
Output configuration set in a global header but not yet locked.
Definition: aac.h:119

AAC_CHANNEL_LFE
Definition: aac.h:99

AACContext::random_state
int random_state
Definition: aac.h:335

AACContext::mdct480
MDCT15Context * mdct480
Definition: aac.h:331

OutputConfiguration::m4ac
MPEG4AudioConfig m4ac
Definition: aac.h:124

PredictorState::r1
AAC_FLOAT r1
Definition: aac.h:141

ChannelElement::sbr
SpectralBandReplication sbr
Definition: aac.h:287

AACContext::mdct_small
FFTContext mdct_small
Definition: aac.h:324

IndividualChannelStream::num_windows
int num_windows
Definition: aac.h:184

ExtensionPayloadID
ExtensionPayloadID
Definition: aac.h:66

PredictorState::r0
AAC_FLOAT r0
Definition: aac.h:140

EXT_DATA_ELEMENT
Definition: aac.h:69

sbr.h
Spectral Band Replication definitions and structures.

IndividualChannelStream::max_sfb
uint8_t max_sfb
number of scalefactor bands per group
Definition: aac.h:175

TYPE_FIL
Definition: aac.h:62

offset
static const uint8_t offset[127][2]
Definition: vf_spp.c:92

WindowSequence
WindowSequence
Definition: aac.h:75

IndividualChannelStream::num_swb
int num_swb
number of scalefactor window bands
Definition: aac.h:183

aac_defines.h

MPEG4AudioConfig
Definition: mpeg4audio.h:33

DynamicRangeControl::prog_ref_level
int prog_ref_level
A reference level for the long-term program audio level for all channels combined.
Definition: aac.h:219

OC_LOCKED
Output configuration locked in place.
Definition: aac.h:120

PredictorState
Predictor State.
Definition: aac.h:135

AACContext::warned_remapping_once
int warned_remapping_once
Definition: aac.h:308

PredictorState::x_est
AAC_FLOAT x_est
Definition: aac.h:143

FFTContext
Definition: fft.h:88

IndividualChannelStream::predictor_reset_group
int predictor_reset_group
Definition: aac.h:188

BETWEEN_TNS_AND_IMDCT
Definition: aac.h:108

AFTER_IMDCT
Definition: aac.h:109

AACContext::mdct120
MDCT15Context * mdct120
Definition: aac.h:330

AAC_FLOAT
float AAC_FLOAT
Definition: aac_defines.h:90

AACContext::mdct_ld
FFTContext mdct_ld
Definition: aac.h:325

ff_aacdec_init_mips
void ff_aacdec_init_mips(AACContext *c)
Definition: aacdec_mips.c:433

AVFloatDSPContext
Definition: float_dsp.h:24

DynamicRangeControl::pce_instance_tag
int pce_instance_tag
Indicates with which program the DRC info is associated.
Definition: aac.h:212

windowing_and_mdct_ltp
static void windowing_and_mdct_ltp(AACContext *ac, INTFLOAT *out, INTFLOAT *in, IndividualChannelStream *ics)
Apply windowing and MDCT to obtain the spectral coefficient from the predicted sample by LTP...
Definition: aacdec_template.c:2543

TemporalNoiseShaping::present
int present
Definition: aac.h:199

AAC_CHANNEL_SIDE
Definition: aac.h:97

DynamicRangeControl::interpolation_scheme
int interpolation_scheme
Indicates the interpolation scheme used in the SBR QMF domain.
Definition: aac.h:217

ChannelCoupling
coupling parameters
Definition: aac.h:234

EXT_SBR_DATA
Definition: aac.h:71

AACContext::tags_mapped
int tags_mapped
Definition: aac.h:307

AACContext::mdct960
MDCT15Context * mdct960
Definition: aac.h:332

AACContext::force_dmono_mode
int force_dmono_mode
0->not dmono, 1->use first channel, 2->use second channel
Definition: aac.h:350

AACContext::is_saved
int is_saved
Set if elements have stored overlap from previous frame.
Definition: aac.h:298

AACContext::warned_num_aac_frames
int warned_num_aac_frames
Definition: aac.h:357

EXT_DYNAMIC_RANGE
Definition: aac.h:70

avcodec.h
Libavcodec external API header.

void
typedef void(RENAME(mix_any_func_type))
Definition: rematrix_template.c:52

TemporalNoiseShaping
Temporal Noise Shaping.
Definition: aac.h:198

LONG_START_SEQUENCE
Definition: aac.h:77

IndividualChannelStream::predictor_present
int predictor_present
Definition: aac.h:186

LongTermPrediction
Long Term Prediction.
Definition: aac.h:163

apply_tns
static void apply_tns(INTFLOAT coef_param[1024], TemporalNoiseShaping *tns, IndividualChannelStream *ics, int decode)
Decode Temporal Noise Shaping filter coefficients and apply all-pole filters; reference: 4...
Definition: aacdec_template.c:2486

AVCodecContext
main external API structure.
Definition: avcodec.h:1518

SingleChannelElement::pulse
Pulse pulse
Definition: aac.h:251

SingleChannelElement::ics
IndividualChannelStream ics
Definition: aac.h:249

MAX_PREDICTORS
#define MAX_PREDICTORS
Definition: aac.h:146

in
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(const int16_t *) pi >> 8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(const int32_t *) pi >> 24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(const float *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(const float *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(const float *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(const double *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(const double *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(const double *) pi *(1U<< 31)))) #define SET_CONV_FUNC_GROUP(ofmt, ifmt) static void set_generic_function(AudioConvert *ac) { } void ff_audio_convert_free(AudioConvert **ac) { if(! *ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);} AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enum AVSampleFormat out_fmt, enum AVSampleFormat in_fmt, int channels, int sample_rate, int apply_map) { AudioConvert *ac;int in_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) return NULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method !=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt) > 2) { ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc) { av_free(ac);return NULL;} return ac;} in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar) { ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar ? ac->channels :1;} else if(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;else ac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);return ac;} int ff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in) { int use_generic=1;int len=in->nb_samples;int p;if(ac->dc) { av_log(ac->avr, AV_LOG_TRACE, "%d samples - audio_convert: %s to %s (dithered)\", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));return ff_convert_dither(ac-> in
Definition: audio_convert.c:194

MAX_ELEM_ID
#define MAX_ELEM_ID
Definition: aac.h:48

AVClass
Describe the class of an AVClass context structure.
Definition: log.h:67

ESC_BT
Spectral data are coded with an escape sequence.
Definition: aac.h:85

AAC_CHANNEL_BACK
Definition: aac.h:98

type
cl_device_type type
Definition: hwcontext_opencl.c:189

IndividualChannelStream::swb_sizes
const uint8_t * swb_sizes
table of scalefactor band sizes for a particular window
Definition: aac.h:182

OCStatus
OCStatus
Output configuration status.
Definition: aac.h:115

MAX_CHANNELS
#define MAX_CHANNELS
Definition: aac.h:47

AAC_CHANNEL_CC
Definition: aac.h:100

TNS_MAX_ORDER
#define TNS_MAX_ORDER
Definition: aac.h:50

AACContext
main AAC context
Definition: aac.h:293

IndividualChannelStream::ltp
LongTermPrediction ltp
Definition: aac.h:180

PredictorState::k1
AAC_FLOAT k1
Definition: aac.h:142

ChannelElement::coup
ChannelCoupling coup
Definition: aac.h:286

ChannelElement::ms_mode
int ms_mode
Signals mid/side stereo flags coding mode (used by encoder)
Definition: aac.h:279

OC_TRIAL_FRAME
Output configuration under trial specified by a frame header.
Definition: aac.h:118

AAC_CHANNEL_FRONT
Definition: aac.h:96

ChannelElement::is_mode
uint8_t is_mode
Set if any bands have been encoded using intensity stereo (used by encoder)
Definition: aac.h:280

OutputConfiguration::status
enum OCStatus status
Definition: aac.h:129

INTENSITY_BT2
Scalefactor data are intensity stereo positions (out of phase).
Definition: aac.h:88

LongTermPrediction::lag
int16_t lag
Definition: aac.h:165

AACContext::che_drc
DynamicRangeControl che_drc
Definition: aac.h:299

AACContext::frame
AVFrame * frame
Definition: aac.h:296

SingleChannelElement
Single Channel Element - used for both SCE and LFE elements.
Definition: aac.h:248

c
static double c[64]
Definition: vsrc_mptestsrc.c:87

TYPE_PCE
Definition: aac.h:61

IndividualChannelStream
Individual Channel Stream.
Definition: aac.h:174

IndividualChannelStream::clip_avoidance_factor
float clip_avoidance_factor
set if any window is near clipping to the necessary atennuation factor to avoid it ...
Definition: aac.h:192

LongTermPrediction::coef
INTFLOAT coef
Definition: aac.h:167

MDCT15Context
Definition: mdct15.h:28

ChannelElement
channel element - generic struct for SCE/CPE/CCE/LFE
Definition: aac.h:275

Pulse::start
int start
Definition: aac.h:226

AACContext::warned_gain_control
int warned_gain_control
Definition: aac.h:360

fft.h

coeffs
static const int16_t coeffs[]
Definition: simple_idct_mmi.c:40

len
int len
Definition: vorbis_enc_data.h:452

ZERO_BT
Scalefactors and spectral data are all zero.
Definition: aac.h:83

Pulse::num_pulse
int num_pulse
Definition: aac.h:225

ONLY_LONG_SEQUENCE
Definition: aac.h:76

out
FILE * out
Definition: movenc.c:54

AACContext::mdct
FFTContext mdct
Definition: aac.h:323

length
const char int length
Definition: avisynth_c.h:768

LongTermPrediction::present
int8_t present
Definition: aac.h:164

EXT_SBR_DATA_CRC
Definition: aac.h:72

BEFORE_TNS
Definition: aac.h:107

SpectralBandReplication
Spectral Band Replication.
Definition: sbr.h:139

OutputConfiguration::layout_map_tags
int layout_map_tags
Definition: aac.h:126

PredictorState::var0
AAC_FLOAT var0
Definition: aac.h:138

OC_NONE
Output unconfigured.
Definition: aac.h:116

FIRST_PAIR_BT
This and later band types encode two values (rather than four) with one code word.
Definition: aac.h:84

RawDataBlockType
RawDataBlockType
Definition: aac.h:55