@ -61,9 +61,7 @@
*/
typedef struct AacPsyBand {
float energy ; ///< band energy
float ffac ; ///< form factor
float thr ; ///< energy threshold
float min_snr ; ///< minimal SNR
float thr_quiet ; ///< threshold in quiet
} AacPsyBand ;
@ -88,17 +86,18 @@ typedef struct AacPsyChannel{
* psychoacoustic model frame type - dependent coefficients
*/
typedef struct AacPsyCoeffs {
float ath [ 64 ] ; ///< absolute threshold of hearing per bands
float barks [ 64 ] ; ///< Bark value for each spectral band in long frame
float spread_low [ 64 ] ; ///< spreading factor for low-to-high threshold spreading in long frame
float spread_hi [ 64 ] ; ///< spreading factor for high-to-low threshold spreading in long frame
float ath ; ///< absolute threshold of hearing per bands
float barks ; ///< Bark value for each spectral band in long frame
float spread_low [ 2 ] ; ///< spreading factor for low-to-high threshold spreading in long frame
float spread_hi [ 2 ] ; ///< spreading factor for high-to-low threshold spreading in long frame
float min_snr ; ///< minimal SNR
} AacPsyCoeffs ;
/**
* 3 GPP TS26 .403 - inspired psychoacoustic model specific data
*/
typedef struct AacPsyContext {
AacPsyCoeffs psy_coef [ 2 ] ;
AacPsyCoeffs psy_coef [ 2 ] [ 64 ] ;
AacPsyChannel * ch ;
} AacPsyContext ;
@ -243,27 +242,30 @@ static av_cold int psy_3gpp_init(FFPsyContext *ctx) {
minath = ath ( 3410 , ATH_ADD ) ;
for ( j = 0 ; j < 2 ; j + + ) {
AacPsyCoeffs * coeffs = & pctx - > psy_coef [ j ] ;
AacPsyCoeffs * coeffs = pctx - > psy_coef [ j ] ;
const uint8_t * band_sizes = ctx - > bands [ j ] ;
float line_to_frequency = ctx - > avctx - > sample_rate / ( j ? 256.f : 2048.0f ) ;
i = 0 ;
prev = 0.0 ;
for ( g = 0 ; g < ctx - > num_bands [ j ] ; g + + ) {
i + = ctx - > bands [ j ] [ g ] ;
i + = band_sizes [ g ] ;
bark = calc_bark ( ( i - 1 ) * line_to_frequency ) ;
coeffs - > barks [ g ] = ( bark + prev ) / 2.0 ;
coeffs [ g ] . barks = ( bark + prev ) / 2.0 ;
prev = bark ;
}
for ( g = 0 ; g < ctx - > num_bands [ j ] - 1 ; g + + ) {
coeffs - > spread_low [ g ] = pow ( 10.0 , - ( coeffs - > barks [ g + 1 ] - coeffs - > barks [ g ] ) * PSY_3GPP_SPREAD_LOW ) ;
coeffs - > spread_hi [ g ] = pow ( 10.0 , - ( coeffs - > barks [ g + 1 ] - coeffs - > barks [ g ] ) * PSY_3GPP_SPREAD_HI ) ;
AacPsyCoeffs * coeff = & coeffs [ g ] ;
float bark_width = coeffs [ g + 1 ] . barks - coeffs - > barks ;
coeff - > spread_low [ 0 ] = pow ( 10.0 , - bark_width * PSY_3GPP_SPREAD_LOW ) ;
coeff - > spread_hi [ 0 ] = pow ( 10.0 , - bark_width * PSY_3GPP_SPREAD_HI ) ;
}
start = 0 ;
for ( g = 0 ; g < ctx - > num_bands [ j ] ; g + + ) {
minscale = ath ( start * line_to_frequency , ATH_ADD ) ;
for ( i = 1 ; i < ctx - > bands [ j ] [ g ] ; i + + )
for ( i = 1 ; i < band_sizes [ g ] ; i + + )
minscale = FFMIN ( minscale , ath ( ( start + i ) * line_to_frequency , ATH_ADD ) ) ;
coeffs - > ath [ g ] = minscale - minath ;
start + = ctx - > bands [ j ] [ g ] ;
coeffs [ g ] . ath = minscale - minath ;
start + = band_sizes [ g ] ;
}
}
@ -406,24 +408,32 @@ static void psy_3gpp_analyze(FFPsyContext *ctx, int channel,
band - > energy + = coefs [ start + i ] * coefs [ start + i ] ;
band - > thr = band - > energy * 0.001258925f ;
start + = band_sizes [ g ] ;
ctx - > psy_bands [ channel * PSY_MAX_BANDS + w + g ] . energy = band - > energy ;
}
}
//modify thresholds - spread, threshold in quiet - 5.4.3 "Spreaded Energy Calculation"
for ( w = 0 ; w < wi - > num_windows * 16 ; w + = 16 ) {
AacPsyBand * band = & pch - > band [ w ] ;
AacPsyBand * bands = & pch - > band [ w ] ;
for ( g = 1 ; g < num_bands ; g + + )
band [ g ] . thr = FFMAX ( band [ g ] . thr , band [ g - 1 ] . thr * coeffs - > spread_hi [ g ] ) ;
bands [ g ] . thr = FFMAX ( bands [ g ] . thr , bands [ g - 1 ] . thr * coeffs [ g ] . spread_hi [ 0 ] ) ;
for ( g = num_bands - 2 ; g > = 0 ; g - - )
band [ g ] . thr = FFMAX ( band [ g ] . thr , band [ g + 1 ] . thr * coeffs - > spread_low [ g ] ) ;
bands [ g ] . thr = FFMAX ( bands [ g ] . thr , bands [ g + 1 ] . thr * coeffs [ g ] . spread_low [ 0 ] ) ;
for ( g = 0 ; g < num_bands ; g + + ) {
band [ g ] . thr_quiet = band [ g ] . thr = FFMAX ( band [ g ] . thr , coeffs - > ath [ g ] ) ;
AacPsyBand * band = & bands [ g ] ;
band - > thr_quiet = band - > thr = FFMAX ( band - > thr , coeffs [ g ] . ath ) ;
if ( ! ( wi - > window_type [ 0 ] = = LONG_STOP_SEQUENCE | | ( wi - > window_type [ 1 ] = = LONG_START_SEQUENCE & & ! w ) ) )
band [ g ] . thr = FFMAX ( PSY_3GPP_RPEMIN * band [ g ] . thr , FFMIN ( band [ g ] . thr ,
PSY_3GPP_RPELEV * pch - > prev_band [ w + g ] . thr_quiet ) ) ;
band - > thr = FFMAX ( PSY_3GPP_RPEMIN * band - > thr , FFMIN ( band - > thr ,
PSY_3GPP_RPELEV * pch - > prev_band [ w + g ] . thr_quiet ) ) ;
}
}
ctx - > psy_bands [ channel * PSY_MAX_BANDS + w + g ] . threshold = band [ g ] . thr ;
for ( w = 0 ; w < wi - > num_windows * 16 ; w + = 16 ) {
for ( g = 0 ; g < num_bands ; g + + ) {
AacPsyBand * band = & pch - > band [ w + g ] ;
FFPsyBand * psy_band = & ctx - > psy_bands [ channel * PSY_MAX_BANDS + w + g ] ;
psy_band - > threshold = band - > thr ;
psy_band - > energy = band - > energy ;
}
}
memcpy ( pch - > prev_band , pch - > band , sizeof ( pch - > band ) ) ;
@ -553,22 +563,9 @@ static FFPsyWindowInfo psy_lame_window(FFPsyContext *ctx,
if ( pch - > prev_attack = = 3 | | att_sum ) {
uselongblock = 0 ;
if ( attacks [ 1 ] & & attacks [ 0 ] )
attacks [ 1 ] = 0 ;
if ( attacks [ 2 ] & & attacks [ 1 ] )
attacks [ 2 ] = 0 ;
if ( attacks [ 3 ] & & attacks [ 2 ] )
attacks [ 3 ] = 0 ;
if ( attacks [ 4 ] & & attacks [ 3 ] )
attacks [ 4 ] = 0 ;
if ( attacks [ 5 ] & & attacks [ 4 ] )
attacks [ 5 ] = 0 ;
if ( attacks [ 6 ] & & attacks [ 5 ] )
attacks [ 6 ] = 0 ;
if ( attacks [ 7 ] & & attacks [ 6 ] )
attacks [ 7 ] = 0 ;
if ( attacks [ 8 ] & & attacks [ 7 ] )
attacks [ 8 ] = 0 ;
for ( i = 1 ; i < AAC_NUM_BLOCKS_SHORT + 1 ; i + + )
if ( attacks [ i ] & & attacks [ i - 1 ] )
attacks [ i ] = 0 ;
}
} else {
/* We have no lookahead info, so just use same type as the previous sequence. */