mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2025-01-24 13:56:33 +02:00
add support for spectral extension
Originally committed as revision 15812 to svn://svn.ffmpeg.org/ffmpeg/trunk
This commit is contained in:
parent
0c5d750df9
commit
0cc51734b2
@ -818,14 +818,86 @@ static int decode_audio_block(AC3DecodeContext *s, int blk)
|
||||
|
||||
/* spectral extension strategy */
|
||||
if (s->eac3 && (!blk || get_bits1(gbc))) {
|
||||
if (get_bits1(gbc)) {
|
||||
av_log_missing_feature(s->avctx, "Spectral extension", 1);
|
||||
return -1;
|
||||
s->spx_in_use[blk] = get_bits1(gbc);
|
||||
if (s->spx_in_use[blk]) {
|
||||
int begf, endf;
|
||||
int spx_end_subband;
|
||||
|
||||
/* determine which channels use spx */
|
||||
if (s->channel_mode == AC3_CHMODE_MONO) {
|
||||
s->channel_in_spx[1] = 1;
|
||||
s->spx_coords_exist[1] = 0;
|
||||
} else {
|
||||
for (ch = 1; ch <= fbw_channels; ch++) {
|
||||
s->channel_in_spx[ch] = get_bits1(gbc);
|
||||
s->spx_coords_exist[ch] = 0;
|
||||
}
|
||||
}
|
||||
|
||||
s->spx_copy_start_freq = get_bits(gbc, 2) * 12 + 25;
|
||||
begf = get_bits(gbc, 3);
|
||||
endf = get_bits(gbc, 3);
|
||||
s->spx_start_subband = begf < 6 ? begf+2 : 2*begf-3;
|
||||
spx_end_subband = endf < 4 ? endf+5 : 2*endf+3;
|
||||
s->num_spx_subbands = spx_end_subband - s->spx_start_subband;
|
||||
s->spx_start_freq = s->spx_start_subband * 12 + 25;
|
||||
s->spx_end_freq = spx_end_subband * 12 + 25;
|
||||
|
||||
decode_band_structure(gbc, blk, s->eac3, 0,
|
||||
s->spx_start_subband, spx_end_subband,
|
||||
ff_eac3_default_spx_band_struct,
|
||||
s->spx_band_struct, NULL, &s->num_spx_bands,
|
||||
s->spx_band_sizes);
|
||||
} else {
|
||||
for (ch = 1; ch <= fbw_channels; ch++) {
|
||||
s->channel_in_spx[ch] = 0;
|
||||
s->first_spx_coords[ch] = 1;
|
||||
}
|
||||
}
|
||||
/* TODO: parse spectral extension strategy info */
|
||||
} else {
|
||||
s->spx_in_use[blk] = blk ? s->spx_in_use[blk-1] : 0;
|
||||
}
|
||||
|
||||
/* TODO: spectral extension coordinates */
|
||||
/* spectral extension coordinates */
|
||||
if (s->spx_in_use[blk]) {
|
||||
for (ch = 1; ch <= fbw_channels; ch++) {
|
||||
if (s->channel_in_spx[ch]) {
|
||||
if (s->first_spx_coords[ch] || get_bits1(gbc)) {
|
||||
int bin, spx_blend;
|
||||
int master_spx_coord;
|
||||
s->first_spx_coords[ch] = 0;
|
||||
s->spx_coords_exist[ch] = 1;
|
||||
spx_blend = get_bits(gbc, 5) << 18;
|
||||
master_spx_coord = get_bits(gbc, 2) * 3;
|
||||
bin = s->spx_start_freq;
|
||||
for (bnd = 0; bnd < s->num_spx_bands; bnd++) {
|
||||
int spx_coord_exp, spx_coord_mant;
|
||||
|
||||
/* calculate blending factors */
|
||||
int bandsize = s->spx_band_sizes[bnd];
|
||||
int nratio = (((bin + (bandsize >> 1)) << 23) / s->spx_end_freq) - spx_blend;
|
||||
nratio = av_clip(nratio, 0, INT24_MAX);
|
||||
s->spx_noise_blend [ch][bnd] = ff_sqrt(( nratio) << 8) * M_SQRT_POW2_15;
|
||||
s->spx_signal_blend[ch][bnd] = ff_sqrt((INT24_MAX - nratio) << 8) * M_SQRT_POW2_15;
|
||||
bin += bandsize;
|
||||
|
||||
/* decode spx coordinates */
|
||||
spx_coord_exp = get_bits(gbc, 4);
|
||||
spx_coord_mant = get_bits(gbc, 2);
|
||||
if (spx_coord_exp == 15)
|
||||
s->spx_coords[ch][bnd] = spx_coord_mant << 26;
|
||||
else
|
||||
s->spx_coords[ch][bnd] = (spx_coord_mant + 4) << 25;
|
||||
s->spx_coords[ch][bnd] >>= (spx_coord_exp + master_spx_coord);
|
||||
}
|
||||
} else {
|
||||
s->spx_coords_exist[ch] = 0;
|
||||
}
|
||||
} else {
|
||||
s->first_spx_coords[ch] = 1;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/* coupling strategy */
|
||||
if (s->eac3 ? s->cpl_strategy_exists[blk] : get_bits1(gbc)) {
|
||||
@ -862,9 +934,12 @@ static int decode_audio_block(AC3DecodeContext *s, int blk)
|
||||
s->phase_flags_in_use = get_bits1(gbc);
|
||||
|
||||
/* coupling frequency range */
|
||||
/* TODO: modify coupling end freq if spectral extension is used */
|
||||
cpl_start_subband = get_bits(gbc, 4);
|
||||
if (s->spx_in_use[blk]) {
|
||||
cpl_end_subband = s->spx_start_subband - 1;
|
||||
} else {
|
||||
cpl_end_subband = get_bits(gbc, 4) + 3;
|
||||
}
|
||||
s->num_cpl_subbands = cpl_end_subband - cpl_start_subband;
|
||||
if (s->num_cpl_subbands < 0) {
|
||||
av_log(s->avctx, AV_LOG_ERROR, "invalid coupling range (%d > %d)\n",
|
||||
@ -939,8 +1014,14 @@ static int decode_audio_block(AC3DecodeContext *s, int blk)
|
||||
if (channel_mode == AC3_CHMODE_STEREO) {
|
||||
if ((s->eac3 && !blk) || get_bits1(gbc)) {
|
||||
s->num_rematrixing_bands = 4;
|
||||
if(cpl_in_use && s->start_freq[CPL_CH] <= 61)
|
||||
if (cpl_in_use) {
|
||||
if (s->start_freq[CPL_CH] <= 61)
|
||||
s->num_rematrixing_bands -= 1 + (s->start_freq[CPL_CH] == 37);
|
||||
} else if (s->spx_in_use[blk]) {
|
||||
if (s->spx_start_freq <= 61)
|
||||
s->num_rematrixing_bands -= 1 + (s->spx_start_freq <= 37) +
|
||||
(s->spx_start_freq <= 25);
|
||||
}
|
||||
for(bnd=0; bnd<s->num_rematrixing_bands; bnd++)
|
||||
s->rematrixing_flags[bnd] = get_bits1(gbc);
|
||||
} else if (!blk) {
|
||||
@ -965,6 +1046,8 @@ static int decode_audio_block(AC3DecodeContext *s, int blk)
|
||||
int prev = s->end_freq[ch];
|
||||
if (s->channel_in_cpl[ch])
|
||||
s->end_freq[ch] = s->start_freq[CPL_CH];
|
||||
else if (s->channel_in_spx[ch])
|
||||
s->end_freq[ch] = s->spx_start_freq;
|
||||
else {
|
||||
int bandwidth_code = get_bits(gbc, 6);
|
||||
if (bandwidth_code > 60) {
|
||||
@ -1155,12 +1238,12 @@ static int decode_audio_block(AC3DecodeContext *s, int blk)
|
||||
|
||||
/* TODO: generate enhanced coupling coordinates and uncouple */
|
||||
|
||||
/* TODO: apply spectral extension */
|
||||
|
||||
/* recover coefficients if rematrixing is in use */
|
||||
if(s->channel_mode == AC3_CHMODE_STEREO)
|
||||
do_rematrixing(s);
|
||||
|
||||
ff_eac3_apply_spectral_extension(s);
|
||||
|
||||
/* apply scaling to coefficients (headroom, dynrng) */
|
||||
for(ch=1; ch<=s->channels; ch++) {
|
||||
float gain = s->mul_bias / 4194304.0f;
|
||||
|
@ -42,6 +42,11 @@
|
||||
#define AC3_MAX_COEFS 256
|
||||
#define AC3_BLOCK_SIZE 256
|
||||
#define MAX_BLOCKS 6
|
||||
#define SPX_MAX_BANDS 17
|
||||
|
||||
#define INT24_MIN -8388608
|
||||
#define INT24_MAX 8388607
|
||||
#define M_SQRT_POW2_15 181
|
||||
|
||||
typedef struct {
|
||||
AVCodecContext *avctx; ///< parent context
|
||||
@ -88,6 +93,26 @@ typedef struct {
|
||||
int cpl_coords[AC3_MAX_CHANNELS][18]; ///< coupling coordinates (cplco)
|
||||
///@}
|
||||
|
||||
///@defgroup spx spectral extension
|
||||
///@{
|
||||
int spx_in_use[MAX_BLOCKS]; ///< spectral extension in use (spxinu)
|
||||
int channel_in_spx[AC3_MAX_CHANNELS]; ///< channel in spectral extension (chinspx)
|
||||
int spx_atten_code[AC3_MAX_CHANNELS]; ///< spx attenuation code (spxattencod)
|
||||
int spx_coords_exist[AC3_MAX_CHANNELS]; ///< indicates if a channel has spx coords (spxcoe)
|
||||
int spx_start_subband; ///< spx beginning frequency band (spxbegf)
|
||||
int spx_start_freq; ///< spx start frequency bin
|
||||
int spx_end_freq; ///< spx end frequency bin
|
||||
int spx_copy_start_freq; ///< spx starting frequency for copying (copystartmant)
|
||||
int num_spx_subbands; ///< number of spectral extension subbands
|
||||
int num_spx_bands; ///< number of spectral extension bands (nspxbnds)
|
||||
uint8_t spx_band_struct[SPX_MAX_BANDS]; ///< spectral extension band structure (spxbndstrc)
|
||||
int spx_band_sizes[SPX_MAX_BANDS]; ///< number of bins in each band (spxbndsztab)
|
||||
int first_spx_coords[AC3_MAX_CHANNELS]; ///< first spx coordinates states (firstspxcos)
|
||||
int spx_noise_blend[AC3_MAX_CHANNELS][SPX_MAX_BANDS]; ///< spx noise blending factor (nblendfact)
|
||||
int spx_signal_blend[AC3_MAX_CHANNELS][SPX_MAX_BANDS]; ///< spx signal blending factor (sblendfact)
|
||||
int spx_coords[AC3_MAX_CHANNELS][SPX_MAX_BANDS]; ///< spectral extension coordinates (spxco)
|
||||
///@}
|
||||
|
||||
///@defgroup aht adaptive hybrid transform
|
||||
int channel_uses_aht[AC3_MAX_CHANNELS]; ///< channel AHT in use (chahtinu)
|
||||
int pre_mantissa[AC3_MAX_CHANNELS][AC3_MAX_COEFS][MAX_BLOCKS]; ///< pre-IDCT mantissas
|
||||
@ -179,4 +204,6 @@ int ff_eac3_parse_header(AC3DecodeContext *s);
|
||||
*/
|
||||
void ff_eac3_decode_transform_coeffs_aht_ch(AC3DecodeContext *s, int ch);
|
||||
|
||||
void ff_eac3_apply_spectral_extension(AC3DecodeContext *s);
|
||||
|
||||
#endif /* AVCODEC_AC3DEC_H */
|
||||
|
@ -1127,6 +1127,52 @@ const uint8_t ff_eac3_frm_expstr[32][6] = {
|
||||
const uint8_t ff_eac3_default_cpl_band_struct[18] =
|
||||
{ 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1 };
|
||||
|
||||
/**
|
||||
* Table E2.15 Default Spectral Extension Banding Structure
|
||||
*/
|
||||
const uint8_t ff_eac3_default_spx_band_struct[17] =
|
||||
{ 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1 };
|
||||
|
||||
/**
|
||||
* Table E.25: Spectral Extension Attenuation Table
|
||||
* 24-bit fixed-point version of the floating-point table in the specification.
|
||||
* ff_eac3_spx_atten_tab[code][bin]=lrint(pow(1<<(bin+1),(code+1)/-15.0)*(1<<23));
|
||||
*/
|
||||
const int32_t ff_eac3_spx_atten_tab[32][3] = {
|
||||
{ 8009792, 7648083, 7302707 },
|
||||
{ 7648083, 6972929, 6357376 },
|
||||
{ 7302707, 6357376, 5534417 },
|
||||
{ 6972929, 5796163, 4817990 },
|
||||
{ 6658043, 5284492, 4194304 },
|
||||
{ 6357376, 4817990, 3651354 },
|
||||
{ 6070287, 4392670, 3178688 },
|
||||
{ 5796163, 4004896, 2767209 },
|
||||
{ 5534417, 3651354, 2408995 },
|
||||
{ 5284492, 3329021, 2097152 },
|
||||
{ 5045853, 3035144, 1825677 },
|
||||
{ 4817990, 2767209, 1589344 },
|
||||
{ 4600417, 2522926, 1383604 },
|
||||
{ 4392670, 2300209, 1204498 },
|
||||
{ 4194304, 2097152, 1048576 },
|
||||
{ 4004896, 1912021, 912838 },
|
||||
{ 3824041, 1743232, 794672 },
|
||||
{ 3651354, 1589344, 691802 },
|
||||
{ 3486464, 1449041, 602249 },
|
||||
{ 3329021, 1321123, 524288 },
|
||||
{ 3178688, 1204498, 456419 },
|
||||
{ 3035144, 1098167, 397336 },
|
||||
{ 2898081, 1001224, 345901 },
|
||||
{ 2767209, 912838, 301124 },
|
||||
{ 2642246, 832255, 262144 },
|
||||
{ 2522926, 758786, 228210 },
|
||||
{ 2408995, 691802, 198668 },
|
||||
{ 2300209, 630732, 172951 },
|
||||
{ 2196335, 575052, 150562 },
|
||||
{ 2097152, 524288, 131072 },
|
||||
{ 2002448, 478005, 114105 },
|
||||
{ 1912021, 435808, 99334 }
|
||||
};
|
||||
|
||||
/**
|
||||
* Table of bin locations for rematrixing bands
|
||||
* reference: Section 7.5.2 Rematrixing : Frequency Band Definitions
|
||||
|
@ -34,6 +34,8 @@ extern const int8_t ff_eac3_gaq_remap_2_4_b[9][2];
|
||||
extern const int16_t (* const ff_eac3_mantissa_vq[8])[6];
|
||||
extern const uint8_t ff_eac3_frm_expstr[32][6];
|
||||
extern const uint8_t ff_eac3_default_cpl_band_struct[18];
|
||||
extern const uint8_t ff_eac3_default_spx_band_struct[17];
|
||||
extern const int32_t ff_eac3_spx_atten_tab[32][3];
|
||||
|
||||
extern const uint8_t ff_ac3_rematrix_band_tab[5];
|
||||
|
||||
|
@ -36,6 +36,104 @@ typedef enum {
|
||||
|
||||
#define EAC3_SR_CODE_REDUCED 3
|
||||
|
||||
|
||||
void ff_eac3_apply_spectral_extension(AC3DecodeContext *s)
|
||||
{
|
||||
int bin, bnd, ch, i;
|
||||
int wrapflag[SPX_MAX_BANDS]={0,}, num_copy_sections, copy_sizes[SPX_MAX_BANDS];
|
||||
int rms_energy[SPX_MAX_BANDS];
|
||||
|
||||
/* Set copy index mapping table. Set wrap flags to apply a notch filter at
|
||||
wrap points later on. */
|
||||
bin = s->spx_copy_start_freq;
|
||||
num_copy_sections = 0;
|
||||
for (bnd = 0; bnd < s->num_spx_bands; bnd++) {
|
||||
int bandsize = s->spx_band_sizes[bnd];
|
||||
if ((bin + bandsize) > s->spx_start_freq) {
|
||||
copy_sizes[num_copy_sections++] = bin - s->spx_copy_start_freq;
|
||||
bin = s->spx_copy_start_freq;
|
||||
wrapflag[bnd] = 1;
|
||||
}
|
||||
for (i = 0; i < bandsize; i++) {
|
||||
if (bin == s->spx_start_freq) {
|
||||
copy_sizes[num_copy_sections++] = bin - s->spx_copy_start_freq;
|
||||
bin = s->spx_copy_start_freq;
|
||||
}
|
||||
bin++;
|
||||
}
|
||||
}
|
||||
copy_sizes[num_copy_sections++] = bin - s->spx_copy_start_freq;
|
||||
|
||||
for (ch = 1; ch <= s->fbw_channels; ch++) {
|
||||
if (!s->channel_in_spx[ch])
|
||||
continue;
|
||||
|
||||
/* Copy coeffs from normal bands to extension bands */
|
||||
bin = s->spx_start_freq;
|
||||
for (bnd = 0; bnd < num_copy_sections; bnd++) {
|
||||
memcpy(&s->fixed_coeffs[ch][bin],
|
||||
&s->fixed_coeffs[ch][s->spx_copy_start_freq],
|
||||
copy_sizes[bnd]*sizeof(int));
|
||||
bin += copy_sizes[bnd];
|
||||
}
|
||||
|
||||
/* Calculate RMS energy for each SPX band. */
|
||||
bin = s->spx_start_freq;
|
||||
for (bnd = 0; bnd < s->num_spx_bands; bnd++) {
|
||||
int bandsize = s->spx_band_sizes[bnd];
|
||||
int64_t accum = 0;
|
||||
for (i = 0; i < bandsize; i++) {
|
||||
int64_t coeff = s->fixed_coeffs[ch][bin++];
|
||||
accum += coeff * coeff;
|
||||
}
|
||||
rms_energy[bnd] = ff_sqrt((accum >> 15) / bandsize) * M_SQRT_POW2_15;
|
||||
}
|
||||
|
||||
/* Apply a notch filter at transitions between normal and extension
|
||||
bands and at all wrap points. */
|
||||
if (s->spx_atten_code[ch] >= 0) {
|
||||
const int32_t *atten_tab = ff_eac3_spx_atten_tab[s->spx_atten_code[ch]];
|
||||
/* apply notch filter at baseband / extension region border */
|
||||
bin = s->spx_start_freq - 2;
|
||||
for (i = 0; i < 5; i++) {
|
||||
s->fixed_coeffs[ch][bin] = ((int64_t)atten_tab[2-abs(i-2)] *
|
||||
(int64_t)s->fixed_coeffs[ch][bin]) >> 23;
|
||||
bin++;
|
||||
}
|
||||
/* apply notch at all other wrap points */
|
||||
bin += s->spx_band_sizes[0];
|
||||
for (bnd = 1; bnd < s->num_spx_bands; bnd++) {
|
||||
if (wrapflag[bnd]) {
|
||||
bin -= 5;
|
||||
for (i = 0; i < 5; i++) {
|
||||
s->fixed_coeffs[ch][bin] = (atten_tab[2-abs(i-2)] *
|
||||
(int64_t)s->fixed_coeffs[ch][bin]) >> 23;
|
||||
bin++;
|
||||
}
|
||||
}
|
||||
bin += s->spx_band_sizes[bnd];
|
||||
}
|
||||
}
|
||||
|
||||
/* Apply noise-blended coefficient scaling based on previously
|
||||
calculated RMS energy, blending factors, and SPX coordinates for
|
||||
each band. */
|
||||
bin = s->spx_start_freq;
|
||||
for (bnd = 0; bnd < s->num_spx_bands; bnd++) {
|
||||
int64_t nscale, sscale, spxco;
|
||||
nscale = (s->spx_noise_blend [ch][bnd] * rms_energy[bnd]) >> 23;
|
||||
nscale = (nscale * 14529495) >> 23;
|
||||
sscale = s->spx_signal_blend[ch][bnd];
|
||||
spxco = s->spx_coords[ch][bnd];
|
||||
for (i = 0; i < s->spx_band_sizes[bnd]; i++) {
|
||||
int64_t noise = (nscale * (((int)av_lfg_get(&s->dith_state))>>8)) >> 23;
|
||||
int64_t signal = (sscale * s->fixed_coeffs[ch][bin]) >> 23;
|
||||
s->fixed_coeffs[ch][bin++] = ((noise + signal) * spxco) >> 23;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/** lrint(M_SQRT2*cos(2*M_PI/12)*(1<<23)) */
|
||||
#define COEFF_0 10273905LL
|
||||
|
||||
@ -459,14 +557,12 @@ int ff_eac3_parse_header(AC3DecodeContext *s)
|
||||
}
|
||||
|
||||
/* spectral extension attenuation data */
|
||||
if (parse_spx_atten_data) {
|
||||
av_log_missing_feature(s->avctx, "Spectral extension attenuation", 1);
|
||||
for (ch = 1; ch <= s->fbw_channels; ch++) {
|
||||
if (get_bits1(gbc)) { // channel has spx attenuation
|
||||
skip_bits(gbc, 5); // skip spx attenuation code
|
||||
}
|
||||
}
|
||||
}
|
||||
for (ch = 1; ch <= s->fbw_channels; ch++) {
|
||||
if (parse_spx_atten_data && get_bits1(gbc))
|
||||
s->spx_atten_code[ch] = get_bits(gbc, 5);
|
||||
else
|
||||
s->spx_atten_code[ch] = -1;
|
||||
}
|
||||
|
||||
/* block start information */
|
||||
if (s->num_blocks > 1 && get_bits1(gbc)) {
|
||||
@ -480,6 +576,7 @@ int ff_eac3_parse_header(AC3DecodeContext *s)
|
||||
|
||||
/* syntax state initialization */
|
||||
for (ch = 1; ch <= s->fbw_channels; ch++) {
|
||||
s->first_spx_coords[ch] = 1;
|
||||
s->first_cpl_coords[ch] = 1;
|
||||
}
|
||||
s->first_cpl_leak = 1;
|
||||
|
Loading…
x
Reference in New Issue
Block a user