mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2024-12-23 12:43:46 +02:00
245 lines
8.8 KiB
C
245 lines
8.8 KiB
C
/*
|
|
* AAC encoder utilities
|
|
* Copyright (C) 2015 Rostislav Pehlivanov
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
/**
|
|
* @file
|
|
* AAC encoder utilities
|
|
* @author Rostislav Pehlivanov ( atomnuker gmail com )
|
|
*/
|
|
|
|
#ifndef AVCODEC_AACENC_UTILS_H
|
|
#define AVCODEC_AACENC_UTILS_H
|
|
|
|
#include "aac.h"
|
|
#include "aac_tablegen_decl.h"
|
|
#include "aacenctab.h"
|
|
|
|
#define ROUND_STANDARD 0.4054f
|
|
#define ROUND_TO_ZERO 0.1054f
|
|
#define C_QUANT 0.4054f
|
|
|
|
static inline void abs_pow34_v(float *out, const float *in, const int size)
|
|
{
|
|
int i;
|
|
for (i = 0; i < size; i++) {
|
|
float a = fabsf(in[i]);
|
|
out[i] = sqrtf(a * sqrtf(a));
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Quantize one coefficient.
|
|
* @return absolute value of the quantized coefficient
|
|
* @see 3GPP TS26.403 5.6.2 "Scalefactor determination"
|
|
*/
|
|
static inline int quant(float coef, const float Q, const float rounding)
|
|
{
|
|
float a = coef * Q;
|
|
return sqrtf(a * sqrtf(a)) + rounding;
|
|
}
|
|
|
|
static inline void quantize_bands(int *out, const float *in, const float *scaled,
|
|
int size, float Q34, int is_signed, int maxval,
|
|
const float rounding)
|
|
{
|
|
int i;
|
|
double qc;
|
|
for (i = 0; i < size; i++) {
|
|
qc = scaled[i] * Q34;
|
|
out[i] = (int)FFMIN(qc + rounding, (double)maxval);
|
|
if (is_signed && in[i] < 0.0f) {
|
|
out[i] = -out[i];
|
|
}
|
|
}
|
|
}
|
|
|
|
static inline float find_max_val(int group_len, int swb_size, const float *scaled)
|
|
{
|
|
float maxval = 0.0f;
|
|
int w2, i;
|
|
for (w2 = 0; w2 < group_len; w2++) {
|
|
for (i = 0; i < swb_size; i++) {
|
|
maxval = FFMAX(maxval, scaled[w2*128+i]);
|
|
}
|
|
}
|
|
return maxval;
|
|
}
|
|
|
|
static inline int find_min_book(float maxval, int sf)
|
|
{
|
|
float Q = ff_aac_pow2sf_tab[POW_SF2_ZERO - sf + SCALE_ONE_POS - SCALE_DIV_512];
|
|
float Q34 = sqrtf(Q * sqrtf(Q));
|
|
int qmaxval, cb;
|
|
qmaxval = maxval * Q34 + C_QUANT;
|
|
if (qmaxval >= (FF_ARRAY_ELEMS(aac_maxval_cb)))
|
|
cb = 11;
|
|
else
|
|
cb = aac_maxval_cb[qmaxval];
|
|
return cb;
|
|
}
|
|
|
|
static inline float find_form_factor(int group_len, int swb_size, float thresh,
|
|
const float *scaled, float nzslope) {
|
|
const float iswb_size = 1.0f / swb_size;
|
|
const float iswb_sizem1 = 1.0f / (swb_size - 1);
|
|
const float ethresh = thresh;
|
|
float form = 0.0f, weight = 0.0f;
|
|
int w2, i;
|
|
for (w2 = 0; w2 < group_len; w2++) {
|
|
float e = 0.0f, e2 = 0.0f, var = 0.0f, maxval = 0.0f;
|
|
float nzl = 0;
|
|
for (i = 0; i < swb_size; i++) {
|
|
float s = fabsf(scaled[w2*128+i]);
|
|
maxval = FFMAX(maxval, s);
|
|
e += s;
|
|
e2 += s *= s;
|
|
/* We really don't want a hard non-zero-line count, since
|
|
* even below-threshold lines do add up towards band spectral power.
|
|
* So, fall steeply towards zero, but smoothly
|
|
*/
|
|
if (s >= ethresh) {
|
|
nzl += 1.0f;
|
|
} else {
|
|
nzl += powf(s / ethresh, nzslope);
|
|
}
|
|
}
|
|
if (e2 > thresh) {
|
|
float frm;
|
|
e *= iswb_size;
|
|
|
|
/** compute variance */
|
|
for (i = 0; i < swb_size; i++) {
|
|
float d = fabsf(scaled[w2*128+i]) - e;
|
|
var += d*d;
|
|
}
|
|
var = sqrtf(var * iswb_sizem1);
|
|
|
|
e2 *= iswb_size;
|
|
frm = e / FFMIN(e+4*var,maxval);
|
|
form += e2 * sqrtf(frm) / FFMAX(0.5f,nzl);
|
|
weight += e2;
|
|
}
|
|
}
|
|
if (weight > 0) {
|
|
return form / weight;
|
|
} else {
|
|
return 1.0f;
|
|
}
|
|
}
|
|
|
|
/** Return the minimum scalefactor where the quantized coef does not clip. */
|
|
static inline uint8_t coef2minsf(float coef)
|
|
{
|
|
return av_clip_uint8(log2f(coef)*4 - 69 + SCALE_ONE_POS - SCALE_DIV_512);
|
|
}
|
|
|
|
/** Return the maximum scalefactor where the quantized coef is not zero. */
|
|
static inline uint8_t coef2maxsf(float coef)
|
|
{
|
|
return av_clip_uint8(log2f(coef)*4 + 6 + SCALE_ONE_POS - SCALE_DIV_512);
|
|
}
|
|
|
|
/*
|
|
* Returns the closest possible index to an array of float values, given a value.
|
|
*/
|
|
static inline int quant_array_idx(const float val, const float *arr, const int num)
|
|
{
|
|
int i, index = 0;
|
|
float quant_min_err = INFINITY;
|
|
for (i = 0; i < num; i++) {
|
|
float error = (val - arr[i])*(val - arr[i]);
|
|
if (error < quant_min_err) {
|
|
quant_min_err = error;
|
|
index = i;
|
|
}
|
|
}
|
|
return index;
|
|
}
|
|
|
|
/**
|
|
* approximates exp10f(-3.0f*(0.5f + 0.5f * cosf(FFMIN(b,15.5f) / 15.5f)))
|
|
*/
|
|
static av_always_inline float bval2bmax(float b)
|
|
{
|
|
return 0.001f + 0.0035f * (b*b*b) / (15.5f*15.5f*15.5f);
|
|
}
|
|
|
|
/*
|
|
* linear congruential pseudorandom number generator, copied from the decoder
|
|
*/
|
|
static inline int lcg_random(unsigned previous_val)
|
|
{
|
|
union { unsigned u; int s; } v = { previous_val * 1664525u + 1013904223 };
|
|
return v.s;
|
|
}
|
|
|
|
#define ERROR_IF(cond, ...) \
|
|
if (cond) { \
|
|
av_log(avctx, AV_LOG_ERROR, __VA_ARGS__); \
|
|
return AVERROR(EINVAL); \
|
|
}
|
|
|
|
#define WARN_IF(cond, ...) \
|
|
if (cond) { \
|
|
av_log(avctx, AV_LOG_WARNING, __VA_ARGS__); \
|
|
}
|
|
|
|
#define AAC_OPT_SET(e_opt, p_opt, bypass, name) \
|
|
ERROR_IF ((e_opt)->name == 1 && (p_opt)->name == OPT_BANNED, \
|
|
"Profile %i does not allow %s\n", avctx->profile, #name); \
|
|
ERROR_IF ((e_opt)->name == 0 && (p_opt)->name == OPT_REQUIRED, \
|
|
"Option %s is a requirement for this profile (%i)\n", \
|
|
#name, avctx->profile); \
|
|
if ((e_opt)->name == 1 && (p_opt)->name == OPT_NEEDS_MAIN && \
|
|
avctx->profile == FF_PROFILE_AAC_LOW) { \
|
|
WARN_IF(1, "Profile %i does not allow for %s, setting profile to " \
|
|
"\"aac_main\"(%i)\n", avctx->profile, #name, \
|
|
FF_PROFILE_AAC_MAIN); \
|
|
avctx->profile = FF_PROFILE_AAC_MAIN; \
|
|
p_opt = &aacenc_profiles[FF_PROFILE_AAC_MAIN].opts; \
|
|
} \
|
|
if ((e_opt)->name == 1 && (p_opt)->name == OPT_NEEDS_LTP && \
|
|
avctx->profile == FF_PROFILE_AAC_LOW) { \
|
|
WARN_IF(1, "Profile %i does not allow for %s, setting profile to " \
|
|
"\"aac_ltp\"(%i)\n", avctx->profile, #name, \
|
|
FF_PROFILE_AAC_LTP); \
|
|
avctx->profile = FF_PROFILE_AAC_LTP; \
|
|
p_opt = &aacenc_profiles[FF_PROFILE_AAC_LTP].opts; \
|
|
} \
|
|
if ((e_opt)->name == OPT_AUTO) { \
|
|
if ((p_opt)->name == OPT_BANNED) { \
|
|
(e_opt)->name = 0; \
|
|
} else if ((p_opt)->name == OPT_NEEDS_LTP) { \
|
|
(e_opt)->name = 0; \
|
|
} else if ((p_opt)->name == OPT_NEEDS_MAIN) { \
|
|
(e_opt)->name = 0; \
|
|
} else if ((p_opt)->name == OPT_REQUIRED) { \
|
|
(e_opt)->name = 1; \
|
|
} else if (bypass) { \
|
|
(e_opt)->name = (e_opt)->name; \
|
|
} else { \
|
|
(e_opt)->name = (p_opt)->name; \
|
|
} \
|
|
} \
|
|
av_log(avctx, AV_LOG_VERBOSE, "Option %s set to %i\n", #name, (e_opt)->name);
|
|
|
|
#endif /* AVCODEC_AACENC_UTILS_H */
|