1
0
mirror of https://github.com/FFmpeg/FFmpeg.git synced 2025-07-11 14:30:22 +02:00

avfilter/af_afftfilt: extend filter functionality

This commit is contained in:
Paul B Mahol
2018-11-11 21:11:30 +01:00
parent 679ad31469
commit bdc66c50dd
2 changed files with 74 additions and 17 deletions

View File

@ -1082,7 +1082,7 @@ Set frequency domain imaginary expression for each separate channel
separated by '|'. If not set, @var{real} option is used. separated by '|'. If not set, @var{real} option is used.
Each expression in @var{real} and @var{imag} can contain the following Each expression in @var{real} and @var{imag} can contain the following
constants: constants and functions:
@table @option @table @option
@item sr @item sr
@ -1102,6 +1102,18 @@ number of channels
@item pts @item pts
current frame pts current frame pts
@item re
current real part of frequency bin
@item im
current imaginary part of frequency bin
@item real(b, ch)
Return the value of real part of frequency bin at location (@var{bin},@var{channel})
@item imag(b, ch)
Return the value of imaginary part of frequency bin at location (@var{bin},@var{channel})
@end table @end table
@item win_size @item win_size
@ -1139,7 +1151,7 @@ window function will be picked. Default is @code{0.75}.
@item @item
Leave almost only low frequencies in audio: Leave almost only low frequencies in audio:
@example @example
afftfilt="1-clip((b/nb)*b,0,1)" afftfilt="'real=re * (1-clip((b/nb)*b,0,1))':imag='im * (1-clip((b/nb)*b,0,1))'"
@end example @end example
@end itemize @end itemize

View File

@ -36,6 +36,7 @@ typedef struct AFFTFiltContext {
FFTContext *fft, *ifft; FFTContext *fft, *ifft;
FFTComplex **fft_data; FFTComplex **fft_data;
FFTComplex **fft_temp;
int nb_exprs; int nb_exprs;
int window_size; int window_size;
AVExpr **real; AVExpr **real;
@ -51,15 +52,15 @@ typedef struct AFFTFiltContext {
float *window_func_lut; float *window_func_lut;
} AFFTFiltContext; } AFFTFiltContext;
static const char *const var_names[] = { "sr", "b", "nb", "ch", "chs", "pts", NULL }; static const char *const var_names[] = { "sr", "b", "nb", "ch", "chs", "pts", "re", "im", NULL };
enum { VAR_SAMPLE_RATE, VAR_BIN, VAR_NBBINS, VAR_CHANNEL, VAR_CHANNELS, VAR_PTS, VAR_VARS_NB }; enum { VAR_SAMPLE_RATE, VAR_BIN, VAR_NBBINS, VAR_CHANNEL, VAR_CHANNELS, VAR_PTS, VAR_REAL, VAR_IMAG, VAR_VARS_NB };
#define OFFSET(x) offsetof(AFFTFiltContext, x) #define OFFSET(x) offsetof(AFFTFiltContext, x)
#define A AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM #define A AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM
static const AVOption afftfilt_options[] = { static const AVOption afftfilt_options[] = {
{ "real", "set channels real expressions", OFFSET(real_str), AV_OPT_TYPE_STRING, {.str = "1" }, 0, 0, A }, { "real", "set channels real expressions", OFFSET(real_str), AV_OPT_TYPE_STRING, {.str = "re" }, 0, 0, A },
{ "imag", "set channels imaginary expressions", OFFSET(img_str), AV_OPT_TYPE_STRING, {.str = NULL }, 0, 0, A }, { "imag", "set channels imaginary expressions", OFFSET(img_str), AV_OPT_TYPE_STRING, {.str = "im" }, 0, 0, A },
{ "win_size", "set window size", OFFSET(fft_bits), AV_OPT_TYPE_INT, {.i64=12}, 4, 17, A, "fft" }, { "win_size", "set window size", OFFSET(fft_bits), AV_OPT_TYPE_INT, {.i64=12}, 4, 17, A, "fft" },
{ "w16", 0, 0, AV_OPT_TYPE_CONST, {.i64=4}, 0, 0, A, "fft" }, { "w16", 0, 0, AV_OPT_TYPE_CONST, {.i64=4}, 0, 0, A, "fft" },
{ "w32", 0, 0, AV_OPT_TYPE_CONST, {.i64=5}, 0, 0, A, "fft" }, { "w32", 0, 0, AV_OPT_TYPE_CONST, {.i64=5}, 0, 0, A, "fft" },
@ -88,6 +89,34 @@ static const AVOption afftfilt_options[] = {
AVFILTER_DEFINE_CLASS(afftfilt); AVFILTER_DEFINE_CLASS(afftfilt);
static inline double getreal(void *priv, double x, double ch)
{
AFFTFiltContext *s = priv;
int ich, ix;
ich = av_clip(ch, 0, s->nb_exprs - 1);
ix = av_clip(x, 0, s->window_size / 2);
return s->fft_data[ich][ix].re;
}
static inline double getimag(void *priv, double x, double ch)
{
AFFTFiltContext *s = priv;
int ich, ix;
ich = av_clip(ch, 0, s->nb_exprs - 1);
ix = av_clip(x, 0, s->window_size / 2);
return s->fft_data[ich][ix].im;
}
static double realf(void *priv, double x, double ch) { return getreal(priv, x, ch); }
static double imagf(void *priv, double x, double ch) { return getimag(priv, x, ch); }
static const char *const func2_names[] = { "real", "imag", NULL };
double (*func2[])(void *, double, double) = { realf, imagf, NULL };
static int config_input(AVFilterLink *inlink) static int config_input(AVFilterLink *inlink)
{ {
AVFilterContext *ctx = inlink->dst; AVFilterContext *ctx = inlink->dst;
@ -109,12 +138,22 @@ static int config_input(AVFilterLink *inlink)
if (!s->fft_data) if (!s->fft_data)
return AVERROR(ENOMEM); return AVERROR(ENOMEM);
s->fft_temp = av_calloc(inlink->channels, sizeof(*s->fft_temp));
if (!s->fft_temp)
return AVERROR(ENOMEM);
for (ch = 0; ch < inlink->channels; ch++) { for (ch = 0; ch < inlink->channels; ch++) {
s->fft_data[ch] = av_calloc(s->window_size, sizeof(**s->fft_data)); s->fft_data[ch] = av_calloc(s->window_size, sizeof(**s->fft_data));
if (!s->fft_data[ch]) if (!s->fft_data[ch])
return AVERROR(ENOMEM); return AVERROR(ENOMEM);
} }
for (ch = 0; ch < inlink->channels; ch++) {
s->fft_temp[ch] = av_calloc(s->window_size, sizeof(**s->fft_temp));
if (!s->fft_temp[ch])
return AVERROR(ENOMEM);
}
s->real = av_calloc(inlink->channels, sizeof(*s->real)); s->real = av_calloc(inlink->channels, sizeof(*s->real));
if (!s->real) if (!s->real)
return AVERROR(ENOMEM); return AVERROR(ENOMEM);
@ -131,7 +170,7 @@ static int config_input(AVFilterLink *inlink)
char *arg = av_strtok(ch == 0 ? args : NULL, "|", &saveptr); char *arg = av_strtok(ch == 0 ? args : NULL, "|", &saveptr);
ret = av_expr_parse(&s->real[ch], arg ? arg : last_expr, var_names, ret = av_expr_parse(&s->real[ch], arg ? arg : last_expr, var_names,
NULL, NULL, NULL, NULL, 0, ctx); NULL, NULL, func2_names, func2, 0, ctx);
if (ret < 0) if (ret < 0)
break; break;
if (arg) if (arg)
@ -149,7 +188,7 @@ static int config_input(AVFilterLink *inlink)
char *arg = av_strtok(ch == 0 ? args : NULL, "|", &saveptr); char *arg = av_strtok(ch == 0 ? args : NULL, "|", &saveptr);
ret = av_expr_parse(&s->imag[ch], arg ? arg : last_expr, var_names, ret = av_expr_parse(&s->imag[ch], arg ? arg : last_expr, var_names,
NULL, NULL, NULL, NULL, 0, ctx); NULL, NULL, func2_names, func2, 0, ctx);
if (ret < 0) if (ret < 0)
break; break;
if (arg) if (arg)
@ -235,6 +274,7 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *frame)
for (ch = 0; ch < inlink->channels; ch++) { for (ch = 0; ch < inlink->channels; ch++) {
FFTComplex *fft_data = s->fft_data[ch]; FFTComplex *fft_data = s->fft_data[ch];
FFTComplex *fft_temp = s->fft_temp[ch];
float *buf = (float *)s->buffer->extended_data[ch]; float *buf = (float *)s->buffer->extended_data[ch];
int x; int x;
@ -243,35 +283,37 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *frame)
av_fft_permute(s->fft, fft_data); av_fft_permute(s->fft, fft_data);
av_fft_calc(s->fft, fft_data); av_fft_calc(s->fft, fft_data);
for (n = 0; n < window_size / 2; n++) { for (n = 0; n <= window_size / 2; n++) {
float fr, fi; float fr, fi;
values[VAR_BIN] = n; values[VAR_BIN] = n;
values[VAR_REAL] = fft_data[n].re;
values[VAR_IMAG] = fft_data[n].im;
fr = av_expr_eval(s->real[ch], values, s); fr = av_expr_eval(s->real[ch], values, s);
fi = av_expr_eval(s->imag[ch], values, s); fi = av_expr_eval(s->imag[ch], values, s);
fft_data[n].re *= fr; fft_temp[n].re = fr;
fft_data[n].im *= fi; fft_temp[n].im = fi;
} }
for (n = window_size / 2 + 1, x = window_size / 2 - 1; n < window_size; n++, x--) { for (n = window_size / 2 + 1, x = window_size / 2 - 1; n < window_size; n++, x--) {
fft_data[n].re = fft_data[x].re; fft_temp[n].re = fft_temp[x].re;
fft_data[n].im = -fft_data[x].im; fft_temp[n].im = -fft_temp[x].im;
} }
av_fft_permute(s->ifft, fft_data); av_fft_permute(s->ifft, fft_temp);
av_fft_calc(s->ifft, fft_data); av_fft_calc(s->ifft, fft_temp);
start = s->start; start = s->start;
end = s->end; end = s->end;
k = end; k = end;
for (i = 0, j = start; j < k && i < window_size; i++, j++) { for (i = 0, j = start; j < k && i < window_size; i++, j++) {
buf[j] += s->fft_data[ch][i].re * f; buf[j] += s->fft_temp[ch][i].re * f;
} }
for (; i < window_size; i++, j++) { for (; i < window_size; i++, j++) {
buf[j] = s->fft_data[ch][i].re * f; buf[j] = s->fft_temp[ch][i].re * f;
} }
start += s->hop_size; start += s->hop_size;
@ -362,8 +404,11 @@ static av_cold void uninit(AVFilterContext *ctx)
for (i = 0; i < s->nb_exprs; i++) { for (i = 0; i < s->nb_exprs; i++) {
if (s->fft_data) if (s->fft_data)
av_freep(&s->fft_data[i]); av_freep(&s->fft_data[i]);
if (s->fft_temp)
av_freep(&s->fft_temp[i]);
} }
av_freep(&s->fft_data); av_freep(&s->fft_data);
av_freep(&s->fft_temp);
for (i = 0; i < s->nb_exprs; i++) { for (i = 0; i < s->nb_exprs; i++) {
av_expr_free(s->real[i]); av_expr_free(s->real[i]);