mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2025-01-24 13:56:33 +02:00
790f793844
There are lots of files that don't need it: The number of object files that actually need it went down from 2011 to 884 here. Keep it for external users in order to not cause breakages. Also improve the other headers a bit while just at it. Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
1340 lines
47 KiB
C
1340 lines
47 KiB
C
/*
|
|
* Copyright (c) 2022 Paul B Mahol
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#include <float.h>
|
|
#include <math.h>
|
|
|
|
#include "libavutil/mem.h"
|
|
#include "libavutil/tx.h"
|
|
#include "libavutil/channel_layout.h"
|
|
#include "libavutil/float_dsp.h"
|
|
#include "libavutil/cpu.h"
|
|
#include "libavutil/opt.h"
|
|
#include "libavutil/parseutils.h"
|
|
#include "audio.h"
|
|
#include "formats.h"
|
|
#include "video.h"
|
|
#include "avfilter.h"
|
|
#include "filters.h"
|
|
#include "internal.h"
|
|
|
|
enum FrequencyScale {
|
|
FSCALE_LINEAR,
|
|
FSCALE_LOG,
|
|
FSCALE_BARK,
|
|
FSCALE_MEL,
|
|
FSCALE_ERBS,
|
|
FSCALE_SQRT,
|
|
FSCALE_CBRT,
|
|
FSCALE_QDRT,
|
|
FSCALE_FM,
|
|
NB_FSCALE
|
|
};
|
|
|
|
enum IntensityScale {
|
|
ISCALE_LOG,
|
|
ISCALE_LINEAR,
|
|
ISCALE_SQRT,
|
|
ISCALE_CBRT,
|
|
ISCALE_QDRT,
|
|
NB_ISCALE
|
|
};
|
|
|
|
enum DirectionMode {
|
|
DIRECTION_LR,
|
|
DIRECTION_RL,
|
|
DIRECTION_UD,
|
|
DIRECTION_DU,
|
|
NB_DIRECTION
|
|
};
|
|
|
|
enum SlideMode {
|
|
SLIDE_REPLACE,
|
|
SLIDE_SCROLL,
|
|
SLIDE_FRAME,
|
|
NB_SLIDE
|
|
};
|
|
|
|
typedef struct ShowCWTContext {
|
|
const AVClass *class;
|
|
int w, h;
|
|
int mode;
|
|
char *rate_str;
|
|
AVRational auto_frame_rate;
|
|
AVRational frame_rate;
|
|
AVTXContext **fft, **ifft;
|
|
av_tx_fn tx_fn, itx_fn;
|
|
int fft_size, ifft_size;
|
|
int pos;
|
|
int64_t in_pts;
|
|
int64_t old_pts;
|
|
int64_t eof_pts;
|
|
float *frequency_band;
|
|
AVComplexFloat **kernel;
|
|
unsigned *index;
|
|
int *kernel_start, *kernel_stop;
|
|
AVFrame *cache;
|
|
AVFrame *outpicref;
|
|
AVFrame *fft_in;
|
|
AVFrame *fft_out;
|
|
AVFrame *dst_x;
|
|
AVFrame *src_x;
|
|
AVFrame *ifft_in;
|
|
AVFrame *ifft_out;
|
|
AVFrame *ch_out;
|
|
AVFrame *over;
|
|
AVFrame *bh_out;
|
|
int nb_threads;
|
|
int nb_channels;
|
|
int nb_consumed_samples;
|
|
int pps;
|
|
int eof;
|
|
int slide;
|
|
int new_frame;
|
|
int direction;
|
|
int hop_size, ihop_size;
|
|
int hop_index, ihop_index;
|
|
int input_padding_size, output_padding_size;
|
|
int input_sample_count, output_sample_count;
|
|
int frequency_band_count;
|
|
float logarithmic_basis;
|
|
int intensity_scale;
|
|
int frequency_scale;
|
|
float minimum_frequency, maximum_frequency;
|
|
float minimum_intensity, maximum_intensity;
|
|
float deviation;
|
|
float bar_ratio;
|
|
int bar_size;
|
|
int sono_size;
|
|
float rotation;
|
|
|
|
AVFloatDSPContext *fdsp;
|
|
} ShowCWTContext;
|
|
|
|
#define OFFSET(x) offsetof(ShowCWTContext, x)
|
|
#define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM
|
|
|
|
static const AVOption showcwt_options[] = {
|
|
{ "size", "set video size", OFFSET(w), AV_OPT_TYPE_IMAGE_SIZE, {.str = "640x512"}, 0, 0, FLAGS },
|
|
{ "s", "set video size", OFFSET(w), AV_OPT_TYPE_IMAGE_SIZE, {.str = "640x512"}, 0, 0, FLAGS },
|
|
{ "rate", "set video rate", OFFSET(rate_str), AV_OPT_TYPE_STRING, {.str = "25"}, 0, 0, FLAGS },
|
|
{ "r", "set video rate", OFFSET(rate_str), AV_OPT_TYPE_STRING, {.str = "25"}, 0, 0, FLAGS },
|
|
{ "scale", "set frequency scale", OFFSET(frequency_scale), AV_OPT_TYPE_INT, {.i64=0}, 0, NB_FSCALE-1, FLAGS, .unit = "scale" },
|
|
{ "linear", "linear", 0, AV_OPT_TYPE_CONST,{.i64=FSCALE_LINEAR}, 0, 0, FLAGS, .unit = "scale" },
|
|
{ "log", "logarithmic", 0, AV_OPT_TYPE_CONST,{.i64=FSCALE_LOG}, 0, 0, FLAGS, .unit = "scale" },
|
|
{ "bark", "bark", 0, AV_OPT_TYPE_CONST,{.i64=FSCALE_BARK}, 0, 0, FLAGS, .unit = "scale" },
|
|
{ "mel", "mel", 0, AV_OPT_TYPE_CONST,{.i64=FSCALE_MEL}, 0, 0, FLAGS, .unit = "scale" },
|
|
{ "erbs", "erbs", 0, AV_OPT_TYPE_CONST,{.i64=FSCALE_ERBS}, 0, 0, FLAGS, .unit = "scale" },
|
|
{ "sqrt", "sqrt", 0, AV_OPT_TYPE_CONST,{.i64=FSCALE_SQRT}, 0, 0, FLAGS, .unit = "scale" },
|
|
{ "cbrt", "cbrt", 0, AV_OPT_TYPE_CONST,{.i64=FSCALE_CBRT}, 0, 0, FLAGS, .unit = "scale" },
|
|
{ "qdrt", "qdrt", 0, AV_OPT_TYPE_CONST,{.i64=FSCALE_QDRT}, 0, 0, FLAGS, .unit = "scale" },
|
|
{ "fm", "fm", 0, AV_OPT_TYPE_CONST,{.i64=FSCALE_FM}, 0, 0, FLAGS, .unit = "scale" },
|
|
{ "iscale", "set intensity scale", OFFSET(intensity_scale),AV_OPT_TYPE_INT, {.i64=0}, 0, NB_ISCALE-1, FLAGS, .unit = "iscale" },
|
|
{ "linear", "linear", 0, AV_OPT_TYPE_CONST,{.i64=ISCALE_LINEAR}, 0, 0, FLAGS, .unit = "iscale" },
|
|
{ "log", "logarithmic", 0, AV_OPT_TYPE_CONST,{.i64=ISCALE_LOG}, 0, 0, FLAGS, .unit = "iscale" },
|
|
{ "sqrt", "sqrt", 0, AV_OPT_TYPE_CONST,{.i64=ISCALE_SQRT}, 0, 0, FLAGS, .unit = "iscale" },
|
|
{ "cbrt", "cbrt", 0, AV_OPT_TYPE_CONST,{.i64=ISCALE_CBRT}, 0, 0, FLAGS, .unit = "iscale" },
|
|
{ "qdrt", "qdrt", 0, AV_OPT_TYPE_CONST,{.i64=ISCALE_QDRT}, 0, 0, FLAGS, .unit = "iscale" },
|
|
{ "min", "set minimum frequency", OFFSET(minimum_frequency), AV_OPT_TYPE_FLOAT, {.dbl = 20.}, 1, 192000, FLAGS },
|
|
{ "max", "set maximum frequency", OFFSET(maximum_frequency), AV_OPT_TYPE_FLOAT, {.dbl = 20000.}, 1, 192000, FLAGS },
|
|
{ "imin", "set minimum intensity", OFFSET(minimum_intensity), AV_OPT_TYPE_FLOAT, {.dbl = 0.}, 0, 1, FLAGS },
|
|
{ "imax", "set maximum intensity", OFFSET(maximum_intensity), AV_OPT_TYPE_FLOAT, {.dbl = 1.}, 0, 1, FLAGS },
|
|
{ "logb", "set logarithmic basis", OFFSET(logarithmic_basis), AV_OPT_TYPE_FLOAT, {.dbl = 0.0001}, 0, 1, FLAGS },
|
|
{ "deviation", "set frequency deviation", OFFSET(deviation), AV_OPT_TYPE_FLOAT, {.dbl = 1.}, 0, 100, FLAGS },
|
|
{ "pps", "set pixels per second", OFFSET(pps), AV_OPT_TYPE_INT, {.i64 = 64}, 1, 1024, FLAGS },
|
|
{ "mode", "set output mode", OFFSET(mode), AV_OPT_TYPE_INT, {.i64=0}, 0, 4, FLAGS, .unit = "mode" },
|
|
{ "magnitude", "magnitude", 0, AV_OPT_TYPE_CONST,{.i64=0}, 0, 0, FLAGS, .unit = "mode" },
|
|
{ "phase", "phase", 0, AV_OPT_TYPE_CONST,{.i64=1}, 0, 0, FLAGS, .unit = "mode" },
|
|
{ "magphase", "magnitude+phase", 0, AV_OPT_TYPE_CONST,{.i64=2}, 0, 0, FLAGS, .unit = "mode" },
|
|
{ "channel", "color per channel", 0, AV_OPT_TYPE_CONST,{.i64=3}, 0, 0, FLAGS, .unit = "mode" },
|
|
{ "stereo", "stereo difference", 0, AV_OPT_TYPE_CONST,{.i64=4}, 0, 0, FLAGS, .unit = "mode" },
|
|
{ "slide", "set slide mode", OFFSET(slide), AV_OPT_TYPE_INT, {.i64=0}, 0, NB_SLIDE-1, FLAGS, .unit = "slide" },
|
|
{ "replace", "replace", 0, AV_OPT_TYPE_CONST,{.i64=SLIDE_REPLACE},0, 0, FLAGS, .unit = "slide" },
|
|
{ "scroll", "scroll", 0, AV_OPT_TYPE_CONST,{.i64=SLIDE_SCROLL}, 0, 0, FLAGS, .unit = "slide" },
|
|
{ "frame", "frame", 0, AV_OPT_TYPE_CONST,{.i64=SLIDE_FRAME}, 0, 0, FLAGS, .unit = "slide" },
|
|
{ "direction", "set direction mode", OFFSET(direction), AV_OPT_TYPE_INT, {.i64=0}, 0, NB_DIRECTION-1, FLAGS, .unit = "direction" },
|
|
{ "lr", "left to right", 0, AV_OPT_TYPE_CONST,{.i64=DIRECTION_LR}, 0, 0, FLAGS, .unit = "direction" },
|
|
{ "rl", "right to left", 0, AV_OPT_TYPE_CONST,{.i64=DIRECTION_RL}, 0, 0, FLAGS, .unit = "direction" },
|
|
{ "ud", "up to down", 0, AV_OPT_TYPE_CONST,{.i64=DIRECTION_UD}, 0, 0, FLAGS, .unit = "direction" },
|
|
{ "du", "down to up", 0, AV_OPT_TYPE_CONST,{.i64=DIRECTION_DU}, 0, 0, FLAGS, .unit = "direction" },
|
|
{ "bar", "set bargraph ratio", OFFSET(bar_ratio), AV_OPT_TYPE_FLOAT, {.dbl = 0.}, 0, 1, FLAGS },
|
|
{ "rotation", "set color rotation", OFFSET(rotation), AV_OPT_TYPE_FLOAT, {.dbl = 0}, -1, 1, FLAGS },
|
|
{ NULL }
|
|
};
|
|
|
|
AVFILTER_DEFINE_CLASS(showcwt);
|
|
|
|
static av_cold void uninit(AVFilterContext *ctx)
|
|
{
|
|
ShowCWTContext *s = ctx->priv;
|
|
|
|
av_freep(&s->frequency_band);
|
|
av_freep(&s->kernel_start);
|
|
av_freep(&s->kernel_stop);
|
|
av_freep(&s->index);
|
|
|
|
av_frame_free(&s->cache);
|
|
av_frame_free(&s->outpicref);
|
|
av_frame_free(&s->fft_in);
|
|
av_frame_free(&s->fft_out);
|
|
av_frame_free(&s->dst_x);
|
|
av_frame_free(&s->src_x);
|
|
av_frame_free(&s->ifft_in);
|
|
av_frame_free(&s->ifft_out);
|
|
av_frame_free(&s->ch_out);
|
|
av_frame_free(&s->over);
|
|
av_frame_free(&s->bh_out);
|
|
|
|
if (s->fft) {
|
|
for (int n = 0; n < s->nb_threads; n++)
|
|
av_tx_uninit(&s->fft[n]);
|
|
av_freep(&s->fft);
|
|
}
|
|
|
|
if (s->ifft) {
|
|
for (int n = 0; n < s->nb_threads; n++)
|
|
av_tx_uninit(&s->ifft[n]);
|
|
av_freep(&s->ifft);
|
|
}
|
|
|
|
if (s->kernel) {
|
|
for (int n = 0; n < s->frequency_band_count; n++)
|
|
av_freep(&s->kernel[n]);
|
|
}
|
|
av_freep(&s->kernel);
|
|
|
|
av_freep(&s->fdsp);
|
|
}
|
|
|
|
static int query_formats(AVFilterContext *ctx)
|
|
{
|
|
AVFilterFormats *formats = NULL;
|
|
AVFilterChannelLayouts *layouts = NULL;
|
|
AVFilterLink *inlink = ctx->inputs[0];
|
|
AVFilterLink *outlink = ctx->outputs[0];
|
|
static const enum AVSampleFormat sample_fmts[] = { AV_SAMPLE_FMT_FLTP, AV_SAMPLE_FMT_NONE };
|
|
static const enum AVPixelFormat pix_fmts[] = { AV_PIX_FMT_YUV444P, AV_PIX_FMT_YUVJ444P, AV_PIX_FMT_YUVA444P, AV_PIX_FMT_NONE };
|
|
int ret;
|
|
|
|
formats = ff_make_format_list(sample_fmts);
|
|
if ((ret = ff_formats_ref(formats, &inlink->outcfg.formats)) < 0)
|
|
return ret;
|
|
|
|
layouts = ff_all_channel_counts();
|
|
if ((ret = ff_channel_layouts_ref(layouts, &inlink->outcfg.channel_layouts)) < 0)
|
|
return ret;
|
|
|
|
formats = ff_all_samplerates();
|
|
if ((ret = ff_formats_ref(formats, &inlink->outcfg.samplerates)) < 0)
|
|
return ret;
|
|
|
|
formats = ff_make_format_list(pix_fmts);
|
|
if ((ret = ff_formats_ref(formats, &outlink->incfg.formats)) < 0)
|
|
return ret;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static float frequency_band(float *frequency_band,
|
|
int frequency_band_count,
|
|
float frequency_range,
|
|
float frequency_offset,
|
|
int frequency_scale, float deviation)
|
|
{
|
|
float ret = 0.f;
|
|
|
|
deviation = sqrtf(deviation / (4.f * M_PI)); // Heisenberg Gabor Limit
|
|
for (int y = 0; y < frequency_band_count; y++) {
|
|
float frequency = frequency_range * (1.f - (float)y / frequency_band_count) + frequency_offset;
|
|
float frequency_derivative = frequency_range / frequency_band_count;
|
|
|
|
switch (frequency_scale) {
|
|
case FSCALE_LOG:
|
|
frequency = powf(2.f, frequency);
|
|
frequency_derivative *= logf(2.f) * frequency;
|
|
break;
|
|
case FSCALE_BARK:
|
|
frequency = 600.f * sinhf(frequency / 6.f);
|
|
frequency_derivative *= sqrtf(frequency * frequency + 360000.f) / 6.f;
|
|
break;
|
|
case FSCALE_MEL:
|
|
frequency = 700.f * (powf(10.f, frequency / 2595.f) - 1.f);
|
|
frequency_derivative *= (frequency + 700.f) * logf(10.f) / 2595.f;
|
|
break;
|
|
case FSCALE_ERBS:
|
|
frequency = 676170.4f / (47.06538f - expf(frequency * 0.08950404f)) - 14678.49f;
|
|
frequency_derivative *= (frequency * frequency + 14990.4f * frequency + 4577850.f) / 160514.f;
|
|
break;
|
|
case FSCALE_SQRT:
|
|
frequency = frequency * frequency;
|
|
frequency_derivative *= 2.f * sqrtf(frequency);
|
|
break;
|
|
case FSCALE_CBRT:
|
|
frequency = frequency * frequency * frequency;
|
|
frequency_derivative *= 3.f * powf(frequency, 2.f / 3.f);
|
|
break;
|
|
case FSCALE_QDRT:
|
|
frequency = frequency * frequency * frequency * frequency;
|
|
frequency_derivative *= 4.f * powf(frequency, 3.f / 4.f);
|
|
break;
|
|
case FSCALE_FM:
|
|
frequency = 2.f * powf(frequency, 3.f / 2.f) / 3.f;
|
|
frequency_derivative *= sqrtf(frequency);
|
|
break;
|
|
}
|
|
|
|
frequency_band[y*2 ] = frequency;
|
|
frequency_band[y*2+1] = frequency_derivative * deviation;
|
|
|
|
ret = 1.f / (frequency_derivative * deviation);
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
static float remap_log(ShowCWTContext *s, float value, int iscale, float log_factor)
|
|
{
|
|
const float max = s->maximum_intensity;
|
|
const float min = s->minimum_intensity;
|
|
float ret;
|
|
|
|
value += min;
|
|
|
|
switch (iscale) {
|
|
case ISCALE_LINEAR:
|
|
ret = max - expf(value / log_factor);
|
|
break;
|
|
case ISCALE_LOG:
|
|
value = logf(value) * log_factor;
|
|
ret = max - av_clipf(value, 0.f, 1.f);
|
|
break;
|
|
case ISCALE_SQRT:
|
|
value = max - expf(value / log_factor);
|
|
ret = sqrtf(value);
|
|
break;
|
|
case ISCALE_CBRT:
|
|
value = max - expf(value / log_factor);
|
|
ret = cbrtf(value);
|
|
break;
|
|
case ISCALE_QDRT:
|
|
value = max - expf(value / log_factor);
|
|
ret = powf(value, 0.25f);
|
|
break;
|
|
}
|
|
|
|
return av_clipf(ret, 0.f, 1.f);
|
|
}
|
|
|
|
static int run_channel_cwt_prepare(AVFilterContext *ctx, void *arg, int jobnr, int ch)
|
|
{
|
|
ShowCWTContext *s = ctx->priv;
|
|
const int hop_size = s->hop_size;
|
|
AVFrame *fin = arg;
|
|
float *cache = (float *)s->cache->extended_data[ch];
|
|
AVComplexFloat *src = (AVComplexFloat *)s->fft_in->extended_data[ch];
|
|
AVComplexFloat *dst = (AVComplexFloat *)s->fft_out->extended_data[ch];
|
|
const int offset = (s->input_padding_size - hop_size) >> 1;
|
|
|
|
if (fin) {
|
|
const float *input = (const float *)fin->extended_data[ch];
|
|
const int offset = s->hop_size - fin->nb_samples;
|
|
|
|
memmove(cache, &cache[fin->nb_samples], offset * sizeof(float));
|
|
memcpy(&cache[offset], input, fin->nb_samples * sizeof(float));
|
|
}
|
|
|
|
if (fin && s->hop_index + fin->nb_samples < hop_size)
|
|
return 0;
|
|
|
|
memset(src, 0, sizeof(float) * s->fft_size);
|
|
for (int n = 0; n < hop_size; n++)
|
|
src[n+offset].re = cache[n];
|
|
|
|
s->tx_fn(s->fft[jobnr], dst, src, sizeof(*src));
|
|
|
|
return 0;
|
|
}
|
|
|
|
#define DRAW_BAR_COLOR(x) \
|
|
do { \
|
|
if (Y <= ht) { \
|
|
dstY[x] = 0; \
|
|
dstU[x] = 128; \
|
|
dstV[x] = 128; \
|
|
} else { \
|
|
float mul = (Y - ht) * bh[0]; \
|
|
dstY[x] = av_clip_uint8(lrintf(Y * mul * 255.f)); \
|
|
dstU[x] = av_clip_uint8(lrintf((U-0.5f) * 128.f + 128)); \
|
|
dstV[x] = av_clip_uint8(lrintf((V-0.5f) * 128.f + 128)); \
|
|
} \
|
|
} while (0)
|
|
|
|
static void draw_bar(ShowCWTContext *s, int y,
|
|
float Y, float U, float V)
|
|
{
|
|
float *bh = ((float *)s->bh_out->extended_data[0]) + y;
|
|
const ptrdiff_t ylinesize = s->outpicref->linesize[0];
|
|
const ptrdiff_t ulinesize = s->outpicref->linesize[1];
|
|
const ptrdiff_t vlinesize = s->outpicref->linesize[2];
|
|
const int direction = s->direction;
|
|
const int sono_size = s->sono_size;
|
|
const int bar_size = s->bar_size;
|
|
const float rcp_bar_h = 1.f / bar_size;
|
|
uint8_t *dstY, *dstU, *dstV;
|
|
const int w = s->w;
|
|
|
|
bh[0] = 1.f / (Y + 0.0001f);
|
|
switch (direction) {
|
|
case DIRECTION_LR:
|
|
dstY = s->outpicref->data[0] + y * ylinesize;
|
|
dstU = s->outpicref->data[1] + y * ulinesize;
|
|
dstV = s->outpicref->data[2] + y * vlinesize;
|
|
for (int x = 0; x < bar_size; x++) {
|
|
float ht = (bar_size - x) * rcp_bar_h;
|
|
DRAW_BAR_COLOR(x);
|
|
}
|
|
break;
|
|
case DIRECTION_RL:
|
|
dstY = s->outpicref->data[0] + y * ylinesize;
|
|
dstU = s->outpicref->data[1] + y * ulinesize;
|
|
dstV = s->outpicref->data[2] + y * vlinesize;
|
|
for (int x = 0; x < bar_size; x++) {
|
|
float ht = x * rcp_bar_h;
|
|
DRAW_BAR_COLOR(w - bar_size + x);
|
|
}
|
|
break;
|
|
case DIRECTION_UD:
|
|
dstY = s->outpicref->data[0] + w - 1 - y;
|
|
dstU = s->outpicref->data[1] + w - 1 - y;
|
|
dstV = s->outpicref->data[2] + w - 1 - y;
|
|
for (int x = 0; x < bar_size; x++) {
|
|
float ht = (bar_size - x) * rcp_bar_h;
|
|
DRAW_BAR_COLOR(0);
|
|
dstY += ylinesize;
|
|
dstU += ulinesize;
|
|
dstV += vlinesize;
|
|
}
|
|
break;
|
|
case DIRECTION_DU:
|
|
dstY = s->outpicref->data[0] + w - 1 - y + ylinesize * sono_size;
|
|
dstU = s->outpicref->data[1] + w - 1 - y + ulinesize * sono_size;
|
|
dstV = s->outpicref->data[2] + w - 1 - y + vlinesize * sono_size;
|
|
for (int x = 0; x < bar_size; x++) {
|
|
float ht = x * rcp_bar_h;
|
|
DRAW_BAR_COLOR(0);
|
|
dstY += ylinesize;
|
|
dstU += ulinesize;
|
|
dstV += vlinesize;
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
|
|
static int draw(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
|
|
{
|
|
ShowCWTContext *s = ctx->priv;
|
|
const ptrdiff_t ylinesize = s->outpicref->linesize[0];
|
|
const ptrdiff_t ulinesize = s->outpicref->linesize[1];
|
|
const ptrdiff_t vlinesize = s->outpicref->linesize[2];
|
|
const ptrdiff_t alinesize = s->outpicref->linesize[3];
|
|
const float log_factor = 1.f/logf(s->logarithmic_basis);
|
|
const int count = s->frequency_band_count;
|
|
const int start = (count * jobnr) / nb_jobs;
|
|
const int end = (count * (jobnr+1)) / nb_jobs;
|
|
const int nb_channels = s->nb_channels;
|
|
const int iscale = s->intensity_scale;
|
|
const int ihop_index = s->ihop_index;
|
|
const int ihop_size = s->ihop_size;
|
|
const float rotation = s->rotation;
|
|
const int direction = s->direction;
|
|
uint8_t *dstY, *dstU, *dstV, *dstA;
|
|
const int sono_size = s->sono_size;
|
|
const int bar_size = s->bar_size;
|
|
const int mode = s->mode;
|
|
const int w_1 = s->w - 1;
|
|
const int x = s->pos;
|
|
float Y, U, V;
|
|
|
|
for (int y = start; y < end; y++) {
|
|
const AVComplexFloat *src = ((const AVComplexFloat *)s->ch_out->extended_data[y]) +
|
|
0 * ihop_size + ihop_index;
|
|
|
|
if (sono_size <= 0)
|
|
goto skip;
|
|
|
|
switch (direction) {
|
|
case DIRECTION_LR:
|
|
case DIRECTION_RL:
|
|
dstY = s->outpicref->data[0] + y * ylinesize;
|
|
dstU = s->outpicref->data[1] + y * ulinesize;
|
|
dstV = s->outpicref->data[2] + y * vlinesize;
|
|
dstA = s->outpicref->data[3] ? s->outpicref->data[3] + y * alinesize : NULL;
|
|
break;
|
|
case DIRECTION_UD:
|
|
case DIRECTION_DU:
|
|
dstY = s->outpicref->data[0] + x * ylinesize + w_1 - y;
|
|
dstU = s->outpicref->data[1] + x * ulinesize + w_1 - y;
|
|
dstV = s->outpicref->data[2] + x * vlinesize + w_1 - y;
|
|
dstA = s->outpicref->data[3] ? s->outpicref->data[3] + x * alinesize + w_1 - y : NULL;
|
|
break;
|
|
}
|
|
|
|
switch (s->slide) {
|
|
case SLIDE_REPLACE:
|
|
case SLIDE_FRAME:
|
|
/* nothing to do here */
|
|
break;
|
|
case SLIDE_SCROLL:
|
|
switch (s->direction) {
|
|
case DIRECTION_RL:
|
|
memmove(dstY, dstY + 1, w_1);
|
|
memmove(dstU, dstU + 1, w_1);
|
|
memmove(dstV, dstV + 1, w_1);
|
|
if (dstA != NULL)
|
|
memmove(dstA, dstA + 1, w_1);
|
|
break;
|
|
case DIRECTION_LR:
|
|
memmove(dstY + 1, dstY, w_1);
|
|
memmove(dstU + 1, dstU, w_1);
|
|
memmove(dstV + 1, dstV, w_1);
|
|
if (dstA != NULL)
|
|
memmove(dstA + 1, dstA, w_1);
|
|
break;
|
|
}
|
|
break;
|
|
}
|
|
|
|
if (direction == DIRECTION_RL ||
|
|
direction == DIRECTION_LR) {
|
|
dstY += x;
|
|
dstU += x;
|
|
dstV += x;
|
|
if (dstA != NULL)
|
|
dstA += x;
|
|
}
|
|
skip:
|
|
|
|
switch (mode) {
|
|
case 4:
|
|
{
|
|
const AVComplexFloat *src2 = (nb_channels > 1) ? src + ihop_size: src;
|
|
float z, u, v;
|
|
|
|
z = hypotf(src[0].re + src2[0].re, src[0].im + src2[0].im);
|
|
u = hypotf(src[0].re, src[0].im);
|
|
v = hypotf(src2[0].re, src2[0].im);
|
|
|
|
z = remap_log(s, z, iscale, log_factor);
|
|
u = remap_log(s, u, iscale, log_factor);
|
|
v = remap_log(s, v, iscale, log_factor);
|
|
|
|
Y = z;
|
|
U = sinf((v - u) * M_PI_2);
|
|
V = sinf((u - v) * M_PI_2);
|
|
|
|
u = U * cosf(rotation * M_PI) - V * sinf(rotation * M_PI);
|
|
v = U * sinf(rotation * M_PI) + V * cosf(rotation * M_PI);
|
|
|
|
U = 0.5f + 0.5f * z * u;
|
|
V = 0.5f + 0.5f * z * v;
|
|
|
|
if (sono_size > 0) {
|
|
dstY[0] = av_clip_uint8(lrintf(Y * 255.f));
|
|
dstU[0] = av_clip_uint8(lrintf(U * 255.f));
|
|
dstV[0] = av_clip_uint8(lrintf(V * 255.f));
|
|
if (dstA)
|
|
dstA[0] = dstY[0];
|
|
}
|
|
|
|
if (bar_size > 0)
|
|
draw_bar(s, y, Y, U, V);
|
|
}
|
|
break;
|
|
case 3:
|
|
{
|
|
const int nb_channels = s->nb_channels;
|
|
const float yf = 1.f / nb_channels;
|
|
|
|
Y = 0.f;
|
|
U = V = 0.5f;
|
|
for (int ch = 0; ch < nb_channels; ch++) {
|
|
const AVComplexFloat *srcn = src + ihop_size * ch;
|
|
float z;
|
|
|
|
z = hypotf(srcn[0].re, srcn[0].im);
|
|
z = remap_log(s, z, iscale, log_factor);
|
|
|
|
Y += z * yf;
|
|
U += z * yf * sinf(2.f * M_PI * (ch * yf + rotation));
|
|
V += z * yf * cosf(2.f * M_PI * (ch * yf + rotation));
|
|
}
|
|
|
|
if (sono_size > 0) {
|
|
dstY[0] = av_clip_uint8(lrintf(Y * 255.f));
|
|
dstU[0] = av_clip_uint8(lrintf(U * 255.f));
|
|
dstV[0] = av_clip_uint8(lrintf(V * 255.f));
|
|
if (dstA)
|
|
dstA[0] = dstY[0];
|
|
}
|
|
|
|
if (bar_size > 0)
|
|
draw_bar(s, y, Y, U, V);
|
|
}
|
|
break;
|
|
case 2:
|
|
Y = hypotf(src[0].re, src[0].im);
|
|
Y = remap_log(s, Y, iscale, log_factor);
|
|
U = atan2f(src[0].im, src[0].re);
|
|
U = 0.5f + 0.5f * U * Y / M_PI;
|
|
V = 1.f - U;
|
|
|
|
if (sono_size > 0) {
|
|
dstY[0] = av_clip_uint8(lrintf(Y * 255.f));
|
|
dstU[0] = av_clip_uint8(lrintf(U * 255.f));
|
|
dstV[0] = av_clip_uint8(lrintf(V * 255.f));
|
|
if (dstA)
|
|
dstA[0] = dstY[0];
|
|
}
|
|
|
|
if (bar_size > 0)
|
|
draw_bar(s, y, Y, U, V);
|
|
break;
|
|
case 1:
|
|
Y = atan2f(src[0].im, src[0].re);
|
|
Y = 0.5f + 0.5f * Y / M_PI;
|
|
|
|
if (sono_size > 0) {
|
|
dstY[0] = av_clip_uint8(lrintf(Y * 255.f));
|
|
if (dstA)
|
|
dstA[0] = dstY[0];
|
|
}
|
|
|
|
if (bar_size > 0)
|
|
draw_bar(s, y, Y, 0.5f, 0.5f);
|
|
break;
|
|
case 0:
|
|
Y = hypotf(src[0].re, src[0].im);
|
|
Y = remap_log(s, Y, iscale, log_factor);
|
|
|
|
if (sono_size > 0) {
|
|
dstY[0] = av_clip_uint8(lrintf(Y * 255.f));
|
|
if (dstA)
|
|
dstA[0] = dstY[0];
|
|
}
|
|
|
|
if (bar_size > 0)
|
|
draw_bar(s, y, Y, 0.5f, 0.5f);
|
|
break;
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int run_channel_cwt(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
|
|
{
|
|
ShowCWTContext *s = ctx->priv;
|
|
const int ch = *(int *)arg;
|
|
const AVComplexFloat *fft_out = (const AVComplexFloat *)s->fft_out->extended_data[ch];
|
|
AVComplexFloat *isrc = (AVComplexFloat *)s->ifft_in->extended_data[jobnr];
|
|
AVComplexFloat *idst = (AVComplexFloat *)s->ifft_out->extended_data[jobnr];
|
|
const int output_padding_size = s->output_padding_size;
|
|
const int input_padding_size = s->input_padding_size;
|
|
const float scale = 1.f / input_padding_size;
|
|
const int ihop_size = s->ihop_size;
|
|
const int count = s->frequency_band_count;
|
|
const int start = (count * jobnr) / nb_jobs;
|
|
const int end = (count * (jobnr+1)) / nb_jobs;
|
|
|
|
for (int y = start; y < end; y++) {
|
|
AVComplexFloat *chout = ((AVComplexFloat *)s->ch_out->extended_data[y]) + ch * ihop_size;
|
|
AVComplexFloat *over = ((AVComplexFloat *)s->over->extended_data[ch]) + y * ihop_size;
|
|
AVComplexFloat *dstx = (AVComplexFloat *)s->dst_x->extended_data[jobnr];
|
|
AVComplexFloat *srcx = (AVComplexFloat *)s->src_x->extended_data[jobnr];
|
|
const AVComplexFloat *kernel = s->kernel[y];
|
|
const unsigned *index = (const unsigned *)s->index;
|
|
const int kernel_start = s->kernel_start[y];
|
|
const int kernel_stop = s->kernel_stop[y];
|
|
const int kernel_range = kernel_stop - kernel_start + 1;
|
|
int offset;
|
|
|
|
if (kernel_start >= 0) {
|
|
offset = 0;
|
|
memcpy(srcx, fft_out + kernel_start, sizeof(*fft_out) * kernel_range);
|
|
} else {
|
|
offset = -kernel_start;
|
|
memcpy(srcx+offset, fft_out, sizeof(*fft_out) * (kernel_range-offset));
|
|
memcpy(srcx, fft_out+input_padding_size-offset, sizeof(*fft_out)*offset);
|
|
}
|
|
|
|
s->fdsp->vector_fmul_scalar((float *)srcx, (const float *)srcx, scale, FFALIGN(kernel_range * 2, 4));
|
|
s->fdsp->vector_fmul((float *)dstx, (const float *)srcx,
|
|
(const float *)kernel, FFALIGN(kernel_range * 2, 16));
|
|
|
|
memset(isrc, 0, sizeof(*isrc) * output_padding_size);
|
|
if (offset == 0) {
|
|
const unsigned *kindex = index + kernel_start;
|
|
for (int i = 0; i < kernel_range; i++) {
|
|
const unsigned n = kindex[i];
|
|
|
|
isrc[n].re += dstx[i].re;
|
|
isrc[n].im += dstx[i].im;
|
|
}
|
|
} else {
|
|
for (int i = 0; i < kernel_range; i++) {
|
|
const unsigned n = (i-kernel_start) & (output_padding_size-1);
|
|
|
|
isrc[n].re += dstx[i].re;
|
|
isrc[n].im += dstx[i].im;
|
|
}
|
|
}
|
|
|
|
s->itx_fn(s->ifft[jobnr], idst, isrc, sizeof(*isrc));
|
|
|
|
memcpy(chout, idst, sizeof(*chout) * ihop_size);
|
|
for (int n = 0; n < ihop_size; n++) {
|
|
chout[n].re += over[n].re;
|
|
chout[n].im += over[n].im;
|
|
}
|
|
memcpy(over, idst + ihop_size, sizeof(*over) * ihop_size);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int compute_kernel(AVFilterContext *ctx)
|
|
{
|
|
ShowCWTContext *s = ctx->priv;
|
|
const int size = s->input_padding_size;
|
|
const int output_sample_count = s->output_sample_count;
|
|
const int fsize = s->frequency_band_count;
|
|
int *kernel_start = s->kernel_start;
|
|
int *kernel_stop = s->kernel_stop;
|
|
unsigned *index = s->index;
|
|
int range_min = INT_MAX;
|
|
int range_max = 0, ret = 0;
|
|
float *tkernel;
|
|
|
|
tkernel = av_malloc_array(size, sizeof(*tkernel));
|
|
if (!tkernel)
|
|
return AVERROR(ENOMEM);
|
|
|
|
for (int y = 0; y < fsize; y++) {
|
|
AVComplexFloat *kernel = s->kernel[y];
|
|
int start = INT_MIN, stop = INT_MAX;
|
|
const float frequency = s->frequency_band[y*2];
|
|
const float deviation = 1.f / (s->frequency_band[y*2+1] *
|
|
output_sample_count);
|
|
const int a = FFMAX(frequency-12.f*sqrtf(1.f/deviation)-0.5f, -size);
|
|
const int b = FFMIN(frequency+12.f*sqrtf(1.f/deviation)-0.5f, size+a);
|
|
const int range = -a;
|
|
|
|
memset(tkernel, 0, size * sizeof(*tkernel));
|
|
for (int n = a; n < b; n++) {
|
|
float ff, f = n+0.5f-frequency;
|
|
|
|
ff = expf(-f*f*deviation);
|
|
tkernel[n+range] = ff;
|
|
}
|
|
|
|
for (int n = a; n < b; n++) {
|
|
if (tkernel[n+range] != 0.f) {
|
|
if (tkernel[n+range] > FLT_MIN)
|
|
av_log(ctx, AV_LOG_DEBUG, "out of range kernel %g\n", tkernel[n+range]);
|
|
start = n;
|
|
break;
|
|
}
|
|
}
|
|
|
|
for (int n = b; n >= a; n--) {
|
|
if (tkernel[n+range] != 0.f) {
|
|
if (tkernel[n+range] > FLT_MIN)
|
|
av_log(ctx, AV_LOG_DEBUG, "out of range kernel %g\n", tkernel[n+range]);
|
|
stop = n;
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (start == INT_MIN || stop == INT_MAX) {
|
|
ret = AVERROR(EINVAL);
|
|
break;
|
|
}
|
|
|
|
kernel_start[y] = start;
|
|
kernel_stop[y] = stop;
|
|
|
|
kernel = av_calloc(FFALIGN(stop-start+1, 16), sizeof(*kernel));
|
|
if (!kernel) {
|
|
ret = AVERROR(ENOMEM);
|
|
break;
|
|
}
|
|
|
|
for (int n = 0; n <= stop - start; n++) {
|
|
kernel[n].re = tkernel[n+range+start];
|
|
kernel[n].im = tkernel[n+range+start];
|
|
}
|
|
|
|
range_min = FFMIN(range_min, stop+1-start);
|
|
range_max = FFMAX(range_max, stop+1-start);
|
|
|
|
s->kernel[y] = kernel;
|
|
}
|
|
|
|
for (int n = 0; n < size; n++)
|
|
index[n] = n & (s->output_padding_size - 1);
|
|
|
|
av_log(ctx, AV_LOG_DEBUG, "range_min: %d\n", range_min);
|
|
av_log(ctx, AV_LOG_DEBUG, "range_max: %d\n", range_max);
|
|
|
|
av_freep(&tkernel);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int config_output(AVFilterLink *outlink)
|
|
{
|
|
AVFilterContext *ctx = outlink->src;
|
|
AVFilterLink *inlink = ctx->inputs[0];
|
|
ShowCWTContext *s = ctx->priv;
|
|
const float limit_frequency = inlink->sample_rate * 0.5f;
|
|
float maximum_frequency = fminf(s->maximum_frequency, limit_frequency);
|
|
float minimum_frequency = s->minimum_frequency;
|
|
float scale = 1.f, factor;
|
|
int ret;
|
|
|
|
if (minimum_frequency >= maximum_frequency) {
|
|
av_log(ctx, AV_LOG_ERROR, "min frequency (%f) >= (%f) max frequency\n",
|
|
minimum_frequency, maximum_frequency);
|
|
return AVERROR(EINVAL);
|
|
}
|
|
|
|
uninit(ctx);
|
|
|
|
s->fdsp = avpriv_float_dsp_alloc(0);
|
|
if (!s->fdsp)
|
|
return AVERROR(ENOMEM);
|
|
|
|
switch (s->direction) {
|
|
case DIRECTION_LR:
|
|
case DIRECTION_RL:
|
|
s->bar_size = s->w * s->bar_ratio;
|
|
s->sono_size = s->w - s->bar_size;
|
|
s->frequency_band_count = s->h;
|
|
break;
|
|
case DIRECTION_UD:
|
|
case DIRECTION_DU:
|
|
s->bar_size = s->h * s->bar_ratio;
|
|
s->sono_size = s->h - s->bar_size;
|
|
s->frequency_band_count = s->w;
|
|
break;
|
|
}
|
|
|
|
switch (s->frequency_scale) {
|
|
case FSCALE_LOG:
|
|
minimum_frequency = logf(minimum_frequency) / logf(2.f);
|
|
maximum_frequency = logf(maximum_frequency) / logf(2.f);
|
|
break;
|
|
case FSCALE_BARK:
|
|
minimum_frequency = 6.f * asinhf(minimum_frequency / 600.f);
|
|
maximum_frequency = 6.f * asinhf(maximum_frequency / 600.f);
|
|
break;
|
|
case FSCALE_MEL:
|
|
minimum_frequency = 2595.f * log10f(1.f + minimum_frequency / 700.f);
|
|
maximum_frequency = 2595.f * log10f(1.f + maximum_frequency / 700.f);
|
|
break;
|
|
case FSCALE_ERBS:
|
|
minimum_frequency = 11.17268f * logf(1.f + (46.06538f * minimum_frequency) / (minimum_frequency + 14678.49f));
|
|
maximum_frequency = 11.17268f * logf(1.f + (46.06538f * maximum_frequency) / (maximum_frequency + 14678.49f));
|
|
break;
|
|
case FSCALE_SQRT:
|
|
minimum_frequency = sqrtf(minimum_frequency);
|
|
maximum_frequency = sqrtf(maximum_frequency);
|
|
break;
|
|
case FSCALE_CBRT:
|
|
minimum_frequency = cbrtf(minimum_frequency);
|
|
maximum_frequency = cbrtf(maximum_frequency);
|
|
break;
|
|
case FSCALE_QDRT:
|
|
minimum_frequency = powf(minimum_frequency, 0.25f);
|
|
maximum_frequency = powf(maximum_frequency, 0.25f);
|
|
break;
|
|
case FSCALE_FM:
|
|
minimum_frequency = powf(9.f * (minimum_frequency * minimum_frequency) / 4.f, 1.f / 3.f);
|
|
maximum_frequency = powf(9.f * (maximum_frequency * maximum_frequency) / 4.f, 1.f / 3.f);
|
|
break;
|
|
}
|
|
|
|
s->frequency_band = av_calloc(s->frequency_band_count,
|
|
sizeof(*s->frequency_band) * 2);
|
|
if (!s->frequency_band)
|
|
return AVERROR(ENOMEM);
|
|
|
|
s->nb_consumed_samples = inlink->sample_rate *
|
|
frequency_band(s->frequency_band,
|
|
s->frequency_band_count, maximum_frequency - minimum_frequency,
|
|
minimum_frequency, s->frequency_scale, s->deviation);
|
|
s->nb_consumed_samples = FFMIN(s->nb_consumed_samples, 65536);
|
|
|
|
s->nb_threads = FFMIN(s->frequency_band_count, ff_filter_get_nb_threads(ctx));
|
|
s->nb_channels = inlink->ch_layout.nb_channels;
|
|
s->old_pts = AV_NOPTS_VALUE;
|
|
s->eof_pts = AV_NOPTS_VALUE;
|
|
|
|
s->input_sample_count = 1 << (32 - ff_clz(s->nb_consumed_samples));
|
|
s->input_padding_size = 1 << (32 - ff_clz(s->input_sample_count));
|
|
s->output_sample_count = FFMAX(1, av_rescale(s->input_sample_count, s->pps, inlink->sample_rate));
|
|
s->output_padding_size = 1 << (32 - ff_clz(s->output_sample_count));
|
|
|
|
s->hop_size = s->input_sample_count;
|
|
s->ihop_size = s->output_padding_size >> 1;
|
|
|
|
outlink->w = s->w;
|
|
outlink->h = s->h;
|
|
outlink->sample_aspect_ratio = (AVRational){1,1};
|
|
|
|
s->fft_size = FFALIGN(s->input_padding_size, av_cpu_max_align());
|
|
s->ifft_size = FFALIGN(s->output_padding_size, av_cpu_max_align());
|
|
|
|
s->fft = av_calloc(s->nb_threads, sizeof(*s->fft));
|
|
if (!s->fft)
|
|
return AVERROR(ENOMEM);
|
|
|
|
for (int n = 0; n < s->nb_threads; n++) {
|
|
ret = av_tx_init(&s->fft[n], &s->tx_fn, AV_TX_FLOAT_FFT, 0, s->input_padding_size, &scale, 0);
|
|
if (ret < 0)
|
|
return ret;
|
|
}
|
|
|
|
s->ifft = av_calloc(s->nb_threads, sizeof(*s->ifft));
|
|
if (!s->ifft)
|
|
return AVERROR(ENOMEM);
|
|
|
|
for (int n = 0; n < s->nb_threads; n++) {
|
|
ret = av_tx_init(&s->ifft[n], &s->itx_fn, AV_TX_FLOAT_FFT, 1, s->output_padding_size, &scale, 0);
|
|
if (ret < 0)
|
|
return ret;
|
|
}
|
|
|
|
s->outpicref = ff_get_video_buffer(outlink, outlink->w, outlink->h);
|
|
s->fft_in = ff_get_audio_buffer(inlink, s->fft_size * 2);
|
|
s->fft_out = ff_get_audio_buffer(inlink, s->fft_size * 2);
|
|
s->dst_x = av_frame_alloc();
|
|
s->src_x = av_frame_alloc();
|
|
s->kernel = av_calloc(s->frequency_band_count, sizeof(*s->kernel));
|
|
s->cache = ff_get_audio_buffer(inlink, s->hop_size);
|
|
s->over = ff_get_audio_buffer(inlink, s->frequency_band_count * 2 * s->ihop_size);
|
|
s->bh_out = ff_get_audio_buffer(inlink, s->frequency_band_count);
|
|
s->ifft_in = av_frame_alloc();
|
|
s->ifft_out = av_frame_alloc();
|
|
s->ch_out = av_frame_alloc();
|
|
s->index = av_calloc(s->input_padding_size, sizeof(*s->index));
|
|
s->kernel_start = av_calloc(s->frequency_band_count, sizeof(*s->kernel_start));
|
|
s->kernel_stop = av_calloc(s->frequency_band_count, sizeof(*s->kernel_stop));
|
|
if (!s->outpicref || !s->fft_in || !s->fft_out || !s->src_x || !s->dst_x || !s->over ||
|
|
!s->ifft_in || !s->ifft_out || !s->kernel_start || !s->kernel_stop || !s->ch_out ||
|
|
!s->cache || !s->index || !s->bh_out || !s->kernel)
|
|
return AVERROR(ENOMEM);
|
|
|
|
s->ch_out->format = inlink->format;
|
|
s->ch_out->nb_samples = 2 * s->ihop_size * inlink->ch_layout.nb_channels;
|
|
s->ch_out->ch_layout.nb_channels = s->frequency_band_count;
|
|
ret = av_frame_get_buffer(s->ch_out, 0);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
s->ifft_in->format = inlink->format;
|
|
s->ifft_in->nb_samples = s->ifft_size * 2;
|
|
s->ifft_in->ch_layout.nb_channels = s->nb_threads;
|
|
ret = av_frame_get_buffer(s->ifft_in, 0);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
s->ifft_out->format = inlink->format;
|
|
s->ifft_out->nb_samples = s->ifft_size * 2;
|
|
s->ifft_out->ch_layout.nb_channels = s->nb_threads;
|
|
ret = av_frame_get_buffer(s->ifft_out, 0);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
s->src_x->format = inlink->format;
|
|
s->src_x->nb_samples = s->fft_size * 2;
|
|
s->src_x->ch_layout.nb_channels = s->nb_threads;
|
|
ret = av_frame_get_buffer(s->src_x, 0);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
s->dst_x->format = inlink->format;
|
|
s->dst_x->nb_samples = s->fft_size * 2;
|
|
s->dst_x->ch_layout.nb_channels = s->nb_threads;
|
|
ret = av_frame_get_buffer(s->dst_x, 0);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
s->outpicref->sample_aspect_ratio = (AVRational){1,1};
|
|
|
|
for (int y = 0; y < outlink->h; y++) {
|
|
memset(s->outpicref->data[0] + y * s->outpicref->linesize[0], 0, outlink->w);
|
|
memset(s->outpicref->data[1] + y * s->outpicref->linesize[1], 128, outlink->w);
|
|
memset(s->outpicref->data[2] + y * s->outpicref->linesize[2], 128, outlink->w);
|
|
if (s->outpicref->data[3])
|
|
memset(s->outpicref->data[3] + y * s->outpicref->linesize[3], 0, outlink->w);
|
|
}
|
|
|
|
s->outpicref->color_range = AVCOL_RANGE_JPEG;
|
|
|
|
factor = s->input_padding_size / (float)inlink->sample_rate;
|
|
for (int n = 0; n < s->frequency_band_count; n++) {
|
|
s->frequency_band[2*n ] *= factor;
|
|
s->frequency_band[2*n+1] *= factor;
|
|
}
|
|
|
|
av_log(ctx, AV_LOG_DEBUG, "factor: %f\n", factor);
|
|
av_log(ctx, AV_LOG_DEBUG, "nb_consumed_samples: %d\n", s->nb_consumed_samples);
|
|
av_log(ctx, AV_LOG_DEBUG, "hop_size: %d\n", s->hop_size);
|
|
av_log(ctx, AV_LOG_DEBUG, "ihop_size: %d\n", s->ihop_size);
|
|
av_log(ctx, AV_LOG_DEBUG, "input_sample_count: %d\n", s->input_sample_count);
|
|
av_log(ctx, AV_LOG_DEBUG, "input_padding_size: %d\n", s->input_padding_size);
|
|
av_log(ctx, AV_LOG_DEBUG, "output_sample_count: %d\n", s->output_sample_count);
|
|
av_log(ctx, AV_LOG_DEBUG, "output_padding_size: %d\n", s->output_padding_size);
|
|
|
|
switch (s->direction) {
|
|
case DIRECTION_LR:
|
|
case DIRECTION_UD:
|
|
s->pos = s->bar_size;
|
|
break;
|
|
case DIRECTION_RL:
|
|
case DIRECTION_DU:
|
|
s->pos = s->sono_size;
|
|
break;
|
|
}
|
|
|
|
s->auto_frame_rate = av_make_q(inlink->sample_rate, s->hop_size);
|
|
if (strcmp(s->rate_str, "auto")) {
|
|
ret = av_parse_video_rate(&s->frame_rate, s->rate_str);
|
|
} else {
|
|
s->frame_rate = s->auto_frame_rate;
|
|
}
|
|
outlink->frame_rate = s->frame_rate;
|
|
outlink->time_base = av_inv_q(outlink->frame_rate);
|
|
|
|
ret = compute_kernel(ctx);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int output_frame(AVFilterContext *ctx)
|
|
{
|
|
AVFilterLink *outlink = ctx->outputs[0];
|
|
AVFilterLink *inlink = ctx->inputs[0];
|
|
ShowCWTContext *s = ctx->priv;
|
|
const int nb_planes = 3 + (s->outpicref->data[3] != NULL);
|
|
int ret;
|
|
|
|
switch (s->slide) {
|
|
case SLIDE_SCROLL:
|
|
switch (s->direction) {
|
|
case DIRECTION_UD:
|
|
for (int p = 0; p < nb_planes; p++) {
|
|
ptrdiff_t linesize = s->outpicref->linesize[p];
|
|
|
|
for (int y = s->h - 1; y > s->bar_size; y--) {
|
|
uint8_t *dst = s->outpicref->data[p] + y * linesize;
|
|
|
|
memmove(dst, dst - linesize, s->w);
|
|
}
|
|
}
|
|
break;
|
|
case DIRECTION_DU:
|
|
for (int p = 0; p < nb_planes; p++) {
|
|
ptrdiff_t linesize = s->outpicref->linesize[p];
|
|
|
|
for (int y = 0; y < s->sono_size; y++) {
|
|
uint8_t *dst = s->outpicref->data[p] + y * linesize;
|
|
|
|
memmove(dst, dst + linesize, s->w);
|
|
}
|
|
}
|
|
break;
|
|
}
|
|
break;
|
|
}
|
|
|
|
ff_filter_execute(ctx, draw, NULL, NULL, s->nb_threads);
|
|
|
|
switch (s->slide) {
|
|
case SLIDE_REPLACE:
|
|
case SLIDE_FRAME:
|
|
switch (s->direction) {
|
|
case DIRECTION_LR:
|
|
s->pos++;
|
|
if (s->pos >= s->w) {
|
|
s->pos = s->bar_size;
|
|
s->new_frame = 1;
|
|
}
|
|
break;
|
|
case DIRECTION_RL:
|
|
s->pos--;
|
|
if (s->pos < 0) {
|
|
s->pos = s->sono_size;
|
|
s->new_frame = 1;
|
|
}
|
|
break;
|
|
case DIRECTION_UD:
|
|
s->pos++;
|
|
if (s->pos >= s->h) {
|
|
s->pos = s->bar_size;
|
|
s->new_frame = 1;
|
|
}
|
|
break;
|
|
case DIRECTION_DU:
|
|
s->pos--;
|
|
if (s->pos < 0) {
|
|
s->pos = s->sono_size;
|
|
s->new_frame = 1;
|
|
}
|
|
break;
|
|
}
|
|
break;
|
|
case SLIDE_SCROLL:
|
|
switch (s->direction) {
|
|
case DIRECTION_UD:
|
|
case DIRECTION_LR:
|
|
s->pos = s->bar_size;
|
|
break;
|
|
case DIRECTION_RL:
|
|
case DIRECTION_DU:
|
|
s->pos = s->sono_size;
|
|
break;
|
|
}
|
|
break;
|
|
}
|
|
|
|
if (s->slide == SLIDE_FRAME && s->eof) {
|
|
switch (s->direction) {
|
|
case DIRECTION_LR:
|
|
for (int p = 0; p < nb_planes; p++) {
|
|
ptrdiff_t linesize = s->outpicref->linesize[p];
|
|
const int size = s->w - s->pos;
|
|
const int fill = p > 0 && p < 3 ? 128 : 0;
|
|
const int x = s->pos;
|
|
|
|
for (int y = 0; y < s->h; y++) {
|
|
uint8_t *dst = s->outpicref->data[p] + y * linesize + x;
|
|
|
|
memset(dst, fill, size);
|
|
}
|
|
}
|
|
break;
|
|
case DIRECTION_RL:
|
|
for (int p = 0; p < nb_planes; p++) {
|
|
ptrdiff_t linesize = s->outpicref->linesize[p];
|
|
const int size = s->w - s->pos;
|
|
const int fill = p > 0 && p < 3 ? 128 : 0;
|
|
|
|
for (int y = 0; y < s->h; y++) {
|
|
uint8_t *dst = s->outpicref->data[p] + y * linesize;
|
|
|
|
memset(dst, fill, size);
|
|
}
|
|
}
|
|
break;
|
|
case DIRECTION_UD:
|
|
for (int p = 0; p < nb_planes; p++) {
|
|
ptrdiff_t linesize = s->outpicref->linesize[p];
|
|
const int fill = p > 0 && p < 3 ? 128 : 0;
|
|
|
|
for (int y = s->pos; y < s->h; y++) {
|
|
uint8_t *dst = s->outpicref->data[p] + y * linesize;
|
|
|
|
memset(dst, fill, s->w);
|
|
}
|
|
}
|
|
break;
|
|
case DIRECTION_DU:
|
|
for (int p = 0; p < nb_planes; p++) {
|
|
ptrdiff_t linesize = s->outpicref->linesize[p];
|
|
const int fill = p > 0 && p < 3 ? 128 : 0;
|
|
|
|
for (int y = s->h - s->pos; y >= 0; y--) {
|
|
uint8_t *dst = s->outpicref->data[p] + y * linesize;
|
|
|
|
memset(dst, fill, s->w);
|
|
}
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
|
|
s->new_frame = s->slide == SLIDE_FRAME && (s->new_frame || s->eof);
|
|
|
|
if (s->slide != SLIDE_FRAME || s->new_frame == 1) {
|
|
int64_t pts_offset = s->new_frame ? 0LL : av_rescale(s->ihop_index, s->hop_size, s->ihop_size);
|
|
const int offset = (s->input_padding_size - s->hop_size) >> 1;
|
|
|
|
pts_offset = av_rescale_q(pts_offset - offset, av_make_q(1, inlink->sample_rate), inlink->time_base);
|
|
s->outpicref->pts = av_rescale_q(s->in_pts + pts_offset, inlink->time_base, outlink->time_base);
|
|
s->outpicref->duration = 1;
|
|
}
|
|
|
|
s->ihop_index++;
|
|
if (s->ihop_index >= s->ihop_size)
|
|
s->ihop_index = s->hop_index = 0;
|
|
|
|
if (s->slide == SLIDE_FRAME && s->new_frame == 0)
|
|
return 1;
|
|
|
|
if (s->old_pts < s->outpicref->pts) {
|
|
AVFrame *out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
|
|
if (!out)
|
|
return AVERROR(ENOMEM);
|
|
ret = av_frame_copy_props(out, s->outpicref);
|
|
if (ret < 0)
|
|
goto fail;
|
|
ret = av_frame_copy(out, s->outpicref);
|
|
if (ret < 0)
|
|
goto fail;
|
|
s->old_pts = s->outpicref->pts;
|
|
s->new_frame = 0;
|
|
ret = ff_filter_frame(outlink, out);
|
|
if (ret <= 0)
|
|
return ret;
|
|
fail:
|
|
av_frame_free(&out);
|
|
return ret;
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
static int run_channels_cwt_prepare(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
|
|
{
|
|
ShowCWTContext *s = ctx->priv;
|
|
const int count = s->nb_channels;
|
|
const int start = (count * jobnr) / nb_jobs;
|
|
const int end = (count * (jobnr+1)) / nb_jobs;
|
|
|
|
for (int ch = start; ch < end; ch++)
|
|
run_channel_cwt_prepare(ctx, arg, jobnr, ch);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int activate(AVFilterContext *ctx)
|
|
{
|
|
AVFilterLink *inlink = ctx->inputs[0];
|
|
AVFilterLink *outlink = ctx->outputs[0];
|
|
ShowCWTContext *s = ctx->priv;
|
|
int ret = 0, status;
|
|
int64_t pts;
|
|
|
|
FF_FILTER_FORWARD_STATUS_BACK(outlink, inlink);
|
|
|
|
if (s->outpicref) {
|
|
AVFrame *fin = NULL;
|
|
|
|
if (s->hop_index < s->hop_size) {
|
|
if (!s->eof) {
|
|
ret = ff_inlink_consume_samples(inlink, 1, s->hop_size - s->hop_index, &fin);
|
|
if (ret < 0)
|
|
return ret;
|
|
}
|
|
|
|
if (ret > 0 || s->eof) {
|
|
ff_filter_execute(ctx, run_channels_cwt_prepare, fin, NULL,
|
|
FFMIN(s->nb_threads, s->nb_channels));
|
|
if (fin) {
|
|
if (s->hop_index == 0) {
|
|
s->in_pts = fin->pts;
|
|
if (s->old_pts == AV_NOPTS_VALUE)
|
|
s->old_pts = av_rescale_q(s->in_pts, inlink->time_base, outlink->time_base) - 1;
|
|
}
|
|
s->hop_index += fin->nb_samples;
|
|
av_frame_free(&fin);
|
|
} else {
|
|
s->hop_index = s->hop_size;
|
|
}
|
|
}
|
|
}
|
|
|
|
if (s->hop_index >= s->hop_size || s->ihop_index > 0) {
|
|
for (int ch = 0; ch < s->nb_channels && s->ihop_index == 0; ch++) {
|
|
ff_filter_execute(ctx, run_channel_cwt, (void *)&ch, NULL,
|
|
s->nb_threads);
|
|
}
|
|
|
|
ret = output_frame(ctx);
|
|
if (ret != 1)
|
|
return ret;
|
|
}
|
|
}
|
|
|
|
if (s->eof) {
|
|
if (s->slide == SLIDE_FRAME)
|
|
ret = output_frame(ctx);
|
|
ff_outlink_set_status(outlink, AVERROR_EOF, s->eof_pts);
|
|
return ret;
|
|
}
|
|
|
|
if (!s->eof && ff_inlink_acknowledge_status(inlink, &status, &pts)) {
|
|
if (status == AVERROR_EOF) {
|
|
s->eof = 1;
|
|
ff_filter_set_ready(ctx, 10);
|
|
s->eof_pts = av_rescale_q(pts, inlink->time_base, outlink->time_base);
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
if (ff_inlink_queued_samples(inlink) > 0 || s->ihop_index ||
|
|
s->hop_index >= s->hop_size || s->eof) {
|
|
ff_filter_set_ready(ctx, 10);
|
|
return 0;
|
|
}
|
|
|
|
if (ff_outlink_frame_wanted(outlink)) {
|
|
ff_inlink_request_frame(inlink);
|
|
return 0;
|
|
}
|
|
|
|
return FFERROR_NOT_READY;
|
|
}
|
|
|
|
static const AVFilterPad showcwt_outputs[] = {
|
|
{
|
|
.name = "default",
|
|
.type = AVMEDIA_TYPE_VIDEO,
|
|
.config_props = config_output,
|
|
},
|
|
};
|
|
|
|
const AVFilter ff_avf_showcwt = {
|
|
.name = "showcwt",
|
|
.description = NULL_IF_CONFIG_SMALL("Convert input audio to a CWT (Continuous Wavelet Transform) spectrum video output."),
|
|
.uninit = uninit,
|
|
.priv_size = sizeof(ShowCWTContext),
|
|
FILTER_INPUTS(ff_audio_default_filterpad),
|
|
FILTER_OUTPUTS(showcwt_outputs),
|
|
FILTER_QUERY_FUNC(query_formats),
|
|
.activate = activate,
|
|
.priv_class = &showcwt_class,
|
|
.flags = AVFILTER_FLAG_SLICE_THREADS,
|
|
};
|