2012-05-21 21:27:59 -04:00
|
|
|
/*
|
|
|
|
* Audio Mix Filter
|
|
|
|
* Copyright (c) 2012 Justin Ruggles <justin.ruggles@gmail.com>
|
|
|
|
*
|
2013-08-15 23:12:51 +02:00
|
|
|
* This file is part of FFmpeg.
|
2012-05-21 21:27:59 -04:00
|
|
|
*
|
2013-08-15 23:12:51 +02:00
|
|
|
* FFmpeg is free software; you can redistribute it and/or
|
2012-05-21 21:27:59 -04:00
|
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
|
|
* License as published by the Free Software Foundation; either
|
|
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
|
|
*
|
2013-08-15 23:12:51 +02:00
|
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
2012-05-21 21:27:59 -04:00
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* Lesser General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Lesser General Public
|
2013-08-15 23:12:51 +02:00
|
|
|
* License along with FFmpeg; if not, write to the Free Software
|
2012-05-21 21:27:59 -04:00
|
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
|
|
*/
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @file
|
|
|
|
* Audio Mix Filter
|
|
|
|
*
|
|
|
|
* Mixes audio from multiple sources into a single output. The channel layout,
|
|
|
|
* sample rate, and sample format will be the same for all inputs and the
|
|
|
|
* output.
|
|
|
|
*/
|
|
|
|
|
2013-04-30 18:30:02 +02:00
|
|
|
#include "libavutil/attributes.h"
|
2012-05-21 21:27:59 -04:00
|
|
|
#include "libavutil/audio_fifo.h"
|
|
|
|
#include "libavutil/avassert.h"
|
|
|
|
#include "libavutil/avstring.h"
|
2012-11-10 10:00:00 -05:00
|
|
|
#include "libavutil/channel_layout.h"
|
2012-08-06 16:49:32 +03:00
|
|
|
#include "libavutil/common.h"
|
2020-04-14 12:38:47 +02:00
|
|
|
#include "libavutil/eval.h"
|
2012-06-08 22:34:30 -04:00
|
|
|
#include "libavutil/float_dsp.h"
|
2012-05-21 21:27:59 -04:00
|
|
|
#include "libavutil/mathematics.h"
|
|
|
|
#include "libavutil/opt.h"
|
|
|
|
#include "libavutil/samplefmt.h"
|
|
|
|
|
|
|
|
#include "audio.h"
|
|
|
|
#include "avfilter.h"
|
2017-08-26 17:47:56 +02:00
|
|
|
#include "filters.h"
|
2012-05-21 21:27:59 -04:00
|
|
|
#include "internal.h"
|
|
|
|
|
|
|
|
#define INPUT_ON 1 /**< input is active */
|
2015-10-24 15:19:11 +02:00
|
|
|
#define INPUT_EOF 2 /**< input has reached EOF (may still be active) */
|
2012-05-21 21:27:59 -04:00
|
|
|
|
|
|
|
#define DURATION_LONGEST 0
|
|
|
|
#define DURATION_SHORTEST 1
|
|
|
|
#define DURATION_FIRST 2
|
|
|
|
|
|
|
|
|
|
|
|
typedef struct FrameInfo {
|
|
|
|
int nb_samples;
|
|
|
|
int64_t pts;
|
|
|
|
struct FrameInfo *next;
|
|
|
|
} FrameInfo;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Linked list used to store timestamps and frame sizes of all frames in the
|
|
|
|
* FIFO for the first input.
|
|
|
|
*
|
|
|
|
* This is needed to keep timestamps synchronized for the case where multiple
|
|
|
|
* input frames are pushed to the filter for processing before a frame is
|
|
|
|
* requested by the output link.
|
|
|
|
*/
|
|
|
|
typedef struct FrameList {
|
|
|
|
int nb_frames;
|
|
|
|
int nb_samples;
|
|
|
|
FrameInfo *list;
|
|
|
|
FrameInfo *end;
|
|
|
|
} FrameList;
|
|
|
|
|
|
|
|
static void frame_list_clear(FrameList *frame_list)
|
|
|
|
{
|
|
|
|
if (frame_list) {
|
|
|
|
while (frame_list->list) {
|
|
|
|
FrameInfo *info = frame_list->list;
|
|
|
|
frame_list->list = info->next;
|
|
|
|
av_free(info);
|
|
|
|
}
|
|
|
|
frame_list->nb_frames = 0;
|
|
|
|
frame_list->nb_samples = 0;
|
|
|
|
frame_list->end = NULL;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static int frame_list_next_frame_size(FrameList *frame_list)
|
|
|
|
{
|
|
|
|
if (!frame_list->list)
|
|
|
|
return 0;
|
|
|
|
return frame_list->list->nb_samples;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int64_t frame_list_next_pts(FrameList *frame_list)
|
|
|
|
{
|
|
|
|
if (!frame_list->list)
|
|
|
|
return AV_NOPTS_VALUE;
|
|
|
|
return frame_list->list->pts;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void frame_list_remove_samples(FrameList *frame_list, int nb_samples)
|
|
|
|
{
|
|
|
|
if (nb_samples >= frame_list->nb_samples) {
|
|
|
|
frame_list_clear(frame_list);
|
|
|
|
} else {
|
|
|
|
int samples = nb_samples;
|
|
|
|
while (samples > 0) {
|
|
|
|
FrameInfo *info = frame_list->list;
|
2014-08-15 21:31:59 +02:00
|
|
|
av_assert0(info);
|
2012-05-21 21:27:59 -04:00
|
|
|
if (info->nb_samples <= samples) {
|
|
|
|
samples -= info->nb_samples;
|
|
|
|
frame_list->list = info->next;
|
|
|
|
if (!frame_list->list)
|
|
|
|
frame_list->end = NULL;
|
|
|
|
frame_list->nb_frames--;
|
|
|
|
frame_list->nb_samples -= info->nb_samples;
|
|
|
|
av_free(info);
|
|
|
|
} else {
|
|
|
|
info->nb_samples -= samples;
|
|
|
|
info->pts += samples;
|
|
|
|
frame_list->nb_samples -= samples;
|
|
|
|
samples = 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static int frame_list_add_frame(FrameList *frame_list, int nb_samples, int64_t pts)
|
|
|
|
{
|
|
|
|
FrameInfo *info = av_malloc(sizeof(*info));
|
|
|
|
if (!info)
|
|
|
|
return AVERROR(ENOMEM);
|
|
|
|
info->nb_samples = nb_samples;
|
|
|
|
info->pts = pts;
|
|
|
|
info->next = NULL;
|
|
|
|
|
|
|
|
if (!frame_list->list) {
|
|
|
|
frame_list->list = info;
|
|
|
|
frame_list->end = info;
|
|
|
|
} else {
|
2014-08-15 21:31:59 +02:00
|
|
|
av_assert0(frame_list->end);
|
2012-05-21 21:27:59 -04:00
|
|
|
frame_list->end->next = info;
|
|
|
|
frame_list->end = info;
|
|
|
|
}
|
|
|
|
frame_list->nb_frames++;
|
|
|
|
frame_list->nb_samples += nb_samples;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2017-08-26 17:47:56 +02:00
|
|
|
/* FIXME: use directly links fifo */
|
2012-05-21 21:27:59 -04:00
|
|
|
|
|
|
|
typedef struct MixContext {
|
|
|
|
const AVClass *class; /**< class for AVOptions */
|
2014-11-18 12:24:16 +01:00
|
|
|
AVFloatDSPContext *fdsp;
|
2012-05-21 21:27:59 -04:00
|
|
|
|
|
|
|
int nb_inputs; /**< number of inputs */
|
|
|
|
int active_inputs; /**< number of input currently active */
|
|
|
|
int duration_mode; /**< mode for determining duration */
|
|
|
|
float dropout_transition; /**< transition time when an input drops out */
|
2018-03-29 13:54:51 +02:00
|
|
|
char *weights_str; /**< string for custom weights for every input */
|
2021-02-12 22:58:13 +01:00
|
|
|
int normalize; /**< if inputs are scaled */
|
2012-05-21 21:27:59 -04:00
|
|
|
|
|
|
|
int nb_channels; /**< number of channels */
|
|
|
|
int sample_rate; /**< sample rate */
|
2012-06-08 23:59:04 -04:00
|
|
|
int planar;
|
2012-05-21 21:27:59 -04:00
|
|
|
AVAudioFifo **fifos; /**< audio fifo for each input */
|
|
|
|
uint8_t *input_state; /**< current state of each input */
|
|
|
|
float *input_scale; /**< mixing scale factor for each input */
|
2018-03-29 13:54:51 +02:00
|
|
|
float *weights; /**< custom weights for every input */
|
|
|
|
float weight_sum; /**< sum of custom weights for every input */
|
|
|
|
float *scale_norm; /**< normalization factor for every input */
|
2012-05-21 21:27:59 -04:00
|
|
|
int64_t next_pts; /**< calculated pts for next output frame */
|
|
|
|
FrameList *frame_list; /**< list of frame info for the first input */
|
|
|
|
} MixContext;
|
|
|
|
|
|
|
|
#define OFFSET(x) offsetof(MixContext, x)
|
|
|
|
#define A AV_OPT_FLAG_AUDIO_PARAM
|
2012-08-13 13:40:01 +02:00
|
|
|
#define F AV_OPT_FLAG_FILTERING_PARAM
|
2020-04-28 12:01:04 +02:00
|
|
|
#define T AV_OPT_FLAG_RUNTIME_PARAM
|
2012-06-22 14:33:09 +02:00
|
|
|
static const AVOption amix_options[] = {
|
2012-05-21 21:27:59 -04:00
|
|
|
{ "inputs", "Number of inputs.",
|
2020-01-06 21:48:38 +08:00
|
|
|
OFFSET(nb_inputs), AV_OPT_TYPE_INT, { .i64 = 2 }, 1, INT16_MAX, A|F },
|
2012-05-21 21:27:59 -04:00
|
|
|
{ "duration", "How to determine the end-of-stream.",
|
2024-02-11 15:41:05 +01:00
|
|
|
OFFSET(duration_mode), AV_OPT_TYPE_INT, { .i64 = DURATION_LONGEST }, 0, 2, A|F, .unit = "duration" },
|
|
|
|
{ "longest", "Duration of longest input.", 0, AV_OPT_TYPE_CONST, { .i64 = DURATION_LONGEST }, 0, 0, A|F, .unit = "duration" },
|
|
|
|
{ "shortest", "Duration of shortest input.", 0, AV_OPT_TYPE_CONST, { .i64 = DURATION_SHORTEST }, 0, 0, A|F, .unit = "duration" },
|
|
|
|
{ "first", "Duration of first input.", 0, AV_OPT_TYPE_CONST, { .i64 = DURATION_FIRST }, 0, 0, A|F, .unit = "duration" },
|
2012-05-21 21:27:59 -04:00
|
|
|
{ "dropout_transition", "Transition time, in seconds, for volume "
|
|
|
|
"renormalization when an input stream ends.",
|
2012-09-05 14:44:05 +02:00
|
|
|
OFFSET(dropout_transition), AV_OPT_TYPE_FLOAT, { .dbl = 2.0 }, 0, INT_MAX, A|F },
|
2018-03-29 13:54:51 +02:00
|
|
|
{ "weights", "Set weight for each input.",
|
2020-04-28 12:01:04 +02:00
|
|
|
OFFSET(weights_str), AV_OPT_TYPE_STRING, {.str="1 1"}, 0, 0, A|F|T },
|
2021-02-12 22:58:13 +01:00
|
|
|
{ "normalize", "Scale inputs",
|
|
|
|
OFFSET(normalize), AV_OPT_TYPE_BOOL, {.i64=1}, 0, 1, A|F|T },
|
2013-09-07 12:13:50 +00:00
|
|
|
{ NULL }
|
2012-05-21 21:27:59 -04:00
|
|
|
};
|
|
|
|
|
2012-06-22 14:33:09 +02:00
|
|
|
AVFILTER_DEFINE_CLASS(amix);
|
2012-05-21 21:27:59 -04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Update the scaling factors to apply to each input during mixing.
|
|
|
|
*
|
|
|
|
* This balances the full volume range between active inputs and handles
|
|
|
|
* volume transitions when EOF is encountered on an input but mixing continues
|
|
|
|
* with the remaining inputs.
|
|
|
|
*/
|
|
|
|
static void calculate_scales(MixContext *s, int nb_samples)
|
|
|
|
{
|
2018-03-29 13:54:51 +02:00
|
|
|
float weight_sum = 0.f;
|
2012-05-21 21:27:59 -04:00
|
|
|
int i;
|
|
|
|
|
2018-03-29 13:54:51 +02:00
|
|
|
for (i = 0; i < s->nb_inputs; i++)
|
|
|
|
if (s->input_state[i] & INPUT_ON)
|
2019-10-03 10:27:56 +02:00
|
|
|
weight_sum += FFABS(s->weights[i]);
|
2018-03-29 13:54:51 +02:00
|
|
|
|
|
|
|
for (i = 0; i < s->nb_inputs; i++) {
|
|
|
|
if (s->input_state[i] & INPUT_ON) {
|
2019-10-03 10:27:56 +02:00
|
|
|
if (s->scale_norm[i] > weight_sum / FFABS(s->weights[i])) {
|
|
|
|
s->scale_norm[i] -= ((s->weight_sum / FFABS(s->weights[i])) / s->nb_inputs) *
|
2018-03-29 13:54:51 +02:00
|
|
|
nb_samples / (s->dropout_transition * s->sample_rate);
|
2019-10-03 10:27:56 +02:00
|
|
|
s->scale_norm[i] = FFMAX(s->scale_norm[i], weight_sum / FFABS(s->weights[i]));
|
2018-03-29 13:54:51 +02:00
|
|
|
}
|
|
|
|
}
|
2012-05-21 21:27:59 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; i < s->nb_inputs; i++) {
|
2021-02-03 20:39:35 +01:00
|
|
|
if (s->input_state[i] & INPUT_ON) {
|
2021-02-12 22:58:13 +01:00
|
|
|
if (!s->normalize)
|
|
|
|
s->input_scale[i] = FFABS(s->weights[i]);
|
2021-02-03 20:39:35 +01:00
|
|
|
else
|
|
|
|
s->input_scale[i] = 1.0f / s->scale_norm[i] * FFSIGN(s->weights[i]);
|
|
|
|
} else {
|
2012-05-21 21:27:59 -04:00
|
|
|
s->input_scale[i] = 0.0f;
|
2021-02-03 20:39:35 +01:00
|
|
|
}
|
2012-05-21 21:27:59 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static int config_output(AVFilterLink *outlink)
|
|
|
|
{
|
|
|
|
AVFilterContext *ctx = outlink->src;
|
|
|
|
MixContext *s = ctx->priv;
|
|
|
|
int i;
|
|
|
|
char buf[64];
|
|
|
|
|
2012-06-08 23:59:04 -04:00
|
|
|
s->planar = av_sample_fmt_is_planar(outlink->format);
|
2012-05-21 21:27:59 -04:00
|
|
|
s->sample_rate = outlink->sample_rate;
|
|
|
|
outlink->time_base = (AVRational){ 1, outlink->sample_rate };
|
|
|
|
s->next_pts = AV_NOPTS_VALUE;
|
|
|
|
|
|
|
|
s->frame_list = av_mallocz(sizeof(*s->frame_list));
|
|
|
|
if (!s->frame_list)
|
|
|
|
return AVERROR(ENOMEM);
|
|
|
|
|
2021-09-14 21:31:53 +02:00
|
|
|
s->fifos = av_calloc(s->nb_inputs, sizeof(*s->fifos));
|
2012-05-21 21:27:59 -04:00
|
|
|
if (!s->fifos)
|
|
|
|
return AVERROR(ENOMEM);
|
|
|
|
|
2021-08-31 11:03:14 -03:00
|
|
|
s->nb_channels = outlink->ch_layout.nb_channels;
|
2012-05-21 21:27:59 -04:00
|
|
|
for (i = 0; i < s->nb_inputs; i++) {
|
|
|
|
s->fifos[i] = av_audio_fifo_alloc(outlink->format, s->nb_channels, 1024);
|
|
|
|
if (!s->fifos[i])
|
|
|
|
return AVERROR(ENOMEM);
|
|
|
|
}
|
|
|
|
|
|
|
|
s->input_state = av_malloc(s->nb_inputs);
|
|
|
|
if (!s->input_state)
|
|
|
|
return AVERROR(ENOMEM);
|
|
|
|
memset(s->input_state, INPUT_ON, s->nb_inputs);
|
|
|
|
s->active_inputs = s->nb_inputs;
|
|
|
|
|
2021-09-14 21:31:53 +02:00
|
|
|
s->input_scale = av_calloc(s->nb_inputs, sizeof(*s->input_scale));
|
|
|
|
s->scale_norm = av_calloc(s->nb_inputs, sizeof(*s->scale_norm));
|
2018-03-29 13:54:51 +02:00
|
|
|
if (!s->input_scale || !s->scale_norm)
|
2012-05-21 21:27:59 -04:00
|
|
|
return AVERROR(ENOMEM);
|
2018-03-29 13:54:51 +02:00
|
|
|
for (i = 0; i < s->nb_inputs; i++)
|
2019-10-03 10:27:56 +02:00
|
|
|
s->scale_norm[i] = s->weight_sum / FFABS(s->weights[i]);
|
2012-05-21 21:27:59 -04:00
|
|
|
calculate_scales(s, 0);
|
|
|
|
|
2021-08-31 11:03:14 -03:00
|
|
|
av_channel_layout_describe(&outlink->ch_layout, buf, sizeof(buf));
|
2012-05-21 21:27:59 -04:00
|
|
|
|
|
|
|
av_log(ctx, AV_LOG_VERBOSE,
|
2012-06-25 12:53:18 +02:00
|
|
|
"inputs:%d fmt:%s srate:%d cl:%s\n", s->nb_inputs,
|
2012-05-21 21:27:59 -04:00
|
|
|
av_get_sample_fmt_name(outlink->format), outlink->sample_rate, buf);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Read samples from the input FIFOs, mix, and write to the output link.
|
|
|
|
*/
|
2017-08-26 17:47:56 +02:00
|
|
|
static int output_frame(AVFilterLink *outlink)
|
2012-05-21 21:27:59 -04:00
|
|
|
{
|
|
|
|
AVFilterContext *ctx = outlink->src;
|
|
|
|
MixContext *s = ctx->priv;
|
2012-11-28 08:41:07 +01:00
|
|
|
AVFrame *out_buf, *in_buf;
|
2017-08-26 17:47:56 +02:00
|
|
|
int nb_samples, ns, i;
|
2015-10-24 15:19:11 +02:00
|
|
|
|
|
|
|
if (s->input_state[0] & INPUT_ON) {
|
|
|
|
/* first input live: use the corresponding frame size */
|
|
|
|
nb_samples = frame_list_next_frame_size(s->frame_list);
|
|
|
|
for (i = 1; i < s->nb_inputs; i++) {
|
|
|
|
if (s->input_state[i] & INPUT_ON) {
|
|
|
|
ns = av_audio_fifo_size(s->fifos[i]);
|
|
|
|
if (ns < nb_samples) {
|
|
|
|
if (!(s->input_state[i] & INPUT_EOF))
|
|
|
|
/* unclosed input with not enough samples */
|
2017-08-26 17:47:56 +02:00
|
|
|
return 0;
|
2015-10-24 15:19:11 +02:00
|
|
|
/* closed input to drain */
|
|
|
|
nb_samples = ns;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2020-09-13 14:00:27 +02:00
|
|
|
|
|
|
|
s->next_pts = frame_list_next_pts(s->frame_list);
|
2015-10-24 15:19:11 +02:00
|
|
|
} else {
|
|
|
|
/* first input closed: use the available samples */
|
|
|
|
nb_samples = INT_MAX;
|
|
|
|
for (i = 1; i < s->nb_inputs; i++) {
|
|
|
|
if (s->input_state[i] & INPUT_ON) {
|
|
|
|
ns = av_audio_fifo_size(s->fifos[i]);
|
|
|
|
nb_samples = FFMIN(nb_samples, ns);
|
|
|
|
}
|
|
|
|
}
|
2017-08-26 17:47:56 +02:00
|
|
|
if (nb_samples == INT_MAX) {
|
|
|
|
ff_outlink_set_status(outlink, AVERROR_EOF, s->next_pts);
|
|
|
|
return 0;
|
|
|
|
}
|
2015-10-24 15:19:11 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
frame_list_remove_samples(s->frame_list, nb_samples);
|
2012-05-21 21:27:59 -04:00
|
|
|
|
|
|
|
calculate_scales(s, nb_samples);
|
|
|
|
|
2016-04-28 20:49:13 +02:00
|
|
|
if (nb_samples == 0)
|
|
|
|
return 0;
|
|
|
|
|
2012-11-28 08:41:07 +01:00
|
|
|
out_buf = ff_get_audio_buffer(outlink, nb_samples);
|
2012-05-21 21:27:59 -04:00
|
|
|
if (!out_buf)
|
|
|
|
return AVERROR(ENOMEM);
|
|
|
|
|
2012-11-28 08:41:07 +01:00
|
|
|
in_buf = ff_get_audio_buffer(outlink, nb_samples);
|
2012-10-09 16:15:15 +02:00
|
|
|
if (!in_buf) {
|
2012-11-28 08:41:07 +01:00
|
|
|
av_frame_free(&out_buf);
|
2012-05-21 21:27:59 -04:00
|
|
|
return AVERROR(ENOMEM);
|
2012-10-09 16:15:15 +02:00
|
|
|
}
|
2012-05-21 21:27:59 -04:00
|
|
|
|
|
|
|
for (i = 0; i < s->nb_inputs; i++) {
|
2015-10-24 15:19:11 +02:00
|
|
|
if (s->input_state[i] & INPUT_ON) {
|
2012-06-08 23:59:04 -04:00
|
|
|
int planes, plane_size, p;
|
|
|
|
|
2012-05-21 21:27:59 -04:00
|
|
|
av_audio_fifo_read(s->fifos[i], (void **)in_buf->extended_data,
|
|
|
|
nb_samples);
|
2012-06-08 23:59:04 -04:00
|
|
|
|
|
|
|
planes = s->planar ? s->nb_channels : 1;
|
|
|
|
plane_size = nb_samples * (s->planar ? 1 : s->nb_channels);
|
|
|
|
plane_size = FFALIGN(plane_size, 16);
|
|
|
|
|
2017-04-09 22:10:14 +02:00
|
|
|
if (out_buf->format == AV_SAMPLE_FMT_FLT ||
|
|
|
|
out_buf->format == AV_SAMPLE_FMT_FLTP) {
|
|
|
|
for (p = 0; p < planes; p++) {
|
|
|
|
s->fdsp->vector_fmac_scalar((float *)out_buf->extended_data[p],
|
|
|
|
(float *) in_buf->extended_data[p],
|
|
|
|
s->input_scale[i], plane_size);
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
for (p = 0; p < planes; p++) {
|
|
|
|
s->fdsp->vector_dmac_scalar((double *)out_buf->extended_data[p],
|
|
|
|
(double *) in_buf->extended_data[p],
|
|
|
|
s->input_scale[i], plane_size);
|
|
|
|
}
|
2012-06-08 23:59:04 -04:00
|
|
|
}
|
2012-05-21 21:27:59 -04:00
|
|
|
}
|
|
|
|
}
|
2012-11-28 08:41:07 +01:00
|
|
|
av_frame_free(&in_buf);
|
2012-05-21 21:27:59 -04:00
|
|
|
|
|
|
|
out_buf->pts = s->next_pts;
|
2023-11-28 13:05:49 +01:00
|
|
|
out_buf->duration = av_rescale_q(out_buf->nb_samples, av_make_q(1, outlink->sample_rate),
|
|
|
|
outlink->time_base);
|
|
|
|
|
2012-05-21 21:27:59 -04:00
|
|
|
if (s->next_pts != AV_NOPTS_VALUE)
|
|
|
|
s->next_pts += nb_samples;
|
|
|
|
|
2012-11-28 13:53:48 +01:00
|
|
|
return ff_filter_frame(outlink, out_buf);
|
2012-05-21 21:27:59 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Requests a frame, if needed, from each input link other than the first.
|
|
|
|
*/
|
|
|
|
static int request_samples(AVFilterContext *ctx, int min_samples)
|
|
|
|
{
|
|
|
|
MixContext *s = ctx->priv;
|
2017-08-26 17:47:56 +02:00
|
|
|
int i;
|
2012-05-21 21:27:59 -04:00
|
|
|
|
|
|
|
av_assert0(s->nb_inputs > 1);
|
2023-10-28 13:41:01 +02:00
|
|
|
if (min_samples == 1 && s->duration_mode == DURATION_FIRST)
|
|
|
|
min_samples = av_audio_fifo_size(s->fifos[0]);
|
2012-05-21 21:27:59 -04:00
|
|
|
|
|
|
|
for (i = 1; i < s->nb_inputs; i++) {
|
2017-08-27 08:49:58 +02:00
|
|
|
if (!(s->input_state[i] & INPUT_ON) ||
|
|
|
|
(s->input_state[i] & INPUT_EOF))
|
2012-05-21 21:27:59 -04:00
|
|
|
continue;
|
2015-10-24 15:19:11 +02:00
|
|
|
if (av_audio_fifo_size(s->fifos[i]) >= min_samples)
|
|
|
|
continue;
|
2017-08-26 17:47:56 +02:00
|
|
|
ff_inlink_request_frame(ctx->inputs[i]);
|
2023-10-28 13:41:01 +02:00
|
|
|
return 0;
|
2012-05-21 21:27:59 -04:00
|
|
|
}
|
2017-08-26 17:47:56 +02:00
|
|
|
return output_frame(ctx->outputs[0]);
|
2012-05-21 21:27:59 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Calculates the number of active inputs and determines EOF based on the
|
|
|
|
* duration option.
|
|
|
|
*
|
|
|
|
* @return 0 if mixing should continue, or AVERROR_EOF if mixing should stop.
|
|
|
|
*/
|
|
|
|
static int calc_active_inputs(MixContext *s)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
int active_inputs = 0;
|
|
|
|
for (i = 0; i < s->nb_inputs; i++)
|
2015-10-24 15:19:11 +02:00
|
|
|
active_inputs += !!(s->input_state[i] & INPUT_ON);
|
2012-05-21 21:27:59 -04:00
|
|
|
s->active_inputs = active_inputs;
|
|
|
|
|
|
|
|
if (!active_inputs ||
|
2015-10-24 15:19:11 +02:00
|
|
|
(s->duration_mode == DURATION_FIRST && !(s->input_state[0] & INPUT_ON)) ||
|
2012-05-21 21:27:59 -04:00
|
|
|
(s->duration_mode == DURATION_SHORTEST && active_inputs != s->nb_inputs))
|
|
|
|
return AVERROR_EOF;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2017-08-26 17:47:56 +02:00
|
|
|
static int activate(AVFilterContext *ctx)
|
2012-05-21 21:27:59 -04:00
|
|
|
{
|
2017-08-26 17:47:56 +02:00
|
|
|
AVFilterLink *outlink = ctx->outputs[0];
|
|
|
|
MixContext *s = ctx->priv;
|
|
|
|
AVFrame *buf = NULL;
|
|
|
|
int i, ret;
|
2012-05-21 21:27:59 -04:00
|
|
|
|
2018-05-05 21:24:41 +02:00
|
|
|
FF_FILTER_FORWARD_STATUS_BACK_ALL(outlink, ctx);
|
|
|
|
|
2017-08-26 17:47:56 +02:00
|
|
|
for (i = 0; i < s->nb_inputs; i++) {
|
|
|
|
AVFilterLink *inlink = ctx->inputs[i];
|
|
|
|
|
|
|
|
if ((ret = ff_inlink_consume_frame(ctx->inputs[i], &buf)) > 0) {
|
|
|
|
if (i == 0) {
|
|
|
|
int64_t pts = av_rescale_q(buf->pts, inlink->time_base,
|
|
|
|
outlink->time_base);
|
|
|
|
ret = frame_list_add_frame(s->frame_list, buf->nb_samples, pts);
|
|
|
|
if (ret < 0) {
|
|
|
|
av_frame_free(&buf);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
}
|
2012-05-21 21:27:59 -04:00
|
|
|
|
2017-08-26 17:47:56 +02:00
|
|
|
ret = av_audio_fifo_write(s->fifos[i], (void **)buf->extended_data,
|
|
|
|
buf->nb_samples);
|
|
|
|
if (ret < 0) {
|
|
|
|
av_frame_free(&buf);
|
|
|
|
return ret;
|
|
|
|
}
|
2012-05-21 21:27:59 -04:00
|
|
|
|
2017-08-26 17:47:56 +02:00
|
|
|
av_frame_free(&buf);
|
2012-05-21 21:27:59 -04:00
|
|
|
|
2017-08-26 17:47:56 +02:00
|
|
|
ret = output_frame(outlink);
|
|
|
|
if (ret < 0)
|
|
|
|
return ret;
|
|
|
|
}
|
2012-05-21 21:27:59 -04:00
|
|
|
}
|
|
|
|
|
2017-08-26 17:47:56 +02:00
|
|
|
for (i = 0; i < s->nb_inputs; i++) {
|
|
|
|
int64_t pts;
|
|
|
|
int status;
|
|
|
|
|
|
|
|
if (ff_inlink_acknowledge_status(ctx->inputs[i], &status, &pts)) {
|
|
|
|
if (status == AVERROR_EOF) {
|
2023-10-28 13:41:01 +02:00
|
|
|
s->input_state[i] |= INPUT_EOF;
|
|
|
|
if (av_audio_fifo_size(s->fifos[i]) == 0) {
|
|
|
|
s->input_state[i] &= ~INPUT_ON;
|
2017-08-26 17:47:56 +02:00
|
|
|
if (s->nb_inputs == 1) {
|
|
|
|
ff_outlink_set_status(outlink, status, pts);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2012-05-21 21:27:59 -04:00
|
|
|
}
|
|
|
|
|
2017-08-26 17:47:56 +02:00
|
|
|
if (calc_active_inputs(s)) {
|
|
|
|
ff_outlink_set_status(outlink, AVERROR_EOF, s->next_pts);
|
|
|
|
return 0;
|
|
|
|
}
|
2012-05-21 21:27:59 -04:00
|
|
|
|
2017-08-26 17:47:56 +02:00
|
|
|
if (ff_outlink_frame_wanted(outlink)) {
|
|
|
|
int wanted_samples;
|
2015-10-24 15:19:11 +02:00
|
|
|
|
2017-08-26 17:47:56 +02:00
|
|
|
if (!(s->input_state[0] & INPUT_ON))
|
|
|
|
return request_samples(ctx, 1);
|
2012-07-02 20:13:40 +02:00
|
|
|
|
2017-08-26 17:47:56 +02:00
|
|
|
if (s->frame_list->nb_frames == 0) {
|
|
|
|
ff_inlink_request_frame(ctx->inputs[0]);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
av_assert0(s->frame_list->nb_frames > 0);
|
|
|
|
|
|
|
|
wanted_samples = frame_list_next_frame_size(s->frame_list);
|
|
|
|
|
|
|
|
return request_samples(ctx, wanted_samples);
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
2012-05-21 21:27:59 -04:00
|
|
|
}
|
|
|
|
|
2020-04-28 12:01:04 +02:00
|
|
|
static void parse_weights(AVFilterContext *ctx)
|
2012-05-21 21:27:59 -04:00
|
|
|
{
|
|
|
|
MixContext *s = ctx->priv;
|
2018-03-29 13:54:51 +02:00
|
|
|
float last_weight = 1.f;
|
2020-04-14 12:38:47 +02:00
|
|
|
char *p;
|
2020-04-28 12:01:04 +02:00
|
|
|
int i;
|
|
|
|
|
|
|
|
s->weight_sum = 0.f;
|
|
|
|
p = s->weights_str;
|
|
|
|
for (i = 0; i < s->nb_inputs; i++) {
|
|
|
|
last_weight = av_strtod(p, &p);
|
|
|
|
s->weights[i] = last_weight;
|
|
|
|
s->weight_sum += FFABS(last_weight);
|
|
|
|
if (p && *p) {
|
|
|
|
p++;
|
|
|
|
} else {
|
|
|
|
i++;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
for (; i < s->nb_inputs; i++) {
|
|
|
|
s->weights[i] = last_weight;
|
|
|
|
s->weight_sum += FFABS(last_weight);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static av_cold int init(AVFilterContext *ctx)
|
|
|
|
{
|
|
|
|
MixContext *s = ctx->priv;
|
|
|
|
int i, ret;
|
2012-05-21 21:27:59 -04:00
|
|
|
|
|
|
|
for (i = 0; i < s->nb_inputs; i++) {
|
|
|
|
AVFilterPad pad = { 0 };
|
|
|
|
|
|
|
|
pad.type = AVMEDIA_TYPE_AUDIO;
|
2017-11-24 17:09:48 +01:00
|
|
|
pad.name = av_asprintf("input%d", i);
|
2015-01-06 09:42:59 +00:00
|
|
|
if (!pad.name)
|
|
|
|
return AVERROR(ENOMEM);
|
2012-05-21 21:27:59 -04:00
|
|
|
|
2021-08-11 22:02:44 +02:00
|
|
|
if ((ret = ff_append_inpad_free_name(ctx, &pad)) < 0)
|
2017-08-25 09:36:22 +02:00
|
|
|
return ret;
|
2012-05-21 21:27:59 -04:00
|
|
|
}
|
|
|
|
|
2014-11-18 12:24:16 +01:00
|
|
|
s->fdsp = avpriv_float_dsp_alloc(0);
|
|
|
|
if (!s->fdsp)
|
|
|
|
return AVERROR(ENOMEM);
|
2012-06-08 22:34:30 -04:00
|
|
|
|
2021-09-14 21:31:53 +02:00
|
|
|
s->weights = av_calloc(s->nb_inputs, sizeof(*s->weights));
|
2018-03-29 13:54:51 +02:00
|
|
|
if (!s->weights)
|
|
|
|
return AVERROR(ENOMEM);
|
|
|
|
|
2020-04-28 12:01:04 +02:00
|
|
|
parse_weights(ctx);
|
2018-03-29 13:54:51 +02:00
|
|
|
|
2012-05-21 21:27:59 -04:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2013-04-30 18:30:02 +02:00
|
|
|
static av_cold void uninit(AVFilterContext *ctx)
|
2012-05-21 21:27:59 -04:00
|
|
|
{
|
|
|
|
int i;
|
|
|
|
MixContext *s = ctx->priv;
|
|
|
|
|
|
|
|
if (s->fifos) {
|
|
|
|
for (i = 0; i < s->nb_inputs; i++)
|
|
|
|
av_audio_fifo_free(s->fifos[i]);
|
|
|
|
av_freep(&s->fifos);
|
|
|
|
}
|
|
|
|
frame_list_clear(s->frame_list);
|
|
|
|
av_freep(&s->frame_list);
|
|
|
|
av_freep(&s->input_state);
|
|
|
|
av_freep(&s->input_scale);
|
2018-03-29 13:54:51 +02:00
|
|
|
av_freep(&s->scale_norm);
|
|
|
|
av_freep(&s->weights);
|
2014-11-18 12:24:16 +01:00
|
|
|
av_freep(&s->fdsp);
|
2012-05-21 21:27:59 -04:00
|
|
|
}
|
|
|
|
|
2020-04-28 12:01:04 +02:00
|
|
|
static int process_command(AVFilterContext *ctx, const char *cmd, const char *args,
|
|
|
|
char *res, int res_len, int flags)
|
|
|
|
{
|
|
|
|
MixContext *s = ctx->priv;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
ret = ff_filter_process_command(ctx, cmd, args, res, res_len, flags);
|
|
|
|
if (ret < 0)
|
|
|
|
return ret;
|
|
|
|
|
|
|
|
parse_weights(ctx);
|
|
|
|
for (int i = 0; i < s->nb_inputs; i++)
|
|
|
|
s->scale_norm[i] = s->weight_sum / FFABS(s->weights[i]);
|
|
|
|
calculate_scales(s, 0);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2012-07-24 14:14:01 +01:00
|
|
|
static const AVFilterPad avfilter_af_amix_outputs[] = {
|
|
|
|
{
|
|
|
|
.name = "default",
|
|
|
|
.type = AVMEDIA_TYPE_AUDIO,
|
|
|
|
.config_props = config_output,
|
|
|
|
},
|
|
|
|
};
|
|
|
|
|
2021-04-19 18:33:56 +02:00
|
|
|
const AVFilter ff_af_amix = {
|
2013-09-07 12:13:50 +00:00
|
|
|
.name = "amix",
|
|
|
|
.description = NULL_IF_CONFIG_SMALL("Audio mixing."),
|
|
|
|
.priv_size = sizeof(MixContext),
|
|
|
|
.priv_class = &amix_class,
|
2012-05-21 21:27:59 -04:00
|
|
|
.init = init,
|
|
|
|
.uninit = uninit,
|
2017-08-26 17:47:56 +02:00
|
|
|
.activate = activate,
|
2013-09-07 12:13:50 +00:00
|
|
|
.inputs = NULL,
|
2021-08-12 13:05:31 +02:00
|
|
|
FILTER_OUTPUTS(avfilter_af_amix_outputs),
|
2021-09-27 13:10:11 +02:00
|
|
|
FILTER_SAMPLEFMTS(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_FLTP,
|
|
|
|
AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_DBLP),
|
2020-04-28 12:01:04 +02:00
|
|
|
.process_command = process_command,
|
2013-09-07 12:13:50 +00:00
|
|
|
.flags = AVFILTER_FLAG_DYNAMIC_INPUTS,
|
2012-05-21 21:27:59 -04:00
|
|
|
};
|