1
0
mirror of https://github.com/FFmpeg/FFmpeg.git synced 2025-11-23 21:54:53 +02:00
Files
FFmpeg/libavcodec/libmpeghdec.c
Andreas Rheinhardt 188440929d avcodec/libmpeghdec: Check channel layouts generically
Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
2025-09-26 05:38:46 +02:00

232 lines
8.3 KiB
C

/*
* MPEG-H 3D Audio Decoder Wrapper
* Copyright (C) 2025 Fraunhofer Institute for Integrated Circuits IIS
*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
/*
* Please note that this FFmpeg Software is licensed under the LGPL-2.1
* but is combined with software that is licensed under different terms, namely
* the "Software License for The Fraunhofer FDK MPEG-H Software". Fraunhofer
* as the initial licensor does not interpret the LGPL-2.1 as requiring
* distribution of the MPEG-H Software under the LGPL-2.1 if being distributed
* together with this FFmpeg Software. Therefore, downstream distribution of
* FFmpeg Software does not imply any right to redistribute the MPEG-H Software
* under the LGPL-2.1.
*/
#include <string.h>
#include <mpeghdec/mpeghdecoder.h>
#include "libavutil/channel_layout.h"
#include "libavutil/frame.h"
#include "libavutil/mem.h"
#include "codec_internal.h"
#include "decode.h"
#define MAX_LOST_FRAMES 2
// max framesize * (max delay frames + 1)
#define PER_CHANNEL_OUTBUF_SIZE (3072 * (MAX_LOST_FRAMES + 1))
typedef struct MPEGH3DADecContext {
// pointer to the decoder
HANDLE_MPEGH_DECODER_CONTEXT decoder;
// Internal values
int32_t *decoder_buffer;
int decoder_buffer_size; ///< in samples
} MPEGH3DADecContext;
static av_cold int mpegh3dadec_close(AVCodecContext *avctx)
{
MPEGH3DADecContext *s = avctx->priv_data;
if (s->decoder)
mpeghdecoder_destroy(s->decoder);
s->decoder = NULL;
av_freep(&s->decoder_buffer);
return 0;
}
// Lookup CICP for FFmpeg channel layout, see:
// https://github.com/Fraunhofer-IIS/mpeghdec/wiki/MPEG-H-decoder-target-layouts
static av_cold int channel_layout_to_cicp(const AVChannelLayout *layout)
{
// different from AV_CH_LAYOUT_7POINT2POINT3
#define CH_LAYOUT_7POINT2POINT3 AV_CH_LAYOUT_5POINT1POINT2 | AV_CH_SIDE_SURROUND_LEFT | \
AV_CH_SIDE_SURROUND_RIGHT | AV_CH_TOP_BACK_CENTER | \
AV_CH_LOW_FREQUENCY_2
#define CH_LAYOUT_5POINT1POINT6 AV_CH_LAYOUT_5POINT1POINT4_BACK | \
AV_CH_TOP_FRONT_CENTER | AV_CH_TOP_CENTER
#define CH_LAYOUT_7POINT1POINT6 AV_CH_LAYOUT_7POINT1POINT4_BACK | \
AV_CH_TOP_FRONT_CENTER | AV_CH_TOP_CENTER
static const uint64_t channel_layout_masks[] = {
0,
AV_CH_LAYOUT_MONO, AV_CH_LAYOUT_STEREO,
AV_CH_LAYOUT_SURROUND, AV_CH_LAYOUT_4POINT0,
AV_CH_LAYOUT_5POINT0, AV_CH_LAYOUT_5POINT1,
AV_CH_LAYOUT_7POINT1_WIDE, 0,
AV_CH_LAYOUT_2_1, AV_CH_LAYOUT_2_2,
AV_CH_LAYOUT_6POINT1, AV_CH_LAYOUT_7POINT1,
AV_CH_LAYOUT_22POINT2, AV_CH_LAYOUT_5POINT1POINT2,
CH_LAYOUT_7POINT2POINT3, AV_CH_LAYOUT_5POINT1POINT4_BACK,
CH_LAYOUT_5POINT1POINT6, CH_LAYOUT_7POINT1POINT6,
AV_CH_LAYOUT_7POINT1POINT4_BACK,
};
for (size_t i = 0; i < FF_ARRAY_ELEMS(channel_layout_masks); ++i) {
if (channel_layout_masks[i]) {
AVChannelLayout ch_layout;
av_channel_layout_from_mask(&ch_layout, channel_layout_masks[i]);
if (!av_channel_layout_compare(layout, &ch_layout))
return i;
}
}
return 0;
}
static av_cold int mpegh3dadec_init(AVCodecContext *avctx)
{
int cicp;
MPEGH3DADecContext *s = avctx->priv_data;
if (avctx->ch_layout.nb_channels == 0) {
av_log(avctx, AV_LOG_ERROR, "Channel layout needs to be specified\n");
return AVERROR(EINVAL);
} else if ((cicp = channel_layout_to_cicp(&avctx->ch_layout)) <= 0) {
av_log(avctx, AV_LOG_ERROR, "Unsupported channel layout\n");
return AVERROR(EINVAL);
}
s->decoder = NULL;
avctx->delay = 0;
avctx->sample_fmt = AV_SAMPLE_FMT_S32;
avctx->sample_rate = 48000;
s->decoder_buffer_size = PER_CHANNEL_OUTBUF_SIZE * avctx->ch_layout.nb_channels;
s->decoder_buffer = av_malloc_array(s->decoder_buffer_size, sizeof(*s->decoder_buffer));
if (!s->decoder_buffer)
return AVERROR(ENOMEM);
// initialize the decoder
s->decoder = mpeghdecoder_init(cicp);
if (s->decoder == NULL) {
av_log(avctx, AV_LOG_ERROR, "MPEG-H decoder library init failed.\n");
return AVERROR_EXTERNAL;
}
if (avctx->extradata_size) {
if (mpeghdecoder_setMhaConfig(s->decoder, avctx->extradata,
avctx->extradata_size)) {
av_log(avctx, AV_LOG_ERROR, "Unable to set MHA configuration\n");
return AVERROR_INVALIDDATA;
}
}
return 0;
}
static int mpegh3dadec_decode_frame(AVCodecContext *avctx, AVFrame *frame,
int *got_frame_ptr, AVPacket *avpkt)
{
MPEGH3DADecContext *s = avctx->priv_data;
int ret;
MPEGH_DECODER_ERROR err;
MPEGH_DECODER_OUTPUT_INFO out_info;
if (!avctx->sample_rate) {
av_log(avctx, AV_LOG_ERROR, "Audio sample rate is not set");
return AVERROR_INVALIDDATA;
}
if (avpkt->data != NULL && avpkt->size > 0) {
if ((err = mpeghdecoder_processTimescale(s->decoder, avpkt->data,
avpkt->size, avpkt->pts,
avctx->sample_rate))) {
av_log(avctx, AV_LOG_ERROR, "mpeghdecoder_process() failed: %x\n",
err);
return AVERROR_INVALIDDATA;
}
} else {
// we are flushing
err = mpeghdecoder_flushAndGet(s->decoder);
if (err != MPEGH_DEC_OK && err != MPEGH_DEC_FEED_DATA)
av_log(avctx, AV_LOG_WARNING,
"mpeghdecoder_flushAndGet() failed: %d\n", err);
}
err = mpeghdecoder_getSamples(s->decoder, s->decoder_buffer,
s->decoder_buffer_size,
&out_info);
if (err == MPEGH_DEC_FEED_DATA) {
// no frames to produce at the moment
return avpkt->size;
} else if (err) {
av_log(avctx, AV_LOG_ERROR, "mpeghdecoder_getSamples() failed: %x\n",
err);
return AVERROR_UNKNOWN;
}
frame->nb_samples = out_info.numSamplesPerChannel;
frame->sample_rate = avctx->sample_rate = out_info.sampleRate;
frame->pts = out_info.ticks;
frame->time_base.num = 1;
frame->time_base.den = out_info.sampleRate;
if ((ret = ff_get_buffer(avctx, frame, 0)) < 0)
return ret;
memcpy(frame->extended_data[0], s->decoder_buffer,
avctx->ch_layout.nb_channels * frame->nb_samples *
sizeof(*s->decoder_buffer) /* only AV_SAMPLE_FMT_S32 is supported */);
*got_frame_ptr = 1;
return ret = avpkt->size;
}
static av_cold void mpegh3dadec_flush(AVCodecContext *avctx)
{
MPEGH_DECODER_ERROR err;
MPEGH3DADecContext *s = avctx->priv_data;
err = mpeghdecoder_flush(s->decoder);
if (err != MPEGH_DEC_OK && err != MPEGH_DEC_FEED_DATA)
av_log(avctx, AV_LOG_WARNING, "mpeghdecoder_flush failed: %d\n", err);
}
const FFCodec ff_libmpeghdec_decoder = {
.p.name = "libmpeghdec",
CODEC_LONG_NAME("libmpeghdec (MPEG-H 3D Audio)"),
.p.type = AVMEDIA_TYPE_AUDIO,
.p.id = AV_CODEC_ID_MPEGH_3D_AUDIO,
.p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY |
AV_CODEC_CAP_CHANNEL_CONF,
.caps_internal = FF_CODEC_CAP_INIT_CLEANUP,
.priv_data_size = sizeof(MPEGH3DADecContext),
.init = mpegh3dadec_init,
FF_CODEC_DECODE_CB(mpegh3dadec_decode_frame),
.flush = mpegh3dadec_flush,
.close = mpegh3dadec_close,
.p.wrapper_name = "libmpeghdec",
};