mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2025-01-19 05:49:09 +02:00
43a188847c
If the relevant elements (the color description elements for AV1 and the VUI elements in general for H.264 (since 1156b507)) are absent, then their correct values (usually meaning unknown) have already been inferred by the reading process, so that it is unnecessary to initialize them again in the av1/h264_metadata filters even when they were initially absent. Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@gmail.com>
309 lines
9.9 KiB
C
309 lines
9.9 KiB
C
/*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#include "libavutil/common.h"
|
|
#include "libavutil/opt.h"
|
|
|
|
#include "bsf.h"
|
|
#include "cbs.h"
|
|
#include "cbs_av1.h"
|
|
|
|
enum {
|
|
PASS,
|
|
INSERT,
|
|
REMOVE,
|
|
};
|
|
|
|
typedef struct AV1MetadataContext {
|
|
const AVClass *class;
|
|
|
|
CodedBitstreamContext *cbc;
|
|
CodedBitstreamFragment access_unit;
|
|
|
|
int td;
|
|
|
|
int color_primaries;
|
|
int transfer_characteristics;
|
|
int matrix_coefficients;
|
|
|
|
int color_range;
|
|
int chroma_sample_position;
|
|
|
|
AVRational tick_rate;
|
|
int num_ticks_per_picture;
|
|
|
|
int delete_padding;
|
|
} AV1MetadataContext;
|
|
|
|
|
|
static int av1_metadata_update_sequence_header(AVBSFContext *bsf,
|
|
AV1RawSequenceHeader *seq)
|
|
{
|
|
AV1MetadataContext *ctx = bsf->priv_data;
|
|
AV1RawColorConfig *clc = &seq->color_config;
|
|
AV1RawTimingInfo *tim = &seq->timing_info;
|
|
|
|
if (ctx->color_primaries >= 0 ||
|
|
ctx->transfer_characteristics >= 0 ||
|
|
ctx->matrix_coefficients >= 0) {
|
|
clc->color_description_present_flag = 1;
|
|
|
|
if (ctx->color_primaries >= 0)
|
|
clc->color_primaries = ctx->color_primaries;
|
|
if (ctx->transfer_characteristics >= 0)
|
|
clc->transfer_characteristics = ctx->transfer_characteristics;
|
|
if (ctx->matrix_coefficients >= 0)
|
|
clc->matrix_coefficients = ctx->matrix_coefficients;
|
|
}
|
|
|
|
if (ctx->color_range >= 0) {
|
|
if (clc->color_primaries == AVCOL_PRI_BT709 &&
|
|
clc->transfer_characteristics == AVCOL_TRC_IEC61966_2_1 &&
|
|
clc->matrix_coefficients == AVCOL_SPC_RGB) {
|
|
av_log(bsf, AV_LOG_WARNING, "Warning: color_range cannot be set "
|
|
"on RGB streams encoded in BT.709 sRGB.\n");
|
|
} else {
|
|
clc->color_range = ctx->color_range;
|
|
}
|
|
}
|
|
|
|
if (ctx->chroma_sample_position >= 0) {
|
|
if (clc->mono_chrome || !clc->subsampling_x || !clc->subsampling_y) {
|
|
av_log(bsf, AV_LOG_WARNING, "Warning: chroma_sample_position "
|
|
"can only be set for 4:2:0 streams.\n");
|
|
} else {
|
|
clc->chroma_sample_position = ctx->chroma_sample_position;
|
|
}
|
|
}
|
|
|
|
if (ctx->tick_rate.num && ctx->tick_rate.den) {
|
|
int num, den;
|
|
|
|
av_reduce(&num, &den, ctx->tick_rate.num, ctx->tick_rate.den,
|
|
UINT32_MAX > INT_MAX ? UINT32_MAX : INT_MAX);
|
|
|
|
tim->time_scale = num;
|
|
tim->num_units_in_display_tick = den;
|
|
seq->timing_info_present_flag = 1;
|
|
|
|
if (ctx->num_ticks_per_picture > 0) {
|
|
tim->equal_picture_interval = 1;
|
|
tim->num_ticks_per_picture_minus_1 =
|
|
ctx->num_ticks_per_picture - 1;
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int av1_metadata_filter(AVBSFContext *bsf, AVPacket *pkt)
|
|
{
|
|
AV1MetadataContext *ctx = bsf->priv_data;
|
|
CodedBitstreamFragment *frag = &ctx->access_unit;
|
|
AV1RawOBU td, *obu;
|
|
int err, i;
|
|
|
|
err = ff_bsf_get_packet_ref(bsf, pkt);
|
|
if (err < 0)
|
|
return err;
|
|
|
|
err = ff_cbs_read_packet(ctx->cbc, frag, pkt);
|
|
if (err < 0) {
|
|
av_log(bsf, AV_LOG_ERROR, "Failed to read packet.\n");
|
|
goto fail;
|
|
}
|
|
|
|
if (frag->nb_units == 0) {
|
|
av_log(bsf, AV_LOG_ERROR, "No OBU in packet.\n");
|
|
err = AVERROR_INVALIDDATA;
|
|
goto fail;
|
|
}
|
|
|
|
for (i = 0; i < frag->nb_units; i++) {
|
|
if (frag->units[i].type == AV1_OBU_SEQUENCE_HEADER) {
|
|
obu = frag->units[i].content;
|
|
err = av1_metadata_update_sequence_header(bsf, &obu->obu.sequence_header);
|
|
if (err < 0)
|
|
goto fail;
|
|
}
|
|
}
|
|
|
|
// If a Temporal Delimiter is present, it must be the first OBU.
|
|
if (frag->units[0].type == AV1_OBU_TEMPORAL_DELIMITER) {
|
|
if (ctx->td == REMOVE)
|
|
ff_cbs_delete_unit(ctx->cbc, frag, 0);
|
|
} else if (ctx->td == INSERT) {
|
|
td = (AV1RawOBU) {
|
|
.header.obu_type = AV1_OBU_TEMPORAL_DELIMITER,
|
|
};
|
|
|
|
err = ff_cbs_insert_unit_content(ctx->cbc, frag, 0, AV1_OBU_TEMPORAL_DELIMITER,
|
|
&td, NULL);
|
|
if (err < 0) {
|
|
av_log(bsf, AV_LOG_ERROR, "Failed to insert Temporal Delimiter.\n");
|
|
goto fail;
|
|
}
|
|
}
|
|
|
|
if (ctx->delete_padding) {
|
|
for (i = frag->nb_units - 1; i >= 0; i--) {
|
|
if (frag->units[i].type == AV1_OBU_PADDING)
|
|
ff_cbs_delete_unit(ctx->cbc, frag, i);
|
|
}
|
|
}
|
|
|
|
err = ff_cbs_write_packet(ctx->cbc, pkt, frag);
|
|
if (err < 0) {
|
|
av_log(bsf, AV_LOG_ERROR, "Failed to write packet.\n");
|
|
goto fail;
|
|
}
|
|
|
|
err = 0;
|
|
fail:
|
|
ff_cbs_fragment_reset(ctx->cbc, frag);
|
|
|
|
if (err < 0)
|
|
av_packet_unref(pkt);
|
|
|
|
return err;
|
|
}
|
|
|
|
static int av1_metadata_init(AVBSFContext *bsf)
|
|
{
|
|
AV1MetadataContext *ctx = bsf->priv_data;
|
|
CodedBitstreamFragment *frag = &ctx->access_unit;
|
|
AV1RawOBU *obu;
|
|
int err, i;
|
|
|
|
err = ff_cbs_init(&ctx->cbc, AV_CODEC_ID_AV1, bsf);
|
|
if (err < 0)
|
|
return err;
|
|
|
|
if (bsf->par_in->extradata) {
|
|
err = ff_cbs_read_extradata(ctx->cbc, frag, bsf->par_in);
|
|
if (err < 0) {
|
|
av_log(bsf, AV_LOG_ERROR, "Failed to read extradata.\n");
|
|
goto fail;
|
|
}
|
|
|
|
for (i = 0; i < frag->nb_units; i++) {
|
|
if (frag->units[i].type == AV1_OBU_SEQUENCE_HEADER) {
|
|
obu = frag->units[i].content;
|
|
err = av1_metadata_update_sequence_header(bsf, &obu->obu.sequence_header);
|
|
if (err < 0)
|
|
goto fail;
|
|
}
|
|
}
|
|
|
|
err = ff_cbs_write_extradata(ctx->cbc, bsf->par_out, frag);
|
|
if (err < 0) {
|
|
av_log(bsf, AV_LOG_ERROR, "Failed to write extradata.\n");
|
|
goto fail;
|
|
}
|
|
}
|
|
|
|
err = 0;
|
|
fail:
|
|
ff_cbs_fragment_reset(ctx->cbc, frag);
|
|
return err;
|
|
}
|
|
|
|
static void av1_metadata_close(AVBSFContext *bsf)
|
|
{
|
|
AV1MetadataContext *ctx = bsf->priv_data;
|
|
|
|
ff_cbs_fragment_free(ctx->cbc, &ctx->access_unit);
|
|
ff_cbs_close(&ctx->cbc);
|
|
}
|
|
|
|
#define OFFSET(x) offsetof(AV1MetadataContext, x)
|
|
#define FLAGS (AV_OPT_FLAG_VIDEO_PARAM|AV_OPT_FLAG_BSF_PARAM)
|
|
static const AVOption av1_metadata_options[] = {
|
|
{ "td", "Temporal Delimiter OBU",
|
|
OFFSET(td), AV_OPT_TYPE_INT,
|
|
{ .i64 = PASS }, PASS, REMOVE, FLAGS, "td" },
|
|
{ "pass", NULL, 0, AV_OPT_TYPE_CONST,
|
|
{ .i64 = PASS }, .flags = FLAGS, .unit = "td" },
|
|
{ "insert", NULL, 0, AV_OPT_TYPE_CONST,
|
|
{ .i64 = INSERT }, .flags = FLAGS, .unit = "td" },
|
|
{ "remove", NULL, 0, AV_OPT_TYPE_CONST,
|
|
{ .i64 = REMOVE }, .flags = FLAGS, .unit = "td" },
|
|
|
|
{ "color_primaries", "Set color primaries (section 6.4.2)",
|
|
OFFSET(color_primaries), AV_OPT_TYPE_INT,
|
|
{ .i64 = -1 }, -1, 255, FLAGS },
|
|
{ "transfer_characteristics", "Set transfer characteristics (section 6.4.2)",
|
|
OFFSET(transfer_characteristics), AV_OPT_TYPE_INT,
|
|
{ .i64 = -1 }, -1, 255, FLAGS },
|
|
{ "matrix_coefficients", "Set matrix coefficients (section 6.4.2)",
|
|
OFFSET(matrix_coefficients), AV_OPT_TYPE_INT,
|
|
{ .i64 = -1 }, -1, 255, FLAGS },
|
|
|
|
{ "color_range", "Set color range flag (section 6.4.2)",
|
|
OFFSET(color_range), AV_OPT_TYPE_INT,
|
|
{ .i64 = -1 }, -1, 1, FLAGS, "cr" },
|
|
{ "tv", "TV (limited) range", 0, AV_OPT_TYPE_CONST,
|
|
{ .i64 = 0 }, .flags = FLAGS, .unit = "cr" },
|
|
{ "pc", "PC (full) range", 0, AV_OPT_TYPE_CONST,
|
|
{ .i64 = 1 }, .flags = FLAGS, .unit = "cr" },
|
|
|
|
{ "chroma_sample_position", "Set chroma sample position (section 6.4.2)",
|
|
OFFSET(chroma_sample_position), AV_OPT_TYPE_INT,
|
|
{ .i64 = -1 }, -1, 3, FLAGS, "csp" },
|
|
{ "unknown", "Unknown chroma sample position", 0, AV_OPT_TYPE_CONST,
|
|
{ .i64 = AV1_CSP_UNKNOWN }, .flags = FLAGS, .unit = "csp" },
|
|
{ "vertical", "Left chroma sample position", 0, AV_OPT_TYPE_CONST,
|
|
{ .i64 = AV1_CSP_VERTICAL }, .flags = FLAGS, .unit = "csp" },
|
|
{ "colocated", "Top-left chroma sample position", 0, AV_OPT_TYPE_CONST,
|
|
{ .i64 = AV1_CSP_COLOCATED }, .flags = FLAGS, .unit = "csp" },
|
|
|
|
{ "tick_rate", "Set display tick rate (num_units_in_display_tick / time_scale)",
|
|
OFFSET(tick_rate), AV_OPT_TYPE_RATIONAL,
|
|
{ .dbl = 0.0 }, 0, UINT_MAX, FLAGS },
|
|
{ "num_ticks_per_picture", "Set display ticks per picture for CFR streams",
|
|
OFFSET(num_ticks_per_picture), AV_OPT_TYPE_INT,
|
|
{ .i64 = -1 }, -1, INT_MAX, FLAGS },
|
|
|
|
{ "delete_padding", "Delete all Padding OBUs",
|
|
OFFSET(delete_padding), AV_OPT_TYPE_BOOL,
|
|
{ .i64 = 0 }, 0, 1, FLAGS},
|
|
|
|
{ NULL }
|
|
};
|
|
|
|
static const AVClass av1_metadata_class = {
|
|
.class_name = "av1_metadata_bsf",
|
|
.item_name = av_default_item_name,
|
|
.option = av1_metadata_options,
|
|
.version = LIBAVUTIL_VERSION_INT,
|
|
};
|
|
|
|
static const enum AVCodecID av1_metadata_codec_ids[] = {
|
|
AV_CODEC_ID_AV1, AV_CODEC_ID_NONE,
|
|
};
|
|
|
|
const AVBitStreamFilter ff_av1_metadata_bsf = {
|
|
.name = "av1_metadata",
|
|
.priv_data_size = sizeof(AV1MetadataContext),
|
|
.priv_class = &av1_metadata_class,
|
|
.init = &av1_metadata_init,
|
|
.close = &av1_metadata_close,
|
|
.filter = &av1_metadata_filter,
|
|
.codec_ids = av1_metadata_codec_ids,
|
|
};
|