mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2025-01-13 21:28:01 +02:00
e45ed15594
Some containers, like Matroska, may propagate key frames with no Sequence Header OBU since it's provided in extradata instead. With this change, the Sequence Header will be appended to the packet data before calling aom_codec_decode(). Signed-off-by: James Almer <jamrial@gmail.com>
237 lines
7.8 KiB
C
237 lines
7.8 KiB
C
/*
|
|
* Copyright (c) 2010, Google, Inc.
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
/**
|
|
* @file
|
|
* AV1 decoder support via libaom
|
|
*/
|
|
|
|
#include <aom/aom_decoder.h>
|
|
#include <aom/aomdx.h>
|
|
|
|
#include "libavutil/common.h"
|
|
#include "libavutil/imgutils.h"
|
|
|
|
#include "avcodec.h"
|
|
#include "internal.h"
|
|
#include "profiles.h"
|
|
|
|
typedef struct AV1DecodeContext {
|
|
struct aom_codec_ctx decoder;
|
|
} AV1DecodeContext;
|
|
|
|
static av_cold int aom_init(AVCodecContext *avctx,
|
|
const struct aom_codec_iface *iface)
|
|
{
|
|
AV1DecodeContext *ctx = avctx->priv_data;
|
|
struct aom_codec_dec_cfg deccfg = {
|
|
/* token partitions+1 would be a decent choice */
|
|
.threads = FFMIN(avctx->thread_count, 16)
|
|
};
|
|
|
|
av_log(avctx, AV_LOG_INFO, "%s\n", aom_codec_version_str());
|
|
av_log(avctx, AV_LOG_VERBOSE, "%s\n", aom_codec_build_config());
|
|
|
|
if (aom_codec_dec_init(&ctx->decoder, iface, &deccfg, 0) != AOM_CODEC_OK) {
|
|
const char *error = aom_codec_error(&ctx->decoder);
|
|
av_log(avctx, AV_LOG_ERROR, "Failed to initialize decoder: %s\n",
|
|
error);
|
|
return AVERROR(EINVAL);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void image_copy_16_to_8(AVFrame *pic, struct aom_image *img)
|
|
{
|
|
const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pic->format);
|
|
int i;
|
|
|
|
for (i = 0; i < desc->nb_components; i++) {
|
|
int w = img->d_w;
|
|
int h = img->d_h;
|
|
int x, y;
|
|
|
|
if (i) {
|
|
w = (w + img->x_chroma_shift) >> img->x_chroma_shift;
|
|
h = (h + img->y_chroma_shift) >> img->y_chroma_shift;
|
|
}
|
|
|
|
for (y = 0; y < h; y++) {
|
|
uint16_t *src = (uint16_t *)(img->planes[i] + y * img->stride[i]);
|
|
uint8_t *dst = pic->data[i] + y * pic->linesize[i];
|
|
for (x = 0; x < w; x++)
|
|
*dst++ = *src++;
|
|
}
|
|
}
|
|
}
|
|
|
|
// returns 0 on success, AVERROR_INVALIDDATA otherwise
|
|
static int set_pix_fmt(AVCodecContext *avctx, struct aom_image *img)
|
|
{
|
|
static const enum AVColorRange color_ranges[] = {
|
|
AVCOL_RANGE_MPEG, AVCOL_RANGE_JPEG
|
|
};
|
|
avctx->color_range = color_ranges[img->range];
|
|
avctx->color_primaries = img->cp;
|
|
avctx->colorspace = img->mc;
|
|
avctx->color_trc = img->tc;
|
|
|
|
switch (img->fmt) {
|
|
case AOM_IMG_FMT_I420:
|
|
case AOM_IMG_FMT_I42016:
|
|
if (img->bit_depth == 8) {
|
|
avctx->pix_fmt = img->monochrome ?
|
|
AV_PIX_FMT_GRAY8 : AV_PIX_FMT_YUV420P;
|
|
avctx->profile = FF_PROFILE_AV1_MAIN;
|
|
return 0;
|
|
} else if (img->bit_depth == 10) {
|
|
avctx->pix_fmt = img->monochrome ?
|
|
AV_PIX_FMT_GRAY10 : AV_PIX_FMT_YUV420P10;
|
|
avctx->profile = FF_PROFILE_AV1_MAIN;
|
|
return 0;
|
|
} else if (img->bit_depth == 12) {
|
|
avctx->pix_fmt = img->monochrome ?
|
|
AV_PIX_FMT_GRAY12 : AV_PIX_FMT_YUV420P12;
|
|
avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;
|
|
return 0;
|
|
} else {
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
case AOM_IMG_FMT_I422:
|
|
case AOM_IMG_FMT_I42216:
|
|
if (img->bit_depth == 8) {
|
|
avctx->pix_fmt = AV_PIX_FMT_YUV422P;
|
|
avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;
|
|
return 0;
|
|
} else if (img->bit_depth == 10) {
|
|
avctx->pix_fmt = AV_PIX_FMT_YUV422P10;
|
|
avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;
|
|
return 0;
|
|
} else if (img->bit_depth == 12) {
|
|
avctx->pix_fmt = AV_PIX_FMT_YUV422P12;
|
|
avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;
|
|
return 0;
|
|
} else {
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
case AOM_IMG_FMT_I444:
|
|
case AOM_IMG_FMT_I44416:
|
|
if (img->bit_depth == 8) {
|
|
avctx->pix_fmt = AV_PIX_FMT_YUV444P;
|
|
avctx->profile = FF_PROFILE_AV1_HIGH;
|
|
return 0;
|
|
} else if (img->bit_depth == 10) {
|
|
avctx->pix_fmt = AV_PIX_FMT_YUV444P10;
|
|
avctx->profile = FF_PROFILE_AV1_HIGH;
|
|
return 0;
|
|
} else if (img->bit_depth == 12) {
|
|
avctx->pix_fmt = AV_PIX_FMT_YUV444P12;
|
|
avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;
|
|
return 0;
|
|
} else {
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
|
|
default:
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
}
|
|
|
|
static int aom_decode(AVCodecContext *avctx, void *data, int *got_frame,
|
|
AVPacket *avpkt)
|
|
{
|
|
AV1DecodeContext *ctx = avctx->priv_data;
|
|
AVFrame *picture = data;
|
|
const void *iter = NULL;
|
|
struct aom_image *img;
|
|
int ret;
|
|
|
|
if (aom_codec_decode(&ctx->decoder, avpkt->data, avpkt->size, NULL) !=
|
|
AOM_CODEC_OK) {
|
|
const char *error = aom_codec_error(&ctx->decoder);
|
|
const char *detail = aom_codec_error_detail(&ctx->decoder);
|
|
|
|
av_log(avctx, AV_LOG_ERROR, "Failed to decode frame: %s\n", error);
|
|
if (detail)
|
|
av_log(avctx, AV_LOG_ERROR, " Additional information: %s\n",
|
|
detail);
|
|
return AVERROR_INVALIDDATA;
|
|
}
|
|
|
|
if ((img = aom_codec_get_frame(&ctx->decoder, &iter))) {
|
|
if (img->d_w > img->w || img->d_h > img->h) {
|
|
av_log(avctx, AV_LOG_ERROR, "Display dimensions %dx%d exceed storage %dx%d\n",
|
|
img->d_w, img->d_h, img->w, img->h);
|
|
return AVERROR_EXTERNAL;
|
|
}
|
|
|
|
if ((ret = set_pix_fmt(avctx, img)) < 0) {
|
|
av_log(avctx, AV_LOG_ERROR, "Unsupported output colorspace (%d) / bit_depth (%d)\n",
|
|
img->fmt, img->bit_depth);
|
|
return ret;
|
|
}
|
|
|
|
if ((int)img->d_w != avctx->width || (int)img->d_h != avctx->height) {
|
|
av_log(avctx, AV_LOG_INFO, "dimension change! %dx%d -> %dx%d\n",
|
|
avctx->width, avctx->height, img->d_w, img->d_h);
|
|
ret = ff_set_dimensions(avctx, img->d_w, img->d_h);
|
|
if (ret < 0)
|
|
return ret;
|
|
}
|
|
if ((ret = ff_get_buffer(avctx, picture, 0)) < 0)
|
|
return ret;
|
|
if ((img->fmt & AOM_IMG_FMT_HIGHBITDEPTH) && img->bit_depth == 8)
|
|
image_copy_16_to_8(picture, img);
|
|
else
|
|
av_image_copy(picture->data, picture->linesize, (const uint8_t **)img->planes,
|
|
img->stride, avctx->pix_fmt, img->d_w, img->d_h);
|
|
*got_frame = 1;
|
|
}
|
|
return avpkt->size;
|
|
}
|
|
|
|
static av_cold int aom_free(AVCodecContext *avctx)
|
|
{
|
|
AV1DecodeContext *ctx = avctx->priv_data;
|
|
aom_codec_destroy(&ctx->decoder);
|
|
return 0;
|
|
}
|
|
|
|
static av_cold int av1_init(AVCodecContext *avctx)
|
|
{
|
|
return aom_init(avctx, &aom_codec_av1_dx_algo);
|
|
}
|
|
|
|
AVCodec ff_libaom_av1_decoder = {
|
|
.name = "libaom-av1",
|
|
.long_name = NULL_IF_CONFIG_SMALL("libaom AV1"),
|
|
.type = AVMEDIA_TYPE_VIDEO,
|
|
.id = AV_CODEC_ID_AV1,
|
|
.priv_data_size = sizeof(AV1DecodeContext),
|
|
.init = av1_init,
|
|
.close = aom_free,
|
|
.decode = aom_decode,
|
|
.capabilities = AV_CODEC_CAP_AUTO_THREADS | AV_CODEC_CAP_DR1,
|
|
.profiles = NULL_IF_CONFIG_SMALL(ff_av1_profiles),
|
|
.wrapper_name = "libaom",
|
|
.bsfs = "dump_extra",
|
|
};
|