mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2025-01-03 05:10:03 +02:00
92abc7266b
Up until now, the VAAPI encoder uses fake data with the AVBuffer-API: The data pointer does not point to real memory, but is instead just a VABufferID converted to a pointer. This has probably been copied from the VAAPI-hwcontext-API (which presumably does it to avoid allocations). This commit changes this without causing additional allocations by switching to the RefStruct-pool API. This also fixes an unchecked av_buffer_ref(). Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
545 lines
18 KiB
C
545 lines
18 KiB
C
/*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#ifndef AVCODEC_VAAPI_ENCODE_H
|
|
#define AVCODEC_VAAPI_ENCODE_H
|
|
|
|
#include <stdint.h>
|
|
|
|
#include <va/va.h>
|
|
|
|
#if VA_CHECK_VERSION(1, 0, 0)
|
|
#include <va/va_str.h>
|
|
#endif
|
|
|
|
#include "libavutil/hwcontext.h"
|
|
#include "libavutil/hwcontext_vaapi.h"
|
|
#include "libavutil/fifo.h"
|
|
|
|
#include "avcodec.h"
|
|
#include "hwconfig.h"
|
|
|
|
struct VAAPIEncodeType;
|
|
struct VAAPIEncodePicture;
|
|
|
|
enum {
|
|
MAX_CONFIG_ATTRIBUTES = 4,
|
|
MAX_GLOBAL_PARAMS = 4,
|
|
MAX_DPB_SIZE = 16,
|
|
MAX_PICTURE_REFERENCES = 2,
|
|
MAX_REORDER_DELAY = 16,
|
|
MAX_PARAM_BUFFER_SIZE = 1024,
|
|
// A.4.1: table A.6 allows at most 22 tile rows for any level.
|
|
MAX_TILE_ROWS = 22,
|
|
// A.4.1: table A.6 allows at most 20 tile columns for any level.
|
|
MAX_TILE_COLS = 20,
|
|
MAX_ASYNC_DEPTH = 64,
|
|
MAX_REFERENCE_LIST_NUM = 2,
|
|
};
|
|
|
|
extern const AVCodecHWConfigInternal *const ff_vaapi_encode_hw_configs[];
|
|
|
|
enum {
|
|
PICTURE_TYPE_IDR = 0,
|
|
PICTURE_TYPE_I = 1,
|
|
PICTURE_TYPE_P = 2,
|
|
PICTURE_TYPE_B = 3,
|
|
};
|
|
|
|
typedef struct VAAPIEncodeSlice {
|
|
int index;
|
|
int row_start;
|
|
int row_size;
|
|
int block_start;
|
|
int block_size;
|
|
void *codec_slice_params;
|
|
} VAAPIEncodeSlice;
|
|
|
|
typedef struct VAAPIEncodePicture {
|
|
struct VAAPIEncodePicture *next;
|
|
|
|
int64_t display_order;
|
|
int64_t encode_order;
|
|
int64_t pts;
|
|
int64_t duration;
|
|
int force_idr;
|
|
|
|
void *opaque;
|
|
AVBufferRef *opaque_ref;
|
|
|
|
#if VA_CHECK_VERSION(1, 0, 0)
|
|
// ROI regions.
|
|
VAEncROI *roi;
|
|
#else
|
|
void *roi;
|
|
#endif
|
|
|
|
int type;
|
|
int b_depth;
|
|
int encode_issued;
|
|
int encode_complete;
|
|
|
|
AVFrame *input_image;
|
|
VASurfaceID input_surface;
|
|
|
|
AVFrame *recon_image;
|
|
VASurfaceID recon_surface;
|
|
|
|
int nb_param_buffers;
|
|
VABufferID *param_buffers;
|
|
|
|
/* Refcounted via the refstruct-API */
|
|
VABufferID *output_buffer_ref;
|
|
VABufferID output_buffer;
|
|
|
|
void *priv_data;
|
|
void *codec_picture_params;
|
|
|
|
// Whether this picture is a reference picture.
|
|
int is_reference;
|
|
|
|
// The contents of the DPB after this picture has been decoded.
|
|
// This will contain the picture itself if it is a reference picture,
|
|
// but not if it isn't.
|
|
int nb_dpb_pics;
|
|
struct VAAPIEncodePicture *dpb[MAX_DPB_SIZE];
|
|
// The reference pictures used in decoding this picture. If they are
|
|
// used by later pictures they will also appear in the DPB. ref[0][] for
|
|
// previous reference frames. ref[1][] for future reference frames.
|
|
int nb_refs[MAX_REFERENCE_LIST_NUM];
|
|
struct VAAPIEncodePicture *refs[MAX_REFERENCE_LIST_NUM][MAX_PICTURE_REFERENCES];
|
|
// The previous reference picture in encode order. Must be in at least
|
|
// one of the reference list and DPB list.
|
|
struct VAAPIEncodePicture *prev;
|
|
// Reference count for other pictures referring to this one through
|
|
// the above pointers, directly from incomplete pictures and indirectly
|
|
// through completed pictures.
|
|
int ref_count[2];
|
|
int ref_removed[2];
|
|
|
|
int nb_slices;
|
|
VAAPIEncodeSlice *slices;
|
|
|
|
/**
|
|
* indicate if current frame is an independent frame that the coded data
|
|
* can be pushed to downstream directly. Coded of non-independent frame
|
|
* data will be concatenated into next independent frame.
|
|
*/
|
|
int non_independent_frame;
|
|
/** Tail data of current pic, used only for repeat header of AV1. */
|
|
char tail_data[MAX_PARAM_BUFFER_SIZE];
|
|
/** Byte length of tail_data. */
|
|
size_t tail_size;
|
|
} VAAPIEncodePicture;
|
|
|
|
typedef struct VAAPIEncodeProfile {
|
|
// lavc profile value (AV_PROFILE_*).
|
|
int av_profile;
|
|
// Supported bit depth.
|
|
int depth;
|
|
// Number of components.
|
|
int nb_components;
|
|
// Chroma subsampling in width dimension.
|
|
int log2_chroma_w;
|
|
// Chroma subsampling in height dimension.
|
|
int log2_chroma_h;
|
|
// VAAPI profile value.
|
|
VAProfile va_profile;
|
|
} VAAPIEncodeProfile;
|
|
|
|
enum {
|
|
RC_MODE_AUTO,
|
|
RC_MODE_CQP,
|
|
RC_MODE_CBR,
|
|
RC_MODE_VBR,
|
|
RC_MODE_ICQ,
|
|
RC_MODE_QVBR,
|
|
RC_MODE_AVBR,
|
|
RC_MODE_MAX = RC_MODE_AVBR,
|
|
};
|
|
|
|
typedef struct VAAPIEncodeRCMode {
|
|
// Mode from above enum (RC_MODE_*).
|
|
int mode;
|
|
// Name.
|
|
const char *name;
|
|
// Supported in the compile-time VAAPI version.
|
|
int supported;
|
|
// VA mode value (VA_RC_*).
|
|
uint32_t va_mode;
|
|
// Uses bitrate parameters.
|
|
int bitrate;
|
|
// Supports maxrate distinct from bitrate.
|
|
int maxrate;
|
|
// Uses quality value.
|
|
int quality;
|
|
// Supports HRD/VBV parameters.
|
|
int hrd;
|
|
} VAAPIEncodeRCMode;
|
|
|
|
typedef struct VAAPIEncodeContext {
|
|
const AVClass *class;
|
|
|
|
// Codec-specific hooks.
|
|
const struct VAAPIEncodeType *codec;
|
|
|
|
// Global options.
|
|
|
|
// Use low power encoding mode.
|
|
int low_power;
|
|
|
|
// Number of I frames between IDR frames.
|
|
int idr_interval;
|
|
|
|
// Desired B frame reference depth.
|
|
int desired_b_depth;
|
|
|
|
// Max Frame Size
|
|
int max_frame_size;
|
|
|
|
// Explicitly set RC mode (otherwise attempt to pick from
|
|
// available modes).
|
|
int explicit_rc_mode;
|
|
|
|
// Explicitly-set QP, for use with the "qp" options.
|
|
// (Forces CQP mode when set, overriding everything else.)
|
|
int explicit_qp;
|
|
|
|
// Desired packed headers.
|
|
unsigned int desired_packed_headers;
|
|
|
|
// The required size of surfaces. This is probably the input
|
|
// size (AVCodecContext.width|height) aligned up to whatever
|
|
// block size is required by the codec.
|
|
int surface_width;
|
|
int surface_height;
|
|
|
|
// The block size for slice calculations.
|
|
int slice_block_width;
|
|
int slice_block_height;
|
|
|
|
// Everything above this point must be set before calling
|
|
// ff_vaapi_encode_init().
|
|
|
|
// Chosen encoding profile details.
|
|
const VAAPIEncodeProfile *profile;
|
|
|
|
// Chosen rate control mode details.
|
|
const VAAPIEncodeRCMode *rc_mode;
|
|
// RC quality level - meaning depends on codec and RC mode.
|
|
// In CQP mode this sets the fixed quantiser value.
|
|
int rc_quality;
|
|
|
|
// Encoding profile (VAProfile*).
|
|
VAProfile va_profile;
|
|
// Encoding entrypoint (VAEntryoint*).
|
|
VAEntrypoint va_entrypoint;
|
|
// Rate control mode.
|
|
unsigned int va_rc_mode;
|
|
// Bitrate for codec-specific encoder parameters.
|
|
unsigned int va_bit_rate;
|
|
// Packed headers which will actually be sent.
|
|
unsigned int va_packed_headers;
|
|
|
|
// Configuration attributes to use when creating va_config.
|
|
VAConfigAttrib config_attributes[MAX_CONFIG_ATTRIBUTES];
|
|
int nb_config_attributes;
|
|
|
|
VAConfigID va_config;
|
|
VAContextID va_context;
|
|
|
|
AVBufferRef *device_ref;
|
|
AVHWDeviceContext *device;
|
|
AVVAAPIDeviceContext *hwctx;
|
|
|
|
// The hardware frame context containing the input frames.
|
|
AVBufferRef *input_frames_ref;
|
|
AVHWFramesContext *input_frames;
|
|
|
|
// The hardware frame context containing the reconstructed frames.
|
|
AVBufferRef *recon_frames_ref;
|
|
AVHWFramesContext *recon_frames;
|
|
|
|
// Pool of (reusable) bitstream output buffers.
|
|
struct FFRefStructPool *output_buffer_pool;
|
|
|
|
// Global parameters which will be applied at the start of the
|
|
// sequence (includes rate control parameters below).
|
|
int global_params_type[MAX_GLOBAL_PARAMS];
|
|
const void *global_params [MAX_GLOBAL_PARAMS];
|
|
size_t global_params_size[MAX_GLOBAL_PARAMS];
|
|
int nb_global_params;
|
|
|
|
// Rate control parameters.
|
|
VAEncMiscParameterRateControl rc_params;
|
|
VAEncMiscParameterHRD hrd_params;
|
|
VAEncMiscParameterFrameRate fr_params;
|
|
VAEncMiscParameterBufferMaxFrameSize mfs_params;
|
|
#if VA_CHECK_VERSION(0, 36, 0)
|
|
VAEncMiscParameterBufferQualityLevel quality_params;
|
|
#endif
|
|
|
|
// Per-sequence parameter structure (VAEncSequenceParameterBuffer*).
|
|
void *codec_sequence_params;
|
|
|
|
// Per-sequence parameters found in the per-picture parameter
|
|
// structure (VAEncPictureParameterBuffer*).
|
|
void *codec_picture_params;
|
|
|
|
// Current encoding window, in display (input) order.
|
|
VAAPIEncodePicture *pic_start, *pic_end;
|
|
// The next picture to use as the previous reference picture in
|
|
// encoding order. Order from small to large in encoding order.
|
|
VAAPIEncodePicture *next_prev[MAX_PICTURE_REFERENCES];
|
|
int nb_next_prev;
|
|
|
|
// Next input order index (display order).
|
|
int64_t input_order;
|
|
// Number of frames that output is behind input.
|
|
int64_t output_delay;
|
|
// Next encode order index.
|
|
int64_t encode_order;
|
|
// Number of frames decode output will need to be delayed.
|
|
int64_t decode_delay;
|
|
// Next output order index (in encode order).
|
|
int64_t output_order;
|
|
|
|
// Timestamp handling.
|
|
int64_t first_pts;
|
|
int64_t dts_pts_diff;
|
|
int64_t ts_ring[MAX_REORDER_DELAY * 3 +
|
|
MAX_ASYNC_DEPTH];
|
|
|
|
// Slice structure.
|
|
int slice_block_rows;
|
|
int slice_block_cols;
|
|
int nb_slices;
|
|
int slice_size;
|
|
|
|
// Tile encoding.
|
|
int tile_cols;
|
|
int tile_rows;
|
|
// Tile width of the i-th column.
|
|
int col_width[MAX_TILE_COLS];
|
|
// Tile height of i-th row.
|
|
int row_height[MAX_TILE_ROWS];
|
|
// Location of the i-th tile column boundary.
|
|
int col_bd[MAX_TILE_COLS + 1];
|
|
// Location of the i-th tile row boundary.
|
|
int row_bd[MAX_TILE_ROWS + 1];
|
|
|
|
// Frame type decision.
|
|
int gop_size;
|
|
int closed_gop;
|
|
int gop_per_idr;
|
|
int p_per_i;
|
|
int max_b_depth;
|
|
int b_per_p;
|
|
int force_idr;
|
|
int idr_counter;
|
|
int gop_counter;
|
|
int end_of_stream;
|
|
int p_to_gpb;
|
|
|
|
// Whether the driver supports ROI at all.
|
|
int roi_allowed;
|
|
// Maximum number of regions supported by the driver.
|
|
int roi_max_regions;
|
|
// Quantisation range for offset calculations. Set by codec-specific
|
|
// code, as it may change based on parameters.
|
|
int roi_quant_range;
|
|
|
|
// The encoder does not support cropping information, so warn about
|
|
// it the first time we encounter any nonzero crop fields.
|
|
int crop_warned;
|
|
// If the driver does not support ROI then warn the first time we
|
|
// encounter a frame with ROI side data.
|
|
int roi_warned;
|
|
|
|
AVFrame *frame;
|
|
|
|
// Whether the driver support vaSyncBuffer
|
|
int has_sync_buffer_func;
|
|
// Store buffered pic
|
|
AVFifo *encode_fifo;
|
|
// Max number of frame buffered in encoder.
|
|
int async_depth;
|
|
|
|
/** Head data for current output pkt, used only for AV1. */
|
|
//void *header_data;
|
|
//size_t header_data_size;
|
|
|
|
/**
|
|
* Buffered coded data of a pic if it is an non-independent frame.
|
|
* This is a RefStruct reference.
|
|
*/
|
|
VABufferID *coded_buffer_ref;
|
|
|
|
/** Tail data of a pic, now only used for av1 repeat frame header. */
|
|
AVPacket *tail_pkt;
|
|
} VAAPIEncodeContext;
|
|
|
|
enum {
|
|
// Codec supports controlling the subdivision of pictures into slices.
|
|
FLAG_SLICE_CONTROL = 1 << 0,
|
|
// Codec only supports constant quality (no rate control).
|
|
FLAG_CONSTANT_QUALITY_ONLY = 1 << 1,
|
|
// Codec is intra-only.
|
|
FLAG_INTRA_ONLY = 1 << 2,
|
|
// Codec supports B-pictures.
|
|
FLAG_B_PICTURES = 1 << 3,
|
|
// Codec supports referencing B-pictures.
|
|
FLAG_B_PICTURE_REFERENCES = 1 << 4,
|
|
// Codec supports non-IDR key pictures (that is, key pictures do
|
|
// not necessarily empty the DPB).
|
|
FLAG_NON_IDR_KEY_PICTURES = 1 << 5,
|
|
// Codec output packet without timestamp delay, which means the
|
|
// output packet has same PTS and DTS.
|
|
FLAG_TIMESTAMP_NO_DELAY = 1 << 6,
|
|
};
|
|
|
|
typedef struct VAAPIEncodeType {
|
|
// List of supported profiles and corresponding VAAPI profiles.
|
|
// (Must end with AV_PROFILE_UNKNOWN.)
|
|
const VAAPIEncodeProfile *profiles;
|
|
|
|
// Codec feature flags.
|
|
int flags;
|
|
|
|
// Default quality for this codec - used as quantiser or RC quality
|
|
// factor depending on RC mode.
|
|
int default_quality;
|
|
|
|
// Determine encode parameters like block sizes for surface alignment
|
|
// and slices. This may need to query the profile and entrypoint,
|
|
// which will be available when this function is called. If not set,
|
|
// assume that all blocks are 16x16 and that surfaces should be
|
|
// aligned to match this.
|
|
int (*get_encoder_caps)(AVCodecContext *avctx);
|
|
|
|
// Perform any extra codec-specific configuration after the
|
|
// codec context is initialised (set up the private data and
|
|
// add any necessary global parameters).
|
|
int (*configure)(AVCodecContext *avctx);
|
|
|
|
// The size of any private data structure associated with each
|
|
// picture (can be zero if not required).
|
|
size_t picture_priv_data_size;
|
|
|
|
// The size of the parameter structures:
|
|
// sizeof(VAEnc{type}ParameterBuffer{codec}).
|
|
size_t sequence_params_size;
|
|
size_t picture_params_size;
|
|
size_t slice_params_size;
|
|
|
|
// Fill the parameter structures.
|
|
int (*init_sequence_params)(AVCodecContext *avctx);
|
|
int (*init_picture_params)(AVCodecContext *avctx,
|
|
VAAPIEncodePicture *pic);
|
|
int (*init_slice_params)(AVCodecContext *avctx,
|
|
VAAPIEncodePicture *pic,
|
|
VAAPIEncodeSlice *slice);
|
|
|
|
// The type used by the packed header: this should look like
|
|
// VAEncPackedHeader{something}.
|
|
int sequence_header_type;
|
|
int picture_header_type;
|
|
int slice_header_type;
|
|
|
|
// Write the packed header data to the provided buffer.
|
|
// The sequence header is also used to fill the codec extradata
|
|
// when the encoder is starting.
|
|
int (*write_sequence_header)(AVCodecContext *avctx,
|
|
char *data, size_t *data_len);
|
|
int (*write_picture_header)(AVCodecContext *avctx,
|
|
VAAPIEncodePicture *pic,
|
|
char *data, size_t *data_len);
|
|
int (*write_slice_header)(AVCodecContext *avctx,
|
|
VAAPIEncodePicture *pic,
|
|
VAAPIEncodeSlice *slice,
|
|
char *data, size_t *data_len);
|
|
|
|
// Fill an extra parameter structure, which will then be
|
|
// passed to vaRenderPicture(). Will be called repeatedly
|
|
// with increasing index argument until AVERROR_EOF is
|
|
// returned.
|
|
int (*write_extra_buffer)(AVCodecContext *avctx,
|
|
VAAPIEncodePicture *pic,
|
|
int index, int *type,
|
|
char *data, size_t *data_len);
|
|
|
|
// Write an extra packed header. Will be called repeatedly
|
|
// with increasing index argument until AVERROR_EOF is
|
|
// returned.
|
|
int (*write_extra_header)(AVCodecContext *avctx,
|
|
VAAPIEncodePicture *pic,
|
|
int index, int *type,
|
|
char *data, size_t *data_len);
|
|
} VAAPIEncodeType;
|
|
|
|
|
|
int ff_vaapi_encode_receive_packet(AVCodecContext *avctx, AVPacket *pkt);
|
|
|
|
int ff_vaapi_encode_init(AVCodecContext *avctx);
|
|
int ff_vaapi_encode_close(AVCodecContext *avctx);
|
|
|
|
|
|
#define VAAPI_ENCODE_COMMON_OPTIONS \
|
|
{ "low_power", \
|
|
"Use low-power encoding mode (only available on some platforms; " \
|
|
"may not support all encoding features)", \
|
|
OFFSET(common.low_power), AV_OPT_TYPE_BOOL, \
|
|
{ .i64 = 0 }, 0, 1, FLAGS }, \
|
|
{ "idr_interval", \
|
|
"Distance (in I-frames) between IDR frames", \
|
|
OFFSET(common.idr_interval), AV_OPT_TYPE_INT, \
|
|
{ .i64 = 0 }, 0, INT_MAX, FLAGS }, \
|
|
{ "b_depth", \
|
|
"Maximum B-frame reference depth", \
|
|
OFFSET(common.desired_b_depth), AV_OPT_TYPE_INT, \
|
|
{ .i64 = 1 }, 1, INT_MAX, FLAGS }, \
|
|
{ "async_depth", "Maximum processing parallelism. " \
|
|
"Increase this to improve single channel performance. This option " \
|
|
"doesn't work if driver doesn't implement vaSyncBuffer function.", \
|
|
OFFSET(common.async_depth), AV_OPT_TYPE_INT, \
|
|
{ .i64 = 2 }, 1, MAX_ASYNC_DEPTH, FLAGS }, \
|
|
{ "max_frame_size", \
|
|
"Maximum frame size (in bytes)",\
|
|
OFFSET(common.max_frame_size), AV_OPT_TYPE_INT, \
|
|
{ .i64 = 0 }, 0, INT_MAX, FLAGS }
|
|
|
|
#define VAAPI_ENCODE_RC_MODE(name, desc) \
|
|
{ #name, desc, 0, AV_OPT_TYPE_CONST, { .i64 = RC_MODE_ ## name }, \
|
|
0, 0, FLAGS, "rc_mode" }
|
|
#define VAAPI_ENCODE_RC_OPTIONS \
|
|
{ "rc_mode",\
|
|
"Set rate control mode", \
|
|
OFFSET(common.explicit_rc_mode), AV_OPT_TYPE_INT, \
|
|
{ .i64 = RC_MODE_AUTO }, RC_MODE_AUTO, RC_MODE_MAX, FLAGS, "rc_mode" }, \
|
|
{ "auto", "Choose mode automatically based on other parameters", \
|
|
0, AV_OPT_TYPE_CONST, { .i64 = RC_MODE_AUTO }, 0, 0, FLAGS, "rc_mode" }, \
|
|
VAAPI_ENCODE_RC_MODE(CQP, "Constant-quality"), \
|
|
VAAPI_ENCODE_RC_MODE(CBR, "Constant-bitrate"), \
|
|
VAAPI_ENCODE_RC_MODE(VBR, "Variable-bitrate"), \
|
|
VAAPI_ENCODE_RC_MODE(ICQ, "Intelligent constant-quality"), \
|
|
VAAPI_ENCODE_RC_MODE(QVBR, "Quality-defined variable-bitrate"), \
|
|
VAAPI_ENCODE_RC_MODE(AVBR, "Average variable-bitrate")
|
|
|
|
|
|
#endif /* AVCODEC_VAAPI_ENCODE_H */
|