2012-06-28 16:46:24 +03:00
/*
* AAC encoder wrapper
* Copyright ( c ) 2012 Martin Storsjo
*
2012-07-13 00:53:48 +03:00
* This file is part of FFmpeg .
2012-06-28 16:46:24 +03:00
*
2014-06-06 10:48:27 +03:00
* Permission to use , copy , modify , and / or distribute this software for any
* purpose with or without fee is hereby granted , provided that the above
* copyright notice and this permission notice appear in all copies .
2012-06-28 16:46:24 +03:00
*
2014-06-06 10:48:27 +03:00
* THE SOFTWARE IS PROVIDED " AS IS " AND THE AUTHOR DISCLAIMS ALL WARRANTIES
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
* MERCHANTABILITY AND FITNESS . IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
* ANY SPECIAL , DIRECT , INDIRECT , OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
* WHATSOEVER RESULTING FROM LOSS OF USE , DATA OR PROFITS , WHETHER IN AN
* ACTION OF CONTRACT , NEGLIGENCE OR OTHER TORTIOUS ACTION , ARISING OUT OF
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE .
2012-06-28 16:46:24 +03:00
*/
# include <fdk-aac/aacenc_lib.h>
2012-11-10 18:00:00 +03:00
# include "libavutil/channel_layout.h"
# include "libavutil/common.h"
2023-03-01 01:08:10 +02:00
# include "libavutil/intreadwrite.h"
2012-11-10 18:00:00 +03:00
# include "libavutil/opt.h"
2012-06-28 16:46:24 +03:00
# include "avcodec.h"
# include "audio_frame_queue.h"
2022-03-16 19:18:28 +02:00
# include "codec_internal.h"
2021-05-11 15:17:13 +02:00
# include "encode.h"
2020-05-10 20:38:11 +02:00
# include "profiles.h"
2012-06-28 16:46:24 +03:00
2018-09-12 22:03:12 +02:00
# ifdef AACENCODER_LIB_VL0
2018-08-31 13:25:30 +02:00
# define FDKENC_VER_AT_LEAST(vl0, vl1) \
2018-09-12 22:03:12 +02:00
( ( AACENCODER_LIB_VL0 > vl0 ) | | \
( AACENCODER_LIB_VL0 = = vl0 & & AACENCODER_LIB_VL1 > = vl1 ) )
# else
# define FDKENC_VER_AT_LEAST(vl0, vl1) 0
# endif
2018-08-31 13:25:30 +02:00
2012-06-28 16:46:24 +03:00
typedef struct AACContext {
const AVClass * class ;
HANDLE_AACENCODER handle ;
int afterburner ;
int eld_sbr ;
2018-09-04 10:45:35 +02:00
int eld_v2 ;
2012-06-28 16:46:24 +03:00
int signaling ;
2012-07-23 19:20:04 +03:00
int latm ;
int header_period ;
2012-09-25 08:37:21 +03:00
int vbr ;
2023-02-28 23:25:13 +02:00
int drc_profile ;
int drc_target_ref ;
int comp_profile ;
int comp_target_ref ;
int prog_ref ;
int metadata_mode ;
AACENC_MetaData metaDataSetup ;
2023-03-01 01:08:10 +02:00
int delay_sent ;
2023-03-30 14:27:41 +02:00
int frame_length ;
2012-06-28 16:46:24 +03:00
AudioFrameQueue afq ;
} AACContext ;
static const AVOption aac_enc_options [ ] = {
2012-08-31 13:22:31 +03:00
{ " afterburner " , " Afterburner (improved quality) " , offsetof ( AACContext , afterburner ) , AV_OPT_TYPE_INT , { . i64 = 1 } , 0 , 1 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM } ,
{ " eld_sbr " , " Enable SBR for ELD (for SBR in other configurations, use the -profile parameter) " , offsetof ( AACContext , eld_sbr ) , AV_OPT_TYPE_INT , { . i64 = 0 } , 0 , 1 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM } ,
2018-09-04 10:45:35 +02:00
# if FDKENC_VER_AT_LEAST(4, 0) // 4.0.0
{ " eld_v2 " , " Enable ELDv2 (LD-MPS extension for ELD stereo signals) " , offsetof ( AACContext , eld_v2 ) , AV_OPT_TYPE_INT , { . i64 = 0 } , 0 , 1 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM } ,
# endif
2012-08-31 13:22:31 +03:00
{ " signaling " , " SBR/PS signaling style " , offsetof ( AACContext , signaling ) , AV_OPT_TYPE_INT , { . i64 = - 1 } , - 1 , 2 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM , " signaling " } ,
2012-08-31 12:45:52 +03:00
{ " default " , " Choose signaling implicitly (explicit hierarchical by default, implicit if global header is disabled) " , 0 , AV_OPT_TYPE_CONST , { . i64 = - 1 } , 0 , 0 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM , " signaling " } ,
{ " implicit " , " Implicit backwards compatible signaling " , 0 , AV_OPT_TYPE_CONST , { . i64 = 0 } , 0 , 0 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM , " signaling " } ,
{ " explicit_sbr " , " Explicit SBR, implicit PS signaling " , 0 , AV_OPT_TYPE_CONST , { . i64 = 1 } , 0 , 0 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM , " signaling " } ,
{ " explicit_hierarchical " , " Explicit hierarchical signaling " , 0 , AV_OPT_TYPE_CONST , { . i64 = 2 } , 0 , 0 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM , " signaling " } ,
2012-08-31 13:22:31 +03:00
{ " latm " , " Output LATM/LOAS encapsulated data " , offsetof ( AACContext , latm ) , AV_OPT_TYPE_INT , { . i64 = 0 } , 0 , 1 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM } ,
{ " header_period " , " StreamMuxConfig and PCE repetition period (in frames) " , offsetof ( AACContext , header_period ) , AV_OPT_TYPE_INT , { . i64 = 0 } , 0 , 0xffff , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM } ,
2012-09-25 08:37:21 +03:00
{ " vbr " , " VBR mode (1-5) " , offsetof ( AACContext , vbr ) , AV_OPT_TYPE_INT , { . i64 = 0 } , 0 , 5 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM } ,
2023-02-28 23:25:13 +02:00
{ " drc_profile " , " The desired compression profile for AAC DRC " , offsetof ( AACContext , drc_profile ) , AV_OPT_TYPE_INT , { . i64 = 0 } , 0 , 256 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM } ,
{ " drc_target_ref " , " Expected target reference level at decoder side in dB (for clipping prevention/limiter) " , offsetof ( AACContext , drc_target_ref ) , AV_OPT_TYPE_INT , { . i64 = 0.0 } , - 31.75 , 0 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM } ,
{ " comp_profile " , " The desired compression profile for AAC DRC " , offsetof ( AACContext , comp_profile ) , AV_OPT_TYPE_INT , { . i64 = 0 } , 0 , 256 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM } ,
{ " comp_target_ref " , " Expected target reference level at decoder side in dB (for clipping prevention/limiter) " , offsetof ( AACContext , comp_target_ref ) , AV_OPT_TYPE_INT , { . i64 = 0.0 } , - 31.75 , 0 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM } ,
{ " prog_ref " , " The program reference level or dialog level in dB " , offsetof ( AACContext , prog_ref ) , AV_OPT_TYPE_INT , { . i64 = 0.0 } , - 31.75 , 0 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM } ,
2023-03-30 14:27:41 +02:00
{ " frame_length " , " The desired frame length " , offsetof ( AACContext , frame_length ) , AV_OPT_TYPE_INT , { . i64 = - 1 } , - 1 , 1024 , AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM } ,
2020-05-10 20:38:11 +02:00
FF_AAC_PROFILE_OPTS
2012-06-28 16:46:24 +03:00
{ NULL }
} ;
static const AVClass aac_enc_class = {
2017-06-10 16:45:06 +02:00
. class_name = " libfdk_aac " ,
. item_name = av_default_item_name ,
. option = aac_enc_options ,
. version = LIBAVUTIL_VERSION_INT ,
2012-06-28 16:46:24 +03:00
} ;
static const char * aac_get_error ( AACENC_ERROR err )
{
switch ( err ) {
case AACENC_OK :
return " No error " ;
case AACENC_INVALID_HANDLE :
return " Invalid handle " ;
case AACENC_MEMORY_ERROR :
return " Memory allocation error " ;
case AACENC_UNSUPPORTED_PARAMETER :
return " Unsupported parameter " ;
case AACENC_INVALID_CONFIG :
return " Invalid config " ;
case AACENC_INIT_ERROR :
return " Initialization error " ;
case AACENC_INIT_AAC_ERROR :
return " AAC library initialization error " ;
case AACENC_INIT_SBR_ERROR :
return " SBR library initialization error " ;
case AACENC_INIT_TP_ERROR :
return " Transport library initialization error " ;
case AACENC_INIT_META_ERROR :
return " Metadata library initialization error " ;
case AACENC_ENCODE_ERROR :
return " Encoding error " ;
case AACENC_ENCODE_EOF :
return " End of file " ;
default :
return " Unknown error " ;
}
}
static int aac_encode_close ( AVCodecContext * avctx )
{
AACContext * s = avctx - > priv_data ;
if ( s - > handle )
aacEncClose ( & s - > handle ) ;
ff_af_queue_close ( & s - > afq ) ;
return 0 ;
}
2023-03-27 16:19:16 +02:00
static void aac_encode_flush ( AVCodecContext * avctx )
{
AACContext * s = avctx - > priv_data ;
AACENC_BufDesc in_buf = { 0 } , out_buf = { 0 } ;
AACENC_InArgs in_args = { 0 } ;
AACENC_OutArgs out_args ;
int64_t pts , duration ;
uint8_t dummy_in [ 1 ] , dummy_out [ 1 ] ;
int in_buffer_identifiers [ ] = { IN_AUDIO_DATA , IN_METADATA_SETUP } ;
int in_buffer_element_sizes [ ] = { 2 , sizeof ( AACENC_MetaData ) } ;
int in_buffer_sizes [ ] = { 0 , sizeof ( s - > metaDataSetup ) } ;
int out_buffer_identifier = OUT_BITSTREAM_DATA ;
int out_buffer_size = sizeof ( dummy_out ) , out_buffer_element_size = 1 ;
void * inBuffer [ ] = { dummy_in , & s - > metaDataSetup } ;
void * out_ptr = dummy_out ;
AACENC_ERROR err ;
ff_af_queue_remove ( & s - > afq , s - > afq . frame_count , & pts , & duration ) ;
in_buf . bufs = ( void * * ) inBuffer ;
in_buf . numBufs = s - > metadata_mode = = 0 ? 1 : 2 ;
in_buf . bufferIdentifiers = in_buffer_identifiers ;
in_buf . bufSizes = in_buffer_sizes ;
in_buf . bufElSizes = in_buffer_element_sizes ;
out_buf . numBufs = 1 ;
out_buf . bufs = & out_ptr ;
out_buf . bufferIdentifiers = & out_buffer_identifier ;
out_buf . bufSizes = & out_buffer_size ;
out_buf . bufElSizes = & out_buffer_element_size ;
err = aacEncEncode ( s - > handle , & in_buf , & out_buf , & in_args , & out_args ) ;
if ( err ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unexpected error while flushing: %s \n " ,
aac_get_error ( err ) ) ;
}
}
2012-06-28 16:46:24 +03:00
static av_cold int aac_encode_init ( AVCodecContext * avctx )
{
AACContext * s = avctx - > priv_data ;
int ret = AVERROR ( EINVAL ) ;
AACENC_InfoStruct info = { 0 } ;
CHANNEL_MODE mode ;
AACENC_ERROR err ;
int aot = FF_PROFILE_AAC_LOW + 1 ;
int sce = 0 , cpe = 0 ;
2017-04-04 16:55:10 +02:00
if ( ( err = aacEncOpen ( & s - > handle , 0 , avctx - > ch_layout . nb_channels ) ) ! = AACENC_OK ) {
2012-06-28 16:46:24 +03:00
av_log ( avctx , AV_LOG_ERROR , " Unable to open the encoder: %s \n " ,
aac_get_error ( err ) ) ;
goto error ;
}
if ( avctx - > profile ! = FF_PROFILE_UNKNOWN )
aot = avctx - > profile + 1 ;
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_AOT , aot ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unable to set the AOT %d: %s \n " ,
aot , aac_get_error ( err ) ) ;
goto error ;
}
if ( aot = = FF_PROFILE_AAC_ELD + 1 & & s - > eld_sbr ) {
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_SBR_MODE ,
1 ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unable to enable SBR for ELD: %s \n " ,
aac_get_error ( err ) ) ;
goto error ;
}
}
2023-03-30 14:27:41 +02:00
if ( s - > frame_length > = 0 ) {
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_GRANULE_LENGTH ,
s - > frame_length ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unable to set granule length: %s \n " ,
aac_get_error ( err ) ) ;
goto error ;
}
}
2012-06-28 16:46:24 +03:00
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_SAMPLERATE ,
avctx - > sample_rate ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unable to set the sample rate %d: %s \n " ,
avctx - > sample_rate , aac_get_error ( err ) ) ;
goto error ;
}
2017-04-04 16:55:10 +02:00
switch ( avctx - > ch_layout . nb_channels ) {
2012-06-28 16:46:24 +03:00
case 1 : mode = MODE_1 ; sce = 1 ; cpe = 0 ; break ;
2018-09-04 10:45:35 +02:00
case 2 :
# if FDKENC_VER_AT_LEAST(4, 0) // 4.0.0
// (profile + 1) to map from profile range to AOT range
if ( aot = = FF_PROFILE_AAC_ELD + 1 & & s - > eld_v2 ) {
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_CHANNELMODE ,
128 ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unable to enable ELDv2: %s \n " ,
aac_get_error ( err ) ) ;
goto error ;
} else {
mode = MODE_212 ;
sce = 1 ;
cpe = 0 ;
}
} else
# endif
{
mode = MODE_2 ;
sce = 0 ;
cpe = 1 ;
}
break ;
2012-06-28 16:46:24 +03:00
case 3 : mode = MODE_1_2 ; sce = 1 ; cpe = 1 ; break ;
case 4 : mode = MODE_1_2_1 ; sce = 2 ; cpe = 1 ; break ;
case 5 : mode = MODE_1_2_2 ; sce = 1 ; cpe = 2 ; break ;
case 6 : mode = MODE_1_2_2_1 ; sce = 2 ; cpe = 2 ; break ;
2022-11-29 19:55:33 +02:00
# if FDKENC_VER_AT_LEAST(4, 0) // 4.0.0
case 7 : mode = MODE_6_1 ; sce = 3 ; cpe = 2 ; break ;
# endif
2014-02-06 03:08:00 +03:00
/* The version macro is introduced the same time as the 7.1 support, so this
should suffice . */
2018-09-04 10:29:37 +02:00
# if FDKENC_VER_AT_LEAST(3, 4) // 3.4.12
2014-01-26 03:31:53 +03:00
case 8 :
sce = 2 ;
cpe = 3 ;
2017-04-04 16:55:10 +02:00
if ( ! av_channel_layout_compare ( & avctx - > ch_layout , & ( AVChannelLayout ) AV_CHANNEL_LAYOUT_7POINT1 ) ) {
2014-01-26 03:31:53 +03:00
mode = MODE_7_1_REAR_SURROUND ;
2022-11-29 19:55:33 +02:00
# if FDKENC_VER_AT_LEAST(4, 0) // 4.0.0
2022-11-28 00:08:49 +02:00
} else if ( ! av_channel_layout_compare ( & avctx - > ch_layout , & ( AVChannelLayout ) AV_CHANNEL_LAYOUT_7POINT1_TOP_BACK ) ) {
mode = MODE_7_1_TOP_FRONT ;
2022-11-29 19:55:33 +02:00
# endif
2014-01-26 03:31:53 +03:00
} else {
// MODE_1_2_2_2_1 and MODE_7_1_FRONT_CENTER use the same channel layout
mode = MODE_7_1_FRONT_CENTER ;
}
break ;
2014-02-06 03:08:00 +03:00
# endif
2012-06-28 16:46:24 +03:00
default :
av_log ( avctx , AV_LOG_ERROR ,
2017-04-04 16:55:10 +02:00
" Unsupported number of channels %d \n " , avctx - > ch_layout . nb_channels ) ;
2012-06-28 16:46:24 +03:00
goto error ;
}
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_CHANNELMODE ,
mode ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR ,
" Unable to set channel mode %d: %s \n " , mode , aac_get_error ( err ) ) ;
goto error ;
}
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_CHANNELORDER ,
1 ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR ,
" Unable to set wav channel order %d: %s \n " ,
mode , aac_get_error ( err ) ) ;
goto error ;
}
2015-06-29 21:59:37 +02:00
if ( avctx - > flags & AV_CODEC_FLAG_QSCALE | | s - > vbr ) {
2012-09-25 08:37:21 +03:00
int mode = s - > vbr ? s - > vbr : avctx - > global_quality ;
2012-06-28 16:46:24 +03:00
if ( mode < 1 | | mode > 5 ) {
av_log ( avctx , AV_LOG_WARNING ,
" VBR quality %d out of range, should be 1-5 \n " , mode ) ;
mode = av_clip ( mode , 1 , 5 ) ;
}
2012-09-25 08:31:44 +03:00
av_log ( avctx , AV_LOG_WARNING ,
" Note, the VBR setting is unsupported and only works with "
" some parameter combinations \n " ) ;
2012-06-28 16:46:24 +03:00
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_BITRATEMODE ,
mode ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unable to set the VBR bitrate mode %d: %s \n " ,
mode , aac_get_error ( err ) ) ;
goto error ;
}
} else {
if ( avctx - > bit_rate < = 0 ) {
if ( avctx - > profile = = FF_PROFILE_AAC_HE_V2 ) {
sce = 1 ;
cpe = 0 ;
}
avctx - > bit_rate = ( 96 * sce + 128 * cpe ) * avctx - > sample_rate / 44 ;
if ( avctx - > profile = = FF_PROFILE_AAC_HE | |
avctx - > profile = = FF_PROFILE_AAC_HE_V2 | |
2013-06-22 18:16:11 +03:00
avctx - > profile = = FF_PROFILE_MPEG2_AAC_HE | |
2012-06-28 16:46:24 +03:00
s - > eld_sbr )
avctx - > bit_rate / = 2 ;
}
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_BITRATE ,
avctx - > bit_rate ) ) ! = AACENC_OK ) {
2015-09-15 18:01:32 +02:00
av_log ( avctx , AV_LOG_ERROR , " Unable to set the bitrate % " PRId64 " : %s \n " ,
2017-09-22 01:33:22 +02:00
avctx - > bit_rate , aac_get_error ( err ) ) ;
2012-06-28 16:46:24 +03:00
goto error ;
}
}
/* Choose bitstream format - if global header is requested, use
* raw access units , otherwise use ADTS . */
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_TRANSMUX ,
2018-07-05 22:05:02 +02:00
avctx - > flags & AV_CODEC_FLAG_GLOBAL_HEADER ? TT_MP4_RAW :
s - > latm ? TT_MP4_LOAS : TT_MP4_ADTS ) ) ! = AACENC_OK ) {
2012-06-28 16:46:24 +03:00
av_log ( avctx , AV_LOG_ERROR , " Unable to set the transmux format: %s \n " ,
aac_get_error ( err ) ) ;
goto error ;
}
2012-07-23 19:20:04 +03:00
if ( s - > latm & & s - > header_period ) {
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_HEADER_PERIOD ,
s - > header_period ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unable to set header period: %s \n " ,
aac_get_error ( err ) ) ;
goto error ;
}
}
2012-06-28 16:46:24 +03:00
/* If no signaling mode is chosen, use explicit hierarchical signaling
* if using mp4 mode ( raw access units , with global header ) and
* implicit signaling if using ADTS . */
if ( s - > signaling < 0 )
2015-06-29 21:59:37 +02:00
s - > signaling = avctx - > flags & AV_CODEC_FLAG_GLOBAL_HEADER ? 2 : 0 ;
2012-06-28 16:46:24 +03:00
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_SIGNALING_MODE ,
s - > signaling ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unable to set signaling mode %d: %s \n " ,
s - > signaling , aac_get_error ( err ) ) ;
goto error ;
}
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_AFTERBURNER ,
s - > afterburner ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unable to set afterburner to %d: %s \n " ,
s - > afterburner , aac_get_error ( err ) ) ;
goto error ;
}
2012-07-12 21:19:08 +03:00
if ( avctx - > cutoff > 0 ) {
2013-02-09 22:03:02 +03:00
if ( avctx - > cutoff < ( avctx - > sample_rate + 255 ) > > 8 | | avctx - > cutoff > 20000 ) {
2012-07-15 19:41:11 +03:00
av_log ( avctx , AV_LOG_ERROR , " cutoff valid range is %d-20000 \n " ,
( avctx - > sample_rate + 255 ) > > 8 ) ;
goto error ;
}
2012-07-12 21:19:08 +03:00
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_BANDWIDTH ,
avctx - > cutoff ) ) ! = AACENC_OK ) {
2012-12-19 20:48:21 +03:00
av_log ( avctx , AV_LOG_ERROR , " Unable to set the encoder bandwidth to %d: %s \n " ,
2012-07-12 21:19:08 +03:00
avctx - > cutoff , aac_get_error ( err ) ) ;
goto error ;
}
}
2023-02-28 23:25:13 +02:00
s - > metadata_mode = 0 ;
if ( s - > prog_ref ) {
s - > metadata_mode = 1 ;
s - > metaDataSetup . prog_ref_level_present = 1 ;
s - > metaDataSetup . prog_ref_level = s - > prog_ref < < 16 ;
}
if ( s - > drc_profile ) {
s - > metadata_mode = 1 ;
s - > metaDataSetup . drc_profile = s - > drc_profile ;
s - > metaDataSetup . drc_TargetRefLevel = s - > drc_target_ref < < 16 ;
if ( s - > comp_profile ) {
/* Including the comp_profile means that we need to set the mode to ETSI */
s - > metadata_mode = 2 ;
s - > metaDataSetup . comp_profile = s - > comp_profile ;
s - > metaDataSetup . comp_TargetRefLevel = s - > comp_target_ref < < 16 ;
}
}
if ( ( err = aacEncoder_SetParam ( s - > handle , AACENC_METADATA_MODE , s - > metadata_mode ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unable to set metadata mode to %d: %s \n " ,
s - > metadata_mode , aac_get_error ( err ) ) ;
goto error ;
}
2012-06-28 16:46:24 +03:00
if ( ( err = aacEncEncode ( s - > handle , NULL , NULL , NULL , NULL ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unable to initialize the encoder: %s \n " ,
aac_get_error ( err ) ) ;
return AVERROR ( EINVAL ) ;
}
if ( ( err = aacEncInfo ( s - > handle , & info ) ) ! = AACENC_OK ) {
av_log ( avctx , AV_LOG_ERROR , " Unable to get encoder info: %s \n " ,
aac_get_error ( err ) ) ;
goto error ;
}
avctx - > frame_size = info . frameLength ;
2018-09-04 10:29:37 +02:00
# if FDKENC_VER_AT_LEAST(4, 0) // 4.0.0
2018-08-31 13:25:30 +02:00
avctx - > initial_padding = info . nDelay ;
# else
2014-08-23 15:40:50 +03:00
avctx - > initial_padding = info . encoderDelay ;
2018-08-31 13:25:30 +02:00
# endif
2012-06-28 16:46:24 +03:00
ff_af_queue_init ( avctx , & s - > afq ) ;
2015-06-29 21:59:37 +02:00
if ( avctx - > flags & AV_CODEC_FLAG_GLOBAL_HEADER ) {
2012-06-28 16:46:24 +03:00
avctx - > extradata_size = info . confSize ;
avctx - > extradata = av_mallocz ( avctx - > extradata_size +
2015-06-29 23:48:34 +02:00
AV_INPUT_BUFFER_PADDING_SIZE ) ;
2012-06-28 16:46:24 +03:00
if ( ! avctx - > extradata ) {
ret = AVERROR ( ENOMEM ) ;
goto error ;
}
memcpy ( avctx - > extradata , info . confBuf , info . confSize ) ;
}
return 0 ;
error :
aac_encode_close ( avctx ) ;
return ret ;
}
static int aac_encode_frame ( AVCodecContext * avctx , AVPacket * avpkt ,
const AVFrame * frame , int * got_packet_ptr )
{
AACContext * s = avctx - > priv_data ;
AACENC_BufDesc in_buf = { 0 } , out_buf = { 0 } ;
AACENC_InArgs in_args = { 0 } ;
AACENC_OutArgs out_args = { 0 } ;
2023-02-28 23:25:13 +02:00
void * inBuffer [ ] = { 0 , & s - > metaDataSetup } ;
int in_buffer_identifiers [ ] = { IN_AUDIO_DATA , IN_METADATA_SETUP } ;
int in_buffer_element_sizes [ ] = { 2 , sizeof ( AACENC_MetaData ) } ;
int in_buffer_sizes [ ] = { 0 , sizeof ( s - > metaDataSetup ) } ;
2012-06-28 16:46:24 +03:00
int out_buffer_identifier = OUT_BITSTREAM_DATA ;
int out_buffer_size , out_buffer_element_size ;
2023-02-28 23:25:13 +02:00
void * out_ptr ;
2023-03-01 01:08:10 +02:00
int ret , discard_padding ;
2018-08-31 13:25:30 +02:00
uint8_t dummy_buf [ 1 ] ;
2012-06-28 16:46:24 +03:00
AACENC_ERROR err ;
/* handle end-of-stream small frame and flushing */
if ( ! frame ) {
2018-08-31 13:25:30 +02:00
/* Must be a non-null pointer, even if it's a dummy. We could use
* the address of anything else on the stack as well . */
2023-02-28 23:25:13 +02:00
inBuffer [ 0 ] = dummy_buf ;
2018-08-31 13:25:30 +02:00
2012-06-28 16:46:24 +03:00
in_args . numInSamples = - 1 ;
} else {
2023-02-28 23:25:13 +02:00
inBuffer [ 0 ] = frame - > data [ 0 ] ;
in_buffer_sizes [ 0 ] = 2 * avctx - > ch_layout . nb_channels * frame - > nb_samples ;
2012-06-28 16:46:24 +03:00
2017-04-04 16:55:10 +02:00
in_args . numInSamples = avctx - > ch_layout . nb_channels * frame - > nb_samples ;
2012-06-28 16:46:24 +03:00
/* add current frame to the queue */
2013-01-14 02:03:23 +03:00
if ( ( ret = ff_af_queue_add ( & s - > afq , frame ) ) < 0 )
2012-06-28 16:46:24 +03:00
return ret ;
}
2023-02-28 23:25:13 +02:00
if ( s - > metadata_mode = = 0 ) {
in_buf . numBufs = 1 ;
} else {
in_buf . numBufs = 2 ;
}
in_buf . bufs = ( void * * ) inBuffer ;
in_buf . bufferIdentifiers = in_buffer_identifiers ;
in_buf . bufSizes = in_buffer_sizes ;
in_buf . bufElSizes = in_buffer_element_sizes ;
2018-08-31 13:25:30 +02:00
2012-06-28 16:46:24 +03:00
/* The maximum packet size is 6144 bits aka 768 bytes per channel. */
2017-04-04 16:55:10 +02:00
ret = ff_alloc_packet ( avctx , avpkt , FFMAX ( 8192 , 768 * avctx - > ch_layout . nb_channels ) ) ;
2021-05-11 15:17:13 +02:00
if ( ret < 0 )
2012-06-28 16:46:24 +03:00
return ret ;
out_ptr = avpkt - > data ;
out_buffer_size = avpkt - > size ;
out_buffer_element_size = 1 ;
out_buf . numBufs = 1 ;
out_buf . bufs = & out_ptr ;
out_buf . bufferIdentifiers = & out_buffer_identifier ;
out_buf . bufSizes = & out_buffer_size ;
out_buf . bufElSizes = & out_buffer_element_size ;
if ( ( err = aacEncEncode ( s - > handle , & in_buf , & out_buf , & in_args ,
& out_args ) ) ! = AACENC_OK ) {
if ( ! frame & & err = = AACENC_ENCODE_EOF )
return 0 ;
av_log ( avctx , AV_LOG_ERROR , " Unable to encode frame: %s \n " ,
aac_get_error ( err ) ) ;
return AVERROR ( EINVAL ) ;
}
if ( ! out_args . numOutBytes )
return 0 ;
/* Get the next frame pts & duration */
ff_af_queue_remove ( & s - > afq , avctx - > frame_size , & avpkt - > pts ,
& avpkt - > duration ) ;
2023-03-01 01:08:10 +02:00
discard_padding = avctx - > frame_size - avpkt - > duration ;
// Check if subtraction resulted in an overflow
if ( ( discard_padding < avctx - > frame_size ) ! = ( avpkt - > duration > 0 ) ) {
av_log ( avctx , AV_LOG_ERROR , " discard padding overflow \n " ) ;
return AVERROR ( EINVAL ) ;
}
if ( ( ! s - > delay_sent & & avctx - > initial_padding > 0 ) | | discard_padding > 0 ) {
uint8_t * side_data =
av_packet_new_side_data ( avpkt , AV_PKT_DATA_SKIP_SAMPLES , 10 ) ;
2023-03-13 06:03:52 +02:00
if ( ! side_data )
2023-03-01 01:08:10 +02:00
return AVERROR ( ENOMEM ) ;
if ( ! s - > delay_sent ) {
AV_WL32 ( side_data , avctx - > initial_padding ) ;
s - > delay_sent = 1 ;
}
AV_WL32 ( side_data + 4 , discard_padding ) ;
}
2012-06-28 16:46:24 +03:00
avpkt - > size = out_args . numOutBytes ;
* got_packet_ptr = 1 ;
return 0 ;
}
static const AVProfile profiles [ ] = {
{ FF_PROFILE_AAC_LOW , " LC " } ,
{ FF_PROFILE_AAC_HE , " HE-AAC " } ,
{ FF_PROFILE_AAC_HE_V2 , " HE-AACv2 " } ,
{ FF_PROFILE_AAC_LD , " LD " } ,
{ FF_PROFILE_AAC_ELD , " ELD " } ,
{ FF_PROFILE_UNKNOWN } ,
} ;
2022-03-16 22:26:11 +02:00
static const FFCodecDefault aac_encode_defaults [ ] = {
2012-06-28 16:46:24 +03:00
{ " b " , " 0 " } ,
{ NULL }
} ;
2017-04-04 16:55:10 +02:00
# if FF_API_OLD_CHANNEL_LAYOUT
2012-06-28 16:46:24 +03:00
static const uint64_t aac_channel_layout [ ] = {
AV_CH_LAYOUT_MONO ,
AV_CH_LAYOUT_STEREO ,
AV_CH_LAYOUT_SURROUND ,
AV_CH_LAYOUT_4POINT0 ,
AV_CH_LAYOUT_5POINT0_BACK ,
AV_CH_LAYOUT_5POINT1_BACK ,
2022-11-29 19:55:33 +02:00
# if FDKENC_VER_AT_LEAST(4, 0) // 4.0.0
2022-11-28 00:16:03 +02:00
AV_CH_LAYOUT_6POINT1_BACK ,
2022-11-29 19:55:33 +02:00
# endif
# if FDKENC_VER_AT_LEAST(3, 4) // 3.4.12
2014-01-26 16:46:11 +03:00
AV_CH_LAYOUT_7POINT1_WIDE_BACK ,
2014-01-26 16:44:27 +03:00
AV_CH_LAYOUT_7POINT1 ,
2022-11-29 19:55:33 +02:00
# endif
# if FDKENC_VER_AT_LEAST(4, 0) // 4.0.0
2022-11-28 00:08:49 +02:00
AV_CH_LAYOUT_7POINT1_TOP_BACK ,
2014-02-06 03:08:00 +03:00
# endif
2012-06-28 16:46:24 +03:00
0 ,
} ;
2017-04-04 16:55:10 +02:00
# endif /* FF_API_OLD_CHANNEL_LAYOUT */
static const AVChannelLayout aac_ch_layouts [ 16 ] = {
AV_CHANNEL_LAYOUT_MONO ,
AV_CHANNEL_LAYOUT_STEREO ,
AV_CHANNEL_LAYOUT_SURROUND ,
AV_CHANNEL_LAYOUT_4POINT0 ,
AV_CHANNEL_LAYOUT_5POINT0_BACK ,
AV_CHANNEL_LAYOUT_5POINT1_BACK ,
2022-11-29 19:55:33 +02:00
# if FDKENC_VER_AT_LEAST(4, 0) // 4.0.0
2022-11-28 00:16:03 +02:00
AV_CHANNEL_LAYOUT_6POINT1_BACK ,
2022-11-29 19:55:33 +02:00
# endif
# if FDKENC_VER_AT_LEAST(3, 4) // 3.4.12
2017-04-04 16:55:10 +02:00
AV_CHANNEL_LAYOUT_7POINT1_WIDE_BACK ,
AV_CHANNEL_LAYOUT_7POINT1 ,
2022-11-29 19:55:33 +02:00
# endif
# if FDKENC_VER_AT_LEAST(4, 0) // 4.0.0
2022-11-28 00:08:49 +02:00
AV_CHANNEL_LAYOUT_7POINT1_TOP_BACK ,
2017-04-04 16:55:10 +02:00
# endif
{ 0 } ,
} ;
2012-06-28 16:46:24 +03:00
2012-09-25 02:02:44 +03:00
static const int aac_sample_rates [ ] = {
96000 , 88200 , 64000 , 48000 , 44100 , 32000 ,
24000 , 22050 , 16000 , 12000 , 11025 , 8000 , 0
} ;
2022-03-16 22:09:54 +02:00
const FFCodec ff_libfdk_aac_encoder = {
. p . name = " libfdk_aac " ,
2022-08-29 13:38:02 +02:00
CODEC_LONG_NAME ( " Fraunhofer FDK AAC " ) ,
2022-03-16 22:09:54 +02:00
. p . type = AVMEDIA_TYPE_AUDIO ,
. p . id = AV_CODEC_ID_AAC ,
2021-05-11 20:52:13 +02:00
. p . capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY |
2023-03-27 16:19:16 +02:00
AV_CODEC_CAP_ENCODER_FLUSH |
2021-05-11 20:52:13 +02:00
AV_CODEC_CAP_SMALL_LAST_FRAME ,
2022-07-09 22:25:41 +02:00
. caps_internal = FF_CODEC_CAP_NOT_INIT_THREADSAFE ,
2012-09-25 02:03:22 +03:00
. priv_data_size = sizeof ( AACContext ) ,
. init = aac_encode_init ,
2022-03-30 23:28:24 +02:00
FF_CODEC_ENCODE_CB ( aac_encode_frame ) ,
2023-03-27 16:19:16 +02:00
. flush = aac_encode_flush ,
2012-09-25 02:03:22 +03:00
. close = aac_encode_close ,
2022-03-16 22:09:54 +02:00
. p . sample_fmts = ( const enum AVSampleFormat [ ] ) { AV_SAMPLE_FMT_S16 ,
2012-09-25 02:03:22 +03:00
AV_SAMPLE_FMT_NONE } ,
2022-03-16 22:09:54 +02:00
. p . priv_class = & aac_enc_class ,
2012-09-25 02:03:22 +03:00
. defaults = aac_encode_defaults ,
2022-03-16 22:09:54 +02:00
. p . profiles = profiles ,
. p . supported_samplerates = aac_sample_rates ,
. p . wrapper_name = " libfdk " ,
2022-09-26 01:10:51 +02:00
CODEC_OLD_CHANNEL_LAYOUTS_ARRAY ( aac_channel_layout )
2022-03-16 22:09:54 +02:00
. p . ch_layouts = aac_ch_layouts ,
2012-06-28 16:46:24 +03:00
} ;