mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2025-01-13 21:28:01 +02:00
interlaced motion estimation
interlaced mpeg2 encoding P & B frames rate distored interlaced mb decission alternate scantable support 4mv encoding fixes (thats also why the regression tests change) passing height to most dsp functions interlaced mpeg4 encoding (no direct mode MBs yet) various related cleanups disabled old motion estimaton algorithms (log, full, ...) they will either be fixed or removed Originally committed as revision 2638 to svn://svn.ffmpeg.org/ffmpeg/trunk
This commit is contained in:
parent
b846b231b3
commit
bb198e198a
41
ffmpeg.c
41
ffmpeg.c
@ -119,8 +119,10 @@ static int use_obmc = 0;
|
|||||||
static int use_aic = 0;
|
static int use_aic = 0;
|
||||||
static int use_aiv = 0;
|
static int use_aiv = 0;
|
||||||
static int use_umv = 0;
|
static int use_umv = 0;
|
||||||
|
static int use_alt_scan = 0;
|
||||||
static int do_deinterlace = 0;
|
static int do_deinterlace = 0;
|
||||||
static int do_interlace = 0;
|
static int do_interlace_dct = 0;
|
||||||
|
static int do_interlace_me = 0;
|
||||||
static int workaround_bugs = FF_BUG_AUTODETECT;
|
static int workaround_bugs = FF_BUG_AUTODETECT;
|
||||||
static int error_resilience = 2;
|
static int error_resilience = 2;
|
||||||
static int error_concealment = 3;
|
static int error_concealment = 3;
|
||||||
@ -130,6 +132,8 @@ static int use_part = 0;
|
|||||||
static int packet_size = 0;
|
static int packet_size = 0;
|
||||||
static int error_rate = 0;
|
static int error_rate = 0;
|
||||||
static int strict = 0;
|
static int strict = 0;
|
||||||
|
static int top_field_first = -1;
|
||||||
|
static int noise_reduction = 0;
|
||||||
static int debug = 0;
|
static int debug = 0;
|
||||||
static int debug_mv = 0;
|
static int debug_mv = 0;
|
||||||
extern int loop_input; /* currently a hack */
|
extern int loop_input; /* currently a hack */
|
||||||
@ -635,7 +639,12 @@ static void do_video_out(AVFormatContext *s,
|
|||||||
/* better than nothing: use input picture interlaced
|
/* better than nothing: use input picture interlaced
|
||||||
settings */
|
settings */
|
||||||
big_picture.interlaced_frame = in_picture->interlaced_frame;
|
big_picture.interlaced_frame = in_picture->interlaced_frame;
|
||||||
big_picture.top_field_first = in_picture->top_field_first;
|
if(do_interlace_me || do_interlace_dct){
|
||||||
|
if(top_field_first == -1)
|
||||||
|
big_picture.top_field_first = in_picture->top_field_first;
|
||||||
|
else
|
||||||
|
big_picture.top_field_first = 1;
|
||||||
|
}
|
||||||
|
|
||||||
/* handles sameq here. This is not correct because it may
|
/* handles sameq here. This is not correct because it may
|
||||||
not be a global option */
|
not be a global option */
|
||||||
@ -1946,6 +1955,16 @@ static void opt_strict(const char *arg)
|
|||||||
strict= atoi(arg);
|
strict= atoi(arg);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static void opt_top_field_first(const char *arg)
|
||||||
|
{
|
||||||
|
top_field_first= atoi(arg);
|
||||||
|
}
|
||||||
|
|
||||||
|
static void opt_noise_reduction(const char *arg)
|
||||||
|
{
|
||||||
|
noise_reduction= atoi(arg);
|
||||||
|
}
|
||||||
|
|
||||||
static void opt_audio_bitrate(const char *arg)
|
static void opt_audio_bitrate(const char *arg)
|
||||||
{
|
{
|
||||||
audio_bit_rate = atoi(arg) * 1000;
|
audio_bit_rate = atoi(arg) * 1000;
|
||||||
@ -2373,14 +2392,20 @@ static void opt_output_file(const char *filename)
|
|||||||
if(use_part) {
|
if(use_part) {
|
||||||
video_enc->flags |= CODEC_FLAG_PART;
|
video_enc->flags |= CODEC_FLAG_PART;
|
||||||
}
|
}
|
||||||
|
if (use_alt_scan) {
|
||||||
|
video_enc->flags |= CODEC_FLAG_ALT_SCAN;
|
||||||
|
}
|
||||||
if (b_frames) {
|
if (b_frames) {
|
||||||
video_enc->max_b_frames = b_frames;
|
video_enc->max_b_frames = b_frames;
|
||||||
video_enc->b_frame_strategy = 0;
|
video_enc->b_frame_strategy = 0;
|
||||||
video_enc->b_quant_factor = 2.0;
|
video_enc->b_quant_factor = 2.0;
|
||||||
}
|
}
|
||||||
if (do_interlace) {
|
if (do_interlace_dct) {
|
||||||
video_enc->flags |= CODEC_FLAG_INTERLACED_DCT;
|
video_enc->flags |= CODEC_FLAG_INTERLACED_DCT;
|
||||||
}
|
}
|
||||||
|
if (do_interlace_me) {
|
||||||
|
video_enc->flags |= CODEC_FLAG_INTERLACED_ME;
|
||||||
|
}
|
||||||
video_enc->qmin = video_qmin;
|
video_enc->qmin = video_qmin;
|
||||||
video_enc->qmax = video_qmax;
|
video_enc->qmax = video_qmax;
|
||||||
video_enc->mb_qmin = video_mb_qmin;
|
video_enc->mb_qmin = video_mb_qmin;
|
||||||
@ -2430,6 +2455,7 @@ static void opt_output_file(const char *filename)
|
|||||||
video_enc->idct_algo = idct_algo;
|
video_enc->idct_algo = idct_algo;
|
||||||
video_enc->strict_std_compliance = strict;
|
video_enc->strict_std_compliance = strict;
|
||||||
video_enc->error_rate = error_rate;
|
video_enc->error_rate = error_rate;
|
||||||
|
video_enc->noise_reduction= noise_reduction;
|
||||||
if(packet_size){
|
if(packet_size){
|
||||||
video_enc->rtp_mode= 1;
|
video_enc->rtp_mode= 1;
|
||||||
video_enc->rtp_payload_size= packet_size;
|
video_enc->rtp_payload_size= packet_size;
|
||||||
@ -2992,16 +3018,21 @@ const OptionDef options[] = {
|
|||||||
{ "passlogfile", HAS_ARG | OPT_STRING | OPT_VIDEO, {(void*)&pass_logfilename}, "select two pass log file name", "file" },
|
{ "passlogfile", HAS_ARG | OPT_STRING | OPT_VIDEO, {(void*)&pass_logfilename}, "select two pass log file name", "file" },
|
||||||
{ "deinterlace", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&do_deinterlace},
|
{ "deinterlace", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&do_deinterlace},
|
||||||
"deinterlace pictures" },
|
"deinterlace pictures" },
|
||||||
{ "interlace", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&do_interlace},
|
{ "ildct", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&do_interlace_dct},
|
||||||
"force interlacing support in encoder (MPEG2/MPEG4)" },
|
"force interlaced dct support in encoder (MPEG2/MPEG4)" },
|
||||||
|
{ "ilme", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&do_interlace_me},
|
||||||
|
"force interlacied me support in encoder MPEG2" },
|
||||||
{ "psnr", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&do_psnr}, "calculate PSNR of compressed frames" },
|
{ "psnr", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&do_psnr}, "calculate PSNR of compressed frames" },
|
||||||
{ "vstats", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&do_vstats}, "dump video coding statistics to file" },
|
{ "vstats", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&do_vstats}, "dump video coding statistics to file" },
|
||||||
{ "vhook", HAS_ARG | OPT_EXPERT | OPT_VIDEO, {(void*)add_frame_hooker}, "insert video processing module", "module" },
|
{ "vhook", HAS_ARG | OPT_EXPERT | OPT_VIDEO, {(void*)add_frame_hooker}, "insert video processing module", "module" },
|
||||||
{ "aic", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&use_aic}, "enable Advanced intra coding (h263+)" },
|
{ "aic", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&use_aic}, "enable Advanced intra coding (h263+)" },
|
||||||
{ "aiv", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&use_aiv}, "enable Alternative inter vlc (h263+)" },
|
{ "aiv", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&use_aiv}, "enable Alternative inter vlc (h263+)" },
|
||||||
{ "umv", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&use_umv}, "enable Unlimited Motion Vector (h263+)" },
|
{ "umv", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&use_umv}, "enable Unlimited Motion Vector (h263+)" },
|
||||||
|
{ "alt", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&use_alt_scan}, "enable alternate scantable (mpeg2)" },
|
||||||
{ "intra_matrix", HAS_ARG | OPT_EXPERT | OPT_VIDEO, {(void*)opt_intra_matrix}, "specify intra matrix coeffs", "matrix" },
|
{ "intra_matrix", HAS_ARG | OPT_EXPERT | OPT_VIDEO, {(void*)opt_intra_matrix}, "specify intra matrix coeffs", "matrix" },
|
||||||
{ "inter_matrix", HAS_ARG | OPT_EXPERT | OPT_VIDEO, {(void*)opt_inter_matrix}, "specify inter matrix coeffs", "matrix" },
|
{ "inter_matrix", HAS_ARG | OPT_EXPERT | OPT_VIDEO, {(void*)opt_inter_matrix}, "specify inter matrix coeffs", "matrix" },
|
||||||
|
{ "top", HAS_ARG | OPT_EXPERT | OPT_VIDEO, {(void*)opt_top_field_first}, "top=1/bottom=0/auto=-1 field first", "" },
|
||||||
|
{ "nr", HAS_ARG | OPT_EXPERT | OPT_VIDEO, {(void*)opt_noise_reduction}, "noise reduction", "" },
|
||||||
|
|
||||||
/* audio options */
|
/* audio options */
|
||||||
{ "ab", HAS_ARG | OPT_AUDIO, {(void*)opt_audio_bitrate}, "set audio bitrate (in kbit/s)", "bitrate", },
|
{ "ab", HAS_ARG | OPT_AUDIO, {(void*)opt_audio_bitrate}, "set audio bitrate (in kbit/s)", "bitrate", },
|
||||||
|
@ -39,11 +39,11 @@ void get_pixels_mvi(DCTELEM *restrict block,
|
|||||||
const uint8_t *restrict pixels, int line_size);
|
const uint8_t *restrict pixels, int line_size);
|
||||||
void diff_pixels_mvi(DCTELEM *block, const uint8_t *s1, const uint8_t *s2,
|
void diff_pixels_mvi(DCTELEM *block, const uint8_t *s1, const uint8_t *s2,
|
||||||
int stride);
|
int stride);
|
||||||
int pix_abs8x8_mvi(uint8_t *pix1, uint8_t *pix2, int line_size);
|
int pix_abs8x8_mvi(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
||||||
int pix_abs16x16_mvi_asm(uint8_t *pix1, uint8_t *pix2, int line_size);
|
int pix_abs16x16_mvi_asm(uint8_t *pix1, uint8_t *pix2, int line_size);
|
||||||
int pix_abs16x16_x2_mvi(uint8_t *pix1, uint8_t *pix2, int line_size);
|
int pix_abs16x16_x2_mvi(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
||||||
int pix_abs16x16_y2_mvi(uint8_t *pix1, uint8_t *pix2, int line_size);
|
int pix_abs16x16_y2_mvi(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
||||||
int pix_abs16x16_xy2_mvi(uint8_t *pix1, uint8_t *pix2, int line_size);
|
int pix_abs16x16_xy2_mvi(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
||||||
|
|
||||||
#if 0
|
#if 0
|
||||||
/* These functions were the base for the optimized assembler routines,
|
/* These functions were the base for the optimized assembler routines,
|
||||||
@ -290,11 +290,6 @@ static int sad16x16_mvi(void *s, uint8_t *a, uint8_t *b, int stride)
|
|||||||
return pix_abs16x16_mvi_asm(a, b, stride);
|
return pix_abs16x16_mvi_asm(a, b, stride);
|
||||||
}
|
}
|
||||||
|
|
||||||
static int sad8x8_mvi(void *s, uint8_t *a, uint8_t *b, int stride)
|
|
||||||
{
|
|
||||||
return pix_abs8x8_mvi(a, b, stride);
|
|
||||||
}
|
|
||||||
|
|
||||||
void dsputil_init_alpha(DSPContext* c, AVCodecContext *avctx)
|
void dsputil_init_alpha(DSPContext* c, AVCodecContext *avctx)
|
||||||
{
|
{
|
||||||
c->put_pixels_tab[0][0] = put_pixels16_axp_asm;
|
c->put_pixels_tab[0][0] = put_pixels16_axp_asm;
|
||||||
@ -347,12 +342,13 @@ void dsputil_init_alpha(DSPContext* c, AVCodecContext *avctx)
|
|||||||
c->get_pixels = get_pixels_mvi;
|
c->get_pixels = get_pixels_mvi;
|
||||||
c->diff_pixels = diff_pixels_mvi;
|
c->diff_pixels = diff_pixels_mvi;
|
||||||
c->sad[0] = sad16x16_mvi;
|
c->sad[0] = sad16x16_mvi;
|
||||||
c->sad[1] = sad8x8_mvi;
|
c->sad[1] = pix_abs8x8_mvi;
|
||||||
c->pix_abs8x8 = pix_abs8x8_mvi;
|
// c->pix_abs[0][0] = pix_abs16x16_mvi_asm; //FIXME function arguments for the asm must be fixed
|
||||||
c->pix_abs16x16 = pix_abs16x16_mvi_asm;
|
c->pix_abs[0][0] = sad16x16_mvi;
|
||||||
c->pix_abs16x16_x2 = pix_abs16x16_x2_mvi;
|
c->pix_abs[1][0] = pix_abs8x8_mvi;
|
||||||
c->pix_abs16x16_y2 = pix_abs16x16_y2_mvi;
|
c->pix_abs[0][1] = pix_abs16x16_x2_mvi;
|
||||||
c->pix_abs16x16_xy2 = pix_abs16x16_xy2_mvi;
|
c->pix_abs[0][2] = pix_abs16x16_y2_mvi;
|
||||||
|
c->pix_abs[0][3] = pix_abs16x16_xy2_mvi;
|
||||||
}
|
}
|
||||||
|
|
||||||
put_pixels_clamped_axp_p = c->put_pixels_clamped;
|
put_pixels_clamped_axp_p = c->put_pixels_clamped;
|
||||||
|
@ -84,10 +84,9 @@ static inline uint64_t avg4(uint64_t l1, uint64_t l2, uint64_t l3, uint64_t l4)
|
|||||||
return r1 + r2;
|
return r1 + r2;
|
||||||
}
|
}
|
||||||
|
|
||||||
int pix_abs8x8_mvi(uint8_t *pix1, uint8_t *pix2, int line_size)
|
int pix_abs8x8_mvi(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int result = 0;
|
int result = 0;
|
||||||
int h = 8;
|
|
||||||
|
|
||||||
if ((size_t) pix2 & 0x7) {
|
if ((size_t) pix2 & 0x7) {
|
||||||
/* works only when pix2 is actually unaligned */
|
/* works only when pix2 is actually unaligned */
|
||||||
@ -160,10 +159,9 @@ int pix_abs16x16_mvi(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
int pix_abs16x16_x2_mvi(uint8_t *pix1, uint8_t *pix2, int line_size)
|
int pix_abs16x16_x2_mvi(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int result = 0;
|
int result = 0;
|
||||||
int h = 16;
|
|
||||||
uint64_t disalign = (size_t) pix2 & 0x7;
|
uint64_t disalign = (size_t) pix2 & 0x7;
|
||||||
|
|
||||||
switch (disalign) {
|
switch (disalign) {
|
||||||
@ -234,10 +232,9 @@ int pix_abs16x16_x2_mvi(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return result;
|
return result;
|
||||||
}
|
}
|
||||||
|
|
||||||
int pix_abs16x16_y2_mvi(uint8_t *pix1, uint8_t *pix2, int line_size)
|
int pix_abs16x16_y2_mvi(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int result = 0;
|
int result = 0;
|
||||||
int h = 16;
|
|
||||||
|
|
||||||
if ((size_t) pix2 & 0x7) {
|
if ((size_t) pix2 & 0x7) {
|
||||||
uint64_t t, p2_l, p2_r;
|
uint64_t t, p2_l, p2_r;
|
||||||
@ -288,10 +285,9 @@ int pix_abs16x16_y2_mvi(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return result;
|
return result;
|
||||||
}
|
}
|
||||||
|
|
||||||
int pix_abs16x16_xy2_mvi(uint8_t *pix1, uint8_t *pix2, int line_size)
|
int pix_abs16x16_xy2_mvi(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int result = 0;
|
int result = 0;
|
||||||
int h = 16;
|
|
||||||
|
|
||||||
uint64_t p1_l, p1_r;
|
uint64_t p1_l, p1_r;
|
||||||
uint64_t p2_l, p2_r, p2_x;
|
uint64_t p2_l, p2_r, p2_x;
|
||||||
|
@ -17,7 +17,7 @@ extern "C" {
|
|||||||
|
|
||||||
#define FFMPEG_VERSION_INT 0x000408
|
#define FFMPEG_VERSION_INT 0x000408
|
||||||
#define FFMPEG_VERSION "0.4.8"
|
#define FFMPEG_VERSION "0.4.8"
|
||||||
#define LIBAVCODEC_BUILD 4697
|
#define LIBAVCODEC_BUILD 4698
|
||||||
|
|
||||||
#define LIBAVCODEC_VERSION_INT FFMPEG_VERSION_INT
|
#define LIBAVCODEC_VERSION_INT FFMPEG_VERSION_INT
|
||||||
#define LIBAVCODEC_VERSION FFMPEG_VERSION
|
#define LIBAVCODEC_VERSION FFMPEG_VERSION
|
||||||
@ -264,6 +264,7 @@ static const __attribute__((unused)) int Motion_Est_QTab[] =
|
|||||||
#define CODEC_FLAG_OBMC 0x00000001 ///< OBMC
|
#define CODEC_FLAG_OBMC 0x00000001 ///< OBMC
|
||||||
#define CODEC_FLAG_LOOP_FILTER 0x00000800 ///< loop filter
|
#define CODEC_FLAG_LOOP_FILTER 0x00000800 ///< loop filter
|
||||||
#define CODEC_FLAG_H263P_SLICE_STRUCT 0x10000000
|
#define CODEC_FLAG_H263P_SLICE_STRUCT 0x10000000
|
||||||
|
#define CODEC_FLAG_INTERLACED_ME 0x20000000 ///< interlaced motion estimation
|
||||||
/* Unsupported options :
|
/* Unsupported options :
|
||||||
* Syntax Arithmetic coding (SAC)
|
* Syntax Arithmetic coding (SAC)
|
||||||
* Reference Picture Selection
|
* Reference Picture Selection
|
||||||
|
@ -218,13 +218,13 @@ static void bswap_buf(uint32_t *dst, uint32_t *src, int w){
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
static int sse8_c(void *v, uint8_t * pix1, uint8_t * pix2, int line_size)
|
static int sse8_c(void *v, uint8_t * pix1, uint8_t * pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int s, i;
|
int s, i;
|
||||||
uint32_t *sq = squareTbl + 256;
|
uint32_t *sq = squareTbl + 256;
|
||||||
|
|
||||||
s = 0;
|
s = 0;
|
||||||
for (i = 0; i < 8; i++) {
|
for (i = 0; i < h; i++) {
|
||||||
s += sq[pix1[0] - pix2[0]];
|
s += sq[pix1[0] - pix2[0]];
|
||||||
s += sq[pix1[1] - pix2[1]];
|
s += sq[pix1[1] - pix2[1]];
|
||||||
s += sq[pix1[2] - pix2[2]];
|
s += sq[pix1[2] - pix2[2]];
|
||||||
@ -239,13 +239,13 @@ static int sse8_c(void *v, uint8_t * pix1, uint8_t * pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int sse16_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size)
|
static int sse16_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int s, i;
|
int s, i;
|
||||||
uint32_t *sq = squareTbl + 256;
|
uint32_t *sq = squareTbl + 256;
|
||||||
|
|
||||||
s = 0;
|
s = 0;
|
||||||
for (i = 0; i < 16; i++) {
|
for (i = 0; i < h; i++) {
|
||||||
s += sq[pix1[ 0] - pix2[ 0]];
|
s += sq[pix1[ 0] - pix2[ 0]];
|
||||||
s += sq[pix1[ 1] - pix2[ 1]];
|
s += sq[pix1[ 1] - pix2[ 1]];
|
||||||
s += sq[pix1[ 2] - pix2[ 2]];
|
s += sq[pix1[ 2] - pix2[ 2]];
|
||||||
@ -2331,12 +2331,12 @@ static void h263_h_loop_filter_c(uint8_t *src, int stride, int qscale){
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
static inline int pix_abs16x16_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
static inline int pix_abs16_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int s, i;
|
int s, i;
|
||||||
|
|
||||||
s = 0;
|
s = 0;
|
||||||
for(i=0;i<16;i++) {
|
for(i=0;i<h;i++) {
|
||||||
s += abs(pix1[0] - pix2[0]);
|
s += abs(pix1[0] - pix2[0]);
|
||||||
s += abs(pix1[1] - pix2[1]);
|
s += abs(pix1[1] - pix2[1]);
|
||||||
s += abs(pix1[2] - pix2[2]);
|
s += abs(pix1[2] - pix2[2]);
|
||||||
@ -2359,12 +2359,12 @@ static inline int pix_abs16x16_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int pix_abs16x16_x2_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
static int pix_abs16_x2_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int s, i;
|
int s, i;
|
||||||
|
|
||||||
s = 0;
|
s = 0;
|
||||||
for(i=0;i<16;i++) {
|
for(i=0;i<h;i++) {
|
||||||
s += abs(pix1[0] - avg2(pix2[0], pix2[1]));
|
s += abs(pix1[0] - avg2(pix2[0], pix2[1]));
|
||||||
s += abs(pix1[1] - avg2(pix2[1], pix2[2]));
|
s += abs(pix1[1] - avg2(pix2[1], pix2[2]));
|
||||||
s += abs(pix1[2] - avg2(pix2[2], pix2[3]));
|
s += abs(pix1[2] - avg2(pix2[2], pix2[3]));
|
||||||
@ -2387,13 +2387,13 @@ static int pix_abs16x16_x2_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int pix_abs16x16_y2_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
static int pix_abs16_y2_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int s, i;
|
int s, i;
|
||||||
uint8_t *pix3 = pix2 + line_size;
|
uint8_t *pix3 = pix2 + line_size;
|
||||||
|
|
||||||
s = 0;
|
s = 0;
|
||||||
for(i=0;i<16;i++) {
|
for(i=0;i<h;i++) {
|
||||||
s += abs(pix1[0] - avg2(pix2[0], pix3[0]));
|
s += abs(pix1[0] - avg2(pix2[0], pix3[0]));
|
||||||
s += abs(pix1[1] - avg2(pix2[1], pix3[1]));
|
s += abs(pix1[1] - avg2(pix2[1], pix3[1]));
|
||||||
s += abs(pix1[2] - avg2(pix2[2], pix3[2]));
|
s += abs(pix1[2] - avg2(pix2[2], pix3[2]));
|
||||||
@ -2417,13 +2417,13 @@ static int pix_abs16x16_y2_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int pix_abs16x16_xy2_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
static int pix_abs16_xy2_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int s, i;
|
int s, i;
|
||||||
uint8_t *pix3 = pix2 + line_size;
|
uint8_t *pix3 = pix2 + line_size;
|
||||||
|
|
||||||
s = 0;
|
s = 0;
|
||||||
for(i=0;i<16;i++) {
|
for(i=0;i<h;i++) {
|
||||||
s += abs(pix1[0] - avg4(pix2[0], pix2[1], pix3[0], pix3[1]));
|
s += abs(pix1[0] - avg4(pix2[0], pix2[1], pix3[0], pix3[1]));
|
||||||
s += abs(pix1[1] - avg4(pix2[1], pix2[2], pix3[1], pix3[2]));
|
s += abs(pix1[1] - avg4(pix2[1], pix2[2], pix3[1], pix3[2]));
|
||||||
s += abs(pix1[2] - avg4(pix2[2], pix2[3], pix3[2], pix3[3]));
|
s += abs(pix1[2] - avg4(pix2[2], pix2[3], pix3[2], pix3[3]));
|
||||||
@ -2447,12 +2447,12 @@ static int pix_abs16x16_xy2_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
static inline int pix_abs8x8_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
static inline int pix_abs8_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int s, i;
|
int s, i;
|
||||||
|
|
||||||
s = 0;
|
s = 0;
|
||||||
for(i=0;i<8;i++) {
|
for(i=0;i<h;i++) {
|
||||||
s += abs(pix1[0] - pix2[0]);
|
s += abs(pix1[0] - pix2[0]);
|
||||||
s += abs(pix1[1] - pix2[1]);
|
s += abs(pix1[1] - pix2[1]);
|
||||||
s += abs(pix1[2] - pix2[2]);
|
s += abs(pix1[2] - pix2[2]);
|
||||||
@ -2467,12 +2467,12 @@ static inline int pix_abs8x8_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int pix_abs8x8_x2_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
static int pix_abs8_x2_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int s, i;
|
int s, i;
|
||||||
|
|
||||||
s = 0;
|
s = 0;
|
||||||
for(i=0;i<8;i++) {
|
for(i=0;i<h;i++) {
|
||||||
s += abs(pix1[0] - avg2(pix2[0], pix2[1]));
|
s += abs(pix1[0] - avg2(pix2[0], pix2[1]));
|
||||||
s += abs(pix1[1] - avg2(pix2[1], pix2[2]));
|
s += abs(pix1[1] - avg2(pix2[1], pix2[2]));
|
||||||
s += abs(pix1[2] - avg2(pix2[2], pix2[3]));
|
s += abs(pix1[2] - avg2(pix2[2], pix2[3]));
|
||||||
@ -2487,13 +2487,13 @@ static int pix_abs8x8_x2_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int pix_abs8x8_y2_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
static int pix_abs8_y2_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int s, i;
|
int s, i;
|
||||||
uint8_t *pix3 = pix2 + line_size;
|
uint8_t *pix3 = pix2 + line_size;
|
||||||
|
|
||||||
s = 0;
|
s = 0;
|
||||||
for(i=0;i<8;i++) {
|
for(i=0;i<h;i++) {
|
||||||
s += abs(pix1[0] - avg2(pix2[0], pix3[0]));
|
s += abs(pix1[0] - avg2(pix2[0], pix3[0]));
|
||||||
s += abs(pix1[1] - avg2(pix2[1], pix3[1]));
|
s += abs(pix1[1] - avg2(pix2[1], pix3[1]));
|
||||||
s += abs(pix1[2] - avg2(pix2[2], pix3[2]));
|
s += abs(pix1[2] - avg2(pix2[2], pix3[2]));
|
||||||
@ -2509,13 +2509,13 @@ static int pix_abs8x8_y2_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int pix_abs8x8_xy2_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
static int pix_abs8_xy2_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int s, i;
|
int s, i;
|
||||||
uint8_t *pix3 = pix2 + line_size;
|
uint8_t *pix3 = pix2 + line_size;
|
||||||
|
|
||||||
s = 0;
|
s = 0;
|
||||||
for(i=0;i<8;i++) {
|
for(i=0;i<h;i++) {
|
||||||
s += abs(pix1[0] - avg4(pix2[0], pix2[1], pix3[0], pix3[1]));
|
s += abs(pix1[0] - avg4(pix2[0], pix2[1], pix3[0], pix3[1]));
|
||||||
s += abs(pix1[1] - avg4(pix2[1], pix2[2], pix3[1], pix3[2]));
|
s += abs(pix1[1] - avg4(pix2[1], pix2[2], pix3[1], pix3[2]));
|
||||||
s += abs(pix1[2] - avg4(pix2[2], pix2[3], pix3[2], pix3[3]));
|
s += abs(pix1[2] - avg4(pix2[2], pix2[3], pix3[2], pix3[3]));
|
||||||
@ -2531,14 +2531,6 @@ static int pix_abs8x8_xy2_c(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int sad16x16_c(void *s, uint8_t *a, uint8_t *b, int stride){
|
|
||||||
return pix_abs16x16_c(a,b,stride);
|
|
||||||
}
|
|
||||||
|
|
||||||
static int sad8x8_c(void *s, uint8_t *a, uint8_t *b, int stride){
|
|
||||||
return pix_abs8x8_c(a,b,stride);
|
|
||||||
}
|
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* permutes an 8x8 block.
|
* permutes an 8x8 block.
|
||||||
* @param block the block which will be permuted according to the given permutation vector
|
* @param block the block which will be permuted according to the given permutation vector
|
||||||
@ -2641,11 +2633,13 @@ o2= (i1)-(i2);
|
|||||||
|
|
||||||
#define BUTTERFLYA(x,y) (ABS((x)+(y)) + ABS((x)-(y)))
|
#define BUTTERFLYA(x,y) (ABS((x)+(y)) + ABS((x)-(y)))
|
||||||
|
|
||||||
static int hadamard8_diff_c(/*MpegEncContext*/ void *s, uint8_t *dst, uint8_t *src, int stride){
|
static int hadamard8_diff8x8_c(/*MpegEncContext*/ void *s, uint8_t *dst, uint8_t *src, int stride, int h){
|
||||||
int i;
|
int i;
|
||||||
int temp[64];
|
int temp[64];
|
||||||
int sum=0;
|
int sum=0;
|
||||||
|
|
||||||
|
assert(h==8);
|
||||||
|
|
||||||
for(i=0; i<8; i++){
|
for(i=0; i<8; i++){
|
||||||
//FIXME try pointer walks
|
//FIXME try pointer walks
|
||||||
BUTTERFLY2(temp[8*i+0], temp[8*i+1], src[stride*i+0]-dst[stride*i+0],src[stride*i+1]-dst[stride*i+1]);
|
BUTTERFLY2(temp[8*i+0], temp[8*i+1], src[stride*i+0]-dst[stride*i+0],src[stride*i+1]-dst[stride*i+1]);
|
||||||
@ -2735,12 +2729,14 @@ static int hadamard8_abs_c(uint8_t *src, int stride, int mean){
|
|||||||
return sum;
|
return sum;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int dct_sad8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride){
|
static int dct_sad8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride, int h){
|
||||||
MpegEncContext * const s= (MpegEncContext *)c;
|
MpegEncContext * const s= (MpegEncContext *)c;
|
||||||
uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64/8];
|
uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64/8];
|
||||||
DCTELEM * const temp= (DCTELEM*)aligned_temp;
|
DCTELEM * const temp= (DCTELEM*)aligned_temp;
|
||||||
int sum=0, i;
|
int sum=0, i;
|
||||||
|
|
||||||
|
assert(h==8);
|
||||||
|
|
||||||
s->dsp.diff_pixels(temp, src1, src2, stride);
|
s->dsp.diff_pixels(temp, src1, src2, stride);
|
||||||
s->dsp.fdct(temp);
|
s->dsp.fdct(temp);
|
||||||
|
|
||||||
@ -2752,13 +2748,14 @@ static int dct_sad8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2
|
|||||||
|
|
||||||
void simple_idct(DCTELEM *block); //FIXME
|
void simple_idct(DCTELEM *block); //FIXME
|
||||||
|
|
||||||
static int quant_psnr8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride){
|
static int quant_psnr8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride, int h){
|
||||||
MpegEncContext * const s= (MpegEncContext *)c;
|
MpegEncContext * const s= (MpegEncContext *)c;
|
||||||
uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64*2/8];
|
uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64*2/8];
|
||||||
DCTELEM * const temp= (DCTELEM*)aligned_temp;
|
DCTELEM * const temp= (DCTELEM*)aligned_temp;
|
||||||
DCTELEM * const bak = ((DCTELEM*)aligned_temp)+64;
|
DCTELEM * const bak = ((DCTELEM*)aligned_temp)+64;
|
||||||
int sum=0, i;
|
int sum=0, i;
|
||||||
|
|
||||||
|
assert(h==8);
|
||||||
s->mb_intra=0;
|
s->mb_intra=0;
|
||||||
|
|
||||||
s->dsp.diff_pixels(temp, src1, src2, stride);
|
s->dsp.diff_pixels(temp, src1, src2, stride);
|
||||||
@ -2775,7 +2772,7 @@ static int quant_psnr8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *s
|
|||||||
return sum;
|
return sum;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int rd8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride){
|
static int rd8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride, int h){
|
||||||
MpegEncContext * const s= (MpegEncContext *)c;
|
MpegEncContext * const s= (MpegEncContext *)c;
|
||||||
const uint8_t *scantable= s->intra_scantable.permutated;
|
const uint8_t *scantable= s->intra_scantable.permutated;
|
||||||
uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64/8];
|
uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64/8];
|
||||||
@ -2787,6 +2784,8 @@ static int rd8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int
|
|||||||
uint8_t * length;
|
uint8_t * length;
|
||||||
uint8_t * last_length;
|
uint8_t * last_length;
|
||||||
|
|
||||||
|
assert(h==8);
|
||||||
|
|
||||||
for(i=0; i<8; i++){
|
for(i=0; i<8; i++){
|
||||||
((uint32_t*)(bak + i*stride))[0]= ((uint32_t*)(src2 + i*stride))[0];
|
((uint32_t*)(bak + i*stride))[0]= ((uint32_t*)(src2 + i*stride))[0];
|
||||||
((uint32_t*)(bak + i*stride))[1]= ((uint32_t*)(src2 + i*stride))[1];
|
((uint32_t*)(bak + i*stride))[1]= ((uint32_t*)(src2 + i*stride))[1];
|
||||||
@ -2847,12 +2846,12 @@ static int rd8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int
|
|||||||
|
|
||||||
s->dsp.idct_add(bak, stride, temp);
|
s->dsp.idct_add(bak, stride, temp);
|
||||||
|
|
||||||
distoration= s->dsp.sse[1](NULL, bak, src1, stride);
|
distoration= s->dsp.sse[1](NULL, bak, src1, stride, 8);
|
||||||
|
|
||||||
return distoration + ((bits*s->qscale*s->qscale*109 + 64)>>7);
|
return distoration + ((bits*s->qscale*s->qscale*109 + 64)>>7);
|
||||||
}
|
}
|
||||||
|
|
||||||
static int bit8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride){
|
static int bit8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride, int h){
|
||||||
MpegEncContext * const s= (MpegEncContext *)c;
|
MpegEncContext * const s= (MpegEncContext *)c;
|
||||||
const uint8_t *scantable= s->intra_scantable.permutated;
|
const uint8_t *scantable= s->intra_scantable.permutated;
|
||||||
uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64/8];
|
uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64/8];
|
||||||
@ -2862,6 +2861,8 @@ static int bit8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, in
|
|||||||
uint8_t * length;
|
uint8_t * length;
|
||||||
uint8_t * last_length;
|
uint8_t * last_length;
|
||||||
|
|
||||||
|
assert(h==8);
|
||||||
|
|
||||||
s->dsp.diff_pixels(temp, src1, src2, stride);
|
s->dsp.diff_pixels(temp, src1, src2, stride);
|
||||||
|
|
||||||
s->block_last_index[0/*FIXME*/]= last= s->fast_dct_quantize(s, temp, 0/*FIXME*/, s->qscale, &i);
|
s->block_last_index[0/*FIXME*/]= last= s->fast_dct_quantize(s, temp, 0/*FIXME*/, s->qscale, &i);
|
||||||
@ -2910,12 +2911,11 @@ static int bit8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, in
|
|||||||
return bits;
|
return bits;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
WARPER8_16_SQ(hadamard8_diff8x8_c, hadamard8_diff16_c)
|
||||||
WARPER88_1616(hadamard8_diff_c, hadamard8_diff16_c)
|
WARPER8_16_SQ(dct_sad8x8_c, dct_sad16_c)
|
||||||
WARPER88_1616(dct_sad8x8_c, dct_sad16x16_c)
|
WARPER8_16_SQ(quant_psnr8x8_c, quant_psnr16_c)
|
||||||
WARPER88_1616(quant_psnr8x8_c, quant_psnr16x16_c)
|
WARPER8_16_SQ(rd8x8_c, rd16_c)
|
||||||
WARPER88_1616(rd8x8_c, rd16x16_c)
|
WARPER8_16_SQ(bit8x8_c, bit16_c)
|
||||||
WARPER88_1616(bit8x8_c, bit16x16_c)
|
|
||||||
|
|
||||||
/* XXX: those functions should be suppressed ASAP when all IDCTs are
|
/* XXX: those functions should be suppressed ASAP when all IDCTs are
|
||||||
converted */
|
converted */
|
||||||
@ -2989,18 +2989,16 @@ void dsputil_init(DSPContext* c, AVCodecContext *avctx)
|
|||||||
c->clear_blocks = clear_blocks_c;
|
c->clear_blocks = clear_blocks_c;
|
||||||
c->pix_sum = pix_sum_c;
|
c->pix_sum = pix_sum_c;
|
||||||
c->pix_norm1 = pix_norm1_c;
|
c->pix_norm1 = pix_norm1_c;
|
||||||
c->sse[0]= sse16_c;
|
|
||||||
c->sse[1]= sse8_c;
|
|
||||||
|
|
||||||
/* TODO [0] 16 [1] 8 */
|
/* TODO [0] 16 [1] 8 */
|
||||||
c->pix_abs16x16 = pix_abs16x16_c;
|
c->pix_abs[0][0] = pix_abs16_c;
|
||||||
c->pix_abs16x16_x2 = pix_abs16x16_x2_c;
|
c->pix_abs[0][1] = pix_abs16_x2_c;
|
||||||
c->pix_abs16x16_y2 = pix_abs16x16_y2_c;
|
c->pix_abs[0][2] = pix_abs16_y2_c;
|
||||||
c->pix_abs16x16_xy2 = pix_abs16x16_xy2_c;
|
c->pix_abs[0][3] = pix_abs16_xy2_c;
|
||||||
c->pix_abs8x8 = pix_abs8x8_c;
|
c->pix_abs[1][0] = pix_abs8_c;
|
||||||
c->pix_abs8x8_x2 = pix_abs8x8_x2_c;
|
c->pix_abs[1][1] = pix_abs8_x2_c;
|
||||||
c->pix_abs8x8_y2 = pix_abs8x8_y2_c;
|
c->pix_abs[1][2] = pix_abs8_y2_c;
|
||||||
c->pix_abs8x8_xy2 = pix_abs8x8_xy2_c;
|
c->pix_abs[1][3] = pix_abs8_xy2_c;
|
||||||
|
|
||||||
#define dspfunc(PFX, IDX, NUM) \
|
#define dspfunc(PFX, IDX, NUM) \
|
||||||
c->PFX ## _pixels_tab[IDX][0] = PFX ## _pixels ## NUM ## _c; \
|
c->PFX ## _pixels_tab[IDX][0] = PFX ## _pixels ## NUM ## _c; \
|
||||||
@ -3097,24 +3095,21 @@ void dsputil_init(DSPContext* c, AVCodecContext *avctx)
|
|||||||
c->put_mspel_pixels_tab[6]= put_mspel8_mc22_c;
|
c->put_mspel_pixels_tab[6]= put_mspel8_mc22_c;
|
||||||
c->put_mspel_pixels_tab[7]= put_mspel8_mc32_c;
|
c->put_mspel_pixels_tab[7]= put_mspel8_mc32_c;
|
||||||
|
|
||||||
c->hadamard8_diff[0]= hadamard8_diff16_c;
|
|
||||||
c->hadamard8_diff[1]= hadamard8_diff_c;
|
|
||||||
c->hadamard8_abs = hadamard8_abs_c;
|
c->hadamard8_abs = hadamard8_abs_c;
|
||||||
|
|
||||||
c->dct_sad[0]= dct_sad16x16_c;
|
#define SET_CMP_FUNC(name) \
|
||||||
c->dct_sad[1]= dct_sad8x8_c;
|
c->name[0]= name ## 16_c;\
|
||||||
|
c->name[1]= name ## 8x8_c;
|
||||||
|
|
||||||
c->sad[0]= sad16x16_c;
|
SET_CMP_FUNC(hadamard8_diff)
|
||||||
c->sad[1]= sad8x8_c;
|
SET_CMP_FUNC(dct_sad)
|
||||||
|
c->sad[0]= pix_abs16_c;
|
||||||
c->quant_psnr[0]= quant_psnr16x16_c;
|
c->sad[1]= pix_abs8_c;
|
||||||
c->quant_psnr[1]= quant_psnr8x8_c;
|
c->sse[0]= sse16_c;
|
||||||
|
c->sse[1]= sse8_c;
|
||||||
c->rd[0]= rd16x16_c;
|
SET_CMP_FUNC(quant_psnr)
|
||||||
c->rd[1]= rd8x8_c;
|
SET_CMP_FUNC(rd)
|
||||||
|
SET_CMP_FUNC(bit)
|
||||||
c->bit[0]= bit16x16_c;
|
|
||||||
c->bit[1]= bit8x8_c;
|
|
||||||
|
|
||||||
c->add_bytes= add_bytes_c;
|
c->add_bytes= add_bytes_c;
|
||||||
c->diff_bytes= diff_bytes_c;
|
c->diff_bytes= diff_bytes_c;
|
||||||
|
@ -110,9 +110,7 @@ static void a(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
|
|||||||
|
|
||||||
/* motion estimation */
|
/* motion estimation */
|
||||||
|
|
||||||
typedef int (*op_pixels_abs_func)(uint8_t *blk1/*align width (8 or 16)*/, uint8_t *blk2/*align 1*/, int line_size)/* __attribute__ ((const))*/;
|
typedef int (*me_cmp_func)(void /*MpegEncContext*/ *s, uint8_t *blk1/*align width (8 or 16)*/, uint8_t *blk2/*align 1*/, int line_size, int h)/* __attribute__ ((const))*/;
|
||||||
|
|
||||||
typedef int (*me_cmp_func)(void /*MpegEncContext*/ *s, uint8_t *blk1/*align width (8 or 16)*/, uint8_t *blk2/*align 1*/, int line_size)/* __attribute__ ((const))*/;
|
|
||||||
|
|
||||||
|
|
||||||
/**
|
/**
|
||||||
@ -136,19 +134,21 @@ typedef struct DSPContext {
|
|||||||
void (*clear_blocks)(DCTELEM *blocks/*align 16*/);
|
void (*clear_blocks)(DCTELEM *blocks/*align 16*/);
|
||||||
int (*pix_sum)(uint8_t * pix, int line_size);
|
int (*pix_sum)(uint8_t * pix, int line_size);
|
||||||
int (*pix_norm1)(uint8_t * pix, int line_size);
|
int (*pix_norm1)(uint8_t * pix, int line_size);
|
||||||
me_cmp_func sad[2]; /* identical to pix_absAxA except additional void * */
|
// 16x16 8x8 4x4 2x2 16x8 8x4 4x2 8x16 4x8 2x4
|
||||||
me_cmp_func sse[2];
|
|
||||||
me_cmp_func hadamard8_diff[2];
|
me_cmp_func sad[4]; /* identical to pix_absAxA except additional void * */
|
||||||
me_cmp_func dct_sad[2];
|
me_cmp_func sse[4];
|
||||||
me_cmp_func quant_psnr[2];
|
me_cmp_func hadamard8_diff[4];
|
||||||
me_cmp_func bit[2];
|
me_cmp_func dct_sad[4];
|
||||||
me_cmp_func rd[2];
|
me_cmp_func quant_psnr[4];
|
||||||
|
me_cmp_func bit[4];
|
||||||
|
me_cmp_func rd[4];
|
||||||
int (*hadamard8_abs )(uint8_t *src, int stride, int mean);
|
int (*hadamard8_abs )(uint8_t *src, int stride, int mean);
|
||||||
|
|
||||||
me_cmp_func me_pre_cmp[11];
|
me_cmp_func me_pre_cmp[5];
|
||||||
me_cmp_func me_cmp[11];
|
me_cmp_func me_cmp[5];
|
||||||
me_cmp_func me_sub_cmp[11];
|
me_cmp_func me_sub_cmp[5];
|
||||||
me_cmp_func mb_cmp[11];
|
me_cmp_func mb_cmp[5];
|
||||||
|
|
||||||
/* maybe create an array for 16/8/4/2 functions */
|
/* maybe create an array for 16/8/4/2 functions */
|
||||||
/**
|
/**
|
||||||
@ -226,14 +226,7 @@ typedef struct DSPContext {
|
|||||||
qpel_mc_func put_h264_qpel_pixels_tab[3][16];
|
qpel_mc_func put_h264_qpel_pixels_tab[3][16];
|
||||||
qpel_mc_func avg_h264_qpel_pixels_tab[3][16];
|
qpel_mc_func avg_h264_qpel_pixels_tab[3][16];
|
||||||
|
|
||||||
op_pixels_abs_func pix_abs16x16;
|
me_cmp_func pix_abs[2][4];
|
||||||
op_pixels_abs_func pix_abs16x16_x2;
|
|
||||||
op_pixels_abs_func pix_abs16x16_y2;
|
|
||||||
op_pixels_abs_func pix_abs16x16_xy2;
|
|
||||||
op_pixels_abs_func pix_abs8x8;
|
|
||||||
op_pixels_abs_func pix_abs8x8_x2;
|
|
||||||
op_pixels_abs_func pix_abs8x8_y2;
|
|
||||||
op_pixels_abs_func pix_abs8x8_xy2;
|
|
||||||
|
|
||||||
/* huffyuv specific */
|
/* huffyuv specific */
|
||||||
void (*add_bytes)(uint8_t *dst/*align 16*/, uint8_t *src/*align 16*/, int w);
|
void (*add_bytes)(uint8_t *dst/*align 16*/, uint8_t *src/*align 16*/, int w);
|
||||||
@ -484,12 +477,24 @@ void ff_mdct_calc(MDCTContext *s, FFTSample *out,
|
|||||||
const FFTSample *input, FFTSample *tmp);
|
const FFTSample *input, FFTSample *tmp);
|
||||||
void ff_mdct_end(MDCTContext *s);
|
void ff_mdct_end(MDCTContext *s);
|
||||||
|
|
||||||
#define WARPER88_1616(name8, name16)\
|
#define WARPER8_16(name8, name16)\
|
||||||
static int name16(void /*MpegEncContext*/ *s, uint8_t *dst, uint8_t *src, int stride){\
|
static int name16(void /*MpegEncContext*/ *s, uint8_t *dst, uint8_t *src, int stride, int h){\
|
||||||
return name8(s, dst , src , stride)\
|
return name8(s, dst , src , stride, h)\
|
||||||
+name8(s, dst+8 , src+8 , stride)\
|
+name8(s, dst+8 , src+8 , stride, h);\
|
||||||
+name8(s, dst +8*stride, src +8*stride, stride)\
|
}
|
||||||
+name8(s, dst+8+8*stride, src+8+8*stride, stride);\
|
|
||||||
|
#define WARPER8_16_SQ(name8, name16)\
|
||||||
|
static int name16(void /*MpegEncContext*/ *s, uint8_t *dst, uint8_t *src, int stride, int h){\
|
||||||
|
int score=0;\
|
||||||
|
score +=name8(s, dst , src , stride, 8);\
|
||||||
|
score +=name8(s, dst+8 , src+8 , stride, 8);\
|
||||||
|
if(h==16){\
|
||||||
|
dst += 8*stride;\
|
||||||
|
src += 8*stride;\
|
||||||
|
score +=name8(s, dst , src , stride, 8);\
|
||||||
|
score +=name8(s, dst+8 , src+8 , stride, 8);\
|
||||||
|
}\
|
||||||
|
return score;\
|
||||||
}
|
}
|
||||||
|
|
||||||
#ifndef HAVE_LRINTF
|
#ifndef HAVE_LRINTF
|
||||||
|
@ -582,8 +582,8 @@ static int is_intra_more_likely(MpegEncContext *s){
|
|||||||
uint8_t *mb_ptr = s->current_picture.data[0] + mb_x*16 + mb_y*16*s->linesize;
|
uint8_t *mb_ptr = s->current_picture.data[0] + mb_x*16 + mb_y*16*s->linesize;
|
||||||
uint8_t *last_mb_ptr= s->last_picture.data [0] + mb_x*16 + mb_y*16*s->linesize;
|
uint8_t *last_mb_ptr= s->last_picture.data [0] + mb_x*16 + mb_y*16*s->linesize;
|
||||||
|
|
||||||
is_intra_likely += s->dsp.pix_abs16x16(last_mb_ptr, mb_ptr , s->linesize);
|
is_intra_likely += s->dsp.sad[0](NULL, last_mb_ptr, mb_ptr , s->linesize, 16);
|
||||||
is_intra_likely -= s->dsp.pix_abs16x16(last_mb_ptr, last_mb_ptr+s->linesize*16, s->linesize);
|
is_intra_likely -= s->dsp.sad[0](NULL, last_mb_ptr, last_mb_ptr+s->linesize*16, s->linesize, 16);
|
||||||
}else{
|
}else{
|
||||||
if(IS_INTRA(s->current_picture.mb_type[mb_xy]))
|
if(IS_INTRA(s->current_picture.mb_type[mb_xy]))
|
||||||
is_intra_likely++;
|
is_intra_likely++;
|
||||||
|
@ -479,9 +479,9 @@ void ff_clean_mpeg4_qscales(MpegEncContext *s){
|
|||||||
for(i=1; i<s->mb_num; i++){
|
for(i=1; i<s->mb_num; i++){
|
||||||
int mb_xy= s->mb_index2xy[i];
|
int mb_xy= s->mb_index2xy[i];
|
||||||
|
|
||||||
if(qscale_table[mb_xy] != qscale_table[s->mb_index2xy[i-1]] && (s->mb_type[mb_xy]&MB_TYPE_INTER4V)){
|
if(qscale_table[mb_xy] != qscale_table[s->mb_index2xy[i-1]] && (s->mb_type[mb_xy]&CANDIDATE_MB_TYPE_INTER4V)){
|
||||||
s->mb_type[mb_xy]&= ~MB_TYPE_INTER4V;
|
s->mb_type[mb_xy]&= ~CANDIDATE_MB_TYPE_INTER4V;
|
||||||
s->mb_type[mb_xy]|= MB_TYPE_INTER;
|
s->mb_type[mb_xy]|= CANDIDATE_MB_TYPE_INTER;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -508,9 +508,9 @@ void ff_clean_mpeg4_qscales(MpegEncContext *s){
|
|||||||
|
|
||||||
for(i=1; i<s->mb_num; i++){
|
for(i=1; i<s->mb_num; i++){
|
||||||
int mb_xy= s->mb_index2xy[i];
|
int mb_xy= s->mb_index2xy[i];
|
||||||
if(qscale_table[mb_xy] != qscale_table[s->mb_index2xy[i-1]] && (s->mb_type[mb_xy]&MB_TYPE_DIRECT)){
|
if(qscale_table[mb_xy] != qscale_table[s->mb_index2xy[i-1]] && (s->mb_type[mb_xy]&CANDIDATE_MB_TYPE_DIRECT)){
|
||||||
s->mb_type[mb_xy]&= ~MB_TYPE_DIRECT;
|
s->mb_type[mb_xy]&= ~CANDIDATE_MB_TYPE_DIRECT;
|
||||||
s->mb_type[mb_xy]|= MB_TYPE_BIDIR;
|
s->mb_type[mb_xy]|= CANDIDATE_MB_TYPE_BIDIR;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -523,7 +523,7 @@ void ff_clean_mpeg4_qscales(MpegEncContext *s){
|
|||||||
*/
|
*/
|
||||||
int ff_mpeg4_set_direct_mv(MpegEncContext *s, int mx, int my){
|
int ff_mpeg4_set_direct_mv(MpegEncContext *s, int mx, int my){
|
||||||
const int mb_index= s->mb_x + s->mb_y*s->mb_stride;
|
const int mb_index= s->mb_x + s->mb_y*s->mb_stride;
|
||||||
const int colocated_mb_type= s->next_picture.mb_type[mb_index]; //FIXME or next?
|
const int colocated_mb_type= s->next_picture.mb_type[mb_index];
|
||||||
int xy= s->block_index[0];
|
int xy= s->block_index[0];
|
||||||
uint16_t time_pp= s->pp_time;
|
uint16_t time_pp= s->pp_time;
|
||||||
uint16_t time_pb= s->pb_time;
|
uint16_t time_pb= s->pb_time;
|
||||||
@ -547,18 +547,18 @@ int ff_mpeg4_set_direct_mv(MpegEncContext *s, int mx, int my){
|
|||||||
s->mv_type = MV_TYPE_FIELD;
|
s->mv_type = MV_TYPE_FIELD;
|
||||||
for(i=0; i<2; i++){
|
for(i=0; i<2; i++){
|
||||||
if(s->top_field_first){
|
if(s->top_field_first){
|
||||||
time_pp= s->pp_field_time - s->field_select_table[mb_index][i] + i;
|
time_pp= s->pp_field_time - s->p_field_select_table[i][mb_index] + i;
|
||||||
time_pb= s->pb_field_time - s->field_select_table[mb_index][i] + i;
|
time_pb= s->pb_field_time - s->p_field_select_table[i][mb_index] + i;
|
||||||
}else{
|
}else{
|
||||||
time_pp= s->pp_field_time + s->field_select_table[mb_index][i] - i;
|
time_pp= s->pp_field_time + s->p_field_select_table[i][mb_index] - i;
|
||||||
time_pb= s->pb_field_time + s->field_select_table[mb_index][i] - i;
|
time_pb= s->pb_field_time + s->p_field_select_table[i][mb_index] - i;
|
||||||
}
|
}
|
||||||
s->mv[0][i][0] = s->field_mv_table[mb_index][i][0]*time_pb/time_pp + mx;
|
s->mv[0][i][0] = s->p_field_mv_table[i][0][mb_index][0]*time_pb/time_pp + mx;
|
||||||
s->mv[0][i][1] = s->field_mv_table[mb_index][i][1]*time_pb/time_pp + my;
|
s->mv[0][i][1] = s->p_field_mv_table[i][0][mb_index][1]*time_pb/time_pp + my;
|
||||||
s->mv[1][i][0] = mx ? s->mv[0][i][0] - s->field_mv_table[mb_index][i][0]
|
s->mv[1][i][0] = mx ? s->mv[0][i][0] - s->p_field_mv_table[i][0][mb_index][0]
|
||||||
: s->field_mv_table[mb_index][i][0]*(time_pb - time_pp)/time_pp;
|
: s->p_field_mv_table[i][0][mb_index][0]*(time_pb - time_pp)/time_pp;
|
||||||
s->mv[1][i][1] = my ? s->mv[0][i][1] - s->field_mv_table[mb_index][i][1]
|
s->mv[1][i][1] = my ? s->mv[0][i][1] - s->p_field_mv_table[i][0][mb_index][1]
|
||||||
: s->field_mv_table[mb_index][i][1]*(time_pb - time_pp)/time_pp;
|
: s->p_field_mv_table[i][0][mb_index][1]*(time_pb - time_pp)/time_pp;
|
||||||
}
|
}
|
||||||
return MB_TYPE_DIRECT2 | MB_TYPE_16x8 | MB_TYPE_L0L1 | MB_TYPE_INTERLACED;
|
return MB_TYPE_DIRECT2 | MB_TYPE_16x8 | MB_TYPE_L0L1 | MB_TYPE_INTERLACED;
|
||||||
}else{
|
}else{
|
||||||
@ -598,9 +598,9 @@ void ff_h263_update_motion_val(MpegEncContext * s){
|
|||||||
motion_y = s->mv[0][0][1] + s->mv[0][1][1];
|
motion_y = s->mv[0][0][1] + s->mv[0][1][1];
|
||||||
motion_x = (motion_x>>1) | (motion_x&1);
|
motion_x = (motion_x>>1) | (motion_x&1);
|
||||||
for(i=0; i<2; i++){
|
for(i=0; i<2; i++){
|
||||||
s->field_mv_table[mb_xy][i][0]= s->mv[0][i][0];
|
s->p_field_mv_table[i][0][mb_xy][0]= s->mv[0][i][0];
|
||||||
s->field_mv_table[mb_xy][i][1]= s->mv[0][i][1];
|
s->p_field_mv_table[i][0][mb_xy][1]= s->mv[0][i][1];
|
||||||
s->field_select_table[mb_xy][i]= s->field_select[0][i];
|
s->p_field_select_table[i][mb_xy]= s->field_select[0][i];
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -746,10 +746,12 @@ void mpeg4_encode_mb(MpegEncContext * s,
|
|||||||
int mb_type= mb_type_table[s->mv_dir];
|
int mb_type= mb_type_table[s->mv_dir];
|
||||||
|
|
||||||
if(s->mb_x==0){
|
if(s->mb_x==0){
|
||||||
s->last_mv[0][0][0]=
|
for(i=0; i<2; i++){
|
||||||
s->last_mv[0][0][1]=
|
s->last_mv[i][0][0]=
|
||||||
s->last_mv[1][0][0]=
|
s->last_mv[i][0][1]=
|
||||||
s->last_mv[1][0][1]= 0;
|
s->last_mv[i][1][0]=
|
||||||
|
s->last_mv[i][1][1]= 0;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
assert(s->dquant>=-2 && s->dquant<=2);
|
assert(s->dquant>=-2 && s->dquant<=2);
|
||||||
@ -803,50 +805,64 @@ void mpeg4_encode_mb(MpegEncContext * s,
|
|||||||
if(cbp)
|
if(cbp)
|
||||||
put_bits(&s->pb, 1, s->interlaced_dct);
|
put_bits(&s->pb, 1, s->interlaced_dct);
|
||||||
if(mb_type) // not diect mode
|
if(mb_type) // not diect mode
|
||||||
put_bits(&s->pb, 1, 0); // no interlaced ME yet
|
put_bits(&s->pb, 1, s->mv_type == MV_TYPE_FIELD);
|
||||||
}
|
}
|
||||||
|
|
||||||
if(interleaved_stats){
|
if(interleaved_stats){
|
||||||
s->misc_bits+= get_bits_diff(s);
|
s->misc_bits+= get_bits_diff(s);
|
||||||
}
|
}
|
||||||
|
|
||||||
switch(mb_type)
|
if(mb_type == 0){
|
||||||
{
|
assert(s->mv_dir & MV_DIRECT);
|
||||||
case 0: /* direct */
|
|
||||||
h263_encode_motion(s, motion_x, 1);
|
h263_encode_motion(s, motion_x, 1);
|
||||||
h263_encode_motion(s, motion_y, 1);
|
h263_encode_motion(s, motion_y, 1);
|
||||||
s->b_count++;
|
s->b_count++;
|
||||||
s->f_count++;
|
s->f_count++;
|
||||||
break;
|
}else{
|
||||||
case 1: /* bidir */
|
assert(mb_type > 0 && mb_type < 4);
|
||||||
h263_encode_motion(s, s->mv[0][0][0] - s->last_mv[0][0][0], s->f_code);
|
if(s->mv_type != MV_TYPE_FIELD){
|
||||||
h263_encode_motion(s, s->mv[0][0][1] - s->last_mv[0][0][1], s->f_code);
|
if(s->mv_dir & MV_DIR_FORWARD){
|
||||||
h263_encode_motion(s, s->mv[1][0][0] - s->last_mv[1][0][0], s->b_code);
|
h263_encode_motion(s, s->mv[0][0][0] - s->last_mv[0][0][0], s->f_code);
|
||||||
h263_encode_motion(s, s->mv[1][0][1] - s->last_mv[1][0][1], s->b_code);
|
h263_encode_motion(s, s->mv[0][0][1] - s->last_mv[0][0][1], s->f_code);
|
||||||
s->last_mv[0][0][0]= s->mv[0][0][0];
|
s->last_mv[0][0][0]= s->last_mv[0][1][0]= s->mv[0][0][0];
|
||||||
s->last_mv[0][0][1]= s->mv[0][0][1];
|
s->last_mv[0][0][1]= s->last_mv[0][1][1]= s->mv[0][0][1];
|
||||||
s->last_mv[1][0][0]= s->mv[1][0][0];
|
s->f_count++;
|
||||||
s->last_mv[1][0][1]= s->mv[1][0][1];
|
}
|
||||||
s->b_count++;
|
if(s->mv_dir & MV_DIR_BACKWARD){
|
||||||
s->f_count++;
|
h263_encode_motion(s, s->mv[1][0][0] - s->last_mv[1][0][0], s->b_code);
|
||||||
break;
|
h263_encode_motion(s, s->mv[1][0][1] - s->last_mv[1][0][1], s->b_code);
|
||||||
case 2: /* backward */
|
s->last_mv[1][0][0]= s->last_mv[1][1][0]= s->mv[1][0][0];
|
||||||
h263_encode_motion(s, motion_x - s->last_mv[1][0][0], s->b_code);
|
s->last_mv[1][0][1]= s->last_mv[1][1][1]= s->mv[1][0][1];
|
||||||
h263_encode_motion(s, motion_y - s->last_mv[1][0][1], s->b_code);
|
s->b_count++;
|
||||||
s->last_mv[1][0][0]= motion_x;
|
}
|
||||||
s->last_mv[1][0][1]= motion_y;
|
}else{
|
||||||
s->b_count++;
|
if(s->mv_dir & MV_DIR_FORWARD){
|
||||||
break;
|
put_bits(&s->pb, 1, s->field_select[0][0]);
|
||||||
case 3: /* forward */
|
put_bits(&s->pb, 1, s->field_select[0][1]);
|
||||||
h263_encode_motion(s, motion_x - s->last_mv[0][0][0], s->f_code);
|
}
|
||||||
h263_encode_motion(s, motion_y - s->last_mv[0][0][1], s->f_code);
|
if(s->mv_dir & MV_DIR_BACKWARD){
|
||||||
s->last_mv[0][0][0]= motion_x;
|
put_bits(&s->pb, 1, s->field_select[1][0]);
|
||||||
s->last_mv[0][0][1]= motion_y;
|
put_bits(&s->pb, 1, s->field_select[1][1]);
|
||||||
s->f_count++;
|
}
|
||||||
break;
|
if(s->mv_dir & MV_DIR_FORWARD){
|
||||||
default:
|
for(i=0; i<2; i++){
|
||||||
av_log(s->avctx, AV_LOG_ERROR, "unknown mb type\n");
|
h263_encode_motion(s, s->mv[0][i][0] - s->last_mv[0][i][0] , s->f_code);
|
||||||
return;
|
h263_encode_motion(s, s->mv[0][i][1] - s->last_mv[0][i][1]/2, s->f_code);
|
||||||
|
s->last_mv[0][i][0]= s->mv[0][i][0];
|
||||||
|
s->last_mv[0][i][1]= s->mv[0][i][1]*2;
|
||||||
|
}
|
||||||
|
s->f_count++;
|
||||||
|
}
|
||||||
|
if(s->mv_dir & MV_DIR_BACKWARD){
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
h263_encode_motion(s, s->mv[1][i][0] - s->last_mv[1][i][0] , s->b_code);
|
||||||
|
h263_encode_motion(s, s->mv[1][i][1] - s->last_mv[1][i][1]/2, s->b_code);
|
||||||
|
s->last_mv[1][i][0]= s->mv[1][i][0];
|
||||||
|
s->last_mv[1][i][1]= s->mv[1][i][1]*2;
|
||||||
|
}
|
||||||
|
s->b_count++;
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if(interleaved_stats){
|
if(interleaved_stats){
|
||||||
@ -861,6 +877,7 @@ void mpeg4_encode_mb(MpegEncContext * s,
|
|||||||
if(interleaved_stats){
|
if(interleaved_stats){
|
||||||
s->p_tex_bits+= get_bits_diff(s);
|
s->p_tex_bits+= get_bits_diff(s);
|
||||||
}
|
}
|
||||||
|
|
||||||
}else{ /* s->pict_type==B_TYPE */
|
}else{ /* s->pict_type==B_TYPE */
|
||||||
cbp= get_p_cbp(s, block, motion_x, motion_y);
|
cbp= get_p_cbp(s, block, motion_x, motion_y);
|
||||||
|
|
||||||
@ -889,7 +906,7 @@ void mpeg4_encode_mb(MpegEncContext * s,
|
|||||||
if(pic==NULL || pic->pict_type!=B_TYPE) break;
|
if(pic==NULL || pic->pict_type!=B_TYPE) break;
|
||||||
|
|
||||||
b_pic= pic->data[0] + offset + 16; //FIXME +16
|
b_pic= pic->data[0] + offset + 16; //FIXME +16
|
||||||
diff= s->dsp.pix_abs16x16(p_pic, b_pic, s->linesize);
|
diff= s->dsp.sad[0](NULL, p_pic, b_pic, s->linesize, 16);
|
||||||
if(diff>s->qscale*70){ //FIXME check that 70 is optimal
|
if(diff>s->qscale*70){ //FIXME check that 70 is optimal
|
||||||
s->mb_skiped=0;
|
s->mb_skiped=0;
|
||||||
break;
|
break;
|
||||||
@ -929,7 +946,7 @@ void mpeg4_encode_mb(MpegEncContext * s,
|
|||||||
if(!s->progressive_sequence){
|
if(!s->progressive_sequence){
|
||||||
if(cbp)
|
if(cbp)
|
||||||
put_bits(pb2, 1, s->interlaced_dct);
|
put_bits(pb2, 1, s->interlaced_dct);
|
||||||
put_bits(pb2, 1, 0); // no interlaced ME yet
|
put_bits(pb2, 1, 0);
|
||||||
}
|
}
|
||||||
|
|
||||||
if(interleaved_stats){
|
if(interleaved_stats){
|
||||||
@ -941,7 +958,38 @@ void mpeg4_encode_mb(MpegEncContext * s,
|
|||||||
|
|
||||||
h263_encode_motion(s, motion_x - pred_x, s->f_code);
|
h263_encode_motion(s, motion_x - pred_x, s->f_code);
|
||||||
h263_encode_motion(s, motion_y - pred_y, s->f_code);
|
h263_encode_motion(s, motion_y - pred_y, s->f_code);
|
||||||
|
}else if(s->mv_type==MV_TYPE_FIELD){
|
||||||
|
if(s->dquant) cbpc+= 8;
|
||||||
|
put_bits(&s->pb,
|
||||||
|
inter_MCBPC_bits[cbpc],
|
||||||
|
inter_MCBPC_code[cbpc]);
|
||||||
|
|
||||||
|
put_bits(pb2, cbpy_tab[cbpy][1], cbpy_tab[cbpy][0]);
|
||||||
|
if(s->dquant)
|
||||||
|
put_bits(pb2, 2, dquant_code[s->dquant+2]);
|
||||||
|
|
||||||
|
assert(!s->progressive_sequence);
|
||||||
|
if(cbp)
|
||||||
|
put_bits(pb2, 1, s->interlaced_dct);
|
||||||
|
put_bits(pb2, 1, 1);
|
||||||
|
|
||||||
|
if(interleaved_stats){
|
||||||
|
s->misc_bits+= get_bits_diff(s);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* motion vectors: 16x8 interlaced mode */
|
||||||
|
h263_pred_motion(s, 0, &pred_x, &pred_y);
|
||||||
|
pred_y /=2;
|
||||||
|
|
||||||
|
put_bits(&s->pb, 1, s->field_select[0][0]);
|
||||||
|
put_bits(&s->pb, 1, s->field_select[0][1]);
|
||||||
|
|
||||||
|
h263_encode_motion(s, s->mv[0][0][0] - pred_x, s->f_code);
|
||||||
|
h263_encode_motion(s, s->mv[0][0][1] - pred_y, s->f_code);
|
||||||
|
h263_encode_motion(s, s->mv[0][1][0] - pred_x, s->f_code);
|
||||||
|
h263_encode_motion(s, s->mv[0][1][1] - pred_y, s->f_code);
|
||||||
}else{
|
}else{
|
||||||
|
assert(s->mv_type==MV_TYPE_8X8);
|
||||||
put_bits(&s->pb,
|
put_bits(&s->pb,
|
||||||
inter_MCBPC_bits[cbpc+16],
|
inter_MCBPC_bits[cbpc+16],
|
||||||
inter_MCBPC_code[cbpc+16]);
|
inter_MCBPC_code[cbpc+16]);
|
||||||
|
@ -61,8 +61,8 @@ static const int h263_mb_type_b_map[15]= {
|
|||||||
MB_TYPE_L0L1 | MB_TYPE_CBP | MB_TYPE_16x16,
|
MB_TYPE_L0L1 | MB_TYPE_CBP | MB_TYPE_16x16,
|
||||||
MB_TYPE_L0L1 | MB_TYPE_CBP | MB_TYPE_QUANT | MB_TYPE_16x16,
|
MB_TYPE_L0L1 | MB_TYPE_CBP | MB_TYPE_QUANT | MB_TYPE_16x16,
|
||||||
0, //stuffing
|
0, //stuffing
|
||||||
MB_TYPE_INTRA | MB_TYPE_CBP,
|
MB_TYPE_INTRA4x4 | MB_TYPE_CBP,
|
||||||
MB_TYPE_INTRA | MB_TYPE_CBP | MB_TYPE_QUANT,
|
MB_TYPE_INTRA4x4 | MB_TYPE_CBP | MB_TYPE_QUANT,
|
||||||
};
|
};
|
||||||
|
|
||||||
const uint8_t cbpc_b_tab[4][2] = {
|
const uint8_t cbpc_b_tab[4][2] = {
|
||||||
|
@ -687,10 +687,10 @@ static int pix_norm1_mmx(uint8_t *pix, int line_size) {
|
|||||||
return tmp;
|
return tmp;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int sse16_mmx(void *v, uint8_t * pix1, uint8_t * pix2, int line_size) {
|
static int sse16_mmx(void *v, uint8_t * pix1, uint8_t * pix2, int line_size, int h) {
|
||||||
int tmp;
|
int tmp;
|
||||||
asm volatile (
|
asm volatile (
|
||||||
"movl $16,%%ecx\n"
|
"movl %4,%%ecx\n"
|
||||||
"pxor %%mm0,%%mm0\n" /* mm0 = 0 */
|
"pxor %%mm0,%%mm0\n" /* mm0 = 0 */
|
||||||
"pxor %%mm7,%%mm7\n" /* mm7 holds the sum */
|
"pxor %%mm7,%%mm7\n" /* mm7 holds the sum */
|
||||||
"1:\n"
|
"1:\n"
|
||||||
@ -741,7 +741,9 @@ static int sse16_mmx(void *v, uint8_t * pix1, uint8_t * pix2, int line_size) {
|
|||||||
"psrlq $32, %%mm7\n" /* shift hi dword to lo */
|
"psrlq $32, %%mm7\n" /* shift hi dword to lo */
|
||||||
"paddd %%mm7,%%mm1\n"
|
"paddd %%mm7,%%mm1\n"
|
||||||
"movd %%mm1,%2\n"
|
"movd %%mm1,%2\n"
|
||||||
: "+r" (pix1), "+r" (pix2), "=r"(tmp) : "r" (line_size) : "%ecx");
|
: "+r" (pix1), "+r" (pix2), "=r"(tmp)
|
||||||
|
: "r" (line_size) , "m" (h)
|
||||||
|
: "%ecx");
|
||||||
return tmp;
|
return tmp;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -866,10 +868,12 @@ static void sub_hfyu_median_prediction_mmx2(uint8_t *dst, uint8_t *src1, uint8_t
|
|||||||
"movq "#c", "#o"+32(%1) \n\t"\
|
"movq "#c", "#o"+32(%1) \n\t"\
|
||||||
"movq "#d", "#o"+48(%1) \n\t"\
|
"movq "#d", "#o"+48(%1) \n\t"\
|
||||||
|
|
||||||
static int hadamard8_diff_mmx(void *s, uint8_t *src1, uint8_t *src2, int stride){
|
static int hadamard8_diff_mmx(void *s, uint8_t *src1, uint8_t *src2, int stride, int h){
|
||||||
uint64_t temp[16] __align8;
|
uint64_t temp[16] __align8;
|
||||||
int sum=0;
|
int sum=0;
|
||||||
|
|
||||||
|
assert(h==8);
|
||||||
|
|
||||||
diff_pixels_mmx((DCTELEM*)temp, src1, src2, stride);
|
diff_pixels_mmx((DCTELEM*)temp, src1, src2, stride);
|
||||||
|
|
||||||
asm volatile(
|
asm volatile(
|
||||||
@ -951,10 +955,12 @@ static int hadamard8_diff_mmx(void *s, uint8_t *src1, uint8_t *src2, int stride)
|
|||||||
return sum&0xFFFF;
|
return sum&0xFFFF;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int hadamard8_diff_mmx2(void *s, uint8_t *src1, uint8_t *src2, int stride){
|
static int hadamard8_diff_mmx2(void *s, uint8_t *src1, uint8_t *src2, int stride, int h){
|
||||||
uint64_t temp[16] __align8;
|
uint64_t temp[16] __align8;
|
||||||
int sum=0;
|
int sum=0;
|
||||||
|
|
||||||
|
assert(h==8);
|
||||||
|
|
||||||
diff_pixels_mmx((DCTELEM*)temp, src1, src2, stride);
|
diff_pixels_mmx((DCTELEM*)temp, src1, src2, stride);
|
||||||
|
|
||||||
asm volatile(
|
asm volatile(
|
||||||
@ -1037,8 +1043,8 @@ static int hadamard8_diff_mmx2(void *s, uint8_t *src1, uint8_t *src2, int stride
|
|||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
WARPER88_1616(hadamard8_diff_mmx, hadamard8_diff16_mmx)
|
WARPER8_16_SQ(hadamard8_diff_mmx, hadamard8_diff16_mmx)
|
||||||
WARPER88_1616(hadamard8_diff_mmx2, hadamard8_diff16_mmx2)
|
WARPER8_16_SQ(hadamard8_diff_mmx2, hadamard8_diff16_mmx2)
|
||||||
#endif //CONFIG_ENCODERS
|
#endif //CONFIG_ENCODERS
|
||||||
|
|
||||||
#define put_no_rnd_pixels8_mmx(a,b,c,d) put_pixels8_mmx(a,b,c,d)
|
#define put_no_rnd_pixels8_mmx(a,b,c,d) put_pixels8_mmx(a,b,c,d)
|
||||||
|
@ -28,9 +28,9 @@ static const __attribute__ ((aligned(8))) uint64_t round_tab[3]={
|
|||||||
|
|
||||||
static __attribute__ ((aligned(8), unused)) uint64_t bone= 0x0101010101010101LL;
|
static __attribute__ ((aligned(8), unused)) uint64_t bone= 0x0101010101010101LL;
|
||||||
|
|
||||||
static inline void sad8_mmx(uint8_t *blk1, uint8_t *blk2, int stride, int h)
|
static inline void sad8_1_mmx(uint8_t *blk1, uint8_t *blk2, int stride, int h)
|
||||||
{
|
{
|
||||||
int len= -(stride<<h);
|
int len= -(stride*h);
|
||||||
asm volatile(
|
asm volatile(
|
||||||
".balign 16 \n\t"
|
".balign 16 \n\t"
|
||||||
"1: \n\t"
|
"1: \n\t"
|
||||||
@ -64,9 +64,9 @@ static inline void sad8_mmx(uint8_t *blk1, uint8_t *blk2, int stride, int h)
|
|||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
static inline void sad8_mmx2(uint8_t *blk1, uint8_t *blk2, int stride, int h)
|
static inline void sad8_1_mmx2(uint8_t *blk1, uint8_t *blk2, int stride, int h)
|
||||||
{
|
{
|
||||||
int len= -(stride<<h);
|
int len= -(stride*h);
|
||||||
asm volatile(
|
asm volatile(
|
||||||
".balign 16 \n\t"
|
".balign 16 \n\t"
|
||||||
"1: \n\t"
|
"1: \n\t"
|
||||||
@ -88,7 +88,7 @@ static inline void sad8_mmx2(uint8_t *blk1, uint8_t *blk2, int stride, int h)
|
|||||||
|
|
||||||
static inline void sad8_2_mmx2(uint8_t *blk1a, uint8_t *blk1b, uint8_t *blk2, int stride, int h)
|
static inline void sad8_2_mmx2(uint8_t *blk1a, uint8_t *blk1b, uint8_t *blk2, int stride, int h)
|
||||||
{
|
{
|
||||||
int len= -(stride<<h);
|
int len= -(stride*h);
|
||||||
asm volatile(
|
asm volatile(
|
||||||
".balign 16 \n\t"
|
".balign 16 \n\t"
|
||||||
"1: \n\t"
|
"1: \n\t"
|
||||||
@ -114,7 +114,7 @@ static inline void sad8_2_mmx2(uint8_t *blk1a, uint8_t *blk1b, uint8_t *blk2, in
|
|||||||
|
|
||||||
static inline void sad8_4_mmx2(uint8_t *blk1, uint8_t *blk2, int stride, int h)
|
static inline void sad8_4_mmx2(uint8_t *blk1, uint8_t *blk2, int stride, int h)
|
||||||
{ //FIXME reuse src
|
{ //FIXME reuse src
|
||||||
int len= -(stride<<h);
|
int len= -(stride*h);
|
||||||
asm volatile(
|
asm volatile(
|
||||||
".balign 16 \n\t"
|
".balign 16 \n\t"
|
||||||
"movq "MANGLE(bone)", %%mm5 \n\t"
|
"movq "MANGLE(bone)", %%mm5 \n\t"
|
||||||
@ -151,7 +151,7 @@ static inline void sad8_4_mmx2(uint8_t *blk1, uint8_t *blk2, int stride, int h)
|
|||||||
|
|
||||||
static inline void sad8_2_mmx(uint8_t *blk1a, uint8_t *blk1b, uint8_t *blk2, int stride, int h)
|
static inline void sad8_2_mmx(uint8_t *blk1a, uint8_t *blk1b, uint8_t *blk2, int stride, int h)
|
||||||
{
|
{
|
||||||
int len= -(stride<<h);
|
int len= -(stride*h);
|
||||||
asm volatile(
|
asm volatile(
|
||||||
".balign 16 \n\t"
|
".balign 16 \n\t"
|
||||||
"1: \n\t"
|
"1: \n\t"
|
||||||
@ -189,7 +189,7 @@ static inline void sad8_2_mmx(uint8_t *blk1a, uint8_t *blk1b, uint8_t *blk2, int
|
|||||||
|
|
||||||
static inline void sad8_4_mmx(uint8_t *blk1, uint8_t *blk2, int stride, int h)
|
static inline void sad8_4_mmx(uint8_t *blk1, uint8_t *blk2, int stride, int h)
|
||||||
{
|
{
|
||||||
int len= -(stride<<h);
|
int len= -(stride*h);
|
||||||
asm volatile(
|
asm volatile(
|
||||||
".balign 16 \n\t"
|
".balign 16 \n\t"
|
||||||
"1: \n\t"
|
"1: \n\t"
|
||||||
@ -265,26 +265,69 @@ static inline int sum_mmx2(void)
|
|||||||
|
|
||||||
|
|
||||||
#define PIX_SAD(suf)\
|
#define PIX_SAD(suf)\
|
||||||
static int pix_abs8x8_ ## suf(uint8_t *blk2, uint8_t *blk1, int stride)\
|
static int sad8_ ## suf(void *v, uint8_t *blk2, uint8_t *blk1, int stride, int h)\
|
||||||
{\
|
{\
|
||||||
|
assert(h==8);\
|
||||||
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
||||||
"pxor %%mm6, %%mm6 \n\t":);\
|
"pxor %%mm6, %%mm6 \n\t":);\
|
||||||
\
|
\
|
||||||
sad8_ ## suf(blk1, blk2, stride, 3);\
|
sad8_1_ ## suf(blk1, blk2, stride, 8);\
|
||||||
\
|
\
|
||||||
return sum_ ## suf();\
|
return sum_ ## suf();\
|
||||||
}\
|
}\
|
||||||
static int sad8x8_ ## suf(void *s, uint8_t *blk2, uint8_t *blk1, int stride)\
|
static int sad8_x2_ ## suf(void *v, uint8_t *blk2, uint8_t *blk1, int stride, int h)\
|
||||||
{\
|
{\
|
||||||
|
assert(h==8);\
|
||||||
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
||||||
"pxor %%mm6, %%mm6 \n\t":);\
|
"pxor %%mm6, %%mm6 \n\t"\
|
||||||
|
"movq %0, %%mm5 \n\t"\
|
||||||
|
:: "m"(round_tab[1]) \
|
||||||
|
);\
|
||||||
\
|
\
|
||||||
sad8_ ## suf(blk1, blk2, stride, 3);\
|
sad8_2_ ## suf(blk1, blk1+1, blk2, stride, 8);\
|
||||||
\
|
\
|
||||||
return sum_ ## suf();\
|
return sum_ ## suf();\
|
||||||
}\
|
}\
|
||||||
\
|
\
|
||||||
static int pix_abs8x8_x2_ ## suf(uint8_t *blk2, uint8_t *blk1, int stride)\
|
static int sad8_y2_ ## suf(void *v, uint8_t *blk2, uint8_t *blk1, int stride, int h)\
|
||||||
|
{\
|
||||||
|
assert(h==8);\
|
||||||
|
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
||||||
|
"pxor %%mm6, %%mm6 \n\t"\
|
||||||
|
"movq %0, %%mm5 \n\t"\
|
||||||
|
:: "m"(round_tab[1]) \
|
||||||
|
);\
|
||||||
|
\
|
||||||
|
sad8_2_ ## suf(blk1, blk1+stride, blk2, stride, 8);\
|
||||||
|
\
|
||||||
|
return sum_ ## suf();\
|
||||||
|
}\
|
||||||
|
\
|
||||||
|
static int sad8_xy2_ ## suf(void *v, uint8_t *blk2, uint8_t *blk1, int stride, int h)\
|
||||||
|
{\
|
||||||
|
assert(h==8);\
|
||||||
|
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
||||||
|
"pxor %%mm6, %%mm6 \n\t"\
|
||||||
|
"movq %0, %%mm5 \n\t"\
|
||||||
|
:: "m"(round_tab[2]) \
|
||||||
|
);\
|
||||||
|
\
|
||||||
|
sad8_4_ ## suf(blk1, blk2, stride, 8);\
|
||||||
|
\
|
||||||
|
return sum_ ## suf();\
|
||||||
|
}\
|
||||||
|
\
|
||||||
|
static int sad16_ ## suf(void *v, uint8_t *blk2, uint8_t *blk1, int stride, int h)\
|
||||||
|
{\
|
||||||
|
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
||||||
|
"pxor %%mm6, %%mm6 \n\t":);\
|
||||||
|
\
|
||||||
|
sad8_1_ ## suf(blk1 , blk2 , stride, h);\
|
||||||
|
sad8_1_ ## suf(blk1+8, blk2+8, stride, h);\
|
||||||
|
\
|
||||||
|
return sum_ ## suf();\
|
||||||
|
}\
|
||||||
|
static int sad16_x2_ ## suf(void *v, uint8_t *blk2, uint8_t *blk1, int stride, int h)\
|
||||||
{\
|
{\
|
||||||
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
||||||
"pxor %%mm6, %%mm6 \n\t"\
|
"pxor %%mm6, %%mm6 \n\t"\
|
||||||
@ -292,12 +335,12 @@ static int pix_abs8x8_x2_ ## suf(uint8_t *blk2, uint8_t *blk1, int stride)\
|
|||||||
:: "m"(round_tab[1]) \
|
:: "m"(round_tab[1]) \
|
||||||
);\
|
);\
|
||||||
\
|
\
|
||||||
sad8_2_ ## suf(blk1, blk1+1, blk2, stride, 3);\
|
sad8_2_ ## suf(blk1 , blk1+1, blk2 , stride, h);\
|
||||||
|
sad8_2_ ## suf(blk1+8, blk1+9, blk2+8, stride, h);\
|
||||||
\
|
\
|
||||||
return sum_ ## suf();\
|
return sum_ ## suf();\
|
||||||
}\
|
}\
|
||||||
\
|
static int sad16_y2_ ## suf(void *v, uint8_t *blk2, uint8_t *blk1, int stride, int h)\
|
||||||
static int pix_abs8x8_y2_ ## suf(uint8_t *blk2, uint8_t *blk1, int stride)\
|
|
||||||
{\
|
{\
|
||||||
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
||||||
"pxor %%mm6, %%mm6 \n\t"\
|
"pxor %%mm6, %%mm6 \n\t"\
|
||||||
@ -305,12 +348,12 @@ static int pix_abs8x8_y2_ ## suf(uint8_t *blk2, uint8_t *blk1, int stride)\
|
|||||||
:: "m"(round_tab[1]) \
|
:: "m"(round_tab[1]) \
|
||||||
);\
|
);\
|
||||||
\
|
\
|
||||||
sad8_2_ ## suf(blk1, blk1+stride, blk2, stride, 3);\
|
sad8_2_ ## suf(blk1 , blk1+stride, blk2 , stride, h);\
|
||||||
|
sad8_2_ ## suf(blk1+8, blk1+stride+8,blk2+8, stride, h);\
|
||||||
\
|
\
|
||||||
return sum_ ## suf();\
|
return sum_ ## suf();\
|
||||||
}\
|
}\
|
||||||
\
|
static int sad16_xy2_ ## suf(void *v, uint8_t *blk2, uint8_t *blk1, int stride, int h)\
|
||||||
static int pix_abs8x8_xy2_ ## suf(uint8_t *blk2, uint8_t *blk1, int stride)\
|
|
||||||
{\
|
{\
|
||||||
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
||||||
"pxor %%mm6, %%mm6 \n\t"\
|
"pxor %%mm6, %%mm6 \n\t"\
|
||||||
@ -318,67 +361,8 @@ static int pix_abs8x8_xy2_ ## suf(uint8_t *blk2, uint8_t *blk1, int stride)\
|
|||||||
:: "m"(round_tab[2]) \
|
:: "m"(round_tab[2]) \
|
||||||
);\
|
);\
|
||||||
\
|
\
|
||||||
sad8_4_ ## suf(blk1, blk2, stride, 3);\
|
sad8_4_ ## suf(blk1 , blk2 , stride, h);\
|
||||||
\
|
sad8_4_ ## suf(blk1+8, blk2+8, stride, h);\
|
||||||
return sum_ ## suf();\
|
|
||||||
}\
|
|
||||||
\
|
|
||||||
static int pix_abs16x16_ ## suf(uint8_t *blk2, uint8_t *blk1, int stride)\
|
|
||||||
{\
|
|
||||||
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
|
||||||
"pxor %%mm6, %%mm6 \n\t":);\
|
|
||||||
\
|
|
||||||
sad8_ ## suf(blk1 , blk2 , stride, 4);\
|
|
||||||
sad8_ ## suf(blk1+8, blk2+8, stride, 4);\
|
|
||||||
\
|
|
||||||
return sum_ ## suf();\
|
|
||||||
}\
|
|
||||||
static int sad16x16_ ## suf(void *s, uint8_t *blk2, uint8_t *blk1, int stride)\
|
|
||||||
{\
|
|
||||||
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
|
||||||
"pxor %%mm6, %%mm6 \n\t":);\
|
|
||||||
\
|
|
||||||
sad8_ ## suf(blk1 , blk2 , stride, 4);\
|
|
||||||
sad8_ ## suf(blk1+8, blk2+8, stride, 4);\
|
|
||||||
\
|
|
||||||
return sum_ ## suf();\
|
|
||||||
}\
|
|
||||||
static int pix_abs16x16_x2_ ## suf(uint8_t *blk2, uint8_t *blk1, int stride)\
|
|
||||||
{\
|
|
||||||
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
|
||||||
"pxor %%mm6, %%mm6 \n\t"\
|
|
||||||
"movq %0, %%mm5 \n\t"\
|
|
||||||
:: "m"(round_tab[1]) \
|
|
||||||
);\
|
|
||||||
\
|
|
||||||
sad8_2_ ## suf(blk1 , blk1+1, blk2 , stride, 4);\
|
|
||||||
sad8_2_ ## suf(blk1+8, blk1+9, blk2+8, stride, 4);\
|
|
||||||
\
|
|
||||||
return sum_ ## suf();\
|
|
||||||
}\
|
|
||||||
static int pix_abs16x16_y2_ ## suf(uint8_t *blk2, uint8_t *blk1, int stride)\
|
|
||||||
{\
|
|
||||||
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
|
||||||
"pxor %%mm6, %%mm6 \n\t"\
|
|
||||||
"movq %0, %%mm5 \n\t"\
|
|
||||||
:: "m"(round_tab[1]) \
|
|
||||||
);\
|
|
||||||
\
|
|
||||||
sad8_2_ ## suf(blk1 , blk1+stride, blk2 , stride, 4);\
|
|
||||||
sad8_2_ ## suf(blk1+8, blk1+stride+8,blk2+8, stride, 4);\
|
|
||||||
\
|
|
||||||
return sum_ ## suf();\
|
|
||||||
}\
|
|
||||||
static int pix_abs16x16_xy2_ ## suf(uint8_t *blk2, uint8_t *blk1, int stride)\
|
|
||||||
{\
|
|
||||||
asm volatile("pxor %%mm7, %%mm7 \n\t"\
|
|
||||||
"pxor %%mm6, %%mm6 \n\t"\
|
|
||||||
"movq %0, %%mm5 \n\t"\
|
|
||||||
:: "m"(round_tab[2]) \
|
|
||||||
);\
|
|
||||||
\
|
|
||||||
sad8_4_ ## suf(blk1 , blk2 , stride, 4);\
|
|
||||||
sad8_4_ ## suf(blk1+8, blk2+8, stride, 4);\
|
|
||||||
\
|
\
|
||||||
return sum_ ## suf();\
|
return sum_ ## suf();\
|
||||||
}\
|
}\
|
||||||
@ -389,32 +373,32 @@ PIX_SAD(mmx2)
|
|||||||
void dsputil_init_pix_mmx(DSPContext* c, AVCodecContext *avctx)
|
void dsputil_init_pix_mmx(DSPContext* c, AVCodecContext *avctx)
|
||||||
{
|
{
|
||||||
if (mm_flags & MM_MMX) {
|
if (mm_flags & MM_MMX) {
|
||||||
c->pix_abs16x16 = pix_abs16x16_mmx;
|
c->pix_abs[0][0] = sad16_mmx;
|
||||||
c->pix_abs16x16_x2 = pix_abs16x16_x2_mmx;
|
c->pix_abs[0][1] = sad16_x2_mmx;
|
||||||
c->pix_abs16x16_y2 = pix_abs16x16_y2_mmx;
|
c->pix_abs[0][2] = sad16_y2_mmx;
|
||||||
c->pix_abs16x16_xy2 = pix_abs16x16_xy2_mmx;
|
c->pix_abs[0][3] = sad16_xy2_mmx;
|
||||||
c->pix_abs8x8 = pix_abs8x8_mmx;
|
c->pix_abs[1][0] = sad8_mmx;
|
||||||
c->pix_abs8x8_x2 = pix_abs8x8_x2_mmx;
|
c->pix_abs[1][1] = sad8_x2_mmx;
|
||||||
c->pix_abs8x8_y2 = pix_abs8x8_y2_mmx;
|
c->pix_abs[1][2] = sad8_y2_mmx;
|
||||||
c->pix_abs8x8_xy2 = pix_abs8x8_xy2_mmx;
|
c->pix_abs[1][3] = sad8_xy2_mmx;
|
||||||
|
|
||||||
c->sad[0]= sad16x16_mmx;
|
c->sad[0]= sad16_mmx;
|
||||||
c->sad[1]= sad8x8_mmx;
|
c->sad[1]= sad8_mmx;
|
||||||
}
|
}
|
||||||
if (mm_flags & MM_MMXEXT) {
|
if (mm_flags & MM_MMXEXT) {
|
||||||
c->pix_abs16x16 = pix_abs16x16_mmx2;
|
c->pix_abs[0][0] = sad16_mmx2;
|
||||||
c->pix_abs8x8 = pix_abs8x8_mmx2;
|
c->pix_abs[1][0] = sad8_mmx2;
|
||||||
|
|
||||||
c->sad[0]= sad16x16_mmx2;
|
c->sad[0]= sad16_mmx2;
|
||||||
c->sad[1]= sad8x8_mmx2;
|
c->sad[1]= sad8_mmx2;
|
||||||
|
|
||||||
if(!(avctx->flags & CODEC_FLAG_BITEXACT)){
|
if(!(avctx->flags & CODEC_FLAG_BITEXACT)){
|
||||||
c->pix_abs16x16_x2 = pix_abs16x16_x2_mmx2;
|
c->pix_abs[0][1] = sad16_x2_mmx2;
|
||||||
c->pix_abs16x16_y2 = pix_abs16x16_y2_mmx2;
|
c->pix_abs[0][2] = sad16_y2_mmx2;
|
||||||
c->pix_abs16x16_xy2 = pix_abs16x16_xy2_mmx2;
|
c->pix_abs[0][3] = sad16_xy2_mmx2;
|
||||||
c->pix_abs8x8_x2 = pix_abs8x8_x2_mmx2;
|
c->pix_abs[1][1] = sad8_x2_mmx2;
|
||||||
c->pix_abs8x8_y2 = pix_abs8x8_y2_mmx2;
|
c->pix_abs[1][2] = sad8_y2_mmx2;
|
||||||
c->pix_abs8x8_xy2 = pix_abs8x8_xy2_mmx2;
|
c->pix_abs[1][3] = sad8_xy2_mmx2;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
File diff suppressed because it is too large
Load Diff
@ -22,29 +22,31 @@
|
|||||||
* @file motion_est_template.c
|
* @file motion_est_template.c
|
||||||
* Motion estimation template.
|
* Motion estimation template.
|
||||||
*/
|
*/
|
||||||
|
//FIXME ref2_y next_pic?
|
||||||
//lets hope gcc will remove the unused vars ...(gcc 3.2.2 seems to do it ...)
|
//lets hope gcc will remove the unused vars ...(gcc 3.2.2 seems to do it ...)
|
||||||
//Note, the last line is there to kill these ugly unused var warnings
|
//Note, the last line is there to kill these ugly unused var warnings
|
||||||
#define LOAD_COMMON(x, y)\
|
#define LOAD_COMMON\
|
||||||
uint32_t * const score_map= s->me.score_map;\
|
uint32_t * const score_map= s->me.score_map;\
|
||||||
const int stride= s->linesize;\
|
|
||||||
const int uvstride= s->uvlinesize;\
|
|
||||||
const int time_pp= s->pp_time;\
|
const int time_pp= s->pp_time;\
|
||||||
const int time_pb= s->pb_time;\
|
const int time_pb= s->pb_time;\
|
||||||
uint8_t * const src_y= s->new_picture.data[0] + ((y) * stride) + (x);\
|
const int xmin= s->me.xmin;\
|
||||||
uint8_t * const src_u= s->new_picture.data[1] + (((y)>>1) * uvstride) + ((x)>>1);\
|
const int ymin= s->me.ymin;\
|
||||||
uint8_t * const src_v= s->new_picture.data[2] + (((y)>>1) * uvstride) + ((x)>>1);\
|
const int xmax= s->me.xmax;\
|
||||||
uint8_t * const ref_y= ref_picture->data[0] + ((y) * stride) + (x);\
|
const int ymax= s->me.ymax;\
|
||||||
uint8_t * const ref_u= ref_picture->data[1] + (((y)>>1) * uvstride) + ((x)>>1);\
|
uint8_t * const src_y= src_data[0];\
|
||||||
uint8_t * const ref_v= ref_picture->data[2] + (((y)>>1) * uvstride) + ((x)>>1);\
|
uint8_t * const src_u= src_data[1];\
|
||||||
uint8_t * const ref2_y= s->next_picture.data[0] + ((y) * stride) + (x);\
|
uint8_t * const src_v= src_data[2];\
|
||||||
|
uint8_t * const ref_y= ref_data[0];\
|
||||||
|
uint8_t * const ref_u= ref_data[1];\
|
||||||
|
uint8_t * const ref_v= ref_data[2];\
|
||||||
op_pixels_func (*hpel_put)[4];\
|
op_pixels_func (*hpel_put)[4];\
|
||||||
op_pixels_func (*hpel_avg)[4]= &s->dsp.avg_pixels_tab[size];\
|
op_pixels_func (*hpel_avg)[4]= &s->dsp.avg_pixels_tab[size];\
|
||||||
op_pixels_func (*chroma_hpel_put)[4];\
|
op_pixels_func (*chroma_hpel_put)[4];\
|
||||||
qpel_mc_func (*qpel_put)[16];\
|
qpel_mc_func (*qpel_put)[16];\
|
||||||
qpel_mc_func (*qpel_avg)[16]= &s->dsp.avg_qpel_pixels_tab[size];\
|
qpel_mc_func (*qpel_avg)[16]= &s->dsp.avg_qpel_pixels_tab[size];\
|
||||||
const __attribute__((unused)) int unu= time_pp + time_pb + (size_t)src_u + (size_t)src_v + (size_t)ref_u + (size_t)ref_v\
|
const __attribute__((unused)) int unu= time_pp + time_pb + (size_t)src_u + (size_t)src_v + (size_t)ref_u + (size_t)ref_v\
|
||||||
+ (size_t)ref2_y + (size_t)hpel_avg + (size_t)qpel_avg + (size_t)score_map;\
|
+ (size_t)hpel_avg + (size_t)qpel_avg + (size_t)score_map\
|
||||||
|
+ xmin + xmax + ymin + ymax;\
|
||||||
if(s->no_rounding /*FIXME b_type*/){\
|
if(s->no_rounding /*FIXME b_type*/){\
|
||||||
hpel_put= &s->dsp.put_no_rnd_pixels_tab[size];\
|
hpel_put= &s->dsp.put_no_rnd_pixels_tab[size];\
|
||||||
chroma_hpel_put= &s->dsp.put_no_rnd_pixels_tab[size+1];\
|
chroma_hpel_put= &s->dsp.put_no_rnd_pixels_tab[size+1];\
|
||||||
@ -70,9 +72,8 @@
|
|||||||
#if 0
|
#if 0
|
||||||
static int RENAME(hpel_motion_search)(MpegEncContext * s,
|
static int RENAME(hpel_motion_search)(MpegEncContext * s,
|
||||||
int *mx_ptr, int *my_ptr, int dmin,
|
int *mx_ptr, int *my_ptr, int dmin,
|
||||||
int xmin, int ymin, int xmax, int ymax,
|
int pred_x, int pred_y, uint8_t *ref_data[3],
|
||||||
int pred_x, int pred_y, Picture *ref_picture,
|
int size, uint8_t * const mv_penalty)
|
||||||
int n, int size, uint8_t * const mv_penalty)
|
|
||||||
{
|
{
|
||||||
const int xx = 16 * s->mb_x + 8*(n&1);
|
const int xx = 16 * s->mb_x + 8*(n&1);
|
||||||
const int yy = 16 * s->mb_y + 8*(n>>1);
|
const int yy = 16 * s->mb_y + 8*(n>>1);
|
||||||
@ -80,7 +81,7 @@ static int RENAME(hpel_motion_search)(MpegEncContext * s,
|
|||||||
const int my = *my_ptr;
|
const int my = *my_ptr;
|
||||||
const int penalty_factor= s->me.sub_penalty_factor;
|
const int penalty_factor= s->me.sub_penalty_factor;
|
||||||
|
|
||||||
LOAD_COMMON(xx, yy);
|
LOAD_COMMON
|
||||||
|
|
||||||
// INIT;
|
// INIT;
|
||||||
//FIXME factorize
|
//FIXME factorize
|
||||||
@ -139,19 +140,17 @@ static int RENAME(hpel_motion_search)(MpegEncContext * s,
|
|||||||
#else
|
#else
|
||||||
static int RENAME(hpel_motion_search)(MpegEncContext * s,
|
static int RENAME(hpel_motion_search)(MpegEncContext * s,
|
||||||
int *mx_ptr, int *my_ptr, int dmin,
|
int *mx_ptr, int *my_ptr, int dmin,
|
||||||
int xmin, int ymin, int xmax, int ymax,
|
int pred_x, int pred_y, uint8_t *src_data[3],
|
||||||
int pred_x, int pred_y, Picture *ref_picture,
|
uint8_t *ref_data[3], int stride, int uvstride,
|
||||||
int n, int size, uint8_t * const mv_penalty)
|
int size, int h, uint8_t * const mv_penalty)
|
||||||
{
|
{
|
||||||
const int xx = 16 * s->mb_x + 8*(n&1);
|
|
||||||
const int yy = 16 * s->mb_y + 8*(n>>1);
|
|
||||||
const int mx = *mx_ptr;
|
const int mx = *mx_ptr;
|
||||||
const int my = *my_ptr;
|
const int my = *my_ptr;
|
||||||
const int penalty_factor= s->me.sub_penalty_factor;
|
const int penalty_factor= s->me.sub_penalty_factor;
|
||||||
me_cmp_func cmp_sub, chroma_cmp_sub;
|
me_cmp_func cmp_sub, chroma_cmp_sub;
|
||||||
int bx=2*mx, by=2*my;
|
int bx=2*mx, by=2*my;
|
||||||
|
|
||||||
LOAD_COMMON(xx, yy);
|
LOAD_COMMON
|
||||||
|
|
||||||
//FIXME factorize
|
//FIXME factorize
|
||||||
|
|
||||||
@ -247,20 +246,18 @@ static int RENAME(hpel_motion_search)(MpegEncContext * s,
|
|||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
static int RENAME(hpel_get_mb_score)(MpegEncContext * s, int mx, int my, int pred_x, int pred_y, Picture *ref_picture,
|
static int RENAME(hpel_get_mb_score)(MpegEncContext * s, int mx, int my, int pred_x, int pred_y, uint8_t *src_data[3],
|
||||||
|
uint8_t *ref_data[3], int stride, int uvstride,
|
||||||
uint8_t * const mv_penalty)
|
uint8_t * const mv_penalty)
|
||||||
{
|
{
|
||||||
// const int check_luma= s->dsp.me_sub_cmp != s->dsp.mb_cmp;
|
// const int check_luma= s->dsp.me_sub_cmp != s->dsp.mb_cmp;
|
||||||
const int size= 0;
|
const int size= 0;
|
||||||
const int xx = 16 * s->mb_x;
|
const int h= 16;
|
||||||
const int yy = 16 * s->mb_y;
|
|
||||||
const int penalty_factor= s->me.mb_penalty_factor;
|
const int penalty_factor= s->me.mb_penalty_factor;
|
||||||
const int xmin= -256*256, ymin= -256*256, xmax= 256*256, ymax= 256*256; //assume that the caller checked these
|
|
||||||
const __attribute__((unused)) int unu2= xmin + xmax +ymin + ymax; //no unused warning shit
|
|
||||||
me_cmp_func cmp_sub, chroma_cmp_sub;
|
me_cmp_func cmp_sub, chroma_cmp_sub;
|
||||||
int d;
|
int d;
|
||||||
|
|
||||||
LOAD_COMMON(xx, yy);
|
LOAD_COMMON
|
||||||
|
|
||||||
//FIXME factorize
|
//FIXME factorize
|
||||||
|
|
||||||
@ -295,12 +292,10 @@ static int RENAME(hpel_get_mb_score)(MpegEncContext * s, int mx, int my, int pre
|
|||||||
|
|
||||||
static int RENAME(qpel_motion_search)(MpegEncContext * s,
|
static int RENAME(qpel_motion_search)(MpegEncContext * s,
|
||||||
int *mx_ptr, int *my_ptr, int dmin,
|
int *mx_ptr, int *my_ptr, int dmin,
|
||||||
int xmin, int ymin, int xmax, int ymax,
|
int pred_x, int pred_y, uint8_t *src_data[3],
|
||||||
int pred_x, int pred_y, Picture *ref_picture,
|
uint8_t *ref_data[3], int stride, int uvstride,
|
||||||
int n, int size, uint8_t * const mv_penalty)
|
int size, int h, uint8_t * const mv_penalty)
|
||||||
{
|
{
|
||||||
const int xx = 16 * s->mb_x + 8*(n&1);
|
|
||||||
const int yy = 16 * s->mb_y + 8*(n>>1);
|
|
||||||
const int mx = *mx_ptr;
|
const int mx = *mx_ptr;
|
||||||
const int my = *my_ptr;
|
const int my = *my_ptr;
|
||||||
const int penalty_factor= s->me.sub_penalty_factor;
|
const int penalty_factor= s->me.sub_penalty_factor;
|
||||||
@ -310,7 +305,7 @@ static int RENAME(qpel_motion_search)(MpegEncContext * s,
|
|||||||
me_cmp_func cmp, chroma_cmp;
|
me_cmp_func cmp, chroma_cmp;
|
||||||
me_cmp_func cmp_sub, chroma_cmp_sub;
|
me_cmp_func cmp_sub, chroma_cmp_sub;
|
||||||
|
|
||||||
LOAD_COMMON(xx, yy);
|
LOAD_COMMON
|
||||||
|
|
||||||
cmp= s->dsp.me_cmp[size];
|
cmp= s->dsp.me_cmp[size];
|
||||||
chroma_cmp= s->dsp.me_cmp[size+1]; //factorize FIXME
|
chroma_cmp= s->dsp.me_cmp[size+1]; //factorize FIXME
|
||||||
@ -514,19 +509,17 @@ static int RENAME(qpel_motion_search)(MpegEncContext * s,
|
|||||||
return dmin;
|
return dmin;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int RENAME(qpel_get_mb_score)(MpegEncContext * s, int mx, int my, int pred_x, int pred_y, Picture *ref_picture,
|
static int RENAME(qpel_get_mb_score)(MpegEncContext * s, int mx, int my, int pred_x, int pred_y, uint8_t *src_data[3],
|
||||||
|
uint8_t *ref_data[3], int stride, int uvstride,
|
||||||
uint8_t * const mv_penalty)
|
uint8_t * const mv_penalty)
|
||||||
{
|
{
|
||||||
const int size= 0;
|
const int size= 0;
|
||||||
const int xx = 16 * s->mb_x;
|
const int h= 16;
|
||||||
const int yy = 16 * s->mb_y;
|
|
||||||
const int penalty_factor= s->me.mb_penalty_factor;
|
const int penalty_factor= s->me.mb_penalty_factor;
|
||||||
const int xmin= -256*256, ymin= -256*256, xmax= 256*256, ymax= 256*256; //assume that the caller checked these
|
|
||||||
const __attribute__((unused)) int unu2= xmin + xmax +ymin + ymax; //no unused warning shit
|
|
||||||
me_cmp_func cmp_sub, chroma_cmp_sub;
|
me_cmp_func cmp_sub, chroma_cmp_sub;
|
||||||
int d;
|
int d;
|
||||||
|
|
||||||
LOAD_COMMON(xx, yy);
|
LOAD_COMMON
|
||||||
|
|
||||||
//FIXME factorize
|
//FIXME factorize
|
||||||
|
|
||||||
@ -597,15 +590,16 @@ if( (y)>(ymax<<(S)) ) printf("%d %d %d %d %d ymax" #v, ymax, (x), (y), s->mb_x,
|
|||||||
|
|
||||||
|
|
||||||
static inline int RENAME(small_diamond_search)(MpegEncContext * s, int *best, int dmin,
|
static inline int RENAME(small_diamond_search)(MpegEncContext * s, int *best, int dmin,
|
||||||
Picture *ref_picture,
|
uint8_t *src_data[3],
|
||||||
|
uint8_t *ref_data[3], int stride, int uvstride,
|
||||||
int const pred_x, int const pred_y, int const penalty_factor,
|
int const pred_x, int const pred_y, int const penalty_factor,
|
||||||
int const xmin, int const ymin, int const xmax, int const ymax, int const shift,
|
int const shift,
|
||||||
uint32_t *map, int map_generation, int size, uint8_t * const mv_penalty
|
uint32_t *map, int map_generation, int size, int h, uint8_t * const mv_penalty
|
||||||
)
|
)
|
||||||
{
|
{
|
||||||
me_cmp_func cmp, chroma_cmp;
|
me_cmp_func cmp, chroma_cmp;
|
||||||
int next_dir=-1;
|
int next_dir=-1;
|
||||||
LOAD_COMMON(s->mb_x*16, s->mb_y*16);
|
LOAD_COMMON
|
||||||
|
|
||||||
cmp= s->dsp.me_cmp[size];
|
cmp= s->dsp.me_cmp[size];
|
||||||
chroma_cmp= s->dsp.me_cmp[size+1];
|
chroma_cmp= s->dsp.me_cmp[size+1];
|
||||||
@ -639,15 +633,16 @@ static inline int RENAME(small_diamond_search)(MpegEncContext * s, int *best, in
|
|||||||
}
|
}
|
||||||
|
|
||||||
static inline int RENAME(funny_diamond_search)(MpegEncContext * s, int *best, int dmin,
|
static inline int RENAME(funny_diamond_search)(MpegEncContext * s, int *best, int dmin,
|
||||||
Picture *ref_picture,
|
uint8_t *src_data[3],
|
||||||
|
uint8_t *ref_data[3], int stride, int uvstride,
|
||||||
int const pred_x, int const pred_y, int const penalty_factor,
|
int const pred_x, int const pred_y, int const penalty_factor,
|
||||||
int const xmin, int const ymin, int const xmax, int const ymax, int const shift,
|
int const shift,
|
||||||
uint32_t *map, int map_generation, int size, uint8_t * const mv_penalty
|
uint32_t *map, int map_generation, int size, int h, uint8_t * const mv_penalty
|
||||||
)
|
)
|
||||||
{
|
{
|
||||||
me_cmp_func cmp, chroma_cmp;
|
me_cmp_func cmp, chroma_cmp;
|
||||||
int dia_size;
|
int dia_size;
|
||||||
LOAD_COMMON(s->mb_x*16, s->mb_y*16);
|
LOAD_COMMON
|
||||||
|
|
||||||
cmp= s->dsp.me_cmp[size];
|
cmp= s->dsp.me_cmp[size];
|
||||||
chroma_cmp= s->dsp.me_cmp[size+1];
|
chroma_cmp= s->dsp.me_cmp[size+1];
|
||||||
@ -730,17 +725,18 @@ if(256*256*256*64 % (stats[0]+1)==0){
|
|||||||
|
|
||||||
#define MAX_SAB_SIZE 16
|
#define MAX_SAB_SIZE 16
|
||||||
static inline int RENAME(sab_diamond_search)(MpegEncContext * s, int *best, int dmin,
|
static inline int RENAME(sab_diamond_search)(MpegEncContext * s, int *best, int dmin,
|
||||||
Picture *ref_picture,
|
uint8_t *src_data[3],
|
||||||
|
uint8_t *ref_data[3], int stride, int uvstride,
|
||||||
int const pred_x, int const pred_y, int const penalty_factor,
|
int const pred_x, int const pred_y, int const penalty_factor,
|
||||||
int const xmin, int const ymin, int const xmax, int const ymax, int const shift,
|
int const shift,
|
||||||
uint32_t *map, int map_generation, int size, uint8_t * const mv_penalty
|
uint32_t *map, int map_generation, int size, int h, uint8_t * const mv_penalty
|
||||||
)
|
)
|
||||||
{
|
{
|
||||||
me_cmp_func cmp, chroma_cmp;
|
me_cmp_func cmp, chroma_cmp;
|
||||||
Minima minima[MAX_SAB_SIZE];
|
Minima minima[MAX_SAB_SIZE];
|
||||||
const int minima_count= ABS(s->me.dia_size);
|
const int minima_count= ABS(s->me.dia_size);
|
||||||
int i, j;
|
int i, j;
|
||||||
LOAD_COMMON(s->mb_x*16, s->mb_y*16);
|
LOAD_COMMON
|
||||||
|
|
||||||
cmp= s->dsp.me_cmp[size];
|
cmp= s->dsp.me_cmp[size];
|
||||||
chroma_cmp= s->dsp.me_cmp[size+1];
|
chroma_cmp= s->dsp.me_cmp[size+1];
|
||||||
@ -810,15 +806,16 @@ static inline int RENAME(sab_diamond_search)(MpegEncContext * s, int *best, int
|
|||||||
}
|
}
|
||||||
|
|
||||||
static inline int RENAME(var_diamond_search)(MpegEncContext * s, int *best, int dmin,
|
static inline int RENAME(var_diamond_search)(MpegEncContext * s, int *best, int dmin,
|
||||||
Picture *ref_picture,
|
uint8_t *src_data[3],
|
||||||
|
uint8_t *ref_data[3], int stride, int uvstride,
|
||||||
int const pred_x, int const pred_y, int const penalty_factor,
|
int const pred_x, int const pred_y, int const penalty_factor,
|
||||||
int const xmin, int const ymin, int const xmax, int const ymax, int const shift,
|
int const shift,
|
||||||
uint32_t *map, int map_generation, int size, uint8_t * const mv_penalty
|
uint32_t *map, int map_generation, int size, int h, uint8_t * const mv_penalty
|
||||||
)
|
)
|
||||||
{
|
{
|
||||||
me_cmp_func cmp, chroma_cmp;
|
me_cmp_func cmp, chroma_cmp;
|
||||||
int dia_size;
|
int dia_size;
|
||||||
LOAD_COMMON(s->mb_x*16, s->mb_y*16);
|
LOAD_COMMON
|
||||||
|
|
||||||
cmp= s->dsp.me_cmp[size];
|
cmp= s->dsp.me_cmp[size];
|
||||||
chroma_cmp= s->dsp.me_cmp[size+1];
|
chroma_cmp= s->dsp.me_cmp[size+1];
|
||||||
@ -886,10 +883,10 @@ if(256*256*256*64 % (stats[0]+1)==0){
|
|||||||
return dmin;
|
return dmin;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int RENAME(epzs_motion_search)(MpegEncContext * s, int block,
|
static int RENAME(epzs_motion_search)(MpegEncContext * s,
|
||||||
int *mx_ptr, int *my_ptr,
|
int *mx_ptr, int *my_ptr,
|
||||||
int P[10][2], int pred_x, int pred_y,
|
int P[10][2], int pred_x, int pred_y, uint8_t *src_data[3],
|
||||||
int xmin, int ymin, int xmax, int ymax, Picture *ref_picture, int16_t (*last_mv)[2],
|
uint8_t *ref_data[3], int stride, int uvstride, int16_t (*last_mv)[2],
|
||||||
int ref_mv_scale, uint8_t * const mv_penalty)
|
int ref_mv_scale, uint8_t * const mv_penalty)
|
||||||
{
|
{
|
||||||
int best[2]={0, 0};
|
int best[2]={0, 0};
|
||||||
@ -899,10 +896,11 @@ static int RENAME(epzs_motion_search)(MpegEncContext * s, int block,
|
|||||||
int map_generation;
|
int map_generation;
|
||||||
const int penalty_factor= s->me.penalty_factor;
|
const int penalty_factor= s->me.penalty_factor;
|
||||||
const int size=0;
|
const int size=0;
|
||||||
const int ref_mv_stride= s->mb_stride;
|
const int h=16;
|
||||||
const int ref_mv_xy= s->mb_x + s->mb_y*ref_mv_stride;
|
const int ref_mv_stride= s->mb_stride; //pass as arg FIXME
|
||||||
|
const int ref_mv_xy= s->mb_x + s->mb_y*ref_mv_stride; //add to last_mv beforepassing FIXME
|
||||||
me_cmp_func cmp, chroma_cmp;
|
me_cmp_func cmp, chroma_cmp;
|
||||||
LOAD_COMMON(s->mb_x*16, s->mb_y*16);
|
LOAD_COMMON
|
||||||
|
|
||||||
cmp= s->dsp.me_cmp[size];
|
cmp= s->dsp.me_cmp[size];
|
||||||
chroma_cmp= s->dsp.me_cmp[size+1];
|
chroma_cmp= s->dsp.me_cmp[size+1];
|
||||||
@ -973,21 +971,21 @@ static int RENAME(epzs_motion_search)(MpegEncContext * s, int block,
|
|||||||
|
|
||||||
//check(best[0],best[1],0, b0)
|
//check(best[0],best[1],0, b0)
|
||||||
if(s->me.dia_size==-1)
|
if(s->me.dia_size==-1)
|
||||||
dmin= RENAME(funny_diamond_search)(s, best, dmin, ref_picture,
|
dmin= RENAME(funny_diamond_search)(s, best, dmin, src_data, ref_data, stride, uvstride,
|
||||||
pred_x, pred_y, penalty_factor, xmin, ymin, xmax, ymax,
|
pred_x, pred_y, penalty_factor,
|
||||||
shift, map, map_generation, size, mv_penalty);
|
shift, map, map_generation, size, h, mv_penalty);
|
||||||
else if(s->me.dia_size<-1)
|
else if(s->me.dia_size<-1)
|
||||||
dmin= RENAME(sab_diamond_search)(s, best, dmin, ref_picture,
|
dmin= RENAME(sab_diamond_search)(s, best, dmin, src_data, ref_data, stride, uvstride,
|
||||||
pred_x, pred_y, penalty_factor, xmin, ymin, xmax, ymax,
|
pred_x, pred_y, penalty_factor,
|
||||||
shift, map, map_generation, size, mv_penalty);
|
shift, map, map_generation, size, h, mv_penalty);
|
||||||
else if(s->me.dia_size<2)
|
else if(s->me.dia_size<2)
|
||||||
dmin= RENAME(small_diamond_search)(s, best, dmin, ref_picture,
|
dmin= RENAME(small_diamond_search)(s, best, dmin, src_data, ref_data, stride, uvstride,
|
||||||
pred_x, pred_y, penalty_factor, xmin, ymin, xmax, ymax,
|
pred_x, pred_y, penalty_factor,
|
||||||
shift, map, map_generation, size, mv_penalty);
|
shift, map, map_generation, size, h, mv_penalty);
|
||||||
else
|
else
|
||||||
dmin= RENAME(var_diamond_search)(s, best, dmin, ref_picture,
|
dmin= RENAME(var_diamond_search)(s, best, dmin, src_data, ref_data, stride, uvstride,
|
||||||
pred_x, pred_y, penalty_factor, xmin, ymin, xmax, ymax,
|
pred_x, pred_y, penalty_factor,
|
||||||
shift, map, map_generation, size, mv_penalty);
|
shift, map, map_generation, size, h, mv_penalty);
|
||||||
|
|
||||||
//check(best[0],best[1],0, b1)
|
//check(best[0],best[1],0, b1)
|
||||||
*mx_ptr= best[0];
|
*mx_ptr= best[0];
|
||||||
@ -998,10 +996,11 @@ static int RENAME(epzs_motion_search)(MpegEncContext * s, int block,
|
|||||||
}
|
}
|
||||||
|
|
||||||
#ifndef CMP_DIRECT /* no 4mv search needed in direct mode */
|
#ifndef CMP_DIRECT /* no 4mv search needed in direct mode */
|
||||||
static int RENAME(epzs_motion_search4)(MpegEncContext * s, int block,
|
static int RENAME(epzs_motion_search4)(MpegEncContext * s,
|
||||||
int *mx_ptr, int *my_ptr,
|
int *mx_ptr, int *my_ptr,
|
||||||
int P[10][2], int pred_x, int pred_y,
|
int P[10][2], int pred_x, int pred_y,
|
||||||
int xmin, int ymin, int xmax, int ymax, Picture *ref_picture, int16_t (*last_mv)[2],
|
uint8_t *src_data[3],
|
||||||
|
uint8_t *ref_data[3], int stride, int uvstride, int16_t (*last_mv)[2],
|
||||||
int ref_mv_scale, uint8_t * const mv_penalty)
|
int ref_mv_scale, uint8_t * const mv_penalty)
|
||||||
{
|
{
|
||||||
int best[2]={0, 0};
|
int best[2]={0, 0};
|
||||||
@ -1011,10 +1010,11 @@ static int RENAME(epzs_motion_search4)(MpegEncContext * s, int block,
|
|||||||
int map_generation;
|
int map_generation;
|
||||||
const int penalty_factor= s->me.penalty_factor;
|
const int penalty_factor= s->me.penalty_factor;
|
||||||
const int size=1;
|
const int size=1;
|
||||||
|
const int h=8;
|
||||||
const int ref_mv_stride= s->mb_stride;
|
const int ref_mv_stride= s->mb_stride;
|
||||||
const int ref_mv_xy= s->mb_x + s->mb_y *ref_mv_stride;
|
const int ref_mv_xy= s->mb_x + s->mb_y *ref_mv_stride;
|
||||||
me_cmp_func cmp, chroma_cmp;
|
me_cmp_func cmp, chroma_cmp;
|
||||||
LOAD_COMMON((s->mb_x*2 + (block&1))*8, (s->mb_y*2 + (block>>1))*8);
|
LOAD_COMMON
|
||||||
|
|
||||||
cmp= s->dsp.me_cmp[size];
|
cmp= s->dsp.me_cmp[size];
|
||||||
chroma_cmp= s->dsp.me_cmp[size+1];
|
chroma_cmp= s->dsp.me_cmp[size+1];
|
||||||
@ -1024,7 +1024,7 @@ static int RENAME(epzs_motion_search4)(MpegEncContext * s, int block,
|
|||||||
dmin = 1000000;
|
dmin = 1000000;
|
||||||
//printf("%d %d %d %d //",xmin, ymin, xmax, ymax);
|
//printf("%d %d %d %d //",xmin, ymin, xmax, ymax);
|
||||||
/* first line */
|
/* first line */
|
||||||
if (s->mb_y == 0 && block<2) {
|
if (s->mb_y == 0/* && block<2*/) {
|
||||||
CHECK_MV(P_LEFT[0]>>shift, P_LEFT[1]>>shift)
|
CHECK_MV(P_LEFT[0]>>shift, P_LEFT[1]>>shift)
|
||||||
CHECK_CLIPED_MV((last_mv[ref_mv_xy][0]*ref_mv_scale + (1<<15))>>16,
|
CHECK_CLIPED_MV((last_mv[ref_mv_xy][0]*ref_mv_scale + (1<<15))>>16,
|
||||||
(last_mv[ref_mv_xy][1]*ref_mv_scale + (1<<15))>>16)
|
(last_mv[ref_mv_xy][1]*ref_mv_scale + (1<<15))>>16)
|
||||||
@ -1049,21 +1049,100 @@ static int RENAME(epzs_motion_search4)(MpegEncContext * s, int block,
|
|||||||
}
|
}
|
||||||
|
|
||||||
if(s->me.dia_size==-1)
|
if(s->me.dia_size==-1)
|
||||||
dmin= RENAME(funny_diamond_search)(s, best, dmin, ref_picture,
|
dmin= RENAME(funny_diamond_search)(s, best, dmin, src_data, ref_data, stride, uvstride,
|
||||||
pred_x, pred_y, penalty_factor, xmin, ymin, xmax, ymax,
|
pred_x, pred_y, penalty_factor,
|
||||||
shift, map, map_generation, size, mv_penalty);
|
shift, map, map_generation, size, h, mv_penalty);
|
||||||
else if(s->me.dia_size<-1)
|
else if(s->me.dia_size<-1)
|
||||||
dmin= RENAME(sab_diamond_search)(s, best, dmin, ref_picture,
|
dmin= RENAME(sab_diamond_search)(s, best, dmin, src_data, ref_data, stride, uvstride,
|
||||||
pred_x, pred_y, penalty_factor, xmin, ymin, xmax, ymax,
|
pred_x, pred_y, penalty_factor,
|
||||||
shift, map, map_generation, size, mv_penalty);
|
shift, map, map_generation, size, h, mv_penalty);
|
||||||
else if(s->me.dia_size<2)
|
else if(s->me.dia_size<2)
|
||||||
dmin= RENAME(small_diamond_search)(s, best, dmin, ref_picture,
|
dmin= RENAME(small_diamond_search)(s, best, dmin, src_data, ref_data, stride, uvstride,
|
||||||
pred_x, pred_y, penalty_factor, xmin, ymin, xmax, ymax,
|
pred_x, pred_y, penalty_factor,
|
||||||
shift, map, map_generation, size, mv_penalty);
|
shift, map, map_generation, size, h, mv_penalty);
|
||||||
else
|
else
|
||||||
dmin= RENAME(var_diamond_search)(s, best, dmin, ref_picture,
|
dmin= RENAME(var_diamond_search)(s, best, dmin, src_data, ref_data, stride, uvstride,
|
||||||
pred_x, pred_y, penalty_factor, xmin, ymin, xmax, ymax,
|
pred_x, pred_y, penalty_factor,
|
||||||
shift, map, map_generation, size, mv_penalty);
|
shift, map, map_generation, size, h, mv_penalty);
|
||||||
|
|
||||||
|
|
||||||
|
*mx_ptr= best[0];
|
||||||
|
*my_ptr= best[1];
|
||||||
|
|
||||||
|
// printf("%d %d %d \n", best[0], best[1], dmin);
|
||||||
|
return dmin;
|
||||||
|
}
|
||||||
|
|
||||||
|
//try to merge with above FIXME (needs PSNR test)
|
||||||
|
static int RENAME(epzs_motion_search2)(MpegEncContext * s,
|
||||||
|
int *mx_ptr, int *my_ptr,
|
||||||
|
int P[10][2], int pred_x, int pred_y,
|
||||||
|
uint8_t *src_data[3],
|
||||||
|
uint8_t *ref_data[3], int stride, int uvstride, int16_t (*last_mv)[2],
|
||||||
|
int ref_mv_scale, uint8_t * const mv_penalty)
|
||||||
|
{
|
||||||
|
int best[2]={0, 0};
|
||||||
|
int d, dmin;
|
||||||
|
const int shift= 1+s->quarter_sample;
|
||||||
|
uint32_t *map= s->me.map;
|
||||||
|
int map_generation;
|
||||||
|
const int penalty_factor= s->me.penalty_factor;
|
||||||
|
const int size=0; //FIXME pass as arg
|
||||||
|
const int h=8;
|
||||||
|
const int ref_mv_stride= s->mb_stride;
|
||||||
|
const int ref_mv_xy= s->mb_x + s->mb_y *ref_mv_stride;
|
||||||
|
me_cmp_func cmp, chroma_cmp;
|
||||||
|
LOAD_COMMON
|
||||||
|
|
||||||
|
cmp= s->dsp.me_cmp[size];
|
||||||
|
chroma_cmp= s->dsp.me_cmp[size+1];
|
||||||
|
|
||||||
|
map_generation= update_map_generation(s);
|
||||||
|
|
||||||
|
dmin = 1000000;
|
||||||
|
//printf("%d %d %d %d //",xmin, ymin, xmax, ymax);
|
||||||
|
/* first line */
|
||||||
|
if (s->mb_y == 0) {
|
||||||
|
CHECK_MV(P_LEFT[0]>>shift, P_LEFT[1]>>shift)
|
||||||
|
CHECK_CLIPED_MV((last_mv[ref_mv_xy][0]*ref_mv_scale + (1<<15))>>16,
|
||||||
|
(last_mv[ref_mv_xy][1]*ref_mv_scale + (1<<15))>>16)
|
||||||
|
CHECK_MV(P_MV1[0]>>shift, P_MV1[1]>>shift)
|
||||||
|
}else{
|
||||||
|
CHECK_MV(P_MV1[0]>>shift, P_MV1[1]>>shift)
|
||||||
|
//FIXME try some early stop
|
||||||
|
if(dmin>64*2){
|
||||||
|
CHECK_MV(P_MEDIAN[0]>>shift, P_MEDIAN[1]>>shift)
|
||||||
|
CHECK_MV(P_LEFT[0]>>shift, P_LEFT[1]>>shift)
|
||||||
|
CHECK_MV(P_TOP[0]>>shift, P_TOP[1]>>shift)
|
||||||
|
CHECK_MV(P_TOPRIGHT[0]>>shift, P_TOPRIGHT[1]>>shift)
|
||||||
|
CHECK_CLIPED_MV((last_mv[ref_mv_xy][0]*ref_mv_scale + (1<<15))>>16,
|
||||||
|
(last_mv[ref_mv_xy][1]*ref_mv_scale + (1<<15))>>16)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
if(dmin>64*4){
|
||||||
|
CHECK_CLIPED_MV((last_mv[ref_mv_xy+1][0]*ref_mv_scale + (1<<15))>>16,
|
||||||
|
(last_mv[ref_mv_xy+1][1]*ref_mv_scale + (1<<15))>>16)
|
||||||
|
CHECK_CLIPED_MV((last_mv[ref_mv_xy+ref_mv_stride][0]*ref_mv_scale + (1<<15))>>16,
|
||||||
|
(last_mv[ref_mv_xy+ref_mv_stride][1]*ref_mv_scale + (1<<15))>>16)
|
||||||
|
}
|
||||||
|
|
||||||
|
if(s->me.dia_size==-1)
|
||||||
|
dmin= RENAME(funny_diamond_search)(s, best, dmin, src_data, ref_data, stride, uvstride,
|
||||||
|
pred_x, pred_y, penalty_factor,
|
||||||
|
shift, map, map_generation, size, h, mv_penalty);
|
||||||
|
else if(s->me.dia_size<-1)
|
||||||
|
dmin= RENAME(sab_diamond_search)(s, best, dmin, src_data, ref_data, stride, uvstride,
|
||||||
|
pred_x, pred_y, penalty_factor,
|
||||||
|
shift, map, map_generation, size, h, mv_penalty);
|
||||||
|
else if(s->me.dia_size<2)
|
||||||
|
dmin= RENAME(small_diamond_search)(s, best, dmin, src_data, ref_data, stride, uvstride,
|
||||||
|
pred_x, pred_y, penalty_factor,
|
||||||
|
shift, map, map_generation, size, h, mv_penalty);
|
||||||
|
else
|
||||||
|
dmin= RENAME(var_diamond_search)(s, best, dmin, src_data, ref_data, stride, uvstride,
|
||||||
|
pred_x, pred_y, penalty_factor,
|
||||||
|
shift, map, map_generation, size, h, mv_penalty);
|
||||||
|
|
||||||
|
|
||||||
*mx_ptr= best[0];
|
*mx_ptr= best[0];
|
||||||
*my_ptr= best[1];
|
*my_ptr= best[1];
|
||||||
|
@ -29,6 +29,9 @@
|
|||||||
|
|
||||||
#include "mpeg12data.h"
|
#include "mpeg12data.h"
|
||||||
|
|
||||||
|
//#undef NDEBUG
|
||||||
|
//#include <assert.h>
|
||||||
|
|
||||||
|
|
||||||
/* Start codes. */
|
/* Start codes. */
|
||||||
#define SEQ_END_CODE 0x000001b7
|
#define SEQ_END_CODE 0x000001b7
|
||||||
@ -476,12 +479,12 @@ void mpeg1_encode_picture_header(MpegEncContext *s, int picture_number)
|
|||||||
}
|
}
|
||||||
|
|
||||||
static inline void put_mb_modes(MpegEncContext *s, int n, int bits,
|
static inline void put_mb_modes(MpegEncContext *s, int n, int bits,
|
||||||
int has_mv)
|
int has_mv, int field_motion)
|
||||||
{
|
{
|
||||||
put_bits(&s->pb, n, bits);
|
put_bits(&s->pb, n, bits);
|
||||||
if (!s->frame_pred_frame_dct) {
|
if (!s->frame_pred_frame_dct) {
|
||||||
if (has_mv)
|
if (has_mv)
|
||||||
put_bits(&s->pb, 2, 2); /* motion_type: frame */
|
put_bits(&s->pb, 2, 2 - field_motion); /* motion_type: frame/field */
|
||||||
put_bits(&s->pb, 1, s->interlaced_dct);
|
put_bits(&s->pb, 1, s->interlaced_dct);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -503,7 +506,7 @@ void mpeg1_encode_mb(MpegEncContext *s,
|
|||||||
}
|
}
|
||||||
|
|
||||||
if (cbp == 0 && !first_mb && (mb_x != s->mb_width - 1 || (mb_y != s->mb_height - 1 && s->codec_id == CODEC_ID_MPEG1VIDEO)) &&
|
if (cbp == 0 && !first_mb && (mb_x != s->mb_width - 1 || (mb_y != s->mb_height - 1 && s->codec_id == CODEC_ID_MPEG1VIDEO)) &&
|
||||||
((s->pict_type == P_TYPE && (motion_x | motion_y) == 0) ||
|
((s->pict_type == P_TYPE && s->mv_type == MV_TYPE_16X16 && (motion_x | motion_y) == 0) ||
|
||||||
(s->pict_type == B_TYPE && s->mv_dir == s->last_mv_dir && (((s->mv_dir & MV_DIR_FORWARD) ? ((s->mv[0][0][0] - s->last_mv[0][0][0])|(s->mv[0][0][1] - s->last_mv[0][0][1])) : 0) |
|
(s->pict_type == B_TYPE && s->mv_dir == s->last_mv_dir && (((s->mv_dir & MV_DIR_FORWARD) ? ((s->mv[0][0][0] - s->last_mv[0][0][0])|(s->mv[0][0][1] - s->last_mv[0][0][1])) : 0) |
|
||||||
((s->mv_dir & MV_DIR_BACKWARD) ? ((s->mv[1][0][0] - s->last_mv[1][0][0])|(s->mv[1][0][1] - s->last_mv[1][0][1])) : 0)) == 0))) {
|
((s->mv_dir & MV_DIR_BACKWARD) ? ((s->mv[1][0][0] - s->last_mv[1][0][0])|(s->mv[1][0][1] - s->last_mv[1][0][1])) : 0)) == 0))) {
|
||||||
s->mb_skip_run++;
|
s->mb_skip_run++;
|
||||||
@ -511,6 +514,10 @@ void mpeg1_encode_mb(MpegEncContext *s,
|
|||||||
s->skip_count++;
|
s->skip_count++;
|
||||||
s->misc_bits++;
|
s->misc_bits++;
|
||||||
s->last_bits++;
|
s->last_bits++;
|
||||||
|
if(s->pict_type == P_TYPE){
|
||||||
|
s->last_mv[0][1][0]= s->last_mv[0][0][0]=
|
||||||
|
s->last_mv[0][1][1]= s->last_mv[0][0][1]= 0;
|
||||||
|
}
|
||||||
} else {
|
} else {
|
||||||
if(first_mb){
|
if(first_mb){
|
||||||
assert(s->mb_skip_run == 0);
|
assert(s->mb_skip_run == 0);
|
||||||
@ -521,150 +528,167 @@ void mpeg1_encode_mb(MpegEncContext *s,
|
|||||||
|
|
||||||
if (s->pict_type == I_TYPE) {
|
if (s->pict_type == I_TYPE) {
|
||||||
if(s->dquant && cbp){
|
if(s->dquant && cbp){
|
||||||
put_mb_modes(s, 2, 1, 0); /* macroblock_type : macroblock_quant = 1 */
|
put_mb_modes(s, 2, 1, 0, 0); /* macroblock_type : macroblock_quant = 1 */
|
||||||
put_bits(&s->pb, 5, s->qscale);
|
put_bits(&s->pb, 5, s->qscale);
|
||||||
}else{
|
}else{
|
||||||
put_mb_modes(s, 1, 1, 0); /* macroblock_type : macroblock_quant = 0 */
|
put_mb_modes(s, 1, 1, 0, 0); /* macroblock_type : macroblock_quant = 0 */
|
||||||
s->qscale -= s->dquant;
|
s->qscale -= s->dquant;
|
||||||
}
|
}
|
||||||
s->misc_bits+= get_bits_diff(s);
|
s->misc_bits+= get_bits_diff(s);
|
||||||
s->i_count++;
|
s->i_count++;
|
||||||
} else if (s->mb_intra) {
|
} else if (s->mb_intra) {
|
||||||
if(s->dquant && cbp){
|
if(s->dquant && cbp){
|
||||||
put_mb_modes(s, 6, 0x01, 0);
|
put_mb_modes(s, 6, 0x01, 0, 0);
|
||||||
put_bits(&s->pb, 5, s->qscale);
|
put_bits(&s->pb, 5, s->qscale);
|
||||||
}else{
|
}else{
|
||||||
put_mb_modes(s, 5, 0x03, 0);
|
put_mb_modes(s, 5, 0x03, 0, 0);
|
||||||
s->qscale -= s->dquant;
|
s->qscale -= s->dquant;
|
||||||
}
|
}
|
||||||
s->misc_bits+= get_bits_diff(s);
|
s->misc_bits+= get_bits_diff(s);
|
||||||
s->i_count++;
|
s->i_count++;
|
||||||
s->last_mv[0][0][0] =
|
memset(s->last_mv, 0, sizeof(s->last_mv));
|
||||||
s->last_mv[0][0][1] = 0;
|
|
||||||
} else if (s->pict_type == P_TYPE) {
|
} else if (s->pict_type == P_TYPE) {
|
||||||
|
if(s->mv_type == MV_TYPE_16X16){
|
||||||
if (cbp != 0) {
|
if (cbp != 0) {
|
||||||
if (motion_x == 0 && motion_y == 0) {
|
if ((motion_x|motion_y) == 0) {
|
||||||
if(s->dquant){
|
if(s->dquant){
|
||||||
put_mb_modes(s, 5, 1, 0); /* macroblock_pattern & quant */
|
put_mb_modes(s, 5, 1, 0, 0); /* macroblock_pattern & quant */
|
||||||
put_bits(&s->pb, 5, s->qscale);
|
put_bits(&s->pb, 5, s->qscale);
|
||||||
}else{
|
}else{
|
||||||
put_mb_modes(s, 2, 1, 0); /* macroblock_pattern only */
|
put_mb_modes(s, 2, 1, 0, 0); /* macroblock_pattern only */
|
||||||
}
|
}
|
||||||
s->misc_bits+= get_bits_diff(s);
|
s->misc_bits+= get_bits_diff(s);
|
||||||
put_bits(&s->pb, mbPatTable[cbp - 1][1], mbPatTable[cbp - 1][0]);
|
|
||||||
} else {
|
} else {
|
||||||
if(s->dquant){
|
if(s->dquant){
|
||||||
put_mb_modes(s, 5, 2, 1); /* motion + cbp */
|
put_mb_modes(s, 5, 2, 1, 0); /* motion + cbp */
|
||||||
put_bits(&s->pb, 5, s->qscale);
|
put_bits(&s->pb, 5, s->qscale);
|
||||||
}else{
|
}else{
|
||||||
put_mb_modes(s, 1, 1, 1); /* motion + cbp */
|
put_mb_modes(s, 1, 1, 1, 0); /* motion + cbp */
|
||||||
}
|
}
|
||||||
s->misc_bits+= get_bits_diff(s);
|
s->misc_bits+= get_bits_diff(s);
|
||||||
mpeg1_encode_motion(s, motion_x - s->last_mv[0][0][0], s->f_code); // RAL: f_code parameter added
|
mpeg1_encode_motion(s, motion_x - s->last_mv[0][0][0], s->f_code); // RAL: f_code parameter added
|
||||||
mpeg1_encode_motion(s, motion_y - s->last_mv[0][0][1], s->f_code); // RAL: f_code parameter added
|
mpeg1_encode_motion(s, motion_y - s->last_mv[0][0][1], s->f_code); // RAL: f_code parameter added
|
||||||
s->mv_bits+= get_bits_diff(s);
|
s->mv_bits+= get_bits_diff(s);
|
||||||
put_bits(&s->pb, mbPatTable[cbp - 1][1], mbPatTable[cbp - 1][0]);
|
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
put_bits(&s->pb, 3, 1); /* motion only */
|
put_bits(&s->pb, 3, 1); /* motion only */
|
||||||
if (!s->frame_pred_frame_dct)
|
if (!s->frame_pred_frame_dct)
|
||||||
put_bits(&s->pb, 2, 2); /* motion_type: frame */
|
put_bits(&s->pb, 2, 2); /* motion_type: frame */
|
||||||
|
s->misc_bits+= get_bits_diff(s);
|
||||||
mpeg1_encode_motion(s, motion_x - s->last_mv[0][0][0], s->f_code); // RAL: f_code parameter added
|
mpeg1_encode_motion(s, motion_x - s->last_mv[0][0][0], s->f_code); // RAL: f_code parameter added
|
||||||
mpeg1_encode_motion(s, motion_y - s->last_mv[0][0][1], s->f_code); // RAL: f_code parameter added
|
mpeg1_encode_motion(s, motion_y - s->last_mv[0][0][1], s->f_code); // RAL: f_code parameter added
|
||||||
s->qscale -= s->dquant;
|
s->qscale -= s->dquant;
|
||||||
s->mv_bits+= get_bits_diff(s);
|
s->mv_bits+= get_bits_diff(s);
|
||||||
}
|
}
|
||||||
s->f_count++;
|
s->last_mv[0][1][0]= s->last_mv[0][0][0]= motion_x;
|
||||||
} else
|
s->last_mv[0][1][1]= s->last_mv[0][0][1]= motion_y;
|
||||||
{ // RAL: All the following bloc added for B frames:
|
}else{
|
||||||
if (cbp != 0)
|
assert(!s->frame_pred_frame_dct && s->mv_type == MV_TYPE_FIELD);
|
||||||
{ // With coded bloc pattern
|
|
||||||
if (s->mv_dir == (MV_DIR_FORWARD | MV_DIR_BACKWARD))
|
if (cbp) {
|
||||||
{ // Bi-directional motion
|
if(s->dquant){
|
||||||
if (s->dquant) {
|
put_mb_modes(s, 5, 2, 1, 1); /* motion + cbp */
|
||||||
put_mb_modes(s, 5, 2, 1);
|
put_bits(&s->pb, 5, s->qscale);
|
||||||
put_bits(&s->pb, 5, s->qscale);
|
}else{
|
||||||
} else {
|
put_mb_modes(s, 1, 1, 1, 1); /* motion + cbp */
|
||||||
put_mb_modes(s, 2, 3, 1);
|
|
||||||
}
|
|
||||||
s->misc_bits += get_bits_diff(s);
|
|
||||||
mpeg1_encode_motion(s, s->mv[0][0][0] - s->last_mv[0][0][0], s->f_code);
|
|
||||||
mpeg1_encode_motion(s, s->mv[0][0][1] - s->last_mv[0][0][1], s->f_code);
|
|
||||||
mpeg1_encode_motion(s, s->mv[1][0][0] - s->last_mv[1][0][0], s->b_code);
|
|
||||||
mpeg1_encode_motion(s, s->mv[1][0][1] - s->last_mv[1][0][1], s->b_code);
|
|
||||||
s->b_count++;
|
|
||||||
s->f_count++;
|
|
||||||
s->mv_bits += get_bits_diff(s);
|
|
||||||
put_bits(&s->pb, mbPatTable[cbp - 1][1], mbPatTable[cbp - 1][0]);
|
|
||||||
}
|
|
||||||
else if (s->mv_dir == MV_DIR_BACKWARD)
|
|
||||||
{ // Backward motion
|
|
||||||
if (s->dquant) {
|
|
||||||
put_mb_modes(s, 6, 2, 1);
|
|
||||||
put_bits(&s->pb, 5, s->qscale);
|
|
||||||
} else {
|
|
||||||
put_mb_modes(s, 3, 3, 1);
|
|
||||||
}
|
|
||||||
s->misc_bits += get_bits_diff(s);
|
|
||||||
mpeg1_encode_motion(s, motion_x - s->last_mv[1][0][0], s->b_code);
|
|
||||||
mpeg1_encode_motion(s, motion_y - s->last_mv[1][0][1], s->b_code);
|
|
||||||
s->b_count++;
|
|
||||||
s->mv_bits += get_bits_diff(s);
|
|
||||||
put_bits(&s->pb, mbPatTable[cbp - 1][1], mbPatTable[cbp - 1][0]);
|
|
||||||
}
|
|
||||||
else if (s->mv_dir == MV_DIR_FORWARD)
|
|
||||||
{ // Forward motion
|
|
||||||
if (s->dquant) {
|
|
||||||
put_mb_modes(s, 6, 3, 1);
|
|
||||||
put_bits(&s->pb, 5, s->qscale);
|
|
||||||
} else {
|
|
||||||
put_mb_modes(s, 4, 3, 1);
|
|
||||||
}
|
|
||||||
s->misc_bits += get_bits_diff(s);
|
|
||||||
mpeg1_encode_motion(s, motion_x - s->last_mv[0][0][0], s->f_code);
|
|
||||||
mpeg1_encode_motion(s, motion_y - s->last_mv[0][0][1], s->f_code);
|
|
||||||
s->f_count++;
|
|
||||||
s->mv_bits += get_bits_diff(s);
|
|
||||||
put_bits(&s->pb, mbPatTable[cbp - 1][1], mbPatTable[cbp - 1][0]);
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
else
|
} else {
|
||||||
{ // No coded bloc pattern
|
put_bits(&s->pb, 3, 1); /* motion only */
|
||||||
if (s->mv_dir == (MV_DIR_FORWARD | MV_DIR_BACKWARD))
|
put_bits(&s->pb, 2, 1); /* motion_type: field */
|
||||||
{ // Bi-directional motion
|
|
||||||
put_bits(&s->pb, 2, 2); /* backward & forward motion */
|
|
||||||
if (!s->frame_pred_frame_dct)
|
|
||||||
put_bits(&s->pb, 2, 2); /* motion_type: frame */
|
|
||||||
mpeg1_encode_motion(s, s->mv[0][0][0] - s->last_mv[0][0][0], s->f_code);
|
|
||||||
mpeg1_encode_motion(s, s->mv[0][0][1] - s->last_mv[0][0][1], s->f_code);
|
|
||||||
mpeg1_encode_motion(s, s->mv[1][0][0] - s->last_mv[1][0][0], s->b_code);
|
|
||||||
mpeg1_encode_motion(s, s->mv[1][0][1] - s->last_mv[1][0][1], s->b_code);
|
|
||||||
s->b_count++;
|
|
||||||
s->f_count++;
|
|
||||||
}
|
|
||||||
else if (s->mv_dir == MV_DIR_BACKWARD)
|
|
||||||
{ // Backward motion
|
|
||||||
put_bits(&s->pb, 3, 2); /* backward motion only */
|
|
||||||
if (!s->frame_pred_frame_dct)
|
|
||||||
put_bits(&s->pb, 2, 2); /* motion_type: frame */
|
|
||||||
mpeg1_encode_motion(s, motion_x - s->last_mv[1][0][0], s->b_code);
|
|
||||||
mpeg1_encode_motion(s, motion_y - s->last_mv[1][0][1], s->b_code);
|
|
||||||
s->b_count++;
|
|
||||||
}
|
|
||||||
else if (s->mv_dir == MV_DIR_FORWARD)
|
|
||||||
{ // Forward motion
|
|
||||||
put_bits(&s->pb, 4, 2); /* forward motion only */
|
|
||||||
if (!s->frame_pred_frame_dct)
|
|
||||||
put_bits(&s->pb, 2, 2); /* motion_type: frame */
|
|
||||||
mpeg1_encode_motion(s, motion_x - s->last_mv[0][0][0], s->f_code);
|
|
||||||
mpeg1_encode_motion(s, motion_y - s->last_mv[0][0][1], s->f_code);
|
|
||||||
s->f_count++;
|
|
||||||
}
|
|
||||||
s->qscale -= s->dquant;
|
s->qscale -= s->dquant;
|
||||||
s->mv_bits += get_bits_diff(s);
|
}
|
||||||
}
|
s->misc_bits+= get_bits_diff(s);
|
||||||
// End of bloc from RAL
|
for(i=0; i<2; i++){
|
||||||
|
put_bits(&s->pb, 1, s->field_select[0][i]);
|
||||||
|
mpeg1_encode_motion(s, s->mv[0][i][0] - s->last_mv[0][i][0] , s->f_code);
|
||||||
|
mpeg1_encode_motion(s, s->mv[0][i][1] - (s->last_mv[0][i][1]>>1), s->f_code);
|
||||||
|
s->last_mv[0][i][0]= s->mv[0][i][0];
|
||||||
|
s->last_mv[0][i][1]= 2*s->mv[0][i][1];
|
||||||
|
}
|
||||||
|
s->mv_bits+= get_bits_diff(s);
|
||||||
}
|
}
|
||||||
|
if(cbp)
|
||||||
|
put_bits(&s->pb, mbPatTable[cbp - 1][1], mbPatTable[cbp - 1][0]);
|
||||||
|
s->f_count++;
|
||||||
|
} else{
|
||||||
|
static const int mb_type_len[4]={0,3,4,2}; //bak,for,bi
|
||||||
|
|
||||||
|
if(s->mv_type == MV_TYPE_16X16){
|
||||||
|
if (cbp){ // With coded bloc pattern
|
||||||
|
if (s->dquant) {
|
||||||
|
if(s->mv_dir == MV_DIR_FORWARD)
|
||||||
|
put_mb_modes(s, 6, 3, 1, 0);
|
||||||
|
else
|
||||||
|
put_mb_modes(s, mb_type_len[s->mv_dir]+3, 2, 1, 0);
|
||||||
|
put_bits(&s->pb, 5, s->qscale);
|
||||||
|
} else {
|
||||||
|
put_mb_modes(s, mb_type_len[s->mv_dir], 3, 1, 0);
|
||||||
|
}
|
||||||
|
}else{ // No coded bloc pattern
|
||||||
|
put_bits(&s->pb, mb_type_len[s->mv_dir], 2);
|
||||||
|
if (!s->frame_pred_frame_dct)
|
||||||
|
put_bits(&s->pb, 2, 2); /* motion_type: frame */
|
||||||
|
s->qscale -= s->dquant;
|
||||||
|
}
|
||||||
|
s->misc_bits += get_bits_diff(s);
|
||||||
|
if (s->mv_dir&MV_DIR_FORWARD){
|
||||||
|
mpeg1_encode_motion(s, s->mv[0][0][0] - s->last_mv[0][0][0], s->f_code);
|
||||||
|
mpeg1_encode_motion(s, s->mv[0][0][1] - s->last_mv[0][0][1], s->f_code);
|
||||||
|
s->last_mv[0][0][0]=s->last_mv[0][1][0]= s->mv[0][0][0];
|
||||||
|
s->last_mv[0][0][1]=s->last_mv[0][1][1]= s->mv[0][0][1];
|
||||||
|
s->f_count++;
|
||||||
|
}
|
||||||
|
if (s->mv_dir&MV_DIR_BACKWARD){
|
||||||
|
mpeg1_encode_motion(s, s->mv[1][0][0] - s->last_mv[1][0][0], s->b_code);
|
||||||
|
mpeg1_encode_motion(s, s->mv[1][0][1] - s->last_mv[1][0][1], s->b_code);
|
||||||
|
s->last_mv[1][0][0]=s->last_mv[1][1][0]= s->mv[1][0][0];
|
||||||
|
s->last_mv[1][0][1]=s->last_mv[1][1][1]= s->mv[1][0][1];
|
||||||
|
s->b_count++;
|
||||||
|
}
|
||||||
|
}else{
|
||||||
|
assert(s->mv_type == MV_TYPE_FIELD);
|
||||||
|
assert(!s->frame_pred_frame_dct);
|
||||||
|
if (cbp){ // With coded bloc pattern
|
||||||
|
if (s->dquant) {
|
||||||
|
if(s->mv_dir == MV_DIR_FORWARD)
|
||||||
|
put_mb_modes(s, 6, 3, 1, 1);
|
||||||
|
else
|
||||||
|
put_mb_modes(s, mb_type_len[s->mv_dir]+3, 2, 1, 1);
|
||||||
|
put_bits(&s->pb, 5, s->qscale);
|
||||||
|
} else {
|
||||||
|
put_mb_modes(s, mb_type_len[s->mv_dir], 3, 1, 1);
|
||||||
|
}
|
||||||
|
}else{ // No coded bloc pattern
|
||||||
|
put_bits(&s->pb, mb_type_len[s->mv_dir], 2);
|
||||||
|
put_bits(&s->pb, 2, 1); /* motion_type: field */
|
||||||
|
s->qscale -= s->dquant;
|
||||||
|
}
|
||||||
|
s->misc_bits += get_bits_diff(s);
|
||||||
|
if (s->mv_dir&MV_DIR_FORWARD){
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
put_bits(&s->pb, 1, s->field_select[0][i]);
|
||||||
|
mpeg1_encode_motion(s, s->mv[0][i][0] - s->last_mv[0][i][0] , s->f_code);
|
||||||
|
mpeg1_encode_motion(s, s->mv[0][i][1] - (s->last_mv[0][i][1]>>1), s->f_code);
|
||||||
|
s->last_mv[0][i][0]= s->mv[0][i][0];
|
||||||
|
s->last_mv[0][i][1]= 2*s->mv[0][i][1];
|
||||||
|
}
|
||||||
|
s->f_count++;
|
||||||
|
}
|
||||||
|
if (s->mv_dir&MV_DIR_BACKWARD){
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
put_bits(&s->pb, 1, s->field_select[1][i]);
|
||||||
|
mpeg1_encode_motion(s, s->mv[1][i][0] - s->last_mv[1][i][0] , s->b_code);
|
||||||
|
mpeg1_encode_motion(s, s->mv[1][i][1] - (s->last_mv[1][i][1]>>1), s->b_code);
|
||||||
|
s->last_mv[1][i][0]= s->mv[1][i][0];
|
||||||
|
s->last_mv[1][i][1]= 2*s->mv[1][i][1];
|
||||||
|
}
|
||||||
|
s->b_count++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
s->mv_bits += get_bits_diff(s);
|
||||||
|
if(cbp)
|
||||||
|
put_bits(&s->pb, mbPatTable[cbp - 1][1], mbPatTable[cbp - 1][0]);
|
||||||
|
}
|
||||||
for(i=0;i<6;i++) {
|
for(i=0;i<6;i++) {
|
||||||
if (cbp & (1 << (5 - i))) {
|
if (cbp & (1 << (5 - i))) {
|
||||||
mpeg1_encode_block(s, block[i], i);
|
mpeg1_encode_block(s, block[i], i);
|
||||||
@ -676,18 +700,6 @@ void mpeg1_encode_mb(MpegEncContext *s,
|
|||||||
else
|
else
|
||||||
s->p_tex_bits+= get_bits_diff(s);
|
s->p_tex_bits+= get_bits_diff(s);
|
||||||
}
|
}
|
||||||
|
|
||||||
// RAL: By this:
|
|
||||||
if (s->mv_dir & MV_DIR_FORWARD)
|
|
||||||
{
|
|
||||||
s->last_mv[0][0][0]= s->mv[0][0][0];
|
|
||||||
s->last_mv[0][0][1]= s->mv[0][0][1];
|
|
||||||
}
|
|
||||||
if (s->mv_dir & MV_DIR_BACKWARD)
|
|
||||||
{
|
|
||||||
s->last_mv[1][0][0]= s->mv[1][0][0];
|
|
||||||
s->last_mv[1][0][1]= s->mv[1][0][1];
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
// RAL: Parameter added: f_or_b_code
|
// RAL: Parameter added: f_or_b_code
|
||||||
@ -1963,13 +1975,9 @@ static void mpeg_decode_picture_coding_extension(MpegEncContext *s)
|
|||||||
if(s->alternate_scan){
|
if(s->alternate_scan){
|
||||||
ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable , ff_alternate_vertical_scan);
|
ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable , ff_alternate_vertical_scan);
|
||||||
ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable , ff_alternate_vertical_scan);
|
ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable , ff_alternate_vertical_scan);
|
||||||
ff_init_scantable(s->dsp.idct_permutation, &s->intra_h_scantable, ff_alternate_vertical_scan);
|
|
||||||
ff_init_scantable(s->dsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
|
|
||||||
}else{
|
}else{
|
||||||
ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable , ff_zigzag_direct);
|
ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable , ff_zigzag_direct);
|
||||||
ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable , ff_zigzag_direct);
|
ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable , ff_zigzag_direct);
|
||||||
ff_init_scantable(s->dsp.idct_permutation, &s->intra_h_scantable, ff_alternate_horizontal_scan);
|
|
||||||
ff_init_scantable(s->dsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/* composite display not parsed */
|
/* composite display not parsed */
|
||||||
@ -2103,10 +2111,10 @@ static int mpeg_decode_slice(AVCodecContext *avctx,
|
|||||||
s->qscale = get_qscale(s);
|
s->qscale = get_qscale(s);
|
||||||
if (s->first_slice && (s->first_field || s->picture_structure==PICT_FRAME)) {
|
if (s->first_slice && (s->first_field || s->picture_structure==PICT_FRAME)) {
|
||||||
if(s->avctx->debug&FF_DEBUG_PICT_INFO){
|
if(s->avctx->debug&FF_DEBUG_PICT_INFO){
|
||||||
av_log(s->avctx, AV_LOG_DEBUG, "qp:%d fc:%2d%2d%2d%2d %s %s %s %s dc:%d pstruct:%d fdct:%d cmv:%d qtype:%d ivlc:%d rff:%d %s\n",
|
av_log(s->avctx, AV_LOG_DEBUG, "qp:%d fc:%2d%2d%2d%2d %s %s %s %s %s dc:%d pstruct:%d fdct:%d cmv:%d qtype:%d ivlc:%d rff:%d %s\n",
|
||||||
s->qscale, s->mpeg_f_code[0][0],s->mpeg_f_code[0][1],s->mpeg_f_code[1][0],s->mpeg_f_code[1][1],
|
s->qscale, s->mpeg_f_code[0][0],s->mpeg_f_code[0][1],s->mpeg_f_code[1][0],s->mpeg_f_code[1][1],
|
||||||
s->pict_type == I_TYPE ? "I" : (s->pict_type == P_TYPE ? "P" : (s->pict_type == B_TYPE ? "B" : "S")),
|
s->pict_type == I_TYPE ? "I" : (s->pict_type == P_TYPE ? "P" : (s->pict_type == B_TYPE ? "B" : "S")),
|
||||||
s->progressive_sequence ? "pro" :"", s->alternate_scan ? "alt" :"", s->top_field_first ? "top" :"",
|
s->progressive_sequence ? "ps" :"", s->progressive_frame ? "pf" : "", s->alternate_scan ? "alt" :"", s->top_field_first ? "top" :"",
|
||||||
s->intra_dc_precision, s->picture_structure, s->frame_pred_frame_dct, s->concealment_motion_vectors,
|
s->intra_dc_precision, s->picture_structure, s->frame_pred_frame_dct, s->concealment_motion_vectors,
|
||||||
s->q_scale_type, s->intra_vlc_format, s->repeat_first_field, s->chroma_420_type ? "420" :"");
|
s->q_scale_type, s->intra_vlc_format, s->repeat_first_field, s->chroma_420_type ? "420" :"");
|
||||||
}
|
}
|
||||||
|
@ -252,8 +252,13 @@ int DCT_common_init(MpegEncContext *s)
|
|||||||
/* load & permutate scantables
|
/* load & permutate scantables
|
||||||
note: only wmv uses differnt ones
|
note: only wmv uses differnt ones
|
||||||
*/
|
*/
|
||||||
ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable , ff_zigzag_direct);
|
if(s->alternate_scan){
|
||||||
ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable , ff_zigzag_direct);
|
ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable , ff_alternate_vertical_scan);
|
||||||
|
ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable , ff_alternate_vertical_scan);
|
||||||
|
}else{
|
||||||
|
ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable , ff_zigzag_direct);
|
||||||
|
ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable , ff_zigzag_direct);
|
||||||
|
}
|
||||||
ff_init_scantable(s->dsp.idct_permutation, &s->intra_h_scantable, ff_alternate_horizontal_scan);
|
ff_init_scantable(s->dsp.idct_permutation, &s->intra_h_scantable, ff_alternate_horizontal_scan);
|
||||||
ff_init_scantable(s->dsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
|
ff_init_scantable(s->dsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
|
||||||
|
|
||||||
@ -394,7 +399,7 @@ static void free_picture(MpegEncContext *s, Picture *pic){
|
|||||||
/* init common structure for both encoder and decoder */
|
/* init common structure for both encoder and decoder */
|
||||||
int MPV_common_init(MpegEncContext *s)
|
int MPV_common_init(MpegEncContext *s)
|
||||||
{
|
{
|
||||||
int y_size, c_size, yc_size, i, mb_array_size, x, y;
|
int y_size, c_size, yc_size, i, mb_array_size, mv_table_size, x, y;
|
||||||
|
|
||||||
dsputil_init(&s->dsp, s->avctx);
|
dsputil_init(&s->dsp, s->avctx);
|
||||||
DCT_common_init(s);
|
DCT_common_init(s);
|
||||||
@ -407,6 +412,7 @@ int MPV_common_init(MpegEncContext *s)
|
|||||||
s->b8_stride = s->mb_width*2 + 1;
|
s->b8_stride = s->mb_width*2 + 1;
|
||||||
s->b4_stride = s->mb_width*4 + 1;
|
s->b4_stride = s->mb_width*4 + 1;
|
||||||
mb_array_size= s->mb_height * s->mb_stride;
|
mb_array_size= s->mb_height * s->mb_stride;
|
||||||
|
mv_table_size= (s->mb_height+2) * s->mb_stride + 1;
|
||||||
|
|
||||||
/* set default edge pos, will be overriden in decode_header if needed */
|
/* set default edge pos, will be overriden in decode_header if needed */
|
||||||
s->h_edge_pos= s->mb_width*16;
|
s->h_edge_pos= s->mb_width*16;
|
||||||
@ -458,8 +464,6 @@ int MPV_common_init(MpegEncContext *s)
|
|||||||
s->mb_index2xy[ s->mb_height*s->mb_width ] = (s->mb_height-1)*s->mb_stride + s->mb_width; //FIXME really needed?
|
s->mb_index2xy[ s->mb_height*s->mb_width ] = (s->mb_height-1)*s->mb_stride + s->mb_width; //FIXME really needed?
|
||||||
|
|
||||||
if (s->encoding) {
|
if (s->encoding) {
|
||||||
int mv_table_size= s->mb_stride * (s->mb_height+2) + 1;
|
|
||||||
|
|
||||||
/* Allocate MV tables */
|
/* Allocate MV tables */
|
||||||
CHECKED_ALLOCZ(s->p_mv_table_base , mv_table_size * 2 * sizeof(int16_t))
|
CHECKED_ALLOCZ(s->p_mv_table_base , mv_table_size * 2 * sizeof(int16_t))
|
||||||
CHECKED_ALLOCZ(s->b_forw_mv_table_base , mv_table_size * 2 * sizeof(int16_t))
|
CHECKED_ALLOCZ(s->b_forw_mv_table_base , mv_table_size * 2 * sizeof(int16_t))
|
||||||
@ -491,7 +495,7 @@ int MPV_common_init(MpegEncContext *s)
|
|||||||
CHECKED_ALLOCZ(s->avctx->stats_out, 256);
|
CHECKED_ALLOCZ(s->avctx->stats_out, 256);
|
||||||
|
|
||||||
/* Allocate MB type table */
|
/* Allocate MB type table */
|
||||||
CHECKED_ALLOCZ(s->mb_type , mb_array_size * sizeof(uint8_t)) //needed for encoding
|
CHECKED_ALLOCZ(s->mb_type , mb_array_size * sizeof(uint16_t)) //needed for encoding
|
||||||
|
|
||||||
CHECKED_ALLOCZ(s->lambda_table, mb_array_size * sizeof(int))
|
CHECKED_ALLOCZ(s->lambda_table, mb_array_size * sizeof(int))
|
||||||
|
|
||||||
@ -513,10 +517,21 @@ int MPV_common_init(MpegEncContext *s)
|
|||||||
|
|
||||||
CHECKED_ALLOCZ(s->error_status_table, mb_array_size*sizeof(uint8_t))
|
CHECKED_ALLOCZ(s->error_status_table, mb_array_size*sizeof(uint8_t))
|
||||||
|
|
||||||
if(s->codec_id==CODEC_ID_MPEG4){
|
if(s->codec_id==CODEC_ID_MPEG4 || (s->flags & CODEC_FLAG_INTERLACED_ME)){
|
||||||
/* interlaced direct mode decoding tables */
|
/* interlaced direct mode decoding tables */
|
||||||
CHECKED_ALLOCZ(s->field_mv_table, mb_array_size*2*2 * sizeof(int16_t))
|
for(i=0; i<2; i++){
|
||||||
CHECKED_ALLOCZ(s->field_select_table, mb_array_size*2* sizeof(int8_t))
|
int j, k;
|
||||||
|
for(j=0; j<2; j++){
|
||||||
|
for(k=0; k<2; k++){
|
||||||
|
CHECKED_ALLOCZ(s->b_field_mv_table_base[i][j][k] , mv_table_size * 2 * sizeof(int16_t))
|
||||||
|
s->b_field_mv_table[i][j][k] = s->b_field_mv_table_base[i][j][k] + s->mb_stride + 1;
|
||||||
|
}
|
||||||
|
CHECKED_ALLOCZ(s->b_field_select_table[i][j] , mb_array_size * 2 * sizeof(uint8_t))
|
||||||
|
CHECKED_ALLOCZ(s->p_field_mv_table_base[i][j] , mv_table_size * 2 * sizeof(int16_t))
|
||||||
|
s->p_field_mv_table[i][j] = s->p_field_mv_table_base[i][j] + s->mb_stride + 1;
|
||||||
|
}
|
||||||
|
CHECKED_ALLOCZ(s->p_field_select_table[i] , mb_array_size * 2 * sizeof(uint8_t))
|
||||||
|
}
|
||||||
}
|
}
|
||||||
if (s->out_format == FMT_H263) {
|
if (s->out_format == FMT_H263) {
|
||||||
/* ac values */
|
/* ac values */
|
||||||
@ -583,7 +598,7 @@ int MPV_common_init(MpegEncContext *s)
|
|||||||
/* init common structure for both encoder and decoder */
|
/* init common structure for both encoder and decoder */
|
||||||
void MPV_common_end(MpegEncContext *s)
|
void MPV_common_end(MpegEncContext *s)
|
||||||
{
|
{
|
||||||
int i;
|
int i, j, k;
|
||||||
|
|
||||||
av_freep(&s->parse_context.buffer);
|
av_freep(&s->parse_context.buffer);
|
||||||
s->parse_context.buffer_size=0;
|
s->parse_context.buffer_size=0;
|
||||||
@ -601,6 +616,18 @@ void MPV_common_end(MpegEncContext *s)
|
|||||||
s->b_bidir_forw_mv_table= NULL;
|
s->b_bidir_forw_mv_table= NULL;
|
||||||
s->b_bidir_back_mv_table= NULL;
|
s->b_bidir_back_mv_table= NULL;
|
||||||
s->b_direct_mv_table= NULL;
|
s->b_direct_mv_table= NULL;
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
for(j=0; j<2; j++){
|
||||||
|
for(k=0; k<2; k++){
|
||||||
|
av_freep(&s->b_field_mv_table_base[i][j][k]);
|
||||||
|
s->b_field_mv_table[i][j][k]=NULL;
|
||||||
|
}
|
||||||
|
av_freep(&s->b_field_select_table[i][j]);
|
||||||
|
av_freep(&s->p_field_mv_table_base[i][j]);
|
||||||
|
s->p_field_mv_table[i][j]=NULL;
|
||||||
|
}
|
||||||
|
av_freep(&s->p_field_select_table[i]);
|
||||||
|
}
|
||||||
|
|
||||||
av_freep(&s->dc_val[0]);
|
av_freep(&s->dc_val[0]);
|
||||||
av_freep(&s->ac_val[0]);
|
av_freep(&s->ac_val[0]);
|
||||||
@ -618,8 +645,6 @@ void MPV_common_end(MpegEncContext *s)
|
|||||||
av_freep(&s->tex_pb_buffer);
|
av_freep(&s->tex_pb_buffer);
|
||||||
av_freep(&s->pb2_buffer);
|
av_freep(&s->pb2_buffer);
|
||||||
av_freep(&s->allocated_edge_emu_buffer); s->edge_emu_buffer= NULL;
|
av_freep(&s->allocated_edge_emu_buffer); s->edge_emu_buffer= NULL;
|
||||||
av_freep(&s->field_mv_table);
|
|
||||||
av_freep(&s->field_select_table);
|
|
||||||
av_freep(&s->avctx->stats_out);
|
av_freep(&s->avctx->stats_out);
|
||||||
av_freep(&s->ac_stats);
|
av_freep(&s->ac_stats);
|
||||||
av_freep(&s->error_status_table);
|
av_freep(&s->error_status_table);
|
||||||
@ -692,7 +717,7 @@ int MPV_encode_init(AVCodecContext *avctx)
|
|||||||
s->me_method = avctx->me_method;
|
s->me_method = avctx->me_method;
|
||||||
|
|
||||||
/* Fixed QSCALE */
|
/* Fixed QSCALE */
|
||||||
s->fixed_qscale = (avctx->flags & CODEC_FLAG_QSCALE);
|
s->fixed_qscale = !!(avctx->flags & CODEC_FLAG_QSCALE);
|
||||||
|
|
||||||
s->adaptive_quant= ( s->avctx->lumi_masking
|
s->adaptive_quant= ( s->avctx->lumi_masking
|
||||||
|| s->avctx->dark_masking
|
|| s->avctx->dark_masking
|
||||||
@ -702,8 +727,9 @@ int MPV_encode_init(AVCodecContext *avctx)
|
|||||||
|| (s->flags&CODEC_FLAG_QP_RD))
|
|| (s->flags&CODEC_FLAG_QP_RD))
|
||||||
&& !s->fixed_qscale;
|
&& !s->fixed_qscale;
|
||||||
|
|
||||||
s->obmc= (s->flags & CODEC_FLAG_OBMC);
|
s->obmc= !!(s->flags & CODEC_FLAG_OBMC);
|
||||||
s->loop_filter= (s->flags & CODEC_FLAG_LOOP_FILTER);
|
s->loop_filter= !!(s->flags & CODEC_FLAG_LOOP_FILTER);
|
||||||
|
s->alternate_scan= !!(s->flags & CODEC_FLAG_ALT_SCAN);
|
||||||
|
|
||||||
if((s->flags & CODEC_FLAG_4MV) && s->codec_id != CODEC_ID_MPEG4
|
if((s->flags & CODEC_FLAG_4MV) && s->codec_id != CODEC_ID_MPEG4
|
||||||
&& s->codec_id != CODEC_ID_H263 && s->codec_id != CODEC_ID_H263P){
|
&& s->codec_id != CODEC_ID_H263 && s->codec_id != CODEC_ID_H263P){
|
||||||
@ -934,7 +960,7 @@ int MPV_encode_init(AVCodecContext *avctx)
|
|||||||
if(s->modified_quant)
|
if(s->modified_quant)
|
||||||
s->chroma_qscale_table= ff_h263_chroma_qscale_table;
|
s->chroma_qscale_table= ff_h263_chroma_qscale_table;
|
||||||
s->progressive_frame=
|
s->progressive_frame=
|
||||||
s->progressive_sequence= !(avctx->flags & CODEC_FLAG_INTERLACED_DCT);
|
s->progressive_sequence= !(avctx->flags & (CODEC_FLAG_INTERLACED_DCT|CODEC_FLAG_INTERLACED_ME));
|
||||||
|
|
||||||
ff_init_me(s);
|
ff_init_me(s);
|
||||||
|
|
||||||
@ -1610,7 +1636,7 @@ static int get_intra_count(MpegEncContext *s, uint8_t *src, uint8_t *ref, int st
|
|||||||
for(y=0; y<h; y+=16){
|
for(y=0; y<h; y+=16){
|
||||||
for(x=0; x<w; x+=16){
|
for(x=0; x<w; x+=16){
|
||||||
int offset= x + y*stride;
|
int offset= x + y*stride;
|
||||||
int sad = s->dsp.pix_abs16x16(src + offset, ref + offset, stride);
|
int sad = s->dsp.sad[0](NULL, src + offset, ref + offset, stride, 16);
|
||||||
int mean= (s->dsp.pix_sum(src + offset, stride) + 128)>>8;
|
int mean= (s->dsp.pix_sum(src + offset, stride) + 128)>>8;
|
||||||
int sae = get_sae(src + offset, mean, stride);
|
int sae = get_sae(src + offset, mean, stride);
|
||||||
|
|
||||||
@ -1906,7 +1932,7 @@ int MPV_encode_picture(AVCodecContext *avctx,
|
|||||||
if(s->avctx->rc_max_rate && s->avctx->rc_min_rate == s->avctx->rc_max_rate){
|
if(s->avctx->rc_max_rate && s->avctx->rc_min_rate == s->avctx->rc_max_rate){
|
||||||
int vbv_delay;
|
int vbv_delay;
|
||||||
|
|
||||||
assert(s->repeat_first_field==0 && s->avctx->repeat_pic==0);
|
assert(s->repeat_first_field==0);
|
||||||
|
|
||||||
vbv_delay= lrintf(90000 * s->rc_context.buffer_index / s->avctx->rc_max_rate);
|
vbv_delay= lrintf(90000 * s->rc_context.buffer_index / s->avctx->rc_max_rate);
|
||||||
assert(vbv_delay < 0xFFFF);
|
assert(vbv_delay < 0xFFFF);
|
||||||
@ -3417,12 +3443,12 @@ static void encode_mb(MpegEncContext *s, int motion_x, int motion_y)
|
|||||||
/* pre quantization */
|
/* pre quantization */
|
||||||
if(s->current_picture.mc_mb_var[s->mb_stride*mb_y+ mb_x]<2*s->qscale*s->qscale){
|
if(s->current_picture.mc_mb_var[s->mb_stride*mb_y+ mb_x]<2*s->qscale*s->qscale){
|
||||||
//FIXME optimize
|
//FIXME optimize
|
||||||
if(s->dsp.pix_abs8x8(ptr_y , dest_y , wrap_y) < 20*s->qscale) skip_dct[0]= 1;
|
if(s->dsp.sad[1](NULL, ptr_y , dest_y , wrap_y, 8) < 20*s->qscale) skip_dct[0]= 1;
|
||||||
if(s->dsp.pix_abs8x8(ptr_y + 8, dest_y + 8, wrap_y) < 20*s->qscale) skip_dct[1]= 1;
|
if(s->dsp.sad[1](NULL, ptr_y + 8, dest_y + 8, wrap_y, 8) < 20*s->qscale) skip_dct[1]= 1;
|
||||||
if(s->dsp.pix_abs8x8(ptr_y +dct_offset , dest_y +dct_offset , wrap_y) < 20*s->qscale) skip_dct[2]= 1;
|
if(s->dsp.sad[1](NULL, ptr_y +dct_offset , dest_y +dct_offset , wrap_y, 8) < 20*s->qscale) skip_dct[2]= 1;
|
||||||
if(s->dsp.pix_abs8x8(ptr_y +dct_offset+ 8, dest_y +dct_offset+ 8, wrap_y) < 20*s->qscale) skip_dct[3]= 1;
|
if(s->dsp.sad[1](NULL, ptr_y +dct_offset+ 8, dest_y +dct_offset+ 8, wrap_y, 8) < 20*s->qscale) skip_dct[3]= 1;
|
||||||
if(s->dsp.pix_abs8x8(ptr_cb , dest_cb , wrap_c) < 20*s->qscale) skip_dct[4]= 1;
|
if(s->dsp.sad[1](NULL, ptr_cb , dest_cb , wrap_c, 8) < 20*s->qscale) skip_dct[4]= 1;
|
||||||
if(s->dsp.pix_abs8x8(ptr_cr , dest_cr , wrap_c) < 20*s->qscale) skip_dct[5]= 1;
|
if(s->dsp.sad[1](NULL, ptr_cr , dest_cr , wrap_c, 8) < 20*s->qscale) skip_dct[5]= 1;
|
||||||
#if 0
|
#if 0
|
||||||
{
|
{
|
||||||
static int stat[7];
|
static int stat[7];
|
||||||
@ -3484,6 +3510,19 @@ static void encode_mb(MpegEncContext *s, int motion_x, int motion_y)
|
|||||||
s->block[5][0]= (1024 + s->c_dc_scale/2)/ s->c_dc_scale;
|
s->block[5][0]= (1024 + s->c_dc_scale/2)/ s->c_dc_scale;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
//non c quantize code returns incorrect block_last_index FIXME
|
||||||
|
if(s->alternate_scan && s->dct_quantize != dct_quantize_c){
|
||||||
|
for(i=0; i<6; i++){
|
||||||
|
int j;
|
||||||
|
if(s->block_last_index[i]>0){
|
||||||
|
for(j=63; j>0; j--){
|
||||||
|
if(s->block[i][ s->intra_scantable.permutated[j] ]) break;
|
||||||
|
}
|
||||||
|
s->block_last_index[i]= j;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
/* huffman encode */
|
/* huffman encode */
|
||||||
switch(s->codec_id){ //FIXME funct ptr could be slightly faster
|
switch(s->codec_id){ //FIXME funct ptr could be slightly faster
|
||||||
case CODEC_ID_MPEG1VIDEO:
|
case CODEC_ID_MPEG1VIDEO:
|
||||||
@ -3724,9 +3763,9 @@ static int sse(MpegEncContext *s, uint8_t *src1, uint8_t *src2, int w, int h, in
|
|||||||
int x,y;
|
int x,y;
|
||||||
|
|
||||||
if(w==16 && h==16)
|
if(w==16 && h==16)
|
||||||
return s->dsp.sse[0](NULL, src1, src2, stride);
|
return s->dsp.sse[0](NULL, src1, src2, stride, 16);
|
||||||
else if(w==8 && h==8)
|
else if(w==8 && h==8)
|
||||||
return s->dsp.sse[1](NULL, src1, src2, stride);
|
return s->dsp.sse[1](NULL, src1, src2, stride, 8);
|
||||||
|
|
||||||
for(y=0; y<h; y++){
|
for(y=0; y<h; y++){
|
||||||
for(x=0; x<w; x++){
|
for(x=0; x<w; x++){
|
||||||
@ -3747,9 +3786,9 @@ static int sse_mb(MpegEncContext *s){
|
|||||||
if(s->mb_y*16 + 16 > s->height) h= s->height- s->mb_y*16;
|
if(s->mb_y*16 + 16 > s->height) h= s->height- s->mb_y*16;
|
||||||
|
|
||||||
if(w==16 && h==16)
|
if(w==16 && h==16)
|
||||||
return s->dsp.sse[0](NULL, s->new_picture.data[0] + s->mb_x*16 + s->mb_y*s->linesize*16, s->dest[0], s->linesize)
|
return s->dsp.sse[0](NULL, s->new_picture.data[0] + s->mb_x*16 + s->mb_y*s->linesize*16, s->dest[0], s->linesize, 16)
|
||||||
+s->dsp.sse[1](NULL, s->new_picture.data[1] + s->mb_x*8 + s->mb_y*s->uvlinesize*8,s->dest[1], s->uvlinesize)
|
+s->dsp.sse[1](NULL, s->new_picture.data[1] + s->mb_x*8 + s->mb_y*s->uvlinesize*8,s->dest[1], s->uvlinesize, 8)
|
||||||
+s->dsp.sse[1](NULL, s->new_picture.data[2] + s->mb_x*8 + s->mb_y*s->uvlinesize*8,s->dest[2], s->uvlinesize);
|
+s->dsp.sse[1](NULL, s->new_picture.data[2] + s->mb_x*8 + s->mb_y*s->uvlinesize*8,s->dest[2], s->uvlinesize, 8);
|
||||||
else
|
else
|
||||||
return sse(s, s->new_picture.data[0] + s->mb_x*16 + s->mb_y*s->linesize*16, s->dest[0], w, h, s->linesize)
|
return sse(s, s->new_picture.data[0] + s->mb_x*16 + s->mb_y*s->linesize*16, s->dest[0], w, h, s->linesize)
|
||||||
+sse(s, s->new_picture.data[1] + s->mb_x*8 + s->mb_y*s->uvlinesize*8,s->dest[1], w>>1, h>>1, s->uvlinesize)
|
+sse(s, s->new_picture.data[1] + s->mb_x*8 + s->mb_y*s->uvlinesize*8,s->dest[1], w>>1, h>>1, s->uvlinesize)
|
||||||
@ -3759,7 +3798,7 @@ static int sse_mb(MpegEncContext *s){
|
|||||||
static void encode_picture(MpegEncContext *s, int picture_number)
|
static void encode_picture(MpegEncContext *s, int picture_number)
|
||||||
{
|
{
|
||||||
int mb_x, mb_y, pdif = 0;
|
int mb_x, mb_y, pdif = 0;
|
||||||
int i;
|
int i, j;
|
||||||
int bits;
|
int bits;
|
||||||
MpegEncContext best_s, backup_s;
|
MpegEncContext best_s, backup_s;
|
||||||
uint8_t bit_buf[2][3000];
|
uint8_t bit_buf[2][3000];
|
||||||
@ -3843,7 +3882,8 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
//FIXME do we need to zero them?
|
//FIXME do we need to zero them?
|
||||||
memset(s->current_picture.motion_val[0][0], 0, sizeof(int16_t)*(s->mb_width*2 + 2)*(s->mb_height*2 + 2)*2);
|
memset(s->current_picture.motion_val[0][0], 0, sizeof(int16_t)*(s->mb_width*2 + 2)*(s->mb_height*2 + 2)*2);
|
||||||
memset(s->p_mv_table , 0, sizeof(int16_t)*(s->mb_stride)*s->mb_height*2);
|
memset(s->p_mv_table , 0, sizeof(int16_t)*(s->mb_stride)*s->mb_height*2);
|
||||||
memset(s->mb_type , MB_TYPE_INTRA, sizeof(uint8_t)*s->mb_stride*s->mb_height);
|
for(i=0; i<s->mb_stride*s->mb_height; i++)
|
||||||
|
s->mb_type[i]= CANDIDATE_MB_TYPE_INTRA;
|
||||||
|
|
||||||
if(!s->fixed_qscale){
|
if(!s->fixed_qscale){
|
||||||
/* finding spatial complexity for I-frame rate control */
|
/* finding spatial complexity for I-frame rate control */
|
||||||
@ -3868,32 +3908,61 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
|
|
||||||
if(s->scene_change_score > s->avctx->scenechange_threshold && s->pict_type == P_TYPE){
|
if(s->scene_change_score > s->avctx->scenechange_threshold && s->pict_type == P_TYPE){
|
||||||
s->pict_type= I_TYPE;
|
s->pict_type= I_TYPE;
|
||||||
memset(s->mb_type , MB_TYPE_INTRA, sizeof(uint8_t)*s->mb_stride*s->mb_height);
|
for(i=0; i<s->mb_stride*s->mb_height; i++)
|
||||||
|
s->mb_type[i]= CANDIDATE_MB_TYPE_INTRA;
|
||||||
//printf("Scene change detected, encoding as I Frame %d %d\n", s->current_picture.mb_var_sum, s->current_picture.mc_mb_var_sum);
|
//printf("Scene change detected, encoding as I Frame %d %d\n", s->current_picture.mb_var_sum, s->current_picture.mc_mb_var_sum);
|
||||||
}
|
}
|
||||||
|
|
||||||
if(!s->umvplus){
|
if(!s->umvplus){
|
||||||
if(s->pict_type==P_TYPE || s->pict_type==S_TYPE) {
|
if(s->pict_type==P_TYPE || s->pict_type==S_TYPE) {
|
||||||
s->f_code= ff_get_best_fcode(s, s->p_mv_table, MB_TYPE_INTER);
|
s->f_code= ff_get_best_fcode(s, s->p_mv_table, CANDIDATE_MB_TYPE_INTER);
|
||||||
|
|
||||||
|
if(s->flags & CODEC_FLAG_INTERLACED_ME){
|
||||||
|
int a,b;
|
||||||
|
a= ff_get_best_fcode(s, s->p_field_mv_table[0][0], CANDIDATE_MB_TYPE_INTER_I); //FIXME field_select
|
||||||
|
b= ff_get_best_fcode(s, s->p_field_mv_table[1][1], CANDIDATE_MB_TYPE_INTER_I);
|
||||||
|
s->f_code= FFMAX(s->f_code, FFMAX(a,b));
|
||||||
|
}
|
||||||
|
|
||||||
ff_fix_long_p_mvs(s);
|
ff_fix_long_p_mvs(s);
|
||||||
|
ff_fix_long_mvs(s, NULL, 0, s->p_mv_table, s->f_code, CANDIDATE_MB_TYPE_INTER, 0);
|
||||||
|
if(s->flags & CODEC_FLAG_INTERLACED_ME){
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
for(j=0; j<2; j++)
|
||||||
|
ff_fix_long_mvs(s, s->p_field_select_table[i], j,
|
||||||
|
s->p_field_mv_table[i][j], s->f_code, CANDIDATE_MB_TYPE_INTER_I, 0);
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if(s->pict_type==B_TYPE){
|
if(s->pict_type==B_TYPE){
|
||||||
int a, b;
|
int a, b;
|
||||||
|
|
||||||
a = ff_get_best_fcode(s, s->b_forw_mv_table, MB_TYPE_FORWARD);
|
a = ff_get_best_fcode(s, s->b_forw_mv_table, CANDIDATE_MB_TYPE_FORWARD);
|
||||||
b = ff_get_best_fcode(s, s->b_bidir_forw_mv_table, MB_TYPE_BIDIR);
|
b = ff_get_best_fcode(s, s->b_bidir_forw_mv_table, CANDIDATE_MB_TYPE_BIDIR);
|
||||||
s->f_code = FFMAX(a, b);
|
s->f_code = FFMAX(a, b);
|
||||||
|
|
||||||
a = ff_get_best_fcode(s, s->b_back_mv_table, MB_TYPE_BACKWARD);
|
a = ff_get_best_fcode(s, s->b_back_mv_table, CANDIDATE_MB_TYPE_BACKWARD);
|
||||||
b = ff_get_best_fcode(s, s->b_bidir_back_mv_table, MB_TYPE_BIDIR);
|
b = ff_get_best_fcode(s, s->b_bidir_back_mv_table, CANDIDATE_MB_TYPE_BIDIR);
|
||||||
s->b_code = FFMAX(a, b);
|
s->b_code = FFMAX(a, b);
|
||||||
|
|
||||||
ff_fix_long_b_mvs(s, s->b_forw_mv_table, s->f_code, MB_TYPE_FORWARD);
|
ff_fix_long_mvs(s, NULL, 0, s->b_forw_mv_table, s->f_code, CANDIDATE_MB_TYPE_FORWARD, 1);
|
||||||
ff_fix_long_b_mvs(s, s->b_back_mv_table, s->b_code, MB_TYPE_BACKWARD);
|
ff_fix_long_mvs(s, NULL, 0, s->b_back_mv_table, s->b_code, CANDIDATE_MB_TYPE_BACKWARD, 1);
|
||||||
ff_fix_long_b_mvs(s, s->b_bidir_forw_mv_table, s->f_code, MB_TYPE_BIDIR);
|
ff_fix_long_mvs(s, NULL, 0, s->b_bidir_forw_mv_table, s->f_code, CANDIDATE_MB_TYPE_BIDIR, 1);
|
||||||
ff_fix_long_b_mvs(s, s->b_bidir_back_mv_table, s->b_code, MB_TYPE_BIDIR);
|
ff_fix_long_mvs(s, NULL, 0, s->b_bidir_back_mv_table, s->b_code, CANDIDATE_MB_TYPE_BIDIR, 1);
|
||||||
|
if(s->flags & CODEC_FLAG_INTERLACED_ME){
|
||||||
|
int dir;
|
||||||
|
for(dir=0; dir<2; dir++){
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
for(j=0; j<2; j++){
|
||||||
|
int type= dir ? (CANDIDATE_MB_TYPE_BACKWARD_I|CANDIDATE_MB_TYPE_BIDIR_I)
|
||||||
|
: (CANDIDATE_MB_TYPE_FORWARD_I |CANDIDATE_MB_TYPE_BIDIR_I);
|
||||||
|
ff_fix_long_mvs(s, s->b_field_select_table[dir][i], j,
|
||||||
|
s->b_field_mv_table[dir][i][j], dir ? s->b_code : s->f_code, type, 1);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -3990,10 +4059,7 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
s->current_picture_ptr->error[i] = 0;
|
s->current_picture_ptr->error[i] = 0;
|
||||||
}
|
}
|
||||||
s->mb_skip_run = 0;
|
s->mb_skip_run = 0;
|
||||||
s->last_mv[0][0][0] = 0;
|
memset(s->last_mv, 0, sizeof(s->last_mv));
|
||||||
s->last_mv[0][0][1] = 0;
|
|
||||||
s->last_mv[1][0][0] = 0;
|
|
||||||
s->last_mv[1][0][1] = 0;
|
|
||||||
|
|
||||||
s->last_mv_dir = 0;
|
s->last_mv_dir = 0;
|
||||||
|
|
||||||
@ -4027,6 +4093,7 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
int mb_type= s->mb_type[xy];
|
int mb_type= s->mb_type[xy];
|
||||||
// int d;
|
// int d;
|
||||||
int dmin= INT_MAX;
|
int dmin= INT_MAX;
|
||||||
|
int dir;
|
||||||
|
|
||||||
s->mb_x = mb_x;
|
s->mb_x = mb_x;
|
||||||
ff_update_block_index(s);
|
ff_update_block_index(s);
|
||||||
@ -4134,25 +4201,37 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
backup_s.tex_pb= s->tex_pb;
|
backup_s.tex_pb= s->tex_pb;
|
||||||
}
|
}
|
||||||
|
|
||||||
if(mb_type&MB_TYPE_INTER){
|
if(mb_type&CANDIDATE_MB_TYPE_INTER){
|
||||||
s->mv_dir = MV_DIR_FORWARD;
|
s->mv_dir = MV_DIR_FORWARD;
|
||||||
s->mv_type = MV_TYPE_16X16;
|
s->mv_type = MV_TYPE_16X16;
|
||||||
s->mb_intra= 0;
|
s->mb_intra= 0;
|
||||||
s->mv[0][0][0] = s->p_mv_table[xy][0];
|
s->mv[0][0][0] = s->p_mv_table[xy][0];
|
||||||
s->mv[0][0][1] = s->p_mv_table[xy][1];
|
s->mv[0][0][1] = s->p_mv_table[xy][1];
|
||||||
encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_INTER, pb, pb2, tex_pb,
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_INTER, pb, pb2, tex_pb,
|
||||||
&dmin, &next_block, s->mv[0][0][0], s->mv[0][0][1]);
|
&dmin, &next_block, s->mv[0][0][0], s->mv[0][0][1]);
|
||||||
}
|
}
|
||||||
if(mb_type&MB_TYPE_SKIPED){
|
if(mb_type&CANDIDATE_MB_TYPE_INTER_I){
|
||||||
|
s->mv_dir = MV_DIR_FORWARD;
|
||||||
|
s->mv_type = MV_TYPE_FIELD;
|
||||||
|
s->mb_intra= 0;
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
j= s->field_select[0][i] = s->p_field_select_table[i][xy];
|
||||||
|
s->mv[0][i][0] = s->p_field_mv_table[i][j][xy][0];
|
||||||
|
s->mv[0][i][1] = s->p_field_mv_table[i][j][xy][1];
|
||||||
|
}
|
||||||
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_INTER_I, pb, pb2, tex_pb,
|
||||||
|
&dmin, &next_block, 0, 0);
|
||||||
|
}
|
||||||
|
if(mb_type&CANDIDATE_MB_TYPE_SKIPED){
|
||||||
s->mv_dir = MV_DIR_FORWARD;
|
s->mv_dir = MV_DIR_FORWARD;
|
||||||
s->mv_type = MV_TYPE_16X16;
|
s->mv_type = MV_TYPE_16X16;
|
||||||
s->mb_intra= 0;
|
s->mb_intra= 0;
|
||||||
s->mv[0][0][0] = 0;
|
s->mv[0][0][0] = 0;
|
||||||
s->mv[0][0][1] = 0;
|
s->mv[0][0][1] = 0;
|
||||||
encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_SKIPED, pb, pb2, tex_pb,
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_SKIPED, pb, pb2, tex_pb,
|
||||||
&dmin, &next_block, s->mv[0][0][0], s->mv[0][0][1]);
|
&dmin, &next_block, s->mv[0][0][0], s->mv[0][0][1]);
|
||||||
}
|
}
|
||||||
if(mb_type&MB_TYPE_INTER4V){
|
if(mb_type&CANDIDATE_MB_TYPE_INTER4V){
|
||||||
s->mv_dir = MV_DIR_FORWARD;
|
s->mv_dir = MV_DIR_FORWARD;
|
||||||
s->mv_type = MV_TYPE_8X8;
|
s->mv_type = MV_TYPE_8X8;
|
||||||
s->mb_intra= 0;
|
s->mb_intra= 0;
|
||||||
@ -4160,28 +4239,28 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
s->mv[0][i][0] = s->current_picture.motion_val[0][s->block_index[i]][0];
|
s->mv[0][i][0] = s->current_picture.motion_val[0][s->block_index[i]][0];
|
||||||
s->mv[0][i][1] = s->current_picture.motion_val[0][s->block_index[i]][1];
|
s->mv[0][i][1] = s->current_picture.motion_val[0][s->block_index[i]][1];
|
||||||
}
|
}
|
||||||
encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_INTER4V, pb, pb2, tex_pb,
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_INTER4V, pb, pb2, tex_pb,
|
||||||
&dmin, &next_block, 0, 0);
|
&dmin, &next_block, 0, 0);
|
||||||
}
|
}
|
||||||
if(mb_type&MB_TYPE_FORWARD){
|
if(mb_type&CANDIDATE_MB_TYPE_FORWARD){
|
||||||
s->mv_dir = MV_DIR_FORWARD;
|
s->mv_dir = MV_DIR_FORWARD;
|
||||||
s->mv_type = MV_TYPE_16X16;
|
s->mv_type = MV_TYPE_16X16;
|
||||||
s->mb_intra= 0;
|
s->mb_intra= 0;
|
||||||
s->mv[0][0][0] = s->b_forw_mv_table[xy][0];
|
s->mv[0][0][0] = s->b_forw_mv_table[xy][0];
|
||||||
s->mv[0][0][1] = s->b_forw_mv_table[xy][1];
|
s->mv[0][0][1] = s->b_forw_mv_table[xy][1];
|
||||||
encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_FORWARD, pb, pb2, tex_pb,
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_FORWARD, pb, pb2, tex_pb,
|
||||||
&dmin, &next_block, s->mv[0][0][0], s->mv[0][0][1]);
|
&dmin, &next_block, s->mv[0][0][0], s->mv[0][0][1]);
|
||||||
}
|
}
|
||||||
if(mb_type&MB_TYPE_BACKWARD){
|
if(mb_type&CANDIDATE_MB_TYPE_BACKWARD){
|
||||||
s->mv_dir = MV_DIR_BACKWARD;
|
s->mv_dir = MV_DIR_BACKWARD;
|
||||||
s->mv_type = MV_TYPE_16X16;
|
s->mv_type = MV_TYPE_16X16;
|
||||||
s->mb_intra= 0;
|
s->mb_intra= 0;
|
||||||
s->mv[1][0][0] = s->b_back_mv_table[xy][0];
|
s->mv[1][0][0] = s->b_back_mv_table[xy][0];
|
||||||
s->mv[1][0][1] = s->b_back_mv_table[xy][1];
|
s->mv[1][0][1] = s->b_back_mv_table[xy][1];
|
||||||
encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_BACKWARD, pb, pb2, tex_pb,
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_BACKWARD, pb, pb2, tex_pb,
|
||||||
&dmin, &next_block, s->mv[1][0][0], s->mv[1][0][1]);
|
&dmin, &next_block, s->mv[1][0][0], s->mv[1][0][1]);
|
||||||
}
|
}
|
||||||
if(mb_type&MB_TYPE_BIDIR){
|
if(mb_type&CANDIDATE_MB_TYPE_BIDIR){
|
||||||
s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD;
|
s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD;
|
||||||
s->mv_type = MV_TYPE_16X16;
|
s->mv_type = MV_TYPE_16X16;
|
||||||
s->mb_intra= 0;
|
s->mb_intra= 0;
|
||||||
@ -4189,10 +4268,10 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
s->mv[0][0][1] = s->b_bidir_forw_mv_table[xy][1];
|
s->mv[0][0][1] = s->b_bidir_forw_mv_table[xy][1];
|
||||||
s->mv[1][0][0] = s->b_bidir_back_mv_table[xy][0];
|
s->mv[1][0][0] = s->b_bidir_back_mv_table[xy][0];
|
||||||
s->mv[1][0][1] = s->b_bidir_back_mv_table[xy][1];
|
s->mv[1][0][1] = s->b_bidir_back_mv_table[xy][1];
|
||||||
encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_BIDIR, pb, pb2, tex_pb,
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_BIDIR, pb, pb2, tex_pb,
|
||||||
&dmin, &next_block, 0, 0);
|
&dmin, &next_block, 0, 0);
|
||||||
}
|
}
|
||||||
if(mb_type&MB_TYPE_DIRECT){
|
if(mb_type&CANDIDATE_MB_TYPE_DIRECT){
|
||||||
int mx= s->b_direct_mv_table[xy][0];
|
int mx= s->b_direct_mv_table[xy][0];
|
||||||
int my= s->b_direct_mv_table[xy][1];
|
int my= s->b_direct_mv_table[xy][1];
|
||||||
|
|
||||||
@ -4201,16 +4280,54 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
#ifdef CONFIG_RISKY
|
#ifdef CONFIG_RISKY
|
||||||
ff_mpeg4_set_direct_mv(s, mx, my);
|
ff_mpeg4_set_direct_mv(s, mx, my);
|
||||||
#endif
|
#endif
|
||||||
encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_DIRECT, pb, pb2, tex_pb,
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_DIRECT, pb, pb2, tex_pb,
|
||||||
&dmin, &next_block, mx, my);
|
&dmin, &next_block, mx, my);
|
||||||
}
|
}
|
||||||
if(mb_type&MB_TYPE_INTRA){
|
if(mb_type&CANDIDATE_MB_TYPE_FORWARD_I){
|
||||||
|
s->mv_dir = MV_DIR_FORWARD;
|
||||||
|
s->mv_type = MV_TYPE_FIELD;
|
||||||
|
s->mb_intra= 0;
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
j= s->field_select[0][i] = s->b_field_select_table[0][i][xy];
|
||||||
|
s->mv[0][i][0] = s->b_field_mv_table[0][i][j][xy][0];
|
||||||
|
s->mv[0][i][1] = s->b_field_mv_table[0][i][j][xy][1];
|
||||||
|
}
|
||||||
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_FORWARD_I, pb, pb2, tex_pb,
|
||||||
|
&dmin, &next_block, 0, 0);
|
||||||
|
}
|
||||||
|
if(mb_type&CANDIDATE_MB_TYPE_BACKWARD_I){
|
||||||
|
s->mv_dir = MV_DIR_BACKWARD;
|
||||||
|
s->mv_type = MV_TYPE_FIELD;
|
||||||
|
s->mb_intra= 0;
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
j= s->field_select[1][i] = s->b_field_select_table[1][i][xy];
|
||||||
|
s->mv[1][i][0] = s->b_field_mv_table[1][i][j][xy][0];
|
||||||
|
s->mv[1][i][1] = s->b_field_mv_table[1][i][j][xy][1];
|
||||||
|
}
|
||||||
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_BACKWARD_I, pb, pb2, tex_pb,
|
||||||
|
&dmin, &next_block, 0, 0);
|
||||||
|
}
|
||||||
|
if(mb_type&CANDIDATE_MB_TYPE_BIDIR_I){
|
||||||
|
s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD;
|
||||||
|
s->mv_type = MV_TYPE_FIELD;
|
||||||
|
s->mb_intra= 0;
|
||||||
|
for(dir=0; dir<2; dir++){
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
j= s->field_select[dir][i] = s->b_field_select_table[dir][i][xy];
|
||||||
|
s->mv[dir][i][0] = s->b_field_mv_table[dir][i][j][xy][0];
|
||||||
|
s->mv[dir][i][1] = s->b_field_mv_table[dir][i][j][xy][1];
|
||||||
|
}
|
||||||
|
}
|
||||||
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_BIDIR_I, pb, pb2, tex_pb,
|
||||||
|
&dmin, &next_block, 0, 0);
|
||||||
|
}
|
||||||
|
if(mb_type&CANDIDATE_MB_TYPE_INTRA){
|
||||||
s->mv_dir = 0;
|
s->mv_dir = 0;
|
||||||
s->mv_type = MV_TYPE_16X16;
|
s->mv_type = MV_TYPE_16X16;
|
||||||
s->mb_intra= 1;
|
s->mb_intra= 1;
|
||||||
s->mv[0][0][0] = 0;
|
s->mv[0][0][0] = 0;
|
||||||
s->mv[0][0][1] = 0;
|
s->mv[0][0][1] = 0;
|
||||||
encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_INTRA, pb, pb2, tex_pb,
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_INTRA, pb, pb2, tex_pb,
|
||||||
&dmin, &next_block, 0, 0);
|
&dmin, &next_block, 0, 0);
|
||||||
if(s->h263_pred || s->h263_aic){
|
if(s->h263_pred || s->h263_aic){
|
||||||
if(best_s.mb_intra)
|
if(best_s.mb_intra)
|
||||||
@ -4252,7 +4369,7 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_INTER /* wrong but unused */, pb, pb2, tex_pb,
|
encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_INTER /* wrong but unused */, pb, pb2, tex_pb,
|
||||||
&dmin, &next_block, s->mv[mvdir][0][0], s->mv[mvdir][0][1]);
|
&dmin, &next_block, s->mv[mvdir][0][0], s->mv[mvdir][0][1]);
|
||||||
if(best_s.qscale != qp){
|
if(best_s.qscale != qp){
|
||||||
if(s->mb_intra){
|
if(s->mb_intra){
|
||||||
@ -4312,19 +4429,30 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
// only one MB-Type possible
|
// only one MB-Type possible
|
||||||
|
|
||||||
switch(mb_type){
|
switch(mb_type){
|
||||||
case MB_TYPE_INTRA:
|
case CANDIDATE_MB_TYPE_INTRA:
|
||||||
s->mv_dir = 0;
|
s->mv_dir = 0;
|
||||||
s->mb_intra= 1;
|
s->mb_intra= 1;
|
||||||
motion_x= s->mv[0][0][0] = 0;
|
motion_x= s->mv[0][0][0] = 0;
|
||||||
motion_y= s->mv[0][0][1] = 0;
|
motion_y= s->mv[0][0][1] = 0;
|
||||||
break;
|
break;
|
||||||
case MB_TYPE_INTER:
|
case CANDIDATE_MB_TYPE_INTER:
|
||||||
s->mv_dir = MV_DIR_FORWARD;
|
s->mv_dir = MV_DIR_FORWARD;
|
||||||
s->mb_intra= 0;
|
s->mb_intra= 0;
|
||||||
motion_x= s->mv[0][0][0] = s->p_mv_table[xy][0];
|
motion_x= s->mv[0][0][0] = s->p_mv_table[xy][0];
|
||||||
motion_y= s->mv[0][0][1] = s->p_mv_table[xy][1];
|
motion_y= s->mv[0][0][1] = s->p_mv_table[xy][1];
|
||||||
break;
|
break;
|
||||||
case MB_TYPE_INTER4V:
|
case CANDIDATE_MB_TYPE_INTER_I:
|
||||||
|
s->mv_dir = MV_DIR_FORWARD;
|
||||||
|
s->mv_type = MV_TYPE_FIELD;
|
||||||
|
s->mb_intra= 0;
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
j= s->field_select[0][i] = s->p_field_select_table[i][xy];
|
||||||
|
s->mv[0][i][0] = s->p_field_mv_table[i][j][xy][0];
|
||||||
|
s->mv[0][i][1] = s->p_field_mv_table[i][j][xy][1];
|
||||||
|
}
|
||||||
|
motion_x = motion_y = 0;
|
||||||
|
break;
|
||||||
|
case CANDIDATE_MB_TYPE_INTER4V:
|
||||||
s->mv_dir = MV_DIR_FORWARD;
|
s->mv_dir = MV_DIR_FORWARD;
|
||||||
s->mv_type = MV_TYPE_8X8;
|
s->mv_type = MV_TYPE_8X8;
|
||||||
s->mb_intra= 0;
|
s->mb_intra= 0;
|
||||||
@ -4334,7 +4462,7 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
}
|
}
|
||||||
motion_x= motion_y= 0;
|
motion_x= motion_y= 0;
|
||||||
break;
|
break;
|
||||||
case MB_TYPE_DIRECT:
|
case CANDIDATE_MB_TYPE_DIRECT:
|
||||||
s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD | MV_DIRECT;
|
s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD | MV_DIRECT;
|
||||||
s->mb_intra= 0;
|
s->mb_intra= 0;
|
||||||
motion_x=s->b_direct_mv_table[xy][0];
|
motion_x=s->b_direct_mv_table[xy][0];
|
||||||
@ -4343,7 +4471,7 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
ff_mpeg4_set_direct_mv(s, motion_x, motion_y);
|
ff_mpeg4_set_direct_mv(s, motion_x, motion_y);
|
||||||
#endif
|
#endif
|
||||||
break;
|
break;
|
||||||
case MB_TYPE_BIDIR:
|
case CANDIDATE_MB_TYPE_BIDIR:
|
||||||
s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD;
|
s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD;
|
||||||
s->mb_intra= 0;
|
s->mb_intra= 0;
|
||||||
motion_x=0;
|
motion_x=0;
|
||||||
@ -4353,19 +4481,54 @@ static void encode_picture(MpegEncContext *s, int picture_number)
|
|||||||
s->mv[1][0][0] = s->b_bidir_back_mv_table[xy][0];
|
s->mv[1][0][0] = s->b_bidir_back_mv_table[xy][0];
|
||||||
s->mv[1][0][1] = s->b_bidir_back_mv_table[xy][1];
|
s->mv[1][0][1] = s->b_bidir_back_mv_table[xy][1];
|
||||||
break;
|
break;
|
||||||
case MB_TYPE_BACKWARD:
|
case CANDIDATE_MB_TYPE_BACKWARD:
|
||||||
s->mv_dir = MV_DIR_BACKWARD;
|
s->mv_dir = MV_DIR_BACKWARD;
|
||||||
s->mb_intra= 0;
|
s->mb_intra= 0;
|
||||||
motion_x= s->mv[1][0][0] = s->b_back_mv_table[xy][0];
|
motion_x= s->mv[1][0][0] = s->b_back_mv_table[xy][0];
|
||||||
motion_y= s->mv[1][0][1] = s->b_back_mv_table[xy][1];
|
motion_y= s->mv[1][0][1] = s->b_back_mv_table[xy][1];
|
||||||
break;
|
break;
|
||||||
case MB_TYPE_FORWARD:
|
case CANDIDATE_MB_TYPE_FORWARD:
|
||||||
s->mv_dir = MV_DIR_FORWARD;
|
s->mv_dir = MV_DIR_FORWARD;
|
||||||
s->mb_intra= 0;
|
s->mb_intra= 0;
|
||||||
motion_x= s->mv[0][0][0] = s->b_forw_mv_table[xy][0];
|
motion_x= s->mv[0][0][0] = s->b_forw_mv_table[xy][0];
|
||||||
motion_y= s->mv[0][0][1] = s->b_forw_mv_table[xy][1];
|
motion_y= s->mv[0][0][1] = s->b_forw_mv_table[xy][1];
|
||||||
// printf(" %d %d ", motion_x, motion_y);
|
// printf(" %d %d ", motion_x, motion_y);
|
||||||
break;
|
break;
|
||||||
|
case CANDIDATE_MB_TYPE_FORWARD_I:
|
||||||
|
s->mv_dir = MV_DIR_FORWARD;
|
||||||
|
s->mv_type = MV_TYPE_FIELD;
|
||||||
|
s->mb_intra= 0;
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
j= s->field_select[0][i] = s->b_field_select_table[0][i][xy];
|
||||||
|
s->mv[0][i][0] = s->b_field_mv_table[0][i][j][xy][0];
|
||||||
|
s->mv[0][i][1] = s->b_field_mv_table[0][i][j][xy][1];
|
||||||
|
}
|
||||||
|
motion_x=motion_y=0;
|
||||||
|
break;
|
||||||
|
case CANDIDATE_MB_TYPE_BACKWARD_I:
|
||||||
|
s->mv_dir = MV_DIR_BACKWARD;
|
||||||
|
s->mv_type = MV_TYPE_FIELD;
|
||||||
|
s->mb_intra= 0;
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
j= s->field_select[1][i] = s->b_field_select_table[1][i][xy];
|
||||||
|
s->mv[1][i][0] = s->b_field_mv_table[1][i][j][xy][0];
|
||||||
|
s->mv[1][i][1] = s->b_field_mv_table[1][i][j][xy][1];
|
||||||
|
}
|
||||||
|
motion_x=motion_y=0;
|
||||||
|
break;
|
||||||
|
case CANDIDATE_MB_TYPE_BIDIR_I:
|
||||||
|
s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD;
|
||||||
|
s->mv_type = MV_TYPE_FIELD;
|
||||||
|
s->mb_intra= 0;
|
||||||
|
for(dir=0; dir<2; dir++){
|
||||||
|
for(i=0; i<2; i++){
|
||||||
|
j= s->field_select[dir][i] = s->b_field_select_table[dir][i][xy];
|
||||||
|
s->mv[dir][i][0] = s->b_field_mv_table[dir][i][j][xy][0];
|
||||||
|
s->mv[dir][i][1] = s->b_field_mv_table[dir][i][j][xy][1];
|
||||||
|
}
|
||||||
|
}
|
||||||
|
motion_x=motion_y=0;
|
||||||
|
break;
|
||||||
default:
|
default:
|
||||||
motion_x=motion_y=0; //gcc warning fix
|
motion_x=motion_y=0; //gcc warning fix
|
||||||
av_log(s->avctx, AV_LOG_ERROR, "illegal MB type\n");
|
av_log(s->avctx, AV_LOG_ERROR, "illegal MB type\n");
|
||||||
|
@ -137,6 +137,7 @@ typedef struct Picture{
|
|||||||
int16_t (*motion_val_base[2])[2];
|
int16_t (*motion_val_base[2])[2];
|
||||||
int8_t *ref_index[2];
|
int8_t *ref_index[2];
|
||||||
uint32_t *mb_type_base;
|
uint32_t *mb_type_base;
|
||||||
|
#define MB_TYPE_INTRA MB_TYPE_INTRA4x4 //default mb_type if theres just one type
|
||||||
#define IS_INTRA4x4(a) ((a)&MB_TYPE_INTRA4x4)
|
#define IS_INTRA4x4(a) ((a)&MB_TYPE_INTRA4x4)
|
||||||
#define IS_INTRA16x16(a) ((a)&MB_TYPE_INTRA16x16)
|
#define IS_INTRA16x16(a) ((a)&MB_TYPE_INTRA16x16)
|
||||||
#define IS_PCM(a) ((a)&MB_TYPE_INTRA_PCM)
|
#define IS_PCM(a) ((a)&MB_TYPE_INTRA_PCM)
|
||||||
@ -206,23 +207,28 @@ typedef struct MotionEstContext{
|
|||||||
int mb_penalty_factor;
|
int mb_penalty_factor;
|
||||||
int pre_pass; ///< = 1 for the pre pass
|
int pre_pass; ///< = 1 for the pre pass
|
||||||
int dia_size;
|
int dia_size;
|
||||||
|
int xmin;
|
||||||
|
int xmax;
|
||||||
|
int ymin;
|
||||||
|
int ymax;
|
||||||
uint8_t (*mv_penalty)[MAX_MV*2+1]; ///< amount of bits needed to encode a MV
|
uint8_t (*mv_penalty)[MAX_MV*2+1]; ///< amount of bits needed to encode a MV
|
||||||
int (*sub_motion_search)(struct MpegEncContext * s,
|
int (*sub_motion_search)(struct MpegEncContext * s,
|
||||||
int *mx_ptr, int *my_ptr, int dmin,
|
int *mx_ptr, int *my_ptr, int dmin,
|
||||||
int xmin, int ymin, int xmax, int ymax,
|
int pred_x, int pred_y, uint8_t *src_data[3],
|
||||||
int pred_x, int pred_y, Picture *ref_picture,
|
uint8_t *ref_data[6], int stride, int uvstride,
|
||||||
int n, int size, uint8_t * const mv_penalty);
|
int size, int h, uint8_t * const mv_penalty);
|
||||||
int (*motion_search[7])(struct MpegEncContext * s, int block,
|
int (*motion_search[7])(struct MpegEncContext * s,
|
||||||
int *mx_ptr, int *my_ptr,
|
int *mx_ptr, int *my_ptr,
|
||||||
int P[10][2], int pred_x, int pred_y,
|
int P[10][2], int pred_x, int pred_y, uint8_t *src_data[3],
|
||||||
int xmin, int ymin, int xmax, int ymax, Picture *ref_picture, int16_t (*last_mv)[2],
|
uint8_t *ref_data[6], int stride, int uvstride, int16_t (*last_mv)[2],
|
||||||
int ref_mv_scale, uint8_t * const mv_penalty);
|
int ref_mv_scale, uint8_t * const mv_penalty);
|
||||||
int (*pre_motion_search)(struct MpegEncContext * s, int block,
|
int (*pre_motion_search)(struct MpegEncContext * s,
|
||||||
int *mx_ptr, int *my_ptr,
|
int *mx_ptr, int *my_ptr,
|
||||||
int P[10][2], int pred_x, int pred_y,
|
int P[10][2], int pred_x, int pred_y, uint8_t *src_data[3],
|
||||||
int xmin, int ymin, int xmax, int ymax, Picture *ref_picture, int16_t (*last_mv)[2],
|
uint8_t *ref_data[6], int stride, int uvstride, int16_t (*last_mv)[2],
|
||||||
int ref_mv_scale, uint8_t * const mv_penalty);
|
int ref_mv_scale, uint8_t * const mv_penalty);
|
||||||
int (*get_mb_score)(struct MpegEncContext * s, int mx, int my, int pred_x, int pred_y, Picture *ref_picture,
|
int (*get_mb_score)(struct MpegEncContext * s, int mx, int my, int pred_x, int pred_y, uint8_t *src_data[3],
|
||||||
|
uint8_t *ref_data[6], int stride, int uvstride,
|
||||||
uint8_t * const mv_penalty);
|
uint8_t * const mv_penalty);
|
||||||
}MotionEstContext;
|
}MotionEstContext;
|
||||||
|
|
||||||
@ -351,12 +357,18 @@ typedef struct MpegEncContext {
|
|||||||
int16_t (*b_bidir_forw_mv_table_base)[2];
|
int16_t (*b_bidir_forw_mv_table_base)[2];
|
||||||
int16_t (*b_bidir_back_mv_table_base)[2];
|
int16_t (*b_bidir_back_mv_table_base)[2];
|
||||||
int16_t (*b_direct_mv_table_base)[2];
|
int16_t (*b_direct_mv_table_base)[2];
|
||||||
|
int16_t (*p_field_mv_table_base[2][2])[2];
|
||||||
|
int16_t (*b_field_mv_table_base[2][2][2])[2];
|
||||||
int16_t (*p_mv_table)[2]; ///< MV table (1MV per MB) p-frame encoding
|
int16_t (*p_mv_table)[2]; ///< MV table (1MV per MB) p-frame encoding
|
||||||
int16_t (*b_forw_mv_table)[2]; ///< MV table (1MV per MB) forward mode b-frame encoding
|
int16_t (*b_forw_mv_table)[2]; ///< MV table (1MV per MB) forward mode b-frame encoding
|
||||||
int16_t (*b_back_mv_table)[2]; ///< MV table (1MV per MB) backward mode b-frame encoding
|
int16_t (*b_back_mv_table)[2]; ///< MV table (1MV per MB) backward mode b-frame encoding
|
||||||
int16_t (*b_bidir_forw_mv_table)[2]; ///< MV table (1MV per MB) bidir mode b-frame encoding
|
int16_t (*b_bidir_forw_mv_table)[2]; ///< MV table (1MV per MB) bidir mode b-frame encoding
|
||||||
int16_t (*b_bidir_back_mv_table)[2]; ///< MV table (1MV per MB) bidir mode b-frame encoding
|
int16_t (*b_bidir_back_mv_table)[2]; ///< MV table (1MV per MB) bidir mode b-frame encoding
|
||||||
int16_t (*b_direct_mv_table)[2]; ///< MV table (1MV per MB) direct mode b-frame encoding
|
int16_t (*b_direct_mv_table)[2]; ///< MV table (1MV per MB) direct mode b-frame encoding
|
||||||
|
int16_t (*p_field_mv_table[2][2])[2]; ///< MV table (2MV per MB) interlaced p-frame encoding
|
||||||
|
int16_t (*b_field_mv_table[2][2][2])[2];///< MV table (4MV per MB) interlaced b-frame encoding
|
||||||
|
uint8_t (*p_field_select_table[2]);
|
||||||
|
uint8_t (*b_field_select_table[2][2]);
|
||||||
int me_method; ///< ME algorithm
|
int me_method; ///< ME algorithm
|
||||||
int scene_change_score;
|
int scene_change_score;
|
||||||
int mv_dir;
|
int mv_dir;
|
||||||
@ -391,17 +403,22 @@ typedef struct MpegEncContext {
|
|||||||
int mb_x, mb_y;
|
int mb_x, mb_y;
|
||||||
int mb_skip_run;
|
int mb_skip_run;
|
||||||
int mb_intra;
|
int mb_intra;
|
||||||
uint8_t *mb_type; ///< Table for MB type FIXME remove and use picture->mb_type
|
uint16_t *mb_type; ///< Table for candidate MB types for encoding
|
||||||
#define MB_TYPE_INTRA 0x01
|
#define CANDIDATE_MB_TYPE_INTRA 0x01
|
||||||
#define MB_TYPE_INTER 0x02
|
#define CANDIDATE_MB_TYPE_INTER 0x02
|
||||||
#define MB_TYPE_INTER4V 0x04
|
#define CANDIDATE_MB_TYPE_INTER4V 0x04
|
||||||
#define MB_TYPE_SKIPED 0x08
|
#define CANDIDATE_MB_TYPE_SKIPED 0x08
|
||||||
//#define MB_TYPE_GMC 0x10
|
//#define MB_TYPE_GMC 0x10
|
||||||
|
|
||||||
#define MB_TYPE_DIRECT 0x10
|
#define CANDIDATE_MB_TYPE_DIRECT 0x10
|
||||||
#define MB_TYPE_FORWARD 0x20
|
#define CANDIDATE_MB_TYPE_FORWARD 0x20
|
||||||
#define MB_TYPE_BACKWARD 0x40
|
#define CANDIDATE_MB_TYPE_BACKWARD 0x40
|
||||||
#define MB_TYPE_BIDIR 0x80
|
#define CANDIDATE_MB_TYPE_BIDIR 0x80
|
||||||
|
|
||||||
|
#define CANDIDATE_MB_TYPE_INTER_I 0x100
|
||||||
|
#define CANDIDATE_MB_TYPE_FORWARD_I 0x200
|
||||||
|
#define CANDIDATE_MB_TYPE_BACKWARD_I 0x400
|
||||||
|
#define CANDIDATE_MB_TYPE_BIDIR_I 0x800
|
||||||
|
|
||||||
int block_index[6]; ///< index to current MB in block based arrays with edges
|
int block_index[6]; ///< index to current MB in block based arrays with edges
|
||||||
int block_wrap[6];
|
int block_wrap[6];
|
||||||
@ -551,8 +568,6 @@ typedef struct MpegEncContext {
|
|||||||
uint8_t *tex_pb_buffer;
|
uint8_t *tex_pb_buffer;
|
||||||
uint8_t *pb2_buffer;
|
uint8_t *pb2_buffer;
|
||||||
int mpeg_quant;
|
int mpeg_quant;
|
||||||
int16_t (*field_mv_table)[2][2]; ///< used for interlaced b frame decoding
|
|
||||||
int8_t (*field_select_table)[2]; ///< wtf, no really another table for interlaced b frames
|
|
||||||
int t_frame; ///< time distance of first I -> B, used for interlaced b frames
|
int t_frame; ///< time distance of first I -> B, used for interlaced b frames
|
||||||
int padding_bug_score; ///< used to detect the VERY common padding bug in MPEG4
|
int padding_bug_score; ///< used to detect the VERY common padding bug in MPEG4
|
||||||
|
|
||||||
@ -748,7 +763,8 @@ void ff_estimate_b_frame_motion(MpegEncContext * s,
|
|||||||
int mb_x, int mb_y);
|
int mb_x, int mb_y);
|
||||||
int ff_get_best_fcode(MpegEncContext * s, int16_t (*mv_table)[2], int type);
|
int ff_get_best_fcode(MpegEncContext * s, int16_t (*mv_table)[2], int type);
|
||||||
void ff_fix_long_p_mvs(MpegEncContext * s);
|
void ff_fix_long_p_mvs(MpegEncContext * s);
|
||||||
void ff_fix_long_b_mvs(MpegEncContext * s, int16_t (*mv_table)[2], int f_code, int type);
|
void ff_fix_long_mvs(MpegEncContext * s, uint8_t *field_select_table, int field_select,
|
||||||
|
int16_t (*mv_table)[2], int f_code, int type, int truncate);
|
||||||
void ff_init_me(MpegEncContext *s);
|
void ff_init_me(MpegEncContext *s);
|
||||||
int ff_pre_estimate_p_frame_motion(MpegEncContext * s, int mb_x, int mb_y);
|
int ff_pre_estimate_p_frame_motion(MpegEncContext * s, int mb_x, int mb_y);
|
||||||
|
|
||||||
|
@ -45,7 +45,7 @@ static void sigill_handler (int sig)
|
|||||||
}
|
}
|
||||||
#endif /* CONFIG_DARWIN */
|
#endif /* CONFIG_DARWIN */
|
||||||
|
|
||||||
int pix_abs16x16_x2_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
int sad16_x2_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int i;
|
int i;
|
||||||
int s __attribute__((aligned(16)));
|
int s __attribute__((aligned(16)));
|
||||||
@ -57,7 +57,7 @@ int pix_abs16x16_x2_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
|
|
||||||
s = 0;
|
s = 0;
|
||||||
sad = (vector unsigned int)vec_splat_u32(0);
|
sad = (vector unsigned int)vec_splat_u32(0);
|
||||||
for(i=0;i<16;i++) {
|
for(i=0;i<h;i++) {
|
||||||
/*
|
/*
|
||||||
Read unaligned pixels into our vectors. The vectors are as follows:
|
Read unaligned pixels into our vectors. The vectors are as follows:
|
||||||
pix1v: pix1[0]-pix1[15]
|
pix1v: pix1[0]-pix1[15]
|
||||||
@ -92,7 +92,7 @@ int pix_abs16x16_x2_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
int pix_abs16x16_y2_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
int sad16_y2_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int i;
|
int i;
|
||||||
int s __attribute__((aligned(16)));
|
int s __attribute__((aligned(16)));
|
||||||
@ -118,7 +118,7 @@ int pix_abs16x16_y2_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
tv = (vector unsigned char *) &pix2[0];
|
tv = (vector unsigned char *) &pix2[0];
|
||||||
pix2v = vec_perm(tv[0], tv[1], vec_lvsl(0, &pix2[0]));
|
pix2v = vec_perm(tv[0], tv[1], vec_lvsl(0, &pix2[0]));
|
||||||
|
|
||||||
for(i=0;i<16;i++) {
|
for(i=0;i<h;i++) {
|
||||||
/*
|
/*
|
||||||
Read unaligned pixels into our vectors. The vectors are as follows:
|
Read unaligned pixels into our vectors. The vectors are as follows:
|
||||||
pix1v: pix1[0]-pix1[15]
|
pix1v: pix1[0]-pix1[15]
|
||||||
@ -152,7 +152,7 @@ int pix_abs16x16_y2_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
int pix_abs16x16_xy2_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
int sad16_xy2_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int i;
|
int i;
|
||||||
int s __attribute__((aligned(16)));
|
int s __attribute__((aligned(16)));
|
||||||
@ -194,7 +194,7 @@ int pix_abs16x16_xy2_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
t1 = vec_add(pix2hv, pix2ihv);
|
t1 = vec_add(pix2hv, pix2ihv);
|
||||||
t2 = vec_add(pix2lv, pix2ilv);
|
t2 = vec_add(pix2lv, pix2ilv);
|
||||||
|
|
||||||
for(i=0;i<16;i++) {
|
for(i=0;i<h;i++) {
|
||||||
/*
|
/*
|
||||||
Read unaligned pixels into our vectors. The vectors are as follows:
|
Read unaligned pixels into our vectors. The vectors are as follows:
|
||||||
pix1v: pix1[0]-pix1[15]
|
pix1v: pix1[0]-pix1[15]
|
||||||
@ -253,7 +253,7 @@ int pix_abs16x16_xy2_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
int pix_abs16x16_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
int sad16_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int i;
|
int i;
|
||||||
int s __attribute__((aligned(16)));
|
int s __attribute__((aligned(16)));
|
||||||
@ -266,7 +266,7 @@ int pix_abs16x16_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
sad = (vector unsigned int)vec_splat_u32(0);
|
sad = (vector unsigned int)vec_splat_u32(0);
|
||||||
|
|
||||||
|
|
||||||
for(i=0;i<16;i++) {
|
for(i=0;i<h;i++) {
|
||||||
/* Read potentially unaligned pixels into t1 and t2 */
|
/* Read potentially unaligned pixels into t1 and t2 */
|
||||||
perm1 = vec_lvsl(0, pix1);
|
perm1 = vec_lvsl(0, pix1);
|
||||||
pix1v = (vector unsigned char *) pix1;
|
pix1v = (vector unsigned char *) pix1;
|
||||||
@ -295,7 +295,7 @@ int pix_abs16x16_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
return s;
|
return s;
|
||||||
}
|
}
|
||||||
|
|
||||||
int pix_abs8x8_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
int sad8_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int i;
|
int i;
|
||||||
int s __attribute__((aligned(16)));
|
int s __attribute__((aligned(16)));
|
||||||
@ -309,7 +309,7 @@ int pix_abs8x8_altivec(uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
|
|
||||||
permclear = (vector unsigned char)AVV(255,255,255,255,255,255,255,255,0,0,0,0,0,0,0,0);
|
permclear = (vector unsigned char)AVV(255,255,255,255,255,255,255,255,0,0,0,0,0,0,0,0);
|
||||||
|
|
||||||
for(i=0;i<8;i++) {
|
for(i=0;i<h;i++) {
|
||||||
/* Read potentially unaligned pixels into t1 and t2
|
/* Read potentially unaligned pixels into t1 and t2
|
||||||
Since we're reading 16 pixels, and actually only want 8,
|
Since we're reading 16 pixels, and actually only want 8,
|
||||||
mask out the last 8 pixels. The 0s don't change the sum. */
|
mask out the last 8 pixels. The 0s don't change the sum. */
|
||||||
@ -374,9 +374,9 @@ int pix_norm1_altivec(uint8_t *pix, int line_size)
|
|||||||
/**
|
/**
|
||||||
* Sum of Squared Errors for a 8x8 block.
|
* Sum of Squared Errors for a 8x8 block.
|
||||||
* AltiVec-enhanced.
|
* AltiVec-enhanced.
|
||||||
* It's the pix_abs8x8_altivec code above w/ squaring added.
|
* It's the sad8_altivec code above w/ squaring added.
|
||||||
*/
|
*/
|
||||||
int sse8_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size)
|
int sse8_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int i;
|
int i;
|
||||||
int s __attribute__((aligned(16)));
|
int s __attribute__((aligned(16)));
|
||||||
@ -391,7 +391,7 @@ int sse8_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
permclear = (vector unsigned char)AVV(255,255,255,255,255,255,255,255,0,0,0,0,0,0,0,0);
|
permclear = (vector unsigned char)AVV(255,255,255,255,255,255,255,255,0,0,0,0,0,0,0,0);
|
||||||
|
|
||||||
|
|
||||||
for(i=0;i<8;i++) {
|
for(i=0;i<h;i++) {
|
||||||
/* Read potentially unaligned pixels into t1 and t2
|
/* Read potentially unaligned pixels into t1 and t2
|
||||||
Since we're reading 16 pixels, and actually only want 8,
|
Since we're reading 16 pixels, and actually only want 8,
|
||||||
mask out the last 8 pixels. The 0s don't change the sum. */
|
mask out the last 8 pixels. The 0s don't change the sum. */
|
||||||
@ -430,9 +430,9 @@ int sse8_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
/**
|
/**
|
||||||
* Sum of Squared Errors for a 16x16 block.
|
* Sum of Squared Errors for a 16x16 block.
|
||||||
* AltiVec-enhanced.
|
* AltiVec-enhanced.
|
||||||
* It's the pix_abs16x16_altivec code above w/ squaring added.
|
* It's the sad16_altivec code above w/ squaring added.
|
||||||
*/
|
*/
|
||||||
int sse16_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size)
|
int sse16_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
|
||||||
{
|
{
|
||||||
int i;
|
int i;
|
||||||
int s __attribute__((aligned(16)));
|
int s __attribute__((aligned(16)));
|
||||||
@ -444,7 +444,7 @@ int sse16_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size)
|
|||||||
|
|
||||||
sum = (vector unsigned int)vec_splat_u32(0);
|
sum = (vector unsigned int)vec_splat_u32(0);
|
||||||
|
|
||||||
for(i=0;i<16;i++) {
|
for(i=0;i<h;i++) {
|
||||||
/* Read potentially unaligned pixels into t1 and t2 */
|
/* Read potentially unaligned pixels into t1 and t2 */
|
||||||
perm1 = vec_lvsl(0, pix1);
|
perm1 = vec_lvsl(0, pix1);
|
||||||
pix1v = (vector unsigned char *) pix1;
|
pix1v = (vector unsigned char *) pix1;
|
||||||
@ -609,14 +609,6 @@ void diff_pixels_altivec(DCTELEM *restrict block, const uint8_t *s1,
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
int sad16x16_altivec(void *s, uint8_t *a, uint8_t *b, int stride) {
|
|
||||||
return pix_abs16x16_altivec(a,b,stride);
|
|
||||||
}
|
|
||||||
|
|
||||||
int sad8x8_altivec(void *s, uint8_t *a, uint8_t *b, int stride) {
|
|
||||||
return pix_abs8x8_altivec(a,b,stride);
|
|
||||||
}
|
|
||||||
|
|
||||||
void add_bytes_altivec(uint8_t *dst, uint8_t *src, int w) {
|
void add_bytes_altivec(uint8_t *dst, uint8_t *src, int w) {
|
||||||
#ifdef ALTIVEC_USE_REFERENCE_C_CODE
|
#ifdef ALTIVEC_USE_REFERENCE_C_CODE
|
||||||
int i;
|
int i;
|
||||||
|
@ -24,16 +24,14 @@
|
|||||||
|
|
||||||
#ifdef HAVE_ALTIVEC
|
#ifdef HAVE_ALTIVEC
|
||||||
|
|
||||||
extern int pix_abs16x16_x2_altivec(uint8_t *pix1, uint8_t *pix2, int line_size);
|
extern int sad16_x2_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
||||||
extern int pix_abs16x16_y2_altivec(uint8_t *pix1, uint8_t *pix2, int line_size);
|
extern int sad16_y2_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
||||||
extern int pix_abs16x16_xy2_altivec(uint8_t *pix1, uint8_t *pix2, int line_size);
|
extern int sad16_xy2_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
||||||
extern int pix_abs16x16_altivec(uint8_t *pix1, uint8_t *pix2, int line_size);
|
extern int sad16_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
||||||
extern int pix_abs8x8_altivec(uint8_t *pix1, uint8_t *pix2, int line_size);
|
extern int sad8_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
||||||
extern int sad16x16_altivec(void *s, uint8_t *a, uint8_t *b, int stride);
|
|
||||||
extern int sad8x8_altivec(void *s, uint8_t *a, uint8_t *b, int stride);
|
|
||||||
extern int pix_norm1_altivec(uint8_t *pix, int line_size);
|
extern int pix_norm1_altivec(uint8_t *pix, int line_size);
|
||||||
extern int sse8_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size);
|
extern int sse8_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
||||||
extern int sse16_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size);
|
extern int sse16_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
||||||
extern int pix_sum_altivec(uint8_t * pix, int line_size);
|
extern int pix_sum_altivec(uint8_t * pix, int line_size);
|
||||||
extern void diff_pixels_altivec(DCTELEM* block, const uint8_t* s1, const uint8_t* s2, int stride);
|
extern void diff_pixels_altivec(DCTELEM* block, const uint8_t* s1, const uint8_t* s2, int stride);
|
||||||
extern void get_pixels_altivec(DCTELEM* block, const uint8_t * pixels, int line_size);
|
extern void get_pixels_altivec(DCTELEM* block, const uint8_t * pixels, int line_size);
|
||||||
|
@ -240,13 +240,13 @@ void dsputil_init_ppc(DSPContext* c, AVCodecContext *avctx)
|
|||||||
mm_flags |= MM_ALTIVEC;
|
mm_flags |= MM_ALTIVEC;
|
||||||
|
|
||||||
// Altivec specific optimisations
|
// Altivec specific optimisations
|
||||||
c->pix_abs16x16_x2 = pix_abs16x16_x2_altivec;
|
c->pix_abs[0][1] = sad16_x2_altivec;
|
||||||
c->pix_abs16x16_y2 = pix_abs16x16_y2_altivec;
|
c->pix_abs[0][2] = sad16_y2_altivec;
|
||||||
c->pix_abs16x16_xy2 = pix_abs16x16_xy2_altivec;
|
c->pix_abs[0][3] = sad16_xy2_altivec;
|
||||||
c->pix_abs16x16 = pix_abs16x16_altivec;
|
c->pix_abs[0][0] = sad16_altivec;
|
||||||
c->pix_abs8x8 = pix_abs8x8_altivec;
|
c->pix_abs[1][0] = sad8_altivec;
|
||||||
c->sad[0]= sad16x16_altivec;
|
c->sad[0]= sad16_altivec;
|
||||||
c->sad[1]= sad8x8_altivec;
|
c->sad[1]= sad8_altivec;
|
||||||
c->pix_norm1 = pix_norm1_altivec;
|
c->pix_norm1 = pix_norm1_altivec;
|
||||||
c->sse[1]= sse8_altivec;
|
c->sse[1]= sse8_altivec;
|
||||||
c->sse[0]= sse16_altivec;
|
c->sse[0]= sse16_altivec;
|
||||||
|
@ -520,7 +520,7 @@ static void adaptive_quantization(MpegEncContext *s, double q){
|
|||||||
if(spat_cplx < 4) spat_cplx= 4; //FIXME finetune
|
if(spat_cplx < 4) spat_cplx= 4; //FIXME finetune
|
||||||
if(temp_cplx < 4) temp_cplx= 4; //FIXME finetune
|
if(temp_cplx < 4) temp_cplx= 4; //FIXME finetune
|
||||||
|
|
||||||
if((s->mb_type[mb_xy]&MB_TYPE_INTRA)){//FIXME hq mode
|
if((s->mb_type[mb_xy]&CANDIDATE_MB_TYPE_INTRA)){//FIXME hq mode
|
||||||
cplx= spat_cplx;
|
cplx= spat_cplx;
|
||||||
factor= 1.0 + p_masking;
|
factor= 1.0 + p_masking;
|
||||||
}else{
|
}else{
|
||||||
|
@ -26,21 +26,21 @@ stddev: 8.18 bytes:7602176
|
|||||||
920a0a8a0063655d1f34dcaad7857f98 *./data/a-h263p.avi
|
920a0a8a0063655d1f34dcaad7857f98 *./data/a-h263p.avi
|
||||||
0eb167c9dfcbeeecbf3debed8af8f811 *./data/out.yuv
|
0eb167c9dfcbeeecbf3debed8af8f811 *./data/out.yuv
|
||||||
stddev: 2.08 bytes:7602176
|
stddev: 2.08 bytes:7602176
|
||||||
a8cc41cd5016bbb821e7c2691f5090ea *./data/a-odivx.mp4
|
66f8b4b5b4f0655cff7bdbc44969cab3 *./data/a-odivx.mp4
|
||||||
e48114a50ef4cfb4fe2016fa5b34ae4c *./data/out.yuv
|
5bd332c77ef45e58b7017e06a0467dd3 *./data/out.yuv
|
||||||
stddev: 8.02 bytes:7602176
|
stddev: 7.94 bytes:7602176
|
||||||
5704a082cc5c5970620123ae20566286 *./data/a-huffyuv.avi
|
5704a082cc5c5970620123ae20566286 *./data/a-huffyuv.avi
|
||||||
799d3db687f6cdd7a837ec156efc171f *./data/out.yuv
|
799d3db687f6cdd7a837ec156efc171f *./data/out.yuv
|
||||||
stddev: 0.00 bytes:7602176
|
stddev: 0.00 bytes:7602176
|
||||||
e9f63126859b97cd23cd1413038f8f7b *./data/a-mpeg4-rc.avi
|
e9f63126859b97cd23cd1413038f8f7b *./data/a-mpeg4-rc.avi
|
||||||
90a159074b1b109569914ee63f387860 *./data/out.yuv
|
90a159074b1b109569914ee63f387860 *./data/out.yuv
|
||||||
stddev: 10.18 bytes:7145472
|
stddev: 10.18 bytes:7145472
|
||||||
b3f1425e266569d5d726b88eadc13dd4 *./data/a-mpeg4-adv.avi
|
d7d295f97a1e07b633f973d2325880ce *./data/a-mpeg4-adv.avi
|
||||||
fb61365b22c947adbaeab74478579020 *./data/out.yuv
|
612f79510c8098f1421aa154047e2bf2 *./data/out.yuv
|
||||||
stddev: 7.31 bytes:7602176
|
stddev: 7.25 bytes:7602176
|
||||||
25ec5ab399fd4db0c8aaea78cb692611 *./data/a-error-mpeg4-adv.avi
|
f863f4198521bd76930ea33991b47273 *./data/a-error-mpeg4-adv.avi
|
||||||
bd441fc1e2fb9a3c0bdc9c5f1ed25ef0 *./data/out.yuv
|
ba7fcd126c7c9fead5a5de71aaaf0624 *./data/out.yuv
|
||||||
stddev: 13.57 bytes:7602176
|
stddev: 16.80 bytes:7602176
|
||||||
328ebd044362116e274739e23c482ee7 *./data/a-mpeg1b.mpg
|
328ebd044362116e274739e23c482ee7 *./data/a-mpeg1b.mpg
|
||||||
788a9d500dc8986231a18076fc80fd73 *./data/out.yuv
|
788a9d500dc8986231a18076fc80fd73 *./data/out.yuv
|
||||||
stddev: 10.07 bytes:7145472
|
stddev: 10.07 bytes:7145472
|
||||||
|
@ -138,7 +138,7 @@ do_ffmpeg $raw_dst -y -i $file -f rawvideo $raw_dst
|
|||||||
|
|
||||||
# mpeg2 encoding interlaced
|
# mpeg2 encoding interlaced
|
||||||
file=${outfile}mpeg2i.mpg
|
file=${outfile}mpeg2i.mpg
|
||||||
do_ffmpeg $file -y -qscale 10 -f pgmyuv -i $raw_src -vcodec mpeg2video -f mpeg1video -interlace $file
|
do_ffmpeg $file -y -qscale 10 -f pgmyuv -i $raw_src -vcodec mpeg2video -f mpeg1video -ildct $file
|
||||||
|
|
||||||
# mpeg2 decoding
|
# mpeg2 decoding
|
||||||
do_ffmpeg $raw_dst -y -i $file -f rawvideo $raw_dst
|
do_ffmpeg $raw_dst -y -i $file -f rawvideo $raw_dst
|
||||||
|
@ -26,21 +26,21 @@ stddev: 5.41 bytes:7602176
|
|||||||
f7828488c31ccb6787367ef4e4a2ad42 *./data/a-h263p.avi
|
f7828488c31ccb6787367ef4e4a2ad42 *./data/a-h263p.avi
|
||||||
7d39d1f272205a6a231d0e0baf32ff9d *./data/out.yuv
|
7d39d1f272205a6a231d0e0baf32ff9d *./data/out.yuv
|
||||||
stddev: 1.91 bytes:7602176
|
stddev: 1.91 bytes:7602176
|
||||||
f17dc7346f5d1d4307ecf4507f10fcc6 *./data/a-odivx.mp4
|
a831828595e5764e6ee30c2d9e548385 *./data/a-odivx.mp4
|
||||||
ff7ddb57d9038b94f08c43bae7e1329f *./data/out.yuv
|
ad75d173bd30d642147f00da21df0012 *./data/out.yuv
|
||||||
stddev: 5.28 bytes:7602176
|
stddev: 5.27 bytes:7602176
|
||||||
242a7a18c2793e115007bc163861ef4e *./data/a-huffyuv.avi
|
242a7a18c2793e115007bc163861ef4e *./data/a-huffyuv.avi
|
||||||
dde5895817ad9d219f79a52d0bdfb001 *./data/out.yuv
|
dde5895817ad9d219f79a52d0bdfb001 *./data/out.yuv
|
||||||
stddev: 0.00 bytes:7602176
|
stddev: 0.00 bytes:7602176
|
||||||
6a469f42ce6946dd4c708f9e51e3da6a *./data/a-mpeg4-rc.avi
|
6a469f42ce6946dd4c708f9e51e3da6a *./data/a-mpeg4-rc.avi
|
||||||
df9de7134d961119705b4e0cabca1f12 *./data/out.yuv
|
df9de7134d961119705b4e0cabca1f12 *./data/out.yuv
|
||||||
stddev: 4.20 bytes:7145472
|
stddev: 4.20 bytes:7145472
|
||||||
742ffadf3c309d2c4ac888a6a0905bf9 *./data/a-mpeg4-adv.avi
|
483504d060b0bd8ac1acfa3a823c2ad7 *./data/a-mpeg4-adv.avi
|
||||||
b02f71e91e9368ce94814ab3d74f91ba *./data/out.yuv
|
08d24bdd7da80cffaf8abaa3e71b1843 *./data/out.yuv
|
||||||
stddev: 4.97 bytes:7602176
|
stddev: 4.96 bytes:7602176
|
||||||
f2888ab759ac28aba85a16d3d54b80d0 *./data/a-error-mpeg4-adv.avi
|
03ff35856faefb4882eaf4d86d95bea7 *./data/a-error-mpeg4-adv.avi
|
||||||
93ab926aad2e658a5bb00c25b7cefdab *./data/out.yuv
|
8550acff0851ee915bd5800f1e20f37c *./data/out.yuv
|
||||||
stddev: 5.22 bytes:7602176
|
stddev: 9.66 bytes:7602176
|
||||||
671802a2c5078e69f7f422765ea87f2a *./data/a-mpeg1b.mpg
|
671802a2c5078e69f7f422765ea87f2a *./data/a-mpeg1b.mpg
|
||||||
d3d5876cef34b728602d5a22eee9249f *./data/out.yuv
|
d3d5876cef34b728602d5a22eee9249f *./data/out.yuv
|
||||||
stddev: 5.93 bytes:7145472
|
stddev: 5.93 bytes:7145472
|
||||||
|
Loading…
Reference in New Issue
Block a user