FFmpeg/libavfilter/x86/Makefile

OBJS-$(CONFIG_GRADFUN_FILTER)                += x86/vf_gradfun.o
OBJS-$(CONFIG_HQDN3D_FILTER)                 += x86/vf_hqdn3d_init.o
OBJS-$(CONFIG_VOLUME_FILTER)                 += x86/af_volume_init.o
OBJS-$(CONFIG_YADIF_FILTER)                  += x86/vf_yadif_init.o

YASM-OBJS-$(CONFIG_HQDN3D_FILTER)            += x86/vf_hqdn3d.o
YASM-OBJS-$(CONFIG_VOLUME_FILTER)            += x86/af_volume.o
YASM-OBJS-$(CONFIG_YADIF_FILTER)             += x86/vf_yadif.o x86/yadif-16.o x86/yadif-10.o
avfilter: x86: consistent filenames for filter optimizations 2013-02-01 15:14:31 +03:00			`OBJS-$(CONFIG_GRADFUN_FILTER) += x86/vf_gradfun.o`
vf_hqdn3d: x86: Add proper arch optimization initialization 2013-01-22 03:39:37 +03:00			`OBJS-$(CONFIG_HQDN3D_FILTER) += x86/vf_hqdn3d_init.o`
x86: af_volume: add SSE2-optimized s16 volume scaling 2012-09-23 21:49:26 +03:00			`OBJS-$(CONFIG_VOLUME_FILTER) += x86/af_volume_init.o`
avfilter: x86: consistent filenames for filter optimizations 2013-02-01 15:14:31 +03:00			`OBJS-$(CONFIG_YADIF_FILTER) += x86/vf_yadif_init.o`
avfilter: call x86 init functions under if (ARCH_X86), not if (HAVE_MMX) 2012-08-29 20:37:14 +03:00
avfilter: x86: consistent filenames for filter optimizations 2013-02-01 15:14:31 +03:00			`YASM-OBJS-$(CONFIG_HQDN3D_FILTER) += x86/vf_hqdn3d.o`
x86: af_volume: add SSE2-optimized s16 volume scaling 2012-09-23 21:49:26 +03:00			`YASM-OBJS-$(CONFIG_VOLUME_FILTER) += x86/af_volume.o`
yadif: x86 assembly for 9 to 14-bit samples These smaller samples do not need to be unpacked to double words allowing the code to process more pixels every iteration (still 2 in MMX but 6 in SSE2). It also avoids emulating the missing double word instructions on older instruction sets. Like with the previous code for 16-bit samples this has been tested on an Athlon64 and a Core2Quad. Athlon64: 1809275 decicycles in C, 32718 runs, 50 skips 911675 decicycles in mmx, 32727 runs, 41 skips, 2.0x faster 495284 decicycles in sse2, 32747 runs, 21 skips, 3.7x faster Core2Quad: 921363 decicycles in C, 32756 runs, 12 skips 486537 decicycles in mmx, 32764 runs, 4 skips, 1.9x faster 293296 decicycles in sse2, 32759 runs, 9 skips, 3.1x faster 284910 decicycles in ssse3, 32759 runs, 9 skips, 3.2x faster Signed-off-by: Michael Niedermayer <michaelni@gmx.at> 2013-03-16 23:42:24 +03:00			`YASM-OBJS-$(CONFIG_YADIF_FILTER) += x86/vf_yadif.o x86/yadif-16.o x86/yadif-10.o`