You've already forked FFmpeg
mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2025-08-15 14:13:16 +02:00
vf_gradfun: move x86 init code to x86/gradfun.c
Signed-off-by: Mans Rullgard <mans@mansr.com>
This commit is contained in:
@@ -37,12 +37,9 @@ typedef struct {
|
|||||||
void (*blur_line) (uint16_t *dc, uint16_t *buf, uint16_t *buf1, uint8_t *src, int src_linesize, int width);
|
void (*blur_line) (uint16_t *dc, uint16_t *buf, uint16_t *buf1, uint8_t *src, int src_linesize, int width);
|
||||||
} GradFunContext;
|
} GradFunContext;
|
||||||
|
|
||||||
|
void ff_gradfun_init_x86(GradFunContext *gf);
|
||||||
|
|
||||||
void ff_gradfun_filter_line_c(uint8_t *dst, uint8_t *src, uint16_t *dc, int width, int thresh, const uint16_t *dithers);
|
void ff_gradfun_filter_line_c(uint8_t *dst, uint8_t *src, uint16_t *dc, int width, int thresh, const uint16_t *dithers);
|
||||||
void ff_gradfun_blur_line_c(uint16_t *dc, uint16_t *buf, uint16_t *buf1, uint8_t *src, int src_linesize, int width);
|
void ff_gradfun_blur_line_c(uint16_t *dc, uint16_t *buf, uint16_t *buf1, uint8_t *src, int src_linesize, int width);
|
||||||
|
|
||||||
void ff_gradfun_filter_line_mmx2(uint8_t *dst, uint8_t *src, uint16_t *dc, int width, int thresh, const uint16_t *dithers);
|
|
||||||
void ff_gradfun_filter_line_ssse3(uint8_t *dst, uint8_t *src, uint16_t *dc, int width, int thresh, const uint16_t *dithers);
|
|
||||||
|
|
||||||
void ff_gradfun_blur_line_sse2(uint16_t *dc, uint16_t *buf, uint16_t *buf1, uint8_t *src, int src_linesize, int width);
|
|
||||||
|
|
||||||
#endif /* AVFILTER_GRADFUN_H */
|
#endif /* AVFILTER_GRADFUN_H */
|
||||||
|
@@ -123,7 +123,6 @@ static av_cold int init(AVFilterContext *ctx, const char *args)
|
|||||||
GradFunContext *gf = ctx->priv;
|
GradFunContext *gf = ctx->priv;
|
||||||
float thresh = 1.2;
|
float thresh = 1.2;
|
||||||
int radius = 16;
|
int radius = 16;
|
||||||
int cpu_flags = av_get_cpu_flags();
|
|
||||||
|
|
||||||
if (args)
|
if (args)
|
||||||
sscanf(args, "%f:%d", &thresh, &radius);
|
sscanf(args, "%f:%d", &thresh, &radius);
|
||||||
@@ -135,12 +134,8 @@ static av_cold int init(AVFilterContext *ctx, const char *args)
|
|||||||
gf->blur_line = ff_gradfun_blur_line_c;
|
gf->blur_line = ff_gradfun_blur_line_c;
|
||||||
gf->filter_line = ff_gradfun_filter_line_c;
|
gf->filter_line = ff_gradfun_filter_line_c;
|
||||||
|
|
||||||
if (HAVE_MMX && cpu_flags & AV_CPU_FLAG_MMX2)
|
if (HAVE_MMX)
|
||||||
gf->filter_line = ff_gradfun_filter_line_mmx2;
|
ff_gradfun_init_x86(gf);
|
||||||
if (HAVE_SSSE3 && cpu_flags & AV_CPU_FLAG_SSSE3)
|
|
||||||
gf->filter_line = ff_gradfun_filter_line_ssse3;
|
|
||||||
if (HAVE_SSE && cpu_flags & AV_CPU_FLAG_SSE2)
|
|
||||||
gf->blur_line = ff_gradfun_blur_line_sse2;
|
|
||||||
|
|
||||||
av_log(ctx, AV_LOG_VERBOSE, "threshold:%.2f radius:%d\n", thresh, gf->radius);
|
av_log(ctx, AV_LOG_VERBOSE, "threshold:%.2f radius:%d\n", thresh, gf->radius);
|
||||||
|
|
||||||
|
@@ -18,6 +18,7 @@
|
|||||||
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
#include "libavutil/attributes.h"
|
||||||
#include "libavutil/cpu.h"
|
#include "libavutil/cpu.h"
|
||||||
#include "libavutil/x86_cpu.h"
|
#include "libavutil/x86_cpu.h"
|
||||||
#include "libavfilter/gradfun.h"
|
#include "libavfilter/gradfun.h"
|
||||||
@@ -25,9 +26,9 @@
|
|||||||
DECLARE_ALIGNED(16, static const uint16_t, pw_7f)[8] = {0x7F,0x7F,0x7F,0x7F,0x7F,0x7F,0x7F,0x7F};
|
DECLARE_ALIGNED(16, static const uint16_t, pw_7f)[8] = {0x7F,0x7F,0x7F,0x7F,0x7F,0x7F,0x7F,0x7F};
|
||||||
DECLARE_ALIGNED(16, static const uint16_t, pw_ff)[8] = {0xFF,0xFF,0xFF,0xFF,0xFF,0xFF,0xFF,0xFF};
|
DECLARE_ALIGNED(16, static const uint16_t, pw_ff)[8] = {0xFF,0xFF,0xFF,0xFF,0xFF,0xFF,0xFF,0xFF};
|
||||||
|
|
||||||
void ff_gradfun_filter_line_mmx2(uint8_t *dst, uint8_t *src, uint16_t *dc, int width, int thresh, const uint16_t *dithers)
|
#if HAVE_MMX2
|
||||||
|
static void gradfun_filter_line_mmx2(uint8_t *dst, uint8_t *src, uint16_t *dc, int width, int thresh, const uint16_t *dithers)
|
||||||
{
|
{
|
||||||
#if HAVE_MMX
|
|
||||||
intptr_t x;
|
intptr_t x;
|
||||||
if (width & 3) {
|
if (width & 3) {
|
||||||
x = width & ~3;
|
x = width & ~3;
|
||||||
@@ -70,12 +71,12 @@ void ff_gradfun_filter_line_mmx2(uint8_t *dst, uint8_t *src, uint16_t *dc, int w
|
|||||||
"rm"(thresh), "m"(*dithers), "m"(*pw_7f)
|
"rm"(thresh), "m"(*dithers), "m"(*pw_7f)
|
||||||
:"memory"
|
:"memory"
|
||||||
);
|
);
|
||||||
#endif
|
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
void ff_gradfun_filter_line_ssse3(uint8_t *dst, uint8_t *src, uint16_t *dc, int width, int thresh, const uint16_t *dithers)
|
|
||||||
{
|
|
||||||
#if HAVE_SSSE3
|
#if HAVE_SSSE3
|
||||||
|
static void gradfun_filter_line_ssse3(uint8_t *dst, uint8_t *src, uint16_t *dc, int width, int thresh, const uint16_t *dithers)
|
||||||
|
{
|
||||||
intptr_t x;
|
intptr_t x;
|
||||||
if (width & 7) {
|
if (width & 7) {
|
||||||
// could be 10% faster if I somehow eliminated this
|
// could be 10% faster if I somehow eliminated this
|
||||||
@@ -117,12 +118,12 @@ void ff_gradfun_filter_line_ssse3(uint8_t *dst, uint8_t *src, uint16_t *dc, int
|
|||||||
"rm"(thresh), "m"(*dithers), "m"(*pw_7f)
|
"rm"(thresh), "m"(*dithers), "m"(*pw_7f)
|
||||||
:"memory"
|
:"memory"
|
||||||
);
|
);
|
||||||
#endif // HAVE_SSSE3
|
|
||||||
}
|
}
|
||||||
|
#endif // HAVE_SSSE3
|
||||||
|
|
||||||
void ff_gradfun_blur_line_sse2(uint16_t *dc, uint16_t *buf, uint16_t *buf1, uint8_t *src, int src_linesize, int width)
|
|
||||||
{
|
|
||||||
#if HAVE_SSE
|
#if HAVE_SSE
|
||||||
|
static void gradfun_blur_line_sse2(uint16_t *dc, uint16_t *buf, uint16_t *buf1, uint8_t *src, int src_linesize, int width)
|
||||||
|
{
|
||||||
#define BLURV(load)\
|
#define BLURV(load)\
|
||||||
intptr_t x = -2*width;\
|
intptr_t x = -2*width;\
|
||||||
__asm__ volatile(\
|
__asm__ volatile(\
|
||||||
@@ -160,5 +161,17 @@ void ff_gradfun_blur_line_sse2(uint16_t *dc, uint16_t *buf, uint16_t *buf1, uint
|
|||||||
} else {
|
} else {
|
||||||
BLURV("movdqa");
|
BLURV("movdqa");
|
||||||
}
|
}
|
||||||
#endif // HAVE_SSE
|
}
|
||||||
|
#endif // HAVE_SSE
|
||||||
|
|
||||||
|
av_cold void ff_gradfun_init_x86(GradFunContext *gf)
|
||||||
|
{
|
||||||
|
int cpu_flags = av_get_cpu_flags();
|
||||||
|
|
||||||
|
if (HAVE_MMX2 && cpu_flags & AV_CPU_FLAG_MMX2)
|
||||||
|
gf->filter_line = gradfun_filter_line_mmx2;
|
||||||
|
if (HAVE_SSSE3 && cpu_flags & AV_CPU_FLAG_SSSE3)
|
||||||
|
gf->filter_line = gradfun_filter_line_ssse3;
|
||||||
|
if (HAVE_SSE && cpu_flags & AV_CPU_FLAG_SSE2)
|
||||||
|
gf->blur_line = gradfun_blur_line_sse2;
|
||||||
}
|
}
|
||||||
|
Reference in New Issue
Block a user