mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2024-12-07 11:13:41 +02:00
06f94149c6
separate dsp.resample to dsp.resample_common and dsp.resample_linear and choose to call faster resample_common even when linear_interp=on when c->frac and c->dst_incr_mod are both zero speed up resampling when exact_rational and linear_interp are both enabled because exact_rational force c->frac and c->dst_incr_mod to be zero when soft compensation does not happen benchmark on exact_rational=on:linear_interp=on old new real 8.432s 5.097s user 7.679s 4.989s sys 0.125s 0.107s Reviewed-by: Michael Niedermayer <michael@niedermayer.cc> Signed-off-by: Muhammad Faiz <mfcc64@gmail.com>
91 lines
3.3 KiB
C
91 lines
3.3 KiB
C
/*
|
|
* audio resampling
|
|
* Copyright (c) 2004-2012 Michael Niedermayer <michaelni@gmx.at>
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
/**
|
|
* @file
|
|
* audio resampling
|
|
* @author Michael Niedermayer <michaelni@gmx.at>
|
|
*/
|
|
|
|
#include "libavutil/x86/cpu.h"
|
|
#include "libswresample/resample.h"
|
|
|
|
#define RESAMPLE_FUNCS(type, opt) \
|
|
int ff_resample_common_##type##_##opt(ResampleContext *c, void *dst, \
|
|
const void *src, int sz, int upd); \
|
|
int ff_resample_linear_##type##_##opt(ResampleContext *c, void *dst, \
|
|
const void *src, int sz, int upd)
|
|
|
|
RESAMPLE_FUNCS(int16, mmxext);
|
|
RESAMPLE_FUNCS(int16, sse2);
|
|
RESAMPLE_FUNCS(int16, xop);
|
|
RESAMPLE_FUNCS(float, sse);
|
|
RESAMPLE_FUNCS(float, avx);
|
|
RESAMPLE_FUNCS(float, fma3);
|
|
RESAMPLE_FUNCS(float, fma4);
|
|
RESAMPLE_FUNCS(double, sse2);
|
|
|
|
av_cold void swri_resample_dsp_x86_init(ResampleContext *c)
|
|
{
|
|
int av_unused mm_flags = av_get_cpu_flags();
|
|
|
|
switch(c->format){
|
|
case AV_SAMPLE_FMT_S16P:
|
|
if (ARCH_X86_32 && EXTERNAL_MMXEXT(mm_flags)) {
|
|
c->dsp.resample_linear = ff_resample_linear_int16_mmxext;
|
|
c->dsp.resample_common = ff_resample_common_int16_mmxext;
|
|
}
|
|
if (EXTERNAL_SSE2(mm_flags)) {
|
|
c->dsp.resample_linear = ff_resample_linear_int16_sse2;
|
|
c->dsp.resample_common = ff_resample_common_int16_sse2;
|
|
}
|
|
if (EXTERNAL_XOP(mm_flags)) {
|
|
c->dsp.resample_linear = ff_resample_linear_int16_xop;
|
|
c->dsp.resample_common = ff_resample_common_int16_xop;
|
|
}
|
|
break;
|
|
case AV_SAMPLE_FMT_FLTP:
|
|
if (EXTERNAL_SSE(mm_flags)) {
|
|
c->dsp.resample_linear = ff_resample_linear_float_sse;
|
|
c->dsp.resample_common = ff_resample_common_float_sse;
|
|
}
|
|
if (EXTERNAL_AVX_FAST(mm_flags)) {
|
|
c->dsp.resample_linear = ff_resample_linear_float_avx;
|
|
c->dsp.resample_common = ff_resample_common_float_avx;
|
|
}
|
|
if (EXTERNAL_FMA3_FAST(mm_flags)) {
|
|
c->dsp.resample_linear = ff_resample_linear_float_fma3;
|
|
c->dsp.resample_common = ff_resample_common_float_fma3;
|
|
}
|
|
if (EXTERNAL_FMA4(mm_flags)) {
|
|
c->dsp.resample_linear = ff_resample_linear_float_fma4;
|
|
c->dsp.resample_common = ff_resample_common_float_fma4;
|
|
}
|
|
break;
|
|
case AV_SAMPLE_FMT_DBLP:
|
|
if (EXTERNAL_SSE2(mm_flags)) {
|
|
c->dsp.resample_linear = ff_resample_linear_double_sse2;
|
|
c->dsp.resample_common = ff_resample_common_double_sse2;
|
|
}
|
|
break;
|
|
}
|
|
}
|