1
0
mirror of https://github.com/FFmpeg/FFmpeg.git synced 2025-01-13 21:28:01 +02:00

configure: Add wasm as a fake arch

And add wasm simd128 flag, so we can add simd128 optimizations.
It can be enabled by put -msimd128 to extra cflags. There is
no runtime detection on simd128 support yet. I think that needs to
be done with JavaScript.

Signed-off-by: Zhao Zhili <zhilizhao@tencent.com>
This commit is contained in:
Zhao Zhili 2024-11-20 20:44:59 +08:00
parent 7c1e732ad2
commit 2dc55f5993
9 changed files with 76 additions and 1 deletions

View File

@ -104,7 +104,8 @@ SUBDIR_VARS := CLEANFILES FFLIBS HOSTPROGS TESTPROGS TOOLS \
ALTIVEC-OBJS VSX-OBJS MMX-OBJS X86ASM-OBJS \ ALTIVEC-OBJS VSX-OBJS MMX-OBJS X86ASM-OBJS \
MIPSFPU-OBJS MIPSDSPR2-OBJS MIPSDSP-OBJS MSA-OBJS \ MIPSFPU-OBJS MIPSDSPR2-OBJS MIPSDSP-OBJS MSA-OBJS \
MMI-OBJS LSX-OBJS LASX-OBJS RV-OBJS RVV-OBJS RVVB-OBJS \ MMI-OBJS LSX-OBJS LASX-OBJS RV-OBJS RVV-OBJS RVVB-OBJS \
OBJS SLIBOBJS SHLIBOBJS STLIBOBJS HOSTOBJS TESTOBJS OBJS SLIBOBJS SHLIBOBJS STLIBOBJS HOSTOBJS TESTOBJS \
SIMD128-OBJS
define RESET define RESET
$(1) := $(1) :=

16
configure vendored
View File

@ -480,6 +480,7 @@ Optimization options (experts only):
--disable-lasx disable Loongson LASX optimizations --disable-lasx disable Loongson LASX optimizations
--disable-rvv disable RISC-V Vector optimizations --disable-rvv disable RISC-V Vector optimizations
--disable-fast-unaligned consider unaligned accesses slow --disable-fast-unaligned consider unaligned accesses slow
--disable-simd128 disable WebAssembly simd128 optimizations
Developer options (useful when working on FFmpeg itself): Developer options (useful when working on FFmpeg itself):
--disable-debug disable debugging symbols --disable-debug disable debugging symbols
@ -2149,6 +2150,7 @@ ARCH_LIST="
sparc64 sparc64
tilegx tilegx
tilepro tilepro
wasm
x86 x86
x86_32 x86_32
x86_64 x86_64
@ -2189,6 +2191,10 @@ ARCH_EXT_LIST_LOONGSON="
lasx lasx
" "
ARCH_EXT_LIST_WASM="
simd128
"
ARCH_EXT_LIST_X86_SIMD=" ARCH_EXT_LIST_X86_SIMD="
aesni aesni
amd3dnow amd3dnow
@ -2235,6 +2241,7 @@ ARCH_EXT_LIST="
$ARCH_EXT_LIST_ARM $ARCH_EXT_LIST_ARM
$ARCH_EXT_LIST_PPC $ARCH_EXT_LIST_PPC
$ARCH_EXT_LIST_RISCV $ARCH_EXT_LIST_RISCV
$ARCH_EXT_LIST_WASM
$ARCH_EXT_LIST_X86 $ARCH_EXT_LIST_X86
$ARCH_EXT_LIST_MIPS $ARCH_EXT_LIST_MIPS
$ARCH_EXT_LIST_LOONGSON $ARCH_EXT_LIST_LOONGSON
@ -2791,6 +2798,8 @@ mipsdsp_deps="mips"
mipsdspr2_deps="mips" mipsdspr2_deps="mips"
msa_deps="mipsfpu" msa_deps="mipsfpu"
simd128_deps="wasm"
x86_64_select="i686" x86_64_select="i686"
x86_64_suggest="fast_cmov" x86_64_suggest="fast_cmov"
@ -5293,6 +5302,9 @@ case "$arch" in
tilegx|tile-gx) tilegx|tile-gx)
arch="tilegx" arch="tilegx"
;; ;;
wasm*)
arch="wasm"
;;
i[3-6]86*|i86pc|BePC|x86pc|x86_64|x86_32|amd64) i[3-6]86*|i86pc|BePC|x86pc|x86_64|x86_32|amd64)
arch="x86" arch="x86"
;; ;;
@ -6403,6 +6415,10 @@ elif enabled riscv; then
enabled rv_zicbop && check_inline_asm rv_zicbop '".option arch, +zicbop\nprefetch.r 64(a0)"' enabled rv_zicbop && check_inline_asm rv_zicbop '".option arch, +zicbop\nprefetch.r 64(a0)"'
enabled rv_zvbb && check_inline_asm rv_zvbb '".option arch, +zvbb\nvclz.v v0, v8"' enabled rv_zvbb && check_inline_asm rv_zvbb '".option arch, +zvbb\nvclz.v v0, v8"'
elif enabled wasm; then
enabled simd128 && check_cc simd128 wasm_simd128.h "v128_t v = wasm_v128_load(0);"
elif enabled x86; then elif enabled x86; then
check_builtin rdtsc intrin.h "__rdtsc()" check_builtin rdtsc intrin.h "__rdtsc()"

View File

@ -21,5 +21,7 @@ OBJS-$(HAVE_RV) += $(RV-OBJS) $(RV-OBJS-yes)
OBJS-$(HAVE_RVV) += $(RVV-OBJS) $(RVV-OBJS-yes) OBJS-$(HAVE_RVV) += $(RVV-OBJS) $(RVV-OBJS-yes)
OBJS-$(HAVE_RV_ZVBB) += $(RVVB-OBJS) $(RVVB-OBJS-yes) OBJS-$(HAVE_RV_ZVBB) += $(RVVB-OBJS) $(RVVB-OBJS-yes)
OBJS-$(HAVE_SIMD128) += $(SIMD128-OBJS) $(SIMD128-OBJS-yes)
OBJS-$(HAVE_MMX) += $(MMX-OBJS) $(MMX-OBJS-yes) OBJS-$(HAVE_MMX) += $(MMX-OBJS) $(MMX-OBJS-yes)
OBJS-$(HAVE_X86ASM) += $(X86ASM-OBJS) $(X86ASM-OBJS-yes) OBJS-$(HAVE_X86ASM) += $(X86ASM-OBJS) $(X86ASM-OBJS-yes)

View File

@ -68,6 +68,8 @@ static int get_cpu_flags(void)
return ff_get_cpu_flags_ppc(); return ff_get_cpu_flags_ppc();
#elif ARCH_RISCV #elif ARCH_RISCV
return ff_get_cpu_flags_riscv(); return ff_get_cpu_flags_riscv();
#elif ARCH_WASM
return ff_get_cpu_flags_wasm();
#elif ARCH_X86 #elif ARCH_X86
return ff_get_cpu_flags_x86(); return ff_get_cpu_flags_x86();
#elif ARCH_LOONGARCH #elif ARCH_LOONGARCH
@ -200,6 +202,8 @@ int av_parse_cpu_caps(unsigned *flags, const char *s)
{ "zbb", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = AV_CPU_FLAG_RVB_BASIC }, .unit = "flags" }, { "zbb", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = AV_CPU_FLAG_RVB_BASIC }, .unit = "flags" },
{ "zvbb", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = AV_CPU_FLAG_RV_ZVBB }, .unit = "flags" }, { "zvbb", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = AV_CPU_FLAG_RV_ZVBB }, .unit = "flags" },
{ "misaligned", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = AV_CPU_FLAG_RV_MISALIGNED }, .unit = "flags" }, { "misaligned", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = AV_CPU_FLAG_RV_MISALIGNED }, .unit = "flags" },
#elif ARCH_WASM
{ "simd128", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = AV_CPU_FLAG_SIMD128 }, .unit = "flags" },
#endif #endif
{ NULL }, { NULL },
}; };
@ -283,6 +287,8 @@ size_t av_cpu_max_align(void)
return ff_get_cpu_max_align_arm(); return ff_get_cpu_max_align_arm();
#elif ARCH_PPC #elif ARCH_PPC
return ff_get_cpu_max_align_ppc(); return ff_get_cpu_max_align_ppc();
#elif ARCH_WASM
return ff_get_cpu_max_align_wasm();
#elif ARCH_X86 #elif ARCH_X86
return ff_get_cpu_max_align_x86(); return ff_get_cpu_max_align_x86();
#elif ARCH_LOONGARCH #elif ARCH_LOONGARCH

View File

@ -101,6 +101,9 @@
#define AV_CPU_FLAG_RV_MISALIGNED (1 <<10) ///< Fast misaligned accesses #define AV_CPU_FLAG_RV_MISALIGNED (1 <<10) ///< Fast misaligned accesses
#define AV_CPU_FLAG_RVB (1 <<11) ///< B (bit manipulations) #define AV_CPU_FLAG_RVB (1 <<11) ///< B (bit manipulations)
// WASM extensions
#define AV_CPU_FLAG_SIMD128 (1 << 0)
/** /**
* Return the flags which specify extensions supported by the CPU. * Return the flags which specify extensions supported by the CPU.
* The returned value is affected by av_force_cpu_flags() if that was used * The returned value is affected by av_force_cpu_flags() if that was used

View File

@ -49,6 +49,7 @@ int ff_get_cpu_flags_aarch64(void);
int ff_get_cpu_flags_arm(void); int ff_get_cpu_flags_arm(void);
int ff_get_cpu_flags_ppc(void); int ff_get_cpu_flags_ppc(void);
int ff_get_cpu_flags_riscv(void); int ff_get_cpu_flags_riscv(void);
int ff_get_cpu_flags_wasm(void);
int ff_get_cpu_flags_x86(void); int ff_get_cpu_flags_x86(void);
int ff_get_cpu_flags_loongarch(void); int ff_get_cpu_flags_loongarch(void);
@ -56,6 +57,7 @@ size_t ff_get_cpu_max_align_mips(void);
size_t ff_get_cpu_max_align_aarch64(void); size_t ff_get_cpu_max_align_aarch64(void);
size_t ff_get_cpu_max_align_arm(void); size_t ff_get_cpu_max_align_arm(void);
size_t ff_get_cpu_max_align_ppc(void); size_t ff_get_cpu_max_align_ppc(void);
size_t ff_get_cpu_max_align_wasm(void);
size_t ff_get_cpu_max_align_x86(void); size_t ff_get_cpu_max_align_x86(void);
size_t ff_get_cpu_max_align_loongarch(void); size_t ff_get_cpu_max_align_loongarch(void);

View File

@ -104,6 +104,8 @@ static const struct {
{ AV_CPU_FLAG_RVV_F64, "zve64d" }, { AV_CPU_FLAG_RVV_F64, "zve64d" },
{ AV_CPU_FLAG_RV_ZVBB, "zvbb" }, { AV_CPU_FLAG_RV_ZVBB, "zvbb" },
{ AV_CPU_FLAG_RV_MISALIGNED, "misaligned" }, { AV_CPU_FLAG_RV_MISALIGNED, "misaligned" },
#elif ARCH_WASM
{ AV_CPU_FLAG_SIMD128, "simd128" },
#endif #endif
{ 0 } { 0 }
}; };

1
libavutil/wasm/Makefile Normal file
View File

@ -0,0 +1 @@
OBJS += wasm/cpu.o

42
libavutil/wasm/cpu.c Normal file
View File

@ -0,0 +1,42 @@
/*
* Copyright (c) 2024 Zhao Zhili
*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#include <stdint.h>
#include "libavutil/cpu_internal.h"
int ff_get_cpu_flags_wasm(void)
{
int flags = 0;
#if HAVE_SIMD128
flags |= AV_CPU_FLAG_SIMD128;
#endif
return flags;
}
size_t ff_get_cpu_max_align_wasm(void)
{
#if HAVE_SIMD128
return 16;
#else
return 8;
#endif
}