1
0
mirror of https://github.com/FFmpeg/FFmpeg.git synced 2025-01-03 05:10:03 +02:00

lavc/fmtconvert: RISC-V V int32_to_float_fmul_array8

This commit is contained in:
Rémi Denis-Courmont 2022-09-26 17:52:44 +03:00 committed by Lynne
parent 47a10b9a99
commit 220dfd0945
2 changed files with 34 additions and 1 deletions

View File

@ -27,13 +27,18 @@
void ff_int32_to_float_fmul_scalar_rvv(float *dst, const int32_t *src,
float mul, int len);
void ff_int32_to_float_fmul_array8_rvv(FmtConvertContext *c, float *dst,
const int32_t *src, const float *mul,
int len);
av_cold void ff_fmt_convert_init_riscv(FmtConvertContext *c)
{
#ifdef HAVE_RVV
int flags = av_get_cpu_flags();
if (flags & AV_CPU_FLAG_RVV_F32)
if (flags & AV_CPU_FLAG_RVV_F32) {
c->int32_to_float_fmul_scalar = ff_int32_to_float_fmul_scalar_rvv;
c->int32_to_float_fmul_array8 = ff_int32_to_float_fmul_array8_rvv;
}
#endif
}

View File

@ -37,3 +37,31 @@ NOHWF mv a2, a3
ret
endfunc
func ff_int32_to_float_fmul_array8_rvv, zve32f
srai a4, a4, 3
1: vsetvli t0, a4, e32, m1, ta, ma
vle32.v v24, (a3)
slli t2, t0, 2 + 3
vlseg8e32.v v16, (a2)
vsetvli t3, zero, e32, m8, ta, ma
vfcvt.f.x.v v16, v16
vsetvli zero, a4, e32, m1, ta, ma
vfmul.vv v16, v16, v24
sub a4, a4, t0
vfmul.vv v17, v17, v24
sh2add a3, t0, a3
vfmul.vv v18, v18, v24
add a2, a2, t2
vfmul.vv v19, v19, v24
vfmul.vv v20, v20, v24
vfmul.vv v21, v21, v24
vfmul.vv v22, v22, v24
vfmul.vv v23, v23, v24
vsseg8e32.v v16, (a1)
add a1, a1, t2
bnez a4, 1b
ret
endfunc