1
0
mirror of https://github.com/FFmpeg/FFmpeg.git synced 2024-12-23 12:43:46 +02:00

Merge commit 'd7320ca3ed10f0d35b3740fa03341161e74275ea'

* commit 'd7320ca3ed10f0d35b3740fa03341161e74275ea':
  arm: Avoid using .dn register aliases

Merged-by: James Almer <jamrial@gmail.com>
This commit is contained in:
James Almer 2017-10-30 21:00:51 -03:00
commit 921993503b
3 changed files with 5 additions and 25 deletions

5
configure vendored
View File

@ -2053,7 +2053,6 @@ SYSTEM_FUNCS="
TOOLCHAIN_FEATURES=" TOOLCHAIN_FEATURES="
as_arch_directive as_arch_directive
as_dn_directive
as_fpu_directive as_fpu_directive
as_func as_func
as_object_arch as_object_arch
@ -5526,10 +5525,6 @@ EOF
check_as <<EOF && enable as_arch_directive check_as <<EOF && enable as_arch_directive
.arch armv7-a .arch armv7-a
EOF
check_as <<EOF && enable as_dn_directive
ra .dn d0.i16
.unreq ra
EOF EOF
check_as <<EOF && enable as_fpu_directive check_as <<EOF && enable as_fpu_directive
.fpu neon .fpu neon

View File

@ -22,8 +22,6 @@
#include "libavcodec/vc1dsp.h" #include "libavcodec/vc1dsp.h"
#include "vc1dsp.h" #include "vc1dsp.h"
#include "config.h"
void ff_vc1_inv_trans_8x8_neon(int16_t *block); void ff_vc1_inv_trans_8x8_neon(int16_t *block);
void ff_vc1_inv_trans_4x8_neon(uint8_t *dest, ptrdiff_t stride, int16_t *block); void ff_vc1_inv_trans_4x8_neon(uint8_t *dest, ptrdiff_t stride, int16_t *block);
void ff_vc1_inv_trans_8x4_neon(uint8_t *dest, ptrdiff_t stride, int16_t *block); void ff_vc1_inv_trans_8x4_neon(uint8_t *dest, ptrdiff_t stride, int16_t *block);
@ -95,7 +93,6 @@ av_cold void ff_vc1dsp_init_neon(VC1DSPContext *dsp)
dsp->vc1_inv_trans_4x4_dc = ff_vc1_inv_trans_4x4_dc_neon; dsp->vc1_inv_trans_4x4_dc = ff_vc1_inv_trans_4x4_dc_neon;
dsp->put_vc1_mspel_pixels_tab[1][ 0] = ff_put_pixels8x8_neon; dsp->put_vc1_mspel_pixels_tab[1][ 0] = ff_put_pixels8x8_neon;
if (HAVE_AS_DN_DIRECTIVE) {
FN_ASSIGN(1, 0); FN_ASSIGN(1, 0);
FN_ASSIGN(2, 0); FN_ASSIGN(2, 0);
FN_ASSIGN(3, 0); FN_ASSIGN(3, 0);
@ -114,7 +111,6 @@ av_cold void ff_vc1dsp_init_neon(VC1DSPContext *dsp)
FN_ASSIGN(1, 3); FN_ASSIGN(1, 3);
FN_ASSIGN(2, 3); FN_ASSIGN(2, 3);
FN_ASSIGN(3, 3); FN_ASSIGN(3, 3);
}
dsp->put_no_rnd_vc1_chroma_pixels_tab[0] = ff_put_vc1_chroma_mc8_neon; dsp->put_no_rnd_vc1_chroma_pixels_tab[0] = ff_put_vc1_chroma_mc8_neon;
dsp->avg_no_rnd_vc1_chroma_pixels_tab[0] = ff_avg_vc1_chroma_mc8_neon; dsp->avg_no_rnd_vc1_chroma_pixels_tab[0] = ff_avg_vc1_chroma_mc8_neon;

View File

@ -663,7 +663,6 @@ function ff_vc1_inv_trans_4x4_neon, export=1
bx lr bx lr
endfunc endfunc
#if HAVE_AS_DN_DIRECTIVE
@ The absolute value of multiplication constants from vc1_mspel_filter and vc1_mspel_{ver,hor}_filter_16bits. @ The absolute value of multiplication constants from vc1_mspel_filter and vc1_mspel_{ver,hor}_filter_16bits.
@ The sign is embedded in the code below that carries out the multiplication (mspel_filter{,.16}). @ The sign is embedded in the code below that carries out the multiplication (mspel_filter{,.16}).
#define MSPEL_MODE_1_MUL_CONSTANTS 4 53 18 3 #define MSPEL_MODE_1_MUL_CONSTANTS 4 53 18 3
@ -689,22 +688,18 @@ endfunc
@ Setup constants in registers for a subsequent use of mspel_filter{,.16}. @ Setup constants in registers for a subsequent use of mspel_filter{,.16}.
.macro mspel_constants typesize reg_a reg_b reg_c reg_d filter_a filter_b filter_c filter_d reg_add filter_add_register .macro mspel_constants typesize reg_a reg_b reg_c reg_d filter_a filter_b filter_c filter_d reg_add filter_add_register
@ Define double-word register aliases. Typesize should be i8 or i16. @ Typesize should be i8 or i16.
ra .dn \reg_a\().\typesize
rb .dn \reg_b\().\typesize
rc .dn \reg_c\().\typesize
rd .dn \reg_d\().\typesize
@ Only set the register if the value is not 1 and unique @ Only set the register if the value is not 1 and unique
.if \filter_a != 1 .if \filter_a != 1
vmov ra, #\filter_a @ ra = filter_a vmov.\typesize \reg_a, #\filter_a @ reg_a = filter_a
.endif .endif
vmov rb, #\filter_b @ rb = filter_b vmov.\typesize \reg_b, #\filter_b @ reg_b = filter_b
.if \filter_b != \filter_c .if \filter_b != \filter_c
vmov rc, #\filter_c @ rc = filter_c vmov.\typesize \reg_c, #\filter_c @ reg_c = filter_c
.endif .endif
.if \filter_d != 1 .if \filter_d != 1
vmov rd, #\filter_d @ rd = filter_d vmov.\typesize \reg_d, #\filter_d @ reg_d = filter_d
.endif .endif
@ vdup to double the size of typesize @ vdup to double the size of typesize
.ifc \typesize,i8 .ifc \typesize,i8
@ -712,11 +707,6 @@ endfunc
.else .else
vdup.32 \reg_add, \filter_add_register @ reg_add = filter_add_register vdup.32 \reg_add, \filter_add_register @ reg_add = filter_add_register
.endif .endif
.unreq ra
.unreq rb
.unreq rc
.unreq rd
.endm .endm
@ After mspel_constants has been used, do the filtering. @ After mspel_constants has been used, do the filtering.
@ -987,7 +977,6 @@ PUT_VC1_MSPEL_MC_V_ONLY(2)
PUT_VC1_MSPEL_MC_V_ONLY(3) PUT_VC1_MSPEL_MC_V_ONLY(3)
#undef PUT_VC1_MSPEL_MC_V_ONLY #undef PUT_VC1_MSPEL_MC_V_ONLY
#endif
function ff_put_pixels8x8_neon, export=1 function ff_put_pixels8x8_neon, export=1
vld1.64 {d0}, [r1], r2 vld1.64 {d0}, [r1], r2