mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2025-03-28 12:32:17 +02:00
swscale/x86/rgb2rgb_template: Fallback to mmx in interleaveBytes() if the alignment is insufficient for SSE*
This also as a sideeffect fixes the non aligned case Signed-off-by: Michael Niedermayer <michael@niedermayer.cc> (cherry picked from commit a066ff89bcbae6033c2ffda9271cad84f6c1b807)
This commit is contained in:
parent
45430c3753
commit
26e98f9ae5
@ -1887,10 +1887,9 @@ static void RENAME(interleaveBytes)(const uint8_t *src1, const uint8_t *src2, ui
|
|||||||
for (h=0; h < height; h++) {
|
for (h=0; h < height; h++) {
|
||||||
int w;
|
int w;
|
||||||
|
|
||||||
if (width >= 16
|
if (width >= 16) {
|
||||||
#if COMPILE_TEMPLATE_SSE2
|
#if COMPILE_TEMPLATE_SSE2
|
||||||
&& !((((intptr_t)src1) | ((intptr_t)src2) | ((intptr_t)dest))&15)
|
if (!((((intptr_t)src1) | ((intptr_t)src2) | ((intptr_t)dest))&15)) {
|
||||||
)
|
|
||||||
__asm__(
|
__asm__(
|
||||||
"xor %%"REG_a", %%"REG_a" \n\t"
|
"xor %%"REG_a", %%"REG_a" \n\t"
|
||||||
"1: \n\t"
|
"1: \n\t"
|
||||||
@ -1909,8 +1908,8 @@ static void RENAME(interleaveBytes)(const uint8_t *src1, const uint8_t *src2, ui
|
|||||||
::"r"(dest), "r"(src1), "r"(src2), "r" ((x86_reg)width-15)
|
::"r"(dest), "r"(src1), "r"(src2), "r" ((x86_reg)width-15)
|
||||||
: "memory", XMM_CLOBBERS("xmm0", "xmm1", "xmm2",) "%"REG_a
|
: "memory", XMM_CLOBBERS("xmm0", "xmm1", "xmm2",) "%"REG_a
|
||||||
);
|
);
|
||||||
#else
|
} else
|
||||||
)
|
#endif
|
||||||
__asm__(
|
__asm__(
|
||||||
"xor %%"REG_a", %%"REG_a" \n\t"
|
"xor %%"REG_a", %%"REG_a" \n\t"
|
||||||
"1: \n\t"
|
"1: \n\t"
|
||||||
@ -1936,7 +1935,8 @@ static void RENAME(interleaveBytes)(const uint8_t *src1, const uint8_t *src2, ui
|
|||||||
::"r"(dest), "r"(src1), "r"(src2), "r" ((x86_reg)width-15)
|
::"r"(dest), "r"(src1), "r"(src2), "r" ((x86_reg)width-15)
|
||||||
: "memory", "%"REG_a
|
: "memory", "%"REG_a
|
||||||
);
|
);
|
||||||
#endif
|
|
||||||
|
}
|
||||||
for (w= (width&(~15)); w < width; w++) {
|
for (w= (width&(~15)); w < width; w++) {
|
||||||
dest[2*w+0] = src1[w];
|
dest[2*w+0] = src1[w];
|
||||||
dest[2*w+1] = src2[w];
|
dest[2*w+1] = src2[w];
|
||||||
|
Loading…
x
Reference in New Issue
Block a user