1
0
mirror of https://github.com/FFmpeg/FFmpeg.git synced 2024-12-23 12:43:46 +02:00

comment about failed optimization

Originally committed as revision 6887 to svn://svn.ffmpeg.org/ffmpeg/trunk
This commit is contained in:
Michael Niedermayer 2006-11-03 15:17:36 +00:00
parent 80c5b9a161
commit 9347118237

View File

@ -402,7 +402,7 @@ static inline void h264_loop_filter_luma_mmx2(uint8_t *pix, int stride, int alph
"pandn %%mm7, %%mm6 \n\t"
"pcmpeqb %%mm7, %%mm6 \n\t"
"pand %%mm7, %%mm6 \n\t" // mask & |p2-p0|<beta
"movq 8+%0, %%mm4 \n\t"
"movq 8+%0, %%mm4 \n\t" // can be merged with the and below but is slower then
"pand %%mm7, %%mm4 \n\t" // mask & tc0
"movq %%mm4, %%mm7 \n\t"
"psubb %%mm6, %%mm7 \n\t"
@ -415,7 +415,7 @@ static inline void h264_loop_filter_luma_mmx2(uint8_t *pix, int stride, int alph
"pandn %0, %%mm6 \n\t"
"pcmpeqb %0, %%mm6 \n\t"
"pand %0, %%mm6 \n\t"
"movq 8+%0, %%mm5 \n\t"
"movq 8+%0, %%mm5 \n\t" // can be merged with the and below but is slower then
"pand %%mm6, %%mm5 \n\t"
"psubb %%mm6, %%mm7 \n\t"
"movq (%2,%3), %%mm3 \n\t"