Commit 41eb0192 authored by michael's avatar michael

yuv9 -> yv12 bugfixes


git-svn-id: file:///var/local/repositories/mplayer/trunk/postproc@9257 b3059339-0415-0410-9bf9-f77b7e298cf2
parent 0f29f2de
...@@ -1619,16 +1619,20 @@ static inline void RENAME(planar2x)(const uint8_t *src, uint8_t *dst, int srcWid ...@@ -1619,16 +1619,20 @@ static inline void RENAME(planar2x)(const uint8_t *src, uint8_t *dst, int srcWid
{ {
int x,y; int x,y;
dst[0]= src[0];
// first line // first line
for(x=0; x<srcWidth; x++){ for(x=0; x<srcWidth-1; x++){
dst[2*x+0]= dst[2*x+1]= (3*src[x] + src[x+1])>>2;
dst[2*x+1]= src[x]; dst[2*x+2]= ( src[x] + 3*src[x+1])>>2;
} }
dst[2*srcWidth-1]= src[srcWidth-1];
dst+= dstStride; dst+= dstStride;
for(y=1; y<srcHeight; y++){ for(y=1; y<srcHeight; y++){
#if defined (HAVE_MMX2) || defined (HAVE_3DNOW) #if defined (HAVE_MMX2) || defined (HAVE_3DNOW)
const int mmxSize= srcWidth; const int mmxSize= srcWidth&~15;
asm volatile( asm volatile(
"movl %4, %%eax \n\t" "movl %4, %%eax \n\t"
"1: \n\t" "1: \n\t"
...@@ -1636,67 +1640,76 @@ static inline void RENAME(planar2x)(const uint8_t *src, uint8_t *dst, int srcWid ...@@ -1636,67 +1640,76 @@ static inline void RENAME(planar2x)(const uint8_t *src, uint8_t *dst, int srcWid
"movq (%1, %%eax), %%mm1 \n\t" "movq (%1, %%eax), %%mm1 \n\t"
"movq 1(%0, %%eax), %%mm2 \n\t" "movq 1(%0, %%eax), %%mm2 \n\t"
"movq 1(%1, %%eax), %%mm3 \n\t" "movq 1(%1, %%eax), %%mm3 \n\t"
"movq %%mm0, %%mm4 \n\t" "movq -1(%0, %%eax), %%mm4 \n\t"
"movq %%mm1, %%mm5 \n\t" "movq -1(%1, %%eax), %%mm5 \n\t"
PAVGB" %%mm3, %%mm0 \n\t" PAVGB" %%mm0, %%mm5 \n\t"
PAVGB" %%mm3, %%mm0 \n\t" PAVGB" %%mm0, %%mm3 \n\t"
PAVGB" %%mm4, %%mm3 \n\t" PAVGB" %%mm0, %%mm5 \n\t"
PAVGB" %%mm4, %%mm3 \n\t" PAVGB" %%mm0, %%mm3 \n\t"
PAVGB" %%mm2, %%mm1 \n\t" PAVGB" %%mm1, %%mm4 \n\t"
PAVGB" %%mm2, %%mm1 \n\t" PAVGB" %%mm1, %%mm2 \n\t"
PAVGB" %%mm5, %%mm2 \n\t" PAVGB" %%mm1, %%mm4 \n\t"
PAVGB" %%mm5, %%mm2 \n\t" PAVGB" %%mm1, %%mm2 \n\t"
"movq %%mm3, %%mm4 \n\t" "movq %%mm5, %%mm7 \n\t"
"movq %%mm2, %%mm5 \n\t" "movq %%mm4, %%mm6 \n\t"
"punpcklbw %%mm1, %%mm3 \n\t" "punpcklbw %%mm3, %%mm5 \n\t"
"punpckhbw %%mm1, %%mm4 \n\t" "punpckhbw %%mm3, %%mm7 \n\t"
"punpcklbw %%mm0, %%mm2 \n\t" "punpcklbw %%mm2, %%mm4 \n\t"
"punpckhbw %%mm0, %%mm5 \n\t" "punpckhbw %%mm2, %%mm6 \n\t"
#if 1 #if 1
MOVNTQ" %%mm3, (%2, %%eax, 2) \n\t" MOVNTQ" %%mm5, (%2, %%eax, 2) \n\t"
MOVNTQ" %%mm4, 8(%2, %%eax, 2) \n\t" MOVNTQ" %%mm7, 8(%2, %%eax, 2) \n\t"
MOVNTQ" %%mm2, (%3, %%eax, 2) \n\t" MOVNTQ" %%mm4, (%3, %%eax, 2) \n\t"
MOVNTQ" %%mm5, 8(%3, %%eax, 2) \n\t" MOVNTQ" %%mm6, 8(%3, %%eax, 2) \n\t"
#else #else
"movq %%mm3, (%2, %%eax, 2) \n\t" "movq %%mm5, (%2, %%eax, 2) \n\t"
"movq %%mm4, 8(%2, %%eax, 2) \n\t" "movq %%mm7, 8(%2, %%eax, 2) \n\t"
"movq %%mm2, (%3, %%eax, 2) \n\t" "movq %%mm4, (%3, %%eax, 2) \n\t"
"movq %%mm5, 8(%3, %%eax, 2) \n\t" "movq %%mm6, 8(%3, %%eax, 2) \n\t"
#endif #endif
"addl $8, %%eax \n\t" "addl $8, %%eax \n\t"
" js 1b \n\t" " js 1b \n\t"
:: "r" (src + mmxSize-1), "r" (src + srcStride + mmxSize-1), :: "r" (src + mmxSize ), "r" (src + srcStride + mmxSize ),
"r" (dst + mmxSize*2), "r" (dst + dstStride + mmxSize*2), "r" (dst + mmxSize*2), "r" (dst + dstStride + mmxSize*2),
"g" (-mmxSize) "g" (-mmxSize)
: "%eax" : "%eax"
); );
dst[0]=
dst[dstStride]= src[0];
#else #else
dst[0]= const int mmxSize=1;
dst[dstStride]= src[0]; #endif
dst[0 ]= (3*src[0] + src[srcStride])>>2;
dst[dstStride]= ( src[0] + 3*src[srcStride])>>2;
for(x=0; x<srcWidth-1; x++){ for(x=mmxSize-1; x<srcWidth-1; x++){
dst[2*x +1]= (3*src[x+0] + src[x+srcStride+1])>>2; dst[2*x +1]= (3*src[x+0] + src[x+srcStride+1])>>2;
dst[2*x+dstStride+2]= ( src[x+0] + 3*src[x+srcStride+1])>>2; dst[2*x+dstStride+2]= ( src[x+0] + 3*src[x+srcStride+1])>>2;
dst[2*x+dstStride+1]= ( src[x+1] + 3*src[x+srcStride ])>>2; dst[2*x+dstStride+1]= ( src[x+1] + 3*src[x+srcStride ])>>2;
dst[2*x +2]= (3*src[x+1] + src[x+srcStride ])>>2; dst[2*x +2]= (3*src[x+1] + src[x+srcStride ])>>2;
} }
#endif dst[srcWidth*2 -1 ]= (3*src[srcWidth-1] + src[srcWidth-1 + srcStride])>>2;
dst[srcWidth*2 -1]= dst[srcWidth*2 -1 + dstStride]= ( src[srcWidth-1] + 3*src[srcWidth-1 + srcStride])>>2;
dst[srcWidth*2 -1 + dstStride]= src[srcWidth-1];
dst+=dstStride*2; dst+=dstStride*2;
src+=srcStride; src+=srcStride;
} }
src-=srcStride;
// last line // last line
#if 1
dst[0]= src[0];
for(x=0; x<srcWidth-1; x++){
dst[2*x+1]= (3*src[x] + src[x+1])>>2;
dst[2*x+2]= ( src[x] + 3*src[x+1])>>2;
}
dst[2*srcWidth-1]= src[srcWidth-1];
#else
for(x=0; x<srcWidth; x++){ for(x=0; x<srcWidth; x++){
dst[2*x+0]= dst[2*x+0]=
dst[2*x+1]= src[x]; dst[2*x+1]= src[x];
} }
#endif
#ifdef HAVE_MMX #ifdef HAVE_MMX
asm volatile( EMMS" \n\t" asm volatile( EMMS" \n\t"
SFENCE" \n\t" SFENCE" \n\t"
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment