mplayer.hg: postproc/swscale_template.c comparison

comparison postproc/swscale_template.c @ 11122:c552fe6acbaa

rounding fixes

author	michael
date	Wed, 15 Oct 2003 11:21:54 +0000
parents	6e35326c742f
children	21e5cb258a95

comparison

equal deleted inserted replaced

-:554b829860c3
+:c552fe6acbaa
 #define MOVNTQ(a,b) "movq " #a ", " #b " \n\t"
 #endif
 #define YSCALEYUV2YV12X(x, offset) \
 			"xorl %%eax, %%eax		\n\t"\
-			"pxor %%mm3, %%mm3		\n\t"\
+			"movq "VROUNDER_OFFSET"(%0), %%mm3\n\t"\
-			"pxor %%mm4, %%mm4		\n\t"\
+			"movq %%mm3, %%mm4		\n\t"\
 			"leal " offset "(%0), %%edx	\n\t"\
 			"movl (%%edx), %%esi		\n\t"\
 			".balign 16			\n\t" /* FIXME Unroll? */\
 			"1:				\n\t"\
 			"movq 8(%%edx), %%mm0		\n\t" /* filterCoeff */\
 			"psraw $3, %%mm4		\n\t"\
 			"packuswb %%mm4, %%mm3		\n\t"\
 			MOVNTQ(%%mm3, (%1, %%eax))\
 			"addl $8, %%eax			\n\t"\
 			"cmpl %2, %%eax			\n\t"\
-			"pxor %%mm3, %%mm3		\n\t"\
+			"movq "VROUNDER_OFFSET"(%0), %%mm3\n\t"\
-			"pxor %%mm4, %%mm4		\n\t"\
+			"movq %%mm3, %%mm4		\n\t"\
 			"leal " offset "(%0), %%edx	\n\t"\
 			"movl (%%edx), %%esi		\n\t"\
 			"jb 1b				\n\t"
 #define YSCALEYUV2YV121 \
 		".balign 16			\n\t"\
 		"nop				\n\t"\
 		"1:				\n\t"\
 		"leal "CHR_MMX_FILTER_OFFSET"(%0), %%edx	\n\t"\
 		"movl (%%edx), %%esi		\n\t"\
-		"pxor %%mm3, %%mm3		\n\t"\
+		"movq "VROUNDER_OFFSET"(%0), %%mm3\n\t"\
-		"pxor %%mm4, %%mm4		\n\t"\
+		"movq %%mm3, %%mm4		\n\t"\
 		".balign 16			\n\t"\
 		"2:				\n\t"\
 		"movq 8(%%edx), %%mm0		\n\t" /* filterCoeff */\
 		"movq (%%esi, %%eax), %%mm2	\n\t" /* UsrcData */\
 		"movq 4096(%%esi, %%eax), %%mm5	\n\t" /* VsrcData */\
 		"testl %%esi, %%esi		\n\t"\
 		" jnz 2b			\n\t"\
 \
 		"leal "LUM_MMX_FILTER_OFFSET"(%0), %%edx	\n\t"\
 		"movl (%%edx), %%esi		\n\t"\
-		"pxor %%mm1, %%mm1		\n\t"\
+		"movq "VROUNDER_OFFSET"(%0), %%mm1\n\t"\
-		"pxor %%mm7, %%mm7		\n\t"\
+		"movq %%mm1, %%mm7		\n\t"\
 		".balign 16			\n\t"\
 		"2:				\n\t"\
 		"movq 8(%%edx), %%mm0		\n\t" /* filterCoeff */\
 		"movq (%%esi, %%eax, 2), %%mm2	\n\t" /* Y1srcData */\
 		"movq 8(%%esi, %%eax, 2), %%mm5	\n\t" /* Y2srcData */\
 		const int firstLumSrcY= vLumFilterPos[dstY]; //First line needed as input
 		const int firstChrSrcY= vChrFilterPos[chrDstY]; //First line needed as input
 		const int lastLumSrcY= firstLumSrcY + vLumFilterSize -1; // Last line needed as input
 		const int lastChrSrcY= firstChrSrcY + vChrFilterSize -1; // Last line needed as input
+//printf("dstY:%d dstH:%d firstLumSrcY:%d lastInLumBuf:%d vLumBufSize: %d vChrBufSize: %d slice: %d %d vLumFilterSize: %d firstChrSrcY: %d vChrFilterSize: %d c->chrSrcVSubSample: %d\n",
+// dstY, dstH, firstLumSrcY, lastInLumBuf, vLumBufSize, vChrBufSize, srcSliceY, srcSliceH, vLumFilterSize, firstChrSrcY, vChrFilterSize,  c->chrSrcVSubSample);
 		//handle holes (FAST_BILINEAR & weird filters)
 		if(firstLumSrcY > lastInLumBuf) lastInLumBuf= firstLumSrcY-1;
 		if(firstChrSrcY > lastInChrBuf) lastInChrBuf= firstChrSrcY-1;
 //printf("%d %d %d\n", firstChrSrcY, lastInChrBuf, vChrBufSize);
 		ASSERT(firstLumSrcY >= lastInLumBuf - vLumBufSize + 1)

Mercurial > mplayer.hg

comparison postproc/swscale_template.c @ 11122:c552fe6acbaa