changeset 2625:a8145a712f25

mmx opt ,untested, i have no mga
author michael
date Fri, 02 Nov 2001 03:17:33 +0000
parents 64844fccf623
children da9777831e1b
files libvo/mga_common.c
diffstat 1 files changed, 41 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- a/libvo/mga_common.c	Fri Nov 02 02:55:51 2001 +0000
+++ b/libvo/mga_common.c	Fri Nov 02 03:17:33 2001 +0000
@@ -1,5 +1,6 @@
 
 #include "fastmemcpy.h"
+#include "../mmx_defs.h"
 
 // mga_vid drawing functions
 
@@ -57,15 +58,55 @@
         src2 = image[2];
 	for(h=0; h < height; h++)
 	{
+#ifdef HAVE_MMX
+		asm(
+			"xorl %%eax, %%eax		\n\t"
+			"1:				\n\t"
+			PREFETCH" 64(%1, %%eax)		\n\t"
+			PREFETCH" 64(%2, %%eax)		\n\t"
+			"movq (%1, %%eax), %%mm0	\n\t"
+			"movq 8(%1, %%eax), %%mm2	\n\t"
+			"movq %%mm0, %%mm1		\n\t"
+			"movq %%mm2, %%mm3		\n\t"
+			"movq (%2, %%eax), %%mm4	\n\t"
+			"movq 8(%2, %%eax), %%mm5	\n\t"
+			"punpcklbw %%mm4, %%mm0		\n\t"
+			"punpckhbw %%mm4, %%mm1		\n\t"
+			"punpcklbw %%mm5, %%mm2		\n\t"
+			"punpckhbw %%mm5, %%mm3		\n\t"
+			MOVNTQ" %%mm0, (%0, %%eax, 2)	\n\t"
+			MOVNTQ" %%mm1, 8(%0, %%eax, 2)	\n\t"
+			MOVNTQ" %%mm2, 16(%0, %%eax, 2)	\n\t"
+			MOVNTQ" %%mm3, 24(%0, %%eax, 2)	\n\t"
+			"addl $16, %%eax			\n\t"
+			"cmpl %3, %%eax			\n\t"
+			" jb 1b				\n\t"
+			::"r"(dest), "r"(src), "r"(src2), "r" (width-15)
+			: "memory", "%eax"
+		);
+		for(w= (width&(~15)); w < width; w++)
+		{
+			dest[2*w+0] = src[w];
+			dest[2*w+1] = src2[w];
+		}
+#else
 		for(w=0; w < width; w++)
 		{
 			dest[2*w+0] = src[w];
 			dest[2*w+1] = src2[w];
 		}
+#endif
 		dest += bespitch;
                 src += stride[1];
                 src2+= stride[2];
 	}
+#ifdef HAVE_MMX
+	asm(
+		EMMS" \n\t"
+		SFENCE" \n\t"
+		::: "memory"
+		);
+#endif
 }
 
 static void