diff x86/vp8dsp-init.c @ 11992:da388061b227 libavcodec

Add x86 asm functions for VP8 put_pixels
author darkshikari
date Mon, 28 Jun 2010 19:14:40 +0000
parents a6d24fc1deb7
children c15e87b9767b
line wrap: on
line diff
--- a/x86/vp8dsp-init.c	Mon Jun 28 18:56:24 2010 +0000
+++ b/x86/vp8dsp-init.c	Mon Jun 28 19:14:40 2010 +0000
@@ -87,6 +87,16 @@
                                           uint8_t *src, int srcstride,
                                           int height, int mx, int my);
 
+extern void ff_put_vp8_pixels8_mmx (uint8_t *dst, int dststride,
+                                    uint8_t *src, int srcstride,
+                                    int height, int mx, int my);
+extern void ff_put_vp8_pixels16_mmx(uint8_t *dst, int dststride,
+                                    uint8_t *src, int srcstride,
+                                    int height, int mx, int my);
+extern void ff_put_vp8_pixels16_sse(uint8_t *dst, int dststride,
+                                    uint8_t *src, int srcstride,
+                                    int height, int mx, int my);
+
 #define TAP_W16(OPT, FILTERTYPE, TAPTYPE) \
 static void ff_put_vp8_ ## FILTERTYPE ## 16_ ## TAPTYPE ## _ ## OPT( \
     uint8_t *dst,  int dststride, uint8_t *src, \
@@ -218,6 +228,10 @@
 #if HAVE_YASM
     if (mm_flags & FF_MM_MMX) {
         c->vp8_idct_dc_add                  = ff_vp8_idct_dc_add_mmx;
+        c->put_vp8_epel_pixels_tab[0][0][0]     =
+        c->put_vp8_bilinear_pixels_tab[0][0][0] = ff_put_vp8_pixels16_mmx;
+        c->put_vp8_epel_pixels_tab[1][0][0]     =
+        c->put_vp8_bilinear_pixels_tab[1][0][0] = ff_put_vp8_pixels8_mmx;
     }
 
     /* note that 4-tap width=16 functions are missing because w=16
@@ -231,6 +245,11 @@
         VP8_BILINEAR_MC_FUNC(1, 4, mmxext);
     }
 
+    if (mm_flags & FF_MM_SSE) {
+        c->put_vp8_epel_pixels_tab[0][0][0]     =
+        c->put_vp8_bilinear_pixels_tab[0][0][0] = ff_put_vp8_pixels16_sse;
+    }
+
     if (mm_flags & FF_MM_SSE2) {
         VP8_LUMA_MC_FUNC(0, 16, sse2);
         VP8_MC_FUNC(1, 8, sse2);