diff x86/vp8dsp-init.c @ 12086:d780ae746855 libavcodec

Simple H/V loopfilter for VP8 in MMX, MMX2 and SSE2 (yay for yasm macros).
author rbultje
date Sat, 03 Jul 2010 19:26:30 +0000
parents 8527154f6e81
children b246b214c2e9
line wrap: on
line diff
--- a/x86/vp8dsp-init.c	Sat Jul 03 18:36:10 2010 +0000
+++ b/x86/vp8dsp-init.c	Sat Jul 03 19:26:30 2010 +0000
@@ -222,6 +222,13 @@
 extern void ff_vp8_idct_dc_add_sse4(uint8_t *dst, DCTELEM block[16], int stride);
 extern void ff_vp8_luma_dc_wht_mmxext(DCTELEM block[4][4][16], DCTELEM dc[16]);
 extern void ff_vp8_idct_add_mmx(uint8_t *dst, DCTELEM block[16], int stride);
+
+extern void ff_vp8_v_loop_filter_simple_mmx   (uint8_t *dst, int stride, int flim);
+extern void ff_vp8_v_loop_filter_simple_mmxext(uint8_t *dst, int stride, int flim);
+extern void ff_vp8_v_loop_filter_simple_sse2  (uint8_t *dst, int stride, int flim);
+extern void ff_vp8_h_loop_filter_simple_mmx   (uint8_t *dst, int stride, int flim);
+extern void ff_vp8_h_loop_filter_simple_mmxext(uint8_t *dst, int stride, int flim);
+extern void ff_vp8_h_loop_filter_simple_sse2  (uint8_t *dst, int stride, int flim);
 #endif
 
 #define VP8_LUMA_MC_FUNC(IDX, SIZE, OPT) \
@@ -260,6 +267,9 @@
         c->put_vp8_bilinear_pixels_tab[0][0][0] = ff_put_vp8_pixels16_mmx;
         c->put_vp8_epel_pixels_tab[1][0][0]     =
         c->put_vp8_bilinear_pixels_tab[1][0][0] = ff_put_vp8_pixels8_mmx;
+
+        c->vp8_v_loop_filter_simple = ff_vp8_v_loop_filter_simple_mmx;
+        c->vp8_h_loop_filter_simple = ff_vp8_h_loop_filter_simple_mmx;
     }
 
     /* note that 4-tap width=16 functions are missing because w=16
@@ -272,6 +282,9 @@
         VP8_BILINEAR_MC_FUNC(0, 16, mmxext);
         VP8_BILINEAR_MC_FUNC(1, 8, mmxext);
         VP8_BILINEAR_MC_FUNC(2, 4, mmxext);
+
+        c->vp8_v_loop_filter_simple = ff_vp8_v_loop_filter_simple_mmxext;
+        c->vp8_h_loop_filter_simple = ff_vp8_h_loop_filter_simple_mmxext;
     }
 
     if (mm_flags & FF_MM_SSE) {
@@ -284,6 +297,9 @@
         VP8_MC_FUNC(1, 8, sse2);
         VP8_BILINEAR_MC_FUNC(0, 16, sse2);
         VP8_BILINEAR_MC_FUNC(1, 8, sse2);
+
+        c->vp8_v_loop_filter_simple = ff_vp8_v_loop_filter_simple_sse2;
+        c->vp8_h_loop_filter_simple = ff_vp8_h_loop_filter_simple_sse2;
     }
 
     if (mm_flags & FF_MM_SSSE3) {