# HG changeset patch
# User darkshikari
# Date 1277489647 0
# Node ID 56aba5a9761ceea6de9e45eaefdae9368c5925f3
# Parent  778bdafd5496ac91b601c87a5281a2b7881a9fed
Make VP8 DSP functions take two strides
This isn't useful for the C functions, but will allow re-using H and V functions
for HV functions without adding separate H and V wrappers.

diff -r 778bdafd5496 -r 56aba5a9761c dsputil.c
--- a/dsputil.c	Fri Jun 25 13:43:55 2010 +0000
+++ b/dsputil.c	Fri Jun 25 18:14:07 2010 +0000
@@ -2657,18 +2657,6 @@
 }
 #endif /* CONFIG_RV40_DECODER */
 
-#if CONFIG_VP8_DECODER
-void ff_put_vp8_pixels16_c(uint8_t *dst, uint8_t *src, int stride, int h, int x, int y) {
-    put_pixels16_c(dst, src, stride, h);
-}
-void ff_put_vp8_pixels8_c(uint8_t *dst, uint8_t *src, int stride, int h, int x, int y) {
-    put_pixels8_c(dst, src, stride, h);
-}
-void ff_put_vp8_pixels4_c(uint8_t *dst, uint8_t *src, int stride, int h, int x, int y) {
-    put_pixels4_c(dst, src, stride, h);
-}
-#endif
-
 static void wmv2_mspel8_v_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int w){
     uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
     int i;
diff -r 778bdafd5496 -r 56aba5a9761c vp8.c
--- a/vp8.c	Fri Jun 25 13:43:55 2010 +0000
+++ b/vp8.c	Fri Jun 25 18:14:07 2010 +0000
@@ -912,7 +912,7 @@
                           uint8_t *dst, uint8_t *src, const VP56mv *mv,
                           int x_off, int y_off, int block_w, int block_h,
                           int width, int height, int linesize,
-                          h264_chroma_mc_func mc_func[3][3])
+                          vp8_mc_func mc_func[3][3])
 {
     static const uint8_t idx[8] = { 0, 1, 2, 1, 2, 1, 2, 1 };
     int mx = (mv->x << luma)&7, mx_idx = idx[mx];
@@ -931,7 +931,7 @@
         src = s->edge_emu_buffer + 2 + linesize * 2;
     }
 
-    mc_func[my_idx][mx_idx](dst, src, linesize, block_h, mx, my);
+    mc_func[my_idx][mx_idx](dst, linesize, src, linesize, block_h, mx, my);
 }
 
 /**
diff -r 778bdafd5496 -r 56aba5a9761c vp8dsp.c
--- a/vp8dsp.c	Fri Jun 25 13:43:55 2010 +0000
+++ b/vp8dsp.c	Fri Jun 25 18:14:07 2010 +0000
@@ -250,6 +250,16 @@
     { 0,   1,  12, 123,   6,   0 },
 };
 
+#define PUT_PIXELS(WIDTH) \
+static void put_vp8_pixels ## WIDTH ##_c(uint8_t *dst, int dststride, uint8_t *src, int srcstride, int h, int x, int y) { \
+    for (int y = 0; y < h; y++, dst+= dststride, src+= srcstride) { \
+        memcpy(dst, src, WIDTH); \
+    } \
+}
+
+PUT_PIXELS(16)
+PUT_PIXELS(8)
+PUT_PIXELS(4)
 
 #define FILTER_6TAP(src, F, stride) \
     av_clip_uint8((F[2]*src[x+0*stride] - F[1]*src[x-1*stride] + F[0]*src[x-2*stride] + \
@@ -260,7 +270,7 @@
                    F[3]*src[x+1*stride] - F[4]*src[x+2*stride] + 64) >> 7)
 
 #define VP8_EPEL_H(SIZE, FILTER, FILTERNAME) \
-static void put_vp8_epel ## SIZE ## _ ## FILTERNAME ## _c(uint8_t *dst, uint8_t *src, int stride, int h, int mx, int my) \
+static void put_vp8_epel ## SIZE ## _ ## FILTERNAME ## _c(uint8_t *dst, int dststride, uint8_t *src, int srcstride, int h, int mx, int my) \
 { \
     const uint8_t *filter = subpel_filters[mx-1]; \
     int x, y; \
@@ -268,37 +278,37 @@
     for (y = 0; y < h; y++) { \
         for (x = 0; x < SIZE; x++) \
             dst[x] = FILTER(src, filter, 1); \
-        dst += stride; \
-        src += stride; \
+        dst += dststride; \
+        src += srcstride; \
     } \
 }
 #define VP8_EPEL_V(SIZE, FILTER, FILTERNAME) \
-static void put_vp8_epel ## SIZE ## _ ## FILTERNAME ## _c(uint8_t *dst, uint8_t *src, int stride, int h, int mx, int my) \
+static void put_vp8_epel ## SIZE ## _ ## FILTERNAME ## _c(uint8_t *dst, int dststride, uint8_t *src, int srcstride, int h, int mx, int my) \
 { \
     const uint8_t *filter = subpel_filters[my-1]; \
     int x, y; \
 \
     for (y = 0; y < h; y++) { \
         for (x = 0; x < SIZE; x++) \
-            dst[x] = FILTER(src, filter, stride); \
-        dst += stride; \
-        src += stride; \
+            dst[x] = FILTER(src, filter, srcstride); \
+        dst += dststride; \
+        src += srcstride; \
     } \
 }
 #define VP8_EPEL_HV(SIZE, FILTERX, FILTERY, FILTERNAME) \
-static void put_vp8_epel ## SIZE ## _ ## FILTERNAME ## _c(uint8_t *dst, uint8_t *src, int stride, int h, int mx, int my) \
+static void put_vp8_epel ## SIZE ## _ ## FILTERNAME ## _c(uint8_t *dst, int dststride, uint8_t *src, int srcstride, int h, int mx, int my) \
 { \
     const uint8_t *filter = subpel_filters[mx-1]; \
     int x, y; \
     uint8_t tmp_array[(2*SIZE+5)*SIZE]; \
     uint8_t *tmp = tmp_array; \
-    src -= 2*stride; \
+    src -= 2*srcstride; \
 \
     for (y = 0; y < h+5; y++) { \
         for (x = 0; x < SIZE; x++) \
             tmp[x] = FILTERX(src, filter, 1); \
         tmp += SIZE; \
-        src += stride; \
+        src += srcstride; \
     } \
 \
     tmp = tmp_array + 2*SIZE; \
@@ -307,7 +317,7 @@
     for (y = 0; y < h; y++) { \
         for (x = 0; x < SIZE; x++) \
             dst[x] = FILTERY(tmp, filter, SIZE); \
-        dst += stride; \
+        dst += dststride; \
         tmp += SIZE; \
     } \
 }
@@ -338,7 +348,7 @@
 VP8_EPEL_HV(4,  FILTER_6TAP, FILTER_6TAP, h6v6)
 
 #define VP8_MC_FUNC(IDX, SIZE) \
-    dsp->put_vp8_epel_pixels_tab[IDX][0][0] = ff_put_vp8_pixels ## SIZE ## _c; \
+    dsp->put_vp8_epel_pixels_tab[IDX][0][0] = put_vp8_pixels ## SIZE ## _c; \
     dsp->put_vp8_epel_pixels_tab[IDX][0][1] = put_vp8_epel ## SIZE ## _h4_c; \
     dsp->put_vp8_epel_pixels_tab[IDX][0][2] = put_vp8_epel ## SIZE ## _h6_c; \
     dsp->put_vp8_epel_pixels_tab[IDX][1][0] = put_vp8_epel ## SIZE ## _v4_c; \
diff -r 778bdafd5496 -r 56aba5a9761c vp8dsp.h
--- a/vp8dsp.h	Fri Jun 25 13:43:55 2010 +0000
+++ b/vp8dsp.h	Fri Jun 25 18:14:07 2010 +0000
@@ -27,6 +27,8 @@
 
 #include "dsputil.h"
 
+typedef void (*vp8_mc_func)(uint8_t *dst/*align 8*/, int dstStride, uint8_t *src/*align 1*/, int srcStride, int h, int x, int y);
+
 typedef struct VP8DSPContext {
     void (*vp8_luma_dc_wht)(DCTELEM block[4][4][16], DCTELEM dc[16]);
     void (*vp8_idct_add)(uint8_t *dst, DCTELEM block[16], int stride);
@@ -55,7 +57,7 @@
      * third dimension: same as second dimention, for horizontal interpolation
      * so something like put_vp8_epel_pixels_tab[width>>3][2*!!my-(my&1)][2*!!mx-(mx&1)](..., mx, my)
      */
-    h264_chroma_mc_func put_vp8_epel_pixels_tab[3][3][3];
+    vp8_mc_func put_vp8_epel_pixels_tab[3][3][3];
 } VP8DSPContext;
 
 void ff_put_vp8_pixels16_c(uint8_t *dst, uint8_t *src, int stride, int h, int x, int y);