libavcodec.hg: snow.c comparison

comparison snow.c @ 5634:9960732c7d7b libavcodec

Replace constants by HTAPS (half pel interpolation filter taps) where appropriate.

author	michael
date	Wed, 05 Sep 2007 00:49:09 +0000
parents	873ea64637d9
children	473cada682a1

comparison

equal deleted inserted replaced

-:873ea64637d9
+:9960732c7d7b
 };
 #define LOG2_MB_SIZE 4
 #define MB_SIZE (1<<LOG2_MB_SIZE)
 #define ENCODER_EXTRA_BITS 4
+#define HTAPS 6
 typedef struct x_and_coeff{
 int16_t x;
 uint16_t coeff;
 } x_and_coeff;
 }
 static void mc_block(uint8_t *dst, const uint8_t *src, uint8_t *tmp, int stride, int b_w, int b_h, int dx, int dy){
 int x, y;
 START_TIMER
-for(y=0; y < b_h+5; y++){
+for(y=0; y < b_h+HTAPS-1; y++){
 for(x=0; x < b_w; x++){
-int a0= src[x    ];
+int a_2=src[x + HTAPS/2-5];
-int a1= src[x + 1];
+int a_1=src[x + HTAPS/2-4];
-int a2= src[x + 2];
+int a0= src[x + HTAPS/2-3];
-int a3= src[x + 3];
+int a1= src[x + HTAPS/2-2];
-int a4= src[x + 4];
+int a2= src[x + HTAPS/2-1];
-int a5= src[x + 5];
+int a3= src[x + HTAPS/2+0];
+int a4= src[x + HTAPS/2+1];
+int a5= src[x + HTAPS/2+2];
+int a6= src[x + HTAPS/2+3];
+int a7= src[x + HTAPS/2+4];
 //            int am= 9*(a1+a2) - (a0+a3);
 int am= 20*(a2+a3) - 5*(a1+a4) + (a0+a5);
 //            int am= 18*(a2+a3) - 2*(a1+a4);
 //             int aL= (-7*a0 + 105*a1 + 35*a2 - 5*a3)>>3;
 //             int aR= (-7*a3 + 105*a2 + 35*a1 - 5*a0)>>3;
 else           tmp[x + y*stride]= (   aR*(16-dx) + 16*a2*(dx-12) + 32)>>6;*/
 }
 tmp += stride;
 src += stride;
 }
-tmp -= (b_h+5)*stride;
+tmp -= (b_h+HTAPS-1)*stride;
 for(y=0; y < b_h; y++){
 for(x=0; x < b_w; x++){
-int a0= tmp[x + 0*stride];
+int a_2=tmp[x + (HTAPS/2-5)*stride];
-int a1= tmp[x + 1*stride];
+int a_1=tmp[x + (HTAPS/2-4)*stride];
-int a2= tmp[x + 2*stride];
+int a0= tmp[x + (HTAPS/2-3)*stride];
-int a3= tmp[x + 3*stride];
+int a1= tmp[x + (HTAPS/2-2)*stride];
-int a4= tmp[x + 4*stride];
+int a2= tmp[x + (HTAPS/2-1)*stride];
-int a5= tmp[x + 5*stride];
+int a3= tmp[x + (HTAPS/2+0)*stride];
+int a4= tmp[x + (HTAPS/2+1)*stride];
+int a5= tmp[x + (HTAPS/2+2)*stride];
+int a6= tmp[x + (HTAPS/2+3)*stride];
+int a7= tmp[x + (HTAPS/2+4)*stride];
 int am= 20*(a2+a3) - 5*(a1+a4) + (a0+a5);
 //            int am= 18*(a2+a3) - 2*(a1+a4);
 /*            int aL= (-7*a0 + 105*a1 + 35*a2 - 5*a3)>>3;
 int aR= (-7*a3 + 105*a2 + 35*a1 - 5*a0)>>3;*/
 STOP_TIMER("mc_block")
 }
 #define mca(dx,dy,b_w)\
 static void mc_block_hpel ## dx ## dy ## b_w(uint8_t *dst, const uint8_t *src, int stride, int h){\
-uint8_t tmp[stride*(b_w+5)];\
+uint8_t tmp[stride*(b_w+HTAPS-1)];\
 assert(h==b_w);\
-mc_block(dst, src-2-2*stride, tmp, stride, b_w, b_w, dx, dy);\
+mc_block(dst, src-(HTAPS/2-1)-(HTAPS/2-1)*stride, tmp, stride, b_w, b_w, dx, dy);\
 }
 mca( 0, 0,16)
 mca( 8, 0,16)
 mca( 0, 8,16)
 int mx= block->mx*scale;
 int my= block->my*scale;
 const int dx= mx&15;
 const int dy= my&15;
 const int tab_index= 3 - (b_w>>2) + (b_w>>4);
-sx += (mx>>4) - 2;
+sx += (mx>>4) - (HTAPS/2-1);
-sy += (my>>4) - 2;
+sy += (my>>4) - (HTAPS/2-1);
 src += sx + sy*stride;
-if(   (unsigned)sx >= w - b_w - 4
+if(   (unsigned)sx >= w - b_w - (HTAPS-2)
-|| (unsigned)sy >= h - b_h - 4){
+|| (unsigned)sy >= h - b_h - (HTAPS-2)){
-ff_emulated_edge_mc(tmp + MB_SIZE, src, stride, b_w+5, b_h+5, sx, sy, w, h);
+ff_emulated_edge_mc(tmp + MB_SIZE, src, stride, b_w+HTAPS-1, b_h+HTAPS-1, sx, sy, w, h);
 src= tmp + MB_SIZE;
 }
 //        assert(b_w == b_h || 2*b_w == b_h || b_w == 2*b_h);
 //        assert(!(b_w&(b_w-1)));
 assert(b_w>1 && b_h>1);
 assert(tab_index>=0 && tab_index<4 || b_w==32);
-if((dx&3) || (dy&3) || !(b_w == b_h || 2*b_w == b_h || b_w == 2*b_h) || (b_w&(b_w-1)))
+if((dx&3) || (dy&3) || !(b_w == b_h || 2*b_w == b_h || b_w == 2*b_h) || (b_w&(b_w-1)) || HTAPS != 6)
 mc_block(dst, src, tmp, stride, b_w, b_h, dx, dy);
 else if(b_w==32){
 int y;
 for(y=0; y<b_h; y+=16){
 s->dsp.put_h264_qpel_pixels_tab[0][dy+(dx>>2)](dst + y*stride, src + 2 + (y+2)*stride,stride);
 const int ref_stride= s->current_picture.linesize[plane_index];
 uint8_t *dst= s->current_picture.data[plane_index];
 uint8_t *src= s->  input_picture.data[plane_index];
 IDWTELEM *pred= (IDWTELEM*)s->m.obmc_scratchpad + plane_index*block_size*block_size*4;
 uint8_t cur[ref_stride*2*MB_SIZE]; //FIXME alignment
-uint8_t tmp[ref_stride*(2*MB_SIZE+5)];
+uint8_t tmp[ref_stride*(2*MB_SIZE+HTAPS-1)];
 const int b_stride = s->b_width << s->block_max_depth;
 const int b_height = s->b_height<< s->block_max_depth;
 const int w= p->width;
 const int h= p->height;
 int distortion;

Mercurial > libavcodec.hg

comparison snow.c @ 5634:9960732c7d7b libavcodec