libavcodec.hg: simple_idct.c comparison

comparison simple_idct.c @ 1008:fb6cbb8a04a3 libavcodec

fixing DCTELEM != short

author	michaelni
date	Wed, 15 Jan 2003 19:21:21 +0000
parents	caa77cd960c0
children	b32afefe7d33

comparison

equal deleted inserted replaced

-:b2cf2a1d9a51
+:fb6cbb8a04a3
 /* signed 16x16 -> 32 multiply */
 #define MUL16(rt, ra, rb) rt = (ra) * (rb)
 #endif
-static inline void idctRowCondDC (int16_t * row)
+static inline void idctRowCondDC (DCTELEM * row)
 {
 	int a0, a1, a2, a3, b0, b1, b2, b3;
 #ifdef FAST_64BIT
 uint64_t temp;
 #else
 #ifdef WORDS_BIGENDIAN
 #define ROW0_MASK 0xffff000000000000LL
 #else
 #define ROW0_MASK 0xffffLL
 #endif
-	if ( ((((uint64_t *)row)[0] & ~ROW0_MASK) |
+if(sizeof(DCTELEM)==2){
-((uint64_t *)row)[1]) == 0) {
+if ( ((((uint64_t *)row)[0] & ~ROW0_MASK) |
-temp = (row[0] << 3) & 0xffff;
+((uint64_t *)row)[1]) == 0) {
-temp += temp << 16;
+temp = (row[0] << 3) & 0xffff;
-temp += temp << 32;
+temp += temp << 16;
-((uint64_t *)row)[0] = temp;
+temp += temp << 32;
-((uint64_t *)row)[1] = temp;
+((uint64_t *)row)[0] = temp;
-return;
+((uint64_t *)row)[1] = temp;
-	}
+return;
+	    }
+}else{
+if (!(row[1]|row[2]|row[3]|row[4]|row[5]|row[6]|row[7])) {
+row[0]=row[1]=row[2]=row[3]=row[4]=row[5]=row[6]=row[7]= row[0] << 3;
+return;
+}
+}
 #else
-	if (!(((uint32_t*)row)[1] |
+if(sizeof(DCTELEM)==2){
-((uint32_t*)row)[2] |
+if (!(((uint32_t*)row)[1] |
-((uint32_t*)row)[3] |
+((uint32_t*)row)[2] |
-row[1])) {
+((uint32_t*)row)[3] |
-temp = (row[0] << 3) & 0xffff;
+row[1])) {
-temp += temp << 16;
+temp = (row[0] << 3) & 0xffff;
-((uint32_t*)row)[0]=((uint32_t*)row)[1] =
+temp += temp << 16;
-		((uint32_t*)row)[2]=((uint32_t*)row)[3] = temp;
+((uint32_t*)row)[0]=((uint32_t*)row)[1] =
-		return;
+((uint32_t*)row)[2]=((uint32_t*)row)[3] = temp;
-	}
+return;
+}
+}else{
+if (!(row[1]|row[2]|row[3]|row[4]|row[5]|row[6]|row[7])) {
+row[0]=row[1]=row[2]=row[3]=row[4]=row[5]=row[6]=row[7]= row[0] << 3;
+return;
+}
+}
 #endif
 a0 = (W4 * row[0]) + (1 << (ROW_SHIFT - 1));
 	a1 = a0;
 	a2 = a0;
 	row[3] = (a3 + b3) >> ROW_SHIFT;
 	row[4] = (a3 - b3) >> ROW_SHIFT;
 }
 static inline void idctSparseColPut (UINT8 *dest, int line_size,
-int16_t * col)
+DCTELEM * col)
 {
 	int a0, a1, a2, a3, b0, b1, b2, b3;
 UINT8 *cm = cropTbl + MAX_NEG_CROP;
 /* XXX: I did that only to give same values as previous code */
 dest += line_size;
 dest[0] = cm[(a0 - b0) >> COL_SHIFT];
 }
 static inline void idctSparseColAdd (UINT8 *dest, int line_size,
-int16_t * col)
+DCTELEM * col)
 {
 	int a0, a1, a2, a3, b0, b1, b2, b3;
 UINT8 *cm = cropTbl + MAX_NEG_CROP;
 /* XXX: I did that only to give same values as previous code */
 dest[0] = cm[dest[0] + ((a1 - b1) >> COL_SHIFT)];
 dest += line_size;
 dest[0] = cm[dest[0] + ((a0 - b0) >> COL_SHIFT)];
 }
-static inline void idctSparseCol (int16_t * col)
+static inline void idctSparseCol (DCTELEM * col)
 {
 	int a0, a1, a2, a3, b0, b1, b2, b3;
 /* XXX: I did that only to give same values as previous code */
 	a0 = W4 * (col[8*0] + ((1<<(COL_SHIFT-1))/W4));
 col[40] = ((a2 - b2) >> COL_SHIFT);
 col[48] = ((a1 - b1) >> COL_SHIFT);
 col[56] = ((a0 - b0) >> COL_SHIFT);
 }
-void simple_idct_put(UINT8 *dest, int line_size, INT16 *block)
+void simple_idct_put(UINT8 *dest, int line_size, DCTELEM *block)
 {
 int i;
 for(i=0; i<8; i++)
 idctRowCondDC(block + i*8);
 for(i=0; i<8; i++)
 idctSparseColPut(dest + i, line_size, block + i);
 }
-void simple_idct_add(UINT8 *dest, int line_size, INT16 *block)
+void simple_idct_add(UINT8 *dest, int line_size, DCTELEM *block)
 {
 int i;
 for(i=0; i<8; i++)
 idctRowCondDC(block + i*8);
 for(i=0; i<8; i++)
 idctSparseColAdd(dest + i, line_size, block + i);
 }
-void simple_idct(INT16 *block)
+void simple_idct(DCTELEM *block)
 {
 int i;
 for(i=0; i<8; i++)
 idctRowCondDC(block + i*8);
 /* row idct is multiple by 16 * sqrt(2.0), col idct4 is normalized,
 and the butterfly must be multiplied by 0.5 * sqrt(2.0) */
 #define C_SHIFT (4+1+12)
-static inline void idct4col(UINT8 *dest, int line_size, const INT16 *col)
+static inline void idct4col(UINT8 *dest, int line_size, const DCTELEM *col)
 {
 int c0, c1, c2, c3, a0, a1, a2, a3;
 const UINT8 *cm = cropTbl + MAX_NEG_CROP;
 a0 = col[8*0];
 to the pixels before clamping to avoid systematic error
 (1024*sqrt(2)) offset would be needed otherwise. */
 /* XXX: I think a 1.0/sqrt(2) normalization should be needed to
 compensate the extra butterfly stage - I don't have the full DV
 specification */
-void simple_idct248_put(UINT8 *dest, int line_size, INT16 *block)
+void simple_idct248_put(UINT8 *dest, int line_size, DCTELEM *block)
 {
 int i;
-INT16 *ptr;
+DCTELEM *ptr;
 /* butterfly */
 ptr = block;
 for(i=0;i<4;i++) {
 BF(0);
 #define C_FIX(x) ((int)((x) * 1.414213562 * (1 << CN_SHIFT) + 0.5))
 #define C1 C_FIX(0.6532814824)
 #define C2 C_FIX(0.2705980501)
 #define C3 C_FIX(0.5)
 #define C_SHIFT (4+1+12)
-static inline void idct4col_add(UINT8 *dest, int line_size, const INT16 *col)
+static inline void idct4col_add(UINT8 *dest, int line_size, const DCTELEM *col)
 {
 int c0, c1, c2, c3, a0, a1, a2, a3;
 const UINT8 *cm = cropTbl + MAX_NEG_CROP;
 a0 = col[8*0];
 #define R_FIX(x) ((int)((x) * 1.414213562 * (1 << RN_SHIFT) + 0.5))
 #define R1 R_FIX(0.6532814824)
 #define R2 R_FIX(0.2705980501)
 #define R3 R_FIX(0.5)
 #define R_SHIFT 11
-static inline void idct4row(INT16 *row)
+static inline void idct4row(DCTELEM *row)
 {
 int c0, c1, c2, c3, a0, a1, a2, a3;
 const UINT8 *cm = cropTbl + MAX_NEG_CROP;
 a0 = row[0];
 row[1]= (c2 + c3) >> R_SHIFT;
 row[2]= (c2 - c3) >> R_SHIFT;
 row[3]= (c0 - c1) >> R_SHIFT;
 }
-void simple_idct84_add(UINT8 *dest, int line_size, INT16 *block)
+void simple_idct84_add(UINT8 *dest, int line_size, DCTELEM *block)
 {
 int i;
 /* IDCT8 on each line */
 for(i=0; i<4; i++) {
 for(i=0;i<8;i++) {
 idct4col_add(dest + i, line_size, block + i);
 }
 }
-void simple_idct48_add(UINT8 *dest, int line_size, INT16 *block)
+void simple_idct48_add(UINT8 *dest, int line_size, DCTELEM *block)
 {
 int i;
 /* IDCT4 on each line */
 for(i=0; i<8; i++) {

Mercurial > libavcodec.hg

comparison simple_idct.c @ 1008:fb6cbb8a04a3 libavcodec