changeset 174:ac5075a55488 libavcodec

new IDCT code by Michael Niedermayer (michaelni@gmx.at) - #define SIMPLE_IDCT to enable
author arpi_esp
date Sun, 09 Dec 2001 12:04:09 +0000
parents 37eaaa9596cc
children bd77d3cbb233
files Makefile dsputil.c dsputil.h h263.c i386/dsputil_mmx.c
diffstat 5 files changed, 67 insertions(+), 7 deletions(-) [+]
line wrap: on
line diff
--- a/Makefile	Wed Nov 28 01:26:03 2001 +0000
+++ b/Makefile	Sun Dec 09 12:04:09 2001 +0000
@@ -6,7 +6,7 @@
 OBJS= common.o utils.o mpegvideo.o h263.o jrevdct.o jfdctfst.o \
       mpegaudio.o ac3enc.o mjpeg.o resample.o dsputil.o \
       motion_est.o imgconvert.o imgresample.o msmpeg4.o \
-      mpeg12.o h263dec.o rv10.o mpegaudiodec.o pcm.o
+      mpeg12.o h263dec.o rv10.o mpegaudiodec.o pcm.o simple_idct.o
 ASM_OBJS=
 
 # currently using libac3 for ac3 decoding
@@ -20,7 +20,8 @@
 ifeq ($(TARGET_MMX),yes)
 OBJS += i386/fdct_mmx.o i386/cputest.o \
 	i386/dsputil_mmx.o i386/mpegvideo_mmx.o \
-        i386/idct_mmx.o i386/motion_est_mmx.o
+        i386/idct_mmx.o i386/motion_est_mmx.o \
+	i386/simple_idct_mmx.o
 endif
 
 # armv4l specific stuff
--- a/dsputil.c	Wed Nov 28 01:26:03 2001 +0000
+++ b/dsputil.c	Sun Dec 09 12:04:09 2001 +0000
@@ -20,6 +20,7 @@
 #include <stdio.h>
 #include "avcodec.h"
 #include "dsputil.h"
+#include "simple_idct.h"
 
 void (*ff_idct)(DCTELEM *block);
 void (*get_pixels)(DCTELEM *block, const UINT8 *pixels, int line_size);
@@ -388,6 +389,27 @@
 
 /* permute block according so that it corresponds to the MMX idct
    order */
+#ifdef SIMPLE_IDCT
+void block_permute(INT16 *block)
+{
+	int i;
+	INT16 temp[64];
+
+//	for(i=0; i<64; i++) temp[i] = block[ block_permute_op(i) ];
+	for(i=0; i<64; i++) temp[ block_permute_op(i) ] = block[i];
+
+	for(i=0; i<64; i++) block[i] = temp[i];
+/*
+	for(i=0; i<64; i++)
+	{
+		if((i&7)==0) printf("\n");
+		printf("%2d ", block[i]);
+	}
+*/
+}
+
+#else
+
 void block_permute(INT16 *block)
 {
     int tmp1, tmp2, tmp3, tmp4, tmp5, tmp6;
@@ -409,6 +431,7 @@
         block += 8;
     }
 }
+#endif
 
 void dsputil_init(void)
 {
@@ -425,7 +448,11 @@
         squareTbl[i] = (i - 256) * (i - 256);
     }
 
+#ifdef SIMPLE_IDCT
+    ff_idct = simple_idct;
+#else
     ff_idct = j_rev_dct;
+#endif
     get_pixels = get_pixels_c;
     put_pixels_clamped = put_pixels_clamped_c;
     add_pixels_clamped = add_pixels_clamped_c;
@@ -449,6 +476,10 @@
     use_permuted_idct = 0;
 #endif
 
+#ifdef SIMPLE_IDCT
+    if(ff_idct == simple_idct) use_permuted_idct=0;
+#endif
+
     if (use_permuted_idct) {
         /* permute for IDCT */
         for(i=0;i<64;i++) {
--- a/dsputil.h	Wed Nov 28 01:26:03 2001 +0000
+++ b/dsputil.h	Sun Dec 09 12:04:09 2001 +0000
@@ -67,10 +67,33 @@
 int pix_abs16x16_y2_c(UINT8 *blk1, UINT8 *blk2, int lx, int h);
 int pix_abs16x16_xy2_c(UINT8 *blk1, UINT8 *blk2, int lx, int h);
 
+#if defined (SIMPLE_IDCT) && defined (HAVE_MMX)
+static inline int block_permute_op(int j)
+{
+static const int table[64]={
+	0x00, 0x08, 0x01, 0x09, 0x04, 0x0C, 0x05, 0x0D,
+	0x10, 0x18, 0x11, 0x19, 0x14, 0x1C, 0x15, 0x1D,
+	0x02, 0x0A, 0x03, 0x0B, 0x06, 0x0E, 0x07, 0x0F,
+	0x12, 0x1A, 0x13, 0x1B, 0x16, 0x1E, 0x17, 0x1F,
+	0x20, 0x28, 0x21, 0x29, 0x24, 0x2C, 0x25, 0x2D,
+	0x30, 0x38, 0x31, 0x39, 0x34, 0x3C, 0x35, 0x3D,
+	0x22, 0x2A, 0x23, 0x2B, 0x26, 0x2E, 0x27, 0x2F,
+	0x32, 0x3A, 0x33, 0x3B, 0x36, 0x3E, 0x37, 0x3F,
+};
+
+	return table[j];
+}
+#elif defined (SIMPLE_IDCT)
+static inline int block_permute_op(int j)
+{
+    return j;
+}
+#else
 static inline int block_permute_op(int j)
 {
     return (j & 0x38) | ((j & 6) >> 1) | ((j & 1) << 2);
 }
+#endif
 
 void block_permute(INT16 *block);
 
--- a/h263.c	Wed Nov 28 01:26:03 2001 +0000
+++ b/h263.c	Sun Dec 09 12:04:09 2001 +0000
@@ -554,7 +554,7 @@
     return pred;
 }
 
-void mpeg4_pred_ac(MpegEncContext * s, INT16 *block, int n, 
+void mpeg4_pred_ac(MpegEncContext * s, INT16 *block, int n,
                    int dir)
 {
     int x, y, wrap, i;
@@ -579,22 +579,22 @@
             /* left prediction */
             ac_val -= 16;
             for(i=1;i<8;i++) {
-                block[i*8] += ac_val[i];
+                block[block_permute_op(i*8)] += ac_val[i];
             }
         } else {
             /* top prediction */
             ac_val -= 16 * wrap;
             for(i=1;i<8;i++) {
-                block[i] += ac_val[i + 8];
+                block[block_permute_op(i)] += ac_val[i + 8];
             }
         }
     }
     /* left copy */
     for(i=1;i<8;i++)
-        ac_val1[i] = block[i * 8];
+        ac_val1[i] = block[block_permute_op(i * 8)];
     /* top copy */
     for(i=1;i<8;i++)
-        ac_val1[8 + i] = block[i];
+        ac_val1[8 + i] = block[block_permute_op(i)];
 }
 
 static inline void mpeg4_encode_dc(MpegEncContext * s, int level, int n, int *dir_ptr)
--- a/i386/dsputil_mmx.c	Wed Nov 28 01:26:03 2001 +0000
+++ b/i386/dsputil_mmx.c	Sun Dec 09 12:04:09 2001 +0000
@@ -20,6 +20,7 @@
  */
 
 #include "../dsputil.h"
+#include "../simple_idct.h"
 
 int mm_flags; /* multimedia extension flags */
 
@@ -1047,5 +1048,9 @@
         } else {
             ff_idct = ff_mmx_idct;
         }
+#ifdef SIMPLE_IDCT
+//	ff_idct = simple_idct;
+	ff_idct = simple_idct_mmx;
+#endif
     }
 }