comparison dct-test.c @ 33:7cf705a32d1c libavcodec

updated dct-test to test IDCTs too
author glantau
date Tue, 07 Aug 2001 22:42:45 +0000
parents 986e461dc072
children 718a22dc121f
comparison
equal deleted inserted replaced
32:a524484f9adf 33:7cf705a32d1c
4 #include <stdlib.h> 4 #include <stdlib.h>
5 #include <stdio.h> 5 #include <stdio.h>
6 #include <string.h> 6 #include <string.h>
7 #include <sys/time.h> 7 #include <sys/time.h>
8 #include <unistd.h> 8 #include <unistd.h>
9 #include <getopt.h>
9 10
10 #include "dsputil.h" 11 #include "dsputil.h"
11 12
13 #include "i386/mmx.h"
14
15 /* reference fdct/idct */
12 extern void fdct(DCTELEM *block); 16 extern void fdct(DCTELEM *block);
17 extern void idct(DCTELEM *block);
13 extern void init_fdct(); 18 extern void init_fdct();
19
20 extern void j_rev_dct(DCTELEM *data);
21 extern void ff_mmx_idct(DCTELEM *data);
22 extern void ff_mmxext_idct(DCTELEM *data);
14 23
15 #define AANSCALE_BITS 12 24 #define AANSCALE_BITS 12
16 static const unsigned short aanscales[64] = { 25 static const unsigned short aanscales[64] = {
17 /* precomputed values scaled up by 14 bits */ 26 /* precomputed values scaled up by 14 bits */
18 16384, 22725, 21407, 19266, 16384, 12873, 8867, 4520, 27 16384, 22725, 21407, 19266, 16384, 12873, 8867, 4520,
33 } 42 }
34 43
35 #define NB_ITS 20000 44 #define NB_ITS 20000
36 #define NB_ITS_SPEED 50000 45 #define NB_ITS_SPEED 50000
37 46
38 void dct_error(const char *name, 47 static short idct_mmx_perm[64];
39 void (*fdct_func)(DCTELEM *block)) 48
49 void idct_mmx_init(void)
50 {
51 int i;
52
53 /* the mmx/mmxext idct uses a reordered input, so we patch scan tables */
54 for (i = 0; i < 64; i++) {
55 idct_mmx_perm[i] = (i & 0x38) | ((i & 6) >> 1) | ((i & 1) << 2);
56 }
57 }
58
59 static DCTELEM block[64] __attribute__ ((aligned (8)));
60 static DCTELEM block1[64] __attribute__ ((aligned (8)));
61
62 void dct_error(const char *name, int is_idct,
63 void (*fdct_func)(DCTELEM *block),
64 void (*fdct_ref)(DCTELEM *block))
40 { 65 {
41 int it, i, scale; 66 int it, i, scale;
42 DCTELEM block[64], block1[64];
43 int err_inf, v; 67 int err_inf, v;
44 INT64 err2, ti, ti1, it1; 68 INT64 err2, ti, ti1, it1;
45 69
46 srandom(0); 70 srandom(0);
47 71
48 err_inf = 0; 72 err_inf = 0;
49 err2 = 0; 73 err2 = 0;
50 for(it=0;it<NB_ITS;it++) { 74 for(it=0;it<NB_ITS;it++) {
51 for(i=0;i<64;i++) 75 for(i=0;i<64;i++)
52 block1[i] = random() % 256; 76 block1[i] = random() % 256;
53 memcpy(block, block1, sizeof(DCTELEM) * 64); 77
54 78 /* for idct test, generate inverse idct data */
79 if (is_idct)
80 fdct(block1);
81
82 if (fdct_func == ff_mmx_idct ||
83 fdct_func == j_rev_dct) {
84 for(i=0;i<64;i++)
85 block[idct_mmx_perm[i]] = block1[i];
86 } else {
87 memcpy(block, block1, sizeof(DCTELEM) * 64);
88 }
89
55 fdct_func(block); 90 fdct_func(block);
91 emms(); /* for ff_mmx_idct */
92
56 if (fdct_func == jpeg_fdct_ifast) { 93 if (fdct_func == jpeg_fdct_ifast) {
57 for(i=0; i<64; i++) { 94 for(i=0; i<64; i++) {
58 scale = (1 << (AANSCALE_BITS + 11)) / aanscales[i]; 95 scale = (1 << (AANSCALE_BITS + 11)) / aanscales[i];
59 block[i] = (block[i] * scale) >> AANSCALE_BITS; 96 block[i] = (block[i] * scale) >> AANSCALE_BITS;
60 } 97 }
61 } 98 }
62 99
63 fdct(block1); 100 fdct_ref(block1);
64 101
65 for(i=0;i<64;i++) { 102 for(i=0;i<64;i++) {
66 v = abs(block[i] - block1[i]); 103 v = abs(block[i] - block1[i]);
67 if (v > err_inf) 104 if (v > err_inf)
68 err_inf = v; 105 err_inf = v;
69 err2 += v * v; 106 err2 += v * v;
70 } 107 }
71 } 108 }
72 printf("DCT %s: err_inf=%d err2=%0.2f\n", 109 printf("%s %s: err_inf=%d err2=%0.2f\n",
110 is_idct ? "IDCT" : "DCT",
73 name, err_inf, (double)err2 / NB_ITS / 64.0); 111 name, err_inf, (double)err2 / NB_ITS / 64.0);
74 112
75 /* speed test */ 113 /* speed test */
76 for(i=0;i<64;i++) 114 for(i=0;i<64;i++)
77 block1[i] = 255 - 63 + i; 115 block1[i] = 255 - 63 + i;
116
117 /* for idct test, generate inverse idct data */
118 if (is_idct)
119 fdct(block1);
120 if (fdct_func == ff_mmx_idct ||
121 fdct_func == j_rev_dct) {
122 for(i=0;i<64;i++)
123 block[idct_mmx_perm[i]] = block1[i];
124 }
78 125
79 ti = gettime(); 126 ti = gettime();
80 it1 = 0; 127 it1 = 0;
81 do { 128 do {
82 for(it=0;it<NB_ITS_SPEED;it++) { 129 for(it=0;it<NB_ITS_SPEED;it++) {
84 fdct_func(block); 131 fdct_func(block);
85 } 132 }
86 it1 += NB_ITS_SPEED; 133 it1 += NB_ITS_SPEED;
87 ti1 = gettime() - ti; 134 ti1 = gettime() - ti;
88 } while (ti1 < 1000000); 135 } while (ti1 < 1000000);
136 emms();
89 137
90 printf("DCT %s: %0.1f kdct/s\n", 138 printf("%s %s: %0.1f kdct/s\n",
139 is_idct ? "IDCT" : "DCT",
91 name, (double)it1 * 1000.0 / (double)ti1); 140 name, (double)it1 * 1000.0 / (double)ti1);
141 }
142
143 void help(void)
144 {
145 printf("dct-test [-i]\n"
146 "test DCT implementations\n");
147 exit(1);
92 } 148 }
93 149
94 int main(int argc, char **argv) 150 int main(int argc, char **argv)
95 { 151 {
152 int test_idct = 0;
153 int c;
154
96 init_fdct(); 155 init_fdct();
97 156 idct_mmx_init();
98 printf("ffmpeg DCT test\n");
99 157
100 dct_error("REF", fdct); /* only to verify code ! */ 158 for(;;) {
101 dct_error("AAN", jpeg_fdct_ifast); 159 c = getopt(argc, argv, "ih");
102 dct_error("MMX", fdct_mmx); 160 if (c == -1)
161 break;
162 switch(c) {
163 case 'i':
164 test_idct = 1;
165 break;
166 case 'h':
167 help();
168 break;
169 }
170 }
171
172 printf("ffmpeg DCT/IDCT test\n");
173
174 if (!test_idct) {
175 dct_error("REF", 0, fdct, fdct); /* only to verify code ! */
176 dct_error("AAN", 0, jpeg_fdct_ifast, fdct);
177 dct_error("MMX", 0, fdct_mmx, fdct);
178 } else {
179 dct_error("REF", 1, idct, idct);
180 dct_error("INT", 1, j_rev_dct, idct);
181 dct_error("MMX", 1, ff_mmx_idct, idct);
182 // dct_error("MMX", 1, ff_mmxext_idct, idct);
183 }
103 return 0; 184 return 0;
104 } 185 }
105