annotate dsputil.c @ 19:82d4c9be9873 libavcodec

MMX/MMXEXT iDCT support, using external functions currently defined in libmpeg2 Gives average 13-20% mpeg decoding speedup on x86 systems.
author arpi_esp
date Fri, 03 Aug 2001 18:33:03 +0000
parents ec4642daa6fe
children 2733a4c1c693
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
1 /*
986e461dc072 Initial revision
glantau
parents:
diff changeset
2 * DSP utils
986e461dc072 Initial revision
glantau
parents:
diff changeset
3 * Copyright (c) 2000, 2001 Gerard Lantau.
986e461dc072 Initial revision
glantau
parents:
diff changeset
4 *
986e461dc072 Initial revision
glantau
parents:
diff changeset
5 * This program is free software; you can redistribute it and/or modify
986e461dc072 Initial revision
glantau
parents:
diff changeset
6 * it under the terms of the GNU General Public License as published by
986e461dc072 Initial revision
glantau
parents:
diff changeset
7 * the Free Software Foundation; either version 2 of the License, or
986e461dc072 Initial revision
glantau
parents:
diff changeset
8 * (at your option) any later version.
986e461dc072 Initial revision
glantau
parents:
diff changeset
9 *
986e461dc072 Initial revision
glantau
parents:
diff changeset
10 * This program is distributed in the hope that it will be useful,
986e461dc072 Initial revision
glantau
parents:
diff changeset
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
986e461dc072 Initial revision
glantau
parents:
diff changeset
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
986e461dc072 Initial revision
glantau
parents:
diff changeset
13 * GNU General Public License for more details.
986e461dc072 Initial revision
glantau
parents:
diff changeset
14 *
986e461dc072 Initial revision
glantau
parents:
diff changeset
15 * You should have received a copy of the GNU General Public License
986e461dc072 Initial revision
glantau
parents:
diff changeset
16 * along with this program; if not, write to the Free Software
986e461dc072 Initial revision
glantau
parents:
diff changeset
17 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
986e461dc072 Initial revision
glantau
parents:
diff changeset
18 */
986e461dc072 Initial revision
glantau
parents:
diff changeset
19 #include <stdlib.h>
986e461dc072 Initial revision
glantau
parents:
diff changeset
20 #include <stdio.h>
986e461dc072 Initial revision
glantau
parents:
diff changeset
21 #include "avcodec.h"
986e461dc072 Initial revision
glantau
parents:
diff changeset
22 #include "dsputil.h"
986e461dc072 Initial revision
glantau
parents:
diff changeset
23
19
82d4c9be9873 MMX/MMXEXT iDCT support, using external functions currently defined in libmpeg2
arpi_esp
parents: 6
diff changeset
24 void (*ff_idct)(DCTELEM *block);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
25 void (*get_pixels)(DCTELEM *block, const UINT8 *pixels, int line_size);
986e461dc072 Initial revision
glantau
parents:
diff changeset
26 void (*put_pixels_clamped)(const DCTELEM *block, UINT8 *pixels, int line_size);
986e461dc072 Initial revision
glantau
parents:
diff changeset
27 void (*add_pixels_clamped)(const DCTELEM *block, UINT8 *pixels, int line_size);
986e461dc072 Initial revision
glantau
parents:
diff changeset
28
986e461dc072 Initial revision
glantau
parents:
diff changeset
29 op_pixels_abs_func pix_abs16x16;
986e461dc072 Initial revision
glantau
parents:
diff changeset
30 op_pixels_abs_func pix_abs16x16_x2;
986e461dc072 Initial revision
glantau
parents:
diff changeset
31 op_pixels_abs_func pix_abs16x16_y2;
986e461dc072 Initial revision
glantau
parents:
diff changeset
32 op_pixels_abs_func pix_abs16x16_xy2;
986e461dc072 Initial revision
glantau
parents:
diff changeset
33
986e461dc072 Initial revision
glantau
parents:
diff changeset
34 static UINT8 cropTbl[256 + 2 * MAX_NEG_CROP];
986e461dc072 Initial revision
glantau
parents:
diff changeset
35 UINT32 squareTbl[512];
986e461dc072 Initial revision
glantau
parents:
diff changeset
36
986e461dc072 Initial revision
glantau
parents:
diff changeset
37 void get_pixels_c(DCTELEM *block, const UINT8 *pixels, int line_size)
986e461dc072 Initial revision
glantau
parents:
diff changeset
38 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
39 DCTELEM *p;
986e461dc072 Initial revision
glantau
parents:
diff changeset
40 const UINT8 *pix;
986e461dc072 Initial revision
glantau
parents:
diff changeset
41 int i;
986e461dc072 Initial revision
glantau
parents:
diff changeset
42
986e461dc072 Initial revision
glantau
parents:
diff changeset
43 /* read the pixels */
986e461dc072 Initial revision
glantau
parents:
diff changeset
44 p = block;
986e461dc072 Initial revision
glantau
parents:
diff changeset
45 pix = pixels;
986e461dc072 Initial revision
glantau
parents:
diff changeset
46 for(i=0;i<8;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
47 p[0] = pix[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
48 p[1] = pix[1];
986e461dc072 Initial revision
glantau
parents:
diff changeset
49 p[2] = pix[2];
986e461dc072 Initial revision
glantau
parents:
diff changeset
50 p[3] = pix[3];
986e461dc072 Initial revision
glantau
parents:
diff changeset
51 p[4] = pix[4];
986e461dc072 Initial revision
glantau
parents:
diff changeset
52 p[5] = pix[5];
986e461dc072 Initial revision
glantau
parents:
diff changeset
53 p[6] = pix[6];
986e461dc072 Initial revision
glantau
parents:
diff changeset
54 p[7] = pix[7];
986e461dc072 Initial revision
glantau
parents:
diff changeset
55 pix += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
56 p += 8;
986e461dc072 Initial revision
glantau
parents:
diff changeset
57 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
58 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
59
986e461dc072 Initial revision
glantau
parents:
diff changeset
60 void put_pixels_clamped_c(const DCTELEM *block, UINT8 *pixels, int line_size)
986e461dc072 Initial revision
glantau
parents:
diff changeset
61 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
62 const DCTELEM *p;
986e461dc072 Initial revision
glantau
parents:
diff changeset
63 UINT8 *pix;
986e461dc072 Initial revision
glantau
parents:
diff changeset
64 int i;
986e461dc072 Initial revision
glantau
parents:
diff changeset
65 UINT8 *cm = cropTbl + MAX_NEG_CROP;
986e461dc072 Initial revision
glantau
parents:
diff changeset
66
986e461dc072 Initial revision
glantau
parents:
diff changeset
67 /* read the pixels */
986e461dc072 Initial revision
glantau
parents:
diff changeset
68 p = block;
986e461dc072 Initial revision
glantau
parents:
diff changeset
69 pix = pixels;
986e461dc072 Initial revision
glantau
parents:
diff changeset
70 for(i=0;i<8;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
71 pix[0] = cm[p[0]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
72 pix[1] = cm[p[1]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
73 pix[2] = cm[p[2]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
74 pix[3] = cm[p[3]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
75 pix[4] = cm[p[4]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
76 pix[5] = cm[p[5]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
77 pix[6] = cm[p[6]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
78 pix[7] = cm[p[7]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
79 pix += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
80 p += 8;
986e461dc072 Initial revision
glantau
parents:
diff changeset
81 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
82 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
83
986e461dc072 Initial revision
glantau
parents:
diff changeset
84 void add_pixels_clamped_c(const DCTELEM *block, UINT8 *pixels, int line_size)
986e461dc072 Initial revision
glantau
parents:
diff changeset
85 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
86 const DCTELEM *p;
986e461dc072 Initial revision
glantau
parents:
diff changeset
87 UINT8 *pix;
986e461dc072 Initial revision
glantau
parents:
diff changeset
88 int i;
986e461dc072 Initial revision
glantau
parents:
diff changeset
89 UINT8 *cm = cropTbl + MAX_NEG_CROP;
986e461dc072 Initial revision
glantau
parents:
diff changeset
90
986e461dc072 Initial revision
glantau
parents:
diff changeset
91 /* read the pixels */
986e461dc072 Initial revision
glantau
parents:
diff changeset
92 p = block;
986e461dc072 Initial revision
glantau
parents:
diff changeset
93 pix = pixels;
986e461dc072 Initial revision
glantau
parents:
diff changeset
94 for(i=0;i<8;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
95 pix[0] = cm[pix[0] + p[0]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
96 pix[1] = cm[pix[1] + p[1]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
97 pix[2] = cm[pix[2] + p[2]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
98 pix[3] = cm[pix[3] + p[3]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
99 pix[4] = cm[pix[4] + p[4]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
100 pix[5] = cm[pix[5] + p[5]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
101 pix[6] = cm[pix[6] + p[6]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
102 pix[7] = cm[pix[7] + p[7]];
986e461dc072 Initial revision
glantau
parents:
diff changeset
103 pix += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
104 p += 8;
986e461dc072 Initial revision
glantau
parents:
diff changeset
105 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
106 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
107
986e461dc072 Initial revision
glantau
parents:
diff changeset
108 #define PIXOP(BTYPE, OPNAME, OP, INCR) \
986e461dc072 Initial revision
glantau
parents:
diff changeset
109 \
986e461dc072 Initial revision
glantau
parents:
diff changeset
110 static void OPNAME ## _pixels(BTYPE *block, const UINT8 *pixels, int line_size, int h) \
986e461dc072 Initial revision
glantau
parents:
diff changeset
111 { \
986e461dc072 Initial revision
glantau
parents:
diff changeset
112 BTYPE *p; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
113 const UINT8 *pix; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
114 \
986e461dc072 Initial revision
glantau
parents:
diff changeset
115 p = block; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
116 pix = pixels; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
117 do { \
986e461dc072 Initial revision
glantau
parents:
diff changeset
118 OP(p[0], pix[0]); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
119 OP(p[1], pix[1]); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
120 OP(p[2], pix[2]); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
121 OP(p[3], pix[3]); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
122 OP(p[4], pix[4]); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
123 OP(p[5], pix[5]); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
124 OP(p[6], pix[6]); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
125 OP(p[7], pix[7]); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
126 pix += line_size; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
127 p += INCR; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
128 } while (--h);; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
129 } \
986e461dc072 Initial revision
glantau
parents:
diff changeset
130 \
986e461dc072 Initial revision
glantau
parents:
diff changeset
131 static void OPNAME ## _pixels_x2(BTYPE *block, const UINT8 *pixels, int line_size, int h) \
986e461dc072 Initial revision
glantau
parents:
diff changeset
132 { \
986e461dc072 Initial revision
glantau
parents:
diff changeset
133 BTYPE *p; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
134 const UINT8 *pix; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
135 \
986e461dc072 Initial revision
glantau
parents:
diff changeset
136 p = block; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
137 pix = pixels; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
138 do { \
986e461dc072 Initial revision
glantau
parents:
diff changeset
139 OP(p[0], avg2(pix[0], pix[1])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
140 OP(p[1], avg2(pix[1], pix[2])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
141 OP(p[2], avg2(pix[2], pix[3])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
142 OP(p[3], avg2(pix[3], pix[4])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
143 OP(p[4], avg2(pix[4], pix[5])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
144 OP(p[5], avg2(pix[5], pix[6])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
145 OP(p[6], avg2(pix[6], pix[7])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
146 OP(p[7], avg2(pix[7], pix[8])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
147 pix += line_size; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
148 p += INCR; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
149 } while (--h); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
150 } \
986e461dc072 Initial revision
glantau
parents:
diff changeset
151 \
986e461dc072 Initial revision
glantau
parents:
diff changeset
152 static void OPNAME ## _pixels_y2(BTYPE *block, const UINT8 *pixels, int line_size, int h) \
986e461dc072 Initial revision
glantau
parents:
diff changeset
153 { \
986e461dc072 Initial revision
glantau
parents:
diff changeset
154 BTYPE *p; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
155 const UINT8 *pix; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
156 const UINT8 *pix1; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
157 \
986e461dc072 Initial revision
glantau
parents:
diff changeset
158 p = block; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
159 pix = pixels; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
160 pix1 = pixels + line_size; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
161 do { \
986e461dc072 Initial revision
glantau
parents:
diff changeset
162 OP(p[0], avg2(pix[0], pix1[0])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
163 OP(p[1], avg2(pix[1], pix1[1])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
164 OP(p[2], avg2(pix[2], pix1[2])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
165 OP(p[3], avg2(pix[3], pix1[3])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
166 OP(p[4], avg2(pix[4], pix1[4])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
167 OP(p[5], avg2(pix[5], pix1[5])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
168 OP(p[6], avg2(pix[6], pix1[6])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
169 OP(p[7], avg2(pix[7], pix1[7])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
170 pix += line_size; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
171 pix1 += line_size; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
172 p += INCR; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
173 } while(--h); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
174 } \
986e461dc072 Initial revision
glantau
parents:
diff changeset
175 \
986e461dc072 Initial revision
glantau
parents:
diff changeset
176 static void OPNAME ## _pixels_xy2(BTYPE *block, const UINT8 *pixels, int line_size, int h) \
986e461dc072 Initial revision
glantau
parents:
diff changeset
177 { \
986e461dc072 Initial revision
glantau
parents:
diff changeset
178 BTYPE *p; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
179 const UINT8 *pix; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
180 const UINT8 *pix1; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
181 \
986e461dc072 Initial revision
glantau
parents:
diff changeset
182 p = block; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
183 pix = pixels; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
184 pix1 = pixels + line_size; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
185 do { \
986e461dc072 Initial revision
glantau
parents:
diff changeset
186 OP(p[0], avg4(pix[0], pix[1], pix1[0], pix1[1])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
187 OP(p[1], avg4(pix[1], pix[2], pix1[1], pix1[2])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
188 OP(p[2], avg4(pix[2], pix[3], pix1[2], pix1[3])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
189 OP(p[3], avg4(pix[3], pix[4], pix1[3], pix1[4])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
190 OP(p[4], avg4(pix[4], pix[5], pix1[4], pix1[5])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
191 OP(p[5], avg4(pix[5], pix[6], pix1[5], pix1[6])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
192 OP(p[6], avg4(pix[6], pix[7], pix1[6], pix1[7])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
193 OP(p[7], avg4(pix[7], pix[8], pix1[7], pix1[8])); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
194 pix += line_size; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
195 pix1 += line_size; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
196 p += INCR; \
986e461dc072 Initial revision
glantau
parents:
diff changeset
197 } while(--h); \
986e461dc072 Initial revision
glantau
parents:
diff changeset
198 } \
986e461dc072 Initial revision
glantau
parents:
diff changeset
199 \
986e461dc072 Initial revision
glantau
parents:
diff changeset
200 void (*OPNAME ## _pixels_tab[4])(BTYPE *block, const UINT8 *pixels, int line_size, int h) = { \
986e461dc072 Initial revision
glantau
parents:
diff changeset
201 OPNAME ## _pixels, \
986e461dc072 Initial revision
glantau
parents:
diff changeset
202 OPNAME ## _pixels_x2, \
986e461dc072 Initial revision
glantau
parents:
diff changeset
203 OPNAME ## _pixels_y2, \
986e461dc072 Initial revision
glantau
parents:
diff changeset
204 OPNAME ## _pixels_xy2, \
986e461dc072 Initial revision
glantau
parents:
diff changeset
205 };
986e461dc072 Initial revision
glantau
parents:
diff changeset
206
986e461dc072 Initial revision
glantau
parents:
diff changeset
207
986e461dc072 Initial revision
glantau
parents:
diff changeset
208 /* rounding primitives */
986e461dc072 Initial revision
glantau
parents:
diff changeset
209 #define avg2(a,b) ((a+b+1)>>1)
986e461dc072 Initial revision
glantau
parents:
diff changeset
210 #define avg4(a,b,c,d) ((a+b+c+d+2)>>2)
986e461dc072 Initial revision
glantau
parents:
diff changeset
211
986e461dc072 Initial revision
glantau
parents:
diff changeset
212 #define op_put(a, b) a = b
986e461dc072 Initial revision
glantau
parents:
diff changeset
213 #define op_avg(a, b) a = avg2(a, b)
986e461dc072 Initial revision
glantau
parents:
diff changeset
214 #define op_sub(a, b) a -= b
986e461dc072 Initial revision
glantau
parents:
diff changeset
215
986e461dc072 Initial revision
glantau
parents:
diff changeset
216 PIXOP(UINT8, put, op_put, line_size)
986e461dc072 Initial revision
glantau
parents:
diff changeset
217 PIXOP(UINT8, avg, op_avg, line_size)
986e461dc072 Initial revision
glantau
parents:
diff changeset
218
986e461dc072 Initial revision
glantau
parents:
diff changeset
219 PIXOP(DCTELEM, sub, op_sub, 8)
986e461dc072 Initial revision
glantau
parents:
diff changeset
220
986e461dc072 Initial revision
glantau
parents:
diff changeset
221 /* not rounding primitives */
986e461dc072 Initial revision
glantau
parents:
diff changeset
222 #undef avg2
986e461dc072 Initial revision
glantau
parents:
diff changeset
223 #undef avg4
986e461dc072 Initial revision
glantau
parents:
diff changeset
224 #define avg2(a,b) ((a+b)>>1)
986e461dc072 Initial revision
glantau
parents:
diff changeset
225 #define avg4(a,b,c,d) ((a+b+c+d+1)>>2)
986e461dc072 Initial revision
glantau
parents:
diff changeset
226
986e461dc072 Initial revision
glantau
parents:
diff changeset
227 PIXOP(UINT8, put_no_rnd, op_put, line_size)
986e461dc072 Initial revision
glantau
parents:
diff changeset
228 PIXOP(UINT8, avg_no_rnd, op_avg, line_size)
986e461dc072 Initial revision
glantau
parents:
diff changeset
229
986e461dc072 Initial revision
glantau
parents:
diff changeset
230 /* motion estimation */
986e461dc072 Initial revision
glantau
parents:
diff changeset
231
986e461dc072 Initial revision
glantau
parents:
diff changeset
232 #undef avg2
986e461dc072 Initial revision
glantau
parents:
diff changeset
233 #undef avg4
986e461dc072 Initial revision
glantau
parents:
diff changeset
234 #define avg2(a,b) ((a+b+1)>>1)
986e461dc072 Initial revision
glantau
parents:
diff changeset
235 #define avg4(a,b,c,d) ((a+b+c+d+2)>>2)
986e461dc072 Initial revision
glantau
parents:
diff changeset
236
986e461dc072 Initial revision
glantau
parents:
diff changeset
237 int pix_abs16x16_c(UINT8 *pix1, UINT8 *pix2, int line_size, int h)
986e461dc072 Initial revision
glantau
parents:
diff changeset
238 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
239 int s, i;
986e461dc072 Initial revision
glantau
parents:
diff changeset
240
986e461dc072 Initial revision
glantau
parents:
diff changeset
241 s = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
242 for(i=0;i<h;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
243 s += abs(pix1[0] - pix2[0]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
244 s += abs(pix1[1] - pix2[1]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
245 s += abs(pix1[2] - pix2[2]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
246 s += abs(pix1[3] - pix2[3]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
247 s += abs(pix1[4] - pix2[4]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
248 s += abs(pix1[5] - pix2[5]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
249 s += abs(pix1[6] - pix2[6]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
250 s += abs(pix1[7] - pix2[7]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
251 s += abs(pix1[8] - pix2[8]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
252 s += abs(pix1[9] - pix2[9]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
253 s += abs(pix1[10] - pix2[10]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
254 s += abs(pix1[11] - pix2[11]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
255 s += abs(pix1[12] - pix2[12]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
256 s += abs(pix1[13] - pix2[13]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
257 s += abs(pix1[14] - pix2[14]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
258 s += abs(pix1[15] - pix2[15]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
259 pix1 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
260 pix2 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
261 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
262 return s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
263 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
264
986e461dc072 Initial revision
glantau
parents:
diff changeset
265 int pix_abs16x16_x2_c(UINT8 *pix1, UINT8 *pix2, int line_size, int h)
986e461dc072 Initial revision
glantau
parents:
diff changeset
266 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
267 int s, i;
986e461dc072 Initial revision
glantau
parents:
diff changeset
268
986e461dc072 Initial revision
glantau
parents:
diff changeset
269 s = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
270 for(i=0;i<h;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
271 s += abs(pix1[0] - avg2(pix2[0], pix2[1]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
272 s += abs(pix1[1] - avg2(pix2[1], pix2[2]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
273 s += abs(pix1[2] - avg2(pix2[2], pix2[3]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
274 s += abs(pix1[3] - avg2(pix2[3], pix2[4]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
275 s += abs(pix1[4] - avg2(pix2[4], pix2[5]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
276 s += abs(pix1[5] - avg2(pix2[5], pix2[6]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
277 s += abs(pix1[6] - avg2(pix2[6], pix2[7]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
278 s += abs(pix1[7] - avg2(pix2[7], pix2[8]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
279 s += abs(pix1[8] - avg2(pix2[8], pix2[9]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
280 s += abs(pix1[9] - avg2(pix2[9], pix2[10]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
281 s += abs(pix1[10] - avg2(pix2[10], pix2[11]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
282 s += abs(pix1[11] - avg2(pix2[11], pix2[12]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
283 s += abs(pix1[12] - avg2(pix2[12], pix2[13]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
284 s += abs(pix1[13] - avg2(pix2[13], pix2[14]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
285 s += abs(pix1[14] - avg2(pix2[14], pix2[15]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
286 s += abs(pix1[15] - avg2(pix2[15], pix2[16]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
287 pix1 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
288 pix2 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
289 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
290 return s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
291 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
292
986e461dc072 Initial revision
glantau
parents:
diff changeset
293 int pix_abs16x16_y2_c(UINT8 *pix1, UINT8 *pix2, int line_size, int h)
986e461dc072 Initial revision
glantau
parents:
diff changeset
294 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
295 int s, i;
986e461dc072 Initial revision
glantau
parents:
diff changeset
296 UINT8 *pix3 = pix2 + line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
297
986e461dc072 Initial revision
glantau
parents:
diff changeset
298 s = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
299 for(i=0;i<h;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
300 s += abs(pix1[0] - avg2(pix2[0], pix3[0]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
301 s += abs(pix1[1] - avg2(pix2[1], pix3[1]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
302 s += abs(pix1[2] - avg2(pix2[2], pix3[2]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
303 s += abs(pix1[3] - avg2(pix2[3], pix3[3]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
304 s += abs(pix1[4] - avg2(pix2[4], pix3[4]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
305 s += abs(pix1[5] - avg2(pix2[5], pix3[5]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
306 s += abs(pix1[6] - avg2(pix2[6], pix3[6]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
307 s += abs(pix1[7] - avg2(pix2[7], pix3[7]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
308 s += abs(pix1[8] - avg2(pix2[8], pix3[8]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
309 s += abs(pix1[9] - avg2(pix2[9], pix3[9]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
310 s += abs(pix1[10] - avg2(pix2[10], pix3[10]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
311 s += abs(pix1[11] - avg2(pix2[11], pix3[11]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
312 s += abs(pix1[12] - avg2(pix2[12], pix3[12]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
313 s += abs(pix1[13] - avg2(pix2[13], pix3[13]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
314 s += abs(pix1[14] - avg2(pix2[14], pix3[14]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
315 s += abs(pix1[15] - avg2(pix2[15], pix3[15]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
316 pix1 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
317 pix2 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
318 pix3 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
319 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
320 return s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
321 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
322
986e461dc072 Initial revision
glantau
parents:
diff changeset
323 int pix_abs16x16_xy2_c(UINT8 *pix1, UINT8 *pix2, int line_size, int h)
986e461dc072 Initial revision
glantau
parents:
diff changeset
324 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
325 int s, i;
986e461dc072 Initial revision
glantau
parents:
diff changeset
326 UINT8 *pix3 = pix2 + line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
327
986e461dc072 Initial revision
glantau
parents:
diff changeset
328 s = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
329 for(i=0;i<h;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
330 s += abs(pix1[0] - avg4(pix2[0], pix2[1], pix3[0], pix3[1]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
331 s += abs(pix1[1] - avg4(pix2[1], pix2[2], pix3[1], pix3[2]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
332 s += abs(pix1[2] - avg4(pix2[2], pix2[3], pix3[2], pix3[3]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
333 s += abs(pix1[3] - avg4(pix2[3], pix2[4], pix3[3], pix3[4]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
334 s += abs(pix1[4] - avg4(pix2[4], pix2[5], pix3[4], pix3[5]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
335 s += abs(pix1[5] - avg4(pix2[5], pix2[6], pix3[5], pix3[6]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
336 s += abs(pix1[6] - avg4(pix2[6], pix2[7], pix3[6], pix3[7]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
337 s += abs(pix1[7] - avg4(pix2[7], pix2[8], pix3[7], pix3[8]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
338 s += abs(pix1[8] - avg4(pix2[8], pix2[9], pix3[8], pix3[9]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
339 s += abs(pix1[9] - avg4(pix2[9], pix2[10], pix3[9], pix3[10]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
340 s += abs(pix1[10] - avg4(pix2[10], pix2[11], pix3[10], pix3[11]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
341 s += abs(pix1[11] - avg4(pix2[11], pix2[12], pix3[11], pix3[12]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
342 s += abs(pix1[12] - avg4(pix2[12], pix2[13], pix3[12], pix3[13]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
343 s += abs(pix1[13] - avg4(pix2[13], pix2[14], pix3[13], pix3[14]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
344 s += abs(pix1[14] - avg4(pix2[14], pix2[15], pix3[14], pix3[15]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
345 s += abs(pix1[15] - avg4(pix2[15], pix2[16], pix3[15], pix3[16]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
346 pix1 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
347 pix2 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
348 pix3 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
349 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
350 return s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
351 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
352
986e461dc072 Initial revision
glantau
parents:
diff changeset
353 void dsputil_init(void)
986e461dc072 Initial revision
glantau
parents:
diff changeset
354 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
355 int i;
986e461dc072 Initial revision
glantau
parents:
diff changeset
356
986e461dc072 Initial revision
glantau
parents:
diff changeset
357 for(i=0;i<256;i++) cropTbl[i + MAX_NEG_CROP] = i;
986e461dc072 Initial revision
glantau
parents:
diff changeset
358 for(i=0;i<MAX_NEG_CROP;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
359 cropTbl[i] = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
360 cropTbl[i + MAX_NEG_CROP + 256] = 255;
986e461dc072 Initial revision
glantau
parents:
diff changeset
361 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
362
986e461dc072 Initial revision
glantau
parents:
diff changeset
363 for(i=0;i<512;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
364 squareTbl[i] = (i - 256) * (i - 256);
986e461dc072 Initial revision
glantau
parents:
diff changeset
365 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
366
19
82d4c9be9873 MMX/MMXEXT iDCT support, using external functions currently defined in libmpeg2
arpi_esp
parents: 6
diff changeset
367 ff_idct = j_rev_dct;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
368 get_pixels = get_pixels_c;
986e461dc072 Initial revision
glantau
parents:
diff changeset
369 put_pixels_clamped = put_pixels_clamped_c;
986e461dc072 Initial revision
glantau
parents:
diff changeset
370 add_pixels_clamped = add_pixels_clamped_c;
986e461dc072 Initial revision
glantau
parents:
diff changeset
371
986e461dc072 Initial revision
glantau
parents:
diff changeset
372 pix_abs16x16 = pix_abs16x16_c;
986e461dc072 Initial revision
glantau
parents:
diff changeset
373 pix_abs16x16_x2 = pix_abs16x16_x2_c;
986e461dc072 Initial revision
glantau
parents:
diff changeset
374 pix_abs16x16_y2 = pix_abs16x16_y2_c;
986e461dc072 Initial revision
glantau
parents:
diff changeset
375 pix_abs16x16_xy2 = pix_abs16x16_xy2_c;
986e461dc072 Initial revision
glantau
parents:
diff changeset
376 av_fdct = jpeg_fdct_ifast;
986e461dc072 Initial revision
glantau
parents:
diff changeset
377
2
2e2c46c87460 fixed config for direct mplayer build compatibility
glantau
parents: 0
diff changeset
378 #ifdef HAVE_MMX
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
379 dsputil_init_mmx();
986e461dc072 Initial revision
glantau
parents:
diff changeset
380 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
381 }