comparison vc1dsp.c @ 5997:90de28dfd8d6 libavcodec

Switch VC-1 decoder to output decoded residual immediately.
author kostya
date Sat, 08 Dec 2007 10:41:18 +0000
parents 90d90aecc83c
children 953c8efd5298
comparison
equal deleted inserted replaced
5996:9319837c5d02 5997:90de28dfd8d6
150 } 150 }
151 } 151 }
152 152
153 /** Do inverse transform on 8x4 part of block 153 /** Do inverse transform on 8x4 part of block
154 */ 154 */
155 static void vc1_inv_trans_8x4_c(DCTELEM block[64], int n) 155 static void vc1_inv_trans_8x4_c(uint8_t *dest, int linesize, DCTELEM *block)
156 { 156 {
157 int i; 157 int i;
158 register int t1,t2,t3,t4,t5,t6,t7,t8; 158 register int t1,t2,t3,t4,t5,t6,t7,t8;
159 DCTELEM *src, *dst; 159 DCTELEM *src, *dst;
160 int off; 160 const uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
161 161
162 off = n * 32; 162 src = block;
163 src = block + off; 163 dst = block;
164 dst = block + off;
165 for(i = 0; i < 4; i++){ 164 for(i = 0; i < 4; i++){
166 t1 = 12 * (src[0] + src[4]); 165 t1 = 12 * (src[0] + src[4]);
167 t2 = 12 * (src[0] - src[4]); 166 t2 = 12 * (src[0] - src[4]);
168 t3 = 16 * src[2] + 6 * src[6]; 167 t3 = 16 * src[2] + 6 * src[6];
169 t4 = 6 * src[2] - 16 * src[6]; 168 t4 = 6 * src[2] - 16 * src[6];
189 188
190 src += 8; 189 src += 8;
191 dst += 8; 190 dst += 8;
192 } 191 }
193 192
194 src = block + off; 193 src = block;
195 dst = block + off;
196 for(i = 0; i < 8; i++){ 194 for(i = 0; i < 8; i++){
197 t1 = 17 * (src[ 0] + src[16]); 195 t1 = 17 * (src[ 0] + src[16]);
198 t2 = 17 * (src[ 0] - src[16]); 196 t2 = 17 * (src[ 0] - src[16]);
199 t3 = 22 * src[ 8]; 197 t3 = 22 * src[ 8];
200 t4 = 22 * src[24]; 198 t4 = 22 * src[24];
201 t5 = 10 * src[ 8]; 199 t5 = 10 * src[ 8];
202 t6 = 10 * src[24]; 200 t6 = 10 * src[24];
203 201
204 dst[ 0] = (t1 + t3 + t6 + 64) >> 7; 202 dest[0*linesize] = cm[dest[0*linesize] + ((t1 + t3 + t6 + 64) >> 7)];
205 dst[ 8] = (t2 - t4 + t5 + 64) >> 7; 203 dest[1*linesize] = cm[dest[1*linesize] + ((t2 - t4 + t5 + 64) >> 7)];
206 dst[16] = (t2 + t4 - t5 + 64) >> 7; 204 dest[2*linesize] = cm[dest[2*linesize] + ((t2 + t4 - t5 + 64) >> 7)];
207 dst[24] = (t1 - t3 - t6 + 64) >> 7; 205 dest[3*linesize] = cm[dest[3*linesize] + ((t1 - t3 - t6 + 64) >> 7)];
208 206
209 src ++; 207 src ++;
210 dst ++; 208 dest++;
211 } 209 }
212 } 210 }
213 211
214 /** Do inverse transform on 4x8 parts of block 212 /** Do inverse transform on 4x8 parts of block
215 */ 213 */
216 static void vc1_inv_trans_4x8_c(DCTELEM block[64], int n) 214 static void vc1_inv_trans_4x8_c(uint8_t *dest, int linesize, DCTELEM *block)
217 { 215 {
218 int i; 216 int i;
219 register int t1,t2,t3,t4,t5,t6,t7,t8; 217 register int t1,t2,t3,t4,t5,t6,t7,t8;
220 DCTELEM *src, *dst; 218 DCTELEM *src, *dst;
221 int off; 219 const uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
222 220
223 off = n * 4; 221 src = block;
224 src = block + off; 222 dst = block;
225 dst = block + off;
226 for(i = 0; i < 8; i++){ 223 for(i = 0; i < 8; i++){
227 t1 = 17 * (src[0] + src[2]); 224 t1 = 17 * (src[0] + src[2]);
228 t2 = 17 * (src[0] - src[2]); 225 t2 = 17 * (src[0] - src[2]);
229 t3 = 22 * src[1]; 226 t3 = 22 * src[1];
230 t4 = 22 * src[3]; 227 t4 = 22 * src[3];
238 235
239 src += 8; 236 src += 8;
240 dst += 8; 237 dst += 8;
241 } 238 }
242 239
243 src = block + off; 240 src = block;
244 dst = block + off;
245 for(i = 0; i < 4; i++){ 241 for(i = 0; i < 4; i++){
246 t1 = 12 * (src[ 0] + src[32]); 242 t1 = 12 * (src[ 0] + src[32]);
247 t2 = 12 * (src[ 0] - src[32]); 243 t2 = 12 * (src[ 0] - src[32]);
248 t3 = 16 * src[16] + 6 * src[48]; 244 t3 = 16 * src[16] + 6 * src[48];
249 t4 = 6 * src[16] - 16 * src[48]; 245 t4 = 6 * src[16] - 16 * src[48];
256 t1 = 16 * src[ 8] + 15 * src[24] + 9 * src[40] + 4 * src[56]; 252 t1 = 16 * src[ 8] + 15 * src[24] + 9 * src[40] + 4 * src[56];
257 t2 = 15 * src[ 8] - 4 * src[24] - 16 * src[40] - 9 * src[56]; 253 t2 = 15 * src[ 8] - 4 * src[24] - 16 * src[40] - 9 * src[56];
258 t3 = 9 * src[ 8] - 16 * src[24] + 4 * src[40] + 15 * src[56]; 254 t3 = 9 * src[ 8] - 16 * src[24] + 4 * src[40] + 15 * src[56];
259 t4 = 4 * src[ 8] - 9 * src[24] + 15 * src[40] - 16 * src[56]; 255 t4 = 4 * src[ 8] - 9 * src[24] + 15 * src[40] - 16 * src[56];
260 256
261 dst[ 0] = (t5 + t1 + 64) >> 7; 257 dest[0*linesize] = cm[dest[0*linesize] + ((t5 + t1 + 64) >> 7)];
262 dst[ 8] = (t6 + t2 + 64) >> 7; 258 dest[1*linesize] = cm[dest[1*linesize] + ((t6 + t2 + 64) >> 7)];
263 dst[16] = (t7 + t3 + 64) >> 7; 259 dest[2*linesize] = cm[dest[2*linesize] + ((t7 + t3 + 64) >> 7)];
264 dst[24] = (t8 + t4 + 64) >> 7; 260 dest[3*linesize] = cm[dest[3*linesize] + ((t8 + t4 + 64) >> 7)];
265 dst[32] = (t8 - t4 + 64 + 1) >> 7; 261 dest[4*linesize] = cm[dest[4*linesize] + ((t8 - t4 + 64 + 1) >> 7)];
266 dst[40] = (t7 - t3 + 64 + 1) >> 7; 262 dest[5*linesize] = cm[dest[5*linesize] + ((t7 - t3 + 64 + 1) >> 7)];
267 dst[48] = (t6 - t2 + 64 + 1) >> 7; 263 dest[6*linesize] = cm[dest[6*linesize] + ((t6 - t2 + 64 + 1) >> 7)];
268 dst[56] = (t5 - t1 + 64 + 1) >> 7; 264 dest[7*linesize] = cm[dest[7*linesize] + ((t5 - t1 + 64 + 1) >> 7)];
269 265
270 src++; 266 src ++;
271 dst++; 267 dest++;
272 } 268 }
273 } 269 }
274 270
275 /** Do inverse transform on 4x4 part of block 271 /** Do inverse transform on 4x4 part of block
276 */ 272 */
277 static void vc1_inv_trans_4x4_c(DCTELEM block[64], int n) 273 static void vc1_inv_trans_4x4_c(uint8_t *dest, int linesize, DCTELEM *block)
278 { 274 {
279 int i; 275 int i;
280 register int t1,t2,t3,t4,t5,t6; 276 register int t1,t2,t3,t4,t5,t6;
281 DCTELEM *src, *dst; 277 DCTELEM *src, *dst;
282 int off; 278 const uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
283 279
284 off = (n&1) * 4 + (n&2) * 16; 280 src = block;
285 src = block + off; 281 dst = block;
286 dst = block + off;
287 for(i = 0; i < 4; i++){ 282 for(i = 0; i < 4; i++){
288 t1 = 17 * (src[0] + src[2]); 283 t1 = 17 * (src[0] + src[2]);
289 t2 = 17 * (src[0] - src[2]); 284 t2 = 17 * (src[0] - src[2]);
290 t3 = 22 * src[1]; 285 t3 = 22 * src[1];
291 t4 = 22 * src[3]; 286 t4 = 22 * src[3];
299 294
300 src += 8; 295 src += 8;
301 dst += 8; 296 dst += 8;
302 } 297 }
303 298
304 src = block + off; 299 src = block;
305 dst = block + off;
306 for(i = 0; i < 4; i++){ 300 for(i = 0; i < 4; i++){
307 t1 = 17 * (src[ 0] + src[16]); 301 t1 = 17 * (src[ 0] + src[16]);
308 t2 = 17 * (src[ 0] - src[16]); 302 t2 = 17 * (src[ 0] - src[16]);
309 t3 = 22 * src[ 8]; 303 t3 = 22 * src[ 8];
310 t4 = 22 * src[24]; 304 t4 = 22 * src[24];
311 t5 = 10 * src[ 8]; 305 t5 = 10 * src[ 8];
312 t6 = 10 * src[24]; 306 t6 = 10 * src[24];
313 307
314 dst[ 0] = (t1 + t3 + t6 + 64) >> 7; 308 dest[0*linesize] = cm[dest[0*linesize] + ((t1 + t3 + t6 + 64) >> 7)];
315 dst[ 8] = (t2 - t4 + t5 + 64) >> 7; 309 dest[1*linesize] = cm[dest[1*linesize] + ((t2 - t4 + t5 + 64) >> 7)];
316 dst[16] = (t2 + t4 - t5 + 64) >> 7; 310 dest[2*linesize] = cm[dest[2*linesize] + ((t2 + t4 - t5 + 64) >> 7)];
317 dst[24] = (t1 - t3 - t6 + 64) >> 7; 311 dest[3*linesize] = cm[dest[3*linesize] + ((t1 - t3 - t6 + 64) >> 7)];
318 312
319 src ++; 313 src ++;
320 dst ++; 314 dest++;
321 } 315 }
322 } 316 }
323 317
324 /* motion compensation functions */ 318 /* motion compensation functions */
325 /** Filter in case of 2 filters */ 319 /** Filter in case of 2 filters */