Mercurial > libavcodec.hg
annotate motion_est.c @ 815:78accc54493b libavcodec
put a few large tables under #ifdef CONFIG_ENCODERS or dynamically allocate them
author | michaelni |
---|---|
date | Thu, 31 Oct 2002 16:11:03 +0000 |
parents | 79de6308c34d |
children | f3c369b8ddca |
rev | line source |
---|---|
0 | 1 /* |
2 * Motion estimation | |
429 | 3 * Copyright (c) 2000,2001 Fabrice Bellard. |
455 | 4 * Copyright (c) 2002 Michael Niedermayer |
0 | 5 * |
6 * | |
429 | 7 * This library is free software; you can redistribute it and/or |
8 * modify it under the terms of the GNU Lesser General Public | |
9 * License as published by the Free Software Foundation; either | |
10 * version 2 of the License, or (at your option) any later version. | |
0 | 11 * |
429 | 12 * This library is distributed in the hope that it will be useful, |
0 | 13 * but WITHOUT ANY WARRANTY; without even the implied warranty of |
429 | 14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
15 * Lesser General Public License for more details. | |
0 | 16 * |
429 | 17 * You should have received a copy of the GNU Lesser General Public |
18 * License along with this library; if not, write to the Free Software | |
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
20 * |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
21 * new Motion Estimation (X1/EPZS) by Michael Niedermayer <michaelni@gmx.at> |
0 | 22 */ |
23 #include <stdlib.h> | |
24 #include <stdio.h> | |
25 #include "avcodec.h" | |
26 #include "dsputil.h" | |
27 #include "mpegvideo.h" | |
28 | |
455 | 29 #define SQ(a) ((a)*(a)) |
284 | 30 #define INTER_BIAS 257 |
31 | |
455 | 32 #define P_LAST P[0] |
33 #define P_LEFT P[1] | |
34 #define P_TOP P[2] | |
35 #define P_TOPRIGHT P[3] | |
36 #define P_MEDIAN P[4] | |
37 #define P_LAST_LEFT P[5] | |
38 #define P_LAST_RIGHT P[6] | |
39 #define P_LAST_TOP P[7] | |
40 #define P_LAST_BOTTOM P[8] | |
41 #define P_MV1 P[9] | |
42 | |
0 | 43 |
284 | 44 static int pix_dev(UINT8 * pix, int line_size, int mean) |
45 { | |
46 int s, i, j; | |
47 | |
48 s = 0; | |
49 for (i = 0; i < 16; i++) { | |
50 for (j = 0; j < 16; j += 8) { | |
51 s += ABS(pix[0]-mean); | |
52 s += ABS(pix[1]-mean); | |
53 s += ABS(pix[2]-mean); | |
54 s += ABS(pix[3]-mean); | |
55 s += ABS(pix[4]-mean); | |
56 s += ABS(pix[5]-mean); | |
57 s += ABS(pix[6]-mean); | |
58 s += ABS(pix[7]-mean); | |
59 pix += 8; | |
60 } | |
61 pix += line_size - 16; | |
62 } | |
63 return s; | |
64 } | |
65 | |
0 | 66 static int pix_norm(UINT8 * pix1, UINT8 * pix2, int line_size) |
67 { | |
68 int s, i, j; | |
69 UINT32 *sq = squareTbl + 256; | |
70 | |
71 s = 0; | |
72 for (i = 0; i < 16; i++) { | |
73 for (j = 0; j < 16; j += 8) { | |
74 s += sq[pix1[0] - pix2[0]]; | |
75 s += sq[pix1[1] - pix2[1]]; | |
76 s += sq[pix1[2] - pix2[2]]; | |
77 s += sq[pix1[3] - pix2[3]]; | |
78 s += sq[pix1[4] - pix2[4]]; | |
79 s += sq[pix1[5] - pix2[5]]; | |
80 s += sq[pix1[6] - pix2[6]]; | |
81 s += sq[pix1[7] - pix2[7]]; | |
82 pix1 += 8; | |
83 pix2 += 8; | |
84 } | |
85 pix1 += line_size - 16; | |
86 pix2 += line_size - 16; | |
87 } | |
88 return s; | |
89 } | |
90 | |
91 static void no_motion_search(MpegEncContext * s, | |
92 int *mx_ptr, int *my_ptr) | |
93 { | |
94 *mx_ptr = 16 * s->mb_x; | |
95 *my_ptr = 16 * s->mb_y; | |
96 } | |
97 | |
98 static int full_motion_search(MpegEncContext * s, | |
99 int *mx_ptr, int *my_ptr, int range, | |
324 | 100 int xmin, int ymin, int xmax, int ymax, uint8_t *ref_picture) |
0 | 101 { |
102 int x1, y1, x2, y2, xx, yy, x, y; | |
103 int mx, my, dmin, d; | |
104 UINT8 *pix; | |
105 | |
106 xx = 16 * s->mb_x; | |
107 yy = 16 * s->mb_y; | |
108 x1 = xx - range + 1; /* we loose one pixel to avoid boundary pb with half pixel pred */ | |
109 if (x1 < xmin) | |
110 x1 = xmin; | |
111 x2 = xx + range - 1; | |
112 if (x2 > xmax) | |
113 x2 = xmax; | |
114 y1 = yy - range + 1; | |
115 if (y1 < ymin) | |
116 y1 = ymin; | |
117 y2 = yy + range - 1; | |
118 if (y2 > ymax) | |
119 y2 = ymax; | |
120 pix = s->new_picture[0] + (yy * s->linesize) + xx; | |
121 dmin = 0x7fffffff; | |
122 mx = 0; | |
123 my = 0; | |
124 for (y = y1; y <= y2; y++) { | |
125 for (x = x1; x <= x2; x++) { | |
324 | 126 d = pix_abs16x16(pix, ref_picture + (y * s->linesize) + x, |
294 | 127 s->linesize); |
0 | 128 if (d < dmin || |
129 (d == dmin && | |
130 (abs(x - xx) + abs(y - yy)) < | |
131 (abs(mx - xx) + abs(my - yy)))) { | |
132 dmin = d; | |
133 mx = x; | |
134 my = y; | |
135 } | |
136 } | |
137 } | |
138 | |
139 *mx_ptr = mx; | |
140 *my_ptr = my; | |
141 | |
142 #if 0 | |
143 if (*mx_ptr < -(2 * range) || *mx_ptr >= (2 * range) || | |
144 *my_ptr < -(2 * range) || *my_ptr >= (2 * range)) { | |
145 fprintf(stderr, "error %d %d\n", *mx_ptr, *my_ptr); | |
146 } | |
147 #endif | |
148 return dmin; | |
149 } | |
150 | |
151 | |
152 static int log_motion_search(MpegEncContext * s, | |
153 int *mx_ptr, int *my_ptr, int range, | |
324 | 154 int xmin, int ymin, int xmax, int ymax, uint8_t *ref_picture) |
0 | 155 { |
156 int x1, y1, x2, y2, xx, yy, x, y; | |
157 int mx, my, dmin, d; | |
158 UINT8 *pix; | |
159 | |
160 xx = s->mb_x << 4; | |
161 yy = s->mb_y << 4; | |
162 | |
163 /* Left limit */ | |
164 x1 = xx - range; | |
165 if (x1 < xmin) | |
166 x1 = xmin; | |
167 | |
168 /* Right limit */ | |
169 x2 = xx + range; | |
170 if (x2 > xmax) | |
171 x2 = xmax; | |
172 | |
173 /* Upper limit */ | |
174 y1 = yy - range; | |
175 if (y1 < ymin) | |
176 y1 = ymin; | |
177 | |
178 /* Lower limit */ | |
179 y2 = yy + range; | |
180 if (y2 > ymax) | |
181 y2 = ymax; | |
182 | |
183 pix = s->new_picture[0] + (yy * s->linesize) + xx; | |
184 dmin = 0x7fffffff; | |
185 mx = 0; | |
186 my = 0; | |
187 | |
188 do { | |
189 for (y = y1; y <= y2; y += range) { | |
190 for (x = x1; x <= x2; x += range) { | |
324 | 191 d = pix_abs16x16(pix, ref_picture + (y * s->linesize) + x, s->linesize); |
0 | 192 if (d < dmin || (d == dmin && (abs(x - xx) + abs(y - yy)) < (abs(mx - xx) + abs(my - yy)))) { |
193 dmin = d; | |
194 mx = x; | |
195 my = y; | |
196 } | |
197 } | |
198 } | |
199 | |
200 range = range >> 1; | |
201 | |
202 x1 = mx - range; | |
203 if (x1 < xmin) | |
204 x1 = xmin; | |
205 | |
206 x2 = mx + range; | |
207 if (x2 > xmax) | |
208 x2 = xmax; | |
209 | |
210 y1 = my - range; | |
211 if (y1 < ymin) | |
212 y1 = ymin; | |
213 | |
214 y2 = my + range; | |
215 if (y2 > ymax) | |
216 y2 = ymax; | |
217 | |
218 } while (range >= 1); | |
219 | |
220 #ifdef DEBUG | |
221 fprintf(stderr, "log - MX: %d\tMY: %d\n", mx, my); | |
222 #endif | |
223 *mx_ptr = mx; | |
224 *my_ptr = my; | |
225 return dmin; | |
226 } | |
227 | |
228 static int phods_motion_search(MpegEncContext * s, | |
229 int *mx_ptr, int *my_ptr, int range, | |
324 | 230 int xmin, int ymin, int xmax, int ymax, uint8_t *ref_picture) |
0 | 231 { |
232 int x1, y1, x2, y2, xx, yy, x, y, lastx, d; | |
233 int mx, my, dminx, dminy; | |
234 UINT8 *pix; | |
235 | |
236 xx = s->mb_x << 4; | |
237 yy = s->mb_y << 4; | |
238 | |
239 /* Left limit */ | |
240 x1 = xx - range; | |
241 if (x1 < xmin) | |
242 x1 = xmin; | |
243 | |
244 /* Right limit */ | |
245 x2 = xx + range; | |
246 if (x2 > xmax) | |
247 x2 = xmax; | |
248 | |
249 /* Upper limit */ | |
250 y1 = yy - range; | |
251 if (y1 < ymin) | |
252 y1 = ymin; | |
253 | |
254 /* Lower limit */ | |
255 y2 = yy + range; | |
256 if (y2 > ymax) | |
257 y2 = ymax; | |
258 | |
259 pix = s->new_picture[0] + (yy * s->linesize) + xx; | |
260 mx = 0; | |
261 my = 0; | |
262 | |
263 x = xx; | |
264 y = yy; | |
265 do { | |
266 dminx = 0x7fffffff; | |
267 dminy = 0x7fffffff; | |
268 | |
269 lastx = x; | |
270 for (x = x1; x <= x2; x += range) { | |
324 | 271 d = pix_abs16x16(pix, ref_picture + (y * s->linesize) + x, s->linesize); |
0 | 272 if (d < dminx || (d == dminx && (abs(x - xx) + abs(y - yy)) < (abs(mx - xx) + abs(my - yy)))) { |
273 dminx = d; | |
274 mx = x; | |
275 } | |
276 } | |
277 | |
278 x = lastx; | |
279 for (y = y1; y <= y2; y += range) { | |
324 | 280 d = pix_abs16x16(pix, ref_picture + (y * s->linesize) + x, s->linesize); |
0 | 281 if (d < dminy || (d == dminy && (abs(x - xx) + abs(y - yy)) < (abs(mx - xx) + abs(my - yy)))) { |
282 dminy = d; | |
283 my = y; | |
284 } | |
285 } | |
286 | |
287 range = range >> 1; | |
288 | |
289 x = mx; | |
290 y = my; | |
291 x1 = mx - range; | |
292 if (x1 < xmin) | |
293 x1 = xmin; | |
294 | |
295 x2 = mx + range; | |
296 if (x2 > xmax) | |
297 x2 = xmax; | |
298 | |
299 y1 = my - range; | |
300 if (y1 < ymin) | |
301 y1 = ymin; | |
302 | |
303 y2 = my + range; | |
304 if (y2 > ymax) | |
305 y2 = ymax; | |
306 | |
307 } while (range >= 1); | |
308 | |
309 #ifdef DEBUG | |
310 fprintf(stderr, "phods - MX: %d\tMY: %d\n", mx, my); | |
311 #endif | |
312 | |
313 /* half pixel search */ | |
314 *mx_ptr = mx; | |
315 *my_ptr = my; | |
316 return dminy; | |
317 } | |
318 | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
319 |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
320 #define Z_THRESHOLD 256 |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
321 |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
322 #define CHECK_MV(x,y)\ |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
323 {\ |
455 | 324 const int key= ((y)<<ME_MAP_MV_BITS) + (x) + map_generation;\ |
325 const int index= (((y)<<ME_MAP_SHIFT) + (x))&(ME_MAP_SIZE-1);\ | |
326 if(map[index]!=key){\ | |
327 d = pix_abs16x16(new_pic, old_pic + (x) + (y)*pic_stride, pic_stride);\ | |
328 d += (mv_penalty[((x)<<shift)-pred_x] + mv_penalty[((y)<<shift)-pred_y])*quant;\ | |
329 COPY3_IF_LT(dmin, d, best[0], x, best[1], y)\ | |
330 map[index]= key;\ | |
331 score_map[index]= d;\ | |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
332 }\ |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
333 } |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
334 |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
335 #define CHECK_MV_DIR(x,y,new_dir)\ |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
336 {\ |
455 | 337 const int key= ((y)<<ME_MAP_MV_BITS) + (x) + map_generation;\ |
338 const int index= (((y)<<ME_MAP_SHIFT) + (x))&(ME_MAP_SIZE-1);\ | |
339 if(map[index]!=key){\ | |
340 d = pix_abs(new_pic, old_pic + (x) + (y)*pic_stride, pic_stride);\ | |
341 d += (mv_penalty[((x)<<shift)-pred_x] + mv_penalty[((y)<<shift)-pred_y])*quant;\ | |
342 if(d<dmin){\ | |
343 best[0]=x;\ | |
344 best[1]=y;\ | |
345 dmin=d;\ | |
346 next_dir= new_dir;\ | |
347 }\ | |
348 map[index]= key;\ | |
349 score_map[index]= d;\ | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
350 }\ |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
351 } |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
352 |
294 | 353 #define CHECK_MV4(x,y)\ |
354 {\ | |
455 | 355 const int key= ((y)<<ME_MAP_MV_BITS) + (x) + map_generation;\ |
356 const int index= (((y)<<ME_MAP_SHIFT) + (x))&(ME_MAP_SIZE-1);\ | |
357 if(map[index]!=key){\ | |
358 d = pix_abs8x8(new_pic, old_pic + (x) + (y)*pic_stride, pic_stride);\ | |
359 d += (mv_penalty[((x)<<shift)-pred_x] + mv_penalty[((y)<<shift)-pred_y])*quant;\ | |
360 COPY3_IF_LT(dmin, d, best[0], x, best[1], y)\ | |
361 map[index]= key;\ | |
362 score_map[index]= d;\ | |
294 | 363 }\ |
364 } | |
365 | |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
366 #define check(x,y,S,v)\ |
455 | 367 if( (x)<(xmin<<(S)) ) printf("%d %d %d %d %d xmin" #v, xmin, (x), (y), s->mb_x, s->mb_y);\ |
368 if( (x)>(xmax<<(S)) ) printf("%d %d %d %d %d xmax" #v, xmax, (x), (y), s->mb_x, s->mb_y);\ | |
369 if( (y)<(ymin<<(S)) ) printf("%d %d %d %d %d ymin" #v, ymin, (x), (y), s->mb_x, s->mb_y);\ | |
370 if( (y)>(ymax<<(S)) ) printf("%d %d %d %d %d ymax" #v, ymax, (x), (y), s->mb_x, s->mb_y);\ | |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
371 |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
372 |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
373 static inline int small_diamond_search(MpegEncContext * s, int *best, int dmin, |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
374 UINT8 *new_pic, UINT8 *old_pic, int pic_stride, |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
375 int pred_x, int pred_y, UINT16 *mv_penalty, int quant, |
455 | 376 int xmin, int ymin, int xmax, int ymax, int shift, |
377 uint32_t *map, uint16_t *score_map, int map_generation, | |
378 op_pixels_abs_func pix_abs) | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
379 { |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
380 int next_dir=-1; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
381 |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
382 for(;;){ |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
383 int d; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
384 const int dir= next_dir; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
385 const int x= best[0]; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
386 const int y= best[1]; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
387 next_dir=-1; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
388 |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
389 //printf("%d", dir); |
280 | 390 if(dir!=2 && x>xmin) CHECK_MV_DIR(x-1, y , 0) |
391 if(dir!=3 && y>ymin) CHECK_MV_DIR(x , y-1, 1) | |
392 if(dir!=0 && x<xmax) CHECK_MV_DIR(x+1, y , 2) | |
393 if(dir!=1 && y<ymax) CHECK_MV_DIR(x , y+1, 3) | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
394 |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
395 if(next_dir==-1){ |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
396 return dmin; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
397 } |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
398 } |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
399 |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
400 /* for(;;){ |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
401 int d; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
402 const int x= best[0]; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
403 const int y= best[1]; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
404 const int last_min=dmin; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
405 if(x>xmin) CHECK_MV(x-1, y ) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
406 if(y>xmin) CHECK_MV(x , y-1) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
407 if(x<xmax) CHECK_MV(x+1, y ) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
408 if(y<xmax) CHECK_MV(x , y+1) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
409 if(x>xmin && y>ymin) CHECK_MV(x-1, y-1) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
410 if(x>xmin && y<ymax) CHECK_MV(x-1, y+1) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
411 if(x<xmax && y>ymin) CHECK_MV(x+1, y-1) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
412 if(x<xmax && y<ymax) CHECK_MV(x+1, y+1) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
413 if(x-1>xmin) CHECK_MV(x-2, y ) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
414 if(y-1>xmin) CHECK_MV(x , y-2) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
415 if(x+1<xmax) CHECK_MV(x+2, y ) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
416 if(y+1<xmax) CHECK_MV(x , y+2) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
417 if(x-1>xmin && y-1>ymin) CHECK_MV(x-2, y-2) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
418 if(x-1>xmin && y+1<ymax) CHECK_MV(x-2, y+2) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
419 if(x+1<xmax && y-1>ymin) CHECK_MV(x+2, y-2) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
420 if(x+1<xmax && y+1<ymax) CHECK_MV(x+2, y+2) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
421 if(dmin==last_min) return dmin; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
422 } |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
423 */ |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
424 } |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
425 |
455 | 426 #if 1 |
427 #define SNAKE_1 3 | |
428 #define SNAKE_2 2 | |
429 #else | |
430 #define SNAKE_1 7 | |
431 #define SNAKE_2 3 | |
432 #endif | |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
433 static inline int snake_search(MpegEncContext * s, int *best, int dmin, |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
434 UINT8 *new_pic, UINT8 *old_pic, int pic_stride, |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
435 int pred_x, int pred_y, UINT16 *mv_penalty, int quant, |
455 | 436 int xmin, int ymin, int xmax, int ymax, int shift, |
437 uint32_t *map, uint16_t *score_map,int map_generation, | |
438 op_pixels_abs_func pix_abs) | |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
439 { |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
440 int dir=0; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
441 int c=1; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
442 static int x_dir[8]= {1,1,0,-1,-1,-1, 0, 1}; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
443 static int y_dir[8]= {0,1,1, 1, 0,-1,-1,-1}; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
444 int fails=0; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
445 int last_d[2]={dmin, dmin}; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
446 |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
447 /*static int good=0; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
448 static int bad=0; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
449 static int point=0; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
450 |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
451 point++; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
452 if(256*256*256*64%point==0) |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
453 { |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
454 printf("%d %d %d\n", good, bad, point); |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
455 }*/ |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
456 |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
457 for(;;){ |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
458 int x= best[0]; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
459 int y= best[1]; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
460 int d; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
461 x+=x_dir[dir]; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
462 y+=y_dir[dir]; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
463 if(x>=xmin && x<=xmax && y>=ymin && y<=ymax){ |
455 | 464 const int key= ((y)<<ME_MAP_MV_BITS) + (x) + map_generation; |
465 const int index= (((y)<<ME_MAP_SHIFT) + (x))&(ME_MAP_SIZE-1); | |
466 if(map[index]!=key){ | |
467 d = pix_abs(new_pic, old_pic + (x) + (y)*pic_stride, pic_stride); | |
468 d += (mv_penalty[((x)<<shift)-pred_x] + mv_penalty[((y)<<shift)-pred_y])*quant; | |
469 map[index]=key; | |
470 score_map[index]=d; | |
471 }else | |
472 d= dmin+1; | |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
473 }else{ |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
474 d = dmin + 10000; //FIXME smarter boundary handling |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
475 } |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
476 if(d<dmin){ |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
477 best[0]=x; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
478 best[1]=y; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
479 dmin=d; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
480 |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
481 if(last_d[1] - last_d[0] > last_d[0] - d) c= -c; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
482 dir+=c; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
483 |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
484 fails=0; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
485 //good++; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
486 last_d[1]=last_d[0]; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
487 last_d[0]=d; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
488 }else{ |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
489 //bad++; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
490 if(fails){ |
455 | 491 if(fails>=SNAKE_1+1) return dmin; |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
492 }else{ |
455 | 493 if(dir&1) dir-= c*3; |
494 else c= -c; | |
495 // c= -c; | |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
496 } |
455 | 497 dir+=c*SNAKE_2; |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
498 fails++; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
499 } |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
500 dir&=7; |
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
501 } |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
502 } |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
503 |
455 | 504 static inline int cross_search(MpegEncContext * s, int *best, int dmin, |
505 UINT8 *new_pic, UINT8 *old_pic, int pic_stride, | |
506 int pred_x, int pred_y, UINT16 *mv_penalty, int quant, | |
507 int xmin, int ymin, int xmax, int ymax, int shift, | |
508 uint32_t *map, uint16_t *score_map,int map_generation, | |
509 op_pixels_abs_func pix_abs) | |
510 { | |
511 static int x_dir[4]= {-1, 0, 1, 0}; | |
512 static int y_dir[4]= { 0,-1, 0, 1}; | |
513 int improvement[2]={100000, 100000}; | |
514 int dirs[2]={2, 3}; | |
515 int dir; | |
516 int last_dir= -1; | |
517 | |
518 for(;;){ | |
519 dir= dirs[ improvement[0] > improvement[1] ? 0 : 1 ]; | |
520 if(improvement[dir&1]==-1) return dmin; | |
521 | |
522 { | |
523 const int x= best[0] + x_dir[dir]; | |
524 const int y= best[1] + y_dir[dir]; | |
525 const int key= (y<<ME_MAP_MV_BITS) + x + map_generation; | |
526 const int index= ((y<<ME_MAP_SHIFT) + x)&(ME_MAP_SIZE-1); | |
527 int d; | |
528 if(x>=xmin && x<=xmax && y>=ymin && y<=ymax){ | |
529 if(map[index]!=key){ | |
530 d = pix_abs(new_pic, old_pic + x + y*pic_stride, pic_stride); | |
531 d += (mv_penalty[(x<<shift)-pred_x] + mv_penalty[(y<<shift)-pred_y])*quant; | |
532 map[index]=key; | |
533 score_map[index]=d; | |
534 if(d<dmin){ | |
535 improvement[dir&1]= dmin-d; | |
536 improvement[(dir&1)^1]++; | |
537 dmin=d; | |
538 best[0]= x; | |
539 best[1]= y; | |
540 last_dir=dir; | |
541 continue; | |
542 } | |
543 }else{ | |
544 d= score_map[index]; | |
545 } | |
546 }else{ | |
547 d= dmin + 1000; //FIXME is this a good idea? | |
548 } | |
549 /* evaluated point was cached or checked and worse */ | |
550 | |
551 if(last_dir==dir){ | |
552 improvement[dir&1]= -1; | |
553 }else{ | |
554 improvement[dir&1]= d-dmin; | |
555 last_dir= dirs[dir&1]= dir^2; | |
556 } | |
557 } | |
558 } | |
559 } | |
560 | |
561 static inline int update_map_generation(MpegEncContext * s) | |
562 { | |
563 s->me_map_generation+= 1<<(ME_MAP_MV_BITS*2); | |
564 if(s->me_map_generation==0){ | |
565 s->me_map_generation= 1<<(ME_MAP_MV_BITS*2); | |
566 memset(s->me_map, 0, sizeof(uint32_t)*ME_MAP_SIZE); | |
567 } | |
568 return s->me_map_generation; | |
569 } | |
570 | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
571 static int epzs_motion_search(MpegEncContext * s, |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
572 int *mx_ptr, int *my_ptr, |
455 | 573 int P[10][2], int pred_x, int pred_y, |
324 | 574 int xmin, int ymin, int xmax, int ymax, uint8_t * ref_picture) |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
575 { |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
576 int best[2]={0, 0}; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
577 int d, dmin; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
578 UINT8 *new_pic, *old_pic; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
579 const int pic_stride= s->linesize; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
580 const int pic_xy= (s->mb_y*pic_stride + s->mb_x)*16; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
581 UINT16 *mv_penalty= s->mv_penalty[s->f_code] + MAX_MV; // f_code of the prev frame |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
582 int quant= s->qscale; // qscale of the prev frame |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
583 const int shift= 1+s->quarter_sample; |
455 | 584 uint32_t *map= s->me_map; |
585 uint16_t *score_map= s->me_score_map; | |
586 int map_generation; | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
587 |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
588 new_pic = s->new_picture[0] + pic_xy; |
324 | 589 old_pic = ref_picture + pic_xy; |
455 | 590 |
591 map_generation= update_map_generation(s); | |
592 | |
294 | 593 dmin = pix_abs16x16(new_pic, old_pic, pic_stride); |
455 | 594 map[0]= map_generation; |
595 score_map[0]= dmin; | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
596 |
280 | 597 /* first line */ |
455 | 598 if ((s->mb_y == 0 || s->first_slice_line)) { |
599 CHECK_MV(P_LEFT[0]>>shift, P_LEFT[1]>>shift) | |
600 CHECK_MV(P_LAST[0]>>shift, P_LAST[1]>>shift) | |
280 | 601 }else{ |
455 | 602 if(dmin<256 && ( P_LEFT[0] |P_LEFT[1] |
603 |P_TOP[0] |P_TOP[1] | |
604 |P_TOPRIGHT[0]|P_TOPRIGHT[1])==0){ | |
605 *mx_ptr= 0; | |
606 *my_ptr= 0; | |
607 s->skip_me=1; | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
608 return dmin; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
609 } |
455 | 610 CHECK_MV(P_MEDIAN[0]>>shift, P_MEDIAN[1]>>shift) |
611 if(dmin>256*2){ | |
612 CHECK_MV(P_LAST[0] >>shift, P_LAST[1] >>shift) | |
613 CHECK_MV(P_LEFT[0] >>shift, P_LEFT[1] >>shift) | |
614 CHECK_MV(P_TOP[0] >>shift, P_TOP[1] >>shift) | |
615 CHECK_MV(P_TOPRIGHT[0]>>shift, P_TOPRIGHT[1]>>shift) | |
616 } | |
617 } | |
618 if(dmin>256*4){ | |
619 CHECK_MV(P_LAST_RIGHT[0] >>shift, P_LAST_RIGHT[1] >>shift) | |
620 CHECK_MV(P_LAST_BOTTOM[0]>>shift, P_LAST_BOTTOM[1]>>shift) | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
621 } |
455 | 622 #if 0 //doest only slow things down |
623 if(dmin>512*3){ | |
624 int step; | |
625 dmin= score_map[0]; | |
626 best[0]= best[1]=0; | |
627 for(step=128; step>0; step>>=1){ | |
628 const int step2= step; | |
629 int y; | |
630 for(y=-step2+best[1]; y<=step2+best[1]; y+=step){ | |
631 int x; | |
632 if(y<ymin || y>ymax) continue; | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
633 |
455 | 634 for(x=-step2+best[0]; x<=step2+best[0]; x+=step){ |
635 if(x<xmin || x>xmax) continue; | |
636 if(x==best[0] && y==best[1]) continue; | |
637 CHECK_MV(x,y) | |
638 } | |
639 } | |
640 } | |
641 } | |
642 #endif | |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
643 //check(best[0],best[1],0, b0) |
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
304
diff
changeset
|
644 if(s->me_method==ME_EPZS) |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
645 dmin= small_diamond_search(s, best, dmin, new_pic, old_pic, pic_stride, |
455 | 646 pred_x, pred_y, mv_penalty, quant, xmin, ymin, xmax, ymax, |
647 shift, map, score_map, map_generation, pix_abs16x16); | |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
648 else |
455 | 649 dmin= cross_search(s, best, dmin, new_pic, old_pic, pic_stride, |
650 pred_x, pred_y, mv_penalty, quant, xmin, ymin, xmax, ymax, | |
651 shift, map, score_map, map_generation, pix_abs16x16); | |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
652 //check(best[0],best[1],0, b1) |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
653 *mx_ptr= best[0]; |
280 | 654 *my_ptr= best[1]; |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
655 |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
656 // printf("%d %d %d \n", best[0], best[1], dmin); |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
657 return dmin; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
658 } |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
659 |
294 | 660 static int epzs_motion_search4(MpegEncContext * s, int block, |
661 int *mx_ptr, int *my_ptr, | |
455 | 662 int P[10][2], int pred_x, int pred_y, |
324 | 663 int xmin, int ymin, int xmax, int ymax, uint8_t *ref_picture) |
294 | 664 { |
665 int best[2]={0, 0}; | |
666 int d, dmin; | |
667 UINT8 *new_pic, *old_pic; | |
668 const int pic_stride= s->linesize; | |
669 const int pic_xy= ((s->mb_y*2 + (block>>1))*pic_stride + s->mb_x*2 + (block&1))*8; | |
670 UINT16 *mv_penalty= s->mv_penalty[s->f_code] + MAX_MV; // f_code of the prev frame | |
671 int quant= s->qscale; // qscale of the prev frame | |
672 const int shift= 1+s->quarter_sample; | |
455 | 673 uint32_t *map= s->me_map; |
674 uint16_t *score_map= s->me_score_map; | |
675 int map_generation; | |
294 | 676 |
677 new_pic = s->new_picture[0] + pic_xy; | |
324 | 678 old_pic = ref_picture + pic_xy; |
455 | 679 |
680 map_generation= update_map_generation(s); | |
294 | 681 |
455 | 682 dmin = 1000000; |
683 //printf("%d %d %d %d //",xmin, ymin, xmax, ymax); | |
294 | 684 /* first line */ |
455 | 685 if ((s->mb_y == 0 || s->first_slice_line) && block<2) { |
686 CHECK_MV4(P_LEFT[0]>>shift, P_LEFT[1]>>shift) | |
687 CHECK_MV4(P_LAST[0]>>shift, P_LAST[1]>>shift) | |
688 CHECK_MV4(P_MV1[0]>>shift, P_MV1[1]>>shift) | |
294 | 689 }else{ |
455 | 690 CHECK_MV4(P_MV1[0]>>shift, P_MV1[1]>>shift) |
691 //FIXME try some early stop | |
692 if(dmin>64*2){ | |
693 CHECK_MV4(P_MEDIAN[0]>>shift, P_MEDIAN[1]>>shift) | |
694 CHECK_MV4(P_LEFT[0]>>shift, P_LEFT[1]>>shift) | |
695 CHECK_MV4(P_TOP[0]>>shift, P_TOP[1]>>shift) | |
696 CHECK_MV4(P_TOPRIGHT[0]>>shift, P_TOPRIGHT[1]>>shift) | |
697 CHECK_MV4(P_LAST[0]>>shift, P_LAST[1]>>shift) | |
294 | 698 } |
455 | 699 } |
700 if(dmin>64*4){ | |
701 CHECK_MV4(P_LAST_RIGHT[0]>>shift, P_LAST_RIGHT[1]>>shift) | |
702 CHECK_MV4(P_LAST_BOTTOM[0]>>shift, P_LAST_BOTTOM[1]>>shift) | |
294 | 703 } |
704 | |
455 | 705 if(s->me_method==ME_EPZS) |
706 dmin= small_diamond_search(s, best, dmin, new_pic, old_pic, pic_stride, | |
707 pred_x, pred_y, mv_penalty, quant, xmin, ymin, xmax, ymax, | |
708 shift, map, score_map, map_generation, pix_abs8x8); | |
709 else | |
710 dmin= cross_search(s, best, dmin, new_pic, old_pic, pic_stride, | |
711 pred_x, pred_y, mv_penalty, quant, xmin, ymin, xmax, ymax, | |
712 shift, map, score_map, map_generation, pix_abs8x8); | |
713 | |
294 | 714 *mx_ptr= best[0]; |
715 *my_ptr= best[1]; | |
716 | |
717 // printf("%d %d %d \n", best[0], best[1], dmin); | |
718 return dmin; | |
719 } | |
720 | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
721 #define CHECK_HALF_MV(suffix, x, y) \ |
455 | 722 {\ |
723 d= pix_abs_ ## suffix(pix, ptr+((x)>>1), s->linesize);\ | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
724 d += (mv_penalty[pen_x + x] + mv_penalty[pen_y + y])*quant;\ |
455 | 725 COPY3_IF_LT(dminh, d, dx, x, dy, y)\ |
726 } | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
727 |
294 | 728 |
0 | 729 /* The idea would be to make half pel ME after Inter/Intra decision to |
730 save time. */ | |
327 | 731 static inline int halfpel_motion_search(MpegEncContext * s, |
0 | 732 int *mx_ptr, int *my_ptr, int dmin, |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
733 int xmin, int ymin, int xmax, int ymax, |
455 | 734 int pred_x, int pred_y, uint8_t *ref_picture, |
735 op_pixels_abs_func pix_abs_x2, | |
736 op_pixels_abs_func pix_abs_y2, op_pixels_abs_func pix_abs_xy2, int n) | |
0 | 737 { |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
738 UINT16 *mv_penalty= s->mv_penalty[s->f_code] + MAX_MV; // f_code of the prev frame |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
739 const int quant= s->qscale; |
455 | 740 int mx, my, xx, yy, dminh; |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
741 UINT8 *pix, *ptr; |
0 | 742 |
455 | 743 if(s->skip_me){ |
744 *mx_ptr = 0; | |
745 *my_ptr = 0; | |
746 return dmin; | |
747 }else | |
748 | |
749 xx = 16 * s->mb_x + 8*(n&1); | |
750 yy = 16 * s->mb_y + 8*(n>>1); | |
751 pix = s->new_picture[0] + (yy * s->linesize) + xx; | |
752 | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
753 mx = *mx_ptr; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
754 my = *my_ptr; |
455 | 755 ptr = ref_picture + ((yy + my) * s->linesize) + (xx + mx); |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
756 |
0 | 757 dminh = dmin; |
758 | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
759 if (mx > xmin && mx < xmax && |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
760 my > ymin && my < ymax) { |
455 | 761 int dx=0, dy=0; |
762 int d, pen_x, pen_y; | |
0 | 763 |
455 | 764 mx<<=1; |
765 my<<=1; | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
766 |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
767 pen_x= pred_x + mx; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
768 pen_y= pred_y + my; |
0 | 769 |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
770 ptr-= s->linesize; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
771 CHECK_HALF_MV(xy2, -1, -1) |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
772 CHECK_HALF_MV(y2 , 0, -1) |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
773 CHECK_HALF_MV(xy2, +1, -1) |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
774 |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
775 ptr+= s->linesize; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
776 CHECK_HALF_MV(x2 , -1, 0) |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
777 CHECK_HALF_MV(x2 , +1, 0) |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
778 CHECK_HALF_MV(xy2, -1, +1) |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
779 CHECK_HALF_MV(y2 , 0, +1) |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
780 CHECK_HALF_MV(xy2, +1, +1) |
294 | 781 |
455 | 782 mx+=dx; |
783 my+=dy; | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
784 }else{ |
455 | 785 mx<<=1; |
786 my<<=1; | |
0 | 787 } |
788 | |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
789 *mx_ptr = mx; |
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
790 *my_ptr = my; |
327 | 791 return dminh; |
0 | 792 } |
793 | |
455 | 794 static inline int fast_halfpel_motion_search(MpegEncContext * s, |
294 | 795 int *mx_ptr, int *my_ptr, int dmin, |
796 int xmin, int ymin, int xmax, int ymax, | |
455 | 797 int pred_x, int pred_y, uint8_t *ref_picture, |
798 op_pixels_abs_func pix_abs_x2, | |
799 op_pixels_abs_func pix_abs_y2, op_pixels_abs_func pix_abs_xy2, int n) | |
294 | 800 { |
801 UINT16 *mv_penalty= s->mv_penalty[s->f_code] + MAX_MV; // f_code of the prev frame | |
455 | 802 uint16_t *score_map= s->me_score_map; |
294 | 803 const int quant= s->qscale; |
455 | 804 int mx, my, xx, yy, dminh; |
294 | 805 UINT8 *pix, *ptr; |
806 | |
455 | 807 if(s->skip_me){ |
808 // printf("S"); | |
809 *mx_ptr = 0; | |
810 *my_ptr = 0; | |
811 return dmin; | |
812 } | |
813 // printf("N"); | |
814 | |
815 xx = 16 * s->mb_x + 8*(n&1); | |
816 yy = 16 * s->mb_y + 8*(n>>1); | |
294 | 817 pix = s->new_picture[0] + (yy * s->linesize) + xx; |
455 | 818 |
294 | 819 mx = *mx_ptr; |
820 my = *my_ptr; | |
455 | 821 ptr = ref_picture + ((yy + my) * s->linesize) + (xx + mx); |
822 | |
294 | 823 dminh = dmin; |
824 | |
825 if (mx > xmin && mx < xmax && | |
826 my > ymin && my < ymax) { | |
455 | 827 int dx=0, dy=0; |
828 int d, pen_x, pen_y; | |
829 const int index= (my<<ME_MAP_SHIFT) + mx; | |
830 const int t= score_map[(index-(1<<ME_MAP_SHIFT))&(ME_MAP_SIZE-1)]; | |
831 const int l= score_map[(index- 1 )&(ME_MAP_SIZE-1)]; | |
832 const int r= score_map[(index+ 1 )&(ME_MAP_SIZE-1)]; | |
833 const int b= score_map[(index+(1<<ME_MAP_SHIFT))&(ME_MAP_SIZE-1)]; | |
834 mx<<=1; | |
835 my<<=1; | |
294 | 836 |
837 | |
838 pen_x= pred_x + mx; | |
839 pen_y= pred_y + my; | |
840 | |
841 ptr-= s->linesize; | |
455 | 842 if(t<=b){ |
843 CHECK_HALF_MV(y2 , 0, -1) | |
844 if(l<=r){ | |
845 CHECK_HALF_MV(xy2, -1, -1) | |
846 if(t+r<=b+l){ | |
847 CHECK_HALF_MV(xy2, +1, -1) | |
848 ptr+= s->linesize; | |
849 }else{ | |
850 ptr+= s->linesize; | |
851 CHECK_HALF_MV(xy2, -1, +1) | |
852 } | |
853 CHECK_HALF_MV(x2 , -1, 0) | |
854 }else{ | |
855 CHECK_HALF_MV(xy2, +1, -1) | |
856 if(t+l<=b+r){ | |
857 CHECK_HALF_MV(xy2, -1, -1) | |
858 ptr+= s->linesize; | |
859 }else{ | |
860 ptr+= s->linesize; | |
861 CHECK_HALF_MV(xy2, +1, +1) | |
862 } | |
863 CHECK_HALF_MV(x2 , +1, 0) | |
864 } | |
865 }else{ | |
866 if(l<=r){ | |
867 if(t+l<=b+r){ | |
868 CHECK_HALF_MV(xy2, -1, -1) | |
869 ptr+= s->linesize; | |
870 }else{ | |
871 ptr+= s->linesize; | |
872 CHECK_HALF_MV(xy2, +1, +1) | |
873 } | |
874 CHECK_HALF_MV(x2 , -1, 0) | |
875 CHECK_HALF_MV(xy2, -1, +1) | |
876 }else{ | |
877 if(t+r<=b+l){ | |
878 CHECK_HALF_MV(xy2, +1, -1) | |
879 ptr+= s->linesize; | |
880 }else{ | |
881 ptr+= s->linesize; | |
882 CHECK_HALF_MV(xy2, -1, +1) | |
883 } | |
884 CHECK_HALF_MV(x2 , +1, 0) | |
885 CHECK_HALF_MV(xy2, +1, +1) | |
886 } | |
887 CHECK_HALF_MV(y2 , 0, +1) | |
888 } | |
889 mx+=dx; | |
890 my+=dy; | |
294 | 891 |
892 }else{ | |
455 | 893 mx<<=1; |
894 my<<=1; | |
294 | 895 } |
896 | |
897 *mx_ptr = mx; | |
898 *my_ptr = my; | |
455 | 899 return dminh; |
294 | 900 } |
901 | |
455 | 902 static inline void set_p_mv_tables(MpegEncContext * s, int mx, int my, int mv4) |
294 | 903 { |
324 | 904 const int xy= s->mb_x + 1 + (s->mb_y + 1)*(s->mb_width + 2); |
294 | 905 |
324 | 906 s->p_mv_table[xy][0] = mx; |
907 s->p_mv_table[xy][1] = my; | |
294 | 908 |
909 /* has allready been set to the 4 MV if 4MV is done */ | |
455 | 910 if(mv4){ |
294 | 911 int mot_xy= s->block_index[0]; |
912 | |
913 s->motion_val[mot_xy ][0]= mx; | |
914 s->motion_val[mot_xy ][1]= my; | |
915 s->motion_val[mot_xy+1][0]= mx; | |
916 s->motion_val[mot_xy+1][1]= my; | |
917 | |
918 mot_xy += s->block_wrap[0]; | |
919 s->motion_val[mot_xy ][0]= mx; | |
920 s->motion_val[mot_xy ][1]= my; | |
921 s->motion_val[mot_xy+1][0]= mx; | |
922 s->motion_val[mot_xy+1][1]= my; | |
923 } | |
924 } | |
925 | |
324 | 926 static inline void get_limits(MpegEncContext *s, int *range, int *xmin, int *ymin, int *xmax, int *ymax, int f_code) |
927 { | |
928 *range = 8 * (1 << (f_code - 1)); | |
929 /* XXX: temporary kludge to avoid overflow for msmpeg4 */ | |
930 if (s->out_format == FMT_H263 && !s->h263_msmpeg4) | |
931 *range *= 2; | |
0 | 932 |
324 | 933 if (s->unrestricted_mv) { |
934 *xmin = -16; | |
935 *ymin = -16; | |
936 if (s->h263_plus) | |
937 *range *= 2; | |
938 if(s->avctx==NULL || s->avctx->codec->id!=CODEC_ID_MPEG4){ | |
939 *xmax = s->mb_width*16; | |
940 *ymax = s->mb_height*16; | |
941 }else { | |
942 /* XXX: dunno if this is correct but ffmpeg4 decoder wont like it otherwise | |
943 (cuz the drawn edge isnt large enough))*/ | |
944 *xmax = s->width; | |
945 *ymax = s->height; | |
946 } | |
947 } else { | |
948 *xmin = 0; | |
949 *ymin = 0; | |
950 *xmax = s->mb_width*16 - 16; | |
951 *ymax = s->mb_height*16 - 16; | |
952 } | |
953 } | |
954 | |
455 | 955 static inline int mv4_search(MpegEncContext *s, int xmin, int ymin, int xmax, int ymax, int mx, int my, int shift) |
956 { | |
957 int block; | |
958 int P[10][2]; | |
959 uint8_t *ref_picture= s->last_picture[0]; | |
960 int dmin_sum=0; | |
961 | |
962 for(block=0; block<4; block++){ | |
963 int mx4, my4; | |
964 int pred_x4, pred_y4; | |
965 int dmin4; | |
966 static const int off[4]= {2, 1, 1, -1}; | |
967 const int mot_stride = s->block_wrap[0]; | |
968 const int mot_xy = s->block_index[block]; | |
969 // const int block_x= (block&1); | |
970 // const int block_y= (block>>1); | |
971 #if 1 // this saves us a bit of cliping work and shouldnt affect compression in a negative way | |
972 const int rel_xmin4= xmin; | |
973 const int rel_xmax4= xmax; | |
974 const int rel_ymin4= ymin; | |
975 const int rel_ymax4= ymax; | |
976 #else | |
977 const int rel_xmin4= xmin - block_x*8; | |
978 const int rel_xmax4= xmax - block_x*8 + 8; | |
979 const int rel_ymin4= ymin - block_y*8; | |
980 const int rel_ymax4= ymax - block_y*8 + 8; | |
981 #endif | |
982 P_LAST[0] = s->motion_val[mot_xy ][0]; | |
983 P_LAST[1] = s->motion_val[mot_xy ][1]; | |
984 P_LEFT[0] = s->motion_val[mot_xy - 1][0]; | |
985 P_LEFT[1] = s->motion_val[mot_xy - 1][1]; | |
986 P_LAST_RIGHT[0] = s->motion_val[mot_xy + 1][0]; | |
987 P_LAST_RIGHT[1] = s->motion_val[mot_xy + 1][1]; | |
988 P_LAST_BOTTOM[0]= s->motion_val[mot_xy + 1*mot_stride][0]; | |
989 P_LAST_BOTTOM[1]= s->motion_val[mot_xy + 1*mot_stride][1]; | |
990 | |
991 if(P_LEFT[0] > (rel_xmax4<<shift)) P_LEFT[0] = (rel_xmax4<<shift); | |
992 if(P_LAST_RIGHT[0] < (rel_xmin4<<shift)) P_LAST_RIGHT[0] = (rel_xmin4<<shift); | |
993 if(P_LAST_BOTTOM[1]< (rel_ymin4<<shift)) P_LAST_BOTTOM[1]= (rel_ymin4<<shift); | |
994 | |
995 /* special case for first line */ | |
996 if ((s->mb_y == 0 || s->first_slice_line) && block<2) { | |
997 pred_x4= P_LEFT[0]; | |
998 pred_y4= P_LEFT[1]; | |
999 } else { | |
1000 P_TOP[0] = s->motion_val[mot_xy - mot_stride ][0]; | |
1001 P_TOP[1] = s->motion_val[mot_xy - mot_stride ][1]; | |
1002 P_TOPRIGHT[0] = s->motion_val[mot_xy - mot_stride + off[block]][0]; | |
1003 P_TOPRIGHT[1] = s->motion_val[mot_xy - mot_stride + off[block]][1]; | |
1004 if(P_TOP[1] > (rel_ymax4<<shift)) P_TOP[1] = (rel_ymax4<<shift); | |
1005 if(P_TOPRIGHT[0] < (rel_xmin4<<shift)) P_TOPRIGHT[0]= (rel_xmin4<<shift); | |
1006 if(P_TOPRIGHT[0] > (rel_xmax4<<shift)) P_TOPRIGHT[0]= (rel_xmax4<<shift); | |
1007 if(P_TOPRIGHT[1] > (rel_ymax4<<shift)) P_TOPRIGHT[1]= (rel_ymax4<<shift); | |
1008 | |
1009 P_MEDIAN[0]= mid_pred(P_LEFT[0], P_TOP[0], P_TOPRIGHT[0]); | |
1010 P_MEDIAN[1]= mid_pred(P_LEFT[1], P_TOP[1], P_TOPRIGHT[1]); | |
1011 | |
1012 if(s->out_format == FMT_H263){ | |
1013 pred_x4 = P_MEDIAN[0]; | |
1014 pred_y4 = P_MEDIAN[1]; | |
1015 }else { /* mpeg1 at least */ | |
1016 pred_x4= P_LEFT[0]; | |
1017 pred_y4= P_LEFT[1]; | |
1018 } | |
1019 } | |
1020 P_MV1[0]= mx; | |
1021 P_MV1[1]= my; | |
1022 | |
1023 dmin4 = epzs_motion_search4(s, block, &mx4, &my4, P, pred_x4, pred_y4, rel_xmin4, rel_ymin4, rel_xmax4, rel_ymax4, ref_picture); | |
1024 | |
1025 dmin4= fast_halfpel_motion_search(s, &mx4, &my4, dmin4, rel_xmin4, rel_ymin4, rel_xmax4, rel_ymax4, | |
1026 pred_x4, pred_y4, ref_picture, pix_abs8x8_x2, | |
1027 pix_abs8x8_y2, pix_abs8x8_xy2, block); | |
1028 | |
1029 s->motion_val[ s->block_index[block] ][0]= mx4; | |
1030 s->motion_val[ s->block_index[block] ][1]= my4; | |
1031 dmin_sum+= dmin4; | |
1032 } | |
1033 return dmin_sum; | |
1034 } | |
1035 | |
324 | 1036 void ff_estimate_p_frame_motion(MpegEncContext * s, |
1037 int mb_x, int mb_y) | |
0 | 1038 { |
1039 UINT8 *pix, *ppix; | |
1040 int sum, varc, vard, mx, my, range, dmin, xx, yy; | |
1041 int xmin, ymin, xmax, ymax; | |
280 | 1042 int rel_xmin, rel_ymin, rel_xmax, rel_ymax; |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
1043 int pred_x=0, pred_y=0; |
455 | 1044 int P[10][2]; |
280 | 1045 const int shift= 1+s->quarter_sample; |
294 | 1046 int mb_type=0; |
324 | 1047 uint8_t *ref_picture= s->last_picture[0]; |
0 | 1048 |
324 | 1049 get_limits(s, &range, &xmin, &ymin, &xmax, &ymax, s->f_code); |
455 | 1050 rel_xmin= xmin - mb_x*16; |
1051 rel_xmax= xmax - mb_x*16; | |
1052 rel_ymin= ymin - mb_y*16; | |
1053 rel_ymax= ymax - mb_y*16; | |
1054 s->skip_me=0; | |
324 | 1055 |
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
304
diff
changeset
|
1056 switch(s->me_method) { |
0 | 1057 case ME_ZERO: |
1058 default: | |
1059 no_motion_search(s, &mx, &my); | |
455 | 1060 mx-= mb_x*16; |
1061 my-= mb_y*16; | |
0 | 1062 dmin = 0; |
1063 break; | |
1064 case ME_FULL: | |
324 | 1065 dmin = full_motion_search(s, &mx, &my, range, xmin, ymin, xmax, ymax, ref_picture); |
455 | 1066 mx-= mb_x*16; |
1067 my-= mb_y*16; | |
0 | 1068 break; |
1069 case ME_LOG: | |
324 | 1070 dmin = log_motion_search(s, &mx, &my, range / 2, xmin, ymin, xmax, ymax, ref_picture); |
455 | 1071 mx-= mb_x*16; |
1072 my-= mb_y*16; | |
0 | 1073 break; |
1074 case ME_PHODS: | |
324 | 1075 dmin = phods_motion_search(s, &mx, &my, range / 2, xmin, ymin, xmax, ymax, ref_picture); |
455 | 1076 mx-= mb_x*16; |
1077 my-= mb_y*16; | |
0 | 1078 break; |
288 | 1079 case ME_X1: |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
1080 case ME_EPZS: |
288 | 1081 { |
294 | 1082 const int mot_stride = s->block_wrap[0]; |
1083 const int mot_xy = s->block_index[0]; | |
288 | 1084 |
455 | 1085 P_LAST[0] = s->motion_val[mot_xy ][0]; |
1086 P_LAST[1] = s->motion_val[mot_xy ][1]; | |
1087 P_LEFT[0] = s->motion_val[mot_xy - 1][0]; | |
1088 P_LEFT[1] = s->motion_val[mot_xy - 1][1]; | |
1089 P_LAST_RIGHT[0] = s->motion_val[mot_xy + 2][0]; | |
1090 P_LAST_RIGHT[1] = s->motion_val[mot_xy + 2][1]; | |
1091 P_LAST_BOTTOM[0]= s->motion_val[mot_xy + 2*mot_stride][0]; | |
1092 P_LAST_BOTTOM[1]= s->motion_val[mot_xy + 2*mot_stride][1]; | |
288 | 1093 |
455 | 1094 if(P_LEFT[0] > (rel_xmax<<shift)) P_LEFT[0] = (rel_xmax<<shift); |
1095 if(P_LAST_RIGHT[0] < (rel_xmin<<shift)) P_LAST_RIGHT[0] = (rel_xmin<<shift); | |
1096 if(P_LAST_BOTTOM[1]< (rel_ymin<<shift)) P_LAST_BOTTOM[1]= (rel_ymin<<shift); | |
280 | 1097 |
1098 /* special case for first line */ | |
455 | 1099 if ((mb_y == 0 || s->first_slice_line)) { |
1100 pred_x= P_LEFT[0]; | |
1101 pred_y= P_LEFT[1]; | |
280 | 1102 } else { |
455 | 1103 P_TOP[0] = s->motion_val[mot_xy - mot_stride ][0]; |
1104 P_TOP[1] = s->motion_val[mot_xy - mot_stride ][1]; | |
1105 P_TOPRIGHT[0] = s->motion_val[mot_xy - mot_stride + 2][0]; | |
1106 P_TOPRIGHT[1] = s->motion_val[mot_xy - mot_stride + 2][1]; | |
1107 if(P_TOP[1] > (rel_ymax<<shift)) P_TOP[1] = (rel_ymax<<shift); | |
1108 if(P_TOPRIGHT[0] < (rel_xmin<<shift)) P_TOPRIGHT[0]= (rel_xmin<<shift); | |
1109 if(P_TOPRIGHT[1] > (rel_ymax<<shift)) P_TOPRIGHT[1]= (rel_ymax<<shift); | |
280 | 1110 |
455 | 1111 P_MEDIAN[0]= mid_pred(P_LEFT[0], P_TOP[0], P_TOPRIGHT[0]); |
1112 P_MEDIAN[1]= mid_pred(P_LEFT[1], P_TOP[1], P_TOPRIGHT[1]); | |
1113 | |
1114 if(s->out_format == FMT_H263){ | |
1115 pred_x = P_MEDIAN[0]; | |
1116 pred_y = P_MEDIAN[1]; | |
1117 }else { /* mpeg1 at least */ | |
1118 pred_x= P_LEFT[0]; | |
1119 pred_y= P_LEFT[1]; | |
1120 } | |
288 | 1121 } |
280 | 1122 } |
324 | 1123 dmin = epzs_motion_search(s, &mx, &my, P, pred_x, pred_y, rel_xmin, rel_ymin, rel_xmax, rel_ymax, ref_picture); |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
280
diff
changeset
|
1124 |
277
5cb2978e701f
new motion estimation (epzs) not complete yet but allready pretty good :)
michaelni
parents:
275
diff
changeset
|
1125 break; |
0 | 1126 } |
1127 | |
1128 /* intra / predictive decision */ | |
1129 xx = mb_x * 16; | |
1130 yy = mb_y * 16; | |
1131 | |
1132 pix = s->new_picture[0] + (yy * s->linesize) + xx; | |
455 | 1133 /* At this point (mx,my) are full-pell and the relative displacement */ |
1134 ppix = ref_picture + ((yy+my) * s->linesize) + (xx+mx); | |
289
648e9245546d
seems the old intra/inter decission is slightly better with a threshold, than the new one
michaelni
parents:
288
diff
changeset
|
1135 |
0 | 1136 sum = pix_sum(pix, s->linesize); |
455 | 1137 |
809
79de6308c34d
fixing another assert q>0.0 issue caused by variance < 0, this fix allso changes the inter/intra decission very slightly -> all regression checksums need to be updated
michaelni
parents:
807
diff
changeset
|
1138 varc = (pix_norm1(pix, s->linesize) - (((unsigned)(sum*sum))>>8) + 500 + 128)>>8; |
289
648e9245546d
seems the old intra/inter decission is slightly better with a threshold, than the new one
michaelni
parents:
288
diff
changeset
|
1139 vard = (pix_norm(pix, ppix, s->linesize)+128)>>8; |
608 | 1140 |
455 | 1141 //printf("%d %d %d %X %X %X\n", s->mb_width, mb_x, mb_y,(int)s, (int)s->mb_var, (int)s->mc_mb_var); fflush(stdout); |
1142 s->mb_var [s->mb_width * mb_y + mb_x] = varc; | |
1143 s->mc_mb_var[s->mb_width * mb_y + mb_x] = vard; | |
809
79de6308c34d
fixing another assert q>0.0 issue caused by variance < 0, this fix allso changes the inter/intra decission very slightly -> all regression checksums need to be updated
michaelni
parents:
807
diff
changeset
|
1144 s->mb_mean [s->mb_width * mb_y + mb_x] = (sum+128)>>8; |
455 | 1145 s->mb_var_sum += varc; |
1146 s->mc_mb_var_sum += vard; | |
1147 //printf("E%d %d %d %X %X %X\n", s->mb_width, mb_x, mb_y,(int)s, (int)s->mb_var, (int)s->mc_mb_var); fflush(stdout); | |
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
304
diff
changeset
|
1148 |
0 | 1149 #if 0 |
233
3f5b72726118
- More work on preliminary bit rate control, just to be able to get an
pulento
parents:
232
diff
changeset
|
1150 printf("varc=%4d avg_var=%4d (sum=%4d) vard=%4d mx=%2d my=%2d\n", |
3f5b72726118
- More work on preliminary bit rate control, just to be able to get an
pulento
parents:
232
diff
changeset
|
1151 varc, s->avg_mb_var, sum, vard, mx - xx, my - yy); |
0 | 1152 #endif |
294 | 1153 if(s->flags&CODEC_FLAG_HQ){ |
608 | 1154 if (vard <= 64 || vard < varc) |
1155 s->scene_change_score+= ff_sqrt(vard) - ff_sqrt(varc); | |
1156 else | |
1157 s->scene_change_score+= 20; | |
1158 | |
294 | 1159 if (vard*2 + 200 > varc) |
1160 mb_type|= MB_TYPE_INTRA; | |
1161 if (varc*2 + 200 > vard){ | |
1162 mb_type|= MB_TYPE_INTER; | |
455 | 1163 if(s->me_method >= ME_EPZS) |
1164 fast_halfpel_motion_search(s, &mx, &my, dmin, rel_xmin, rel_ymin, rel_xmax, rel_ymax, | |
1165 pred_x, pred_y, ref_picture, pix_abs16x16_x2, pix_abs16x16_y2, | |
1166 pix_abs16x16_xy2, 0); | |
1167 else | |
1168 halfpel_motion_search( s, &mx, &my, dmin, rel_xmin, rel_ymin, rel_xmax, rel_ymax, | |
1169 pred_x, pred_y, ref_picture, pix_abs16x16_x2, pix_abs16x16_y2, | |
1170 pix_abs16x16_xy2, 0); | |
304 | 1171 }else{ |
455 | 1172 mx <<=1; |
1173 my <<=1; | |
0 | 1174 } |
455 | 1175 if((s->flags&CODEC_FLAG_4MV) |
1176 && !s->skip_me && varc>50 && vard>10){ | |
1177 mv4_search(s, rel_xmin, rel_ymin, rel_xmax, rel_ymax, mx, my, shift); | |
1178 mb_type|=MB_TYPE_INTER4V; | |
1179 | |
1180 set_p_mv_tables(s, mx, my, 0); | |
1181 }else | |
1182 set_p_mv_tables(s, mx, my, 1); | |
294 | 1183 }else{ |
1184 if (vard <= 64 || vard < varc) { | |
608 | 1185 s->scene_change_score+= ff_sqrt(vard) - ff_sqrt(varc); |
294 | 1186 mb_type|= MB_TYPE_INTER; |
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
304
diff
changeset
|
1187 if (s->me_method != ME_ZERO) { |
455 | 1188 if(s->me_method >= ME_EPZS) |
1189 dmin= fast_halfpel_motion_search(s, &mx, &my, dmin, rel_xmin, rel_ymin, rel_xmax, rel_ymax, | |
1190 pred_x, pred_y, ref_picture, pix_abs16x16_x2, pix_abs16x16_y2, | |
1191 pix_abs16x16_xy2, 0); | |
1192 else | |
1193 dmin= halfpel_motion_search(s, &mx, &my, dmin, rel_xmin, rel_ymin, rel_xmax, rel_ymax, | |
1194 pred_x, pred_y, ref_picture, pix_abs16x16_x2, pix_abs16x16_y2, | |
1195 pix_abs16x16_xy2, 0); | |
1196 if((s->flags&CODEC_FLAG_4MV) | |
1197 && !s->skip_me && varc>50 && vard>10){ | |
1198 int dmin4= mv4_search(s, rel_xmin, rel_ymin, rel_xmax, rel_ymax, mx, my, shift); | |
1199 if(dmin4 + 128 <dmin) | |
1200 mb_type= MB_TYPE_INTER4V; | |
1201 } | |
1202 set_p_mv_tables(s, mx, my, mb_type!=MB_TYPE_INTER4V); | |
1203 | |
294 | 1204 } else { |
455 | 1205 mx <<=1; |
1206 my <<=1; | |
294 | 1207 } |
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
304
diff
changeset
|
1208 #if 0 |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
304
diff
changeset
|
1209 if (vard < 10) { |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
304
diff
changeset
|
1210 skip++; |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
304
diff
changeset
|
1211 fprintf(stderr,"\nEarly skip: %d vard: %2d varc: %5d dmin: %d", |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
304
diff
changeset
|
1212 skip, vard, varc, dmin); |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
304
diff
changeset
|
1213 } |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
304
diff
changeset
|
1214 #endif |
294 | 1215 }else{ |
608 | 1216 s->scene_change_score+= 20; |
294 | 1217 mb_type|= MB_TYPE_INTRA; |
455 | 1218 mx = 0; |
1219 my = 0; | |
294 | 1220 } |
1221 } | |
284 | 1222 |
294 | 1223 s->mb_type[mb_y*s->mb_width + mb_x]= mb_type; |
0 | 1224 } |
1225 | |
327 | 1226 int ff_estimate_motion_b(MpegEncContext * s, |
324 | 1227 int mb_x, int mb_y, int16_t (*mv_table)[2], uint8_t *ref_picture, int f_code) |
0 | 1228 { |
327 | 1229 int mx, my, range, dmin; |
324 | 1230 int xmin, ymin, xmax, ymax; |
1231 int rel_xmin, rel_ymin, rel_xmax, rel_ymax; | |
1232 int pred_x=0, pred_y=0; | |
455 | 1233 int P[10][2]; |
324 | 1234 const int shift= 1+s->quarter_sample; |
1235 const int mot_stride = s->mb_width + 2; | |
1236 const int mot_xy = (mb_y + 1)*mot_stride + mb_x + 1; | |
1237 | |
1238 get_limits(s, &range, &xmin, &ymin, &xmax, &ymax, f_code); | |
455 | 1239 rel_xmin= xmin - mb_x*16; |
1240 rel_xmax= xmax - mb_x*16; | |
1241 rel_ymin= ymin - mb_y*16; | |
1242 rel_ymax= ymax - mb_y*16; | |
324 | 1243 |
1244 switch(s->me_method) { | |
1245 case ME_ZERO: | |
1246 default: | |
1247 no_motion_search(s, &mx, &my); | |
1248 dmin = 0; | |
455 | 1249 mx-= mb_x*16; |
1250 my-= mb_y*16; | |
324 | 1251 break; |
1252 case ME_FULL: | |
1253 dmin = full_motion_search(s, &mx, &my, range, xmin, ymin, xmax, ymax, ref_picture); | |
455 | 1254 mx-= mb_x*16; |
1255 my-= mb_y*16; | |
324 | 1256 break; |
1257 case ME_LOG: | |
1258 dmin = log_motion_search(s, &mx, &my, range / 2, xmin, ymin, xmax, ymax, ref_picture); | |
455 | 1259 mx-= mb_x*16; |
1260 my-= mb_y*16; | |
324 | 1261 break; |
1262 case ME_PHODS: | |
1263 dmin = phods_motion_search(s, &mx, &my, range / 2, xmin, ymin, xmax, ymax, ref_picture); | |
455 | 1264 mx-= mb_x*16; |
1265 my-= mb_y*16; | |
324 | 1266 break; |
1267 case ME_X1: | |
1268 case ME_EPZS: | |
1269 { | |
0 | 1270 |
455 | 1271 P_LAST[0] = mv_table[mot_xy ][0]; |
1272 P_LAST[1] = mv_table[mot_xy ][1]; | |
1273 P_LEFT[0] = mv_table[mot_xy - 1][0]; | |
1274 P_LEFT[1] = mv_table[mot_xy - 1][1]; | |
1275 P_LAST_RIGHT[0] = mv_table[mot_xy + 1][0]; | |
1276 P_LAST_RIGHT[1] = mv_table[mot_xy + 1][1]; | |
1277 P_LAST_BOTTOM[0] = mv_table[mot_xy + mot_stride][0]; | |
1278 P_LAST_BOTTOM[1] = mv_table[mot_xy + mot_stride][1]; | |
324 | 1279 |
455 | 1280 if(P_LEFT[0] > (rel_xmax<<shift)) P_LEFT[0] = (rel_xmax<<shift); |
1281 if(P_LAST_RIGHT[0] < (rel_xmin<<shift)) P_LAST_RIGHT[0] = (rel_xmin<<shift); | |
1282 if(P_LAST_BOTTOM[1]< (rel_ymin<<shift)) P_LAST_BOTTOM[1]= (rel_ymin<<shift); | |
324 | 1283 |
1284 /* special case for first line */ | |
455 | 1285 if ((mb_y == 0 || s->first_slice_line)) { |
324 | 1286 } else { |
455 | 1287 P_TOP[0] = mv_table[mot_xy - mot_stride ][0]; |
1288 P_TOP[1] = mv_table[mot_xy - mot_stride ][1]; | |
1289 P_TOPRIGHT[0] = mv_table[mot_xy - mot_stride + 1 ][0]; | |
1290 P_TOPRIGHT[1] = mv_table[mot_xy - mot_stride + 1 ][1]; | |
1291 if(P_TOP[1] > (rel_ymax<<shift)) P_TOP[1]= (rel_ymax<<shift); | |
1292 if(P_TOPRIGHT[0] < (rel_xmin<<shift)) P_TOPRIGHT[0]= (rel_xmin<<shift); | |
1293 if(P_TOPRIGHT[1] > (rel_ymax<<shift)) P_TOPRIGHT[1]= (rel_ymax<<shift); | |
324 | 1294 |
455 | 1295 P_MEDIAN[0]= mid_pred(P_LEFT[0], P_TOP[0], P_TOPRIGHT[0]); |
1296 P_MEDIAN[1]= mid_pred(P_LEFT[1], P_TOP[1], P_TOPRIGHT[1]); | |
324 | 1297 } |
455 | 1298 pred_x= P_LEFT[0]; |
1299 pred_y= P_LEFT[1]; | |
324 | 1300 } |
1301 dmin = epzs_motion_search(s, &mx, &my, P, pred_x, pred_y, rel_xmin, rel_ymin, rel_xmax, rel_ymax, ref_picture); | |
1302 | |
1303 break; | |
1304 } | |
1305 | |
455 | 1306 dmin= fast_halfpel_motion_search(s, &mx, &my, dmin, rel_xmin, rel_ymin, rel_xmax, rel_ymax, |
1307 pred_x, pred_y, ref_picture, pix_abs16x16_x2, pix_abs16x16_y2, | |
1308 pix_abs16x16_xy2, 0); | |
1309 //printf("%d %d %d %d//", s->mb_x, s->mb_y, mx, my); | |
324 | 1310 // s->mb_type[mb_y*s->mb_width + mb_x]= mb_type; |
1311 mv_table[mot_xy][0]= mx; | |
1312 mv_table[mot_xy][1]= my; | |
327 | 1313 return dmin; |
324 | 1314 } |
1315 | |
1316 | |
327 | 1317 static inline int check_bidir_mv(MpegEncContext * s, |
1318 int mb_x, int mb_y, | |
1319 int motion_fx, int motion_fy, | |
1320 int motion_bx, int motion_by, | |
1321 int pred_fx, int pred_fy, | |
1322 int pred_bx, int pred_by) | |
1323 { | |
1324 //FIXME optimize? | |
455 | 1325 //FIXME direct mode penalty |
327 | 1326 UINT16 *mv_penalty= s->mv_penalty[s->f_code] + MAX_MV; // f_code of the prev frame |
1327 uint8_t *dest_y = s->me_scratchpad; | |
1328 uint8_t *ptr; | |
1329 int dxy; | |
1330 int src_x, src_y; | |
1331 int fbmin; | |
1332 | |
1333 fbmin = (mv_penalty[motion_fx-pred_fx] + mv_penalty[motion_fy-pred_fy])*s->qscale; | |
1334 | |
1335 dxy = ((motion_fy & 1) << 1) | (motion_fx & 1); | |
1336 src_x = mb_x * 16 + (motion_fx >> 1); | |
1337 src_y = mb_y * 16 + (motion_fy >> 1); | |
765 | 1338 src_x = clip(src_x, -16, s->width); |
1339 if (src_x == s->width) | |
1340 dxy&= 2; | |
1341 src_y = clip(src_y, -16, s->height); | |
1342 if (src_y == s->height) | |
1343 dxy&= 1; | |
1344 | |
327 | 1345 ptr = s->last_picture[0] + (src_y * s->linesize) + src_x; |
651 | 1346 put_pixels_tab[0][dxy](dest_y , ptr , s->linesize, 16); |
327 | 1347 |
1348 fbmin += (mv_penalty[motion_bx-pred_bx] + mv_penalty[motion_by-pred_by])*s->qscale; | |
1349 | |
1350 dxy = ((motion_by & 1) << 1) | (motion_bx & 1); | |
1351 src_x = mb_x * 16 + (motion_bx >> 1); | |
1352 src_y = mb_y * 16 + (motion_by >> 1); | |
765 | 1353 src_x = clip(src_x, -16, s->width); |
1354 if (src_x == s->width) | |
1355 dxy&= 2; | |
1356 src_y = clip(src_y, -16, s->height); | |
1357 if (src_y == s->height) | |
1358 dxy&= 1; | |
327 | 1359 |
1360 ptr = s->next_picture[0] + (src_y * s->linesize) + src_x; | |
651 | 1361 avg_pixels_tab[0][dxy](dest_y , ptr , s->linesize, 16); |
327 | 1362 |
1363 fbmin += pix_abs16x16(s->new_picture[0] + mb_x*16 + mb_y*16*s->linesize, dest_y, s->linesize); | |
1364 return fbmin; | |
1365 } | |
1366 | |
1367 /* refine the bidir vectors in hq mode and return the score in both lq & hq mode*/ | |
1368 static inline int bidir_refine(MpegEncContext * s, | |
1369 int mb_x, int mb_y) | |
1370 { | |
1371 const int mot_stride = s->mb_width + 2; | |
1372 const int xy = (mb_y + 1)*mot_stride + mb_x + 1; | |
1373 int fbmin; | |
1374 int pred_fx= s->b_bidir_forw_mv_table[xy-1][0]; | |
1375 int pred_fy= s->b_bidir_forw_mv_table[xy-1][1]; | |
1376 int pred_bx= s->b_bidir_back_mv_table[xy-1][0]; | |
1377 int pred_by= s->b_bidir_back_mv_table[xy-1][1]; | |
1378 int motion_fx= s->b_bidir_forw_mv_table[xy][0]= s->b_forw_mv_table[xy][0]; | |
1379 int motion_fy= s->b_bidir_forw_mv_table[xy][1]= s->b_forw_mv_table[xy][1]; | |
1380 int motion_bx= s->b_bidir_back_mv_table[xy][0]= s->b_back_mv_table[xy][0]; | |
1381 int motion_by= s->b_bidir_back_mv_table[xy][1]= s->b_back_mv_table[xy][1]; | |
1382 | |
1383 //FIXME do refinement and add flag | |
1384 | |
1385 fbmin= check_bidir_mv(s, mb_x, mb_y, | |
1386 motion_fx, motion_fy, | |
1387 motion_bx, motion_by, | |
1388 pred_fx, pred_fy, | |
1389 pred_bx, pred_by); | |
1390 | |
1391 return fbmin; | |
1392 } | |
1393 | |
1394 static inline int direct_search(MpegEncContext * s, | |
1395 int mb_x, int mb_y) | |
324 | 1396 { |
455 | 1397 int P[10][2]; |
327 | 1398 const int mot_stride = s->mb_width + 2; |
1399 const int mot_xy = (mb_y + 1)*mot_stride + mb_x + 1; | |
1400 int dmin, dmin2; | |
1401 int motion_fx, motion_fy, motion_bx, motion_by, motion_bx0, motion_by0; | |
1402 int motion_dx, motion_dy; | |
1403 const int motion_px= s->p_mv_table[mot_xy][0]; | |
1404 const int motion_py= s->p_mv_table[mot_xy][1]; | |
1405 const int time_pp= s->pp_time; | |
664 | 1406 const int time_pb= s->pb_time; |
1407 const int time_bp= time_pp - time_pb; | |
327 | 1408 int bx, by; |
1409 int mx, my, mx2, my2; | |
587
4d41fe7eb780
b frame direct mode bugfix (bug found by CM <chenm001 at 163 dot com>)
michaelni
parents:
502
diff
changeset
|
1410 uint8_t *ref_picture= s->me_scratchpad - (mb_x - 1 + (mb_y - 1)*s->linesize)*16; |
327 | 1411 int16_t (*mv_table)[2]= s->b_direct_mv_table; |
620
a5aa53b6e648
warning patch by (Dominik Mierzejewski <dominik at rangers dot eu dot org>)
michaelni
parents:
612
diff
changeset
|
1412 /* uint16_t *mv_penalty= s->mv_penalty[s->f_code] + MAX_MV; */ // f_code of the prev frame |
324 | 1413 |
327 | 1414 /* thanks to iso-mpeg the rounding is different for the zero vector, so we need to handle that ... */ |
1415 motion_fx= (motion_px*time_pb)/time_pp; | |
1416 motion_fy= (motion_py*time_pb)/time_pp; | |
1417 motion_bx0= (-motion_px*time_bp)/time_pp; | |
1418 motion_by0= (-motion_py*time_bp)/time_pp; | |
1419 motion_dx= motion_dy=0; | |
1420 dmin2= check_bidir_mv(s, mb_x, mb_y, | |
1421 motion_fx, motion_fy, | |
1422 motion_bx0, motion_by0, | |
1423 motion_fx, motion_fy, | |
1424 motion_bx0, motion_by0) - s->qscale; | |
1425 | |
1426 motion_bx= motion_fx - motion_px; | |
1427 motion_by= motion_fy - motion_py; | |
1428 for(by=-1; by<2; by++){ | |
1429 for(bx=-1; bx<2; bx++){ | |
1430 uint8_t *dest_y = s->me_scratchpad + (by+1)*s->linesize*16 + (bx+1)*16; | |
1431 uint8_t *ptr; | |
1432 int dxy; | |
1433 int src_x, src_y; | |
1434 const int width= s->width; | |
1435 const int height= s->height; | |
1436 | |
1437 dxy = ((motion_fy & 1) << 1) | (motion_fx & 1); | |
1438 src_x = (mb_x + bx) * 16 + (motion_fx >> 1); | |
1439 src_y = (mb_y + by) * 16 + (motion_fy >> 1); | |
1440 src_x = clip(src_x, -16, width); | |
1441 if (src_x == width) dxy &= ~1; | |
1442 src_y = clip(src_y, -16, height); | |
1443 if (src_y == height) dxy &= ~2; | |
1444 | |
1445 ptr = s->last_picture[0] + (src_y * s->linesize) + src_x; | |
651 | 1446 put_pixels_tab[0][dxy](dest_y , ptr , s->linesize, 16); |
327 | 1447 |
1448 dxy = ((motion_by & 1) << 1) | (motion_bx & 1); | |
1449 src_x = (mb_x + bx) * 16 + (motion_bx >> 1); | |
1450 src_y = (mb_y + by) * 16 + (motion_by >> 1); | |
1451 src_x = clip(src_x, -16, width); | |
1452 if (src_x == width) dxy &= ~1; | |
1453 src_y = clip(src_y, -16, height); | |
1454 if (src_y == height) dxy &= ~2; | |
1455 | |
651 | 1456 avg_pixels_tab[0][dxy](dest_y , ptr , s->linesize, 16); |
327 | 1457 } |
1458 } | |
1459 | |
455 | 1460 P_LAST[0] = mv_table[mot_xy ][0]; |
1461 P_LAST[1] = mv_table[mot_xy ][1]; | |
1462 P_LEFT[0] = mv_table[mot_xy - 1][0]; | |
1463 P_LEFT[1] = mv_table[mot_xy - 1][1]; | |
1464 P_LAST_RIGHT[0] = mv_table[mot_xy + 1][0]; | |
1465 P_LAST_RIGHT[1] = mv_table[mot_xy + 1][1]; | |
1466 P_LAST_BOTTOM[0] = mv_table[mot_xy + mot_stride][0]; | |
1467 P_LAST_BOTTOM[1] = mv_table[mot_xy + mot_stride][1]; | |
1468 /* | |
1469 if(P_LEFT[0] > (rel_xmax<<shift)) P_LEFT[0] = (rel_xmax<<shift); | |
1470 if(P_LAST_RIGHT[0] < (rel_xmin<<shift)) P_LAST_RIGHT[0] = (rel_xmin<<shift); | |
1471 if(P_LAST_BOTTOM[1]< (rel_ymin<<shift)) P_LAST_BOTTOM[1]= (rel_ymin<<shift); | |
1472 */ | |
327 | 1473 /* special case for first line */ |
455 | 1474 if ((mb_y == 0 || s->first_slice_line)) { |
327 | 1475 } else { |
455 | 1476 P_TOP[0] = mv_table[mot_xy - mot_stride ][0]; |
1477 P_TOP[1] = mv_table[mot_xy - mot_stride ][1]; | |
1478 P_TOPRIGHT[0] = mv_table[mot_xy - mot_stride + 1 ][0]; | |
1479 P_TOPRIGHT[1] = mv_table[mot_xy - mot_stride + 1 ][1]; | |
327 | 1480 |
455 | 1481 P_MEDIAN[0]= mid_pred(P_LEFT[0], P_TOP[0], P_TOPRIGHT[0]); |
1482 P_MEDIAN[1]= mid_pred(P_LEFT[1], P_TOP[1], P_TOPRIGHT[1]); | |
327 | 1483 } |
1484 dmin = epzs_motion_search(s, &mx, &my, P, 0, 0, -16, -16, 15, 15, ref_picture); | |
1485 if(mx==0 && my==0) dmin=99999999; // not representable, due to rounding stuff | |
1486 if(dmin2<dmin){ | |
1487 dmin= dmin2; | |
1488 mx=0; | |
1489 my=0; | |
1490 } | |
1491 #if 1 | |
1492 mx2= mx= mx*2; | |
1493 my2= my= my*2; | |
1494 for(by=-1; by<2; by++){ | |
1495 if(my2+by < -32) continue; | |
1496 for(bx=-1; bx<2; bx++){ | |
1497 if(bx==0 && by==0) continue; | |
1498 if(mx2+bx < -32) continue; | |
1499 dmin2= check_bidir_mv(s, mb_x, mb_y, | |
1500 mx2+bx+motion_fx, my2+by+motion_fy, | |
1501 mx2+bx+motion_bx, my2+by+motion_by, | |
1502 mx2+bx+motion_fx, my2+by+motion_fy, | |
1503 motion_bx, motion_by) - s->qscale; | |
1504 | |
1505 if(dmin2<dmin){ | |
1506 dmin=dmin2; | |
1507 mx= mx2 + bx; | |
1508 my= my2 + by; | |
1509 } | |
1510 } | |
1511 } | |
1512 #else | |
1513 mx*=2; my*=2; | |
1514 #endif | |
1515 if(mx==0 && my==0){ | |
1516 motion_bx= motion_bx0; | |
1517 motion_by= motion_by0; | |
1518 } | |
1519 | |
1520 s->b_direct_mv_table[mot_xy][0]= mx; | |
1521 s->b_direct_mv_table[mot_xy][1]= my; | |
1522 s->b_direct_forw_mv_table[mot_xy][0]= motion_fx + mx; | |
1523 s->b_direct_forw_mv_table[mot_xy][1]= motion_fy + my; | |
1524 s->b_direct_back_mv_table[mot_xy][0]= motion_bx + mx; | |
1525 s->b_direct_back_mv_table[mot_xy][1]= motion_by + my; | |
1526 return dmin; | |
324 | 1527 } |
1528 | |
1529 void ff_estimate_b_frame_motion(MpegEncContext * s, | |
1530 int mb_x, int mb_y) | |
1531 { | |
327 | 1532 const int quant= s->qscale; |
1533 int fmin, bmin, dmin, fbmin; | |
1534 int type=0; | |
1535 | |
1536 dmin= direct_search(s, mb_x, mb_y); | |
324 | 1537 |
327 | 1538 fmin= ff_estimate_motion_b(s, mb_x, mb_y, s->b_forw_mv_table, s->last_picture[0], s->f_code); |
1539 bmin= ff_estimate_motion_b(s, mb_x, mb_y, s->b_back_mv_table, s->next_picture[0], s->b_code) - quant; | |
324 | 1540 //printf(" %d %d ", s->b_forw_mv_table[xy][0], s->b_forw_mv_table[xy][1]); |
327 | 1541 |
1542 fbmin= bidir_refine(s, mb_x, mb_y); | |
1543 | |
612 | 1544 { |
327 | 1545 int score= dmin; |
1546 type=MB_TYPE_DIRECT; | |
1547 | |
1548 if(fmin<score){ | |
1549 score=fmin; | |
1550 type= MB_TYPE_FORWARD; | |
1551 } | |
1552 if(bmin<score){ | |
1553 score=bmin; | |
1554 type= MB_TYPE_BACKWARD; | |
1555 } | |
1556 if(fbmin<score){ | |
1557 score=fbmin; | |
1558 type= MB_TYPE_BIDIR; | |
1559 } | |
807
0e1d375c537f
fixing q>0.0 assert failure caused by overflow of variance for b frames
michaelni
parents:
765
diff
changeset
|
1560 score= ((unsigned)(score*score + 128*256))>>16; |
455 | 1561 s->mc_mb_var_sum += score; |
612 | 1562 s->mc_mb_var[mb_y*s->mb_width + mb_x] = score; //FIXME use SSD |
327 | 1563 } |
612 | 1564 |
1565 if(s->flags&CODEC_FLAG_HQ){ | |
1566 type= MB_TYPE_FORWARD | MB_TYPE_BACKWARD | MB_TYPE_BIDIR | MB_TYPE_DIRECT; //FIXME something smarter | |
1567 } | |
1568 | |
455 | 1569 /* |
1570 { | |
1571 static int count=0; | |
1572 static int sum=0; | |
1573 if(type==MB_TYPE_DIRECT){ | |
1574 int diff= ABS(s->b_forw_mv_table) | |
1575 } | |
1576 }*/ | |
327 | 1577 |
1578 s->mb_type[mb_y*s->mb_width + mb_x]= type; | |
455 | 1579 /* if(mb_y==0 && mb_x==0) printf("\n"); |
1580 if(mb_x==0) printf("\n"); | |
1581 printf("%d", av_log2(type)); | |
1582 */ | |
324 | 1583 } |
0 | 1584 |
324 | 1585 /* find best f_code for ME which do unlimited searches */ |
1586 int ff_get_best_fcode(MpegEncContext * s, int16_t (*mv_table)[2], int type) | |
1587 { | |
1588 if(s->me_method>=ME_EPZS){ | |
455 | 1589 int score[8]; |
324 | 1590 int i, y; |
1591 UINT8 * fcode_tab= s->fcode_tab; | |
455 | 1592 int best_fcode=-1; |
1593 int best_score=-10000000; | |
324 | 1594 |
455 | 1595 for(i=0; i<8; i++) score[i]= s->mb_num*(8-i); //FIXME *2 and all other too so its the same but nicer |
324 | 1596 |
1597 for(y=0; y<s->mb_height; y++){ | |
1598 int x; | |
1599 int xy= (y+1)* (s->mb_width+2) + 1; | |
1600 i= y*s->mb_width; | |
1601 for(x=0; x<s->mb_width; x++){ | |
1602 if(s->mb_type[i] & type){ | |
455 | 1603 int fcode= MAX(fcode_tab[mv_table[xy][0] + MAX_MV], |
1604 fcode_tab[mv_table[xy][1] + MAX_MV]); | |
1605 int j; | |
1606 | |
1607 for(j=0; j<fcode && j<8; j++){ | |
1608 if(s->pict_type==B_TYPE || s->mc_mb_var[i] < s->mb_var[i]) | |
1609 score[j]-= 170; | |
1610 } | |
324 | 1611 } |
1612 i++; | |
1613 xy++; | |
1614 } | |
1615 } | |
455 | 1616 |
1617 for(i=1; i<8; i++){ | |
1618 if(score[i] > best_score){ | |
1619 best_score= score[i]; | |
1620 best_fcode= i; | |
1621 } | |
1622 // printf("%d %d\n", i, score[i]); | |
1623 } | |
327 | 1624 |
324 | 1625 // printf("fcode: %d type: %d\n", i, s->pict_type); |
455 | 1626 return best_fcode; |
324 | 1627 /* for(i=0; i<=MAX_FCODE; i++){ |
1628 printf("%d ", mv_num[i]); | |
1629 } | |
1630 printf("\n");*/ | |
1631 }else{ | |
1632 return 1; | |
0 | 1633 } |
1634 } | |
1635 | |
324 | 1636 void ff_fix_long_p_mvs(MpegEncContext * s) |
1637 { | |
1638 const int f_code= s->f_code; | |
1639 int y; | |
1640 UINT8 * fcode_tab= s->fcode_tab; | |
455 | 1641 //int clip=0; |
1642 //int noclip=0; | |
324 | 1643 /* clip / convert to intra 16x16 type MVs */ |
1644 for(y=0; y<s->mb_height; y++){ | |
1645 int x; | |
1646 int xy= (y+1)* (s->mb_width+2)+1; | |
1647 int i= y*s->mb_width; | |
1648 for(x=0; x<s->mb_width; x++){ | |
1649 if(s->mb_type[i]&MB_TYPE_INTER){ | |
1650 if( fcode_tab[s->p_mv_table[xy][0] + MAX_MV] > f_code | |
1651 || fcode_tab[s->p_mv_table[xy][0] + MAX_MV] == 0 | |
1652 || fcode_tab[s->p_mv_table[xy][1] + MAX_MV] > f_code | |
1653 || fcode_tab[s->p_mv_table[xy][1] + MAX_MV] == 0 ){ | |
1654 s->mb_type[i] &= ~MB_TYPE_INTER; | |
1655 s->mb_type[i] |= MB_TYPE_INTRA; | |
1656 s->p_mv_table[xy][0] = 0; | |
1657 s->p_mv_table[xy][1] = 0; | |
455 | 1658 //clip++; |
324 | 1659 } |
455 | 1660 //else |
1661 // noclip++; | |
324 | 1662 } |
1663 xy++; | |
1664 i++; | |
1665 } | |
1666 } | |
455 | 1667 //printf("%d no:%d %d//\n", clip, noclip, f_code); |
324 | 1668 if(s->flags&CODEC_FLAG_4MV){ |
1669 const int wrap= 2+ s->mb_width*2; | |
1670 | |
1671 /* clip / convert to intra 8x8 type MVs */ | |
1672 for(y=0; y<s->mb_height; y++){ | |
1673 int xy= (y*2 + 1)*wrap + 1; | |
1674 int i= y*s->mb_width; | |
1675 int x; | |
1676 | |
1677 for(x=0; x<s->mb_width; x++){ | |
1678 if(s->mb_type[i]&MB_TYPE_INTER4V){ | |
1679 int block; | |
1680 for(block=0; block<4; block++){ | |
1681 int off= (block& 1) + (block>>1)*wrap; | |
1682 int mx= s->motion_val[ xy + off ][0]; | |
1683 int my= s->motion_val[ xy + off ][1]; | |
1684 | |
1685 if( fcode_tab[mx + MAX_MV] > f_code | |
1686 || fcode_tab[mx + MAX_MV] == 0 | |
1687 || fcode_tab[my + MAX_MV] > f_code | |
1688 || fcode_tab[my + MAX_MV] == 0 ){ | |
1689 s->mb_type[i] &= ~MB_TYPE_INTER4V; | |
1690 s->mb_type[i] |= MB_TYPE_INTRA; | |
1691 } | |
1692 } | |
1693 } | |
502 | 1694 xy+=2; |
1695 i++; | |
324 | 1696 } |
1697 } | |
1698 } | |
1699 } | |
1700 | |
1701 void ff_fix_long_b_mvs(MpegEncContext * s, int16_t (*mv_table)[2], int f_code, int type) | |
1702 { | |
1703 int y; | |
1704 UINT8 * fcode_tab= s->fcode_tab; | |
1705 | |
1706 /* clip / convert to intra 16x16 type MVs */ | |
1707 for(y=0; y<s->mb_height; y++){ | |
1708 int x; | |
1709 int xy= (y+1)* (s->mb_width+2)+1; | |
1710 int i= y*s->mb_width; | |
1711 for(x=0; x<s->mb_width; x++){ | |
691
199b324b2693
fixing variance scaling for b frames (messed adaptive quants up)
michaelni
parents:
690
diff
changeset
|
1712 if( fcode_tab[mv_table[xy][0] + MAX_MV] > f_code |
199b324b2693
fixing variance scaling for b frames (messed adaptive quants up)
michaelni
parents:
690
diff
changeset
|
1713 || fcode_tab[mv_table[xy][0] + MAX_MV] == 0){ |
199b324b2693
fixing variance scaling for b frames (messed adaptive quants up)
michaelni
parents:
690
diff
changeset
|
1714 if(mv_table[xy][0]>0) mv_table[xy][0]= (16<<f_code)-1; |
199b324b2693
fixing variance scaling for b frames (messed adaptive quants up)
michaelni
parents:
690
diff
changeset
|
1715 else mv_table[xy][0]= -(16<<f_code); |
199b324b2693
fixing variance scaling for b frames (messed adaptive quants up)
michaelni
parents:
690
diff
changeset
|
1716 } |
199b324b2693
fixing variance scaling for b frames (messed adaptive quants up)
michaelni
parents:
690
diff
changeset
|
1717 if( fcode_tab[mv_table[xy][1] + MAX_MV] > f_code |
199b324b2693
fixing variance scaling for b frames (messed adaptive quants up)
michaelni
parents:
690
diff
changeset
|
1718 || fcode_tab[mv_table[xy][1] + MAX_MV] == 0){ |
199b324b2693
fixing variance scaling for b frames (messed adaptive quants up)
michaelni
parents:
690
diff
changeset
|
1719 if(mv_table[xy][1]>0) mv_table[xy][1]= (16<<f_code)-1; |
199b324b2693
fixing variance scaling for b frames (messed adaptive quants up)
michaelni
parents:
690
diff
changeset
|
1720 else mv_table[xy][1]= -(16<<f_code); |
324 | 1721 } |
1722 xy++; | |
1723 i++; | |
1724 } | |
1725 } | |
1726 } |