[svn] / branches / dev-api-3 / xvidcore / src / motion / motion_est.c Repository:
ViewVC logotype

Annotation of /branches/dev-api-3/xvidcore/src/motion/motion_est.c

Parent Directory Parent Directory | Revision Log Revision Log


Revision 539 - (view) (download)

1 : Isibaar 3 /**************************************************************************
2 :     *
3 : chl 259 * XVID MPEG-4 VIDEO CODEC
4 :     * motion estimation
5 :     *
6 :     * This program is an implementation of a part of one or more MPEG-4
7 :     * Video tools as specified in ISO/IEC 14496-2 standard. Those intending
8 :     * to use this software module in hardware or software products are
9 :     * advised that its use may infringe existing patents or copyrights, and
10 :     * any such use would be at such party's own risk. The original
11 :     * developer of this software module and his/her company, and subsequent
12 :     * editors and their companies, will have no liability for use of this
13 :     * software or modifications or derivatives thereof.
14 :     *
15 :     * This program is free software; you can redistribute it and/or modify
16 :     * it under the terms of the GNU General Public License as published by
17 :     * the Free Software Foundation; either version 2 of the License, or
18 :     * (at your option) any later version.
19 :     *
20 :     * This program is distributed in the hope that it will be useful,
21 :     * but WITHOUT ANY WARRANTY; without even the implied warranty of
22 :     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
23 :     * GNU General Public License for more details.
24 :     *
25 :     * You should have received a copy of the GNU General Public License
26 :     * along with this program; if not, write to the Free Software
27 :     * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
28 :     *
29 :     *************************************************************************/
30 :    
31 : Isibaar 3 #include <assert.h>
32 :     #include <stdio.h>
33 : chl 96 #include <stdlib.h>
34 : Isibaar 3
35 :     #include "../encoder.h"
36 :     #include "../utils/mbfunctions.h"
37 :     #include "../prediction/mbprediction.h"
38 :     #include "../global.h"
39 :     #include "../utils/timer.h"
40 : chl 530 #include "motion_est.h"
41 : suxen_drol 118 #include "motion.h"
42 : Isibaar 3 #include "sad.h"
43 : Isibaar 539 #include "../utils/emms.h"
44 : Isibaar 3
45 : chl 530 #define INITIAL_SKIP_THRESH (10)
46 :     #define FINAL_SKIP_THRESH (50)
47 :     #define MAX_SAD00_FOR_SKIP (20)
48 : Isibaar 539 #define MAX_CHROMA_SAD_FOR_SKIP (22)
49 :     #define SKIP_THRESH_B (25)
50 : Isibaar 3
51 : chl 530 #define CHECK_CANDIDATE(X,Y,D) { \
52 :     (*CheckCandidate)((const int)(X),(const int)(Y), (D), &iDirection, data ); }
53 : Isibaar 3
54 : chl 530 #define iDiamondSize 2
55 : chl 141
56 : chl 530 static __inline int
57 :     d_mv_bits(int x, int y, const uint32_t iFcode)
58 : Isibaar 3 {
59 : chl 530 int xb, yb;
60 :    
61 :     if (x == 0) xb = 1;
62 :     else {
63 :     if (x < 0) x = -x;
64 :     x += (1 << (iFcode - 1)) - 1;
65 :     x >>= (iFcode - 1);
66 :     if (x > 32) x = 32;
67 :     xb = mvtab[x] + iFcode;
68 : edgomez 195 }
69 : Isibaar 3
70 : chl 530 if (y == 0) yb = 1;
71 :     else {
72 :     if (y < 0) y = -y;
73 :     y += (1 << (iFcode - 1)) - 1;
74 :     y >>= (iFcode - 1);
75 :     if (y > 32) y = 32;
76 :     yb = mvtab[y] + iFcode;
77 :     }
78 :     return xb + yb;
79 : Isibaar 3 }
80 :    
81 :    
82 : Isibaar 539 /* CHECK_CANDIATE FUNCTIONS START */
83 :    
84 : chl 530 static void
85 :     CheckCandidate16(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
86 : Isibaar 3 {
87 : chl 530 int32_t * const sad = data->temp;
88 :     int t;
89 :     const uint8_t * Reference;
90 : Isibaar 3
91 : chl 530 if (( x > data->max_dx) || ( x < data->min_dx)
92 :     || ( y > data->max_dy) || (y < data->min_dy)) return;
93 : suxen_drol 136
94 : chl 530 switch ( ((x&1)<<1) + (y&1) ) {
95 :     case 0 : Reference = data->Ref + x/2 + (y/2)*(data->iEdgedWidth); break;
96 :     case 1 : Reference = data->RefV + x/2 + ((y-1)/2)*(data->iEdgedWidth); break;
97 :     case 2 : Reference = data->RefH + (x-1)/2 + (y/2)*(data->iEdgedWidth); break;
98 :     default : Reference = data->RefHV + (x-1)/2 + ((y-1)/2)*(data->iEdgedWidth); break;
99 :     }
100 : chl 259
101 : chl 530 data->temp[0] = sad16v(data->Cur, Reference, data->iEdgedWidth, sad+1);
102 : Isibaar 3
103 : chl 530 t = d_mv_bits(x - data->predMV.x, y - data->predMV.y, data->iFcode);
104 :     data->temp[0] += lambda_vec16[data->iQuant] * t;
105 :     data->temp[1] += lambda_vec8[data->iQuant] * t;
106 : chl 326
107 : chl 530 if (data->temp[0] < data->iMinSAD[0]) {
108 :     data->iMinSAD[0] = data->temp[0];
109 :     data->currentMV[0].x = x; data->currentMV[0].y = y;
110 :     *dir = Direction; }
111 : chl 184
112 : chl 530 if (data->temp[1] < data->iMinSAD[1]) {
113 :     data->iMinSAD[1] = data->temp[1]; data->currentMV[1].x = x; data->currentMV[1].y = y; }
114 :     if (data->temp[2] < data->iMinSAD[2]) {
115 :     data->iMinSAD[2] = data->temp[2]; data->currentMV[2].x = x; data->currentMV[2].y = y; }
116 :     if (data->temp[3] < data->iMinSAD[3]) {
117 :     data->iMinSAD[3] = data->temp[3]; data->currentMV[3].x = x; data->currentMV[3].y = y; }
118 :     if (data->temp[4] < data->iMinSAD[4]) {
119 :     data->iMinSAD[4] = data->temp[4]; data->currentMV[4].x = x; data->currentMV[4].y = y; }
120 : chl 184
121 : Isibaar 3 }
122 :    
123 : chl 530 static void
124 :     CheckCandidate16no4v(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
125 :     {
126 :     int32_t sad;
127 :     const uint8_t * Reference;
128 : chl 326
129 : chl 530 if (( x > data->max_dx) || ( x < data->min_dx)
130 :     || ( y > data->max_dy) || (y < data->min_dy)) return;
131 : Isibaar 3
132 : chl 530 switch ( ((x&1)<<1) + (y&1) )
133 :     {
134 :     case 0 : Reference = data->Ref + x/2 + (y/2)*(data->iEdgedWidth); break;
135 :     case 1 : Reference = data->RefV + x/2 + ((y-1)/2)*(data->iEdgedWidth); break;
136 :     case 2 : Reference = data->RefH + (x-1)/2 + (y/2)*(data->iEdgedWidth); break;
137 :     default : Reference = data->RefHV + (x-1)/2 + ((y-1)/2)*(data->iEdgedWidth); break;
138 :     }
139 : Isibaar 3
140 : chl 530 sad = lambda_vec16[data->iQuant] *
141 :     d_mv_bits(x - data->predMV.x, y - data->predMV.y, data->iFcode);
142 :     sad += sad16(data->Cur, Reference, data->iEdgedWidth, 256*4096);
143 : Isibaar 3
144 : chl 530 if (sad < *(data->iMinSAD)) {
145 :     *(data->iMinSAD) = sad;
146 :     data->currentMV[0].x = x; data->currentMV[0].y = y;
147 :     *dir = Direction; }
148 : Isibaar 3 }
149 :    
150 : chl 530 static void
151 : Isibaar 539 CheckCandidate16no4vI(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
152 :     {
153 :     int32_t sad;
154 :    
155 :     if (( x > data->max_dx) || ( x < data->min_dx)
156 :     || ( y > data->max_dy) || (y < data->min_dy)) return;
157 :    
158 :     sad = lambda_vec16[data->iQuant] *
159 :     d_mv_bits(x - data->predMV.x, y - data->predMV.y, data->iFcode);
160 :    
161 :     sad += sad16(data->Cur, data->Ref + x/2 + (y/2)*(data->iEdgedWidth),
162 :     data->iEdgedWidth, 256*4096);
163 :    
164 :     if (sad < *(data->iMinSAD)) {
165 :     *(data->iMinSAD) = sad;
166 :     data->currentMV[0].x = x; data->currentMV[0].y = y;
167 :     *dir = Direction; }
168 :     }
169 :    
170 :    
171 :     static void
172 : chl 530 CheckCandidateInt(const int xf, const int yf, const int Direction, int * const dir, const SearchData * const data)
173 :     {
174 :     int32_t sad;
175 :     const int xb = data->currentMV[1].x;
176 :     const int yb = data->currentMV[1].y;
177 :     const uint8_t *ReferenceF, *ReferenceB;
178 : Isibaar 3
179 : chl 530 if (( xf > data->max_dx) || ( xf < data->min_dx)
180 :     || ( yf > data->max_dy) || (yf < data->min_dy)) return;
181 : Isibaar 3
182 : chl 530 switch ( ((xf&1)<<1) + (yf&1) ) {
183 :     case 0 : ReferenceF = data->Ref + xf/2 + (yf/2)*(data->iEdgedWidth); break;
184 :     case 1 : ReferenceF = data->RefV + xf/2 + ((yf-1)/2)*(data->iEdgedWidth); break;
185 :     case 2 : ReferenceF = data->RefH + (xf-1)/2 + (yf/2)*(data->iEdgedWidth); break;
186 :     default : ReferenceF = data->RefHV + (xf-1)/2 + ((yf-1)/2)*(data->iEdgedWidth); break;
187 :     }
188 : edgomez 195
189 : chl 530 switch ( ((xb&1)<<1) + (yb&1) ) {
190 :     case 0 : ReferenceB = data->bRef + xb/2 + (yb/2)*(data->iEdgedWidth); break;
191 :     case 1 : ReferenceB = data->bRefV + xb/2 + ((yb-1)/2)*(data->iEdgedWidth); break;
192 :     case 2 : ReferenceB = data->bRefH + (xb-1)/2 + (yb/2)*(data->iEdgedWidth); break;
193 :     default : ReferenceB = data->bRefHV + (xb-1)/2 + ((yb-1)/2)*(data->iEdgedWidth); break;
194 :     }
195 : Isibaar 3
196 : chl 530 sad = lambda_vec16[data->iQuant] *
197 :     ( d_mv_bits(xf - data->predMV.x, yf - data->predMV.y, data->iFcode) +
198 :     d_mv_bits(xb - data->bpredMV.x, yb - data->bpredMV.y, data->iFcode) );
199 : Isibaar 3
200 : chl 530 sad += sad16bi(data->Cur, ReferenceF, ReferenceB, data->iEdgedWidth);
201 : Isibaar 3
202 : chl 530 if (sad < *(data->iMinSAD)) {
203 :     *(data->iMinSAD) = sad;
204 :     data->currentMV->x = xf; data->currentMV->y = yf;
205 :     *dir = Direction; }
206 : Isibaar 3 }
207 :    
208 : chl 530 static void
209 :     CheckCandidateDirect(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
210 : Isibaar 3 {
211 : chl 530 int32_t sad;
212 :     int k;
213 :     const uint8_t *ReferenceF;
214 :     const uint8_t *ReferenceB;
215 :     VECTOR mvs, b_mvs;
216 : Isibaar 3
217 : chl 530 if (( x > 31) || ( x < -32) || ( y > 31) || (y < -32)) return;
218 : Isibaar 3
219 : chl 530 sad = lambda_vec16[data->iQuant] * d_mv_bits(x, y, 1);
220 : Isibaar 3
221 : chl 530 for (k = 0; k < 4; k++) {
222 :     mvs.x = data->directmvF[k].x + x;
223 :     b_mvs.x = ((x == 0) ?
224 :     data->directmvB[k].x
225 :     : mvs.x - data->referencemv[k].x);
226 : Isibaar 3
227 : chl 530 mvs.y = data->directmvF[k].y + y;
228 :     b_mvs.y = ((y == 0) ?
229 :     data->directmvB[k].y
230 :     : mvs.y - data->referencemv[k].y);
231 :    
232 :     if (( mvs.x > data->max_dx ) || ( mvs.x < data->min_dx )
233 :     || ( mvs.y > data->max_dy ) || ( mvs.y < data->min_dy )
234 :     || ( b_mvs.x > data->max_dx ) || ( b_mvs.x < data->min_dx )
235 :     || ( b_mvs.y > data->max_dy ) || ( b_mvs.y < data->min_dy )) return;
236 : Isibaar 3
237 : chl 530 switch ( ((mvs.x&1)<<1) + (mvs.y&1) ) {
238 :     case 0 : ReferenceF = data->Ref + mvs.x/2 + (mvs.y/2)*(data->iEdgedWidth); break;
239 :     case 1 : ReferenceF = data->RefV + mvs.x/2 + ((mvs.y-1)/2)*(data->iEdgedWidth); break;
240 :     case 2 : ReferenceF = data->RefH + (mvs.x-1)/2 + (mvs.y/2)*(data->iEdgedWidth); break;
241 :     default : ReferenceF = data->RefHV + (mvs.x-1)/2 + ((mvs.y-1)/2)*(data->iEdgedWidth); break;
242 :     }
243 : Isibaar 3
244 : chl 530 switch ( ((b_mvs.x&1)<<1) + (b_mvs.y&1) ) {
245 :     case 0 : ReferenceB = data->bRef + b_mvs.x/2 + (b_mvs.y/2)*(data->iEdgedWidth); break;
246 :     case 1 : ReferenceB = data->bRefV + b_mvs.x/2 + ((b_mvs.y-1)/2)*(data->iEdgedWidth); break;
247 :     case 2 : ReferenceB = data->bRefH + (b_mvs.x-1)/2 + (b_mvs.y/2)*(data->iEdgedWidth); break;
248 :     default : ReferenceB = data->bRefHV + (b_mvs.x-1)/2 + ((b_mvs.y-1)/2)*(data->iEdgedWidth); break;
249 : chl 344 }
250 : chl 530
251 :     sad += sad8bi(data->Cur + 8*(k&1) + 8*(k>>1)*(data->iEdgedWidth),
252 :     ReferenceF + 8*(k&1) + 8*(k>>1)*(data->iEdgedWidth),
253 :     ReferenceB + 8*(k&1) + 8*(k>>1)*(data->iEdgedWidth),
254 :     data->iEdgedWidth);
255 :     if (sad > *(data->iMinSAD)) return;
256 : edgomez 78 }
257 : chl 530
258 :     if (sad < *(data->iMinSAD)) {
259 :     *(data->iMinSAD) = sad;
260 :     data->currentMV->x = x; data->currentMV->y = y;
261 :     *dir = Direction; }
262 : Isibaar 3 }
263 :    
264 : chl 530 static void
265 :     CheckCandidateDirectno4v(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
266 : chl 96 {
267 : chl 530 int32_t sad;
268 :     const uint8_t *ReferenceF;
269 :     const uint8_t *ReferenceB;
270 :     VECTOR mvs, b_mvs;
271 : chl 96
272 : chl 530 if (( x > 31) || ( x < -31) || ( y > 31) || (y < -31)) return;
273 :    
274 :     sad = lambda_vec16[data->iQuant] * d_mv_bits(x, y, 1);
275 : edgomez 195
276 : chl 530 mvs.x = data->directmvF[0].x + x;
277 :     b_mvs.x = ((x == 0) ?
278 :     data->directmvB[0].x
279 :     : mvs.x - data->referencemv[0].x);
280 : edgomez 195
281 : chl 530 mvs.y = data->directmvF[0].y + y;
282 :     b_mvs.y = ((y == 0) ?
283 :     data->directmvB[0].y
284 :     : mvs.y - data->referencemv[0].y);
285 :    
286 :     if (( mvs.x > data->max_dx ) || ( mvs.x < data->min_dx )
287 :     || ( mvs.y > data->max_dy ) || ( mvs.y < data->min_dy )
288 :     || ( b_mvs.x > data->max_dx ) || ( b_mvs.x < data->min_dx )
289 :     || ( b_mvs.y > data->max_dy ) || ( b_mvs.y < data->min_dy )) return;
290 : chl 96
291 : chl 530 switch ( ((mvs.x&1)<<1) + (mvs.y&1) ) {
292 :     case 0 : ReferenceF = data->Ref + mvs.x/2 + (mvs.y/2)*(data->iEdgedWidth); break;
293 :     case 1 : ReferenceF = data->RefV + mvs.x/2 + ((mvs.y-1)/2)*(data->iEdgedWidth); break;
294 :     case 2 : ReferenceF = data->RefH + (mvs.x-1)/2 + (mvs.y/2)*(data->iEdgedWidth); break;
295 :     default : ReferenceF = data->RefHV + (mvs.x-1)/2 + ((mvs.y-1)/2)*(data->iEdgedWidth); break;
296 :     }
297 : chl 96
298 : chl 530 switch ( ((b_mvs.x&1)<<1) + (b_mvs.y&1) ) {
299 :     case 0 : ReferenceB = data->bRef + b_mvs.x/2 + (b_mvs.y/2)*(data->iEdgedWidth); break;
300 :     case 1 : ReferenceB = data->bRefV + b_mvs.x/2 + ((b_mvs.y-1)/2)*(data->iEdgedWidth); break;
301 :     case 2 : ReferenceB = data->bRefH + (b_mvs.x-1)/2 + (b_mvs.y/2)*(data->iEdgedWidth); break;
302 :     default : ReferenceB = data->bRefHV + (b_mvs.x-1)/2 + ((b_mvs.y-1)/2)*(data->iEdgedWidth); break;
303 :     }
304 :    
305 :     sad += sad16bi(data->Cur, ReferenceF, ReferenceB, data->iEdgedWidth);
306 : chl 96
307 : chl 530 if (sad < *(data->iMinSAD)) {
308 :     *(data->iMinSAD) = sad;
309 :     data->currentMV->x = x; data->currentMV->y = y;
310 :     *dir = Direction; }
311 :     }
312 : chl 96
313 : chl 530 static void
314 :     CheckCandidate8(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
315 :     {
316 :     int32_t sad;
317 :     const uint8_t * Reference;
318 : edgomez 195
319 : chl 530 if (( x > data->max_dx) || ( x < data->min_dx)
320 :     || ( y > data->max_dy) || (y < data->min_dy)) return;
321 : chl 96
322 : chl 530 switch ( ((x&1)<<1) + (y&1) )
323 :     {
324 :     case 0 : Reference = data->Ref + x/2 + (y/2)*(data->iEdgedWidth); break;
325 :     case 1 : Reference = data->RefV + x/2 + ((y-1)/2)*(data->iEdgedWidth); break;
326 :     case 2 : Reference = data->RefH + (x-1)/2 + (y/2)*(data->iEdgedWidth); break;
327 :     default : Reference = data->RefHV + (x-1)/2 + ((y-1)/2)*(data->iEdgedWidth); break;
328 :     }
329 : edgomez 195
330 : chl 530 sad = sad8(data->Cur, Reference, data->iEdgedWidth);
331 :     sad += lambda_vec8[data->iQuant] * d_mv_bits(x - data->predMV.x, y - data->predMV.y, data->iFcode);
332 : edgomez 195
333 : chl 530 if (sad < *(data->iMinSAD)) {
334 :     *(data->iMinSAD) = sad;
335 :     data->currentMV->x = x; data->currentMV->y = y;
336 :     *dir = Direction; }
337 : chl 96 }
338 :    
339 : Isibaar 539 /* CHECK_CANDIATE FUNCTIONS END */
340 : chl 96
341 : chl 530 /* MAINSEARCH FUNCTIONS START */
342 : edgomez 195
343 : chl 530 static void
344 :     AdvDiamondSearch(int x, int y, const SearchData * const data, int bDirection)
345 : chl 181 {
346 :    
347 :     /* directions: 1 - left (x-1); 2 - right (x+1), 4 - up (y-1); 8 - down (y+1) */
348 :    
349 : chl 530 int iDirection;
350 : edgomez 195
351 :     do {
352 : chl 181 iDirection = 0;
353 : chl 530 if (bDirection & 1) CHECK_CANDIDATE(x - iDiamondSize, y, 1);
354 :     if (bDirection & 2) CHECK_CANDIDATE(x + iDiamondSize, y, 2);
355 :     if (bDirection & 4) CHECK_CANDIDATE(x, y - iDiamondSize, 4);
356 :     if (bDirection & 8) CHECK_CANDIDATE(x, y + iDiamondSize, 8);
357 : chl 181
358 :     /* now we're doing diagonal checks near our candidate */
359 :    
360 : chl 530 if (iDirection) { //checking if anything found
361 : chl 181 bDirection = iDirection;
362 :     iDirection = 0;
363 : chl 530 x = data->currentMV->x; y = data->currentMV->y;
364 :     if (bDirection & 3) { //our candidate is left or right
365 :     CHECK_CANDIDATE(x, y + iDiamondSize, 8);
366 :     CHECK_CANDIDATE(x, y - iDiamondSize, 4);
367 :     } else { // what remains here is up or down
368 :     CHECK_CANDIDATE(x + iDiamondSize, y, 2);
369 :     CHECK_CANDIDATE(x - iDiamondSize, y, 1); }
370 : chl 181
371 : edgomez 195 if (iDirection) {
372 :     bDirection += iDirection;
373 : chl 530 x = data->currentMV->x; y = data->currentMV->y; }
374 :     } else { //about to quit, eh? not so fast....
375 : edgomez 195 switch (bDirection) {
376 : chl 181 case 2:
377 : chl 530 CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2 + 4);
378 :     CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2 + 8);
379 : chl 181 break;
380 :     case 1:
381 : chl 530 CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1 + 4);
382 :     CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1 + 8);
383 : chl 181 break;
384 : edgomez 195 case 2 + 4:
385 : chl 530 CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1 + 4);
386 :     CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2 + 4);
387 :     CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2 + 8);
388 : chl 181 break;
389 :     case 4:
390 : chl 530 CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2 + 4);
391 :     CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1 + 4);
392 : chl 181 break;
393 :     case 8:
394 : chl 530 CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2 + 8);
395 :     CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1 + 8);
396 : chl 181 break;
397 : edgomez 195 case 1 + 4:
398 : chl 530 CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1 + 8);
399 :     CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1 + 4);
400 :     CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2 + 4);
401 : chl 181 break;
402 : edgomez 195 case 2 + 8:
403 : chl 530 CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1 + 4);
404 :     CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1 + 8);
405 :     CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2 + 8);
406 : chl 181 break;
407 : edgomez 195 case 1 + 8:
408 : chl 530 CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2 + 4);
409 :     CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2 + 8);
410 :     CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1 + 8);
411 : chl 181 break;
412 : edgomez 195 default: //1+2+4+8 == we didn't find anything at all
413 : chl 530 CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1 + 4);
414 :     CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1 + 8);
415 :     CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2 + 4);
416 :     CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2 + 8);
417 : chl 181 break;
418 :     }
419 : chl 530 if (!iDirection) break; //ok, the end. really
420 :     bDirection = iDirection;
421 :     x = data->currentMV->x; y = data->currentMV->y;
422 : chl 181 }
423 :     }
424 : edgomez 195 while (1); //forever
425 : chl 181 }
426 :    
427 : chl 530 static void
428 :     SquareSearch(int x, int y, const SearchData * const data, int bDirection)
429 : chl 326 {
430 : chl 530 int iDirection;
431 : chl 326
432 : chl 530 do {
433 :     iDirection = 0;
434 :     if (bDirection & 1) CHECK_CANDIDATE(x - iDiamondSize, y, 1+16+64);
435 :     if (bDirection & 2) CHECK_CANDIDATE(x + iDiamondSize, y, 2+32+128);
436 :     if (bDirection & 4) CHECK_CANDIDATE(x, y - iDiamondSize, 4+16+32);
437 :     if (bDirection & 8) CHECK_CANDIDATE(x, y + iDiamondSize, 8+64+128);
438 :     if (bDirection & 16) CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1+4+16+32+64);
439 :     if (bDirection & 32) CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2+4+16+32+128);
440 :     if (bDirection & 64) CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1+8+16+64+128);
441 :     if (bDirection & 128) CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2+8+32+64+128);
442 : chl 326
443 : chl 530 bDirection = iDirection;
444 :     x = data->currentMV->x; y = data->currentMV->y;
445 :     } while (iDirection);
446 : chl 346 }
447 :    
448 : chl 530 static void
449 :     DiamondSearch(int x, int y, const SearchData * const data, int bDirection)
450 : chl 346 {
451 :    
452 : chl 181 /* directions: 1 - left (x-1); 2 - right (x+1), 4 - up (y-1); 8 - down (y+1) */
453 :    
454 : chl 530 int iDirection;
455 : edgomez 195
456 :     do {
457 : chl 181 iDirection = 0;
458 : chl 530 if (bDirection & 1) CHECK_CANDIDATE(x - iDiamondSize, y, 1);
459 :     if (bDirection & 2) CHECK_CANDIDATE(x + iDiamondSize, y, 2);
460 :     if (bDirection & 4) CHECK_CANDIDATE(x, y - iDiamondSize, 4);
461 :     if (bDirection & 8) CHECK_CANDIDATE(x, y + iDiamondSize, 8);
462 : chl 181
463 :     /* now we're doing diagonal checks near our candidate */
464 :    
465 : chl 530 if (iDirection) { //checking if anything found
466 : chl 181 bDirection = iDirection;
467 :     iDirection = 0;
468 : chl 530 x = data->currentMV->x; y = data->currentMV->y;
469 :     if (bDirection & 3) { //our candidate is left or right
470 :     CHECK_CANDIDATE(x, y + iDiamondSize, 8);
471 :     CHECK_CANDIDATE(x, y - iDiamondSize, 4);
472 :     } else { // what remains here is up or down
473 :     CHECK_CANDIDATE(x + iDiamondSize, y, 2);
474 :     CHECK_CANDIDATE(x - iDiamondSize, y, 1); }
475 : chl 181
476 : chl 530 bDirection += iDirection;
477 :     x = data->currentMV->x; y = data->currentMV->y;
478 : chl 181 }
479 :     }
480 : chl 530 while (iDirection);
481 : chl 181 }
482 :    
483 : chl 530 /* MAINSEARCH FUNCTIONS END */
484 : chl 181
485 : chl 530 /* HALFPELREFINE COULD BE A MAINSEARCH FUNCTION, BUT THERE IS NO NEED FOR IT */
486 :    
487 :     static void
488 :     HalfpelRefine(const SearchData * const data)
489 : chl 96 {
490 : chl 530 /* Do a half-pel refinement (or rather a "smallest possible amount" refinement) */
491 : edgomez 195
492 : chl 530 VECTOR backupMV = *(data->currentMV);
493 :     int iDirection; //not needed
494 : chl 96
495 : chl 530 CHECK_CANDIDATE(backupMV.x - 1, backupMV.y - 1, 0);
496 :     CHECK_CANDIDATE(backupMV.x + 1, backupMV.y - 1, 0);
497 :     CHECK_CANDIDATE(backupMV.x - 1, backupMV.y + 1, 0);
498 :     CHECK_CANDIDATE(backupMV.x + 1, backupMV.y + 1, 0);
499 : edgomez 195
500 : chl 530 CHECK_CANDIDATE(backupMV.x - 1, backupMV.y, 0);
501 :     CHECK_CANDIDATE(backupMV.x + 1, backupMV.y, 0);
502 :    
503 :     CHECK_CANDIDATE(backupMV.x, backupMV.y + 1, 0);
504 :     CHECK_CANDIDATE(backupMV.x, backupMV.y - 1, 0);
505 : chl 96 }
506 :    
507 : chl 530 static __inline int
508 :     SkipDecisionP(const IMAGE * current, const IMAGE * reference,
509 :     const int x, const int y,
510 :     const uint32_t iEdgedWidth, const uint32_t iQuant)
511 : chl 96
512 : Isibaar 3 {
513 : chl 530 /* keep repeating checks for all b-frames before this P frame,
514 :     to make sure that SKIP is possible (todo)
515 :     how: if skip is not possible set sad00 to a very high value */
516 : Isibaar 3
517 : chl 530 uint32_t sadC = sad8(current->u + x*8 + y*(iEdgedWidth/2)*8,
518 :     reference->u + x*8 + y*(iEdgedWidth/2)*8, iEdgedWidth/2);
519 :     if (sadC > iQuant * MAX_CHROMA_SAD_FOR_SKIP) return 0;
520 :     sadC += sad8(current->v + x*8 + y*(iEdgedWidth/2)*8,
521 :     reference->v + x*8 + y*(iEdgedWidth/2)*8, iEdgedWidth/2);
522 :     if (sadC > iQuant * MAX_CHROMA_SAD_FOR_SKIP) return 0;
523 : edgomez 195
524 : chl 530 return 1;
525 :     }
526 : edgomez 195
527 : chl 530 static __inline void
528 :     SkipMacroblockP(MACROBLOCK *pMB, const int32_t sad)
529 :     {
530 :     pMB->mode = MODE_NOT_CODED;
531 : Isibaar 539 pMB->mvs[0].x = pMB->mvs[1].x = pMB->mvs[2].x = pMB->mvs[3].x = 0;
532 :     pMB->mvs[0].y = pMB->mvs[1].y = pMB->mvs[2].y = pMB->mvs[3].y = 0;
533 : chl 530 pMB->sad16 = pMB->sad8[0] = pMB->sad8[1] = pMB->sad8[2] = pMB->sad8[3] = sad;
534 : Isibaar 3 }
535 :    
536 : chl 530 bool
537 :     MotionEstimation(MBParam * const pParam,
538 :     FRAMEINFO * const current,
539 :     FRAMEINFO * const reference,
540 :     const IMAGE * const pRefH,
541 :     const IMAGE * const pRefV,
542 :     const IMAGE * const pRefHV,
543 :     const uint32_t iLimit)
544 : Isibaar 3 {
545 : chl 530 MACROBLOCK *const pMBs = current->mbs;
546 :     const IMAGE *const pCurrent = &current->image;
547 :     const IMAGE *const pRef = &reference->image;
548 : Isibaar 3
549 : chl 530 const VECTOR zeroMV = { 0, 0 };
550 : Isibaar 3
551 : chl 530 uint32_t x, y;
552 :     uint32_t iIntra = 0;
553 :     int32_t InterBias;
554 : edgomez 195
555 : Isibaar 539 // some pre-initialized thingies for SearchP
556 :     int32_t temp[5];
557 :     VECTOR currentMV[5];
558 :     int32_t iMinSAD[5];
559 :     SearchData Data;
560 :     Data.iEdgedWidth = pParam->edged_width;
561 :     Data.currentMV = currentMV;
562 :     Data.iMinSAD = iMinSAD;
563 :     Data.temp = temp;
564 :     Data.iFcode = current->fcode;
565 :    
566 : chl 530 if (sadInit) (*sadInit) ();
567 : edgomez 195
568 : chl 530 for (y = 0; y < pParam->mb_height; y++) {
569 :     for (x = 0; x < pParam->mb_width; x++) {
570 : Isibaar 3
571 : chl 530 MACROBLOCK *pMB = &pMBs[x + y * pParam->mb_width];
572 :     int32_t sad00 = pMB->sad16
573 :     = sad16v(pCurrent->y + (x + y * pParam->edged_width) * 16,
574 :     pRef->y + (x + y * pParam->edged_width) * 16,
575 :     pParam->edged_width, pMB->sad8 );
576 : edgomez 195
577 : chl 530 if (!(current->global_flags & XVID_LUMIMASKING)) {
578 :     pMB->dquant = NO_CHANGE;
579 :     pMB->quant = current->quant; }
580 : chl 181
581 : chl 530 //initial skip decision
582 : Isibaar 3
583 : chl 530 if ((pMB->dquant == NO_CHANGE) && (sad00 <= MAX_SAD00_FOR_SKIP * pMB->quant)
584 :     && (SkipDecisionP(pCurrent, pRef, x, y, pParam->edged_width, pMB->quant)) ) {
585 :     if (pMB->sad16 < pMB->quant * INITIAL_SKIP_THRESH) {
586 :     SkipMacroblockP(pMB, sad00);
587 :     continue;
588 :     }
589 :     } else sad00 = 256*4096; // skip not allowed - for final skip decision
590 : Isibaar 3
591 : chl 530 SearchP(pRef->y, pRefH->y, pRefV->y, pRefHV->y, pCurrent, x,
592 :     y, current->motion_flags, pMB->quant,
593 : Isibaar 539 &Data, pParam, pMBs, reference->mbs,
594 : chl 530 current->global_flags & XVID_INTER4V, pMB);
595 : edgomez 195
596 : chl 530 /* final skip decision, a.k.a. "the vector you found, really that good?" */
597 :     if (sad00 < pMB->quant * MAX_SAD00_FOR_SKIP)
598 :     if ((100*pMB->sad16)/(sad00+1) > FINAL_SKIP_THRESH)
599 :     { SkipMacroblockP(pMB, sad00); continue; }
600 :    
601 :     /* finally, intra decision */
602 : Isibaar 3
603 : chl 530 InterBias = MV16_INTER_BIAS;
604 :     if (pMB->quant > 8) InterBias += 50 * (pMB->quant - 8); // to make high quants work
605 :     if (y != 0)
606 :     if ((pMB - pParam->mb_width)->mode == MODE_INTER ) InterBias -= 50;
607 :     if (x != 0)
608 :     if ((pMB - 1)->mode == MODE_INTER ) InterBias -= 50;
609 : Isibaar 3
610 : chl 530 if (InterBias < pMB->sad16) {
611 :     const int32_t deviation =
612 :     dev16(pCurrent->y + (x + y * pParam->edged_width) * 16,
613 :     pParam->edged_width);
614 : Isibaar 3
615 : chl 530 if (deviation < (pMB->sad16 - InterBias)) {
616 :     if (++iIntra >= iLimit) return 1;
617 :     pMB->mode = MODE_INTRA;
618 : Isibaar 539 pMB->mvs[0] = pMB->mvs[1] = pMB->mvs[2] =
619 :     pMB->mvs[3] = zeroMV;
620 : chl 530 pMB->sad16 = pMB->sad8[0] = pMB->sad8[1] = pMB->sad8[2] =
621 :     pMB->sad8[3] = 0;
622 :     }
623 :     }
624 :     }
625 : Isibaar 3 }
626 : chl 530 return 0;
627 :     }
628 : Isibaar 3
629 : edgomez 195
630 : chl 530 #define PMV_HALFPEL16 (PMV_HALFPELDIAMOND16|PMV_HALFPELREFINE16)
631 : Isibaar 3
632 : chl 530 static __inline int
633 :     make_mask(const VECTOR * const pmv, const int i)
634 :     {
635 : Isibaar 539 int mask = 255, j;
636 : chl 530 for (j = 0; j < i; j++) {
637 :     if (MVequal(pmv[i], pmv[j])) return 0; // same vector has been checked already
638 :     if (pmv[i].x == pmv[j].x) {
639 :     if (pmv[i].y == pmv[j].y + iDiamondSize) { mask &= ~4; continue; }
640 :     if (pmv[i].y == pmv[j].y - iDiamondSize) { mask &= ~8; continue; }
641 :     } else
642 :     if (pmv[i].y == pmv[j].y) {
643 :     if (pmv[i].x == pmv[j].x + iDiamondSize) { mask &= ~1; continue; }
644 :     if (pmv[i].x == pmv[j].x - iDiamondSize) { mask &= ~2; continue; }
645 :     }
646 : Isibaar 3 }
647 : chl 530 return mask;
648 :     }
649 : edgomez 195
650 : chl 530 static __inline void
651 :     PreparePredictionsP(VECTOR * const pmv, int x, int y, const int iWcount,
652 :     const int iHcount, const MACROBLOCK * const prevMB)
653 :     {
654 : edgomez 195
655 : chl 530 //this function depends on get_pmvdata which means that it sucks. It should get the predictions by itself
656 : edgomez 195
657 : chl 530 if ( (y != 0) && (x != (iWcount-1)) ) { // [5] top-right neighbour
658 :     pmv[5].x = EVEN(pmv[3].x);
659 : Isibaar 539 pmv[5].y = EVEN(pmv[3].y);
660 :     } else pmv[5].x = pmv[5].y = 0;
661 : chl 169
662 : chl 530 if (x != 0) { pmv[3].x = EVEN(pmv[1].x); pmv[3].y = EVEN(pmv[1].y); }// pmv[3] is left neighbour
663 :     else pmv[3].x = pmv[3].y = 0;
664 : Isibaar 3
665 : chl 530 if (y != 0) { pmv[4].x = EVEN(pmv[2].x); pmv[4].y = EVEN(pmv[2].y); }// [4] top neighbour
666 :     else pmv[4].x = pmv[4].y = 0;
667 : chl 169
668 : chl 530 // [1] median prediction
669 :     pmv[1].x = EVEN(pmv[0].x); pmv[1].y = EVEN(pmv[0].y);
670 : chl 169
671 : chl 530 pmv[0].x = pmv[0].y = 0; // [0] is zero; not used in the loop (checked before) but needed here for make_mask
672 : chl 169
673 : chl 530 pmv[2].x = EVEN(prevMB->mvs[0].x); // [2] is last frame
674 :     pmv[2].y = EVEN(prevMB->mvs[0].y);
675 : chl 169
676 : chl 530 if ((x != iWcount-1) && (y != iHcount-1)) {
677 :     pmv[6].x = EVEN((prevMB+1+iWcount)->mvs[0].x); //[6] right-down neighbour in last frame
678 : Isibaar 539 pmv[6].y = EVEN((prevMB+1+iWcount)->mvs[0].y);
679 :     } else pmv[6].x = pmv[6].y = 0;
680 : chl 530 }
681 : chl 169
682 : chl 530 static void
683 :     SearchP(const uint8_t * const pRef,
684 :     const uint8_t * const pRefH,
685 :     const uint8_t * const pRefV,
686 :     const uint8_t * const pRefHV,
687 :     const IMAGE * const pCur,
688 :     const int x,
689 :     const int y,
690 :     const uint32_t MotionFlags,
691 :     const uint32_t iQuant,
692 : Isibaar 539 SearchData * const Data,
693 : chl 530 const MBParam * const pParam,
694 :     const MACROBLOCK * const pMBs,
695 :     const MACROBLOCK * const prevMBs,
696 :     int inter4v,
697 :     MACROBLOCK * const pMB)
698 :     {
699 : chl 169
700 : chl 530 int i, iDirection = 255, mask, threshA;
701 : Isibaar 539 VECTOR pmv[7];
702 : Isibaar 3
703 : Isibaar 539 get_pmvdata2(pMBs, pParam->mb_width, 0, x, y, 0, pmv, Data->temp); //has to be changed to get_pmv(2)()
704 :     get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 16,
705 :     pParam->width, pParam->height, Data->iFcode);
706 : Isibaar 3
707 : Isibaar 539 Data->predMV = pmv[0];
708 :     Data->Cur = pCur->y + (x + y * Data->iEdgedWidth) * 16;
709 :     Data->Ref = pRef + (x + Data->iEdgedWidth*y)*16;
710 :     Data->RefH = pRefH + (x + Data->iEdgedWidth*y) * 16;
711 :     Data->RefV = pRefV + (x + Data->iEdgedWidth*y) * 16;
712 :     Data->RefHV = pRefHV + (x + Data->iEdgedWidth*y) * 16;
713 : Isibaar 3
714 : Isibaar 539 Data->iQuant = iQuant;
715 : chl 169
716 : chl 530 if (!(MotionFlags & PMV_HALFPEL16)) {
717 : Isibaar 539 Data->min_dx = EVEN(Data->min_dx);
718 :     Data->max_dx = EVEN(Data->max_dx);
719 :     Data->min_dy = EVEN(Data->min_dy);
720 :     Data->max_dy = EVEN(Data->max_dy); }
721 : edgomez 195
722 : Isibaar 539 for(i = 0; i < 5; i++) Data->iMinSAD[i] = 256*4096;
723 : chl 169
724 : Isibaar 539 if (inter4v) CheckCandidate = CheckCandidate16;
725 :     else CheckCandidate = CheckCandidate16no4v;
726 : chl 169
727 : Isibaar 539 (*CheckCandidate)(Data->predMV.x, Data->predMV.y, 0, &iDirection, Data);
728 : edgomez 195
729 : Isibaar 539 for(i = 0; i < 5; i++) Data->currentMV[i].x = Data->currentMV[i].y = 0;
730 :    
731 :     i = d_mv_bits(Data->predMV.x, Data->predMV.y, Data->iFcode);
732 :     Data->iMinSAD[0] = pMB->sad16 + lambda_vec16[iQuant] * i;
733 :     Data->iMinSAD[1] = pMB->sad8[0] + lambda_vec8[iQuant] * i;
734 :     Data->iMinSAD[2] = pMB->sad8[1];
735 :     Data->iMinSAD[3] = pMB->sad8[2];
736 :     Data->iMinSAD[4] = pMB->sad8[3];
737 :    
738 : chl 530 if (pMB->dquant != NO_CHANGE) inter4v = 0;
739 : edgomez 195
740 : chl 530 if ((x == 0) && (y == 0)) threshA = 512;
741 :     else {
742 : Isibaar 539 threshA = Data->temp[0] + 20;
743 : chl 530 if (threshA < 512) threshA = 512;
744 :     if (threshA > 1024) threshA = 1024; }
745 : Isibaar 3
746 : chl 530 PreparePredictionsP(pmv, x, y, pParam->mb_width, pParam->mb_height,
747 :     prevMBs + x + y * pParam->mb_width);
748 : edgomez 195
749 : chl 530 /* main loop. checking all predictions */
750 :    
751 :     for (i = 1; i < 7; i++) {
752 :     if (!(mask = make_mask(pmv, i)) ) continue;
753 : Isibaar 539 CheckCandidate16(pmv[i].x, pmv[i].y, mask, &iDirection, Data);
754 :     if (Data->iMinSAD[0] <= threshA) break;
755 : chl 530 }
756 :    
757 : Isibaar 539 if ((Data->iMinSAD[0] <= threshA) ||
758 :     (MVequal(Data->currentMV[0], (prevMBs+x+y*pParam->mb_width)->mvs[0]) &&
759 :     (Data->iMinSAD[0] < (prevMBs+x+y*pParam->mb_width)->sad16))) {
760 : chl 530 inter4v = 0;
761 : Isibaar 539 } else {
762 : Isibaar 3
763 : Isibaar 539 MainSearchFunc * MainSearchPtr;
764 :     if (MotionFlags & PMV_USESQUARES16) MainSearchPtr = SquareSearch;
765 :     else if (MotionFlags & PMV_ADVANCEDDIAMOND16) MainSearchPtr = AdvDiamondSearch;
766 :     else MainSearchPtr = DiamondSearch;
767 : chl 181
768 : Isibaar 539 (*MainSearchPtr)(Data->currentMV->x, Data->currentMV->y, Data, iDirection);
769 : Isibaar 3
770 : chl 530 /* extended search, diamond starting in 0,0 and in prediction.
771 :     note that this search is/might be done in halfpel positions,
772 :     which makes it more different than the diamond above */
773 : chl 259
774 : Isibaar 539 if (MotionFlags & PMV_EXTSEARCH16) {
775 :     int32_t bSAD;
776 :     VECTOR startMV = Data->predMV, backupMV = Data->currentMV[0];
777 :     if (!(MotionFlags & PMV_HALFPELREFINE16)) // who's gonna use extsearch and no halfpel?
778 :     startMV.x = EVEN(startMV.x); startMV.y = EVEN(startMV.y);
779 :     if (!(MVequal(startMV, backupMV))) {
780 :     bSAD = Data->iMinSAD[0]; Data->iMinSAD[0] = MV_MAX_ERROR;
781 : Isibaar 3
782 : Isibaar 539 CheckCandidate16(startMV.x, startMV.y, 255, &iDirection, Data);
783 :     (*MainSearchPtr)(startMV.x, startMV.y, Data, 255);
784 :     if (bSAD < Data->iMinSAD[0]) {
785 :     Data->currentMV[0] = backupMV;
786 :     Data->iMinSAD[0] = bSAD; }
787 :     }
788 : Isibaar 3
789 : Isibaar 539 backupMV = Data->currentMV[0];
790 :     if (MotionFlags & PMV_HALFPELREFINE16) startMV.x = startMV.y = 1;
791 :     else startMV.x = startMV.y = 0;
792 :     if (!(MVequal(startMV, backupMV))) {
793 :     bSAD = Data->iMinSAD[0]; Data->iMinSAD[0] = MV_MAX_ERROR;
794 : edgomez 195
795 : Isibaar 539 CheckCandidate16(startMV.x, startMV.y, 255, &iDirection, Data);
796 :     (*MainSearchPtr)(startMV.x, startMV.y, Data, 255);
797 :     if (bSAD < Data->iMinSAD[0]) {
798 :     Data->currentMV[0] = backupMV;
799 :     Data->iMinSAD[0] = bSAD; }
800 :     }
801 : Isibaar 3 }
802 :     }
803 :    
804 : Isibaar 539 if (MotionFlags & PMV_HALFPELREFINE16) HalfpelRefine(Data);
805 : Isibaar 3
806 : Isibaar 539 if (inter4v) {
807 :     SearchData Data8;
808 :     Data8.iFcode = Data->iFcode;
809 :     Data8.iQuant = Data->iQuant;
810 :     Data8.iEdgedWidth = Data->iEdgedWidth;
811 :     Search8(Data, 2*x, 2*y, MotionFlags, pParam, pMB, pMBs, 0, &Data8);
812 :     Search8(Data, 2*x + 1, 2*y, MotionFlags, pParam, pMB, pMBs, 1, &Data8);
813 :     Search8(Data, 2*x, 2*y + 1, MotionFlags, pParam, pMB, pMBs, 2, &Data8);
814 :     Search8(Data, 2*x + 1, 2*y + 1, MotionFlags, pParam, pMB, pMBs, 3, &Data8);
815 :     }
816 : Isibaar 3
817 : chl 530 if (!(inter4v) ||
818 : Isibaar 539 (Data->iMinSAD[0] < Data->iMinSAD[1] + Data->iMinSAD[2] +
819 :     Data->iMinSAD[3] + Data->iMinSAD[4] + IMV16X16 * (int32_t)iQuant )) {
820 : chl 530 // INTER MODE
821 :     pMB->mode = MODE_INTER;
822 : Isibaar 539 pMB->mvs[0] = pMB->mvs[1]
823 :     = pMB->mvs[2] = pMB->mvs[3] = Data->currentMV[0];
824 : Isibaar 3
825 : chl 530 pMB->sad16 = pMB->sad8[0] = pMB->sad8[1] =
826 : Isibaar 539 pMB->sad8[2] = pMB->sad8[3] = Data->iMinSAD[0];
827 : Isibaar 3
828 : Isibaar 539 pMB->pmvs[0].x = Data->currentMV[0].x - Data->predMV.x;
829 :     pMB->pmvs[0].y = Data->currentMV[0].y - Data->predMV.y;
830 : edgomez 195 } else {
831 : chl 530 // INTER4V MODE; all other things are already set in Search8
832 :     pMB->mode = MODE_INTER4V;
833 : Isibaar 539 pMB->sad16 = Data->iMinSAD[1] + Data->iMinSAD[2] +
834 :     Data->iMinSAD[3] + Data->iMinSAD[4] + IMV16X16 * iQuant;
835 : edgomez 78 }
836 : chl 530
837 : Isibaar 3 }
838 :    
839 : chl 530 static void
840 :     Search8(const SearchData * const OldData,
841 :     const int x, const int y,
842 :     const uint32_t MotionFlags,
843 :     const MBParam * const pParam,
844 :     MACROBLOCK * const pMB,
845 :     const MACROBLOCK * const pMBs,
846 : Isibaar 539 const int block,
847 :     SearchData * const Data)
848 : chl 345 {
849 : Isibaar 539 Data->predMV = get_pmv2(pMBs, pParam->mb_width, 0, x/2 , y/2, block);
850 :     Data->iMinSAD = OldData->iMinSAD + 1 + block;
851 :     Data->currentMV = OldData->currentMV + 1 + block;
852 : chl 345
853 : chl 530 if (block != 0)
854 : Isibaar 539 *(Data->iMinSAD) += lambda_vec8[Data->iQuant] *
855 :     d_mv_bits( Data->currentMV->x - Data->predMV.x,
856 :     Data->currentMV->y - Data->predMV.y,
857 :     Data->iFcode);
858 : chl 345
859 : chl 530 if (MotionFlags & (PMV_EXTSEARCH8|PMV_HALFPELREFINE8)) {
860 : chl 345
861 : Isibaar 539 Data->Ref = OldData->Ref + 8 * ((block&1) + pParam->edged_width*(block>>1));
862 :     Data->RefH = OldData->RefH + 8 * ((block&1) + pParam->edged_width*(block>>1));
863 :     Data->RefV = OldData->RefV + 8 * ((block&1) + pParam->edged_width*(block>>1));
864 :     Data->RefHV = OldData->RefHV + 8 * ((block&1) + pParam->edged_width*(block>>1));
865 : chl 345
866 : Isibaar 539 Data->Cur = OldData->Cur + 8 * ((block&1) + pParam->edged_width*(block>>1));
867 : chl 530
868 : Isibaar 539 get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 8,
869 : chl 530 pParam->width, pParam->height, OldData->iFcode);
870 : chl 345
871 : chl 530 CheckCandidate = CheckCandidate8;
872 : chl 345
873 : chl 530 if (MotionFlags & PMV_EXTSEARCH8) {
874 : chl 345
875 : chl 530 MainSearchFunc *MainSearchPtr;
876 :     if (MotionFlags & PMV_USESQUARES8) MainSearchPtr = SquareSearch;
877 :     else if (MotionFlags & PMV_ADVANCEDDIAMOND8) MainSearchPtr = AdvDiamondSearch;
878 :     else MainSearchPtr = DiamondSearch;
879 : chl 345
880 : Isibaar 539 (*MainSearchPtr)(Data->currentMV->x, Data->currentMV->y, Data, 255); }
881 : chl 345
882 : Isibaar 539 if (MotionFlags & PMV_HALFPELREFINE8) HalfpelRefine(Data);
883 : chl 345 }
884 : chl 530
885 : Isibaar 539 pMB->pmvs[block].x = Data->currentMV->x - Data->predMV.x;
886 :     pMB->pmvs[block].y = Data->currentMV->y - Data->predMV.y;
887 :     pMB->mvs[block] = *(Data->currentMV);
888 :     pMB->sad8[block] = 4 * (*Data->iMinSAD);
889 :    
890 : chl 345 }
891 :    
892 : chl 530 /* B-frames code starts here */
893 : chl 345
894 : chl 530 static __inline VECTOR
895 :     ChoosePred(const MACROBLOCK * const pMB, const uint32_t mode)
896 : Isibaar 3 {
897 : chl 530 /* the stupidiest function ever */
898 :     if (mode == MODE_FORWARD) return pMB->mvs[0];
899 :     else return pMB->b_mvs[0];
900 : Isibaar 3 }
901 :    
902 : chl 530 static void __inline
903 :     PreparePredictionsBF(VECTOR * const pmv, const int x, const int y,
904 :     const uint32_t iWcount,
905 :     const MACROBLOCK * const pMB,
906 :     const uint32_t mode_curr)
907 : Isibaar 3 {
908 :    
909 : chl 530 // [0] is prediction
910 :     pmv[0].x = EVEN(pmv[0].x); pmv[0].y = EVEN(pmv[0].y);
911 : Isibaar 3
912 : chl 530 pmv[1].x = pmv[1].y = 0; // [1] is zero
913 : Isibaar 3
914 : chl 530 pmv[2] = ChoosePred(pMB, mode_curr);
915 :     pmv[2].x = EVEN(pmv[2].x); pmv[2].y = EVEN(pmv[2].y);
916 : edgomez 195
917 : chl 530 if ((y != 0)&&(x != (int)(iWcount+1))) { // [3] top-right neighbour
918 :     pmv[3] = ChoosePred(pMB+1-iWcount, mode_curr);
919 : Isibaar 539 pmv[3].x = EVEN(pmv[3].x); pmv[3].y = EVEN(pmv[3].y);
920 :     } else pmv[3].x = pmv[3].y = 0;
921 : Isibaar 3
922 : chl 530 if (y != 0) {
923 :     pmv[4] = ChoosePred(pMB-iWcount, mode_curr);
924 :     pmv[4].x = EVEN(pmv[4].x); pmv[4].y = EVEN(pmv[4].y);
925 :     } else pmv[4].x = pmv[4].y = 0;
926 : Isibaar 3
927 : chl 530 if (x != 0) {
928 :     pmv[5] = ChoosePred(pMB-1, mode_curr);
929 :     pmv[5].x = EVEN(pmv[5].x); pmv[5].y = EVEN(pmv[5].y);
930 :     } else pmv[5].x = pmv[5].y = 0;
931 : Isibaar 3
932 : chl 530 if ((x != 0)&&(y != 0)) {
933 :     pmv[6] = ChoosePred(pMB-1-iWcount, mode_curr);
934 :     pmv[6].x = EVEN(pmv[5].x); pmv[5].y = EVEN(pmv[5].y);
935 :     } else pmv[6].x = pmv[6].y = 0;
936 : edgomez 195
937 : chl 530 // more?
938 :     }
939 : chl 181
940 : edgomez 170
941 : chl 530 /* search backward or forward, for b-frames */
942 :     static void
943 :     SearchBF( const uint8_t * const pRef,
944 :     const uint8_t * const pRefH,
945 :     const uint8_t * const pRefV,
946 :     const uint8_t * const pRefHV,
947 :     const IMAGE * const pCur,
948 :     const int x, const int y,
949 :     const uint32_t MotionFlags,
950 :     const uint32_t iQuant,
951 :     const uint32_t iFcode,
952 :     const MBParam * const pParam,
953 :     MACROBLOCK * const pMB,
954 :     const VECTOR * const predMV,
955 :     int32_t * const best_sad,
956 :     const int32_t mode_current)
957 :     {
958 : Isibaar 3
959 : chl 530 const int32_t iEdgedWidth = pParam->edged_width;
960 :    
961 :     int i, iDirection, mask;
962 :     VECTOR currentMV, pmv[7];
963 :     MainSearchFunc *MainSearchPtr;
964 :     int32_t iMinSAD = MV_MAX_ERROR;
965 :     SearchData Data;
966 : Isibaar 3
967 : chl 530 Data.iMinSAD = &iMinSAD;
968 :     Data.Cur = pCur->y + (x + y * iEdgedWidth) * 16;
969 :     Data.iEdgedWidth = iEdgedWidth;
970 :     Data.currentMV = &currentMV;
971 :     Data.iMinSAD = &iMinSAD;
972 :     Data.Ref = pRef + (x + y * iEdgedWidth) * 16;
973 :     Data.RefH = pRefH + (x + y * iEdgedWidth) * 16;
974 :     Data.RefV = pRefV + (x + y * iEdgedWidth) * 16;
975 :     Data.RefHV = pRefHV + (x + y * iEdgedWidth) * 16;
976 : Isibaar 3
977 : chl 530 Data.iQuant = iQuant;
978 :     Data.iFcode = iFcode;
979 :     Data.predMV = *predMV;
980 : edgomez 195
981 : chl 530 get_range(&Data.min_dx, &Data.max_dx, &Data.min_dy, &Data.max_dy, x, y, 16,
982 :     pParam->width, pParam->height, iFcode);
983 : Isibaar 3
984 : chl 530 if (!(MotionFlags & PMV_HALFPEL16)) {
985 :     Data.min_dx = EVEN(Data.min_dx);
986 :     Data.max_dx = EVEN(Data.max_dx);
987 :     Data.min_dy = EVEN(Data.min_dy);
988 :     Data.max_dy = EVEN(Data.max_dy); } // no-halpel and b-frames. do we need it?
989 : edgomez 195
990 : Isibaar 3
991 : chl 530 pmv[0] = Data.predMV;
992 :     PreparePredictionsBF(pmv, x, y, pParam->mb_width,
993 :     pMB, mode_current);
994 : Isibaar 3
995 : chl 530 currentMV.x = currentMV.y = 0;
996 : Isibaar 3
997 : chl 530 CheckCandidate = CheckCandidate16no4v;
998 : chl 181
999 : chl 530 // main loop. checking all predictions
1000 :     for (i = 0; i < 8; i++) {
1001 :     if (!(mask = make_mask(pmv, i)) ) continue;
1002 :     CheckCandidate16no4v(pmv[i].x, pmv[i].y, mask, &iDirection, &Data);
1003 : edgomez 78 }
1004 : Isibaar 3
1005 : chl 530 if (MotionFlags & PMV_USESQUARES16)
1006 :     MainSearchPtr = SquareSearch;
1007 :     else if (MotionFlags & PMV_ADVANCEDDIAMOND16)
1008 :     MainSearchPtr = AdvDiamondSearch;
1009 :     else MainSearchPtr = DiamondSearch;
1010 : chl 96
1011 : chl 530 (*MainSearchPtr)(currentMV.x, currentMV.y, &Data, 255);
1012 : chl 169
1013 : chl 530 if (MotionFlags & PMV_HALFPELREFINE16) HalfpelRefine(&Data);
1014 : chl 169
1015 : chl 530 // three bits are needed to code backward mode. four for forward
1016 :     // we treat the bits just like they were vector's
1017 :     if (mode_current == MODE_FORWARD) iMinSAD += 4 * lambda_vec16[iQuant];
1018 :     else iMinSAD += 3 * lambda_vec16[iQuant];
1019 : chl 169
1020 :    
1021 : chl 530 if (iMinSAD < *best_sad) {
1022 :     *best_sad = iMinSAD;
1023 :     pMB->mode = mode_current;
1024 :     pMB->pmvs[0].x = currentMV.x - predMV->x;
1025 :     pMB->pmvs[0].y = currentMV.y - predMV->y;
1026 :     if (mode_current == MODE_FORWARD) pMB->mvs[0] = currentMV;
1027 :     else pMB->b_mvs[0] = currentMV;
1028 : chl 169 }
1029 : chl 530
1030 :     }
1031 : chl 169
1032 : chl 530 static int32_t
1033 : Isibaar 539 SearchDirect(const IMAGE * const f_Ref,
1034 : chl 530 const uint8_t * const f_RefH,
1035 :     const uint8_t * const f_RefV,
1036 :     const uint8_t * const f_RefHV,
1037 : Isibaar 539 const IMAGE * const b_Ref,
1038 : chl 530 const uint8_t * const b_RefH,
1039 :     const uint8_t * const b_RefV,
1040 :     const uint8_t * const b_RefHV,
1041 :     const IMAGE * const pCur,
1042 :     const int x, const int y,
1043 :     const uint32_t MotionFlags,
1044 :     const uint32_t iQuant,
1045 :     const int32_t TRB, const int32_t TRD,
1046 :     const MBParam * const pParam,
1047 :     MACROBLOCK * const pMB,
1048 :     const MACROBLOCK * const b_mb,
1049 :     int32_t * const best_sad)
1050 : edgomez 195
1051 : chl 530 {
1052 :     const uint32_t iEdgedWidth = pParam->edged_width;
1053 : Isibaar 539 int32_t iMinSAD = 266*4096, skip_sad;
1054 : chl 530 int k;
1055 :     VECTOR currentMV;
1056 :     MainSearchFunc *MainSearchPtr;
1057 :     SearchData Data;
1058 : Isibaar 3
1059 : chl 530 Data.iMinSAD = &iMinSAD;
1060 :     Data.Cur = pCur->y + x * 16 + y * 16 * iEdgedWidth;
1061 :     Data.iEdgedWidth = iEdgedWidth;
1062 :     Data.currentMV = &currentMV;
1063 :     Data.iQuant = iQuant;
1064 :     Data.referencemv = b_mb->mvs;
1065 : chl 140
1066 : Isibaar 539 Data.Ref= f_Ref->y + (x + iEdgedWidth*y) * 16;
1067 : chl 530 Data.RefH = f_RefH + (x + iEdgedWidth*y) * 16;
1068 :     Data.RefV = f_RefV + (x + iEdgedWidth*y) * 16;
1069 :     Data.RefHV = f_RefHV + (x + iEdgedWidth*y) * 16;
1070 : Isibaar 539 Data.bRef = b_Ref->y + (x + iEdgedWidth*y) * 16;
1071 : chl 530 Data.bRefH = b_RefH + (x + iEdgedWidth*y) * 16;
1072 :     Data.bRefV = b_RefV + (x + iEdgedWidth*y) * 16;
1073 :     Data.bRefHV = b_RefHV + (x + iEdgedWidth*y) * 16;
1074 :     /*
1075 :     //What we do here is a complicated version of CheckCandidateDirect(0,0);
1076 :     get_range(&Data.min_dx, &Data.max_dx, &Data.min_dy, &Data.max_dy, x, y, 16, pParam->width, pParam->height, 19);
1077 : chl 140
1078 : Isibaar 3 */
1079 : chl 530 Data.max_dx = 2 * pParam->width - 2 * (x) * 16;
1080 :     Data.max_dy = 2 * pParam->height - 2 * (y) * 16;
1081 :     Data.min_dx = -(2 * 16 + 2 * (x) * 16);
1082 :     Data.min_dy = -(2 * 16 + 2 * (y) * 16);
1083 : Isibaar 3
1084 : chl 530 for (k = 0; k < 4; k++) {
1085 :     pMB->mvs[k].x = Data.directmvF[k].x = ((TRB * Data.referencemv[k].x) / TRD);
1086 :     pMB->b_mvs[k].x = Data.directmvB[k].x = ((TRB - TRD) * Data.referencemv[k].x) / TRD;
1087 :     pMB->mvs[k].y = Data.directmvF[k].y = ((TRB * Data.referencemv[k].y) / TRD);
1088 :     pMB->b_mvs[k].y = Data.directmvB[k].y = ((TRB - TRD) * Data.referencemv[k].y) / TRD;
1089 : Isibaar 3
1090 : Isibaar 539 if (( pMB->mvs[k].x > Data.max_dx ) || ( pMB->mvs[k].x < Data.min_dx )
1091 : chl 530 || ( pMB->mvs[k].y > Data.max_dy ) || ( pMB->mvs[k].y < Data.min_dy )
1092 :     || ( pMB->b_mvs[k].x > Data.max_dx ) || ( pMB->b_mvs[k].x < Data.min_dx )
1093 :     || ( pMB->b_mvs[k].y > Data.max_dy ) || ( pMB->b_mvs[k].y < Data.min_dy )) {
1094 : Isibaar 3
1095 : Isibaar 539 *best_sad = 256*4096; // in that case, we won't use direct mode
1096 :     pMB->mode = MODE_DIRECT; // just to make sure it doesn't say "MODE_DIRECT_NONE_MV"
1097 :     pMB->b_mvs[0].x = pMB->b_mvs[0].y = 0;
1098 :     return 0;
1099 :     }
1100 :     if (b_mb->mode != MODE_INTER4V) {
1101 :     pMB->mvs[1] = pMB->mvs[2] = pMB->mvs[3] = pMB->mvs[0];
1102 :     pMB->b_mvs[1] = pMB->b_mvs[2] = pMB->b_mvs[3] = pMB->b_mvs[0];
1103 :     Data.directmvF[1] = Data.directmvF[2] = Data.directmvF[3] = Data.directmvF[0];
1104 :     Data.directmvB[1] = Data.directmvB[2] = Data.directmvB[3] = Data.directmvB[0];
1105 :     break;
1106 :     }
1107 :     }
1108 : Isibaar 3
1109 : Isibaar 539 if (b_mb->mode == MODE_INTER4V)
1110 :     CheckCandidate = CheckCandidateDirect;
1111 :     else CheckCandidate = CheckCandidateDirectno4v;
1112 : edgomez 195
1113 : Isibaar 539 (*CheckCandidate)(0, 0, 255, &k, &Data);
1114 : Isibaar 3
1115 : chl 530 // skip decision
1116 : Isibaar 539 if (iMinSAD - 2 * lambda_vec16[iQuant] < (int32_t)iQuant * SKIP_THRESH_B) {
1117 :     //checking chroma. everything copied from MC
1118 :     //this is not full chroma compensation, only it's fullpel approximation. should work though
1119 :     int sum, dx, dy, b_dx, b_dy;
1120 : Isibaar 3
1121 : Isibaar 539 sum = pMB->mvs[0].x + pMB->mvs[1].x + pMB->mvs[2].x + pMB->mvs[3].x;
1122 :     dx = (sum == 0 ? 0 : SIGN(sum) * (roundtab[ABS(sum) % 16] + (ABS(sum) / 16) * 2));
1123 :    
1124 :     sum = pMB->mvs[0].y + pMB->mvs[1].y + pMB->mvs[2].y + pMB->mvs[3].y;
1125 :     dy = (sum == 0 ? 0 : SIGN(sum) * (roundtab[ABS(sum) % 16] + (ABS(sum) / 16) * 2));
1126 :    
1127 :     sum = pMB->b_mvs[0].x + pMB->b_mvs[1].x + pMB->b_mvs[2].x + pMB->b_mvs[3].x;
1128 :     b_dx = (sum == 0 ? 0 : SIGN(sum) * (roundtab[ABS(sum) % 16] + (ABS(sum) / 16) * 2));
1129 :    
1130 :     sum = pMB->b_mvs[0].y + pMB->b_mvs[1].y + pMB->b_mvs[2].y + pMB->b_mvs[3].y;
1131 :     b_dy = (sum == 0 ? 0 : SIGN(sum) * (roundtab[ABS(sum) % 16] + (ABS(sum) / 16) * 2));
1132 :    
1133 :     sum = sad8bi(pCur->u + 8*x + 8*y*(iEdgedWidth/2),
1134 :     f_Ref->u + (y*8 + dy/2) * (iEdgedWidth/2) + x*8 + dx/2,
1135 :     b_Ref->u + (y*8 + b_dy/2) * (iEdgedWidth/2) + x*8 + b_dx/2,
1136 :     iEdgedWidth/2);
1137 :     sum += sad8bi(pCur->v + 8*x + 8*y*(iEdgedWidth/2),
1138 :     f_Ref->v + (y*8 + dy/2) * (iEdgedWidth/2) + x*8 + dx/2,
1139 :     b_Ref->v + (y*8 + b_dy/2) * (iEdgedWidth/2) + x*8 + b_dx/2,
1140 :     iEdgedWidth/2);
1141 :    
1142 :     if ((uint32_t) sum < MAX_CHROMA_SAD_FOR_SKIP * Data.iQuant) {
1143 :     pMB->mode = MODE_DIRECT_NONE_MV;
1144 :     return iMinSAD;
1145 :     }
1146 :     }
1147 :    
1148 : chl 530 skip_sad = iMinSAD;
1149 : edgomez 195
1150 : chl 530 // DIRECT MODE DELTA VECTOR SEARCH.
1151 :     // This has to be made more effective, but at the moment I'm happy it's running at all
1152 : Isibaar 3
1153 : chl 530 if (MotionFlags & PMV_USESQUARES16) MainSearchPtr = SquareSearch;
1154 :     else if (MotionFlags & PMV_ADVANCEDDIAMOND16) MainSearchPtr = AdvDiamondSearch;
1155 :     else MainSearchPtr = DiamondSearch;
1156 : edgomez 195
1157 : chl 530 (*MainSearchPtr)(0, 0, &Data, 255);
1158 : Isibaar 3
1159 : chl 530 HalfpelRefine(&Data);
1160 : Isibaar 3
1161 : chl 530 iMinSAD += 1 * lambda_vec16[iQuant]; // one bit is needed to code direct mode. we treat this bit just like it was vector's
1162 :     *best_sad = iMinSAD;
1163 : Isibaar 3
1164 : chl 530 if (b_mb->mode == MODE_INTER4V)
1165 :     pMB->mode = MODE_DIRECT;
1166 :     else pMB->mode = MODE_DIRECT_NO4V; //for faster compensation
1167 : edgomez 195
1168 : chl 530 pMB->pmvs[3] = currentMV;
1169 : edgomez 195
1170 : chl 530 for (k = 0; k < 4; k++) {
1171 :     pMB->mvs[k].x = Data.directmvF[k].x + currentMV.x;
1172 :     pMB->b_mvs[k].x = ((currentMV.x == 0)
1173 :     ? Data.directmvB[k].x
1174 :     : pMB->mvs[k].x - Data.referencemv[k].x);
1175 :     pMB->mvs[k].y = (Data.directmvF[k].y + currentMV.y);
1176 :     pMB->b_mvs[k].y = ((currentMV.y == 0)
1177 :     ? Data.directmvB[k].y
1178 :     : pMB->mvs[k].y - Data.referencemv[k].y);
1179 :     if (b_mb->mode != MODE_INTER4V) {
1180 :     pMB->mvs[3] = pMB->mvs[2] = pMB->mvs[1] = pMB->mvs[0];
1181 :     pMB->b_mvs[3] = pMB->b_mvs[2] = pMB->b_mvs[1] = pMB->b_mvs[0];
1182 :     break;
1183 :     }
1184 :     }
1185 :     return 0;//skip_sad;
1186 : Isibaar 3 }
1187 : chl 96
1188 : chl 530 static __inline void
1189 :     SearchInterpolate(const uint8_t * const f_Ref,
1190 :     const uint8_t * const f_RefH,
1191 :     const uint8_t * const f_RefV,
1192 :     const uint8_t * const f_RefHV,
1193 :     const uint8_t * const b_Ref,
1194 :     const uint8_t * const b_RefH,
1195 :     const uint8_t * const b_RefV,
1196 :     const uint8_t * const b_RefHV,
1197 :     const IMAGE * const pCur,
1198 :     const int x, const int y,
1199 :     const uint32_t fcode,
1200 :     const uint32_t bcode,
1201 :     const uint32_t MotionFlags,
1202 :     const uint32_t iQuant,
1203 :     const MBParam * const pParam,
1204 :     const VECTOR * const f_predMV,
1205 :     const VECTOR * const b_predMV,
1206 :     MACROBLOCK * const pMB,
1207 :     int32_t * const best_sad)
1208 :    
1209 : chl 96 {
1210 : chl 530 /* Interpolated MC motion vector search, this is tedious and more complicated because there are
1211 :     two values for everything, always one for backward and one for forward ME. Still, we don't gain
1212 :     much from this search, maybe it should simply be skipped and simply current i_sad16 value used
1213 :     as "optimal". */
1214 : chl 96
1215 : edgomez 195 const int32_t iEdgedWidth = pParam->edged_width;
1216 : chl 96
1217 : chl 530 int iDirection, i, j;
1218 :     int32_t iMinSAD = 256*4096;
1219 :     VECTOR currentMV[3];
1220 :     SearchData fData, bData;
1221 : chl 96
1222 : chl 530 fData.iMinSAD = bData.iMinSAD = &iMinSAD;
1223 : edgomez 195
1224 : chl 530 fData.Cur = bData.Cur = pCur->y + (x + y * iEdgedWidth) * 16;
1225 :     fData.iEdgedWidth = bData.iEdgedWidth = iEdgedWidth;
1226 :     fData.currentMV = currentMV; bData.currentMV = currentMV + 1;
1227 :     fData.iQuant = bData.iQuant = iQuant;
1228 :     fData.iFcode = bData.bFcode = fcode; fData.bFcode = bData.iFcode = bcode;
1229 : chl 96
1230 : chl 530 bData.bRef = fData.Ref = f_Ref + (x + y * iEdgedWidth) * 16;
1231 :     bData.bRefH = fData.RefH = f_RefH + (x + y * iEdgedWidth) * 16;
1232 :     bData.bRefV = fData.RefV = f_RefV + (x + y * iEdgedWidth) * 16;
1233 :     bData.bRefHV = fData.RefHV = f_RefHV + (x + y * iEdgedWidth) * 16;
1234 :     bData.Ref = fData.bRef = b_Ref + (x + y * iEdgedWidth) * 16;
1235 :     bData.RefH = fData.bRefH = b_RefH + (x + y * iEdgedWidth) * 16;
1236 :     bData.RefV = fData.bRefV = b_RefV + (x + y * iEdgedWidth) * 16;
1237 :     bData.RefHV = fData.bRefHV = b_RefHV + (x + y * iEdgedWidth) * 16;
1238 : edgomez 195
1239 : chl 530 bData.bpredMV = fData.predMV = *f_predMV;
1240 :     fData.bpredMV = bData.predMV = *b_predMV;
1241 : chl 96
1242 : chl 530 currentMV[0] = pMB->mvs[0];
1243 :     currentMV[1] = pMB->b_mvs[0];
1244 :     get_range(&fData.min_dx, &fData.max_dx, &fData.min_dy, &fData.max_dy, x, y, 16, pParam->width, pParam->height, fcode);
1245 :     get_range(&bData.min_dx, &bData.max_dx, &bData.min_dy, &bData.max_dy, x, y, 16, pParam->width, pParam->height, bcode);
1246 : chl 96
1247 : Isibaar 539 if (currentMV[0].x > fData.max_dx) currentMV[0].x = fData.max_dx;
1248 :     if (currentMV[0].x < fData.min_dx) currentMV[0].x = fData.min_dy;
1249 :     if (currentMV[0].y > fData.max_dy) currentMV[0].y = fData.max_dx;
1250 :     if (currentMV[0].y > fData.min_dy) currentMV[0].y = fData.min_dy;
1251 :    
1252 :     if (currentMV[1].x > bData.max_dx) currentMV[1].x = bData.max_dx;
1253 :     if (currentMV[1].x < bData.min_dx) currentMV[1].x = bData.min_dy;
1254 :     if (currentMV[1].y > bData.max_dy) currentMV[1].y = bData.max_dx;
1255 :     if (currentMV[1].y > bData.min_dy) currentMV[1].y = bData.min_dy;
1256 :    
1257 : chl 530 CheckCandidateInt(currentMV[0].x, currentMV[0].y, 255, &iDirection, &fData);
1258 : chl 96
1259 : chl 530 //diamond. I wish we could use normal mainsearch functions (square, advdiamond)
1260 : chl 96
1261 : chl 530 do {
1262 :     iDirection = 255;
1263 :     // forward MV moves
1264 :     i = currentMV[0].x; j = currentMV[0].y;
1265 : chl 96
1266 : Isibaar 539 CheckCandidateInt(i + 1, j, 0, &iDirection, &fData);
1267 :     CheckCandidateInt(i, j + 1, 0, &iDirection, &fData);
1268 :     CheckCandidateInt(i - 1, j, 0, &iDirection, &fData);
1269 :     CheckCandidateInt(i, j - 1, 0, &iDirection, &fData);
1270 : chl 96
1271 : chl 530 // backward MV moves
1272 :     i = currentMV[1].x; j = currentMV[1].y;
1273 :     currentMV[2] = currentMV[0];
1274 : chl 326
1275 : Isibaar 539 CheckCandidateInt(i + 1, j, 0, &iDirection, &bData);
1276 :     CheckCandidateInt(i, j + 1, 0, &iDirection, &bData);
1277 :     CheckCandidateInt(i - 1, j, 0, &iDirection, &bData);
1278 :     CheckCandidateInt(i, j - 1, 0, &iDirection, &bData);
1279 : chl 96
1280 : chl 530 } while (!(iDirection));
1281 : edgomez 195
1282 : chl 530 // two bits are needed to code interpolate mode. we treat the bits just like they were vector's
1283 :     iMinSAD += 2 * lambda_vec16[iQuant];
1284 :     if (iMinSAD < *best_sad) {
1285 :     *best_sad = iMinSAD;
1286 :     pMB->mvs[0] = currentMV[0];
1287 :     pMB->b_mvs[0] = currentMV[1];
1288 :     pMB->mode = MODE_INTERPOLATE;
1289 : chl 96
1290 : chl 530 pMB->pmvs[1].x = pMB->mvs[0].x - f_predMV->x;
1291 :     pMB->pmvs[1].y = pMB->mvs[0].y - f_predMV->y;
1292 :     pMB->pmvs[0].x = pMB->b_mvs[0].x - b_predMV->x;
1293 :     pMB->pmvs[0].y = pMB->b_mvs[0].y - b_predMV->y;
1294 :     }
1295 :     }
1296 : chl 96
1297 : chl 530 void
1298 :     MotionEstimationBVOP(MBParam * const pParam,
1299 :     FRAMEINFO * const frame,
1300 :     const int32_t time_bp,
1301 :     const int32_t time_pp,
1302 :     // forward (past) reference
1303 :     const MACROBLOCK * const f_mbs,
1304 :     const IMAGE * const f_ref,
1305 :     const IMAGE * const f_refH,
1306 :     const IMAGE * const f_refV,
1307 :     const IMAGE * const f_refHV,
1308 :     // backward (future) reference
1309 :     const MACROBLOCK * const b_mbs,
1310 :     const IMAGE * const b_ref,
1311 :     const IMAGE * const b_refH,
1312 :     const IMAGE * const b_refV,
1313 :     const IMAGE * const b_refHV)
1314 :     {
1315 :     uint32_t i, j;
1316 :     int32_t best_sad, skip_sad;
1317 :     int f_count = 0, b_count = 0, i_count = 0, d_count = 0, n_count = 0;
1318 :     static const VECTOR zeroMV={0,0};
1319 : chl 96
1320 : chl 530 VECTOR f_predMV, b_predMV; /* there is no prediction for direct mode*/
1321 : chl 96
1322 : chl 530 const int32_t TRB = time_pp - time_bp;
1323 :     const int32_t TRD = time_pp;
1324 : chl 96
1325 : chl 530 // note: i==horizontal, j==vertical
1326 : chl 96
1327 : chl 530 for (j = 0; j < pParam->mb_height; j++) {
1328 : chl 96
1329 : chl 530 f_predMV = b_predMV = zeroMV; /* prediction is reset at left boundary */
1330 : edgomez 195
1331 : chl 530 for (i = 0; i < pParam->mb_width; i++) {
1332 :     MACROBLOCK * const pMB = frame->mbs + i + j * pParam->mb_width;
1333 :     const MACROBLOCK * const b_mb = b_mbs + i + j * pParam->mb_width;
1334 : edgomez 195
1335 : chl 530 /* special case, if collocated block is SKIPed: encoding is forward (0,0), cpb=0 without further ado */
1336 :     if (b_mb->mode == MODE_NOT_CODED) {
1337 :     pMB->mode = MODE_NOT_CODED;
1338 :     continue;
1339 : chl 96 }
1340 :    
1341 : chl 530 /* direct search comes first, because it (1) checks for SKIP-mode
1342 :     and (2) sets very good predictions for forward and backward search */
1343 : chl 96
1344 : Isibaar 539 skip_sad = SearchDirect(f_ref, f_refH->y, f_refV->y, f_refHV->y,
1345 :     b_ref, b_refH->y, b_refV->y, b_refHV->y,
1346 : chl 530 &frame->image,
1347 :     i, j,
1348 :     frame->motion_flags,
1349 :     frame->quant,
1350 :     TRB, TRD,
1351 :     pParam,
1352 :     pMB, b_mb,
1353 :     &best_sad);
1354 : chl 96
1355 : Isibaar 539 if (pMB->mode == MODE_DIRECT_NONE_MV) { n_count++; continue; }
1356 : chl 96
1357 : chl 530 // best_sad = 256*4096; //uncomment to disable Directsearch.
1358 :     // To disable any other mode, just comment the function call
1359 : chl 96
1360 : chl 530 // forward search
1361 :     SearchBF(f_ref->y, f_refH->y, f_refV->y, f_refHV->y,
1362 :     &frame->image, i, j,
1363 :     frame->motion_flags,
1364 :     frame->quant, frame->fcode, pParam,
1365 :     pMB, &f_predMV, &best_sad,
1366 :     MODE_FORWARD);
1367 : chl 96
1368 : chl 530 // backward search
1369 :     SearchBF(b_ref->y, b_refH->y, b_refV->y, b_refHV->y,
1370 :     &frame->image, i, j,
1371 :     frame->motion_flags,
1372 :     frame->quant, frame->bcode, pParam,
1373 :     pMB, &b_predMV, &best_sad,
1374 :     MODE_BACKWARD);
1375 : chl 96
1376 : chl 530 // interpolate search comes last, because it uses data from forward and backward as prediction
1377 : chl 96
1378 : chl 530 SearchInterpolate(f_ref->y, f_refH->y, f_refV->y, f_refHV->y,
1379 :     b_ref->y, b_refH->y, b_refV->y, b_refHV->y,
1380 :     &frame->image,
1381 :     i, j,
1382 :     frame->fcode, frame->bcode,
1383 :     frame->motion_flags,
1384 :     frame->quant, pParam,
1385 :     &f_predMV, &b_predMV,
1386 :     pMB, &best_sad);
1387 : chl 96
1388 : chl 530 switch (pMB->mode) {
1389 :     case MODE_FORWARD:
1390 :     f_count++;
1391 :     f_predMV = pMB->mvs[0];
1392 :     break;
1393 :     case MODE_BACKWARD:
1394 :     b_count++;
1395 :     b_predMV = pMB->b_mvs[0];
1396 :     break;
1397 :     case MODE_INTERPOLATE:
1398 :     i_count++;
1399 :     f_predMV = pMB->mvs[0];
1400 :     b_predMV = pMB->b_mvs[0];
1401 :     break;
1402 :     case MODE_DIRECT:
1403 :     case MODE_DIRECT_NO4V:
1404 :     d_count++;
1405 :     break;
1406 :     default:
1407 :     break;
1408 : chl 96 }
1409 :     }
1410 :     }
1411 :    
1412 : chl 530 // fprintf(debug,"B-Stat: F: %04d B: %04d I: %04d D: %04d, N: %04d\n",
1413 :     // f_count,b_count,i_count,d_count,n_count);
1414 : chl 96
1415 :     }
1416 :    
1417 : chl 530 /* Hinted ME starts here */
1418 : chl 96
1419 : chl 530 static __inline void
1420 :     Search8hinted( const SearchData * const OldData,
1421 :     const int x, const int y,
1422 :     const uint32_t MotionFlags,
1423 :     const MBParam * const pParam,
1424 :     MACROBLOCK * const pMB,
1425 :     const MACROBLOCK * const pMBs,
1426 :     const int block)
1427 : chl 96 {
1428 : chl 530 SearchData Data;
1429 :     MainSearchFunc *MainSearchPtr;
1430 : chl 141
1431 : chl 530 Data.predMV = get_pmv2(pMBs, pParam->mb_width, 0, x/2 , y/2, block);
1432 :     Data.iMinSAD = OldData->iMinSAD + 1 + block;
1433 :     Data.currentMV = OldData->currentMV+1+block;
1434 :     Data.iFcode = OldData->iFcode;
1435 :     Data.iQuant = OldData->iQuant;
1436 : chl 96
1437 : chl 530 Data.Ref = OldData->Ref + 8 * ((block&1) + pParam->edged_width*(block>>1));
1438 :     Data.RefH = OldData->RefH + 8 * ((block&1) + pParam->edged_width*(block>>1));
1439 :     Data.RefV = OldData->RefV + 8 * ((block&1) + pParam->edged_width*(block>>1));
1440 :     Data.RefHV = OldData->RefHV + 8 * ((block&1) + pParam->edged_width*(block>>1));
1441 :     Data.iEdgedWidth = pParam->edged_width;
1442 :     Data.Cur = OldData->Cur + 8 * ((block&1) + pParam->edged_width*(block>>1));
1443 : chl 96
1444 : chl 530 CheckCandidate = CheckCandidate8;
1445 : edgomez 195
1446 : chl 530 if (block != 0)
1447 :     *(Data.iMinSAD) += lambda_vec8[Data.iQuant] *
1448 :     d_mv_bits( Data.currentMV->x - Data.predMV.x,
1449 :     Data.currentMV->y - Data.predMV.y,
1450 :     Data.iFcode);
1451 : edgomez 195
1452 :    
1453 : chl 530 get_range(&Data.min_dx, &Data.max_dx, &Data.min_dy, &Data.max_dy, x, y, 8,
1454 :     pParam->width, pParam->height, OldData->iFcode);
1455 : chl 96
1456 : chl 530 if (pMB->mode == MODE_INTER4V) {
1457 :     int dummy;
1458 :     CheckCandidate8(pMB->mvs[block].x, pMB->mvs[block].y, 0, &dummy, &Data); }
1459 : chl 96
1460 : chl 530 if (MotionFlags & PMV_USESQUARES8) MainSearchPtr = SquareSearch;
1461 :     else if (MotionFlags & PMV_ADVANCEDDIAMOND8) MainSearchPtr = AdvDiamondSearch;
1462 :     else MainSearchPtr = DiamondSearch;
1463 : chl 96
1464 : chl 530 (*MainSearchPtr)(Data.currentMV->x, Data.currentMV->y, &Data, 255);
1465 : edgomez 195
1466 : chl 530 if (MotionFlags & PMV_HALFPELREFINE8) HalfpelRefine(&Data);
1467 : chl 96
1468 : chl 530 pMB->pmvs[block].x = Data.currentMV->x - Data.predMV.x;
1469 :     pMB->pmvs[block].y = Data.currentMV->y - Data.predMV.y;
1470 :     pMB->mvs[block] = *(Data.currentMV);
1471 :     pMB->sad8[block] = 4 * (*(Data.iMinSAD));
1472 : chl 96 }
1473 :    
1474 : suxen_drol 118
1475 : chl 530 static void
1476 :     SearchPhinted ( const uint8_t * const pRef,
1477 : chl 289 const uint8_t * const pRefH,
1478 :     const uint8_t * const pRefV,
1479 :     const uint8_t * const pRefHV,
1480 :     const IMAGE * const pCur,
1481 :     const int x,
1482 :     const int y,
1483 :     const uint32_t MotionFlags,
1484 :     const uint32_t iQuant,
1485 :     const uint32_t iFcode,
1486 :     const MBParam * const pParam,
1487 :     const MACROBLOCK * const pMBs,
1488 : chl 530 int inter4v,
1489 :     MACROBLOCK * const pMB)
1490 : chl 289 {
1491 : chl 530
1492 : chl 289 const int32_t iEdgedWidth = pParam->edged_width;
1493 : chl 530
1494 :     int i;
1495 :     VECTOR currentMV[5];
1496 :     int32_t iMinSAD[5];
1497 :     int32_t temp[5];
1498 :     MainSearchFunc * MainSearchPtr;
1499 :     SearchData Data;
1500 : suxen_drol 118
1501 : chl 530 Data.predMV = get_pmv2(pMBs, pParam->mb_width, 0, x, y, 0);
1502 :     get_range(&Data.min_dx, &Data.max_dx, &Data.min_dy, &Data.max_dy, x, y, 16,
1503 :     pParam->width, pParam->height, iFcode);
1504 : suxen_drol 118
1505 : chl 530 Data.Cur = pCur->y + (x + y * iEdgedWidth) * 16;
1506 :     Data.iEdgedWidth = iEdgedWidth;
1507 :     Data.currentMV = currentMV;
1508 :     Data.iMinSAD = iMinSAD;
1509 :     Data.Ref = pRef + (x + iEdgedWidth*y)*16;
1510 :     Data.RefH = pRefH + (x + iEdgedWidth*y) * 16;
1511 :     Data.RefV = pRefV + (x + iEdgedWidth*y) * 16;
1512 :     Data.RefHV = pRefHV + (x + iEdgedWidth*y) * 16;
1513 :     Data.temp = temp;
1514 :     Data.iQuant = iQuant;
1515 :     Data.iFcode = iFcode;
1516 : chl 326
1517 : chl 530 if (!(MotionFlags & PMV_HALFPEL16)) {
1518 :     Data.min_dx = EVEN(Data.min_dx);
1519 :     Data.max_dx = EVEN(Data.max_dx);
1520 :     Data.min_dy = EVEN(Data.min_dy);
1521 :     Data.max_dy = EVEN(Data.max_dy);
1522 :     }
1523 : chl 289
1524 : chl 530 for(i = 0; i < 5; i++) iMinSAD[i] = MV_MAX_ERROR;
1525 : chl 289
1526 : chl 530 if (pMB->dquant != NO_CHANGE) inter4v = 0;
1527 : chl 289
1528 : chl 530 if (inter4v)
1529 :     CheckCandidate = CheckCandidate16;
1530 :     else CheckCandidate = CheckCandidate16no4v;
1531 : chl 289
1532 :    
1533 : chl 530 pMB->mvs[0].x = EVEN(pMB->mvs[0].x);
1534 :     pMB->mvs[0].y = EVEN(pMB->mvs[0].y);
1535 :     if (pMB->mvs[0].x > Data.max_dx) pMB->mvs[0].x = Data.max_dx; // this is in case iFcode changed
1536 :     if (pMB->mvs[0].x < Data.min_dx) pMB->mvs[0].x = Data.min_dx;
1537 :     if (pMB->mvs[0].y > Data.max_dy) pMB->mvs[0].y = Data.max_dy;
1538 :     if (pMB->mvs[0].y < Data.min_dy) pMB->mvs[0].y = Data.min_dy;
1539 : chl 370
1540 : chl 530 CheckCandidate16(pMB->mvs[0].x, pMB->mvs[0].y, 0, &i, &Data);
1541 : chl 289
1542 : chl 530 if (pMB->mode == MODE_INTER4V)
1543 :     for (i = 1; i < 4; i++) { // all four vectors will be used as four predictions for 16x16 search
1544 :     pMB->mvs[i].x = EVEN(pMB->mvs[i].x);
1545 :     pMB->mvs[i].y = EVEN(pMB->mvs[i].y);
1546 :     if (!(make_mask(pMB->mvs, i)))
1547 :     CheckCandidate16(pMB->mvs[i].x, pMB->mvs[i].y, 0, &i, &Data);
1548 : chl 289 }
1549 :    
1550 :     if (MotionFlags & PMV_USESQUARES16)
1551 : chl 530 MainSearchPtr = SquareSearch;
1552 : chl 289 else if (MotionFlags & PMV_ADVANCEDDIAMOND16)
1553 : chl 530 MainSearchPtr = AdvDiamondSearch;
1554 :     else MainSearchPtr = DiamondSearch;
1555 : chl 289
1556 : chl 530 (*MainSearchPtr)(currentMV->x, currentMV->y, &Data, 255);
1557 : chl 289
1558 : chl 530 if (MotionFlags & PMV_HALFPELREFINE16) HalfpelRefine(&Data);
1559 : chl 289
1560 : chl 530 if (inter4v)
1561 :     for(i = 0; i < 4; i++)
1562 :     Search8hinted(&Data, 2*x+(i&1), 2*y+(i>>1), MotionFlags, pParam, pMB, pMBs, i);
1563 : chl 289
1564 : chl 530 if (!(inter4v) ||
1565 :     (iMinSAD[0] < iMinSAD[1] + iMinSAD[2] + iMinSAD[3] + iMinSAD[4] + IMV16X16 * (int32_t)iQuant )) {
1566 :     // INTER MODE
1567 : chl 289
1568 : chl 530 pMB->mode = MODE_INTER;
1569 : Isibaar 539 pMB->mvs[0] = pMB->mvs[1]
1570 : chl 530 = pMB->mvs[2] = pMB->mvs[3] = currentMV[0];
1571 : chl 289
1572 : chl 530 pMB->sad16 = pMB->sad8[0] = pMB->sad8[1] =
1573 :     pMB->sad8[2] = pMB->sad8[3] = iMinSAD[0];
1574 : chl 289
1575 : chl 530 pMB->pmvs[0].x = currentMV[0].x - Data.predMV.x;
1576 :     pMB->pmvs[0].y = currentMV[0].y - Data.predMV.y;
1577 :     } else {
1578 :     // INTER4V MODE; all other things are already set in Search8hinted
1579 :     pMB->mode = MODE_INTER4V;
1580 :     pMB->sad16 = iMinSAD[1] + iMinSAD[2] + iMinSAD[3] + iMinSAD[4] + IMV16X16 * iQuant;
1581 : chl 289 }
1582 :    
1583 :     }
1584 :    
1585 : edgomez 195 void
1586 : chl 530 MotionEstimationHinted( MBParam * const pParam,
1587 :     FRAMEINFO * const current,
1588 :     FRAMEINFO * const reference,
1589 :     const IMAGE * const pRefH,
1590 :     const IMAGE * const pRefV,
1591 :     const IMAGE * const pRefHV)
1592 : suxen_drol 118 {
1593 : chl 530 MACROBLOCK *const pMBs = current->mbs;
1594 :     const IMAGE *const pCurrent = &current->image;
1595 :     const IMAGE *const pRef = &reference->image;
1596 : suxen_drol 118
1597 : chl 530 uint32_t x, y;
1598 : chl 312
1599 : chl 530 if (sadInit) (*sadInit) ();
1600 : suxen_drol 118
1601 : chl 530 for (y = 0; y < pParam->mb_height; y++) {
1602 :     for (x = 0; x < pParam->mb_width; x++) {
1603 : chl 312
1604 : chl 530 MACROBLOCK *pMB = &pMBs[x + y * pParam->mb_width];
1605 : suxen_drol 118
1606 : chl 530 //intra mode is copied from the first pass. At least for the time being
1607 :     if ((pMB->mode == MODE_INTRA) || (pMB->mode == MODE_NOT_CODED) ) continue;
1608 : chl 346
1609 : chl 530 if (!(current->global_flags & XVID_LUMIMASKING)) {
1610 :     pMB->dquant = NO_CHANGE;
1611 :     pMB->quant = current->quant; }
1612 : chl 341
1613 : Isibaar 539 SearchPhinted(pRef->y, pRefH->y, pRefV->y, pRefHV->y, pCurrent, x,
1614 :     y, current->motion_flags, pMB->quant,
1615 :     current->fcode, pParam, pMBs,
1616 :     current->global_flags & XVID_INTER4V, pMB);
1617 : chl 317
1618 : Isibaar 539 }
1619 :     }
1620 :     }
1621 : suxen_drol 118
1622 : Isibaar 539 static __inline int
1623 :     MEanalyzeMB ( const uint8_t * const pRef,
1624 :     const uint8_t * const pCur,
1625 :     const int x,
1626 :     const int y,
1627 :     const uint32_t iFcode,
1628 :     const MBParam * const pParam,
1629 :     const MACROBLOCK * const pMBs,
1630 :     MACROBLOCK * const pMB)
1631 :     {
1632 : chl 317
1633 : Isibaar 539 const int32_t iEdgedWidth = pParam->edged_width;
1634 :     int i, mask;
1635 :     VECTOR currentMV, pmv[3];
1636 :     int32_t iMinSAD = MV_MAX_ERROR;
1637 :     SearchData Data;
1638 : suxen_drol 118
1639 : Isibaar 539 Data.predMV = get_pmv2(pMBs, pParam->mb_width, 0, x, y, 0);
1640 :     get_range(&Data.min_dx, &Data.max_dx, &Data.min_dy, &Data.max_dy, x, y, 16,
1641 :     pParam->width, pParam->height, iFcode);
1642 : chl 326
1643 : Isibaar 539 Data.Cur = pCur + (x + y * iEdgedWidth) * 16;
1644 :     Data.iEdgedWidth = iEdgedWidth;
1645 :     Data.currentMV = &currentMV;
1646 :     Data.iMinSAD = &iMinSAD;
1647 :     Data.Ref = pRef + (x + iEdgedWidth*y)*16;
1648 :     Data.iQuant = 2;
1649 :     Data.iFcode = iFcode;
1650 :    
1651 :     CheckCandidate = CheckCandidate16no4vI;
1652 : chl 326
1653 : Isibaar 539 pmv[1].x = EVEN(pMB->mvs[0].x);
1654 :     pmv[1].y = EVEN(pMB->mvs[0].y);
1655 :     pmv[0].x = EVEN(Data.predMV.x);
1656 :     pmv[0].y = EVEN(Data.predMV.y);
1657 :     pmv[2].x = pmv[2].y = 0;
1658 : chl 326
1659 : Isibaar 539 CheckCandidate16no4vI(pmv[0].x, pmv[0].y, 255, &i, &Data);
1660 :     if (!(mask = make_mask(pmv, 1)))
1661 :     CheckCandidate16no4vI(pmv[1].x, pmv[1].y, mask, &i, &Data);
1662 :     if (!(mask = make_mask(pmv, 2)))
1663 :     CheckCandidate16no4vI(0, 0, mask, &i, &Data);
1664 :    
1665 :     DiamondSearch(currentMV.x, currentMV.y, &Data, i);
1666 :    
1667 :     pMB->mvs[0] = pMB->mvs[1]
1668 :     = pMB->mvs[2] = pMB->mvs[3] = currentMV; // all, for future get_pmv()
1669 :    
1670 :     return iMinSAD;
1671 :     }
1672 :    
1673 :     #define INTRA_THRESH 1350
1674 :     #define INTER_THRESH 900
1675 :    
1676 :     int
1677 :     MEanalysis( const IMAGE * const pRef,
1678 :     const IMAGE * const pCurrent,
1679 :     MBParam * const pParam,
1680 :     MACROBLOCK * const pMBs,
1681 :     const uint32_t iFcode)
1682 :     {
1683 :     uint32_t x, y, intra = 0;
1684 :     int sSAD = 0;
1685 :    
1686 :     if (sadInit) (*sadInit) ();
1687 :    
1688 :     for (y = 0; y < pParam->mb_height-1; y++) {
1689 :     for (x = 0; x < pParam->mb_width; x++) {
1690 :     int sad, dev;
1691 :    
1692 :     MACROBLOCK *pMB = &pMBs[x + y * pParam->mb_width];
1693 :    
1694 :     sad = MEanalyzeMB(pRef->y, pCurrent->y, x, y,
1695 :     iFcode, pParam, pMBs, pMB);
1696 :    
1697 :     if ( x != 0 && y != 0 && x != pParam->mb_width-1 ) { //no edge macroblocks, they just don't work
1698 :     if (sad > INTRA_THRESH) {
1699 :     dev = dev16(pCurrent->y + (x + y * pParam->edged_width) * 16,
1700 :     pParam->edged_width);
1701 :     if (dev + INTRA_THRESH < sad) intra++;
1702 :     if (intra > (pParam->mb_height-2)*(pParam->mb_width-2)/2) return 2; // I frame
1703 :     }
1704 :     sSAD += sad;
1705 :     }
1706 :    
1707 : suxen_drol 118 }
1708 :     }
1709 : Isibaar 539 sSAD /= (pParam->mb_height-2)*(pParam->mb_width-2);
1710 :     if (sSAD > INTER_THRESH ) return 1; //P frame
1711 :     emms();
1712 :     return 0; // B frame
1713 :    
1714 : suxen_drol 118 }

No admin address has been configured
ViewVC Help
Powered by ViewVC 1.0.4