[svn] / branches / dev-api-3 / xvidcore / src / motion / motion_est.c Repository:
ViewVC logotype

Annotation of /branches/dev-api-3/xvidcore/src/motion/motion_est.c

Parent Directory Parent Directory | Revision Log Revision Log


Revision 568 - (view) (download)

1 : Isibaar 3 /**************************************************************************
2 :     *
3 : chl 259 * XVID MPEG-4 VIDEO CODEC
4 :     * motion estimation
5 :     *
6 :     * This program is an implementation of a part of one or more MPEG-4
7 :     * Video tools as specified in ISO/IEC 14496-2 standard. Those intending
8 :     * to use this software module in hardware or software products are
9 :     * advised that its use may infringe existing patents or copyrights, and
10 :     * any such use would be at such party's own risk. The original
11 :     * developer of this software module and his/her company, and subsequent
12 :     * editors and their companies, will have no liability for use of this
13 :     * software or modifications or derivatives thereof.
14 :     *
15 :     * This program is free software; you can redistribute it and/or modify
16 :     * it under the terms of the GNU General Public License as published by
17 :     * the Free Software Foundation; either version 2 of the License, or
18 :     * (at your option) any later version.
19 :     *
20 :     * This program is distributed in the hope that it will be useful,
21 :     * but WITHOUT ANY WARRANTY; without even the implied warranty of
22 :     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
23 :     * GNU General Public License for more details.
24 :     *
25 :     * You should have received a copy of the GNU General Public License
26 :     * along with this program; if not, write to the Free Software
27 :     * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
28 :     *
29 :     *************************************************************************/
30 :    
31 : Isibaar 3 #include <assert.h>
32 :     #include <stdio.h>
33 : chl 96 #include <stdlib.h>
34 : Isibaar 3
35 :     #include "../encoder.h"
36 :     #include "../utils/mbfunctions.h"
37 :     #include "../prediction/mbprediction.h"
38 :     #include "../global.h"
39 :     #include "../utils/timer.h"
40 : chl 530 #include "motion_est.h"
41 : suxen_drol 118 #include "motion.h"
42 : Isibaar 3 #include "sad.h"
43 : Isibaar 539 #include "../utils/emms.h"
44 : Isibaar 3
45 : chl 530 #define INITIAL_SKIP_THRESH (10)
46 :     #define FINAL_SKIP_THRESH (50)
47 :     #define MAX_SAD00_FOR_SKIP (20)
48 : Isibaar 539 #define MAX_CHROMA_SAD_FOR_SKIP (22)
49 :     #define SKIP_THRESH_B (25)
50 : Isibaar 3
51 : chl 530 #define CHECK_CANDIDATE(X,Y,D) { \
52 :     (*CheckCandidate)((const int)(X),(const int)(Y), (D), &iDirection, data ); }
53 : Isibaar 3
54 : chl 530 #define iDiamondSize 2
55 : chl 141
56 : chl 530 static __inline int
57 :     d_mv_bits(int x, int y, const uint32_t iFcode)
58 : Isibaar 3 {
59 : chl 530 int xb, yb;
60 :    
61 :     if (x == 0) xb = 1;
62 :     else {
63 :     if (x < 0) x = -x;
64 :     x += (1 << (iFcode - 1)) - 1;
65 :     x >>= (iFcode - 1);
66 :     if (x > 32) x = 32;
67 :     xb = mvtab[x] + iFcode;
68 : edgomez 195 }
69 : Isibaar 3
70 : chl 530 if (y == 0) yb = 1;
71 :     else {
72 :     if (y < 0) y = -y;
73 :     y += (1 << (iFcode - 1)) - 1;
74 :     y >>= (iFcode - 1);
75 :     if (y > 32) y = 32;
76 :     yb = mvtab[y] + iFcode;
77 :     }
78 :     return xb + yb;
79 : Isibaar 3 }
80 :    
81 :    
82 : Isibaar 539 /* CHECK_CANDIATE FUNCTIONS START */
83 :    
84 : chl 530 static void
85 :     CheckCandidate16(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
86 : Isibaar 3 {
87 : chl 530 int32_t * const sad = data->temp;
88 :     int t;
89 :     const uint8_t * Reference;
90 : Isibaar 3
91 : chl 530 if (( x > data->max_dx) || ( x < data->min_dx)
92 :     || ( y > data->max_dy) || (y < data->min_dy)) return;
93 : suxen_drol 136
94 : chl 530 switch ( ((x&1)<<1) + (y&1) ) {
95 :     case 0 : Reference = data->Ref + x/2 + (y/2)*(data->iEdgedWidth); break;
96 :     case 1 : Reference = data->RefV + x/2 + ((y-1)/2)*(data->iEdgedWidth); break;
97 :     case 2 : Reference = data->RefH + (x-1)/2 + (y/2)*(data->iEdgedWidth); break;
98 :     default : Reference = data->RefHV + (x-1)/2 + ((y-1)/2)*(data->iEdgedWidth); break;
99 :     }
100 : chl 259
101 : chl 530 data->temp[0] = sad16v(data->Cur, Reference, data->iEdgedWidth, sad+1);
102 : Isibaar 3
103 : chl 530 t = d_mv_bits(x - data->predMV.x, y - data->predMV.y, data->iFcode);
104 :     data->temp[0] += lambda_vec16[data->iQuant] * t;
105 :     data->temp[1] += lambda_vec8[data->iQuant] * t;
106 : chl 326
107 : chl 530 if (data->temp[0] < data->iMinSAD[0]) {
108 :     data->iMinSAD[0] = data->temp[0];
109 :     data->currentMV[0].x = x; data->currentMV[0].y = y;
110 :     *dir = Direction; }
111 : chl 184
112 : chl 530 if (data->temp[1] < data->iMinSAD[1]) {
113 :     data->iMinSAD[1] = data->temp[1]; data->currentMV[1].x = x; data->currentMV[1].y = y; }
114 :     if (data->temp[2] < data->iMinSAD[2]) {
115 :     data->iMinSAD[2] = data->temp[2]; data->currentMV[2].x = x; data->currentMV[2].y = y; }
116 :     if (data->temp[3] < data->iMinSAD[3]) {
117 :     data->iMinSAD[3] = data->temp[3]; data->currentMV[3].x = x; data->currentMV[3].y = y; }
118 :     if (data->temp[4] < data->iMinSAD[4]) {
119 :     data->iMinSAD[4] = data->temp[4]; data->currentMV[4].x = x; data->currentMV[4].y = y; }
120 : chl 184
121 : Isibaar 3 }
122 :    
123 : chl 530 static void
124 :     CheckCandidate16no4v(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
125 :     {
126 :     int32_t sad;
127 :     const uint8_t * Reference;
128 : chl 326
129 : chl 530 if (( x > data->max_dx) || ( x < data->min_dx)
130 :     || ( y > data->max_dy) || (y < data->min_dy)) return;
131 : Isibaar 3
132 : chl 530 switch ( ((x&1)<<1) + (y&1) )
133 :     {
134 :     case 0 : Reference = data->Ref + x/2 + (y/2)*(data->iEdgedWidth); break;
135 :     case 1 : Reference = data->RefV + x/2 + ((y-1)/2)*(data->iEdgedWidth); break;
136 :     case 2 : Reference = data->RefH + (x-1)/2 + (y/2)*(data->iEdgedWidth); break;
137 :     default : Reference = data->RefHV + (x-1)/2 + ((y-1)/2)*(data->iEdgedWidth); break;
138 :     }
139 : Isibaar 3
140 : chl 530 sad = lambda_vec16[data->iQuant] *
141 :     d_mv_bits(x - data->predMV.x, y - data->predMV.y, data->iFcode);
142 :     sad += sad16(data->Cur, Reference, data->iEdgedWidth, 256*4096);
143 : Isibaar 3
144 : chl 530 if (sad < *(data->iMinSAD)) {
145 :     *(data->iMinSAD) = sad;
146 :     data->currentMV[0].x = x; data->currentMV[0].y = y;
147 :     *dir = Direction; }
148 : Isibaar 3 }
149 :    
150 : chl 530 static void
151 : Isibaar 539 CheckCandidate16no4vI(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
152 :     {
153 :     int32_t sad;
154 :    
155 :     if (( x > data->max_dx) || ( x < data->min_dx)
156 :     || ( y > data->max_dy) || (y < data->min_dy)) return;
157 :    
158 :     sad = lambda_vec16[data->iQuant] *
159 :     d_mv_bits(x - data->predMV.x, y - data->predMV.y, data->iFcode);
160 :    
161 :     sad += sad16(data->Cur, data->Ref + x/2 + (y/2)*(data->iEdgedWidth),
162 :     data->iEdgedWidth, 256*4096);
163 :    
164 :     if (sad < *(data->iMinSAD)) {
165 :     *(data->iMinSAD) = sad;
166 :     data->currentMV[0].x = x; data->currentMV[0].y = y;
167 :     *dir = Direction; }
168 :     }
169 :    
170 :    
171 :     static void
172 : chl 530 CheckCandidateInt(const int xf, const int yf, const int Direction, int * const dir, const SearchData * const data)
173 :     {
174 :     int32_t sad;
175 :     const int xb = data->currentMV[1].x;
176 :     const int yb = data->currentMV[1].y;
177 :     const uint8_t *ReferenceF, *ReferenceB;
178 : Isibaar 3
179 : chl 530 if (( xf > data->max_dx) || ( xf < data->min_dx)
180 :     || ( yf > data->max_dy) || (yf < data->min_dy)) return;
181 : Isibaar 3
182 : chl 530 switch ( ((xf&1)<<1) + (yf&1) ) {
183 :     case 0 : ReferenceF = data->Ref + xf/2 + (yf/2)*(data->iEdgedWidth); break;
184 :     case 1 : ReferenceF = data->RefV + xf/2 + ((yf-1)/2)*(data->iEdgedWidth); break;
185 :     case 2 : ReferenceF = data->RefH + (xf-1)/2 + (yf/2)*(data->iEdgedWidth); break;
186 :     default : ReferenceF = data->RefHV + (xf-1)/2 + ((yf-1)/2)*(data->iEdgedWidth); break;
187 :     }
188 : edgomez 195
189 : chl 530 switch ( ((xb&1)<<1) + (yb&1) ) {
190 :     case 0 : ReferenceB = data->bRef + xb/2 + (yb/2)*(data->iEdgedWidth); break;
191 :     case 1 : ReferenceB = data->bRefV + xb/2 + ((yb-1)/2)*(data->iEdgedWidth); break;
192 :     case 2 : ReferenceB = data->bRefH + (xb-1)/2 + (yb/2)*(data->iEdgedWidth); break;
193 :     default : ReferenceB = data->bRefHV + (xb-1)/2 + ((yb-1)/2)*(data->iEdgedWidth); break;
194 :     }
195 : Isibaar 3
196 : chl 530 sad = lambda_vec16[data->iQuant] *
197 :     ( d_mv_bits(xf - data->predMV.x, yf - data->predMV.y, data->iFcode) +
198 :     d_mv_bits(xb - data->bpredMV.x, yb - data->bpredMV.y, data->iFcode) );
199 : Isibaar 3
200 : chl 530 sad += sad16bi(data->Cur, ReferenceF, ReferenceB, data->iEdgedWidth);
201 : Isibaar 3
202 : chl 530 if (sad < *(data->iMinSAD)) {
203 :     *(data->iMinSAD) = sad;
204 :     data->currentMV->x = xf; data->currentMV->y = yf;
205 :     *dir = Direction; }
206 : Isibaar 3 }
207 :    
208 : chl 530 static void
209 :     CheckCandidateDirect(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
210 : Isibaar 3 {
211 : chl 530 int32_t sad;
212 :     int k;
213 :     const uint8_t *ReferenceF;
214 :     const uint8_t *ReferenceB;
215 :     VECTOR mvs, b_mvs;
216 : Isibaar 3
217 : chl 530 if (( x > 31) || ( x < -32) || ( y > 31) || (y < -32)) return;
218 : Isibaar 3
219 : chl 530 sad = lambda_vec16[data->iQuant] * d_mv_bits(x, y, 1);
220 : Isibaar 3
221 : chl 530 for (k = 0; k < 4; k++) {
222 :     mvs.x = data->directmvF[k].x + x;
223 :     b_mvs.x = ((x == 0) ?
224 :     data->directmvB[k].x
225 :     : mvs.x - data->referencemv[k].x);
226 : Isibaar 3
227 : chl 530 mvs.y = data->directmvF[k].y + y;
228 :     b_mvs.y = ((y == 0) ?
229 :     data->directmvB[k].y
230 :     : mvs.y - data->referencemv[k].y);
231 :    
232 :     if (( mvs.x > data->max_dx ) || ( mvs.x < data->min_dx )
233 :     || ( mvs.y > data->max_dy ) || ( mvs.y < data->min_dy )
234 :     || ( b_mvs.x > data->max_dx ) || ( b_mvs.x < data->min_dx )
235 :     || ( b_mvs.y > data->max_dy ) || ( b_mvs.y < data->min_dy )) return;
236 : Isibaar 3
237 : chl 530 switch ( ((mvs.x&1)<<1) + (mvs.y&1) ) {
238 :     case 0 : ReferenceF = data->Ref + mvs.x/2 + (mvs.y/2)*(data->iEdgedWidth); break;
239 :     case 1 : ReferenceF = data->RefV + mvs.x/2 + ((mvs.y-1)/2)*(data->iEdgedWidth); break;
240 :     case 2 : ReferenceF = data->RefH + (mvs.x-1)/2 + (mvs.y/2)*(data->iEdgedWidth); break;
241 :     default : ReferenceF = data->RefHV + (mvs.x-1)/2 + ((mvs.y-1)/2)*(data->iEdgedWidth); break;
242 :     }
243 : Isibaar 3
244 : chl 530 switch ( ((b_mvs.x&1)<<1) + (b_mvs.y&1) ) {
245 :     case 0 : ReferenceB = data->bRef + b_mvs.x/2 + (b_mvs.y/2)*(data->iEdgedWidth); break;
246 :     case 1 : ReferenceB = data->bRefV + b_mvs.x/2 + ((b_mvs.y-1)/2)*(data->iEdgedWidth); break;
247 :     case 2 : ReferenceB = data->bRefH + (b_mvs.x-1)/2 + (b_mvs.y/2)*(data->iEdgedWidth); break;
248 :     default : ReferenceB = data->bRefHV + (b_mvs.x-1)/2 + ((b_mvs.y-1)/2)*(data->iEdgedWidth); break;
249 : chl 344 }
250 : chl 530
251 :     sad += sad8bi(data->Cur + 8*(k&1) + 8*(k>>1)*(data->iEdgedWidth),
252 :     ReferenceF + 8*(k&1) + 8*(k>>1)*(data->iEdgedWidth),
253 :     ReferenceB + 8*(k&1) + 8*(k>>1)*(data->iEdgedWidth),
254 :     data->iEdgedWidth);
255 :     if (sad > *(data->iMinSAD)) return;
256 : edgomez 78 }
257 : chl 530
258 :     if (sad < *(data->iMinSAD)) {
259 :     *(data->iMinSAD) = sad;
260 :     data->currentMV->x = x; data->currentMV->y = y;
261 :     *dir = Direction; }
262 : Isibaar 3 }
263 :    
264 : chl 530 static void
265 :     CheckCandidateDirectno4v(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
266 : chl 96 {
267 : chl 530 int32_t sad;
268 :     const uint8_t *ReferenceF;
269 :     const uint8_t *ReferenceB;
270 :     VECTOR mvs, b_mvs;
271 : chl 96
272 : chl 530 if (( x > 31) || ( x < -31) || ( y > 31) || (y < -31)) return;
273 :    
274 :     sad = lambda_vec16[data->iQuant] * d_mv_bits(x, y, 1);
275 : edgomez 195
276 : chl 530 mvs.x = data->directmvF[0].x + x;
277 :     b_mvs.x = ((x == 0) ?
278 :     data->directmvB[0].x
279 :     : mvs.x - data->referencemv[0].x);
280 : edgomez 195
281 : chl 530 mvs.y = data->directmvF[0].y + y;
282 :     b_mvs.y = ((y == 0) ?
283 :     data->directmvB[0].y
284 :     : mvs.y - data->referencemv[0].y);
285 :    
286 :     if (( mvs.x > data->max_dx ) || ( mvs.x < data->min_dx )
287 :     || ( mvs.y > data->max_dy ) || ( mvs.y < data->min_dy )
288 :     || ( b_mvs.x > data->max_dx ) || ( b_mvs.x < data->min_dx )
289 :     || ( b_mvs.y > data->max_dy ) || ( b_mvs.y < data->min_dy )) return;
290 : chl 96
291 : chl 530 switch ( ((mvs.x&1)<<1) + (mvs.y&1) ) {
292 :     case 0 : ReferenceF = data->Ref + mvs.x/2 + (mvs.y/2)*(data->iEdgedWidth); break;
293 :     case 1 : ReferenceF = data->RefV + mvs.x/2 + ((mvs.y-1)/2)*(data->iEdgedWidth); break;
294 :     case 2 : ReferenceF = data->RefH + (mvs.x-1)/2 + (mvs.y/2)*(data->iEdgedWidth); break;
295 :     default : ReferenceF = data->RefHV + (mvs.x-1)/2 + ((mvs.y-1)/2)*(data->iEdgedWidth); break;
296 :     }
297 : chl 96
298 : chl 530 switch ( ((b_mvs.x&1)<<1) + (b_mvs.y&1) ) {
299 :     case 0 : ReferenceB = data->bRef + b_mvs.x/2 + (b_mvs.y/2)*(data->iEdgedWidth); break;
300 :     case 1 : ReferenceB = data->bRefV + b_mvs.x/2 + ((b_mvs.y-1)/2)*(data->iEdgedWidth); break;
301 :     case 2 : ReferenceB = data->bRefH + (b_mvs.x-1)/2 + (b_mvs.y/2)*(data->iEdgedWidth); break;
302 :     default : ReferenceB = data->bRefHV + (b_mvs.x-1)/2 + ((b_mvs.y-1)/2)*(data->iEdgedWidth); break;
303 :     }
304 :    
305 :     sad += sad16bi(data->Cur, ReferenceF, ReferenceB, data->iEdgedWidth);
306 : chl 96
307 : chl 530 if (sad < *(data->iMinSAD)) {
308 :     *(data->iMinSAD) = sad;
309 :     data->currentMV->x = x; data->currentMV->y = y;
310 :     *dir = Direction; }
311 :     }
312 : chl 96
313 : chl 530 static void
314 :     CheckCandidate8(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
315 :     {
316 :     int32_t sad;
317 :     const uint8_t * Reference;
318 : edgomez 195
319 : chl 530 if (( x > data->max_dx) || ( x < data->min_dx)
320 :     || ( y > data->max_dy) || (y < data->min_dy)) return;
321 : chl 96
322 : chl 530 switch ( ((x&1)<<1) + (y&1) )
323 :     {
324 :     case 0 : Reference = data->Ref + x/2 + (y/2)*(data->iEdgedWidth); break;
325 :     case 1 : Reference = data->RefV + x/2 + ((y-1)/2)*(data->iEdgedWidth); break;
326 :     case 2 : Reference = data->RefH + (x-1)/2 + (y/2)*(data->iEdgedWidth); break;
327 :     default : Reference = data->RefHV + (x-1)/2 + ((y-1)/2)*(data->iEdgedWidth); break;
328 :     }
329 : edgomez 195
330 : chl 530 sad = sad8(data->Cur, Reference, data->iEdgedWidth);
331 :     sad += lambda_vec8[data->iQuant] * d_mv_bits(x - data->predMV.x, y - data->predMV.y, data->iFcode);
332 : edgomez 195
333 : chl 530 if (sad < *(data->iMinSAD)) {
334 :     *(data->iMinSAD) = sad;
335 :     data->currentMV->x = x; data->currentMV->y = y;
336 :     *dir = Direction; }
337 : chl 96 }
338 :    
339 : Isibaar 539 /* CHECK_CANDIATE FUNCTIONS END */
340 : chl 96
341 : chl 530 /* MAINSEARCH FUNCTIONS START */
342 : edgomez 195
343 : chl 530 static void
344 :     AdvDiamondSearch(int x, int y, const SearchData * const data, int bDirection)
345 : chl 181 {
346 :    
347 :     /* directions: 1 - left (x-1); 2 - right (x+1), 4 - up (y-1); 8 - down (y+1) */
348 :    
349 : chl 530 int iDirection;
350 : edgomez 195
351 :     do {
352 : chl 181 iDirection = 0;
353 : chl 530 if (bDirection & 1) CHECK_CANDIDATE(x - iDiamondSize, y, 1);
354 :     if (bDirection & 2) CHECK_CANDIDATE(x + iDiamondSize, y, 2);
355 :     if (bDirection & 4) CHECK_CANDIDATE(x, y - iDiamondSize, 4);
356 :     if (bDirection & 8) CHECK_CANDIDATE(x, y + iDiamondSize, 8);
357 : chl 181
358 :     /* now we're doing diagonal checks near our candidate */
359 :    
360 : chl 530 if (iDirection) { //checking if anything found
361 : chl 181 bDirection = iDirection;
362 :     iDirection = 0;
363 : chl 530 x = data->currentMV->x; y = data->currentMV->y;
364 :     if (bDirection & 3) { //our candidate is left or right
365 :     CHECK_CANDIDATE(x, y + iDiamondSize, 8);
366 :     CHECK_CANDIDATE(x, y - iDiamondSize, 4);
367 :     } else { // what remains here is up or down
368 :     CHECK_CANDIDATE(x + iDiamondSize, y, 2);
369 :     CHECK_CANDIDATE(x - iDiamondSize, y, 1); }
370 : chl 181
371 : edgomez 195 if (iDirection) {
372 :     bDirection += iDirection;
373 : chl 530 x = data->currentMV->x; y = data->currentMV->y; }
374 :     } else { //about to quit, eh? not so fast....
375 : edgomez 195 switch (bDirection) {
376 : chl 181 case 2:
377 : chl 530 CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2 + 4);
378 :     CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2 + 8);
379 : chl 181 break;
380 :     case 1:
381 : chl 530 CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1 + 4);
382 :     CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1 + 8);
383 : chl 181 break;
384 : edgomez 195 case 2 + 4:
385 : chl 530 CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1 + 4);
386 :     CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2 + 4);
387 :     CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2 + 8);
388 : chl 181 break;
389 :     case 4:
390 : chl 530 CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2 + 4);
391 :     CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1 + 4);
392 : chl 181 break;
393 :     case 8:
394 : chl 530 CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2 + 8);
395 :     CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1 + 8);
396 : chl 181 break;
397 : edgomez 195 case 1 + 4:
398 : chl 530 CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1 + 8);
399 :     CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1 + 4);
400 :     CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2 + 4);
401 : chl 181 break;
402 : edgomez 195 case 2 + 8:
403 : chl 530 CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1 + 4);
404 :     CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1 + 8);
405 :     CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2 + 8);
406 : chl 181 break;
407 : edgomez 195 case 1 + 8:
408 : chl 530 CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2 + 4);
409 :     CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2 + 8);
410 :     CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1 + 8);
411 : chl 181 break;
412 : edgomez 195 default: //1+2+4+8 == we didn't find anything at all
413 : chl 530 CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1 + 4);
414 :     CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1 + 8);
415 :     CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2 + 4);
416 :     CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2 + 8);
417 : chl 181 break;
418 :     }
419 : chl 530 if (!iDirection) break; //ok, the end. really
420 :     bDirection = iDirection;
421 :     x = data->currentMV->x; y = data->currentMV->y;
422 : chl 181 }
423 :     }
424 : edgomez 195 while (1); //forever
425 : chl 181 }
426 :    
427 : chl 530 static void
428 :     SquareSearch(int x, int y, const SearchData * const data, int bDirection)
429 : chl 326 {
430 : chl 530 int iDirection;
431 : chl 326
432 : chl 530 do {
433 :     iDirection = 0;
434 :     if (bDirection & 1) CHECK_CANDIDATE(x - iDiamondSize, y, 1+16+64);
435 :     if (bDirection & 2) CHECK_CANDIDATE(x + iDiamondSize, y, 2+32+128);
436 :     if (bDirection & 4) CHECK_CANDIDATE(x, y - iDiamondSize, 4+16+32);
437 :     if (bDirection & 8) CHECK_CANDIDATE(x, y + iDiamondSize, 8+64+128);
438 :     if (bDirection & 16) CHECK_CANDIDATE(x - iDiamondSize, y - iDiamondSize, 1+4+16+32+64);
439 :     if (bDirection & 32) CHECK_CANDIDATE(x + iDiamondSize, y - iDiamondSize, 2+4+16+32+128);
440 :     if (bDirection & 64) CHECK_CANDIDATE(x - iDiamondSize, y + iDiamondSize, 1+8+16+64+128);
441 :     if (bDirection & 128) CHECK_CANDIDATE(x + iDiamondSize, y + iDiamondSize, 2+8+32+64+128);
442 : chl 326
443 : chl 530 bDirection = iDirection;
444 :     x = data->currentMV->x; y = data->currentMV->y;
445 :     } while (iDirection);
446 : chl 346 }
447 :    
448 : chl 530 static void
449 :     DiamondSearch(int x, int y, const SearchData * const data, int bDirection)
450 : chl 346 {
451 :    
452 : chl 181 /* directions: 1 - left (x-1); 2 - right (x+1), 4 - up (y-1); 8 - down (y+1) */
453 :    
454 : chl 530 int iDirection;
455 : edgomez 195
456 :     do {
457 : chl 181 iDirection = 0;
458 : chl 530 if (bDirection & 1) CHECK_CANDIDATE(x - iDiamondSize, y, 1);
459 :     if (bDirection & 2) CHECK_CANDIDATE(x + iDiamondSize, y, 2);
460 :     if (bDirection & 4) CHECK_CANDIDATE(x, y - iDiamondSize, 4);
461 :     if (bDirection & 8) CHECK_CANDIDATE(x, y + iDiamondSize, 8);
462 : chl 181
463 :     /* now we're doing diagonal checks near our candidate */
464 :    
465 : chl 530 if (iDirection) { //checking if anything found
466 : chl 181 bDirection = iDirection;
467 :     iDirection = 0;
468 : chl 530 x = data->currentMV->x; y = data->currentMV->y;
469 :     if (bDirection & 3) { //our candidate is left or right
470 :     CHECK_CANDIDATE(x, y + iDiamondSize, 8);
471 :     CHECK_CANDIDATE(x, y - iDiamondSize, 4);
472 :     } else { // what remains here is up or down
473 :     CHECK_CANDIDATE(x + iDiamondSize, y, 2);
474 :     CHECK_CANDIDATE(x - iDiamondSize, y, 1); }
475 : chl 181
476 : chl 530 bDirection += iDirection;
477 :     x = data->currentMV->x; y = data->currentMV->y;
478 : chl 181 }
479 :     }
480 : chl 530 while (iDirection);
481 : chl 181 }
482 :    
483 : chl 530 /* MAINSEARCH FUNCTIONS END */
484 : chl 181
485 : chl 530 /* HALFPELREFINE COULD BE A MAINSEARCH FUNCTION, BUT THERE IS NO NEED FOR IT */
486 :    
487 :     static void
488 :     HalfpelRefine(const SearchData * const data)
489 : chl 96 {
490 : chl 530 /* Do a half-pel refinement (or rather a "smallest possible amount" refinement) */
491 : edgomez 195
492 : chl 530 VECTOR backupMV = *(data->currentMV);
493 :     int iDirection; //not needed
494 : chl 96
495 : chl 530 CHECK_CANDIDATE(backupMV.x - 1, backupMV.y - 1, 0);
496 :     CHECK_CANDIDATE(backupMV.x + 1, backupMV.y - 1, 0);
497 :     CHECK_CANDIDATE(backupMV.x - 1, backupMV.y + 1, 0);
498 :     CHECK_CANDIDATE(backupMV.x + 1, backupMV.y + 1, 0);
499 : edgomez 195
500 : chl 530 CHECK_CANDIDATE(backupMV.x - 1, backupMV.y, 0);
501 :     CHECK_CANDIDATE(backupMV.x + 1, backupMV.y, 0);
502 :    
503 :     CHECK_CANDIDATE(backupMV.x, backupMV.y + 1, 0);
504 :     CHECK_CANDIDATE(backupMV.x, backupMV.y - 1, 0);
505 : chl 96 }
506 :    
507 : chl 530 static __inline int
508 :     SkipDecisionP(const IMAGE * current, const IMAGE * reference,
509 :     const int x, const int y,
510 :     const uint32_t iEdgedWidth, const uint32_t iQuant)
511 : chl 96
512 : Isibaar 3 {
513 : chl 530 /* keep repeating checks for all b-frames before this P frame,
514 :     to make sure that SKIP is possible (todo)
515 :     how: if skip is not possible set sad00 to a very high value */
516 : Isibaar 3
517 : chl 530 uint32_t sadC = sad8(current->u + x*8 + y*(iEdgedWidth/2)*8,
518 :     reference->u + x*8 + y*(iEdgedWidth/2)*8, iEdgedWidth/2);
519 :     if (sadC > iQuant * MAX_CHROMA_SAD_FOR_SKIP) return 0;
520 : h 545 sadC += sad8(current->v + (x + y*(iEdgedWidth/2))*8,
521 :     reference->v + (x + y*(iEdgedWidth/2))*8, iEdgedWidth/2);
522 : chl 530 if (sadC > iQuant * MAX_CHROMA_SAD_FOR_SKIP) return 0;
523 : edgomez 195
524 : chl 530 return 1;
525 :     }
526 : edgomez 195
527 : chl 530 static __inline void
528 :     SkipMacroblockP(MACROBLOCK *pMB, const int32_t sad)
529 :     {
530 :     pMB->mode = MODE_NOT_CODED;
531 : Isibaar 539 pMB->mvs[0].x = pMB->mvs[1].x = pMB->mvs[2].x = pMB->mvs[3].x = 0;
532 :     pMB->mvs[0].y = pMB->mvs[1].y = pMB->mvs[2].y = pMB->mvs[3].y = 0;
533 : chl 530 pMB->sad16 = pMB->sad8[0] = pMB->sad8[1] = pMB->sad8[2] = pMB->sad8[3] = sad;
534 : Isibaar 3 }
535 :    
536 : chl 530 bool
537 :     MotionEstimation(MBParam * const pParam,
538 :     FRAMEINFO * const current,
539 :     FRAMEINFO * const reference,
540 :     const IMAGE * const pRefH,
541 :     const IMAGE * const pRefV,
542 :     const IMAGE * const pRefHV,
543 :     const uint32_t iLimit)
544 : Isibaar 3 {
545 : chl 530 MACROBLOCK *const pMBs = current->mbs;
546 :     const IMAGE *const pCurrent = &current->image;
547 :     const IMAGE *const pRef = &reference->image;
548 : Isibaar 3
549 : chl 530 const VECTOR zeroMV = { 0, 0 };
550 : Isibaar 3
551 : chl 530 uint32_t x, y;
552 :     uint32_t iIntra = 0;
553 :     int32_t InterBias;
554 : edgomez 195
555 : Isibaar 539 // some pre-initialized thingies for SearchP
556 :     int32_t temp[5];
557 :     VECTOR currentMV[5];
558 :     int32_t iMinSAD[5];
559 :     SearchData Data;
560 :     Data.iEdgedWidth = pParam->edged_width;
561 :     Data.currentMV = currentMV;
562 :     Data.iMinSAD = iMinSAD;
563 :     Data.temp = temp;
564 :     Data.iFcode = current->fcode;
565 :    
566 : chl 530 if (sadInit) (*sadInit) ();
567 : edgomez 195
568 : chl 530 for (y = 0; y < pParam->mb_height; y++) {
569 :     for (x = 0; x < pParam->mb_width; x++) {
570 : Isibaar 3
571 : chl 530 MACROBLOCK *pMB = &pMBs[x + y * pParam->mb_width];
572 :     int32_t sad00 = pMB->sad16
573 :     = sad16v(pCurrent->y + (x + y * pParam->edged_width) * 16,
574 :     pRef->y + (x + y * pParam->edged_width) * 16,
575 :     pParam->edged_width, pMB->sad8 );
576 : edgomez 195
577 : chl 530 if (!(current->global_flags & XVID_LUMIMASKING)) {
578 :     pMB->dquant = NO_CHANGE;
579 :     pMB->quant = current->quant; }
580 : chl 181
581 : chl 530 //initial skip decision
582 : Isibaar 3
583 : chl 530 if ((pMB->dquant == NO_CHANGE) && (sad00 <= MAX_SAD00_FOR_SKIP * pMB->quant)
584 :     && (SkipDecisionP(pCurrent, pRef, x, y, pParam->edged_width, pMB->quant)) ) {
585 :     if (pMB->sad16 < pMB->quant * INITIAL_SKIP_THRESH) {
586 :     SkipMacroblockP(pMB, sad00);
587 :     continue;
588 :     }
589 :     } else sad00 = 256*4096; // skip not allowed - for final skip decision
590 : Isibaar 3
591 : chl 530 SearchP(pRef->y, pRefH->y, pRefV->y, pRefHV->y, pCurrent, x,
592 :     y, current->motion_flags, pMB->quant,
593 : Isibaar 539 &Data, pParam, pMBs, reference->mbs,
594 : chl 530 current->global_flags & XVID_INTER4V, pMB);
595 : edgomez 195
596 : chl 530 /* final skip decision, a.k.a. "the vector you found, really that good?" */
597 :     if (sad00 < pMB->quant * MAX_SAD00_FOR_SKIP)
598 :     if ((100*pMB->sad16)/(sad00+1) > FINAL_SKIP_THRESH)
599 :     { SkipMacroblockP(pMB, sad00); continue; }
600 :    
601 :     /* finally, intra decision */
602 : Isibaar 3
603 : chl 530 InterBias = MV16_INTER_BIAS;
604 :     if (pMB->quant > 8) InterBias += 50 * (pMB->quant - 8); // to make high quants work
605 :     if (y != 0)
606 :     if ((pMB - pParam->mb_width)->mode == MODE_INTER ) InterBias -= 50;
607 :     if (x != 0)
608 :     if ((pMB - 1)->mode == MODE_INTER ) InterBias -= 50;
609 : Isibaar 3
610 : chl 530 if (InterBias < pMB->sad16) {
611 :     const int32_t deviation =
612 :     dev16(pCurrent->y + (x + y * pParam->edged_width) * 16,
613 :     pParam->edged_width);
614 : Isibaar 3
615 : chl 530 if (deviation < (pMB->sad16 - InterBias)) {
616 :     if (++iIntra >= iLimit) return 1;
617 :     pMB->mode = MODE_INTRA;
618 : Isibaar 539 pMB->mvs[0] = pMB->mvs[1] = pMB->mvs[2] =
619 :     pMB->mvs[3] = zeroMV;
620 : chl 530 pMB->sad16 = pMB->sad8[0] = pMB->sad8[1] = pMB->sad8[2] =
621 :     pMB->sad8[3] = 0;
622 :     }
623 :     }
624 :     }
625 : Isibaar 3 }
626 : chl 530 return 0;
627 :     }
628 : Isibaar 3
629 : edgomez 195
630 : chl 530 #define PMV_HALFPEL16 (PMV_HALFPELDIAMOND16|PMV_HALFPELREFINE16)
631 : Isibaar 3
632 : chl 530 static __inline int
633 :     make_mask(const VECTOR * const pmv, const int i)
634 :     {
635 : Isibaar 539 int mask = 255, j;
636 : chl 530 for (j = 0; j < i; j++) {
637 :     if (MVequal(pmv[i], pmv[j])) return 0; // same vector has been checked already
638 :     if (pmv[i].x == pmv[j].x) {
639 :     if (pmv[i].y == pmv[j].y + iDiamondSize) { mask &= ~4; continue; }
640 :     if (pmv[i].y == pmv[j].y - iDiamondSize) { mask &= ~8; continue; }
641 :     } else
642 :     if (pmv[i].y == pmv[j].y) {
643 :     if (pmv[i].x == pmv[j].x + iDiamondSize) { mask &= ~1; continue; }
644 :     if (pmv[i].x == pmv[j].x - iDiamondSize) { mask &= ~2; continue; }
645 :     }
646 : Isibaar 3 }
647 : chl 530 return mask;
648 :     }
649 : edgomez 195
650 : chl 530 static __inline void
651 :     PreparePredictionsP(VECTOR * const pmv, int x, int y, const int iWcount,
652 :     const int iHcount, const MACROBLOCK * const prevMB)
653 :     {
654 : edgomez 195
655 : chl 530 //this function depends on get_pmvdata which means that it sucks. It should get the predictions by itself
656 : edgomez 195
657 : chl 530 if ( (y != 0) && (x != (iWcount-1)) ) { // [5] top-right neighbour
658 :     pmv[5].x = EVEN(pmv[3].x);
659 : Isibaar 539 pmv[5].y = EVEN(pmv[3].y);
660 :     } else pmv[5].x = pmv[5].y = 0;
661 : chl 169
662 : chl 530 if (x != 0) { pmv[3].x = EVEN(pmv[1].x); pmv[3].y = EVEN(pmv[1].y); }// pmv[3] is left neighbour
663 :     else pmv[3].x = pmv[3].y = 0;
664 : Isibaar 3
665 : chl 530 if (y != 0) { pmv[4].x = EVEN(pmv[2].x); pmv[4].y = EVEN(pmv[2].y); }// [4] top neighbour
666 :     else pmv[4].x = pmv[4].y = 0;
667 : chl 169
668 : chl 530 // [1] median prediction
669 :     pmv[1].x = EVEN(pmv[0].x); pmv[1].y = EVEN(pmv[0].y);
670 : chl 169
671 : chl 530 pmv[0].x = pmv[0].y = 0; // [0] is zero; not used in the loop (checked before) but needed here for make_mask
672 : chl 169
673 : chl 530 pmv[2].x = EVEN(prevMB->mvs[0].x); // [2] is last frame
674 :     pmv[2].y = EVEN(prevMB->mvs[0].y);
675 : chl 169
676 : chl 530 if ((x != iWcount-1) && (y != iHcount-1)) {
677 :     pmv[6].x = EVEN((prevMB+1+iWcount)->mvs[0].x); //[6] right-down neighbour in last frame
678 : Isibaar 539 pmv[6].y = EVEN((prevMB+1+iWcount)->mvs[0].y);
679 :     } else pmv[6].x = pmv[6].y = 0;
680 : chl 530 }
681 : chl 169
682 : chl 530 static void
683 :     SearchP(const uint8_t * const pRef,
684 :     const uint8_t * const pRefH,
685 :     const uint8_t * const pRefV,
686 :     const uint8_t * const pRefHV,
687 :     const IMAGE * const pCur,
688 :     const int x,
689 :     const int y,
690 :     const uint32_t MotionFlags,
691 :     const uint32_t iQuant,
692 : Isibaar 539 SearchData * const Data,
693 : chl 530 const MBParam * const pParam,
694 :     const MACROBLOCK * const pMBs,
695 :     const MACROBLOCK * const prevMBs,
696 :     int inter4v,
697 :     MACROBLOCK * const pMB)
698 :     {
699 : chl 169
700 : chl 530 int i, iDirection = 255, mask, threshA;
701 : Isibaar 539 VECTOR pmv[7];
702 : Isibaar 3
703 : Isibaar 539 get_pmvdata2(pMBs, pParam->mb_width, 0, x, y, 0, pmv, Data->temp); //has to be changed to get_pmv(2)()
704 :     get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 16,
705 :     pParam->width, pParam->height, Data->iFcode);
706 : Isibaar 3
707 : Isibaar 539 Data->predMV = pmv[0];
708 :     Data->Cur = pCur->y + (x + y * Data->iEdgedWidth) * 16;
709 :     Data->Ref = pRef + (x + Data->iEdgedWidth*y)*16;
710 :     Data->RefH = pRefH + (x + Data->iEdgedWidth*y) * 16;
711 :     Data->RefV = pRefV + (x + Data->iEdgedWidth*y) * 16;
712 :     Data->RefHV = pRefHV + (x + Data->iEdgedWidth*y) * 16;
713 : Isibaar 3
714 : Isibaar 539 Data->iQuant = iQuant;
715 : chl 169
716 : chl 530 if (!(MotionFlags & PMV_HALFPEL16)) {
717 : Isibaar 539 Data->min_dx = EVEN(Data->min_dx);
718 :     Data->max_dx = EVEN(Data->max_dx);
719 :     Data->min_dy = EVEN(Data->min_dy);
720 :     Data->max_dy = EVEN(Data->max_dy); }
721 : edgomez 568
722 :     if (pMB->dquant != NO_CHANGE) inter4v = 0;
723 : edgomez 195
724 : Isibaar 539 if (inter4v) CheckCandidate = CheckCandidate16;
725 :     else CheckCandidate = CheckCandidate16no4v;
726 : chl 169
727 : Isibaar 539 for(i = 0; i < 5; i++) Data->currentMV[i].x = Data->currentMV[i].y = 0;
728 :    
729 :     i = d_mv_bits(Data->predMV.x, Data->predMV.y, Data->iFcode);
730 :     Data->iMinSAD[0] = pMB->sad16 + lambda_vec16[iQuant] * i;
731 :     Data->iMinSAD[1] = pMB->sad8[0] + lambda_vec8[iQuant] * i;
732 :     Data->iMinSAD[2] = pMB->sad8[1];
733 :     Data->iMinSAD[3] = pMB->sad8[2];
734 :     Data->iMinSAD[4] = pMB->sad8[3];
735 :    
736 : chl 530 if ((x == 0) && (y == 0)) threshA = 512;
737 :     else {
738 : edgomez 568 threshA = Data->temp[0]; // that's when we keep this SAD atm
739 : chl 530 if (threshA < 512) threshA = 512;
740 :     if (threshA > 1024) threshA = 1024; }
741 : Isibaar 3
742 : chl 530 PreparePredictionsP(pmv, x, y, pParam->mb_width, pParam->mb_height,
743 :     prevMBs + x + y * pParam->mb_width);
744 : edgomez 195
745 : edgomez 568 if (inter4v) CheckCandidate = CheckCandidate16;
746 :     else CheckCandidate = CheckCandidate16no4v;
747 :    
748 :    
749 : chl 530 /* main loop. checking all predictions */
750 :    
751 :     for (i = 1; i < 7; i++) {
752 :     if (!(mask = make_mask(pmv, i)) ) continue;
753 : edgomez 568 (*CheckCandidate)(pmv[i].x, pmv[i].y, mask, &iDirection, Data);
754 : Isibaar 539 if (Data->iMinSAD[0] <= threshA) break;
755 : chl 530 }
756 :    
757 : Isibaar 539 if ((Data->iMinSAD[0] <= threshA) ||
758 :     (MVequal(Data->currentMV[0], (prevMBs+x+y*pParam->mb_width)->mvs[0]) &&
759 :     (Data->iMinSAD[0] < (prevMBs+x+y*pParam->mb_width)->sad16))) {
760 : chl 530 inter4v = 0;
761 : Isibaar 539 } else {
762 : Isibaar 3
763 : Isibaar 539 MainSearchFunc * MainSearchPtr;
764 :     if (MotionFlags & PMV_USESQUARES16) MainSearchPtr = SquareSearch;
765 :     else if (MotionFlags & PMV_ADVANCEDDIAMOND16) MainSearchPtr = AdvDiamondSearch;
766 :     else MainSearchPtr = DiamondSearch;
767 : chl 181
768 : Isibaar 539 (*MainSearchPtr)(Data->currentMV->x, Data->currentMV->y, Data, iDirection);
769 : Isibaar 3
770 : chl 530 /* extended search, diamond starting in 0,0 and in prediction.
771 :     note that this search is/might be done in halfpel positions,
772 :     which makes it more different than the diamond above */
773 : chl 259
774 : Isibaar 539 if (MotionFlags & PMV_EXTSEARCH16) {
775 :     int32_t bSAD;
776 :     VECTOR startMV = Data->predMV, backupMV = Data->currentMV[0];
777 :     if (!(MotionFlags & PMV_HALFPELREFINE16)) // who's gonna use extsearch and no halfpel?
778 :     startMV.x = EVEN(startMV.x); startMV.y = EVEN(startMV.y);
779 :     if (!(MVequal(startMV, backupMV))) {
780 :     bSAD = Data->iMinSAD[0]; Data->iMinSAD[0] = MV_MAX_ERROR;
781 : Isibaar 3
782 : Isibaar 539 CheckCandidate16(startMV.x, startMV.y, 255, &iDirection, Data);
783 :     (*MainSearchPtr)(startMV.x, startMV.y, Data, 255);
784 :     if (bSAD < Data->iMinSAD[0]) {
785 :     Data->currentMV[0] = backupMV;
786 :     Data->iMinSAD[0] = bSAD; }
787 :     }
788 : Isibaar 3
789 : Isibaar 539 backupMV = Data->currentMV[0];
790 :     if (MotionFlags & PMV_HALFPELREFINE16) startMV.x = startMV.y = 1;
791 :     else startMV.x = startMV.y = 0;
792 :     if (!(MVequal(startMV, backupMV))) {
793 :     bSAD = Data->iMinSAD[0]; Data->iMinSAD[0] = MV_MAX_ERROR;
794 : edgomez 195
795 : Isibaar 539 CheckCandidate16(startMV.x, startMV.y, 255, &iDirection, Data);
796 :     (*MainSearchPtr)(startMV.x, startMV.y, Data, 255);
797 :     if (bSAD < Data->iMinSAD[0]) {
798 :     Data->currentMV[0] = backupMV;
799 :     Data->iMinSAD[0] = bSAD; }
800 :     }
801 : Isibaar 3 }
802 :     }
803 :    
804 : Isibaar 539 if (MotionFlags & PMV_HALFPELREFINE16) HalfpelRefine(Data);
805 : Isibaar 3
806 : Isibaar 539 if (inter4v) {
807 :     SearchData Data8;
808 :     Data8.iFcode = Data->iFcode;
809 :     Data8.iQuant = Data->iQuant;
810 :     Data8.iEdgedWidth = Data->iEdgedWidth;
811 :     Search8(Data, 2*x, 2*y, MotionFlags, pParam, pMB, pMBs, 0, &Data8);
812 :     Search8(Data, 2*x + 1, 2*y, MotionFlags, pParam, pMB, pMBs, 1, &Data8);
813 :     Search8(Data, 2*x, 2*y + 1, MotionFlags, pParam, pMB, pMBs, 2, &Data8);
814 :     Search8(Data, 2*x + 1, 2*y + 1, MotionFlags, pParam, pMB, pMBs, 3, &Data8);
815 :     }
816 : Isibaar 3
817 : chl 530 if (!(inter4v) ||
818 : Isibaar 539 (Data->iMinSAD[0] < Data->iMinSAD[1] + Data->iMinSAD[2] +
819 :     Data->iMinSAD[3] + Data->iMinSAD[4] + IMV16X16 * (int32_t)iQuant )) {
820 : chl 530 // INTER MODE
821 :     pMB->mode = MODE_INTER;
822 : Isibaar 539 pMB->mvs[0] = pMB->mvs[1]
823 :     = pMB->mvs[2] = pMB->mvs[3] = Data->currentMV[0];
824 : Isibaar 3
825 : chl 530 pMB->sad16 = pMB->sad8[0] = pMB->sad8[1] =
826 : Isibaar 539 pMB->sad8[2] = pMB->sad8[3] = Data->iMinSAD[0];
827 : Isibaar 3
828 : Isibaar 539 pMB->pmvs[0].x = Data->currentMV[0].x - Data->predMV.x;
829 :     pMB->pmvs[0].y = Data->currentMV[0].y - Data->predMV.y;
830 : edgomez 195 } else {
831 : chl 530 // INTER4V MODE; all other things are already set in Search8
832 :     pMB->mode = MODE_INTER4V;
833 : Isibaar 539 pMB->sad16 = Data->iMinSAD[1] + Data->iMinSAD[2] +
834 :     Data->iMinSAD[3] + Data->iMinSAD[4] + IMV16X16 * iQuant;
835 : edgomez 78 }
836 : chl 530
837 : Isibaar 3 }
838 :    
839 : chl 530 static void
840 :     Search8(const SearchData * const OldData,
841 :     const int x, const int y,
842 :     const uint32_t MotionFlags,
843 :     const MBParam * const pParam,
844 :     MACROBLOCK * const pMB,
845 :     const MACROBLOCK * const pMBs,
846 : Isibaar 539 const int block,
847 :     SearchData * const Data)
848 : chl 345 {
849 : Isibaar 539 Data->predMV = get_pmv2(pMBs, pParam->mb_width, 0, x/2 , y/2, block);
850 :     Data->iMinSAD = OldData->iMinSAD + 1 + block;
851 :     Data->currentMV = OldData->currentMV + 1 + block;
852 : chl 345
853 : chl 530 if (block != 0)
854 : Isibaar 539 *(Data->iMinSAD) += lambda_vec8[Data->iQuant] *
855 :     d_mv_bits( Data->currentMV->x - Data->predMV.x,
856 :     Data->currentMV->y - Data->predMV.y,
857 :     Data->iFcode);
858 : chl 345
859 : chl 530 if (MotionFlags & (PMV_EXTSEARCH8|PMV_HALFPELREFINE8)) {
860 : chl 345
861 : Isibaar 539 Data->Ref = OldData->Ref + 8 * ((block&1) + pParam->edged_width*(block>>1));
862 :     Data->RefH = OldData->RefH + 8 * ((block&1) + pParam->edged_width*(block>>1));
863 :     Data->RefV = OldData->RefV + 8 * ((block&1) + pParam->edged_width*(block>>1));
864 :     Data->RefHV = OldData->RefHV + 8 * ((block&1) + pParam->edged_width*(block>>1));
865 : chl 345
866 : Isibaar 539 Data->Cur = OldData->Cur + 8 * ((block&1) + pParam->edged_width*(block>>1));
867 : chl 530
868 : Isibaar 539 get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 8,
869 : chl 530 pParam->width, pParam->height, OldData->iFcode);
870 : chl 345
871 : chl 530 CheckCandidate = CheckCandidate8;
872 : chl 345
873 : chl 530 if (MotionFlags & PMV_EXTSEARCH8) {
874 : chl 345
875 : chl 530 MainSearchFunc *MainSearchPtr;
876 :     if (MotionFlags & PMV_USESQUARES8) MainSearchPtr = SquareSearch;
877 :     else if (MotionFlags & PMV_ADVANCEDDIAMOND8) MainSearchPtr = AdvDiamondSearch;
878 :     else MainSearchPtr = DiamondSearch;
879 : chl 345
880 : Isibaar 539 (*MainSearchPtr)(Data->currentMV->x, Data->currentMV->y, Data, 255); }
881 : chl 345
882 : Isibaar 539 if (MotionFlags & PMV_HALFPELREFINE8) HalfpelRefine(Data);
883 : chl 345 }
884 : chl 530
885 : Isibaar 539 pMB->pmvs[block].x = Data->currentMV->x - Data->predMV.x;
886 :     pMB->pmvs[block].y = Data->currentMV->y - Data->predMV.y;
887 :     pMB->mvs[block] = *(Data->currentMV);
888 :     pMB->sad8[block] = 4 * (*Data->iMinSAD);
889 :    
890 : chl 345 }
891 :    
892 : chl 530 /* B-frames code starts here */
893 : chl 345
894 : chl 530 static __inline VECTOR
895 :     ChoosePred(const MACROBLOCK * const pMB, const uint32_t mode)
896 : Isibaar 3 {
897 : chl 530 /* the stupidiest function ever */
898 :     if (mode == MODE_FORWARD) return pMB->mvs[0];
899 :     else return pMB->b_mvs[0];
900 : Isibaar 3 }
901 :    
902 : chl 530 static void __inline
903 :     PreparePredictionsBF(VECTOR * const pmv, const int x, const int y,
904 :     const uint32_t iWcount,
905 :     const MACROBLOCK * const pMB,
906 :     const uint32_t mode_curr)
907 : Isibaar 3 {
908 :    
909 : chl 530 // [0] is prediction
910 :     pmv[0].x = EVEN(pmv[0].x); pmv[0].y = EVEN(pmv[0].y);
911 : Isibaar 3
912 : chl 530 pmv[1].x = pmv[1].y = 0; // [1] is zero
913 : Isibaar 3
914 : chl 530 pmv[2] = ChoosePred(pMB, mode_curr);
915 :     pmv[2].x = EVEN(pmv[2].x); pmv[2].y = EVEN(pmv[2].y);
916 : edgomez 195
917 : chl 530 if ((y != 0)&&(x != (int)(iWcount+1))) { // [3] top-right neighbour
918 :     pmv[3] = ChoosePred(pMB+1-iWcount, mode_curr);
919 : Isibaar 539 pmv[3].x = EVEN(pmv[3].x); pmv[3].y = EVEN(pmv[3].y);
920 :     } else pmv[3].x = pmv[3].y = 0;
921 : Isibaar 3
922 : chl 530 if (y != 0) {
923 :     pmv[4] = ChoosePred(pMB-iWcount, mode_curr);
924 :     pmv[4].x = EVEN(pmv[4].x); pmv[4].y = EVEN(pmv[4].y);
925 :     } else pmv[4].x = pmv[4].y = 0;
926 : Isibaar 3
927 : chl 530 if (x != 0) {
928 :     pmv[5] = ChoosePred(pMB-1, mode_curr);
929 :     pmv[5].x = EVEN(pmv[5].x); pmv[5].y = EVEN(pmv[5].y);
930 :     } else pmv[5].x = pmv[5].y = 0;
931 : Isibaar 3
932 : chl 530 if ((x != 0)&&(y != 0)) {
933 :     pmv[6] = ChoosePred(pMB-1-iWcount, mode_curr);
934 :     pmv[6].x = EVEN(pmv[5].x); pmv[5].y = EVEN(pmv[5].y);
935 :     } else pmv[6].x = pmv[6].y = 0;
936 : edgomez 195
937 : chl 530 // more?
938 :     }
939 : chl 181
940 : edgomez 170
941 : chl 530 /* search backward or forward, for b-frames */
942 :     static void
943 :     SearchBF( const uint8_t * const pRef,
944 :     const uint8_t * const pRefH,
945 :     const uint8_t * const pRefV,
946 :     const uint8_t * const pRefHV,
947 :     const IMAGE * const pCur,
948 :     const int x, const int y,
949 :     const uint32_t MotionFlags,
950 :     const uint32_t iFcode,
951 :     const MBParam * const pParam,
952 :     MACROBLOCK * const pMB,
953 :     const VECTOR * const predMV,
954 :     int32_t * const best_sad,
955 : h 545 const int32_t mode_current,
956 :     SearchData * const Data)
957 : chl 530 {
958 : Isibaar 3
959 : chl 530 const int32_t iEdgedWidth = pParam->edged_width;
960 :    
961 :     int i, iDirection, mask;
962 : h 545 VECTOR pmv[7];
963 : chl 530 MainSearchFunc *MainSearchPtr;
964 : h 545 *Data->iMinSAD = MV_MAX_ERROR;
965 :     Data->iFcode = iFcode;
966 : Isibaar 3
967 : h 545 Data->Ref = pRef + (x + y * iEdgedWidth) * 16;
968 :     Data->RefH = pRefH + (x + y * iEdgedWidth) * 16;
969 :     Data->RefV = pRefV + (x + y * iEdgedWidth) * 16;
970 :     Data->RefHV = pRefHV + (x + y * iEdgedWidth) * 16;
971 : Isibaar 3
972 : h 545 Data->predMV = *predMV;
973 : edgomez 195
974 : h 545 get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 16,
975 : chl 530 pParam->width, pParam->height, iFcode);
976 : Isibaar 3
977 : h 545 pmv[0] = Data->predMV;
978 :     PreparePredictionsBF(pmv, x, y, pParam->mb_width, pMB, mode_current);
979 : edgomez 195
980 : h 545 Data->currentMV->x = Data->currentMV->y = 0;
981 : Isibaar 3
982 : chl 530 CheckCandidate = CheckCandidate16no4v;
983 : chl 181
984 : chl 530 // main loop. checking all predictions
985 :     for (i = 0; i < 8; i++) {
986 :     if (!(mask = make_mask(pmv, i)) ) continue;
987 : h 545 CheckCandidate16no4v(pmv[i].x, pmv[i].y, mask, &iDirection, Data);
988 : edgomez 78 }
989 : Isibaar 3
990 : chl 530 if (MotionFlags & PMV_USESQUARES16)
991 :     MainSearchPtr = SquareSearch;
992 :     else if (MotionFlags & PMV_ADVANCEDDIAMOND16)
993 :     MainSearchPtr = AdvDiamondSearch;
994 :     else MainSearchPtr = DiamondSearch;
995 : chl 96
996 : h 545 (*MainSearchPtr)(Data->currentMV->x, Data->currentMV->y, Data, 255);
997 : chl 169
998 : h 545 HalfpelRefine(Data);
999 : chl 169
1000 : chl 530 // three bits are needed to code backward mode. four for forward
1001 :     // we treat the bits just like they were vector's
1002 : h 545 if (mode_current == MODE_FORWARD) *Data->iMinSAD += 4 * lambda_vec16[Data->iQuant];
1003 :     else *Data->iMinSAD += 3 * lambda_vec16[Data->iQuant];
1004 : chl 169
1005 :    
1006 : h 545 if (*Data->iMinSAD < *best_sad) {
1007 :     *best_sad = *Data->iMinSAD;
1008 : chl 530 pMB->mode = mode_current;
1009 : h 545 pMB->pmvs[0].x = Data->currentMV->x - predMV->x;
1010 :     pMB->pmvs[0].y = Data->currentMV->y - predMV->y;
1011 :     if (mode_current == MODE_FORWARD) pMB->mvs[0] = *Data->currentMV;
1012 :     else pMB->b_mvs[0] = *Data->currentMV;
1013 : chl 169 }
1014 : chl 530
1015 :     }
1016 : chl 169
1017 : chl 530 static int32_t
1018 : Isibaar 539 SearchDirect(const IMAGE * const f_Ref,
1019 : chl 530 const uint8_t * const f_RefH,
1020 :     const uint8_t * const f_RefV,
1021 :     const uint8_t * const f_RefHV,
1022 : Isibaar 539 const IMAGE * const b_Ref,
1023 : chl 530 const uint8_t * const b_RefH,
1024 :     const uint8_t * const b_RefV,
1025 :     const uint8_t * const b_RefHV,
1026 :     const IMAGE * const pCur,
1027 :     const int x, const int y,
1028 :     const uint32_t MotionFlags,
1029 :     const int32_t TRB, const int32_t TRD,
1030 :     const MBParam * const pParam,
1031 :     MACROBLOCK * const pMB,
1032 :     const MACROBLOCK * const b_mb,
1033 : h 545 int32_t * const best_sad,
1034 :     SearchData * const Data)
1035 : edgomez 195
1036 : chl 530 {
1037 : h 545 int32_t skip_sad;
1038 : chl 530 int k;
1039 : h 545
1040 : chl 530 MainSearchFunc *MainSearchPtr;
1041 : Isibaar 3
1042 : h 545 *Data->iMinSAD = 256*4096;
1043 :     Data->referencemv = b_mb->mvs;
1044 : chl 140
1045 : h 545 Data->Ref = f_Ref->y + (x + Data->iEdgedWidth*y) * 16;
1046 :     Data->RefH = f_RefH + (x + Data->iEdgedWidth*y) * 16;
1047 :     Data->RefV = f_RefV + (x + Data->iEdgedWidth*y) * 16;
1048 :     Data->RefHV = f_RefHV + (x + Data->iEdgedWidth*y) * 16;
1049 :     Data->bRef = b_Ref->y + (x + Data->iEdgedWidth*y) * 16;
1050 :     Data->bRefH = b_RefH + (x + Data->iEdgedWidth*y) * 16;
1051 :     Data->bRefV = b_RefV + (x + Data->iEdgedWidth*y) * 16;
1052 :     Data->bRefHV = b_RefHV + (x + Data->iEdgedWidth*y) * 16;
1053 : chl 140
1054 : h 545 Data->max_dx = 2 * pParam->width - 2 * (x) * 16;
1055 :     Data->max_dy = 2 * pParam->height - 2 * (y) * 16;
1056 :     Data->min_dx = -(2 * 16 + 2 * (x) * 16);
1057 :     Data->min_dy = -(2 * 16 + 2 * (y) * 16);
1058 : Isibaar 3
1059 : chl 530 for (k = 0; k < 4; k++) {
1060 : h 545 pMB->mvs[k].x = Data->directmvF[k].x = ((TRB * Data->referencemv[k].x) / TRD);
1061 :     pMB->b_mvs[k].x = Data->directmvB[k].x = ((TRB - TRD) * Data->referencemv[k].x) / TRD;
1062 :     pMB->mvs[k].y = Data->directmvF[k].y = ((TRB * Data->referencemv[k].y) / TRD);
1063 :     pMB->b_mvs[k].y = Data->directmvB[k].y = ((TRB - TRD) * Data->referencemv[k].y) / TRD;
1064 : Isibaar 3
1065 : h 545 if ( ( pMB->b_mvs[k].x > Data->max_dx ) || ( pMB->b_mvs[k].x < Data->min_dx )
1066 :     || ( pMB->b_mvs[k].y > Data->max_dy ) || ( pMB->b_mvs[k].y < Data->min_dy )) {
1067 : Isibaar 3
1068 : Isibaar 539 *best_sad = 256*4096; // in that case, we won't use direct mode
1069 :     pMB->mode = MODE_DIRECT; // just to make sure it doesn't say "MODE_DIRECT_NONE_MV"
1070 :     pMB->b_mvs[0].x = pMB->b_mvs[0].y = 0;
1071 :     return 0;
1072 :     }
1073 :     if (b_mb->mode != MODE_INTER4V) {
1074 :     pMB->mvs[1] = pMB->mvs[2] = pMB->mvs[3] = pMB->mvs[0];
1075 :     pMB->b_mvs[1] = pMB->b_mvs[2] = pMB->b_mvs[3] = pMB->b_mvs[0];
1076 : h 545 Data->directmvF[1] = Data->directmvF[2] = Data->directmvF[3] = Data->directmvF[0];
1077 :     Data->directmvB[1] = Data->directmvB[2] = Data->directmvB[3] = Data->directmvB[0];
1078 : Isibaar 539 break;
1079 :     }
1080 :     }
1081 : Isibaar 3
1082 : Isibaar 539 if (b_mb->mode == MODE_INTER4V)
1083 :     CheckCandidate = CheckCandidateDirect;
1084 :     else CheckCandidate = CheckCandidateDirectno4v;
1085 : edgomez 195
1086 : h 545 (*CheckCandidate)(0, 0, 255, &k, Data);
1087 : Isibaar 3
1088 : chl 530 // skip decision
1089 : h 545 if (*Data->iMinSAD - 2 * lambda_vec16[Data->iQuant] < (int32_t)Data->iQuant * SKIP_THRESH_B) {
1090 : Isibaar 539 //checking chroma. everything copied from MC
1091 :     //this is not full chroma compensation, only it's fullpel approximation. should work though
1092 :     int sum, dx, dy, b_dx, b_dy;
1093 : Isibaar 3
1094 : Isibaar 539 sum = pMB->mvs[0].x + pMB->mvs[1].x + pMB->mvs[2].x + pMB->mvs[3].x;
1095 :     dx = (sum == 0 ? 0 : SIGN(sum) * (roundtab[ABS(sum) % 16] + (ABS(sum) / 16) * 2));
1096 :    
1097 :     sum = pMB->mvs[0].y + pMB->mvs[1].y + pMB->mvs[2].y + pMB->mvs[3].y;
1098 :     dy = (sum == 0 ? 0 : SIGN(sum) * (roundtab[ABS(sum) % 16] + (ABS(sum) / 16) * 2));
1099 :    
1100 :     sum = pMB->b_mvs[0].x + pMB->b_mvs[1].x + pMB->b_mvs[2].x + pMB->b_mvs[3].x;
1101 :     b_dx = (sum == 0 ? 0 : SIGN(sum) * (roundtab[ABS(sum) % 16] + (ABS(sum) / 16) * 2));
1102 :    
1103 :     sum = pMB->b_mvs[0].y + pMB->b_mvs[1].y + pMB->b_mvs[2].y + pMB->b_mvs[3].y;
1104 :     b_dy = (sum == 0 ? 0 : SIGN(sum) * (roundtab[ABS(sum) % 16] + (ABS(sum) / 16) * 2));
1105 :    
1106 : h 545 sum = sad8bi(pCur->u + 8*x + 8*y*(Data->iEdgedWidth/2),
1107 :     f_Ref->u + (y*8 + dy/2) * (Data->iEdgedWidth/2) + x*8 + dx/2,
1108 :     b_Ref->u + (y*8 + b_dy/2) * (Data->iEdgedWidth/2) + x*8 + b_dx/2,
1109 :     Data->iEdgedWidth/2);
1110 :     sum += sad8bi(pCur->v + 8*x + 8*y*(Data->iEdgedWidth/2),
1111 :     f_Ref->v + (y*8 + dy/2) * (Data->iEdgedWidth/2) + x*8 + dx/2,
1112 :     b_Ref->v + (y*8 + b_dy/2) * (Data->iEdgedWidth/2) + x*8 + b_dx/2,
1113 :     Data->iEdgedWidth/2);
1114 : Isibaar 539
1115 : h 545 if ((uint32_t) sum < MAX_CHROMA_SAD_FOR_SKIP * Data->iQuant) {
1116 : Isibaar 539 pMB->mode = MODE_DIRECT_NONE_MV;
1117 : h 545 return *Data->iMinSAD;
1118 : Isibaar 539 }
1119 :     }
1120 :    
1121 : h 545 skip_sad = *Data->iMinSAD;
1122 : edgomez 195
1123 : chl 530 // DIRECT MODE DELTA VECTOR SEARCH.
1124 :     // This has to be made more effective, but at the moment I'm happy it's running at all
1125 : Isibaar 3
1126 : chl 530 if (MotionFlags & PMV_USESQUARES16) MainSearchPtr = SquareSearch;
1127 :     else if (MotionFlags & PMV_ADVANCEDDIAMOND16) MainSearchPtr = AdvDiamondSearch;
1128 :     else MainSearchPtr = DiamondSearch;
1129 : edgomez 195
1130 : h 545 (*MainSearchPtr)(0, 0, Data, 255);
1131 : Isibaar 3
1132 : h 545 HalfpelRefine(Data);
1133 : Isibaar 3
1134 : h 545 *Data->iMinSAD += 1 * lambda_vec16[Data->iQuant]; // one bit is needed to code direct mode. we treat this bit just like it was vector's
1135 :     *best_sad = *Data->iMinSAD;
1136 : Isibaar 3
1137 : chl 530 if (b_mb->mode == MODE_INTER4V)
1138 :     pMB->mode = MODE_DIRECT;
1139 :     else pMB->mode = MODE_DIRECT_NO4V; //for faster compensation
1140 : edgomez 195
1141 : h 545 pMB->pmvs[3] = *Data->currentMV;
1142 : edgomez 195
1143 : chl 530 for (k = 0; k < 4; k++) {
1144 : h 545 pMB->mvs[k].x = Data->directmvF[k].x + Data->currentMV->x;
1145 :     pMB->b_mvs[k].x = ((Data->currentMV->x == 0)
1146 :     ? Data->directmvB[k].x
1147 :     : pMB->mvs[k].x - Data->referencemv[k].x);
1148 :     pMB->mvs[k].y = (Data->directmvF[k].y + Data->currentMV->y);
1149 :     pMB->b_mvs[k].y = ((Data->currentMV->y == 0)
1150 :     ? Data->directmvB[k].y
1151 :     : pMB->mvs[k].y - Data->referencemv[k].y);
1152 : chl 530 if (b_mb->mode != MODE_INTER4V) {
1153 :     pMB->mvs[3] = pMB->mvs[2] = pMB->mvs[1] = pMB->mvs[0];
1154 :     pMB->b_mvs[3] = pMB->b_mvs[2] = pMB->b_mvs[1] = pMB->b_mvs[0];
1155 :     break;
1156 :     }
1157 :     }
1158 : h 545 return skip_sad;
1159 : Isibaar 3 }
1160 : chl 96
1161 : h 545
1162 : chl 530 static __inline void
1163 :     SearchInterpolate(const uint8_t * const f_Ref,
1164 :     const uint8_t * const f_RefH,
1165 :     const uint8_t * const f_RefV,
1166 :     const uint8_t * const f_RefHV,
1167 :     const uint8_t * const b_Ref,
1168 :     const uint8_t * const b_RefH,
1169 :     const uint8_t * const b_RefV,
1170 :     const uint8_t * const b_RefHV,
1171 :     const IMAGE * const pCur,
1172 :     const int x, const int y,
1173 :     const uint32_t fcode,
1174 :     const uint32_t bcode,
1175 :     const uint32_t MotionFlags,
1176 :     const MBParam * const pParam,
1177 :     const VECTOR * const f_predMV,
1178 :     const VECTOR * const b_predMV,
1179 :     MACROBLOCK * const pMB,
1180 : h 545 int32_t * const best_sad,
1181 :     SearchData * const fData)
1182 : chl 530
1183 : chl 96 {
1184 :    
1185 : edgomez 195 const int32_t iEdgedWidth = pParam->edged_width;
1186 : chl 96
1187 : chl 530 int iDirection, i, j;
1188 : h 545 SearchData bData;
1189 : chl 96
1190 : h 545 bData.iMinSAD = fData->iMinSAD;
1191 :     *bData.iMinSAD = 4096*256;
1192 :     bData.Cur = fData->Cur;
1193 :     fData->iEdgedWidth = bData.iEdgedWidth = iEdgedWidth;
1194 :     bData.currentMV = fData->currentMV + 1;
1195 :     bData.iQuant = fData->iQuant;
1196 :     fData->iFcode = bData.bFcode = fcode; fData->bFcode = bData.iFcode = bcode;
1197 : edgomez 195
1198 : h 545 bData.bRef = fData->Ref = f_Ref + (x + y * iEdgedWidth) * 16;
1199 :     bData.bRefH = fData->RefH = f_RefH + (x + y * iEdgedWidth) * 16;
1200 :     bData.bRefV = fData->RefV = f_RefV + (x + y * iEdgedWidth) * 16;
1201 :     bData.bRefHV = fData->RefHV = f_RefHV + (x + y * iEdgedWidth) * 16;
1202 :     bData.Ref = fData->bRef = b_Ref + (x + y * iEdgedWidth) * 16;
1203 :     bData.RefH = fData->bRefH = b_RefH + (x + y * iEdgedWidth) * 16;
1204 :     bData.RefV = fData->bRefV = b_RefV + (x + y * iEdgedWidth) * 16;
1205 :     bData.RefHV = fData->bRefHV = b_RefHV + (x + y * iEdgedWidth) * 16;
1206 : chl 96
1207 : h 545 bData.bpredMV = fData->predMV = *f_predMV;
1208 :     fData->bpredMV = bData.predMV = *b_predMV;
1209 : edgomez 195
1210 : h 545 fData->currentMV[0] = pMB->mvs[0];
1211 :     fData->currentMV[1] = pMB->b_mvs[0];
1212 :     get_range(&fData->min_dx, &fData->max_dx, &fData->min_dy, &fData->max_dy, x, y, 16, pParam->width, pParam->height, fcode);
1213 : chl 530 get_range(&bData.min_dx, &bData.max_dx, &bData.min_dy, &bData.max_dy, x, y, 16, pParam->width, pParam->height, bcode);
1214 : chl 96
1215 : h 545 if (fData->currentMV[0].x > fData->max_dx) fData->currentMV[0].x = fData->max_dx;
1216 :     if (fData->currentMV[0].x < fData->min_dx) fData->currentMV[0].x = fData->min_dy;
1217 :     if (fData->currentMV[0].y > fData->max_dy) fData->currentMV[0].y = fData->max_dx;
1218 :     if (fData->currentMV[0].y > fData->min_dy) fData->currentMV[0].y = fData->min_dy;
1219 : Isibaar 539
1220 : h 545 if (fData->currentMV[1].x > bData.max_dx) fData->currentMV[1].x = bData.max_dx;
1221 :     if (fData->currentMV[1].x < bData.min_dx) fData->currentMV[1].x = bData.min_dy;
1222 :     if (fData->currentMV[1].y > bData.max_dy) fData->currentMV[1].y = bData.max_dx;
1223 :     if (fData->currentMV[1].y > bData.min_dy) fData->currentMV[1].y = bData.min_dy;
1224 : Isibaar 539
1225 : h 545 CheckCandidateInt(fData->currentMV[0].x, fData->currentMV[0].y, 255, &iDirection, fData);
1226 : chl 96
1227 : chl 530 //diamond. I wish we could use normal mainsearch functions (square, advdiamond)
1228 : chl 96
1229 : chl 530 do {
1230 :     iDirection = 255;
1231 :     // forward MV moves
1232 : h 545 i = fData->currentMV[0].x; j = fData->currentMV[0].y;
1233 : chl 96
1234 : h 545 CheckCandidateInt(i + 1, j, 0, &iDirection, fData);
1235 :     CheckCandidateInt(i, j + 1, 0, &iDirection, fData);
1236 :     CheckCandidateInt(i - 1, j, 0, &iDirection, fData);
1237 :     CheckCandidateInt(i, j - 1, 0, &iDirection, fData);
1238 : chl 96
1239 : chl 530 // backward MV moves
1240 : h 545 i = fData->currentMV[1].x; j = fData->currentMV[1].y;
1241 :     fData->currentMV[2] = fData->currentMV[0];
1242 : chl 326
1243 : Isibaar 539 CheckCandidateInt(i + 1, j, 0, &iDirection, &bData);
1244 :     CheckCandidateInt(i, j + 1, 0, &iDirection, &bData);
1245 :     CheckCandidateInt(i - 1, j, 0, &iDirection, &bData);
1246 :     CheckCandidateInt(i, j - 1, 0, &iDirection, &bData);
1247 : chl 96
1248 : chl 530 } while (!(iDirection));
1249 : edgomez 195
1250 : chl 530 // two bits are needed to code interpolate mode. we treat the bits just like they were vector's
1251 : h 545 *fData->iMinSAD += 2 * lambda_vec16[fData->iQuant];
1252 :     if (*fData->iMinSAD < *best_sad) {
1253 :     *best_sad = *fData->iMinSAD;
1254 :     pMB->mvs[0] = fData->currentMV[0];
1255 :     pMB->b_mvs[0] = fData->currentMV[1];
1256 : chl 530 pMB->mode = MODE_INTERPOLATE;
1257 : chl 96
1258 : chl 530 pMB->pmvs[1].x = pMB->mvs[0].x - f_predMV->x;
1259 :     pMB->pmvs[1].y = pMB->mvs[0].y - f_predMV->y;
1260 :     pMB->pmvs[0].x = pMB->b_mvs[0].x - b_predMV->x;
1261 :     pMB->pmvs[0].y = pMB->b_mvs[0].y - b_predMV->y;
1262 :     }
1263 :     }
1264 : chl 96
1265 : h 545
1266 : chl 530 void
1267 :     MotionEstimationBVOP(MBParam * const pParam,
1268 :     FRAMEINFO * const frame,
1269 :     const int32_t time_bp,
1270 :     const int32_t time_pp,
1271 :     // forward (past) reference
1272 :     const MACROBLOCK * const f_mbs,
1273 :     const IMAGE * const f_ref,
1274 :     const IMAGE * const f_refH,
1275 :     const IMAGE * const f_refV,
1276 :     const IMAGE * const f_refHV,
1277 :     // backward (future) reference
1278 :     const MACROBLOCK * const b_mbs,
1279 :     const IMAGE * const b_ref,
1280 :     const IMAGE * const b_refH,
1281 :     const IMAGE * const b_refV,
1282 :     const IMAGE * const b_refHV)
1283 :     {
1284 :     uint32_t i, j;
1285 :     int32_t best_sad, skip_sad;
1286 :     int f_count = 0, b_count = 0, i_count = 0, d_count = 0, n_count = 0;
1287 :     static const VECTOR zeroMV={0,0};
1288 : chl 96
1289 : chl 530 VECTOR f_predMV, b_predMV; /* there is no prediction for direct mode*/
1290 : chl 96
1291 : chl 530 const int32_t TRB = time_pp - time_bp;
1292 :     const int32_t TRD = time_pp;
1293 : chl 96
1294 : h 545 // some pre-inintialized data for the rest of the search
1295 :    
1296 :     SearchData Data;
1297 :     int32_t iMinSAD;
1298 :     VECTOR currentMV[3];
1299 :     Data.iEdgedWidth = pParam->edged_width;
1300 :     Data.currentMV = currentMV;
1301 :     Data.iMinSAD = &iMinSAD;
1302 :     Data.iQuant = frame->quant;
1303 :    
1304 : chl 530 // note: i==horizontal, j==vertical
1305 : chl 96
1306 : chl 530 for (j = 0; j < pParam->mb_height; j++) {
1307 : chl 96
1308 : chl 530 f_predMV = b_predMV = zeroMV; /* prediction is reset at left boundary */
1309 : edgomez 195
1310 : chl 530 for (i = 0; i < pParam->mb_width; i++) {
1311 :     MACROBLOCK * const pMB = frame->mbs + i + j * pParam->mb_width;
1312 :     const MACROBLOCK * const b_mb = b_mbs + i + j * pParam->mb_width;
1313 : edgomez 195
1314 : chl 530 /* special case, if collocated block is SKIPed: encoding is forward (0,0), cpb=0 without further ado */
1315 :     if (b_mb->mode == MODE_NOT_CODED) {
1316 :     pMB->mode = MODE_NOT_CODED;
1317 :     continue;
1318 : chl 96 }
1319 :    
1320 : h 545 Data.Cur = frame->image.y + (j * Data.iEdgedWidth + i) * 16;
1321 : chl 530 /* direct search comes first, because it (1) checks for SKIP-mode
1322 :     and (2) sets very good predictions for forward and backward search */
1323 : chl 96
1324 : Isibaar 539 skip_sad = SearchDirect(f_ref, f_refH->y, f_refV->y, f_refHV->y,
1325 :     b_ref, b_refH->y, b_refV->y, b_refHV->y,
1326 : chl 530 &frame->image,
1327 :     i, j,
1328 :     frame->motion_flags,
1329 :     TRB, TRD,
1330 :     pParam,
1331 :     pMB, b_mb,
1332 : h 545 &best_sad,
1333 :     &Data);
1334 : chl 96
1335 : Isibaar 539 if (pMB->mode == MODE_DIRECT_NONE_MV) { n_count++; continue; }
1336 : chl 96
1337 : chl 530 // best_sad = 256*4096; //uncomment to disable Directsearch.
1338 :     // To disable any other mode, just comment the function call
1339 : chl 96
1340 : chl 530 // forward search
1341 :     SearchBF(f_ref->y, f_refH->y, f_refV->y, f_refHV->y,
1342 :     &frame->image, i, j,
1343 :     frame->motion_flags,
1344 : h 545 frame->fcode, pParam,
1345 : chl 530 pMB, &f_predMV, &best_sad,
1346 : h 545 MODE_FORWARD, &Data);
1347 : chl 96
1348 : chl 530 // backward search
1349 :     SearchBF(b_ref->y, b_refH->y, b_refV->y, b_refHV->y,
1350 :     &frame->image, i, j,
1351 :     frame->motion_flags,
1352 : h 545 frame->bcode, pParam,
1353 : chl 530 pMB, &b_predMV, &best_sad,
1354 : h 545 MODE_BACKWARD, &Data);
1355 : chl 96
1356 : chl 530 // interpolate search comes last, because it uses data from forward and backward as prediction
1357 : chl 96
1358 : chl 530 SearchInterpolate(f_ref->y, f_refH->y, f_refV->y, f_refHV->y,
1359 :     b_ref->y, b_refH->y, b_refV->y, b_refHV->y,
1360 :     &frame->image,
1361 :     i, j,
1362 :     frame->fcode, frame->bcode,
1363 :     frame->motion_flags,
1364 : h 545 pParam,
1365 : chl 530 &f_predMV, &b_predMV,
1366 : h 545 pMB, &best_sad,
1367 :     &Data);
1368 : chl 96
1369 : chl 530 switch (pMB->mode) {
1370 :     case MODE_FORWARD:
1371 :     f_count++;
1372 :     f_predMV = pMB->mvs[0];
1373 :     break;
1374 :     case MODE_BACKWARD:
1375 :     b_count++;
1376 :     b_predMV = pMB->b_mvs[0];
1377 :     break;
1378 :     case MODE_INTERPOLATE:
1379 :     i_count++;
1380 :     f_predMV = pMB->mvs[0];
1381 :     b_predMV = pMB->b_mvs[0];
1382 :     break;
1383 :     case MODE_DIRECT:
1384 :     case MODE_DIRECT_NO4V:
1385 :     d_count++;
1386 :     break;
1387 :     default:
1388 :     break;
1389 : chl 96 }
1390 :     }
1391 :     }
1392 :    
1393 : chl 530 // fprintf(debug,"B-Stat: F: %04d B: %04d I: %04d D: %04d, N: %04d\n",
1394 :     // f_count,b_count,i_count,d_count,n_count);
1395 : chl 96
1396 :     }
1397 :    
1398 : chl 530 /* Hinted ME starts here */
1399 : chl 96
1400 : chl 530 static __inline void
1401 :     Search8hinted( const SearchData * const OldData,
1402 :     const int x, const int y,
1403 :     const uint32_t MotionFlags,
1404 :     const MBParam * const pParam,
1405 :     MACROBLOCK * const pMB,
1406 :     const MACROBLOCK * const pMBs,
1407 :     const int block)
1408 : chl 96 {
1409 : chl 530 SearchData Data;
1410 :     MainSearchFunc *MainSearchPtr;
1411 : chl 141
1412 : chl 530 Data.predMV = get_pmv2(pMBs, pParam->mb_width, 0, x/2 , y/2, block);
1413 :     Data.iMinSAD = OldData->iMinSAD + 1 + block;
1414 :     Data.currentMV = OldData->currentMV+1+block;
1415 :     Data.iFcode = OldData->iFcode;
1416 :     Data.iQuant = OldData->iQuant;
1417 : chl 96
1418 : chl 530 Data.Ref = OldData->Ref + 8 * ((block&1) + pParam->edged_width*(block>>1));
1419 :     Data.RefH = OldData->RefH + 8 * ((block&1) + pParam->edged_width*(block>>1));
1420 :     Data.RefV = OldData->RefV + 8 * ((block&1) + pParam->edged_width*(block>>1));
1421 :     Data.RefHV = OldData->RefHV + 8 * ((block&1) + pParam->edged_width*(block>>1));
1422 :     Data.iEdgedWidth = pParam->edged_width;
1423 :     Data.Cur = OldData->Cur + 8 * ((block&1) + pParam->edged_width*(block>>1));
1424 : chl 96
1425 : chl 530 CheckCandidate = CheckCandidate8;
1426 : edgomez 195
1427 : chl 530 if (block != 0)
1428 :     *(Data.iMinSAD) += lambda_vec8[Data.iQuant] *
1429 :     d_mv_bits( Data.currentMV->x - Data.predMV.x,
1430 :     Data.currentMV->y - Data.predMV.y,
1431 :     Data.iFcode);
1432 : edgomez 195
1433 :    
1434 : chl 530 get_range(&Data.min_dx, &Data.max_dx, &Data.min_dy, &Data.max_dy, x, y, 8,
1435 :     pParam->width, pParam->height, OldData->iFcode);
1436 : chl 96
1437 : chl 530 if (pMB->mode == MODE_INTER4V) {
1438 :     int dummy;
1439 :     CheckCandidate8(pMB->mvs[block].x, pMB->mvs[block].y, 0, &dummy, &Data); }
1440 : chl 96
1441 : chl 530 if (MotionFlags & PMV_USESQUARES8) MainSearchPtr = SquareSearch;
1442 :     else if (MotionFlags & PMV_ADVANCEDDIAMOND8) MainSearchPtr = AdvDiamondSearch;
1443 :     else MainSearchPtr = DiamondSearch;
1444 : chl 96
1445 : chl 530 (*MainSearchPtr)(Data.currentMV->x, Data.currentMV->y, &Data, 255);
1446 : edgomez 195
1447 : chl 530 if (MotionFlags & PMV_HALFPELREFINE8) HalfpelRefine(&Data);
1448 : chl 96
1449 : chl 530 pMB->pmvs[block].x = Data.currentMV->x - Data.predMV.x;
1450 :     pMB->pmvs[block].y = Data.currentMV->y - Data.predMV.y;
1451 :     pMB->mvs[block] = *(Data.currentMV);
1452 :     pMB->sad8[block] = 4 * (*(Data.iMinSAD));
1453 : chl 96 }
1454 :    
1455 : suxen_drol 118
1456 : chl 530 static void
1457 :     SearchPhinted ( const uint8_t * const pRef,
1458 : chl 289 const uint8_t * const pRefH,
1459 :     const uint8_t * const pRefV,
1460 :     const uint8_t * const pRefHV,
1461 :     const IMAGE * const pCur,
1462 :     const int x,
1463 :     const int y,
1464 :     const uint32_t MotionFlags,
1465 :     const uint32_t iQuant,
1466 :     const MBParam * const pParam,
1467 :     const MACROBLOCK * const pMBs,
1468 : chl 530 int inter4v,
1469 : h 545 MACROBLOCK * const pMB,
1470 : edgomez 568 SearchData * const Data)
1471 : chl 289 {
1472 : chl 530
1473 : chl 289 const int32_t iEdgedWidth = pParam->edged_width;
1474 : chl 530
1475 : edgomez 568 int i, t;
1476 : chl 530 MainSearchFunc * MainSearchPtr;
1477 : suxen_drol 118
1478 : h 545 Data->predMV = get_pmv2(pMBs, pParam->mb_width, 0, x, y, 0);
1479 :     get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 16,
1480 :     pParam->width, pParam->height, Data->iFcode);
1481 : suxen_drol 118
1482 : h 545 Data->Cur = pCur->y + (x + y * iEdgedWidth) * 16;
1483 :     Data->Ref = pRef + (x + iEdgedWidth*y)*16;
1484 :     Data->RefH = pRefH + (x + iEdgedWidth*y) * 16;
1485 :     Data->RefV = pRefV + (x + iEdgedWidth*y) * 16;
1486 :     Data->RefHV = pRefHV + (x + iEdgedWidth*y) * 16;
1487 :     Data->iQuant = iQuant;
1488 : edgomez 568
1489 : chl 530 if (!(MotionFlags & PMV_HALFPEL16)) {
1490 : h 545 Data->min_dx = EVEN(Data->min_dx);
1491 :     Data->max_dx = EVEN(Data->max_dx);
1492 :     Data->min_dy = EVEN(Data->min_dy);
1493 :     Data->max_dy = EVEN(Data->max_dy);
1494 : chl 530 }
1495 : chl 289
1496 : h 545 for(i = 0; i < 5; i++) Data->iMinSAD[i] = MV_MAX_ERROR;
1497 : chl 289
1498 : chl 530 if (pMB->dquant != NO_CHANGE) inter4v = 0;
1499 : chl 289
1500 : chl 530 if (inter4v)
1501 :     CheckCandidate = CheckCandidate16;
1502 :     else CheckCandidate = CheckCandidate16no4v;
1503 : chl 289
1504 :    
1505 : chl 530 pMB->mvs[0].x = EVEN(pMB->mvs[0].x);
1506 :     pMB->mvs[0].y = EVEN(pMB->mvs[0].y);
1507 : h 545 if (pMB->mvs[0].x > Data->max_dx) pMB->mvs[0].x = Data->max_dx; // this is in case iFcode changed
1508 :     if (pMB->mvs[0].x < Data->min_dx) pMB->mvs[0].x = Data->min_dx;
1509 :     if (pMB->mvs[0].y > Data->max_dy) pMB->mvs[0].y = Data->max_dy;
1510 :     if (pMB->mvs[0].y < Data->min_dy) pMB->mvs[0].y = Data->min_dy;
1511 : chl 370
1512 : edgomez 568 (*CheckCandidate)(pMB->mvs[0].x, pMB->mvs[0].y, 0, &t, Data);
1513 : chl 289
1514 : chl 530 if (pMB->mode == MODE_INTER4V)
1515 :     for (i = 1; i < 4; i++) { // all four vectors will be used as four predictions for 16x16 search
1516 :     pMB->mvs[i].x = EVEN(pMB->mvs[i].x);
1517 :     pMB->mvs[i].y = EVEN(pMB->mvs[i].y);
1518 :     if (!(make_mask(pMB->mvs, i)))
1519 : edgomez 568 (*CheckCandidate)(pMB->mvs[i].x, pMB->mvs[i].y, 0, &t, Data);
1520 : chl 289 }
1521 :    
1522 :     if (MotionFlags & PMV_USESQUARES16)
1523 : chl 530 MainSearchPtr = SquareSearch;
1524 : chl 289 else if (MotionFlags & PMV_ADVANCEDDIAMOND16)
1525 : chl 530 MainSearchPtr = AdvDiamondSearch;
1526 :     else MainSearchPtr = DiamondSearch;
1527 : chl 289
1528 : h 545 (*MainSearchPtr)(Data->currentMV->x, Data->currentMV->y, Data, 255);
1529 : chl 289
1530 : h 545 if (MotionFlags & PMV_HALFPELREFINE16) HalfpelRefine(Data);
1531 : chl 289
1532 : chl 530 if (inter4v)
1533 :     for(i = 0; i < 4; i++)
1534 : h 545 Search8hinted(Data, 2*x+(i&1), 2*y+(i>>1), MotionFlags, pParam, pMB, pMBs, i);
1535 : chl 289
1536 : chl 530 if (!(inter4v) ||
1537 : h 545 (Data->iMinSAD[0] < Data->iMinSAD[1] + Data->iMinSAD[2] + Data->iMinSAD[3] +
1538 :     Data->iMinSAD[4] + IMV16X16 * (int32_t)iQuant )) {
1539 : chl 530 // INTER MODE
1540 : chl 289
1541 : chl 530 pMB->mode = MODE_INTER;
1542 : Isibaar 539 pMB->mvs[0] = pMB->mvs[1]
1543 : h 545 = pMB->mvs[2] = pMB->mvs[3] = Data->currentMV[0];
1544 : chl 289
1545 : chl 530 pMB->sad16 = pMB->sad8[0] = pMB->sad8[1] =
1546 : h 545 pMB->sad8[2] = pMB->sad8[3] = Data->iMinSAD[0];
1547 : chl 289
1548 : h 545 pMB->pmvs[0].x = Data->currentMV[0].x - Data->predMV.x;
1549 :     pMB->pmvs[0].y = Data->currentMV[0].y - Data->predMV.y;
1550 : chl 530 } else {
1551 :     // INTER4V MODE; all other things are already set in Search8hinted
1552 :     pMB->mode = MODE_INTER4V;
1553 : h 545 pMB->sad16 = Data->iMinSAD[1] + Data->iMinSAD[2] + Data->iMinSAD[3]
1554 :     + Data->iMinSAD[4] + IMV16X16 * iQuant;
1555 : chl 289 }
1556 :    
1557 :     }
1558 :    
1559 : edgomez 195 void
1560 : chl 530 MotionEstimationHinted( MBParam * const pParam,
1561 :     FRAMEINFO * const current,
1562 :     FRAMEINFO * const reference,
1563 :     const IMAGE * const pRefH,
1564 :     const IMAGE * const pRefV,
1565 :     const IMAGE * const pRefHV)
1566 : suxen_drol 118 {
1567 : chl 530 MACROBLOCK *const pMBs = current->mbs;
1568 :     const IMAGE *const pCurrent = &current->image;
1569 :     const IMAGE *const pRef = &reference->image;
1570 : suxen_drol 118
1571 : chl 530 uint32_t x, y;
1572 : h 545 int32_t temp[5];
1573 :     int32_t iMinSAD[5];
1574 :     VECTOR currentMV[5];
1575 :     SearchData Data;
1576 :     Data.iEdgedWidth = pParam->edged_width;
1577 :     Data.currentMV = currentMV;
1578 :     Data.iMinSAD = iMinSAD;
1579 :     Data.temp = temp;
1580 :     Data.iFcode = current->fcode;
1581 :    
1582 : chl 530 if (sadInit) (*sadInit) ();
1583 : suxen_drol 118
1584 : chl 530 for (y = 0; y < pParam->mb_height; y++) {
1585 :     for (x = 0; x < pParam->mb_width; x++) {
1586 : chl 312
1587 : chl 530 MACROBLOCK *pMB = &pMBs[x + y * pParam->mb_width];
1588 : suxen_drol 118
1589 : chl 530 //intra mode is copied from the first pass. At least for the time being
1590 :     if ((pMB->mode == MODE_INTRA) || (pMB->mode == MODE_NOT_CODED) ) continue;
1591 : chl 346
1592 : chl 530 if (!(current->global_flags & XVID_LUMIMASKING)) {
1593 :     pMB->dquant = NO_CHANGE;
1594 :     pMB->quant = current->quant; }
1595 : chl 341
1596 : Isibaar 539 SearchPhinted(pRef->y, pRefH->y, pRefV->y, pRefHV->y, pCurrent, x,
1597 :     y, current->motion_flags, pMB->quant,
1598 : h 545 pParam, pMBs, current->global_flags & XVID_INTER4V, pMB,
1599 :     &Data);
1600 : chl 317
1601 : Isibaar 539 }
1602 :     }
1603 :     }
1604 : suxen_drol 118
1605 : Isibaar 539 static __inline int
1606 :     MEanalyzeMB ( const uint8_t * const pRef,
1607 :     const uint8_t * const pCur,
1608 :     const int x,
1609 :     const int y,
1610 :     const MBParam * const pParam,
1611 :     const MACROBLOCK * const pMBs,
1612 : h 545 MACROBLOCK * const pMB,
1613 :     SearchData * const Data)
1614 : Isibaar 539 {
1615 : chl 317
1616 : Isibaar 539 int i, mask;
1617 : h 545 VECTOR pmv[3];
1618 : suxen_drol 118
1619 : h 545 *(Data->iMinSAD) = MV_MAX_ERROR;
1620 :     Data->predMV = get_pmv2(pMBs, pParam->mb_width, 0, x, y, 0);
1621 :     get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 16,
1622 :     pParam->width, pParam->height, Data->iFcode);
1623 : chl 326
1624 : h 545 Data->Cur = pCur + (x + y * pParam->edged_width) * 16;
1625 :     Data->Ref = pRef + (x + y * pParam->edged_width) * 16;
1626 : Isibaar 539
1627 :     CheckCandidate = CheckCandidate16no4vI;
1628 : chl 326
1629 : Isibaar 539 pmv[1].x = EVEN(pMB->mvs[0].x);
1630 :     pmv[1].y = EVEN(pMB->mvs[0].y);
1631 : h 545 pmv[0].x = EVEN(Data->predMV.x);
1632 :     pmv[0].y = EVEN(Data->predMV.y);
1633 : Isibaar 539 pmv[2].x = pmv[2].y = 0;
1634 : chl 326
1635 : h 545 CheckCandidate16no4vI(pmv[0].x, pmv[0].y, 255, &i, Data);
1636 : Isibaar 539 if (!(mask = make_mask(pmv, 1)))
1637 : h 545 CheckCandidate16no4vI(pmv[1].x, pmv[1].y, mask, &i, Data);
1638 : Isibaar 539 if (!(mask = make_mask(pmv, 2)))
1639 : h 545 CheckCandidate16no4vI(0, 0, mask, &i, Data);
1640 : Isibaar 539
1641 : h 545 DiamondSearch(Data->currentMV->x, Data->currentMV->y, Data, i);
1642 : Isibaar 539
1643 :     pMB->mvs[0] = pMB->mvs[1]
1644 : h 545 = pMB->mvs[2] = pMB->mvs[3] = *Data->currentMV; // all, for future get_pmv()
1645 : Isibaar 539
1646 : h 545 return *(Data->iMinSAD);
1647 : Isibaar 539 }
1648 :    
1649 :     #define INTRA_THRESH 1350
1650 :     #define INTER_THRESH 900
1651 :    
1652 :     int
1653 :     MEanalysis( const IMAGE * const pRef,
1654 :     const IMAGE * const pCurrent,
1655 :     MBParam * const pParam,
1656 :     MACROBLOCK * const pMBs,
1657 :     const uint32_t iFcode)
1658 :     {
1659 :     uint32_t x, y, intra = 0;
1660 :     int sSAD = 0;
1661 : h 545
1662 :     VECTOR currentMV;
1663 :     int32_t iMinSAD;
1664 :     SearchData Data;
1665 :     Data.iEdgedWidth = pParam->edged_width;
1666 :     Data.currentMV = &currentMV;
1667 :     Data.iMinSAD = &iMinSAD;
1668 :     Data.iFcode = iFcode;
1669 :     Data.iQuant = 2;
1670 :    
1671 : Isibaar 539 if (sadInit) (*sadInit) ();
1672 :    
1673 :     for (y = 0; y < pParam->mb_height-1; y++) {
1674 :     for (x = 0; x < pParam->mb_width; x++) {
1675 :     int sad, dev;
1676 :     MACROBLOCK *pMB = &pMBs[x + y * pParam->mb_width];
1677 :    
1678 :     sad = MEanalyzeMB(pRef->y, pCurrent->y, x, y,
1679 : h 545 pParam, pMBs, pMB, &Data);
1680 : Isibaar 539
1681 :     if ( x != 0 && y != 0 && x != pParam->mb_width-1 ) { //no edge macroblocks, they just don't work
1682 :     if (sad > INTRA_THRESH) {
1683 :     dev = dev16(pCurrent->y + (x + y * pParam->edged_width) * 16,
1684 :     pParam->edged_width);
1685 :     if (dev + INTRA_THRESH < sad) intra++;
1686 :     if (intra > (pParam->mb_height-2)*(pParam->mb_width-2)/2) return 2; // I frame
1687 :     }
1688 :     sSAD += sad;
1689 :     }
1690 :    
1691 : suxen_drol 118 }
1692 :     }
1693 : Isibaar 539 sSAD /= (pParam->mb_height-2)*(pParam->mb_width-2);
1694 :     if (sSAD > INTER_THRESH ) return 1; //P frame
1695 :     emms();
1696 :     return 0; // B frame
1697 :    
1698 : suxen_drol 118 }

No admin address has been configured
ViewVC Help
Powered by ViewVC 1.0.4