[svn] / branches / dev-api-4 / xvidcore / src / motion / motion_est.h Repository:
ViewVC logotype

Annotation of /branches/dev-api-4/xvidcore/src/motion/motion_est.h

Parent Directory Parent Directory | Revision Log Revision Log


Revision 1077 - (view) (download)

1 : edgomez 1054 /*****************************************************************************
2 : edgomez 851 *
3 :     * XVID MPEG-4 VIDEO CODEC
4 : edgomez 1054 * - Motion Estimation related header -
5 : edgomez 851 *
6 : edgomez 1054 * Copyright(C) 2002 Christoph Lampert <gruel@web.de>
7 :     * 2002 Michael Militzer <michael@xvid.org>
8 :     * 2002-2003 Radoslaw Czyz <xvid@syskin.cjb.net>
9 : edgomez 851 *
10 : edgomez 1054 * This program is free software ; you can redistribute it and/or modify
11 : edgomez 851 * it under the terms of the GNU General Public License as published by
12 : edgomez 1054 * the Free Software Foundation ; either version 2 of the License, or
13 : edgomez 851 * (at your option) any later version.
14 :     *
15 :     * This program is distributed in the hope that it will be useful,
16 : edgomez 1054 * but WITHOUT ANY WARRANTY ; without even the implied warranty of
17 : edgomez 851 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 :     * GNU General Public License for more details.
19 :     *
20 :     * You should have received a copy of the GNU General Public License
21 : edgomez 1054 * along with this program ; if not, write to the Free Software
22 : edgomez 851 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 :     *
24 : chl 1077 * $Id: motion_est.h,v 1.3.2.12 2003-06-28 15:51:54 chl Exp $
25 : edgomez 851 *
26 : edgomez 1054 ****************************************************************************/
27 : edgomez 851
28 :     #ifndef _MOTION_EST_H_
29 :     #define _MOTION_EST_H_
30 :    
31 :     #include "../portab.h"
32 :     #include "../global.h"
33 :     #include "../image/reduced.h"
34 :    
35 :     /* hard coded motion search parameters for motion_est and smp_motion_est */
36 :    
37 : edgomez 1053 /* very large value */
38 : edgomez 851 #define MV_MAX_ERROR (4096 * 256)
39 :    
40 :     /* INTER bias for INTER/INTRA decision; mpeg4 spec suggests 2*nb */
41 :     #define MV16_INTER_BIAS 512
42 :    
43 :     /* vector map (vlc delta size) smoother parameters ! float !*/
44 :     #define NEIGH_TEND_16X16 10.5
45 :     #define NEIGH_TEND_8X8 40.0
46 :     #define NEIGH_8X8_BIAS 30
47 :    
48 : edgomez 1023 #define BITS_MULT 16
49 :    
50 : edgomez 851 /* Parameters which control inter/inter4v decision */
51 :     #define IMV16X16 2
52 :    
53 :     static const int lambda_vec16[32] =
54 :     { 0 ,(int)(1.00235 * NEIGH_TEND_16X16 + 0.5),
55 :     (int)(1.15582*NEIGH_TEND_16X16 + 0.5), (int)(1.31976*NEIGH_TEND_16X16 + 0.5),
56 :     (int)(1.49591*NEIGH_TEND_16X16 + 0.5), (int)(1.68601*NEIGH_TEND_16X16 + 0.5),
57 :     (int)(1.89187*NEIGH_TEND_16X16 + 0.5), (int)(2.11542*NEIGH_TEND_16X16 + 0.5),
58 :     (int)(2.35878*NEIGH_TEND_16X16 + 0.5), (int)(2.62429*NEIGH_TEND_16X16 + 0.5),
59 :     (int)(2.91455*NEIGH_TEND_16X16 + 0.5), (int)(3.23253*NEIGH_TEND_16X16 + 0.5),
60 :     (int)(3.58158*NEIGH_TEND_16X16 + 0.5), (int)(3.96555*NEIGH_TEND_16X16 + 0.5),
61 :     (int)(4.38887*NEIGH_TEND_16X16 + 0.5), (int)(4.85673*NEIGH_TEND_16X16 + 0.5),
62 :     (int)(5.37519*NEIGH_TEND_16X16 + 0.5), (int)(5.95144*NEIGH_TEND_16X16 + 0.5),
63 :     (int)(6.59408*NEIGH_TEND_16X16 + 0.5), (int)(7.31349*NEIGH_TEND_16X16 + 0.5),
64 :     (int)(8.12242*NEIGH_TEND_16X16 + 0.5), (int)(9.03669*NEIGH_TEND_16X16 + 0.5),
65 :     (int)(10.0763*NEIGH_TEND_16X16 + 0.5), (int)(11.2669*NEIGH_TEND_16X16 + 0.5),
66 :     (int)(12.6426*NEIGH_TEND_16X16 + 0.5), (int)(14.2493*NEIGH_TEND_16X16 + 0.5),
67 :     (int)(16.1512*NEIGH_TEND_16X16 + 0.5), (int)(18.442*NEIGH_TEND_16X16 + 0.5),
68 :     (int)(21.2656*NEIGH_TEND_16X16 + 0.5), (int)(24.8580*NEIGH_TEND_16X16 + 0.5),
69 :     (int)(29.6436*NEIGH_TEND_16X16 + 0.5), (int)(36.4949*NEIGH_TEND_16X16 + 0.5) };
70 :    
71 :     static const int lambda_vec8[32] =
72 :     { 0 ,(int)(1.00235 * NEIGH_TEND_8X8 + 0.5),
73 :     (int)(1.15582 + NEIGH_TEND_8X8 + 0.5), (int)(1.31976*NEIGH_TEND_8X8 + 0.5),
74 :     (int)(1.49591*NEIGH_TEND_8X8 + 0.5), (int)(1.68601*NEIGH_TEND_8X8 + 0.5),
75 :     (int)(1.89187*NEIGH_TEND_8X8 + 0.5), (int)(2.11542*NEIGH_TEND_8X8 + 0.5),
76 :     (int)(2.35878*NEIGH_TEND_8X8 + 0.5), (int)(2.62429*NEIGH_TEND_8X8 + 0.5),
77 :     (int)(2.91455*NEIGH_TEND_8X8 + 0.5), (int)(3.23253*NEIGH_TEND_8X8 + 0.5),
78 :     (int)(3.58158*NEIGH_TEND_8X8 + 0.5), (int)(3.96555*NEIGH_TEND_8X8 + 0.5),
79 :     (int)(4.38887*NEIGH_TEND_8X8 + 0.5), (int)(4.85673*NEIGH_TEND_8X8 + 0.5),
80 :     (int)(5.37519*NEIGH_TEND_8X8 + 0.5), (int)(5.95144*NEIGH_TEND_8X8 + 0.5),
81 :     (int)(6.59408*NEIGH_TEND_8X8 + 0.5), (int)(7.31349*NEIGH_TEND_8X8 + 0.5),
82 :     (int)(8.12242*NEIGH_TEND_8X8 + 0.5), (int)(9.03669*NEIGH_TEND_8X8 + 0.5),
83 :     (int)(10.0763*NEIGH_TEND_8X8 + 0.5), (int)(11.2669*NEIGH_TEND_8X8 + 0.5),
84 :     (int)(12.6426*NEIGH_TEND_8X8 + 0.5), (int)(14.2493*NEIGH_TEND_8X8 + 0.5),
85 :     (int)(16.1512*NEIGH_TEND_8X8 + 0.5), (int)(18.442*NEIGH_TEND_8X8 + 0.5),
86 :     (int)(21.2656*NEIGH_TEND_8X8 + 0.5), (int)(24.8580*NEIGH_TEND_8X8 + 0.5),
87 :     (int)(29.6436*NEIGH_TEND_8X8 + 0.5), (int)(36.4949*NEIGH_TEND_8X8 + 0.5) };
88 :    
89 : edgomez 1053 /* mv.length table */
90 : edgomez 974 static const int mvtab[64] = {
91 :     1, 2, 3, 4, 6, 7, 7, 7,
92 :     9, 9, 9, 10, 10, 10, 10, 10,
93 :     10, 10, 10, 10, 10, 10, 10, 10,
94 :     10, 11, 11, 11, 11, 11, 11, 12,
95 :     12, 12, 12, 12, 12, 12, 12, 12,
96 :     12, 12, 12, 12, 12, 12, 12, 12,
97 :     12, 12, 12, 12, 12, 12, 12, 12, 12 };
98 : edgomez 851
99 :     static const int DQtab[4] = {
100 :     -1, -2, 1, 2
101 :     };
102 :    
103 :     #define RRV_MV_SCALEDOWN(a) ( (a)>=0 ? (a+1)/2 : (a-1)/2 )
104 :    
105 :     typedef struct
106 :     {
107 : edgomez 1053 /* general fields */
108 : edgomez 851 int max_dx, min_dx, max_dy, min_dy;
109 :     uint32_t rounding;
110 :     VECTOR predMV;
111 :     VECTOR * currentMV;
112 :     VECTOR * currentQMV;
113 :     int32_t * iMinSAD;
114 : edgomez 1053 const uint8_t * RefP[6]; /* N, V, H, HV, cU, cV */
115 : edgomez 851 const uint8_t * CurU;
116 :     const uint8_t * CurV;
117 :     uint8_t * RefQ;
118 :     const uint8_t * Cur;
119 :     uint32_t lambda16;
120 :     uint32_t lambda8;
121 :     uint32_t iEdgedWidth;
122 :     uint32_t iFcode;
123 :     int * temp;
124 :     int qpel, qpel_precision;
125 :     int chroma;
126 :     int rrv;
127 : edgomez 1053
128 :     /* fields for interpolate and direct modes */
129 :     const uint8_t * b_RefP[6]; /* N, V, H, HV, cU, cV */
130 : edgomez 851 VECTOR bpredMV;
131 :     uint32_t bFcode;
132 : edgomez 1053
133 :     /* fields for direct mode */
134 : edgomez 851 VECTOR directmvF[4];
135 :     VECTOR directmvB[4];
136 :     const VECTOR * referencemv;
137 : edgomez 1053
138 :     /* BITS/R-D stuff */
139 : edgomez 959 int16_t * dctSpace;
140 : edgomez 1022 uint32_t iQuant;
141 :     uint32_t quant_type;
142 : edgomez 851
143 :     } SearchData;
144 :    
145 :    
146 :     typedef void(CheckFunc)(const int x, const int y,
147 :     const int Direction, int * const dir,
148 :     const SearchData * const Data);
149 :     CheckFunc *CheckCandidate;
150 :    
151 :     /*
152 :     * Calculate the min/max range
153 :     * relative to the _MACROBLOCK_ position
154 :     */
155 :     static void __inline
156 :     get_range(int32_t * const min_dx,
157 :     int32_t * const max_dx,
158 :     int32_t * const min_dy,
159 :     int32_t * const max_dy,
160 :     const uint32_t x,
161 :     const uint32_t y,
162 :     uint32_t block_sz, /* block dimension, 8 or 16 */
163 :     const uint32_t width,
164 :     const uint32_t height,
165 :     const uint32_t fcode,
166 :     const int qpel, /* 1 if the resulting range should be in qpel precision; otherwise 0 */
167 :     const int rrv)
168 :     {
169 :     int k, m = qpel ? 4 : 2;
170 :     const int search_range = 32 << (fcode - 1);
171 :     int high = search_range - 1;
172 :     int low = -search_range;
173 :    
174 :     if (rrv) {
175 :     high = RRV_MV_SCALEUP(high);
176 :     low = RRV_MV_SCALEUP(low);
177 :     block_sz *= 2;
178 :     }
179 :    
180 :     k = m * (int)(width - x * block_sz);
181 :     *max_dx = MIN(high, k);
182 :     k = m * (int)(height - y * block_sz);
183 :     *max_dy = MIN(high, k);
184 :    
185 :     k = -m * (int)((x+1) * block_sz);
186 :     *min_dx = MAX(low, k);
187 :     k = -m * (int)((y+1) * block_sz);
188 :     *min_dy = MAX(low, k);
189 :     }
190 :    
191 :     typedef void MainSearchFunc(int x, int y, const SearchData * const Data, int bDirection);
192 :    
193 :     static MainSearchFunc DiamondSearch, AdvDiamondSearch, SquareSearch;
194 :    
195 :     static void Search8(const SearchData * const OldData,
196 :     const int x, const int y,
197 :     const uint32_t MotionFlags,
198 :     const MBParam * const pParam,
199 :     MACROBLOCK * const pMB,
200 :     const MACROBLOCK * const pMBs,
201 :     const int block,
202 :     SearchData * const Data);
203 :    
204 :     bool
205 :     MotionEstimation(MBParam * const pParam,
206 : syskin 884 FRAMEINFO * const current,
207 :     FRAMEINFO * const reference,
208 :     const IMAGE * const pRefH,
209 :     const IMAGE * const pRefV,
210 :     const IMAGE * const pRefHV,
211 : chl 1077 const IMAGE * const pGMC,
212 : syskin 884 const uint32_t iLimit);
213 : edgomez 851
214 :     static void
215 :     SearchP(const IMAGE * const pRef,
216 :     const uint8_t * const pRefH,
217 :     const uint8_t * const pRefV,
218 :     const uint8_t * const pRefHV,
219 :     const IMAGE * const pCur,
220 :     const int x,
221 :     const int y,
222 :     const uint32_t MotionFlags,
223 : edgomez 1022 const uint32_t VopFlags,
224 :     const uint32_t VolFlags,
225 : edgomez 851 SearchData * const Data,
226 :     const MBParam * const pParam,
227 :     const MACROBLOCK * const pMBs,
228 :     const MACROBLOCK * const prevMBs,
229 :     MACROBLOCK * const pMB);
230 :    
231 : chl 1077 static __inline void
232 :     GMEanalyzeMB (const uint8_t * const pCur,
233 :     const uint8_t * const pRef,
234 :     const uint8_t * const pRefH,
235 :     const uint8_t * const pRefV,
236 :     const uint8_t * const pRefHV,
237 :     const int x,
238 :     const int y,
239 :     const MBParam * const pParam,
240 :     MACROBLOCK * const pMBs,
241 :     SearchData * const Data);
242 :    
243 :     void
244 :     GMEanalysis(const MBParam * const pParam,
245 :     const FRAMEINFO * const current,
246 :     const FRAMEINFO * const reference,
247 :     const IMAGE * const pRefH,
248 :     const IMAGE * const pRefV,
249 :     const IMAGE * const pRefHV);
250 :    
251 :    
252 :    
253 :     WARPPOINTS
254 :     GlobalMotionEst(MACROBLOCK * const pMBs,
255 : edgomez 851 const MBParam * const pParam,
256 :     const FRAMEINFO * const current,
257 :     const FRAMEINFO * const reference,
258 :     const IMAGE * const pRefH,
259 :     const IMAGE * const pRefV,
260 :     const IMAGE * const pRefHV );
261 :    
262 : chl 1077
263 :     int
264 :     GlobalMotionEstRefine(WARPPOINTS *const startwp,
265 :     MACROBLOCK * const pMBs,
266 :     const MBParam * const pParam,
267 :     const FRAMEINFO * const current,
268 :     const FRAMEINFO * const reference,
269 :     const IMAGE * const pCurr,
270 :     const IMAGE * const pRef,
271 :     const IMAGE * const pRefH,
272 :     const IMAGE * const pRefV,
273 :     const IMAGE * const pRefHV);
274 :    
275 :    
276 :    
277 :    
278 :     int
279 :     globalSAD(const WARPPOINTS *const wp,
280 :     const MBParam * const pParam,
281 :     const MACROBLOCK * const pMBs,
282 :     const FRAMEINFO * const current,
283 :     const IMAGE * const pRef,
284 :     const IMAGE * const pCurr,
285 :     uint8_t *const GMCblock);
286 :    
287 : edgomez 851 #define iDiamondSize 2
288 :    
289 :     static __inline uint32_t
290 : suxen_drol 890 MakeGoodMotionFlags(const uint32_t MotionFlags, const uint32_t VopFlags, const uint32_t VolFlags)
291 : edgomez 851 {
292 :     uint32_t Flags = MotionFlags;
293 :    
294 : edgomez 949 if (!(VopFlags & XVID_VOP_MODEDECISION_BITS))
295 :     Flags &= ~(XVID_ME_QUARTERPELREFINE16_BITS+XVID_ME_QUARTERPELREFINE8_BITS+XVID_ME_HALFPELREFINE16_BITS+XVID_ME_HALFPELREFINE8_BITS+XVID_ME_EXTSEARCH_BITS);
296 : edgomez 851
297 : edgomez 949 if (Flags & XVID_ME_EXTSEARCH_BITS)
298 :     Flags |= XVID_ME_HALFPELREFINE16_BITS;
299 : edgomez 851
300 : edgomez 949 if (Flags & XVID_ME_EXTSEARCH_BITS && MotionFlags & XVID_ME_EXTSEARCH8)
301 :     Flags |= XVID_ME_HALFPELREFINE8_BITS;
302 : edgomez 851
303 : edgomez 949 if (Flags & XVID_ME_HALFPELREFINE16_BITS)
304 :     Flags |= XVID_ME_QUARTERPELREFINE16_BITS;
305 : edgomez 851
306 : edgomez 949 if (Flags & XVID_ME_HALFPELREFINE8_BITS) {
307 :     Flags |= XVID_ME_QUARTERPELREFINE8_BITS;
308 :     Flags &= ~XVID_ME_HALFPELREFINE8;
309 : edgomez 851 }
310 :    
311 : edgomez 949 if (Flags & XVID_ME_QUARTERPELREFINE8_BITS)
312 :     Flags &= ~XVID_ME_QUARTERPELREFINE8;
313 : edgomez 851
314 : edgomez 949 if (!(VolFlags & XVID_VOL_QUARTERPEL))
315 :     Flags &= ~(XVID_ME_QUARTERPELREFINE16+XVID_ME_QUARTERPELREFINE8+XVID_ME_QUARTERPELREFINE16_BITS+XVID_ME_QUARTERPELREFINE8_BITS);
316 : edgomez 851
317 : edgomez 949 if (!(VopFlags & XVID_VOP_HALFPEL))
318 :     Flags &= ~(XVID_ME_EXTSEARCH16+XVID_ME_HALFPELREFINE16+XVID_ME_HALFPELREFINE8+XVID_ME_HALFPELREFINE16_BITS+XVID_ME_HALFPELREFINE8_BITS);
319 : edgomez 851
320 : edgomez 949 if ((VopFlags & XVID_VOP_GREYSCALE) || (VopFlags & XVID_VOP_REDUCED))
321 :     Flags &= ~(XVID_ME_CHROMA16 + XVID_ME_CHROMA8);
322 : edgomez 851
323 :     return Flags;
324 :     }
325 :    
326 :     /* BITS mode decision and search */
327 :    
328 :     #include "../bitstream/zigzag.h"
329 :     #include "../quant/quant_mpeg4.h"
330 :     #include "../quant/quant_h263.h"
331 :     #include "../bitstream/vlc_codes.h"
332 : edgomez 1022 #include "../dct/fdct.h"
333 : edgomez 851
334 :     static int
335 :     CountMBBitsInter(SearchData * const Data,
336 :     const MACROBLOCK * const pMBs, const int x, const int y,
337 :     const MBParam * const pParam,
338 :     const uint32_t MotionFlags);
339 :    
340 :     static int
341 :     CountMBBitsInter4v(const SearchData * const Data,
342 :     MACROBLOCK * const pMB, const MACROBLOCK * const pMBs,
343 :     const int x, const int y,
344 :     const MBParam * const pParam, const uint32_t MotionFlags,
345 :     const VECTOR * const backup);
346 :    
347 :     static int
348 :     CountMBBitsIntra(const SearchData * const Data);
349 :    
350 :     int CodeCoeffIntra_CalcBits(const int16_t qcoeff[64], const uint16_t * zigzag);
351 :     int CodeCoeffInter_CalcBits(const int16_t qcoeff[64], const uint16_t * zigzag);
352 : edgomez 1023
353 : syskin 1075 /* one over lambda for R-D mode decision and motion search */
354 :     #define LAMBDA ( (int)(BITS_MULT/1.0) )
355 : edgomez 1023
356 : edgomez 1022 static __inline unsigned int
357 : edgomez 1023 Block_CalcBits( int16_t * const coeff,
358 :     int16_t * const data,
359 : syskin 1075 int16_t * const dqcoeff,
360 : edgomez 1023 const uint32_t quant, const int quant_type,
361 :     uint32_t * cbp,
362 :     const int block)
363 : edgomez 1022 {
364 :     int sum;
365 : edgomez 1023 int bits;
366 :     int distortion = 0;
367 :     int i;
368 : edgomez 851
369 : edgomez 1022 fdct(data);
370 :    
371 :     if (quant_type == 0) sum = quant_inter(coeff, data, quant);
372 :     else sum = quant4_inter(coeff, data, quant);
373 :    
374 :     if (sum > 0) {
375 :     *cbp |= 1 << (5 - block);
376 : edgomez 1023 bits = BITS_MULT * CodeCoeffInter_CalcBits(coeff, scan_tables[0]);
377 :     } else bits = 0;
378 :    
379 : syskin 1075 if (quant_type == 0) dequant_inter(dqcoeff, coeff, quant);
380 :     else dequant4_inter(dqcoeff, coeff, quant);
381 : edgomez 1023
382 :     for (i = 0; i < 64; i++) {
383 : syskin 1075 distortion += (data[i] - dqcoeff[i])*(data[i] - dqcoeff[i]);
384 : edgomez 1023 }
385 :    
386 : syskin 1075 bits += (LAMBDA*distortion)/(quant*quant);
387 : edgomez 1023
388 :     return bits;
389 : edgomez 1022 }
390 :    
391 : edgomez 1023 static __inline unsigned int
392 :     Block_CalcBitsIntra(int16_t * const coeff,
393 :     int16_t * const data,
394 : syskin 1075 int16_t * const dqcoeff,
395 : edgomez 1023 const uint32_t quant, const int quant_type,
396 :     uint32_t * cbp,
397 :     const int block,
398 :     int * dcpred)
399 :     {
400 :     int bits, i;
401 :     int distortion = 0;
402 : syskin 1071 uint32_t iDcScaler = get_dc_scaler(quant, block < 4);
403 : edgomez 1023 int b_dc;
404 :    
405 :     fdct(data);
406 :     data[0] -= 1024;
407 :    
408 : syskin 1075 if (quant_type == 0) quant_intra(coeff, data, quant, iDcScaler);
409 :     else quant4_intra(coeff, data, quant, iDcScaler);
410 : edgomez 1023
411 :     b_dc = coeff[0];
412 :     if (block < 4) {
413 :     coeff[0] -= *dcpred;
414 :     *dcpred = b_dc;
415 :     }
416 :    
417 :     bits = BITS_MULT*CodeCoeffIntra_CalcBits(coeff, scan_tables[0]);
418 :     if (bits != 0) *cbp |= 1 << (5 - block);
419 :    
420 : syskin 1071 if (block < 4) bits += BITS_MULT*dcy_tab[coeff[0] + 255].len;
421 :     else bits += BITS_MULT*dcc_tab[coeff[0] + 255].len;
422 :    
423 : edgomez 1023 coeff[0] = b_dc;
424 : syskin 1075 if (quant_type == 0) dequant_intra(dqcoeff, coeff, quant, iDcScaler);
425 :     else dequant4_intra(dqcoeff, coeff, quant, iDcScaler);
426 : edgomez 1023
427 :     for (i = 0; i < 64; i++) {
428 : syskin 1075 distortion += (data[i] - dqcoeff[i])*(data[i] - dqcoeff[i]);
429 : edgomez 1023 }
430 :    
431 : syskin 1075 bits += (LAMBDA*distortion)/(quant*quant);
432 : edgomez 1023
433 :     return bits;
434 :     }
435 :    
436 : edgomez 851 #endif /* _MOTION_EST_H_ */

No admin address has been configured
ViewVC Help
Powered by ViewVC 1.0.4