[svn] / branches / dev-api-4 / xvidcore / src / motion / motion_est.h Repository:
ViewVC logotype

Annotation of /branches/dev-api-4/xvidcore/src/motion/motion_est.h

Parent Directory Parent Directory | Revision Log Revision Log


Revision 1071 - (view) (download)

1 : edgomez 1054 /*****************************************************************************
2 : edgomez 851 *
3 :     * XVID MPEG-4 VIDEO CODEC
4 : edgomez 1054 * - Motion Estimation related header -
5 : edgomez 851 *
6 : edgomez 1054 * Copyright(C) 2002 Christoph Lampert <gruel@web.de>
7 :     * 2002 Michael Militzer <michael@xvid.org>
8 :     * 2002-2003 Radoslaw Czyz <xvid@syskin.cjb.net>
9 : edgomez 851 *
10 : edgomez 1054 * This program is free software ; you can redistribute it and/or modify
11 : edgomez 851 * it under the terms of the GNU General Public License as published by
12 : edgomez 1054 * the Free Software Foundation ; either version 2 of the License, or
13 : edgomez 851 * (at your option) any later version.
14 :     *
15 :     * This program is distributed in the hope that it will be useful,
16 : edgomez 1054 * but WITHOUT ANY WARRANTY ; without even the implied warranty of
17 : edgomez 851 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 :     * GNU General Public License for more details.
19 :     *
20 :     * You should have received a copy of the GNU General Public License
21 : edgomez 1054 * along with this program ; if not, write to the Free Software
22 : edgomez 851 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 :     *
24 : syskin 1071 * $Id: motion_est.h,v 1.3.2.10 2003-06-19 09:59:37 syskin Exp $
25 : edgomez 851 *
26 : edgomez 1054 ****************************************************************************/
27 : edgomez 851
28 :     #ifndef _MOTION_EST_H_
29 :     #define _MOTION_EST_H_
30 :    
31 :     #include "../portab.h"
32 :     #include "../global.h"
33 :     #include "../image/reduced.h"
34 :    
35 :     /* hard coded motion search parameters for motion_est and smp_motion_est */
36 :    
37 : edgomez 1053 /* very large value */
38 : edgomez 851 #define MV_MAX_ERROR (4096 * 256)
39 :    
40 :     /* INTER bias for INTER/INTRA decision; mpeg4 spec suggests 2*nb */
41 :     #define MV16_INTER_BIAS 512
42 :    
43 :     /* vector map (vlc delta size) smoother parameters ! float !*/
44 :     #define NEIGH_TEND_16X16 10.5
45 :     #define NEIGH_TEND_8X8 40.0
46 :     #define NEIGH_8X8_BIAS 30
47 :    
48 : edgomez 1023 #define BITS_MULT 16
49 :    
50 : edgomez 851 /* Parameters which control inter/inter4v decision */
51 :     #define IMV16X16 2
52 :    
53 :     static const int lambda_vec16[32] =
54 :     { 0 ,(int)(1.00235 * NEIGH_TEND_16X16 + 0.5),
55 :     (int)(1.15582*NEIGH_TEND_16X16 + 0.5), (int)(1.31976*NEIGH_TEND_16X16 + 0.5),
56 :     (int)(1.49591*NEIGH_TEND_16X16 + 0.5), (int)(1.68601*NEIGH_TEND_16X16 + 0.5),
57 :     (int)(1.89187*NEIGH_TEND_16X16 + 0.5), (int)(2.11542*NEIGH_TEND_16X16 + 0.5),
58 :     (int)(2.35878*NEIGH_TEND_16X16 + 0.5), (int)(2.62429*NEIGH_TEND_16X16 + 0.5),
59 :     (int)(2.91455*NEIGH_TEND_16X16 + 0.5), (int)(3.23253*NEIGH_TEND_16X16 + 0.5),
60 :     (int)(3.58158*NEIGH_TEND_16X16 + 0.5), (int)(3.96555*NEIGH_TEND_16X16 + 0.5),
61 :     (int)(4.38887*NEIGH_TEND_16X16 + 0.5), (int)(4.85673*NEIGH_TEND_16X16 + 0.5),
62 :     (int)(5.37519*NEIGH_TEND_16X16 + 0.5), (int)(5.95144*NEIGH_TEND_16X16 + 0.5),
63 :     (int)(6.59408*NEIGH_TEND_16X16 + 0.5), (int)(7.31349*NEIGH_TEND_16X16 + 0.5),
64 :     (int)(8.12242*NEIGH_TEND_16X16 + 0.5), (int)(9.03669*NEIGH_TEND_16X16 + 0.5),
65 :     (int)(10.0763*NEIGH_TEND_16X16 + 0.5), (int)(11.2669*NEIGH_TEND_16X16 + 0.5),
66 :     (int)(12.6426*NEIGH_TEND_16X16 + 0.5), (int)(14.2493*NEIGH_TEND_16X16 + 0.5),
67 :     (int)(16.1512*NEIGH_TEND_16X16 + 0.5), (int)(18.442*NEIGH_TEND_16X16 + 0.5),
68 :     (int)(21.2656*NEIGH_TEND_16X16 + 0.5), (int)(24.8580*NEIGH_TEND_16X16 + 0.5),
69 :     (int)(29.6436*NEIGH_TEND_16X16 + 0.5), (int)(36.4949*NEIGH_TEND_16X16 + 0.5) };
70 :    
71 :     static const int lambda_vec8[32] =
72 :     { 0 ,(int)(1.00235 * NEIGH_TEND_8X8 + 0.5),
73 :     (int)(1.15582 + NEIGH_TEND_8X8 + 0.5), (int)(1.31976*NEIGH_TEND_8X8 + 0.5),
74 :     (int)(1.49591*NEIGH_TEND_8X8 + 0.5), (int)(1.68601*NEIGH_TEND_8X8 + 0.5),
75 :     (int)(1.89187*NEIGH_TEND_8X8 + 0.5), (int)(2.11542*NEIGH_TEND_8X8 + 0.5),
76 :     (int)(2.35878*NEIGH_TEND_8X8 + 0.5), (int)(2.62429*NEIGH_TEND_8X8 + 0.5),
77 :     (int)(2.91455*NEIGH_TEND_8X8 + 0.5), (int)(3.23253*NEIGH_TEND_8X8 + 0.5),
78 :     (int)(3.58158*NEIGH_TEND_8X8 + 0.5), (int)(3.96555*NEIGH_TEND_8X8 + 0.5),
79 :     (int)(4.38887*NEIGH_TEND_8X8 + 0.5), (int)(4.85673*NEIGH_TEND_8X8 + 0.5),
80 :     (int)(5.37519*NEIGH_TEND_8X8 + 0.5), (int)(5.95144*NEIGH_TEND_8X8 + 0.5),
81 :     (int)(6.59408*NEIGH_TEND_8X8 + 0.5), (int)(7.31349*NEIGH_TEND_8X8 + 0.5),
82 :     (int)(8.12242*NEIGH_TEND_8X8 + 0.5), (int)(9.03669*NEIGH_TEND_8X8 + 0.5),
83 :     (int)(10.0763*NEIGH_TEND_8X8 + 0.5), (int)(11.2669*NEIGH_TEND_8X8 + 0.5),
84 :     (int)(12.6426*NEIGH_TEND_8X8 + 0.5), (int)(14.2493*NEIGH_TEND_8X8 + 0.5),
85 :     (int)(16.1512*NEIGH_TEND_8X8 + 0.5), (int)(18.442*NEIGH_TEND_8X8 + 0.5),
86 :     (int)(21.2656*NEIGH_TEND_8X8 + 0.5), (int)(24.8580*NEIGH_TEND_8X8 + 0.5),
87 :     (int)(29.6436*NEIGH_TEND_8X8 + 0.5), (int)(36.4949*NEIGH_TEND_8X8 + 0.5) };
88 :    
89 : edgomez 1053 /* mv.length table */
90 : edgomez 974 static const int mvtab[64] = {
91 :     1, 2, 3, 4, 6, 7, 7, 7,
92 :     9, 9, 9, 10, 10, 10, 10, 10,
93 :     10, 10, 10, 10, 10, 10, 10, 10,
94 :     10, 11, 11, 11, 11, 11, 11, 12,
95 :     12, 12, 12, 12, 12, 12, 12, 12,
96 :     12, 12, 12, 12, 12, 12, 12, 12,
97 :     12, 12, 12, 12, 12, 12, 12, 12, 12 };
98 : edgomez 851
99 :     static const int DQtab[4] = {
100 :     -1, -2, 1, 2
101 :     };
102 :    
103 :     #define RRV_MV_SCALEDOWN(a) ( (a)>=0 ? (a+1)/2 : (a-1)/2 )
104 :    
105 :     typedef struct
106 :     {
107 : edgomez 1053 /* general fields */
108 : edgomez 851 int max_dx, min_dx, max_dy, min_dy;
109 :     uint32_t rounding;
110 :     VECTOR predMV;
111 :     VECTOR * currentMV;
112 :     VECTOR * currentQMV;
113 :     int32_t * iMinSAD;
114 : edgomez 1053 const uint8_t * RefP[6]; /* N, V, H, HV, cU, cV */
115 : edgomez 851 const uint8_t * CurU;
116 :     const uint8_t * CurV;
117 :     uint8_t * RefQ;
118 :     const uint8_t * Cur;
119 :     uint32_t lambda16;
120 :     uint32_t lambda8;
121 :     uint32_t iEdgedWidth;
122 :     uint32_t iFcode;
123 :     int * temp;
124 :     int qpel, qpel_precision;
125 :     int chroma;
126 :     int rrv;
127 : edgomez 1053
128 :     /* fields for interpolate and direct modes */
129 :     const uint8_t * b_RefP[6]; /* N, V, H, HV, cU, cV */
130 : edgomez 851 VECTOR bpredMV;
131 :     uint32_t bFcode;
132 : edgomez 1053
133 :     /* fields for direct mode */
134 : edgomez 851 VECTOR directmvF[4];
135 :     VECTOR directmvB[4];
136 :     const VECTOR * referencemv;
137 : edgomez 1053
138 :     /* BITS/R-D stuff */
139 : edgomez 959 int16_t * dctSpace;
140 : edgomez 1022 uint32_t iQuant;
141 :     uint32_t quant_type;
142 : edgomez 851
143 :     } SearchData;
144 :    
145 :    
146 :     typedef void(CheckFunc)(const int x, const int y,
147 :     const int Direction, int * const dir,
148 :     const SearchData * const Data);
149 :     CheckFunc *CheckCandidate;
150 :    
151 :     /*
152 :     * Calculate the min/max range
153 :     * relative to the _MACROBLOCK_ position
154 :     */
155 :     static void __inline
156 :     get_range(int32_t * const min_dx,
157 :     int32_t * const max_dx,
158 :     int32_t * const min_dy,
159 :     int32_t * const max_dy,
160 :     const uint32_t x,
161 :     const uint32_t y,
162 :     uint32_t block_sz, /* block dimension, 8 or 16 */
163 :     const uint32_t width,
164 :     const uint32_t height,
165 :     const uint32_t fcode,
166 :     const int qpel, /* 1 if the resulting range should be in qpel precision; otherwise 0 */
167 :     const int rrv)
168 :     {
169 :     int k, m = qpel ? 4 : 2;
170 :     const int search_range = 32 << (fcode - 1);
171 :     int high = search_range - 1;
172 :     int low = -search_range;
173 :    
174 :     if (rrv) {
175 :     high = RRV_MV_SCALEUP(high);
176 :     low = RRV_MV_SCALEUP(low);
177 :     block_sz *= 2;
178 :     }
179 :    
180 :     k = m * (int)(width - x * block_sz);
181 :     *max_dx = MIN(high, k);
182 :     k = m * (int)(height - y * block_sz);
183 :     *max_dy = MIN(high, k);
184 :    
185 :     k = -m * (int)((x+1) * block_sz);
186 :     *min_dx = MAX(low, k);
187 :     k = -m * (int)((y+1) * block_sz);
188 :     *min_dy = MAX(low, k);
189 :     }
190 :    
191 :     typedef void MainSearchFunc(int x, int y, const SearchData * const Data, int bDirection);
192 :    
193 :     static MainSearchFunc DiamondSearch, AdvDiamondSearch, SquareSearch;
194 :    
195 :     static void Search8(const SearchData * const OldData,
196 :     const int x, const int y,
197 :     const uint32_t MotionFlags,
198 :     const MBParam * const pParam,
199 :     MACROBLOCK * const pMB,
200 :     const MACROBLOCK * const pMBs,
201 :     const int block,
202 :     SearchData * const Data);
203 :    
204 :     bool
205 :     MotionEstimation(MBParam * const pParam,
206 : syskin 884 FRAMEINFO * const current,
207 :     FRAMEINFO * const reference,
208 :     const IMAGE * const pRefH,
209 :     const IMAGE * const pRefV,
210 :     const IMAGE * const pRefHV,
211 :     const uint32_t iLimit);
212 : edgomez 851
213 :     static void
214 :     SearchP(const IMAGE * const pRef,
215 :     const uint8_t * const pRefH,
216 :     const uint8_t * const pRefV,
217 :     const uint8_t * const pRefHV,
218 :     const IMAGE * const pCur,
219 :     const int x,
220 :     const int y,
221 :     const uint32_t MotionFlags,
222 : edgomez 1022 const uint32_t VopFlags,
223 :     const uint32_t VolFlags,
224 : edgomez 851 SearchData * const Data,
225 :     const MBParam * const pParam,
226 :     const MACROBLOCK * const pMBs,
227 :     const MACROBLOCK * const prevMBs,
228 :     MACROBLOCK * const pMB);
229 :    
230 :     static WARPPOINTS
231 :     GlobalMotionEst(const MACROBLOCK * const pMBs,
232 :     const MBParam * const pParam,
233 :     const FRAMEINFO * const current,
234 :     const FRAMEINFO * const reference,
235 :     const IMAGE * const pRefH,
236 :     const IMAGE * const pRefV,
237 :     const IMAGE * const pRefHV );
238 :    
239 :     #define iDiamondSize 2
240 :    
241 :     static __inline uint32_t
242 : suxen_drol 890 MakeGoodMotionFlags(const uint32_t MotionFlags, const uint32_t VopFlags, const uint32_t VolFlags)
243 : edgomez 851 {
244 :     uint32_t Flags = MotionFlags;
245 :    
246 : edgomez 949 if (!(VopFlags & XVID_VOP_MODEDECISION_BITS))
247 :     Flags &= ~(XVID_ME_QUARTERPELREFINE16_BITS+XVID_ME_QUARTERPELREFINE8_BITS+XVID_ME_HALFPELREFINE16_BITS+XVID_ME_HALFPELREFINE8_BITS+XVID_ME_EXTSEARCH_BITS);
248 : edgomez 851
249 : edgomez 949 if (Flags & XVID_ME_EXTSEARCH_BITS)
250 :     Flags |= XVID_ME_HALFPELREFINE16_BITS;
251 : edgomez 851
252 : edgomez 949 if (Flags & XVID_ME_EXTSEARCH_BITS && MotionFlags & XVID_ME_EXTSEARCH8)
253 :     Flags |= XVID_ME_HALFPELREFINE8_BITS;
254 : edgomez 851
255 : edgomez 949 if (Flags & XVID_ME_HALFPELREFINE16_BITS)
256 :     Flags |= XVID_ME_QUARTERPELREFINE16_BITS;
257 : edgomez 851
258 : edgomez 949 if (Flags & XVID_ME_HALFPELREFINE8_BITS) {
259 :     Flags |= XVID_ME_QUARTERPELREFINE8_BITS;
260 :     Flags &= ~XVID_ME_HALFPELREFINE8;
261 : edgomez 851 }
262 :    
263 : edgomez 949 if (Flags & XVID_ME_QUARTERPELREFINE8_BITS)
264 :     Flags &= ~XVID_ME_QUARTERPELREFINE8;
265 : edgomez 851
266 : edgomez 949 if (!(VolFlags & XVID_VOL_QUARTERPEL))
267 :     Flags &= ~(XVID_ME_QUARTERPELREFINE16+XVID_ME_QUARTERPELREFINE8+XVID_ME_QUARTERPELREFINE16_BITS+XVID_ME_QUARTERPELREFINE8_BITS);
268 : edgomez 851
269 : edgomez 949 if (!(VopFlags & XVID_VOP_HALFPEL))
270 :     Flags &= ~(XVID_ME_EXTSEARCH16+XVID_ME_HALFPELREFINE16+XVID_ME_HALFPELREFINE8+XVID_ME_HALFPELREFINE16_BITS+XVID_ME_HALFPELREFINE8_BITS);
271 : edgomez 851
272 : edgomez 949 if ((VopFlags & XVID_VOP_GREYSCALE) || (VopFlags & XVID_VOP_REDUCED))
273 :     Flags &= ~(XVID_ME_CHROMA16 + XVID_ME_CHROMA8);
274 : edgomez 851
275 :     return Flags;
276 :     }
277 :    
278 :     /* BITS mode decision and search */
279 :    
280 :     #include "../bitstream/zigzag.h"
281 :     #include "../quant/quant_mpeg4.h"
282 :     #include "../quant/quant_h263.h"
283 :     #include "../bitstream/vlc_codes.h"
284 : edgomez 1022 #include "../dct/fdct.h"
285 : edgomez 851
286 :     static int
287 :     CountMBBitsInter(SearchData * const Data,
288 :     const MACROBLOCK * const pMBs, const int x, const int y,
289 :     const MBParam * const pParam,
290 :     const uint32_t MotionFlags);
291 :    
292 :     static int
293 :     CountMBBitsInter4v(const SearchData * const Data,
294 :     MACROBLOCK * const pMB, const MACROBLOCK * const pMBs,
295 :     const int x, const int y,
296 :     const MBParam * const pParam, const uint32_t MotionFlags,
297 :     const VECTOR * const backup);
298 :    
299 :     static int
300 :     CountMBBitsIntra(const SearchData * const Data);
301 :    
302 :     int CodeCoeffIntra_CalcBits(const int16_t qcoeff[64], const uint16_t * zigzag);
303 :     int CodeCoeffInter_CalcBits(const int16_t qcoeff[64], const uint16_t * zigzag);
304 : edgomez 1023
305 :     #define LAMBDA ( (int)(1.0*BITS_MULT) )
306 :    
307 : edgomez 1022 static __inline unsigned int
308 : edgomez 1023 Block_CalcBits( int16_t * const coeff,
309 :     int16_t * const data,
310 :     const uint32_t quant, const int quant_type,
311 :     uint32_t * cbp,
312 :     const int block)
313 : edgomez 1022 {
314 :     int sum;
315 : edgomez 1023 int bits;
316 :     const int lambda = LAMBDA*quant*quant;
317 :     int distortion = 0;
318 :     int i;
319 : edgomez 851
320 : edgomez 1022 fdct(data);
321 :    
322 :     if (quant_type == 0) sum = quant_inter(coeff, data, quant);
323 :     else sum = quant4_inter(coeff, data, quant);
324 :    
325 :     if (sum > 0) {
326 :     *cbp |= 1 << (5 - block);
327 : edgomez 1023 bits = BITS_MULT * CodeCoeffInter_CalcBits(coeff, scan_tables[0]);
328 :     } else bits = 0;
329 :    
330 :     if (quant_type == 0) dequant_inter(coeff, coeff, quant);
331 :     else dequant4_inter(coeff, coeff, quant);
332 :    
333 :     for (i = 0; i < 64; i++) {
334 :     distortion += (data[i] - coeff[i])*(data[i] - coeff[i]);
335 :     }
336 :     bits += (BITS_MULT*BITS_MULT*distortion)/lambda;
337 :    
338 :    
339 :     return bits;
340 : edgomez 1022 }
341 :    
342 : edgomez 1023 static __inline unsigned int
343 :     Block_CalcBitsIntra(int16_t * const coeff,
344 :     int16_t * const data,
345 :     const uint32_t quant, const int quant_type,
346 :     uint32_t * cbp,
347 :     const int block,
348 :     int * dcpred)
349 :     {
350 :     int bits, i;
351 :     const int lambda = LAMBDA*quant*quant;
352 :     int distortion = 0;
353 : syskin 1071 uint32_t iDcScaler = get_dc_scaler(quant, block < 4);
354 : edgomez 1023 int b_dc;
355 :    
356 :     fdct(data);
357 :     data[0] -= 1024;
358 :    
359 : syskin 1071 if (quant_type == 0) quant_intra_c(coeff, data, quant, iDcScaler); // MUST BE _C
360 :     else quant4_intra_c(coeff, data, quant, iDcScaler); // MUST BE _C
361 : edgomez 1023
362 :     b_dc = coeff[0];
363 :     if (block < 4) {
364 :     coeff[0] -= *dcpred;
365 :     *dcpred = b_dc;
366 :     }
367 :    
368 :     bits = BITS_MULT*CodeCoeffIntra_CalcBits(coeff, scan_tables[0]);
369 :     if (bits != 0) *cbp |= 1 << (5 - block);
370 :    
371 : syskin 1071 if (block < 4) bits += BITS_MULT*dcy_tab[coeff[0] + 255].len;
372 :     else bits += BITS_MULT*dcc_tab[coeff[0] + 255].len;
373 :    
374 : edgomez 1023 coeff[0] = b_dc;
375 :     if (quant_type == 0) dequant_intra(coeff, coeff, quant, iDcScaler);
376 :     else dequant4_intra(coeff, coeff, quant, iDcScaler);
377 :    
378 :     for (i = 0; i < 64; i++) {
379 :     distortion += (data[i] - coeff[i])*(data[i] - coeff[i]);
380 :     }
381 :    
382 :     bits += (BITS_MULT*BITS_MULT*distortion)/lambda;
383 :    
384 :     return bits;
385 :     }
386 :    
387 : syskin 1071
388 : edgomez 851 #endif /* _MOTION_EST_H_ */

No admin address has been configured
ViewVC Help
Powered by ViewVC 1.0.4