Parent Directory | Revision Log
Revision 1054 - (view) (download)
1 : | edgomez | 1054 | /***************************************************************************** |
2 : | edgomez | 851 | * |
3 : | * XVID MPEG-4 VIDEO CODEC | ||
4 : | edgomez | 1054 | * - Motion Estimation related header - |
5 : | edgomez | 851 | * |
6 : | edgomez | 1054 | * Copyright(C) 2002 Christoph Lampert <gruel@web.de> |
7 : | * 2002 Michael Militzer <michael@xvid.org> | ||
8 : | * 2002-2003 Radoslaw Czyz <xvid@syskin.cjb.net> | ||
9 : | edgomez | 851 | * |
10 : | edgomez | 1054 | * This program is free software ; you can redistribute it and/or modify |
11 : | edgomez | 851 | * it under the terms of the GNU General Public License as published by |
12 : | edgomez | 1054 | * the Free Software Foundation ; either version 2 of the License, or |
13 : | edgomez | 851 | * (at your option) any later version. |
14 : | * | ||
15 : | * This program is distributed in the hope that it will be useful, | ||
16 : | edgomez | 1054 | * but WITHOUT ANY WARRANTY ; without even the implied warranty of |
17 : | edgomez | 851 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
18 : | * GNU General Public License for more details. | ||
19 : | * | ||
20 : | * You should have received a copy of the GNU General Public License | ||
21 : | edgomez | 1054 | * along with this program ; if not, write to the Free Software |
22 : | edgomez | 851 | * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
23 : | * | ||
24 : | edgomez | 1054 | * $Id: motion_est.h,v 1.3.2.9 2003-06-09 13:54:41 edgomez Exp $ |
25 : | edgomez | 851 | * |
26 : | edgomez | 1054 | ****************************************************************************/ |
27 : | edgomez | 851 | |
28 : | #ifndef _MOTION_EST_H_ | ||
29 : | #define _MOTION_EST_H_ | ||
30 : | |||
31 : | #include "../portab.h" | ||
32 : | #include "../global.h" | ||
33 : | #include "../image/reduced.h" | ||
34 : | |||
35 : | /* hard coded motion search parameters for motion_est and smp_motion_est */ | ||
36 : | |||
37 : | edgomez | 1053 | /* very large value */ |
38 : | edgomez | 851 | #define MV_MAX_ERROR (4096 * 256) |
39 : | |||
40 : | /* INTER bias for INTER/INTRA decision; mpeg4 spec suggests 2*nb */ | ||
41 : | #define MV16_INTER_BIAS 512 | ||
42 : | |||
43 : | /* vector map (vlc delta size) smoother parameters ! float !*/ | ||
44 : | #define NEIGH_TEND_16X16 10.5 | ||
45 : | #define NEIGH_TEND_8X8 40.0 | ||
46 : | #define NEIGH_8X8_BIAS 30 | ||
47 : | |||
48 : | edgomez | 1023 | #define BITS_MULT 16 |
49 : | |||
50 : | edgomez | 851 | /* Parameters which control inter/inter4v decision */ |
51 : | #define IMV16X16 2 | ||
52 : | |||
53 : | static const int lambda_vec16[32] = | ||
54 : | { 0 ,(int)(1.00235 * NEIGH_TEND_16X16 + 0.5), | ||
55 : | (int)(1.15582*NEIGH_TEND_16X16 + 0.5), (int)(1.31976*NEIGH_TEND_16X16 + 0.5), | ||
56 : | (int)(1.49591*NEIGH_TEND_16X16 + 0.5), (int)(1.68601*NEIGH_TEND_16X16 + 0.5), | ||
57 : | (int)(1.89187*NEIGH_TEND_16X16 + 0.5), (int)(2.11542*NEIGH_TEND_16X16 + 0.5), | ||
58 : | (int)(2.35878*NEIGH_TEND_16X16 + 0.5), (int)(2.62429*NEIGH_TEND_16X16 + 0.5), | ||
59 : | (int)(2.91455*NEIGH_TEND_16X16 + 0.5), (int)(3.23253*NEIGH_TEND_16X16 + 0.5), | ||
60 : | (int)(3.58158*NEIGH_TEND_16X16 + 0.5), (int)(3.96555*NEIGH_TEND_16X16 + 0.5), | ||
61 : | (int)(4.38887*NEIGH_TEND_16X16 + 0.5), (int)(4.85673*NEIGH_TEND_16X16 + 0.5), | ||
62 : | (int)(5.37519*NEIGH_TEND_16X16 + 0.5), (int)(5.95144*NEIGH_TEND_16X16 + 0.5), | ||
63 : | (int)(6.59408*NEIGH_TEND_16X16 + 0.5), (int)(7.31349*NEIGH_TEND_16X16 + 0.5), | ||
64 : | (int)(8.12242*NEIGH_TEND_16X16 + 0.5), (int)(9.03669*NEIGH_TEND_16X16 + 0.5), | ||
65 : | (int)(10.0763*NEIGH_TEND_16X16 + 0.5), (int)(11.2669*NEIGH_TEND_16X16 + 0.5), | ||
66 : | (int)(12.6426*NEIGH_TEND_16X16 + 0.5), (int)(14.2493*NEIGH_TEND_16X16 + 0.5), | ||
67 : | (int)(16.1512*NEIGH_TEND_16X16 + 0.5), (int)(18.442*NEIGH_TEND_16X16 + 0.5), | ||
68 : | (int)(21.2656*NEIGH_TEND_16X16 + 0.5), (int)(24.8580*NEIGH_TEND_16X16 + 0.5), | ||
69 : | (int)(29.6436*NEIGH_TEND_16X16 + 0.5), (int)(36.4949*NEIGH_TEND_16X16 + 0.5) }; | ||
70 : | |||
71 : | static const int lambda_vec8[32] = | ||
72 : | { 0 ,(int)(1.00235 * NEIGH_TEND_8X8 + 0.5), | ||
73 : | (int)(1.15582 + NEIGH_TEND_8X8 + 0.5), (int)(1.31976*NEIGH_TEND_8X8 + 0.5), | ||
74 : | (int)(1.49591*NEIGH_TEND_8X8 + 0.5), (int)(1.68601*NEIGH_TEND_8X8 + 0.5), | ||
75 : | (int)(1.89187*NEIGH_TEND_8X8 + 0.5), (int)(2.11542*NEIGH_TEND_8X8 + 0.5), | ||
76 : | (int)(2.35878*NEIGH_TEND_8X8 + 0.5), (int)(2.62429*NEIGH_TEND_8X8 + 0.5), | ||
77 : | (int)(2.91455*NEIGH_TEND_8X8 + 0.5), (int)(3.23253*NEIGH_TEND_8X8 + 0.5), | ||
78 : | (int)(3.58158*NEIGH_TEND_8X8 + 0.5), (int)(3.96555*NEIGH_TEND_8X8 + 0.5), | ||
79 : | (int)(4.38887*NEIGH_TEND_8X8 + 0.5), (int)(4.85673*NEIGH_TEND_8X8 + 0.5), | ||
80 : | (int)(5.37519*NEIGH_TEND_8X8 + 0.5), (int)(5.95144*NEIGH_TEND_8X8 + 0.5), | ||
81 : | (int)(6.59408*NEIGH_TEND_8X8 + 0.5), (int)(7.31349*NEIGH_TEND_8X8 + 0.5), | ||
82 : | (int)(8.12242*NEIGH_TEND_8X8 + 0.5), (int)(9.03669*NEIGH_TEND_8X8 + 0.5), | ||
83 : | (int)(10.0763*NEIGH_TEND_8X8 + 0.5), (int)(11.2669*NEIGH_TEND_8X8 + 0.5), | ||
84 : | (int)(12.6426*NEIGH_TEND_8X8 + 0.5), (int)(14.2493*NEIGH_TEND_8X8 + 0.5), | ||
85 : | (int)(16.1512*NEIGH_TEND_8X8 + 0.5), (int)(18.442*NEIGH_TEND_8X8 + 0.5), | ||
86 : | (int)(21.2656*NEIGH_TEND_8X8 + 0.5), (int)(24.8580*NEIGH_TEND_8X8 + 0.5), | ||
87 : | (int)(29.6436*NEIGH_TEND_8X8 + 0.5), (int)(36.4949*NEIGH_TEND_8X8 + 0.5) }; | ||
88 : | |||
89 : | edgomez | 1053 | /* mv.length table */ |
90 : | edgomez | 974 | static const int mvtab[64] = { |
91 : | 1, 2, 3, 4, 6, 7, 7, 7, | ||
92 : | 9, 9, 9, 10, 10, 10, 10, 10, | ||
93 : | 10, 10, 10, 10, 10, 10, 10, 10, | ||
94 : | 10, 11, 11, 11, 11, 11, 11, 12, | ||
95 : | 12, 12, 12, 12, 12, 12, 12, 12, | ||
96 : | 12, 12, 12, 12, 12, 12, 12, 12, | ||
97 : | 12, 12, 12, 12, 12, 12, 12, 12, 12 }; | ||
98 : | edgomez | 851 | |
99 : | static const int DQtab[4] = { | ||
100 : | -1, -2, 1, 2 | ||
101 : | }; | ||
102 : | |||
103 : | #define RRV_MV_SCALEDOWN(a) ( (a)>=0 ? (a+1)/2 : (a-1)/2 ) | ||
104 : | |||
105 : | typedef struct | ||
106 : | { | ||
107 : | edgomez | 1053 | /* general fields */ |
108 : | edgomez | 851 | int max_dx, min_dx, max_dy, min_dy; |
109 : | uint32_t rounding; | ||
110 : | VECTOR predMV; | ||
111 : | VECTOR * currentMV; | ||
112 : | VECTOR * currentQMV; | ||
113 : | int32_t * iMinSAD; | ||
114 : | edgomez | 1053 | const uint8_t * RefP[6]; /* N, V, H, HV, cU, cV */ |
115 : | edgomez | 851 | const uint8_t * CurU; |
116 : | const uint8_t * CurV; | ||
117 : | uint8_t * RefQ; | ||
118 : | const uint8_t * Cur; | ||
119 : | uint32_t lambda16; | ||
120 : | uint32_t lambda8; | ||
121 : | uint32_t iEdgedWidth; | ||
122 : | uint32_t iFcode; | ||
123 : | int * temp; | ||
124 : | int qpel, qpel_precision; | ||
125 : | int chroma; | ||
126 : | int rrv; | ||
127 : | edgomez | 1053 | |
128 : | /* fields for interpolate and direct modes */ | ||
129 : | const uint8_t * b_RefP[6]; /* N, V, H, HV, cU, cV */ | ||
130 : | edgomez | 851 | VECTOR bpredMV; |
131 : | uint32_t bFcode; | ||
132 : | edgomez | 1053 | |
133 : | /* fields for direct mode */ | ||
134 : | edgomez | 851 | VECTOR directmvF[4]; |
135 : | VECTOR directmvB[4]; | ||
136 : | const VECTOR * referencemv; | ||
137 : | edgomez | 1053 | |
138 : | /* BITS/R-D stuff */ | ||
139 : | edgomez | 959 | int16_t * dctSpace; |
140 : | edgomez | 1022 | uint32_t iQuant; |
141 : | uint32_t quant_type; | ||
142 : | edgomez | 851 | |
143 : | } SearchData; | ||
144 : | |||
145 : | |||
146 : | typedef void(CheckFunc)(const int x, const int y, | ||
147 : | const int Direction, int * const dir, | ||
148 : | const SearchData * const Data); | ||
149 : | CheckFunc *CheckCandidate; | ||
150 : | |||
151 : | /* | ||
152 : | * Calculate the min/max range | ||
153 : | * relative to the _MACROBLOCK_ position | ||
154 : | */ | ||
155 : | static void __inline | ||
156 : | get_range(int32_t * const min_dx, | ||
157 : | int32_t * const max_dx, | ||
158 : | int32_t * const min_dy, | ||
159 : | int32_t * const max_dy, | ||
160 : | const uint32_t x, | ||
161 : | const uint32_t y, | ||
162 : | uint32_t block_sz, /* block dimension, 8 or 16 */ | ||
163 : | const uint32_t width, | ||
164 : | const uint32_t height, | ||
165 : | const uint32_t fcode, | ||
166 : | const int qpel, /* 1 if the resulting range should be in qpel precision; otherwise 0 */ | ||
167 : | const int rrv) | ||
168 : | { | ||
169 : | int k, m = qpel ? 4 : 2; | ||
170 : | const int search_range = 32 << (fcode - 1); | ||
171 : | int high = search_range - 1; | ||
172 : | int low = -search_range; | ||
173 : | |||
174 : | if (rrv) { | ||
175 : | high = RRV_MV_SCALEUP(high); | ||
176 : | low = RRV_MV_SCALEUP(low); | ||
177 : | block_sz *= 2; | ||
178 : | } | ||
179 : | |||
180 : | k = m * (int)(width - x * block_sz); | ||
181 : | *max_dx = MIN(high, k); | ||
182 : | k = m * (int)(height - y * block_sz); | ||
183 : | *max_dy = MIN(high, k); | ||
184 : | |||
185 : | k = -m * (int)((x+1) * block_sz); | ||
186 : | *min_dx = MAX(low, k); | ||
187 : | k = -m * (int)((y+1) * block_sz); | ||
188 : | *min_dy = MAX(low, k); | ||
189 : | } | ||
190 : | |||
191 : | typedef void MainSearchFunc(int x, int y, const SearchData * const Data, int bDirection); | ||
192 : | |||
193 : | static MainSearchFunc DiamondSearch, AdvDiamondSearch, SquareSearch; | ||
194 : | |||
195 : | static void Search8(const SearchData * const OldData, | ||
196 : | const int x, const int y, | ||
197 : | const uint32_t MotionFlags, | ||
198 : | const MBParam * const pParam, | ||
199 : | MACROBLOCK * const pMB, | ||
200 : | const MACROBLOCK * const pMBs, | ||
201 : | const int block, | ||
202 : | SearchData * const Data); | ||
203 : | |||
204 : | bool | ||
205 : | MotionEstimation(MBParam * const pParam, | ||
206 : | syskin | 884 | FRAMEINFO * const current, |
207 : | FRAMEINFO * const reference, | ||
208 : | const IMAGE * const pRefH, | ||
209 : | const IMAGE * const pRefV, | ||
210 : | const IMAGE * const pRefHV, | ||
211 : | const uint32_t iLimit); | ||
212 : | edgomez | 851 | |
213 : | static void | ||
214 : | SearchP(const IMAGE * const pRef, | ||
215 : | const uint8_t * const pRefH, | ||
216 : | const uint8_t * const pRefV, | ||
217 : | const uint8_t * const pRefHV, | ||
218 : | const IMAGE * const pCur, | ||
219 : | const int x, | ||
220 : | const int y, | ||
221 : | const uint32_t MotionFlags, | ||
222 : | edgomez | 1022 | const uint32_t VopFlags, |
223 : | const uint32_t VolFlags, | ||
224 : | edgomez | 851 | SearchData * const Data, |
225 : | const MBParam * const pParam, | ||
226 : | const MACROBLOCK * const pMBs, | ||
227 : | const MACROBLOCK * const prevMBs, | ||
228 : | MACROBLOCK * const pMB); | ||
229 : | |||
230 : | static WARPPOINTS | ||
231 : | GlobalMotionEst(const MACROBLOCK * const pMBs, | ||
232 : | const MBParam * const pParam, | ||
233 : | const FRAMEINFO * const current, | ||
234 : | const FRAMEINFO * const reference, | ||
235 : | const IMAGE * const pRefH, | ||
236 : | const IMAGE * const pRefV, | ||
237 : | const IMAGE * const pRefHV ); | ||
238 : | |||
239 : | #define iDiamondSize 2 | ||
240 : | |||
241 : | static __inline uint32_t | ||
242 : | suxen_drol | 890 | MakeGoodMotionFlags(const uint32_t MotionFlags, const uint32_t VopFlags, const uint32_t VolFlags) |
243 : | edgomez | 851 | { |
244 : | uint32_t Flags = MotionFlags; | ||
245 : | |||
246 : | edgomez | 949 | if (!(VopFlags & XVID_VOP_MODEDECISION_BITS)) |
247 : | Flags &= ~(XVID_ME_QUARTERPELREFINE16_BITS+XVID_ME_QUARTERPELREFINE8_BITS+XVID_ME_HALFPELREFINE16_BITS+XVID_ME_HALFPELREFINE8_BITS+XVID_ME_EXTSEARCH_BITS); | ||
248 : | edgomez | 851 | |
249 : | edgomez | 949 | if (Flags & XVID_ME_EXTSEARCH_BITS) |
250 : | Flags |= XVID_ME_HALFPELREFINE16_BITS; | ||
251 : | edgomez | 851 | |
252 : | edgomez | 949 | if (Flags & XVID_ME_EXTSEARCH_BITS && MotionFlags & XVID_ME_EXTSEARCH8) |
253 : | Flags |= XVID_ME_HALFPELREFINE8_BITS; | ||
254 : | edgomez | 851 | |
255 : | edgomez | 949 | if (Flags & XVID_ME_HALFPELREFINE16_BITS) |
256 : | Flags |= XVID_ME_QUARTERPELREFINE16_BITS; | ||
257 : | edgomez | 851 | |
258 : | edgomez | 949 | if (Flags & XVID_ME_HALFPELREFINE8_BITS) { |
259 : | Flags |= XVID_ME_QUARTERPELREFINE8_BITS; | ||
260 : | Flags &= ~XVID_ME_HALFPELREFINE8; | ||
261 : | edgomez | 851 | } |
262 : | |||
263 : | edgomez | 949 | if (Flags & XVID_ME_QUARTERPELREFINE8_BITS) |
264 : | Flags &= ~XVID_ME_QUARTERPELREFINE8; | ||
265 : | edgomez | 851 | |
266 : | edgomez | 949 | if (!(VolFlags & XVID_VOL_QUARTERPEL)) |
267 : | Flags &= ~(XVID_ME_QUARTERPELREFINE16+XVID_ME_QUARTERPELREFINE8+XVID_ME_QUARTERPELREFINE16_BITS+XVID_ME_QUARTERPELREFINE8_BITS); | ||
268 : | edgomez | 851 | |
269 : | edgomez | 949 | if (!(VopFlags & XVID_VOP_HALFPEL)) |
270 : | Flags &= ~(XVID_ME_EXTSEARCH16+XVID_ME_HALFPELREFINE16+XVID_ME_HALFPELREFINE8+XVID_ME_HALFPELREFINE16_BITS+XVID_ME_HALFPELREFINE8_BITS); | ||
271 : | edgomez | 851 | |
272 : | edgomez | 949 | if ((VopFlags & XVID_VOP_GREYSCALE) || (VopFlags & XVID_VOP_REDUCED)) |
273 : | Flags &= ~(XVID_ME_CHROMA16 + XVID_ME_CHROMA8); | ||
274 : | edgomez | 851 | |
275 : | return Flags; | ||
276 : | } | ||
277 : | |||
278 : | /* BITS mode decision and search */ | ||
279 : | |||
280 : | #include "../bitstream/zigzag.h" | ||
281 : | #include "../quant/quant_mpeg4.h" | ||
282 : | #include "../quant/quant_h263.h" | ||
283 : | #include "../bitstream/vlc_codes.h" | ||
284 : | edgomez | 1022 | #include "../dct/fdct.h" |
285 : | edgomez | 851 | |
286 : | static int | ||
287 : | CountMBBitsInter(SearchData * const Data, | ||
288 : | const MACROBLOCK * const pMBs, const int x, const int y, | ||
289 : | const MBParam * const pParam, | ||
290 : | const uint32_t MotionFlags); | ||
291 : | |||
292 : | static int | ||
293 : | CountMBBitsInter4v(const SearchData * const Data, | ||
294 : | MACROBLOCK * const pMB, const MACROBLOCK * const pMBs, | ||
295 : | const int x, const int y, | ||
296 : | const MBParam * const pParam, const uint32_t MotionFlags, | ||
297 : | const VECTOR * const backup); | ||
298 : | |||
299 : | static int | ||
300 : | CountMBBitsIntra(const SearchData * const Data); | ||
301 : | |||
302 : | int CodeCoeffIntra_CalcBits(const int16_t qcoeff[64], const uint16_t * zigzag); | ||
303 : | int CodeCoeffInter_CalcBits(const int16_t qcoeff[64], const uint16_t * zigzag); | ||
304 : | edgomez | 1023 | |
305 : | #define LAMBDA ( (int)(1.0*BITS_MULT) ) | ||
306 : | |||
307 : | edgomez | 1022 | static __inline unsigned int |
308 : | edgomez | 1023 | Block_CalcBits( int16_t * const coeff, |
309 : | int16_t * const data, | ||
310 : | const uint32_t quant, const int quant_type, | ||
311 : | uint32_t * cbp, | ||
312 : | const int block) | ||
313 : | edgomez | 1022 | { |
314 : | int sum; | ||
315 : | edgomez | 1023 | int bits; |
316 : | const int lambda = LAMBDA*quant*quant; | ||
317 : | int distortion = 0; | ||
318 : | int i; | ||
319 : | edgomez | 851 | |
320 : | edgomez | 1022 | fdct(data); |
321 : | |||
322 : | if (quant_type == 0) sum = quant_inter(coeff, data, quant); | ||
323 : | else sum = quant4_inter(coeff, data, quant); | ||
324 : | |||
325 : | if (sum > 0) { | ||
326 : | *cbp |= 1 << (5 - block); | ||
327 : | edgomez | 1023 | bits = BITS_MULT * CodeCoeffInter_CalcBits(coeff, scan_tables[0]); |
328 : | } else bits = 0; | ||
329 : | |||
330 : | if (quant_type == 0) dequant_inter(coeff, coeff, quant); | ||
331 : | else dequant4_inter(coeff, coeff, quant); | ||
332 : | |||
333 : | for (i = 0; i < 64; i++) { | ||
334 : | distortion += (data[i] - coeff[i])*(data[i] - coeff[i]); | ||
335 : | } | ||
336 : | bits += (BITS_MULT*BITS_MULT*distortion)/lambda; | ||
337 : | |||
338 : | |||
339 : | return bits; | ||
340 : | edgomez | 1022 | } |
341 : | |||
342 : | edgomez | 1023 | static __inline unsigned int |
343 : | Block_CalcBitsIntra(int16_t * const coeff, | ||
344 : | int16_t * const data, | ||
345 : | const uint32_t quant, const int quant_type, | ||
346 : | uint32_t * cbp, | ||
347 : | const int block, | ||
348 : | int * dcpred) | ||
349 : | { | ||
350 : | int bits, i; | ||
351 : | const int lambda = LAMBDA*quant*quant; | ||
352 : | int distortion = 0; | ||
353 : | uint32_t iDcScaler = get_dc_scaler(quant, block > 3); | ||
354 : | int b_dc; | ||
355 : | |||
356 : | fdct(data); | ||
357 : | data[0] -= 1024; | ||
358 : | |||
359 : | if (quant_type == 0) quant_intra(coeff, data, quant, iDcScaler); | ||
360 : | else quant4_intra(coeff, data, quant, iDcScaler); | ||
361 : | |||
362 : | b_dc = coeff[0]; | ||
363 : | if (block < 4) { | ||
364 : | coeff[0] -= *dcpred; | ||
365 : | *dcpred = b_dc; | ||
366 : | } | ||
367 : | |||
368 : | *cbp |= 1 << (5 - block); | ||
369 : | bits = BITS_MULT*CodeCoeffIntra_CalcBits(coeff, scan_tables[0]); | ||
370 : | bits += BITS_MULT*dcy_tab[coeff[0] + 255].len; | ||
371 : | if (bits != 0) *cbp |= 1 << (5 - block); | ||
372 : | |||
373 : | coeff[0] = b_dc; | ||
374 : | if (quant_type == 0) dequant_intra(coeff, coeff, quant, iDcScaler); | ||
375 : | else dequant4_intra(coeff, coeff, quant, iDcScaler); | ||
376 : | |||
377 : | for (i = 0; i < 64; i++) { | ||
378 : | distortion += (data[i] - coeff[i])*(data[i] - coeff[i]); | ||
379 : | } | ||
380 : | |||
381 : | bits += (BITS_MULT*BITS_MULT*distortion)/lambda; | ||
382 : | |||
383 : | return bits; | ||
384 : | } | ||
385 : | |||
386 : | edgomez | 851 | #endif /* _MOTION_EST_H_ */ |
No admin address has been configured | ViewVC Help |
Powered by ViewVC 1.0.4 |