Parent Directory | Revision Log
Revision 1053 - (view) (download)
1 : | edgomez | 851 | /************************************************************************** |
2 : | * | ||
3 : | * XVID MPEG-4 VIDEO CODEC | ||
4 : | * - Motion estimation header - | ||
5 : | * | ||
6 : | * This program is an implementation of a part of one or more MPEG-4 | ||
7 : | * Video tools as specified in ISO/IEC 14496-2 standard. Those intending | ||
8 : | * to use this software module in hardware or software products are | ||
9 : | * advised that its use may infringe existing patents or copyrights, and | ||
10 : | * any such use would be at such party's own risk. The original | ||
11 : | * developer of this software module and his/her company, and subsequent | ||
12 : | * editors and their companies, will have no liability for use of this | ||
13 : | * software or modifications or derivatives thereof. | ||
14 : | * | ||
15 : | * This program is free software; you can redistribute it and/or modify | ||
16 : | * it under the terms of the GNU General Public License as published by | ||
17 : | * the Free Software Foundation; either version 2 of the License, or | ||
18 : | * (at your option) any later version. | ||
19 : | * | ||
20 : | * This program is distributed in the hope that it will be useful, | ||
21 : | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
22 : | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
23 : | * GNU General Public License for more details. | ||
24 : | * | ||
25 : | * You should have received a copy of the GNU General Public License | ||
26 : | * along with this program; if not, write to the Free Software | ||
27 : | * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA | ||
28 : | * | ||
29 : | edgomez | 1053 | * $Id: motion_est.h,v 1.3.2.8 2003-06-09 01:22:18 edgomez Exp $ |
30 : | edgomez | 851 | * |
31 : | ***************************************************************************/ | ||
32 : | |||
33 : | #ifndef _MOTION_EST_H_ | ||
34 : | #define _MOTION_EST_H_ | ||
35 : | |||
36 : | #include "../portab.h" | ||
37 : | #include "../global.h" | ||
38 : | #include "../image/reduced.h" | ||
39 : | |||
40 : | /* hard coded motion search parameters for motion_est and smp_motion_est */ | ||
41 : | |||
42 : | edgomez | 1053 | /* very large value */ |
43 : | edgomez | 851 | #define MV_MAX_ERROR (4096 * 256) |
44 : | |||
45 : | /* INTER bias for INTER/INTRA decision; mpeg4 spec suggests 2*nb */ | ||
46 : | #define MV16_INTER_BIAS 512 | ||
47 : | |||
48 : | /* vector map (vlc delta size) smoother parameters ! float !*/ | ||
49 : | #define NEIGH_TEND_16X16 10.5 | ||
50 : | #define NEIGH_TEND_8X8 40.0 | ||
51 : | #define NEIGH_8X8_BIAS 30 | ||
52 : | |||
53 : | edgomez | 1023 | #define BITS_MULT 16 |
54 : | |||
55 : | edgomez | 851 | /* Parameters which control inter/inter4v decision */ |
56 : | #define IMV16X16 2 | ||
57 : | |||
58 : | static const int lambda_vec16[32] = | ||
59 : | { 0 ,(int)(1.00235 * NEIGH_TEND_16X16 + 0.5), | ||
60 : | (int)(1.15582*NEIGH_TEND_16X16 + 0.5), (int)(1.31976*NEIGH_TEND_16X16 + 0.5), | ||
61 : | (int)(1.49591*NEIGH_TEND_16X16 + 0.5), (int)(1.68601*NEIGH_TEND_16X16 + 0.5), | ||
62 : | (int)(1.89187*NEIGH_TEND_16X16 + 0.5), (int)(2.11542*NEIGH_TEND_16X16 + 0.5), | ||
63 : | (int)(2.35878*NEIGH_TEND_16X16 + 0.5), (int)(2.62429*NEIGH_TEND_16X16 + 0.5), | ||
64 : | (int)(2.91455*NEIGH_TEND_16X16 + 0.5), (int)(3.23253*NEIGH_TEND_16X16 + 0.5), | ||
65 : | (int)(3.58158*NEIGH_TEND_16X16 + 0.5), (int)(3.96555*NEIGH_TEND_16X16 + 0.5), | ||
66 : | (int)(4.38887*NEIGH_TEND_16X16 + 0.5), (int)(4.85673*NEIGH_TEND_16X16 + 0.5), | ||
67 : | (int)(5.37519*NEIGH_TEND_16X16 + 0.5), (int)(5.95144*NEIGH_TEND_16X16 + 0.5), | ||
68 : | (int)(6.59408*NEIGH_TEND_16X16 + 0.5), (int)(7.31349*NEIGH_TEND_16X16 + 0.5), | ||
69 : | (int)(8.12242*NEIGH_TEND_16X16 + 0.5), (int)(9.03669*NEIGH_TEND_16X16 + 0.5), | ||
70 : | (int)(10.0763*NEIGH_TEND_16X16 + 0.5), (int)(11.2669*NEIGH_TEND_16X16 + 0.5), | ||
71 : | (int)(12.6426*NEIGH_TEND_16X16 + 0.5), (int)(14.2493*NEIGH_TEND_16X16 + 0.5), | ||
72 : | (int)(16.1512*NEIGH_TEND_16X16 + 0.5), (int)(18.442*NEIGH_TEND_16X16 + 0.5), | ||
73 : | (int)(21.2656*NEIGH_TEND_16X16 + 0.5), (int)(24.8580*NEIGH_TEND_16X16 + 0.5), | ||
74 : | (int)(29.6436*NEIGH_TEND_16X16 + 0.5), (int)(36.4949*NEIGH_TEND_16X16 + 0.5) }; | ||
75 : | |||
76 : | static const int lambda_vec8[32] = | ||
77 : | { 0 ,(int)(1.00235 * NEIGH_TEND_8X8 + 0.5), | ||
78 : | (int)(1.15582 + NEIGH_TEND_8X8 + 0.5), (int)(1.31976*NEIGH_TEND_8X8 + 0.5), | ||
79 : | (int)(1.49591*NEIGH_TEND_8X8 + 0.5), (int)(1.68601*NEIGH_TEND_8X8 + 0.5), | ||
80 : | (int)(1.89187*NEIGH_TEND_8X8 + 0.5), (int)(2.11542*NEIGH_TEND_8X8 + 0.5), | ||
81 : | (int)(2.35878*NEIGH_TEND_8X8 + 0.5), (int)(2.62429*NEIGH_TEND_8X8 + 0.5), | ||
82 : | (int)(2.91455*NEIGH_TEND_8X8 + 0.5), (int)(3.23253*NEIGH_TEND_8X8 + 0.5), | ||
83 : | (int)(3.58158*NEIGH_TEND_8X8 + 0.5), (int)(3.96555*NEIGH_TEND_8X8 + 0.5), | ||
84 : | (int)(4.38887*NEIGH_TEND_8X8 + 0.5), (int)(4.85673*NEIGH_TEND_8X8 + 0.5), | ||
85 : | (int)(5.37519*NEIGH_TEND_8X8 + 0.5), (int)(5.95144*NEIGH_TEND_8X8 + 0.5), | ||
86 : | (int)(6.59408*NEIGH_TEND_8X8 + 0.5), (int)(7.31349*NEIGH_TEND_8X8 + 0.5), | ||
87 : | (int)(8.12242*NEIGH_TEND_8X8 + 0.5), (int)(9.03669*NEIGH_TEND_8X8 + 0.5), | ||
88 : | (int)(10.0763*NEIGH_TEND_8X8 + 0.5), (int)(11.2669*NEIGH_TEND_8X8 + 0.5), | ||
89 : | (int)(12.6426*NEIGH_TEND_8X8 + 0.5), (int)(14.2493*NEIGH_TEND_8X8 + 0.5), | ||
90 : | (int)(16.1512*NEIGH_TEND_8X8 + 0.5), (int)(18.442*NEIGH_TEND_8X8 + 0.5), | ||
91 : | (int)(21.2656*NEIGH_TEND_8X8 + 0.5), (int)(24.8580*NEIGH_TEND_8X8 + 0.5), | ||
92 : | (int)(29.6436*NEIGH_TEND_8X8 + 0.5), (int)(36.4949*NEIGH_TEND_8X8 + 0.5) }; | ||
93 : | |||
94 : | edgomez | 1053 | /* mv.length table */ |
95 : | edgomez | 974 | static const int mvtab[64] = { |
96 : | 1, 2, 3, 4, 6, 7, 7, 7, | ||
97 : | 9, 9, 9, 10, 10, 10, 10, 10, | ||
98 : | 10, 10, 10, 10, 10, 10, 10, 10, | ||
99 : | 10, 11, 11, 11, 11, 11, 11, 12, | ||
100 : | 12, 12, 12, 12, 12, 12, 12, 12, | ||
101 : | 12, 12, 12, 12, 12, 12, 12, 12, | ||
102 : | 12, 12, 12, 12, 12, 12, 12, 12, 12 }; | ||
103 : | edgomez | 851 | |
104 : | static const int DQtab[4] = { | ||
105 : | -1, -2, 1, 2 | ||
106 : | }; | ||
107 : | |||
108 : | #define RRV_MV_SCALEDOWN(a) ( (a)>=0 ? (a+1)/2 : (a-1)/2 ) | ||
109 : | |||
110 : | typedef struct | ||
111 : | { | ||
112 : | edgomez | 1053 | /* general fields */ |
113 : | edgomez | 851 | int max_dx, min_dx, max_dy, min_dy; |
114 : | uint32_t rounding; | ||
115 : | VECTOR predMV; | ||
116 : | VECTOR * currentMV; | ||
117 : | VECTOR * currentQMV; | ||
118 : | int32_t * iMinSAD; | ||
119 : | edgomez | 1053 | const uint8_t * RefP[6]; /* N, V, H, HV, cU, cV */ |
120 : | edgomez | 851 | const uint8_t * CurU; |
121 : | const uint8_t * CurV; | ||
122 : | uint8_t * RefQ; | ||
123 : | const uint8_t * Cur; | ||
124 : | uint32_t lambda16; | ||
125 : | uint32_t lambda8; | ||
126 : | uint32_t iEdgedWidth; | ||
127 : | uint32_t iFcode; | ||
128 : | int * temp; | ||
129 : | int qpel, qpel_precision; | ||
130 : | int chroma; | ||
131 : | int rrv; | ||
132 : | edgomez | 1053 | |
133 : | /* fields for interpolate and direct modes */ | ||
134 : | const uint8_t * b_RefP[6]; /* N, V, H, HV, cU, cV */ | ||
135 : | edgomez | 851 | VECTOR bpredMV; |
136 : | uint32_t bFcode; | ||
137 : | edgomez | 1053 | |
138 : | /* fields for direct mode */ | ||
139 : | edgomez | 851 | VECTOR directmvF[4]; |
140 : | VECTOR directmvB[4]; | ||
141 : | const VECTOR * referencemv; | ||
142 : | edgomez | 1053 | |
143 : | /* BITS/R-D stuff */ | ||
144 : | edgomez | 959 | int16_t * dctSpace; |
145 : | edgomez | 1022 | uint32_t iQuant; |
146 : | uint32_t quant_type; | ||
147 : | edgomez | 851 | |
148 : | } SearchData; | ||
149 : | |||
150 : | |||
151 : | typedef void(CheckFunc)(const int x, const int y, | ||
152 : | const int Direction, int * const dir, | ||
153 : | const SearchData * const Data); | ||
154 : | CheckFunc *CheckCandidate; | ||
155 : | |||
156 : | /* | ||
157 : | * Calculate the min/max range | ||
158 : | * relative to the _MACROBLOCK_ position | ||
159 : | */ | ||
160 : | static void __inline | ||
161 : | get_range(int32_t * const min_dx, | ||
162 : | int32_t * const max_dx, | ||
163 : | int32_t * const min_dy, | ||
164 : | int32_t * const max_dy, | ||
165 : | const uint32_t x, | ||
166 : | const uint32_t y, | ||
167 : | uint32_t block_sz, /* block dimension, 8 or 16 */ | ||
168 : | const uint32_t width, | ||
169 : | const uint32_t height, | ||
170 : | const uint32_t fcode, | ||
171 : | const int qpel, /* 1 if the resulting range should be in qpel precision; otherwise 0 */ | ||
172 : | const int rrv) | ||
173 : | { | ||
174 : | int k, m = qpel ? 4 : 2; | ||
175 : | const int search_range = 32 << (fcode - 1); | ||
176 : | int high = search_range - 1; | ||
177 : | int low = -search_range; | ||
178 : | |||
179 : | if (rrv) { | ||
180 : | high = RRV_MV_SCALEUP(high); | ||
181 : | low = RRV_MV_SCALEUP(low); | ||
182 : | block_sz *= 2; | ||
183 : | } | ||
184 : | |||
185 : | k = m * (int)(width - x * block_sz); | ||
186 : | *max_dx = MIN(high, k); | ||
187 : | k = m * (int)(height - y * block_sz); | ||
188 : | *max_dy = MIN(high, k); | ||
189 : | |||
190 : | k = -m * (int)((x+1) * block_sz); | ||
191 : | *min_dx = MAX(low, k); | ||
192 : | k = -m * (int)((y+1) * block_sz); | ||
193 : | *min_dy = MAX(low, k); | ||
194 : | } | ||
195 : | |||
196 : | typedef void MainSearchFunc(int x, int y, const SearchData * const Data, int bDirection); | ||
197 : | |||
198 : | static MainSearchFunc DiamondSearch, AdvDiamondSearch, SquareSearch; | ||
199 : | |||
200 : | static void Search8(const SearchData * const OldData, | ||
201 : | const int x, const int y, | ||
202 : | const uint32_t MotionFlags, | ||
203 : | const MBParam * const pParam, | ||
204 : | MACROBLOCK * const pMB, | ||
205 : | const MACROBLOCK * const pMBs, | ||
206 : | const int block, | ||
207 : | SearchData * const Data); | ||
208 : | |||
209 : | bool | ||
210 : | MotionEstimation(MBParam * const pParam, | ||
211 : | syskin | 884 | FRAMEINFO * const current, |
212 : | FRAMEINFO * const reference, | ||
213 : | const IMAGE * const pRefH, | ||
214 : | const IMAGE * const pRefV, | ||
215 : | const IMAGE * const pRefHV, | ||
216 : | const uint32_t iLimit); | ||
217 : | edgomez | 851 | |
218 : | static void | ||
219 : | SearchP(const IMAGE * const pRef, | ||
220 : | const uint8_t * const pRefH, | ||
221 : | const uint8_t * const pRefV, | ||
222 : | const uint8_t * const pRefHV, | ||
223 : | const IMAGE * const pCur, | ||
224 : | const int x, | ||
225 : | const int y, | ||
226 : | const uint32_t MotionFlags, | ||
227 : | edgomez | 1022 | const uint32_t VopFlags, |
228 : | const uint32_t VolFlags, | ||
229 : | edgomez | 851 | SearchData * const Data, |
230 : | const MBParam * const pParam, | ||
231 : | const MACROBLOCK * const pMBs, | ||
232 : | const MACROBLOCK * const prevMBs, | ||
233 : | MACROBLOCK * const pMB); | ||
234 : | |||
235 : | static WARPPOINTS | ||
236 : | GlobalMotionEst(const MACROBLOCK * const pMBs, | ||
237 : | const MBParam * const pParam, | ||
238 : | const FRAMEINFO * const current, | ||
239 : | const FRAMEINFO * const reference, | ||
240 : | const IMAGE * const pRefH, | ||
241 : | const IMAGE * const pRefV, | ||
242 : | const IMAGE * const pRefHV ); | ||
243 : | |||
244 : | #define iDiamondSize 2 | ||
245 : | |||
246 : | static __inline uint32_t | ||
247 : | suxen_drol | 890 | MakeGoodMotionFlags(const uint32_t MotionFlags, const uint32_t VopFlags, const uint32_t VolFlags) |
248 : | edgomez | 851 | { |
249 : | uint32_t Flags = MotionFlags; | ||
250 : | |||
251 : | edgomez | 949 | if (!(VopFlags & XVID_VOP_MODEDECISION_BITS)) |
252 : | Flags &= ~(XVID_ME_QUARTERPELREFINE16_BITS+XVID_ME_QUARTERPELREFINE8_BITS+XVID_ME_HALFPELREFINE16_BITS+XVID_ME_HALFPELREFINE8_BITS+XVID_ME_EXTSEARCH_BITS); | ||
253 : | edgomez | 851 | |
254 : | edgomez | 949 | if (Flags & XVID_ME_EXTSEARCH_BITS) |
255 : | Flags |= XVID_ME_HALFPELREFINE16_BITS; | ||
256 : | edgomez | 851 | |
257 : | edgomez | 949 | if (Flags & XVID_ME_EXTSEARCH_BITS && MotionFlags & XVID_ME_EXTSEARCH8) |
258 : | Flags |= XVID_ME_HALFPELREFINE8_BITS; | ||
259 : | edgomez | 851 | |
260 : | edgomez | 949 | if (Flags & XVID_ME_HALFPELREFINE16_BITS) |
261 : | Flags |= XVID_ME_QUARTERPELREFINE16_BITS; | ||
262 : | edgomez | 851 | |
263 : | edgomez | 949 | if (Flags & XVID_ME_HALFPELREFINE8_BITS) { |
264 : | Flags |= XVID_ME_QUARTERPELREFINE8_BITS; | ||
265 : | Flags &= ~XVID_ME_HALFPELREFINE8; | ||
266 : | edgomez | 851 | } |
267 : | |||
268 : | edgomez | 949 | if (Flags & XVID_ME_QUARTERPELREFINE8_BITS) |
269 : | Flags &= ~XVID_ME_QUARTERPELREFINE8; | ||
270 : | edgomez | 851 | |
271 : | edgomez | 949 | if (!(VolFlags & XVID_VOL_QUARTERPEL)) |
272 : | Flags &= ~(XVID_ME_QUARTERPELREFINE16+XVID_ME_QUARTERPELREFINE8+XVID_ME_QUARTERPELREFINE16_BITS+XVID_ME_QUARTERPELREFINE8_BITS); | ||
273 : | edgomez | 851 | |
274 : | edgomez | 949 | if (!(VopFlags & XVID_VOP_HALFPEL)) |
275 : | Flags &= ~(XVID_ME_EXTSEARCH16+XVID_ME_HALFPELREFINE16+XVID_ME_HALFPELREFINE8+XVID_ME_HALFPELREFINE16_BITS+XVID_ME_HALFPELREFINE8_BITS); | ||
276 : | edgomez | 851 | |
277 : | edgomez | 949 | if ((VopFlags & XVID_VOP_GREYSCALE) || (VopFlags & XVID_VOP_REDUCED)) |
278 : | Flags &= ~(XVID_ME_CHROMA16 + XVID_ME_CHROMA8); | ||
279 : | edgomez | 851 | |
280 : | return Flags; | ||
281 : | } | ||
282 : | |||
283 : | /* BITS mode decision and search */ | ||
284 : | |||
285 : | #include "../bitstream/zigzag.h" | ||
286 : | #include "../quant/quant_mpeg4.h" | ||
287 : | #include "../quant/quant_h263.h" | ||
288 : | #include "../bitstream/vlc_codes.h" | ||
289 : | edgomez | 1022 | #include "../dct/fdct.h" |
290 : | edgomez | 851 | |
291 : | static int | ||
292 : | CountMBBitsInter(SearchData * const Data, | ||
293 : | const MACROBLOCK * const pMBs, const int x, const int y, | ||
294 : | const MBParam * const pParam, | ||
295 : | const uint32_t MotionFlags); | ||
296 : | |||
297 : | static int | ||
298 : | CountMBBitsInter4v(const SearchData * const Data, | ||
299 : | MACROBLOCK * const pMB, const MACROBLOCK * const pMBs, | ||
300 : | const int x, const int y, | ||
301 : | const MBParam * const pParam, const uint32_t MotionFlags, | ||
302 : | const VECTOR * const backup); | ||
303 : | |||
304 : | static int | ||
305 : | CountMBBitsIntra(const SearchData * const Data); | ||
306 : | |||
307 : | int CodeCoeffIntra_CalcBits(const int16_t qcoeff[64], const uint16_t * zigzag); | ||
308 : | int CodeCoeffInter_CalcBits(const int16_t qcoeff[64], const uint16_t * zigzag); | ||
309 : | edgomez | 1023 | |
310 : | #define LAMBDA ( (int)(1.0*BITS_MULT) ) | ||
311 : | |||
312 : | edgomez | 1022 | static __inline unsigned int |
313 : | edgomez | 1023 | Block_CalcBits( int16_t * const coeff, |
314 : | int16_t * const data, | ||
315 : | const uint32_t quant, const int quant_type, | ||
316 : | uint32_t * cbp, | ||
317 : | const int block) | ||
318 : | edgomez | 1022 | { |
319 : | int sum; | ||
320 : | edgomez | 1023 | int bits; |
321 : | const int lambda = LAMBDA*quant*quant; | ||
322 : | int distortion = 0; | ||
323 : | int i; | ||
324 : | edgomez | 851 | |
325 : | edgomez | 1022 | fdct(data); |
326 : | |||
327 : | if (quant_type == 0) sum = quant_inter(coeff, data, quant); | ||
328 : | else sum = quant4_inter(coeff, data, quant); | ||
329 : | |||
330 : | if (sum > 0) { | ||
331 : | *cbp |= 1 << (5 - block); | ||
332 : | edgomez | 1023 | bits = BITS_MULT * CodeCoeffInter_CalcBits(coeff, scan_tables[0]); |
333 : | } else bits = 0; | ||
334 : | |||
335 : | if (quant_type == 0) dequant_inter(coeff, coeff, quant); | ||
336 : | else dequant4_inter(coeff, coeff, quant); | ||
337 : | |||
338 : | for (i = 0; i < 64; i++) { | ||
339 : | distortion += (data[i] - coeff[i])*(data[i] - coeff[i]); | ||
340 : | } | ||
341 : | bits += (BITS_MULT*BITS_MULT*distortion)/lambda; | ||
342 : | |||
343 : | |||
344 : | return bits; | ||
345 : | edgomez | 1022 | } |
346 : | |||
347 : | edgomez | 1023 | static __inline unsigned int |
348 : | Block_CalcBitsIntra(int16_t * const coeff, | ||
349 : | int16_t * const data, | ||
350 : | const uint32_t quant, const int quant_type, | ||
351 : | uint32_t * cbp, | ||
352 : | const int block, | ||
353 : | int * dcpred) | ||
354 : | { | ||
355 : | int bits, i; | ||
356 : | const int lambda = LAMBDA*quant*quant; | ||
357 : | int distortion = 0; | ||
358 : | uint32_t iDcScaler = get_dc_scaler(quant, block > 3); | ||
359 : | int b_dc; | ||
360 : | |||
361 : | fdct(data); | ||
362 : | data[0] -= 1024; | ||
363 : | |||
364 : | if (quant_type == 0) quant_intra(coeff, data, quant, iDcScaler); | ||
365 : | else quant4_intra(coeff, data, quant, iDcScaler); | ||
366 : | |||
367 : | b_dc = coeff[0]; | ||
368 : | if (block < 4) { | ||
369 : | coeff[0] -= *dcpred; | ||
370 : | *dcpred = b_dc; | ||
371 : | } | ||
372 : | |||
373 : | *cbp |= 1 << (5 - block); | ||
374 : | bits = BITS_MULT*CodeCoeffIntra_CalcBits(coeff, scan_tables[0]); | ||
375 : | bits += BITS_MULT*dcy_tab[coeff[0] + 255].len; | ||
376 : | if (bits != 0) *cbp |= 1 << (5 - block); | ||
377 : | |||
378 : | coeff[0] = b_dc; | ||
379 : | if (quant_type == 0) dequant_intra(coeff, coeff, quant, iDcScaler); | ||
380 : | else dequant4_intra(coeff, coeff, quant, iDcScaler); | ||
381 : | |||
382 : | for (i = 0; i < 64; i++) { | ||
383 : | distortion += (data[i] - coeff[i])*(data[i] - coeff[i]); | ||
384 : | } | ||
385 : | |||
386 : | bits += (BITS_MULT*BITS_MULT*distortion)/lambda; | ||
387 : | |||
388 : | return bits; | ||
389 : | } | ||
390 : | |||
391 : | edgomez | 851 | #endif /* _MOTION_EST_H_ */ |
No admin address has been configured | ViewVC Help |
Powered by ViewVC 1.0.4 |