Parent Directory
|
Revision Log
Revision 1959 - (view) (download)
1 : | edgomez | 194 | /***************************************************************************** |
2 : | edgomez | 145 | * |
3 : | * XVID MPEG-4 VIDEO CODEC | ||
4 : | edgomez | 1382 | * - Encoder main module - |
5 : | edgomez | 145 | * |
6 : | Isibaar | 1883 | * Copyright(C) 2002-2010 Michael Militzer <isibaar@xvid.org> |
7 : | * 2002-2003 Peter Ross <pross@xvid.org> | ||
8 : | * 2002 Daniel Smith <danielsmith@astroboymail.com> | ||
9 : | edgomez | 402 | * |
10 : | edgomez | 1382 | * This program is free software ; you can redistribute it and/or modify |
11 : | edgomez | 851 | * it under the terms of the GNU General Public License as published by |
12 : | edgomez | 1382 | * the Free Software Foundation ; either version 2 of the License, or |
13 : | edgomez | 145 | * (at your option) any later version. |
14 : | * | ||
15 : | * This program is distributed in the hope that it will be useful, | ||
16 : | edgomez | 1382 | * but WITHOUT ANY WARRANTY ; without even the implied warranty of |
17 : | edgomez | 145 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
18 : | * GNU General Public License for more details. | ||
19 : | * | ||
20 : | * You should have received a copy of the GNU General Public License | ||
21 : | edgomez | 1382 | * along with this program ; if not, write to the Free Software |
22 : | edgomez | 145 | * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
23 : | * | ||
24 : | Isibaar | 1959 | * $Id: encoder.c,v 1.140 2011-03-08 19:16:26 Isibaar Exp $ |
25 : | edgomez | 405 | * |
26 : | edgomez | 194 | ****************************************************************************/ |
27 : | suxen_drol | 118 | |
28 : | Isibaar | 3 | #include <stdlib.h> |
29 : | #include <stdio.h> | ||
30 : | #include <math.h> | ||
31 : | edgomez | 198 | #include <string.h> |
32 : | Isibaar | 3 | |
33 : | #include "encoder.h" | ||
34 : | #include "prediction/mbprediction.h" | ||
35 : | #include "global.h" | ||
36 : | #include "utils/timer.h" | ||
37 : | #include "image/image.h" | ||
38 : | edgomez | 851 | #include "image/font.h" |
39 : | #include "motion/sad.h" | ||
40 : | suxen_drol | 152 | #include "motion/motion.h" |
41 : | edgomez | 1382 | #include "motion/gmc.h" |
42 : | |||
43 : | Isibaar | 3 | #include "bitstream/cbp.h" |
44 : | #include "utils/mbfunctions.h" | ||
45 : | #include "bitstream/bitstream.h" | ||
46 : | #include "bitstream/mbcoding.h" | ||
47 : | #include "utils/emms.h" | ||
48 : | #include "bitstream/mbcoding.h" | ||
49 : | Isibaar | 4 | #include "quant/quant_matrix.h" |
50 : | Isibaar | 41 | #include "utils/mem_align.h" |
51 : | Isibaar | 3 | |
52 : | syskin | 1682 | # include "motion/motion_smp.h" |
53 : | |||
54 : | |||
55 : | edgomez | 194 | /***************************************************************************** |
56 : | * Local function prototypes | ||
57 : | ****************************************************************************/ | ||
58 : | |||
59 : | edgomez | 192 | static int FrameCodeI(Encoder * pEnc, |
60 : | edgomez | 1382 | Bitstream * bs); |
61 : | Isibaar | 3 | |
62 : | edgomez | 192 | static int FrameCodeP(Encoder * pEnc, |
63 : | syskin | 1403 | Bitstream * bs); |
64 : | Isibaar | 3 | |
65 : | edgomez | 851 | static void FrameCodeB(Encoder * pEnc, |
66 : | FRAMEINFO * frame, | ||
67 : | edgomez | 1382 | Bitstream * bs); |
68 : | edgomez | 851 | |
69 : | edgomez | 194 | |
70 : | /***************************************************************************** | ||
71 : | * Encoder creation | ||
72 : | * | ||
73 : | * This function creates an Encoder instance, it allocates all necessary | ||
74 : | edgomez | 851 | * image buffers (reference, current and bframes) and initialize the internal |
75 : | * xvid encoder paremeters according to the XVID_ENC_PARAM input parameter. | ||
76 : | edgomez | 194 | * |
77 : | * The code seems to be very long but is very basic, mainly memory allocation | ||
78 : | * and cleaning code. | ||
79 : | * | ||
80 : | * Returned values : | ||
81 : | edgomez | 1382 | * - 0 - no errors |
82 : | syskin | 903 | * - XVID_ERR_MEMORY - the libc could not allocate memory, the function |
83 : | * cleans the structure before exiting. | ||
84 : | * pParam->handle is also set to NULL. | ||
85 : | edgomez | 194 | * |
86 : | ****************************************************************************/ | ||
87 : | |||
88 : | edgomez | 1382 | /* |
89 : | * Simplify the "fincr/fbase" fraction | ||
90 : | */ | ||
91 : | Skal | 1617 | static int |
92 : | gcd(int a, int b) | ||
93 : | { | ||
94 : | int r ; | ||
95 : | |||
96 : | if (b > a) { | ||
97 : | r = a; | ||
98 : | a = b; | ||
99 : | b = r; | ||
100 : | } | ||
101 : | |||
102 : | while ((r = a % b)) { | ||
103 : | a = b; | ||
104 : | b = r; | ||
105 : | } | ||
106 : | return b; | ||
107 : | } | ||
108 : | |||
109 : | edgomez | 1382 | static void |
110 : | simplify_time(int *inc, int *base) | ||
111 : | Isibaar | 3 | { |
112 : | edgomez | 1382 | /* common factor */ |
113 : | Skal | 1617 | const int s = gcd(*inc, *base); |
114 : | *inc /= s; | ||
115 : | *base /= s; | ||
116 : | Isibaar | 3 | |
117 : | edgomez | 1501 | if (*base > 65535 || *inc > 65535) { |
118 : | int *biggest; | ||
119 : | int *other; | ||
120 : | edgomez | 1507 | float div; |
121 : | edgomez | 1512 | |
122 : | edgomez | 1501 | if (*base > *inc) { |
123 : | biggest = base; | ||
124 : | other = inc; | ||
125 : | } else { | ||
126 : | biggest = inc; | ||
127 : | other = base; | ||
128 : | } | ||
129 : | |||
130 : | edgomez | 1507 | div = ((float)*biggest)/((float)65535); |
131 : | Skal | 1617 | *biggest = (unsigned int)(((float)*biggest)/div); |
132 : | *other = (unsigned int)(((float)*other)/div); | ||
133 : | Isibaar | 3 | } |
134 : | edgomez | 1382 | } |
135 : | Isibaar | 3 | |
136 : | edgomez | 192 | |
137 : | edgomez | 1382 | int |
138 : | enc_create(xvid_enc_create_t * create) | ||
139 : | { | ||
140 : | Encoder *pEnc; | ||
141 : | syskin | 1682 | int n; |
142 : | Isibaar | 3 | |
143 : | edgomez | 1382 | if (XVID_VERSION_MAJOR(create->version) != 1) /* v1.x.x */ |
144 : | return XVID_ERR_VERSION; | ||
145 : | Isibaar | 3 | |
146 : | edgomez | 1382 | if (create->width%2 || create->height%2) |
147 : | return XVID_ERR_FAIL; | ||
148 : | h | 121 | |
149 : | syskin | 1391 | if (create->width<=0 || create->height<=0) |
150 : | return XVID_ERR_FAIL; | ||
151 : | |||
152 : | edgomez | 1382 | /* allocate encoder struct */ |
153 : | h | 121 | |
154 : | edgomez | 192 | pEnc = (Encoder *) xvid_malloc(sizeof(Encoder), CACHE_LINE); |
155 : | if (pEnc == NULL) | ||
156 : | Isibaar | 3 | return XVID_ERR_MEMORY; |
157 : | edgomez | 198 | memset(pEnc, 0, sizeof(Encoder)); |
158 : | |||
159 : | edgomez | 1382 | pEnc->mbParam.profile = create->profile; |
160 : | Isibaar | 3 | |
161 : | edgomez | 1382 | /* global flags */ |
162 : | pEnc->mbParam.global_flags = create->global; | ||
163 : | suxen_drol | 1607 | if ((pEnc->mbParam.global_flags & XVID_GLOBAL_PACKED)) |
164 : | pEnc->mbParam.global_flags |= XVID_GLOBAL_DIVX5_USERDATA; | ||
165 : | Isibaar | 3 | |
166 : | edgomez | 1382 | /* width, height */ |
167 : | pEnc->mbParam.width = create->width; | ||
168 : | pEnc->mbParam.height = create->height; | ||
169 : | Isibaar | 3 | pEnc->mbParam.mb_width = (pEnc->mbParam.width + 15) / 16; |
170 : | pEnc->mbParam.mb_height = (pEnc->mbParam.height + 15) / 16; | ||
171 : | edgomez | 195 | pEnc->mbParam.edged_width = 16 * pEnc->mbParam.mb_width + 2 * EDGE_SIZE; |
172 : | pEnc->mbParam.edged_height = 16 * pEnc->mbParam.mb_height + 2 * EDGE_SIZE; | ||
173 : | Isibaar | 3 | |
174 : | edgomez | 1382 | /* framerate */ |
175 : | pEnc->mbParam.fincr = MAX(create->fincr, 0); | ||
176 : | pEnc->mbParam.fbase = create->fincr <= 0 ? 25 : create->fbase; | ||
177 : | if (pEnc->mbParam.fincr>0) | ||
178 : | Skal | 1617 | simplify_time((int*)&pEnc->mbParam.fincr, (int*)&pEnc->mbParam.fbase); |
179 : | Isibaar | 1627 | |
180 : | edgomez | 1382 | /* zones */ |
181 : | if(create->num_zones > 0) { | ||
182 : | pEnc->num_zones = create->num_zones; | ||
183 : | pEnc->zones = xvid_malloc(sizeof(xvid_enc_zone_t) * pEnc->num_zones, CACHE_LINE); | ||
184 : | if (pEnc->zones == NULL) | ||
185 : | goto xvid_err_memory0; | ||
186 : | memcpy(pEnc->zones, create->zones, sizeof(xvid_enc_zone_t) * pEnc->num_zones); | ||
187 : | } else { | ||
188 : | pEnc->num_zones = 0; | ||
189 : | pEnc->zones = NULL; | ||
190 : | } | ||
191 : | Isibaar | 208 | |
192 : | edgomez | 1382 | /* plugins */ |
193 : | if(create->num_plugins > 0) { | ||
194 : | pEnc->num_plugins = create->num_plugins; | ||
195 : | pEnc->plugins = xvid_malloc(sizeof(xvid_enc_plugin_t) * pEnc->num_plugins, CACHE_LINE); | ||
196 : | if (pEnc->plugins == NULL) | ||
197 : | goto xvid_err_memory0; | ||
198 : | } else { | ||
199 : | pEnc->num_plugins = 0; | ||
200 : | pEnc->plugins = NULL; | ||
201 : | } | ||
202 : | Isibaar | 3 | |
203 : | edgomez | 1382 | for (n=0; n<pEnc->num_plugins;n++) { |
204 : | xvid_plg_create_t pcreate; | ||
205 : | xvid_plg_info_t pinfo; | ||
206 : | Isibaar | 3 | |
207 : | edgomez | 1382 | memset(&pinfo, 0, sizeof(xvid_plg_info_t)); |
208 : | pinfo.version = XVID_VERSION; | ||
209 : | suxen_drol | 1653 | if (create->plugins[n].func(NULL, XVID_PLG_INFO, &pinfo, NULL) >= 0) { |
210 : | edgomez | 1382 | pEnc->mbParam.plugin_flags |= pinfo.flags; |
211 : | } | ||
212 : | Isibaar | 3 | |
213 : | edgomez | 1382 | memset(&pcreate, 0, sizeof(xvid_plg_create_t)); |
214 : | pcreate.version = XVID_VERSION; | ||
215 : | pcreate.num_zones = pEnc->num_zones; | ||
216 : | pcreate.zones = pEnc->zones; | ||
217 : | pcreate.width = pEnc->mbParam.width; | ||
218 : | pcreate.height = pEnc->mbParam.height; | ||
219 : | pcreate.mb_width = pEnc->mbParam.mb_width; | ||
220 : | pcreate.mb_height = pEnc->mbParam.mb_height; | ||
221 : | pcreate.fincr = pEnc->mbParam.fincr; | ||
222 : | pcreate.fbase = pEnc->mbParam.fbase; | ||
223 : | pcreate.param = create->plugins[n].param; | ||
224 : | Isibaar | 3 | |
225 : | edgomez | 1382 | pEnc->plugins[n].func = NULL; /* disable plugins that fail */ |
226 : | suxen_drol | 1653 | if (create->plugins[n].func(NULL, XVID_PLG_CREATE, &pcreate, &pEnc->plugins[n].param) >= 0) { |
227 : | edgomez | 1382 | pEnc->plugins[n].func = create->plugins[n].func; |
228 : | } | ||
229 : | } | ||
230 : | Isibaar | 3 | |
231 : | edgomez | 1382 | if ((pEnc->mbParam.global_flags & XVID_GLOBAL_EXTRASTATS_ENABLE) || |
232 : | (pEnc->mbParam.plugin_flags & XVID_REQPSNR)) { | ||
233 : | pEnc->mbParam.plugin_flags |= XVID_REQORIGINAL; /* psnr calculation requires the original */ | ||
234 : | } | ||
235 : | |||
236 : | /* temp dquants */ | ||
237 : | if ((pEnc->mbParam.plugin_flags & XVID_REQDQUANTS)) { | ||
238 : | pEnc->temp_dquants = (int *) xvid_malloc(pEnc->mbParam.mb_width * | ||
239 : | pEnc->mbParam.mb_height * sizeof(int), CACHE_LINE); | ||
240 : | if (pEnc->temp_dquants==NULL) | ||
241 : | goto xvid_err_memory1a; | ||
242 : | } | ||
243 : | |||
244 : | syskin | 1660 | /* temp lambdas */ |
245 : | if (pEnc->mbParam.plugin_flags & XVID_REQLAMBDA) { | ||
246 : | pEnc->temp_lambda = (float *) xvid_malloc(pEnc->mbParam.mb_width * | ||
247 : | pEnc->mbParam.mb_height * 6 * sizeof(float), CACHE_LINE); | ||
248 : | if (pEnc->temp_lambda == NULL) | ||
249 : | goto xvid_err_memory1a; | ||
250 : | } | ||
251 : | |||
252 : | edgomez | 1382 | /* bframes */ |
253 : | pEnc->mbParam.max_bframes = MAX(create->max_bframes, 0); | ||
254 : | pEnc->mbParam.bquant_ratio = MAX(create->bquant_ratio, 0); | ||
255 : | pEnc->mbParam.bquant_offset = create->bquant_offset; | ||
256 : | |||
257 : | /* min/max quant */ | ||
258 : | for (n=0; n<3; n++) { | ||
259 : | pEnc->mbParam.min_quant[n] = create->min_quant[n] > 0 ? create->min_quant[n] : 2; | ||
260 : | pEnc->mbParam.max_quant[n] = create->max_quant[n] > 0 ? create->max_quant[n] : 31; | ||
261 : | } | ||
262 : | |||
263 : | /* frame drop ratio */ | ||
264 : | pEnc->mbParam.frame_drop_ratio = MAX(create->frame_drop_ratio, 0); | ||
265 : | |||
266 : | /* max keyframe interval */ | ||
267 : | pEnc->mbParam.iMaxKeyInterval = create->max_key_interval <= 0 ? (10 * (int)pEnc->mbParam.fbase) / (int)pEnc->mbParam.fincr : create->max_key_interval; | ||
268 : | |||
269 : | /* allocate working frame-image memory */ | ||
270 : | |||
271 : | edgomez | 192 | pEnc->current = xvid_malloc(sizeof(FRAMEINFO), CACHE_LINE); |
272 : | pEnc->reference = xvid_malloc(sizeof(FRAMEINFO), CACHE_LINE); | ||
273 : | Isibaar | 3 | |
274 : | edgomez | 195 | if (pEnc->current == NULL || pEnc->reference == NULL) |
275 : | edgomez | 192 | goto xvid_err_memory1; |
276 : | |||
277 : | edgomez | 1382 | /* allocate macroblock memory */ |
278 : | Isibaar | 3 | |
279 : | edgomez | 195 | pEnc->current->mbs = |
280 : | xvid_malloc(sizeof(MACROBLOCK) * pEnc->mbParam.mb_width * | ||
281 : | pEnc->mbParam.mb_height, CACHE_LINE); | ||
282 : | pEnc->reference->mbs = | ||
283 : | xvid_malloc(sizeof(MACROBLOCK) * pEnc->mbParam.mb_width * | ||
284 : | pEnc->mbParam.mb_height, CACHE_LINE); | ||
285 : | suxen_drol | 136 | |
286 : | edgomez | 192 | if (pEnc->current->mbs == NULL || pEnc->reference->mbs == NULL) |
287 : | goto xvid_err_memory2; | ||
288 : | suxen_drol | 136 | |
289 : | edgomez | 1382 | /* allocate quant matrix memory */ |
290 : | suxen_drol | 136 | |
291 : | edgomez | 1382 | pEnc->mbParam.mpeg_quant_matrices = |
292 : | xvid_malloc(sizeof(uint16_t) * 64 * 8, CACHE_LINE); | ||
293 : | |||
294 : | if (pEnc->mbParam.mpeg_quant_matrices == NULL) | ||
295 : | goto xvid_err_memory2a; | ||
296 : | |||
297 : | /* allocate interpolation image memory */ | ||
298 : | |||
299 : | if ((pEnc->mbParam.plugin_flags & XVID_REQORIGINAL)) { | ||
300 : | edgomez | 851 | image_null(&pEnc->sOriginal); |
301 : | edgomez | 1382 | image_null(&pEnc->sOriginal2); |
302 : | } | ||
303 : | edgomez | 851 | |
304 : | image_null(&pEnc->f_refh); | ||
305 : | image_null(&pEnc->f_refv); | ||
306 : | image_null(&pEnc->f_refhv); | ||
307 : | |||
308 : | suxen_drol | 136 | image_null(&pEnc->current->image); |
309 : | image_null(&pEnc->reference->image); | ||
310 : | image_null(&pEnc->vInterH); | ||
311 : | image_null(&pEnc->vInterV); | ||
312 : | image_null(&pEnc->vInterHV); | ||
313 : | edgomez | 192 | |
314 : | edgomez | 1382 | if ((pEnc->mbParam.plugin_flags & XVID_REQORIGINAL)) { |
315 : | if (image_create | ||
316 : | edgomez | 851 | (&pEnc->sOriginal, pEnc->mbParam.edged_width, |
317 : | pEnc->mbParam.edged_height) < 0) | ||
318 : | goto xvid_err_memory3; | ||
319 : | edgomez | 1382 | |
320 : | if (image_create | ||
321 : | (&pEnc->sOriginal2, pEnc->mbParam.edged_width, | ||
322 : | pEnc->mbParam.edged_height) < 0) | ||
323 : | goto xvid_err_memory3; | ||
324 : | edgomez | 851 | } |
325 : | |||
326 : | edgomez | 195 | if (image_create |
327 : | edgomez | 851 | (&pEnc->f_refh, pEnc->mbParam.edged_width, |
328 : | edgomez | 195 | pEnc->mbParam.edged_height) < 0) |
329 : | edgomez | 192 | goto xvid_err_memory3; |
330 : | edgomez | 195 | if (image_create |
331 : | edgomez | 851 | (&pEnc->f_refv, pEnc->mbParam.edged_width, |
332 : | pEnc->mbParam.edged_height) < 0) | ||
333 : | goto xvid_err_memory3; | ||
334 : | if (image_create | ||
335 : | (&pEnc->f_refhv, pEnc->mbParam.edged_width, | ||
336 : | pEnc->mbParam.edged_height) < 0) | ||
337 : | goto xvid_err_memory3; | ||
338 : | |||
339 : | if (image_create | ||
340 : | edgomez | 195 | (&pEnc->current->image, pEnc->mbParam.edged_width, |
341 : | pEnc->mbParam.edged_height) < 0) | ||
342 : | edgomez | 192 | goto xvid_err_memory3; |
343 : | edgomez | 195 | if (image_create |
344 : | (&pEnc->reference->image, pEnc->mbParam.edged_width, | ||
345 : | pEnc->mbParam.edged_height) < 0) | ||
346 : | edgomez | 192 | goto xvid_err_memory3; |
347 : | edgomez | 195 | if (image_create |
348 : | (&pEnc->vInterH, pEnc->mbParam.edged_width, | ||
349 : | pEnc->mbParam.edged_height) < 0) | ||
350 : | edgomez | 192 | goto xvid_err_memory3; |
351 : | edgomez | 195 | if (image_create |
352 : | (&pEnc->vInterV, pEnc->mbParam.edged_width, | ||
353 : | pEnc->mbParam.edged_height) < 0) | ||
354 : | edgomez | 192 | goto xvid_err_memory3; |
355 : | edgomez | 195 | if (image_create |
356 : | (&pEnc->vInterHV, pEnc->mbParam.edged_width, | ||
357 : | pEnc->mbParam.edged_height) < 0) | ||
358 : | edgomez | 192 | goto xvid_err_memory3; |
359 : | suxen_drol | 136 | |
360 : | edgomez | 851 | /* Create full bitplane for GMC, this might be wasteful */ |
361 : | if (image_create | ||
362 : | (&pEnc->vGMC, pEnc->mbParam.edged_width, | ||
363 : | pEnc->mbParam.edged_height) < 0) | ||
364 : | goto xvid_err_memory3; | ||
365 : | |||
366 : | edgomez | 1382 | /* init bframe image buffers */ |
367 : | edgomez | 851 | |
368 : | edgomez | 1382 | pEnc->bframenum_head = 0; |
369 : | pEnc->bframenum_tail = 0; | ||
370 : | pEnc->flush_bframes = 0; | ||
371 : | pEnc->closed_bframenum = -1; | ||
372 : | edgomez | 851 | |
373 : | /* B Frames specific init */ | ||
374 : | pEnc->bframes = NULL; | ||
375 : | |||
376 : | if (pEnc->mbParam.max_bframes > 0) { | ||
377 : | |||
378 : | pEnc->bframes = | ||
379 : | xvid_malloc(pEnc->mbParam.max_bframes * sizeof(FRAMEINFO *), | ||
380 : | CACHE_LINE); | ||
381 : | |||
382 : | if (pEnc->bframes == NULL) | ||
383 : | goto xvid_err_memory3; | ||
384 : | |||
385 : | for (n = 0; n < pEnc->mbParam.max_bframes; n++) | ||
386 : | pEnc->bframes[n] = NULL; | ||
387 : | |||
388 : | |||
389 : | for (n = 0; n < pEnc->mbParam.max_bframes; n++) { | ||
390 : | pEnc->bframes[n] = xvid_malloc(sizeof(FRAMEINFO), CACHE_LINE); | ||
391 : | |||
392 : | if (pEnc->bframes[n] == NULL) | ||
393 : | goto xvid_err_memory4; | ||
394 : | |||
395 : | pEnc->bframes[n]->mbs = | ||
396 : | xvid_malloc(sizeof(MACROBLOCK) * pEnc->mbParam.mb_width * | ||
397 : | pEnc->mbParam.mb_height, CACHE_LINE); | ||
398 : | |||
399 : | if (pEnc->bframes[n]->mbs == NULL) | ||
400 : | goto xvid_err_memory4; | ||
401 : | |||
402 : | image_null(&pEnc->bframes[n]->image); | ||
403 : | |||
404 : | if (image_create | ||
405 : | (&pEnc->bframes[n]->image, pEnc->mbParam.edged_width, | ||
406 : | pEnc->mbParam.edged_height) < 0) | ||
407 : | goto xvid_err_memory4; | ||
408 : | |||
409 : | } | ||
410 : | } | ||
411 : | |||
412 : | edgomez | 1382 | /* init incoming frame queue */ |
413 : | pEnc->queue_head = 0; | ||
414 : | pEnc->queue_tail = 0; | ||
415 : | pEnc->queue_size = 0; | ||
416 : | edgomez | 851 | |
417 : | edgomez | 1382 | pEnc->queue = |
418 : | xvid_malloc((pEnc->mbParam.max_bframes+1) * sizeof(QUEUEINFO), | ||
419 : | CACHE_LINE); | ||
420 : | edgomez | 851 | |
421 : | edgomez | 1382 | if (pEnc->queue == NULL) |
422 : | goto xvid_err_memory4; | ||
423 : | edgomez | 851 | |
424 : | edgomez | 1382 | for (n = 0; n < pEnc->mbParam.max_bframes+1; n++) |
425 : | image_null(&pEnc->queue[n].image); | ||
426 : | edgomez | 851 | |
427 : | |||
428 : | edgomez | 1382 | for (n = 0; n < pEnc->mbParam.max_bframes+1; n++) { |
429 : | if (image_create | ||
430 : | (&pEnc->queue[n].image, pEnc->mbParam.edged_width, | ||
431 : | pEnc->mbParam.edged_height) < 0) | ||
432 : | goto xvid_err_memory5; | ||
433 : | edgomez | 851 | } |
434 : | |||
435 : | edgomez | 1382 | /* timestamp stuff */ |
436 : | edgomez | 851 | |
437 : | pEnc->mbParam.m_stamp = 0; | ||
438 : | Isibaar | 1883 | pEnc->m_framenum = create->start_frame_num; |
439 : | edgomez | 851 | pEnc->current->stamp = 0; |
440 : | pEnc->reference->stamp = 0; | ||
441 : | |||
442 : | edgomez | 1382 | /* other stuff */ |
443 : | Isibaar | 3 | |
444 : | edgomez | 1382 | pEnc->iFrameNum = 0; |
445 : | pEnc->fMvPrevSigma = -1; | ||
446 : | Isibaar | 3 | |
447 : | Isibaar | 1913 | /* slices */ |
448 : | pEnc->num_slices = MIN(MAX(1, create->num_slices), (int) pEnc->mbParam.mb_height); | ||
449 : | |||
450 : | syskin | 1682 | /* multithreaded stuff */ |
451 : | if (create->num_threads > 0) { | ||
452 : | Isibaar | 1913 | int t = MIN(create->num_threads, (int) (pEnc->mbParam.mb_height>>1)); /* at least two rows per thread */ |
453 : | int threads_per_slice = MAX(1, (t / pEnc->num_slices)); | ||
454 : | int rows_per_thread = (pEnc->mbParam.mb_height + threads_per_slice - 1) / threads_per_slice; | ||
455 : | |||
456 : | syskin | 1682 | pEnc->num_threads = t; |
457 : | Isibaar | 1913 | pEnc->smpData = xvid_malloc(t*sizeof(SMPData), CACHE_LINE); |
458 : | if (!pEnc->smpData) | ||
459 : | syskin | 1682 | goto xvid_err_nosmp; |
460 : | Isibaar | 1913 | |
461 : | /* tmp bitstream buffer for slice coding */ | ||
462 : | pEnc->smpData[0].tmp_buffer = xvid_malloc(16*pEnc->mbParam.edged_width*pEnc->mbParam.mb_height*sizeof(uint8_t), CACHE_LINE); | ||
463 : | if (! pEnc->smpData[0].tmp_buffer) goto xvid_err_nosmp; | ||
464 : | |||
465 : | syskin | 1682 | for (n = 0; n < t; n++) { |
466 : | Isibaar | 1913 | int s = MIN(pEnc->num_threads, pEnc->num_slices); |
467 : | |||
468 : | pEnc->smpData[n].complete_count_self = | ||
469 : | syskin | 1682 | xvid_malloc(rows_per_thread * sizeof(int), CACHE_LINE); |
470 : | |||
471 : | Isibaar | 1913 | if (!pEnc->smpData[n].complete_count_self) |
472 : | syskin | 1682 | goto xvid_err_nosmp; |
473 : | Isibaar | 1913 | |
474 : | if (n > 0 && n < s) { | ||
475 : | pEnc->smpData[n].bs = (Bitstream *) xvid_malloc(sizeof(Bitstream), CACHE_LINE); | ||
476 : | if (!pEnc->smpData[n].bs) | ||
477 : | goto xvid_err_nosmp; | ||
478 : | |||
479 : | pEnc->smpData[n].sStat = (Statistics *) xvid_malloc(sizeof(Statistics), CACHE_LINE); | ||
480 : | if (!pEnc->smpData[n].sStat) | ||
481 : | goto xvid_err_nosmp; | ||
482 : | |||
483 : | pEnc->smpData[n].tmp_buffer = pEnc->smpData[0].tmp_buffer + 16*(((n-1)*pEnc->mbParam.edged_width*pEnc->mbParam.mb_height)/s); | ||
484 : | BitstreamInit(pEnc->smpData[n].bs, pEnc->smpData[n].tmp_buffer, 0); | ||
485 : | } | ||
486 : | |||
487 : | syskin | 1682 | if (n != 0) |
488 : | Isibaar | 1913 | pEnc->smpData[n].complete_count_above = |
489 : | pEnc->smpData[n-1].complete_count_self; | ||
490 : | syskin | 1682 | } |
491 : | Isibaar | 1913 | pEnc->smpData[0].complete_count_above = |
492 : | pEnc->smpData[t-1].complete_count_self - 1; | ||
493 : | syskin | 1682 | |
494 : | } else { | ||
495 : | xvid_err_nosmp: | ||
496 : | /* no SMP */ | ||
497 : | Isibaar | 1913 | if (pEnc->smpData) { |
498 : | if (pEnc->smpData[0].tmp_buffer) | ||
499 : | xvid_free(pEnc->smpData[0].tmp_buffer); | ||
500 : | } | ||
501 : | else { | ||
502 : | pEnc->smpData = xvid_malloc(1*sizeof(SMPData), CACHE_LINE); | ||
503 : | if (pEnc->smpData == NULL) | ||
504 : | goto xvid_err_memory5; | ||
505 : | } | ||
506 : | |||
507 : | syskin | 1682 | create->num_threads = 0; |
508 : | } | ||
509 : | |||
510 : | edgomez | 1382 | create->handle = (void *) pEnc; |
511 : | |||
512 : | Isibaar | 36 | init_timer(); |
513 : | edgomez | 1382 | init_mpeg_matrix(pEnc->mbParam.mpeg_quant_matrices); |
514 : | Isibaar | 3 | |
515 : | edgomez | 1382 | return 0; /* ok */ |
516 : | edgomez | 192 | |
517 : | /* | ||
518 : | * We handle all XVID_ERR_MEMORY here, this makes the code lighter | ||
519 : | */ | ||
520 : | suxen_drol | 229 | |
521 : | edgomez | 851 | xvid_err_memory5: |
522 : | |||
523 : | edgomez | 1382 | for (n = 0; n < pEnc->mbParam.max_bframes+1; n++) { |
524 : | image_destroy(&pEnc->queue[n].image, pEnc->mbParam.edged_width, | ||
525 : | edgomez | 851 | pEnc->mbParam.edged_height); |
526 : | } | ||
527 : | |||
528 : | edgomez | 1382 | xvid_free(pEnc->queue); |
529 : | |||
530 : | edgomez | 851 | xvid_err_memory4: |
531 : | |||
532 : | if (pEnc->mbParam.max_bframes > 0) { | ||
533 : | edgomez | 1382 | int i; |
534 : | edgomez | 851 | |
535 : | for (i = 0; i < pEnc->mbParam.max_bframes; i++) { | ||
536 : | |||
537 : | if (pEnc->bframes[i] == NULL) | ||
538 : | continue; | ||
539 : | |||
540 : | image_destroy(&pEnc->bframes[i]->image, pEnc->mbParam.edged_width, | ||
541 : | pEnc->mbParam.edged_height); | ||
542 : | xvid_free(pEnc->bframes[i]->mbs); | ||
543 : | xvid_free(pEnc->bframes[i]); | ||
544 : | syskin | 903 | } |
545 : | edgomez | 851 | |
546 : | xvid_free(pEnc->bframes); | ||
547 : | } | ||
548 : | |||
549 : | edgomez | 195 | xvid_err_memory3: |
550 : | edgomez | 851 | |
551 : | edgomez | 1382 | if ((pEnc->mbParam.plugin_flags & XVID_REQORIGINAL)) { |
552 : | image_destroy(&pEnc->sOriginal, pEnc->mbParam.edged_width, | ||
553 : | edgomez | 851 | pEnc->mbParam.edged_height); |
554 : | edgomez | 1382 | image_destroy(&pEnc->sOriginal2, pEnc->mbParam.edged_width, |
555 : | pEnc->mbParam.edged_height); | ||
556 : | edgomez | 851 | } |
557 : | |||
558 : | image_destroy(&pEnc->f_refh, pEnc->mbParam.edged_width, | ||
559 : | edgomez | 195 | pEnc->mbParam.edged_height); |
560 : | edgomez | 851 | image_destroy(&pEnc->f_refv, pEnc->mbParam.edged_width, |
561 : | pEnc->mbParam.edged_height); | ||
562 : | image_destroy(&pEnc->f_refhv, pEnc->mbParam.edged_width, | ||
563 : | pEnc->mbParam.edged_height); | ||
564 : | edgomez | 192 | |
565 : | edgomez | 195 | image_destroy(&pEnc->current->image, pEnc->mbParam.edged_width, |
566 : | pEnc->mbParam.edged_height); | ||
567 : | image_destroy(&pEnc->reference->image, pEnc->mbParam.edged_width, | ||
568 : | pEnc->mbParam.edged_height); | ||
569 : | image_destroy(&pEnc->vInterH, pEnc->mbParam.edged_width, | ||
570 : | pEnc->mbParam.edged_height); | ||
571 : | image_destroy(&pEnc->vInterV, pEnc->mbParam.edged_width, | ||
572 : | pEnc->mbParam.edged_height); | ||
573 : | image_destroy(&pEnc->vInterHV, pEnc->mbParam.edged_width, | ||
574 : | pEnc->mbParam.edged_height); | ||
575 : | edgomez | 192 | |
576 : | edgomez | 851 | /* destroy GMC image */ |
577 : | image_destroy(&pEnc->vGMC, pEnc->mbParam.edged_width, | ||
578 : | pEnc->mbParam.edged_height); | ||
579 : | |||
580 : | edgomez | 1382 | xvid_err_memory2a: |
581 : | xvid_free(pEnc->mbParam.mpeg_quant_matrices); | ||
582 : | edgomez | 851 | |
583 : | edgomez | 195 | xvid_err_memory2: |
584 : | edgomez | 192 | xvid_free(pEnc->current->mbs); |
585 : | xvid_free(pEnc->reference->mbs); | ||
586 : | |||
587 : | edgomez | 195 | xvid_err_memory1: |
588 : | edgomez | 192 | xvid_free(pEnc->current); |
589 : | xvid_free(pEnc->reference); | ||
590 : | edgomez | 1382 | |
591 : | xvid_err_memory1a: | ||
592 : | if ((pEnc->mbParam.plugin_flags & XVID_REQDQUANTS)) { | ||
593 : | xvid_free(pEnc->temp_dquants); | ||
594 : | } | ||
595 : | |||
596 : | syskin | 1660 | if(pEnc->mbParam.plugin_flags & XVID_REQLAMBDA) { |
597 : | xvid_free(pEnc->temp_lambda); | ||
598 : | } | ||
599 : | |||
600 : | edgomez | 1382 | xvid_err_memory0: |
601 : | for (n=0; n<pEnc->num_plugins;n++) { | ||
602 : | if (pEnc->plugins[n].func) { | ||
603 : | suxen_drol | 1653 | pEnc->plugins[n].func(pEnc->plugins[n].param, XVID_PLG_DESTROY, NULL, NULL); |
604 : | edgomez | 1382 | } |
605 : | } | ||
606 : | xvid_free(pEnc->plugins); | ||
607 : | |||
608 : | xvid_free(pEnc->zones); | ||
609 : | |||
610 : | edgomez | 192 | xvid_free(pEnc); |
611 : | |||
612 : | edgomez | 1382 | create->handle = NULL; |
613 : | edgomez | 194 | |
614 : | edgomez | 192 | return XVID_ERR_MEMORY; |
615 : | Isibaar | 3 | } |
616 : | |||
617 : | edgomez | 194 | /***************************************************************************** |
618 : | * Encoder destruction | ||
619 : | * | ||
620 : | * This function destroy the entire encoder structure created by a previous | ||
621 : | edgomez | 1382 | * successful enc_create call. |
622 : | edgomez | 194 | * |
623 : | * Returned values (for now only one returned value) : | ||
624 : | edgomez | 1382 | * - 0 - no errors |
625 : | edgomez | 194 | * |
626 : | ****************************************************************************/ | ||
627 : | |||
628 : | int | ||
629 : | edgomez | 1382 | enc_destroy(Encoder * pEnc) |
630 : | Isibaar | 3 | { |
631 : | edgomez | 851 | int i; |
632 : | syskin | 903 | |
633 : | edgomez | 851 | /* B Frames specific */ |
634 : | edgomez | 1382 | for (i = 0; i < pEnc->mbParam.max_bframes+1; i++) { |
635 : | image_destroy(&pEnc->queue[i].image, pEnc->mbParam.edged_width, | ||
636 : | edgomez | 851 | pEnc->mbParam.edged_height); |
637 : | } | ||
638 : | |||
639 : | edgomez | 1382 | xvid_free(pEnc->queue); |
640 : | |||
641 : | edgomez | 851 | if (pEnc->mbParam.max_bframes > 0) { |
642 : | |||
643 : | for (i = 0; i < pEnc->mbParam.max_bframes; i++) { | ||
644 : | |||
645 : | if (pEnc->bframes[i] == NULL) | ||
646 : | continue; | ||
647 : | |||
648 : | image_destroy(&pEnc->bframes[i]->image, pEnc->mbParam.edged_width, | ||
649 : | pEnc->mbParam.edged_height); | ||
650 : | xvid_free(pEnc->bframes[i]->mbs); | ||
651 : | xvid_free(pEnc->bframes[i]); | ||
652 : | } | ||
653 : | |||
654 : | xvid_free(pEnc->bframes); | ||
655 : | syskin | 903 | |
656 : | edgomez | 851 | } |
657 : | |||
658 : | edgomez | 192 | /* All images, reference, current etc ... */ |
659 : | edgomez | 851 | |
660 : | edgomez | 195 | image_destroy(&pEnc->current->image, pEnc->mbParam.edged_width, |
661 : | pEnc->mbParam.edged_height); | ||
662 : | image_destroy(&pEnc->reference->image, pEnc->mbParam.edged_width, | ||
663 : | pEnc->mbParam.edged_height); | ||
664 : | image_destroy(&pEnc->vInterH, pEnc->mbParam.edged_width, | ||
665 : | pEnc->mbParam.edged_height); | ||
666 : | image_destroy(&pEnc->vInterV, pEnc->mbParam.edged_width, | ||
667 : | pEnc->mbParam.edged_height); | ||
668 : | image_destroy(&pEnc->vInterHV, pEnc->mbParam.edged_width, | ||
669 : | pEnc->mbParam.edged_height); | ||
670 : | edgomez | 851 | image_destroy(&pEnc->f_refh, pEnc->mbParam.edged_width, |
671 : | edgomez | 195 | pEnc->mbParam.edged_height); |
672 : | edgomez | 851 | image_destroy(&pEnc->f_refv, pEnc->mbParam.edged_width, |
673 : | pEnc->mbParam.edged_height); | ||
674 : | image_destroy(&pEnc->f_refhv, pEnc->mbParam.edged_width, | ||
675 : | pEnc->mbParam.edged_height); | ||
676 : | edgomez | 1382 | image_destroy(&pEnc->vGMC, pEnc->mbParam.edged_width, |
677 : | pEnc->mbParam.edged_height); | ||
678 : | edgomez | 192 | |
679 : | edgomez | 1382 | if ((pEnc->mbParam.plugin_flags & XVID_REQORIGINAL)) { |
680 : | image_destroy(&pEnc->sOriginal, pEnc->mbParam.edged_width, | ||
681 : | edgomez | 851 | pEnc->mbParam.edged_height); |
682 : | edgomez | 1382 | image_destroy(&pEnc->sOriginal2, pEnc->mbParam.edged_width, |
683 : | pEnc->mbParam.edged_height); | ||
684 : | edgomez | 851 | } |
685 : | |||
686 : | edgomez | 192 | /* Encoder structure */ |
687 : | edgomez | 851 | |
688 : | suxen_drol | 136 | xvid_free(pEnc->current->mbs); |
689 : | xvid_free(pEnc->current); | ||
690 : | |||
691 : | xvid_free(pEnc->reference->mbs); | ||
692 : | xvid_free(pEnc->reference); | ||
693 : | |||
694 : | edgomez | 1382 | if ((pEnc->mbParam.plugin_flags & XVID_REQDQUANTS)) { |
695 : | xvid_free(pEnc->temp_dquants); | ||
696 : | } | ||
697 : | edgomez | 192 | |
698 : | syskin | 1693 | if ((pEnc->mbParam.plugin_flags & XVID_REQLAMBDA)) { |
699 : | xvid_free(pEnc->temp_lambda); | ||
700 : | } | ||
701 : | Isibaar | 3 | |
702 : | edgomez | 1382 | if (pEnc->num_plugins>0) { |
703 : | xvid_plg_destroy_t pdestroy; | ||
704 : | memset(&pdestroy, 0, sizeof(xvid_plg_destroy_t)); | ||
705 : | suxen_drol | 229 | |
706 : | edgomez | 1382 | pdestroy.version = XVID_VERSION; |
707 : | pdestroy.num_frames = pEnc->m_framenum; | ||
708 : | suxen_drol | 229 | |
709 : | edgomez | 1382 | for (i=0; i<pEnc->num_plugins;i++) { |
710 : | if (pEnc->plugins[i].func) { | ||
711 : | suxen_drol | 1653 | pEnc->plugins[i].func(pEnc->plugins[i].param, XVID_PLG_DESTROY, &pdestroy, NULL); |
712 : | edgomez | 1382 | } |
713 : | } | ||
714 : | xvid_free(pEnc->plugins); | ||
715 : | edgomez | 851 | } |
716 : | |||
717 : | edgomez | 1382 | xvid_free(pEnc->mbParam.mpeg_quant_matrices); |
718 : | edgomez | 851 | |
719 : | syskin | 1682 | if (pEnc->num_zones > 0) |
720 : | edgomez | 1382 | xvid_free(pEnc->zones); |
721 : | edgomez | 851 | |
722 : | syskin | 1682 | if (pEnc->num_threads > 0) { |
723 : | Isibaar | 1913 | for (i = 1; i < MAX(1, MIN(pEnc->num_threads, pEnc->num_slices)); i++) { |
724 : | xvid_free(pEnc->smpData[i].bs); | ||
725 : | xvid_free(pEnc->smpData[i].sStat); | ||
726 : | } | ||
727 : | if (pEnc->smpData[0].tmp_buffer) xvid_free(pEnc->smpData[0].tmp_buffer); | ||
728 : | |||
729 : | syskin | 1682 | for (i = 0; i < pEnc->num_threads; i++) |
730 : | Isibaar | 1913 | xvid_free(pEnc->smpData[i].complete_count_self); |
731 : | syskin | 1682 | } |
732 : | Isibaar | 1913 | xvid_free(pEnc->smpData); |
733 : | syskin | 1682 | |
734 : | edgomez | 1382 | xvid_free(pEnc); |
735 : | edgomez | 851 | |
736 : | edgomez | 1382 | return 0; /* ok */ |
737 : | edgomez | 851 | } |
738 : | |||
739 : | |||
740 : | edgomez | 1382 | /* |
741 : | call the plugins | ||
742 : | */ | ||
743 : | edgomez | 851 | |
744 : | edgomez | 1382 | static void call_plugins(Encoder * pEnc, FRAMEINFO * frame, IMAGE * original, |
745 : | int opt, int * type, int * quant, xvid_enc_stats_t * stats) | ||
746 : | { | ||
747 : | syskin | 1660 | unsigned int i, j, k; |
748 : | edgomez | 1382 | xvid_plg_data_t data; |
749 : | edgomez | 851 | |
750 : | edgomez | 1382 | /* set data struct */ |
751 : | edgomez | 851 | |
752 : | edgomez | 1382 | memset(&data, 0, sizeof(xvid_plg_data_t)); |
753 : | data.version = XVID_VERSION; | ||
754 : | edgomez | 851 | |
755 : | edgomez | 1382 | /* find zone */ |
756 : | for(i=0; i<pEnc->num_zones && pEnc->zones[i].frame<=frame->frame_num; i++) ; | ||
757 : | data.zone = i>0 ? &pEnc->zones[i-1] : NULL; | ||
758 : | edgomez | 851 | |
759 : | edgomez | 1382 | data.width = pEnc->mbParam.width; |
760 : | data.height = pEnc->mbParam.height; | ||
761 : | data.mb_width = pEnc->mbParam.mb_width; | ||
762 : | data.mb_height = pEnc->mbParam.mb_height; | ||
763 : | data.fincr = frame->fincr; | ||
764 : | data.fbase = pEnc->mbParam.fbase; | ||
765 : | data.bquant_ratio = pEnc->mbParam.bquant_ratio; | ||
766 : | data.bquant_offset = pEnc->mbParam.bquant_offset; | ||
767 : | edgomez | 851 | |
768 : | edgomez | 1382 | for (i=0; i<3; i++) { |
769 : | data.min_quant[i] = pEnc->mbParam.min_quant[i]; | ||
770 : | data.max_quant[i] = pEnc->mbParam.max_quant[i]; | ||
771 : | } | ||
772 : | edgomez | 851 | |
773 : | edgomez | 1382 | data.reference.csp = XVID_CSP_PLANAR; |
774 : | data.reference.plane[0] = pEnc->reference->image.y; | ||
775 : | data.reference.plane[1] = pEnc->reference->image.u; | ||
776 : | data.reference.plane[2] = pEnc->reference->image.v; | ||
777 : | data.reference.stride[0] = pEnc->mbParam.edged_width; | ||
778 : | data.reference.stride[1] = pEnc->mbParam.edged_width/2; | ||
779 : | data.reference.stride[2] = pEnc->mbParam.edged_width/2; | ||
780 : | edgomez | 851 | |
781 : | edgomez | 1382 | data.current.csp = XVID_CSP_PLANAR; |
782 : | data.current.plane[0] = frame->image.y; | ||
783 : | data.current.plane[1] = frame->image.u; | ||
784 : | data.current.plane[2] = frame->image.v; | ||
785 : | data.current.stride[0] = pEnc->mbParam.edged_width; | ||
786 : | data.current.stride[1] = pEnc->mbParam.edged_width/2; | ||
787 : | data.current.stride[2] = pEnc->mbParam.edged_width/2; | ||
788 : | edgomez | 851 | |
789 : | edgomez | 1382 | data.frame_num = frame->frame_num; |
790 : | edgomez | 851 | |
791 : | edgomez | 1382 | if (opt == XVID_PLG_BEFORE) { |
792 : | data.type = *type; | ||
793 : | data.quant = *quant; | ||
794 : | edgomez | 851 | |
795 : | edgomez | 1382 | data.vol_flags = frame->vol_flags; |
796 : | data.vop_flags = frame->vop_flags; | ||
797 : | data.motion_flags = frame->motion_flags; | ||
798 : | edgomez | 851 | |
799 : | edgomez | 1382 | } else if (opt == XVID_PLG_FRAME) { |
800 : | data.type = coding2type(frame->coding_type); | ||
801 : | data.quant = frame->quant; | ||
802 : | edgomez | 851 | |
803 : | edgomez | 1382 | if ((pEnc->mbParam.plugin_flags & XVID_REQDQUANTS)) { |
804 : | data.dquant = pEnc->temp_dquants; | ||
805 : | data.dquant_stride = pEnc->mbParam.mb_width; | ||
806 : | syskin | 1680 | memset(data.dquant, 0, data.mb_width*data.mb_height*sizeof(int)); |
807 : | edgomez | 1382 | } |
808 : | syskin | 1660 | |
809 : | if(pEnc->mbParam.plugin_flags & XVID_REQLAMBDA) { | ||
810 : | int block = 0; | ||
811 : | Isibaar | 1766 | emms(); |
812 : | syskin | 1660 | data.lambda = pEnc->temp_lambda; |
813 : | for(i = 0;i < pEnc->mbParam.mb_height; i++) | ||
814 : | for(j = 0;j < pEnc->mbParam.mb_width; j++) | ||
815 : | for (k = 0; k < 6; k++) | ||
816 : | data.lambda[block++] = 1.0f; | ||
817 : | } | ||
818 : | |||
819 : | edgomez | 1382 | } else { /* XVID_PLG_AFTER */ |
820 : | if ((pEnc->mbParam.plugin_flags & XVID_REQORIGINAL)) { | ||
821 : | data.original.csp = XVID_CSP_PLANAR; | ||
822 : | data.original.plane[0] = original->y; | ||
823 : | data.original.plane[1] = original->u; | ||
824 : | data.original.plane[2] = original->v; | ||
825 : | data.original.stride[0] = pEnc->mbParam.edged_width; | ||
826 : | data.original.stride[1] = pEnc->mbParam.edged_width/2; | ||
827 : | data.original.stride[2] = pEnc->mbParam.edged_width/2; | ||
828 : | } | ||
829 : | edgomez | 851 | |
830 : | edgomez | 1382 | if ((frame->vol_flags & XVID_VOL_EXTRASTATS) || |
831 : | (pEnc->mbParam.plugin_flags & XVID_REQPSNR)) { | ||
832 : | edgomez | 851 | |
833 : | edgomez | 1382 | data.sse_y = |
834 : | plane_sse( original->y, frame->image.y, | ||
835 : | pEnc->mbParam.edged_width, pEnc->mbParam.width, | ||
836 : | pEnc->mbParam.height); | ||
837 : | edgomez | 851 | |
838 : | edgomez | 1382 | data.sse_u = |
839 : | plane_sse( original->u, frame->image.u, | ||
840 : | pEnc->mbParam.edged_width/2, pEnc->mbParam.width/2, | ||
841 : | pEnc->mbParam.height/2); | ||
842 : | edgomez | 851 | |
843 : | edgomez | 1382 | data.sse_v = |
844 : | plane_sse( original->v, frame->image.v, | ||
845 : | pEnc->mbParam.edged_width/2, pEnc->mbParam.width/2, | ||
846 : | pEnc->mbParam.height/2); | ||
847 : | } | ||
848 : | edgomez | 851 | |
849 : | edgomez | 1382 | data.type = coding2type(frame->coding_type); |
850 : | data.quant = frame->quant; | ||
851 : | edgomez | 851 | |
852 : | edgomez | 1382 | if ((pEnc->mbParam.plugin_flags & XVID_REQDQUANTS)) { |
853 : | data.dquant = pEnc->temp_dquants; | ||
854 : | data.dquant_stride = pEnc->mbParam.mb_width; | ||
855 : | edgomez | 851 | |
856 : | edgomez | 1382 | for (j=0; j<pEnc->mbParam.mb_height; j++) |
857 : | for (i=0; i<pEnc->mbParam.mb_width; i++) { | ||
858 : | data.dquant[j*data.dquant_stride + i] = frame->mbs[j*pEnc->mbParam.mb_width + i].dquant; | ||
859 : | } | ||
860 : | } | ||
861 : | edgomez | 851 | |
862 : | edgomez | 1382 | data.vol_flags = frame->vol_flags; |
863 : | data.vop_flags = frame->vop_flags; | ||
864 : | data.motion_flags = frame->motion_flags; | ||
865 : | edgomez | 851 | |
866 : | edgomez | 1382 | data.length = frame->length; |
867 : | data.kblks = frame->sStat.kblks; | ||
868 : | data.mblks = frame->sStat.mblks; | ||
869 : | data.ublks = frame->sStat.ublks; | ||
870 : | edgomez | 851 | |
871 : | edgomez | 1382 | /* New code */ |
872 : | data.stats.type = coding2type(frame->coding_type); | ||
873 : | data.stats.quant = frame->quant; | ||
874 : | data.stats.vol_flags = frame->vol_flags; | ||
875 : | data.stats.vop_flags = frame->vop_flags; | ||
876 : | data.stats.length = frame->length; | ||
877 : | data.stats.hlength = frame->length - (frame->sStat.iTextBits / 8); | ||
878 : | data.stats.kblks = frame->sStat.kblks; | ||
879 : | data.stats.mblks = frame->sStat.mblks; | ||
880 : | data.stats.ublks = frame->sStat.ublks; | ||
881 : | data.stats.sse_y = data.sse_y; | ||
882 : | data.stats.sse_u = data.sse_u; | ||
883 : | data.stats.sse_v = data.sse_v; | ||
884 : | edgomez | 851 | |
885 : | edgomez | 1382 | if (stats) |
886 : | *stats = data.stats; | ||
887 : | } | ||
888 : | edgomez | 851 | |
889 : | edgomez | 1382 | /* call plugins */ |
890 : | for (i=0; i<(unsigned int)pEnc->num_plugins;i++) { | ||
891 : | emms(); | ||
892 : | if (pEnc->plugins[i].func) { | ||
893 : | suxen_drol | 1653 | if (pEnc->plugins[i].func(pEnc->plugins[i].param, opt, &data, NULL) < 0) { |
894 : | edgomez | 1382 | continue; |
895 : | edgomez | 851 | } |
896 : | } | ||
897 : | edgomez | 1382 | } |
898 : | emms(); | ||
899 : | edgomez | 851 | |
900 : | edgomez | 1382 | /* copy modified values back into frame*/ |
901 : | if (opt == XVID_PLG_BEFORE) { | ||
902 : | *type = data.type; | ||
903 : | *quant = data.quant > 0 ? data.quant : 2; /* default */ | ||
904 : | |||
905 : | frame->vol_flags = data.vol_flags; | ||
906 : | frame->vop_flags = data.vop_flags; | ||
907 : | frame->motion_flags = data.motion_flags; | ||
908 : | syskin | 903 | |
909 : | edgomez | 1382 | } else if (opt == XVID_PLG_FRAME) { |
910 : | edgomez | 851 | |
911 : | edgomez | 1382 | if ((pEnc->mbParam.plugin_flags & XVID_REQDQUANTS)) { |
912 : | for (j=0; j<pEnc->mbParam.mb_height; j++) | ||
913 : | for (i=0; i<pEnc->mbParam.mb_width; i++) { | ||
914 : | frame->mbs[j*pEnc->mbParam.mb_width + i].dquant = data.dquant[j*data.mb_width + i]; | ||
915 : | } | ||
916 : | } else { | ||
917 : | for (j=0; j<pEnc->mbParam.mb_height; j++) | ||
918 : | for (i=0; i<pEnc->mbParam.mb_width; i++) { | ||
919 : | frame->mbs[j*pEnc->mbParam.mb_width + i].dquant = 0; | ||
920 : | } | ||
921 : | } | ||
922 : | syskin | 1660 | |
923 : | if (pEnc->mbParam.plugin_flags & XVID_REQLAMBDA) { | ||
924 : | for (j = 0; j < pEnc->mbParam.mb_height; j++) | ||
925 : | for (i = 0; i < pEnc->mbParam.mb_width; i++) | ||
926 : | for (k = 0; k < 6; k++) { | ||
927 : | frame->mbs[j*pEnc->mbParam.mb_width + i].lambda[k] = | ||
928 : | (int) ((float)(1<<LAMBDA_EXP) * data.lambda[6 * (j * data.mb_width + i) + k]); | ||
929 : | Isibaar | 1909 | } |
930 : | syskin | 1660 | } else { |
931 : | for (j = 0; j<pEnc->mbParam.mb_height; j++) | ||
932 : | for (i = 0; i<pEnc->mbParam.mb_width; i++) | ||
933 : | for (k = 0; k < 6; k++) { | ||
934 : | frame->mbs[j*pEnc->mbParam.mb_width + i].lambda[k] = 1<<LAMBDA_EXP; | ||
935 : | Isibaar | 1909 | } |
936 : | syskin | 1660 | } |
937 : | |||
938 : | |||
939 : | edgomez | 1382 | frame->mbs[0].quant = data.quant; /* FRAME will not affect the quant in stats */ |
940 : | } | ||
941 : | edgomez | 851 | |
942 : | |||
943 : | edgomez | 1382 | } |
944 : | edgomez | 851 | |
945 : | Isibaar | 967 | |
946 : | edgomez | 1382 | static __inline void inc_frame_num(Encoder * pEnc) |
947 : | { | ||
948 : | pEnc->current->frame_num = pEnc->m_framenum; | ||
949 : | pEnc->current->stamp = pEnc->mbParam.m_stamp; /* first frame is zero */ | ||
950 : | Isibaar | 967 | |
951 : | edgomez | 1382 | pEnc->mbParam.m_stamp += pEnc->current->fincr; |
952 : | pEnc->m_framenum++; /* debug ticker */ | ||
953 : | } | ||
954 : | edgomez | 851 | |
955 : | edgomez | 1382 | static __inline void dec_frame_num(Encoder * pEnc) |
956 : | { | ||
957 : | pEnc->mbParam.m_stamp -= pEnc->mbParam.fincr; | ||
958 : | pEnc->m_framenum--; /* debug ticker */ | ||
959 : | } | ||
960 : | edgomez | 851 | |
961 : | edgomez | 1382 | static __inline void |
962 : | MBSetDquant(MACROBLOCK * pMB, int x, int y, MBParam * mbParam) | ||
963 : | { | ||
964 : | if (pMB->cbp == 0) { | ||
965 : | /* we want to code dquant but the quantizer value will not be used yet | ||
966 : | let's find out if we can postpone dquant to next MB | ||
967 : | */ | ||
968 : | if (x == mbParam->mb_width-1 && y == mbParam->mb_height-1) { | ||
969 : | pMB->dquant = 0; /* it's the last MB of all, the easiest case */ | ||
970 : | return; | ||
971 : | } else { | ||
972 : | MACROBLOCK * next = pMB + 1; | ||
973 : | const MACROBLOCK * prev = pMB - 1; | ||
974 : | if (next->mode != MODE_INTER4V && next->mode != MODE_NOT_CODED) | ||
975 : | /* mode allows dquant change in the future */ | ||
976 : | if (abs(next->quant - prev->quant) <= 2) { | ||
977 : | /* quant change is not out of range */ | ||
978 : | pMB->quant = prev->quant; | ||
979 : | pMB->dquant = 0; | ||
980 : | next->dquant = next->quant - prev->quant; | ||
981 : | return; | ||
982 : | } | ||
983 : | } | ||
984 : | edgomez | 851 | } |
985 : | edgomez | 1382 | /* couldn't skip this dquant */ |
986 : | pMB->mode = MODE_INTER_Q; | ||
987 : | } | ||
988 : | |||
989 : | edgomez | 851 | |
990 : | |||
991 : | edgomez | 1382 | static __inline void |
992 : | set_timecodes(FRAMEINFO* pCur,FRAMEINFO *pRef, int32_t time_base) | ||
993 : | { | ||
994 : | edgomez | 851 | |
995 : | edgomez | 1382 | pCur->ticks = (int32_t)pCur->stamp % time_base; |
996 : | pCur->seconds = ((int32_t)pCur->stamp / time_base) - ((int32_t)pRef->stamp / time_base) ; | ||
997 : | syskin | 903 | |
998 : | edgomez | 1382 | #if 0 /* HEAVY DEBUG OUTPUT */ |
999 : | fprintf(stderr,"WriteVop: %d - %d \n", | ||
1000 : | ((int32_t)pCur->stamp / time_base), ((int32_t)pRef->stamp / time_base)); | ||
1001 : | fprintf(stderr,"set_timecodes: VOP %1d stamp=%lld ref_stamp=%lld base=%d\n", | ||
1002 : | pCur->coding_type, pCur->stamp, pRef->stamp, time_base); | ||
1003 : | fprintf(stderr,"set_timecodes: VOP %1d seconds=%d ticks=%d (ref-sec=%d ref-tick=%d)\n", | ||
1004 : | pCur->coding_type, pCur->seconds, pCur->ticks, pRef->seconds, pRef->ticks); | ||
1005 : | #endif | ||
1006 : | } | ||
1007 : | edgomez | 851 | |
1008 : | edgomez | 1382 | static void |
1009 : | simplify_par(int *par_width, int *par_height) | ||
1010 : | { | ||
1011 : | edgomez | 851 | |
1012 : | edgomez | 1382 | int _par_width = (!*par_width) ? 1 : (*par_width<0) ? -*par_width: *par_width; |
1013 : | int _par_height = (!*par_height) ? 1 : (*par_height<0) ? -*par_height: *par_height; | ||
1014 : | int divisor = gcd(_par_width, _par_height); | ||
1015 : | Isibaar | 967 | |
1016 : | edgomez | 1382 | _par_width /= divisor; |
1017 : | _par_height /= divisor; | ||
1018 : | Isibaar | 967 | |
1019 : | edgomez | 1382 | /* 2^8 precision maximum */ |
1020 : | if (_par_width>255 || _par_height>255) { | ||
1021 : | float div; | ||
1022 : | emms(); | ||
1023 : | if (_par_width>_par_height) | ||
1024 : | div = (float)_par_width/255; | ||
1025 : | else | ||
1026 : | div = (float)_par_height/255; | ||
1027 : | edgomez | 851 | |
1028 : | edgomez | 1382 | _par_width = (int)((float)_par_width/div); |
1029 : | _par_height = (int)((float)_par_height/div); | ||
1030 : | edgomez | 851 | } |
1031 : | |||
1032 : | edgomez | 1382 | *par_width = _par_width; |
1033 : | *par_height = _par_height; | ||
1034 : | edgomez | 851 | |
1035 : | edgomez | 1382 | return; |
1036 : | } | ||
1037 : | edgomez | 851 | |
1038 : | edgomez | 1382 | /***************************************************************************** |
1039 : | * IPB frame encoder entry point | ||
1040 : | * | ||
1041 : | * Returned values : | ||
1042 : | * - >0 - output bytes | ||
1043 : | * - 0 - no output | ||
1044 : | * - XVID_ERR_VERSION - wrong version passed to core | ||
1045 : | * - XVID_ERR_END - End of stream reached before end of coding | ||
1046 : | * - XVID_ERR_FORMAT - the image subsystem reported the image had a wrong | ||
1047 : | * format | ||
1048 : | ****************************************************************************/ | ||
1049 : | edgomez | 851 | |
1050 : | |||
1051 : | edgomez | 1382 | int |
1052 : | enc_encode(Encoder * pEnc, | ||
1053 : | xvid_enc_frame_t * xFrame, | ||
1054 : | xvid_enc_stats_t * stats) | ||
1055 : | { | ||
1056 : | xvid_enc_frame_t * frame; | ||
1057 : | int type; | ||
1058 : | Bitstream bs; | ||
1059 : | edgomez | 851 | |
1060 : | edgomez | 1382 | if (XVID_VERSION_MAJOR(xFrame->version) != 1 || (stats && XVID_VERSION_MAJOR(stats->version) != 1)) /* v1.x.x */ |
1061 : | return XVID_ERR_VERSION; | ||
1062 : | edgomez | 851 | |
1063 : | edgomez | 1382 | xFrame->out_flags = 0; |
1064 : | edgomez | 851 | |
1065 : | edgomez | 1382 | start_global_timer(); |
1066 : | BitstreamInit(&bs, xFrame->bitstream, 0); | ||
1067 : | |||
1068 : | |||
1069 : | /* %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% | ||
1070 : | * enqueue image to the encoding-queue | ||
1071 : | * %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% */ | ||
1072 : | |||
1073 : | if (xFrame->input.csp != XVID_CSP_NULL) | ||
1074 : | { | ||
1075 : | QUEUEINFO * q = &pEnc->queue[pEnc->queue_tail]; | ||
1076 : | |||
1077 : | edgomez | 851 | start_timer(); |
1078 : | if (image_input | ||
1079 : | edgomez | 1382 | (&q->image, pEnc->mbParam.width, pEnc->mbParam.height, |
1080 : | pEnc->mbParam.edged_width, (uint8_t**)xFrame->input.plane, xFrame->input.stride, | ||
1081 : | xFrame->input.csp, xFrame->vol_flags & XVID_VOL_INTERLACING)) | ||
1082 : | edgomez | 851 | { |
1083 : | emms(); | ||
1084 : | return XVID_ERR_FORMAT; | ||
1085 : | } | ||
1086 : | stop_conv_timer(); | ||
1087 : | |||
1088 : | edgomez | 1382 | if ((xFrame->vop_flags & XVID_VOP_CHROMAOPT)) { |
1089 : | image_chroma_optimize(&q->image, | ||
1090 : | edgomez | 853 | pEnc->mbParam.width, pEnc->mbParam.height, pEnc->mbParam.edged_width); |
1091 : | } | ||
1092 : | |||
1093 : | edgomez | 1382 | q->frame = *xFrame; |
1094 : | |||
1095 : | if (xFrame->quant_intra_matrix) | ||
1096 : | edgomez | 851 | { |
1097 : | edgomez | 1382 | memcpy(q->quant_intra_matrix, xFrame->quant_intra_matrix, 64*sizeof(unsigned char)); |
1098 : | q->frame.quant_intra_matrix = q->quant_intra_matrix; | ||
1099 : | edgomez | 851 | } |
1100 : | |||
1101 : | edgomez | 1382 | if (xFrame->quant_inter_matrix) |
1102 : | { | ||
1103 : | memcpy(q->quant_inter_matrix, xFrame->quant_inter_matrix, 64*sizeof(unsigned char)); | ||
1104 : | q->frame.quant_inter_matrix = q->quant_inter_matrix; | ||
1105 : | } | ||
1106 : | edgomez | 851 | |
1107 : | edgomez | 1382 | pEnc->queue_tail = (pEnc->queue_tail + 1) % (pEnc->mbParam.max_bframes+1); |
1108 : | pEnc->queue_size++; | ||
1109 : | } | ||
1110 : | edgomez | 851 | |
1111 : | |||
1112 : | edgomez | 1382 | /* %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% |
1113 : | * bframe flush code | ||
1114 : | * %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% */ | ||
1115 : | edgomez | 851 | |
1116 : | edgomez | 1382 | repeat: |
1117 : | edgomez | 851 | |
1118 : | edgomez | 1382 | if (pEnc->flush_bframes) |
1119 : | { | ||
1120 : | if (pEnc->bframenum_head < pEnc->bframenum_tail) { | ||
1121 : | edgomez | 851 | |
1122 : | edgomez | 1382 | DPRINTF(XVID_DEBUG_DEBUG,"*** BFRAME (flush) bf: head=%i tail=%i queue: head=%i tail=%i size=%i\n", |
1123 : | pEnc->bframenum_head, pEnc->bframenum_tail, | ||
1124 : | pEnc->queue_head, pEnc->queue_tail, pEnc->queue_size); | ||
1125 : | edgomez | 851 | |
1126 : | edgomez | 1382 | if ((pEnc->mbParam.plugin_flags & XVID_REQORIGINAL)) { |
1127 : | image_copy(&pEnc->sOriginal2, &pEnc->bframes[pEnc->bframenum_head]->image, | ||
1128 : | pEnc->mbParam.edged_width, pEnc->mbParam.height); | ||
1129 : | edgomez | 851 | } |
1130 : | |||
1131 : | edgomez | 1382 | FrameCodeB(pEnc, pEnc->bframes[pEnc->bframenum_head], &bs); |
1132 : | suxen_drol | 1653 | call_plugins(pEnc, pEnc->bframes[pEnc->bframenum_head], &pEnc->sOriginal2, XVID_PLG_AFTER, NULL, NULL, stats); |
1133 : | edgomez | 1382 | pEnc->bframenum_head++; |
1134 : | edgomez | 851 | |
1135 : | edgomez | 1382 | goto done; |
1136 : | edgomez | 851 | } |
1137 : | |||
1138 : | edgomez | 1382 | /* write an empty marker to the bitstream. |
1139 : | edgomez | 851 | |
1140 : | edgomez | 1382 | for divx5 decoder compatibility, this marker must consist |
1141 : | of a not-coded p-vop, with a time_base of zero, and time_increment | ||
1142 : | indentical to the future-referece frame. | ||
1143 : | */ | ||
1144 : | edgomez | 851 | |
1145 : | edgomez | 1382 | if ((pEnc->mbParam.global_flags & XVID_GLOBAL_PACKED && pEnc->bframenum_tail > 0)) { |
1146 : | int tmp; | ||
1147 : | int bits; | ||
1148 : | edgomez | 851 | |
1149 : | edgomez | 1382 | DPRINTF(XVID_DEBUG_DEBUG,"*** EMPTY bf: head=%i tail=%i queue: head=%i tail=%i size=%i\n", |
1150 : | pEnc->bframenum_head, pEnc->bframenum_tail, | ||
1151 : | pEnc->queue_head, pEnc->queue_tail, pEnc->queue_size); | ||
1152 : | edgomez | 851 | |
1153 : | edgomez | 1382 | bits = BitstreamPos(&bs); |
1154 : | edgomez | 851 | |
1155 : | edgomez | 1382 | tmp = pEnc->current->seconds; |
1156 : | pEnc->current->seconds = 0; /* force time_base = 0 */ | ||
1157 : | edgomez | 851 | |
1158 : | edgomez | 1382 | BitstreamWriteVopHeader(&bs, &pEnc->mbParam, pEnc->current, 0, pEnc->current->quant); |
1159 : | BitstreamPad(&bs); | ||
1160 : | pEnc->current->seconds = tmp; | ||
1161 : | edgomez | 851 | |
1162 : | edgomez | 1382 | /* add the not-coded length to the reference frame size */ |
1163 : | pEnc->current->length += (BitstreamPos(&bs) - bits) / 8; | ||
1164 : | suxen_drol | 1653 | call_plugins(pEnc, pEnc->current, &pEnc->sOriginal, XVID_PLG_AFTER, NULL, NULL, stats); |
1165 : | edgomez | 851 | |
1166 : | edgomez | 1382 | /* flush complete: reset counters */ |
1167 : | pEnc->flush_bframes = 0; | ||
1168 : | pEnc->bframenum_head = pEnc->bframenum_tail = 0; | ||
1169 : | goto done; | ||
1170 : | edgomez | 851 | |
1171 : | } | ||
1172 : | |||
1173 : | edgomez | 1382 | /* flush complete: reset counters */ |
1174 : | pEnc->flush_bframes = 0; | ||
1175 : | pEnc->bframenum_head = pEnc->bframenum_tail = 0; | ||
1176 : | } | ||
1177 : | edgomez | 851 | |
1178 : | /* %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% | ||
1179 : | edgomez | 1382 | * dequeue frame from the encoding queue |
1180 : | edgomez | 851 | * %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% */ |
1181 : | |||
1182 : | edgomez | 1382 | if (pEnc->queue_size == 0) /* empty */ |
1183 : | { | ||
1184 : | if (xFrame->input.csp == XVID_CSP_NULL) /* no futher input */ | ||
1185 : | { | ||
1186 : | edgomez | 851 | |
1187 : | edgomez | 1382 | DPRINTF(XVID_DEBUG_DEBUG,"*** FINISH bf: head=%i tail=%i queue: head=%i tail=%i size=%i\n", |
1188 : | pEnc->bframenum_head, pEnc->bframenum_tail, | ||
1189 : | pEnc->queue_head, pEnc->queue_tail, pEnc->queue_size); | ||
1190 : | edgomez | 851 | |
1191 : | edgomez | 1382 | if (!(pEnc->mbParam.global_flags & XVID_GLOBAL_PACKED) && pEnc->mbParam.max_bframes > 0) { |
1192 : | suxen_drol | 1653 | call_plugins(pEnc, pEnc->current, &pEnc->sOriginal, XVID_PLG_AFTER, NULL, NULL, stats); |
1193 : | edgomez | 1382 | } |
1194 : | edgomez | 851 | |
1195 : | edgomez | 1382 | /* if the very last frame is to be b-vop, we must change it to a p-vop */ |
1196 : | if (pEnc->bframenum_tail > 0) { | ||
1197 : | edgomez | 851 | |
1198 : | edgomez | 1382 | SWAP(FRAMEINFO*, pEnc->current, pEnc->reference); |
1199 : | pEnc->bframenum_tail--; | ||
1200 : | SWAP(FRAMEINFO*, pEnc->current, pEnc->bframes[pEnc->bframenum_tail]); | ||
1201 : | edgomez | 851 | |
1202 : | edgomez | 1382 | /* convert B-VOP to P-VOP */ |
1203 : | pEnc->current->quant = 100*pEnc->current->quant - pEnc->mbParam.bquant_offset; | ||
1204 : | pEnc->current->quant += pEnc->mbParam.bquant_ratio - 1; /* to avoid rouding issues */ | ||
1205 : | pEnc->current->quant /= pEnc->mbParam.bquant_ratio; | ||
1206 : | |||
1207 : | if ((pEnc->mbParam.plugin_flags & XVID_REQORIGINAL)) { | ||
1208 : | image_copy(&pEnc->sOriginal, &pEnc->current->image, | ||
1209 : | pEnc->mbParam.edged_width, pEnc->mbParam.height); | ||
1210 : | edgomez | 851 | } |
1211 : | |||
1212 : | edgomez | 1382 | DPRINTF(XVID_DEBUG_DEBUG,"*** PFRAME bf: head=%i tail=%i queue: head=%i tail=%i size=%i\n", |
1213 : | pEnc->bframenum_head, pEnc->bframenum_tail, | ||
1214 : | pEnc->queue_head, pEnc->queue_tail, pEnc->queue_size); | ||
1215 : | syskin | 1391 | pEnc->mbParam.frame_drop_ratio = -1; /* it must be a coded vop */ |
1216 : | edgomez | 851 | |
1217 : | syskin | 1403 | FrameCodeP(pEnc, &bs); |
1218 : | edgomez | 851 | |
1219 : | |||
1220 : | edgomez | 1382 | if ((pEnc->mbParam.global_flags & XVID_GLOBAL_PACKED) && pEnc->bframenum_tail==0) { |
1221 : | suxen_drol | 1653 | call_plugins(pEnc, pEnc->current, &pEnc->sOriginal, XVID_PLG_AFTER, NULL, NULL, stats); |
1222 : | edgomez | 1382 | }else{ |
1223 : | pEnc->flush_bframes = 1; | ||
1224 : | goto done; | ||
1225 : | } | ||
1226 : | } | ||
1227 : | DPRINTF(XVID_DEBUG_DEBUG, "*** END\n"); | ||
1228 : | edgomez | 851 | |
1229 : | edgomez | 1382 | emms(); |
1230 : | return XVID_ERR_END; /* end of stream reached */ | ||
1231 : | edgomez | 851 | } |
1232 : | edgomez | 1382 | goto done; /* nothing to encode yet; encoder lag */ |
1233 : | } | ||
1234 : | edgomez | 851 | |
1235 : | edgomez | 1382 | /* the current FRAME becomes the reference */ |
1236 : | SWAP(FRAMEINFO*, pEnc->current, pEnc->reference); | ||
1237 : | edgomez | 851 | |
1238 : | edgomez | 1382 | /* remove frame from encoding-queue (head), and move it into the current */ |
1239 : | image_swap(&pEnc->current->image, &pEnc->queue[pEnc->queue_head].image); | ||
1240 : | frame = &pEnc->queue[pEnc->queue_head].frame; | ||
1241 : | pEnc->queue_head = (pEnc->queue_head + 1) % (pEnc->mbParam.max_bframes+1); | ||
1242 : | pEnc->queue_size--; | ||
1243 : | edgomez | 851 | |
1244 : | |||
1245 : | edgomez | 1382 | /* %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% |
1246 : | * init pEnc->current fields | ||
1247 : | * %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% */ | ||
1248 : | edgomez | 851 | |
1249 : | edgomez | 1382 | pEnc->current->fincr = pEnc->mbParam.fincr>0 ? pEnc->mbParam.fincr : frame->fincr; |
1250 : | inc_frame_num(pEnc); | ||
1251 : | pEnc->current->vol_flags = frame->vol_flags; | ||
1252 : | pEnc->current->vop_flags = frame->vop_flags; | ||
1253 : | pEnc->current->motion_flags = frame->motion; | ||
1254 : | pEnc->current->fcode = pEnc->mbParam.m_fcode; | ||
1255 : | pEnc->current->bcode = pEnc->mbParam.m_fcode; | ||
1256 : | edgomez | 851 | |
1257 : | |||
1258 : | edgomez | 1382 | if ((xFrame->vop_flags & XVID_VOP_CHROMAOPT)) { |
1259 : | image_chroma_optimize(&pEnc->current->image, | ||
1260 : | pEnc->mbParam.width, pEnc->mbParam.height, pEnc->mbParam.edged_width); | ||
1261 : | } | ||
1262 : | edgomez | 851 | |
1263 : | edgomez | 1382 | /* %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% |
1264 : | * frame type & quant selection | ||
1265 : | * %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% */ | ||
1266 : | edgomez | 851 | |
1267 : | edgomez | 1382 | type = frame->type; |
1268 : | pEnc->current->quant = frame->quant; | ||
1269 : | edgomez | 851 | |
1270 : | Skal | 1617 | call_plugins(pEnc, pEnc->current, NULL, XVID_PLG_BEFORE, &type, (int*)&pEnc->current->quant, stats); |
1271 : | edgomez | 851 | |
1272 : | edgomez | 1382 | if (type > 0){ /* XVID_TYPE_?VOP */ |
1273 : | type = type2coding(type); /* convert XVID_TYPE_?VOP to bitstream coding type */ | ||
1274 : | } else{ /* XVID_TYPE_AUTO */ | ||
1275 : | if (pEnc->iFrameNum == 0 || (pEnc->mbParam.iMaxKeyInterval > 0 && pEnc->iFrameNum >= pEnc->mbParam.iMaxKeyInterval)){ | ||
1276 : | pEnc->iFrameNum = 0; | ||
1277 : | type = I_VOP; | ||
1278 : | }else{ | ||
1279 : | type = MEanalysis(&pEnc->reference->image, pEnc->current, | ||
1280 : | &pEnc->mbParam, pEnc->mbParam.iMaxKeyInterval, | ||
1281 : | pEnc->iFrameNum, pEnc->bframenum_tail, xFrame->bframe_threshold, | ||
1282 : | (pEnc->bframes) ? pEnc->bframes[pEnc->bframenum_head]->mbs: NULL); | ||
1283 : | edgomez | 851 | } |
1284 : | edgomez | 1382 | } |
1285 : | edgomez | 851 | |
1286 : | edgomez | 1382 | if (type != I_VOP) |
1287 : | pEnc->current->vol_flags = pEnc->mbParam.vol_flags; /* don't allow VOL changes here */ | ||
1288 : | edgomez | 851 | |
1289 : | edgomez | 1382 | /* bframes buffer overflow check */ |
1290 : | if (type == B_VOP && pEnc->bframenum_tail >= pEnc->mbParam.max_bframes) { | ||
1291 : | type = P_VOP; | ||
1292 : | } | ||
1293 : | edgomez | 851 | |
1294 : | edgomez | 1382 | pEnc->iFrameNum++; |
1295 : | edgomez | 851 | |
1296 : | edgomez | 1382 | if ((pEnc->current->vop_flags & XVID_VOP_DEBUG)) { |
1297 : | image_printf(&pEnc->current->image, pEnc->mbParam.edged_width, pEnc->mbParam.height, 5, 5, | ||
1298 : | "%d st:%lld if:%d", pEnc->current->frame_num, pEnc->current->stamp, pEnc->iFrameNum); | ||
1299 : | } | ||
1300 : | edgomez | 851 | |
1301 : | edgomez | 1382 | /* %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% |
1302 : | * encode this frame as a b-vop | ||
1303 : | * (we dont encode here, rather we store the frame in the bframes queue, to be encoded later) | ||
1304 : | * %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% */ | ||
1305 : | if (type == B_VOP) { | ||
1306 : | if ((pEnc->current->vop_flags & XVID_VOP_DEBUG)) { | ||
1307 : | edgomez | 851 | image_printf(&pEnc->current->image, pEnc->mbParam.edged_width, pEnc->mbParam.height, 5, 200, "BVOP"); |
1308 : | } | ||
1309 : | |||
1310 : | edgomez | 1382 | if (frame->quant < 1) { |
1311 : | syskin | 903 | pEnc->current->quant = ((((pEnc->reference->quant + pEnc->current->quant) * |
1312 : | edgomez | 851 | pEnc->mbParam.bquant_ratio) / 2) + pEnc->mbParam.bquant_offset)/100; |
1313 : | |||
1314 : | } else { | ||
1315 : | edgomez | 1382 | pEnc->current->quant = frame->quant; |
1316 : | edgomez | 851 | } |
1317 : | |||
1318 : | if (pEnc->current->quant < 1) | ||
1319 : | pEnc->current->quant = 1; | ||
1320 : | else if (pEnc->current->quant > 31) | ||
1321 : | syskin | 903 | pEnc->current->quant = 31; |
1322 : | |||
1323 : | edgomez | 1382 | DPRINTF(XVID_DEBUG_DEBUG,"*** BFRAME (store) bf: head=%i tail=%i queue: head=%i tail=%i size=%i quant=%i\n", |
1324 : | edgomez | 851 | pEnc->bframenum_head, pEnc->bframenum_tail, |
1325 : | pEnc->queue_head, pEnc->queue_tail, pEnc->queue_size,pEnc->current->quant); | ||
1326 : | |||
1327 : | /* store frame into bframe buffer & swap ref back to current */ | ||
1328 : | edgomez | 1382 | SWAP(FRAMEINFO*, pEnc->current, pEnc->bframes[pEnc->bframenum_tail]); |
1329 : | SWAP(FRAMEINFO*, pEnc->current, pEnc->reference); | ||
1330 : | edgomez | 851 | |
1331 : | pEnc->bframenum_tail++; | ||
1332 : | |||
1333 : | edgomez | 1382 | goto repeat; |
1334 : | edgomez | 851 | } |
1335 : | |||
1336 : | |||
1337 : | edgomez | 1382 | DPRINTF(XVID_DEBUG_DEBUG,"*** XXXXXX bf: head=%i tail=%i queue: head=%i tail=%i size=%i\n", |
1338 : | pEnc->bframenum_head, pEnc->bframenum_tail, | ||
1339 : | pEnc->queue_head, pEnc->queue_tail, pEnc->queue_size); | ||
1340 : | edgomez | 851 | |
1341 : | edgomez | 1382 | /* for unpacked bframes, output the stats for the last encoded frame */ |
1342 : | if (!(pEnc->mbParam.global_flags & XVID_GLOBAL_PACKED) && pEnc->mbParam.max_bframes > 0) | ||
1343 : | { | ||
1344 : | if (pEnc->current->stamp > 0) { | ||
1345 : | suxen_drol | 1653 | call_plugins(pEnc, pEnc->reference, &pEnc->sOriginal, XVID_PLG_AFTER, NULL, NULL, stats); |
1346 : | edgomez | 851 | } |
1347 : | Isibaar | 1770 | else if (stats) { |
1348 : | stats->type = XVID_TYPE_NOTHING; | ||
1349 : | } | ||
1350 : | edgomez | 851 | } |
1351 : | |||
1352 : | edgomez | 1382 | /* %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% |
1353 : | * closed-gop | ||
1354 : | * if the frame prior to an iframe is scheduled as a bframe, we must change it to a pframe | ||
1355 : | * %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% */ | ||
1356 : | edgomez | 851 | |
1357 : | edgomez | 1382 | if (type == I_VOP && (pEnc->mbParam.global_flags & XVID_GLOBAL_CLOSED_GOP) && pEnc->bframenum_tail > 0) { |
1358 : | edgomez | 851 | |
1359 : | edgomez | 1382 | /* place this frame back on the encoding-queue (head) */ |
1360 : | /* we will deal with it next time */ | ||
1361 : | dec_frame_num(pEnc); | ||
1362 : | pEnc->iFrameNum--; | ||
1363 : | edgomez | 851 | |
1364 : | edgomez | 1382 | pEnc->queue_head = (pEnc->queue_head + (pEnc->mbParam.max_bframes+1) - 1) % (pEnc->mbParam.max_bframes+1); |
1365 : | pEnc->queue_size++; | ||
1366 : | image_swap(&pEnc->current->image, &pEnc->queue[pEnc->queue_head].image); | ||
1367 : | edgomez | 851 | |
1368 : | edgomez | 1382 | /* grab the last frame from the bframe-queue */ |
1369 : | edgomez | 851 | |
1370 : | edgomez | 1382 | pEnc->bframenum_tail--; |
1371 : | SWAP(FRAMEINFO*, pEnc->current, pEnc->bframes[pEnc->bframenum_tail]); | ||
1372 : | edgomez | 851 | |
1373 : | edgomez | 1382 | if ((pEnc->current->vop_flags & XVID_VOP_DEBUG)) { |
1374 : | suxen_drol | 1607 | image_printf(&pEnc->current->image, pEnc->mbParam.edged_width, pEnc->mbParam.height, 5, 100, "CLOSED GOP BVOP->PVOP"); |
1375 : | edgomez | 1382 | } |
1376 : | suxen_drol | 229 | |
1377 : | edgomez | 1382 | /* convert B-VOP quant to P-VOP */ |
1378 : | pEnc->current->quant = 100*pEnc->current->quant - pEnc->mbParam.bquant_offset; | ||
1379 : | pEnc->current->quant += pEnc->mbParam.bquant_ratio - 1; /* to avoid rouding issues */ | ||
1380 : | pEnc->current->quant /= pEnc->mbParam.bquant_ratio; | ||
1381 : | type = P_VOP; | ||
1382 : | edgomez | 851 | } |
1383 : | |||
1384 : | Isibaar | 3 | |
1385 : | edgomez | 1382 | /* %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% |
1386 : | * encode this frame as an i-vop | ||
1387 : | * %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% */ | ||
1388 : | edgomez | 853 | |
1389 : | edgomez | 1382 | if (type == I_VOP) { |
1390 : | Isibaar | 113 | |
1391 : | edgomez | 1382 | DPRINTF(XVID_DEBUG_DEBUG,"*** IFRAME bf: head=%i tail=%i queue: head=%i tail=%i size=%i\n", |
1392 : | pEnc->bframenum_head, pEnc->bframenum_tail, | ||
1393 : | pEnc->queue_head, pEnc->queue_tail, pEnc->queue_size); | ||
1394 : | suxen_drol | 136 | |
1395 : | edgomez | 1382 | if ((pEnc->current->vop_flags & XVID_VOP_DEBUG)) { |
1396 : | image_printf(&pEnc->current->image, pEnc->mbParam.edged_width, pEnc->mbParam.height, 5, 200, "IVOP"); | ||
1397 : | } | ||
1398 : | Isibaar | 3 | |
1399 : | edgomez | 1382 | pEnc->iFrameNum = 1; |
1400 : | Isibaar | 3 | |
1401 : | edgomez | 1382 | /* ---- update vol flags at IVOP ----------- */ |
1402 : | pEnc->mbParam.vol_flags = pEnc->current->vol_flags; | ||
1403 : | edgomez | 851 | |
1404 : | edgomez | 1382 | /* Aspect ratio */ |
1405 : | switch(frame->par) { | ||
1406 : | case XVID_PAR_11_VGA: | ||
1407 : | case XVID_PAR_43_PAL: | ||
1408 : | case XVID_PAR_43_NTSC: | ||
1409 : | case XVID_PAR_169_PAL: | ||
1410 : | case XVID_PAR_169_NTSC: | ||
1411 : | case XVID_PAR_EXT: | ||
1412 : | pEnc->mbParam.par = frame->par; | ||
1413 : | break; | ||
1414 : | default: | ||
1415 : | pEnc->mbParam.par = XVID_PAR_11_VGA; | ||
1416 : | break; | ||
1417 : | } | ||
1418 : | edgomez | 195 | |
1419 : | edgomez | 1382 | /* For extended PAR only, we try to sanityse/simplify par values */ |
1420 : | if (pEnc->mbParam.par == XVID_PAR_EXT) { | ||
1421 : | pEnc->mbParam.par_width = frame->par_width; | ||
1422 : | pEnc->mbParam.par_height = frame->par_height; | ||
1423 : | simplify_par(&pEnc->mbParam.par_width, &pEnc->mbParam.par_height); | ||
1424 : | } | ||
1425 : | edgomez | 194 | |
1426 : | edgomez | 1382 | if ((pEnc->mbParam.vol_flags & XVID_VOL_MPEGQUANT)) { |
1427 : | if (frame->quant_intra_matrix != NULL) | ||
1428 : | set_intra_matrix(pEnc->mbParam.mpeg_quant_matrices, frame->quant_intra_matrix); | ||
1429 : | if (frame->quant_inter_matrix != NULL) | ||
1430 : | set_inter_matrix(pEnc->mbParam.mpeg_quant_matrices, frame->quant_inter_matrix); | ||
1431 : | } | ||
1432 : | edgomez | 194 | |
1433 : | edgomez | 1382 | /* prevent vol/vop misuse */ |
1434 : | edgomez | 194 | |
1435 : | edgomez | 1382 | if (!(pEnc->current->vol_flags & XVID_VOL_INTERLACING)) |
1436 : | pEnc->current->vop_flags &= ~(XVID_VOP_TOPFIELDFIRST|XVID_VOP_ALTERNATESCAN); | ||
1437 : | edgomez | 195 | |
1438 : | edgomez | 1382 | /* ^^^------------------------ */ |
1439 : | edgomez | 195 | |
1440 : | edgomez | 1382 | if ((pEnc->mbParam.plugin_flags & XVID_REQORIGINAL)) { |
1441 : | image_copy(&pEnc->sOriginal, &pEnc->current->image, | ||
1442 : | pEnc->mbParam.edged_width, pEnc->mbParam.height); | ||
1443 : | edgomez | 194 | } |
1444 : | |||
1445 : | edgomez | 1382 | FrameCodeI(pEnc, &bs); |
1446 : | xFrame->out_flags |= XVID_KEYFRAME; | ||
1447 : | Isibaar | 3 | |
1448 : | edgomez | 1382 | /* %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% |
1449 : | * encode this frame as an p-vop | ||
1450 : | * %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% */ | ||
1451 : | Isibaar | 3 | |
1452 : | edgomez | 1382 | } else { /* (type == P_VOP || type == S_VOP) */ |
1453 : | edgomez | 78 | |
1454 : | edgomez | 1382 | DPRINTF(XVID_DEBUG_DEBUG,"*** PFRAME bf: head=%i tail=%i queue: head=%i tail=%i size=%i\n", |
1455 : | pEnc->bframenum_head, pEnc->bframenum_tail, | ||
1456 : | pEnc->queue_head, pEnc->queue_tail, pEnc->queue_size); | ||
1457 : | edgomez | 195 | |
1458 : | edgomez | 1382 | if ((pEnc->current->vop_flags & XVID_VOP_DEBUG)) { |
1459 : | image_printf(&pEnc->current->image, pEnc->mbParam.edged_width, pEnc->mbParam.height, 5, 200, "PVOP"); | ||
1460 : | Isibaar | 20 | } |
1461 : | Isibaar | 3 | |
1462 : | edgomez | 1382 | if ((pEnc->mbParam.plugin_flags & XVID_REQORIGINAL)) { |
1463 : | image_copy(&pEnc->sOriginal, &pEnc->current->image, | ||
1464 : | pEnc->mbParam.edged_width, pEnc->mbParam.height); | ||
1465 : | edgomez | 194 | } |
1466 : | |||
1467 : | syskin | 1403 | if ( FrameCodeP(pEnc, &bs) == 0 ) { |
1468 : | syskin | 1391 | /* N-VOP, we mustn't code b-frames yet */ |
1469 : | Isibaar | 1679 | if ((pEnc->mbParam.global_flags & XVID_GLOBAL_PACKED) || |
1470 : | pEnc->mbParam.max_bframes == 0) | ||
1471 : | call_plugins(pEnc, pEnc->current, &pEnc->sOriginal, XVID_PLG_AFTER, NULL, NULL, stats); | ||
1472 : | syskin | 1391 | goto done; |
1473 : | } | ||
1474 : | edgomez | 13 | } |
1475 : | Isibaar | 3 | |
1476 : | edgomez | 867 | |
1477 : | edgomez | 1382 | /* %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% |
1478 : | * on next enc_encode call we must flush bframes | ||
1479 : | * %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% */ | ||
1480 : | h | 29 | |
1481 : | edgomez | 1382 | /*done_flush:*/ |
1482 : | edgomez | 195 | |
1483 : | edgomez | 1382 | pEnc->flush_bframes = 1; |
1484 : | Isibaar | 41 | |
1485 : | edgomez | 1382 | /* packed & queued_bframes: dont bother outputting stats here, we do so after the flush */ |
1486 : | if ((pEnc->mbParam.global_flags & XVID_GLOBAL_PACKED) && pEnc->bframenum_tail > 0) { | ||
1487 : | goto repeat; | ||
1488 : | Isibaar | 3 | } |
1489 : | syskin | 903 | |
1490 : | edgomez | 1382 | /* packed or no-bframes or no-bframes-queued: output stats */ |
1491 : | if ((pEnc->mbParam.global_flags & XVID_GLOBAL_PACKED) || pEnc->mbParam.max_bframes == 0 ) { | ||
1492 : | suxen_drol | 1653 | call_plugins(pEnc, pEnc->current, &pEnc->sOriginal, XVID_PLG_AFTER, NULL, NULL, stats); |
1493 : | edgomez | 851 | } |
1494 : | Isibaar | 113 | |
1495 : | edgomez | 1382 | /* %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% |
1496 : | * done; return number of bytes consumed | ||
1497 : | * %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% */ | ||
1498 : | edgomez | 195 | |
1499 : | edgomez | 1382 | done: |
1500 : | |||
1501 : | Isibaar | 3 | stop_global_timer(); |
1502 : | write_timer(); | ||
1503 : | |||
1504 : | edgomez | 1382 | emms(); |
1505 : | return BitstreamLength(&bs); | ||
1506 : | Isibaar | 3 | } |
1507 : | |||
1508 : | |||
1509 : | edgomez | 1382 | static void SetMacroblockQuants(MBParam * const pParam, FRAMEINFO * frame) |
1510 : | { | ||
1511 : | unsigned int i; | ||
1512 : | MACROBLOCK * pMB = frame->mbs; | ||
1513 : | int quant = frame->mbs[0].quant; /* set by XVID_PLG_FRAME */ | ||
1514 : | if (quant > 31) | ||
1515 : | frame->quant = quant = 31; | ||
1516 : | else if (quant < 1) | ||
1517 : | frame->quant = quant = 1; | ||
1518 : | |||
1519 : | for (i = 0; i < pParam->mb_height * pParam->mb_width; i++) { | ||
1520 : | quant += pMB->dquant; | ||
1521 : | if (quant > 31) | ||
1522 : | quant = 31; | ||
1523 : | else if (quant < 1) | ||
1524 : | quant = 1; | ||
1525 : | pMB->quant = quant; | ||
1526 : | pMB++; | ||
1527 : | } | ||
1528 : | } | ||
1529 : | |||
1530 : | |||
1531 : | edgomez | 195 | static __inline void |
1532 : | Isibaar | 1913 | CodeIntraMB(MACROBLOCK * pMB) |
1533 : | edgomez | 195 | { |
1534 : | Isibaar | 3 | pMB->mode = MODE_INTRA; |
1535 : | |||
1536 : | suxen_drol | 136 | /* zero mv statistics */ |
1537 : | pMB->mvs[0].x = pMB->mvs[1].x = pMB->mvs[2].x = pMB->mvs[3].x = 0; | ||
1538 : | pMB->mvs[0].y = pMB->mvs[1].y = pMB->mvs[2].y = pMB->mvs[3].y = 0; | ||
1539 : | pMB->sad8[0] = pMB->sad8[1] = pMB->sad8[2] = pMB->sad8[3] = 0; | ||
1540 : | pMB->sad16 = 0; | ||
1541 : | |||
1542 : | edgomez | 1382 | if (pMB->dquant != 0) { |
1543 : | pMB->mode = MODE_INTRA_Q; | ||
1544 : | Isibaar | 3 | } |
1545 : | } | ||
1546 : | |||
1547 : | Isibaar | 1913 | static void |
1548 : | SliceCodeI(SMPData *data) | ||
1549 : | { | ||
1550 : | Encoder *pEnc = (Encoder *) data->pEnc; | ||
1551 : | Bitstream *bs = (Bitstream *) data->bs; | ||
1552 : | Isibaar | 3 | |
1553 : | Isibaar | 1913 | uint16_t x, y; |
1554 : | int mb_width = pEnc->mbParam.mb_width; | ||
1555 : | int mb_height = pEnc->mbParam.mb_height; | ||
1556 : | h | 101 | |
1557 : | Isibaar | 1913 | int bound = 0, num_slices = pEnc->num_slices; |
1558 : | FRAMEINFO *const current = pEnc->current; | ||
1559 : | |||
1560 : | DECLARE_ALIGNED_MATRIX(dct_codes, 6, 64, int16_t, CACHE_LINE); | ||
1561 : | DECLARE_ALIGNED_MATRIX(qcoeff, 6, 64, int16_t, CACHE_LINE); | ||
1562 : | |||
1563 : | if (data->start_y > 0) { /* write resync marker */ | ||
1564 : | bound = data->start_y*mb_width; | ||
1565 : | write_video_packet_header(bs, &pEnc->mbParam, current, bound); | ||
1566 : | } | ||
1567 : | |||
1568 : | for (y = data->start_y; y < data->stop_y; y++) { | ||
1569 : | int new_bound = mb_width * ((((y*num_slices) / mb_height) * mb_height + (num_slices-1)) / num_slices); | ||
1570 : | |||
1571 : | if (new_bound > bound) { | ||
1572 : | bound = new_bound; | ||
1573 : | BitstreamPadAlways(bs); | ||
1574 : | write_video_packet_header(bs, &pEnc->mbParam, current, bound); | ||
1575 : | } | ||
1576 : | |||
1577 : | for (x = 0; x < mb_width; x++) { | ||
1578 : | MACROBLOCK *pMB = ¤t->mbs[x + y * mb_width]; | ||
1579 : | |||
1580 : | CodeIntraMB(pMB); | ||
1581 : | |||
1582 : | MBTransQuantIntra(&pEnc->mbParam, current, pMB, x, y, | ||
1583 : | dct_codes, qcoeff); | ||
1584 : | |||
1585 : | start_timer(); | ||
1586 : | MBPrediction(current, x, y, mb_width, qcoeff, bound); | ||
1587 : | stop_prediction_timer(); | ||
1588 : | |||
1589 : | start_timer(); | ||
1590 : | MBCoding(current, pMB, qcoeff, bs, data->sStat); | ||
1591 : | stop_coding_timer(); | ||
1592 : | |||
1593 : | } | ||
1594 : | } | ||
1595 : | |||
1596 : | emms(); | ||
1597 : | BitstreamPadAlways(bs); | ||
1598 : | } | ||
1599 : | |||
1600 : | static __inline void | ||
1601 : | SerializeBitstreams(Encoder *pEnc, FRAMEINFO *current, Bitstream *bs, int num_threads) | ||
1602 : | { | ||
1603 : | int k; | ||
1604 : | uint32_t pos = BitstreamLength(bs); | ||
1605 : | |||
1606 : | for (k = 1; k < num_threads; k++) { | ||
1607 : | uint32_t len = BitstreamLength(pEnc->smpData[k].bs); | ||
1608 : | |||
1609 : | memcpy((void *)((ptr_t)bs->start + pos), | ||
1610 : | (void *)((ptr_t)pEnc->smpData[k].bs->start), len); | ||
1611 : | |||
1612 : | Isibaar | 1935 | current->length += len; |
1613 : | pos += len; | ||
1614 : | Isibaar | 1913 | |
1615 : | /* collect stats */ | ||
1616 : | current->sStat.iTextBits += pEnc->smpData[k].sStat->iTextBits; | ||
1617 : | current->sStat.kblks += pEnc->smpData[k].sStat->kblks; | ||
1618 : | current->sStat.mblks += pEnc->smpData[k].sStat->mblks; | ||
1619 : | current->sStat.ublks += pEnc->smpData[k].sStat->ublks; | ||
1620 : | current->sStat.iMVBits += pEnc->smpData[k].sStat->iMVBits; | ||
1621 : | } | ||
1622 : | |||
1623 : | if (num_threads > 1) { | ||
1624 : | uint32_t pos32 = pos>>2; | ||
1625 : | bs->tail = bs->start + pos32; | ||
1626 : | bs->pos = 8*(pos - (pos32<<2)); | ||
1627 : | bs->buf = 0; | ||
1628 : | |||
1629 : | if (bs->pos > 0) { | ||
1630 : | uint32_t pos8 = bs->pos/8; | ||
1631 : | memset((void *)((ptr_t)bs->tail+pos8), 0, (4-pos8)); | ||
1632 : | pos = *bs->tail; | ||
1633 : | #ifndef ARCH_IS_BIG_ENDIAN | ||
1634 : | BSWAP(pos); | ||
1635 : | #endif | ||
1636 : | bs->buf = pos; | ||
1637 : | } | ||
1638 : | } | ||
1639 : | } | ||
1640 : | |||
1641 : | edgomez | 195 | static int |
1642 : | FrameCodeI(Encoder * pEnc, | ||
1643 : | edgomez | 1382 | Bitstream * bs) |
1644 : | h | 104 | { |
1645 : | edgomez | 1382 | int bits = BitstreamPos(bs); |
1646 : | Isibaar | 1913 | int bound = 0, num_slices = pEnc->num_slices; |
1647 : | int num_threads = MAX(1, MIN(pEnc->num_threads, num_slices)); | ||
1648 : | int slices_per_thread = (num_slices*1024 / num_threads); | ||
1649 : | edgomez | 851 | int mb_height = pEnc->mbParam.mb_height; |
1650 : | Isibaar | 1913 | void * status = NULL; |
1651 : | uint16_t k; | ||
1652 : | h | 104 | |
1653 : | suxen_drol | 136 | pEnc->mbParam.m_rounding_type = 1; |
1654 : | pEnc->current->rounding_type = pEnc->mbParam.m_rounding_type; | ||
1655 : | pEnc->current->coding_type = I_VOP; | ||
1656 : | h | 104 | |
1657 : | edgomez | 1382 | call_plugins(pEnc, pEnc->current, NULL, XVID_PLG_FRAME, NULL, NULL, NULL); |
1658 : | |||
1659 : | SetMacroblockQuants(&pEnc->mbParam, pEnc->current); | ||
1660 : | |||
1661 : | Isibaar | 1913 | BitstreamWriteVolHeader(bs, &pEnc->mbParam, pEnc->current, num_slices); |
1662 : | edgomez | 403 | |
1663 : | edgomez | 851 | set_timecodes(pEnc->current,pEnc->reference,pEnc->mbParam.fbase); |
1664 : | |||
1665 : | edgomez | 1098 | BitstreamPad(bs); |
1666 : | h | 104 | |
1667 : | edgomez | 1382 | BitstreamWriteVopHeader(bs, &pEnc->mbParam, pEnc->current, 1, pEnc->current->mbs[0].quant); |
1668 : | h | 104 | |
1669 : | edgomez | 851 | pEnc->current->sStat.iTextBits = 0; |
1670 : | h | 104 | |
1671 : | Isibaar | 1913 | /* multithreaded intra coding - dispatch threads */ |
1672 : | for (k = 0; k < num_threads; k++) { | ||
1673 : | int add = ((slices_per_thread + 512) >> 10); | ||
1674 : | h | 104 | |
1675 : | Isibaar | 1913 | slices_per_thread += ((num_slices*1024 / num_threads) - add*1024); |
1676 : | h | 104 | |
1677 : | Isibaar | 1913 | pEnc->smpData[k].pEnc = (void *) pEnc; |
1678 : | pEnc->smpData[k].stop_y = (((bound+add) * mb_height + (num_slices-1)) / num_slices); | ||
1679 : | pEnc->smpData[k].start_y = ((bound * mb_height + (num_slices-1)) / num_slices); | ||
1680 : | h | 104 | |
1681 : | Isibaar | 1913 | bound += add; |
1682 : | h | 104 | |
1683 : | Isibaar | 1913 | if (k > 0) { |
1684 : | BitstreamReset(pEnc->smpData[k].bs); | ||
1685 : | pEnc->smpData[k].sStat->iTextBits = 0; | ||
1686 : | h | 104 | } |
1687 : | Isibaar | 1913 | } |
1688 : | pEnc->smpData[0].bs = bs; | ||
1689 : | pEnc->smpData[0].sStat = &pEnc->current->sStat; | ||
1690 : | |||
1691 : | /* create threads */ | ||
1692 : | for (k = 1; k < num_threads; k++) { | ||
1693 : | pthread_create(&pEnc->smpData[k].handle, NULL, | ||
1694 : | (void*)SliceCodeI, (void*)&pEnc->smpData[k]); | ||
1695 : | } | ||
1696 : | h | 104 | |
1697 : | Isibaar | 1913 | SliceCodeI(&pEnc->smpData[0]); |
1698 : | h | 104 | |
1699 : | Isibaar | 1913 | /* wait until all threads are finished */ |
1700 : | for (k = 1; k < num_threads; k++) { | ||
1701 : | pthread_join(pEnc->smpData[k].handle, &status); | ||
1702 : | } | ||
1703 : | edgomez | 1382 | |
1704 : | Isibaar | 1913 | pEnc->current->length = BitstreamLength(bs) - (bits/8); |
1705 : | edgomez | 1382 | |
1706 : | Isibaar | 1913 | /* reassemble the pieces together */ |
1707 : | SerializeBitstreams(pEnc, pEnc->current, bs, num_threads); | ||
1708 : | |||
1709 : | pEnc->current->sStat.iMVBits = 0; | ||
1710 : | pEnc->current->sStat.mblks = pEnc->current->sStat.ublks = 0; | ||
1711 : | pEnc->current->sStat.kblks = pEnc->mbParam.mb_width * pEnc->mbParam.mb_height; | ||
1712 : | |||
1713 : | edgomez | 851 | pEnc->fMvPrevSigma = -1; |
1714 : | suxen_drol | 136 | pEnc->mbParam.m_fcode = 2; |
1715 : | h | 104 | |
1716 : | edgomez | 1382 | pEnc->current->is_edged = 0; /* not edged */ |
1717 : | pEnc->current->is_interpolated = -1; /* not interpolated (fake rounding -1) */ | ||
1718 : | h | 104 | |
1719 : | edgomez | 867 | return 1; /* intra */ |
1720 : | h | 104 | } |
1721 : | |||
1722 : | syskin | 1572 | static __inline void |
1723 : | updateFcode(Statistics * sStat, Encoder * pEnc) | ||
1724 : | { | ||
1725 : | float fSigma; | ||
1726 : | int iSearchRange; | ||
1727 : | h | 104 | |
1728 : | syskin | 1572 | if (sStat->iMvCount == 0) |
1729 : | sStat->iMvCount = 1; | ||
1730 : | |||
1731 : | fSigma = (float) sqrt((float) sStat->iMvSum / sStat->iMvCount); | ||
1732 : | |||
1733 : | iSearchRange = 16 << pEnc->mbParam.m_fcode; | ||
1734 : | |||
1735 : | if ((3.0 * fSigma > iSearchRange) && (pEnc->mbParam.m_fcode <= 5) ) | ||
1736 : | pEnc->mbParam.m_fcode++; | ||
1737 : | |||
1738 : | else if ((5.0 * fSigma < iSearchRange) | ||
1739 : | && (4.0 * pEnc->fMvPrevSigma < iSearchRange) | ||
1740 : | && (pEnc->mbParam.m_fcode >= 2) ) | ||
1741 : | pEnc->mbParam.m_fcode--; | ||
1742 : | |||
1743 : | pEnc->fMvPrevSigma = fSigma; | ||
1744 : | } | ||
1745 : | |||
1746 : | edgomez | 851 | #define BFRAME_SKIP_THRESHHOLD 30 |
1747 : | Isibaar | 3 | |
1748 : | Isibaar | 1913 | static void |
1749 : | SliceCodeP(SMPData *data) | ||
1750 : | { | ||
1751 : | Encoder *pEnc = (Encoder *) data->pEnc; | ||
1752 : | Bitstream *bs = (Bitstream *) data->bs; | ||
1753 : | |||
1754 : | int x, y, k; | ||
1755 : | FRAMEINFO *const current = pEnc->current; | ||
1756 : | FRAMEINFO *const reference = pEnc->reference; | ||
1757 : | MBParam * const pParam = &pEnc->mbParam; | ||
1758 : | int mb_width = pParam->mb_width; | ||
1759 : | int mb_height = pParam->mb_height; | ||
1760 : | |||
1761 : | DECLARE_ALIGNED_MATRIX(dct_codes, 6, 64, int16_t, CACHE_LINE); | ||
1762 : | DECLARE_ALIGNED_MATRIX(qcoeff, 6, 64, int16_t, CACHE_LINE); | ||
1763 : | |||
1764 : | int bound = 0, num_slices = pEnc->num_slices; | ||
1765 : | |||
1766 : | if (data->start_y > 0) { /* write resync marker */ | ||
1767 : | bound = data->start_y*mb_width; | ||
1768 : | write_video_packet_header(bs, pParam, current, bound); | ||
1769 : | } | ||
1770 : | |||
1771 : | for (y = data->start_y; y < data->stop_y; y++) { | ||
1772 : | int new_bound = mb_width * ((((y*num_slices) / mb_height) * mb_height + (num_slices-1)) / num_slices); | ||
1773 : | |||
1774 : | if (new_bound > bound) { | ||
1775 : | bound = new_bound; | ||
1776 : | BitstreamPadAlways(bs); | ||
1777 : | write_video_packet_header(bs, pParam, current, bound); | ||
1778 : | } | ||
1779 : | |||
1780 : | for (x = 0; x < mb_width; x++) { | ||
1781 : | MACROBLOCK *pMB = ¤t->mbs[x + y * pParam->mb_width]; | ||
1782 : | int skip_possible; | ||
1783 : | |||
1784 : | if (pMB->mode == MODE_INTRA || pMB->mode == MODE_INTRA_Q) { | ||
1785 : | CodeIntraMB(pMB); | ||
1786 : | MBTransQuantIntra(pParam, current, pMB, x, y, | ||
1787 : | dct_codes, qcoeff); | ||
1788 : | |||
1789 : | start_timer(); | ||
1790 : | MBPrediction(current, x, y, pParam->mb_width, qcoeff, bound); | ||
1791 : | stop_prediction_timer(); | ||
1792 : | |||
1793 : | data->sStat->kblks++; | ||
1794 : | |||
1795 : | MBCoding(current, pMB, qcoeff, bs, data->sStat); | ||
1796 : | stop_coding_timer(); | ||
1797 : | continue; | ||
1798 : | } | ||
1799 : | |||
1800 : | start_timer(); | ||
1801 : | MBMotionCompensation(pMB, x, y, &reference->image, | ||
1802 : | &pEnc->vInterH, &pEnc->vInterV, | ||
1803 : | &pEnc->vInterHV, &pEnc->vGMC, | ||
1804 : | ¤t->image, | ||
1805 : | dct_codes, pParam->width, | ||
1806 : | pParam->height, | ||
1807 : | pParam->edged_width, | ||
1808 : | (current->vol_flags & XVID_VOL_QUARTERPEL), | ||
1809 : | current->rounding_type, | ||
1810 : | data->RefQ); | ||
1811 : | |||
1812 : | stop_comp_timer(); | ||
1813 : | |||
1814 : | pMB->field_pred = 0; | ||
1815 : | |||
1816 : | if (pMB->cbp != 0) { | ||
1817 : | pMB->cbp = MBTransQuantInter(pParam, current, pMB, x, y, | ||
1818 : | dct_codes, qcoeff); | ||
1819 : | } | ||
1820 : | |||
1821 : | if (pMB->dquant != 0) | ||
1822 : | MBSetDquant(pMB, x, y, pParam); | ||
1823 : | |||
1824 : | |||
1825 : | if (pMB->cbp || pMB->mvs[0].x || pMB->mvs[0].y || | ||
1826 : | pMB->mvs[1].x || pMB->mvs[1].y || pMB->mvs[2].x || | ||
1827 : | pMB->mvs[2].y || pMB->mvs[3].x || pMB->mvs[3].y) { | ||
1828 : | data->sStat->mblks++; | ||
1829 : | } else { | ||
1830 : | data->sStat->ublks++; | ||
1831 : | } | ||
1832 : | |||
1833 : | start_timer(); | ||
1834 : | |||
1835 : | /* Finished processing the MB, now check if to CODE or SKIP */ | ||
1836 : | |||
1837 : | skip_possible = (pMB->cbp == 0) && (pMB->mode == MODE_INTER); | ||
1838 : | |||
1839 : | if (current->coding_type == S_VOP) | ||
1840 : | skip_possible &= (pMB->mcsel == 1); | ||
1841 : | else { /* PVOP */ | ||
1842 : | const VECTOR * const mv = (pParam->vol_flags & XVID_VOL_QUARTERPEL) ? | ||
1843 : | pMB->qmvs : pMB->mvs; | ||
1844 : | skip_possible &= ((mv->x|mv->y) == 0); | ||
1845 : | } | ||
1846 : | |||
1847 : | if ((pMB->mode == MODE_NOT_CODED) || (skip_possible)) { | ||
1848 : | /* This is a candidate for SKIPping, but for P-VOPs check intermediate B-frames first */ | ||
1849 : | int bSkip = 1; | ||
1850 : | |||
1851 : | if (current->coding_type == P_VOP) { /* special rule for P-VOP's SKIP */ | ||
1852 : | for (k = pEnc->bframenum_head; k < pEnc->bframenum_tail; k++) { | ||
1853 : | int iSAD; | ||
1854 : | iSAD = sad16(reference->image.y + 16*y*pParam->edged_width + 16*x, | ||
1855 : | pEnc->bframes[k]->image.y + 16*y*pParam->edged_width + 16*x, | ||
1856 : | pParam->edged_width, BFRAME_SKIP_THRESHHOLD * pMB->quant); | ||
1857 : | Isibaar | 1919 | if (iSAD >= BFRAME_SKIP_THRESHHOLD * pMB->quant || ((bound > 1) && |
1858 : | ((y*mb_width+x == bound) || (y*mb_width+x == bound+1)))) { /* Some third-party decoders have problems with coloc skip MB before or after | ||
1859 : | resync marker in BVOP. We avoid any ambiguity and force no skip at slice boundary */ | ||
1860 : | Isibaar | 1913 | bSkip = 0; /* could not SKIP */ |
1861 : | if (pParam->vol_flags & XVID_VOL_QUARTERPEL) { | ||
1862 : | VECTOR predMV = get_qpmv2(current->mbs, pParam->mb_width, bound, x, y, 0); | ||
1863 : | pMB->pmvs[0].x = - predMV.x; | ||
1864 : | pMB->pmvs[0].y = - predMV.y; | ||
1865 : | } else { | ||
1866 : | VECTOR predMV = get_pmv2(current->mbs, pParam->mb_width, bound, x, y, 0); | ||
1867 : | pMB->pmvs[0].x = - predMV.x; | ||
1868 : | pMB->pmvs[0].y = - predMV.y; | ||
1869 : | } | ||
1870 : | pMB->mode = MODE_INTER; | ||
1871 : | pMB->cbp = 0; | ||
1872 : | break; | ||
1873 : | } | ||
1874 : | } | ||
1875 : | } | ||
1876 : | |||
1877 : | if (bSkip) { | ||
1878 : | /* do SKIP */ | ||
1879 : | pMB->mode = MODE_NOT_CODED; | ||
1880 : | MBSkip(bs); | ||
1881 : | stop_coding_timer(); | ||
1882 : | continue; /* next MB */ | ||
1883 : | } | ||
1884 : | } | ||
1885 : | |||
1886 : | /* ordinary case: normal coded INTER/INTER4V block */ | ||
1887 : | MBCoding(current, pMB, qcoeff, bs, data->sStat); | ||
1888 : | stop_coding_timer(); | ||
1889 : | } | ||
1890 : | } | ||
1891 : | |||
1892 : | BitstreamPadAlways(bs); /* next_start_code() at the end of VideoObjectPlane() */ | ||
1893 : | emms(); | ||
1894 : | } | ||
1895 : | |||
1896 : | edgomez | 851 | /* FrameCodeP also handles S(GMC)-VOPs */ |
1897 : | edgomez | 195 | static int |
1898 : | Isibaar | 1913 | FrameCodeP(Encoder * pEnc, Bitstream * bs) |
1899 : | Isibaar | 3 | { |
1900 : | edgomez | 1382 | int bits = BitstreamPos(bs); |
1901 : | Isibaar | 42 | |
1902 : | edgomez | 1382 | FRAMEINFO *const current = pEnc->current; |
1903 : | FRAMEINFO *const reference = pEnc->reference; | ||
1904 : | MBParam * const pParam = &pEnc->mbParam; | ||
1905 : | int mb_width = pParam->mb_width; | ||
1906 : | int mb_height = pParam->mb_height; | ||
1907 : | syskin | 1391 | int coded = 1; |
1908 : | syskin | 903 | |
1909 : | Isibaar | 1913 | int k = 0, bound = 0, num_slices = pEnc->num_slices; |
1910 : | int num_threads = MAX(1, MIN(pEnc->num_threads, num_slices)); | ||
1911 : | void * status = NULL; | ||
1912 : | int slices_per_thread = (num_slices*1024 / num_threads); | ||
1913 : | int threads_per_slice = (pEnc->num_threads*1024 / num_threads); | ||
1914 : | |||
1915 : | edgomez | 1382 | IMAGE *pRef = &reference->image; |
1916 : | |||
1917 : | if (!reference->is_edged) { | ||
1918 : | start_timer(); | ||
1919 : | image_setedges(pRef, pParam->edged_width, pParam->edged_height, | ||
1920 : | Isibaar | 1959 | pParam->width, pParam->height, XVID_BS_VERSION); |
1921 : | edgomez | 1382 | stop_edges_timer(); |
1922 : | reference->is_edged = 1; | ||
1923 : | } | ||
1924 : | Isibaar | 3 | |
1925 : | edgomez | 1382 | pParam->m_rounding_type = 1 - pParam->m_rounding_type; |
1926 : | current->rounding_type = pParam->m_rounding_type; | ||
1927 : | current->fcode = pParam->m_fcode; | ||
1928 : | |||
1929 : | if ((current->vop_flags & XVID_VOP_HALFPEL)) { | ||
1930 : | if (reference->is_interpolated != current->rounding_type) { | ||
1931 : | start_timer(); | ||
1932 : | syskin | 1665 | image_interpolate(pRef->y, pEnc->vInterH.y, pEnc->vInterV.y, |
1933 : | pEnc->vInterHV.y, pParam->edged_width, | ||
1934 : | edgomez | 1382 | pParam->edged_height, |
1935 : | (pParam->vol_flags & XVID_VOL_QUARTERPEL), | ||
1936 : | current->rounding_type); | ||
1937 : | stop_inter_timer(); | ||
1938 : | reference->is_interpolated = current->rounding_type; | ||
1939 : | } | ||
1940 : | Isibaar | 3 | } |
1941 : | |||
1942 : | syskin | 1567 | current->sStat.iTextBits = current->sStat.iMvSum = current->sStat.iMvCount = |
1943 : | Isibaar | 1677 | current->sStat.kblks = current->sStat.mblks = current->sStat.ublks = |
1944 : | current->sStat.iMVBits = 0; | ||
1945 : | syskin | 1567 | |
1946 : | edgomez | 1382 | current->coding_type = P_VOP; |
1947 : | syskin | 903 | |
1948 : | Isibaar | 1909 | if (current->vop_flags & XVID_VOP_RD_PSNRHVSM) { |
1949 : | image_block_variance(¤t->image, pParam->edged_width, current->mbs, | ||
1950 : | pParam->mb_width, pParam->mb_height); | ||
1951 : | } | ||
1952 : | |||
1953 : | edgomez | 1382 | call_plugins(pEnc, pEnc->current, NULL, XVID_PLG_FRAME, NULL, NULL, NULL); |
1954 : | |||
1955 : | SetMacroblockQuants(&pEnc->mbParam, current); | ||
1956 : | |||
1957 : | Isibaar | 3 | start_timer(); |
1958 : | Isibaar | 1913 | if (current->vol_flags & XVID_VOL_GMC) /* GMC only for S(GMC)-VOPs */ |
1959 : | edgomez | 1382 | { int gmcval; |
1960 : | current->warp = GlobalMotionEst( current->mbs, pParam, current, reference, | ||
1961 : | Isibaar | 1913 | &pEnc->vInterH, &pEnc->vInterV, &pEnc->vInterHV, num_slices); |
1962 : | edgomez | 851 | |
1963 : | edgomez | 1382 | if (current->motion_flags & XVID_ME_GME_REFINE) { |
1964 : | gmcval = GlobalMotionEstRefine(¤t->warp, | ||
1965 : | current->mbs, pParam, | ||
1966 : | current, reference, | ||
1967 : | ¤t->image, | ||
1968 : | &reference->image, | ||
1969 : | &pEnc->vInterH, | ||
1970 : | &pEnc->vInterV, | ||
1971 : | &pEnc->vInterHV); | ||
1972 : | } else { | ||
1973 : | gmcval = globalSAD(¤t->warp, pParam, current->mbs, | ||
1974 : | current, | ||
1975 : | &reference->image, | ||
1976 : | ¤t->image, | ||
1977 : | pEnc->vGMC.y); | ||
1978 : | } | ||
1979 : | Isibaar | 3 | |
1980 : | edgomez | 1382 | gmcval += /*current->quant*/ 2 * (int)(pParam->mb_width*pParam->mb_height); |
1981 : | edgomez | 851 | |
1982 : | edgomez | 1382 | /* 1st '3': 3 warpoints, 2nd '3': 16th pel res (2<<3) */ |
1983 : | generate_GMCparameters( 3, 3, ¤t->warp, | ||
1984 : | pParam->width, pParam->height, | ||
1985 : | ¤t->new_gmc_data); | ||
1986 : | edgomez | 851 | |
1987 : | edgomez | 1382 | if ( (gmcval<0) && ( (current->warp.duv[1].x != 0) || (current->warp.duv[1].y != 0) || |
1988 : | (current->warp.duv[2].x != 0) || (current->warp.duv[2].y != 0) ) ) | ||
1989 : | { | ||
1990 : | current->coding_type = S_VOP; | ||
1991 : | edgomez | 851 | |
1992 : | edgomez | 1382 | generate_GMCimage(¤t->new_gmc_data, &reference->image, |
1993 : | pParam->mb_width, pParam->mb_height, | ||
1994 : | pParam->edged_width, pParam->edged_width/2, | ||
1995 : | pParam->m_fcode, ((pParam->vol_flags & XVID_VOL_QUARTERPEL)?1:0), 0, | ||
1996 : | current->rounding_type, current->mbs, &pEnc->vGMC); | ||
1997 : | edgomez | 851 | |
1998 : | edgomez | 1382 | } else { |
1999 : | |||
2000 : | generate_GMCimage(¤t->new_gmc_data, &reference->image, | ||
2001 : | pParam->mb_width, pParam->mb_height, | ||
2002 : | pParam->edged_width, pParam->edged_width/2, | ||
2003 : | pParam->m_fcode, ((pParam->vol_flags & XVID_VOL_QUARTERPEL)?1:0), 0, | ||
2004 : | current->rounding_type, current->mbs, NULL); /* no warping, just AMV */ | ||
2005 : | } | ||
2006 : | h | 101 | } |
2007 : | Isibaar | 3 | |
2008 : | Isibaar | 1913 | if (pEnc->num_threads > 0) { |
2009 : | edgomez | 1382 | |
2010 : | syskin | 1682 | /* multithreaded motion estimation - dispatch threads */ |
2011 : | Isibaar | 1913 | while (k < pEnc->num_threads) { |
2012 : | int i, add_s = (slices_per_thread + 512) >> 10; | ||
2013 : | int add_t = (threads_per_slice + 512) >> 10; | ||
2014 : | |||
2015 : | int start_y = (bound * mb_height + (num_slices-1)) / num_slices; | ||
2016 : | int stop_y = ((bound+add_s) * mb_height + (num_slices-1)) / num_slices; | ||
2017 : | int rows_per_thread = (stop_y - start_y + add_t - 1) / add_t; | ||
2018 : | syskin | 1684 | |
2019 : | Isibaar | 1913 | slices_per_thread += ((num_slices*1024 / num_threads) - add_s*1024); |
2020 : | threads_per_slice += ((pEnc->num_threads*1024 / num_threads) - add_t*1024); | ||
2021 : | edgomez | 1382 | |
2022 : | Isibaar | 1913 | for (i = 0; i < add_t; i++) { |
2023 : | memset(pEnc->smpData[k+i].complete_count_self, 0, rows_per_thread * sizeof(int)); | ||
2024 : | |||
2025 : | pEnc->smpData[k+i].pEnc = (void *) pEnc; | ||
2026 : | pEnc->smpData[k+i].y_row = i; | ||
2027 : | pEnc->smpData[k+i].y_step = add_t; | ||
2028 : | pEnc->smpData[k+i].stop_y = stop_y; | ||
2029 : | pEnc->smpData[k+i].start_y = start_y; | ||
2030 : | |||
2031 : | /* todo: sort out temp space once and for all */ | ||
2032 : | pEnc->smpData[k+i].RefQ = (((k+i)&1) ? pEnc->vInterV.u : pEnc->vInterV.v) + | ||
2033 : | 16*((k+i)>>1)*pParam->edged_width; | ||
2034 : | } | ||
2035 : | |||
2036 : | pEnc->smpData[k].complete_count_above = | ||
2037 : | pEnc->smpData[k+add_t-1].complete_count_self - 1; | ||
2038 : | |||
2039 : | bound += add_s; | ||
2040 : | k += add_t; | ||
2041 : | syskin | 1682 | } |
2042 : | |||
2043 : | syskin | 1684 | for (k = 1; k < pEnc->num_threads; k++) { |
2044 : | Isibaar | 1913 | pthread_create(&pEnc->smpData[k].handle, NULL, |
2045 : | (void*)MotionEstimateSMP, (void*)&pEnc->smpData[k]); | ||
2046 : | syskin | 1682 | } |
2047 : | syskin | 1684 | |
2048 : | Isibaar | 1913 | MotionEstimateSMP(&pEnc->smpData[0]); |
2049 : | syskin | 1684 | |
2050 : | for (k = 1; k < pEnc->num_threads; k++) { | ||
2051 : | Isibaar | 1913 | pthread_join(pEnc->smpData[k].handle, &status); |
2052 : | syskin | 1684 | } |
2053 : | |||
2054 : | current->fcode = 0; | ||
2055 : | for (k = 0; k < pEnc->num_threads; k++) { | ||
2056 : | Isibaar | 1913 | current->sStat.iMvSum += pEnc->smpData[k].mvSum; |
2057 : | current->sStat.iMvCount += pEnc->smpData[k].mvCount; | ||
2058 : | if (pEnc->smpData[k].minfcode > current->fcode) | ||
2059 : | current->fcode = pEnc->smpData[k].minfcode; | ||
2060 : | syskin | 1684 | } |
2061 : | |||
2062 : | syskin | 1682 | } else { |
2063 : | Isibaar | 1913 | |
2064 : | syskin | 1682 | /* regular ME */ |
2065 : | |||
2066 : | MotionEstimation(&pEnc->mbParam, current, reference, | ||
2067 : | &pEnc->vInterH, &pEnc->vInterV, &pEnc->vInterHV, | ||
2068 : | Isibaar | 1913 | &pEnc->vGMC, 256*4096, num_slices); |
2069 : | |||
2070 : | syskin | 1682 | } |
2071 : | |||
2072 : | edgomez | 1382 | stop_motion_timer(); |
2073 : | |||
2074 : | set_timecodes(current,reference,pParam->fbase); | ||
2075 : | Isibaar | 3 | |
2076 : | edgomez | 1382 | BitstreamWriteVopHeader(bs, &pEnc->mbParam, current, 1, current->mbs[0].quant); |
2077 : | Isibaar | 3 | |
2078 : | Isibaar | 1913 | /* multithreaded inter coding - dispatch threads */ |
2079 : | Isibaar | 3 | |
2080 : | Isibaar | 1913 | bound = 0; |
2081 : | slices_per_thread = (num_slices*1024 / num_threads); | ||
2082 : | chl | 419 | |
2083 : | Isibaar | 1913 | for (k = 0; k < num_threads; k++) { |
2084 : | int add = ((slices_per_thread + 512) >> 10); | ||
2085 : | edgomez | 851 | |
2086 : | Isibaar | 1913 | slices_per_thread += ((num_slices*1024 / num_threads) - add*1024); |
2087 : | edgomez | 851 | |
2088 : | Isibaar | 1913 | pEnc->smpData[k].pEnc = (void *) pEnc; |
2089 : | pEnc->smpData[k].stop_y = (((bound+add) * mb_height + (num_slices-1)) / num_slices); | ||
2090 : | pEnc->smpData[k].start_y = ((bound * mb_height + (num_slices-1)) / num_slices); | ||
2091 : | pEnc->smpData[k].RefQ = ((k&1) ? pEnc->vInterV.u : pEnc->vInterV.v) + 16*(k>>1)*pParam->edged_width; | ||
2092 : | Isibaar | 3 | |
2093 : | Isibaar | 1913 | bound += add; |
2094 : | chl | 347 | |
2095 : | Isibaar | 1913 | if (k > 0) { |
2096 : | pEnc->smpData[k].sStat->iTextBits = pEnc->smpData[k].sStat->kblks = | ||
2097 : | pEnc->smpData[k].sStat->mblks = pEnc->smpData[k].sStat->ublks = | ||
2098 : | pEnc->smpData[k].sStat->iMVBits = 0; | ||
2099 : | |||
2100 : | BitstreamReset(pEnc->smpData[k].bs); | ||
2101 : | } | ||
2102 : | } | ||
2103 : | pEnc->smpData[0].bs = bs; | ||
2104 : | pEnc->smpData[0].sStat = ¤t->sStat; | ||
2105 : | edgomez | 851 | |
2106 : | Isibaar | 1913 | /* create threads */ |
2107 : | for (k = 1; k < num_threads; k++) { | ||
2108 : | pthread_create(&pEnc->smpData[k].handle, NULL, | ||
2109 : | (void*)SliceCodeP, (void*)&pEnc->smpData[k]); | ||
2110 : | } | ||
2111 : | edgomez | 851 | |
2112 : | Isibaar | 1913 | SliceCodeP(&pEnc->smpData[0]); |
2113 : | edgomez | 851 | |
2114 : | Isibaar | 1913 | /* wait until all threads are finished */ |
2115 : | for (k = 1; k < num_threads; k++) { | ||
2116 : | pthread_join(pEnc->smpData[k].handle, &status); | ||
2117 : | } | ||
2118 : | edgomez | 1382 | |
2119 : | Isibaar | 1913 | current->length = BitstreamLength(bs) - (bits/8); |
2120 : | edgomez | 1382 | |
2121 : | Isibaar | 1913 | /* reassemble the pieces together */ |
2122 : | SerializeBitstreams(pEnc, pEnc->current, bs, num_threads); | ||
2123 : | edgomez | 1382 | |
2124 : | syskin | 1572 | updateFcode(¤t->sStat, pEnc); |
2125 : | Isibaar | 3 | |
2126 : | edgomez | 851 | /* frame drop code */ |
2127 : | edgomez | 1382 | #if 0 |
2128 : | DPRINTF(XVID_DEBUG_DEBUG, "kmu %i %i %i\n", current->sStat.kblks, current->sStat.mblks, current->sStat.ublks); | ||
2129 : | #endif | ||
2130 : | Isibaar | 1913 | |
2131 : | Isibaar | 1908 | if (current->sStat.kblks + current->sStat.mblks < |
2132 : | syskin | 1406 | (pParam->frame_drop_ratio * mb_width * mb_height) / 100 && |
2133 : | Isibaar | 1948 | ( (pEnc->bframenum_head >= pEnc->bframenum_tail) || !(pEnc->mbParam.global_flags & XVID_GLOBAL_CLOSED_GOP)) && |
2134 : | (current->coding_type == P_VOP) ) | ||
2135 : | edgomez | 851 | { |
2136 : | Isibaar | 1679 | current->sStat.kblks = current->sStat.mblks = current->sStat.iTextBits = 0; |
2137 : | edgomez | 1382 | current->sStat.ublks = mb_width * mb_height; |
2138 : | edgomez | 851 | |
2139 : | BitstreamReset(bs); | ||
2140 : | |||
2141 : | edgomez | 1382 | set_timecodes(current,reference,pParam->fbase); |
2142 : | BitstreamWriteVopHeader(bs, &pEnc->mbParam, current, 0, current->mbs[0].quant); | ||
2143 : | edgomez | 851 | |
2144 : | edgomez | 867 | /* copy reference frame details into the current frame */ |
2145 : | edgomez | 1382 | current->quant = reference->quant; |
2146 : | current->motion_flags = reference->motion_flags; | ||
2147 : | current->rounding_type = reference->rounding_type; | ||
2148 : | current->fcode = reference->fcode; | ||
2149 : | current->bcode = reference->bcode; | ||
2150 : | syskin | 1391 | current->stamp = reference->stamp; |
2151 : | edgomez | 1382 | image_copy(¤t->image, &reference->image, pParam->edged_width, pParam->height); |
2152 : | memcpy(current->mbs, reference->mbs, sizeof(MACROBLOCK) * mb_width * mb_height); | ||
2153 : | syskin | 1391 | coded = 0; |
2154 : | |||
2155 : | Isibaar | 1913 | BitstreamPadAlways(bs); /* next_start_code() at the end of VideoObjectPlane() */ |
2156 : | |||
2157 : | current->length = (BitstreamPos(bs) - bits) / 8; | ||
2158 : | |||
2159 : | syskin | 1391 | } else { |
2160 : | edgomez | 851 | |
2161 : | syskin | 1391 | pEnc->current->is_edged = 0; /* not edged */ |
2162 : | pEnc->current->is_interpolated = -1; /* not interpolated (fake rounding -1) */ | ||
2163 : | edgomez | 1382 | |
2164 : | syskin | 1391 | /* what was this frame's interpolated reference will become |
2165 : | forward (past) reference in b-frame coding */ | ||
2166 : | edgomez | 1382 | |
2167 : | syskin | 1391 | image_swap(&pEnc->vInterH, &pEnc->f_refh); |
2168 : | image_swap(&pEnc->vInterV, &pEnc->f_refv); | ||
2169 : | image_swap(&pEnc->vInterHV, &pEnc->f_refhv); | ||
2170 : | } | ||
2171 : | edgomez | 1382 | |
2172 : | edgomez | 851 | /* XXX: debug |
2173 : | { | ||
2174 : | char s[100]; | ||
2175 : | sprintf(s, "\\%05i_cur.pgm", pEnc->m_framenum); | ||
2176 : | edgomez | 1382 | image_dump_yuvpgm(¤t->image, |
2177 : | pParam->edged_width, | ||
2178 : | pParam->width, pParam->height, s); | ||
2179 : | |||
2180 : | edgomez | 851 | sprintf(s, "\\%05i_ref.pgm", pEnc->m_framenum); |
2181 : | edgomez | 1382 | image_dump_yuvpgm(&reference->image, |
2182 : | pParam->edged_width, | ||
2183 : | pParam->width, pParam->height, s); | ||
2184 : | syskin | 903 | } |
2185 : | edgomez | 851 | */ |
2186 : | |||
2187 : | Isibaar | 1913 | return coded; |
2188 : | } | ||
2189 : | edgomez | 851 | |
2190 : | Isibaar | 1913 | static void |
2191 : | SliceCodeB(SMPData *data) | ||
2192 : | { | ||
2193 : | Encoder *pEnc = (Encoder *) data->pEnc; | ||
2194 : | Bitstream *bs = (Bitstream *) data->bs; | ||
2195 : | Isibaar | 3 | |
2196 : | Isibaar | 1913 | DECLARE_ALIGNED_MATRIX(dct_codes, 6, 64, int16_t, CACHE_LINE); |
2197 : | DECLARE_ALIGNED_MATRIX(qcoeff, 6, 64, int16_t, CACHE_LINE); | ||
2198 : | |||
2199 : | int x, y; | ||
2200 : | FRAMEINFO * const frame = (FRAMEINFO * const) data->current; | ||
2201 : | MBParam * const pParam = &pEnc->mbParam; | ||
2202 : | int mb_width = pParam->mb_width; | ||
2203 : | int mb_height = pParam->mb_height; | ||
2204 : | IMAGE *f_ref = &pEnc->reference->image; | ||
2205 : | IMAGE *b_ref = &pEnc->current->image; | ||
2206 : | |||
2207 : | int bound = data->start_y*mb_width; | ||
2208 : | int num_slices = pEnc->num_slices; | ||
2209 : | |||
2210 : | if (data->start_y > 0) { /* write resync marker */ | ||
2211 : | Isibaar | 1919 | write_video_packet_header(bs, pParam, frame, bound+1); |
2212 : | Isibaar | 1913 | } |
2213 : | |||
2214 : | Isibaar | 1919 | for (y = data->start_y; y < MIN(data->stop_y+1, mb_height); y++) { |
2215 : | Isibaar | 1913 | int new_bound = mb_width * ((((y*num_slices) / mb_height) * mb_height + (num_slices-1)) / num_slices); |
2216 : | Isibaar | 1919 | int stop_x = (y == data->stop_y) ? 1 : mb_width; |
2217 : | int start_x = (y == data->start_y && y > 0) ? 1 : 0; | ||
2218 : | Isibaar | 1913 | |
2219 : | Isibaar | 1919 | for (x = start_x; x < stop_x; x++) { |
2220 : | Isibaar | 1913 | MACROBLOCK * const mb = &frame->mbs[x + y * pEnc->mbParam.mb_width]; |
2221 : | |||
2222 : | /* decoder ignores mb when refence block is INTER(0,0), CBP=0 */ | ||
2223 : | if (mb->mode == MODE_NOT_CODED) { | ||
2224 : | if (pParam->plugin_flags & XVID_REQORIGINAL) { | ||
2225 : | MBMotionCompensation(mb, x, y, f_ref, NULL, f_ref, NULL, NULL, &frame->image, | ||
2226 : | NULL, 0, 0, pParam->edged_width, 0, 0, data->RefQ); | ||
2227 : | } | ||
2228 : | continue; | ||
2229 : | } | ||
2230 : | |||
2231 : | Isibaar | 1919 | if (new_bound > bound && x > 0) { |
2232 : | bound = new_bound; | ||
2233 : | BitstreamPadAlways(bs); | ||
2234 : | write_video_packet_header(bs, pParam, frame, y*mb_width+x); | ||
2235 : | } | ||
2236 : | |||
2237 : | Isibaar | 1913 | mb->quant = frame->quant; |
2238 : | |||
2239 : | if (mb->cbp != 0 || pParam->plugin_flags & XVID_REQORIGINAL) { | ||
2240 : | /* we have to motion-compensate, transfer etc, | ||
2241 : | because there might be blocks to code */ | ||
2242 : | |||
2243 : | MBMotionCompensationBVOP(pParam, mb, x, y, &frame->image, | ||
2244 : | f_ref, &pEnc->f_refh, &pEnc->f_refv, | ||
2245 : | &pEnc->f_refhv, b_ref, &pEnc->vInterH, | ||
2246 : | &pEnc->vInterV, &pEnc->vInterHV, dct_codes, | ||
2247 : | data->RefQ); | ||
2248 : | |||
2249 : | mb->cbp = MBTransQuantInterBVOP(pParam, frame, mb, x, y, dct_codes, qcoeff); | ||
2250 : | } | ||
2251 : | |||
2252 : | if (mb->mode == MODE_DIRECT_NO4V) | ||
2253 : | mb->mode = MODE_DIRECT; | ||
2254 : | |||
2255 : | if (mb->mode == MODE_DIRECT && (mb->cbp | mb->pmvs[3].x | mb->pmvs[3].y) == 0) | ||
2256 : | mb->mode = MODE_DIRECT_NONE_MV; /* skipped */ | ||
2257 : | else | ||
2258 : | if (frame->vop_flags & XVID_VOP_GREYSCALE) | ||
2259 : | /* keep only bits 5-2 -- Chroma blocks will just be skipped by MBCodingBVOP */ | ||
2260 : | mb->cbp &= 0x3C; | ||
2261 : | |||
2262 : | start_timer(); | ||
2263 : | MBCodingBVOP(frame, mb, qcoeff, frame->fcode, frame->bcode, bs, data->sStat); | ||
2264 : | stop_coding_timer(); | ||
2265 : | } | ||
2266 : | } | ||
2267 : | |||
2268 : | BitstreamPadAlways(bs); /* next_start_code() at the end of VideoObjectPlane() */ | ||
2269 : | emms(); | ||
2270 : | edgomez | 851 | } |
2271 : | suxen_drol | 118 | |
2272 : | edgomez | 851 | static void |
2273 : | FrameCodeB(Encoder * pEnc, | ||
2274 : | FRAMEINFO * frame, | ||
2275 : | edgomez | 1382 | Bitstream * bs) |
2276 : | edgomez | 851 | { |
2277 : | edgomez | 1382 | int bits = BitstreamPos(bs); |
2278 : | Isibaar | 1913 | int k = 0, bound = 0, num_slices = pEnc->num_slices; |
2279 : | int num_threads = MAX(1, MIN(pEnc->num_threads, num_slices)); | ||
2280 : | void * status = NULL; | ||
2281 : | int slices_per_thread = (num_slices*1024 / num_threads); | ||
2282 : | int threads_per_slice = (pEnc->num_threads*1024 / num_threads); | ||
2283 : | edgomez | 851 | |
2284 : | IMAGE *f_ref = &pEnc->reference->image; | ||
2285 : | IMAGE *b_ref = &pEnc->current->image; | ||
2286 : | |||
2287 : | Isibaar | 1913 | MBParam * const pParam = &pEnc->mbParam; |
2288 : | int mb_height = pParam->mb_height; | ||
2289 : | |||
2290 : | edgomez | 1382 | #ifdef BFRAMES_DEC_DEBUG |
2291 : | edgomez | 851 | FILE *fp; |
2292 : | static char first=0; | ||
2293 : | #define BFRAME_DEBUG if (!first && fp){ \ | ||
2294 : | fprintf(fp,"Y=%3d X=%3d MB=%2d CBP=%02X\n",y,x,mb->mode,mb->cbp); \ | ||
2295 : | } | ||
2296 : | |||
2297 : | if (!first){ | ||
2298 : | fp=fopen("C:\\XVIDDBGE.TXT","w"); | ||
2299 : | } | ||
2300 : | #endif | ||
2301 : | |||
2302 : | edgomez | 867 | /* forward */ |
2303 : | edgomez | 1382 | if (!pEnc->reference->is_edged) { |
2304 : | image_setedges(f_ref, pEnc->mbParam.edged_width, | ||
2305 : | pEnc->mbParam.edged_height, pEnc->mbParam.width, | ||
2306 : | Isibaar | 1959 | pEnc->mbParam.height, XVID_BS_VERSION); |
2307 : | Isibaar | 1931 | pEnc->reference->is_edged = 1; |
2308 : | edgomez | 1382 | } |
2309 : | edgomez | 851 | |
2310 : | edgomez | 1382 | if (pEnc->reference->is_interpolated != 0) { |
2311 : | start_timer(); | ||
2312 : | syskin | 1665 | image_interpolate(f_ref->y, pEnc->f_refh.y, pEnc->f_refv.y, pEnc->f_refhv.y, |
2313 : | edgomez | 1382 | pEnc->mbParam.edged_width, pEnc->mbParam.edged_height, |
2314 : | (pEnc->mbParam.vol_flags & XVID_VOL_QUARTERPEL), 0); | ||
2315 : | stop_inter_timer(); | ||
2316 : | pEnc->reference->is_interpolated = 0; | ||
2317 : | } | ||
2318 : | |||
2319 : | edgomez | 867 | /* backward */ |
2320 : | edgomez | 1382 | if (!pEnc->current->is_edged) { |
2321 : | image_setedges(b_ref, pEnc->mbParam.edged_width, | ||
2322 : | pEnc->mbParam.edged_height, pEnc->mbParam.width, | ||
2323 : | Isibaar | 1959 | pEnc->mbParam.height, XVID_BS_VERSION); |
2324 : | edgomez | 1382 | pEnc->current->is_edged = 1; |
2325 : | } | ||
2326 : | edgomez | 851 | |
2327 : | edgomez | 1382 | if (pEnc->current->is_interpolated != 0) { |
2328 : | start_timer(); | ||
2329 : | syskin | 1665 | image_interpolate(b_ref->y, pEnc->vInterH.y, pEnc->vInterV.y, pEnc->vInterHV.y, |
2330 : | edgomez | 1382 | pEnc->mbParam.edged_width, pEnc->mbParam.edged_height, |
2331 : | (pEnc->mbParam.vol_flags & XVID_VOL_QUARTERPEL), 0); | ||
2332 : | stop_inter_timer(); | ||
2333 : | pEnc->current->is_interpolated = 0; | ||
2334 : | } | ||
2335 : | edgomez | 851 | |
2336 : | edgomez | 1382 | frame->coding_type = B_VOP; |
2337 : | Isibaar | 1909 | |
2338 : | Isibaar | 1931 | if ((frame->vop_flags & XVID_VOP_RD_PSNRHVSM) && (frame->vop_flags & XVID_VOP_RD_BVOP)) { |
2339 : | image_block_variance(&frame->image, pEnc->mbParam.edged_width, frame->mbs, | ||
2340 : | Isibaar | 1909 | pEnc->mbParam.mb_width, pEnc->mbParam.mb_height); |
2341 : | } | ||
2342 : | |||
2343 : | syskin | 1660 | call_plugins(pEnc, frame, NULL, XVID_PLG_FRAME, NULL, NULL, NULL); |
2344 : | edgomez | 1382 | |
2345 : | syskin | 1682 | frame->fcode = frame->bcode = pEnc->current->fcode; |
2346 : | edgomez | 851 | |
2347 : | syskin | 1684 | start_timer(); |
2348 : | Isibaar | 1913 | |
2349 : | syskin | 1682 | if (pEnc->num_threads > 0) { |
2350 : | Isibaar | 1913 | |
2351 : | syskin | 1682 | /* multithreaded motion estimation - dispatch threads */ |
2352 : | Isibaar | 1913 | while (k < pEnc->num_threads) { |
2353 : | int i, add_s = (slices_per_thread + 512) >> 10; | ||
2354 : | int add_t = (threads_per_slice + 512) >> 10; | ||
2355 : | |||
2356 : | int start_y = (bound * mb_height + (num_slices-1)) / num_slices; | ||
2357 : | int stop_y = ((bound+add_s) * mb_height + (num_slices-1)) / num_slices; | ||
2358 : | int rows_per_thread = (stop_y - start_y + add_t - 1) / add_t; | ||
2359 : | syskin | 1682 | |
2360 : | Isibaar | 1913 | slices_per_thread += ((num_slices*1024 / num_threads) - add_s*1024); |
2361 : | threads_per_slice += ((pEnc->num_threads*1024 / num_threads) - add_t*1024); | ||
2362 : | |||
2363 : | for (i = 0; i < add_t; i++) { | ||
2364 : | memset(pEnc->smpData[k+i].complete_count_self, 0, rows_per_thread * sizeof(int)); | ||
2365 : | |||
2366 : | pEnc->smpData[k+i].pEnc = (void *) pEnc; | ||
2367 : | pEnc->smpData[k+i].current = frame; | ||
2368 : | |||
2369 : | pEnc->smpData[k+i].y_row = i; | ||
2370 : | pEnc->smpData[k+i].y_step = add_t; | ||
2371 : | pEnc->smpData[k+i].stop_y = stop_y; | ||
2372 : | pEnc->smpData[k+i].start_y = start_y; | ||
2373 : | |||
2374 : | /* todo: sort out temp space once and for all */ | ||
2375 : | pEnc->smpData[k+i].RefQ = (((k+i)&1) ? pEnc->vInterV.u : pEnc->vInterV.v) + | ||
2376 : | 16*((k+i)>>1)*pParam->edged_width; | ||
2377 : | } | ||
2378 : | |||
2379 : | pEnc->smpData[k].complete_count_above = | ||
2380 : | pEnc->smpData[k+add_t-1].complete_count_self - 1; | ||
2381 : | |||
2382 : | bound += add_s; | ||
2383 : | k += add_t; | ||
2384 : | syskin | 1682 | } |
2385 : | |||
2386 : | syskin | 1684 | for (k = 1; k < pEnc->num_threads; k++) { |
2387 : | Isibaar | 1913 | pthread_create(&pEnc->smpData[k].handle, NULL, |
2388 : | (void*)SMPMotionEstimationBVOP, (void*)&pEnc->smpData[k]); | ||
2389 : | syskin | 1682 | } |
2390 : | syskin | 1693 | |
2391 : | Isibaar | 1913 | SMPMotionEstimationBVOP(&pEnc->smpData[0]); |
2392 : | syskin | 1684 | |
2393 : | for (k = 1; k < pEnc->num_threads; k++) { | ||
2394 : | Isibaar | 1913 | pthread_join(pEnc->smpData[k].handle, &status); |
2395 : | syskin | 1684 | } |
2396 : | |||
2397 : | frame->fcode = frame->bcode = 0; | ||
2398 : | for (k = 0; k < pEnc->num_threads; k++) { | ||
2399 : | Isibaar | 1913 | if (pEnc->smpData[k].minfcode > frame->fcode) |
2400 : | frame->fcode = pEnc->smpData[k].minfcode; | ||
2401 : | if (pEnc->smpData[k].minbcode > frame->bcode) | ||
2402 : | frame->bcode = pEnc->smpData[k].minbcode; | ||
2403 : | syskin | 1684 | } |
2404 : | syskin | 1682 | } else { |
2405 : | Isibaar | 1913 | |
2406 : | syskin | 1682 | MotionEstimationBVOP(&pEnc->mbParam, frame, |
2407 : | ((int32_t)(pEnc->current->stamp - frame->stamp)), /* time_bp */ | ||
2408 : | ((int32_t)(pEnc->current->stamp - pEnc->reference->stamp)), /* time_pp */ | ||
2409 : | pEnc->reference->mbs, f_ref, | ||
2410 : | &pEnc->f_refh, &pEnc->f_refv, &pEnc->f_refhv, | ||
2411 : | pEnc->current, b_ref, &pEnc->vInterH, | ||
2412 : | Isibaar | 1919 | &pEnc->vInterV, &pEnc->vInterHV, |
2413 : | pEnc->num_slices); | ||
2414 : | syskin | 1682 | } |
2415 : | syskin | 1684 | stop_motion_timer(); |
2416 : | syskin | 1682 | |
2417 : | edgomez | 851 | set_timecodes(frame, pEnc->reference,pEnc->mbParam.fbase); |
2418 : | edgomez | 1382 | BitstreamWriteVopHeader(bs, &pEnc->mbParam, frame, 1, frame->quant); |
2419 : | edgomez | 851 | |
2420 : | Isibaar | 1913 | /* reset stats */ |
2421 : | edgomez | 851 | frame->sStat.iTextBits = 0; |
2422 : | Isibaar | 1677 | frame->sStat.iMVBits = 0; |
2423 : | edgomez | 851 | frame->sStat.iMvSum = 0; |
2424 : | frame->sStat.iMvCount = 0; | ||
2425 : | frame->sStat.kblks = frame->sStat.mblks = frame->sStat.ublks = 0; | ||
2426 : | edgomez | 1382 | frame->sStat.mblks = pEnc->mbParam.mb_width * pEnc->mbParam.mb_height; |
2427 : | frame->sStat.kblks = frame->sStat.ublks = 0; | ||
2428 : | Isibaar | 1913 | |
2429 : | /* multithreaded inter coding - dispatch threads */ | ||
2430 : | bound = 0; | ||
2431 : | slices_per_thread = (num_slices*1024 / num_threads); | ||
2432 : | |||
2433 : | for (k = 0; k < num_threads; k++) { | ||
2434 : | int add = ((slices_per_thread + 512) >> 10); | ||
2435 : | edgomez | 851 | |
2436 : | Isibaar | 1913 | slices_per_thread += ((num_slices*1024 / num_threads) - add*1024); |
2437 : | edgomez | 851 | |
2438 : | Isibaar | 1913 | pEnc->smpData[k].pEnc = (void *) pEnc; |
2439 : | pEnc->smpData[k].current = frame; | ||
2440 : | pEnc->smpData[k].stop_y = (((bound+add) * mb_height + (num_slices-1)) / num_slices); | ||
2441 : | pEnc->smpData[k].start_y = ((bound * mb_height + (num_slices-1)) / num_slices); | ||
2442 : | bound += add; | ||
2443 : | edgomez | 851 | |
2444 : | Isibaar | 1913 | /* todo: sort out temp space once and for all */ |
2445 : | pEnc->smpData[k].RefQ = ((k&1) ? pEnc->vInterV.u : pEnc->vInterV.v) + 16*(k>>1)*pParam->edged_width; | ||
2446 : | edgomez | 851 | |
2447 : | Isibaar | 1913 | if (k > 0) { |
2448 : | BitstreamReset(pEnc->smpData[k].bs); | ||
2449 : | pEnc->smpData[k].sStat->iTextBits = pEnc->smpData[k].sStat->kblks = | ||
2450 : | pEnc->smpData[k].sStat->mblks = pEnc->smpData[k].sStat->ublks = pEnc->smpData[k].sStat->iMVBits = 0; | ||
2451 : | } | ||
2452 : | } | ||
2453 : | edgomez | 851 | |
2454 : | Isibaar | 1913 | for (k = 1; k < num_threads; k++) { |
2455 : | pthread_create(&pEnc->smpData[k].handle, NULL, | ||
2456 : | (void*)SliceCodeB, (void*)&pEnc->smpData[k]); | ||
2457 : | } | ||
2458 : | edgomez | 1382 | |
2459 : | Isibaar | 1913 | pEnc->smpData[0].bs = bs; |
2460 : | pEnc->smpData[0].sStat = &frame->sStat; | ||
2461 : | SliceCodeB(&pEnc->smpData[0]); | ||
2462 : | edgomez | 851 | |
2463 : | Isibaar | 1913 | for (k = 1; k < num_threads; k++) { |
2464 : | pthread_join(pEnc->smpData[k].handle, &status); | ||
2465 : | edgomez | 851 | } |
2466 : | |||
2467 : | Isibaar | 1913 | frame->length = BitstreamLength(bs) - (bits/8); |
2468 : | edgomez | 851 | |
2469 : | Isibaar | 1913 | /* reassemble the pieces together */ |
2470 : | SerializeBitstreams(pEnc, frame, bs, num_threads); | ||
2471 : | |||
2472 : | edgomez | 851 | #ifdef BFRAMES_DEC_DEBUG |
2473 : | if (!first){ | ||
2474 : | first=1; | ||
2475 : | if (fp) | ||
2476 : | fclose(fp); | ||
2477 : | } | ||
2478 : | #endif | ||
2479 : | suxen_drol | 118 | } |
No admin address has been configured | ViewVC Help |
Powered by ViewVC 1.0.4 |