Parent Directory | Revision Log
Revision 1424 - (view) (download)
1 : | edgomez | 851 | /************************************************************************** |
2 : | albeu | 315 | * |
3 : | edgomez | 1382 | * XVID MPEG-4 VIDEO CODEC |
4 : | * - Image management functions - | ||
5 : | albeu | 315 | * |
6 : | suxen_drol | 1397 | * Copyright(C) 2001-2004 Peter Ross <pross@xvid.org> |
7 : | albeu | 315 | * |
8 : | edgomez | 1382 | * This program is free software ; you can redistribute it and/or modify |
9 : | * it under the terms of the GNU General Public License as published by | ||
10 : | * the Free Software Foundation ; either version 2 of the License, or | ||
11 : | * (at your option) any later version. | ||
12 : | albeu | 315 | * |
13 : | edgomez | 1382 | * This program is distributed in the hope that it will be useful, |
14 : | * but WITHOUT ANY WARRANTY ; without even the implied warranty of | ||
15 : | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
16 : | * GNU General Public License for more details. | ||
17 : | albeu | 315 | * |
18 : | edgomez | 1382 | * You should have received a copy of the GNU General Public License |
19 : | * along with this program ; if not, write to the Free Software | ||
20 : | * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA | ||
21 : | albeu | 315 | * |
22 : | edgomez | 1424 | * $Id: image.c,v 1.29 2004-04-12 15:49:56 edgomez Exp $ |
23 : | albeu | 315 | * |
24 : | edgomez | 1382 | ****************************************************************************/ |
25 : | albeu | 315 | |
26 : | #include <stdlib.h> | ||
27 : | edgomez | 1382 | #include <string.h> /* memcpy, memset */ |
28 : | albeu | 315 | #include <math.h> |
29 : | |||
30 : | #include "../portab.h" | ||
31 : | edgomez | 1382 | #include "../global.h" |
32 : | #include "../xvid.h" | ||
33 : | albeu | 315 | #include "image.h" |
34 : | #include "colorspace.h" | ||
35 : | #include "interpolate8x8.h" | ||
36 : | edgomez | 851 | #include "reduced.h" |
37 : | albeu | 315 | #include "../utils/mem_align.h" |
38 : | edgomez | 1424 | #include "../motion/sad.h" |
39 : | albeu | 315 | |
40 : | edgomez | 1382 | #include "font.h" |
41 : | edgomez | 851 | |
42 : | albeu | 315 | #define SAFETY 64 |
43 : | #define EDGE_SIZE2 (EDGE_SIZE/2) | ||
44 : | |||
45 : | |||
46 : | int32_t | ||
47 : | image_create(IMAGE * image, | ||
48 : | uint32_t edged_width, | ||
49 : | uint32_t edged_height) | ||
50 : | { | ||
51 : | const uint32_t edged_width2 = edged_width / 2; | ||
52 : | const uint32_t edged_height2 = edged_height / 2; | ||
53 : | |||
54 : | image->y = | ||
55 : | xvid_malloc(edged_width * (edged_height + 1) + SAFETY, CACHE_LINE); | ||
56 : | if (image->y == NULL) { | ||
57 : | return -1; | ||
58 : | } | ||
59 : | edgomez | 1382 | memset(image->y, 0, edged_width * (edged_height + 1) + SAFETY); |
60 : | albeu | 315 | |
61 : | image->u = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE); | ||
62 : | if (image->u == NULL) { | ||
63 : | xvid_free(image->y); | ||
64 : | edgomez | 1382 | image->y = NULL; |
65 : | albeu | 315 | return -1; |
66 : | } | ||
67 : | edgomez | 1382 | memset(image->u, 0, edged_width2 * edged_height2 + SAFETY); |
68 : | |||
69 : | albeu | 315 | image->v = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE); |
70 : | if (image->v == NULL) { | ||
71 : | xvid_free(image->u); | ||
72 : | edgomez | 1382 | image->u = NULL; |
73 : | albeu | 315 | xvid_free(image->y); |
74 : | edgomez | 1382 | image->y = NULL; |
75 : | albeu | 315 | return -1; |
76 : | } | ||
77 : | edgomez | 1382 | memset(image->v, 0, edged_width2 * edged_height2 + SAFETY); |
78 : | albeu | 315 | |
79 : | image->y += EDGE_SIZE * edged_width + EDGE_SIZE; | ||
80 : | image->u += EDGE_SIZE2 * edged_width2 + EDGE_SIZE2; | ||
81 : | image->v += EDGE_SIZE2 * edged_width2 + EDGE_SIZE2; | ||
82 : | |||
83 : | return 0; | ||
84 : | } | ||
85 : | |||
86 : | |||
87 : | |||
88 : | void | ||
89 : | image_destroy(IMAGE * image, | ||
90 : | uint32_t edged_width, | ||
91 : | uint32_t edged_height) | ||
92 : | { | ||
93 : | const uint32_t edged_width2 = edged_width / 2; | ||
94 : | |||
95 : | if (image->y) { | ||
96 : | xvid_free(image->y - (EDGE_SIZE * edged_width + EDGE_SIZE)); | ||
97 : | edgomez | 1382 | image->y = NULL; |
98 : | albeu | 315 | } |
99 : | if (image->u) { | ||
100 : | xvid_free(image->u - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2)); | ||
101 : | edgomez | 1382 | image->u = NULL; |
102 : | albeu | 315 | } |
103 : | if (image->v) { | ||
104 : | xvid_free(image->v - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2)); | ||
105 : | edgomez | 1382 | image->v = NULL; |
106 : | albeu | 315 | } |
107 : | } | ||
108 : | |||
109 : | |||
110 : | void | ||
111 : | image_swap(IMAGE * image1, | ||
112 : | IMAGE * image2) | ||
113 : | { | ||
114 : | edgomez | 1382 | SWAP(uint8_t*, image1->y, image2->y); |
115 : | SWAP(uint8_t*, image1->u, image2->u); | ||
116 : | SWAP(uint8_t*, image1->v, image2->v); | ||
117 : | albeu | 315 | } |
118 : | |||
119 : | |||
120 : | void | ||
121 : | image_copy(IMAGE * image1, | ||
122 : | IMAGE * image2, | ||
123 : | uint32_t edged_width, | ||
124 : | uint32_t height) | ||
125 : | { | ||
126 : | memcpy(image1->y, image2->y, edged_width * height); | ||
127 : | memcpy(image1->u, image2->u, edged_width * height / 4); | ||
128 : | memcpy(image1->v, image2->v, edged_width * height / 4); | ||
129 : | } | ||
130 : | |||
131 : | edgomez | 1382 | /* setedges bug was fixed in this BS version */ |
132 : | #define SETEDGES_BUG_BEFORE 18 | ||
133 : | albeu | 315 | |
134 : | void | ||
135 : | image_setedges(IMAGE * image, | ||
136 : | uint32_t edged_width, | ||
137 : | uint32_t edged_height, | ||
138 : | uint32_t width, | ||
139 : | edgomez | 1382 | uint32_t height, |
140 : | int bs_version) | ||
141 : | albeu | 315 | { |
142 : | const uint32_t edged_width2 = edged_width / 2; | ||
143 : | edgomez | 1382 | uint32_t width2; |
144 : | albeu | 315 | uint32_t i; |
145 : | uint8_t *dst; | ||
146 : | uint8_t *src; | ||
147 : | |||
148 : | dst = image->y - (EDGE_SIZE + EDGE_SIZE * edged_width); | ||
149 : | src = image->y; | ||
150 : | |||
151 : | edgomez | 1382 | /* According to the Standard Clause 7.6.4, padding is done starting at 16 |
152 : | * pixel width and height multiples. This was not respected in old xvids */ | ||
153 : | if (bs_version == 0 || bs_version >= SETEDGES_BUG_BEFORE) { | ||
154 : | width = (width+15)&~15; | ||
155 : | height = (height+15)&~15; | ||
156 : | } | ||
157 : | |||
158 : | width2 = width/2; | ||
159 : | |||
160 : | albeu | 315 | for (i = 0; i < EDGE_SIZE; i++) { |
161 : | edgomez | 851 | memset(dst, *src, EDGE_SIZE); |
162 : | memcpy(dst + EDGE_SIZE, src, width); | ||
163 : | memset(dst + edged_width - EDGE_SIZE, *(src + width - 1), | ||
164 : | EDGE_SIZE); | ||
165 : | albeu | 315 | dst += edged_width; |
166 : | } | ||
167 : | |||
168 : | for (i = 0; i < height; i++) { | ||
169 : | memset(dst, *src, EDGE_SIZE); | ||
170 : | memset(dst + edged_width - EDGE_SIZE, src[width - 1], EDGE_SIZE); | ||
171 : | dst += edged_width; | ||
172 : | src += edged_width; | ||
173 : | } | ||
174 : | |||
175 : | src -= edged_width; | ||
176 : | for (i = 0; i < EDGE_SIZE; i++) { | ||
177 : | edgomez | 851 | memset(dst, *src, EDGE_SIZE); |
178 : | memcpy(dst + EDGE_SIZE, src, width); | ||
179 : | memset(dst + edged_width - EDGE_SIZE, *(src + width - 1), | ||
180 : | albeu | 315 | EDGE_SIZE); |
181 : | dst += edged_width; | ||
182 : | } | ||
183 : | |||
184 : | |||
185 : | edgomez | 1382 | /* U */ |
186 : | albeu | 315 | dst = image->u - (EDGE_SIZE2 + EDGE_SIZE2 * edged_width2); |
187 : | src = image->u; | ||
188 : | |||
189 : | for (i = 0; i < EDGE_SIZE2; i++) { | ||
190 : | memset(dst, *src, EDGE_SIZE2); | ||
191 : | memcpy(dst + EDGE_SIZE2, src, width2); | ||
192 : | memset(dst + edged_width2 - EDGE_SIZE2, *(src + width2 - 1), | ||
193 : | EDGE_SIZE2); | ||
194 : | dst += edged_width2; | ||
195 : | } | ||
196 : | |||
197 : | for (i = 0; i < height / 2; i++) { | ||
198 : | memset(dst, *src, EDGE_SIZE2); | ||
199 : | memset(dst + edged_width2 - EDGE_SIZE2, src[width2 - 1], EDGE_SIZE2); | ||
200 : | dst += edged_width2; | ||
201 : | src += edged_width2; | ||
202 : | } | ||
203 : | src -= edged_width2; | ||
204 : | for (i = 0; i < EDGE_SIZE2; i++) { | ||
205 : | memset(dst, *src, EDGE_SIZE2); | ||
206 : | memcpy(dst + EDGE_SIZE2, src, width2); | ||
207 : | memset(dst + edged_width2 - EDGE_SIZE2, *(src + width2 - 1), | ||
208 : | EDGE_SIZE2); | ||
209 : | dst += edged_width2; | ||
210 : | } | ||
211 : | |||
212 : | |||
213 : | edgomez | 1382 | /* V */ |
214 : | albeu | 315 | dst = image->v - (EDGE_SIZE2 + EDGE_SIZE2 * edged_width2); |
215 : | src = image->v; | ||
216 : | |||
217 : | for (i = 0; i < EDGE_SIZE2; i++) { | ||
218 : | memset(dst, *src, EDGE_SIZE2); | ||
219 : | memcpy(dst + EDGE_SIZE2, src, width2); | ||
220 : | memset(dst + edged_width2 - EDGE_SIZE2, *(src + width2 - 1), | ||
221 : | EDGE_SIZE2); | ||
222 : | dst += edged_width2; | ||
223 : | } | ||
224 : | |||
225 : | for (i = 0; i < height / 2; i++) { | ||
226 : | memset(dst, *src, EDGE_SIZE2); | ||
227 : | memset(dst + edged_width2 - EDGE_SIZE2, src[width2 - 1], EDGE_SIZE2); | ||
228 : | dst += edged_width2; | ||
229 : | src += edged_width2; | ||
230 : | } | ||
231 : | src -= edged_width2; | ||
232 : | for (i = 0; i < EDGE_SIZE2; i++) { | ||
233 : | memset(dst, *src, EDGE_SIZE2); | ||
234 : | memcpy(dst + EDGE_SIZE2, src, width2); | ||
235 : | memset(dst + edged_width2 - EDGE_SIZE2, *(src + width2 - 1), | ||
236 : | EDGE_SIZE2); | ||
237 : | dst += edged_width2; | ||
238 : | } | ||
239 : | } | ||
240 : | |||
241 : | edgomez | 1382 | /* bframe encoding requires image-based u,v interpolation */ |
242 : | albeu | 315 | void |
243 : | image_interpolate(const IMAGE * refn, | ||
244 : | IMAGE * refh, | ||
245 : | IMAGE * refv, | ||
246 : | IMAGE * refhv, | ||
247 : | uint32_t edged_width, | ||
248 : | uint32_t edged_height, | ||
249 : | edgomez | 851 | uint32_t quarterpel, |
250 : | albeu | 315 | uint32_t rounding) |
251 : | { | ||
252 : | edgomez | 1382 | const uint32_t offset = EDGE_SIZE2 * (edged_width + 1); /* we only interpolate half of the edge area */ |
253 : | albeu | 315 | const uint32_t stride_add = 7 * edged_width; |
254 : | edgomez | 1382 | #if 0 |
255 : | edgomez | 851 | const uint32_t edged_width2 = edged_width / 2; |
256 : | const uint32_t edged_height2 = edged_height / 2; | ||
257 : | const uint32_t offset2 = EDGE_SIZE2 * (edged_width2 + 1); | ||
258 : | const uint32_t stride_add2 = 7 * edged_width2; | ||
259 : | #endif | ||
260 : | albeu | 315 | uint8_t *n_ptr, *h_ptr, *v_ptr, *hv_ptr; |
261 : | uint32_t x, y; | ||
262 : | |||
263 : | |||
264 : | n_ptr = refn->y; | ||
265 : | h_ptr = refh->y; | ||
266 : | v_ptr = refv->y; | ||
267 : | |||
268 : | n_ptr -= offset; | ||
269 : | h_ptr -= offset; | ||
270 : | v_ptr -= offset; | ||
271 : | |||
272 : | edgomez | 1382 | /* Note we initialize the hv pointer later, as we can optimize code a bit |
273 : | * doing it down to up in quarterpel and up to down in halfpel */ | ||
274 : | edgomez | 851 | if(quarterpel) { |
275 : | edgomez | 1382 | |
276 : | edgomez | 851 | for (y = 0; y < (edged_height - EDGE_SIZE); y += 8) { |
277 : | for (x = 0; x < (edged_width - EDGE_SIZE); x += 8) { | ||
278 : | interpolate8x8_6tap_lowpass_h(h_ptr, n_ptr, edged_width, rounding); | ||
279 : | interpolate8x8_6tap_lowpass_v(v_ptr, n_ptr, edged_width, rounding); | ||
280 : | albeu | 315 | |
281 : | edgomez | 851 | n_ptr += 8; |
282 : | h_ptr += 8; | ||
283 : | v_ptr += 8; | ||
284 : | } | ||
285 : | edgomez | 1382 | |
286 : | edgomez | 851 | n_ptr += EDGE_SIZE; |
287 : | h_ptr += EDGE_SIZE; | ||
288 : | v_ptr += EDGE_SIZE; | ||
289 : | |||
290 : | h_ptr += stride_add; | ||
291 : | v_ptr += stride_add; | ||
292 : | n_ptr += stride_add; | ||
293 : | } | ||
294 : | |||
295 : | edgomez | 1382 | h_ptr = refh->y + (edged_height - EDGE_SIZE - EDGE_SIZE2)*edged_width - EDGE_SIZE2; |
296 : | hv_ptr = refhv->y + (edged_height - EDGE_SIZE - EDGE_SIZE2)*edged_width - EDGE_SIZE2; | ||
297 : | edgomez | 851 | |
298 : | for (y = 0; y < (edged_height - EDGE_SIZE); y = y + 8) { | ||
299 : | edgomez | 1382 | hv_ptr -= stride_add; |
300 : | h_ptr -= stride_add; | ||
301 : | hv_ptr -= EDGE_SIZE; | ||
302 : | h_ptr -= EDGE_SIZE; | ||
303 : | |||
304 : | edgomez | 851 | for (x = 0; x < (edged_width - EDGE_SIZE); x = x + 8) { |
305 : | edgomez | 1382 | hv_ptr -= 8; |
306 : | h_ptr -= 8; | ||
307 : | edgomez | 851 | interpolate8x8_6tap_lowpass_v(hv_ptr, h_ptr, edged_width, rounding); |
308 : | } | ||
309 : | } | ||
310 : | edgomez | 1382 | } else { |
311 : | edgomez | 851 | |
312 : | edgomez | 1382 | hv_ptr = refhv->y; |
313 : | hv_ptr -= offset; | ||
314 : | |||
315 : | edgomez | 851 | for (y = 0; y < (edged_height - EDGE_SIZE); y += 8) { |
316 : | for (x = 0; x < (edged_width - EDGE_SIZE); x += 8) { | ||
317 : | interpolate8x8_halfpel_h(h_ptr, n_ptr, edged_width, rounding); | ||
318 : | interpolate8x8_halfpel_v(v_ptr, n_ptr, edged_width, rounding); | ||
319 : | interpolate8x8_halfpel_hv(hv_ptr, n_ptr, edged_width, rounding); | ||
320 : | |||
321 : | n_ptr += 8; | ||
322 : | h_ptr += 8; | ||
323 : | v_ptr += 8; | ||
324 : | hv_ptr += 8; | ||
325 : | } | ||
326 : | edgomez | 1382 | |
327 : | edgomez | 851 | h_ptr += EDGE_SIZE; |
328 : | v_ptr += EDGE_SIZE; | ||
329 : | hv_ptr += EDGE_SIZE; | ||
330 : | n_ptr += EDGE_SIZE; | ||
331 : | |||
332 : | h_ptr += stride_add; | ||
333 : | v_ptr += stride_add; | ||
334 : | hv_ptr += stride_add; | ||
335 : | n_ptr += stride_add; | ||
336 : | } | ||
337 : | } | ||
338 : | /* | ||
339 : | #ifdef BFRAMES | ||
340 : | n_ptr = refn->u; | ||
341 : | h_ptr = refh->u; | ||
342 : | v_ptr = refv->u; | ||
343 : | hv_ptr = refhv->u; | ||
344 : | |||
345 : | n_ptr -= offset2; | ||
346 : | h_ptr -= offset2; | ||
347 : | v_ptr -= offset2; | ||
348 : | hv_ptr -= offset2; | ||
349 : | |||
350 : | for (y = 0; y < edged_height2; y += 8) { | ||
351 : | for (x = 0; x < edged_width2; x += 8) { | ||
352 : | interpolate8x8_halfpel_h(h_ptr, n_ptr, edged_width2, rounding); | ||
353 : | interpolate8x8_halfpel_v(v_ptr, n_ptr, edged_width2, rounding); | ||
354 : | interpolate8x8_halfpel_hv(hv_ptr, n_ptr, edged_width2, rounding); | ||
355 : | |||
356 : | albeu | 315 | n_ptr += 8; |
357 : | h_ptr += 8; | ||
358 : | v_ptr += 8; | ||
359 : | hv_ptr += 8; | ||
360 : | } | ||
361 : | edgomez | 851 | h_ptr += stride_add2; |
362 : | v_ptr += stride_add2; | ||
363 : | hv_ptr += stride_add2; | ||
364 : | n_ptr += stride_add2; | ||
365 : | albeu | 315 | } |
366 : | |||
367 : | edgomez | 851 | n_ptr = refn->v; |
368 : | h_ptr = refh->v; | ||
369 : | v_ptr = refv->v; | ||
370 : | hv_ptr = refhv->v; | ||
371 : | |||
372 : | n_ptr -= offset2; | ||
373 : | h_ptr -= offset2; | ||
374 : | v_ptr -= offset2; | ||
375 : | hv_ptr -= offset2; | ||
376 : | |||
377 : | for (y = 0; y < edged_height2; y = y + 8) { | ||
378 : | for (x = 0; x < edged_width2; x = x + 8) { | ||
379 : | interpolate8x8_halfpel_h(h_ptr, n_ptr, edged_width2, rounding); | ||
380 : | interpolate8x8_halfpel_v(v_ptr, n_ptr, edged_width2, rounding); | ||
381 : | interpolate8x8_halfpel_hv(hv_ptr, n_ptr, edged_width2, rounding); | ||
382 : | |||
383 : | n_ptr += 8; | ||
384 : | h_ptr += 8; | ||
385 : | v_ptr += 8; | ||
386 : | hv_ptr += 8; | ||
387 : | } | ||
388 : | h_ptr += stride_add2; | ||
389 : | v_ptr += stride_add2; | ||
390 : | hv_ptr += stride_add2; | ||
391 : | n_ptr += stride_add2; | ||
392 : | } | ||
393 : | #endif | ||
394 : | */ | ||
395 : | albeu | 315 | /* |
396 : | interpolate_halfpel_h( | ||
397 : | refh->y - offset, | ||
398 : | edgomez | 1382 | refn->y - offset, |
399 : | albeu | 315 | edged_width, edged_height, |
400 : | rounding); | ||
401 : | |||
402 : | interpolate_halfpel_v( | ||
403 : | refv->y - offset, | ||
404 : | edgomez | 1382 | refn->y - offset, |
405 : | albeu | 315 | edged_width, edged_height, |
406 : | rounding); | ||
407 : | |||
408 : | interpolate_halfpel_hv( | ||
409 : | refhv->y - offset, | ||
410 : | refn->y - offset, | ||
411 : | edged_width, edged_height, | ||
412 : | rounding); | ||
413 : | */ | ||
414 : | |||
415 : | /* uv-image-based compensation | ||
416 : | offset = EDGE_SIZE2 * (edged_width / 2 + 1); | ||
417 : | |||
418 : | interpolate_halfpel_h( | ||
419 : | refh->u - offset, | ||
420 : | edgomez | 1382 | refn->u - offset, |
421 : | albeu | 315 | edged_width / 2, edged_height / 2, |
422 : | rounding); | ||
423 : | |||
424 : | interpolate_halfpel_v( | ||
425 : | refv->u - offset, | ||
426 : | edgomez | 1382 | refn->u - offset, |
427 : | albeu | 315 | edged_width / 2, edged_height / 2, |
428 : | rounding); | ||
429 : | |||
430 : | interpolate_halfpel_hv( | ||
431 : | refhv->u - offset, | ||
432 : | edgomez | 1382 | refn->u - offset, |
433 : | albeu | 315 | edged_width / 2, edged_height / 2, |
434 : | rounding); | ||
435 : | |||
436 : | |||
437 : | interpolate_halfpel_h( | ||
438 : | refh->v - offset, | ||
439 : | edgomez | 1382 | refn->v - offset, |
440 : | albeu | 315 | edged_width / 2, edged_height / 2, |
441 : | rounding); | ||
442 : | |||
443 : | interpolate_halfpel_v( | ||
444 : | refv->v - offset, | ||
445 : | edgomez | 1382 | refn->v - offset, |
446 : | albeu | 315 | edged_width / 2, edged_height / 2, |
447 : | rounding); | ||
448 : | |||
449 : | interpolate_halfpel_hv( | ||
450 : | refhv->v - offset, | ||
451 : | edgomez | 1382 | refn->v - offset, |
452 : | albeu | 315 | edged_width / 2, edged_height / 2, |
453 : | rounding); | ||
454 : | */ | ||
455 : | } | ||
456 : | |||
457 : | |||
458 : | edgomez | 851 | /* |
459 : | chroma optimize filter, invented by mf | ||
460 : | a chroma pixel is average from the surrounding pixels, when the | ||
461 : | correpsonding luma pixels are pure black or white. | ||
462 : | */ | ||
463 : | |||
464 : | void | ||
465 : | image_chroma_optimize(IMAGE * img, int width, int height, int edged_width) | ||
466 : | { | ||
467 : | int x,y; | ||
468 : | int pixels = 0; | ||
469 : | |||
470 : | for (y = 1; y < height/2 - 1; y++) | ||
471 : | for (x = 1; x < width/2 - 1; x++) | ||
472 : | { | ||
473 : | #define IS_PURE(a) ((a)<=16||(a)>=235) | ||
474 : | #define IMG_Y(Y,X) img->y[(Y)*edged_width + (X)] | ||
475 : | #define IMG_U(Y,X) img->u[(Y)*edged_width/2 + (X)] | ||
476 : | #define IMG_V(Y,X) img->v[(Y)*edged_width/2 + (X)] | ||
477 : | |||
478 : | edgomez | 1382 | if (IS_PURE(IMG_Y(y*2 ,x*2 )) && |
479 : | edgomez | 851 | IS_PURE(IMG_Y(y*2 ,x*2+1)) && |
480 : | edgomez | 1382 | IS_PURE(IMG_Y(y*2+1,x*2 )) && |
481 : | edgomez | 851 | IS_PURE(IMG_Y(y*2+1,x*2+1))) |
482 : | { | ||
483 : | IMG_U(y,x) = (IMG_U(y,x-1) + IMG_U(y-1, x) + IMG_U(y, x+1) + IMG_U(y+1, x)) / 4; | ||
484 : | IMG_V(y,x) = (IMG_V(y,x-1) + IMG_V(y-1, x) + IMG_V(y, x+1) + IMG_V(y+1, x)) / 4; | ||
485 : | pixels++; | ||
486 : | } | ||
487 : | |||
488 : | #undef IS_PURE | ||
489 : | #undef IMG_Y | ||
490 : | #undef IMG_U | ||
491 : | #undef IMG_V | ||
492 : | } | ||
493 : | edgomez | 1382 | |
494 : | DPRINTF(XVID_DEBUG_DEBUG,"chroma_optimized_pixels = %i/%i\n", pixels, width*height/4); | ||
495 : | edgomez | 851 | } |
496 : | |||
497 : | |||
498 : | |||
499 : | |||
500 : | |||
501 : | /* | ||
502 : | perform safe packed colorspace conversion, by splitting | ||
503 : | the image up into an optimized area (pixel width divisible by 16), | ||
504 : | and two unoptimized/plain-c areas (pixel width divisible by 2) | ||
505 : | */ | ||
506 : | |||
507 : | edgomez | 1382 | static void |
508 : | edgomez | 851 | safe_packed_conv(uint8_t * x_ptr, int x_stride, |
509 : | uint8_t * y_ptr, uint8_t * u_ptr, uint8_t * v_ptr, | ||
510 : | int y_stride, int uv_stride, | ||
511 : | int width, int height, int vflip, | ||
512 : | packedFunc * func_opt, packedFunc func_c, int size) | ||
513 : | { | ||
514 : | int width_opt, width_c; | ||
515 : | |||
516 : | if (func_opt != func_c && x_stride < size*((width+15)/16)*16) | ||
517 : | { | ||
518 : | width_opt = width & (~15); | ||
519 : | width_c = width - width_opt; | ||
520 : | } | ||
521 : | else | ||
522 : | { | ||
523 : | width_opt = width; | ||
524 : | width_c = 0; | ||
525 : | } | ||
526 : | |||
527 : | func_opt(x_ptr, x_stride, | ||
528 : | y_ptr, u_ptr, v_ptr, y_stride, uv_stride, | ||
529 : | width_opt, height, vflip); | ||
530 : | |||
531 : | if (width_c) | ||
532 : | { | ||
533 : | func_c(x_ptr + size*width_opt, x_stride, | ||
534 : | y_ptr + width_opt, u_ptr + width_opt/2, v_ptr + width_opt/2, | ||
535 : | y_stride, uv_stride, width_c, height, vflip); | ||
536 : | } | ||
537 : | } | ||
538 : | |||
539 : | |||
540 : | |||
541 : | albeu | 315 | int |
542 : | image_input(IMAGE * image, | ||
543 : | uint32_t width, | ||
544 : | int height, | ||
545 : | uint32_t edged_width, | ||
546 : | edgomez | 1382 | uint8_t * src[4], |
547 : | int src_stride[4], | ||
548 : | edgomez | 851 | int csp, |
549 : | int interlacing) | ||
550 : | albeu | 315 | { |
551 : | edgomez | 851 | const int edged_width2 = edged_width/2; |
552 : | const int width2 = width/2; | ||
553 : | const int height2 = height/2; | ||
554 : | edgomez | 1382 | #if 0 |
555 : | const int height_signed = (csp & XVID_CSP_VFLIP) ? -height : height; | ||
556 : | #endif | ||
557 : | albeu | 315 | |
558 : | switch (csp & ~XVID_CSP_VFLIP) { | ||
559 : | case XVID_CSP_RGB555: | ||
560 : | edgomez | 851 | safe_packed_conv( |
561 : | edgomez | 1382 | src[0], src_stride[0], image->y, image->u, image->v, |
562 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
563 : | interlacing?rgb555i_to_yv12 :rgb555_to_yv12, | ||
564 : | interlacing?rgb555i_to_yv12_c:rgb555_to_yv12_c, 2); | ||
565 : | break; | ||
566 : | albeu | 315 | |
567 : | case XVID_CSP_RGB565: | ||
568 : | edgomez | 851 | safe_packed_conv( |
569 : | edgomez | 1382 | src[0], src_stride[0], image->y, image->u, image->v, |
570 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
571 : | interlacing?rgb565i_to_yv12 :rgb565_to_yv12, | ||
572 : | interlacing?rgb565i_to_yv12_c:rgb565_to_yv12_c, 2); | ||
573 : | break; | ||
574 : | albeu | 315 | |
575 : | |||
576 : | edgomez | 1382 | case XVID_CSP_BGR: |
577 : | edgomez | 851 | safe_packed_conv( |
578 : | edgomez | 1382 | src[0], src_stride[0], image->y, image->u, image->v, |
579 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
580 : | interlacing?bgri_to_yv12 :bgr_to_yv12, | ||
581 : | interlacing?bgri_to_yv12_c:bgr_to_yv12_c, 3); | ||
582 : | break; | ||
583 : | albeu | 315 | |
584 : | edgomez | 1382 | case XVID_CSP_BGRA: |
585 : | edgomez | 851 | safe_packed_conv( |
586 : | edgomez | 1382 | src[0], src_stride[0], image->y, image->u, image->v, |
587 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
588 : | interlacing?bgrai_to_yv12 :bgra_to_yv12, | ||
589 : | interlacing?bgrai_to_yv12_c:bgra_to_yv12_c, 4); | ||
590 : | break; | ||
591 : | albeu | 315 | |
592 : | edgomez | 851 | case XVID_CSP_ABGR : |
593 : | safe_packed_conv( | ||
594 : | edgomez | 1382 | src[0], src_stride[0], image->y, image->u, image->v, |
595 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
596 : | interlacing?abgri_to_yv12 :abgr_to_yv12, | ||
597 : | interlacing?abgri_to_yv12_c:abgr_to_yv12_c, 4); | ||
598 : | break; | ||
599 : | albeu | 315 | |
600 : | edgomez | 851 | case XVID_CSP_RGBA : |
601 : | safe_packed_conv( | ||
602 : | edgomez | 1382 | src[0], src_stride[0], image->y, image->u, image->v, |
603 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
604 : | interlacing?rgbai_to_yv12 :rgba_to_yv12, | ||
605 : | interlacing?rgbai_to_yv12_c:rgba_to_yv12_c, 4); | ||
606 : | break; | ||
607 : | edgomez | 1382 | |
608 : | case XVID_CSP_ARGB: | ||
609 : | safe_packed_conv( | ||
610 : | src[0], src_stride[0], image->y, image->u, image->v, | ||
611 : | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), | ||
612 : | interlacing?argbi_to_yv12 : argb_to_yv12, | ||
613 : | interlacing?argbi_to_yv12_c: argb_to_yv12_c, 4); | ||
614 : | break; | ||
615 : | albeu | 315 | |
616 : | case XVID_CSP_YUY2: | ||
617 : | edgomez | 851 | safe_packed_conv( |
618 : | edgomez | 1382 | src[0], src_stride[0], image->y, image->u, image->v, |
619 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
620 : | interlacing?yuyvi_to_yv12 :yuyv_to_yv12, | ||
621 : | interlacing?yuyvi_to_yv12_c:yuyv_to_yv12_c, 2); | ||
622 : | break; | ||
623 : | albeu | 315 | |
624 : | case XVID_CSP_YVYU: /* u/v swapped */ | ||
625 : | edgomez | 851 | safe_packed_conv( |
626 : | edgomez | 1382 | src[0], src_stride[0], image->y, image->v, image->u, |
627 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
628 : | interlacing?yuyvi_to_yv12 :yuyv_to_yv12, | ||
629 : | interlacing?yuyvi_to_yv12_c:yuyv_to_yv12_c, 2); | ||
630 : | break; | ||
631 : | albeu | 315 | |
632 : | case XVID_CSP_UYVY: | ||
633 : | edgomez | 851 | safe_packed_conv( |
634 : | edgomez | 1382 | src[0], src_stride[0], image->y, image->u, image->v, |
635 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
636 : | interlacing?uyvyi_to_yv12 :uyvy_to_yv12, | ||
637 : | interlacing?uyvyi_to_yv12_c:uyvy_to_yv12_c, 2); | ||
638 : | break; | ||
639 : | albeu | 315 | |
640 : | edgomez | 1382 | case XVID_CSP_I420: /* YCbCr == YUV == internal colorspace for MPEG */ |
641 : | edgomez | 851 | yv12_to_yv12(image->y, image->u, image->v, edged_width, edged_width2, |
642 : | edgomez | 1382 | src[0], src[0] + src_stride[0]*height, src[0] + src_stride[0]*height + (src_stride[0]/2)*height2, |
643 : | src_stride[0], src_stride[0]/2, width, height, (csp & XVID_CSP_VFLIP)); | ||
644 : | break; | ||
645 : | |||
646 : | case XVID_CSP_YV12: /* YCrCb == YVA == U and V plane swapped */ | ||
647 : | edgomez | 851 | yv12_to_yv12(image->y, image->v, image->u, edged_width, edged_width2, |
648 : | edgomez | 1382 | src[0], src[0] + src_stride[0]*height, src[0] + src_stride[0]*height + (src_stride[0]/2)*height2, |
649 : | src_stride[0], src_stride[0]/2, width, height, (csp & XVID_CSP_VFLIP)); | ||
650 : | edgomez | 851 | break; |
651 : | |||
652 : | edgomez | 1382 | case XVID_CSP_PLANAR: /* YCbCr with arbitrary pointers and different strides for Y and UV */ |
653 : | yv12_to_yv12(image->y, image->u, image->v, edged_width, edged_width2, | ||
654 : | src[0], src[1], src[2], src_stride[0], src_stride[1], /* v: dst_stride[2] not yet supported */ | ||
655 : | width, height, (csp & XVID_CSP_VFLIP)); | ||
656 : | edgomez | 851 | break; |
657 : | albeu | 315 | |
658 : | case XVID_CSP_NULL: | ||
659 : | break; | ||
660 : | |||
661 : | edgomez | 851 | default : |
662 : | return -1; | ||
663 : | albeu | 315 | } |
664 : | |||
665 : | edgomez | 851 | |
666 : | /* pad out image when the width and/or height is not a multiple of 16 */ | ||
667 : | |||
668 : | if (width & 15) | ||
669 : | { | ||
670 : | int i; | ||
671 : | int pad_width = 16 - (width&15); | ||
672 : | for (i = 0; i < height; i++) | ||
673 : | { | ||
674 : | edgomez | 1382 | memset(image->y + i*edged_width + width, |
675 : | edgomez | 851 | *(image->y + i*edged_width + width - 1), pad_width); |
676 : | } | ||
677 : | for (i = 0; i < height/2; i++) | ||
678 : | { | ||
679 : | edgomez | 1382 | memset(image->u + i*edged_width2 + width2, |
680 : | edgomez | 851 | *(image->u + i*edged_width2 + width2 - 1),pad_width/2); |
681 : | edgomez | 1382 | memset(image->v + i*edged_width2 + width2, |
682 : | edgomez | 851 | *(image->v + i*edged_width2 + width2 - 1),pad_width/2); |
683 : | } | ||
684 : | } | ||
685 : | |||
686 : | if (height & 15) | ||
687 : | { | ||
688 : | edgomez | 1382 | int pad_height = 16 - (height&15); |
689 : | edgomez | 851 | int length = ((width+15)/16)*16; |
690 : | int i; | ||
691 : | for (i = 0; i < pad_height; i++) | ||
692 : | { | ||
693 : | memcpy(image->y + (height+i)*edged_width, | ||
694 : | image->y + (height-1)*edged_width,length); | ||
695 : | } | ||
696 : | |||
697 : | for (i = 0; i < pad_height/2; i++) | ||
698 : | { | ||
699 : | memcpy(image->u + (height2+i)*edged_width2, | ||
700 : | image->u + (height2-1)*edged_width2,length/2); | ||
701 : | memcpy(image->v + (height2+i)*edged_width2, | ||
702 : | image->v + (height2-1)*edged_width2,length/2); | ||
703 : | } | ||
704 : | } | ||
705 : | |||
706 : | /* | ||
707 : | if (interlacing) | ||
708 : | image_printf(image, edged_width, height, 5,5, "[i]"); | ||
709 : | image_dump_yuvpgm(image, edged_width, ((width+15)/16)*16, ((height+15)/16)*16, "\\encode.pgm"); | ||
710 : | */ | ||
711 : | return 0; | ||
712 : | albeu | 315 | } |
713 : | |||
714 : | |||
715 : | |||
716 : | int | ||
717 : | image_output(IMAGE * image, | ||
718 : | uint32_t width, | ||
719 : | int height, | ||
720 : | uint32_t edged_width, | ||
721 : | edgomez | 1382 | uint8_t * dst[4], |
722 : | uint32_t dst_stride[4], | ||
723 : | edgomez | 851 | int csp, |
724 : | int interlacing) | ||
725 : | albeu | 315 | { |
726 : | edgomez | 851 | const int edged_width2 = edged_width/2; |
727 : | int height2 = height/2; | ||
728 : | |||
729 : | /* | ||
730 : | if (interlacing) | ||
731 : | image_printf(image, edged_width, height, 5,100, "[i]=%i,%i",width,height); | ||
732 : | image_dump_yuvpgm(image, edged_width, width, height, "\\decode.pgm"); | ||
733 : | */ | ||
734 : | |||
735 : | albeu | 315 | switch (csp & ~XVID_CSP_VFLIP) { |
736 : | case XVID_CSP_RGB555: | ||
737 : | edgomez | 851 | safe_packed_conv( |
738 : | edgomez | 1382 | dst[0], dst_stride[0], image->y, image->u, image->v, |
739 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
740 : | interlacing?yv12_to_rgb555i :yv12_to_rgb555, | ||
741 : | interlacing?yv12_to_rgb555i_c:yv12_to_rgb555_c, 2); | ||
742 : | albeu | 315 | return 0; |
743 : | |||
744 : | case XVID_CSP_RGB565: | ||
745 : | edgomez | 851 | safe_packed_conv( |
746 : | edgomez | 1382 | dst[0], dst_stride[0], image->y, image->u, image->v, |
747 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
748 : | interlacing?yv12_to_rgb565i :yv12_to_rgb565, | ||
749 : | interlacing?yv12_to_rgb565i_c:yv12_to_rgb565_c, 2); | ||
750 : | albeu | 315 | return 0; |
751 : | |||
752 : | edgomez | 1382 | case XVID_CSP_BGR: |
753 : | edgomez | 851 | safe_packed_conv( |
754 : | edgomez | 1382 | dst[0], dst_stride[0], image->y, image->u, image->v, |
755 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
756 : | interlacing?yv12_to_bgri :yv12_to_bgr, | ||
757 : | interlacing?yv12_to_bgri_c:yv12_to_bgr_c, 3); | ||
758 : | albeu | 315 | return 0; |
759 : | |||
760 : | edgomez | 1382 | case XVID_CSP_BGRA: |
761 : | edgomez | 851 | safe_packed_conv( |
762 : | edgomez | 1382 | dst[0], dst_stride[0], image->y, image->u, image->v, |
763 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
764 : | interlacing?yv12_to_bgrai :yv12_to_bgra, | ||
765 : | interlacing?yv12_to_bgrai_c:yv12_to_bgra_c, 4); | ||
766 : | albeu | 315 | return 0; |
767 : | |||
768 : | edgomez | 851 | case XVID_CSP_ABGR: |
769 : | safe_packed_conv( | ||
770 : | edgomez | 1382 | dst[0], dst_stride[0], image->y, image->u, image->v, |
771 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
772 : | interlacing?yv12_to_abgri :yv12_to_abgr, | ||
773 : | interlacing?yv12_to_abgri_c:yv12_to_abgr_c, 4); | ||
774 : | albeu | 315 | return 0; |
775 : | |||
776 : | edgomez | 851 | case XVID_CSP_RGBA: |
777 : | safe_packed_conv( | ||
778 : | edgomez | 1382 | dst[0], dst_stride[0], image->y, image->u, image->v, |
779 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
780 : | interlacing?yv12_to_rgbai :yv12_to_rgba, | ||
781 : | interlacing?yv12_to_rgbai_c:yv12_to_rgba_c, 4); | ||
782 : | albeu | 315 | return 0; |
783 : | |||
784 : | edgomez | 1382 | case XVID_CSP_ARGB: |
785 : | safe_packed_conv( | ||
786 : | dst[0], dst_stride[0], image->y, image->u, image->v, | ||
787 : | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), | ||
788 : | interlacing?yv12_to_argbi :yv12_to_argb, | ||
789 : | interlacing?yv12_to_argbi_c:yv12_to_argb_c, 4); | ||
790 : | return 0; | ||
791 : | |||
792 : | albeu | 315 | case XVID_CSP_YUY2: |
793 : | edgomez | 851 | safe_packed_conv( |
794 : | edgomez | 1382 | dst[0], dst_stride[0], image->y, image->u, image->v, |
795 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
796 : | interlacing?yv12_to_yuyvi :yv12_to_yuyv, | ||
797 : | interlacing?yv12_to_yuyvi_c:yv12_to_yuyv_c, 2); | ||
798 : | albeu | 315 | return 0; |
799 : | |||
800 : | edgomez | 1382 | case XVID_CSP_YVYU: /* u,v swapped */ |
801 : | edgomez | 851 | safe_packed_conv( |
802 : | edgomez | 1382 | dst[0], dst_stride[0], image->y, image->v, image->u, |
803 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
804 : | interlacing?yv12_to_yuyvi :yv12_to_yuyv, | ||
805 : | interlacing?yv12_to_yuyvi_c:yv12_to_yuyv_c, 2); | ||
806 : | albeu | 315 | return 0; |
807 : | |||
808 : | case XVID_CSP_UYVY: | ||
809 : | edgomez | 851 | safe_packed_conv( |
810 : | edgomez | 1382 | dst[0], dst_stride[0], image->y, image->u, image->v, |
811 : | edgomez | 851 | edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
812 : | interlacing?yv12_to_uyvyi :yv12_to_uyvy, | ||
813 : | interlacing?yv12_to_uyvyi_c:yv12_to_uyvy_c, 2); | ||
814 : | albeu | 315 | return 0; |
815 : | |||
816 : | edgomez | 1382 | case XVID_CSP_I420: /* YCbCr == YUV == internal colorspace for MPEG */ |
817 : | yv12_to_yv12(dst[0], dst[0] + dst_stride[0]*height, dst[0] + dst_stride[0]*height + (dst_stride[0]/2)*height2, | ||
818 : | dst_stride[0], dst_stride[0]/2, | ||
819 : | edgomez | 851 | image->y, image->u, image->v, edged_width, edged_width2, |
820 : | width, height, (csp & XVID_CSP_VFLIP)); | ||
821 : | return 0; | ||
822 : | |||
823 : | edgomez | 1382 | case XVID_CSP_YV12: /* YCrCb == YVU == U and V plane swapped */ |
824 : | yv12_to_yv12(dst[0], dst[0] + dst_stride[0]*height, dst[0] + dst_stride[0]*height + (dst_stride[0]/2)*height2, | ||
825 : | dst_stride[0], dst_stride[0]/2, | ||
826 : | edgomez | 851 | image->y, image->v, image->u, edged_width, edged_width2, |
827 : | width, height, (csp & XVID_CSP_VFLIP)); | ||
828 : | return 0; | ||
829 : | |||
830 : | edgomez | 1382 | case XVID_CSP_PLANAR: /* YCbCr with arbitrary pointers and different strides for Y and UV */ |
831 : | yv12_to_yv12(dst[0], dst[1], dst[2], | ||
832 : | dst_stride[0], dst_stride[1], /* v: dst_stride[2] not yet supported */ | ||
833 : | image->y, image->u, image->v, edged_width, edged_width2, | ||
834 : | width, height, (csp & XVID_CSP_VFLIP)); | ||
835 : | albeu | 315 | return 0; |
836 : | |||
837 : | edgomez | 1382 | case XVID_CSP_INTERNAL : |
838 : | dst[0] = image->y; | ||
839 : | dst[1] = image->u; | ||
840 : | dst[2] = image->v; | ||
841 : | dst_stride[0] = edged_width; | ||
842 : | dst_stride[1] = edged_width/2; | ||
843 : | dst_stride[2] = edged_width/2; | ||
844 : | return 0; | ||
845 : | |||
846 : | albeu | 315 | case XVID_CSP_NULL: |
847 : | edgomez | 1382 | case XVID_CSP_SLICE: |
848 : | albeu | 315 | return 0; |
849 : | |||
850 : | } | ||
851 : | |||
852 : | return -1; | ||
853 : | } | ||
854 : | |||
855 : | float | ||
856 : | image_psnr(IMAGE * orig_image, | ||
857 : | IMAGE * recon_image, | ||
858 : | uint16_t stride, | ||
859 : | uint16_t width, | ||
860 : | uint16_t height) | ||
861 : | { | ||
862 : | int32_t diff, x, y, quad = 0; | ||
863 : | uint8_t *orig = orig_image->y; | ||
864 : | uint8_t *recon = recon_image->y; | ||
865 : | float psnr_y; | ||
866 : | |||
867 : | for (y = 0; y < height; y++) { | ||
868 : | for (x = 0; x < width; x++) { | ||
869 : | diff = *(orig + x) - *(recon + x); | ||
870 : | quad += diff * diff; | ||
871 : | } | ||
872 : | orig += stride; | ||
873 : | recon += stride; | ||
874 : | } | ||
875 : | |||
876 : | psnr_y = (float) quad / (float) (width * height); | ||
877 : | |||
878 : | if (psnr_y) { | ||
879 : | psnr_y = (float) (255 * 255) / psnr_y; | ||
880 : | psnr_y = 10 * (float) log10(psnr_y); | ||
881 : | } else | ||
882 : | psnr_y = (float) 99.99; | ||
883 : | |||
884 : | return psnr_y; | ||
885 : | } | ||
886 : | |||
887 : | |||
888 : | edgomez | 851 | float sse_to_PSNR(long sse, int pixels) |
889 : | { | ||
890 : | if (sse==0) | ||
891 : | return 99.99F; | ||
892 : | |||
893 : | edgomez | 1382 | return 48.131F - 10*(float)log10((float)sse/(float)(pixels)); /* log10(255*255)=4.8131 */ |
894 : | edgomez | 851 | |
895 : | } | ||
896 : | |||
897 : | edgomez | 1424 | long plane_sse(uint8_t *orig, |
898 : | uint8_t *recon, | ||
899 : | uint16_t stride, | ||
900 : | uint16_t width, | ||
901 : | uint16_t height) | ||
902 : | edgomez | 851 | { |
903 : | edgomez | 1424 | int y, bwidth, bheight; |
904 : | long sse = 0; | ||
905 : | edgomez | 851 | |
906 : | edgomez | 1424 | bwidth = width & (~0x07); |
907 : | bheight = height & (~0x07); | ||
908 : | |||
909 : | /* Compute the 8x8 integer part */ | ||
910 : | for (y = 0; y<bheight; y += 8) { | ||
911 : | int x; | ||
912 : | |||
913 : | /* Compute sse for the band */ | ||
914 : | for (x = 0; x<bwidth; x += 8) | ||
915 : | sse += sse8_8bit(orig + x, recon + x, stride); | ||
916 : | |||
917 : | /* remaining pixels of the 8 pixels high band */ | ||
918 : | for (x = bwidth; x < width; x++) { | ||
919 : | int diff; | ||
920 : | diff = *(orig + 0*stride + x) - *(recon + 0*stride + x); | ||
921 : | sse += diff * diff; | ||
922 : | diff = *(orig + 1*stride + x) - *(recon + 1*stride + x); | ||
923 : | sse += diff * diff; | ||
924 : | diff = *(orig + 2*stride + x) - *(recon + 2*stride + x); | ||
925 : | sse += diff * diff; | ||
926 : | diff = *(orig + 3*stride + x) - *(recon + 3*stride + x); | ||
927 : | sse += diff * diff; | ||
928 : | diff = *(orig + 4*stride + x) - *(recon + 4*stride + x); | ||
929 : | sse += diff * diff; | ||
930 : | diff = *(orig + 5*stride + x) - *(recon + 5*stride + x); | ||
931 : | sse += diff * diff; | ||
932 : | diff = *(orig + 6*stride + x) - *(recon + 6*stride + x); | ||
933 : | sse += diff * diff; | ||
934 : | diff = *(orig + 7*stride + x) - *(recon + 7*stride + x); | ||
935 : | sse += diff * diff; | ||
936 : | } | ||
937 : | |||
938 : | orig += 8*stride; | ||
939 : | recon += 8*stride; | ||
940 : | } | ||
941 : | |||
942 : | /* Compute the down rectangle sse */ | ||
943 : | for (y = bheight; y < height; y++) { | ||
944 : | int x; | ||
945 : | edgomez | 851 | for (x = 0; x < width; x++) { |
946 : | edgomez | 1424 | int diff; |
947 : | edgomez | 851 | diff = *(orig + x) - *(recon + x); |
948 : | sse += diff * diff; | ||
949 : | } | ||
950 : | orig += stride; | ||
951 : | recon += stride; | ||
952 : | } | ||
953 : | edgomez | 1424 | |
954 : | return (sse); | ||
955 : | edgomez | 851 | } |
956 : | |||
957 : | edgomez | 1382 | #if 0 |
958 : | edgomez | 851 | |
959 : | albeu | 315 | #include <stdio.h> |
960 : | #include <string.h> | ||
961 : | |||
962 : | int image_dump_pgm(uint8_t * bmp, uint32_t width, uint32_t height, char * filename) | ||
963 : | { | ||
964 : | FILE * f; | ||
965 : | char hdr[1024]; | ||
966 : | edgomez | 1382 | |
967 : | albeu | 315 | f = fopen(filename, "wb"); |
968 : | if ( f == NULL) | ||
969 : | { | ||
970 : | return -1; | ||
971 : | } | ||
972 : | sprintf(hdr, "P5\n#xvid\n%i %i\n255\n", width, height); | ||
973 : | fwrite(hdr, strlen(hdr), 1, f); | ||
974 : | fwrite(bmp, width, height, f); | ||
975 : | fclose(f); | ||
976 : | |||
977 : | return 0; | ||
978 : | } | ||
979 : | |||
980 : | |||
981 : | edgomez | 1382 | /* dump image+edges to yuv pgm files */ |
982 : | albeu | 315 | |
983 : | int image_dump(IMAGE * image, uint32_t edged_width, uint32_t edged_height, char * path, int number) | ||
984 : | { | ||
985 : | char filename[1024]; | ||
986 : | |||
987 : | sprintf(filename, "%s_%i_%c.pgm", path, number, 'y'); | ||
988 : | image_dump_pgm( | ||
989 : | image->y - (EDGE_SIZE * edged_width + EDGE_SIZE), | ||
990 : | edged_width, edged_height, filename); | ||
991 : | |||
992 : | sprintf(filename, "%s_%i_%c.pgm", path, number, 'u'); | ||
993 : | image_dump_pgm( | ||
994 : | image->u - (EDGE_SIZE2 * edged_width / 2 + EDGE_SIZE2), | ||
995 : | edged_width / 2, edged_height / 2, filename); | ||
996 : | |||
997 : | sprintf(filename, "%s_%i_%c.pgm", path, number, 'v'); | ||
998 : | image_dump_pgm( | ||
999 : | image->v - (EDGE_SIZE2 * edged_width / 2 + EDGE_SIZE2), | ||
1000 : | edged_width / 2, edged_height / 2, filename); | ||
1001 : | |||
1002 : | return 0; | ||
1003 : | } | ||
1004 : | edgomez | 1382 | #endif |
1005 : | albeu | 315 | |
1006 : | |||
1007 : | |||
1008 : | /* dump image to yuvpgm file */ | ||
1009 : | |||
1010 : | #include <stdio.h> | ||
1011 : | |||
1012 : | int | ||
1013 : | image_dump_yuvpgm(const IMAGE * image, | ||
1014 : | const uint32_t edged_width, | ||
1015 : | const uint32_t width, | ||
1016 : | const uint32_t height, | ||
1017 : | char *filename) | ||
1018 : | { | ||
1019 : | FILE *f; | ||
1020 : | char hdr[1024]; | ||
1021 : | uint32_t i; | ||
1022 : | uint8_t *bmp1; | ||
1023 : | uint8_t *bmp2; | ||
1024 : | |||
1025 : | |||
1026 : | f = fopen(filename, "wb"); | ||
1027 : | if (f == NULL) { | ||
1028 : | return -1; | ||
1029 : | } | ||
1030 : | sprintf(hdr, "P5\n#xvid\n%i %i\n255\n", width, (3 * height) / 2); | ||
1031 : | fwrite(hdr, strlen(hdr), 1, f); | ||
1032 : | |||
1033 : | bmp1 = image->y; | ||
1034 : | for (i = 0; i < height; i++) { | ||
1035 : | fwrite(bmp1, width, 1, f); | ||
1036 : | bmp1 += edged_width; | ||
1037 : | } | ||
1038 : | |||
1039 : | bmp1 = image->u; | ||
1040 : | bmp2 = image->v; | ||
1041 : | for (i = 0; i < height / 2; i++) { | ||
1042 : | fwrite(bmp1, width / 2, 1, f); | ||
1043 : | fwrite(bmp2, width / 2, 1, f); | ||
1044 : | bmp1 += edged_width / 2; | ||
1045 : | bmp2 += edged_width / 2; | ||
1046 : | } | ||
1047 : | |||
1048 : | fclose(f); | ||
1049 : | return 0; | ||
1050 : | } | ||
1051 : | |||
1052 : | |||
1053 : | float | ||
1054 : | image_mad(const IMAGE * img1, | ||
1055 : | const IMAGE * img2, | ||
1056 : | uint32_t stride, | ||
1057 : | uint32_t width, | ||
1058 : | uint32_t height) | ||
1059 : | { | ||
1060 : | const uint32_t stride2 = stride / 2; | ||
1061 : | const uint32_t width2 = width / 2; | ||
1062 : | const uint32_t height2 = height / 2; | ||
1063 : | |||
1064 : | uint32_t x, y; | ||
1065 : | uint32_t sum = 0; | ||
1066 : | |||
1067 : | for (y = 0; y < height; y++) | ||
1068 : | for (x = 0; x < width; x++) | ||
1069 : | edgomez | 1382 | sum += abs(img1->y[x + y * stride] - img2->y[x + y * stride]); |
1070 : | albeu | 315 | |
1071 : | for (y = 0; y < height2; y++) | ||
1072 : | for (x = 0; x < width2; x++) | ||
1073 : | edgomez | 1382 | sum += abs(img1->u[x + y * stride2] - img2->u[x + y * stride2]); |
1074 : | albeu | 315 | |
1075 : | for (y = 0; y < height2; y++) | ||
1076 : | for (x = 0; x < width2; x++) | ||
1077 : | edgomez | 1382 | sum += abs(img1->v[x + y * stride2] - img2->v[x + y * stride2]); |
1078 : | albeu | 315 | |
1079 : | return (float) sum / (width * height * 3 / 2); | ||
1080 : | } | ||
1081 : | |||
1082 : | void | ||
1083 : | edgomez | 1382 | output_slice(IMAGE * cur, int std, int width, xvid_image_t* out_frm, int mbx, int mby,int mbl) { |
1084 : | albeu | 315 | uint8_t *dY,*dU,*dV,*sY,*sU,*sV; |
1085 : | int std2 = std >> 1; | ||
1086 : | int w = mbl << 4, w2,i; | ||
1087 : | |||
1088 : | if(w > width) | ||
1089 : | w = width; | ||
1090 : | w2 = w >> 1; | ||
1091 : | suxen_drol | 323 | |
1092 : | edgomez | 1382 | dY = (uint8_t*)out_frm->plane[0] + (mby << 4) * out_frm->stride[0] + (mbx << 4); |
1093 : | dU = (uint8_t*)out_frm->plane[1] + (mby << 3) * out_frm->stride[1] + (mbx << 3); | ||
1094 : | dV = (uint8_t*)out_frm->plane[2] + (mby << 3) * out_frm->stride[2] + (mbx << 3); | ||
1095 : | albeu | 315 | sY = cur->y + (mby << 4) * std + (mbx << 4); |
1096 : | sU = cur->u + (mby << 3) * std2 + (mbx << 3); | ||
1097 : | sV = cur->v + (mby << 3) * std2 + (mbx << 3); | ||
1098 : | |||
1099 : | for(i = 0 ; i < 16 ; i++) { | ||
1100 : | memcpy(dY,sY,w); | ||
1101 : | edgomez | 1382 | dY += out_frm->stride[0]; |
1102 : | suxen_drol | 323 | sY += std; |
1103 : | } | ||
1104 : | albeu | 315 | for(i = 0 ; i < 8 ; i++) { |
1105 : | memcpy(dU,sU,w2); | ||
1106 : | edgomez | 1382 | dU += out_frm->stride[1]; |
1107 : | albeu | 315 | sU += std2; |
1108 : | } | ||
1109 : | for(i = 0 ; i < 8 ; i++) { | ||
1110 : | memcpy(dV,sV,w2); | ||
1111 : | edgomez | 1382 | dV += out_frm->stride[2]; |
1112 : | albeu | 315 | sV += std2; |
1113 : | } | ||
1114 : | } | ||
1115 : | edgomez | 851 | |
1116 : | |||
1117 : | void | ||
1118 : | image_clear(IMAGE * img, int width, int height, int edged_width, | ||
1119 : | int y, int u, int v) | ||
1120 : | { | ||
1121 : | uint8_t * p; | ||
1122 : | int i; | ||
1123 : | |||
1124 : | p = img->y; | ||
1125 : | for (i = 0; i < height; i++) { | ||
1126 : | memset(p, y, width); | ||
1127 : | p += edged_width; | ||
1128 : | } | ||
1129 : | |||
1130 : | p = img->u; | ||
1131 : | for (i = 0; i < height/2; i++) { | ||
1132 : | memset(p, u, width/2); | ||
1133 : | p += edged_width/2; | ||
1134 : | } | ||
1135 : | |||
1136 : | p = img->v; | ||
1137 : | for (i = 0; i < height/2; i++) { | ||
1138 : | memset(p, v, width/2); | ||
1139 : | p += edged_width/2; | ||
1140 : | } | ||
1141 : | } | ||
1142 : | |||
1143 : | |||
1144 : | edgomez | 1382 | /* reduced resolution deblocking filter |
1145 : | edgomez | 851 | block = block size (16=rrv, 8=full resolution) |
1146 : | flags = XVID_DEC_YDEBLOCK|XVID_DEC_UVDEBLOCK | ||
1147 : | */ | ||
1148 : | void | ||
1149 : | image_deblock_rrv(IMAGE * img, int edged_width, | ||
1150 : | const MACROBLOCK * mbs, int mb_width, int mb_height, int mb_stride, | ||
1151 : | int block, int flags) | ||
1152 : | { | ||
1153 : | const int edged_width2 = edged_width /2; | ||
1154 : | const int nblocks = block / 8; /* skals code uses 8pixel block uints */ | ||
1155 : | int i,j; | ||
1156 : | |||
1157 : | /* luma: j,i in block units */ | ||
1158 : | edgomez | 1382 | |
1159 : | edgomez | 851 | for (j = 1; j < mb_height*2; j++) /* horizontal deblocking */ |
1160 : | for (i = 0; i < mb_width*2; i++) | ||
1161 : | { | ||
1162 : | if (mbs[(j-1)/2*mb_stride + (i/2)].mode != MODE_NOT_CODED || | ||
1163 : | mbs[(j+0)/2*mb_stride + (i/2)].mode != MODE_NOT_CODED) | ||
1164 : | { | ||
1165 : | hfilter_31(img->y + (j*block - 1)*edged_width + i*block, | ||
1166 : | img->y + (j*block + 0)*edged_width + i*block, nblocks); | ||
1167 : | } | ||
1168 : | } | ||
1169 : | |||
1170 : | for (j = 0; j < mb_height*2; j++) /* vertical deblocking */ | ||
1171 : | for (i = 1; i < mb_width*2; i++) | ||
1172 : | { | ||
1173 : | if (mbs[(j/2)*mb_stride + (i-1)/2].mode != MODE_NOT_CODED || | ||
1174 : | mbs[(j/2)*mb_stride + (i+0)/2].mode != MODE_NOT_CODED) | ||
1175 : | { | ||
1176 : | vfilter_31(img->y + (j*block)*edged_width + i*block - 1, | ||
1177 : | img->y + (j*block)*edged_width + i*block + 0, | ||
1178 : | edged_width, nblocks); | ||
1179 : | } | ||
1180 : | } | ||
1181 : | |||
1182 : | |||
1183 : | edgomez | 1382 | |
1184 : | edgomez | 851 | /* chroma */ |
1185 : | edgomez | 1382 | |
1186 : | edgomez | 851 | for (j = 1; j < mb_height; j++) /* horizontal deblocking */ |
1187 : | for (i = 0; i < mb_width; i++) | ||
1188 : | { | ||
1189 : | edgomez | 1382 | if (mbs[(j-1)*mb_stride + i].mode != MODE_NOT_CODED || |
1190 : | edgomez | 851 | mbs[(j+0)*mb_stride + i].mode != MODE_NOT_CODED) |
1191 : | { | ||
1192 : | hfilter_31(img->u + (j*block - 1)*edged_width2 + i*block, | ||
1193 : | img->u + (j*block + 0)*edged_width2 + i*block, nblocks); | ||
1194 : | hfilter_31(img->v + (j*block - 1)*edged_width2 + i*block, | ||
1195 : | img->v + (j*block + 0)*edged_width2 + i*block, nblocks); | ||
1196 : | } | ||
1197 : | } | ||
1198 : | |||
1199 : | edgomez | 1382 | for (j = 0; j < mb_height; j++) /* vertical deblocking */ |
1200 : | edgomez | 851 | for (i = 1; i < mb_width; i++) |
1201 : | { | ||
1202 : | if (mbs[j*mb_stride + i - 1].mode != MODE_NOT_CODED || | ||
1203 : | edgomez | 1382 | mbs[j*mb_stride + i + 0].mode != MODE_NOT_CODED) |
1204 : | edgomez | 851 | { |
1205 : | vfilter_31(img->u + (j*block)*edged_width2 + i*block - 1, | ||
1206 : | img->u + (j*block)*edged_width2 + i*block + 0, | ||
1207 : | edged_width2, nblocks); | ||
1208 : | vfilter_31(img->v + (j*block)*edged_width2 + i*block - 1, | ||
1209 : | img->v + (j*block)*edged_width2 + i*block + 0, | ||
1210 : | edged_width2, nblocks); | ||
1211 : | } | ||
1212 : | } | ||
1213 : | |||
1214 : | edgomez | 1382 | |
1215 : | edgomez | 851 | } |
1216 : |
No admin address has been configured | ViewVC Help |
Powered by ViewVC 1.0.4 |