Annotation of /trunk/xvidcore/src/image/image.c

Revision 1959 - (view) (download)

1 :	edgomez	851	/**************************************************************************
2 :	albeu	315	*
3 :	edgomez	1382	* XVID MPEG-4 VIDEO CODEC
4 :			* - Image management functions -
5 :	albeu	315	*
6 :	Isibaar	1909	* Copyright(C) 2001-2010 Peter Ross <pross@xvid.org>
7 :	albeu	315	*
8 :	edgomez	1382	* This program is free software ; you can redistribute it and/or modify
9 :			* it under the terms of the GNU General Public License as published by
10 :			* the Free Software Foundation ; either version 2 of the License, or
11 :			* (at your option) any later version.
12 :	albeu	315	*
13 :	edgomez	1382	* This program is distributed in the hope that it will be useful,
14 :			* but WITHOUT ANY WARRANTY ; without even the implied warranty of
15 :			* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 :			* GNU General Public License for more details.
17 :	albeu	315	*
18 :	edgomez	1382	* You should have received a copy of the GNU General Public License
19 :			* along with this program ; if not, write to the Free Software
20 :			* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 :	albeu	315	*
22 :	Isibaar	1959	* $Id: image.c,v 1.48 2011-03-08 19:16:32 Isibaar Exp $
23 :	albeu	315	*
24 :	edgomez	1382	****************************************************************************/
25 :	albeu	315
26 :			#include <stdlib.h>
27 :	edgomez	1382	#include <string.h> /* memcpy, memset */
28 :	albeu	315	#include <math.h>
29 :			#include "../portab.h"
30 :	edgomez	1382	#include "../global.h"
31 :			#include "../xvid.h"
32 :	albeu	315	#include "image.h"
33 :			#include "colorspace.h"
34 :			#include "interpolate8x8.h"
35 :			#include "../utils/mem_align.h"
36 :	edgomez	1424	#include "../motion/sad.h"
37 :	Skal	1733	#include "../utils/emms.h"
38 :	albeu	315
39 :	edgomez	1382	#include "font.h"
40 :	edgomez	851
41 :	albeu	315	#define SAFETY 64
42 :			#define EDGE_SIZE2 (EDGE_SIZE/2)
43 :
44 :
45 :			int32_t
46 :			image_create(IMAGE * image,
47 :			uint32_t edged_width,
48 :			uint32_t edged_height)
49 :			{
50 :			const uint32_t edged_width2 = edged_width / 2;
51 :			const uint32_t edged_height2 = edged_height / 2;
52 :
53 :			image->y =
54 :			xvid_malloc(edged_width * (edged_height + 1) + SAFETY, CACHE_LINE);
55 :			if (image->y == NULL) {
56 :			return -1;
57 :			}
58 :	edgomez	1382	memset(image->y, 0, edged_width * (edged_height + 1) + SAFETY);
59 :	albeu	315
60 :			image->u = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE);
61 :			if (image->u == NULL) {
62 :			xvid_free(image->y);
63 :	edgomez	1382	image->y = NULL;
64 :	albeu	315	return -1;
65 :			}
66 :	edgomez	1382	memset(image->u, 0, edged_width2 * edged_height2 + SAFETY);
67 :
68 :	albeu	315	image->v = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE);
69 :			if (image->v == NULL) {
70 :			xvid_free(image->u);
71 :	edgomez	1382	image->u = NULL;
72 :	albeu	315	xvid_free(image->y);
73 :	edgomez	1382	image->y = NULL;
74 :	albeu	315	return -1;
75 :			}
76 :	edgomez	1382	memset(image->v, 0, edged_width2 * edged_height2 + SAFETY);
77 :	albeu	315
78 :			image->y += EDGE_SIZE * edged_width + EDGE_SIZE;
79 :			image->u += EDGE_SIZE2 * edged_width2 + EDGE_SIZE2;
80 :			image->v += EDGE_SIZE2 * edged_width2 + EDGE_SIZE2;
81 :
82 :			return 0;
83 :			}
84 :
85 :
86 :
87 :			void
88 :			image_destroy(IMAGE * image,
89 :			uint32_t edged_width,
90 :			uint32_t edged_height)
91 :			{
92 :			const uint32_t edged_width2 = edged_width / 2;
93 :
94 :			if (image->y) {
95 :			xvid_free(image->y - (EDGE_SIZE * edged_width + EDGE_SIZE));
96 :	edgomez	1382	image->y = NULL;
97 :	albeu	315	}
98 :			if (image->u) {
99 :			xvid_free(image->u - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2));
100 :	edgomez	1382	image->u = NULL;
101 :	albeu	315	}
102 :			if (image->v) {
103 :			xvid_free(image->v - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2));
104 :	edgomez	1382	image->v = NULL;
105 :	albeu	315	}
106 :			}
107 :
108 :
109 :			void
110 :			image_swap(IMAGE * image1,
111 :			IMAGE * image2)
112 :			{
113 :	edgomez	1382	SWAP(uint8_t*, image1->y, image2->y);
114 :			SWAP(uint8_t*, image1->u, image2->u);
115 :			SWAP(uint8_t*, image1->v, image2->v);
116 :	albeu	315	}
117 :
118 :
119 :			void
120 :			image_copy(IMAGE * image1,
121 :			IMAGE * image2,
122 :			uint32_t edged_width,
123 :			uint32_t height)
124 :			{
125 :			memcpy(image1->y, image2->y, edged_width * height);
126 :			memcpy(image1->u, image2->u, edged_width * height / 4);
127 :			memcpy(image1->v, image2->v, edged_width * height / 4);
128 :			}
129 :
130 :	Isibaar	1959	/* setedges bug was in this BS versions */
131 :	edgomez	1382	#define SETEDGES_BUG_BEFORE 18
132 :	Isibaar	1959	#define SETEDGES_BUG_AFTER 57
133 :			#define SETEDGES_BUG_REFIXED 63
134 :	albeu	315
135 :			void
136 :			image_setedges(IMAGE * image,
137 :			uint32_t edged_width,
138 :			uint32_t edged_height,
139 :			uint32_t width,
140 :	edgomez	1382	uint32_t height,
141 :			int bs_version)
142 :	albeu	315	{
143 :			const uint32_t edged_width2 = edged_width / 2;
144 :	edgomez	1382	uint32_t width2;
145 :	albeu	315	uint32_t i;
146 :			uint8_t *dst;
147 :			uint8_t *src;
148 :
149 :			dst = image->y - (EDGE_SIZE + EDGE_SIZE * edged_width);
150 :			src = image->y;
151 :
152 :	edgomez	1382	/* According to the Standard Clause 7.6.4, padding is done starting at 16
153 :			* pixel width and height multiples. This was not respected in old xvids */
154 :	Isibaar	1959	if (bs_version >= SETEDGES_BUG_BEFORE &&
155 :			bs_version < SETEDGES_BUG_AFTER \|\|
156 :			bs_version >= SETEDGES_BUG_REFIXED) {
157 :	edgomez	1382	width = (width+15)&~15;
158 :			height = (height+15)&~15;
159 :			}
160 :
161 :			width2 = width/2;
162 :
163 :	albeu	315	for (i = 0; i < EDGE_SIZE; i++) {
164 :	edgomez	851	memset(dst, *src, EDGE_SIZE);
165 :			memcpy(dst + EDGE_SIZE, src, width);
166 :			memset(dst + edged_width - EDGE_SIZE, *(src + width - 1),
167 :			EDGE_SIZE);
168 :	albeu	315	dst += edged_width;
169 :			}
170 :
171 :			for (i = 0; i < height; i++) {
172 :			memset(dst, *src, EDGE_SIZE);
173 :			memset(dst + edged_width - EDGE_SIZE, src[width - 1], EDGE_SIZE);
174 :			dst += edged_width;
175 :			src += edged_width;
176 :			}
177 :
178 :			src -= edged_width;
179 :			for (i = 0; i < EDGE_SIZE; i++) {
180 :	edgomez	851	memset(dst, *src, EDGE_SIZE);
181 :			memcpy(dst + EDGE_SIZE, src, width);
182 :			memset(dst + edged_width - EDGE_SIZE, *(src + width - 1),
183 :	albeu	315	EDGE_SIZE);
184 :			dst += edged_width;
185 :			}
186 :
187 :
188 :	edgomez	1382	/* U */
189 :	albeu	315	dst = image->u - (EDGE_SIZE2 + EDGE_SIZE2 * edged_width2);
190 :			src = image->u;
191 :
192 :			for (i = 0; i < EDGE_SIZE2; i++) {
193 :			memset(dst, *src, EDGE_SIZE2);
194 :			memcpy(dst + EDGE_SIZE2, src, width2);
195 :			memset(dst + edged_width2 - EDGE_SIZE2, *(src + width2 - 1),
196 :			EDGE_SIZE2);
197 :			dst += edged_width2;
198 :			}
199 :
200 :			for (i = 0; i < height / 2; i++) {
201 :			memset(dst, *src, EDGE_SIZE2);
202 :			memset(dst + edged_width2 - EDGE_SIZE2, src[width2 - 1], EDGE_SIZE2);
203 :			dst += edged_width2;
204 :			src += edged_width2;
205 :			}
206 :			src -= edged_width2;
207 :			for (i = 0; i < EDGE_SIZE2; i++) {
208 :			memset(dst, *src, EDGE_SIZE2);
209 :			memcpy(dst + EDGE_SIZE2, src, width2);
210 :			memset(dst + edged_width2 - EDGE_SIZE2, *(src + width2 - 1),
211 :			EDGE_SIZE2);
212 :			dst += edged_width2;
213 :			}
214 :
215 :
216 :	edgomez	1382	/* V */
217 :	albeu	315	dst = image->v - (EDGE_SIZE2 + EDGE_SIZE2 * edged_width2);
218 :			src = image->v;
219 :
220 :			for (i = 0; i < EDGE_SIZE2; i++) {
221 :			memset(dst, *src, EDGE_SIZE2);
222 :			memcpy(dst + EDGE_SIZE2, src, width2);
223 :			memset(dst + edged_width2 - EDGE_SIZE2, *(src + width2 - 1),
224 :			EDGE_SIZE2);
225 :			dst += edged_width2;
226 :			}
227 :
228 :			for (i = 0; i < height / 2; i++) {
229 :			memset(dst, *src, EDGE_SIZE2);
230 :			memset(dst + edged_width2 - EDGE_SIZE2, src[width2 - 1], EDGE_SIZE2);
231 :			dst += edged_width2;
232 :			src += edged_width2;
233 :			}
234 :			src -= edged_width2;
235 :			for (i = 0; i < EDGE_SIZE2; i++) {
236 :			memset(dst, *src, EDGE_SIZE2);
237 :			memcpy(dst + EDGE_SIZE2, src, width2);
238 :			memset(dst + edged_width2 - EDGE_SIZE2, *(src + width2 - 1),
239 :			EDGE_SIZE2);
240 :			dst += edged_width2;
241 :			}
242 :			}
243 :
244 :			void
245 :	syskin	1665	image_interpolate(const uint8_t * refn,
246 :			uint8_t * refh,
247 :			uint8_t * refv,
248 :			uint8_t * refhv,
249 :	albeu	315	uint32_t edged_width,
250 :			uint32_t edged_height,
251 :	edgomez	851	uint32_t quarterpel,
252 :	albeu	315	uint32_t rounding)
253 :			{
254 :	edgomez	1382	const uint32_t offset = EDGE_SIZE2 * (edged_width + 1); /* we only interpolate half of the edge area */
255 :	albeu	315	const uint32_t stride_add = 7 * edged_width;
256 :	syskin	1664
257 :	syskin	1665	uint8_t *n_ptr;
258 :			uint8_t h_ptr, v_ptr, *hv_ptr;
259 :	albeu	315	uint32_t x, y;
260 :
261 :	syskin	1665	n_ptr = (uint8_t*)refn;
262 :			h_ptr = refh;
263 :	syskin	1666	v_ptr = refv;
264 :	albeu	315
265 :			n_ptr -= offset;
266 :			h_ptr -= offset;
267 :			v_ptr -= offset;
268 :
269 :	edgomez	1382	/* Note we initialize the hv pointer later, as we can optimize code a bit
270 :			* doing it down to up in quarterpel and up to down in halfpel */
271 :	edgomez	851	if(quarterpel) {
272 :	edgomez	1382
273 :	edgomez	851	for (y = 0; y < (edged_height - EDGE_SIZE); y += 8) {
274 :			for (x = 0; x < (edged_width - EDGE_SIZE); x += 8) {
275 :			interpolate8x8_6tap_lowpass_h(h_ptr, n_ptr, edged_width, rounding);
276 :			interpolate8x8_6tap_lowpass_v(v_ptr, n_ptr, edged_width, rounding);
277 :	albeu	315
278 :	edgomez	851	n_ptr += 8;
279 :			h_ptr += 8;
280 :			v_ptr += 8;
281 :			}
282 :	edgomez	1382
283 :	edgomez	851	n_ptr += EDGE_SIZE;
284 :			h_ptr += EDGE_SIZE;
285 :			v_ptr += EDGE_SIZE;
286 :
287 :			h_ptr += stride_add;
288 :			v_ptr += stride_add;
289 :			n_ptr += stride_add;
290 :			}
291 :
292 :	syskin	1665	h_ptr = refh + (edged_height - EDGE_SIZE - EDGE_SIZE2)*edged_width - EDGE_SIZE2;
293 :			hv_ptr = refhv + (edged_height - EDGE_SIZE - EDGE_SIZE2)*edged_width - EDGE_SIZE2;
294 :	edgomez	851
295 :			for (y = 0; y < (edged_height - EDGE_SIZE); y = y + 8) {
296 :	edgomez	1382	hv_ptr -= stride_add;
297 :			h_ptr -= stride_add;
298 :			hv_ptr -= EDGE_SIZE;
299 :			h_ptr -= EDGE_SIZE;
300 :
301 :	edgomez	851	for (x = 0; x < (edged_width - EDGE_SIZE); x = x + 8) {
302 :	edgomez	1382	hv_ptr -= 8;
303 :			h_ptr -= 8;
304 :	edgomez	851	interpolate8x8_6tap_lowpass_v(hv_ptr, h_ptr, edged_width, rounding);
305 :			}
306 :			}
307 :	edgomez	1382	} else {
308 :	edgomez	851
309 :	syskin	1665	hv_ptr = refhv;
310 :	edgomez	1382	hv_ptr -= offset;
311 :
312 :	edgomez	851	for (y = 0; y < (edged_height - EDGE_SIZE); y += 8) {
313 :			for (x = 0; x < (edged_width - EDGE_SIZE); x += 8) {
314 :			interpolate8x8_halfpel_h(h_ptr, n_ptr, edged_width, rounding);
315 :			interpolate8x8_halfpel_v(v_ptr, n_ptr, edged_width, rounding);
316 :			interpolate8x8_halfpel_hv(hv_ptr, n_ptr, edged_width, rounding);
317 :
318 :			n_ptr += 8;
319 :			h_ptr += 8;
320 :			v_ptr += 8;
321 :			hv_ptr += 8;
322 :			}
323 :	edgomez	1382
324 :	edgomez	851	h_ptr += EDGE_SIZE;
325 :			v_ptr += EDGE_SIZE;
326 :			hv_ptr += EDGE_SIZE;
327 :			n_ptr += EDGE_SIZE;
328 :
329 :			h_ptr += stride_add;
330 :			v_ptr += stride_add;
331 :			hv_ptr += stride_add;
332 :			n_ptr += stride_add;
333 :			}
334 :			}
335 :	albeu	315	}
336 :
337 :
338 :	edgomez	851	/*
339 :			chroma optimize filter, invented by mf
340 :			a chroma pixel is average from the surrounding pixels, when the
341 :			correpsonding luma pixels are pure black or white.
342 :			*/
343 :
344 :			void
345 :			image_chroma_optimize(IMAGE * img, int width, int height, int edged_width)
346 :			{
347 :			int x,y;
348 :			int pixels = 0;
349 :
350 :			for (y = 1; y < height/2 - 1; y++)
351 :			for (x = 1; x < width/2 - 1; x++)
352 :			{
353 :			#define IS_PURE(a) ((a)<=16\|\|(a)>=235)
354 :			#define IMG_Y(Y,X) img->y[(Y)*edged_width + (X)]
355 :			#define IMG_U(Y,X) img->u[(Y)*edged_width/2 + (X)]
356 :			#define IMG_V(Y,X) img->v[(Y)*edged_width/2 + (X)]
357 :
358 :	edgomez	1382	if (IS_PURE(IMG_Y(y2 ,x2 )) &&
359 :	edgomez	851	IS_PURE(IMG_Y(y2 ,x2+1)) &&
360 :	edgomez	1382	IS_PURE(IMG_Y(y2+1,x2 )) &&
361 :	edgomez	851	IS_PURE(IMG_Y(y2+1,x2+1)))
362 :			{
363 :			IMG_U(y,x) = (IMG_U(y,x-1) + IMG_U(y-1, x) + IMG_U(y, x+1) + IMG_U(y+1, x)) / 4;
364 :			IMG_V(y,x) = (IMG_V(y,x-1) + IMG_V(y-1, x) + IMG_V(y, x+1) + IMG_V(y+1, x)) / 4;
365 :			pixels++;
366 :			}
367 :
368 :			#undef IS_PURE
369 :			#undef IMG_Y
370 :			#undef IMG_U
371 :			#undef IMG_V
372 :			}
373 :	edgomez	1382
374 :			DPRINTF(XVID_DEBUG_DEBUG,"chroma_optimized_pixels = %i/%i\n", pixels, width*height/4);
375 :	edgomez	851	}
376 :
377 :
378 :
379 :
380 :
381 :			/*
382 :			perform safe packed colorspace conversion, by splitting
383 :			the image up into an optimized area (pixel width divisible by 16),
384 :			and two unoptimized/plain-c areas (pixel width divisible by 2)
385 :			*/
386 :
387 :	edgomez	1382	static void
388 :	edgomez	851	safe_packed_conv(uint8_t * x_ptr, int x_stride,
389 :			uint8_t * y_ptr, uint8_t * u_ptr, uint8_t * v_ptr,
390 :			int y_stride, int uv_stride,
391 :			int width, int height, int vflip,
392 :	Isibaar	1815	packedFunc * func_opt, packedFunc func_c,
393 :			int size, int interlacing)
394 :	edgomez	851	{
395 :	Isibaar	1815	int width_opt, width_c, height_opt;
396 :	edgomez	851
397 :	Isibaar	1856	if (width<0 \|\| width==1 \|\| height==1) return; /* forget about it */
398 :	Isibaar	1815
399 :	edgomez	851	if (func_opt != func_c && x_stride < size((width+15)/16)16)
400 :			{
401 :			width_opt = width & (~15);
402 :	Isibaar	1815	width_c = (width - width_opt) & (~1);
403 :	edgomez	851	}
404 :	Isibaar	1856	else if (func_opt != func_c && !(width&1) && (size==3))
405 :	edgomez	851	{
406 :	Isibaar	1856	/* MMX reads 4 bytes per pixel for RGB/BGR */
407 :			width_opt = width - 2;
408 :			width_c = 2;
409 :			}
410 :			else {
411 :	Isibaar	1815	/* Enforce the width to be divisable by two. */
412 :			width_opt = width & (~1);
413 :	edgomez	851	width_c = 0;
414 :			}
415 :
416 :	Isibaar	1815	/* packed conversions require height to be divisable by 2
417 :			(or even by 4 for interlaced conversion) */
418 :			if (interlacing)
419 :			height_opt = height & (~3);
420 :			else
421 :			height_opt = height & (~1);
422 :
423 :	edgomez	851	func_opt(x_ptr, x_stride,
424 :			y_ptr, u_ptr, v_ptr, y_stride, uv_stride,
425 :	Isibaar	1815	width_opt, height_opt, vflip);
426 :	edgomez	851
427 :			if (width_c)
428 :			{
429 :			func_c(x_ptr + size*width_opt, x_stride,
430 :			y_ptr + width_opt, u_ptr + width_opt/2, v_ptr + width_opt/2,
431 :	Isibaar	1815	y_stride, uv_stride, width_c, height_opt, vflip);
432 :	edgomez	851	}
433 :			}
434 :
435 :
436 :
437 :	albeu	315	int
438 :			image_input(IMAGE * image,
439 :			uint32_t width,
440 :			int height,
441 :			uint32_t edged_width,
442 :	edgomez	1382	uint8_t * src[4],
443 :			int src_stride[4],
444 :	edgomez	851	int csp,
445 :			int interlacing)
446 :	albeu	315	{
447 :	edgomez	851	const int edged_width2 = edged_width/2;
448 :			const int width2 = width/2;
449 :			const int height2 = height/2;
450 :	edgomez	1382	#if 0
451 :			const int height_signed = (csp & XVID_CSP_VFLIP) ? -height : height;
452 :			#endif
453 :	albeu	315
454 :			switch (csp & ~XVID_CSP_VFLIP) {
455 :			case XVID_CSP_RGB555:
456 :	edgomez	851	safe_packed_conv(
457 :	edgomez	1382	src[0], src_stride[0], image->y, image->u, image->v,
458 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
459 :			interlacing?rgb555i_to_yv12 :rgb555_to_yv12,
460 :	Isibaar	1815	interlacing?rgb555i_to_yv12_c:rgb555_to_yv12_c, 2, interlacing);
461 :	edgomez	851	break;
462 :	albeu	315
463 :			case XVID_CSP_RGB565:
464 :	edgomez	851	safe_packed_conv(
465 :	edgomez	1382	src[0], src_stride[0], image->y, image->u, image->v,
466 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
467 :			interlacing?rgb565i_to_yv12 :rgb565_to_yv12,
468 :	Isibaar	1815	interlacing?rgb565i_to_yv12_c:rgb565_to_yv12_c, 2, interlacing);
469 :	edgomez	851	break;
470 :	albeu	315
471 :
472 :	edgomez	1382	case XVID_CSP_BGR:
473 :	edgomez	851	safe_packed_conv(
474 :	edgomez	1382	src[0], src_stride[0], image->y, image->u, image->v,
475 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
476 :			interlacing?bgri_to_yv12 :bgr_to_yv12,
477 :	Isibaar	1815	interlacing?bgri_to_yv12_c:bgr_to_yv12_c, 3, interlacing);
478 :	edgomez	851	break;
479 :	albeu	315
480 :	edgomez	1382	case XVID_CSP_BGRA:
481 :	edgomez	851	safe_packed_conv(
482 :	edgomez	1382	src[0], src_stride[0], image->y, image->u, image->v,
483 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
484 :			interlacing?bgrai_to_yv12 :bgra_to_yv12,
485 :	Isibaar	1815	interlacing?bgrai_to_yv12_c:bgra_to_yv12_c, 4, interlacing);
486 :	edgomez	851	break;
487 :	albeu	315
488 :	edgomez	851	case XVID_CSP_ABGR :
489 :			safe_packed_conv(
490 :	edgomez	1382	src[0], src_stride[0], image->y, image->u, image->v,
491 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
492 :			interlacing?abgri_to_yv12 :abgr_to_yv12,
493 :	Isibaar	1815	interlacing?abgri_to_yv12_c:abgr_to_yv12_c, 4, interlacing);
494 :	edgomez	851	break;
495 :	albeu	315
496 :	chl	1759	case XVID_CSP_RGB:
497 :			safe_packed_conv(
498 :			src[0], src_stride[0], image->y, image->u, image->v,
499 :			edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
500 :			interlacing?rgbi_to_yv12 :rgb_to_yv12,
501 :	Isibaar	1815	interlacing?rgbi_to_yv12_c:rgb_to_yv12_c, 3, interlacing);
502 :	chl	1759	break;
503 :
504 :	edgomez	851	case XVID_CSP_RGBA :
505 :			safe_packed_conv(
506 :	edgomez	1382	src[0], src_stride[0], image->y, image->u, image->v,
507 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
508 :			interlacing?rgbai_to_yv12 :rgba_to_yv12,
509 :	Isibaar	1815	interlacing?rgbai_to_yv12_c:rgba_to_yv12_c, 4, interlacing);
510 :	edgomez	851	break;
511 :	edgomez	1382
512 :			case XVID_CSP_ARGB:
513 :			safe_packed_conv(
514 :			src[0], src_stride[0], image->y, image->u, image->v,
515 :			edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
516 :			interlacing?argbi_to_yv12 : argb_to_yv12,
517 :	Isibaar	1815	interlacing?argbi_to_yv12_c: argb_to_yv12_c, 4, interlacing);
518 :	edgomez	1382	break;
519 :	albeu	315
520 :			case XVID_CSP_YUY2:
521 :	edgomez	851	safe_packed_conv(
522 :	edgomez	1382	src[0], src_stride[0], image->y, image->u, image->v,
523 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
524 :			interlacing?yuyvi_to_yv12 :yuyv_to_yv12,
525 :	Isibaar	1815	interlacing?yuyvi_to_yv12_c:yuyv_to_yv12_c, 2, interlacing);
526 :	edgomez	851	break;
527 :	albeu	315
528 :			case XVID_CSP_YVYU: /* u/v swapped */
529 :	edgomez	851	safe_packed_conv(
530 :	edgomez	1382	src[0], src_stride[0], image->y, image->v, image->u,
531 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
532 :			interlacing?yuyvi_to_yv12 :yuyv_to_yv12,
533 :	Isibaar	1815	interlacing?yuyvi_to_yv12_c:yuyv_to_yv12_c, 2, interlacing);
534 :	edgomez	851	break;
535 :	albeu	315
536 :			case XVID_CSP_UYVY:
537 :	edgomez	851	safe_packed_conv(
538 :	edgomez	1382	src[0], src_stride[0], image->y, image->u, image->v,
539 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
540 :			interlacing?uyvyi_to_yv12 :uyvy_to_yv12,
541 :	Isibaar	1815	interlacing?uyvyi_to_yv12_c:uyvy_to_yv12_c, 2, interlacing);
542 :	edgomez	851	break;
543 :	albeu	315
544 :	edgomez	1382	case XVID_CSP_I420: /* YCbCr == YUV == internal colorspace for MPEG */
545 :	edgomez	851	yv12_to_yv12(image->y, image->u, image->v, edged_width, edged_width2,
546 :	edgomez	1382	src[0], src[0] + src_stride[0]height, src[0] + src_stride[0]height + (src_stride[0]/2)*height2,
547 :			src_stride[0], src_stride[0]/2, width, height, (csp & XVID_CSP_VFLIP));
548 :			break;
549 :
550 :			case XVID_CSP_YV12: /* YCrCb == YVA == U and V plane swapped */
551 :	edgomez	851	yv12_to_yv12(image->y, image->v, image->u, edged_width, edged_width2,
552 :	edgomez	1382	src[0], src[0] + src_stride[0]height, src[0] + src_stride[0]height + (src_stride[0]/2)*height2,
553 :			src_stride[0], src_stride[0]/2, width, height, (csp & XVID_CSP_VFLIP));
554 :	edgomez	851	break;
555 :
556 :	edgomez	1382	case XVID_CSP_PLANAR: /* YCbCr with arbitrary pointers and different strides for Y and UV */
557 :			yv12_to_yv12(image->y, image->u, image->v, edged_width, edged_width2,
558 :			src[0], src[1], src[2], src_stride[0], src_stride[1], /* v: dst_stride[2] not yet supported */
559 :			width, height, (csp & XVID_CSP_VFLIP));
560 :	edgomez	851	break;
561 :	albeu	315
562 :			case XVID_CSP_NULL:
563 :			break;
564 :
565 :	edgomez	851	default :
566 :			return -1;
567 :	albeu	315	}
568 :
569 :	edgomez	851
570 :			/* pad out image when the width and/or height is not a multiple of 16 */
571 :
572 :			if (width & 15)
573 :			{
574 :			int i;
575 :			int pad_width = 16 - (width&15);
576 :			for (i = 0; i < height; i++)
577 :			{
578 :	edgomez	1382	memset(image->y + i*edged_width + width,
579 :	edgomez	851	(image->y + iedged_width + width - 1), pad_width);
580 :			}
581 :			for (i = 0; i < height/2; i++)
582 :			{
583 :	edgomez	1382	memset(image->u + i*edged_width2 + width2,
584 :	edgomez	851	(image->u + iedged_width2 + width2 - 1),pad_width/2);
585 :	edgomez	1382	memset(image->v + i*edged_width2 + width2,
586 :	edgomez	851	(image->v + iedged_width2 + width2 - 1),pad_width/2);
587 :			}
588 :			}
589 :
590 :			if (height & 15)
591 :			{
592 :	edgomez	1382	int pad_height = 16 - (height&15);
593 :	edgomez	851	int length = ((width+15)/16)*16;
594 :			int i;
595 :			for (i = 0; i < pad_height; i++)
596 :			{
597 :			memcpy(image->y + (height+i)*edged_width,
598 :			image->y + (height-1)*edged_width,length);
599 :			}
600 :
601 :			for (i = 0; i < pad_height/2; i++)
602 :			{
603 :			memcpy(image->u + (height2+i)*edged_width2,
604 :			image->u + (height2-1)*edged_width2,length/2);
605 :			memcpy(image->v + (height2+i)*edged_width2,
606 :			image->v + (height2-1)*edged_width2,length/2);
607 :			}
608 :			}
609 :
610 :			/*
611 :			if (interlacing)
612 :			image_printf(image, edged_width, height, 5,5, "[i]");
613 :			image_dump_yuvpgm(image, edged_width, ((width+15)/16)16, ((height+15)/16)16, "\\encode.pgm");
614 :			*/
615 :			return 0;
616 :	albeu	315	}
617 :
618 :
619 :
620 :			int
621 :			image_output(IMAGE * image,
622 :			uint32_t width,
623 :			int height,
624 :			uint32_t edged_width,
625 :	edgomez	1382	uint8_t * dst[4],
626 :	Skal	1617	int dst_stride[4],
627 :	edgomez	851	int csp,
628 :			int interlacing)
629 :	albeu	315	{
630 :	edgomez	851	const int edged_width2 = edged_width/2;
631 :			int height2 = height/2;
632 :
633 :			/*
634 :			if (interlacing)
635 :			image_printf(image, edged_width, height, 5,100, "[i]=%i,%i",width,height);
636 :			image_dump_yuvpgm(image, edged_width, width, height, "\\decode.pgm");
637 :			*/
638 :
639 :	albeu	315	switch (csp & ~XVID_CSP_VFLIP) {
640 :			case XVID_CSP_RGB555:
641 :	edgomez	851	safe_packed_conv(
642 :	edgomez	1382	dst[0], dst_stride[0], image->y, image->u, image->v,
643 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
644 :			interlacing?yv12_to_rgb555i :yv12_to_rgb555,
645 :	Isibaar	1815	interlacing?yv12_to_rgb555i_c:yv12_to_rgb555_c, 2, interlacing);
646 :	albeu	315	return 0;
647 :
648 :			case XVID_CSP_RGB565:
649 :	edgomez	851	safe_packed_conv(
650 :	edgomez	1382	dst[0], dst_stride[0], image->y, image->u, image->v,
651 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
652 :			interlacing?yv12_to_rgb565i :yv12_to_rgb565,
653 :	Isibaar	1815	interlacing?yv12_to_rgb565i_c:yv12_to_rgb565_c, 2, interlacing);
654 :	albeu	315	return 0;
655 :
656 :	edgomez	1382	case XVID_CSP_BGR:
657 :	edgomez	851	safe_packed_conv(
658 :	edgomez	1382	dst[0], dst_stride[0], image->y, image->u, image->v,
659 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
660 :			interlacing?yv12_to_bgri :yv12_to_bgr,
661 :	Isibaar	1815	interlacing?yv12_to_bgri_c:yv12_to_bgr_c, 3, interlacing);
662 :	albeu	315	return 0;
663 :
664 :	edgomez	1382	case XVID_CSP_BGRA:
665 :	edgomez	851	safe_packed_conv(
666 :	edgomez	1382	dst[0], dst_stride[0], image->y, image->u, image->v,
667 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
668 :			interlacing?yv12_to_bgrai :yv12_to_bgra,
669 :	Isibaar	1815	interlacing?yv12_to_bgrai_c:yv12_to_bgra_c, 4, interlacing);
670 :	albeu	315	return 0;
671 :
672 :	edgomez	851	case XVID_CSP_ABGR:
673 :			safe_packed_conv(
674 :	edgomez	1382	dst[0], dst_stride[0], image->y, image->u, image->v,
675 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
676 :			interlacing?yv12_to_abgri :yv12_to_abgr,
677 :	Isibaar	1815	interlacing?yv12_to_abgri_c:yv12_to_abgr_c, 4, interlacing);
678 :	albeu	315	return 0;
679 :
680 :	chl	1759	case XVID_CSP_RGB:
681 :			safe_packed_conv(
682 :			dst[0], dst_stride[0], image->y, image->u, image->v,
683 :			edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
684 :			interlacing?yv12_to_rgbi :yv12_to_rgb,
685 :	Isibaar	1815	interlacing?yv12_to_rgbi_c:yv12_to_rgb_c, 3, interlacing);
686 :	chl	1759	return 0;
687 :
688 :	edgomez	851	case XVID_CSP_RGBA:
689 :			safe_packed_conv(
690 :	edgomez	1382	dst[0], dst_stride[0], image->y, image->u, image->v,
691 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
692 :			interlacing?yv12_to_rgbai :yv12_to_rgba,
693 :	Isibaar	1815	interlacing?yv12_to_rgbai_c:yv12_to_rgba_c, 4, interlacing);
694 :	albeu	315	return 0;
695 :
696 :	edgomez	1382	case XVID_CSP_ARGB:
697 :			safe_packed_conv(
698 :			dst[0], dst_stride[0], image->y, image->u, image->v,
699 :			edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
700 :			interlacing?yv12_to_argbi :yv12_to_argb,
701 :	Isibaar	1815	interlacing?yv12_to_argbi_c:yv12_to_argb_c, 4, interlacing);
702 :	edgomez	1382	return 0;
703 :
704 :	albeu	315	case XVID_CSP_YUY2:
705 :	edgomez	851	safe_packed_conv(
706 :	edgomez	1382	dst[0], dst_stride[0], image->y, image->u, image->v,
707 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
708 :			interlacing?yv12_to_yuyvi :yv12_to_yuyv,
709 :	Isibaar	1815	interlacing?yv12_to_yuyvi_c:yv12_to_yuyv_c, 2, interlacing);
710 :	albeu	315	return 0;
711 :
712 :	edgomez	1382	case XVID_CSP_YVYU: /* u,v swapped */
713 :	edgomez	851	safe_packed_conv(
714 :	edgomez	1382	dst[0], dst_stride[0], image->y, image->v, image->u,
715 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
716 :			interlacing?yv12_to_yuyvi :yv12_to_yuyv,
717 :	Isibaar	1815	interlacing?yv12_to_yuyvi_c:yv12_to_yuyv_c, 2, interlacing);
718 :	albeu	315	return 0;
719 :
720 :			case XVID_CSP_UYVY:
721 :	edgomez	851	safe_packed_conv(
722 :	edgomez	1382	dst[0], dst_stride[0], image->y, image->u, image->v,
723 :	edgomez	851	edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
724 :			interlacing?yv12_to_uyvyi :yv12_to_uyvy,
725 :	Isibaar	1815	interlacing?yv12_to_uyvyi_c:yv12_to_uyvy_c, 2, interlacing);
726 :	albeu	315	return 0;
727 :
728 :	edgomez	1382	case XVID_CSP_I420: /* YCbCr == YUV == internal colorspace for MPEG */
729 :			yv12_to_yv12(dst[0], dst[0] + dst_stride[0]height, dst[0] + dst_stride[0]height + (dst_stride[0]/2)*height2,
730 :			dst_stride[0], dst_stride[0]/2,
731 :	edgomez	851	image->y, image->u, image->v, edged_width, edged_width2,
732 :			width, height, (csp & XVID_CSP_VFLIP));
733 :			return 0;
734 :
735 :	edgomez	1382	case XVID_CSP_YV12: /* YCrCb == YVU == U and V plane swapped */
736 :			yv12_to_yv12(dst[0], dst[0] + dst_stride[0]height, dst[0] + dst_stride[0]height + (dst_stride[0]/2)*height2,
737 :			dst_stride[0], dst_stride[0]/2,
738 :	edgomez	851	image->y, image->v, image->u, edged_width, edged_width2,
739 :			width, height, (csp & XVID_CSP_VFLIP));
740 :			return 0;
741 :
742 :	edgomez	1382	case XVID_CSP_PLANAR: /* YCbCr with arbitrary pointers and different strides for Y and UV */
743 :			yv12_to_yv12(dst[0], dst[1], dst[2],
744 :			dst_stride[0], dst_stride[1], /* v: dst_stride[2] not yet supported */
745 :			image->y, image->u, image->v, edged_width, edged_width2,
746 :			width, height, (csp & XVID_CSP_VFLIP));
747 :	albeu	315	return 0;
748 :
749 :	edgomez	1382	case XVID_CSP_INTERNAL :
750 :			dst[0] = image->y;
751 :			dst[1] = image->u;
752 :			dst[2] = image->v;
753 :			dst_stride[0] = edged_width;
754 :			dst_stride[1] = edged_width/2;
755 :			dst_stride[2] = edged_width/2;
756 :			return 0;
757 :
758 :	albeu	315	case XVID_CSP_NULL:
759 :	edgomez	1382	case XVID_CSP_SLICE:
760 :	albeu	315	return 0;
761 :
762 :			}
763 :
764 :			return -1;
765 :			}
766 :
767 :			float
768 :			image_psnr(IMAGE * orig_image,
769 :			IMAGE * recon_image,
770 :			uint16_t stride,
771 :			uint16_t width,
772 :			uint16_t height)
773 :			{
774 :			int32_t diff, x, y, quad = 0;
775 :			uint8_t *orig = orig_image->y;
776 :			uint8_t *recon = recon_image->y;
777 :			float psnr_y;
778 :
779 :			for (y = 0; y < height; y++) {
780 :			for (x = 0; x < width; x++) {
781 :			diff = (orig + x) - (recon + x);
782 :			quad += diff * diff;
783 :			}
784 :			orig += stride;
785 :			recon += stride;
786 :			}
787 :
788 :			psnr_y = (float) quad / (float) (width * height);
789 :
790 :			if (psnr_y) {
791 :			psnr_y = (float) (255 * 255) / psnr_y;
792 :			psnr_y = 10 * (float) log10(psnr_y);
793 :			} else
794 :			psnr_y = (float) 99.99;
795 :
796 :			return psnr_y;
797 :			}
798 :
799 :
800 :	edgomez	851	float sse_to_PSNR(long sse, int pixels)
801 :			{
802 :			if (sse==0)
803 :			return 99.99F;
804 :
805 :	edgomez	1382	return 48.131F - 10(float)log10((float)sse/(float)(pixels)); / log10(255255)=4.8131 /
806 :	edgomez	851
807 :			}
808 :
809 :	edgomez	1424	long plane_sse(uint8_t *orig,
810 :			uint8_t *recon,
811 :			uint16_t stride,
812 :			uint16_t width,
813 :			uint16_t height)
814 :	edgomez	851	{
815 :	edgomez	1424	int y, bwidth, bheight;
816 :			long sse = 0;
817 :	edgomez	851
818 :	edgomez	1424	bwidth = width & (~0x07);
819 :			bheight = height & (~0x07);
820 :
821 :			/* Compute the 8x8 integer part */
822 :			for (y = 0; y<bheight; y += 8) {
823 :			int x;
824 :
825 :			/* Compute sse for the band */
826 :			for (x = 0; x<bwidth; x += 8)
827 :			sse += sse8_8bit(orig + x, recon + x, stride);
828 :
829 :			/* remaining pixels of the 8 pixels high band */
830 :			for (x = bwidth; x < width; x++) {
831 :			int diff;
832 :			diff = (orig + 0stride + x) - (recon + 0stride + x);
833 :			sse += diff * diff;
834 :			diff = (orig + 1stride + x) - (recon + 1stride + x);
835 :			sse += diff * diff;
836 :			diff = (orig + 2stride + x) - (recon + 2stride + x);
837 :			sse += diff * diff;
838 :			diff = (orig + 3stride + x) - (recon + 3stride + x);
839 :			sse += diff * diff;
840 :			diff = (orig + 4stride + x) - (recon + 4stride + x);
841 :			sse += diff * diff;
842 :			diff = (orig + 5stride + x) - (recon + 5stride + x);
843 :			sse += diff * diff;
844 :			diff = (orig + 6stride + x) - (recon + 6stride + x);
845 :			sse += diff * diff;
846 :			diff = (orig + 7stride + x) - (recon + 7stride + x);
847 :			sse += diff * diff;
848 :			}
849 :
850 :			orig += 8*stride;
851 :			recon += 8*stride;
852 :			}
853 :
854 :			/* Compute the down rectangle sse */
855 :			for (y = bheight; y < height; y++) {
856 :			int x;
857 :	edgomez	851	for (x = 0; x < width; x++) {
858 :	edgomez	1424	int diff;
859 :	edgomez	851	diff = (orig + x) - (recon + x);
860 :			sse += diff * diff;
861 :			}
862 :			orig += stride;
863 :			recon += stride;
864 :			}
865 :	edgomez	1424
866 :			return (sse);
867 :	edgomez	851	}
868 :
869 :	Isibaar	1909	void image_block_variance(IMAGE * orig_image,
870 :			uint16_t stride,
871 :			MACROBLOCK *mbs,
872 :			uint16_t mb_width,
873 :			uint16_t mb_height)
874 :			{
875 :			DECLARE_ALIGNED_MATRIX(sums, 1, 4, uint16_t, CACHE_LINE);
876 :			DECLARE_ALIGNED_MATRIX(squares, 1, 4, uint32_t, CACHE_LINE);
877 :
878 :			int x, y, i, j;
879 :	Isibaar	1932	uint8_t *orig_y = orig_image->y;
880 :			uint8_t *orig_u = orig_image->u;
881 :			uint8_t *orig_v = orig_image->v;
882 :	Isibaar	1909
883 :			for (y = 0; y < mb_height; y++) {
884 :			for (x = 0; x < mb_width; x++) {
885 :			MACROBLOCK pMB = &mbs[x + y mb_width];
886 :			uint32_t var4[4];
887 :			uint32_t sum = 0, square = 0;
888 :
889 :	Isibaar	1932	/* y-blocks */
890 :	Isibaar	1909	for (j = 0; j < 2; j++) {
891 :			for (i = 0; i < 2; i++) {
892 :	Isibaar	1932	int lsum = blocksum8(orig_y + ((y<<4) + (j<<3))*stride + (x<<4) + (i<<3),
893 :	Isibaar	1909	stride, sums, squares);
894 :	Isibaar	1932	int lsquare = (squares[0] + squares[1] + squares[2] + squares[3])<<6;
895 :	Isibaar	1909
896 :			sum += lsum;
897 :			square += lsquare;
898 :
899 :			var4[0] = (squares[0]<<4) - sums[0]*sums[0];
900 :			var4[1] = (squares[1]<<4) - sums[1]*sums[1];
901 :			var4[2] = (squares[2]<<4) - sums[2]*sums[2];
902 :			var4[3] = (squares[3]<<4) - sums[3]*sums[3];
903 :
904 :			pMB->rel_var8[j2 + i] = lsquare - lsumlsum;
905 :			if (pMB->rel_var8[j*2 + i])
906 :	Isibaar	1932	pMB->rel_var8[j*2 + i] = ((var4[0] + var4[1] + var4[2] + var4[3])<<8) /
907 :	Isibaar	1909	pMB->rel_var8[j2 + i]; / 4(Var(Di)/Var(D)) /
908 :			else
909 :			pMB->rel_var8[j*2 + i] = 64;
910 :			}
911 :			}
912 :	Isibaar	1932
913 :			/* u */
914 :			{
915 :			int lsum = blocksum8(orig_u + (y<<3)*(stride>>1) + (x<<3),
916 :			stride, sums, squares);
917 :			int lsquare = (squares[0] + squares[1] + squares[2] + squares[3])<<6;
918 :
919 :			sum += lsum;
920 :			square += lsquare;
921 :
922 :			var4[0] = (squares[0]<<4) - sums[0]*sums[0];
923 :			var4[1] = (squares[1]<<4) - sums[1]*sums[1];
924 :			var4[2] = (squares[2]<<4) - sums[2]*sums[2];
925 :			var4[3] = (squares[3]<<4) - sums[3]*sums[3];
926 :
927 :			pMB->rel_var8[4] = lsquare - lsum*lsum;
928 :			if (pMB->rel_var8[4])
929 :			pMB->rel_var8[4] = ((var4[0] + var4[1] + var4[2] + var4[3])<<8) /
930 :			pMB->rel_var8[4]; /* 4(Var(Di)/Var(D)) /
931 :			else
932 :			pMB->rel_var8[4] = 64;
933 :			}
934 :
935 :			/* v */
936 :			{
937 :			int lsum = blocksum8(orig_v + (y<<3)*(stride>>1) + (x<<3),
938 :			stride, sums, squares);
939 :			int lsquare = (squares[0] + squares[1] + squares[2] + squares[3])<<6;
940 :
941 :			sum += lsum;
942 :			square += lsquare;
943 :
944 :			var4[0] = (squares[0]<<4) - sums[0]*sums[0];
945 :			var4[1] = (squares[1]<<4) - sums[1]*sums[1];
946 :			var4[2] = (squares[2]<<4) - sums[2]*sums[2];
947 :			var4[3] = (squares[3]<<4) - sums[3]*sums[3];
948 :
949 :			pMB->rel_var8[5] = lsquare - lsum*lsum;
950 :			if (pMB->rel_var8[5])
951 :			pMB->rel_var8[5] = ((var4[0] + var4[1] + var4[2] + var4[3])<<8) /
952 :			pMB->rel_var8[5]; /* 4(Var(Di)/Var(D)) /
953 :			else
954 :			pMB->rel_var8[5] = 64;
955 :			}
956 :
957 :	Isibaar	1909	}
958 :			}
959 :			}
960 :
961 :	edgomez	1382	#if 0
962 :	edgomez	851
963 :	albeu	315	#include <stdio.h>
964 :			#include <string.h>
965 :
966 :			int image_dump_pgm(uint8_t * bmp, uint32_t width, uint32_t height, char * filename)
967 :			{
968 :			FILE * f;
969 :			char hdr[1024];
970 :	edgomez	1382
971 :	albeu	315	f = fopen(filename, "wb");
972 :			if ( f == NULL)
973 :			{
974 :			return -1;
975 :			}
976 :			sprintf(hdr, "P5\n#xvid\n%i %i\n255\n", width, height);
977 :			fwrite(hdr, strlen(hdr), 1, f);
978 :			fwrite(bmp, width, height, f);
979 :			fclose(f);
980 :
981 :			return 0;
982 :			}
983 :
984 :
985 :	edgomez	1382	/* dump image+edges to yuv pgm files */
986 :	albeu	315
987 :			int image_dump(IMAGE * image, uint32_t edged_width, uint32_t edged_height, char * path, int number)
988 :			{
989 :			char filename[1024];
990 :
991 :			sprintf(filename, "%s_%i_%c.pgm", path, number, 'y');
992 :			image_dump_pgm(
993 :			image->y - (EDGE_SIZE * edged_width + EDGE_SIZE),
994 :			edged_width, edged_height, filename);
995 :
996 :			sprintf(filename, "%s_%i_%c.pgm", path, number, 'u');
997 :			image_dump_pgm(
998 :			image->u - (EDGE_SIZE2 * edged_width / 2 + EDGE_SIZE2),
999 :			edged_width / 2, edged_height / 2, filename);
1000 :
1001 :			sprintf(filename, "%s_%i_%c.pgm", path, number, 'v');
1002 :			image_dump_pgm(
1003 :			image->v - (EDGE_SIZE2 * edged_width / 2 + EDGE_SIZE2),
1004 :			edged_width / 2, edged_height / 2, filename);
1005 :
1006 :			return 0;
1007 :			}
1008 :	edgomez	1382	#endif
1009 :	albeu	315
1010 :
1011 :
1012 :			/* dump image to yuvpgm file */
1013 :
1014 :			#include <stdio.h>
1015 :
1016 :			int
1017 :			image_dump_yuvpgm(const IMAGE * image,
1018 :			const uint32_t edged_width,
1019 :			const uint32_t width,
1020 :			const uint32_t height,
1021 :			char *filename)
1022 :			{
1023 :			FILE *f;
1024 :			char hdr[1024];
1025 :			uint32_t i;
1026 :			uint8_t *bmp1;
1027 :			uint8_t *bmp2;
1028 :
1029 :
1030 :			f = fopen(filename, "wb");
1031 :			if (f == NULL) {
1032 :			return -1;
1033 :			}
1034 :			sprintf(hdr, "P5\n#xvid\n%i %i\n255\n", width, (3 * height) / 2);
1035 :			fwrite(hdr, strlen(hdr), 1, f);
1036 :
1037 :			bmp1 = image->y;
1038 :			for (i = 0; i < height; i++) {
1039 :			fwrite(bmp1, width, 1, f);
1040 :			bmp1 += edged_width;
1041 :			}
1042 :
1043 :			bmp1 = image->u;
1044 :			bmp2 = image->v;
1045 :			for (i = 0; i < height / 2; i++) {
1046 :			fwrite(bmp1, width / 2, 1, f);
1047 :			fwrite(bmp2, width / 2, 1, f);
1048 :			bmp1 += edged_width / 2;
1049 :			bmp2 += edged_width / 2;
1050 :			}
1051 :
1052 :			fclose(f);
1053 :			return 0;
1054 :			}
1055 :
1056 :
1057 :			float
1058 :			image_mad(const IMAGE * img1,
1059 :			const IMAGE * img2,
1060 :			uint32_t stride,
1061 :			uint32_t width,
1062 :			uint32_t height)
1063 :			{
1064 :			const uint32_t stride2 = stride / 2;
1065 :			const uint32_t width2 = width / 2;
1066 :			const uint32_t height2 = height / 2;
1067 :
1068 :			uint32_t x, y;
1069 :			uint32_t sum = 0;
1070 :
1071 :			for (y = 0; y < height; y++)
1072 :			for (x = 0; x < width; x++)
1073 :	edgomez	1382	sum += abs(img1->y[x + y * stride] - img2->y[x + y * stride]);
1074 :	albeu	315
1075 :			for (y = 0; y < height2; y++)
1076 :			for (x = 0; x < width2; x++)
1077 :	edgomez	1382	sum += abs(img1->u[x + y * stride2] - img2->u[x + y * stride2]);
1078 :	albeu	315
1079 :			for (y = 0; y < height2; y++)
1080 :			for (x = 0; x < width2; x++)
1081 :	edgomez	1382	sum += abs(img1->v[x + y * stride2] - img2->v[x + y * stride2]);
1082 :	albeu	315
1083 :			return (float) sum / (width * height * 3 / 2);
1084 :			}
1085 :
1086 :			void
1087 :	suxen_drol	1631	output_slice(IMAGE * cur, int stride, int width, xvid_image_t* out_frm, int mbx, int mby,int mbl) {
1088 :	albeu	315	uint8_t dY,dU,dV,sY,sU,sV;
1089 :	suxen_drol	1631	int stride2 = stride >> 1;
1090 :	albeu	315	int w = mbl << 4, w2,i;
1091 :
1092 :			if(w > width)
1093 :			w = width;
1094 :			w2 = w >> 1;
1095 :	suxen_drol	323
1096 :	edgomez	1382	dY = (uint8_t)out_frm->plane[0] + (mby << 4) out_frm->stride[0] + (mbx << 4);
1097 :			dU = (uint8_t)out_frm->plane[1] + (mby << 3) out_frm->stride[1] + (mbx << 3);
1098 :			dV = (uint8_t)out_frm->plane[2] + (mby << 3) out_frm->stride[2] + (mbx << 3);
1099 :	suxen_drol	1631	sY = cur->y + (mby << 4) * stride + (mbx << 4);
1100 :			sU = cur->u + (mby << 3) * stride2 + (mbx << 3);
1101 :			sV = cur->v + (mby << 3) * stride2 + (mbx << 3);
1102 :	albeu	315
1103 :			for(i = 0 ; i < 16 ; i++) {
1104 :			memcpy(dY,sY,w);
1105 :	edgomez	1382	dY += out_frm->stride[0];
1106 :	suxen_drol	1631	sY += stride;
1107 :	suxen_drol	323	}
1108 :	albeu	315	for(i = 0 ; i < 8 ; i++) {
1109 :			memcpy(dU,sU,w2);
1110 :	edgomez	1382	dU += out_frm->stride[1];
1111 :	suxen_drol	1631	sU += stride2;
1112 :	albeu	315	}
1113 :			for(i = 0 ; i < 8 ; i++) {
1114 :			memcpy(dV,sV,w2);
1115 :	edgomez	1382	dV += out_frm->stride[2];
1116 :	suxen_drol	1631	sV += stride2;
1117 :	albeu	315	}
1118 :			}
1119 :	edgomez	851
1120 :
1121 :			void
1122 :			image_clear(IMAGE * img, int width, int height, int edged_width,
1123 :			int y, int u, int v)
1124 :			{
1125 :			uint8_t * p;
1126 :			int i;
1127 :
1128 :			p = img->y;
1129 :			for (i = 0; i < height; i++) {
1130 :			memset(p, y, width);
1131 :			p += edged_width;
1132 :			}
1133 :
1134 :			p = img->u;
1135 :			for (i = 0; i < height/2; i++) {
1136 :			memset(p, u, width/2);
1137 :			p += edged_width/2;
1138 :			}
1139 :
1140 :			p = img->v;
1141 :			for (i = 0; i < height/2; i++) {
1142 :			memset(p, v, width/2);
1143 :			p += edged_width/2;
1144 :			}
1145 :			}
1146 :	Skal	1733
1147 :			/****************************************************************************/
1148 :
1149 :	Isibaar	1734	static void (deintl_core)(uint8_t , int width, int height, const int stride) = 0;
1150 :			extern void xvid_deinterlace_sse(uint8_t *, int width, int height, const int stride);
1151 :	Skal	1733
1152 :			#define CLIP_255(x) ( ((x)&~255) ? ((-(x)) >> (8*sizeof((x))-1))&0xff : (x) )
1153 :
1154 :	Isibaar	1734	static void deinterlace_c(uint8_t *pix, int width, int height, const int bps)
1155 :	Skal	1733	{
1156 :			pix += bps;
1157 :			while(width-->0)
1158 :			{
1159 :			int p1 = pix[-bps];
1160 :			int p2 = pix[0];
1161 :			int p0 = p2;
1162 :			int j = (height>>1) - 1;
1163 :			int V;
1164 :			unsigned char *P = pix++;
1165 :			while(j-->0)
1166 :			{
1167 :			const int p3 = P[ bps];
1168 :			const int p4 = P[2*bps];
1169 :			V = ((p1+p3+1)>>1) + ((p2 - ((p0+p4+1)>>1)) >> 2);
1170 :			P[0] = CLIP_255( V );
1171 :			p0 = p2;
1172 :			p1 = p3;
1173 :			p2 = p4;
1174 :			P += 2*bps;
1175 :			}
1176 :			V = ((p1+p1+1)>>1) + ((p2 - ((p0+p2+1)>>1)) >> 2);
1177 :			P[0] = CLIP_255( V );
1178 :			}
1179 :			}
1180 :			#undef CLIP_255
1181 :
1182 :			int xvid_image_deinterlace(xvid_image_t* img, int width, int height, int bottom_first)
1183 :			{
1184 :			if (height&1)
1185 :			return 0;
1186 :			if (img->csp!=XVID_CSP_PLANAR && img->csp!=XVID_CSP_I420 && img->csp!=XVID_CSP_YV12)
1187 :			return 0; /* not yet supported */
1188 :			if (deintl_core==0) {
1189 :			deintl_core = deinterlace_c;
1190 :	Isibaar	1795	#if defined(ARCH_IS_IA32) \|\| defined(ARCH_IS_X86_64)
1191 :	Skal	1736	{
1192 :			int cpu_flags = check_cpu_features();
1193 :			if (cpu_flags & XVID_CPU_MMX)
1194 :			deintl_core = xvid_deinterlace_sse;
1195 :			}
1196 :	Skal	1733	#endif
1197 :			}
1198 :			if (!bottom_first) {
1199 :			deintl_core(img->plane[0], width, height, img->stride[0]);
1200 :			deintl_core(img->plane[1], width>>1, height>>1, img->stride[1]);
1201 :			deintl_core(img->plane[2], width>>1, height>>1, img->stride[2]);
1202 :			}
1203 :			else {
1204 :	Isibaar	1734	deintl_core((uint8_t )img->plane[0] + ( height -1)img->stride[0], width, height, -img->stride[0]);
1205 :			deintl_core((uint8_t )img->plane[1] + ((height>>1)-1)img->stride[1], width>>1, height>>1, -img->stride[1]);
1206 :			deintl_core((uint8_t )img->plane[2] + ((height>>1)-1)img->stride[2], width>>1, height>>1, -img->stride[2]);
1207 :	Skal	1733	}
1208 :			emms();
1209 :
1210 :			return 1;
1211 :			}
1212 :

No admin address has been configured	ViewVC Help
Powered by ViewVC 1.0.4