19 |
* along with this program ; if not, write to the Free Software |
* along with this program ; if not, write to the Free Software |
20 |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
21 |
* |
* |
22 |
* $Id: image.c,v 1.26.2.7 2003-06-09 13:53:50 edgomez Exp $ |
* $Id: image.c,v 1.26.2.11 2003-11-05 16:15:47 edgomez Exp $ |
23 |
* |
* |
24 |
****************************************************************************/ |
****************************************************************************/ |
25 |
|
|
49 |
{ |
{ |
50 |
const uint32_t edged_width2 = edged_width / 2; |
const uint32_t edged_width2 = edged_width / 2; |
51 |
const uint32_t edged_height2 = edged_height / 2; |
const uint32_t edged_height2 = edged_height / 2; |
|
uint32_t i; |
|
52 |
|
|
53 |
image->y = |
image->y = |
54 |
xvid_malloc(edged_width * (edged_height + 1) + SAFETY, CACHE_LINE); |
xvid_malloc(edged_width * (edged_height + 1) + SAFETY, CACHE_LINE); |
55 |
if (image->y == NULL) { |
if (image->y == NULL) { |
56 |
return -1; |
return -1; |
57 |
} |
} |
58 |
|
memset(image->y, 0, edged_width * (edged_height + 1) + SAFETY); |
|
for (i = 0; i < edged_width * edged_height + SAFETY; i++) { |
|
|
image->y[i] = 0; |
|
|
} |
|
59 |
|
|
60 |
image->u = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE); |
image->u = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE); |
61 |
if (image->u == NULL) { |
if (image->u == NULL) { |
62 |
xvid_free(image->y); |
xvid_free(image->y); |
63 |
|
image->y = NULL; |
64 |
return -1; |
return -1; |
65 |
} |
} |
66 |
|
memset(image->u, 0, edged_width2 * edged_height2 + SAFETY); |
67 |
|
|
68 |
image->v = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE); |
image->v = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE); |
69 |
if (image->v == NULL) { |
if (image->v == NULL) { |
70 |
xvid_free(image->u); |
xvid_free(image->u); |
71 |
|
image->u = NULL; |
72 |
xvid_free(image->y); |
xvid_free(image->y); |
73 |
|
image->y = NULL; |
74 |
return -1; |
return -1; |
75 |
} |
} |
76 |
|
memset(image->v, 0, edged_width2 * edged_height2 + SAFETY); |
77 |
|
|
78 |
image->y += EDGE_SIZE * edged_width + EDGE_SIZE; |
image->y += EDGE_SIZE * edged_width + EDGE_SIZE; |
79 |
image->u += EDGE_SIZE2 * edged_width2 + EDGE_SIZE2; |
image->u += EDGE_SIZE2 * edged_width2 + EDGE_SIZE2; |
93 |
|
|
94 |
if (image->y) { |
if (image->y) { |
95 |
xvid_free(image->y - (EDGE_SIZE * edged_width + EDGE_SIZE)); |
xvid_free(image->y - (EDGE_SIZE * edged_width + EDGE_SIZE)); |
96 |
|
image->y = NULL; |
97 |
} |
} |
98 |
if (image->u) { |
if (image->u) { |
99 |
xvid_free(image->u - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2)); |
xvid_free(image->u - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2)); |
100 |
|
image->u = NULL; |
101 |
} |
} |
102 |
if (image->v) { |
if (image->v) { |
103 |
xvid_free(image->v - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2)); |
xvid_free(image->v - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2)); |
104 |
|
image->v = NULL; |
105 |
} |
} |
106 |
} |
} |
107 |
|
|
136 |
uint32_t height) |
uint32_t height) |
137 |
{ |
{ |
138 |
const uint32_t edged_width2 = edged_width / 2; |
const uint32_t edged_width2 = edged_width / 2; |
139 |
const uint32_t width2 = width / 2; |
uint32_t width2; |
140 |
uint32_t i; |
uint32_t i; |
141 |
uint8_t *dst; |
uint8_t *dst; |
142 |
uint8_t *src; |
uint8_t *src; |
145 |
dst = image->y - (EDGE_SIZE + EDGE_SIZE * edged_width); |
dst = image->y - (EDGE_SIZE + EDGE_SIZE * edged_width); |
146 |
src = image->y; |
src = image->y; |
147 |
|
|
148 |
|
/* According to the Standard Clause 7.6.4, padding is done starting at 16 |
149 |
|
* pixel width and height multiples */ |
150 |
|
width = (width+15)&~15; |
151 |
|
height = (height+15)&~15; |
152 |
|
width2 = width/2; |
153 |
|
|
154 |
for (i = 0; i < EDGE_SIZE; i++) { |
for (i = 0; i < EDGE_SIZE; i++) { |
155 |
memset(dst, *src, EDGE_SIZE); |
memset(dst, *src, EDGE_SIZE); |
156 |
memcpy(dst + EDGE_SIZE, src, width); |
memcpy(dst + EDGE_SIZE, src, width); |
258 |
n_ptr = refn->y; |
n_ptr = refn->y; |
259 |
h_ptr = refh->y; |
h_ptr = refh->y; |
260 |
v_ptr = refv->y; |
v_ptr = refv->y; |
|
hv_ptr = refhv->y; |
|
261 |
|
|
262 |
n_ptr -= offset; |
n_ptr -= offset; |
263 |
h_ptr -= offset; |
h_ptr -= offset; |
264 |
v_ptr -= offset; |
v_ptr -= offset; |
|
hv_ptr -= offset; |
|
265 |
|
|
266 |
|
/* Note we initialize the hv pointer later, as we can optimize code a bit |
267 |
|
* doing it down to up in quarterpel and up to down in halfpel */ |
268 |
if(quarterpel) { |
if(quarterpel) { |
269 |
|
|
270 |
for (y = 0; y < (edged_height - EDGE_SIZE); y += 8) { |
for (y = 0; y < (edged_height - EDGE_SIZE); y += 8) { |
286 |
n_ptr += stride_add; |
n_ptr += stride_add; |
287 |
} |
} |
288 |
|
|
289 |
h_ptr = refh->y; |
h_ptr = refh->y + (edged_height - EDGE_SIZE - EDGE_SIZE2)*edged_width - EDGE_SIZE2; |
290 |
h_ptr -= offset; |
hv_ptr = refhv->y + (edged_height - EDGE_SIZE - EDGE_SIZE2)*edged_width - EDGE_SIZE2; |
291 |
|
|
292 |
for (y = 0; y < (edged_height - EDGE_SIZE); y = y + 8) { |
for (y = 0; y < (edged_height - EDGE_SIZE); y = y + 8) { |
293 |
|
hv_ptr -= stride_add; |
294 |
|
h_ptr -= stride_add; |
295 |
|
hv_ptr -= EDGE_SIZE; |
296 |
|
h_ptr -= EDGE_SIZE; |
297 |
|
|
298 |
for (x = 0; x < (edged_width - EDGE_SIZE); x = x + 8) { |
for (x = 0; x < (edged_width - EDGE_SIZE); x = x + 8) { |
299 |
|
hv_ptr -= 8; |
300 |
|
h_ptr -= 8; |
301 |
interpolate8x8_6tap_lowpass_v(hv_ptr, h_ptr, edged_width, rounding); |
interpolate8x8_6tap_lowpass_v(hv_ptr, h_ptr, edged_width, rounding); |
|
hv_ptr += 8; |
|
|
h_ptr += 8; |
|
|
} |
|
|
|
|
|
hv_ptr += EDGE_SIZE; |
|
|
h_ptr += EDGE_SIZE; |
|
|
|
|
|
hv_ptr += stride_add; |
|
|
h_ptr += stride_add; |
|
302 |
} |
} |
303 |
} |
} |
304 |
else { |
} else { |
305 |
|
|
306 |
|
hv_ptr = refhv->y; |
307 |
|
hv_ptr -= offset; |
308 |
|
|
309 |
for (y = 0; y < (edged_height - EDGE_SIZE); y += 8) { |
for (y = 0; y < (edged_height - EDGE_SIZE); y += 8) { |
310 |
for (x = 0; x < (edged_width - EDGE_SIZE); x += 8) { |
for (x = 0; x < (edged_width - EDGE_SIZE); x += 8) { |