3 |
* XVID MPEG-4 VIDEO CODEC |
* XVID MPEG-4 VIDEO CODEC |
4 |
* - 8bit<->16bit transfer - |
* - 8bit<->16bit transfer - |
5 |
* |
* |
6 |
* Copyright(C) 2001-2002 Peter Ross <pross@xvid.org> |
* Copyright(C) 2001-2003 Peter Ross <pross@xvid.org> |
|
* |
|
|
* This program is an implementation of a part of one or more MPEG-4 |
|
|
* Video tools as specified in ISO/IEC 14496-2 standard. Those intending |
|
|
* to use this software module in hardware or software products are |
|
|
* advised that its use may infringe existing patents or copyrights, and |
|
|
* any such use would be at such party's own risk. The original |
|
|
* developer of this software module and his/her company, and subsequent |
|
|
* editors and their companies, will have no liability for use of this |
|
|
* software or modifications or derivatives thereof. |
|
7 |
* |
* |
8 |
* This program is free software; you can redistribute it and/or modify |
* This program is free software; you can redistribute it and/or modify |
9 |
* it under the terms of the GNU General Public License as published by |
* it under the terms of the GNU General Public License as published by |
19 |
* along with this program; if not, write to the Free Software |
* along with this program; if not, write to the Free Software |
20 |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
21 |
* |
* |
22 |
* $Id: mem_transfer.c,v 1.6 2002-09-21 03:07:56 suxen_drol Exp $ |
* $Id: mem_transfer.c,v 1.15 2005-08-01 10:53:46 Isibaar Exp $ |
23 |
* |
* |
24 |
****************************************************************************/ |
****************************************************************************/ |
25 |
|
|
32 |
TRANSFER_16TO8COPY_PTR transfer_16to8copy; |
TRANSFER_16TO8COPY_PTR transfer_16to8copy; |
33 |
|
|
34 |
TRANSFER_8TO16SUB_PTR transfer_8to16sub; |
TRANSFER_8TO16SUB_PTR transfer_8to16sub; |
35 |
|
TRANSFER_8TO16SUBRO_PTR transfer_8to16subro; |
36 |
TRANSFER_8TO16SUB2_PTR transfer_8to16sub2; |
TRANSFER_8TO16SUB2_PTR transfer_8to16sub2; |
37 |
|
TRANSFER_8TO16SUB2RO_PTR transfer_8to16sub2ro; |
38 |
TRANSFER_16TO8ADD_PTR transfer_16to8add; |
TRANSFER_16TO8ADD_PTR transfer_16to8add; |
39 |
|
|
40 |
TRANSFER8X8_COPY_PTR transfer8x8_copy; |
TRANSFER8X8_COPY_PTR transfer8x8_copy; |
41 |
|
|
42 |
|
#define USE_REFERENCE_C |
43 |
|
|
44 |
/***************************************************************************** |
/***************************************************************************** |
45 |
* |
* |
66 |
const uint8_t * const src, |
const uint8_t * const src, |
67 |
uint32_t stride) |
uint32_t stride) |
68 |
{ |
{ |
69 |
uint32_t i, j; |
int i, j; |
|
|
|
70 |
for (j = 0; j < 8; j++) { |
for (j = 0; j < 8; j++) { |
71 |
for (i = 0; i < 8; i++) { |
for (i = 0; i < 8; i++) { |
72 |
dst[j * 8 + i] = (int16_t) src[j * stride + i]; |
dst[j * 8 + i] = (int16_t) src[j * stride + i]; |
88 |
const int16_t * const src, |
const int16_t * const src, |
89 |
uint32_t stride) |
uint32_t stride) |
90 |
{ |
{ |
91 |
uint32_t i, j; |
int i, j; |
92 |
|
|
93 |
for (j = 0; j < 8; j++) { |
for (j = 0; j < 8; j++) { |
94 |
for (i = 0; i < 8; i++) { |
for (i = 0; i < 8; i++) { |
95 |
|
#ifdef USE_REFERENCE_C |
96 |
int16_t pixel = src[j * 8 + i]; |
int16_t pixel = src[j * 8 + i]; |
97 |
|
|
98 |
if (pixel < 0) { |
if (pixel < 0) { |
101 |
pixel = 255; |
pixel = 255; |
102 |
} |
} |
103 |
dst[j * stride + i] = (uint8_t) pixel; |
dst[j * stride + i] = (uint8_t) pixel; |
104 |
|
#else |
105 |
|
const int16_t pixel = src[j * 8 + i]; |
106 |
|
const uint8_t value = (uint8_t)( (pixel&~255) ? (-pixel)>>(8*sizeof(pixel)-1) : pixel ); |
107 |
|
dst[j*stride + i] = value; |
108 |
|
#endif |
109 |
} |
} |
110 |
} |
} |
111 |
} |
} |
130 |
const uint8_t * ref, |
const uint8_t * ref, |
131 |
const uint32_t stride) |
const uint32_t stride) |
132 |
{ |
{ |
133 |
uint32_t i, j; |
int i, j; |
134 |
|
|
135 |
for (j = 0; j < 8; j++) { |
for (j = 0; j < 8; j++) { |
136 |
for (i = 0; i < 8; i++) { |
for (i = 0; i < 8; i++) { |
137 |
uint8_t c = cur[j * stride + i]; |
const uint8_t c = cur[j * stride + i]; |
138 |
uint8_t r = ref[j * stride + i]; |
const uint8_t r = ref[j * stride + i]; |
139 |
|
|
140 |
cur[j * stride + i] = r; |
cur[j * stride + i] = r; |
141 |
dct[j * 8 + i] = (int16_t) c - (int16_t) r; |
dct[j * 8 + i] = (int16_t) c - (int16_t) r; |
144 |
} |
} |
145 |
|
|
146 |
|
|
147 |
|
void |
148 |
|
transfer_8to16subro_c(int16_t * const dct, |
149 |
|
const uint8_t * const cur, |
150 |
|
const uint8_t * ref, |
151 |
|
const uint32_t stride) |
152 |
|
{ |
153 |
|
int i, j; |
154 |
|
|
155 |
|
for (j = 0; j < 8; j++) { |
156 |
|
for (i = 0; i < 8; i++) { |
157 |
|
const uint8_t c = cur[j * stride + i]; |
158 |
|
const uint8_t r = ref[j * stride + i]; |
159 |
|
dct[j * 8 + i] = (int16_t) c - (int16_t) r; |
160 |
|
} |
161 |
|
} |
162 |
|
} |
163 |
|
|
164 |
|
|
165 |
|
|
166 |
/* |
/* |
167 |
* C - the current buffer |
* C - the current buffer |
168 |
* R1 - the 1st reference buffer |
* R1 - the 1st reference buffer |
173 |
* |
* |
174 |
* R1 (8bit) = R1 |
* R1 (8bit) = R1 |
175 |
* R2 (8bit) = R2 |
* R2 (8bit) = R2 |
176 |
* C (8bit) = C |
* R (temp) = min((R1 + R2)/2, 255) |
177 |
* DCT (16bit)= C - min((R1 + R2)/2, 255) |
* DCT (16bit)= C - R |
178 |
|
* C (8bit) = R |
179 |
*/ |
*/ |
180 |
void |
void |
181 |
transfer_8to16sub2_c(int16_t * const dct, |
transfer_8to16sub2_c(int16_t * const dct, |
188 |
|
|
189 |
for (j = 0; j < 8; j++) { |
for (j = 0; j < 8; j++) { |
190 |
for (i = 0; i < 8; i++) { |
for (i = 0; i < 8; i++) { |
191 |
uint8_t c = cur[j * stride + i]; |
const uint8_t c = cur[j * stride + i]; |
192 |
int r = (ref1[j * stride + i] + ref2[j * stride + i] + 1) / 2; |
const uint8_t r = (ref1[j * stride + i] + ref2[j * stride + i] + 1) >> 1; |
193 |
|
cur[j * stride + i] = r; |
194 |
if (r > 255) { |
dct[j * 8 + i] = (int16_t) c - (int16_t) r; |
195 |
r = 255; |
} |
196 |
} |
} |
197 |
//cur[j * stride + i] = r; |
} |
198 |
|
|
199 |
|
void |
200 |
|
transfer_8to16sub2ro_c(int16_t * const dct, |
201 |
|
const uint8_t * const cur, |
202 |
|
const uint8_t * ref1, |
203 |
|
const uint8_t * ref2, |
204 |
|
const uint32_t stride) |
205 |
|
{ |
206 |
|
uint32_t i, j; |
207 |
|
|
208 |
|
for (j = 0; j < 8; j++) { |
209 |
|
for (i = 0; i < 8; i++) { |
210 |
|
const uint8_t c = cur[j * stride + i]; |
211 |
|
const uint8_t r = (ref1[j * stride + i] + ref2[j * stride + i] + 1) >> 1; |
212 |
dct[j * 8 + i] = (int16_t) c - (int16_t) r; |
dct[j * 8 + i] = (int16_t) c - (int16_t) r; |
213 |
} |
} |
214 |
} |
} |
229 |
const int16_t * const src, |
const int16_t * const src, |
230 |
uint32_t stride) |
uint32_t stride) |
231 |
{ |
{ |
232 |
uint32_t i, j; |
int i, j; |
233 |
|
|
234 |
for (j = 0; j < 8; j++) { |
for (j = 0; j < 8; j++) { |
235 |
for (i = 0; i < 8; i++) { |
for (i = 0; i < 8; i++) { |
236 |
|
#ifdef USE_REFERENCE_C |
237 |
int16_t pixel = (int16_t) dst[j * stride + i] + src[j * 8 + i]; |
int16_t pixel = (int16_t) dst[j * stride + i] + src[j * 8 + i]; |
238 |
|
|
239 |
if (pixel < 0) { |
if (pixel < 0) { |
242 |
pixel = 255; |
pixel = 255; |
243 |
} |
} |
244 |
dst[j * stride + i] = (uint8_t) pixel; |
dst[j * stride + i] = (uint8_t) pixel; |
245 |
|
#else |
246 |
|
const int16_t pixel = (int16_t) dst[j * stride + i] + src[j * 8 + i]; |
247 |
|
const uint8_t value = (uint8_t)( (pixel&~255) ? (-pixel)>>(8*sizeof(pixel)-1) : pixel ); |
248 |
|
dst[j*stride + i] = value; |
249 |
|
#endif |
250 |
|
|
251 |
} |
} |
252 |
} |
} |
253 |
} |
} |
266 |
const uint8_t * const src, |
const uint8_t * const src, |
267 |
const uint32_t stride) |
const uint32_t stride) |
268 |
{ |
{ |
269 |
uint32_t i, j; |
int j, i; |
270 |
|
|
271 |
for (j = 0; j < 8; j++) { |
for (j = 0; j < 8; ++j) { |
272 |
for (i = 0; i < 8; i++) { |
uint8_t *d = dst + j*stride; |
273 |
dst[j * stride + i] = src[j * stride + i]; |
const uint8_t *s = src + j*stride; |
274 |
|
|
275 |
|
for (i = 0; i < 8; ++i) |
276 |
|
{ |
277 |
|
*d++ = *s++; |
278 |
} |
} |
279 |
} |
} |
280 |
} |
} |