3 |
* XVID MPEG-4 VIDEO CODEC |
* XVID MPEG-4 VIDEO CODEC |
4 |
* - Native API implementation - |
* - Native API implementation - |
5 |
* |
* |
6 |
|
* Copyright(C) 2001-2003 Peter Ross <pross@xvid.org> |
7 |
|
* |
8 |
* This program is free software ; you can redistribute it and/or modify |
* This program is free software ; you can redistribute it and/or modify |
9 |
* it under the terms of the GNU General Public License as published by |
* it under the terms of the GNU General Public License as published by |
10 |
* the Free Software Foundation ; either version 2 of the License, or |
* the Free Software Foundation ; either version 2 of the License, or |
19 |
* along with this program ; if not, write to the Free Software |
* along with this program ; if not, write to the Free Software |
20 |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
21 |
* |
* |
22 |
* $Id: xvid.c,v 1.45.2.5 2003-06-09 01:16:57 edgomez Exp $ |
* $Id: xvid.c,v 1.45.2.15 2003-10-01 23:23:01 edgomez Exp $ |
23 |
* |
* |
24 |
****************************************************************************/ |
****************************************************************************/ |
25 |
|
|
46 |
#include "utils/emms.h" |
#include "utils/emms.h" |
47 |
#include "utils/timer.h" |
#include "utils/timer.h" |
48 |
#include "bitstream/mbcoding.h" |
#include "bitstream/mbcoding.h" |
49 |
|
#include "image/qpel.h" |
50 |
|
|
51 |
#if defined(_DEBUG) |
#if defined(_DEBUG) |
52 |
unsigned int xvid_debug = 0; /* xvid debug mask */ |
unsigned int xvid_debug = 0; /* xvid debug mask */ |
164 |
{ |
{ |
165 |
unsigned int cpu_flags; |
unsigned int cpu_flags; |
166 |
|
|
167 |
if (XVID_MAJOR(init->version) != 1) /* v1.x.x */ |
if (XVID_VERSION_MAJOR(init->version) != 1) /* v1.x.x */ |
168 |
return XVID_ERR_VERSION; |
return XVID_ERR_VERSION; |
169 |
|
|
170 |
cpu_flags = (init->cpu_flags & XVID_CPU_FORCE) ? init->cpu_flags : detect_cpu_flags(); |
cpu_flags = (init->cpu_flags & XVID_CPU_FORCE) ? init->cpu_flags : detect_cpu_flags(); |
183 |
/* Restore FPU context : emms_c is a nop functions */ |
/* Restore FPU context : emms_c is a nop functions */ |
184 |
emms = emms_c; |
emms = emms_c; |
185 |
|
|
186 |
|
/* Qpel stuff */ |
187 |
|
xvid_QP_Funcs = &xvid_QP_Funcs_C; |
188 |
|
xvid_QP_Add_Funcs = &xvid_QP_Add_Funcs_C; |
189 |
|
xvid_Init_QP(); |
190 |
|
|
191 |
/* Quantization functions */ |
/* Quantization functions */ |
192 |
quant_intra = quant_intra_c; |
quant_intra = quant_intra_c; |
193 |
dequant_intra = dequant_intra_c; |
dequant_intra = dequant_intra_c; |
294 |
|
|
295 |
#if defined(ARCH_IS_IA32) |
#if defined(ARCH_IS_IA32) |
296 |
|
|
297 |
if ((cpu_flags & XVID_CPU_ASM)) |
if ((cpu_flags & XVID_CPU_ASM)) { |
|
{ |
|
298 |
vfilter_31 = xvid_VFilter_31_x86; |
vfilter_31 = xvid_VFilter_31_x86; |
299 |
hfilter_31 = xvid_HFilter_31_x86; |
hfilter_31 = xvid_HFilter_31_x86; |
300 |
} |
} |
313 |
fdct = fdct_mmx; |
fdct = fdct_mmx; |
314 |
idct = idct_mmx; |
idct = idct_mmx; |
315 |
|
|
316 |
|
/* Qpel stuff */ |
317 |
|
xvid_QP_Funcs = &xvid_QP_Funcs_mmx; |
318 |
|
xvid_QP_Add_Funcs = &xvid_QP_Add_Funcs_mmx; |
319 |
|
|
320 |
/* Quantization related functions */ |
/* Quantization related functions */ |
321 |
quant_intra = quant_intra_mmx; |
quant_intra = quant_intra_mmx; |
322 |
dequant_intra = dequant_intra_mmx; |
dequant_intra = dequant_intra_mmx; |
480 |
interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_3dne; |
interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_3dne; |
481 |
} |
} |
482 |
|
|
483 |
|
#if defined(EXPERIMENTAL_SSE2_CODE) /* mark the whole SSE2 stuff as experimental. At least on |
484 |
|
my P4, it crashes... */ |
485 |
if ((cpu_flags & XVID_CPU_SSE2)) { |
if ((cpu_flags & XVID_CPU_SSE2)) { |
486 |
|
|
487 |
calc_cbp = calc_cbp_sse2; |
calc_cbp = calc_cbp_sse2; |
492 |
quant_inter = quant_inter_sse2; |
quant_inter = quant_inter_sse2; |
493 |
dequant_inter = dequant_inter_sse2; |
dequant_inter = dequant_inter_sse2; |
494 |
|
|
|
#if defined(EXPERIMENTAL_SSE2_CODE) |
|
495 |
/* ME; slower than xmm */ |
/* ME; slower than xmm */ |
496 |
sad16 = sad16_sse2; |
sad16 = sad16_sse2; |
497 |
dev16 = dev16_sse2; |
dev16 = dev16_sse2; |
|
#endif |
|
498 |
/* Forward and Inverse DCT */ |
/* Forward and Inverse DCT */ |
499 |
|
#if 0 /* Both function are known to be unprecise, better keep them deactivated */ |
500 |
idct = idct_sse2; |
idct = idct_sse2; |
501 |
fdct = fdct_sse2; |
fdct = fdct_sse2; |
502 |
|
#endif |
503 |
} |
} |
504 |
#endif |
#endif |
505 |
|
#endif |
506 |
|
|
507 |
#if defined(ARCH_IS_IA64) |
#if defined(ARCH_IS_IA64) |
508 |
if ((cpu_flags & XVID_CPU_ASM)) { /* use assembler routines? */ |
if ((cpu_flags & XVID_CPU_ASM)) { /* use assembler routines? */ |
527 |
transfer_8to16sub2 = transfer_8to16sub2_ia64; |
transfer_8to16sub2 = transfer_8to16sub2_ia64; |
528 |
transfer_16to8add = transfer_16to8add_ia64; |
transfer_16to8add = transfer_16to8add_ia64; |
529 |
transfer8x8_copy = transfer8x8_copy_ia64; |
transfer8x8_copy = transfer8x8_copy_ia64; |
|
DPRINTF(DPRINTF_DEBUG, "Using IA-64 assembler routines."); |
|
530 |
} |
} |
531 |
#endif |
#endif |
532 |
|
|
559 |
static int |
static int |
560 |
xvid_gbl_info(xvid_gbl_info_t * info) |
xvid_gbl_info(xvid_gbl_info_t * info) |
561 |
{ |
{ |
562 |
if (XVID_MAJOR(info->version) != 1) /* v1.x.x */ |
if (XVID_VERSION_MAJOR(info->version) != 1) /* v1.x.x */ |
563 |
return XVID_ERR_VERSION; |
return XVID_ERR_VERSION; |
564 |
|
|
565 |
info->actual_version = XVID_VERSION; |
info->actual_version = XVID_VERSION; |
585 |
int height2; |
int height2; |
586 |
IMAGE img; |
IMAGE img; |
587 |
|
|
588 |
if (XVID_MAJOR(convert->version) != 1) /* v1.x.x */ |
if (XVID_VERSION_MAJOR(convert->version) != 1) /* v1.x.x */ |
589 |
return XVID_ERR_VERSION; |
return XVID_ERR_VERSION; |
590 |
|
|
591 |
#if 0 |
#if 0 |