--- trunk/xvidcore/src/encoder.c 2002/03/26 11:16:08 69 +++ trunk/xvidcore/src/encoder.c 2002/03/29 07:03:24 84 @@ -121,55 +121,38 @@ pEnc->iFrameNum = 0; pEnc->iMaxKeyInterval = pParam->max_key_interval; - if (image_create(&pEnc->sCurrent, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height) < 0) - { - xvid_free(pEnc); - return XVID_ERR_MEMORY; - } - - if (image_create(&pEnc->sReference, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height) < 0) - { - image_destroy(&pEnc->sCurrent, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); - xvid_free(pEnc); - return XVID_ERR_MEMORY; - } - - if (image_create(&pEnc->vInterH, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height) < 0) - { - image_destroy(&pEnc->sCurrent, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); - image_destroy(&pEnc->sReference, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); - xvid_free(pEnc); - return XVID_ERR_MEMORY; - } - - if (image_create(&pEnc->vInterV, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height) < 0) - { - image_destroy(&pEnc->sCurrent, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); - image_destroy(&pEnc->sReference, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); - image_destroy(&pEnc->vInterH, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); - xvid_free(pEnc); - return XVID_ERR_MEMORY; - } + /* try to allocate memory */ - if (image_create(&pEnc->vInterHV, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height) < 0) - { - image_destroy(&pEnc->sCurrent, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); - image_destroy(&pEnc->sReference, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); - image_destroy(&pEnc->vInterH, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); - image_destroy(&pEnc->vInterV, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); - xvid_free(pEnc); - return XVID_ERR_MEMORY; - } - - pEnc->pMBs = xvid_malloc(sizeof(MACROBLOCK) * pEnc->mbParam.mb_width * pEnc->mbParam.mb_height, CACHE_LINE); - if (pEnc->pMBs == NULL) + pEnc->sCurrent.y = pEnc->sCurrent.u = pEnc->sCurrent.v = NULL; + pEnc->sReference.y = pEnc->sReference.u = pEnc->sReference.v = NULL; + pEnc->vInterH.y = pEnc->vInterH.u = pEnc->vInterH.v = NULL; + pEnc->vInterV.y = pEnc->vInterV.u = pEnc->vInterV.v = NULL; + pEnc->vInterVf.y = pEnc->vInterVf.u = pEnc->vInterVf.v = NULL; + pEnc->vInterHV.y = pEnc->vInterHV.u = pEnc->vInterHV.v = NULL; + pEnc->vInterHVf.y = pEnc->vInterHVf.u = pEnc->vInterHVf.v = NULL; + + pEnc->pMBs = NULL; + + if (image_create(&pEnc->sCurrent, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height) < 0 || + image_create(&pEnc->sReference, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height) < 0 || + image_create(&pEnc->vInterH, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height) < 0 || + image_create(&pEnc->vInterV, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height) < 0 || + image_create(&pEnc->vInterVf, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height) < 0 || + image_create(&pEnc->vInterHV, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height) < 0 || + image_create(&pEnc->vInterHVf, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height) < 0 || + (pEnc->pMBs = xvid_malloc(sizeof(MACROBLOCK) * pEnc->mbParam.mb_width * pEnc->mbParam.mb_height, CACHE_LINE)) == NULL) { image_destroy(&pEnc->sCurrent, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); image_destroy(&pEnc->sReference, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); image_destroy(&pEnc->vInterH, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); image_destroy(&pEnc->vInterV, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); + image_destroy(&pEnc->vInterVf, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); image_destroy(&pEnc->vInterHV, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); - xvid_free(pEnc); + image_destroy(&pEnc->vInterHVf, pEnc->mbParam.edged_width, pEnc->mbParam.edged_height); + if (pEnc) + { + xvid_free(pEnc); + } return XVID_ERR_MEMORY; } @@ -255,9 +238,14 @@ { int * temp_dquants = (int *) xvid_malloc(pEnc->mbParam.mb_width * pEnc->mbParam.mb_height * sizeof(int), CACHE_LINE); - pEnc->mbParam.quant = adaptive_quantization(pEnc->sCurrent.y, pEnc->mbParam.width, - temp_dquants, pFrame->quant, pFrame->quant, - 2*pFrame->quant, pEnc->mbParam.mb_width, pEnc->mbParam.mb_height); + pEnc->mbParam.quant = adaptive_quantization(pEnc->sCurrent.y, + pEnc->mbParam.width, + temp_dquants, + pEnc->mbParam.quant, + pEnc->mbParam.quant, + 2*pEnc->mbParam.quant, + pEnc->mbParam.mb_width, + pEnc->mbParam.mb_height); for (y = 0; y < pEnc->mbParam.mb_height; y++) for (x = 0; x < pEnc->mbParam.mb_width; x++) @@ -276,6 +264,8 @@ else if(pEnc->mbParam.global_flags & XVID_MPEGQUANT) { int ret1, ret2; + ret1 = ret2 = 0; + if(pEnc->mbParam.quant_type != MPEG4_QUANT) write_vol_header = 1; @@ -364,8 +354,10 @@ static int FrameCodeI(Encoder * pEnc, Bitstream * bs, uint32_t *pBits) { - CACHE_ALIGN int16_t dct_codes[6][64]; - CACHE_ALIGN int16_t qcoeff[6][64]; + + DECLARE_ALIGNED_MATRIX(dct_codes, 6, 64, int16_t, CACHE_LINE); + DECLARE_ALIGNED_MATRIX(qcoeff, 6, 64, int16_t, CACHE_LINE); + uint16_t x, y; pEnc->iFrameNum = 0; @@ -417,8 +409,8 @@ { float fSigma; - CACHE_ALIGN int16_t dct_codes[6][64]; - CACHE_ALIGN int16_t qcoeff[6][64]; + DECLARE_ALIGNED_MATRIX(dct_codes, 6, 64, int16_t, CACHE_LINE); + DECLARE_ALIGNED_MATRIX(qcoeff, 6, 64, int16_t, CACHE_LINE); int iLimit; uint32_t x, y; @@ -429,7 +421,12 @@ IMAGE *pRef = &pEnc->sReference; start_timer(); - image_setedges(pRef,pEnc->mbParam.edged_width, pEnc->mbParam.edged_height, pEnc->mbParam.width, pEnc->mbParam.height, pEnc->mbParam.global_flags & XVID_INTERLACING); + image_setedges(pRef, + pEnc->mbParam.edged_width, + pEnc->mbParam.edged_height, + pEnc->mbParam.width, + pEnc->mbParam.height, + pEnc->mbParam.global_flags & XVID_INTERLACING); stop_edges_timer(); pEnc->mbParam.rounding_type = 1 - pEnc->mbParam.rounding_type; @@ -439,18 +436,49 @@ else iLimit = pEnc->mbParam.mb_width * pEnc->mbParam.mb_height + 1; - if ((pEnc->mbParam.global_flags & XVID_HALFPEL) > 0) { + if ((pEnc->mbParam.global_flags & XVID_HALFPEL) > 0) + { + IMAGE *vInterV = NULL; + IMAGE *vInterVf = NULL; + IMAGE *vInterHV = NULL; + IMAGE *vInterHVf = NULL; + + // interpolate fields together if field ME is used + if (pEnc->mbParam.global_flags & XVID_INTERLACING && + pEnc->mbParam.global_flags & XVID_FIELDME) + { + vInterVf = &pEnc->vInterVf; + vInterHVf = &pEnc->vInterHVf; + } + + // perform normal interpolation, unless only field-based ME is allowed + if (!(pEnc->mbParam.global_flags & XVID_INTERLACING) || + !(pEnc->mbParam.global_flags & XVID_FIELDMEONLY)) + { + vInterV = &pEnc->vInterV; + vInterHV = &pEnc->vInterHV; + } + start_timer(); - image_interpolate(pRef, &pEnc->vInterH, &pEnc->vInterV, &pEnc->vInterHV, - pEnc->mbParam.edged_width, pEnc->mbParam.edged_height, - pEnc->mbParam.rounding_type); + image_interpolate(pRef, + &pEnc->vInterH, + vInterV, vInterVf, + vInterHV, vInterHVf, + pEnc->mbParam.edged_width, + pEnc->mbParam.edged_height, + pEnc->mbParam.rounding_type); stop_inter_timer(); } start_timer(); - bIntra = MotionEstimation(pEnc->pMBs, &pEnc->mbParam, &pEnc->sReference, - &pEnc->vInterH, &pEnc->vInterV, - &pEnc->vInterHV, &pEnc->sCurrent, iLimit); + bIntra = MotionEstimation(pEnc->pMBs, + &pEnc->mbParam, + &pEnc->sReference, + &pEnc->vInterH, + &pEnc->vInterV, &pEnc->vInterVf, + &pEnc->vInterHV, &pEnc->vInterHVf, + &pEnc->sCurrent, + iLimit); stop_motion_timer(); if (bIntra == 1) @@ -481,9 +509,14 @@ if (!bIntra) { start_timer(); - MBMotionCompensation(pMB, x, y, &pEnc->sReference, - &pEnc->vInterH, &pEnc->vInterV, - &pEnc->vInterHV, &pEnc->sCurrent, dct_codes, + MBMotionCompensation(pMB, + x, y, + &pEnc->sReference, + &pEnc->vInterH, + &pEnc->vInterV, &pEnc->vInterVf, + &pEnc->vInterHV, &pEnc->vInterHVf, + &pEnc->sCurrent, + dct_codes, pEnc->mbParam.width, pEnc->mbParam.height, pEnc->mbParam.edged_width,