21 |
* along with this program ; if not, write to the Free Software |
* along with this program ; if not, write to the Free Software |
22 |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
23 |
* |
* |
24 |
* $Id: estimation_bvop.c,v 1.1.2.5 2003-11-19 12:24:25 syskin Exp $ |
* $Id: estimation_bvop.c,v 1.1.2.8 2003-12-18 02:02:08 Isibaar Exp $ |
25 |
* |
* |
26 |
****************************************************************************/ |
****************************************************************************/ |
27 |
|
|
298 |
} |
} |
299 |
} |
} |
300 |
|
|
301 |
|
void |
302 |
|
CheckCandidate16no4v_qpel(const int x, const int y, SearchData * const data, const unsigned int Direction) |
303 |
|
{ |
304 |
|
int32_t sad, xc, yc; |
305 |
|
const uint8_t * Reference; |
306 |
|
uint32_t t; |
307 |
|
|
308 |
|
if ( (x > data->max_dx) || ( x < data->min_dx) |
309 |
|
|| (y > data->max_dy) || (y < data->min_dy) ) return; |
310 |
|
|
311 |
|
if (data->rrv && (!(x&1) && x !=0) | (!(y&1) && y !=0) ) return; /* non-zero even value */ |
312 |
|
|
313 |
|
Reference = xvid_me_interpolate16x16qpel(x, y, 0, data); |
314 |
|
|
315 |
|
xc = x/2; yc = y/2; |
316 |
|
t = d_mv_bits(x, y, data->predMV, data->iFcode, |
317 |
|
data->qpel^data->qpel_precision, data->rrv); |
318 |
|
|
319 |
|
sad = sad16(data->Cur, Reference, data->iEdgedWidth, 256*4096); |
320 |
|
sad += (data->lambda16 * t * sad)>>10; |
321 |
|
|
322 |
|
if (data->chroma && sad < *data->iMinSAD) |
323 |
|
sad += xvid_me_ChromaSAD((xc >> 1) + roundtab_79[xc & 0x3], |
324 |
|
(yc >> 1) + roundtab_79[yc & 0x3], data); |
325 |
|
|
326 |
|
if (sad < *(data->iMinSAD)) { |
327 |
|
data->iMinSAD2 = *(data->iMinSAD); |
328 |
|
data->currentQMV2.x = data->currentQMV->x; |
329 |
|
data->currentQMV2.y = data->currentQMV->y; |
330 |
|
|
331 |
|
data->iMinSAD[0] = sad; |
332 |
|
data->currentQMV[0].x = x; data->currentQMV[0].y = y; |
333 |
|
} else if (sad < data->iMinSAD2) { |
334 |
|
data->iMinSAD2 = sad; |
335 |
|
data->currentQMV2.x = x; data->currentQMV2.y = y; |
336 |
|
} |
337 |
|
} |
338 |
|
|
339 |
static __inline VECTOR |
static __inline VECTOR |
340 |
ChoosePred(const MACROBLOCK * const pMB, const uint32_t mode) |
ChoosePred(const MACROBLOCK * const pMB, const uint32_t mode) |
341 |
{ |
{ |
399 |
|
|
400 |
int i; |
int i; |
401 |
VECTOR pmv[7]; |
VECTOR pmv[7]; |
|
MainSearchFunc *MainSearchPtr; |
|
402 |
*Data->iMinSAD = MV_MAX_ERROR; |
*Data->iMinSAD = MV_MAX_ERROR; |
403 |
Data->iFcode = iFcode; |
Data->iFcode = iFcode; |
404 |
Data->qpel_precision = 0; |
Data->qpel_precision = 0; |
405 |
Data->chromaX = Data->chromaX = Data->chromaSAD = 256*4096; /* reset chroma-sad cache */ |
Data->chromaX = Data->chromaY = Data->chromaSAD = 256*4096; /* reset chroma-sad cache */ |
406 |
|
|
407 |
Data->RefP[0] = pRef->y + (x + Data->iEdgedWidth*y) * 16; |
Data->RefP[0] = pRef->y + (x + Data->iEdgedWidth*y) * 16; |
408 |
Data->RefP[2] = pRefH + (x + Data->iEdgedWidth*y) * 16; |
Data->RefP[2] = pRefH + (x + Data->iEdgedWidth*y) * 16; |
428 |
if (!vector_repeats(pmv, i) ) |
if (!vector_repeats(pmv, i) ) |
429 |
CheckCandidate16no4v(pmv[i].x, pmv[i].y, Data, i); |
CheckCandidate16no4v(pmv[i].x, pmv[i].y, Data, i); |
430 |
|
|
431 |
|
if (*Data->iMinSAD > 512) { |
432 |
|
unsigned int mask = make_mask(pmv, 7, Data->dir); |
433 |
|
|
434 |
|
MainSearchFunc *MainSearchPtr; |
435 |
if (MotionFlags & XVID_ME_USESQUARES16) MainSearchPtr = xvid_me_SquareSearch; |
if (MotionFlags & XVID_ME_USESQUARES16) MainSearchPtr = xvid_me_SquareSearch; |
436 |
else if (MotionFlags & XVID_ME_ADVANCEDDIAMOND16) MainSearchPtr = xvid_me_AdvDiamondSearch; |
else if (MotionFlags & XVID_ME_ADVANCEDDIAMOND16) MainSearchPtr = xvid_me_AdvDiamondSearch; |
437 |
else MainSearchPtr = xvid_me_DiamondSearch; |
else MainSearchPtr = xvid_me_DiamondSearch; |
438 |
|
|
|
if (*Data->iMinSAD > 512) { |
|
|
unsigned int mask = make_mask(pmv, 7, Data->dir); |
|
439 |
MainSearchPtr(Data->currentMV->x, Data->currentMV->y, Data, mask, CheckCandidate16no4v); |
MainSearchPtr(Data->currentMV->x, Data->currentMV->y, Data, mask, CheckCandidate16no4v); |
440 |
} |
} |
441 |
|
|
447 |
Data->qpel_precision = 1; |
Data->qpel_precision = 1; |
448 |
get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 4, |
get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 4, |
449 |
pParam->width, pParam->height, iFcode, 2, 0); |
pParam->width, pParam->height, iFcode, 2, 0); |
450 |
|
|
451 |
|
if (MotionFlags & XVID_ME_QUARTERPELREFINE16) { |
452 |
|
if(MotionFlags & XVID_ME_FASTREFINE16) |
453 |
|
SubpelRefine_Fast(Data, CheckCandidate16no4v_qpel); |
454 |
|
else |
455 |
xvid_me_SubpelRefine(Data, CheckCandidate16no4v); |
xvid_me_SubpelRefine(Data, CheckCandidate16no4v); |
456 |
} |
} |
457 |
|
} |
458 |
|
|
459 |
/* three bits are needed to code backward mode. four for forward */ |
/* three bits are needed to code backward mode. four for forward */ |
460 |
|
|
491 |
const uint32_t x, const uint32_t y, |
const uint32_t x, const uint32_t y, |
492 |
const SearchData * const Data) |
const SearchData * const Data) |
493 |
{ |
{ |
494 |
|
int k; |
495 |
|
|
496 |
|
if (!Data->chroma) { |
497 |
int dx = 0, dy = 0, b_dx = 0, b_dy = 0; |
int dx = 0, dy = 0, b_dx = 0, b_dy = 0; |
498 |
int32_t sum; |
int32_t sum; |
|
int k; |
|
499 |
const uint32_t stride = Data->iEdgedWidth/2; |
const uint32_t stride = Data->iEdgedWidth/2; |
500 |
/* this is not full chroma compensation, only it's fullpel approximation. should work though */ |
/* this is not full chroma compensation, only it's fullpel approximation. should work though */ |
501 |
|
|
523 |
b_Ref->v + (y*8 + b_dy/2) * stride + x*8 + b_dx/2, |
b_Ref->v + (y*8 + b_dy/2) * stride + x*8 + b_dx/2, |
524 |
stride); |
stride); |
525 |
|
|
526 |
if (sum < MAX_CHROMA_SAD_FOR_SKIP * (int)Data->iQuant) { |
if (sum >= MAX_CHROMA_SAD_FOR_SKIP * (int)Data->iQuant) return; /* no skip */ |
527 |
|
} |
528 |
|
|
529 |
|
/* skip */ |
530 |
pMB->mode = MODE_DIRECT_NONE_MV; /* skipped */ |
pMB->mode = MODE_DIRECT_NONE_MV; /* skipped */ |
531 |
for (k = 0; k < 4; k++) { |
for (k = 0; k < 4; k++) { |
532 |
pMB->qmvs[k] = pMB->mvs[k] = Data->directmvF[k]; |
pMB->qmvs[k] = pMB->mvs[k] = Data->directmvF[k]; |
533 |
pMB->b_qmvs[k] = pMB->b_mvs[k] = Data->directmvB[k]; |
pMB->b_qmvs[k] = pMB->b_mvs[k] = Data->directmvB[k]; |
534 |
} |
} |
535 |
} |
} |
|
} |
|
536 |
|
|
537 |
static uint32_t |
static uint32_t |
538 |
SearchDirect(const IMAGE * const f_Ref, |
SearchDirect(const IMAGE * const f_Ref, |
612 |
/* initial (fast) skip decision */ |
/* initial (fast) skip decision */ |
613 |
if (*Data->iMinSAD < (int)Data->iQuant * INITIAL_SKIP_THRESH * (Data->chroma?3:2)) { |
if (*Data->iMinSAD < (int)Data->iQuant * INITIAL_SKIP_THRESH * (Data->chroma?3:2)) { |
614 |
/* possible skip */ |
/* possible skip */ |
|
if (Data->chroma) { |
|
|
pMB->mode = MODE_DIRECT_NONE_MV; |
|
|
return *Data->iMinSAD; /* skip. */ |
|
|
} else { |
|
615 |
SkipDecisionB(pCur, f_Ref, b_Ref, pMB, x, y, Data); |
SkipDecisionB(pCur, f_Ref, b_Ref, pMB, x, y, Data); |
616 |
if (pMB->mode == MODE_DIRECT_NONE_MV) return *Data->iMinSAD; /* skip. */ |
if (pMB->mode == MODE_DIRECT_NONE_MV) return *Data->iMinSAD; /* skipped */ |
|
} |
|
617 |
} |
} |
618 |
|
|
619 |
*Data->iMinSAD += Data->lambda16; |
*Data->iMinSAD += Data->lambda16; |
620 |
skip_sad = *Data->iMinSAD; |
skip_sad = *Data->iMinSAD; |
621 |
|
|
622 |
/* |
if (!(MotionFlags & XVID_ME_SKIP_DELTASEARCH)) { |
|
* DIRECT MODE DELTA VECTOR SEARCH. |
|
|
* This has to be made more effective, but at the moment I'm happy it's running at all |
|
|
*/ |
|
|
|
|
623 |
if (MotionFlags & XVID_ME_USESQUARES16) MainSearchPtr = xvid_me_SquareSearch; |
if (MotionFlags & XVID_ME_USESQUARES16) MainSearchPtr = xvid_me_SquareSearch; |
624 |
else if (MotionFlags & XVID_ME_ADVANCEDDIAMOND16) MainSearchPtr = xvid_me_AdvDiamondSearch; |
else if (MotionFlags & XVID_ME_ADVANCEDDIAMOND16) MainSearchPtr = xvid_me_AdvDiamondSearch; |
625 |
else MainSearchPtr = xvid_me_DiamondSearch; |
else MainSearchPtr = xvid_me_DiamondSearch; |
627 |
MainSearchPtr(0, 0, Data, 255, CheckCandidate); |
MainSearchPtr(0, 0, Data, 255, CheckCandidate); |
628 |
|
|
629 |
xvid_me_SubpelRefine(Data, CheckCandidate); |
xvid_me_SubpelRefine(Data, CheckCandidate); |
630 |
|
} |
631 |
|
|
632 |
*best_sad = *Data->iMinSAD; |
*best_sad = *Data->iMinSAD; |
633 |
|
|
794 |
SubpelRefine_dir(Data, CheckCandidateInt, 2); |
SubpelRefine_dir(Data, CheckCandidateInt, 2); |
795 |
} |
} |
796 |
|
|
797 |
*Data->iMinSAD += (2+3) * Data->lambda16; /* two bits are needed to code interpolate mode. */ |
*Data->iMinSAD += 2 * Data->lambda16; /* two bits are needed to code interpolate mode. */ |
798 |
|
|
799 |
if (*Data->iMinSAD < *best_sad) { |
if (*Data->iMinSAD < *best_sad) { |
800 |
*best_sad = *Data->iMinSAD; |
*best_sad = *Data->iMinSAD; |
852 |
memset(&Data, 0, sizeof(SearchData)); |
memset(&Data, 0, sizeof(SearchData)); |
853 |
|
|
854 |
Data.iEdgedWidth = pParam->edged_width; |
Data.iEdgedWidth = pParam->edged_width; |
|
Data.lambda16 = xvid_me_lambda_vec16[MAX(frame->quant-2, 2)]; |
|
855 |
Data.qpel = pParam->vol_flags & XVID_VOL_QUARTERPEL ? 1 : 0; |
Data.qpel = pParam->vol_flags & XVID_VOL_QUARTERPEL ? 1 : 0; |
856 |
Data.rounding = 0; |
Data.rounding = 0; |
857 |
Data.chroma = frame->motion_flags & XVID_ME_CHROMA_BVOP; |
Data.chroma = frame->motion_flags & XVID_ME_CHROMA_BVOP; |
876 |
continue; |
continue; |
877 |
} |
} |
878 |
|
|
879 |
|
Data.lambda16 = xvid_me_lambda_vec16[b_mb->quant]; |
880 |
|
|
881 |
Data.Cur = frame->image.y + (j * Data.iEdgedWidth + i) * 16; |
Data.Cur = frame->image.y + (j * Data.iEdgedWidth + i) * 16; |
882 |
Data.CurU = frame->image.u + (j * Data.iEdgedWidth/2 + i) * 8; |
Data.CurU = frame->image.u + (j * Data.iEdgedWidth/2 + i) * 8; |
883 |
Data.CurV = frame->image.v + (j * Data.iEdgedWidth/2 + i) * 8; |
Data.CurV = frame->image.v + (j * Data.iEdgedWidth/2 + i) * 8; |
925 |
&Data); |
&Data); |
926 |
|
|
927 |
/* final skip decision */ |
/* final skip decision */ |
928 |
if ( (skip_sad < Data.iQuant * MAX_SAD00_FOR_SKIP * 2) |
if ( (skip_sad < Data.iQuant * MAX_SAD00_FOR_SKIP * (Data.chroma ? 3:2) ) |
929 |
&& ((100*best_sad)/(skip_sad+1) > FINAL_SKIP_THRESH) ) |
&& ((100*best_sad)/(skip_sad+1) > FINAL_SKIP_THRESH) ) |
930 |
|
|
931 |
SkipDecisionB(&frame->image, f_ref, b_ref, pMB, i, j, &Data); |
SkipDecisionB(&frame->image, f_ref, b_ref, pMB, i, j, &Data); |
932 |
|
|
933 |
switch (pMB->mode) { |
switch (pMB->mode) { |