--- trunk/xvidcore/src/prediction/mbprediction.c 2002/04/25 06:55:00 136 +++ trunk/xvidcore/src/prediction/mbprediction.c 2002/06/30 10:46:29 252 @@ -42,6 +42,7 @@ * * * Revision history: * * * + * 29.06.2002 predict_acdc() bounding * * 12.12.2001 improved calc_acdc_prediction; removed need for memcpy * * 15.12.2001 moved pmv displacement to motion estimation * * 30.11.2001 mmx cbp support * @@ -59,13 +60,17 @@ #define DIV_DIV(A,B) ( (A) > 0 ? ((A)+((B)>>1))/(B) : ((A)-((B)>>1))/(B) ) -static int __inline rescale(int predict_quant, int current_quant, int coeff) +static int __inline +rescale(int predict_quant, + int current_quant, + int coeff) { - return (coeff != 0) ? DIV_DIV((coeff) * (predict_quant), (current_quant)) : 0; + return (coeff != 0) ? DIV_DIV((coeff) * (predict_quant), + (current_quant)) : 0; } -static const int16_t default_acdc_values[15] = { +static const int16_t default_acdc_values[15] = { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 @@ -77,14 +82,20 @@ */ -void predict_acdc(MACROBLOCK *pMBs, - uint32_t x, uint32_t y, uint32_t mb_width, - uint32_t block, - int16_t qcoeff[64], - uint32_t current_quant, - int32_t iDcScaler, - int16_t predictors[8]) +void +predict_acdc(MACROBLOCK * pMBs, + uint32_t x, + uint32_t y, + uint32_t mb_width, + uint32_t block, + int16_t qcoeff[64], + uint32_t current_quant, + int32_t iDcScaler, + int16_t predictors[8], + const int bound) + { + const int mbpos = (y * mb_width) + x; int16_t *left, *top, *diag, *current; int32_t left_quant = current_quant; @@ -94,8 +105,8 @@ const int16_t *pTop = default_acdc_values; const int16_t *pDiag = default_acdc_values; - uint32_t index = x + y * mb_width; // current macroblock - int * acpred_direction = &pMBs[index].acpred_directions[block]; + uint32_t index = x + y * mb_width; // current macroblock + int *acpred_direction = &pMBs[index].acpred_directions[block]; uint32_t i; left = top = diag = current = 0; @@ -104,27 +115,28 @@ // left macroblock - if(x && (pMBs[index - 1].mode == MODE_INTRA - || pMBs[index - 1].mode == MODE_INTRA_Q)) { + if (x && mbpos >= bound + 1 && + (pMBs[index - 1].mode == MODE_INTRA || + pMBs[index - 1].mode == MODE_INTRA_Q)) { left = pMBs[index - 1].pred_values[0]; left_quant = pMBs[index - 1].quant; //DEBUGI("LEFT", *(left+MBPRED_SIZE)); } - // top macroblock - - if(y && (pMBs[index - mb_width].mode == MODE_INTRA - || pMBs[index - mb_width].mode == MODE_INTRA_Q)) { + + if (mbpos >= bound + (int)mb_width && + (pMBs[index - mb_width].mode == MODE_INTRA || + pMBs[index - mb_width].mode == MODE_INTRA_Q)) { top = pMBs[index - mb_width].pred_values[0]; top_quant = pMBs[index - mb_width].quant; } - // diag macroblock - - if(x && y && (pMBs[index - 1 - mb_width].mode == MODE_INTRA - || pMBs[index - 1 - mb_width].mode == MODE_INTRA_Q)) { + + if (x && mbpos >= bound + (int)mb_width + 1 && + (pMBs[index - 1 - mb_width].mode == MODE_INTRA || + pMBs[index - 1 - mb_width].mode == MODE_INTRA_Q)) { diag = pMBs[index - 1 - mb_width].pred_values[0]; } @@ -132,89 +144,85 @@ current = pMBs[index].pred_values[0]; // now grab pLeft, pTop, pDiag _blocks_ - + switch (block) { - - case 0: - if(left) + + case 0: + if (left) pLeft = left + MBPRED_SIZE; - - if(top) + + if (top) pTop = top + (MBPRED_SIZE << 1); - - if(diag) + + if (diag) pDiag = diag + 3 * MBPRED_SIZE; - + break; - + case 1: pLeft = current; left_quant = current_quant; - - if(top) { + + if (top) { pTop = top + 3 * MBPRED_SIZE; pDiag = top + (MBPRED_SIZE << 1); } break; - + case 2: - if(left) { + if (left) { pLeft = left + 3 * MBPRED_SIZE; pDiag = left + MBPRED_SIZE; } - + pTop = current; top_quant = current_quant; break; - + case 3: pLeft = current + (MBPRED_SIZE << 1); left_quant = current_quant; - + pTop = current + MBPRED_SIZE; top_quant = current_quant; - + pDiag = current; - + break; - + case 4: - if(left) + if (left) pLeft = left + (MBPRED_SIZE << 2); - if(top) + if (top) pTop = top + (MBPRED_SIZE << 2); - if(diag) + if (diag) pDiag = diag + (MBPRED_SIZE << 2); break; - + case 5: - if(left) + if (left) pLeft = left + 5 * MBPRED_SIZE; - if(top) + if (top) pTop = top + 5 * MBPRED_SIZE; - if(diag) + if (diag) pDiag = diag + 5 * MBPRED_SIZE; break; } - // determine ac prediction direction & ac/dc predictor - // place rescaled ac/dc predictions into predictors[] for later use + // determine ac prediction direction & ac/dc predictor + // place rescaled ac/dc predictions into predictors[] for later use - if(ABS(pLeft[0] - pDiag[0]) < ABS(pDiag[0] - pTop[0])) { - *acpred_direction = 1; // vertical + if (ABS(pLeft[0] - pDiag[0]) < ABS(pDiag[0] - pTop[0])) { + *acpred_direction = 1; // vertical predictors[0] = DIV_DIV(pTop[0], iDcScaler); - for (i = 1; i < 8; i++) - { + for (i = 1; i < 8; i++) { predictors[i] = rescale(top_quant, current_quant, pTop[i]); } - } - else - { - *acpred_direction = 2; // horizontal + } else { + *acpred_direction = 2; // horizontal predictors[0] = DIV_DIV(pLeft[0], iDcScaler); - for (i = 1; i < 8; i++) - { + for (i = 1; i < 8; i++) { predictors[i] = rescale(left_quant, current_quant, pLeft[i + 7]); } } @@ -226,45 +234,45 @@ */ -void add_acdc(MACROBLOCK *pMB, - uint32_t block, - int16_t dct_codes[64], - uint32_t iDcScaler, - int16_t predictors[8]) +void +add_acdc(MACROBLOCK * pMB, + uint32_t block, + int16_t dct_codes[64], + uint32_t iDcScaler, + int16_t predictors[8]) { uint8_t acpred_direction = pMB->acpred_directions[block]; - int16_t * pCurrent = pMB->pred_values[block]; + int16_t *pCurrent = pMB->pred_values[block]; uint32_t i; + DPRINTF(DPRINTF_COEFF,"predictor[0] %i", predictors[0]); + dct_codes[0] += predictors[0]; // dc prediction pCurrent[0] = dct_codes[0] * iDcScaler; - if (acpred_direction == 1) - { - for (i = 1; i < 8; i++) - { + if (acpred_direction == 1) { + for (i = 1; i < 8; i++) { int level = dct_codes[i] + predictors[i]; + + DPRINTF(DPRINTF_COEFF,"predictor[%i] %i",i, predictors[i]); + dct_codes[i] = level; pCurrent[i] = level; - pCurrent[i+7] = dct_codes[i*8]; + pCurrent[i + 7] = dct_codes[i * 8]; } - } - else if (acpred_direction == 2) - { - for (i = 1; i < 8; i++) - { - int level = dct_codes[i*8] + predictors[i]; - dct_codes[i*8] = level; - pCurrent[i+7] = level; + } else if (acpred_direction == 2) { + for (i = 1; i < 8; i++) { + int level = dct_codes[i * 8] + predictors[i]; + DPRINTF(DPRINTF_COEFF,"predictor[%i] %i",i*8, predictors[i]); + + dct_codes[i * 8] = level; + pCurrent[i + 7] = level; pCurrent[i] = dct_codes[i]; } - } - else - { - for (i = 1; i < 8; i++) - { + } else { + for (i = 1; i < 8; i++) { pCurrent[i] = dct_codes[i]; - pCurrent[i+7] = dct_codes[i*8]; + pCurrent[i + 7] = dct_codes[i * 8]; } } } @@ -284,13 +292,14 @@ S2 = sum of all qcoeff */ -uint32_t calc_acdc(MACROBLOCK *pMB, - uint32_t block, - int16_t qcoeff[64], - uint32_t iDcScaler, - int16_t predictors[8]) +uint32_t +calc_acdc(MACROBLOCK * pMB, + uint32_t block, + int16_t qcoeff[64], + uint32_t iDcScaler, + int16_t predictors[8]) { - int16_t * pCurrent = pMB->pred_values[block]; + int16_t *pCurrent = pMB->pred_values[block]; uint32_t i; uint32_t S1 = 0, S2 = 0; @@ -298,7 +307,7 @@ /* store current coeffs to pred_values[] for future prediction */ pCurrent[0] = qcoeff[0] * iDcScaler; - for(i = 1; i < 8; i++) { + for (i = 1; i < 8; i++) { pCurrent[i] = qcoeff[i]; pCurrent[i + 7] = qcoeff[i * 8]; } @@ -307,9 +316,8 @@ qcoeff[0] = qcoeff[0] - predictors[0]; - if (pMB->acpred_directions[block] == 1) - { - for(i = 1; i < 8; i++) { + if (pMB->acpred_directions[block] == 1) { + for (i = 1; i < 8; i++) { int16_t level; level = qcoeff[i]; @@ -318,13 +326,12 @@ S1 += ABS(level); predictors[i] = level; } - } - else // acpred_direction == 2 + } else // acpred_direction == 2 { - for(i = 1; i < 8; i++) { + for (i = 1; i < 8; i++) { int16_t level; - level = qcoeff[i*8]; + level = qcoeff[i * 8]; S2 += ABS(level); level -= predictors[i]; S1 += ABS(level); @@ -333,42 +340,39 @@ } - + return S2 - S1; } /* apply predictors[] to qcoeff */ -void apply_acdc(MACROBLOCK *pMB, - uint32_t block, - int16_t qcoeff[64], - int16_t predictors[8]) +void +apply_acdc(MACROBLOCK * pMB, + uint32_t block, + int16_t qcoeff[64], + int16_t predictors[8]) { uint32_t i; - if (pMB->acpred_directions[block] == 1) - { - for(i = 1; i < 8; i++) - { + if (pMB->acpred_directions[block] == 1) { + for (i = 1; i < 8; i++) { qcoeff[i] = predictors[i]; } - } - else - { - for(i = 1; i < 8; i++) - { - qcoeff[i*8] = predictors[i]; + } else { + for (i = 1; i < 8; i++) { + qcoeff[i * 8] = predictors[i]; } } } -void MBPrediction(FRAMEINFO *frame, - uint32_t x, - uint32_t y, - uint32_t mb_width, - int16_t qcoeff[6*64]) +void +MBPrediction(FRAMEINFO * frame, + uint32_t x, + uint32_t y, + uint32_t mb_width, + int16_t qcoeff[6 * 64]) { int32_t j; @@ -379,44 +383,207 @@ MACROBLOCK *pMB = &frame->mbs[x + y * mb_width]; if ((pMB->mode == MODE_INTRA) || (pMB->mode == MODE_INTRA_Q)) { - - for(j = 0; j < 6; j++) - { + + for (j = 0; j < 6; j++) { iDcScaler = get_dc_scaler(iQuant, (j < 4) ? 1 : 0); - predict_acdc(frame->mbs, - x, - y, - mb_width, - j, - &qcoeff[j*64], - iQuant, - iDcScaler, - predictors[j]); - - S += calc_acdc(pMB, - j, - &qcoeff[j*64], - iDcScaler, - predictors[j]); + predict_acdc(frame->mbs, x, y, mb_width, j, &qcoeff[j * 64], + iQuant, iDcScaler, predictors[j], 0); + + S += calc_acdc(pMB, j, &qcoeff[j * 64], iDcScaler, predictors[j]); } - if (S < 0) // dont predict - { - for(j = 0; j < 6; j++) - { + if (S < 0) // dont predict + { + for (j = 0; j < 6; j++) { pMB->acpred_directions[j] = 0; } - } - else - { - for(j = 0; j < 6; j++) - { - apply_acdc(pMB, j, &qcoeff[j*64], predictors[j]); + } else { + for (j = 0; j < 6; j++) { + apply_acdc(pMB, j, &qcoeff[j * 64], predictors[j]); } } pMB->cbp = calc_cbp(qcoeff); } } + + + + +/* + get_pmvdata2: get_pmvdata with bounding +*/ +#define OFFSET(x,y,stride) ((x)+((y)*(stride))) + +int +get_pmvdata2(const MACROBLOCK * const pMBs, + const uint32_t x, + const uint32_t y, + const uint32_t x_dim, + const uint32_t block, + VECTOR * const pmv, + int32_t * const psad, + const int bound) +{ + const int mbpos = OFFSET(x, y ,x_dim); + + /* + * pmv are filled with: + * [0]: Median (or whatever is correct in a special case) + * [1]: left neighbour + * [2]: top neighbour + * [3]: topright neighbour + * psad are filled with: + * [0]: minimum of [1] to [3] + * [1]: left neighbour's SAD (NB:[1] to [3] are actually not needed) + * [2]: top neighbour's SAD + * [3]: topright neighbour's SAD + */ + + int xin1, xin2, xin3; + int yin1, yin2, yin3; + int vec1, vec2, vec3; + + int pos1, pos2, pos3; + int num_cand = 0; // number of candidates + int last_cand; // last candidate + + uint32_t index = x + y * x_dim; + const VECTOR zeroMV = { 0, 0 }; + + /* + * MODE_INTER, vm18 page 48 + * MODE_INTER4V vm18 page 51 + * + * (x,y-1) (x+1,y-1) + * [ | ] [ | ] + * [ 2 | 3 ] [ 2 | ] + * + * (x-1,y) (x,y) (x+1,y) + * [ | 1 ] [ 0 | 1 ] [ 0 | ] + * [ | 3 ] [ 2 | 3 ] [ | ] + */ + + switch (block) { + case 0: + xin1 = x - 1; + yin1 = y; + vec1 = 1; /* left */ + xin2 = x; + yin2 = y - 1; + vec2 = 2; /* top */ + xin3 = x + 1; + yin3 = y - 1; + vec3 = 2; /* top right */ + break; + case 1: + xin1 = x; + yin1 = y; + vec1 = 0; + xin2 = x; + yin2 = y - 1; + vec2 = 3; + xin3 = x + 1; + yin3 = y - 1; + vec3 = 2; + break; + case 2: + xin1 = x - 1; + yin1 = y; + vec1 = 3; + xin2 = x; + yin2 = y; + vec2 = 0; + xin3 = x; + yin3 = y; + vec3 = 1; + break; + default: + xin1 = x; + yin1 = y; + vec1 = 2; + xin2 = x; + yin2 = y; + vec2 = 0; + xin3 = x; + yin3 = y; + vec3 = 1; + } + + pos1 = OFFSET(xin1, yin1, x_dim); + pos2 = OFFSET(xin2, yin2, x_dim); + pos3 = OFFSET(xin3, yin3, x_dim); + + // left + if (xin1 < 0 || pos1 < bound) { + pmv[1] = zeroMV; + psad[1] = MV_MAX_ERROR; + } else { + pmv[1] = pMBs[xin1 + yin1 * x_dim].mvs[vec1]; + psad[1] = pMBs[xin1 + yin1 * x_dim].sad8[vec1]; + num_cand++; + last_cand = 1; + } + + // top + if (yin2 < 0 || pos2 < bound) { + pmv[2] = zeroMV; + psad[2] = MV_MAX_ERROR; + } else { + pmv[2] = pMBs[xin2 + yin2 * x_dim].mvs[vec2]; + psad[2] = pMBs[xin2 + yin2 * x_dim].sad8[vec2]; + num_cand++; + last_cand = 2; + } + + + // top right + if (yin3 < 0 || pos3 < bound || xin3 >= (int)x_dim) { + pmv[3] = zeroMV; + psad[3] = MV_MAX_ERROR; + //DPRINTF(DPRINTF_MV, "top-right"); + } else { + pmv[3] = pMBs[xin3 + yin3 * x_dim].mvs[vec3]; + psad[3] = pMBs[xin2 + yin2 * x_dim].sad8[vec3]; + num_cand++; + last_cand = 3; + } + + if (num_cand == 1) + { + /* DPRINTF(DPRINTF_MV,"cand0=(%i,%i), cand1=(%i,%i) cand2=(%i,%i) last=%i", + pmv[1].x, pmv[1].y, + pmv[2].x, pmv[2].y, + pmv[3].x, pmv[3].y, last_cand - 1); + */ + + pmv[0] = pmv[last_cand]; + psad[0] = psad[last_cand]; + return 0; + } + + /* DPRINTF(DPRINTF_MV,"cand0=(%i,%i), cand1=(%i,%i) cand2=(%i,%i)", + pmv[1].x, pmv[1].y, + pmv[2].x, pmv[2].y, + pmv[3].x, pmv[3].y);*/ + + if ((MVequal(pmv[1], pmv[2])) && (MVequal(pmv[1], pmv[3]))) { + pmv[0] = pmv[1]; + psad[0] = MIN(MIN(psad[1], psad[2]), psad[3]); + return 1; + } + + /* median,minimum */ + + pmv[0].x = + MIN(MAX(pmv[1].x, pmv[2].x), + MIN(MAX(pmv[2].x, pmv[3].x), MAX(pmv[1].x, pmv[3].x))); + pmv[0].y = + MIN(MAX(pmv[1].y, pmv[2].y), + MIN(MAX(pmv[2].y, pmv[3].y), MAX(pmv[1].y, pmv[3].y))); + psad[0] = MIN(MIN(psad[1], psad[2]), psad[3]); + + return 0; +}