--- trunk/xvidcore/src/bitstream/mbcoding.c 2002/03/15 09:20:03 28 +++ trunk/xvidcore/src/bitstream/mbcoding.c 2003/02/15 15:22:19 851 @@ -1,490 +1,1088 @@ + /****************************************************************************** + * * + * This file is part of XviD, a free MPEG-4 video encoder/decoder * + * * + * XviD is an implementation of a part of one or more MPEG-4 Video tools * + * as specified in ISO/IEC 14496-2 standard. Those intending to use this * + * software module in hardware or software products are advised that its * + * use may infringe existing patents or copyrights, and any such use * + * would be at such party's own risk. The original developer of this * + * software module and his/her company, and subsequent editors and their * + * companies, will have no liability for use of this software or * + * modifications or derivatives thereof. * + * * + * XviD is free software; you can redistribute it and/or modify it * + * under the terms of the GNU General Public License as published by * + * the Free Software Foundation; either version 2 of the License, or * + * (at your option) any later version. * + * * + * XviD is distributed in the hope that it will be useful, but * + * WITHOUT ANY WARRANTY; without even the implied warranty of * + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * + * GNU General Public License for more details. * + * * + * You should have received a copy of the GNU General Public License * + * along with this program; if not, write to the Free Software * + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA * + * * + ******************************************************************************/ + + /****************************************************************************** + * * + * mbcoding.c * + * * + * Copyright (C) 2002 - Michael Militzer * + * * + * For more information visit the XviD homepage: http://www.xvid.org * + * * + ******************************************************************************/ + + /****************************************************************************** + * * + * Revision history: * + * * + * 28.10.2002 GMC support - gruel * + * 28.06.2002 added check_resync_marker() * + * 14.04.2002 bframe encoding * + * 08.03.2002 initial version; isibaar * + * * + ******************************************************************************/ + + +#include +#include #include "../portab.h" +#include "../global.h" #include "bitstream.h" #include "zigzag.h" #include "vlc_codes.h" +#include "mbcoding.h" #include "../utils/mbfunctions.h" -#include /* malloc, free */ +/* #define BIGLUT */ -#define ESCAPE 7167 -#define ABS(X) (((X)>0)?(X):-(X)) -#define CLIP(X,A) (X > A) ? (A) : (X) +#ifdef BIGLUT +#define LEVELOFFSET 2048 +#else +#define LEVELOFFSET 32 +#endif + +static REVERSE_EVENT DCT3D[2][4096]; + +#ifdef BIGLUT +static VLC coeff_VLC[2][2][4096][64]; +VLC *intra_table; +static VLC *inter_table; +#else +static VLC coeff_VLC[2][2][64][64]; +#endif -static VLC *DCT3D[2]; +/* not really MB related, but VLCs are only available here */ +void bs_put_spritetrajectory(Bitstream * bs, const int val) +{ + const int code = sprite_trajectory_code[val+16384].code; + const int len = sprite_trajectory_code[val+16384].len; + const int code2 = sprite_trajectory_len[len].code; + const int len2 = sprite_trajectory_len[len].len; -VLC *intra_table, *inter_table; -static short clip_table[4096]; +// printf("GMC=%d Code/Len = %d / %d ",val, code,len); +// printf("Code2 / Len2 = %d / %d \n",code2,len2); + + BitstreamPutBits(bs, code2, len2); + if (len) BitstreamPutBits(bs, code, len); +} -void create_vlc_tables(void) +int bs_get_spritetrajectory(Bitstream * bs) { - int32_t k, l, i, intra, last; - VLC *vlc[2]; - VLC **coeff_ptr; - VLC *vlc1, *vlc2; + int i; + for (i = 0; i < 12; i++) + { + if (BitstreamShowBits(bs, sprite_trajectory_len[i].len) == sprite_trajectory_len[i].code) + { + BitstreamSkip(bs, sprite_trajectory_len[i].len); + return i; + } + } + return -1; +} - VLC *DCT3Dintra; - VLC *DCT3Dinter; +void +init_vlc_tables(void) +{ + uint32_t i, j, k, intra, last, run, run_esc, level, level_esc, escape, escape_len, offset; + int32_t l; - DCT3Dintra = (VLC *) malloc(sizeof(VLC) * 4096); - DCT3Dinter = (VLC *) malloc(sizeof(VLC) * 4096); +#ifdef BIGLUT + intra_table = coeff_VLC[1]; + inter_table = coeff_VLC[0]; +#endif - vlc1 = DCT3Dintra; - vlc2 = DCT3Dinter; - - vlc[0] = intra_table = (VLC *) malloc(128 * 511 * sizeof(VLC)); - vlc[1] = inter_table = (VLC *) malloc(128 * 511 * sizeof(VLC)); - - // initialize the clipping table - for(i = -2048; i < 2048; i++) { - clip_table[i + 2048] = i; - if(i < -255) - clip_table[i + 2048] = -255; - if(i > 255) - clip_table[i + 2048] = 255; - } - - // generate intra/inter vlc lookup table - for(i = 0; i < 4; i++) { - intra = i % 2; - last = i >> 1; - coeff_ptr = coeff_vlc[last + (intra << 1)]; - - for(k = -255; k < 256; k++) { // level - char *max_level_ptr = max_level[last + (intra << 1)]; - char *max_run_ptr = max_run[last + (intra << 1)]; - - for(l = 0; l < 64; l++) { // run - int32_t level = k, run = l; - - if(abs(level) <= max_level_ptr[run] && run <= max_run_ptr[abs(level)]) { + for (intra = 0; intra < 2; intra++) + for (i = 0; i < 4096; i++) + DCT3D[intra][i].event.level = 0; - if(level > 0) { - vlc[intra]->code = (coeff_ptr[run][level - 1].code) << 1; - vlc[intra]->len = coeff_ptr[run][level - 1].len + 1; - } - else if(level < 0) { - vlc[intra]->code = ((coeff_ptr[run][-level - 1].code) << 1) + 1; - vlc[intra]->len = coeff_ptr[run][-level - 1].len + 1; - } - else { - vlc[intra]->code = 0; - vlc[intra]->len = 0; + for (intra = 0; intra < 2; intra++) + for (last = 0; last < 2; last++) + { + for (run = 0; run < 63 + last; run++) + for (level = 0; level < (uint32_t)(32 << intra); level++) + { +#ifdef BIGLUT + offset = LEVELOFFSET; +#else + offset = !intra * LEVELOFFSET; +#endif + coeff_VLC[intra][last][level + offset][run].len = 128; + } + } + + for (intra = 0; intra < 2; intra++) + for (i = 0; i < 102; i++) + { +#ifdef BIGLUT + offset = LEVELOFFSET; +#else + offset = !intra * LEVELOFFSET; +#endif + for (j = 0; j < (uint32_t)(1 << (12 - coeff_tab[intra][i].vlc.len)); j++) + { + DCT3D[intra][(coeff_tab[intra][i].vlc.code << (12 - coeff_tab[intra][i].vlc.len)) | j].len = coeff_tab[intra][i].vlc.len; + DCT3D[intra][(coeff_tab[intra][i].vlc.code << (12 - coeff_tab[intra][i].vlc.len)) | j].event = coeff_tab[intra][i].event; + } + + coeff_VLC[intra][coeff_tab[intra][i].event.last][coeff_tab[intra][i].event.level + offset][coeff_tab[intra][i].event.run].code + = coeff_tab[intra][i].vlc.code << 1; + coeff_VLC[intra][coeff_tab[intra][i].event.last][coeff_tab[intra][i].event.level + offset][coeff_tab[intra][i].event.run].len + = coeff_tab[intra][i].vlc.len + 1; +#ifndef BIGLUT + if (!intra) +#endif + { + coeff_VLC[intra][coeff_tab[intra][i].event.last][offset - coeff_tab[intra][i].event.level][coeff_tab[intra][i].event.run].code + = (coeff_tab[intra][i].vlc.code << 1) | 1; + coeff_VLC[intra][coeff_tab[intra][i].event.last][offset - coeff_tab[intra][i].event.level][coeff_tab[intra][i].event.run].len + = coeff_tab[intra][i].vlc.len + 1; + } + } + + for (intra = 0; intra < 2; intra++) + for (last = 0; last < 2; last++) + for (run = 0; run < 63 + last; run++) + { + for (level = 1; level < (uint32_t)(32 << intra); level++) + { + if (level <= max_level[intra][last][run] && run <= max_run[intra][last][level]) + continue; + +#ifdef BIGLUT + offset = LEVELOFFSET; +#else + offset = !intra * LEVELOFFSET; +#endif + level_esc = level - max_level[intra][last][run]; + run_esc = run - 1 - max_run[intra][last][level]; + /*use this test to use shorter esc2 codes when possible + if (level_esc <= max_level[intra][last][run] && run <= max_run[intra][last][level_esc] + && !(coeff_VLC[intra][last][level_esc + offset][run].len + 7 + 1 + > coeff_VLC[intra][last][level + offset][run_esc].code + 7 + 2))*/ + + if (level_esc <= max_level[intra][last][run] && run <= max_run[intra][last][level_esc]) + { + escape = ESCAPE1; + escape_len = 7 + 1; + run_esc = run; } - } else { - if(level > 0) - level -= max_level_ptr[run]; else - level += max_level_ptr[run]; - - if(abs(level) <= max_level_ptr[run] && - run <= max_run_ptr[abs(level)]) { - - if(level > 0) { - vlc[intra]->code = (0x06 << (coeff_ptr[run][level - 1].len + 1)) | - (coeff_ptr[run][level - 1].code << 1); - vlc[intra]->len = (coeff_ptr[run][level - 1].len + 1) + 8; - } - else if(level < 0) { - vlc[intra]->code = (0x06 << (coeff_ptr[run][-level - 1].len + 1)) | - ((coeff_ptr[run][-level - 1].code << 1) + 1); - vlc[intra]->len = (coeff_ptr[run][-level - 1].len + 1) + 8; - } - else { - vlc[intra]->code = 0x06; - vlc[intra]->len = 8; + { + if (run_esc <= max_run[intra][last][level] && level <= max_level[intra][last][run_esc]) + { + escape = ESCAPE2; + escape_len = 7 + 2; + level_esc = level; } - } else { - if(level > 0) - level += max_level_ptr[run]; else - level -= max_level_ptr[run]; - DEBUG1("1) run:", run); - run -= max_run_ptr[abs(level)] + 1; - DEBUG1("2) run:", run); - - if(abs(level) <= max_level_ptr[run] && - run <= max_run_ptr[abs(level)]) { - - if(level > 0) { - vlc[intra]->code = (0x0e << (coeff_ptr[run][level - 1].len + 1)) | - (coeff_ptr[run][level - 1].code << 1); - vlc[intra]->len = (coeff_ptr[run][level - 1].len + 1) + 9; - } - else if(level < 0) { - vlc[intra]->code = (0x0e << (coeff_ptr[run][-level - 1].len + 1)) | - ((coeff_ptr[run][-level - 1].code << 1) + 1); - vlc[intra]->len = (coeff_ptr[run][-level - 1].len + 1) + 9; - } - else { - vlc[intra]->code = 0x0e; - vlc[intra]->len = 9; + { +#ifndef BIGLUT + if (!intra) +#endif + { + coeff_VLC[intra][last][level + offset][run].code + = (ESCAPE3 << 21) | (last << 20) | (run << 14) | (1 << 13) | ((level & 0xfff) << 1) | 1; + coeff_VLC[intra][last][level + offset][run].len = 30; + coeff_VLC[intra][last][offset - level][run].code + = (ESCAPE3 << 21) | (last << 20) | (run << 14) | (1 << 13) | ((-level & 0xfff) << 1) | 1; + coeff_VLC[intra][last][offset - level][run].len = 30; } - } else { - if(level != 0) - run += max_run_ptr[abs(level)] + 1; - else - run++; - - DEBUG1("3) run:", run); - - vlc[intra]->code = (uint32_t) ((0x1e + last) << 20) | - (l << 14) | (1 << 13) | ((k & 0xfff) << 1) | 1; - - vlc[intra]->len = 30; + continue; } } - } - vlc[intra]++; - } - } - } - intra_table += 64*255; // center vlc tables - inter_table += 64*255; // center vlc tables - for(i = 0; i < 4096; i++) { - if(i >= 512) { - *vlc1 = DCT3Dtab3[(i >> 5) - 16]; - *vlc2 = DCT3Dtab0[(i >> 5) - 16]; - } - else if(i >= 128) { - *vlc1 = DCT3Dtab4[(i >> 2) - 32]; - *vlc2 = DCT3Dtab1[(i >> 2) - 32]; - } - else if(i >= 8) { - *vlc1 = DCT3Dtab5[i - 8]; - *vlc2 = DCT3Dtab2[i - 8]; - } - else { - *vlc1 = ERRtab[i]; - *vlc2 = ERRtab[i]; - } - - vlc1++; - vlc2++; - } - DCT3D[0] = DCT3Dinter; - DCT3D[1] = DCT3Dintra; - -} + coeff_VLC[intra][last][level + offset][run].code + = (escape << coeff_VLC[intra][last][level_esc + offset][run_esc].len) + | coeff_VLC[intra][last][level_esc + offset][run_esc].code; + coeff_VLC[intra][last][level + offset][run].len + = coeff_VLC[intra][last][level_esc + offset][run_esc].len + escape_len; +#ifndef BIGLUT + if (!intra) +#endif + { + coeff_VLC[intra][last][offset - level][run].code + = (escape << coeff_VLC[intra][last][level_esc + offset][run_esc].len) + | coeff_VLC[intra][last][level_esc + offset][run_esc].code | 1; + coeff_VLC[intra][last][offset - level][run].len + = coeff_VLC[intra][last][level_esc + offset][run_esc].len + escape_len; + } + } -void destroy_vlc_tables(void) { +#ifdef BIGLUT + for (level = 32 << intra; level < 2048; level++) + { + coeff_VLC[intra][last][level + offset][run].code + = (ESCAPE3 << 21) | (last << 20) | (run << 14) | (1 << 13) | ((level & 0xfff) << 1) | 1; + coeff_VLC[intra][last][level + offset][run].len = 30; + + coeff_VLC[intra][last][offset - level][run].code + = (ESCAPE3 << 21) | (last << 20) | (run << 14) | (1 << 13) | ((-level & 0xfff) << 1) | 1; + coeff_VLC[intra][last][offset - level][run].len = 30; + } +#else + if (!intra) + { + coeff_VLC[intra][last][0][run].code + = (ESCAPE3 << 21) | (last << 20) | (run << 14) | (1 << 13) | ((-32 & 0xfff) << 1) | 1; + coeff_VLC[intra][last][0][run].len = 30; + } +#endif + } +/* init sprite_trajectory tables */ +/* even if GMC is not specified (it might be used later...) */ - if(intra_table != NULL && inter_table != NULL) { - intra_table -= 64*255; // uncenter vlc tables - inter_table -= 64*255; // uncenter vlc tables + sprite_trajectory_code[0+16384].code = 0; + sprite_trajectory_code[0+16384].len = 0; + for (k=0;k<14;k++) + { + int limit = (1< (cmp - 1)) + + if (value > (cmp - 1)) value -= 64 * scale_factor; - pStat->iMvSum += value * value; - pStat->iMvCount++; + pStat->iMvSum += value * value; + pStat->iMvCount++; - if (value == 0) - BitstreamPutBits(bs, mb_motion_table[32].code, mb_motion_table[32].len); - else { + if (value == 0) { + BitstreamPutBits(bs, mb_motion_table[32].code, + mb_motion_table[32].len); + } else { uint16_t length, code, mv_res, sign; - + length = 16 << f_code; f_code--; - + sign = (value < 0); - if(value >= length) + if (value >= length) value -= 2 * length; - else if(value < -length) + else if (value < -length) value += 2 * length; - if(sign) + if (sign) value = -value; value--; mv_res = value & ((1 << f_code) - 1); code = ((value - mv_res) >> f_code) + 1; - if(sign) + if (sign) code = -code; code += 32; - BitstreamPutBits(bs, mb_motion_table[code].code, mb_motion_table[code].len); - - if(f_code) + BitstreamPutBits(bs, mb_motion_table[code].code, + mb_motion_table[code].len); + + if (f_code) BitstreamPutBits(bs, mv_res, f_code); - } + } + } +#ifdef BIGLUT + +static __inline void +CodeCoeff(Bitstream * bs, + const int16_t qcoeff[64], + VLC * table, + const uint16_t * zigzag, + uint16_t intra) +{ -static __inline void CodeCoeff(Bitstream *bs, int16_t qcoeff[64], VLC *table, - const uint16_t *zigzag, uint16_t intra) { uint32_t j, last; short v; VLC *vlc; - + j = intra; - last = 1 + intra; + last = intra; + + while (j < 64 && (v = qcoeff[zigzag[j]]) == 0) + j++; - while((v = qcoeff[zigzag[j++]]) == 0); - do { - // count zeroes - vlc = table + (clip_table[2048+v] << 6) + j - last; - last = j + 1; - while(j < 64 && (v = qcoeff[zigzag[j++]]) == 0); - - // write code - if(j != 64) { + vlc = table + 64 * 2048 + (v << 6) + j - last; + last = ++j; + + /* count zeroes */ + while (j < 64 && (v = qcoeff[zigzag[j]]) == 0) + j++; + + /* write code */ + if (j != 64) { BitstreamPutBits(bs, vlc->code, vlc->len); } else { - vlc += 64*511; + vlc += 64 * 4096; BitstreamPutBits(bs, vlc->code, vlc->len); break; } - } while(1); + } while (1); + } -static void CodeBlockIntra(const MBParam * pParam, const MACROBLOCK *pMB, - int16_t qcoeff[][64], Bitstream * bs, Statistics * pStat) + +/* returns the number of bits required to encode qcoeff */ +int +CodeCoeff_CalcBits(const int16_t qcoeff[64], + VLC * table, + const uint16_t * zigzag, + uint16_t intra) { + int bits = 0; + uint32_t j, last; + short v; + VLC *vlc; + + j = intra; + last = intra; + + while (j < 64 && (v = qcoeff[zigzag[j]]) == 0) + j++; + + if (j >= 64) return 0; /* empty block */ + + do { + vlc = table + 64 * 2048 + (v << 6) + j - last; + last = ++j; + + /* count zeroes */ + while (j < 64 && (v = qcoeff[zigzag[j]]) == 0) + j++; + + /* write code */ + if (j != 64) { + bits += vlc->len; + } else { + vlc += 64 * 4096; + bits += vlc->len; + break; + } + } while (1); + + return bits; +} + + +#else + +static __inline void +CodeCoeffInter(Bitstream * bs, + const int16_t qcoeff[64], + const uint16_t * zigzag) +{ + uint32_t i, run, prev_run, code, len; + int32_t level, prev_level, level_shifted; + + i = 0; + run = 0; + + while (!(level = qcoeff[zigzag[i++]])) + run++; + + prev_level = level; + prev_run = run; + run = 0; + + while (i < 64) + { + if ((level = qcoeff[zigzag[i++]]) != 0) + { + level_shifted = prev_level + 32; + if (!(level_shifted & -64)) + { + code = coeff_VLC[0][0][level_shifted][prev_run].code; + len = coeff_VLC[0][0][level_shifted][prev_run].len; + } + else + { + code = (ESCAPE3 << 21) | (prev_run << 14) | (1 << 13) | ((prev_level & 0xfff) << 1) | 1; + len = 30; + } + BitstreamPutBits(bs, code, len); + prev_level = level; + prev_run = run; + run = 0; + } + else + run++; + } + + level_shifted = prev_level + 32; + if (!(level_shifted & -64)) + { + code = coeff_VLC[0][1][level_shifted][prev_run].code; + len = coeff_VLC[0][1][level_shifted][prev_run].len; + } + else + { + code = (ESCAPE3 << 21) | (1 << 20) | (prev_run << 14) | (1 << 13) | ((prev_level & 0xfff) << 1) | 1; + len = 30; + } + BitstreamPutBits(bs, code, len); +} + +static __inline void +CodeCoeffIntra(Bitstream * bs, + const int16_t qcoeff[64], + const uint16_t * zigzag) +{ + uint32_t i, abs_level, run, prev_run, code, len; + int32_t level, prev_level; + + i = 1; + run = 0; + + while (i<64 && !(level = qcoeff[zigzag[i++]])) + run++; + + prev_level = level; + prev_run = run; + run = 0; + + while (i < 64) + { + if ((level = qcoeff[zigzag[i++]]) != 0) + { + abs_level = ABS(prev_level); + abs_level = abs_level < 64 ? abs_level : 0; + code = coeff_VLC[1][0][abs_level][prev_run].code; + len = coeff_VLC[1][0][abs_level][prev_run].len; + if (len != 128) + code |= (prev_level < 0); + else + { + code = (ESCAPE3 << 21) | (prev_run << 14) | (1 << 13) | ((prev_level & 0xfff) << 1) | 1; + len = 30; + } + BitstreamPutBits(bs, code, len); + prev_level = level; + prev_run = run; + run = 0; + } + else + run++; + } + + abs_level = ABS(prev_level); + abs_level = abs_level < 64 ? abs_level : 0; + code = coeff_VLC[1][1][abs_level][prev_run].code; + len = coeff_VLC[1][1][abs_level][prev_run].len; + if (len != 128) + code |= (prev_level < 0); + else + { + code = (ESCAPE3 << 21) | (1 << 20) | (prev_run << 14) | (1 << 13) | ((prev_level & 0xfff) << 1) | 1; + len = 30; + } + BitstreamPutBits(bs, code, len); +} + + + +/* returns the number of bits required to encode qcoeff */ + +int +CodeCoeffIntra_CalcBits(const int16_t qcoeff[64], const uint16_t * zigzag) +{ + int bits = 0; + uint32_t i, abs_level, run, prev_run, len; + int32_t level, prev_level; + + i = 1; + run = 0; + + while (i<64 && !(level = qcoeff[zigzag[i++]])) + run++; + + if (i >= 64) return 0; /* empty block */ + + prev_level = level; + prev_run = run; + run = 0; + + while (i < 64) + { + if ((level = qcoeff[zigzag[i++]]) != 0) + { + abs_level = ABS(prev_level); + abs_level = abs_level < 64 ? abs_level : 0; + len = coeff_VLC[1][0][abs_level][prev_run].len; + bits += len!=128 ? len : 30; + + prev_level = level; + prev_run = run; + run = 0; + } + else + run++; + } + + abs_level = ABS(prev_level); + abs_level = abs_level < 64 ? abs_level : 0; + len = coeff_VLC[1][1][abs_level][prev_run].len; + bits += len!=128 ? len : 30; + + return bits; +} + +int +CodeCoeffInter_CalcBits(const int16_t qcoeff[64], const uint16_t * zigzag) +{ + uint32_t i, run, prev_run, len; + int32_t level, prev_level, level_shifted; + int bits = 0; + + i = 0; + run = 0; + + while (!(level = qcoeff[zigzag[i++]])) + run++; + + prev_level = level; + prev_run = run; + run = 0; + + while (i < 64) { + if ((level = qcoeff[zigzag[i++]]) != 0) { + level_shifted = prev_level + 32; + if (!(level_shifted & -64)) + len = coeff_VLC[0][0][level_shifted][prev_run].len; + else + len = 30; + + bits += len; + prev_level = level; + prev_run = run; + run = 0; + } + else + run++; + } + + level_shifted = prev_level + 32; + if (!(level_shifted & -64)) + len = coeff_VLC[0][1][level_shifted][prev_run].len; + else + len = 30; + bits += len; + + return bits; +} + + +#endif + +static __inline void +CodeBlockIntra(const FRAMEINFO * const frame, + const MACROBLOCK * pMB, + int16_t qcoeff[6 * 64], + Bitstream * bs, + Statistics * pStat) +{ + uint32_t i, mcbpc, cbpy, bits; cbpy = pMB->cbp >> 2; - // write mcbpc - if(pParam->coding_type == I_VOP) { - mcbpc = ((pMB->mode >> 1) & 3) | ((pMB->cbp & 3) << 2); - BitstreamPutBits(bs, mcbpc_intra_tab[mcbpc].code, mcbpc_intra_tab[mcbpc].len); - } - else { - mcbpc = (pMB->mode & 7) | ((pMB->cbp & 3) << 3); - BitstreamPutBits(bs, mcbpc_inter_tab[mcbpc].code, mcbpc_inter_tab[mcbpc].len); + // write mcbpc + if (frame->coding_type == I_VOP) { + mcbpc = ((pMB->mode >> 1) & 3) | ((pMB->cbp & 3) << 2); + BitstreamPutBits(bs, mcbpc_intra_tab[mcbpc].code, + mcbpc_intra_tab[mcbpc].len); + } else { + mcbpc = (pMB->mode & 7) | ((pMB->cbp & 3) << 3); + BitstreamPutBits(bs, mcbpc_inter_tab[mcbpc].code, + mcbpc_inter_tab[mcbpc].len); } // ac prediction flag - if(pMB->acpred_directions[0]) - BitstreamPutBits(bs, 1, 1); + if (pMB->acpred_directions[0]) + BitstreamPutBits(bs, 1, 1); else - BitstreamPutBits(bs, 0, 1); + BitstreamPutBits(bs, 0, 1); - // write cbpy - BitstreamPutBits (bs, cbpy_tab[cbpy].code, cbpy_tab[cbpy].len); + // write cbpy + BitstreamPutBits(bs, cbpy_tab[cbpy].code, cbpy_tab[cbpy].len); // write dquant - if(pMB->mode == MODE_INTRA_Q) + if (pMB->mode == MODE_INTRA_Q) BitstreamPutBits(bs, pMB->dquant, 2); + // write interlacing + if (frame->global_flags & XVID_INTERLACING) { + BitstreamPutBit(bs, pMB->field_dct); + } // code block coeffs - for(i = 0; i < 6; i++) - { - if(i < 4) - BitstreamPutBits(bs, dcy_tab[qcoeff[i][0] + 255].code, - dcy_tab[qcoeff[i][0] + 255].len); + for (i = 0; i < 6; i++) { + if (i < 4) + BitstreamPutBits(bs, dcy_tab[qcoeff[i * 64 + 0] + 255].code, + dcy_tab[qcoeff[i * 64 + 0] + 255].len); else - BitstreamPutBits(bs, dcc_tab[qcoeff[i][0] + 255].code, - dcc_tab[qcoeff[i][0] + 255].len); - - if(pMB->cbp & (1 << (5 - i))) - { + BitstreamPutBits(bs, dcc_tab[qcoeff[i * 64 + 0] + 255].code, + dcc_tab[qcoeff[i * 64 + 0] + 255].len); + + if (pMB->cbp & (1 << (5 - i))) { + const uint16_t *scan_table = + frame->global_flags & XVID_ALTERNATESCAN ? + scan_tables[2] : scan_tables[pMB->acpred_directions[i]]; + bits = BitstreamPos(bs); - CodeCoeff(bs, qcoeff[i], intra_table, scan_tables[pMB->acpred_directions[i]], 1); +#ifdef BIGLUT + CodeCoeff(bs, &qcoeff[i * 64], intra_table, scan_table, 1); +#else + CodeCoeffIntra(bs, &qcoeff[i * 64], scan_table); +#endif bits = BitstreamPos(bs) - bits; pStat->iTextBits += bits; } } + } -static void CodeBlockInter(const MBParam * pParam, const MACROBLOCK *pMB, - int16_t qcoeff[][64], Bitstream * bs, Statistics * pStat) +static void +CodeBlockInter(const FRAMEINFO * const frame, + const MACROBLOCK * pMB, + int16_t qcoeff[6 * 64], + Bitstream * bs, + Statistics * pStat) { + int32_t i; uint32_t bits, mcbpc, cbpy; - mcbpc = (pMB->mode & 7) | ((pMB->cbp & 3) << 3); + mcbpc = (pMB->mode & 7) | ((pMB->cbp & 3) << 3); cbpy = 15 - (pMB->cbp >> 2); // write mcbpc - BitstreamPutBits(bs, mcbpc_inter_tab[mcbpc].code, mcbpc_inter_tab[mcbpc].len); + BitstreamPutBits(bs, mcbpc_inter_tab[mcbpc].code, + mcbpc_inter_tab[mcbpc].len); + + if ( (frame->coding_type == S_VOP) && (pMB->mode == MODE_INTER || pMB->mode == MODE_INTER_Q) ) + BitstreamPutBit(bs, pMB->mcsel); // mcsel: '0'=local motion, '1'=GMC // write cbpy BitstreamPutBits(bs, cbpy_tab[cbpy].code, cbpy_tab[cbpy].len); // write dquant - if(pMB->mode == MODE_INTER_Q) + if (pMB->mode == MODE_INTER_Q) BitstreamPutBits(bs, pMB->dquant, 2); - - // code motion vector(s) - for(i = 0; i < (pMB->mode == MODE_INTER4V ? 4 : 1); i++) - { - CodeVector(bs, pMB->pmvs[i].x, pParam->fixed_code, pStat); - CodeVector(bs, pMB->pmvs[i].y, pParam->fixed_code, pStat); + + // interlacing + if (frame->global_flags & XVID_INTERLACING) { + if (pMB->cbp) { + BitstreamPutBit(bs, pMB->field_dct); + DPRINTF(DPRINTF_MB,"codep: field_dct: %i", pMB->field_dct); + } + + // if inter block, write field ME flag + if (pMB->mode == MODE_INTER || pMB->mode == MODE_INTER_Q) { + BitstreamPutBit(bs, pMB->field_pred); + DPRINTF(DPRINTF_MB,"codep: field_pred: %i", pMB->field_pred); + + // write field prediction references + if (pMB->field_pred) { + BitstreamPutBit(bs, pMB->field_for_top); + BitstreamPutBit(bs, pMB->field_for_bot); + } + } } + // code motion vector(s) if motion is local + if (!pMB->mcsel) + for (i = 0; i < (pMB->mode == MODE_INTER4V ? 4 : 1); i++) { + CodeVector(bs, pMB->pmvs[i].x, frame->fcode, pStat); + CodeVector(bs, pMB->pmvs[i].y, frame->fcode, pStat); + } bits = BitstreamPos(bs); - + // code block coeffs - for(i = 0; i < 6; i++) - if(pMB->cbp & (1 << (5 - i))) - CodeCoeff(bs, qcoeff[i], inter_table, scan_tables[0], 0); + for (i = 0; i < 6; i++) + if (pMB->cbp & (1 << (5 - i))) + { + const uint16_t *scan_table = + frame->global_flags & XVID_ALTERNATESCAN ? + scan_tables[2] : scan_tables[0]; + +#ifdef BIGLUT + CodeCoeff(bs, &qcoeff[i * 64], inter_table, scan_table, 0); +#else + CodeCoeffInter(bs, &qcoeff[i * 64], scan_table); +#endif + } bits = BitstreamPos(bs) - bits; pStat->iTextBits += bits; } -void MBCoding(const MBParam * pParam, MACROBLOCK *pMB, - int16_t qcoeff[][64], - Bitstream * bs, Statistics * pStat) -{ - int intra = (pMB->mode == MODE_INTRA || pMB->mode == MODE_INTRA_Q); - - if(pParam->coding_type == P_VOP) { - if(pMB->cbp == 0 && pMB->mode == MODE_INTER && - pMB->mvs[0].x == 0 && pMB->mvs[0].y == 0) - { - BitstreamPutBit(bs, 1); // not_coded - return; - } - else - BitstreamPutBit(bs, 0); // coded +void +MBCoding(const FRAMEINFO * const frame, + MACROBLOCK * pMB, + int16_t qcoeff[6 * 64], + Bitstream * bs, + Statistics * pStat) +{ + if (frame->coding_type != I_VOP) + BitstreamPutBit(bs, 0); // not_coded + + if (pMB->mode == MODE_INTRA || pMB->mode == MODE_INTRA_Q) + CodeBlockIntra(frame, pMB, qcoeff, bs, pStat); + else + CodeBlockInter(frame, pMB, qcoeff, bs, pStat); + +} + +/* +// moved to mbcoding.h so that in can be 'static __inline' +void +MBSkip(Bitstream * bs) +{ + BitstreamPutBit(bs, 1); // not coded +} +*/ + +/*************************************************************** + * bframe encoding start + ***************************************************************/ + +/* + mbtype + 0 1b direct(h263) mvdb + 1 01b interpolate mc+q dbquant, mvdf, mvdb + 2 001b backward mc+q dbquant, mvdb + 3 0001b forward mc+q dbquant, mvdf +*/ + +static __inline void +put_bvop_mbtype(Bitstream * bs, + int value) +{ + switch (value) { + case MODE_FORWARD: + BitstreamPutBit(bs, 0); + case MODE_BACKWARD: + BitstreamPutBit(bs, 0); + case MODE_INTERPOLATE: + BitstreamPutBit(bs, 0); + case MODE_DIRECT: + BitstreamPutBit(bs, 1); + default: + break; } +} - if(intra) - CodeBlockIntra(pParam, pMB, qcoeff, bs, pStat); - else - CodeBlockInter(pParam, pMB, qcoeff, bs, pStat); +/* + dbquant + -2 10b + 0 0b + +2 11b +*/ + +static __inline void +put_bvop_dbquant(Bitstream * bs, + int value) +{ + switch (value) { + case 0: + BitstreamPutBit(bs, 0); + return; + + case -2: + BitstreamPutBit(bs, 1); + BitstreamPutBit(bs, 0); + return; + + case 2: + BitstreamPutBit(bs, 1); + BitstreamPutBit(bs, 1); + return; + + default:; // invalid + } } + +void +MBCodingBVOP(const MACROBLOCK * mb, + const int16_t qcoeff[6 * 64], + const int32_t fcode, + const int32_t bcode, + Bitstream * bs, + Statistics * pStat, + int direction) +{ + int vcode = fcode; + unsigned int i; + +/* ------------------------------------------------------------------ + when a block is skipped it is decoded DIRECT(0,0) + hence is interpolated from forward & backward frames + ------------------------------------------------------------------ */ + + if (mb->mode == MODE_DIRECT_NONE_MV) { + BitstreamPutBit(bs, 1); // skipped + return; + } + + BitstreamPutBit(bs, 0); // not skipped + + if (mb->cbp == 0) { + BitstreamPutBit(bs, 1); // cbp == 0 + } else { + BitstreamPutBit(bs, 0); // cbp == xxx + } + + put_bvop_mbtype(bs, mb->mode); + + if (mb->cbp) { + BitstreamPutBits(bs, mb->cbp, 6); + } + + if (mb->mode != MODE_DIRECT && mb->cbp != 0) { + put_bvop_dbquant(bs, 0); // todo: mb->dquant = 0 + } + + switch (mb->mode) { + case MODE_INTERPOLATE: + CodeVector(bs, mb->pmvs[1].x, vcode, pStat); //forward vector of interpolate mode + CodeVector(bs, mb->pmvs[1].y, vcode, pStat); + case MODE_BACKWARD: + vcode = bcode; + case MODE_FORWARD: + CodeVector(bs, mb->pmvs[0].x, vcode, pStat); + CodeVector(bs, mb->pmvs[0].y, vcode, pStat); + break; + case MODE_DIRECT: + CodeVector(bs, mb->pmvs[3].x, 1, pStat); // fcode is always 1 for delta vector + CodeVector(bs, mb->pmvs[3].y, 1, pStat); // prediction is always (0,0) + default: break; + } + + for (i = 0; i < 6; i++) { + if (mb->cbp & (1 << (5 - i))) { +#ifdef BIGLUT + CodeCoeff(bs, &qcoeff[i * 64], inter_table, scan_tables[0], 0); +#else + CodeCoeffInter(bs, &qcoeff[i * 64], scan_tables[0]); +#endif + } + } +} + + + /*************************************************************** * decoding stuff starts here * ***************************************************************/ -int get_mcbpc_intra(Bitstream * bs) + +// for IVOP addbits == 0 +// for PVOP addbits == fcode - 1 +// for BVOP addbits == max(fcode,bcode) - 1 +// returns true or false +int +check_resync_marker(Bitstream * bs, int addbits) +{ + uint32_t nbits; + uint32_t code; + uint32_t nbitsresyncmarker = NUMBITS_VP_RESYNC_MARKER + addbits; + + nbits = BitstreamNumBitsToByteAlign(bs); + code = BitstreamShowBits(bs, nbits); + + if (code == (((uint32_t)1 << (nbits - 1)) - 1)) + { + return BitstreamShowBitsFromByteAlign(bs, nbitsresyncmarker) == RESYNC_MARKER; + } + + return 0; +} + + + +int +get_mcbpc_intra(Bitstream * bs) { + uint32_t index; - - while((index = BitstreamShowBits(bs, 9)) == 1) - BitstreamSkip(bs, 9); + index = BitstreamShowBits(bs, 9); index >>= 3; BitstreamSkip(bs, mcbpc_intra_table[index].len); + return mcbpc_intra_table[index].code; + } -int get_mcbpc_inter(Bitstream * bs) +int +get_mcbpc_inter(Bitstream * bs) { + uint32_t index; - while((index = CLIP(BitstreamShowBits(bs, 9), 256)) == 1) - BitstreamSkip(bs, 9); + index = MIN(BitstreamShowBits(bs, 9), 256); + + BitstreamSkip(bs, mcbpc_inter_table[index].len); - BitstreamSkip(bs, mcbpc_inter_table[index].len); return mcbpc_inter_table[index].code; + } -int get_cbpy(Bitstream * bs, int intra) +int +get_cbpy(Bitstream * bs, + int intra) { + int cbpy; uint32_t index = BitstreamShowBits(bs, 6); BitstreamSkip(bs, cbpy_table[index].len); cbpy = cbpy_table[index].code; - if(!intra) + if (!intra) cbpy = 15 - cbpy; return cbpy; + } -int get_mv_data(Bitstream * bs) +static __inline int +get_mv_data(Bitstream * bs) { + uint32_t index; - if(BitstreamGetBit(bs)) + if (BitstreamGetBit(bs)) return 0; - + index = BitstreamShowBits(bs, 12); - if(index >= 512) - { + if (index >= 512) { index = (index >> 8) - 2; BitstreamSkip(bs, TMNMVtab0[index].len); return TMNMVtab0[index].code; } - - if(index >= 128) - { + + if (index >= 128) { index = (index >> 2) - 32; BitstreamSkip(bs, TMNMVtab1[index].len); return TMNMVtab1[index].code; } - index -= 4; + index -= 4; BitstreamSkip(bs, TMNMVtab2[index].len); return TMNMVtab2[index].code; + } -int get_mv(Bitstream * bs, int fcode) +int +get_mv(Bitstream * bs, + int fcode) { + int data; int res; int mv; int scale_fac = 1 << (fcode - 1); data = get_mv_data(bs); - - if(scale_fac == 1 || data == 0) + + if (scale_fac == 1 || data == 0) return data; res = BitstreamGetBits(bs, fcode - 1); mv = ((ABS(data) - 1) * scale_fac) + res + 1; - + return data < 0 ? -mv : mv; + } -int get_dc_dif(Bitstream * bs, uint32_t dc_size) +int +get_dc_dif(Bitstream * bs, + uint32_t dc_size) { + int code = BitstreamGetBits(bs, dc_size); int msb = code >> (dc_size - 1); - if(msb == 0) - return (-1 * (code^((1 << dc_size) - 1))); + if (msb == 0) + return (-1 * (code ^ ((1 << dc_size) - 1))); return code; + } -int get_dc_size_lum(Bitstream * bs) +int +get_dc_size_lum(Bitstream * bs) { + int code, i; + code = BitstreamShowBits(bs, 11); - for(i = 11; i > 3; i--) { - if(code == 1) { + for (i = 11; i > 3; i--) { + if (code == 1) { BitstreamSkip(bs, i); return i + 1; } @@ -493,16 +1091,20 @@ BitstreamSkip(bs, dc_lum_tab[code].len); return dc_lum_tab[code].code; + } -int get_dc_size_chrom(Bitstream * bs) +int +get_dc_size_chrom(Bitstream * bs) { + uint32_t code, i; + code = BitstreamShowBits(bs, 12); - for(i = 12; i > 2; i--) { - if(code == 1) { + for (i = 12; i > 2; i--) { + if (code == 1) { BitstreamSkip(bs, i); return i; } @@ -510,148 +1112,150 @@ } return 3 - BitstreamGetBits(bs, 2); + } -int get_coeff(Bitstream * bs, int *run, int *last, int intra, int short_video_header) +static __inline int +get_coeff(Bitstream * bs, + int *run, + int *last, + int intra, + int short_video_header) { - uint32_t mode; - const VLC *tab; + + uint32_t mode; int32_t level; + REVERSE_EVENT *reverse_event; - if(short_video_header) // inter-VLCs will be used for both intra and inter blocks + if (short_video_header) /* inter-VLCs will be used for both intra and inter blocks */ intra = 0; - - tab = &DCT3D[intra][BitstreamShowBits(bs, 12)]; - - if(tab->code == -1) - goto error; - BitstreamSkip(bs, tab->len); + if (BitstreamShowBits(bs, 7) != ESCAPE) { + reverse_event = &DCT3D[intra][BitstreamShowBits(bs, 12)]; - if(tab->code != ESCAPE) { - if(!intra) - { - *run = (tab->code >> 4) & 255; - level = tab->code & 15; - *last = (tab->code >> 12) & 1; - } - else - { - *run = (tab->code >> 8) & 255; - level = tab->code & 255; - *last = (tab->code >> 16) & 1; - } - return BitstreamGetBit(bs) ? -level : level; + if ((level = reverse_event->event.level) == 0) + goto error; + + *last = reverse_event->event.last; + *run = reverse_event->event.run; + + BitstreamSkip(bs, reverse_event->len); + + return BitstreamGetBits(bs, 1) ? -level : level; } - if(short_video_header) - { - // escape mode 4 - H.263 type, only used if short_video_header = 1 + BitstreamSkip(bs, 7); + + if (short_video_header) { + /* escape mode 4 - H.263 type, only used if short_video_header = 1 */ *last = BitstreamGetBit(bs); *run = BitstreamGetBits(bs, 6); level = BitstreamGetBits(bs, 8); - if (level == 0 || level == 128) - DEBUG1("Illegal LEVEL for ESCAPE mode 4:", level); + if (level == 0 || level == 128) + DPRINTF(DPRINTF_ERROR, "Illegal LEVEL for ESCAPE mode 4: %d", level); - return (level >= 128 ? -(256 - level) : level); + return (level << 24) >> 24; } - + mode = BitstreamShowBits(bs, 2); - if(mode < 3) { + if (mode < 3) { BitstreamSkip(bs, (mode == 2) ? 2 : 1); - tab = &DCT3D[intra][BitstreamShowBits(bs, 12)]; - if (tab->code == -1) + reverse_event = &DCT3D[intra][BitstreamShowBits(bs, 12)]; + + if ((level = reverse_event->event.level) == 0) goto error; - BitstreamSkip(bs, tab->len); + *last = reverse_event->event.last; + *run = reverse_event->event.run; - if (!intra) { - *run = (tab->code >> 4) & 255; - level = tab->code & 15; - *last = (tab->code >> 12) & 1; - } - else - { - *run = (tab->code >> 8) & 255; - level = tab->code & 255; - *last = (tab->code >> 16) & 1; - } - - if(mode < 2) // first escape mode, level is offset - level += max_level[*last + (!intra<<1)][*run]; // need to add back the max level - else if(mode == 2) // second escape mode, run is offset - *run += max_run[*last + (!intra<<1)][level] + 1; - - return BitstreamGetBit(bs) ? -level : level; - } + BitstreamSkip(bs, reverse_event->len); - // third escape mode - fixed length codes + if (mode < 2) /* first escape mode, level is offset */ + level += max_level[intra][*last][*run]; + else /* second escape mode, run is offset */ + *run += max_run[intra][*last][level] + 1; + + return BitstreamGetBits(bs, 1) ? -level : level; + } + + /* third escape mode - fixed length codes */ BitstreamSkip(bs, 2); *last = BitstreamGetBits(bs, 1); - *run = BitstreamGetBits(bs, 6); - BitstreamSkip(bs, 1); // marker - level = BitstreamGetBits(bs, 12); - BitstreamSkip(bs, 1); // marker + *run = BitstreamGetBits(bs, 6); + BitstreamSkip(bs, 1); /* marker */ + level = BitstreamGetBits(bs, 12); + BitstreamSkip(bs, 1); /* marker */ - return (level & 0x800) ? (level | (-1 ^ 0xfff)) : level; + return (level << 20) >> 20; -error: + error: *run = VLC_ERROR; return 0; } - -void get_intra_block(Bitstream * bs, int16_t * block, int direction, int coeff) +void +get_intra_block(Bitstream * bs, + int16_t * block, + int direction, + int coeff) { - const uint16_t * scan = scan_tables[ direction ]; - int level; - int run; - int last; - do - { + const uint16_t *scan = scan_tables[direction]; + int level, run, last; + + do { level = get_coeff(bs, &run, &last, 1, 0); - if (run == -1) - { - DEBUG("fatal: invalid run"); + if (run == -1) { + DPRINTF(DPRINTF_ERROR,"fatal: invalid run"); break; } coeff += run; - block[ scan[coeff] ] = level; - if (level < -127 || level > 127) - { - DEBUG1("warning: intra_overflow", level); + block[scan[coeff]] = level; + + DPRINTF(DPRINTF_COEFF,"block[%i] %i", scan[coeff], level); + //DPRINTF(DPRINTF_COEFF,"block[%i] %i %08x", scan[coeff], level, BitstreamShowBits(bs, 32)); + + if (level < -2047 || level > 2047) { + DPRINTF(DPRINTF_ERROR,"warning: intra_overflow %i", level); } coeff++; } while (!last); + } -void get_inter_block(Bitstream * bs, int16_t * block) +void +get_inter_block(Bitstream * bs, + int16_t * block, + int direction) { - const uint16_t * scan = scan_tables[0]; + + const uint16_t *scan = scan_tables[direction]; int p; int level; int run; int last; p = 0; - do - { + do { level = get_coeff(bs, &run, &last, 0, 0); - if (run == -1) - { - DEBUG("fatal: invalid run"); + if (run == -1) { + DPRINTF(DPRINTF_ERROR,"fatal: invalid run"); break; } p += run; - block[ scan[p] ] = level; - if (level < -127 || level > 127) - { - DEBUG1("warning: inter_overflow", level); + + block[scan[p]] = level; + + DPRINTF(DPRINTF_COEFF,"block[%i] %i", scan[p], level); + // DPRINTF(DPRINTF_COEFF,"block[%i] %i %08x", scan[p], level, BitstreamShowBits(bs, 32)); + + if (level < -2047 || level > 2047) { + DPRINTF(DPRINTF_ERROR,"warning: inter overflow %i", level); } p++; } while (!last); + }