--- trunk/xvidcore/examples/xvid_encraw.c 2002/08/17 20:03:36 376 +++ trunk/xvidcore/examples/xvid_encraw.c 2005/10/07 15:02:28 1646 @@ -1,572 +1,1319 @@ -/************************************************************************** +/***************************************************************************** * - * XVID MPEG-4 VIDEO CODEC - Example for encoding and decoding + * XVID MPEG-4 VIDEO CODEC + * - Console based test application - * - * This program is free software; you can redistribute it and/or modify - * it under the terms of the GNU General Public License as published by - * the Free Software Foundation; either version 2 of the License, or - * (at your option) any later version. + * Copyright(C) 2002-2003 Christoph Lampert + * 2002-2003 Edouard Gomez + * 2003 Peter Ross * - * This program is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - * GNU General Public License for more details. + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. * - * You should have received a copy of the GNU General Public License - * along with this program; if not, write to the Free Software - * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. * - *************************************************************************/ + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + * + * $Id: xvid_encraw.c,v 1.22 2005-10-07 15:02:28 suxen_drol Exp $ + * + ****************************************************************************/ -/************************************************************************ +/***************************************************************************** + * Application notes : * - * Speed test routine for XviD using the XviD-API - * (C) Christoph Lampert, 2002/08/17 - * - * A sequence of YUV pics in PGM or RAW file format is encoded and the - * raw MPEG-4 stream is written to stdout. - * The encoding speed of this is measured, too. + * A sequence of raw YUV I420 pics or YUV I420 PGM file format is encoded + * The speed is measured and frames' PSNR are taken from core. * * The program is plain C and needs no libraries except for libxvidcore, - * and maths-lib, so with UN*X you simply compile by - * - * gcc xvid_encraw.c -lxvidcore -lm -o xvid_encraw - * - * Run without or with illegal parameters, then PGM input input is read - * from stdin. - * - * Parameters are: xvid_stat XDIM YDIM QUALITY BITRATE/QUANTIZER FRAMERATE - * - * if XDIM or YDIM are illegal (e.g. 0), they are ignored and input is - * considered to be PGM. Otherwise (X and Y both greater than 0) raw YUV - * is expected, as e.g. the standard MPEG test-files, like "foreman" - * - * 0 <= QUALITY <= 6 (default 5) - * - * BITRATE is in kbps (default 900), - * if BITRATE<32, then value is taken is fixed QUANTIZER - * - * FRAMERATE is a float (with or without decimal dot), default is 25.00 - * - * input/output and m4v-output is saved, if corresponding flags are set - * - * PGM input must in a very specific format, see read_pgmheader - * it can be generated e.g. from MPEG2 by mpeg2dec -o pgmpipe - * - ************************************************************************/ - -/************************************************************************ - * - * For EXAMPLES how to use this, see the seperate file xvid_stat.examples + * and maths-lib. * + * Use ./xvid_encraw -help for a list of options + * ************************************************************************/ #include #include -#include // needed for log10 -#include // only needed for gettimeofday +#include +#include +#ifndef WIN32 +#include +#else +#include +#include +#include +#define XVID_AVI_INPUT +#endif -#include "../src/xvid.h" /* comes with XviD */ +#include "xvid.h" -int motion_presets[7] = { - 0, // Q 0 - PMV_EARLYSTOP16, // Q 1 - PMV_EARLYSTOP16, // Q 2 - PMV_EARLYSTOP16 | PMV_HALFPELREFINE16, // Q 3 - PMV_EARLYSTOP16 | PMV_HALFPELREFINE16, // Q 4 - PMV_EARLYSTOP16 | PMV_HALFPELREFINE16 | PMV_EARLYSTOP8 // Q 5 - | PMV_HALFPELREFINE8, - PMV_EARLYSTOP16 | PMV_HALFPELREFINE16 | PMV_EXTSEARCH16 // Q 6 - | PMV_USESQUARES16 | PMV_EARLYSTOP8 | PMV_HALFPELREFINE8 - }; - -int general_presets[7] = { - XVID_H263QUANT, /* or use XVID_MPEGQUANT */ // Q 0 - XVID_MPEGQUANT, // Q 1 - XVID_H263QUANT, // Q 2 - XVID_H263QUANT | XVID_HALFPEL, // Q 3 - XVID_H263QUANT | XVID_HALFPEL | XVID_INTER4V, // Q 4 - XVID_H263QUANT | XVID_HALFPEL | XVID_INTER4V, // Q 5 - XVID_H263QUANT | XVID_HALFPEL | XVID_INTER4V }; // Q 6 - - -/* my default values for encoding */ - -#define ABS_MAXFRAMENR 9999 // max number of frames - -int ARG_BITRATE=900; -int ARG_QUANTI=0; - -int ARG_QUALITY =6; -int ARG_MINQUANT=1; -int ARG_MAXQUANT=31; -float ARG_FRAMERATE=25.00; +#undef READ_PNM -int ARG_MAXFRAMENR=ABS_MAXFRAMENR; +/***************************************************************************** + * Quality presets + ****************************************************************************/ + +static const int motion_presets[] = { + /* quality 0 */ + 0, + + /* quality 1 */ + XVID_ME_ADVANCEDDIAMOND16, + + /* quality 2 */ + XVID_ME_ADVANCEDDIAMOND16 | XVID_ME_HALFPELREFINE16, + + /* quality 3 */ + XVID_ME_ADVANCEDDIAMOND16 | XVID_ME_HALFPELREFINE16 | + XVID_ME_ADVANCEDDIAMOND8 | XVID_ME_HALFPELREFINE8, + + /* quality 4 */ + XVID_ME_ADVANCEDDIAMOND16 | XVID_ME_HALFPELREFINE16 | + XVID_ME_ADVANCEDDIAMOND8 | XVID_ME_HALFPELREFINE8 | + XVID_ME_CHROMA_PVOP | XVID_ME_CHROMA_BVOP, + + /* quality 5 */ + XVID_ME_ADVANCEDDIAMOND16 | XVID_ME_HALFPELREFINE16 | + XVID_ME_ADVANCEDDIAMOND8 | XVID_ME_HALFPELREFINE8 | + XVID_ME_CHROMA_PVOP | XVID_ME_CHROMA_BVOP, + + /* quality 6 */ + XVID_ME_ADVANCEDDIAMOND16 | XVID_ME_HALFPELREFINE16 | XVID_ME_EXTSEARCH16 | + XVID_ME_ADVANCEDDIAMOND8 | XVID_ME_HALFPELREFINE8 | XVID_ME_EXTSEARCH8 | + XVID_ME_CHROMA_PVOP | XVID_ME_CHROMA_BVOP, + +}; +#define ME_ELEMENTS (sizeof(motion_presets)/sizeof(motion_presets[0])) + +static const int vop_presets[] = { + /* quality 0 */ + 0, + + /* quality 1 */ + 0, + + /* quality 2 */ + XVID_VOP_HALFPEL, + + /* quality 3 */ + XVID_VOP_HALFPEL | XVID_VOP_INTER4V, + + /* quality 4 */ + XVID_VOP_HALFPEL | XVID_VOP_INTER4V, + + /* quality 5 */ + XVID_VOP_HALFPEL | XVID_VOP_INTER4V | + XVID_VOP_TRELLISQUANT, + + /* quality 6 */ + XVID_VOP_HALFPEL | XVID_VOP_INTER4V | + XVID_VOP_TRELLISQUANT | XVID_VOP_HQACPRED, + +}; +#define VOP_ELEMENTS (sizeof(vop_presets)/sizeof(vop_presets[0])) + +/***************************************************************************** + * Command line global variables + ****************************************************************************/ + +#define MAX_ZONES 64 + +static xvid_enc_zone_t ZONES[MAX_ZONES]; +static int NUM_ZONES = 0; + +/* Maximum number of frames to encode */ +#define ABS_MAXFRAMENR 9999 + +static int ARG_STATS = 0; +static int ARG_DUMP = 0; +static int ARG_LUMIMASKING = 0; +static int ARG_BITRATE = 0; +static int ARG_SINGLE = 0; +static char *ARG_PASS1 = 0; +static char *ARG_PASS2 = 0; +static int ARG_QUALITY = ME_ELEMENTS - 1; +static float ARG_FRAMERATE = 25.00f; +static int ARG_MAXFRAMENR = ABS_MAXFRAMENR; +static int ARG_MAXKEYINTERVAL = 0; +static char *ARG_INPUTFILE = NULL; +static int ARG_INPUTTYPE = 0; +static int ARG_SAVEMPEGSTREAM = 0; +static int ARG_SAVEINDIVIDUAL = 0; +static char *ARG_OUTPUTFILE = NULL; +static int XDIM = 0; +static int YDIM = 0; +static int ARG_BQRATIO = 150; +static int ARG_BQOFFSET = 100; +static int ARG_MAXBFRAMES = 0; +static int ARG_PACKED = 0; +static int ARG_DEBUG = 0; +static int ARG_VOPDEBUG = 0; +static int ARG_GREYSCALE = 0; +static int ARG_QTYPE = 0; +static int ARG_QMATRIX = 0; +static int ARG_GMC = 0; +static int ARG_INTERLACING = 0; +static int ARG_QPEL = 0; +static int ARG_TURBO = 0; +static int ARG_VHQMODE = 0; +static int ARG_BVHQ = 0; +static int ARG_CLOSED_GOP = 0; -#ifdef BFRAMES +#ifndef READ_PNM +#define IMAGE_SIZE(x,y) ((x)*(y)*3/2) +#else +#define IMAGE_SIZE(x,y) ((x)*(y)*3) +#endif + +#define MAX(A,B) ( ((A)>(B)) ? (A) : (B) ) +#define SMALL_EPS (1e-10) -int ARG_MAXBFRAMES=1; -int ARG_BQUANTRATIO=200; +#define SWAP(a) ( (((a)&0x000000ff)<<24) | (((a)&0x0000ff00)<<8) | \ + (((a)&0x00ff0000)>>8) | (((a)&0xff000000)>>24) ) +/**************************************************************************** + * Nasty global vars ;-) + ***************************************************************************/ + +static int i; + +/* the path where to save output */ +static char filepath[256] = "./"; + +/* Internal structures (handles) for encoding and decoding */ +static void *enc_handle = NULL; + +static unsigned char qmatrix_intra[64]; +static unsigned char qmatrix_inter[64]; + +#ifdef XVID_AVI_INPUT +static PAVISTREAM avi_stream = NULL; #endif -#define MAX(A,B) ( ((A)>(B)) ? (A) : (B) ) -#define SMALL_EPS 1e-10 +/***************************************************************************** + * Local prototypes + ****************************************************************************/ + +/* Prints program usage message */ +static void usage(); + +/* Statistical functions */ +static double msecond(); + +/* PGM related functions */ +#ifndef READ_PNM +static int read_pgmheader(FILE * handle); +static int read_pgmdata(FILE * handle, + unsigned char *image); +#else +static int read_pnmheader(FILE * handle); +static int read_pnmdata(FILE * handle, + unsigned char *image); +#endif +static int read_yuvdata(FILE * handle, + unsigned char *image); -/* these are global variables. Not very elegant, but easy, and this is an easy program */ - -int XDIM=0; -int YDIM=0; // will be set when reading first image -int i,filenr = 0; - -int save_m4v_flag = 1; // output MPEG4-bytestream? -int save_ref_flag = 0; // save input image - -int pgmflag = 0; // a flag, if input is in PGM format, overwritten in init-phase -char filepath[256] = "./"; // the path where to save output - -void *enc_handle = NULL; // internal structures (handles) for encoding - - -/*********************************************************************/ -/* "statistical" functions */ -/* */ -/* these are not needed for encoding or decoding, but for measuring */ -/* time and quality, there in nothing specific to XviD in these */ -/* */ -/*********************************************************************/ - -double msecond() -/* return the current time in seconds(!) */ -{ - struct timeval tv; - gettimeofday(&tv, 0); - return tv.tv_sec + tv.tv_usec * 1.0e-6; -} +/* Encoder related functions */ +static int enc_init(int use_assembler); +static int enc_stop(); +static int enc_main(unsigned char *image, + unsigned char *bitstream, + int *key, + int *stats_type, + int *stats_quant, + int *stats_length, + int stats[3]); + +/***************************************************************************** + * Main function + ****************************************************************************/ + +int +main(int argc, + char *argv[]) +{ -/*********************************************************************/ -/* input and output functions */ -/* */ -/* the are small and simple routines to read and write PGM and YUV */ -/* image. It's just for convenience, again nothing specific to XviD */ -/* */ -/*********************************************************************/ - -int read_pgmheader(FILE* handle) -{ - int bytes,xsize,ysize,depth; - char dummy[2]; - - bytes = fread(dummy,1,2,handle); + unsigned char *mp4_buffer = NULL; + unsigned char *in_buffer = NULL; + unsigned char *out_buffer = NULL; + + double enctime; + double totalenctime = 0.; + float totalPSNR[3] = {0., 0., 0.}; + + int totalsize; + int result; + int m4v_size; + int key; + int stats_type; + int stats_quant; + int stats_length; + int use_assembler = 1; + + int input_num; + int output_num; + + char filename[256]; + + FILE *in_file = stdin; + FILE *out_file = NULL; + + printf("xvid_encraw - raw mpeg4 bitstream encoder "); + printf("written by Christoph Lampert 2002-2003\n\n"); + + /* Is there a dumb XviD coder ? */ + if(ME_ELEMENTS != VOP_ELEMENTS) { + fprintf(stderr, "Presets' arrays should have the same number of elements -- Please fill a bug to xvid-devel@xvid.org\n"); + return(-1); + } + +/***************************************************************************** + * Command line parsing + ****************************************************************************/ + + for (i = 1; i < argc; i++) { + + if (strcmp("-asm", argv[i]) == 0) { + use_assembler = 1; + } else if (strcmp("-noasm", argv[i]) == 0) { + use_assembler = 0; + } else if (strcmp("-w", argv[i]) == 0 && i < argc - 1) { + i++; + XDIM = atoi(argv[i]); + } else if (strcmp("-h", argv[i]) == 0 && i < argc - 1) { + i++; + YDIM = atoi(argv[i]); + } else if (strcmp("-bitrate", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_BITRATE = atoi(argv[i]); + } else if (strcmp("-single", argv[i]) == 0) { + ARG_SINGLE = 1; + } else if (strcmp("-pass1", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_PASS1 = argv[i]; + } else if (strcmp("-pass2", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_PASS2 = argv[i]; + } else if (strcmp("-max_bframes", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_MAXBFRAMES = atoi(argv[i]); + } else if (strcmp("-packed", argv[i]) == 0) { + ARG_PACKED = 1; + } else if (strcmp("-bquant_ratio", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_BQRATIO = atoi(argv[i]); + } else if (strcmp("-bquant_offset", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_BQOFFSET = atoi(argv[i]); + + } else if ((strcmp("-zq", argv[i]) == 0 || strcmp("-zw", argv[i]) == 0) && i < argc - 2) { + + if (NUM_ZONES >= MAX_ZONES) { + fprintf(stderr,"warning: too many zones; zone ignored\n"); + continue; + } + ZONES[NUM_ZONES].mode = strcmp("-zq", argv[i])==0 ? XVID_ZONE_QUANT : XVID_ZONE_WEIGHT; + i++; + ZONES[NUM_ZONES].frame = atoi(argv[i]); + i++; + ZONES[NUM_ZONES].increment = (int)(atof(argv[i]) * 100); + ZONES[NUM_ZONES].base = 100; + NUM_ZONES++; + + } else if (strcmp("-quality", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_QUALITY = atoi(argv[i]); + } else if (strcmp("-vhqmode", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_VHQMODE = atoi(argv[i]); + } else if (strcmp("-framerate", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_FRAMERATE = (float) atof(argv[i]); + } else if (strcmp("-max_key_interval", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_MAXKEYINTERVAL = atoi(argv[i]); + } else if (strcmp("-i", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_INPUTFILE = argv[i]; + } else if (strcmp("-stats", argv[i]) == 0) { + ARG_STATS = 1; + } else if (strcmp("-dump", argv[i]) == 0) { + ARG_DUMP = 1; + } else if (strcmp("-lumimasking", argv[i]) == 0) { + ARG_LUMIMASKING = 1; + } else if (strcmp("-type", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_INPUTTYPE = atoi(argv[i]); + } else if (strcmp("-frames", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_MAXFRAMENR = atoi(argv[i]); + } else if (strcmp("-qtype", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_QTYPE = atoi(argv[i]); + } else if (strcmp("-qmatrix", argv[i]) == 0 && i < argc - 1) { + FILE *fp = fopen(argv[++i], "rb"); + if (fp == NULL) { + fprintf(stderr, "Error opening input file %s\n", argv[i]); + return (-1); + } + fseek(fp, 0, SEEK_END); + if (ftell(fp) != 128) { + fprintf(stderr, "Unexpected size of input file %s\n", argv[i]); + return (-1); + } + + fseek(fp, 0, SEEK_SET); + fread(qmatrix_intra, 1, 64, fp); + fread(qmatrix_inter, 1, 64, fp); + + ARG_QMATRIX = 1; + } else if (strcmp("-save", argv[i]) == 0) { + ARG_SAVEMPEGSTREAM = 1; + ARG_SAVEINDIVIDUAL = 1; + } else if (strcmp("-debug", argv[i]) == 0) { + i++; + if (sscanf(argv[i],"0x%x", &ARG_DEBUG) || sscanf(argv[i],"%d", &ARG_DEBUG)) ; + } else if (strcmp("-o", argv[i]) == 0 && i < argc - 1) { + ARG_SAVEMPEGSTREAM = 1; + i++; + ARG_OUTPUTFILE = argv[i]; + } else if (strcmp("-vop_debug", argv[i]) == 0) { + ARG_VOPDEBUG = 1; + } else if (strcmp("-grey", argv[i]) == 0) { + ARG_GREYSCALE = 1; + } else if (strcmp("-bvhq", argv[i]) == 0) { + ARG_BVHQ = 1; + } else if (strcmp("-qpel", argv[i]) == 0) { + ARG_QPEL = 1; + } else if (strcmp("-turbo", argv[i]) == 0) { + ARG_TURBO = 1; + } else if (strcmp("-gmc", argv[i]) == 0) { + ARG_GMC = 1; + } else if (strcmp("-interlaced", argv[i]) == 0) { + ARG_INTERLACING = 1; + } else if (strcmp("-closed_gop", argv[i]) == 0) { + ARG_CLOSED_GOP = 1; + } else if (strcmp("-help", argv[i])) { + usage(); + return (0); + } else { + usage(); + exit(-1); + } - if ( (bytes < 2) || (dummy[0] != 'P') || (dummy[1] != '5' )) - return 1; - fscanf(handle,"%d %d %d",&xsize,&ysize,&depth); - if ( (xsize > 1440) || (ysize > 2880 ) || (depth != 255) ) - { - return 2; } - if ( (XDIM==0) || (YDIM==0) ) - { XDIM=xsize; - YDIM=ysize; + +/***************************************************************************** + * Arguments checking + ****************************************************************************/ + + if (XDIM <= 0 || XDIM >= 4096 || YDIM <= 0 || YDIM >= 4096) { + fprintf(stderr, + "Trying to retrieve width and height from input header\n"); + if (!ARG_INPUTTYPE) + ARG_INPUTTYPE = 1; /* pgm */ } - return 0; -} + if (ARG_QUALITY < 0 ) { + ARG_QUALITY = 0; + } else if (ARG_QUALITY >= ME_ELEMENTS) { + ARG_QUALITY = ME_ELEMENTS - 1; + } -int read_pgmdata(FILE* handle, unsigned char *image) -{ - int i,status; - char dummy; - - unsigned char* buff1_ptr2 = image + XDIM*YDIM; - unsigned char* buff1_ptr3 = image + XDIM*YDIM + XDIM/2*YDIM/2; - - fread(image,XDIM*YDIM,1,stdin); // read Y component of picture - - for (i=0;i= ARG_MAXFRAMENR) { + result = 1; + } + + if (!result) { +#ifdef XVID_AVI_INPUT + if (ARG_INPUTTYPE==2) { + /* read avs/avi data (YUV-format) */ + if(AVIStreamRead(avi_stream, input_num, 1, in_buffer, IMAGE_SIZE(XDIM, YDIM), NULL, NULL ) != AVIERR_OK) + result = 1; + } else +#endif + if (ARG_INPUTTYPE==1) { + /* read PGM data (YUV-format) */ +#ifndef READ_PNM + result = read_pgmdata(in_file, in_buffer); #else - xinit.cpu_flags = 0; + result = read_pnmdata(in_file, in_buffer); #endif + } else { + /* read raw data (YUV-format) */ + result = read_yuvdata(in_file, in_buffer); + } + } - else - xinit.cpu_flags = XVID_CPU_FORCE; +/***************************************************************************** + * Encode and decode this frame + ****************************************************************************/ + + enctime = msecond(); + m4v_size = + enc_main(!result ? in_buffer : 0, mp4_buffer, &key, &stats_type, + &stats_quant, &stats_length, sse); + enctime = msecond() - enctime; + + /* Write the Frame statistics */ + + printf("%5d: key=%i, time= %6.0f, len= %7d", !result ? input_num : -1, + key, (float) enctime, (int) m4v_size); + + if (stats_type > 0) { /* !XVID_TYPE_NOTHING */ + + switch (stats_type) { + case XVID_TYPE_IVOP: + type = "I"; + break; + case XVID_TYPE_PVOP: + type = "P"; + break; + case XVID_TYPE_BVOP: + type = "B"; + break; + case XVID_TYPE_SVOP: + type = "S"; + break; + default: + type = "U"; + break; + } + + printf(" | type=%s, quant= %2d, len= %7d", type, stats_quant, + stats_length); + +#define SSE2PSNR(sse, width, height) ((!(sse))?0.0f : 48.131f - 10*(float)log10((float)(sse)/((float)((width)*(height))))) + + if (ARG_STATS) { + printf(", psnr y = %2.2f, psnr u = %2.2f, psnr v = %2.2f", + SSE2PSNR(sse[0], XDIM, YDIM), SSE2PSNR(sse[1], XDIM / 2, + YDIM / 2), + SSE2PSNR(sse[2], XDIM / 2, YDIM / 2)); + + totalPSNR[0] += SSE2PSNR(sse[0], XDIM, YDIM); + totalPSNR[1] += SSE2PSNR(sse[1], XDIM/2, YDIM/2); + totalPSNR[2] += SSE2PSNR(sse[2], XDIM/2, YDIM/2); + } + + } +#undef SSE2PSNR - xvid_init(NULL, 0, &xinit, NULL); + printf("\n"); - xparam.width = XDIM; - xparam.height = YDIM; - if ((ARG_FRAMERATE - (int)ARG_FRAMERATE) < SMALL_EPS) - { - xparam.fincr = 1; - xparam.fbase = (int)ARG_FRAMERATE; + if (m4v_size < 0) { + break; + } + + /* Update encoding time stats */ + totalenctime += enctime; + totalsize += m4v_size; + +/***************************************************************************** + * Save stream to file + ****************************************************************************/ + + if (m4v_size > 0 && ARG_SAVEMPEGSTREAM) { + + /* Save single files */ + if (ARG_SAVEINDIVIDUAL) { + FILE *out; + sprintf(filename, "%sframe%05d.m4v", filepath, output_num); + out = fopen(filename, "w+b"); + fwrite(mp4_buffer, m4v_size, 1, out); + fclose(out); + output_num++; + } + + /* Save ES stream */ + if (ARG_OUTPUTFILE && out_file) + fwrite(mp4_buffer, 1, m4v_size, out_file); + } + + input_num++; + + /* Read the header if it's pgm stream */ + if (!result && (ARG_INPUTTYPE==1)) +#ifndef READ_PNM + result = read_pgmheader(in_file); +#else + result = read_pnmheader(in_file); +#endif + } while (1); + + + +/***************************************************************************** + * Calculate totals and averages for output, print results + ****************************************************************************/ + + printf("Tot: enctime(ms) =%7.2f, length(bytes) = %7d\n", + totalenctime, (int) totalsize); + + if (input_num > 0) { + totalsize /= input_num; + totalenctime /= input_num; + totalPSNR[0] /= input_num; + totalPSNR[1] /= input_num; + totalPSNR[2] /= input_num; + } else { + totalsize = -1; + totalenctime = -1; } - else - { - xparam.fincr = FRAMERATE_INCR; - xparam.fbase = (int)(FRAMERATE_INCR * ARG_FRAMERATE); + + printf("Avg: enctime(ms) =%7.2f, fps =%7.2f, length(bytes) = %7d", + totalenctime, 1000 / totalenctime, (int) totalsize); + if (ARG_STATS) { + printf(", psnr y = %2.2f, psnr u = %2.2f, psnr v = %2.2f", + totalPSNR[0],totalPSNR[1],totalPSNR[2]); } - xparam.rc_reaction_delay_factor = 16; - xparam.rc_averaging_period = 100; - xparam.rc_buffer = 10; - xparam.rc_bitrate = ARG_BITRATE*1000; - xparam.min_quantizer = 1; - xparam.max_quantizer = 31; - xparam.max_key_interval = (int)ARG_FRAMERATE*10; + printf("\n"); + + +/***************************************************************************** + * XviD PART Stop + ****************************************************************************/ -#ifdef BFRAMES - xparam.global = XVID_GLOBAL_DX50BVOP; - xparam.max_bframes = ARG_MAXBFRAMES; - xparam.bquant_ratio = ARG_BQUANTRATIO; - xparam.frame_drop_ratio=0; + release_all: + +#ifdef XVID_AVI_INPUT + if (avi_stream) { + AVIStreamRelease(avi_stream); + AVIFileExit(); + } #endif - /* I use a small value here, since will not encode whole movies, - but short clips */ + if (enc_handle) { + result = enc_stop(); + if (result) + fprintf(stderr, "Encore RELEASE problem return value %d\n", + result); + } + + if (in_file) + fclose(in_file); + if (out_file) + fclose(out_file); + + free_all_memory: + free(out_buffer); + free(mp4_buffer); + free(in_buffer); - xerr = xvid_encore(NULL, XVID_ENC_CREATE, &xparam, NULL); - enc_handle=xparam.handle; + return (0); - return xerr; } -int enc_stop() -{ int xerr; - xerr = xvid_encore(enc_handle, XVID_ENC_DESTROY, NULL, NULL); - return xerr; +/***************************************************************************** + * "statistical" functions + * + * these are not needed for encoding or decoding, but for measuring + * time and quality, there in nothing specific to XviD in these + * + *****************************************************************************/ + +/* Return time elapsed time in miliseconds since the program started */ +static double +msecond() +{ +#ifndef WIN32 + struct timeval tv; + + gettimeofday(&tv, 0); + return (tv.tv_sec * 1.0e3 + tv.tv_usec * 1.0e-3); +#else + clock_t clk; + + clk = clock(); + return (clk * 1000.0 / CLOCKS_PER_SEC); +#endif } -int enc_main(unsigned char* image, unsigned char* bitstream, int *streamlength, int* frametype) -{ int xerr; +/***************************************************************************** + * Usage message + *****************************************************************************/ - XVID_ENC_FRAME xframe; - XVID_ENC_STATS xstats; +static void +usage() +{ + fprintf(stderr, "Usage : xvid_stat [OPTIONS]\n\n"); + fprintf(stderr, "Input options:\n"); + fprintf(stderr, " -i string : input filename (default=stdin)\n"); +#ifdef XVID_AVI_INPUT + fprintf(stderr, " -type integer: input data type (yuv=0, pgm=1, avi/avs=2)\n"); +#else + fprintf(stderr, " -type integer: input data type (yuv=0, pgm=1)\n"); +#endif + fprintf(stderr, " -w integer: frame width ([1.2048])\n"); + fprintf(stderr, " -h integer: frame height ([1.2048])\n"); + fprintf(stderr, " -frames integer: number of frames to encode\n"); + fprintf(stderr, "\n"); + fprintf(stderr, "Output options:\n"); + fprintf(stderr, " -dump : save decoder output\n"); + fprintf(stderr, " -save : save an Elementary Stream file per frame\n"); + fprintf(stderr, " -o string: save an Elementary Stream for the complete sequence\n"); + fprintf(stderr, "\n"); + fprintf(stderr, "BFrames options:\n"); + fprintf(stderr, " -max_bframes integer: max bframes (default=0)\n"); + fprintf(stderr, " -bquant_ratio integer: bframe quantizer ratio (default=150)\n"); + fprintf(stderr, " -bquant_offset integer: bframe quantizer offset (default=100)\n"); + fprintf(stderr, "\n"); + fprintf(stderr, "Rate control options:\n"); + fprintf(stderr, " -framerate float : target framerate (>0 | default=25.0)\n"); + fprintf(stderr, " -bitrate integer : target bitrate\n"); + fprintf(stderr, " -single : single pass mode\n"); + fprintf(stderr, " -pass1 filename : twopass mode (first pass)\n"); + fprintf(stderr, " -pass2 filename : twopass mode (2nd pass)\n"); + fprintf(stderr, " -zq starting_frame float : bitrate zone; quant\n"); + fprintf(stderr, " -zw starting_frame float : bitrate zone; weight\n"); + fprintf(stderr, " -max_key_interval integer : maximum keyframe interval\n"); + fprintf(stderr, "\n"); + fprintf(stderr, "Other options\n"); + fprintf(stderr, " -noasm : do not use assembly optmized code\n"); + fprintf(stderr, " -turbo : use turbo presets for higher encoding speed\n"); + fprintf(stderr, " -quality integer : quality ([0..%d])\n", ME_ELEMENTS - 1); + fprintf(stderr, " -vhqmode integer : level of Rate-Distortion optimizations ([0..4]) (default=0)\n"); + fprintf(stderr, " -bvhq : use Rate-Distortion optimizations for B-frames too\n"); + fprintf(stderr, " -qpel : use quarter pixel ME\n"); + fprintf(stderr, " -gmc : use global motion compensation\n"); + fprintf(stderr, " -qtype integer : quantization type (H263:0, MPEG4:1) (default=0)\n"); + fprintf(stderr, " -qmatrix filename: use custom MPEG4 quantization matrix\n"); + fprintf(stderr, " -interlaced : use interlaced encoding (this is NOT a deinterlacer!)\n"); + fprintf(stderr, " -packed : packed mode\n"); + fprintf(stderr, " -closed_gop : closed GOP mode\n"); + fprintf(stderr, " -grey : grey scale coding (chroma is discarded)\n"); + fprintf(stderr, " -lumimasking : use lumimasking algorithm\n"); + fprintf(stderr, " -stats : print stats about encoded frames\n"); + fprintf(stderr, " -debug : activates xvidcore internal debugging output\n"); + fprintf(stderr, " -vop_debug : print some info directly into encoded frames\n"); + fprintf(stderr, " -help : prints this help message\n"); + fprintf(stderr, "\n"); + fprintf(stderr, "NB: You can define %d zones repeating the -z[qw] option as many times as needed.\n", MAX_ZONES); + fprintf(stderr, "\n"); +} - xframe.bitstream = bitstream; - xframe.length = -1; // this is written by the routine +/***************************************************************************** + * Input and output functions + * + * the are small and simple routines to read and write PGM and YUV + * image. It's just for convenience, again nothing specific to XviD + * + *****************************************************************************/ - xframe.image = image; - xframe.colorspace = XVID_CSP_YV12; // defined in +#ifndef READ_PNM +static int +read_pgmheader(FILE * handle) +{ + int bytes, xsize, ysize, depth; + char dummy[2]; - xframe.intra = -1; // let the codec decide between I-frame (1) and P-frame (0) + bytes = fread(dummy, 1, 2, handle); - xframe.quant = ARG_QUANTI; // is quant != 0, use a fixed quant (and ignore bitrate) + if ((bytes < 2) || (dummy[0] != 'P') || (dummy[1] != '5')) + return (1); - xframe.motion = motion_presets[ARG_QUALITY]; - xframe.general = general_presets[ARG_QUALITY]; - xframe.quant_intra_matrix = xframe.quant_inter_matrix = NULL; + fscanf(handle, "%d %d %d", &xsize, &ysize, &depth); + if ((xsize > 4096) || (ysize > 4096*3/2) || (depth != 255)) { + fprintf(stderr, "%d %d %d\n", xsize, ysize, depth); + return (2); + } + if ((XDIM == 0) || (YDIM == 0)) { + XDIM = xsize; + YDIM = ysize * 2 / 3; + } -#ifdef BFRAMES - xframe.bquant = 0; -#endif + return (0); +} - xerr = xvid_encore(enc_handle, XVID_ENC_ENCODE, &xframe, &xstats); +static int +read_pgmdata(FILE * handle, + unsigned char *image) +{ + int i; + char dummy; -/* enc_result->is_key_frame = xframe.intra; - enc_result->quantizer = xframe.quant; - enc_result->total_bits = xframe.length * 8; - enc_result->motion_bits = xstats.hlength * 8; - enc_result->texture_bits = enc_result->total_bits - enc_result->motion_bits; -*/ + unsigned char *y = image; + unsigned char *u = image + XDIM * YDIM; + unsigned char *v = image + XDIM * YDIM + XDIM / 2 * YDIM / 2; + + /* read Y component of picture */ + fread(y, 1, XDIM * YDIM, handle); + + for (i = 0; i < YDIM / 2; i++) { + /* read U */ + fread(u, 1, XDIM / 2, handle); + + /* read V */ + fread(v, 1, XDIM / 2, handle); + + /* Update pointers */ + u += XDIM / 2; + v += XDIM / 2; + } -/* This is statictical data, e.g. for 2-pass. - If you are not interested in any of this, you can use - NULL instead of &xstats -*/ - *frametype = xframe.intra; - *streamlength = xframe.length; + /* I don't know why, but this seems needed */ + fread(&dummy, 1, 1, handle); - return xerr; + return (0); } +#else +static int +read_pnmheader(FILE * handle) +{ + int bytes, xsize, ysize, depth; + char dummy[2]; -/*********************************************************************/ -/* Main program */ -/*********************************************************************/ - -int main(int argc, char *argv[]) -{ - unsigned char *divx_buffer = NULL; - unsigned char *in_buffer = NULL; - - double enctime; - double totalenctime=0.; - - long totalsize=0; - int status; - - int m4v_size; - int frame_type[ABS_MAXFRAMENR]; - int Iframes=0, Pframes=0, Bframes=0; - int use_assembler=1; - - char filename[256]; - - FILE *filehandle; - -/* read YUV in pgm format from stdin */ - if (!pgmflag) - { - pgmflag = 1; - -// if (argc==2 && !strcmp(argv[1],"-noasm")) -// use_assembler = 0; - - if (argc>=3) - { XDIM = atoi(argv[1]); - YDIM = atoi(argv[2]); - if ( (XDIM <= 0) || (XDIM >= 2048) || (YDIM <=0) || (YDIM >= 2048) ) - { fprintf(stderr,"Wrong frames size %d %d, trying PGM \n",XDIM, YDIM); - } - else - { - YDIM = YDIM*3/2; /* for YUV */ - pgmflag = 0; - } + bytes = fread(dummy, 1, 2, handle); + + if ((bytes < 2) || (dummy[0] != 'P') || (dummy[1] != '6')) + return (1); + + fscanf(handle, "%d %d %d", &xsize, &ysize, &depth); + if ((xsize > 1440) || (ysize > 2880) || (depth != 255)) { + fprintf(stderr, "%d %d %d\n", xsize, ysize, depth); + return (2); } - } - - if (pgmflag) - { if (read_pgmheader(stdin)) - { - fprintf(stderr,"Wrong input format, I want YUV encapsulated in PGM\n"); - return 1; - } - } - if (argc>=4) - { ARG_QUALITY = atoi(argv[3]); - if ( (ARG_QUALITY < 0) || (ARG_QUALITY > 6) ) - { fprintf(stderr,"Wrong Quality\n"); return -1; } + + XDIM = xsize; + YDIM = ysize; + + return (0); +} + +static int +read_pnmdata(FILE * handle, + unsigned char *image) +{ + int i; + char dummy; + + /* read Y component of picture */ + fread(image, 1, XDIM * YDIM * 3, handle); + + /* I don't know why, but this seems needed */ + fread(&dummy, 1, 1, handle); + + return (0); +} +#endif + +static int +read_yuvdata(FILE * handle, + unsigned char *image) +{ + + if (fread(image, 1, IMAGE_SIZE(XDIM, YDIM), handle) != + (unsigned int) IMAGE_SIZE(XDIM, YDIM)) + return (1); else - fprintf(stderr,"Quality %d\n",ARG_QUALITY); - } - if (argc>=5) - { ARG_BITRATE = atoi(argv[4]); - if ( (ARG_BITRATE <= 0) ) - { fprintf(stderr,"Wrong Bitrate\n"); return -1; } - if ( (ARG_BITRATE < 32) ) - { ARG_QUANTI = ARG_BITRATE; - ARG_BITRATE=0; - fprintf(stderr,"Quantizer %d\n",ARG_QUANTI); + return (0); +} + +/***************************************************************************** + * Routines for encoding: init encoder, frame step, release encoder + ****************************************************************************/ + +/* sample plugin */ + +int +rawenc_debug(void *handle, + int opt, + void *param1, + void *param2) +{ + switch (opt) { + case XVID_PLG_INFO: + { + xvid_plg_info_t *info = (xvid_plg_info_t *) param1; + + info->flags = XVID_REQDQUANTS; + return 0; } - else - fprintf(stderr,"Bitrate %d kbps\n",ARG_BITRATE); - } - if (argc>=6) - { ARG_FRAMERATE = (float)atof(argv[5]); - if ( (ARG_FRAMERATE <= 0) ) - { fprintf(stderr,"Wrong Fraterate %s \n",argv[5]); return -1; } - fprintf(stderr,"Framerate %6.3f fps\n",ARG_FRAMERATE); - } - - if (argc>=7) - { ARG_MAXFRAMENR = atoi(argv[6]); - if ( (ARG_MAXFRAMENR <= 0) ) - { fprintf(stderr,"Wrong number of frames\n"); return -1; } - fprintf(stderr,"max. Framenr. %d\n",ARG_MAXFRAMENR); - } - -#ifdef BFRAMES - if (argc>=8) - { ARG_MAXBFRAMES = atoi(argv[7]); - if ( (ARG_MAXBFRAMES < -1) || ( ARG_MAXBFRAMES > ARG_FRAMERATE) ) - { fprintf(stderr,"Wrong maximumnumber of bframes\n"); return -1; } - fprintf(stderr,"max. B-frames %d\n",ARG_MAXBFRAMES); - } - - if (argc>=9) - { ARG_MAXFRAMENR = atoi(argv[8]); - if ( (ARG_BQUANTRATIO <= 0) ) - { fprintf(stderr,"Wrong B-frames Quantizer ratio \n"); return -1; } - fprintf(stderr,"B-frames quant-ratio %d\n",ARG_BQUANTRATIO); - } -#endif - -/* now we know the sizes, so allocate memory */ - - in_buffer = (unsigned char *) malloc(XDIM*YDIM); - if (!in_buffer) - goto free_all_memory; - - divx_buffer = (unsigned char *) malloc(XDIM*YDIM*2); - if (!divx_buffer) - goto free_all_memory; - - YDIM = YDIM*2/3; // PGM is YUV 4:2:0 format, so real image height is *2/3 of PGM picture -/*********************************************************************/ -/* XviD PART Start */ -/*********************************************************************/ - - status = enc_init(use_assembler); - if (status) - { - fprintf(stderr,"Encore INIT problem, return value %d\n", status); - goto release_all; + case XVID_PLG_CREATE: + case XVID_PLG_DESTROY: + case XVID_PLG_BEFORE: + return 0; + + case XVID_PLG_AFTER: + { + xvid_plg_data_t *data = (xvid_plg_data_t *) param1; + int i, j; + + printf("---[ frame: %5i quant: %2i length: %6i ]---\n", + data->frame_num, data->quant, data->length); + for (j = 0; j < data->mb_height; j++) { + for (i = 0; i < data->mb_width; i++) + printf("%2i ", data->dquant[j * data->dquant_stride + i]); + printf("\n"); + } + + return 0; + } } -/*********************************************************************/ -/* Main loop */ -/*********************************************************************/ - - do - { - if (pgmflag) - status = read_pgmdata(stdin, in_buffer); // read PGM data (YUV-format) - else - status = read_yuvdata(stdin, in_buffer); // read raw data (YUV-format) - - if (status) - { - // Couldn't read image, most likely end-of-file - continue; + return XVID_ERR_FAIL; +} + + +#define FRAMERATE_INCR 1001 + + +/* Initialize encoder for first use, pass all needed parameters to the codec */ +static int +enc_init(int use_assembler) +{ + int xerr; + //xvid_plugin_cbr_t cbr; + xvid_plugin_single_t single; + xvid_plugin_2pass1_t rc2pass1; + xvid_plugin_2pass2_t rc2pass2; + //xvid_plugin_fixed_t rcfixed; + xvid_enc_plugin_t plugins[7]; + xvid_gbl_init_t xvid_gbl_init; + xvid_enc_create_t xvid_enc_create; + + /*------------------------------------------------------------------------ + * XviD core initialization + *----------------------------------------------------------------------*/ + + /* Set version -- version checking will done by xvidcore */ + memset(&xvid_gbl_init, 0, sizeof(xvid_gbl_init)); + xvid_gbl_init.version = XVID_VERSION; + xvid_gbl_init.debug = ARG_DEBUG; + + + /* Do we have to enable ASM optimizations ? */ + if (use_assembler) { + +#ifdef ARCH_IS_IA64 + xvid_gbl_init.cpu_flags = XVID_CPU_FORCE | XVID_CPU_ASM; +#else + xvid_gbl_init.cpu_flags = 0; +#endif + } else { + xvid_gbl_init.cpu_flags = XVID_CPU_FORCE; } + /* Initialize XviD core -- Should be done once per __process__ */ + xvid_global(NULL, XVID_GBL_INIT, &xvid_gbl_init, NULL); - if (save_ref_flag) - { - sprintf(filename, "%s%05d.pgm", filepath, filenr); - write_pgm(filename,in_buffer); - } + /*------------------------------------------------------------------------ + * XviD encoder initialization + *----------------------------------------------------------------------*/ + + /* Version again */ + memset(&xvid_enc_create, 0, sizeof(xvid_enc_create)); + xvid_enc_create.version = XVID_VERSION; + + /* Width and Height of input frames */ + xvid_enc_create.width = XDIM; + xvid_enc_create.height = YDIM; + xvid_enc_create.profile = XVID_PROFILE_AS_L4; + + /* init plugins */ + xvid_enc_create.zones = ZONES; + xvid_enc_create.num_zones = NUM_ZONES; + + xvid_enc_create.plugins = plugins; + xvid_enc_create.num_plugins = 0; + + if (ARG_SINGLE) { + memset(&single, 0, sizeof(xvid_plugin_single_t)); + single.version = XVID_VERSION; + single.bitrate = ARG_BITRATE; + + plugins[xvid_enc_create.num_plugins].func = xvid_plugin_single; + plugins[xvid_enc_create.num_plugins].param = &single; + xvid_enc_create.num_plugins++; + } + if (ARG_PASS2) { + memset(&rc2pass2, 0, sizeof(xvid_plugin_2pass2_t)); + rc2pass2.version = XVID_VERSION; + rc2pass2.filename = ARG_PASS2; + rc2pass2.bitrate = ARG_BITRATE; + +/* An example of activating VBV could look like this + rc2pass2.vbv_size = 3145728; + rc2pass2.vbv_initial = 2359296; + rc2pass2.vbv_maxrate = 4000000; + rc2pass2.vbv_peakrate = 10000000; +*/ -/*********************************************************************/ -/* analyse this frame before encoding */ -/*********************************************************************/ + plugins[xvid_enc_create.num_plugins].func = xvid_plugin_2pass2; + plugins[xvid_enc_create.num_plugins].param = &rc2pass2; + xvid_enc_create.num_plugins++; + } -// nothing is done here at the moment, but you could e.g. create -// histograms or measure entropy or apply preprocessing filters... + if (ARG_PASS1) { + memset(&rc2pass1, 0, sizeof(xvid_plugin_2pass1_t)); + rc2pass1.version = XVID_VERSION; + rc2pass1.filename = ARG_PASS1; + + plugins[xvid_enc_create.num_plugins].func = xvid_plugin_2pass1; + plugins[xvid_enc_create.num_plugins].param = &rc2pass1; + xvid_enc_create.num_plugins++; + } -/*********************************************************************/ -/* encode and decode this frame */ -/*********************************************************************/ + if (ARG_LUMIMASKING) { + plugins[xvid_enc_create.num_plugins].func = xvid_plugin_lumimasking; + plugins[xvid_enc_create.num_plugins].param = NULL; + xvid_enc_create.num_plugins++; + } - enctime = -msecond(); - status = enc_main(in_buffer, divx_buffer, &m4v_size, &frame_type[filenr]); - enctime += msecond(); + if (ARG_DUMP) { + plugins[xvid_enc_create.num_plugins].func = xvid_plugin_dump; + plugins[xvid_enc_create.num_plugins].param = NULL; + xvid_enc_create.num_plugins++; + } - totalenctime += enctime; - totalsize += m4v_size; +#if 0 + if (ARG_DEBUG) { + plugins[xvid_enc_create.num_plugins].func = rawenc_debug; + plugins[xvid_enc_create.num_plugins].param = NULL; + xvid_enc_create.num_plugins++; + } +#endif - fprintf(stderr,"Frame %5d: intra %d, enctime =%6.1f ms length=%7d bytes\n", - filenr, frame_type[filenr], enctime*1000, m4v_size); + /* No fancy thread tests */ + xvid_enc_create.num_threads = 0; - if (save_m4v_flag) - { - fwrite(divx_buffer, m4v_size, 1, stdout); + /* Frame rate - Do some quick float fps = fincr/fbase hack */ + if ((ARG_FRAMERATE - (int) ARG_FRAMERATE) < SMALL_EPS) { + xvid_enc_create.fincr = 1; + xvid_enc_create.fbase = (int) ARG_FRAMERATE; + } else { + xvid_enc_create.fincr = FRAMERATE_INCR; + xvid_enc_create.fbase = (int) (FRAMERATE_INCR * ARG_FRAMERATE); } - - if (pgmflag) - status = read_pgmheader(stdin); - // because if this was the last PGM, stop now - filenr++; + /* Maximum key frame interval */ + if (ARG_MAXKEYINTERVAL > 0) { + xvid_enc_create.max_key_interval = ARG_MAXKEYINTERVAL; + }else { + xvid_enc_create.max_key_interval = (int) ARG_FRAMERATE *10; + } - } while ( (!status) && (filenr