--- trunk/xvidcore/examples/xvid_encraw.c 2003/02/15 15:22:19 851 +++ trunk/xvidcore/examples/xvid_encraw.c 2008/11/27 19:45:28 1811 @@ -3,7 +3,9 @@ * XVID MPEG-4 VIDEO CODEC * - Console based test application - * - * Copyright(C) 2002-2003 Christoph Lampert + * Copyright(C) 2002-2003 Christoph Lampert + * 2002-2003 Edouard Gomez + * 2003 Peter Ross * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by @@ -19,109 +21,248 @@ * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA * - * $Id: xvid_encraw.c,v 1.10 2003-02-15 15:22:17 edgomez Exp $ + * $Id: xvid_encraw.c,v 1.36 2008-11-27 19:45:28 Isibaar Exp $ * ****************************************************************************/ /***************************************************************************** * Application notes : * - * A sequence of YUV pics in PGM file format is encoded and decoded - * The speed is measured and PSNR of decoded picture is calculated. + * A sequence of raw YUV I420 pics or YUV I420 PGM file format is encoded + * The speed is measured and frames' PSNR are taken from core. * * The program is plain C and needs no libraries except for libxvidcore, * and maths-lib. + * + * Use ./xvid_encraw -help for a list of options * ************************************************************************/ #include +//#include #include #include #include #ifndef WIN32 #include #else +#include +#include #include +#define XVID_AVI_INPUT +#define XVID_AVI_OUTPUT #endif #include "xvid.h" +#ifdef XVID_MKV_OUTPUT +#include "matroska.cpp" +#endif + +#undef READ_PNM + /***************************************************************************** * Quality presets ****************************************************************************/ -static int const motion_presets[7] = { - 0, /* Q 0 */ - PMV_EARLYSTOP16, /* Q 1 */ - PMV_EARLYSTOP16, /* Q 2 */ - PMV_EARLYSTOP16 | PMV_HALFPELREFINE16, /* Q 3 */ - PMV_EARLYSTOP16 | PMV_HALFPELREFINE16, /* Q 4 */ - PMV_EARLYSTOP16 | PMV_HALFPELREFINE16 | PMV_EARLYSTOP8 | /* Q 5 */ - PMV_HALFPELREFINE8, - PMV_EARLYSTOP16 | PMV_HALFPELREFINE16 | PMV_EXTSEARCH16 | /* Q 6 */ - PMV_USESQUARES16 | PMV_EARLYSTOP8 | PMV_HALFPELREFINE8 +// Equivalent to vfw's pmvfast_presets +static const int motion_presets[] = { + /* quality 0 */ + 0, + + /* quality 1 */ + 0, + + /* quality 2 */ + 0, + + /* quality 3 */ + 0, + + /* quality 4 */ + 0 | XVID_ME_HALFPELREFINE16 | 0, + + /* quality 5 */ + 0 | XVID_ME_HALFPELREFINE16 | 0 | XVID_ME_ADVANCEDDIAMOND16, + + /* quality 6 */ + XVID_ME_HALFPELREFINE16 | XVID_ME_EXTSEARCH16 | XVID_ME_HALFPELREFINE8 | 0 | XVID_ME_USESQUARES16 + }; +#define ME_ELEMENTS (sizeof(motion_presets)/sizeof(motion_presets[0])) + +static const int vop_presets[] = { + /* quality 0 */ + 0, + + /* quality 1 */ + 0, + + /* quality 2 */ + 0, + + /* quality 3 */ + 0, + + /* quality 4 */ + 0, + + /* quality 5 */ + XVID_VOP_INTER4V, + + /* quality 6 */ + XVID_VOP_INTER4V, -static int const general_presets[7] = { - XVID_H263QUANT, /* Q 0 */ - XVID_MPEGQUANT, /* Q 1 */ - XVID_H263QUANT, /* Q 2 */ - XVID_H263QUANT | XVID_HALFPEL, /* Q 3 */ - XVID_H263QUANT | XVID_HALFPEL | XVID_INTER4V, /* Q 4 */ - XVID_H263QUANT | XVID_HALFPEL | XVID_INTER4V, /* Q 5 */ - XVID_H263QUANT | XVID_HALFPEL | XVID_INTER4V /* Q 6 */ }; - +#define VOP_ELEMENTS (sizeof(vop_presets)/sizeof(vop_presets[0])) /***************************************************************************** * Command line global variables ****************************************************************************/ +#define MAX_ZONES 64 + +#define DEFAULT_QUANT 400 + +typedef struct +{ + int frame; + + int type; + int mode; + int modifier; + + unsigned int greyscale; + unsigned int chroma_opt; + unsigned int bvop_threshold; + unsigned int cartoon_mode; +} zone_t; + +typedef struct +{ + int count; + int size; + int quants[32]; +} frame_stats_t; + /* Maximum number of frames to encode */ -#define ABS_MAXFRAMENR 9999 +#define ABS_MAXFRAMENR -1 /* no limit */ -/* HINTMODEs */ -#define HINT_MODE_NONE 0 -#define HINT_MODE_GET 1 -#define HINT_MODE_SET 2 -#define HINT_FILE "hints.mv" - -static int ARG_BITRATE = 900; -static int ARG_QUANTI = 0; -static int ARG_QUALITY = 6; -static int ARG_MINQUANT = 1; -static int ARG_MAXQUANT = 31; -static float ARG_FRAMERATE = 25.00f; -static int ARG_MAXFRAMENR = ABS_MAXFRAMENR; -static char *ARG_INPUTFILE = NULL; -static int ARG_INPUTTYPE = 0; -static int ARG_SAVEMPEGSTREAM = 0; -static char *ARG_OUTPUTFILE = NULL; -static int ARG_HINTMODE = HINT_MODE_NONE; -static int XDIM = 0; -static int YDIM = 0; -static int ARG_BQRATIO = 120; -static int ARG_BQOFFSET = 0; -static int ARG_MAXBFRAMES = 0; +#ifndef READ_PNM #define IMAGE_SIZE(x,y) ((x)*(y)*3/2) +#else +#define IMAGE_SIZE(x,y) ((x)*(y)*3) +#endif #define MAX(A,B) ( ((A)>(B)) ? (A) : (B) ) -#define SMALL_EPS 1e-10 +#define SMALL_EPS (1e-10) #define SWAP(a) ( (((a)&0x000000ff)<<24) | (((a)&0x0000ff00)<<8) | \ (((a)&0x00ff0000)>>8) | (((a)&0xff000000)>>24) ) +static zone_t ZONES[MAX_ZONES]; +static int NUM_ZONES = 0; +static frame_stats_t framestats[7]; + +static int ARG_STATS = 0; +static int ARG_SSIM = -1; +static char* ARG_SSIM_PATH = NULL; +static int ARG_DUMP = 0; +static int ARG_LUMIMASKING = 0; +static int ARG_BITRATE = 0; +static int ARG_TARGETSIZE = 0; +static int ARG_SINGLE = 1; +static char *ARG_PASS1 = 0; +static char *ARG_PASS2 = 0; +//static int ARG_QUALITY = ME_ELEMENTS - 1; +static int ARG_QUALITY = 6; +static float ARG_FRAMERATE = 25.00f; +static int ARG_DWRATE = 25; +static int ARG_DWSCALE = 1; +static int ARG_MAXFRAMENR = ABS_MAXFRAMENR; +static int ARG_MAXKEYINTERVAL = 300; +static int ARG_STARTFRAMENR = 0; +static char *ARG_INPUTFILE = NULL; +static int ARG_INPUTTYPE = 0; +static int ARG_SAVEMPEGSTREAM = 0; +static int ARG_SAVEINDIVIDUAL = 0; +static char *ARG_OUTPUTFILE = NULL; +#ifdef XVID_AVI_OUTPUT +static char *ARG_AVIOUTPUTFILE = NULL; +#endif +#ifdef XVID_MKV_OUTPUT +static char *ARG_MKVOUTPUTFILE = NULL; +#endif +#ifdef XVID_AVI_INPUT +static PAVISTREAM avi_stream = NULL; +static PAVIFILE avi_file = NULL; +static LPBITMAPINFOHEADER info_header = NULL; +static PGETFRAME get_frame = NULL; +#else +#define get_frame NULL +#endif +static char *ARG_TIMECODEFILE = NULL; +static int XDIM = 0; +static int YDIM = 0; +static int ARG_BQRATIO = 150; +static int ARG_BQOFFSET = 100; +static int ARG_MAXBFRAMES = 2; +static int ARG_PACKED = 1; +static int ARG_DEBUG = 0; +static int ARG_VOPDEBUG = 0; +static int ARG_TRELLIS = 1; +static int ARG_QTYPE = 0; +static int ARG_QMATRIX = 0; +static int ARG_GMC = 0; +static int ARG_INTERLACING = 0; +static int ARG_QPEL = 0; +static int ARG_TURBO = 0; +static int ARG_VHQMODE = 1; +static int ARG_BVHQ = 0; +static int ARG_CLOSED_GOP = 1; +static int ARG_CHROMAME = 1; +static int ARG_PAR = 1; +static int ARG_PARHEIGHT; +static int ARG_PARWIDTH; +static int ARG_QUANTS[6] = {2, 31, 2, 31, 2, 31}; +static int ARG_FRAMEDROP = 0; +static double ARG_CQ = 0; +static int ARG_FULL1PASS = 0; +static int ARG_REACTION = 16; +static int ARG_AVERAGING = 100; +static int ARG_SMOOTHER = 100; +static int ARG_KBOOST = 10; +static int ARG_KREDUCTION = 20; +static int ARG_KTHRESH = 1; +static int ARG_CHIGH = 0; +static int ARG_CLOW = 0; +static int ARG_OVERSTRENGTH = 5; +static int ARG_OVERIMPROVE = 5; +static int ARG_OVERDEGRADE = 5; +static int ARG_OVERHEAD = 0; +static int ARG_VBVSIZE = 0; +static int ARG_VBVMAXRATE = 0; +static int ARG_VBVPEAKRATE = 0; +static int ARG_THREADS = 0; +static int ARG_VFR = 0; +static int ARG_PROGRESS = 0; +static int ARG_COLORSPACE = XVID_CSP_YV12; + /* the path where to save output */ +static char filepath[256] = "./"; + /* Internal structures (handles) for encoding and decoding */ +static void *enc_handle = NULL; +static unsigned char qmatrix_intra[64]; +static unsigned char qmatrix_inter[64]; + /**************************************************************************** * Nasty global vars ;-) ***************************************************************************/ -static int i,filenr = 0; +static const int height_ratios[] = {1, 1, 11, 11, 11, 33}; +static const int width_ratios[] = {1, 1, 12, 10, 16, 40}; -/* the path where to save output */ -static char filepath[256] = "./"; +const char userdata_start_code[] = "\0\0\x01\xb2"; -/* Internal structures (handles) for encoding and decoding */ -static void *enc_handle = NULL; /***************************************************************************** * Local prototypes @@ -132,230 +273,745 @@ /* Statistical functions */ static double msecond(); +int gcd(int a, int b); +int minquant(int quants[32]); +int maxquant(int quants[32]); +double avgquant(frame_stats_t frame); /* PGM related functions */ -static int read_pgmheader(FILE* handle); -static int read_pgmdata(FILE* handle, unsigned char *image); -static int read_yuvdata(FILE* handle, unsigned char *image); +#ifndef READ_PNM +static int read_pgmheader(FILE * handle); +static int read_pgmdata(FILE * handle, + unsigned char *image); +#else +static int read_pnmheader(FILE * handle); +static int read_pnmdata(FILE * handle, + unsigned char *image); +#endif +static int read_yuvdata(FILE * handle, + unsigned char *image); /* Encoder related functions */ static int enc_init(int use_assembler); +static int enc_info(); static int enc_stop(); -static int enc_main(unsigned char* image, unsigned char* bitstream, - unsigned char *hints_buffer, - long *streamlength, long* frametype, long *hints_size); +static int enc_main(unsigned char *image, + unsigned char *bitstream, + int *key, + int *stats_type, + int *stats_quant, + int *stats_length, + int stats[3], + int framenum); + +/* Zone Related Functions */ +static void apply_zone_modifiers(xvid_enc_frame_t * frame, int framenum); +static void prepare_full1pass_zones(); +static void prepare_cquant_zones(); +void sort_zones(zone_t * zones, int zone_num, int * sel); + + +void removedivxp(char *buf, int size); /***************************************************************************** * Main function ****************************************************************************/ -int main(int argc, char *argv[]) +int +main(int argc, + char *argv[]) { unsigned char *mp4_buffer = NULL; unsigned char *in_buffer = NULL; unsigned char *out_buffer = NULL; - unsigned char *hints_buffer = NULL; double enctime; - double totalenctime=0.; - - long totalsize; - long hints_size; - int status; - long frame_type; - long bigendian; - - long m4v_size; - int use_assembler=0; - + double totalenctime = 0.; + float totalPSNR[3] = {0., 0., 0.}; + FILE *statsfile; + + int totalsize; + int result; + int m4v_size; + int key; + int stats_type; + int stats_quant; + int stats_length; + int use_assembler = 1; + int fakenvop = 0; + int i; + int nvop_counter; + + int input_num; + int output_num; + char filename[256]; - + FILE *in_file = stdin; FILE *out_file = NULL; - FILE *hints_file = NULL; + FILE *time_file = NULL; + +#ifdef XVID_AVI_OUTPUT + int avierr; + PAVIFILE myAVIFile=NULL; + PAVISTREAM myAVIStream=NULL; + AVISTREAMINFO myAVIStreamInfo; + BITMAPINFOHEADER myBitmapInfoHeader; + AVIFileInit(); +#endif +#ifdef XVID_MKV_OUTPUT + PMKVFILE myMKVFile=NULL; + PMKVSTREAM myMKVStream=NULL; + MKVSTREAMINFO myMKVStreamInfo; +#endif printf("xvid_encraw - raw mpeg4 bitstream encoder "); printf("written by Christoph Lampert 2002-2003\n\n"); + /* Is there a dumb XviD coder ? */ + if(ME_ELEMENTS != VOP_ELEMENTS) { + fprintf(stderr, "Presets' arrays should have the same number of elements -- Please fill a bug to xvid-devel@xvid.org\n"); + return(-1); + } + /***************************************************************************** * Command line parsing ****************************************************************************/ - for (i=1; i< argc; i++) { - - if (strcmp("-asm", argv[i]) == 0 ) { + for (i = 1; i < argc; i++) { + + if (strcmp("-asm", argv[i]) == 0) { use_assembler = 1; - } - else if (strcmp("-w", argv[i]) == 0 && i < argc - 1 ) { + } else if (strcmp("-noasm", argv[i]) == 0) { + use_assembler = 0; + } else if (strcmp("-w", argv[i]) == 0 && i < argc - 1) { i++; XDIM = atoi(argv[i]); - } - else if (strcmp("-h", argv[i]) == 0 && i < argc - 1 ) { + } else if (strcmp("-h", argv[i]) == 0 && i < argc - 1) { i++; YDIM = atoi(argv[i]); - } - else if (strcmp("-b", argv[i]) == 0 && i < argc - 1 ) { + } else if (strcmp("-csp",argv[i]) == 0 && i < argc - 1) { i++; - ARG_BITRATE = atoi(argv[i]); - } - else if (strcmp("-bn", argv[i]) == 0 && i < argc - 1 ) { + if (strcmp(argv[i],"i420") == 0){ + ARG_COLORSPACE = XVID_CSP_I420; + } else if(strcmp(argv[i],"yv12") == 0){ + ARG_COLORSPACE = XVID_CSP_YV12; + } else { + printf("Invalid colorspace\n"); + return 0; + } + } else if (strcmp("-bitrate", argv[i]) == 0) { + if (i < argc - 1) + ARG_BITRATE = atoi(argv[i+1]); + if (ARG_BITRATE) { + i++; + if (ARG_BITRATE <= 10000) + /* if given parameter is <= 10000, assume it means kbps */ + ARG_BITRATE *= 1000; + } + else + ARG_BITRATE = 700000; + } else if (strcmp("-size", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_TARGETSIZE = atoi(argv[i]); + } else if (strcmp("-cq", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_CQ = atof(argv[i])*100; + } else if (strcmp("-single", argv[i]) == 0) { + ARG_SINGLE = 1; + ARG_PASS1 = NULL; + ARG_PASS2 = NULL; + } else if (strcmp("-pass1", argv[i]) == 0) { + ARG_SINGLE = 0; + if ((i < argc - 1) && (*argv[i+1] != '-')) { + i++; + ARG_PASS1 = argv[i]; + } else { + ARG_PASS1 = "xvid.stats"; + } + } else if (strcmp("-full1pass", argv[i]) == 0) { + ARG_FULL1PASS = 1; + } else if (strcmp("-pass2", argv[i]) == 0) { + ARG_SINGLE = 0; + if ((i < argc - 1) && (*argv[i+1] != '-')) { + i++; + ARG_PASS2 = argv[i]; + } else { + ARG_PASS2 = "xvid.stats"; + } + } else if (strcmp("-max_bframes", argv[i]) == 0 && i < argc - 1) { i++; ARG_MAXBFRAMES = atoi(argv[i]); - } - else if (strcmp("-bqr", argv[i]) == 0 && i < argc - 1 ) { + } else if (strcmp("-par", argv[i]) == 0 && i < argc - 1) { + i++; + if (sscanf(argv[i], "%d:%d", &(ARG_PARWIDTH), &(ARG_PARHEIGHT))!=2) + ARG_PAR = atoi(argv[i]); + else { + int div; + ARG_PAR = 0; + div = gcd(ARG_PARWIDTH, ARG_PARHEIGHT); + ARG_PARWIDTH /= div; + ARG_PARHEIGHT /= div; + } + } else if (strcmp("-nopacked", argv[i]) == 0) { + ARG_PACKED = 0; + } else if (strcmp("-packed", argv[i]) == 0) { + ARG_PACKED = 2; + } else if (strcmp("-nochromame", argv[i]) == 0) { + ARG_CHROMAME = 0; + } else if (strcmp("-threads", argv[i]) == 0 && i < argc -1) { + i++; + ARG_THREADS = atoi(argv[i]); + } else if (strcmp("-bquant_ratio", argv[i]) == 0 && i < argc - 1) { i++; ARG_BQRATIO = atoi(argv[i]); - } - else if (strcmp("-bqo", argv[i]) == 0 && i < argc - 1 ) { + } else if (strcmp("-bquant_offset", argv[i]) == 0 && i < argc - 1) { i++; ARG_BQOFFSET = atoi(argv[i]); - } - else if (strcmp("-q", argv[i]) == 0 && i < argc - 1 ) { + + } else if (strcmp("-zones", argv[i]) == 0 && i < argc -1) { + char c; + char *frameoptions, *rem; + int startframe; + char options[40]; + + i++; + + do { + rem = strrchr(argv[i], '/'); + if (rem==NULL) + rem=argv[i]; + else { + *rem = '\0'; + rem++; + } + if (sscanf(rem, "%d,%c,%s", &startframe, &c, options)<3) { + fprintf(stderr, "Zone error, bad parameters %s\n", rem); + continue; + } + if (NUM_ZONES >= MAX_ZONES) { + fprintf(stderr, "warning: too many zones; zone ignored\n"); + continue; + } + memset(&ZONES[NUM_ZONES], 0, sizeof(zone_t)); + + ZONES[NUM_ZONES].frame = startframe; + ZONES[NUM_ZONES].modifier = atof(options)*100; + if (toupper(c)=='Q') + ZONES[NUM_ZONES].mode = XVID_ZONE_QUANT; + else if (toupper(c)=='W') + ZONES[NUM_ZONES].mode = XVID_ZONE_WEIGHT; + else { + fprintf(stderr, "Bad zone type %c\n", c); + continue; + } + + if ((frameoptions=strchr(options, ','))!=NULL) { + int readchar=0, count; + frameoptions++; + while (readchar= MAX_ZONES) { + fprintf(stderr,"warning: too many zones; zone ignored\n"); + continue; + } + memset(&ZONES[NUM_ZONES], 0, sizeof(zone_t)); + if (strcmp("-zq", argv[i])== 0) { + ZONES[NUM_ZONES].mode = XVID_ZONE_QUANT; + } + else { + ZONES[NUM_ZONES].mode = XVID_ZONE_WEIGHT; + } + ZONES[NUM_ZONES].modifier = atof(argv[i+2])*100; + i++; + ZONES[NUM_ZONES].frame = atoi(argv[i]); + i++; + ZONES[NUM_ZONES].type = XVID_TYPE_AUTO; + ZONES[NUM_ZONES].greyscale = 0; + ZONES[NUM_ZONES].chroma_opt = 0; + ZONES[NUM_ZONES].bvop_threshold = 0; + ZONES[NUM_ZONES].cartoon_mode = 0; + + NUM_ZONES++; + } else if (strcmp("-quality", argv[i]) == 0 && i < argc - 1) { i++; ARG_QUALITY = atoi(argv[i]); - } - else if (strcmp("-f", argv[i]) == 0 && i < argc - 1 ) { + } else if (strcmp("-start", argv[i]) == 0 && i < argc - 1) { i++; - ARG_FRAMERATE = (float)atof(argv[i]); - } - else if (strcmp("-i", argv[i]) == 0 && i < argc - 1 ) { + ARG_STARTFRAMENR = atoi(argv[i]); + } else if (strcmp("-vhqmode", argv[i]) == 0 && i < argc - 1) { + i++; + ARG_VHQMODE = atoi(argv[i]); + } else if (strcmp("-framerate", argv[i]) == 0 && i < argc - 1) { + int exponent; + i++; + ARG_FRAMERATE = (float) atof(argv[i]); + exponent = strcspn(argv[i], "."); + if (exponent 0) + i++; + else + ARG_PROGRESS = 10; + } else if (strcmp("-help", argv[i])) { usage(); - return(0); - } - else { + return (0); + } else { usage(); exit(-1); } - + } - + /***************************************************************************** * Arguments checking ****************************************************************************/ - if (XDIM <= 0 || XDIM >= 2048 || YDIM <=0 || YDIM >= 2048 ) { - fprintf(stderr, "Trying to retreive width and height from PGM header\n"); - ARG_INPUTTYPE = 1; /* pgm */ + if (XDIM <= 0 || XDIM >= 4096 || YDIM <= 0 || YDIM >= 4096) { + fprintf(stderr, + "Trying to retrieve width and height from input header\n"); + if (!ARG_INPUTTYPE) + ARG_INPUTTYPE = 1; /* pgm */ } - - if ( ARG_QUALITY < 0 || ARG_QUALITY > 6) { - fprintf(stderr,"Wrong Quality\n"); - return -1; + + if (ARG_QUALITY < 0 ) { + ARG_QUALITY = 0; + } else if (ARG_QUALITY >= ME_ELEMENTS) { + ARG_QUALITY = ME_ELEMENTS - 1; } - if ( ARG_BITRATE <= 0 && ARG_QUANTI == 0) { - fprintf(stderr,"Wrong Bitrate\n"); - return -1; + if (ARG_STARTFRAMENR < 0) { + fprintf(stderr, "Bad starting frame number %d, cannot be negative\n", ARG_STARTFRAMENR); + return(-1); } - if ( ARG_FRAMERATE <= 0) { - fprintf(stderr,"Wrong Framerate %s \n",argv[5]); - return -1; + if (ARG_PASS2) { + if (ARG_PASS2 == ARG_PASS1) { + fprintf(stderr, "Can't use the same statsfile for pass1 and pass2: %s\n", ARG_PASS2); + return(-1); + } + statsfile = fopen(ARG_PASS2, "rb"); + if (statsfile == NULL) { + fprintf(stderr, "Couldn't open statsfile '%s'!\n", ARG_PASS2); + return (-1); + } + fclose(statsfile); } - if ( ARG_MAXFRAMENR <= 0) { - fprintf(stderr,"Wrong number of frames\n"); - return -1; +#ifdef XVID_AVI_OUTPUT + if (ARG_AVIOUTPUTFILE == NULL && ARG_PACKED <= 1) + ARG_PACKED = 0; +#endif + + if (ARG_BITRATE < 0) { + fprintf(stderr, "Bad bitrate %d, cannot be negative\n", ARG_BITRATE); + return(-1); } - if ( ARG_HINTMODE != HINT_MODE_NONE && - ARG_HINTMODE != HINT_MODE_GET && - ARG_HINTMODE != HINT_MODE_SET) - ARG_HINTMODE = HINT_MODE_NONE; + if (NUM_ZONES) { + int i; + sort_zones(ZONES, NUM_ZONES, &i); + } - if( ARG_HINTMODE != HINT_MODE_NONE) { - char *rights = "rb"; + if (ARG_PAR > 5) { + fprintf(stderr, "Bad PAR: %d. Must be [1..5] or width:height\n", ARG_PAR); + return(-1); + } - /* - * If we are getting hints from core, we will have to write them to - * hint file - */ - if(ARG_HINTMODE == HINT_MODE_GET) - rights = "w+b"; + if (ARG_MAXFRAMENR == 0) { + fprintf(stderr, "Wrong number of frames\n"); + return (-1); + } - /* Open the hint file */ - hints_file = fopen(HINT_FILE, rights); - if(hints_file == NULL) { - fprintf(stderr, "Error opening input file %s\n", HINT_FILE); - return -1; + if (ARG_INPUTFILE == NULL || strcmp(ARG_INPUTFILE, "stdin") == 0) { + in_file = stdin; + } else { +#ifdef XVID_AVI_INPUT + if (strcmp(ARG_INPUTFILE+(strlen(ARG_INPUTFILE)-3), "avs")==0 || + strcmp(ARG_INPUTFILE+(strlen(ARG_INPUTFILE)-3), "avi")==0 || + ARG_INPUTTYPE==2) + { + AVISTREAMINFO avi_info; +#ifndef XVID_AVI_OUTPUT + AVIFileInit(); +#endif + FILE *avi_fp = fopen(ARG_INPUTFILE, "rb"); + if (avi_fp == NULL) { + fprintf(stderr, "Couldn't open file '%s'!\n", ARG_INPUTFILE); + return (-1); + } + fclose(avi_fp); + + if (AVIFileOpen(&avi_file, ARG_INPUTFILE, OF_READ, NULL) != AVIERR_OK) { + fprintf(stderr, "Can't open avi/avs file %s\n", ARG_INPUTFILE); + AVIFileExit(); + return(-1); + } + + if (AVIFileGetStream(avi_file, &avi_stream, streamtypeVIDEO, 0) != AVIERR_OK) { + fprintf(stderr, "Can't open stream from file '%s'!\n", ARG_INPUTFILE); + AVIFileRelease(avi_file); + AVIFileExit(); + return (-1); + } + + AVIFileRelease(avi_file); + + if(AVIStreamInfo(avi_stream, &avi_info, sizeof(AVISTREAMINFO)) != AVIERR_OK) { + fprintf(stderr, "Can't get stream info from file '%s'!\n", ARG_INPUTFILE); + AVIStreamRelease(avi_stream); + AVIFileExit(); + return (-1); + } + + if (avi_info.fccHandler != MAKEFOURCC('Y', 'V', '1', '2')) { + LONG size; + fprintf(stderr, "Non YV12 input colorspace %c%c%c%c! Attempting conversion...\n", + avi_info.fccHandler%256, (avi_info.fccHandler>>8)%256, (avi_info.fccHandler>>16)%256, + (avi_info.fccHandler>>24)%256); + size = sizeof(myBitmapInfoHeader); + AVIStreamReadFormat(avi_stream, 0, &myBitmapInfoHeader, &size); + if (size==0) + fprintf(stderr, "AVIStreamReadFormat read 0 bytes.\n"); + else { + fprintf(stderr, "AVIStreamReadFormat read %d bytes.\n", size); + fprintf(stderr, "width = %d, height = %d, planes = %d\n", myBitmapInfoHeader.biWidth, + myBitmapInfoHeader.biHeight, myBitmapInfoHeader.biPlanes); + fprintf(stderr, "Compression = %c%c%c%c, %d\n", + myBitmapInfoHeader.biCompression%256, (myBitmapInfoHeader.biCompression>>8)%256, + (myBitmapInfoHeader.biCompression>>16)%256, (myBitmapInfoHeader.biCompression>>24)%256, + myBitmapInfoHeader.biCompression); + fprintf(stderr, "Bits Per Pixel = %d\n", myBitmapInfoHeader.biBitCount); + myBitmapInfoHeader.biCompression = MAKEFOURCC('Y', 'V', '1', '2'); + myBitmapInfoHeader.biBitCount = 12; + myBitmapInfoHeader.biSizeImage = (myBitmapInfoHeader.biWidth*myBitmapInfoHeader.biHeight)*3/2; + get_frame = AVIStreamGetFrameOpen(avi_stream, &myBitmapInfoHeader); + } + if (get_frame == NULL) { + AVIStreamRelease(avi_stream); + AVIFileExit(); + return (-1); + } + else { + unsigned char *temp; + fprintf(stderr, "AVIStreamGetFrameOpen successful.\n"); + temp = (unsigned char*)AVIStreamGetFrame(get_frame, 0); + if (temp != NULL) { + int i; + for (i = 0; i < ((DWORD*)temp)[0]; i++) { + fprintf(stderr, "%2d ", temp[i]); + } + fprintf(stderr, "\n"); + } + } + if (avi_info.fccHandler == MAKEFOURCC('D', 'I', 'B', ' ')) { + AVIStreamGetFrameClose(get_frame); + get_frame = NULL; + ARG_COLORSPACE = XVID_CSP_BGR | XVID_CSP_VFLIP; + } + } + + if (ARG_MAXFRAMENR<0) + ARG_MAXFRAMENR = avi_info.dwLength-ARG_STARTFRAMENR; + else + ARG_MAXFRAMENR = min(ARG_MAXFRAMENR, avi_info.dwLength-ARG_STARTFRAMENR); + + XDIM = avi_info.rcFrame.right - avi_info.rcFrame.left; + YDIM = avi_info.rcFrame.bottom - avi_info.rcFrame.top; + if (ARG_FRAMERATE==0) { + ARG_FRAMERATE = (float) avi_info.dwRate / (float) avi_info.dwScale; + ARG_DWRATE = avi_info.dwRate; + ARG_DWSCALE = avi_info.dwScale; + } + + ARG_INPUTTYPE = 2; + } + else +#endif + { + in_file = fopen(ARG_INPUTFILE, "rb"); + if (in_file == NULL) { + fprintf(stderr, "Error opening input file %s\n", ARG_INPUTFILE); + return (-1); + } } + } - /* Allocate hint memory space, we will be using rawhints */ - /* NB : Hope 1Mb is enough */ - if((hints_buffer = malloc(1024*1024)) == NULL) { - fprintf(stderr, "Memory allocation error\n"); - return -1; + // This should be after the avi input opening stuff + if (ARG_TIMECODEFILE != NULL) { + time_file = fopen(ARG_TIMECODEFILE, "r"); + if (time_file==NULL) { + fprintf(stderr, "Couldn't open timecode file '%s'!\n", ARG_TIMECODEFILE); + return(-1); + } + else { + fscanf(time_file, "# timecode format v2\n"); } - } - if ( ARG_INPUTFILE == NULL || strcmp(ARG_INPUTFILE, "stdin") == 0) { - in_file = stdin; + if (ARG_FRAMERATE <= 0) { + fprintf(stderr, "Wrong Framerate %f\n", ARG_FRAMERATE); + return (-1); } - else { - in_file = fopen(ARG_INPUTFILE, "rb"); - if (in_file == NULL) { - fprintf(stderr, "Error opening input file %s\n", ARG_INPUTFILE); - return -1; - } + if (ARG_TARGETSIZE) { + if (ARG_MAXFRAMENR <= 0) { + fprintf(stderr, "Bad target size; number of input frames unknown\n"); + goto release_all; + } else if (ARG_BITRATE) { + fprintf(stderr, "Parameter conflict: Do not specify both -bitrate and -size\n"); + goto release_all; + } else + ARG_BITRATE = ((ARG_TARGETSIZE * 8) / (ARG_MAXFRAMENR / ARG_FRAMERATE)) * 1024; } - if (ARG_INPUTTYPE) { + /* Set constant quant to default if no bitrate given for single pass */ + if (ARG_SINGLE && (!ARG_BITRATE) && (!ARG_CQ)) + ARG_CQ = DEFAULT_QUANT; + + if (ARG_INPUTTYPE==1) { +#ifndef READ_PNM if (read_pgmheader(in_file)) { - fprintf(stderr, "Wrong input format, I want YUV encapsulated in PGM\n"); - return -1; +#else + if (read_pnmheader(in_file)) { +#endif + fprintf(stderr, + "Wrong input format, I want YUV encapsulated in PGM\n"); + return (-1); } } + /* Jump to the starting frame */ + if (ARG_INPUTTYPE == 0) + fseek(in_file, ARG_STARTFRAMENR*IMAGE_SIZE(XDIM, YDIM), SEEK_SET); + /* now we know the sizes, so allocate memory */ - in_buffer = (unsigned char *) malloc(IMAGE_SIZE(XDIM,YDIM)); - if (!in_buffer) - goto free_all_memory; + if (get_frame == NULL) + { + in_buffer = (unsigned char *) malloc(4*XDIM*YDIM); + if (!in_buffer) + goto free_all_memory; + } /* this should really be enough memory ! */ - mp4_buffer = (unsigned char *) malloc(IMAGE_SIZE(XDIM,YDIM)*2); + mp4_buffer = (unsigned char *) malloc(IMAGE_SIZE(XDIM, YDIM) * 2); if (!mp4_buffer) - goto free_all_memory; + goto free_all_memory; /***************************************************************************** * XviD PART Start ****************************************************************************/ - status = enc_init(use_assembler); - if (status) - { - fprintf(stderr, "Encore INIT problem, return value %d\n", status); + result = enc_init(use_assembler); + if (result) { + fprintf(stderr, "Encore INIT problem, return value %d\n", result); goto release_all; } @@ -363,154 +1019,412 @@ * Main loop ****************************************************************************/ - if (ARG_SAVEMPEGSTREAM && ARG_OUTPUTFILE) { + if (ARG_SAVEMPEGSTREAM) { - if((out_file = fopen(ARG_OUTPUTFILE, "w+b")) == NULL) { - fprintf(stderr, "Error opening output file %s\n", ARG_OUTPUTFILE); - goto release_all; + if (ARG_OUTPUTFILE) { + if ((out_file = fopen(ARG_OUTPUTFILE, "w+b")) == NULL) { + fprintf(stderr, "Error opening output file %s\n", ARG_OUTPUTFILE); + goto release_all; + } } - } - else { +#ifdef XVID_AVI_OUTPUT + if (ARG_AVIOUTPUTFILE != NULL ) { + { + /* Open the .avi output then close it */ + /* Resets the file size to 0, which AVIFile doesn't seem to do */ + FILE *scrub; + if ((scrub = fopen(ARG_AVIOUTPUTFILE, "w+b")) == NULL) { + fprintf(stderr, "Error opening output file %s\n", ARG_AVIOUTPUTFILE); + goto release_all; + } + else + fclose(scrub); + } + memset(&myAVIStreamInfo, 0, sizeof(AVISTREAMINFO)); + myAVIStreamInfo.fccType = streamtypeVIDEO; + myAVIStreamInfo.fccHandler = MAKEFOURCC('x', 'v', 'i', 'd'); + myAVIStreamInfo.dwScale = ARG_DWSCALE; + myAVIStreamInfo.dwRate = ARG_DWRATE; + myAVIStreamInfo.dwLength = ARG_MAXFRAMENR; + myAVIStreamInfo.dwQuality = 10000; + SetRect(&myAVIStreamInfo.rcFrame, 0, 0, YDIM, XDIM); + + if (avierr=AVIFileOpen(&myAVIFile, ARG_AVIOUTPUTFILE, OF_CREATE|OF_WRITE, NULL)) { + fprintf(stderr, "AVIFileOpen failed opening output file %s, error code %d\n", ARG_AVIOUTPUTFILE, avierr); + goto release_all; + } + + if (avierr=AVIFileCreateStream(myAVIFile, &myAVIStream, &myAVIStreamInfo)) { + fprintf(stderr, "AVIFileCreateStream failed, error code %d\n", avierr); + goto release_all; + } + + memset(&myBitmapInfoHeader, 0, sizeof(BITMAPINFOHEADER)); + myBitmapInfoHeader.biHeight = YDIM; + myBitmapInfoHeader.biWidth = XDIM; + myBitmapInfoHeader.biPlanes = 1; + myBitmapInfoHeader.biSize = sizeof(BITMAPINFOHEADER); + myBitmapInfoHeader.biCompression = MAKEFOURCC('X', 'V', 'I', 'D'); + myBitmapInfoHeader.biBitCount = 12; + myBitmapInfoHeader.biSizeImage = 6*XDIM*YDIM; + if (avierr=AVIStreamSetFormat(myAVIStream, 0, &myBitmapInfoHeader, sizeof(BITMAPINFOHEADER))) { + fprintf(stderr, "AVIStreamSetFormat failed, error code %d\n", avierr); + goto release_all; + } + } +#endif +#ifdef XVID_MKV_OUTPUT + if (ARG_MKVOUTPUTFILE != NULL) { + { + /* Open the .mkv output then close it */ + /* Just to make sure we can write to it */ + FILE *scrub; + if ((scrub = fopen(ARG_MKVOUTPUTFILE, "w+b")) == NULL) { + fprintf(stderr, "Error opening output file %s\n", ARG_MKVOUTPUTFILE); + goto release_all; + } + else + fclose(scrub); + } + + MKVFileOpen(&myMKVFile, ARG_MKVOUTPUTFILE, OF_CREATE|OF_WRITE, NULL); + if (ARG_PAR) { + myMKVStreamInfo.display_height = YDIM*height_ratios[ARG_PAR]; + myMKVStreamInfo.display_width = XDIM*width_ratios[ARG_PAR]; + } + else { + myMKVStreamInfo.display_height = YDIM*ARG_PARHEIGHT; + myMKVStreamInfo.display_width = XDIM*ARG_PARWIDTH; + } + myMKVStreamInfo.height = YDIM; + myMKVStreamInfo.width = XDIM; + myMKVStreamInfo.framerate = ARG_DWRATE; + myMKVStreamInfo.framescale = ARG_DWSCALE; + myMKVStreamInfo.length = ARG_MAXFRAMENR; + MKVFileCreateStream(myMKVFile, &myMKVStream, &myMKVStreamInfo); + } +#endif + } else { out_file = NULL; } + /***************************************************************************** * Encoding loop ****************************************************************************/ totalsize = 0; + result = 0; + + input_num = 0; /* input frame counter */ + output_num = 0; /* output frame counter */ + + nvop_counter = 0; + do { - if (ARG_INPUTTYPE) - status = read_pgmdata(in_file, in_buffer); /* read PGM data (YUV-format) */ - else - status = read_yuvdata(in_file, in_buffer); /* read raw data (YUV-format) */ - - if (status) - { - /* Couldn't read image, most likely end-of-file */ - continue; - } + char *type; + int sse[3]; -/***************************************************************************** - * Read hints from file - ****************************************************************************/ + if (input_num >= ARG_MAXFRAMENR && ARG_MAXFRAMENR > 0) { + result = 1; + } - if(ARG_HINTMODE == HINT_MODE_SET) { - fread(&hints_size, 1, sizeof(long), hints_file); - hints_size = (!bigendian)?SWAP(hints_size):hints_size; - fread(hints_buffer, 1, hints_size, hints_file); + if (!result) { +#ifdef XVID_AVI_INPUT + if (ARG_INPUTTYPE==2) { + /* read avs/avi data (YUV-format) */ + if (get_frame != NULL) { + in_buffer = (unsigned char*)AVIStreamGetFrame(get_frame, input_num+ARG_STARTFRAMENR); + if (in_buffer == NULL) + result = 1; + else + in_buffer += ((DWORD*)in_buffer)[0]; + } else { + if(AVIStreamRead(avi_stream, input_num+ARG_STARTFRAMENR, 1, in_buffer, 4*XDIM*YDIM, NULL, NULL ) != AVIERR_OK) + result = 1; + } + } else +#endif + if (ARG_INPUTTYPE==1) { + /* read PGM data (YUV-format) */ +#ifndef READ_PNM + result = read_pgmdata(in_file, in_buffer); +#else + result = read_pnmdata(in_file, in_buffer); +#endif + } else { + /* read raw data (YUV-format) */ + result = read_yuvdata(in_file, in_buffer); + } } /***************************************************************************** * Encode and decode this frame ****************************************************************************/ + if (input_num >= (unsigned int)ARG_MAXFRAMENR-1 && ARG_MAXBFRAMES) { + stats_type = XVID_TYPE_PVOP; + } + else + stats_type = XVID_TYPE_AUTO; + enctime = msecond(); - status = enc_main(in_buffer, mp4_buffer, hints_buffer, - &m4v_size, &frame_type, &hints_size); + m4v_size = + enc_main(!result ? in_buffer : 0, mp4_buffer, &key, &stats_type, + &stats_quant, &stats_length, sse, input_num); enctime = msecond() - enctime; - /* if it's a not coded VOP (aka NVOP) then we write nothing */ - if(frame_type == 5) goto next_frame; + /* Write the Frame statistics */ - { - char *type[] = {"P", "I", "B", "S", "Packed", "N", "Unknown"}; + if (stats_type > 0) { /* !XVID_TYPE_NOTHING */ + switch (stats_type) { + case XVID_TYPE_IVOP: + type = "I"; + break; + case XVID_TYPE_PVOP: + type = "P"; + break; + case XVID_TYPE_BVOP: + type = "B"; + if (ARG_PACKED) + fakenvop = 1; + break; + case XVID_TYPE_SVOP: + type = "S"; + break; + default: + type = "U"; + break; + } - if(frame_type<0 || frame_type>5) frame_type = 6; + if (stats_length > 8) { + framestats[stats_type].count++; + framestats[stats_type].quants[stats_quant]++; + framestats[stats_type].size += stats_length; + } + else { + framestats[5].count++; + framestats[5].quants[stats_quant]++; + framestats[5].size += stats_length; + } - printf("Frame %5d: type = %s, enctime(ms) =%6.1f, length(bytes) =%7d\n", - (int)filenr, type[frame_type], (float)enctime, (int)m4v_size); +#define SSE2PSNR(sse, width, height) ((!(sse))?0.0f : 48.131f - 10*(float)log10((float)(sse)/((float)((width)*(height))))) + if (ARG_PROGRESS == 0) { + printf("%5d: key=%i, time= %6.0f, len= %7d", !result ? input_num : -1, + key, (float) enctime, (int) m4v_size); + printf(" | type=%s, quant= %2d, len= %7d", type, stats_quant, + stats_length); + + + if (ARG_STATS) { + printf(", psnr y = %2.2f, psnr u = %2.2f, psnr v = %2.2f", + SSE2PSNR(sse[0], XDIM, YDIM), SSE2PSNR(sse[1], XDIM / 2, YDIM / 2), + SSE2PSNR(sse[2], XDIM / 2, YDIM / 2)); + } + printf("\n"); + } else { + if (input_num % ARG_PROGRESS == 1) { + if (ARG_MAXFRAMENR > 0) { + fprintf(stderr, "\r%7d frames(%3d%%) encoded, %6.2f fps, Average Bitrate = %5.0fkbps", \ + input_num, input_num*100/ARG_MAXFRAMENR, input_num*1000/totalenctime, \ + (((totalsize/1000)*ARG_FRAMERATE)*8)/input_num); + } else { + fprintf(stderr, "\r%7d frames encoded, %6.2f fps, Average Bitrate = %5.0fkbps", \ + input_num, input_num*1000/totalenctime, \ + (((totalsize/1000)*ARG_FRAMERATE)*8)/input_num); + } + } + } + + if (ARG_STATS) { + totalPSNR[0] += SSE2PSNR(sse[0], XDIM, YDIM); + totalPSNR[1] += SSE2PSNR(sse[1], XDIM/2, YDIM/2); + totalPSNR[2] += SSE2PSNR(sse[2], XDIM/2, YDIM/2); + } +#undef SSE2PSNR } + if (m4v_size < 0) + break; + /* Update encoding time stats */ totalenctime += enctime; totalsize += m4v_size; /***************************************************************************** - * Save hints to file + * Save stream to file ****************************************************************************/ - if(ARG_HINTMODE == HINT_MODE_GET) { - hints_size = (!bigendian)?SWAP(hints_size):hints_size; - fwrite(&hints_size, 1, sizeof(long), hints_file); - hints_size = (!bigendian)?SWAP(hints_size):hints_size; - fwrite(hints_buffer, 1, hints_size, hints_file); - } + if (m4v_size > 0 && ARG_SAVEMPEGSTREAM) { + char timecode[50]; -/***************************************************************************** - * Save stream to file - ****************************************************************************/ + if (time_file != NULL) { + if (fscanf(time_file, "%s\n", timecode) != 1) { + fprintf(stderr, "Error reading timecode file, frame %d\n", output_num); + goto release_all; + } + } + else + sprintf(timecode, "%f", ((double)ARG_DWSCALE/ARG_DWRATE)*1000*output_num); - if (ARG_SAVEMPEGSTREAM) - { /* Save single files */ - if (out_file == NULL) { - sprintf(filename, "%sframe%05d.m4v", filepath, filenr); - out_file = fopen(filename, "wb"); - fwrite(mp4_buffer, m4v_size, 1, out_file); - fclose(out_file); - out_file = NULL; + if (ARG_SAVEINDIVIDUAL) { + FILE *out; + sprintf(filename, "%sframe%05d.m4v", filepath, output_num); + out = fopen(filename, "w+b"); + fwrite(mp4_buffer, m4v_size, 1, out); + fclose(out); } - else { +#ifdef XVID_AVI_OUTPUT + if (ARG_AVIOUTPUTFILE && myAVIStream) { + int output_frame; + + if (time_file == NULL) + output_frame = output_num; + else { + output_frame = (int)(atof(timecode)/1000/((double)ARG_DWSCALE/ARG_DWRATE)+.5); + } + if (AVIStreamWrite(myAVIStream, output_frame, 1, mp4_buffer, m4v_size, key ? AVIIF_KEYFRAME : 0, NULL, NULL)) { + fprintf(stderr, "AVIStreamWrite failed writing frame %d\n", output_num); + goto release_all; + } + } +#endif - /* Write mp4 data */ - fwrite(mp4_buffer, 1, m4v_size, out_file); + if (key && ARG_PACKED) + removedivxp((char*)mp4_buffer, m4v_size); - } + /* Save ES stream */ + if (ARG_OUTPUTFILE && out_file && !(fakenvop && m4v_size <= 8)) { + fwrite(mp4_buffer, 1, m4v_size, out_file); + } +#ifdef XVID_MKV_OUTPUT + if (ARG_MKVOUTPUTFILE && myMKVStream) { + MKVStreamWrite(myMKVStream, atof(timecode), 1, (ARG_PACKED && fakenvop && (m4v_size <= 8)) ? NULL : mp4_buffer, m4v_size, key ? AVIIF_KEYFRAME : 0, NULL, NULL); + } +#endif + + output_num++; + if (stats_type != XVID_TYPE_BVOP) + fakenvop=0; } - next_frame: - /* Read the header if it's pgm stream */ - if (ARG_INPUTTYPE) - status = read_pgmheader(in_file); + input_num++; + + /* Read the header if it's pgm stream */ + if (!result && (ARG_INPUTTYPE==1)) +#ifndef READ_PNM + result = read_pgmheader(in_file); +#else + result = read_pnmheader(in_file); +#endif + } while (1); - if(frame_type != 5) filenr++; - } while ( (!status) && (filenr 0) { + totalsize /= input_num; + totalenctime /= input_num; + totalPSNR[0] /= input_num; + totalPSNR[1] /= input_num; + totalPSNR[2] /= input_num; + } else { + totalsize = -1; + totalenctime = -1; + } + + printf("Avg: enctime(ms) =%7.2f, fps =%7.2f, length(bytes) = %7d", + totalenctime, 1000 / totalenctime, (int) totalsize); + if (ARG_STATS) { + printf(", psnr y = %2.2f, psnr u = %2.2f, psnr v = %2.2f", + totalPSNR[0],totalPSNR[1],totalPSNR[2]); + } + printf("\n"); + if (framestats[XVID_TYPE_IVOP].count) { + printf("I frames: %6d frames, size = %7d/%7d, quants = %2d / %.2f / %2d\n", \ + framestats[XVID_TYPE_IVOP].count, framestats[XVID_TYPE_IVOP].size/framestats[XVID_TYPE_IVOP].count, \ + framestats[XVID_TYPE_IVOP].size, minquant(framestats[XVID_TYPE_IVOP].quants), \ + avgquant(framestats[XVID_TYPE_IVOP]), maxquant(framestats[XVID_TYPE_IVOP].quants)); + } + if (framestats[XVID_TYPE_PVOP].count) { + printf("P frames: %6d frames, size = %7d/%7d, quants = %2d / %.2f / %2d\n", \ + framestats[XVID_TYPE_PVOP].count, framestats[XVID_TYPE_PVOP].size/framestats[XVID_TYPE_PVOP].count, \ + framestats[XVID_TYPE_PVOP].size, minquant(framestats[XVID_TYPE_PVOP].quants), \ + avgquant(framestats[XVID_TYPE_PVOP]), maxquant(framestats[XVID_TYPE_PVOP].quants)); + } + if (framestats[XVID_TYPE_BVOP].count) { + printf("B frames: %6d frames, size = %7d/%7d, quants = %2d / %.2f / %2d\n", \ + framestats[XVID_TYPE_BVOP].count, framestats[XVID_TYPE_BVOP].size/framestats[XVID_TYPE_BVOP].count, \ + framestats[XVID_TYPE_BVOP].size, minquant(framestats[XVID_TYPE_BVOP].quants), \ + avgquant(framestats[XVID_TYPE_BVOP]), maxquant(framestats[XVID_TYPE_BVOP].quants)); + } + if (framestats[XVID_TYPE_SVOP].count) { + printf("S frames: %6d frames, size = %7d/%7d, quants = %2d / %.2f / %2d\n", \ + framestats[XVID_TYPE_SVOP].count, framestats[XVID_TYPE_SVOP].size/framestats[XVID_TYPE_SVOP].count, \ + framestats[XVID_TYPE_SVOP].size, minquant(framestats[XVID_TYPE_SVOP].quants), \ + avgquant(framestats[XVID_TYPE_SVOP]), maxquant(framestats[XVID_TYPE_SVOP].quants)); + } + if (framestats[5].count) { + printf("N frames: %6d frames, size = %7d/%7d\n", \ + framestats[5].count, framestats[5].size/framestats[5].count, \ + framestats[5].size); + } - printf("Avg: enctime(ms) =%7.2f, fps =%7.2f, length(bytes) = %7d\n", - totalenctime, 1000/totalenctime, (int)totalsize); /***************************************************************************** * XviD PART Stop ****************************************************************************/ - release_all: + release_all: + +#ifdef XVID_AVI_INPUT + if (get_frame) AVIStreamGetFrameClose(get_frame); + if (avi_stream) AVIStreamRelease(avi_stream); +#ifndef XVID_AVI_OUTPUT + AVIFileExit(); +#endif +#endif - if (enc_handle) - { - status = enc_stop(); - if (status) - fprintf(stderr, "Encore RELEASE problem return value %d\n", status); + if (enc_handle) { + result = enc_stop(); + if (result) + fprintf(stderr, "Encore RELEASE problem return value %d\n", + result); } - if(in_file) + if (in_file) fclose(in_file); - if(out_file) + if (out_file) fclose(out_file); - if(hints_file) - fclose(hints_file); - free_all_memory: +#ifdef XVID_AVI_OUTPUT + if (myAVIStream) AVIStreamRelease(myAVIStream); + if (myAVIFile) AVIFileRelease(myAVIFile); + AVIFileExit(); +#endif +#ifdef XVID_MKV_OUTPUT + if (myMKVStream) MKVStreamRelease(myMKVStream); + if (myMKVFile) MKVFileRelease(myMKVFile); +#endif + + free_all_memory: free(out_buffer); free(mp4_buffer); free(in_buffer); - if(hints_buffer) free(hints_buffer); - return 0; + return (0); } @@ -524,51 +1438,177 @@ *****************************************************************************/ /* Return time elapsed time in miliseconds since the program started */ -static double msecond() -{ +static double +msecond() +{ #ifndef WIN32 - struct timeval tv; + struct timeval tv; + gettimeofday(&tv, 0); - return tv.tv_sec*1.0e3 + tv.tv_usec * 1.0e-3; + return (tv.tv_sec * 1.0e3 + tv.tv_usec * 1.0e-3); #else clock_t clk; + clk = clock(); - return clk * 1000 / CLOCKS_PER_SEC; + return (clk * 1000.0 / CLOCKS_PER_SEC); #endif } +int +gcd(int a, int b) +{ + int r ; + + if (b > a) { + r = a; + a = b; + b = r; + } + + while ((r = a % b)) { + a = b; + b = r; + } + return b; +} + +int minquant(int quants[32]) +{ + int i = 1; + while (quants[i] == 0) { + i++; + } + return i; +} + +int maxquant(int quants[32]) +{ + int i = 31; + while (quants[i] == 0) { + i--; + } + return i; +} + +double avgquant(frame_stats_t frame) +{ + double avg=0; + int i; + for (i=1; i < 32; i++) { + avg += frame.quants[i]*i; + } + avg /= frame.count; + return avg; +} + /***************************************************************************** * Usage message *****************************************************************************/ -static void usage() +static void +usage() { - - fprintf(stderr, "Usage : xvid_stat [OPTIONS]\n"); - fprintf(stderr, "Options :\n"); - fprintf(stderr, " -w integer : frame width ([1.2048])\n"); - fprintf(stderr, " -h integer : frame height ([1.2048])\n"); - fprintf(stderr, " -b integer : target bitrate (>0 | default=900kbit)\n"); - fprintf(stderr, " -b integer : target bitrate (>0 | default=900kbit)\n"); - fprintf(stderr, " -bn integer : max bframes (default=0)\n"); - fprintf(stderr, " -bqr integer : bframe quantizer ratio (default=150)\n"); - fprintf(stderr, " -bqo integer : bframe quantizer offset (default=100)\n"); - fprintf(stderr, " -f float : target framerate (>0)\n"); - fprintf(stderr, " -i string : input filename (default=stdin)\n"); - fprintf(stderr, " -t integer : input data type (yuv=0, pgm=1)\n"); - fprintf(stderr, " -n integer : number of frames to encode\n"); - fprintf(stderr, " -q integer : quality ([0..5])\n"); - fprintf(stderr, " -d boolean : save decoder output (0 False*, !=0 True)\n"); - fprintf(stderr, " -m boolean : save mpeg4 raw stream (0 False*, !=0 True)\n"); - fprintf(stderr, " -o string : output container filename (only usefull when -m 1 is used) :\n"); - fprintf(stderr, " When this option is not used : one file per encoded frame\n"); - fprintf(stderr, " When this option is used : save to 'string' (default=stream.m4v)\n"); - fprintf(stderr, " -mt integer : output type (m4v=0, mp4u=1)\n"); - fprintf(stderr, " -mv integer : Use motion vector hints (no hints=0, get hints=1, set hints=2)\n"); - fprintf(stderr, " -help : prints this help message\n"); - fprintf(stderr, " -quant integer : fixed quantizer (disables -b setting)\n"); - fprintf(stderr, " (* means default)\n"); - + fprintf(stderr, "xvid_encraw built at %s on %s\n", __TIME__, __DATE__); + fprintf(stderr, "Usage : xvid_encraw [OPTIONS]\n\n"); + fprintf(stderr, "Input options:\n"); + fprintf(stderr, " -i string : input filename (stdin)\n"); +#ifdef XVID_AVI_INPUT + fprintf(stderr, " -type integer: input data type (yuv=0, pgm=1, avi/avs=2)\n"); +#else + fprintf(stderr, " -type integer: input data type (yuv=0, pgm=1)\n"); +#endif + fprintf(stderr, " -w integer: frame width ([1.2048])\n"); + fprintf(stderr, " -h integer: frame height ([1.2048])\n"); + fprintf(stderr, " -csp string : colorspace of raw input file i420, yv12 (default)\n"); + fprintf(stderr, " -frames integer: number of frames to encode\n"); + fprintf(stderr, "\n"); + fprintf(stderr, "Output options:\n"); + fprintf(stderr, " -dump : save decoder output\n"); + fprintf(stderr, " -save : save an Elementary Stream file per frame\n"); + fprintf(stderr, " -o string : save an Elementary Stream for the complete sequence\n"); +#ifdef XVID_AVI_OUTPUT + fprintf(stderr, " -avi string: save an AVI file for the complete sequence\n"); +#endif + fprintf(stderr, " -mkv string: save a MKV file for the complete sequence\n"); + fprintf(stderr, "\n"); + fprintf(stderr, "BFrames options:\n"); + fprintf(stderr, " -max_bframes integer: max bframes (2)\n"); + fprintf(stderr, " -bquant_ratio integer: bframe quantizer ratio (150)\n"); + fprintf(stderr, " -bquant_offset integer: bframe quantizer offset (100)\n"); + fprintf(stderr, "\n"); + fprintf(stderr, "Rate control options:\n"); + fprintf(stderr, " -framerate float : target framerate (25.0)\n"); + fprintf(stderr, " -bitrate [integer] : target bitrate in kbps (700)\n"); + fprintf(stderr, " -size integer : target size in kilobytes\n"); + fprintf(stderr, " -single : single pass mode (default)\n"); + fprintf(stderr, " -cq float : single pass constant quantizer\n"); + fprintf(stderr, " -pass1 [filename] : twopass mode (first pass)\n"); + fprintf(stderr, " -full1pass : perform full first pass\n"); + fprintf(stderr, " -pass2 [filename] : twopass mode (2nd pass)\n"); + fprintf(stderr, " -zq starting_frame float : bitrate zone; quant\n"); + fprintf(stderr, " -zw starting_frame float : bitrate zone; weight\n"); + fprintf(stderr, " -max_key_interval integer : maximum keyframe interval (300)\n"); + fprintf(stderr, "\n"); + fprintf(stderr, "Single Pass options:\n"); + fprintf(stderr, "-reaction integer : reaction delay factor (16)\n"); + fprintf(stderr, "-averaging integer : averaging period (100)\n"); + fprintf(stderr, "-smoother integer : smoothing buffer (100)\n"); + fprintf(stderr, "\n"); + fprintf(stderr, "Second Pass options:\n"); + fprintf(stderr, "-kboost integer : I frame boost (10)\n"); + fprintf(stderr, "-kthresh integer : I frame reduction threshold (1)\n"); + fprintf(stderr, "-kreduction integer : I frame reduction amount (20)\n"); + fprintf(stderr, "-ostrength integer : overflow control strength (5)\n"); + fprintf(stderr, "-oimprove integer : max overflow improvement (5)\n"); + fprintf(stderr, "-odegrade integer : max overflow degradation (5)\n"); + fprintf(stderr, "-chigh integer : high bitrate scenes degradation (0)\n"); + fprintf(stderr, "-clow integer : low bitrate scenes improvement (0)\n"); + fprintf(stderr, "-overhead integer : container frame overhead (24)\n"); + fprintf(stderr, "-vbvsize integer : use vbv buffer size\n"); + fprintf(stderr, "-vbvmax integer : vbv max bitrate\n"); + fprintf(stderr, "-vbvpeak integer : vbv peak bitrate over 1 second\n"); + fprintf(stderr, "\n"); + fprintf(stderr, "Other options\n"); + fprintf(stderr, " -noasm : do not use assembly optmized code\n"); + fprintf(stderr, " -turbo : use turbo presets for higher encoding speed\n"); + fprintf(stderr, " -quality integer : quality ([0..%d]) (6)\n", ME_ELEMENTS - 1); + fprintf(stderr, " -vhqmode integer : level of R-D optimizations ([0..4]) (1)\n"); + fprintf(stderr, " -bvhq : use R-D optimizations for B-frames\n"); + fprintf(stderr, " -qpel : use quarter pixel ME\n"); + fprintf(stderr, " -gmc : use global motion compensation\n"); + fprintf(stderr, " -qtype integer : quantization type (H263:0, MPEG4:1) (0)\n"); + fprintf(stderr, " -qmatrix filename : use custom MPEG4 quantization matrix\n"); + fprintf(stderr, " -interlaced [integer] : interlaced encoding (BFF:1, TFF:2) (1)\n"); + fprintf(stderr, " -nopacked : Disable packed mode\n"); + fprintf(stderr, " -noclosed_gop : Disable closed GOP mode\n"); + fprintf(stderr, " -lumimasking : use lumimasking algorithm\n"); + fprintf(stderr, " -stats : print stats about encoded frames\n"); + fprintf(stderr, " -ssim [integer] : prints ssim for every frame (accurate: 0 fast: 4) (2)\n"); + fprintf(stderr, " -ssim_file filename : outputs the ssim stats into a file\n"); + fprintf(stderr, " -debug : activates xvidcore internal debugging output\n"); + fprintf(stderr, " -vop_debug : print some info directly into encoded frames\n"); + fprintf(stderr, " -nochromame : Disable chroma motion estimation\n"); + fprintf(stderr, " -notrellis : Disable trellis quantization\n"); + fprintf(stderr, " -imin integer : Minimum I Quantizer (1..31) (2)\n"); + fprintf(stderr, " -imax integer : Maximum I quantizer (1..31) (31)\n"); + fprintf(stderr, " -bmin integer : Minimum B Quantizer (1..31) (2)\n"); + fprintf(stderr, " -bmax integer : Maximum B quantizer (1..31) (31)\n"); + fprintf(stderr, " -pmin integer : Minimum P Quantizer (1..31) (2)\n"); + fprintf(stderr, " -pmax integer : Maximum P quantizer (1..31) (31)\n"); + fprintf(stderr, " -drop integer : Frame Drop Ratio (0..100) (0)\n"); + fprintf(stderr, " -start integer : Starting frame number\n"); + fprintf(stderr, " -threads integer : Number of threads\n"); + fprintf(stderr, " -progress [integer] : Show progress updates every n frames (10)\n"); + fprintf(stderr, " -par integer[:integer] : Set Pixel Aspect Ratio.\n"); + fprintf(stderr, " 1 = 1:1\n"); + fprintf(stderr, " 2 = 12:11 (4:3 PAL)\n"); + fprintf(stderr, " 3 = 10:11 (4:3 NTSC)\n"); + fprintf(stderr, " 4 = 16:11 (16:9 PAL)\n"); + fprintf(stderr, " 5 = 40:33 (16:9 NTSC)\n"); + fprintf(stderr, " other = custom (width:height)\n"); + fprintf(stderr, " -help : prints this help message\n"); + fprintf(stderr, "\n"); + fprintf(stderr, "NB: You can define %d zones repeating the -z[qw] option as needed.\n", MAX_ZONES); } /***************************************************************************** @@ -579,190 +1619,741 @@ * *****************************************************************************/ -static int read_pgmheader(FILE* handle) -{ - int bytes,xsize,ysize,depth; +#ifndef READ_PNM +static int +read_pgmheader(FILE * handle) +{ + int bytes, xsize, ysize, depth; char dummy[2]; - - bytes = fread(dummy,1,2,handle); - if ( (bytes < 2) || (dummy[0] != 'P') || (dummy[1] != '5' )) - return 1; + bytes = fread(dummy, 1, 2, handle); - fscanf(handle,"%d %d %d",&xsize,&ysize,&depth); - if ( (xsize > 1440) || (ysize > 2880 ) || (depth != 255) ) - { - fprintf(stderr,"%d %d %d\n",xsize,ysize,depth); - return 2; + if ((bytes < 2) || (dummy[0] != 'P') || (dummy[1] != '5')) + return (1); + + fscanf(handle, "%d %d %d", &xsize, &ysize, &depth); + if ((xsize > 4096) || (ysize > 4096*3/2) || (depth != 255)) { + fprintf(stderr, "%d %d %d\n", xsize, ysize, depth); + return (2); } - if ( (XDIM==0) || (YDIM==0) ) - { - XDIM=xsize; - YDIM=ysize*2/3; + if ((XDIM == 0) || (YDIM == 0)) { + XDIM = xsize; + YDIM = ysize * 2 / 3; } - return 0; + return (0); } -static int read_pgmdata(FILE* handle, unsigned char *image) -{ +static int +read_pgmdata(FILE * handle, + unsigned char *image) +{ int i; char dummy; - + unsigned char *y = image; - unsigned char *u = image + XDIM*YDIM; - unsigned char *v = image + XDIM*YDIM + XDIM/2*YDIM/2; + unsigned char *u = image + XDIM * YDIM; + unsigned char *v = image + XDIM * YDIM + XDIM / 2 * YDIM / 2; /* read Y component of picture */ - fread(y, 1, XDIM*YDIM, handle); - - for (i=0;i 1440) || (ysize > 2880) || (depth != 255)) { + fprintf(stderr, "%d %d %d\n", xsize, ysize, depth); + return (2); + } + + XDIM = xsize; + YDIM = ysize; + + return (0); +} + +static int +read_pnmdata(FILE * handle, + unsigned char *image) { - - if (fread(image, 1, IMAGE_SIZE(XDIM, YDIM), handle) != (unsigned int)IMAGE_SIZE(XDIM, YDIM)) - return 1; - else - return 0; + int i; + char dummy; + + /* read Y component of picture */ + fread(image, 1, XDIM * YDIM * 3, handle); + + /* I don't know why, but this seems needed */ + fread(&dummy, 1, 1, handle); + + return (0); +} +#endif + +static int +read_yuvdata(FILE * handle, + unsigned char *image) +{ + + if (fread(image, 1, IMAGE_SIZE(XDIM, YDIM), handle) != + (unsigned int) IMAGE_SIZE(XDIM, YDIM)) + return (1); + else + return (0); } /***************************************************************************** * Routines for encoding: init encoder, frame step, release encoder ****************************************************************************/ +/* sample plugin */ + +int +rawenc_debug(void *handle, + int opt, + void *param1, + void *param2) +{ + switch (opt) { + case XVID_PLG_INFO: + { + xvid_plg_info_t *info = (xvid_plg_info_t *) param1; + + info->flags = XVID_REQDQUANTS; + return 0; + } + + case XVID_PLG_CREATE: + case XVID_PLG_DESTROY: + case XVID_PLG_BEFORE: + return 0; + + case XVID_PLG_AFTER: + { + xvid_plg_data_t *data = (xvid_plg_data_t *) param1; + int i, j; + + printf("---[ frame: %5i quant: %2i length: %6i ]---\n", + data->frame_num, data->quant, data->length); + for (j = 0; j < data->mb_height; j++) { + for (i = 0; i < data->mb_width; i++) + printf("%2i ", data->dquant[j * data->dquant_stride + i]); + printf("\n"); + } + + return 0; + } + } + + return XVID_ERR_FAIL; +} + + #define FRAMERATE_INCR 1001 + /* Initialize encoder for first use, pass all needed parameters to the codec */ -static int enc_init(int use_assembler) +static int +enc_init(int use_assembler) { int xerr; - - XVID_INIT_PARAM xinit; - XVID_ENC_PARAM xparam; + //xvid_plugin_cbr_t cbr; + xvid_plugin_single_t single; + xvid_plugin_2pass1_t rc2pass1; + xvid_plugin_2pass2_t rc2pass2; + xvid_plugin_ssim_t ssim; + //xvid_plugin_fixed_t rcfixed; + xvid_enc_plugin_t plugins[8]; + xvid_gbl_init_t xvid_gbl_init; + xvid_enc_create_t xvid_enc_create; + int i; + + /*------------------------------------------------------------------------ + * XviD core initialization + *----------------------------------------------------------------------*/ - if(use_assembler) { + /* Set version -- version checking will done by xvidcore */ + memset(&xvid_gbl_init, 0, sizeof(xvid_gbl_init)); + xvid_gbl_init.version = XVID_VERSION; + xvid_gbl_init.debug = ARG_DEBUG; -#ifdef ARCH_IA64 - xinit.cpu_flags = XVID_CPU_FORCE | XVID_CPU_IA64; + + /* Do we have to enable ASM optimizations ? */ + if (use_assembler) { + +#ifdef ARCH_IS_IA64 + xvid_gbl_init.cpu_flags = XVID_CPU_FORCE | XVID_CPU_ASM; #else - xinit.cpu_flags = 0; + xvid_gbl_init.cpu_flags = 0; #endif + } else { + xvid_gbl_init.cpu_flags = XVID_CPU_FORCE; } - else { - xinit.cpu_flags = XVID_CPU_FORCE; + + /* Initialize XviD core -- Should be done once per __process__ */ + xvid_global(NULL, XVID_GBL_INIT, &xvid_gbl_init, NULL); + enc_info(); + + /*------------------------------------------------------------------------ + * XviD encoder initialization + *----------------------------------------------------------------------*/ + + /* Version again */ + memset(&xvid_enc_create, 0, sizeof(xvid_enc_create)); + xvid_enc_create.version = XVID_VERSION; + + /* Width and Height of input frames */ + xvid_enc_create.width = XDIM; + xvid_enc_create.height = YDIM; + xvid_enc_create.profile = 0xf5; /* Unrestricted */ + + /* init plugins */ +// xvid_enc_create.zones = ZONES; +// xvid_enc_create.num_zones = NUM_ZONES; + + xvid_enc_create.plugins = plugins; + xvid_enc_create.num_plugins = 0; + + if (ARG_SINGLE) { + memset(&single, 0, sizeof(xvid_plugin_single_t)); + single.version = XVID_VERSION; + single.bitrate = ARG_BITRATE; + single.reaction_delay_factor = ARG_REACTION; + single.averaging_period = ARG_AVERAGING; + single.buffer = ARG_SMOOTHER; + + + plugins[xvid_enc_create.num_plugins].func = xvid_plugin_single; + plugins[xvid_enc_create.num_plugins].param = &single; + xvid_enc_create.num_plugins++; + if (!ARG_BITRATE) + prepare_cquant_zones(); } - xvid_init(NULL, 0, &xinit, NULL); + if (ARG_PASS2) { + memset(&rc2pass2, 0, sizeof(xvid_plugin_2pass2_t)); + rc2pass2.version = XVID_VERSION; + rc2pass2.filename = ARG_PASS2; + rc2pass2.bitrate = ARG_BITRATE; - xparam.width = XDIM; - xparam.height = YDIM; - if ((ARG_FRAMERATE - (int)ARG_FRAMERATE) < SMALL_EPS) - { - xparam.fincr = 1; - xparam.fbase = (int)ARG_FRAMERATE; + rc2pass2.keyframe_boost = ARG_KBOOST; + rc2pass2.curve_compression_high = ARG_CHIGH; + rc2pass2.curve_compression_low = ARG_CLOW; + rc2pass2.overflow_control_strength = ARG_OVERSTRENGTH; + rc2pass2.max_overflow_improvement = ARG_OVERIMPROVE; + rc2pass2.max_overflow_degradation = ARG_OVERDEGRADE; + rc2pass2.kfreduction = ARG_KREDUCTION; + rc2pass2.kfthreshold = ARG_KTHRESH; + rc2pass2.container_frame_overhead = ARG_OVERHEAD; + +// An example of activating VBV could look like this + rc2pass2.vbv_size = ARG_VBVSIZE; + rc2pass2.vbv_initial = (ARG_VBVSIZE*3)/4; + rc2pass2.vbv_maxrate = ARG_VBVMAXRATE; + rc2pass2.vbv_peakrate = ARG_VBVPEAKRATE*3; + + + plugins[xvid_enc_create.num_plugins].func = xvid_plugin_2pass2; + plugins[xvid_enc_create.num_plugins].param = &rc2pass2; + xvid_enc_create.num_plugins++; } - else - { - xparam.fincr = FRAMERATE_INCR; - xparam.fbase = (int)(FRAMERATE_INCR * ARG_FRAMERATE); + + if (ARG_PASS1) { + memset(&rc2pass1, 0, sizeof(xvid_plugin_2pass1_t)); + rc2pass1.version = XVID_VERSION; + rc2pass1.filename = ARG_PASS1; + if (ARG_FULL1PASS) + prepare_full1pass_zones(); + plugins[xvid_enc_create.num_plugins].func = xvid_plugin_2pass1; + plugins[xvid_enc_create.num_plugins].param = &rc2pass1; + xvid_enc_create.num_plugins++; + } + + /* Zones stuff */ + xvid_enc_create.zones = (xvid_enc_zone_t*)malloc(sizeof(xvid_enc_zone_t) * NUM_ZONES); + xvid_enc_create.num_zones = NUM_ZONES; + for (i=0; i < xvid_enc_create.num_zones; i++) { + xvid_enc_create.zones[i].frame = ZONES[i].frame; + xvid_enc_create.zones[i].base = 100; + xvid_enc_create.zones[i].mode = ZONES[i].mode; + xvid_enc_create.zones[i].increment = ZONES[i].modifier; + } + + + if (ARG_LUMIMASKING) { + plugins[xvid_enc_create.num_plugins].func = xvid_plugin_lumimasking; + plugins[xvid_enc_create.num_plugins].param = NULL; + xvid_enc_create.num_plugins++; + } + + if (ARG_DUMP) { + plugins[xvid_enc_create.num_plugins].func = xvid_plugin_dump; + plugins[xvid_enc_create.num_plugins].param = NULL; + xvid_enc_create.num_plugins++; } - xparam.rc_reaction_delay_factor = 16; - xparam.rc_averaging_period = 100; - xparam.rc_buffer = 10; - xparam.rc_bitrate = ARG_BITRATE*1000; - xparam.min_quantizer = ARG_MINQUANT; - xparam.max_quantizer = ARG_MAXQUANT; - xparam.max_key_interval = (int)ARG_FRAMERATE*10; - xparam.bquant_ratio = ARG_BQRATIO; - xparam.bquant_offset = ARG_BQOFFSET; - xparam.max_bframes = ARG_MAXBFRAMES; - xparam.frame_drop_ratio = 0; - xparam.global = 0; + + if (ARG_SSIM>=0 || ARG_SSIM_PATH != NULL) { + memset(&ssim, 0, sizeof(xvid_plugin_ssim_t)); + + plugins[xvid_enc_create.num_plugins].func = xvid_plugin_ssim; + + if( ARG_SSIM >=0){ + ssim.b_printstat = 1; + ssim.acc = ARG_SSIM; + } else { + ssim.b_printstat = 0; + ssim.acc = 2; + } + + if(ARG_SSIM_PATH != NULL){ + ssim.stat_path = ARG_SSIM_PATH; + } + + ssim.b_visualize = 0; + plugins[xvid_enc_create.num_plugins].param = &ssim; + xvid_enc_create.num_plugins++; + } + +#if 0 + if (ARG_DEBUG) { + plugins[xvid_enc_create.num_plugins].func = rawenc_debug; + plugins[xvid_enc_create.num_plugins].param = NULL; + xvid_enc_create.num_plugins++; + } +#endif + + xvid_enc_create.num_threads = ARG_THREADS; + + /* Frame rate */ + xvid_enc_create.fincr = ARG_DWSCALE; + xvid_enc_create.fbase = ARG_DWRATE; + + /* Maximum key frame interval */ + if (ARG_MAXKEYINTERVAL > 0) { + xvid_enc_create.max_key_interval = ARG_MAXKEYINTERVAL; + }else { + xvid_enc_create.max_key_interval = (int) ARG_FRAMERATE *10; + } + + xvid_enc_create.min_quant[0]=ARG_QUANTS[0]; + xvid_enc_create.min_quant[1]=ARG_QUANTS[2]; + xvid_enc_create.min_quant[2]=ARG_QUANTS[4]; + xvid_enc_create.max_quant[0]=ARG_QUANTS[1]; + xvid_enc_create.max_quant[1]=ARG_QUANTS[3]; + xvid_enc_create.max_quant[2]=ARG_QUANTS[5]; + + /* Bframes settings */ + xvid_enc_create.max_bframes = ARG_MAXBFRAMES; + xvid_enc_create.bquant_ratio = ARG_BQRATIO; + xvid_enc_create.bquant_offset = ARG_BQOFFSET; + + /* Frame drop ratio */ + xvid_enc_create.frame_drop_ratio = ARG_FRAMEDROP; + + /* Global encoder options */ + xvid_enc_create.global = 0; + + if (ARG_PACKED) + xvid_enc_create.global |= XVID_GLOBAL_PACKED; + + if (ARG_CLOSED_GOP) + xvid_enc_create.global |= XVID_GLOBAL_CLOSED_GOP; + + if (ARG_STATS) + xvid_enc_create.global |= XVID_GLOBAL_EXTRASTATS_ENABLE; /* I use a small value here, since will not encode whole movies, but short clips */ + xerr = xvid_encore(NULL, XVID_ENC_CREATE, &xvid_enc_create, NULL); - xerr = xvid_encore(NULL, XVID_ENC_CREATE, &xparam, NULL); - enc_handle=xparam.handle; + /* Retrieve the encoder instance from the structure */ + enc_handle = xvid_enc_create.handle; - return xerr; + free(xvid_enc_create.zones); + + return (xerr); +} + +static int +enc_info() +{ + xvid_gbl_info_t xvid_gbl_info; + int ret; + + memset(&xvid_gbl_info, 0, sizeof(xvid_gbl_info)); + xvid_gbl_info.version = XVID_VERSION; + ret = xvid_global(NULL, XVID_GBL_INFO, &xvid_gbl_info, NULL); + if (xvid_gbl_info.build != NULL) { + fprintf(stderr, "xvidcore build version: %s\n", xvid_gbl_info.build); + } + fprintf(stderr, "Bitstream version: %d.%d.%d\n", XVID_VERSION_MAJOR(xvid_gbl_info.actual_version), XVID_VERSION_MINOR(xvid_gbl_info.actual_version), XVID_VERSION_PATCH(xvid_gbl_info.actual_version)); + fprintf(stderr, "Detected CPU flags: "); + if (xvid_gbl_info.cpu_flags & XVID_CPU_ASM) + fprintf(stderr, "ASM "); + if (xvid_gbl_info.cpu_flags & XVID_CPU_MMX) + fprintf(stderr, "MMX "); + if (xvid_gbl_info.cpu_flags & XVID_CPU_MMXEXT) + fprintf(stderr, "MMXEXT "); + if (xvid_gbl_info.cpu_flags & XVID_CPU_SSE) + fprintf(stderr, "SSE "); + if (xvid_gbl_info.cpu_flags & XVID_CPU_SSE2) + fprintf(stderr, "SSE2 "); + if (xvid_gbl_info.cpu_flags & XVID_CPU_SSE3) + fprintf(stderr, "SSE3 "); + if (xvid_gbl_info.cpu_flags & XVID_CPU_SSE41) + fprintf(stderr, "SSE41 "); + if (xvid_gbl_info.cpu_flags & XVID_CPU_3DNOW) + fprintf(stderr, "3DNOW "); + if (xvid_gbl_info.cpu_flags & XVID_CPU_3DNOWEXT) + fprintf(stderr, "3DNOWEXT "); + if (xvid_gbl_info.cpu_flags & XVID_CPU_TSC) + fprintf(stderr, "TSC "); + fprintf(stderr, "\n"); + fprintf(stderr, "Detected %d cpus,", xvid_gbl_info.num_threads); + if (!ARG_THREADS) + ARG_THREADS = xvid_gbl_info.num_threads; + fprintf(stderr, " using %d threads.\n", ARG_THREADS); + return ret; } -static int enc_stop() +static int +enc_stop() { int xerr; + /* Destroy the encoder instance */ xerr = xvid_encore(enc_handle, XVID_ENC_DESTROY, NULL, NULL); - return xerr; + return (xerr); } -static int enc_main(unsigned char* image, unsigned char* bitstream, - unsigned char* hints_buffer, - long *streamlength, long *frametype, long *hints_size) +static int +enc_main(unsigned char *image, + unsigned char *bitstream, + int *key, + int *stats_type, + int *stats_quant, + int *stats_length, + int sse[3], + int framenum) { - int xerr; + int ret; - XVID_ENC_FRAME xframe; - XVID_ENC_STATS xstats; + xvid_enc_frame_t xvid_enc_frame; + xvid_enc_stats_t xvid_enc_stats; - xframe.bitstream = bitstream; - xframe.length = -1; /* this is written by the routine */ + /* Version for the frame and the stats */ + memset(&xvid_enc_frame, 0, sizeof(xvid_enc_frame)); + xvid_enc_frame.version = XVID_VERSION; + + memset(&xvid_enc_stats, 0, sizeof(xvid_enc_stats)); + xvid_enc_stats.version = XVID_VERSION; + + /* Bind output buffer */ + xvid_enc_frame.bitstream = bitstream; + xvid_enc_frame.length = -1; + + /* Initialize input image fields */ + if (image) { + xvid_enc_frame.input.plane[0] = image; +#ifndef READ_PNM + xvid_enc_frame.input.csp = ARG_COLORSPACE; + xvid_enc_frame.input.stride[0] = XDIM; +#else + xvid_enc_frame.input.csp = XVID_CSP_BGR; + xvid_enc_frame.input.stride[0] = XDIM*3; +#endif + } else { + xvid_enc_frame.input.csp = XVID_CSP_NULL; + } + + /* Set up core's general features */ + xvid_enc_frame.vol_flags = 0; + if (ARG_STATS) + xvid_enc_frame.vol_flags |= XVID_VOL_EXTRASTATS; + if (ARG_QTYPE) { + xvid_enc_frame.vol_flags |= XVID_VOL_MPEGQUANT; + if (ARG_QMATRIX) { + xvid_enc_frame.quant_intra_matrix = qmatrix_intra; + xvid_enc_frame.quant_inter_matrix = qmatrix_inter; + } + else { + /* We don't use special matrices */ + xvid_enc_frame.quant_intra_matrix = NULL; + xvid_enc_frame.quant_inter_matrix = NULL; + } + } - xframe.image = image; - xframe.colorspace = XVID_CSP_YV12; /* defined in */ + if (ARG_PAR) + xvid_enc_frame.par = ARG_PAR; + else { + xvid_enc_frame.par = XVID_PAR_EXT; + xvid_enc_frame.par_width = ARG_PARWIDTH; + xvid_enc_frame.par_height = ARG_PARHEIGHT; + } - xframe.intra = -1; /* let the codec decide between I-frame (1) and P-frame (0) */ - xframe.quant = ARG_QUANTI; /* is quant != 0, use a fixed quant (and ignore bitrate) */ - xframe.bquant = 0; + if (ARG_QPEL) { + xvid_enc_frame.vol_flags |= XVID_VOL_QUARTERPEL; + xvid_enc_frame.motion |= XVID_ME_QUARTERPELREFINE16 | XVID_ME_QUARTERPELREFINE8; + } + if (ARG_GMC) { + xvid_enc_frame.vol_flags |= XVID_VOL_GMC; + xvid_enc_frame.motion |= XVID_ME_GME_REFINE; + } + + /* Set up core's general features */ + xvid_enc_frame.vop_flags = vop_presets[ARG_QUALITY]; + + if (ARG_INTERLACING) { + xvid_enc_frame.vol_flags |= XVID_VOL_INTERLACING; + if (ARG_INTERLACING == 2) + xvid_enc_frame.vop_flags |= XVID_VOP_TOPFIELDFIRST; + } + + xvid_enc_frame.vop_flags |= XVID_VOP_HALFPEL; + xvid_enc_frame.vop_flags |= XVID_VOP_HQACPRED; + + if (ARG_VOPDEBUG) { + xvid_enc_frame.vop_flags |= XVID_VOP_DEBUG; + } + + if (ARG_TRELLIS) { + xvid_enc_frame.vop_flags |= XVID_VOP_TRELLISQUANT; + } + + /* Frame type -- taken from function call parameter */ + /* Sometimes we might want to force the last frame to be a P Frame */ + xvid_enc_frame.type = *stats_type; + + /* Force the right quantizer -- It is internally managed by RC plugins */ + xvid_enc_frame.quant = 0; + + if (ARG_CHROMAME) + xvid_enc_frame.motion |= XVID_ME_CHROMA_PVOP + XVID_ME_CHROMA_BVOP; + + /* Set up motion estimation flags */ + xvid_enc_frame.motion |= motion_presets[ARG_QUALITY]; + + if (ARG_TURBO) + xvid_enc_frame.motion |= XVID_ME_FASTREFINE16 | XVID_ME_FASTREFINE8 | + XVID_ME_SKIP_DELTASEARCH | XVID_ME_FAST_MODEINTERPOLATE | + XVID_ME_BFRAME_EARLYSTOP; + + if (ARG_BVHQ) + xvid_enc_frame.vop_flags |= XVID_VOP_RD_BVOP; + + switch (ARG_VHQMODE) /* this is the same code as for vfw */ + { + case 1: /* VHQ_MODE_DECISION */ + xvid_enc_frame.vop_flags |= XVID_VOP_MODEDECISION_RD; + break; + + case 2: /* VHQ_LIMITED_SEARCH */ + xvid_enc_frame.vop_flags |= XVID_VOP_MODEDECISION_RD; + xvid_enc_frame.motion |= XVID_ME_HALFPELREFINE16_RD; + xvid_enc_frame.motion |= XVID_ME_QUARTERPELREFINE16_RD; + break; + + case 3: /* VHQ_MEDIUM_SEARCH */ + xvid_enc_frame.vop_flags |= XVID_VOP_MODEDECISION_RD; + xvid_enc_frame.motion |= XVID_ME_HALFPELREFINE16_RD; + xvid_enc_frame.motion |= XVID_ME_HALFPELREFINE8_RD; + xvid_enc_frame.motion |= XVID_ME_QUARTERPELREFINE16_RD; + xvid_enc_frame.motion |= XVID_ME_QUARTERPELREFINE8_RD; + xvid_enc_frame.motion |= XVID_ME_CHECKPREDICTION_RD; + break; + + case 4: /* VHQ_WIDE_SEARCH */ + xvid_enc_frame.vop_flags |= XVID_VOP_MODEDECISION_RD; + xvid_enc_frame.motion |= XVID_ME_HALFPELREFINE16_RD; + xvid_enc_frame.motion |= XVID_ME_HALFPELREFINE8_RD; + xvid_enc_frame.motion |= XVID_ME_QUARTERPELREFINE16_RD; + xvid_enc_frame.motion |= XVID_ME_QUARTERPELREFINE8_RD; + xvid_enc_frame.motion |= XVID_ME_CHECKPREDICTION_RD; + xvid_enc_frame.motion |= XVID_ME_EXTSEARCH_RD; + break; + + default : + break; + } + + /* Not sure what this does */ + // force keyframe spacing in 2-pass 1st pass + if (ARG_QUALITY == 0) + xvid_enc_frame.type = XVID_TYPE_IVOP; + + /* frame-based stuff */ + apply_zone_modifiers(&xvid_enc_frame, framenum); + + + /* Encode the frame */ + ret = xvid_encore(enc_handle, XVID_ENC_ENCODE, &xvid_enc_frame, + &xvid_enc_stats); + + *key = (xvid_enc_frame.out_flags & XVID_KEYFRAME); + *stats_type = xvid_enc_stats.type; + *stats_quant = xvid_enc_stats.quant; + *stats_length = xvid_enc_stats.length; + sse[0] = xvid_enc_stats.sse_y; + sse[1] = xvid_enc_stats.sse_u; + sse[2] = xvid_enc_stats.sse_v; + + return (ret); +} + +void +sort_zones(zone_t * zones, int zone_num, int * sel) +{ + int i, j; + zone_t tmp; + for (i = 0; i < zone_num; i++) { + int cur = i; + int min_f = zones[i].frame; + for (j = i + 1; j < zone_num; j++) { + if (zones[j].frame < min_f) { + min_f = zones[j].frame; + cur = j; + } + } + if (cur != i) { + tmp = zones[i]; + zones[i] = zones[cur]; + zones[cur] = tmp; + if (i == *sel) *sel = cur; + else if (cur == *sel) *sel = i; + } + } +} + +/* constant-quant zones for fixed quant encoding */ +static void +prepare_cquant_zones() { + + int i = 0; + if (NUM_ZONES == 0 || ZONES[0].frame != 0) { + /* first zone does not start at frame 0 or doesn't exist */ + + if (NUM_ZONES >= MAX_ZONES) NUM_ZONES--; /* we sacrifice last zone */ + + ZONES[NUM_ZONES].frame = 0; + ZONES[NUM_ZONES].mode = XVID_ZONE_QUANT; + ZONES[NUM_ZONES].modifier = ARG_CQ; + ZONES[NUM_ZONES].type = XVID_TYPE_AUTO; + ZONES[NUM_ZONES].greyscale = 0; + ZONES[NUM_ZONES].chroma_opt = 0; + ZONES[NUM_ZONES].bvop_threshold = 0; + ZONES[NUM_ZONES].cartoon_mode = 0; + NUM_ZONES++; + + sort_zones(ZONES, NUM_ZONES, &i); + } + + /* step 2: let's change all weight zones into quant zones */ - xframe.motion = motion_presets[ARG_QUALITY]; - xframe.general = general_presets[ARG_QUALITY]; - xframe.quant_intra_matrix = xframe.quant_inter_matrix = NULL; - xframe.stride = XDIM; + for(i = 0; i < NUM_ZONES; i++) + if (ZONES[i].mode == XVID_ZONE_WEIGHT) { + ZONES[i].mode = XVID_ZONE_QUANT; + ZONES[i].modifier = (100*ARG_CQ) / ZONES[i].modifier; + } +} - xframe.hint.hintstream = hints_buffer; +/* full first pass zones */ +static void +prepare_full1pass_zones() { + + int i = 0; + if (NUM_ZONES == 0 || ZONES[0].frame != 0) { + /* first zone does not start at frame 0 or doesn't exist */ + + if (NUM_ZONES >= MAX_ZONES) NUM_ZONES--; /* we sacrifice last zone */ + + ZONES[NUM_ZONES].frame = 0; + ZONES[NUM_ZONES].mode = XVID_ZONE_QUANT; + ZONES[NUM_ZONES].modifier = 200; + ZONES[NUM_ZONES].type = XVID_TYPE_AUTO; + ZONES[NUM_ZONES].greyscale = 0; + ZONES[NUM_ZONES].chroma_opt = 0; + ZONES[NUM_ZONES].bvop_threshold = 0; + ZONES[NUM_ZONES].cartoon_mode = 0; + NUM_ZONES++; - if(ARG_HINTMODE == HINT_MODE_SET) { - xframe.hint.hintlength = *hints_size; - xframe.hint.rawhints = 0; - xframe.general |= XVID_HINTEDME_SET; + sort_zones(ZONES, NUM_ZONES, &i); } - if(ARG_HINTMODE == HINT_MODE_GET) { - xframe.hint.rawhints = 0; - xframe.general |= XVID_HINTEDME_GET; + /* step 2: let's change all weight zones into quant zones */ + + for(i = 0; i < NUM_ZONES; i++) + if (ZONES[i].mode == XVID_ZONE_WEIGHT) { + ZONES[i].mode = XVID_ZONE_QUANT; + ZONES[i].modifier = 200; + } +} + +static void apply_zone_modifiers(xvid_enc_frame_t * frame, int framenum) +{ + int i; + + for (i=0; itype = ZONES[i].type; + + if (ZONES[i].greyscale) { + frame->vop_flags |= XVID_VOP_GREYSCALE; } - xerr = xvid_encore(enc_handle, XVID_ENC_ENCODE, &xframe, &xstats); + if (ZONES[i].chroma_opt) { + frame->vop_flags |= XVID_VOP_CHROMAOPT; + } + + if (ZONES[i].cartoon_mode) { + frame->vop_flags |= XVID_VOP_CARTOON; + frame->motion |= XVID_ME_DETECT_STATIC_MOTION; + } - if(ARG_HINTMODE == HINT_MODE_GET) - *hints_size = xframe.hint.hintlength; + if (ARG_MAXBFRAMES) { + frame->bframe_threshold = ZONES[i].bvop_threshold; + } +} - /* - * This is statictical data, e.g. for 2-pass. If you are not - * interested in any of this, you can use NULL instead of &xstats - */ - *frametype = xframe.intra; - *streamlength = xframe.length; +void removedivxp(char *buf, int bufsize) { + int i; + char* userdata; - return xerr; + for (i=0; i <= (bufsize-sizeof(userdata_start_code)); i++) { + if (memcmp((void*)userdata_start_code, (void*)(buf+i), strlen(userdata_start_code))==0) { + if ((userdata = strstr(buf+i+4, "DivX"))!=NULL) { + userdata[strlen(userdata)-1] = '\0'; + return; + } + } + } }