--- xvid.h 2003/03/16 12:04:14 1.27.2.9 +++ xvid.h 2004/03/03 20:57:36 1.27.2.66 @@ -1,25 +1,25 @@ /***************************************************************************** * - * XVID MPEG-4 VIDEO CODEC - * - XviD Main header file - + * XVID MPEG-4 VIDEO CODEC + * - XviD Main header file - * - * This file is part of XviD, a free MPEG-4 video encoder/decoder + * Copyright(C) 2001-2003 Peter Ross * - * This program is free software; you can redistribute it and/or modify + * This program is free software ; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by - * the Free Software Foundation; either version 2 of the License, or + * the Free Software Foundation ; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of + * but WITHOUT ANY WARRANTY ; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License - * along with this program; if not, write to the Free Software + * along with this program ; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA * - * $Id: xvid.h,v 1.27.2.9 2003/03/16 12:04:14 suxen_drol Exp $ + * $Id: xvid.h,v 1.27.2.66 2004/03/03 20:57:36 edgomez Exp $ * ****************************************************************************/ @@ -45,21 +45,27 @@ memset(&struct,0,sizeof(struct)); struct.version = XVID_VERSION; - XVID_UNSTABLE is defined only during development. + XVID_UNSTABLE is defined only during development. */ -#define XVID_MAKE_VERSION(a,b,c) ( (((a)&0xff)<<16) | (((b)&0xff)<<8) | ((c)&0xff) ) -#define XVID_MAJOR(a) ( ((a)>>16) & 0xff ) -#define XVID_MINOR(b) ((char)( ((b)>>8) & 0xff )) -#define XVID_PATCH(c) ( (c) & 0xff ) +#define XVID_MAKE_VERSION(a,b,c) ((((a)&0xff)<<16) | (((b)&0xff)<<8) | ((c)&0xff)) +#define XVID_VERSION_MAJOR(a) ((char)(((a)>>16) & 0xff)) +#define XVID_VERSION_MINOR(a) ((char)(((a)>> 8) & 0xff)) +#define XVID_VERSION_PATCH(a) ((char)(((a)>> 0) & 0xff)) + +#define XVID_MAKE_API(a,b) ((((a)&0xff)<<16) | (((b)&0xff)<<0)) +#define XVID_API_MAJOR(a) (((a)>>16) & 0xff) +#define XVID_API_MINOR(a) (((a)>> 0) & 0xff) + +#define XVID_VERSION XVID_MAKE_VERSION(1,0,-124) +#define XVID_API XVID_MAKE_API(4, 0) -#define XVID_VERSION XVID_MAKE_VERSION(1,-127,0) #define XVID_UNSTABLE -/* Bitstream Version - * this will be writen into the bitstream to allow easy detection of xvid - * encoder bugs in the decoder, without this it might not possible to - * automatically distinquish between a file which has been encoded with an +/* Bitstream Version + * this will be writen into the bitstream to allow easy detection of xvid + * encoder bugs in the decoder, without this it might not possible to + * automatically distinquish between a file which has been encoded with an * old & buggy XVID from a file which has been encoded with a bugfree version * see the infamous interlacing bug ... * @@ -67,18 +73,18 @@ * doesnt hurt but not increasing it could cause difficulty for decoders in the * future */ -#define XVID_BS_VERSION "0009" +#define XVID_BS_VERSION "0029" /***************************************************************************** * error codes ****************************************************************************/ - /* all functions return values <0 indicate error */ + /* all functions return values <0 indicate error */ #define XVID_ERR_FAIL -1 /* general fault */ -#define XVID_ERR_MEMORY -2 /* memory allocation error */ -#define XVID_ERR_FORMAT -3 /* file format error */ +#define XVID_ERR_MEMORY -2 /* memory allocation error */ +#define XVID_ERR_FORMAT -3 /* file format error */ #define XVID_ERR_VERSION -4 /* structure version not supported */ #define XVID_ERR_END -5 /* encoder only; end of stream reached */ @@ -90,22 +96,24 @@ /* colorspace values */ -#define XVID_CSP_USER 0 /* 4:2:0 planar */ -#define XVID_CSP_I420 1 /* 4:2:0 packed(planar win32) */ -#define XVID_CSP_YV12 2 /* 4:2:0 packed(planar win32) */ -#define XVID_CSP_YUY2 3 /* 4:2:2 packed */ -#define XVID_CSP_UYVY 4 /* 4:2:2 packed */ -#define XVID_CSP_YVYU 5 /* 4:2:2 packed */ -#define XVID_CSP_BGRA 6 /* 32-bit bgra packed */ -#define XVID_CSP_ABGR 7 /* 32-bit abgr packed */ -#define XVID_CSP_RGBA 8 /* 32-bit rgba packed */ -#define XVID_CSP_BGR 9 /* 32-bit bgr packed */ -#define XVID_CSP_RGB555 10 /* 16-bit rgb555 packed */ -#define XVID_CSP_RGB565 11 /* 16-bit rgb565 packed */ -#define XVID_CSP_SLICE 12 /* decoder only: 4:2:0 planar, per slice rendering */ -#define XVID_CSP_INTERNAL 13 /* decoder only: 4:2:0 planar, returns ptrs to internal buffers */ -#define XVID_CSP_NULL 14 /* decoder only: dont output anything */ -#define XVID_CSP_VFLIP 0x80000000 /* vertical flip mask */ +#define XVID_CSP_PLANAR (1<< 0) /* 4:2:0 planar (==I420, except for pointers/strides) */ +#define XVID_CSP_USER XVID_CSP_PLANAR +#define XVID_CSP_I420 (1<< 1) /* 4:2:0 planar */ +#define XVID_CSP_YV12 (1<< 2) /* 4:2:0 planar */ +#define XVID_CSP_YUY2 (1<< 3) /* 4:2:2 packed */ +#define XVID_CSP_UYVY (1<< 4) /* 4:2:2 packed */ +#define XVID_CSP_YVYU (1<< 5) /* 4:2:2 packed */ +#define XVID_CSP_BGRA (1<< 6) /* 32-bit bgra packed */ +#define XVID_CSP_ABGR (1<< 7) /* 32-bit abgr packed */ +#define XVID_CSP_RGBA (1<< 8) /* 32-bit rgba packed */ +#define XVID_CSP_ARGB (1<<15) /* 32-bit argb packed */ +#define XVID_CSP_BGR (1<< 9) /* 24-bit bgr packed */ +#define XVID_CSP_RGB555 (1<<10) /* 16-bit rgb555 packed */ +#define XVID_CSP_RGB565 (1<<11) /* 16-bit rgb565 packed */ +#define XVID_CSP_SLICE (1<<12) /* decoder only: 4:2:0 planar, per slice rendering */ +#define XVID_CSP_INTERNAL (1<<13) /* decoder only: 4:2:0 planar, returns ptrs to internal buffers */ +#define XVID_CSP_NULL (1<<14) /* decoder only: dont output anything */ +#define XVID_CSP_VFLIP (1<<31) /* vertical flip mask */ /* xvid_image_t for non-planar colorspaces use only plane[0] and stride[0] @@ -116,144 +124,214 @@ int stride[4]; /* [in] image stride; "bytes per row"*/ } xvid_image_t; +/* video-object-sequence profiles */ +#define XVID_PROFILE_S_L0 0x08 /* simple */ +#define XVID_PROFILE_S_L1 0x01 +#define XVID_PROFILE_S_L2 0x02 +#define XVID_PROFILE_S_L3 0x03 +#define XVID_PROFILE_ARTS_L1 0x91 /* advanced realtime simple */ +#define XVID_PROFILE_ARTS_L2 0x92 +#define XVID_PROFILE_ARTS_L3 0x93 +#define XVID_PROFILE_ARTS_L4 0x94 +#define XVID_PROFILE_AS_L0 0xf0 /* advanced simple */ +#define XVID_PROFILE_AS_L1 0xf1 +#define XVID_PROFILE_AS_L2 0xf2 +#define XVID_PROFILE_AS_L3 0xf3 +#define XVID_PROFILE_AS_L4 0xf4 /* aspect ratios */ -#define XVID_PAR_11_VGA 1 /* 1:1 vga (square) */ -#define XVID_PAR_43_PAL 2 /* 4:3 pal (12:11 625-line) */ -#define XVID_PAR_43_NTSC 3 /* 4:3 ntsc (10:11 525-line) */ -#define XVID_PAR_169_PAL 4 /* 16:9 pal (16:11 625-line) */ -#define XVID_PAR_169_NTSC 5 /* 16:9 ntsc (40:33 525-line) */ -#define XVID_PAR_EXT 15 /* extended par; use par_width, par_height */ +#define XVID_PAR_11_VGA 1 /* 1:1 vga (square), default if supplied PAR is not a valid value */ +#define XVID_PAR_43_PAL 2 /* 4:3 pal (12:11 625-line) */ +#define XVID_PAR_43_NTSC 3 /* 4:3 ntsc (10:11 525-line) */ +#define XVID_PAR_169_PAL 4 /* 16:9 pal (16:11 625-line) */ +#define XVID_PAR_169_NTSC 5 /* 16:9 ntsc (40:33 525-line) */ +#define XVID_PAR_EXT 15 /* extended par; use par_width, par_height */ /* frame type flags */ -#define XVID_TYPE_VOL -1 /* decoder only: vol was decoded */ -#define XVID_TYPE_NOTHING 0 /* decoder only (encoder stats): nothing was decoded/encoded */ -#define XVID_TYPE_AUTO 0 /* encoder: automatically determine coding type */ -#define XVID_TYPE_IVOP 1 /* intra frame */ -#define XVID_TYPE_PVOP 2 /* predicted frame */ -#define XVID_TYPE_BVOP 3 /* bidirectionally encoded */ -#define XVID_TYPE_SVOP 4 /* predicted+sprite frame */ +#define XVID_TYPE_VOL -1 /* decoder only: vol was decoded */ +#define XVID_TYPE_NOTHING 0 /* decoder only (encoder stats): nothing was decoded/encoded */ +#define XVID_TYPE_AUTO 0 /* encoder: automatically determine coding type */ +#define XVID_TYPE_IVOP 1 /* intra frame */ +#define XVID_TYPE_PVOP 2 /* predicted frame */ +#define XVID_TYPE_BVOP 3 /* bidirectionally encoded */ +#define XVID_TYPE_SVOP 4 /* predicted+sprite frame */ + /***************************************************************************** * xvid_global() ****************************************************************************/ -/* cpu_flags definitions */ +/* cpu_flags definitions (make sure to sync this with cpuid.asm for ia32) */ -#define XVID_CPU_FORCE 0x80000000 /* force passed cpu flags */ -#define XVID_CPU_ASM 0x00000080 /* native assembly */ +#define XVID_CPU_FORCE (1<<31) /* force passed cpu flags */ +#define XVID_CPU_ASM (1<< 7) /* native assembly */ /* ARCH_IS_IA32 */ -#define XVID_CPU_MMX 0x00000001 /* mmx : pentiumMMX,k6 */ -#define XVID_CPU_MMXEXT 0x00000002 /* mmx-ext : pentium2, athlon */ -#define XVID_CPU_SSE 0x00000004 /* sse : pentium3, athlonXP */ -#define XVID_CPU_SSE2 0x00000008 /* sse2 : pentium4, athlon64 */ -#define XVID_CPU_3DNOW 0x00000010 /* 3dnow : k6-2 */ -#define XVID_CPU_3DNOWEXT 0x00000020 /* 3dnow-ext: athlon */ -#define XVID_CPU_TSC 0x00000040 /* timestamp counter */ +#define XVID_CPU_MMX (1<< 0) /* mmx : pentiumMMX,k6 */ +#define XVID_CPU_MMXEXT (1<< 1) /* mmx-ext : pentium2, athlon */ +#define XVID_CPU_SSE (1<< 2) /* sse : pentium3, athlonXP */ +#define XVID_CPU_SSE2 (1<< 3) /* sse2 : pentium4, athlon64 */ +#define XVID_CPU_3DNOW (1<< 4) /* 3dnow : k6-2 */ +#define XVID_CPU_3DNOWEXT (1<< 5) /* 3dnow-ext : athlon */ +#define XVID_CPU_TSC (1<< 6) /* tsc : Pentium */ /* ARCH_IS_PPC */ -#define XVID_CPU_ALTIVEC 0x00000001 /* altivec */ +#define XVID_CPU_ALTIVEC (1<< 0) /* altivec */ + +#define XVID_DEBUG_ERROR (1<< 0) +#define XVID_DEBUG_STARTCODE (1<< 1) +#define XVID_DEBUG_HEADER (1<< 2) +#define XVID_DEBUG_TIMECODE (1<< 3) +#define XVID_DEBUG_MB (1<< 4) +#define XVID_DEBUG_COEFF (1<< 5) +#define XVID_DEBUG_MV (1<< 6) +#define XVID_DEBUG_RC (1<< 7) +#define XVID_DEBUG_DEBUG (1<<31) /* XVID_GBL_INIT param1 */ typedef struct { int version; - int cpu_flags; /* [in:opt] zero = autodetect cpu - XVID_CPU_FORCE|{cpu features} = force cpu features */ + unsigned int cpu_flags; /* [in:opt] zero = autodetect cpu; XVID_CPU_FORCE|{cpu features} = force cpu features */ + int debug; /* [in:opt] debug level */ } xvid_gbl_init_t; /* XVID_GBL_INFO param1 */ typedef struct { int version; - int actual_version; /* [out] returns the actual xvidcore version */ - const char * build; /* [out] if !null, points to description of this xvid core build */ - int cpu_flags; /* [out] detected cpu features */ - int num_threads; /* [out] detected number of cpus/threads */ + int actual_version; /* [out] returns the actual xvidcore version */ + const char * build; /* [out] if !null, points to description of this xvid core build */ + unsigned int cpu_flags; /* [out] detected cpu features */ + int num_threads; /* [out] detected number of cpus/threads */ } xvid_gbl_info_t; /* XVID_GBL_CONVERT param1 */ typedef struct { int version; - xvid_image_t input; /* [in] input image & colorspace */ - xvid_image_t output; /* [in] output image & colorspace */ - int width; /* [in] width */ - int height; /* [in] height */ - int interlacing; /* [in] interlacing */ + xvid_image_t input; /* [in] input image & colorspace */ + xvid_image_t output; /* [in] output image & colorspace */ + int width; /* [in] width */ + int height; /* [in] height */ + int interlacing; /* [in] interlacing */ } xvid_gbl_convert_t; -#define XVID_GBL_INIT 0 /* initialize xvidcore; must be called before using xvid_decore, or xvid_encore) */ -#define XVID_GBL_INFO 1 /* return some info about xvidcore, and the host computer */ -#define XVID_GBL_CONVERT 2 /* colorspace conversion utility */ -#define XVID_GBL_TEST 3 /* testing.. */ +#define XVID_GBL_INIT 0 /* initialize xvidcore; must be called before using xvid_decore, or xvid_encore) */ +#define XVID_GBL_INFO 1 /* return some info about xvidcore, and the host computer */ +#define XVID_GBL_CONVERT 2 /* colorspace conversion utility */ -int xvid_global(void *handle, int opt, void *param1, void *param2); +extern int xvid_global(void *handle, int opt, void *param1, void *param2); /***************************************************************************** * xvid_decore() ****************************************************************************/ -#define XVID_DEC_CREATE 0 /* create decore instance; return 0 on success */ -#define XVID_DEC_DESTROY 1 /* destroy decore instance: return 0 on success */ -#define XVID_DEC_DECODE 2 /* decode a frame: returns number of bytes consumed >= 0 */ +#define XVID_DEC_CREATE 0 /* create decore instance; return 0 on success */ +#define XVID_DEC_DESTROY 1 /* destroy decore instance: return 0 on success */ +#define XVID_DEC_DECODE 2 /* decode a frame: returns number of bytes consumed >= 0 */ -int xvid_decore(void *handle, int opt, void *param1, void *param2); +extern int xvid_decore(void *handle, int opt, void *param1, void *param2); -/* XVID_DEC_CREATE param 1 +/* XVID_DEC_CREATE param 1 image width & height may be specified here when the dimensions are known in advance. */ typedef struct { int version; - int width; /* [in:opt] image width */ - int height; /* [in:opt] image width */ - void * handle; /* [out] decore context handle */ + int width; /* [in:opt] image width */ + int height; /* [in:opt] image width */ + void * handle; /* [out] decore context handle */ } xvid_dec_create_t; /* XVID_DEC_DECODE param1 */ /* general flags */ -#define XVID_LOWDELAY 0x00000001 /* lowdelay mode */ -#define XVID_DISCONTINUITY 0x00000002 /* indicates break in stream */ +#define XVID_LOWDELAY (1<<0) /* lowdelay mode */ +#define XVID_DISCONTINUITY (1<<1) /* indicates break in stream */ +#define XVID_DEBLOCKY (1<<2) /* perform luma deblocking */ +#define XVID_DEBLOCKUV (1<<3) /* perform chroma deblocking */ +#define XVID_FILMEFFECT (1<<4) /* adds film grain */ typedef struct { int version; - int general; /* [in:opt] general flags */ - void *bitstream; /* [in] bitstream (read from)*/ - int length; /* [in] bitstream length */ - xvid_image_t output; /* [in] output image (written to) */ -} -xvid_dec_frame_t; + int general; /* [in:opt] general flags */ + void *bitstream; /* [in] bitstream (read from)*/ + int length; /* [in] bitstream length */ + xvid_image_t output; /* [in] output image (written to) */ +} xvid_dec_frame_t; /* XVID_DEC_DECODE param2 :: optional */ typedef struct { int version; - int type; /* [out] output data type */ + + int type; /* [out] output data type */ union { - struct { /* type>0 {XVID_TYPE_IVOP,XVID_TYPE_PVOP,XVID_TYPE_BVOP,XVID_TYPE_SVOP} */ - int general; /* [out] flags */ - int time_base; /* [out] time base */ - int time_increment; /* [out] time increment */ + struct { /* type>0 {XVID_TYPE_IVOP,XVID_TYPE_PVOP,XVID_TYPE_BVOP,XVID_TYPE_SVOP} */ + int general; /* [out] flags */ + int time_base; /* [out] time base */ + int time_increment; /* [out] time increment */ /* XXX: external deblocking stuff */ - int * qscale; /* [out] pointer to quantizer table */ - int qscale_stride; /* [out] quantizer scale stride */ + int * qscale; /* [out] pointer to quantizer table */ + int qscale_stride; /* [out] quantizer scale stride */ } vop; struct { /* XVID_TYPE_VOL */ - int general; /* [out] flags */ - int width; /* [out] width */ - int height; /* [out] height */ - int par; /* [out] picture aspect ratio (refer to XVID_PAR_xxx above) */ - int par_width; /* [out] aspect ratio width */ - int par_height; /* [out] aspect ratio height */ + int general; /* [out] flags */ + int width; /* [out] width */ + int height; /* [out] height */ + int par; /* [out] pixel aspect ratio (refer to XVID_PAR_xxx above) */ + int par_width; /* [out] aspect ratio width [1..255] */ + int par_height; /* [out] aspect ratio height [1..255] */ } vol; } data; } xvid_dec_stats_t; +#define XVID_ZONE_QUANT (1<<0) +#define XVID_ZONE_WEIGHT (1<<1) + +typedef struct +{ + int frame; + int mode; + int increment; + int base; +} xvid_enc_zone_t; + + +/*---------------------------------------------------------------------------- + * xvid_enc_stats_t structure + * + * Used in: + * - xvid_plg_data_t structure + * - optional parameter in xvid_encore() function + * + * .coding_type = XVID_TYPE_NOTHING if the stats are not given + *--------------------------------------------------------------------------*/ + +typedef struct { + int version; + + /* encoding parameters */ + int type; /* [out] coding type */ + int quant; /* [out] frame quantizer */ + int vol_flags; /* [out] vol flags (see above) */ + int vop_flags; /* [out] vop flags (see above) */ + + /* bitrate */ + int length; /* [out] frame length */ + + int hlength; /* [out] header length (bytes) */ + int kblks; /* [out] number of blocks compressed as Intra */ + int mblks; /* [out] number of blocks compressed as Inter */ + int ublks; /* [out] number of blocks marked as not_coded */ + + int sse_y; /* [out] Y plane's sse */ + int sse_u; /* [out] U plane's sse */ + int sse_v; /* [out] V plane's sse */ +} xvid_enc_stats_t; /***************************************************************************** xvid plugin system -- internals @@ -264,71 +342,99 @@ xvidcore will call XVID_PLG_DESTROY during XVID_ENC_DESTROY ****************************************************************************/ -#define XVID_PLG_CREATE 0 -#define XVID_PLG_DESTROY 1 -#define XVID_PLG_INFO 2 -#define XVID_PLG_BEFORE 3 -#define XVID_PLG_AFTER 4 + +#define XVID_PLG_CREATE (1<<0) +#define XVID_PLG_DESTROY (1<<1) +#define XVID_PLG_INFO (1<<2) +#define XVID_PLG_BEFORE (1<<3) +#define XVID_PLG_FRAME (1<<4) +#define XVID_PLG_AFTER (1<<5) /* xvid_plg_info_t.flags */ -#define XVID_REQORIGINAL 1 /* plugin requires a copy of the original (uncompressed) image */ -#define XVID_REQPSNR 2 /* plugin requires psnr between the uncompressed and compressed image*/ -#define XVID_REQDQUANTS 3 /* plugin requires access to the dquant table */ +#define XVID_REQORIGINAL (1<<0) /* plugin requires a copy of the original (uncompressed) image */ +#define XVID_REQPSNR (1<<1) /* plugin requires psnr between the uncompressed and compressed image*/ +#define XVID_REQDQUANTS (1<<2) /* plugin requires access to the dquant table */ typedef struct { - int version; - int flags; /* plugin flags */ + int version; + int flags; /* [in:opt] plugin flags */ } xvid_plg_info_t; typedef struct { - int version; + int version; + + int num_zones; /* [out] */ + xvid_enc_zone_t * zones; /* [out] */ - int width; - int height; - int mb_width; - int mb_height; - int fincr; - int fbase; + int width; /* [out] */ + int height; /* [out] */ + int mb_width; /* [out] */ + int mb_height; /* [out] */ + int fincr; /* [out] */ + int fbase; /* [out] */ - void * param; + void * param; /* [out] */ } xvid_plg_create_t; typedef struct { - int version; + int version; + + int num_frames; /* [out] total frame encoded */ +} xvid_plg_destroy_t; + +typedef struct +{ + int version; + + xvid_enc_zone_t * zone; /* [out] current zone */ - int width; /* [out] */ - int height; /* [out] */ - int mb_width; /* [out] */ - int mb_height; /* [out] */ + int width; /* [out] */ + int height; /* [out] */ + int mb_width; /* [out] */ + int mb_height; /* [out] */ int fincr; /* [out] */ - int fbase; /* [out] */ - - xvid_image_t reference; /* [out] -> [out] */ - xvid_image_t current; /* [out] -> [in,out] */ - xvid_image_t original; /* [out] after: points the original (uncompressed) copy of the current frame */ - int frame_num; /* [out] frame number */ - - int type; /* [in,out] */ - int quant; /* [in,out] */ - - int * dquant; /* [in,out] pointer to diff quantizer table */ - int dquant_stride; /* [in,out] diff quantizer stride */ - - int vop_flags; /* [in,out] */ - int vol_flags; /* [in,out] */ - int motion_flags; /* [in,out] */ - - int length; /* [out] after: length of encoded frame */ - int kblks, mblks, ublks; /* [out] after: */ - int sse_y, sse_u, sse_v; /* [out] */ -} xvid_plg_data_t; + int fbase; /* [out] */ + + int min_quant[3]; /* [out] */ + int max_quant[3]; /* [out] */ + + xvid_image_t reference; /* [out] -> [out] */ + xvid_image_t current; /* [out] -> [in,out] */ + xvid_image_t original; /* [out] after: points the original (uncompressed) copy of the current frame */ + int frame_num; /* [out] frame number */ + + int type; /* [in,out] */ + int quant; /* [in,out] */ + + int * dquant; /* [in,out] pointer to diff quantizer table */ + int dquant_stride; /* [in,out] diff quantizer stride */ + + int vop_flags; /* [in,out] */ + int vol_flags; /* [in,out] */ + int motion_flags; /* [in,out] */ + +/* Deprecated, use the stats field instead. + * Will disapear before 1.0 */ + int length; /* [out] after: length of encoded frame */ + int kblks; /* [out] number of blocks compressed as Intra */ + int mblks; /* [out] number of blocks compressed as Inter */ + int ublks; /* [out] number of blocks marked not_coded */ + int sse_y; /* [out] Y plane's sse */ + int sse_u; /* [out] U plane's sse */ + int sse_v; /* [out] V plane's sse */ +/* End of duplicated data, kept only for binary compatibility */ + int bquant_ratio; /* [in] */ + int bquant_offset; /* [in] */ + + xvid_enc_stats_t stats; /* [out] frame statistics */ +} xvid_plg_data_t; /***************************************************************************** xvid plugin system -- external @@ -344,7 +450,7 @@ plugins[0].param = NULL; plugins[1].func = xvid_cbr_func; plugins[1].param = &cbr_data; - + create.num_plugins = 2; create.plugins = plugins; @@ -354,235 +460,312 @@ typedef struct { - xvid_plugin_func * func; - void * param; + xvid_plugin_func * func; + void * param; } xvid_enc_plugin_t; -xvid_plugin_func xvid_plugin_psnr; /* write psnr values to stdout */ -xvid_plugin_func xvid_plugin_dump; /* dump before and after yuvpgms */ -xvid_plugin_func xvid_plugin_lumimasking; /* lumimasking */ +extern xvid_plugin_func xvid_plugin_single; /* single-pass rate control */ +extern xvid_plugin_func xvid_plugin_2pass1; /* two-pass rate control: first pass */ +extern xvid_plugin_func xvid_plugin_2pass2; /* two-pass rate control: second pass */ -/***************************************************************************** - * xvid_encore() - ****************************************************************************/ +extern xvid_plugin_func xvid_plugin_lumimasking; /* lumimasking */ -/* Encoder options */ -#define XVID_ENC_CREATE 0 /* create encoder instance; returns 0 on success */ -#define XVID_ENC_DESTROY 1 /* destroy encoder instance; returns 0 on success */ -#define XVID_ENC_ENCODE 2 /* encode a frame: returns number of ouput bytes - 0 means this frame should not be written (ie. encoder lag) */ +extern xvid_plugin_func xvid_plugin_psnr; /* write psnr values to stdout */ +extern xvid_plugin_func xvid_plugin_dump; /* dump before and after yuvpgms */ -int xvid_encore(void *handle, int opt, void *param1, void *param2); - -/* global flags */ -typedef enum +/* single pass rate control + * CBR and Constant quantizer modes */ +typedef struct { - XVID_PACKED = 0x00000001, /* packed bitstream */ - XVID_CLOSED_GOP = 0x00000002, /* closed_gop: was DX50BVOP dx50 bvop compatibility */ - XVID_EXTRASTATS_ENABLE = 0x00000004 -/*define XVID_VOL_AT_IVOP 0x00000008 write vol at every ivop: WIN32/divx compatibility */ -/*define XVID_FORCE_VOL 0x00000008 XXX: when vol-based parameters are changed, insert an ivop NOT recommended */ -} xvid_global_t; - - -/* XVID_ENC_ENCODE param1 */ -/* vol-based flags */ -typedef enum { - XVID_MPEGQUANT = 0x00000001, - XVID_EXTRASTATS = 0x00000002, - XVID_QUARTERPEL = 0x00000004, /* enable quarterpel: frames will encoded as quarterpel */ - XVID_GMC = 0x00000008, /* enable GMC; frames will be checked for gmc suitability */ - XVID_REDUCED_ENABLE = 0x00000010, /* enable reduced resolution vops: frames will be checked for rrv suitability */ - XVID_INTERLACING = 0x00000400, /* enable interlaced encoding */ -} xvid_vol_t; + int version; + int bitrate; /* [in] bits per second */ + int reaction_delay_factor; /* [in] */ + int averaging_period; /* [in] */ + int buffer; /* [in] */ +} xvid_plugin_single_t; -/* vop-based flags */ -typedef enum { - XVID_DEBUG = 0x00000001, - XVID_HALFPEL = 0x00000004, /* use halfpel interpolation */ - XVID_INTER4V = 0x00000008, - - XVID_CHROMAOPT = 0x00000020, /* enable chroma optimization pre-filter */ - XVID_GREYSCALE = 0x00000040, /* enable greyscale only mode (even for - color input material chroma is ignored) */ - XVID_HQACPRED = 0x00000080, /* 20030209: high quality ac prediction */ - XVID_MODEDECISION_BITS = 0x00000100, /* enable DCT-ME and use it for mode decision */ - XVID_DYNAMIC_BFRAMES = 0x00000200, +typedef struct { + int version; - /* only valid for vol_flags|=XVID_INTERLACING */ - XVID_TOPFIELDFIRST = 0x00000400, /* set top-field-first flag */ - XVID_ALTERNATESCAN = 0x00000800, /* set alternate vertical scan flag */ + char * filename; +} xvid_plugin_2pass1_t; - /* only valid for vol_flags|=XVID_REDUCED_ENABLED */ - XVID_REDUCED = 0x00001000, /* reduced resolution vop */ -} xvid_vop_t; +#define XVID_PAYBACK_BIAS 0 /* payback with bias */ +#define XVID_PAYBACK_PROP 1 /* payback proportionally */ -typedef enum { - PMV_ADVANCEDDIAMOND16 = 0x00008000, /* use advdiamonds instead of diamonds as search pattern */ - PMV_USESQUARES16 = 0x00800000, /* use squares instead of diamonds as search pattern */ +typedef struct { + int version; - PMV_HALFPELREFINE16 = 0x00020000, - PMV_HALFPELREFINE8 = 0x02000000, + int bitrate; /* [in] bits per second */ + char * filename; /* [in] first pass stats filename */ - PMV_QUARTERPELREFINE16 = 0x00040000, - PMV_QUARTERPELREFINE8 = 0x04000000, + int keyframe_boost; /* [in] keyframe boost percentage: [0..100] */ + int curve_compression_high; /* [in] percentage of compression performed on the high part of the curve (above average) */ + int curve_compression_low; /* [in] percentage of compression performed on the low part of the curve (below average) */ + int overflow_control_strength;/* [in] Payback delay expressed in number of frames */ + int max_overflow_improvement; /* [in] percentage of allowed range for a frame that gets bigger because of overflow bonus */ + int max_overflow_degradation; /* [in] percentage of allowed range for a frame that gets smaller because of overflow penalty */ + + int kfreduction; /* [in] maximum bitrate reduction applied to an iframe under the kfthreshold distance limit */ + int kfthreshold; /* [in] if an iframe is closer to the next iframe than this distance, a quantity of bits + * is substracted from its bit allocation. The reduction is computed as multiples of + * kfreduction/kthreshold. It reaches kfreduction when the distance == kfthreshold, + * 0 for 1global field during instance + * creation (operation XVID_ENC_CREATE) + *--------------------------------------------------------------------------*/ + +#define XVID_GLOBAL_PACKED (1<<0) /* packed bitstream */ +#define XVID_GLOBAL_CLOSED_GOP (1<<1) /* closed_gop: was DX50BVOP dx50 bvop compatibility */ +#define XVID_GLOBAL_EXTRASTATS_ENABLE (1<<2) +#if 0 +#define XVID_GLOBAL_VOL_AT_IVOP (1<<3) /* write vol at every ivop: WIN32/divx compatibility */ +#define XVID_GLOBAL_FORCE_VOL (1<<4) /* when vol-based parameters are changed, insert an ivop NOT recommended */ +#endif - xvid_global_t global; /* [in:opt] global flags; controls encoding behavior */ -/* --- vol-based stuff; included here for conveinience */ - int fincr; /* [in:opt] framerate increment; set to zero for variable framerate */ - int fbase; /* [in] framerate base - frame_duration = fincr/fbase seconds*/ -/* ^^^---------------------------------------------- */ +/*---------------------------------------------------------------------------- + * "VOL" flags + * + * These flags are used for xvid_enc_frame_t->vol_flags field during frame + * encoding (operation XVID_ENC_ENCODE) + *--------------------------------------------------------------------------*/ + +#define XVID_VOL_MPEGQUANT (1<<0) /* enable MPEG type quantization */ +#define XVID_VOL_EXTRASTATS (1<<1) /* enable plane sse stats */ +#define XVID_VOL_QUARTERPEL (1<<2) /* enable quarterpel: frames will encoded as quarterpel */ +#define XVID_VOL_GMC (1<<3) /* enable GMC; frames will be checked for gmc suitability */ +#define XVID_VOL_REDUCED_ENABLE (1<<4) /* enable reduced resolution vops: frames will be checked for rrv suitability */ +#define XVID_VOL_INTERLACING (1<<5) /* enable interlaced encoding */ -/* ---vop-based; included here for conveienience */ - int max_key_interval; /* [in:opt] the maximum interval between key frames */ - /*XXX: maybe call it gop_size? */ +/*---------------------------------------------------------------------------- + * "VOP" flags + * + * These flags are used for xvid_enc_frame_t->vop_flags field during frame + * encoding (operation XVID_ENC_ENCODE) + *--------------------------------------------------------------------------*/ + +/* Always valid */ +#define XVID_VOP_DEBUG (1<< 0) /* print debug messages in frames */ +#define XVID_VOP_HALFPEL (1<< 1) /* use halfpel interpolation */ +#define XVID_VOP_INTER4V (1<< 2) /* use 4 motion vectors per MB */ +#define XVID_VOP_TRELLISQUANT (1<< 3) /* use trellis based R-D "optimal" quantization */ +#define XVID_VOP_CHROMAOPT (1<< 4) /* enable chroma optimization pre-filter */ +#define XVID_VOP_CARTOON (1<< 5) /* use 'cartoon mode' */ +#define XVID_VOP_GREYSCALE (1<< 6) /* enable greyscale only mode (even for color input material chroma is ignored) */ +#define XVID_VOP_HQACPRED (1<< 7) /* high quality ac prediction */ +#define XVID_VOP_MODEDECISION_RD (1<< 8) /* enable DCT-ME and use it for mode decision */ +#define XVID_VOP_FAST_MODEDECISION_RD (1<<12) /* use simplified R-D mode decision */ + +/* Only valid for vol_flags|=XVID_VOL_INTERLACING */ +#define XVID_VOP_TOPFIELDFIRST (1<< 9) /* set top-field-first flag */ +#define XVID_VOP_ALTERNATESCAN (1<<10) /* set alternate vertical scan flag */ - int frame_drop_ratio; /* [in:opt] frame dropping: 0=drop none... 100=drop all */ +/* only valid for vol_flags|=XVID_VOL_REDUCED_ENABLED */ +#define XVID_VOP_REDUCED (1<<11) /* reduced resolution vop */ - int bquant_ratio; /* [in:opt] bframe quantizer multipier/offeset; used to decide bframes quant when bquant==-1 */ - int bquant_offset; /* bquant = (avg(past_ref_quant,future_ref_quant)*bquant_ratio + bquant_offset) / 100 */ -/* ^^^ -------------------------------------------------------------------------*/ +/*---------------------------------------------------------------------------- + * "Motion" flags + * + * These flags are used for xvid_enc_frame_t->motion field during frame + * encoding (operation XVID_ENC_ENCODE) + *--------------------------------------------------------------------------*/ + +/* Motion Estimation Search Patterns */ +#define XVID_ME_ADVANCEDDIAMOND16 (1<< 0) /* use advdiamonds instead of diamonds as search pattern */ +#define XVID_ME_ADVANCEDDIAMOND8 (1<< 1) /* use advdiamond for XVID_ME_EXTSEARCH8 */ +#define XVID_ME_USESQUARES16 (1<< 2) /* use squares instead of diamonds as search pattern */ +#define XVID_ME_USESQUARES8 (1<< 3) /* use square for XVID_ME_EXTSEARCH8 */ + +/* SAD operator based flags */ +#define XVID_ME_HALFPELREFINE16 (1<< 4) +#define XVID_ME_HALFPELREFINE8 (1<< 6) +#define XVID_ME_QUARTERPELREFINE16 (1<< 7) +#define XVID_ME_QUARTERPELREFINE8 (1<< 8) +#define XVID_ME_GME_REFINE (1<< 9) +#define XVID_ME_EXTSEARCH16 (1<<10) /* extend PMV by more searches */ +#define XVID_ME_EXTSEARCH8 (1<<11) /* use diamond/square for extended 8x8 search */ +#define XVID_ME_CHROMA_PVOP (1<<12) /* also use chroma for P_VOP/S_VOP ME */ +#define XVID_ME_CHROMA_BVOP (1<<13) /* also use chroma for B_VOP ME */ +#define XVID_ME_FASTREFINE16 (1<<25) /* use low-complexity refinement functions */ +#define XVID_ME_FASTREFINE8 (1<<29) /* low-complexity 8x8 sub-block refinement */ + +/* Rate Distortion based flags + * Valid when XVID_VOP_MODEDECISION_RD is enabled */ +#define XVID_ME_HALFPELREFINE16_RD (1<<14) /* perform RD-based halfpel refinement */ +#define XVID_ME_HALFPELREFINE8_RD (1<<15) /* perform RD-based halfpel refinement for 8x8 mode */ +#define XVID_ME_QUARTERPELREFINE16_RD (1<<16) /* perform RD-based qpel refinement */ +#define XVID_ME_QUARTERPELREFINE8_RD (1<<17) /* perform RD-based qpel refinement for 8x8 mode */ +#define XVID_ME_EXTSEARCH_RD (1<<18) /* perform RD-based search using square pattern enable XVID_ME_EXTSEARCH8 to do this in 8x8 search as well */ +#define XVID_ME_CHECKPREDICTION_RD (1<<19) /* always check vector equal to prediction */ + +/* Other */ +#define XVID_ME_DETECT_STATIC_MOTION (1<<24) /* speed-up ME by detecting stationary scenes */ +#define XVID_ME_SKIP_DELTASEARCH (1<<26) /* speed-up by skipping b-frame delta search */ +#define XVID_ME_FAST_MODEINTERPOLATE (1<<27) /* speed-up by partly skipping interpolate mode */ +#define XVID_ME_BFRAME_EARLYSTOP (1<<28) /* speed-up by early exiting b-search */ + +/* Unused */ +#define XVID_ME_UNRESTRICTED16 (1<<20) /* unrestricted ME, not implemented */ +#define XVID_ME_OVERLAPPING16 (1<<21) /* overlapping ME, not implemented */ +#define XVID_ME_UNRESTRICTED8 (1<<22) /* unrestricted ME, not implemented */ +#define XVID_ME_OVERLAPPING8 (1<<23) /* overlapping ME, not implemented */ - void *handle; /* [out] encoder instance handle */ -} -xvid_enc_create_t; +/*---------------------------------------------------------------------------- + * xvid_enc_create_t structure definition + * + * This structure is passed as param1 during an instance creation (operation + * XVID_ENC_CREATE) + *--------------------------------------------------------------------------*/ typedef struct { - int version; - int type; /* [in] rate control type: XVID_RC_xxx */ + int version; - /* common stuff */ - int min_iquant; /* [in:opt] ivop quantizer upper/lower limit */ - int max_iquant; /* [in:opt] */ - int min_pquant; /* [in:opt] psvop quantizer upper/lower limit */ - int max_pquant; /* [in:opt] */ - int min_bquant; /* [in:opt] bvop quantizer upper/lower limit */ - int max_bquant; /* [in:opt] */ - - union { - struct { /* XVID_RC_FQUANT */ - float quant; /* [in] quantizer */ - } fquant; - struct { /* XVID_RC_CBR */ - int bitrate; /* [in] the bitrate of the target encoded stream, in bits/second */ - int reaction_delay_factor; /* [in] how fast the rate control reacts - lower values are faster */ - int averaging_period; /* [in] */ - int buffer; /* [in] */ - } cbr; - } data; -} xvid_enc_rc_t; + int profile; /* [in] profile@level; refer to XVID_PROFILE_xxx */ + int width; /* [in] frame dimensions; width, pixel units */ + int height; /* [in] frame dimensions; height, pixel units */ + int num_zones; /* [in:opt] number of bitrate zones */ + xvid_enc_zone_t * zones; /* ^^ zone array */ + int num_plugins; /* [in:opt] number of plugins */ + xvid_enc_plugin_t * plugins; /* ^^ plugin array */ -#define XVID_KEYFRAME 0x00000001 + int num_threads; /* [in:opt] number of threads */ + int max_bframes; /* [in:opt] max sequential bframes (0=disable bframes) */ -typedef struct { - int version; + int global; /* [in:opt] global flags; controls encoding behavior */ -/* --- VOL related stuff; unless XVID_FORCEVOL is set, the encoder will not react to any - changes here until the next VOL (keyframe). */ - xvid_vol_t vol_flags; /* [in] vol flags */ - unsigned char * - quant_intra_matrix; /* [in:opt] custom intra qmatrix */ - unsigned char * - quant_inter_matrix; /* [in:opt] custom inter qmatrix */ + /* --- vol-based stuff; included here for convenience */ + int fincr; /* [in:opt] framerate increment; set to zero for variable framerate */ + int fbase; /* [in] framerate base frame_duration = fincr/fbase seconds*/ + /* ---------------------------------------------- */ - int par; /* [in:opt] picture aspect ratio (refer to XVID_PAR_xxx above) */ - int par_width; /* [in:opt] aspect ratio width */ - int par_height; /* [in:opt] aspect ratio height */ -/* ^^^----------------------------------------------------------------------------------*/ + /* --- vop-based; included here for convenience */ + int max_key_interval; /* [in:opt] the maximum interval between key frames */ - int fincr; /* framerate increment, for variable framerate only */ - xvid_vop_t vop_flags; /* [in] (general)vop-based flags */ - xvid_motion_t motion; /* [in] ME options */ + int frame_drop_ratio; /* [in:opt] frame dropping: 0=drop none... 100=drop all */ - xvid_image_t input; /* [in] input image (read from) */ - - int type; /* [in:opt] coding type */ - int quant; /* [in] frame quantizer; if <=0, automatatic (ratecontrol) */ + int bquant_ratio; /* [in:opt] bframe quantizer multipier/offeset; used to decide bframes quant when bquant==-1 */ + int bquant_offset; /* bquant = (avg(past_ref_quant,future_ref_quant)*bquant_ratio + bquant_offset) / 100 */ - void *bitstream; /* [in:opt] bitstream ptr (written to)*/ - int length; /* [in:opt] bitstream length (bytes) */ + int min_quant[3]; /* [in:opt] */ + int max_quant[3]; /* [in:opt] */ + /* ---------------------------------------------- */ - int out_flags; /* [out] bitstream output flags */ -} -xvid_enc_frame_t; + void *handle; /* [out] encoder instance handle */ +} xvid_enc_create_t; -/* XVID_ENC_ENCODE param2 (optional) - xvid_enc_stats_t describes individual frame details - - coding_type==XVID_TYPE_NOTHING if the stats are not given -*/ +/*---------------------------------------------------------------------------- + * xvid_enc_frame_t structure definition + * + * This structure is passed as param1 during a frame encoding (operation + * XVID_ENC_ENCODE) + *--------------------------------------------------------------------------*/ + +/* out value for the frame structure->type field + * unlike stats output in param2, this field is not asynchronous and tells + * the client app, if the frame written into the stream buffer is an ivop + * usually used for indexing purpose in the container */ +#define XVID_KEYFRAME (1<<1) + +/* The structure */ typedef struct { int version; - /* encoding parameters */ - int type; /* [out] coding type */ - int quant; /* [out] frame quantizer */ - xvid_vol_t vol_flags; /* [out] vol flags (see above) */ - int vop_flags; /* [out] vop flags (see above) */ - /* bitrate */ - int length; /* [out] frame length */ + /* VOL related stuff + * unless XVID_FORCEVOL is set, the encoder will not react to any changes + * here until the next VOL (keyframe). */ - int hlength; /* [out] header length (bytes) */ - int kblks, mblks, ublks; /* [out] */ + int vol_flags; /* [in] vol flags */ + unsigned char *quant_intra_matrix; /* [in:opt] custom intra qmatrix */ + unsigned char *quant_inter_matrix; /* [in:opt] custom inter qmatrix */ - int sse_y, sse_u, sse_v; -} -xvid_enc_stats_t; + int par; /* [in:opt] pixel aspect ratio (refer to XVID_PAR_xxx above) */ + int par_width; /* [in:opt] aspect ratio width */ + int par_height; /* [in:opt] aspect ratio height */ + + /* Other fields that can change on a frame base */ + + int fincr; /* [in:opt] framerate increment, for variable framerate only */ + int vop_flags; /* [in] (general)vop-based flags */ + int motion; /* [in] ME options */ + + xvid_image_t input; /* [in] input image (read from) */ + + int type; /* [in:opt] coding type */ + int quant; /* [in] frame quantizer; if <=0, automatic (ratecontrol) */ + int bframe_threshold; + + void *bitstream; /* [in:opt] bitstream ptr (written to)*/ + int length; /* [in:opt] bitstream length (bytes) */ + + int out_flags; /* [out] bitstream output flags */ +} xvid_enc_frame_t; #ifdef __cplusplus } #endif - #endif