[cvs] / xvidcore / src / xvid.c Repository:
ViewVC logotype

Diff of /xvidcore/src/xvid.c

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

revision 1.11, Sat Apr 13 16:30:01 2002 UTC revision 1.23, Wed Jun 26 15:59:51 2002 UTC
# Line 1  Line 1 
1  /**************************************************************************  /*****************************************************************************
2   *   *
3   *      XVID MPEG-4 VIDEO CODEC   *      XVID MPEG-4 VIDEO CODEC
4   *      native api   *  - Native API implementation  -
5   *   *
6   *      This program is an implementation of a part of one or more MPEG-4   *      This program is an implementation of a part of one or more MPEG-4
7   *      Video tools as specified in ISO/IEC 14496-2 standard.  Those intending   *      Video tools as specified in ISO/IEC 14496-2 standard.  Those intending
# Line 24  Line 24 
24   *   *
25   *      You should have received a copy of the GNU General Public License   *      You should have received a copy of the GNU General Public License
26   *      along with this program; if not, write to the Free Software   *      along with this program; if not, write to the Free Software
27   *      Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.   *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
28   *   *
29   *************************************************************************/   ****************************************************************************/
30    /*****************************************************************************
 /**************************************************************************  
31   *   *
32   *      History:   *  History
33   *   *
34   *      17.03.2002      Added interpolate8x8_halfpel_hv_xmm   *      - 23.06.2002    added XVID_CPU_CHKONLY
35   *  22.12.2001  API change: added xvid_init() - Isibaar   *  - 17.03.2002        Added interpolate8x8_halfpel_hv_xmm
36   *      16.12.2001      inital version; (c)2001 peter ross <pross@cs.rmit.edu.au>   *  - 22.12.2001  API change: added xvid_init() - Isibaar
37     *  - 16.12.2001        inital version; (c)2001 peter ross <pross@cs.rmit.edu.au>
38   *   *
39   *************************************************************************/   *  $Id$
40     *
41     ****************************************************************************/
42    
43  #include "xvid.h"  #include "xvid.h"
44  #include "decoder.h"  #include "decoder.h"
# Line 55  Line 56 
56  #include "utils/timer.h"  #include "utils/timer.h"
57  #include "bitstream/mbcoding.h"  #include "bitstream/mbcoding.h"
58    
59  int xvid_init(void *handle, int opt, void *param1, void *param2)  /*****************************************************************************
60     * XviD Init Entry point
61     *
62     * Well this function initialize all internal function pointers according
63     * to the CPU features forced by the library client or autodetected (depending
64     * on the XVID_CPU_FORCE flag). It also initializes vlc coding tables and all
65     * image colorspace transformation tables.
66     *
67     * Returned value : XVID_ERR_OK
68     *                  + API_VERSION in the input XVID_INIT_PARAM structure
69     *                  + core build  "   "    "       "               "
70     *
71     ****************************************************************************/
72    
73    int
74    xvid_init(void *handle,
75                      int opt,
76                      void *param1,
77                      void *param2)
78  {  {
79          int cpu_flags;          int cpu_flags;
80          XVID_INIT_PARAM *init_param;          XVID_INIT_PARAM *init_param;
81    
82          init_param = (XVID_INIT_PARAM *) param1;          init_param = (XVID_INIT_PARAM *) param1;
83    
84          // force specific cpu settings?          /* Inform the client the API version */
85          if((init_param->cpu_flags & XVID_CPU_FORCE) > 0)          init_param->api_version = API_VERSION;
86    
87            /* Inform the client the core build - unused because we're still alpha */
88            init_param->core_build = 1000;
89    
90            if ((init_param->cpu_flags & XVID_CPU_CHKONLY))
91            {
92                    init_param->cpu_flags = check_cpu_features();
93                    return XVID_ERR_OK;
94            }
95    
96            /* Do we have to force CPU features  ? */
97            if ((init_param->cpu_flags & XVID_CPU_FORCE) > 0) {
98                  cpu_flags = init_param->cpu_flags;                  cpu_flags = init_param->cpu_flags;
99          else {          } else {
100    
 #ifdef ARCH_X86  
101                  cpu_flags = check_cpu_features();                  cpu_flags = check_cpu_features();
 #else  
                 cpu_flags = 0;  
 #endif  
102                  init_param->cpu_flags = cpu_flags;                  init_param->cpu_flags = cpu_flags;
103          }          }
104    
105          // initialize the function pointers          /* Initialize the function pointers */
106          idct_int32_init();          idct_int32_init();
107          init_vlc_tables();          init_vlc_tables();
108    
109            /* Fixed Point Forward/Inverse DCT transformations */
110          fdct = fdct_int32;          fdct = fdct_int32;
111          idct = idct_int32;          idct = idct_int32;
112    
113            /* Only needed on PPC Altivec archs */
114          sadInit = 0;          sadInit = 0;
115    
116            /* Restore FPU context : emms_c is a nop functions */
117          emms = emms_c;          emms = emms_c;
118    
119            /* Quantization functions */
120          quant_intra = quant_intra_c;          quant_intra = quant_intra_c;
121          dequant_intra = dequant_intra_c;          dequant_intra = dequant_intra_c;
122          quant_inter = quant_inter_c;          quant_inter = quant_inter_c;
# Line 96  Line 127 
127          quant4_inter = quant4_inter_c;          quant4_inter = quant4_inter_c;
128          dequant4_inter = dequant4_inter_c;          dequant4_inter = dequant4_inter_c;
129    
130            /* Block transfer related functions */
131          transfer_8to16copy = transfer_8to16copy_c;          transfer_8to16copy = transfer_8to16copy_c;
132          transfer_16to8copy = transfer_16to8copy_c;          transfer_16to8copy = transfer_16to8copy_c;
133          transfer_8to16sub = transfer_8to16sub_c;          transfer_8to16sub = transfer_8to16sub_c;
# Line 103  Line 135 
135          transfer_16to8add = transfer_16to8add_c;          transfer_16to8add = transfer_16to8add_c;
136          transfer8x8_copy = transfer8x8_copy_c;          transfer8x8_copy = transfer8x8_copy_c;
137    
138            /* Image interpolation related functions */
139          interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_c;          interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_c;
140          interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_c;          interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_c;
141          interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_c;          interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_c;
142    
143            /* Initialize internal colorspace transformation tables */
144          colorspace_init();          colorspace_init();
145    
146            /* All colorspace transformation functions User Format->YV12 */
147          rgb555_to_yv12 = rgb555_to_yv12_c;          rgb555_to_yv12 = rgb555_to_yv12_c;
148          rgb565_to_yv12 = rgb565_to_yv12_c;          rgb565_to_yv12 = rgb565_to_yv12_c;
149          rgb24_to_yv12 = rgb24_to_yv12_c;          rgb24_to_yv12 = rgb24_to_yv12_c;
# Line 117  Line 152 
152          yuyv_to_yv12 = yuyv_to_yv12_c;          yuyv_to_yv12 = yuyv_to_yv12_c;
153          uyvy_to_yv12 = uyvy_to_yv12_c;          uyvy_to_yv12 = uyvy_to_yv12_c;
154    
155            /* All colorspace transformation functions YV12->User format */
156          yv12_to_rgb555 = yv12_to_rgb555_c;          yv12_to_rgb555 = yv12_to_rgb555_c;
157          yv12_to_rgb565 = yv12_to_rgb565_c;          yv12_to_rgb565 = yv12_to_rgb565_c;
158          yv12_to_rgb24 = yv12_to_rgb24_c;          yv12_to_rgb24 = yv12_to_rgb24_c;
# Line 125  Line 161 
161          yv12_to_yuyv = yv12_to_yuyv_c;          yv12_to_yuyv = yv12_to_yuyv_c;
162          yv12_to_uyvy = yv12_to_uyvy_c;          yv12_to_uyvy = yv12_to_uyvy_c;
163    
164            /* Functions used in motion estimation algorithms */
165          calc_cbp = calc_cbp_c;          calc_cbp = calc_cbp_c;
166          sad16 = sad16_c;          sad16 = sad16_c;
167          sad16bi = sad16bi_c;          sad16bi = sad16bi_c;
# Line 133  Line 170 
170    
171  #ifdef ARCH_X86  #ifdef ARCH_X86
172          if((cpu_flags & XVID_CPU_MMX) > 0) {          if((cpu_flags & XVID_CPU_MMX) > 0) {
173    
174                    /* Forward and Inverse Discrete Cosine Transformation functions */
175                  fdct = fdct_mmx;                  fdct = fdct_mmx;
176                  idct = idct_mmx;                  idct = idct_mmx;
177    
178                    /* To restore FPU context after mmx use */
179                  emms = emms_mmx;                  emms = emms_mmx;
180    
181                    /* Quantization related functions */
182                  quant_intra = quant_intra_mmx;                  quant_intra = quant_intra_mmx;
183                  dequant_intra = dequant_intra_mmx;                  dequant_intra = dequant_intra_mmx;
184                  quant_inter = quant_inter_mmx;                  quant_inter = quant_inter_mmx;
# Line 148  Line 189 
189                  quant4_inter = quant4_inter_mmx;                  quant4_inter = quant4_inter_mmx;
190                  dequant4_inter = dequant4_inter_mmx;                  dequant4_inter = dequant4_inter_mmx;
191    
192                    /* Block related functions */
193                  transfer_8to16copy = transfer_8to16copy_mmx;                  transfer_8to16copy = transfer_8to16copy_mmx;
194                  transfer_16to8copy = transfer_16to8copy_mmx;                  transfer_16to8copy = transfer_16to8copy_mmx;
195                  transfer_8to16sub = transfer_8to16sub_mmx;                  transfer_8to16sub = transfer_8to16sub_mmx;
196                    transfer_8to16sub2 = transfer_8to16sub2_mmx;
197                  transfer_16to8add = transfer_16to8add_mmx;                  transfer_16to8add = transfer_16to8add_mmx;
198                  transfer8x8_copy = transfer8x8_copy_mmx;                  transfer8x8_copy = transfer8x8_copy_mmx;
199    
200    
201                    /* Image Interpolation related functions */
202                  interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_mmx;                  interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_mmx;
203                  interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_mmx;                  interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_mmx;
204                  interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_mmx;                  interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_mmx;
205    
206                    /* Image RGB->YV12 related functions */
207                  rgb24_to_yv12 = rgb24_to_yv12_mmx;                  rgb24_to_yv12 = rgb24_to_yv12_mmx;
208                  rgb32_to_yv12 = rgb32_to_yv12_mmx;                  rgb32_to_yv12 = rgb32_to_yv12_mmx;
209                  yuv_to_yv12 = yuv_to_yv12_mmx;                  yuv_to_yv12 = yuv_to_yv12_mmx;
210                  yuyv_to_yv12 = yuyv_to_yv12_mmx;                  yuyv_to_yv12 = yuyv_to_yv12_mmx;
211                  uyvy_to_yv12 = uyvy_to_yv12_mmx;                  uyvy_to_yv12 = uyvy_to_yv12_mmx;
212    
213                    /* Image YV12->RGB related functions */
214                  yv12_to_rgb24 = yv12_to_rgb24_mmx;                  yv12_to_rgb24 = yv12_to_rgb24_mmx;
215                  yv12_to_rgb32 = yv12_to_rgb32_mmx;                  yv12_to_rgb32 = yv12_to_rgb32_mmx;
216                  yv12_to_yuyv = yv12_to_yuyv_mmx;                  yv12_to_yuyv = yv12_to_yuyv_mmx;
217                  yv12_to_uyvy = yv12_to_uyvy_mmx;                  yv12_to_uyvy = yv12_to_uyvy_mmx;
218    
219                    /* Motion estimation related functions */
220                  calc_cbp = calc_cbp_mmx;                  calc_cbp = calc_cbp_mmx;
221                  sad16 = sad16_mmx;                  sad16 = sad16_mmx;
222                  sad8 = sad8_mmx;                  sad8 = sad8_mmx;
# Line 177  Line 225 
225          }          }
226    
227          if((cpu_flags & XVID_CPU_MMXEXT) > 0) {          if((cpu_flags & XVID_CPU_MMXEXT) > 0) {
228    
229                    /* Inverse DCT */
230                  idct = idct_xmm;                  idct = idct_xmm;
231    
232                    /* Interpolation */
233                  interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_xmm;                  interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_xmm;
234                  interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_xmm;                  interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_xmm;
235                  interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_xmm;                  interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_xmm;
236    
237                    /* Buffer transfer */
238                    transfer_8to16sub2 = transfer_8to16sub2_xmm;
239    
240                    /* Colorspace transformation */
241                  yuv_to_yv12 = yuv_to_yv12_xmm;                  yuv_to_yv12 = yuv_to_yv12_xmm;
242    
243                    /* ME functions */
244                  sad16 = sad16_xmm;                  sad16 = sad16_xmm;
245                  sad8 = sad8_xmm;                  sad8 = sad8_xmm;
246                  dev16 = dev16_xmm;                  dev16 = dev16_xmm;
# Line 190  Line 248 
248          }          }
249    
250          if((cpu_flags & XVID_CPU_3DNOW) > 0) {          if((cpu_flags & XVID_CPU_3DNOW) > 0) {
251    
252                    /* Interpolation */
253                  interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_3dn;                  interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_3dn;
254                  interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_3dn;                  interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_3dn;
255                  interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_3dn;                  interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_3dn;
256          }          }
257    
258            if ((cpu_flags & XVID_CPU_SSE2) > 0) {
259    #ifdef EXPERIMENTAL_SSE2_CODE
260    
261                    /* Quantization */
262                    quant_intra   = quant_intra_sse2;
263                    dequant_intra = dequant_intra_sse2;
264                    quant_inter   = quant_inter_sse2;
265                    dequant_inter = dequant_inter_sse2;
266    
267                    /* ME */
268                    calc_cbp = calc_cbp_sse2;
269                    sad16    = sad16_sse2;
270                    dev16    = dev16_sse2;
271    
272                    /* Forward and Inverse DCT */
273                    idct  = idct_sse2;
274                    fdct = fdct_sse2;
275    #endif
276            }
277    
278    #endif
279    
280    #ifdef ARCH_IA64
281            if ((cpu_flags & XVID_CPU_IA64) > 0) { //use assembler routines?
282              idct_ia64_init();
283              fdct = fdct_ia64;
284              idct = idct_ia64;   //not yet working, crashes
285              interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_ia64;
286              interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_ia64;
287              interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_ia64;
288              sad16 = sad16_ia64;
289              sad16bi = sad16bi_ia64;
290              sad8 = sad8_ia64;
291              dev16 = dev16_ia64;
292              quant_intra = quant_intra_ia64;
293              dequant_intra = dequant_intra_ia64;
294              quant_inter = quant_inter_ia64;
295              dequant_inter = dequant_inter_ia64;
296              transfer_8to16copy = transfer_8to16copy_ia64;
297              transfer_16to8copy = transfer_16to8copy_ia64;
298              transfer_8to16sub = transfer_8to16sub_ia64;
299              transfer_8to16sub2 = transfer_8to16sub2_ia64;
300              transfer_16to8add = transfer_16to8add_ia64;
301              transfer8x8_copy = transfer8x8_copy_ia64;
302              DEBUG("Using IA-64 assembler routines.\n");
303            }
304  #endif  #endif
305    
306  #ifdef ARCH_PPC  #ifdef ARCH_PPC
307  #ifdef ARCH_PPC_ALTIVEC  #ifdef ARCH_PPC_ALTIVEC
308          calc_cbp = calc_cbp_altivec;          calc_cbp = calc_cbp_altivec;
# Line 210  Line 317 
317  #endif  #endif
318  #endif  #endif
319    
         // API version  
         init_param->api_version = API_VERSION;  
   
         // something clever has to be done for this  
         init_param->core_build = 1000;  
   
320          return XVID_ERR_OK;          return XVID_ERR_OK;
321  }  }
322    
323  int xvid_decore(void * handle, int opt, void * param1, void * param2)  /*****************************************************************************
324  {   * XviD Native decoder entry point
325          switch (opt)   *
326     * This function is just a wrapper to all the option cases.
327     *
328     * Returned values : XVID_ERR_FAIL when opt is invalid
329     *                   else returns the wrapped function result
330     *
331     ****************************************************************************/
332    
333    int
334    xvid_decore(void *handle,
335                            int opt,
336                            void *param1,
337                            void *param2)
338          {          {
339            switch (opt) {
340          case XVID_DEC_DECODE :          case XVID_DEC_DECODE :
341          return decoder_decode((DECODER *) handle, (XVID_DEC_FRAME *) param1);          return decoder_decode((DECODER *) handle, (XVID_DEC_FRAME *) param1);
342    
# Line 238  Line 352 
352  }  }
353    
354    
355  int xvid_encore(void * handle, int opt, void * param1, void * param2)  /*****************************************************************************
356  {   * XviD Native encoder entry point
357          switch (opt)   *
358     * This function is just a wrapper to all the option cases.
359     *
360     * Returned values : XVID_ERR_FAIL when opt is invalid
361     *                   else returns the wrapped function result
362     *
363     ****************************************************************************/
364    
365    int
366    xvid_encore(void *handle,
367                            int opt,
368                            void *param1,
369                            void *param2)
370          {          {
371            switch (opt) {
372          case XVID_ENC_ENCODE :          case XVID_ENC_ENCODE :
373          return encoder_encode((Encoder *) handle, (XVID_ENC_FRAME *) param1, (XVID_ENC_STATS *) param2);  #ifdef BFRAMES
374                    if (((Encoder *) handle)->mbParam.max_bframes >= 0)
375                    return encoder_encode_bframes((Encoder *) handle, (XVID_ENC_FRAME *) param1,
376                                                              (XVID_ENC_STATS *) param2);
377                    else
378    #endif
379                    return encoder_encode((Encoder *) handle, (XVID_ENC_FRAME *) param1,
380                                                              (XVID_ENC_STATS *) param2);
381    
382          case XVID_ENC_CREATE :          case XVID_ENC_CREATE :
383          return encoder_create((XVID_ENC_PARAM *) param1);          return encoder_create((XVID_ENC_PARAM *) param1);

Legend:
Removed from v.1.11  
changed lines
  Added in v.1.23

No admin address has been configured
ViewVC Help
Powered by ViewVC 1.0.4