[cvs] / xvidcore / src / xvid.c Repository:
ViewVC logotype

Annotation of /xvidcore/src/xvid.c

Parent Directory Parent Directory | Revision Log Revision Log


Revision 1.31 - (view) (download)

1 : edgomez 1.16 /*****************************************************************************
2 : edgomez 1.17 *
3 :     * XVID MPEG-4 VIDEO CODEC
4 :     * - Native API implementation -
5 :     *
6 :     * This program is an implementation of a part of one or more MPEG-4
7 :     * Video tools as specified in ISO/IEC 14496-2 standard. Those intending
8 :     * to use this software module in hardware or software products are
9 :     * advised that its use may infringe existing patents or copyrights, and
10 :     * any such use would be at such party's own risk. The original
11 :     * developer of this software module and his/her company, and subsequent
12 :     * editors and their companies, will have no liability for use of this
13 :     * software or modifications or derivatives thereof.
14 :     *
15 :     * This program is free software ; you can redistribute it and/or modify
16 :     * it under the terms of the GNU General Public License as published by
17 :     * the Free Software Foundation ; either version 2 of the License, or
18 :     * (at your option) any later version.
19 :     *
20 :     * This program is distributed in the hope that it will be useful,
21 :     * but WITHOUT ANY WARRANTY ; without even the implied warranty of
22 :     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
23 :     * GNU General Public License for more details.
24 :     *
25 :     * You should have received a copy of the GNU General Public License
26 :     * along with this program ; if not, write to the Free Software
27 :     * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
28 :     *
29 :     ****************************************************************************/
30 : chenm001 1.29
31 : edgomez 1.16 /*****************************************************************************
32 : edgomez 1.17 *
33 :     * History
34 :     *
35 : suxen_drol 1.21 * - 23.06.2002 added XVID_CPU_CHKONLY
36 : edgomez 1.17 * - 17.03.2002 Added interpolate8x8_halfpel_hv_xmm
37 :     * - 22.12.2001 API change: added xvid_init() - Isibaar
38 :     * - 16.12.2001 inital version; (c)2001 peter ross <pross@cs.rmit.edu.au>
39 :     *
40 : suxen_drol 1.31 * $Id: xvid.c,v 1.30 2002/07/16 11:15:15 ia64p Exp $
41 : edgomez 1.17 *
42 :     ****************************************************************************/
43 : Isibaar 1.1
44 :     #include "xvid.h"
45 :     #include "decoder.h"
46 :     #include "encoder.h"
47 :     #include "bitstream/cbp.h"
48 :     #include "dct/idct.h"
49 :     #include "dct/fdct.h"
50 :     #include "image/colorspace.h"
51 :     #include "image/interpolate8x8.h"
52 :     #include "utils/mem_transfer.h"
53 :     #include "quant/quant_h263.h"
54 :     #include "quant/quant_mpeg4.h"
55 : ia64p 1.30 #include "motion/motion.h"
56 : Isibaar 1.1 #include "motion/sad.h"
57 :     #include "utils/emms.h"
58 :     #include "utils/timer.h"
59 : Isibaar 1.9 #include "bitstream/mbcoding.h"
60 : Isibaar 1.1
61 : suxen_drol 1.31 #if defined(ARCH_X86) && defined(EXPERIMENTAL_SSE2_CODE)
62 :    
63 :     #ifdef WIN32
64 :     #include <windows.h>
65 :     #else
66 :     #include <signal.h>
67 :     #include <setjmp.h>
68 :     #endif
69 :    
70 :    
71 :     #ifndef WIN32
72 :    
73 :     static jmp_buf mark;
74 :    
75 :     static void
76 :     sigill_handler(int signal)
77 :     {
78 :     longjmp(mark, 1);
79 :     }
80 :     #endif
81 :    
82 :    
83 :     /*
84 :     calls the funcptr, and returns whether SIGILL (illegal instruction) was signalled
85 :     return values:
86 :     -1 : could not determine
87 :     0 : SIGILL was *not* signalled
88 :     1 : SIGILL was signalled
89 :     */
90 :    
91 :     int
92 :     sigill_check(void (*func)())
93 :     {
94 :     #ifdef WIN32
95 :     _try {
96 :     func();
97 :     }
98 :     _except(EXCEPTION_EXECUTE_HANDLER) {
99 :    
100 :     if (_exception_code() == STATUS_ILLEGAL_INSTRUCTION)
101 :     return 1;
102 :     }
103 :     return 0;
104 :     #else
105 :     void * old_handler;
106 :     int jmpret;
107 :    
108 :    
109 :     old_handler = signal(SIGILL, sigill_handler);
110 :     if (old_handler == SIG_ERR)
111 :     {
112 :     return -1;
113 :     }
114 :    
115 :     jmpret = setjmp(mark);
116 :     if (jmpret == 0)
117 :     {
118 :     func();
119 :     }
120 :    
121 :     signal(SIGILL, old_handler);
122 :    
123 :     return jmpret;
124 :     #endif
125 :     }
126 :     #endif
127 :    
128 : edgomez 1.16 /*****************************************************************************
129 :     * XviD Init Entry point
130 :     *
131 :     * Well this function initialize all internal function pointers according
132 :     * to the CPU features forced by the library client or autodetected (depending
133 :     * on the XVID_CPU_FORCE flag). It also initializes vlc coding tables and all
134 :     * image colorspace transformation tables.
135 :     *
136 :     * Returned value : XVID_ERR_OK
137 :     * + API_VERSION in the input XVID_INIT_PARAM structure
138 :     * + core build " " " " "
139 :     *
140 :     ****************************************************************************/
141 :    
142 : edgomez 1.15 int
143 :     xvid_init(void *handle,
144 :     int opt,
145 :     void *param1,
146 :     void *param2)
147 : Isibaar 1.1 {
148 :     int cpu_flags;
149 :     XVID_INIT_PARAM *init_param;
150 :    
151 :     init_param = (XVID_INIT_PARAM *) param1;
152 :    
153 : suxen_drol 1.21 /* Inform the client the API version */
154 :     init_param->api_version = API_VERSION;
155 :    
156 :     /* Inform the client the core build - unused because we're still alpha */
157 :     init_param->core_build = 1000;
158 :    
159 : suxen_drol 1.31 /* Do we have to force CPU features ? */
160 :     if ((init_param->cpu_flags & XVID_CPU_FORCE)) {
161 : suxen_drol 1.21
162 : Isibaar 1.1 cpu_flags = init_param->cpu_flags;
163 : suxen_drol 1.31
164 : edgomez 1.16 } else {
165 : Isibaar 1.1
166 : chenm001 1.29 cpu_flags = check_cpu_features();
167 : suxen_drol 1.31
168 :     #if defined(ARCH_X86) && defined(EXPERIMENTAL_SSE2_CODE)
169 :     if ((cpu_flags & XVID_CPU_SSE) && sigill_check(sse_os_trigger))
170 :     cpu_flags &= ~XVID_CPU_SSE;
171 :    
172 :     if ((cpu_flags & XVID_CPU_SSE2) && sigill_check(sse2_os_trigger))
173 :     cpu_flags &= ~XVID_CPU_SSE2;
174 :     #endif
175 :     }
176 :    
177 :     if ((init_param->cpu_flags & XVID_CPU_CHKONLY))
178 :     {
179 : Isibaar 1.1 init_param->cpu_flags = cpu_flags;
180 : suxen_drol 1.31 return XVID_ERR_OK;
181 : Isibaar 1.1 }
182 : suxen_drol 1.31
183 :     init_param->cpu_flags = cpu_flags;
184 :    
185 : Isibaar 1.1
186 : edgomez 1.16 /* Initialize the function pointers */
187 : Isibaar 1.1 idct_int32_init();
188 : Isibaar 1.9 init_vlc_tables();
189 :    
190 : edgomez 1.16 /* Fixed Point Forward/Inverse DCT transformations */
191 : Isibaar 1.1 fdct = fdct_int32;
192 :     idct = idct_int32;
193 :    
194 : edgomez 1.16 /* Only needed on PPC Altivec archs */
195 : canard 1.10 sadInit = 0;
196 : edgomez 1.15
197 : edgomez 1.16 /* Restore FPU context : emms_c is a nop functions */
198 : Isibaar 1.1 emms = emms_c;
199 :    
200 : edgomez 1.16 /* Quantization functions */
201 :     quant_intra = quant_intra_c;
202 : Isibaar 1.1 dequant_intra = dequant_intra_c;
203 : edgomez 1.16 quant_inter = quant_inter_c;
204 : Isibaar 1.1 dequant_inter = dequant_inter_c;
205 :    
206 : edgomez 1.16 quant4_intra = quant4_intra_c;
207 : Isibaar 1.1 dequant4_intra = dequant4_intra_c;
208 : edgomez 1.16 quant4_inter = quant4_inter_c;
209 : Isibaar 1.1 dequant4_inter = dequant4_inter_c;
210 :    
211 : edgomez 1.16 /* Block transfer related functions */
212 : Isibaar 1.1 transfer_8to16copy = transfer_8to16copy_c;
213 :     transfer_16to8copy = transfer_16to8copy_c;
214 : edgomez 1.16 transfer_8to16sub = transfer_8to16sub_c;
215 : suxen_drol 1.11 transfer_8to16sub2 = transfer_8to16sub2_c;
216 : edgomez 1.16 transfer_16to8add = transfer_16to8add_c;
217 :     transfer8x8_copy = transfer8x8_copy_c;
218 : Isibaar 1.1
219 : edgomez 1.16 /* Image interpolation related functions */
220 :     interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_c;
221 :     interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_c;
222 : Isibaar 1.1 interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_c;
223 :    
224 : edgomez 1.16 /* Initialize internal colorspace transformation tables */
225 : Isibaar 1.1 colorspace_init();
226 :    
227 : edgomez 1.16 /* All colorspace transformation functions User Format->YV12 */
228 : Isibaar 1.1 rgb555_to_yv12 = rgb555_to_yv12_c;
229 :     rgb565_to_yv12 = rgb565_to_yv12_c;
230 : edgomez 1.16 rgb24_to_yv12 = rgb24_to_yv12_c;
231 :     rgb32_to_yv12 = rgb32_to_yv12_c;
232 :     yuv_to_yv12 = yuv_to_yv12_c;
233 :     yuyv_to_yv12 = yuyv_to_yv12_c;
234 :     uyvy_to_yv12 = uyvy_to_yv12_c;
235 : Isibaar 1.1
236 : edgomez 1.16 /* All colorspace transformation functions YV12->User format */
237 : Isibaar 1.1 yv12_to_rgb555 = yv12_to_rgb555_c;
238 :     yv12_to_rgb565 = yv12_to_rgb565_c;
239 : edgomez 1.16 yv12_to_rgb24 = yv12_to_rgb24_c;
240 :     yv12_to_rgb32 = yv12_to_rgb32_c;
241 :     yv12_to_yuv = yv12_to_yuv_c;
242 :     yv12_to_yuyv = yv12_to_yuyv_c;
243 :     yv12_to_uyvy = yv12_to_uyvy_c;
244 : Isibaar 1.1
245 : edgomez 1.16 /* Functions used in motion estimation algorithms */
246 : Isibaar 1.1 calc_cbp = calc_cbp_c;
247 : edgomez 1.16 sad16 = sad16_c;
248 :     sad16bi = sad16bi_c;
249 :     sad8 = sad8_c;
250 :     dev16 = dev16_c;
251 : ia64p 1.30 Halfpel8_Refine = Halfpel8_Refine_c;
252 : Isibaar 1.1
253 :     #ifdef ARCH_X86
254 : edgomez 1.15 if ((cpu_flags & XVID_CPU_MMX) > 0) {
255 : edgomez 1.16
256 :     /* Forward and Inverse Discrete Cosine Transformation functions */
257 : Isibaar 1.1 fdct = fdct_mmx;
258 :     idct = idct_mmx;
259 :    
260 : edgomez 1.16 /* To restore FPU context after mmx use */
261 : Isibaar 1.1 emms = emms_mmx;
262 :    
263 : edgomez 1.16 /* Quantization related functions */
264 :     quant_intra = quant_intra_mmx;
265 : Isibaar 1.1 dequant_intra = dequant_intra_mmx;
266 : edgomez 1.16 quant_inter = quant_inter_mmx;
267 : Isibaar 1.1 dequant_inter = dequant_inter_mmx;
268 :    
269 : edgomez 1.16 quant4_intra = quant4_intra_mmx;
270 : Isibaar 1.1 dequant4_intra = dequant4_intra_mmx;
271 : edgomez 1.16 quant4_inter = quant4_inter_mmx;
272 : Isibaar 1.1 dequant4_inter = dequant4_inter_mmx;
273 :    
274 : edgomez 1.16 /* Block related functions */
275 : Isibaar 1.1 transfer_8to16copy = transfer_8to16copy_mmx;
276 :     transfer_16to8copy = transfer_16to8copy_mmx;
277 : edgomez 1.16 transfer_8to16sub = transfer_8to16sub_mmx;
278 : edgomez 1.22 transfer_8to16sub2 = transfer_8to16sub2_mmx;
279 : edgomez 1.16 transfer_16to8add = transfer_16to8add_mmx;
280 :     transfer8x8_copy = transfer8x8_copy_mmx;
281 : edgomez 1.22
282 : edgomez 1.16
283 :     /* Image Interpolation related functions */
284 :     interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_mmx;
285 :     interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_mmx;
286 : Isibaar 1.1 interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_mmx;
287 :    
288 : edgomez 1.16 /* Image RGB->YV12 related functions */
289 : Isibaar 1.1 rgb24_to_yv12 = rgb24_to_yv12_mmx;
290 :     rgb32_to_yv12 = rgb32_to_yv12_mmx;
291 : edgomez 1.16 yuv_to_yv12 = yuv_to_yv12_mmx;
292 :     yuyv_to_yv12 = yuyv_to_yv12_mmx;
293 :     uyvy_to_yv12 = uyvy_to_yv12_mmx;
294 : Isibaar 1.1
295 : edgomez 1.16 /* Image YV12->RGB related functions */
296 : Isibaar 1.1 yv12_to_rgb24 = yv12_to_rgb24_mmx;
297 :     yv12_to_rgb32 = yv12_to_rgb32_mmx;
298 : edgomez 1.16 yv12_to_yuyv = yv12_to_yuyv_mmx;
299 :     yv12_to_uyvy = yv12_to_uyvy_mmx;
300 : Isibaar 1.1
301 : edgomez 1.16 /* Motion estimation related functions */
302 : Isibaar 1.1 calc_cbp = calc_cbp_mmx;
303 : edgomez 1.16 sad16 = sad16_mmx;
304 :     sad8 = sad8_mmx;
305 :     dev16 = dev16_mmx;
306 : Isibaar 1.1
307 :     }
308 :    
309 : edgomez 1.15 if ((cpu_flags & XVID_CPU_MMXEXT) > 0) {
310 : edgomez 1.16
311 :     /* Inverse DCT */
312 : Isibaar 1.1 idct = idct_xmm;
313 : edgomez 1.16
314 :     /* Interpolation */
315 :     interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_xmm;
316 :     interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_xmm;
317 : h 1.3 interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_xmm;
318 : Isibaar 1.25
319 : chenm001 1.29 /* Quantization */
320 :     dequant_intra = dequant_intra_xmm;
321 :     dequant_inter = dequant_inter_xmm;
322 :    
323 : edgomez 1.19 /* Buffer transfer */
324 :     transfer_8to16sub2 = transfer_8to16sub2_xmm;
325 : edgomez 1.16
326 :     /* Colorspace transformation */
327 : Isibaar 1.1 yuv_to_yv12 = yuv_to_yv12_xmm;
328 :    
329 : edgomez 1.16 /* ME functions */
330 : Isibaar 1.1 sad16 = sad16_xmm;
331 : chenm001 1.29 sad16bi = sad16bi_xmm;
332 : edgomez 1.16 sad8 = sad8_xmm;
333 : Isibaar 1.1 dev16 = dev16_xmm;
334 :    
335 :     }
336 :    
337 : edgomez 1.15 if ((cpu_flags & XVID_CPU_3DNOW) > 0) {
338 : edgomez 1.16
339 :     /* Interpolation */
340 : Isibaar 1.1 interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_3dn;
341 :     interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_3dn;
342 : h 1.4 interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_3dn;
343 : Isibaar 1.1 }
344 :    
345 : edgomez 1.15 if ((cpu_flags & XVID_CPU_SSE2) > 0) {
346 : Isibaar 1.14 #ifdef EXPERIMENTAL_SSE2_CODE
347 : edgomez 1.16
348 : chenm001 1.29 calc_cbp = calc_cbp_sse2;
349 :    
350 : edgomez 1.16 /* Quantization */
351 :     quant_intra = quant_intra_sse2;
352 : Isibaar 1.14 dequant_intra = dequant_intra_sse2;
353 : edgomez 1.16 quant_inter = quant_inter_sse2;
354 : Isibaar 1.14 dequant_inter = dequant_inter_sse2;
355 : h 1.13
356 : edgomez 1.16 /* ME */
357 :     sad16 = sad16_sse2;
358 :     dev16 = dev16_sse2;
359 :    
360 :     /* Forward and Inverse DCT */
361 :     idct = idct_sse2;
362 : Isibaar 1.14 fdct = fdct_sse2;
363 :     #endif
364 : h 1.12 }
365 : edgomez 1.16
366 : Isibaar 1.1 #endif
367 : Isibaar 1.18
368 :     #ifdef ARCH_IA64
369 :     if ((cpu_flags & XVID_CPU_IA64) > 0) { //use assembler routines?
370 :     idct_ia64_init();
371 :     fdct = fdct_ia64;
372 :     idct = idct_ia64; //not yet working, crashes
373 :     interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_ia64;
374 :     interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_ia64;
375 :     interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_ia64;
376 :     sad16 = sad16_ia64;
377 :     sad16bi = sad16bi_ia64;
378 :     sad8 = sad8_ia64;
379 :     dev16 = dev16_ia64;
380 : ia64p 1.30 Halfpel8_Refine = Halfpel8_Refine_ia64;
381 : Isibaar 1.18 quant_intra = quant_intra_ia64;
382 :     dequant_intra = dequant_intra_ia64;
383 :     quant_inter = quant_inter_ia64;
384 :     dequant_inter = dequant_inter_ia64;
385 :     transfer_8to16copy = transfer_8to16copy_ia64;
386 :     transfer_16to8copy = transfer_16to8copy_ia64;
387 :     transfer_8to16sub = transfer_8to16sub_ia64;
388 :     transfer_8to16sub2 = transfer_8to16sub2_ia64;
389 :     transfer_16to8add = transfer_16to8add_ia64;
390 :     transfer8x8_copy = transfer8x8_copy_ia64;
391 :     DEBUG("Using IA-64 assembler routines.\n");
392 :     }
393 :     #endif
394 : edgomez 1.16
395 : canard 1.5 #ifdef ARCH_PPC
396 : canard 1.6 #ifdef ARCH_PPC_ALTIVEC
397 :     calc_cbp = calc_cbp_altivec;
398 : canard 1.7 fdct = fdct_altivec;
399 :     idct = idct_altivec;
400 : canard 1.10 sadInit = sadInit_altivec;
401 : canard 1.8 sad16 = sad16_altivec;
402 :     sad8 = sad8_altivec;
403 :     dev16 = dev16_altivec;
404 : canard 1.6 #else
405 : canard 1.5 calc_cbp = calc_cbp_ppc;
406 : canard 1.6 #endif
407 : canard 1.5 #endif
408 : Isibaar 1.1
409 :     return XVID_ERR_OK;
410 :     }
411 :    
412 : edgomez 1.16 /*****************************************************************************
413 :     * XviD Native decoder entry point
414 :     *
415 :     * This function is just a wrapper to all the option cases.
416 :     *
417 :     * Returned values : XVID_ERR_FAIL when opt is invalid
418 :     * else returns the wrapped function result
419 :     *
420 :     ****************************************************************************/
421 :    
422 : edgomez 1.15 int
423 :     xvid_decore(void *handle,
424 :     int opt,
425 :     void *param1,
426 :     void *param2)
427 : Isibaar 1.1 {
428 : edgomez 1.15 switch (opt) {
429 :     case XVID_DEC_DECODE:
430 :     return decoder_decode((DECODER *) handle, (XVID_DEC_FRAME *) param1);
431 :    
432 :     case XVID_DEC_CREATE:
433 : chenm001 1.29 return decoder_create((XVID_DEC_PARAM *) param1);
434 : edgomez 1.15
435 :     case XVID_DEC_DESTROY:
436 :     return decoder_destroy((DECODER *) handle);
437 : Isibaar 1.1
438 :     default:
439 : edgomez 1.15 return XVID_ERR_FAIL;
440 :     }
441 : Isibaar 1.1 }
442 :    
443 : edgomez 1.16
444 :     /*****************************************************************************
445 :     * XviD Native encoder entry point
446 :     *
447 :     * This function is just a wrapper to all the option cases.
448 :     *
449 :     * Returned values : XVID_ERR_FAIL when opt is invalid
450 :     * else returns the wrapped function result
451 :     *
452 :     ****************************************************************************/
453 : Isibaar 1.1
454 : edgomez 1.15 int
455 :     xvid_encore(void *handle,
456 :     int opt,
457 :     void *param1,
458 :     void *param2)
459 : Isibaar 1.1 {
460 : edgomez 1.15 switch (opt) {
461 :     case XVID_ENC_ENCODE:
462 : suxen_drol 1.20 #ifdef BFRAMES
463 :     if (((Encoder *) handle)->mbParam.max_bframes >= 0)
464 :     return encoder_encode_bframes((Encoder *) handle, (XVID_ENC_FRAME *) param1,
465 :     (XVID_ENC_STATS *) param2);
466 :     else
467 :     #endif
468 : edgomez 1.15 return encoder_encode((Encoder *) handle, (XVID_ENC_FRAME *) param1,
469 :     (XVID_ENC_STATS *) param2);
470 :    
471 :     case XVID_ENC_CREATE:
472 :     return encoder_create((XVID_ENC_PARAM *) param1);
473 :    
474 :     case XVID_ENC_DESTROY:
475 :     return encoder_destroy((Encoder *) handle);
476 : Isibaar 1.1
477 :     default:
478 : edgomez 1.15 return XVID_ERR_FAIL;
479 :     }
480 : Isibaar 1.1 }

No admin address has been configured
ViewVC Help
Powered by ViewVC 1.0.4