Diff of /xvidcore/src/xvid.c

-revision 1.33.2.21, Fri Jan  3 16:25:14 2003 UTC
+revision 1.43, Wed Feb 19 21:13:00 2003 UTC
 Line 3
   *  XVID MPEG-4 VIDEO CODEC
   *  - Native API implementation  -
   *
-  *  This program is an implementation of a part of one or more MPEG-4
-  *  Video tools as specified in ISO/IEC 14496-2 standard.  Those intending
-  *  to use this software module in hardware or software products are
-  *  advised that its use may infringe existing patents or copyrights, and
-  *  any such use would be at such party's own risk.  The original
-  *  developer of this software module and his/her company, and subsequent
-  *  editors and their companies, will have no liability for use of this
-  *  software or modifications or derivatives thereof.
-  *
   *  This program is free software ; you can redistribute it and/or modify
   *  it under the terms of the GNU General Public License as published by
   *  the Free Software Foundation ; either version 2 of the License, or
-Line 26
+Line 17
   *  along with this program ; if not, write to the Free Software
   *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
   *
-  ****************************************************************************/
- /*****************************************************************************
-  *
-  *  History
-  *
-  *      - 23.06.2002    added XVID_CPU_CHKONLY
-  *  - 17.03.2002        Added interpolate8x8_halfpel_hv_xmm
-  *  - 22.12.2001  API change: added xvid_init() - Isibaar
-  *  - 16.12.2001        inital version; (c)2001 peter ross <pross@cs.rmit.edu.au>
-  *
   *  $Id$
   *
   ****************************************************************************/
-Line 65
+Line 45
  #include "utils/timer.h"
  #include "bitstream/mbcoding.h"
- #if defined(ARCH_X86) && defined(EXPERIMENTAL_SSE2_CODE)
+ #if defined(ARCH_IS_IA32)
- #ifdef WIN32
+ #if defined(_MSC_VER)
  #include <windows.h>
  #else
  #include <signal.h>
  #include <setjmp.h>
- #endif
- #ifndef WIN32
  static jmp_buf mark;
-Line 88
+Line 64
  /*
- calls the funcptr, and returns whether SIGILL (illegal instruction) was signalled
+  * Calls the funcptr, and returns whether SIGILL (illegal instruction) was
- return values:
+  * signalled
- -1 : could not determine
+  *
- : SIGILL was *not* signalled
+  * Return values:
- : SIGILL was signalled
+  *  -1 : could not determine
+  *   0 : SIGILL was *not* signalled
+  *   1 : SIGILL was signalled
  */
  int
  sigill_check(void (*func)())
  {
- #ifdef WIN32
+ #if defined(_MSC_VER)
          _try {
                  func();
          }
-Line 132
+Line 110
  }
  #endif
+ /* detect cpu flags  */
+ static unsigned int
+ detect_cpu_flags()
+ {
+         /* enable native assembly optimizations by default */
+         unsigned int cpu_flags = XVID_CPU_ASM;
+ #if defined(ARCH_IS_IA32)
+         cpu_flags |= check_cpu_features();
+         if ((cpu_flags & XVID_CPU_SSE) && sigill_check(sse_os_trigger))
+                 cpu_flags &= ~XVID_CPU_SSE;
+         if ((cpu_flags & XVID_CPU_SSE2) && sigill_check(sse2_os_trigger))
+                 cpu_flags &= ~XVID_CPU_SSE2;
+ #endif
+ #if defined(ARCH_IS_PPC)
+ #if defined(ARCH_IS_PPC_ALTIVEC)
+         cpu_flags |= XVID_CPU_ALTIVEC;
+ #endif
+ #endif
+         return cpu_flags;
+ }
  /*****************************************************************************
   * XviD Init Entry point
   *
-Line 165
+Line 170
          } else {
-                 cpu_flags = check_cpu_features();
+                 cpu_flags = detect_cpu_flags();
- #if defined(ARCH_X86) && defined(EXPERIMENTAL_SSE2_CODE)
-                 if ((cpu_flags & XVID_CPU_SSE) && sigill_check(sse_os_trigger))
-                         cpu_flags &= ~XVID_CPU_SSE;
-                 if ((cpu_flags & XVID_CPU_SSE2) && sigill_check(sse2_os_trigger))
-                         cpu_flags &= ~XVID_CPU_SSE2;
- #endif
          }
          if ((init_param->cpu_flags & XVID_CPU_CHKONLY))
-Line 214
+Line 211
          transfer_8to16copy = transfer_8to16copy_c;
          transfer_16to8copy = transfer_16to8copy_c;
          transfer_8to16sub  = transfer_8to16sub_c;
+         transfer_8to16subro  = transfer_8to16subro_c;
          transfer_8to16sub2 = transfer_8to16sub2_c;
          transfer_16to8add  = transfer_16to8add_c;
          transfer8x8_copy   = transfer8x8_copy_c;
-Line 241
+Line 239
          interpolate8x8_avg4 = interpolate8x8_avg4_c;
          /* reduced resoltuion */
          copy_upsampled_8x8_16to8 = xvid_Copy_Upsampled_8x8_16To8_C;
          add_upsampled_8x8_16to8 = xvid_Add_Upsampled_8x8_16To8_C;
- #ifdef ARCH_X86
-         vfilter_31 = xvid_VFilter_31_x86;
-         hfilter_31 = xvid_HFilter_31_x86;
- #else
          vfilter_31 = xvid_VFilter_31_C;
          hfilter_31 = xvid_HFilter_31_C;
- #endif
          filter_18x18_to_8x8 = xvid_Filter_18x18_To_8x8_C;
          filter_diff_18x18_to_8x8 = xvid_Filter_Diff_18x18_To_8x8_C;
-Line 306
+Line 298
          dev16    = dev16_c;
          sad16v   = sad16v_c;
- //      Halfpel8_Refine = Halfpel8_Refine_c;
+ /*      Halfpel8_Refine = Halfpel8_Refine_c; */
- #ifdef ARCH_X86
+ #if defined(ARCH_IS_IA32)
+         if ((cpu_flags & XVID_CPU_ASM))
+         {
+                 vfilter_31 = xvid_VFilter_31_x86;
+                 hfilter_31 = xvid_HFilter_31_x86;
+         }
          if ((cpu_flags & XVID_CPU_MMX) || (cpu_flags & XVID_CPU_MMXEXT) ||
                  (cpu_flags & XVID_CPU_3DNOW) || (cpu_flags & XVID_CPU_3DNOWEXT) ||
-Line 318
+Line 316
                  emms = emms_mmx;
          }
-         if ((cpu_flags & XVID_CPU_MMX) > 0) {
+         if ((cpu_flags & XVID_CPU_MMX)) {
                  /* Forward and Inverse Discrete Cosine Transformation functions */
                  fdct = fdct_mmx;
-Line 339
+Line 337
                  transfer_8to16copy = transfer_8to16copy_mmx;
                  transfer_16to8copy = transfer_16to8copy_mmx;
                  transfer_8to16sub  = transfer_8to16sub_mmx;
+                 transfer_8to16subro  = transfer_8to16subro_mmx;
                  transfer_8to16sub2 = transfer_8to16sub2_mmx;
                  transfer_16to8add  = transfer_16to8add_mmx;
                  transfer8x8_copy   = transfer8x8_copy_mmx;
-Line 388
+Line 387
                  sad8bi  = sad8bi_mmx;
                  dev16    = dev16_mmx;
                  sad16v   = sad16v_mmx;
          }
          /* these 3dnow functions are faster than mmx, but slower than xmm. */
-         if ((cpu_flags & XVID_CPU_3DNOW) > 0) {
+         if ((cpu_flags & XVID_CPU_3DNOW)) {
+                 emms = emms_3dn;
                  /* ME functions */
                  sad16bi = sad16bi_3dn;
 Line 403
          }
-         if ((cpu_flags & XVID_CPU_MMXEXT) > 0) {
+         if ((cpu_flags & XVID_CPU_MMXEXT)) {
                  /* Inverse DCT */
                  idct = idct_xmm;
 Line 441
                  sad16v   = sad16v_xmm;
          }
-         if ((cpu_flags & XVID_CPU_3DNOW) > 0) {
+         if ((cpu_flags & XVID_CPU_3DNOW)) {
                  /* Interpolation */
                  interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_3dn;
 Line 449
                  interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_3dn;
          }
-         if ((cpu_flags & XVID_CPU_3DNOWEXT) > 0) {
+         if ((cpu_flags & XVID_CPU_3DNOWEXT)) {
                  /* Inverse DCT */
                  idct =  idct_3dne;
 Line 458
                  transfer_8to16copy =  transfer_8to16copy_3dne;
                  transfer_16to8copy = transfer_16to8copy_3dne;
                  transfer_8to16sub =  transfer_8to16sub_3dne;
+                 transfer_8to16subro =  transfer_8to16subro_3dne;
                  transfer_8to16sub2 =  transfer_8to16sub2_3dne;
                  transfer_16to8add = transfer_16to8add_3dne;
                  transfer8x8_copy = transfer8x8_copy_3dne;
-Line 485
+Line 486
          }
-         if ((cpu_flags & XVID_CPU_SSE2) > 0) {
+         if ((cpu_flags & XVID_CPU_SSE2)) {
- #ifdef EXPERIMENTAL_SSE2_CODE
                  calc_cbp = calc_cbp_sse2;
 Line 496
                  quant_inter   = quant_inter_sse2;
                  dequant_inter = dequant_inter_sse2;
-                 /* ME */
+ #if defined(EXPERIMENTAL_SSE2_CODE)
+                 /* ME; slower than xmm */
                  sad16    = sad16_sse2;
                  dev16    = dev16_sse2;
+ #endif
                  /* Forward and Inverse DCT */
                  idct  = idct_sse2;
                  fdct = fdct_sse2;
- #endif
          }
  #endif
- #ifdef ARCH_IA64
+ #if defined(ARCH_IS_IA64)
-         if ((cpu_flags & XVID_CPU_IA64) > 0) { //use assembler routines?
+         if ((cpu_flags & XVID_CPU_ASM)) { /* use assembler routines? */
            idct_ia64_init();
            fdct = fdct_ia64;
-           idct = idct_ia64;   //not yet working, crashes
+           idct = idct_ia64;   /*not yet working, crashes */
            interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_ia64;
            interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_ia64;
            interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_ia64;
-Line 520
+Line 519
            sad16bi = sad16bi_ia64;
            sad8 = sad8_ia64;
            dev16 = dev16_ia64;
- //        Halfpel8_Refine = Halfpel8_Refine_ia64;
+ /*        Halfpel8_Refine = Halfpel8_Refine_ia64; */
            quant_intra = quant_intra_ia64;
            dequant_intra = dequant_intra_ia64;
            quant_inter = quant_inter_ia64;
-Line 531
+Line 530
            transfer_8to16sub2 = transfer_8to16sub2_ia64;
            transfer_16to8add = transfer_16to8add_ia64;
            transfer8x8_copy = transfer8x8_copy_ia64;
-           DEBUG("Using IA-64 assembler routines.\n");
+           DPRINTF(DPRINTF_DEBUG, "Using IA-64 assembler routines.");
          }
  #endif
- #ifdef ARCH_PPC
+ #if defined(ARCH_IS_PPC)
- #ifdef ARCH_PPC_ALTIVEC
+         if ((cpu_flags & XVID_CPU_ASM))
+         {
+                 calc_cbp = calc_cbp_ppc;
+         }
+         if ((cpu_flags & XVID_CPU_ALTIVEC))
+         {
          calc_cbp = calc_cbp_altivec;
          fdct = fdct_altivec;
          idct = idct_altivec;
-Line 544
+Line 549
          sad16 = sad16_altivec;
          sad8 = sad8_altivec;
          dev16 = dev16_altivec;
- #else
+         }
-         calc_cbp = calc_cbp_ppc;
- #endif
  #endif
          return XVID_ERR_OK;
-Line 557
+Line 560
  static int
  xvid_init_convert(XVID_INIT_CONVERTINFO* convert)
  {
-         // const int flip1 = (convert->input.colorspace & XVID_CSP_VFLIP) ^ (convert->output.colorspace & XVID_CSP_VFLIP);
+ /*
+         const int flip1 =
+                 (convert->input.colorspace & XVID_CSP_VFLIP) ^
+                 (convert->output.colorspace & XVID_CSP_VFLIP);
+ */
          const int width = convert->width;
          const int height = convert->height;
          const int width2 = convert->width/2;
-Line 643
+Line 650
  #define TEST_FDCT  (TEST_FORWARD)
  #define TEST_IDCT  (0)
- int test_transform(void * funcA, void * funcB, const char * nameB,
+ static int test_transform(void * funcA, void * funcB, const char * nameB,
                                     int test, int flags)
  {
          int i;
-Line 723
+Line 730
  #define TEST_DEQUANT_INTRA      (TEST_INTRA)
  #define TEST_DEQUANT_INTER      (0)
- int test_quant(void * funcA, void * funcB, const char * nameB,
+ static int test_quant(void * funcA, void * funcB, const char * nameB,
                             int test, int flags)
  {
          int q,i;
          int64_t timeSTART;
          int64_t timeA = 0;
          int64_t timeB = 0;
-         int retA, retB;
+         int retA = 0, retB = 0;
          DECLARE_ALIGNED_MATRIX(arrayX, 1, 64, int16_t, CACHE_LINE);
          DECLARE_ALIGNED_MATRIX(arrayA, 1, 64, int16_t, CACHE_LINE);
          DECLARE_ALIGNED_MATRIX(arrayB, 1, 64, int16_t, CACHE_LINE);
-Line 810
+Line 817
          printf("xvid_init_test\n");
- #if defined(ARCH_X86)
+ #if defined(ARCH_IS_IA32)
-         cpu_flags = check_cpu_features();
+         cpu_flags = detect_cpu_flags();
          idct_int32_init();
          emms_mmx();

 Legend:



Removed from v.1.33.2.21
 


changed lines


 
Added in v.1.43
 Legend:



Removed from v.1.33.2.21
 


changed lines


 
Added in v.1.43
-Removed from v.1.33.2.21
+Added in v.1.43

No admin address has been configured	ViewVC Help
Powered by ViewVC 1.0.4