[cvs] / xvidcore / src / xvid.c Repository:
ViewVC logotype

Diff of /xvidcore/src/xvid.c

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

revision 1.68, Sat Feb 25 04:41:12 2006 UTC revision 1.80, Mon Dec 1 15:06:48 2008 UTC
# Line 28  Line 28 
28  #include <string.h>  #include <string.h>
29  #include <time.h>  #include <time.h>
30    
31    #if !defined(_WIN32)
32    #include <unistd.h>
33    #endif
34    
35  #include "xvid.h"  #include "xvid.h"
36  #include "decoder.h"  #include "decoder.h"
37  #include "encoder.h"  #include "encoder.h"
# Line 40  Line 44 
44  #include "utils/mbfunctions.h"  #include "utils/mbfunctions.h"
45  #include "quant/quant.h"  #include "quant/quant.h"
46  #include "motion/motion.h"  #include "motion/motion.h"
47    #include "motion/gmc.h"
48  #include "motion/sad.h"  #include "motion/sad.h"
49  #include "utils/emms.h"  #include "utils/emms.h"
50  #include "utils/timer.h"  #include "utils/timer.h"
# Line 136  Line 141 
141          if ((cpu_flags & XVID_CPU_SSE) && sigill_check(sse_os_trigger))          if ((cpu_flags & XVID_CPU_SSE) && sigill_check(sse_os_trigger))
142                  cpu_flags &= ~XVID_CPU_SSE;                  cpu_flags &= ~XVID_CPU_SSE;
143    
144          if ((cpu_flags & XVID_CPU_SSE2) && sigill_check(sse2_os_trigger))          if ((cpu_flags & (XVID_CPU_SSE2|XVID_CPU_SSE3|XVID_CPU_SSE41)) && sigill_check(sse2_os_trigger))
145                  cpu_flags &= ~XVID_CPU_SSE2;                  cpu_flags &= ~(XVID_CPU_SSE2|XVID_CPU_SSE3|XVID_CPU_SSE41);
146  #endif  #endif
147    
148  #if defined(ARCH_IS_PPC)  #if defined(ARCH_IS_PPC)
# Line 256  Line 261 
261          yv12_to_yv12    = yv12_to_yv12_c;          yv12_to_yv12    = yv12_to_yv12_c;
262          rgb555_to_yv12  = rgb555_to_yv12_c;          rgb555_to_yv12  = rgb555_to_yv12_c;
263          rgb565_to_yv12  = rgb565_to_yv12_c;          rgb565_to_yv12  = rgb565_to_yv12_c;
264            rgb_to_yv12     = rgb_to_yv12_c;
265          bgr_to_yv12     = bgr_to_yv12_c;          bgr_to_yv12     = bgr_to_yv12_c;
266          bgra_to_yv12    = bgra_to_yv12_c;          bgra_to_yv12    = bgra_to_yv12_c;
267          abgr_to_yv12    = abgr_to_yv12_c;          abgr_to_yv12    = abgr_to_yv12_c;
# Line 277  Line 283 
283          /* All colorspace transformation functions YV12->User format */          /* All colorspace transformation functions YV12->User format */
284          yv12_to_rgb555  = yv12_to_rgb555_c;          yv12_to_rgb555  = yv12_to_rgb555_c;
285          yv12_to_rgb565  = yv12_to_rgb565_c;          yv12_to_rgb565  = yv12_to_rgb565_c;
286            yv12_to_rgb     = yv12_to_rgb_c;
287          yv12_to_bgr     = yv12_to_bgr_c;          yv12_to_bgr     = yv12_to_bgr_c;
288          yv12_to_bgra    = yv12_to_bgra_c;          yv12_to_bgra    = yv12_to_bgra_c;
289          yv12_to_abgr    = yv12_to_abgr_c;          yv12_to_abgr    = yv12_to_abgr_c;
# Line 306  Line 313 
313          sse8_16bit = sse8_16bit_c;          sse8_16bit = sse8_16bit_c;
314          sse8_8bit  = sse8_8bit_c;          sse8_8bit  = sse8_8bit_c;
315    
316  #if defined(ARCH_IS_IA32)          init_GMC(cpu_flags);
317    
318    #if defined(ARCH_IS_IA32) || defined(ARCH_IS_X86_64)
319    
320          if ((cpu_flags & XVID_CPU_MMX) || (cpu_flags & XVID_CPU_MMXEXT) ||          if ((cpu_flags & XVID_CPU_MMX) || (cpu_flags & XVID_CPU_MMXEXT) ||
321                  (cpu_flags & XVID_CPU_3DNOW) || (cpu_flags & XVID_CPU_3DNOWEXT) ||                  (cpu_flags & XVID_CPU_3DNOW) || (cpu_flags & XVID_CPU_3DNOWEXT) ||
322                  (cpu_flags & XVID_CPU_SSE) || (cpu_flags & XVID_CPU_SSE2))                  (cpu_flags & XVID_CPU_SSE) || (cpu_flags & XVID_CPU_SSE2) ||
323            (cpu_flags & XVID_CPU_SSE3) || (cpu_flags & XVID_CPU_SSE41))
324          {          {
325                  /* Restore FPU context : emms_c is a nop functions */                  /* Restore FPU context : emms_c is a nop functions */
326                  emms = emms_mmx;                  emms = emms_mmx;
# Line 331  Line 341 
341                  quant_h263_inter   = quant_h263_inter_mmx;                  quant_h263_inter   = quant_h263_inter_mmx;
342                  dequant_h263_intra = dequant_h263_intra_mmx;                  dequant_h263_intra = dequant_h263_intra_mmx;
343                  dequant_h263_inter = dequant_h263_inter_mmx;                  dequant_h263_inter = dequant_h263_inter_mmx;
   
344                  quant_mpeg_intra   = quant_mpeg_intra_mmx;                  quant_mpeg_intra   = quant_mpeg_intra_mmx;
345                  quant_mpeg_inter   = quant_mpeg_inter_mmx;                  quant_mpeg_inter   = quant_mpeg_inter_mmx;
346                  dequant_mpeg_intra = dequant_mpeg_intra_mmx;                  dequant_mpeg_intra = dequant_mpeg_intra_mmx;
347                  dequant_mpeg_inter = dequant_mpeg_inter_mmx;                  dequant_mpeg_inter = dequant_mpeg_inter_mmx;
348    
349    
350                  /* Block related functions */                  /* Block related functions */
351                  transfer_8to16copy = transfer_8to16copy_mmx;                  transfer_8to16copy = transfer_8to16copy_mmx;
352                  transfer_16to8copy = transfer_16to8copy_mmx;                  transfer_16to8copy = transfer_16to8copy_mmx;
# Line 374  Line 384 
384                  image_brightness = image_brightness_mmx;                  image_brightness = image_brightness_mmx;
385    
386                  /* image input xxx_to_yv12 related functions */                  /* image input xxx_to_yv12 related functions */
387    
388                  yv12_to_yv12  = yv12_to_yv12_mmx;                  yv12_to_yv12  = yv12_to_yv12_mmx;
389    
390                  bgr_to_yv12   = bgr_to_yv12_mmx;                  bgr_to_yv12   = bgr_to_yv12_mmx;
391                    rgb_to_yv12   = rgb_to_yv12_mmx;
392                  bgra_to_yv12  = bgra_to_yv12_mmx;                  bgra_to_yv12  = bgra_to_yv12_mmx;
393                    rgba_to_yv12  = rgba_to_yv12_mmx;
394                  yuyv_to_yv12  = yuyv_to_yv12_mmx;                  yuyv_to_yv12  = yuyv_to_yv12_mmx;
395                  uyvy_to_yv12  = uyvy_to_yv12_mmx;                  uyvy_to_yv12  = uyvy_to_yv12_mmx;
396    
# Line 412  Line 426 
426    
427                  yuyv_to_yv12  = yuyv_to_yv12_3dn;                  yuyv_to_yv12  = yuyv_to_yv12_3dn;
428                  uyvy_to_yv12  = uyvy_to_yv12_3dn;                  uyvy_to_yv12  = uyvy_to_yv12_3dn;
429    
430          }          }
431    
432    
# Line 436  Line 451 
451                  interpolate8x8_halfpel_hv_add = interpolate8x8_halfpel_hv_add_xmm;                  interpolate8x8_halfpel_hv_add = interpolate8x8_halfpel_hv_add_xmm;
452    
453                  /* Quantization */                  /* Quantization */
                 quant_mpeg_intra = quant_mpeg_intra_xmm;  
454                  quant_mpeg_inter = quant_mpeg_inter_xmm;                  quant_mpeg_inter = quant_mpeg_inter_xmm;
455    
456                  dequant_h263_intra = dequant_h263_intra_xmm;                  dequant_h263_intra = dequant_h263_intra_xmm;
# Line 447  Line 461 
461                  transfer_8to16sub2ro = transfer_8to16sub2ro_xmm;                  transfer_8to16sub2ro = transfer_8to16sub2ro_xmm;
462    
463                  /* Colorspace transformation */                  /* Colorspace transformation */
464                  yv12_to_yv12  = yv12_to_yv12_xmm;                  /* yv12_to_yv12  = yv12_to_yv12_xmm; */ /* appears to be slow on many machines */
465                  yuyv_to_yv12  = yuyv_to_yv12_xmm;                  yuyv_to_yv12  = yuyv_to_yv12_xmm;
466                  uyvy_to_yv12  = uyvy_to_yv12_xmm;                  uyvy_to_yv12  = uyvy_to_yv12_xmm;
467    
# Line 508  Line 522 
522                          dequant_h263_inter = dequant_h263_inter_3dne;                          dequant_h263_inter = dequant_h263_inter_3dne;
523    
524                          /* ME functions */                          /* ME functions */
                         calc_cbp = calc_cbp_3dne;  
   
525                          sad16 = sad16_3dne;                          sad16 = sad16_3dne;
526                          sad8 = sad8_3dne;                          sad8 = sad8_3dne;
527                          sad16bi = sad16bi_3dne;                          sad16bi = sad16bi_3dne;
# Line 534  Line 546 
546    
547                  /* DCT operators */                  /* DCT operators */
548                  fdct = fdct_sse2_skal;                  fdct = fdct_sse2_skal;
549      /* idct = idct_sse2_skal; */   /* Is now IEEE1180 and Walken compliant. Disabled until fully tested. */                  idct = idct_sse2_skal;   /* Is now IEEE1180 and Walken compliant. */
550    
551                  /* postprocessing */                  /* postprocessing */
552                  image_brightness = image_brightness_sse2;                  image_brightness = image_brightness_sse2;
553    
554            }
555    
556            if ((cpu_flags & XVID_CPU_SSE3)) {
557    
558                    /* SAD operators */
559                    sad16    = sad16_sse3;
560                    dev16    = dev16_sse3;
561          }          }
562    
563  #endif /* ARCH_IS_IA32 */  #endif /* ARCH_IS_IA32 */
564    
565  #if defined(ARCH_IS_IA64)  #if defined(ARCH_IS_IA64)
# Line 629  Line 650 
650          }          }
651  #endif  #endif
652    
 #if defined(ARCH_IS_X86_64)  
         /* For now, only XVID_CPU_ASM is looked for, so user can still  
          * disable asm usage the usual way. When Intel EMT64 cpus will  
          * be out, maybe we'll have to check more precisely what cpu  
          * features there really are. */  
         if (cpu_flags & XVID_CPU_ASM) {  
                 /* SIMD state flusher */  
                 emms = emms_mmx;  
   
                 /* DCT operators */  
                 fdct = fdct_skal_x86_64;  
                 idct = idct_x86_64;  
   
                 /* SAD operators */  
                 sad16      = sad16_x86_64;  
                 sad8       = sad8_x86_64;  
                 sad16bi    = sad16bi_x86_64;  
                 sad8bi     = sad8bi_x86_64;  
                 dev16      = dev16_x86_64;  
                 sad16v     = sad16v_x86_64;  
                 sse8_16bit = sse8_16bit_x86_64;  
                 sse8_8bit  = sse8_8bit_x86_64;  
   
                 /* Interpolation operators */  
                 interpolate8x8_halfpel_h  = interpolate8x8_halfpel_h_x86_64;  
                 interpolate8x8_halfpel_v  = interpolate8x8_halfpel_v_x86_64;  
                 interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_x86_64;  
   
                 interpolate8x8_halfpel_add = interpolate8x8_halfpel_add_x86_64;  
                 interpolate8x8_halfpel_h_add = interpolate8x8_halfpel_h_add_x86_64;  
                 interpolate8x8_halfpel_v_add = interpolate8x8_halfpel_v_add_x86_64;  
                 interpolate8x8_halfpel_hv_add = interpolate8x8_halfpel_hv_add_x86_64;  
   
                 interpolate8x8_6tap_lowpass_h = interpolate8x8_6tap_lowpass_h_x86_64;  
                 interpolate8x8_6tap_lowpass_v = interpolate8x8_6tap_lowpass_v_x86_64;  
   
                 interpolate8x8_avg2 = interpolate8x8_avg2_x86_64;  
                 interpolate8x8_avg4 = interpolate8x8_avg4_x86_64;  
   
                 /* Quantization related functions */  
                 quant_h263_intra   = quant_h263_intra_x86_64;  
                 quant_h263_inter   = quant_h263_inter_x86_64;  
                 dequant_h263_intra = dequant_h263_intra_x86_64;  
                 dequant_h263_inter = dequant_h263_inter_x86_64;  
                 quant_mpeg_intra   = quant_mpeg_intra_x86_64;  
                 quant_mpeg_inter   = quant_mpeg_inter_x86_64;  
                 dequant_mpeg_intra   = dequant_mpeg_intra_x86_64;  
                 dequant_mpeg_inter   = dequant_mpeg_inter_x86_64;  
   
                 /* Block related functions */  
                 transfer_8to16copy  = transfer_8to16copy_x86_64;  
                 transfer_16to8copy  = transfer_16to8copy_x86_64;  
                 transfer_8to16sub   = transfer_8to16sub_x86_64;  
                 transfer_8to16subro = transfer_8to16subro_x86_64;  
                 transfer_8to16sub2  = transfer_8to16sub2_x86_64;  
                 transfer_8to16sub2ro= transfer_8to16sub2ro_x86_64;  
                 transfer_16to8add   = transfer_16to8add_x86_64;  
                 transfer8x8_copy    = transfer8x8_copy_x86_64;  
   
                 /* Qpel stuff */  
                 xvid_QP_Funcs = &xvid_QP_Funcs_x86_64;  
                 xvid_QP_Add_Funcs = &xvid_QP_Add_Funcs_x86_64;  
   
                 /* Interlacing Functions */  
                 MBFieldTest = MBFieldTest_x86_64;  
         }  
 #endif  
   
653  #if defined(_DEBUG)  #if defined(_DEBUG)
654      xvid_debug = init->debug;      xvid_debug = init->debug;
655  #endif  #endif
# Line 712  Line 665 
665                  return XVID_ERR_VERSION;                  return XVID_ERR_VERSION;
666    
667          info->actual_version = XVID_VERSION;          info->actual_version = XVID_VERSION;
668          info->build = "xvid-1.2.0-dev";          info->build = "xvid-1.3.0-dev";
669          info->cpu_flags = detect_cpu_flags();          info->cpu_flags = detect_cpu_flags();
670    info->num_threads = 0;    info->num_threads = 0;
671    
672  #if defined(WIN32)  #if defined(_WIN32)
673    
674    {    {
675      DWORD dwProcessAffinityMask, dwSystemAffinityMask;          SYSTEM_INFO siSysInfo;
676      if (GetProcessAffinityMask(GetCurrentProcess(), &dwProcessAffinityMask, &dwSystemAffinityMask)) {          GetSystemInfo(&siSysInfo);
677        int i;          info->num_threads = siSysInfo.dwNumberOfProcessors; /* number of _logical_ cores */
       for(i=0; i<32; i++) {  
         if ((dwProcessAffinityMask & (1<<i)))  
           info->num_threads++;  
       }  
     }  
678    }    }
679    
680    #else
681    
682      info->num_threads = sysconf(_SC_NPROCESSORS_CONF);
683    
684  #endif  #endif
685    
686          return 0;          return 0;

Legend:
Removed from v.1.68  
changed lines
  Added in v.1.80

No admin address has been configured
ViewVC Help
Powered by ViewVC 1.0.4