Diff of /xvidcore/src/image/qpel.h

-revision 1.1.2.1, Sat May  3 23:26:35 2003 UTC
+revision 1.6, Wed Jan  5 23:02:15 2005 UTC
 Line 3
  *  XVID MPEG-4 VIDEO CODEC
  *  - QPel interpolation -
  *
+  *  Copyright(C) 2003 Pascal Massimino <skal@planet-d.net>
+  *
  *  This program is free software ; you can redistribute it and/or modify
  *  it under the terms of the GNU General Public License as published by
  *  the Free Software Foundation ; either version 2 of the License, or
-Line 17
+Line 19
  *  along with this program ; if not, write to the Free Software
  *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
  *
- *****************************************************************************/
+  * $Id$
- /**************************************************************************
-  *
-  *      History:
   *
-  *  22.10.2002  initial coding  - Skal -
+  ****************************************************************************/
-  *
-  *************************************************************************/
  #ifndef _XVID_QPEL_H_
  #define _XVID_QPEL_H_
+ #include "interpolate8x8.h"
  #include "../utils/mem_transfer.h"
  /*****************************************************************************
-Line 41
+Line 38
  typedef  XVID_QP_PASS_SIGNATURE(XVID_QP_PASS);
-     // We put everything in a single struct so it can easily be passed
+ /* We put everything in a single struct so it can easily be passed
-     // to prediction functions as a whole...
+  * to prediction functions as a whole... */
- struct XVID_QP_FUNCS {
+ typedef struct _XVID_QP_FUNCS {
-     // filter for QPel 16x? prediction
+         /* filter for QPel 16x? prediction */
    XVID_QP_PASS *H_Pass;
    XVID_QP_PASS *H_Pass_Avrg;
-Line 55
+Line 52
    XVID_QP_PASS *V_Pass_Avrg;
    XVID_QP_PASS *V_Pass_Avrg_Up;
-     // filter for QPel 8x? prediction
+     /* filter for QPel 8x? prediction */
    XVID_QP_PASS *H_Pass_8;
    XVID_QP_PASS *H_Pass_Avrg_8;
-Line 63
+Line 60
    XVID_QP_PASS *V_Pass_8;
    XVID_QP_PASS *V_Pass_Avrg_8;
    XVID_QP_PASS *V_Pass_Avrg_Up_8;
- };
+ } XVID_QP_FUNCS;
- typedef struct XVID_QP_FUNCS  XVID_QP_FUNCS;
  /*****************************************************************************
   * fwd dcl
   ****************************************************************************/
+ extern void xvid_Init_QP();
+ extern XVID_QP_FUNCS xvid_QP_Funcs_C_ref;       /* for P-frames */
+ extern XVID_QP_FUNCS xvid_QP_Add_Funcs_C_ref;   /* for B-frames */
- extern XVID_QP_FUNCS xvid_QP_Funcs_C;       // for P-frames
+ extern XVID_QP_FUNCS xvid_QP_Funcs_C;       /* for P-frames */
- extern XVID_QP_FUNCS xvid_QP_Add_Funcs_C;   // for B-frames
+ extern XVID_QP_FUNCS xvid_QP_Add_Funcs_C;   /* for B-frames */
+ #ifdef ARCH_IS_IA32
  extern XVID_QP_FUNCS xvid_QP_Funcs_mmx;
  extern XVID_QP_FUNCS xvid_QP_Add_Funcs_mmx;
- extern void xvid_Init_QP_mmx(); // should be called at mmx initialization
+ #endif
- extern XVID_QP_FUNCS *xvid_QP_Funcs;      // <- main pointer for enc/dec structure
+ #ifdef ARCH_IS_PPC
- extern XVID_QP_FUNCS *xvid_QP_Add_Funcs;  // <- main pointer for enc/dec structure
+ extern XVID_QP_FUNCS xvid_QP_Funcs_Altivec_C;
+ extern XVID_QP_FUNCS xvid_QP_Add_Funcs_Altivec_C;
+ #endif
+ #ifdef ARCH_IS_X86_64
+ extern XVID_QP_FUNCS xvid_QP_Funcs_x86_64;
+ extern XVID_QP_FUNCS xvid_QP_Add_Funcs_x86_64;
+ #endif
+ extern XVID_QP_FUNCS *xvid_QP_Funcs;      /* <- main pointer for enc/dec structure */
+ extern XVID_QP_FUNCS *xvid_QP_Add_Funcs;  /* <- main pointer for enc/dec structure */
  /*****************************************************************************
   * macros
-Line 100
+Line 111
   ****************************************************************************/
- static __inline void new_interpolate16x16_quarterpel(
+ static void __inline
-     uint8_t * const cur,
+ interpolate16x16_quarterpel(uint8_t * const cur,
      uint8_t * const refn,
                  uint8_t * const refh,
                  uint8_t * const refv,
-Line 119
+Line 130
          int32_t x_int, y_int;
-   const int32_t xRef = x*4 + dx;
+         const int32_t xRef = (int)x*4 + dx;
-   const int32_t yRef = y*4 + dy;
+         const int32_t yRef = (int)y*4 + dy;
-      Ops = xvid_QP_Funcs; // TODO: pass as argument
+         Ops = xvid_QP_Funcs;
       quads = (dx&3) | ((dy&3)<<2);
    x_int = xRef/4;
-Line 134
+Line 145
     y_int--;
      dst = cur + y * stride + x;
-         src = refn + y_int * stride + x_int;
+         src = refn + y_int * (int)stride + x_int;
-   tmp = refh; // we need at least a 16 x stride scratch block
+         tmp = refh; /* we need at least a 16 x stride scratch block */
    switch(quads) {
      case 0:
-Line 202
+Line 213
    }
  }
- static __inline void new_interpolate16x8_quarterpel(
+ static void __inline
-     uint8_t * const cur,
+ interpolate16x16_add_quarterpel(uint8_t * const cur,
      uint8_t * const refn,
                  uint8_t * const refh,
                  uint8_t * const refv,
-Line 218
+Line 229
          uint8_t *tmp;
          int32_t quads;
          const XVID_QP_FUNCS *Ops;
+         const XVID_QP_FUNCS *Ops_Copy;
          int32_t x_int, y_int;
-   const int32_t xRef = x*4 + dx;
+         const int32_t xRef = (int)x*4 + dx;
-   const int32_t yRef = y*4 + dy;
+         const int32_t yRef = (int)y*4 + dy;
-      Ops = xvid_QP_Funcs; // TODO: pass as argument
+         Ops = xvid_QP_Add_Funcs;
+         Ops_Copy = xvid_QP_Funcs;
       quads = (dx&3) | ((dy&3)<<2);
    x_int = xRef/4;
-Line 236
+Line 249
     y_int--;
      dst = cur + y * stride + x;
-         src = refn + y_int * stride + x_int;
+         src = refn + y_int * (int)stride + x_int;
-   tmp = refh; // we need at least a 16 x stride scratch block
+         tmp = refh; /* we need at least a 16 x stride scratch block */
+         switch(quads) {
+         case 0:
+                 /* NB: there is no halfpel involved ! the name's function can be
+                  *     misleading */
+                 interpolate8x8_halfpel_add(dst, src, stride, rounding);
+                 interpolate8x8_halfpel_add(dst+8, src+8, stride, rounding);
+                 interpolate8x8_halfpel_add(dst+8*stride, src+8*stride, stride, rounding);
+                 interpolate8x8_halfpel_add(dst+8*stride+8, src+8*stride+8, stride, rounding);
+                 break;
+         case 1:
+                 Ops->H_Pass_Avrg(dst, src, 16, stride, rounding);
+                 break;
+         case 2:
+                 Ops->H_Pass(dst, src, 16, stride, rounding);
+                 break;
+         case 3:
+                 Ops->H_Pass_Avrg_Up(dst, src, 16, stride, rounding);
+                 break;
+         case 4:
+                 Ops->V_Pass_Avrg(dst, src, 16, stride, rounding);
+                 break;
+         case 5:
+                 Ops_Copy->H_Pass_Avrg(tmp, src, 17, stride, rounding);
+                 Ops->V_Pass_Avrg(dst, tmp, 16, stride, rounding);
+                 break;
+         case 6:
+                 Ops_Copy->H_Pass(tmp, src,        17, stride, rounding);
+                 Ops->V_Pass_Avrg(dst, tmp, 16, stride, rounding);
+                 break;
+         case 7:
+                 Ops_Copy->H_Pass_Avrg_Up(tmp, src, 17, stride, rounding);
+                 Ops->V_Pass_Avrg(dst, tmp, 16, stride, rounding);
+                 break;
+         case 8:
+                 Ops->V_Pass(dst, src, 16, stride, rounding);
+                 break;
+         case 9:
+                 Ops_Copy->H_Pass_Avrg(tmp, src, 17, stride, rounding);
+                 Ops->V_Pass(dst, tmp, 16, stride, rounding);
+                 break;
+         case 10:
+                 Ops_Copy->H_Pass(tmp, src, 17, stride, rounding);
+                 Ops->V_Pass(dst, tmp, 16, stride, rounding);
+                 break;
+         case 11:
+                 Ops_Copy->H_Pass_Avrg_Up(tmp, src, 17, stride, rounding);
+                 Ops->V_Pass(dst, tmp, 16, stride, rounding);
+                 break;
+         case 12:
+                 Ops->V_Pass_Avrg_Up(dst, src, 16, stride, rounding);
+                 break;
+         case 13:
+                 Ops_Copy->H_Pass_Avrg(tmp, src, 17, stride, rounding);
+                 Ops->V_Pass_Avrg_Up(dst, tmp, 16, stride, rounding);
+                 break;
+         case 14:
+                 Ops_Copy->H_Pass(tmp, src, 17, stride, rounding);
+                 Ops->V_Pass_Avrg_Up( dst, tmp, 16, stride, rounding);
+                 break;
+         case 15:
+                 Ops_Copy->H_Pass_Avrg_Up(tmp, src, 17, stride, rounding);
+                 Ops->V_Pass_Avrg_Up(dst, tmp, 16, stride, rounding);
+                 break;
+         }
+ }
+ static void __inline
+ interpolate16x8_quarterpel(uint8_t * const cur,
+                                                            uint8_t * const refn,
+                                                            uint8_t * const refh,
+                                                            uint8_t * const refv,
+                                                            uint8_t * const refhv,
+                                                            const uint32_t x, const uint32_t y,
+                                                            const int32_t dx,  const int dy,
+                                                            const uint32_t stride,
+                                                            const uint32_t rounding)
+ {
+         const uint8_t *src;
+         uint8_t *dst;
+         uint8_t *tmp;
+         int32_t quads;
+         const XVID_QP_FUNCS *Ops;
+         int32_t x_int, y_int;
+         const int32_t xRef = (int)x*4 + dx;
+         const int32_t yRef = (int)y*4 + dy;
+         Ops = xvid_QP_Funcs;
+         quads = (dx&3) | ((dy&3)<<2);
+         x_int = xRef/4;
+         if (xRef < 0 && xRef % 4)
+                 x_int--;
+         y_int    = yRef/4;
+         if (yRef < 0 && yRef % 4)
+                 y_int--;
+         dst = cur + y * stride + x;
+         src = refn + y_int * (int)stride + x_int;
+         tmp = refh; /* we need at least a 16 x stride scratch block */
    switch(quads) {
      case 0:
-Line 302
+Line 419
    }
  }
- static __inline void new_interpolate8x8_quarterpel(
+ static void __inline
-     uint8_t * const cur,
+ interpolate8x8_quarterpel(uint8_t * const cur,
      uint8_t * const refn,
                  uint8_t * const refh,
                  uint8_t * const refv,
-Line 321
+Line 438
          int32_t x_int, y_int;
-   const int32_t xRef = x*4 + dx;
+         const int32_t xRef = (int)x*4 + dx;
-   const int32_t yRef = y*4 + dy;
+         const int32_t yRef = (int)y*4 + dy;
-      Ops = xvid_QP_Funcs; // TODO: pass as argument
+         Ops = xvid_QP_Funcs;
       quads = (dx&3) | ((dy&3)<<2);
    x_int = xRef/4;
-Line 336
+Line 453
     y_int--;
      dst = cur + y * stride + x;
-         src = refn + y_int * stride + x_int;
+         src = refn + y_int * (int)stride + x_int;
-   tmp = refh; // we need at least a 16 x stride scratch block
+         tmp = refh; /* we need at least a 16 x stride scratch block */
    switch(quads) {
      case 0:
-Line 400
+Line 517
      break;
    }
  }
- /*****************************************************************************/
+ static void __inline
+ interpolate8x8_add_quarterpel(uint8_t * const cur,
+                                                           uint8_t * const refn,
+                                                           uint8_t * const refh,
+                                                           uint8_t * const refv,
+                                                           uint8_t * const refhv,
+                                                           const uint32_t x, const uint32_t y,
+                                                           const int32_t dx,  const int dy,
+                                                           const uint32_t stride,
+                                                           const uint32_t rounding)
+ {
+         const uint8_t *src;
+         uint8_t *dst;
+         uint8_t *tmp;
+         int32_t quads;
+         const XVID_QP_FUNCS *Ops;
+         const XVID_QP_FUNCS *Ops_Copy;
+         int32_t x_int, y_int;
+         const int32_t xRef = (int)x*4 + dx;
+         const int32_t yRef = (int)y*4 + dy;
+         Ops = xvid_QP_Add_Funcs;
+         Ops_Copy = xvid_QP_Funcs;
+         quads = (dx&3) | ((dy&3)<<2);
+         x_int = xRef/4;
+         if (xRef < 0 && xRef % 4)
+                 x_int--;
+         y_int    = yRef/4;
+         if (yRef < 0 && yRef % 4)
+                 y_int--;
+         dst = cur + y * stride + x;
+         src = refn + y_int * (int)stride + x_int;
+         tmp = refh; /* we need at least a 16 x stride scratch block */
+         switch(quads) {
+         case 0:
+                 /* Misleading function name, there is no halfpel involved
+                  * just dst and src averaging with rounding=0 */
+                 interpolate8x8_halfpel_add(dst, src, stride, rounding);
+                 break;
+         case 1:
+                 Ops->H_Pass_Avrg_8(dst, src, 8, stride, rounding);
+                 break;
+         case 2:
+                 Ops->H_Pass_8(dst, src, 8, stride, rounding);
+                 break;
+         case 3:
+                 Ops->H_Pass_Avrg_Up_8(dst, src, 8, stride, rounding);
+                 break;
+         case 4:
+                 Ops->V_Pass_Avrg_8(dst, src, 8, stride, rounding);
+                 break;
+         case 5:
+                 Ops_Copy->H_Pass_Avrg_8(tmp, src, 9, stride, rounding);
+                 Ops->V_Pass_Avrg_8(dst, tmp, 8, stride, rounding);
+                 break;
+         case 6:
+                 Ops_Copy->H_Pass_8(tmp, src, 9, stride, rounding);
+                 Ops->V_Pass_Avrg_8(dst, tmp, 8, stride, rounding);
+                 break;
+         case 7:
+                 Ops_Copy->H_Pass_Avrg_Up_8(tmp, src, 9, stride, rounding);
+                 Ops->V_Pass_Avrg_8(dst, tmp, 8, stride, rounding);
+                 break;
+         case 8:
+                 Ops->V_Pass_8(dst, src, 8, stride, rounding);
+                 break;
+         case 9:
+                 Ops_Copy->H_Pass_Avrg_8(tmp, src, 9, stride, rounding);
+                 Ops->V_Pass_8(dst, tmp, 8, stride, rounding);
+                 break;
+         case 10:
+                 Ops_Copy->H_Pass_8(tmp, src, 9, stride, rounding);
+                 Ops->V_Pass_8(dst, tmp, 8, stride, rounding);
+                 break;
+         case 11:
+                 Ops_Copy->H_Pass_Avrg_Up_8(tmp, src, 9, stride, rounding);
+                 Ops->V_Pass_8(dst, tmp, 8, stride, rounding);
+                 break;
+         case 12:
+                 Ops->V_Pass_Avrg_Up_8(dst, src, 8, stride, rounding);
+                 break;
+         case 13:
+                 Ops_Copy->H_Pass_Avrg_8(tmp, src, 9, stride, rounding);
+                 Ops->V_Pass_Avrg_Up_8(dst, tmp, 8, stride, rounding);
+                 break;
+         case 14:
+                 Ops_Copy->H_Pass_8(tmp, src, 9, stride, rounding);
+                 Ops->V_Pass_Avrg_Up_8( dst, tmp, 8, stride, rounding);
+                 break;
+         case 15:
+                 Ops_Copy->H_Pass_Avrg_Up_8(tmp, src, 9, stride, rounding);
+                 Ops->V_Pass_Avrg_Up_8(dst, tmp, 8, stride, rounding);
+                 break;
+         }
+ }
  #endif  /* _XVID_QPEL_H_ */

 Legend:



Removed from v.1.1.2.1
 


changed lines


 
Added in v.1.6
 Legend:



Removed from v.1.1.2.1
 


changed lines


 
Added in v.1.6
-Removed from v.1.1.2.1
+Added in v.1.6

No admin address has been configured	ViewVC Help
Powered by ViewVC 1.0.4