Diff of /xvidcore/src/motion/motion_est.c

-revision 1.39, Sat Jul 27 23:47:01 2002 UTC
+revision 1.45, Fri Sep  6 16:59:47 2002 UTC
 Line 1
- /**************************************************************************
+ /*****************************************************************************
   *
   *      XVID MPEG-4 VIDEO CODEC
-  *      motion estimation
+  *  - Motion Estimation module -
+  *
+  *  Copyright(C) 2002 Christoph Lampert <gruel@web.de>
+  *  Copyright(C) 2002 Michael Militzer <michael@xvid.org>
+  *  Copyright(C) 2002 Edouard Gomez <ed.gomez@wanadoo.fr>
+  *  Copyright(C) 2002 chenm001 <chenm001@163.com>
   *
   *      This program is an implementation of a part of one or more MPEG-4
   *      Video tools as specified in ISO/IEC 14496-2 standard.  Those intending
-Line 24
+Line 29
   *
   *      You should have received a copy of the GNU General Public License
   *      along with this program; if not, write to the Free Software
-  *      Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+  *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
   *
   *************************************************************************/
- /**************************************************************************
-  *
-  *  Modifications:
-  *
-  *      01.05.2002      updated MotionEstimationBVOP
-  *      25.04.2002 partial prevMB conversion
-  *  22.04.2002 remove some compile warning by chenm001 <chenm001@163.com>
-  *  14.04.2002 added MotionEstimationBVOP()
-  *  02.04.2002 add EPZS(^2) as ME algorithm, use PMV_USESQUARES to choose between
-  *             EPZS and EPZS^2
-  *  08.02.2002 split up PMVfast into three routines: PMVFast, PMVFast_MainLoop
-  *             PMVFast_Refine to support multiple searches with different start points
-  *  07.01.2002 uv-block-based interpolation
-  *  06.01.2002 INTER/INTRA-decision is now done before any SEARCH8 (speedup)
-  *             changed INTER_BIAS to 150 (as suggested by suxen_drol)
-  *             removed halfpel refinement step in PMVfastSearch8 + quality=5
-  *             added new quality mode = 6 which performs halfpel refinement
-  *             filesize difference between quality 5 and 6 is smaller than 1%
-  *             (Isibaar)
-  *  31.12.2001 PMVfastSearch16 and PMVfastSearch8 (gruel)
-  *  30.12.2001 get_range/MotionSearchX simplified; blue/green bug fix
-  *  22.12.2001 commented best_point==99 check
-  *  19.12.2001 modified get_range (purple bug fix)
-  *  15.12.2001 moved pmv displacement from mbprediction
-  *  02.12.2001 motion estimation/compensation split (Isibaar)
-  *  16.11.2001 rewrote/tweaked search algorithms; pross@cs.rmit.edu.au
-  *  10.11.2001 support for sad16/sad8 functions
-  *  28.08.2001 reactivated MODE_INTER4V for EXT_MODE
-  *  24.08.2001 removed MODE_INTER4V_Q, disabled MODE_INTER4V for EXT_MODE
-  *  22.08.2001 added MODE_INTER4V_Q
-  *  20.08.2001 added pragma to get rid of internal compiler error with VC6
-  *             idea by Cyril. Thanks.
-  *
-  *  Michael Militzer <isibaar@videocoding.de>
-  *
-  **************************************************************************/
  #include <assert.h>
  #include <stdio.h>
  #include <stdlib.h>
-Line 186
+Line 154
                          MACROBLOCK *const pMB = &pMBs[x + y * iWcount];
+                         if (pMB->mode == MODE_NOT_CODED)
+                                 continue;
                          predMV = get_pmv2(pMBs, pParam->mb_width, 0, x, y, 0);
                          pMB->sad16 =
-Line 874
+Line 845
          return iMinSAD;
  }
+ #define CHECK_MV16_F_INTERPOL(X,Y) { \
- #define CHECK_MV16_F_INTERPOL(X,Y,BX,BY) { \
+   if ( ((X) <= f_max_dx) && ((X) >= f_min_dx) \
-   if ( ((X) <= max_dx) && ((X) >= min_dx) \
+     && ((Y) <= f_max_dy) && ((Y) >= f_min_dy) ) \
-     && ((Y) <= max_dy) && ((Y) >= min_dy) ) \
-   { \
-     iSAD = sad16( cur, get_ref(pRef, pRefH, pRefV, pRefHV, x, y, 16, X, Y, iEdgedWidth),iEdgedWidth, iMinSAD); \
-     iSAD += calc_delta_16((X) - center_x, (Y) - center_y, (uint8_t)iFcode, iQuant);\
-     if (iSAD < iMinSAD) \
-     {  iMinSAD=iSAD; currMV->x=(X); currMV->y=(Y); } } \
- }
- #define CHECK_MV16_F_INTERPOL_DIR(X,Y,BX,BY,D) { \
-   if ( ((X) <= max_dx) && ((X) >= min_dx) \
-     && ((Y) <= max_dy) && ((Y) >= min_dy) ) \
-   { \
-     iSAD = sad16( cur, get_ref(pRef, pRefH, pRefV, pRefHV, x, y, 16, X, Y, iEdgedWidth),iEdgedWidth, iMinSAD); \
-     iSAD += calc_delta_16((X) - center_x, (Y) - center_y, (uint8_t)iFcode, iQuant);\
-     if (iSAD < iMinSAD) \
-     {  iMinSAD=iSAD; currMV->x=(X); currMV->y=(Y); iDirection=(D); } } \
- }
- #define CHECK_MV16_F_INTERPOL_FOUND(X,Y,BX,BY,D) { \
-   if ( ((X) <= max_dx) && ((X) >= min_dx) \
-     && ((Y) <= max_dy) && ((Y) >= min_dy) ) \
    { \
-     iSAD = sad16( cur, get_ref(pRef, pRefH, pRefV, pRefHV, x, y, 16, X, Y, iEdgedWidth),iEdgedWidth, iMinSAD); \
+     iSAD = sad16bi( cur, \
-     iSAD += calc_delta_16((X) - center_x, (Y) - center_y, (uint8_t)iFcode, iQuant);\
+                         get_ref(f_pRef, f_pRefH, f_pRefV, f_pRefHV, x, y, 16, X, Y, iEdgedWidth),       \
+                         get_ref(b_pRef, b_pRefH, b_pRefV, b_pRefHV, x, y, 16, b_currMV->x, b_currMV->y, iEdgedWidth),   \
+                         iEdgedWidth); \
+     iSAD += calc_delta_16((X) - f_center_x, (Y) - f_center_y, (uint8_t)f_iFcode, iQuant);\
+     iSAD += calc_delta_16(b_currMV->x - b_center_x, b_currMV->y - b_center_y, (uint8_t)b_iFcode, iQuant);\
      if (iSAD < iMinSAD) \
-     {  iMinSAD=iSAD; currMV->x=(X); currMV->y=(Y); iDirection=(D); iFound=0; } } \
+     {  iMinSAD=iSAD; f_currMV->x=(X); f_currMV->y=(Y); } } \
  }
+ #define CHECK_MV16_F_INTERPOL_FOUND(X,Y) { \
- #define CHECK_MV16_B_INTERPOL(FX,FY,X,Y) { \
+   if ( ((X) <= f_max_dx) && ((X) >= f_min_dx) \
-   if ( ((X) <= max_dx) && ((X) >= min_dx) \
+     && ((Y) <= f_max_dy) && ((Y) >= f_min_dy) ) \
-     && ((Y) <= max_dy) && ((Y) >= min_dy) ) \
    { \
-     iSAD = sad16( cur, get_ref(pRef, pRefH, pRefV, pRefHV, x, y, 16, X, Y, iEdgedWidth),iEdgedWidth, iMinSAD); \
+     iSAD = sad16bi( cur, \
-     iSAD += calc_delta_16((X) - center_x, (Y) - center_y, (uint8_t)iFcode, iQuant);\
+                         get_ref(f_pRef, f_pRefH, f_pRefV, f_pRefHV, x, y, 16, X, Y, iEdgedWidth),       \
+                         get_ref(b_pRef, b_pRefH, b_pRefV, b_pRefHV, x, y, 16, b_currMV->x, b_currMV->y, iEdgedWidth),   \
+                         iEdgedWidth); \
+     iSAD += calc_delta_16((X) - f_center_x, (Y) - f_center_y, (uint8_t)f_iFcode, iQuant);\
+     iSAD += calc_delta_16(b_currMV->x - b_center_x, b_currMV->y - b_center_y, (uint8_t)b_iFcode, iQuant);\
      if (iSAD < iMinSAD) \
-     {  iMinSAD=iSAD; currMV->x=(X); currMV->y=(Y); } } \
+     {  iMinSAD=iSAD; f_currMV->x=(X); f_currMV->y=(Y); iFound=0;} } \
  }
+ #define CHECK_MV16_B_INTERPOL(X,Y) { \
- #define CHECK_MV16_B_INTERPOL_DIR(FX,FY,X,Y,D) { \
+   if ( ((X) <= b_max_dx) && ((X) >= b_min_dx) \
-   if ( ((X) <= max_dx) && ((X) >= min_dx) \
+     && ((Y) <= b_max_dy) && ((Y) >= b_min_dy) ) \
-     && ((Y) <= max_dy) && ((Y) >= min_dy) ) \
    { \
-     iSAD = sad16( cur, get_ref(pRef, pRefH, pRefV, pRefHV, x, y, 16, X, Y, iEdgedWidth),iEdgedWidth, iMinSAD); \
+     iSAD = sad16bi( cur, \
-     iSAD += calc_delta_16((X) - center_x, (Y) - center_y, (uint8_t)iFcode, iQuant);\
+                         get_ref(f_pRef, f_pRefH, f_pRefV, f_pRefHV, x, y, 16, f_currMV->x, f_currMV->y, iEdgedWidth),   \
+                         get_ref(b_pRef, b_pRefH, b_pRefV, b_pRefHV, x, y, 16, X, Y, iEdgedWidth),       \
+                         iEdgedWidth); \
+     iSAD += calc_delta_16(f_currMV->x - f_center_x, f_currMV->y - f_center_y, (uint8_t)f_iFcode, iQuant);\
+     iSAD += calc_delta_16((X) - b_center_x, (Y) - b_center_y, (uint8_t)b_iFcode, iQuant);\
      if (iSAD < iMinSAD) \
-     {  iMinSAD=iSAD; currMV->x=(X); currMV->y=(Y); iDirection=(D); } } \
+     {  iMinSAD=iSAD; b_currMV->x=(X); b_currMV->y=(Y); } } \
  }
+ #define CHECK_MV16_B_INTERPOL_FOUND(X,Y) { \
- #define CHECK_MV16_B_INTERPOL_FOUND(FX,FY,X,Y,D) { \
+   if ( ((X) <= b_max_dx) && ((X) >= b_min_dx) \
-   if ( ((X) <= max_dx) && ((X) >= min_dx) \
+     && ((Y) <= b_max_dy) && ((Y) >= b_min_dy) ) \
-     && ((Y) <= max_dy) && ((Y) >= min_dy) ) \
    { \
-     iSAD = sad16( cur, get_ref(pRef, pRefH, pRefV, pRefHV, x, y, 16, X, Y, iEdgedWidth),iEdgedWidth, iMinSAD); \
+     iSAD = sad16bi( cur, \
-     iSAD += calc_delta_16((X) - center_x, (Y) - center_y, (uint8_t)iFcode, iQuant);\
+                         get_ref(f_pRef, f_pRefH, f_pRefV, f_pRefHV, x, y, 16, f_currMV->x, f_currMV->y, iEdgedWidth),   \
+                         get_ref(b_pRef, b_pRefH, b_pRefV, b_pRefHV, x, y, 16, X, Y, iEdgedWidth),       \
+                         iEdgedWidth); \
+     iSAD += calc_delta_16(f_currMV->x - f_center_x, f_currMV->y - f_center_y, (uint8_t)f_iFcode, iQuant);\
+     iSAD += calc_delta_16((X) - b_center_x, (Y) - b_center_y, (uint8_t)b_iFcode, iQuant);\
      if (iSAD < iMinSAD) \
-     {  iMinSAD=iSAD; currMV->x=(X); currMV->y=(Y); iDirection=(D); iFound=0; } } \
+     {  iMinSAD=iSAD; b_currMV->x=(X); b_currMV->y=(Y); iFound=0;} } \
  }
- #if (0==1)
  int32_t
  Diamond16_InterpolMainSearch(
                                          const uint8_t * const f_pRef,
                                           const uint8_t * const f_pRefH,
                                           const uint8_t * const f_pRefV,
                                           const uint8_t * const f_pRefHV,
                                           const uint8_t * const cur,
                                          const uint8_t * const b_pRef,
-Line 970
+Line 932
                                     const int b_center_x,
                                     const int b_center_y,
-                                          const int32_t min_dx,
+                                     const int32_t f_min_dx,
-                                          const int32_t max_dx,
+                                         const int32_t f_max_dx,
-                                          const int32_t min_dy,
+                                         const int32_t f_min_dy,
-                                          const int32_t max_dy,
+                                         const int32_t f_max_dy,
+                                     const int32_t b_min_dx,
+                                         const int32_t b_max_dx,
+                                         const int32_t b_min_dy,
+                                         const int32_t b_max_dy,
                                           const int32_t iEdgedWidth,
                                           const int32_t iDiamondSize,
-Line 985
+Line 953
  {
  /* Do a diamond search around given starting point, return SAD of best */
-         int32_t f_iDirection = 0;
-         int32_t b_iDirection = 0;
          int32_t iSAD;
          VECTOR f_backupMV;
          VECTOR b_backupMV;
-         f_backupMV.x = start_x;
+         f_currMV->x = f_start_x;
-         f_backupMV.y = start_y;
+         f_currMV->y = f_start_y;
-         b_backupMV.x = start_x;
+         b_currMV->x = b_start_x;
-         b_backupMV.y = start_y;
+         b_currMV->y = b_start_y;
- /* It's one search with full Diamond pattern, and only 3 of 4 for all following diamonds */
+         do
+         {
+                 iFound = 1;
-         CHECK_MV16_CANDIDATE_DIR(backupMV.x - iDiamondSize, backupMV.y, 1);
+                 f_backupMV = *f_currMV;
-         CHECK_MV16_CANDIDATE_DIR(backupMV.x + iDiamondSize, backupMV.y, 2);
-         CHECK_MV16_CANDIDATE_DIR(backupMV.x, backupMV.y - iDiamondSize, 3);
-         CHECK_MV16_CANDIDATE_DIR(backupMV.x, backupMV.y + iDiamondSize, 4);
-         if (iDirection)
+                 CHECK_MV16_F_INTERPOL_FOUND(f_backupMV.x - iDiamondSize, f_backupMV.y);
-                 while (!iFound) {
+                 CHECK_MV16_F_INTERPOL_FOUND(f_backupMV.x + iDiamondSize, f_backupMV.y);
-                         iFound = 1;
+                 CHECK_MV16_F_INTERPOL_FOUND(f_backupMV.x, f_backupMV.y - iDiamondSize);
-                         backupMV = *currMV;
+                 CHECK_MV16_F_INTERPOL_FOUND(f_backupMV.x, f_backupMV.y + iDiamondSize);
+                 b_backupMV = *b_currMV;
+                 CHECK_MV16_B_INTERPOL_FOUND(b_backupMV.x - iDiamondSize, b_backupMV.y);
+                 CHECK_MV16_B_INTERPOL_FOUND(b_backupMV.x + iDiamondSize, b_backupMV.y);
+                 CHECK_MV16_B_INTERPOL_FOUND(b_backupMV.x, b_backupMV.y - iDiamondSize);
+                 CHECK_MV16_B_INTERPOL_FOUND(b_backupMV.x, b_backupMV.y + iDiamondSize);
+         } while (!iFound);
+         return iMinSAD;
+ }
+ /* Sorry, these MACROS really got too large... I'll turn them into function soon! */
+ #define CHECK_MV16_DIRECT_FOUND(X,Y) \
+         if ( (X)>=(-32) && (X)<=(31) && ((Y)>=-32) && ((Y)<=31) ) \
+         { int k;\
+         VECTOR mvs,b_mvs;       \
+         iSAD = 0;\
+         for (k = 0; k < 4; k++) {       \
+                                         mvs.x = (int32_t) ((TRB * directmv[k].x) / TRD + (X));          \
+                     b_mvs.x = (int32_t) (((X) == 0)                                                     \
+                                                                                 ? ((TRB - TRD) * directmv[k].x) / TRD   \
+                                             : mvs.x - directmv[k].x);                           \
+                                                                                                                                                                 \
+                     mvs.y = (int32_t) ((TRB * directmv[k].y) / TRD + (Y));              \
+                         b_mvs.y = (int32_t) (((Y) == 0)                                                         \
+                                                                                 ? ((TRB - TRD) * directmv[k].y) / TRD   \
+                                             : mvs.y - directmv[k].y);                           \
+                                                                                                                                                                 \
+   if ( (mvs.x <= max_dx) && (mvs.x >= min_dx) \
+     && (mvs.y <= max_dy) && (mvs.y >= min_dy)  \
+         && (b_mvs.x <= max_dx) && (b_mvs.x >= min_dx)  \
+     && (b_mvs.y <= max_dy) && (b_mvs.y >= min_dy) ) { \
+             iSAD += sad8bi( cur + 8*(k&1) + 8*(k>>1)*iEdgedWidth,                                                                                                       \
+                         get_ref(f_pRef, f_pRefH, f_pRefV, f_pRefHV, 2*x+(k&1), 2*y+(k>>1), 8, \
+                                         mvs.x, mvs.y, iEdgedWidth),                                                             \
+                         get_ref(b_pRef, b_pRefH, b_pRefV, b_pRefHV, 2*x+(k&1), 2*y+(k>>1), 8, \
+                                         b_mvs.x, b_mvs.y, iEdgedWidth),                                                         \
+                         iEdgedWidth); \
+                 }       \
+         else    \
+                 iSAD = 65535;   \
+         } \
+         iSAD += calc_delta_16((X),(Y), 1, iQuant);\
+         if (iSAD < iMinSAD) \
+             {  iMinSAD=iSAD; currMV->x=(X); currMV->y=(Y); iFound=0; } \
+ }
+ int32_t
+ Diamond16_DirectMainSearch(
+                                         const uint8_t * const f_pRef,
+                                         const uint8_t * const f_pRefH,
+                                         const uint8_t * const f_pRefV,
+                                         const uint8_t * const f_pRefHV,
+                                         const uint8_t * const cur,
+                                         const uint8_t * const b_pRef,
+                                         const uint8_t * const b_pRefH,
+                                         const uint8_t * const b_pRefV,
+                                         const uint8_t * const b_pRefHV,
+                                         const int x,
+                                         const int y,
+                                         const int TRB,
+                                         const int TRD,
+                                     const int start_x,
+                                     const int start_y,
+                                     int iMinSAD,
+                                     VECTOR * const currMV,
+                                         const VECTOR * const directmv,
+                                     const int32_t min_dx,
+                                         const int32_t max_dx,
+                                         const int32_t min_dy,
+                                         const int32_t max_dy,
+                                         const int32_t iEdgedWidth,
+                                         const int32_t iDiamondSize,
+                                         const int32_t iQuant,
+                                         int iFound)
+ {
+ /* Do a diamond search around given starting point, return SAD of best */
+         int32_t iSAD;
+         VECTOR backupMV;
-                         if (iDirection != 2)
-                                 CHECK_MV16_CANDIDATE_FOUND(backupMV.x - iDiamondSize,
-                                                                                    backupMV.y, 1);
-                         if (iDirection != 1)
-                                 CHECK_MV16_CANDIDATE_FOUND(backupMV.x + iDiamondSize,
-                                                                                    backupMV.y, 2);
-                         if (iDirection != 4)
-                                 CHECK_MV16_CANDIDATE_FOUND(backupMV.x,
-                                                                                    backupMV.y - iDiamondSize, 3);
-                         if (iDirection != 3)
-                                 CHECK_MV16_CANDIDATE_FOUND(backupMV.x,
-                                                                                    backupMV.y + iDiamondSize, 4);
-         } else {
                  currMV->x = start_x;
                  currMV->y = start_y;
-         }
+ /* It's one search with full Diamond pattern, and only 3 of 4 for all following diamonds */
+         do
+         {
+                 iFound = 1;
+                 backupMV = *currMV;
+                 CHECK_MV16_DIRECT_FOUND(backupMV.x - iDiamondSize, backupMV.y);
+                 CHECK_MV16_DIRECT_FOUND(backupMV.x + iDiamondSize, backupMV.y);
+                 CHECK_MV16_DIRECT_FOUND(backupMV.x, backupMV.y - iDiamondSize);
+                 CHECK_MV16_DIRECT_FOUND(backupMV.x, backupMV.y + iDiamondSize);
+         } while (!iFound);
          return iMinSAD;
  }
- #endif
  int32_t
-Line 1278
+Line 1339
                                  const IMAGE * const pCur,
                                  const int x,
                                  const int y,
-                                 const int start_x,
+                                 const int start_x,      /* start is searched first, so it should contain the most */
-                                 const int start_y,
+                                 const int start_y,  /* likely motion vector for this block */
-                                 const int center_x,
+                                 const int center_x,     /* center is from where length of MVs is measured */
                                  const int center_y,
                                  const uint32_t MotionFlags,
                                  const uint32_t iQuant,
-Line 2737
+Line 2798
                                  const IMAGE * const pCur,
                                  const int x,
                                  const int y,
-                         const int start_x,
+                                 const int start_x,              /* start should be most likely vector */
                          const int start_y,
-                         const int center_x,
+                                 const int center_x,             /* center is from where length of MVs is measured */
                          const int center_y,
                                  const uint32_t MotionFlags,
                                  const uint32_t iQuant,
-Line 2768
+Line 2829
          int32_t iFound;
          VECTOR newMV;
-         VECTOR backupMV;                        /* just for PMVFAST */
+         VECTOR backupMV;
          VECTOR pmv[4];
          int32_t psad[4];
-Line 2798
+Line 2859
                  *currMV = pmv[0] = pmv[1] = pmv[2] = pmv[3] = zeroMV;
          } else {
+                 bPredEq = get_ipmvdata(pMBs, iWcount, 0, x, y, 0, pmv, psad);
                  threshA = psad[0];
                  threshB = threshA + 256;
                  if (threshA < 512)
-Line 2807
+Line 2871
                  if (threshB > 1792)
                          threshB = 1792;
-                 bPredEq = get_ipmvdata(pMBs, iWcount, 0, x, y, 0, pmv, psad);
                  *currMV = pmv[0];                       /* current best := prediction */
          }
-Line 3023
+Line 3086
  /* ***********************************************************
          bvop motion estimation
- // TODO: need to incorporate prediction here (eg. sad += calc_delta_16)
  ***************************************************************/
- #define DIRECT_PENALTY 0
- #define DIRECT_UPPERLIMIT 256   // never use direct mode if SAD is larger than this
  void
  MotionEstimationBVOP(MBParam * const pParam,
                                           FRAMEINFO * const frame,
-Line 3052
+Line 3110
          const int mb_height = pParam->mb_height;
          const int edged_width = pParam->edged_width;
+         const int32_t iWidth = pParam->width;
+         const int32_t iHeight = pParam->height;
          int i, j, k;
          static const VECTOR zeroMV={0,0};
-Line 3059
+Line 3120
          int f_sad16;    /* forward (as usual) search */
          int b_sad16;    /* backward (only in b-frames) search */
          int i_sad16;    /* interpolated (both direction, b-frames only) */
-         int d_sad16;    /* direct mode (assume linear motion) */
+         int d_sad16;    /* direct mode (assume almost linear motion) */
          int best_sad;
          VECTOR f_predMV, b_predMV;      /* there is no prediction for direct mode*/
+         VECTOR f_interpolMV, b_interpolMV;
          VECTOR pmv_dontcare;
+         int min_dx, max_dx, min_dy, max_dy;
+         int f_min_dx, f_max_dx, f_min_dy, f_max_dy;
+         int b_min_dx, b_max_dx, b_min_dy, b_max_dy;
          int f_count=0;
          int b_count=0;
          int i_count=0;
          int d_count=0;
-         int s_count=0;
          const int64_t TRB = (int32_t)time_pp - (int32_t)time_bp;
      const int64_t TRD = (int32_t)time_pp;
-Line 3089
+Line 3154
                          mb->deltamv=zeroMV;
- /* special case, if collocated block is SKIPed: encoding is forward(0,0)  */
+ /* special case, if collocated block is SKIPed: encoding is forward (0,0), cpb=0 without further ado */
- #ifndef _DISABLE_SKIP
                          if (b_mb->mode == MODE_INTER && b_mb->cbp == 0 &&
                                  b_mb->mvs[0].x == 0 && b_mb->mvs[0].y == 0) {
                                  mb->mode = MODE_NOT_CODED;
-                                 mb->mvs[0].x = 0;
+                                 mb->b_mvs[0] = mb->mvs[0] = zeroMV;
-                                 mb->mvs[0].y = 0;
-                                 mb->b_mvs[0].x = 0;
-                                 mb->b_mvs[0].y = 0;
                                  continue;
                          }
- #endif
-                         d_sad16 = DIRECT_PENALTY;
                          if (b_mb->mode == MODE_INTER4V)
                          {
+                                 d_sad16 = 0;
                          /* same method of scaling as in decoder.c, so we copy from there */
                      for (k = 0; k < 4; k++) {
-Line 3119
+Line 3177
                                              : mb->mvs[k].x - mb->directmv[k].x);
                      mb->mvs[k].y = (int32_t) ((TRB * mb->directmv[k].y) / TRD + mb->deltamv.y);
-                         mb->b_mvs[k].y = (int32_t) ((mb->directmv[k].y == 0)
+                         mb->b_mvs[k].y = (int32_t) ((mb->deltamv.y == 0)
                                                                                  ? ((TRB - TRD) * mb->directmv[k].y) / TRD
                                              : mb->mvs[k].y - mb->directmv[k].y);
                                          d_sad16 +=
-                                                 sad8bi(frame->image.y + 2*(i+(k&1))*8 + 2*(j+(k>>1))*8*edged_width,
+                                                 sad8bi(frame->image.y + (2*i+(k&1))*8 + (2*j+(k>>1))*8*edged_width,
                                                    get_ref_mv(f_ref->y, f_refH->y, f_refV->y, f_refHV->y,
-*(i+(k&1)), 2*(j+(k>>1)), 8, &mb->mvs[k], edged_width),
+                                                                 (2*i+(k&1)), (2*j+(k>>1)), 8, &mb->mvs[k], edged_width),
                                                    get_ref_mv(b_ref->y, b_refH->y, b_refV->y, b_refHV->y,
-*(i+(k&1)), 2*(j+(k>>1)), 8, &mb->b_mvs[k], edged_width),
+                                                                 (2*i+(k&1)), (2*j+(k>>1)), 8, &mb->b_mvs[k], edged_width),
                                                    edged_width);
                                  }
                          }
-Line 3147
+Line 3205
                                                                          ? ((TRB - TRD) * mb->directmv[0].y) / TRD
                                      : mb->mvs[0].y - mb->directmv[0].y);
-                                 d_sad16 += sad16bi(frame->image.y + i * 16 + j * 16 * edged_width,
+                                 d_sad16 = sad16bi(frame->image.y + i * 16 + j * 16 * edged_width,
                                                    get_ref_mv(f_ref->y, f_refH->y, f_refV->y, f_refHV->y,
                                                                  i, j, 16, &mb->mvs[0], edged_width),
                                                    get_ref_mv(b_ref->y, b_refH->y, b_refV->y, b_refHV->y,
-Line 3190
+Line 3248
                      i_sad16 += calc_delta_16(mb->b_mvs[0].x-b_predMV.x, mb->b_mvs[0].y-b_predMV.y,
                                                                  frame->bcode, frame->quant);
-                         // TODO: direct search
+                         get_range(&f_min_dx, &f_max_dx, &f_min_dy, &f_max_dy, i, j, 16, iWidth, iHeight,
-                         // predictor + delta vector in range [-32,32] (fcode=1)
+                           frame->fcode);
+                         get_range(&b_min_dx, &b_max_dx, &b_min_dy, &b_max_dy, i, j, 16, iWidth, iHeight,
+                           frame->bcode);
+ /* Interpolated MC motion vector search, this is tedious and more complicated because there are
+    two values for everything, always one for backward and one for forward ME. Still, we don't gain
+    much from this search, maybe it should simply be skipped and simply current i_sad16 value used
+    as "optimal". */
+                         i_sad16 = Diamond16_InterpolMainSearch(
+                                                 f_ref->y, f_refH->y, f_refV->y, f_refHV->y,
+                                                 frame->image.y + i * 16 + j * 16 * edged_width,
+                                                 b_ref->y, b_refH->y, b_refV->y, b_refHV->y,
+                                                 i, j,
+                                                 mb->mvs[0].x, mb->mvs[0].y,
+                                                 mb->b_mvs[0].x, mb->b_mvs[0].y,
+                                                 i_sad16,
+                                                 &f_interpolMV, &b_interpolMV,
+                                                 f_predMV.x, f_predMV.y, b_predMV.x, b_predMV.y,
+                                                 f_min_dx, f_max_dx, f_min_dy, f_max_dy,
+                                                 b_min_dx, b_max_dx, b_min_dy, b_max_dy,
+                                                 edged_width,  2,
+                                                 frame->fcode, frame->bcode,frame->quant,0);
+                         i_sad16 = Diamond16_InterpolMainSearch(
+                                                 f_ref->y, f_refH->y, f_refV->y, f_refHV->y,
+                                                 frame->image.y + i * 16 + j * 16 * edged_width,
+                                                 b_ref->y, b_refH->y, b_refV->y, b_refHV->y,
+                                                 i, j,
+                                                 f_interpolMV.x, f_interpolMV.y,
+                                                 b_interpolMV.x, b_interpolMV.y,
+                                                 i_sad16,
+                                                 &f_interpolMV, &b_interpolMV,
+                                                 f_predMV.x, f_predMV.y, b_predMV.x, b_predMV.y,
+                                                 f_min_dx, f_max_dx, f_min_dy, f_max_dy,
+                                                 b_min_dx, b_max_dx, b_min_dy, b_max_dy,
+                                                 edged_width,  1,
+                                                 frame->fcode, frame->bcode,frame->quant,0);             // equiv to halfpel refine
+ /*  DIRECT MODE DELTA VECTOR SEARCH.
+     This has to be made more effective, but at the moment I'm happy it's running at all */
+ /* There are two range restrictions for direct mode: deltaMV is limited to [-32,31] in halfpel units, and
+    absolute vector must not lie outside of image dimensions. Constraint one is dealt with by CHECK_MV16_DIRECT
+    and for constraint two we need distance to boundary. This is done by get_range very large fcode (hack!) */
+                         get_range(&min_dx, &max_dx, &min_dy, &max_dy, i, j, 16, iWidth, iHeight, 19);
+                         d_sad16 = Diamond16_DirectMainSearch(
+                                                 f_ref->y, f_refH->y, f_refV->y, f_refHV->y,
+                                                 frame->image.y + i*16 + j*16*edged_width,
+                                                 b_ref->y, b_refH->y, b_refV->y, b_refHV->y,
+                                                 i, j,
+                                                 TRB,TRD,
+,0,
+                                                 d_sad16,
+                                                 &mb->deltamv,
+                                                 mb->directmv, // this has to be pre-initialized with b_mb->mvs[]
+                                         min_dx, max_dx, min_dy, max_dy,
+                                                 edged_width, 2, frame->quant, 0);
+                         d_sad16 = Diamond16_DirectMainSearch(
+                                                 f_ref->y, f_refH->y, f_refV->y, f_refHV->y,
+                                                 frame->image.y + i*16 + j*16*edged_width,
+                                                 b_ref->y, b_refH->y, b_refV->y, b_refHV->y,
+                                                 i, j,
+                                                 TRB,TRD,
+                                                 mb->deltamv.x, mb->deltamv.y,
+                                                 d_sad16,
+                                                 &mb->deltamv,
+                                                 mb->directmv, // this has to be pre-initialized with b_mb->mvs[]
+                                         min_dx, max_dx, min_dy, max_dy,
+                                                 edged_width, 1, frame->quant, 0);               // equiv to halfpel refine
-                         i_sad16 = 65535;
+ //                      i_sad16 = 65535;                /* remove the comment to disable any of the MODEs */
-                         f_sad16 = 65535;
+ //                      f_sad16 = 65535;
-                         b_sad16 = 65535;
+ //                      b_sad16 = 65535;
  //                      d_sad16 = 65535;
                          if (f_sad16 < b_sad16) {
-Line 3216
+Line 3348
                                  if (b_mb->mode == MODE_INTER4V)
                                  {
-                                 /* same method of scaling as in decoder.c, so we copy from there */
+                                 /* how to calc vectors is defined in standard. mvs[] and b_mvs[] are only for motion compensation */
+                                 /* for the bitstream, the value mb->deltamv is read directly */
                              for (k = 0; k < 4; k++) {
                                                  mb->mvs[k].x = (int32_t) ((TRB * mb->directmv[k].x) / TRD + mb->deltamv.x);
-Line 3225
+Line 3359
                                                      : mb->mvs[k].x - mb->directmv[k].x);
                              mb->mvs[k].y = (int32_t) ((TRB * mb->directmv[k].y) / TRD + mb->deltamv.y);
-                         mb->b_mvs[k].y = (int32_t) ((mb->directmv[k].y == 0)
+                         mb->b_mvs[k].y = (int32_t) ((mb->deltamv.y == 0)
                                                                                          ? ((TRB - TRD) * mb->directmv[k].y) / TRD
                                              : mb->mvs[k].y - mb->directmv[k].y);
                                          }
-Line 3240
+Line 3374
                              mb->mvs[0].y = (int32_t) ((TRB * mb->directmv[0].y) / TRD + mb->deltamv.y);
-                         mb->b_mvs[0].y = (int32_t) ((mb->directmv[0].y == 0)
+                         mb->b_mvs[0].y = (int32_t) ((mb->deltamv.y == 0)
                                                                                  ? ((TRB - TRD) * mb->directmv[0].y) / TRD
                                              : mb->mvs[0].y - mb->directmv[0].y);
-Line 3250
+Line 3384
                                  best_sad = d_sad16;
                                  mb->mode = MODE_DIRECT;
-                                 mb->mode = MODE_INTERPOLATE;            // direct mode still broken :-(
                          }
                          switch (mb->mode)
-Line 3266
+Line 3399
                                          break;
                                  case MODE_INTERPOLATE:
                                          i_count++;
+                                         mb->mvs[0] = f_interpolMV;
+                                         mb->b_mvs[0] = b_interpolMV;
                                          f_predMV = mb->mvs[0];
                                          b_predMV = mb->b_mvs[0];
                                          break;
-Line 3273
+Line 3408
                                          d_count++;
                                          break;
                                  default:
-                                         s_count++;              // ???
                                          break;
                          }
-Line 3281
+Line 3415
          }
  #ifdef _DEBUG_BFRAME_STAT
-         fprintf(stderr,"B-Stat: F: %04d   B: %04d   I: %04d  D: %04d   S: %04d\n",
+         fprintf(stderr,"B-Stat: F: %04d   B: %04d   I: %04d  D: %04d\n",
-                                 f_count,b_count,i_count,d_count,s_count);
+                                 f_count,b_count,i_count,d_count);
  #endif
  }

 Legend:



Removed from v.1.39
 


changed lines


 
Added in v.1.45
 Legend:



Removed from v.1.39
 


changed lines


 
Added in v.1.45
-Removed from v.1.39
+Added in v.1.45

No admin address has been configured	ViewVC Help
Powered by ViewVC 1.0.4