Diff of /xvidcore/src/motion/motion_est.c

-revision 1.69, Tue May 13 12:47:33 2003 UTC
+revision 1.72, Thu Jun 26 10:37:09 2003 UTC
 Line 667
          for(i = 0; i < 4; i++) {
                  int s = 8*((i&1) + (i>>1)*data->iEdgedWidth);
                  transfer_8to16subro(in, data->Cur + s, ptr + s, data->iEdgedWidth);
-                 bits += data->temp[i] = Block_CalcBits(coeff, in, data->iQuant, data->quant_type, &cbp, i, 0);
+                 bits += data->temp[i] = Block_CalcBits(coeff, in, data->dctSpace + 128, data->iQuant, data->quant_type, &cbp, i);
          }
-         bits += t = d_mv_bits(x, y, data->predMV, data->iFcode, data->qpel^data->qpel_precision, 0);
+         bits += t = BITS_MULT*d_mv_bits(x, y, data->predMV, data->iFcode, data->qpel^data->qpel_precision, 0);
-         bits += xvid_cbpy_tab[15-(cbp>>2)].len;
+         //8x8 blocks for inter4v mode
+         if (data->temp[0] + t < data->iMinSAD[1]) {
+                 data->iMinSAD[1] = data->temp[0] + t; current[1].x = x; current[1].y = y; }
+         if (data->temp[1] < data->iMinSAD[2]) {
+                 data->iMinSAD[2] = data->temp[1]; current[2].x = x; current[2].y = y; }
+         if (data->temp[2] < data->iMinSAD[3]) {
+                 data->iMinSAD[3] = data->temp[2]; current[3].x = x; current[3].y = y; }
+         if (data->temp[3] < data->iMinSAD[4]) {
+                 data->iMinSAD[4] = data->temp[3]; current[4].x = x; current[4].y = y; }
+         bits += BITS_MULT*xvid_cbpy_tab[15-(cbp>>2)].len;
          if (bits >= data->iMinSAD[0]) return;
-Line 683
+Line 693
          //chroma U
          ptr = interpolate8x8_switch2(data->RefQ + 64, data->RefP[4], 0, 0, xc, yc,  data->iEdgedWidth/2, data->rounding);
          transfer_8to16subro(in, ptr, data->CurU, data->iEdgedWidth/2);
-         bits += Block_CalcBits(coeff, in, data->iQuant, data->quant_type, &cbp, 4, 0);
+         bits += Block_CalcBits(coeff, in, data->dctSpace + 128, data->iQuant, data->quant_type, &cbp, 4);
          if (bits >= data->iMinSAD[0]) return;
          //chroma V
          ptr = interpolate8x8_switch2(data->RefQ + 64, data->RefP[5], 0, 0, xc, yc,  data->iEdgedWidth/2, data->rounding);
          transfer_8to16subro(in, ptr, data->CurV, data->iEdgedWidth/2);
-         bits += Block_CalcBits(coeff, in, data->iQuant, data->quant_type, &cbp, 5, 0);
+         bits += Block_CalcBits(coeff, in, data->dctSpace + 128, data->iQuant, data->quant_type, &cbp, 5);
-         bits += mcbpc_inter_tab[(MODE_INTER & 7) | ((cbp & 3) << 3)].len;
+         bits += BITS_MULT*mcbpc_inter_tab[(MODE_INTER & 7) | ((cbp & 3) << 3)].len;
          if (bits < data->iMinSAD[0]) {
                  data->iMinSAD[0] = bits;
                  current[0].x = x; current[0].y = y;
                  *dir = Direction;
          }
-         if (data->temp[0] + t < data->iMinSAD[1]) {
-                 data->iMinSAD[1] = data->temp[0] + t; current[1].x = x; current[1].y = y; }
-         if (data->temp[1] < data->iMinSAD[2]) {
-                 data->iMinSAD[2] = data->temp[1]; current[2].x = x; current[2].y = y; }
-         if (data->temp[2] < data->iMinSAD[3]) {
-                 data->iMinSAD[3] = data->temp[2]; current[3].x = x; current[3].y = y; }
-         if (data->temp[3] < data->iMinSAD[4]) {
-                 data->iMinSAD[4] = data->temp[3]; current[4].x = x; current[4].y = y; }
  }
  static void
  CheckCandidateBits8(const int x, const int y, const int Direction, int * const dir, const SearchData * const data)
 Line 731
          }
          transfer_8to16subro(in, data->Cur, ptr, data->iEdgedWidth);
-         bits = Block_CalcBits(coeff, in, data->iQuant, data->quant_type, &cbp, 5, 0);
+         bits = Block_CalcBits(coeff, in, data->dctSpace + 128, data->iQuant, data->quant_type, &cbp, 5);
-         bits += d_mv_bits(x, y, data->predMV, data->iFcode, data->qpel^data->qpel_precision, 0);
+         bits += BITS_MULT*d_mv_bits(x, y, data->predMV, data->iFcode, data->qpel^data->qpel_precision, 0);
          if (bits < data->iMinSAD[0]) {
                  data->temp[0] = cbp;
 Line 973
                          Data->iMinSAD[0] = sad;
                  }
-                 /* final skip decision, a.k.a. "the vector you found, really that good?" */
+                 // final skip decision, a.k.a. "the vector you found, really that good?"
                  if (skip_possible && (pMB->sad16 < (int)iQuant * MAX_SAD00_FOR_SKIP))
                          if ( (100*sad)/(pMB->sad16+1) > FINAL_SKIP_THRESH)
                                  if (Data->chroma || SkipDecisionP(pCurrent, pRef, x, y, Data->iEdgedWidth/2, iQuant, Data->rrv)) {
 Line 981
                                          sad = 0;
                                  }
-                 /* intra decision */
+                 // intra decision
                  if (iQuant > 8) InterBias += 100 * (iQuant - 8); // to make high quants work
                  if (y != 0)
 Line 1087
          VECTOR currentMV[5];
          VECTOR currentQMV[5];
          int32_t iMinSAD[5];
-         DECLARE_ALIGNED_MATRIX(dct_space, 2, 64, int16_t, CACHE_LINE);
+         DECLARE_ALIGNED_MATRIX(dct_space, 3, 64, int16_t, CACHE_LINE);
          SearchData Data;
          memset(&Data, 0, sizeof(SearchData));
          Data.iEdgedWidth = iEdgedWidth;
 Line 1150
  //initial skip decision
  /* no early skip for GMC (global vector = skip vector is unknown!)  */
                          if (!(current->global_flags & XVID_GMC))        { /* no fast SKIP for S(GMC)-VOPs */
-                                 if (pMB->dquant == NO_CHANGE && sad00 < pMB->quant * skip_thresh)
+                                 if (pMB->dquant == NO_CHANGE && sad00 < quant * skip_thresh)
                                          if (Data.chroma || SkipDecisionP(pCurrent, pRef, x, y, iEdgedWidth/2, pMB->quant, Data.rrv)) {
                                                  SkipMacroblockP(pMB, sad00);
                                                  continue;
 Line 1292
          Data->iMinSAD[3] = pMB->sad8[2];
          Data->iMinSAD[4] = pMB->sad8[3];
-         if ((!(GlobalFlags & XVID_MODEDECISION_BITS)) || (x | y)) {
+         if ((!(GlobalFlags & XVID_MODEDECISION_BITS)) && (x | y)) {
                  threshA = Data->temp[0]; // that's where we keep this SAD atm
                  if (threshA < 512) threshA = 512;
                  else if (threshA > 1024) threshA = 1024;
 Line 1371
                  Data->currentQMV[i].y = 2 * Data->currentMV[i].y;
          }
-         if (MotionFlags & PMV_QUARTERPELREFINE16) {
+         if (Data->qpel) {
                  get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 16,
                                  pParam->width, pParam->height, Data->iFcode, 1, 0);
                  Data->qpel_precision = 1;
+                 if (MotionFlags & PMV_QUARTERPELREFINE16)
                  SubpelRefine(Data);
          }
-         if ((!(GlobalFlags & XVID_MODEDECISION_BITS)) && (Data->iMinSAD[0] < (int32_t)pMB->quant * 30))
+         if (Data->iMinSAD[0] < (int32_t)pMB->quant * 30)
                  inter4v = 0;
          if (inter4v) {
 Line 1775
          CheckCandidate(0, 0, 255, &k, Data);
  // initial (fast) skip decision
-         if (*Data->iMinSAD < pMB->quant * INITIAL_SKIP_THRESH * (2 + Data->chroma?1:0)) {
+         if (*Data->iMinSAD < pMB->quant * INITIAL_SKIP_THRESH * (Data->chroma?3:2)) {
                  //possible skip
                  if (Data->chroma) {
                          pMB->mode = MODE_DIRECT_NONE_MV;
 Line 2159
          }
  }
- #define INTRA_THRESH    1800
+ #define INTRA_THRESH    2200
- #define INTER_THRESH    1200
+ #define INTER_THRESH    50
+ #define INTRA_THRESH2   95
  int
  MEanalysis(     const IMAGE * const pRef,
-Line 2175
+Line 2176
          int sSAD = 0;
          MACROBLOCK * const pMBs = Current->mbs;
          const IMAGE * const pCurrent = &Current->image;
-         int IntraThresh = INTRA_THRESH, InterThresh = INTER_THRESH + 10*b_thresh;
+         int IntraThresh = INTRA_THRESH, InterThresh = INTER_THRESH + b_thresh;
          int s = 0, blocks = 0;
+         int complexity = 0;
          int32_t iMinSAD[5], temp[5];
          VECTOR currentMV[5];
-Line 2188
+Line 2190
          Data.temp = temp;
          CheckCandidate = CheckCandidate32I;
-         if (intraCount != 0 && intraCount < 10) // we're right after an I frame
+         if (intraCount != 0) {
+                 if (intraCount < 10) // we're right after an I frame
                  IntraThresh += 15 * (intraCount - 10) * (intraCount - 10);
          else
                  if ( 5*(maxIntra - intraCount) < maxIntra) // we're close to maximum. 2 sec when max is 10 sec
                          IntraThresh -= (IntraThresh * (maxIntra - 8*(maxIntra - intraCount)))/maxIntra;
+         }
-         InterThresh -= (350 - 8*b_thresh) * bCount;
+         InterThresh -= 12 * bCount;
-         if (InterThresh < 300 + 5*b_thresh) InterThresh = 300 + 5*b_thresh;
+         if (InterThresh < 15 + b_thresh) InterThresh = 15 + b_thresh;
          if (sadInit) (*sadInit) ();
          for (y = 1; y < pParam->mb_height-1; y += 2) {
                  for (x = 1; x < pParam->mb_width-1; x += 2) {
                          int i;
-                         blocks += 4;
+                         blocks += 10;
                          if (bCount == 0) pMBs[x + y * pParam->mb_width].mvs[0] = zeroMV;
                          else { //extrapolation of the vector found for last frame
-Line 2217
+Line 2222
                          for (i = 0; i < 4; i++) {
                                  int dev;
                                  MACROBLOCK *pMB = &pMBs[x+(i&1) + (y+(i>>1)) * pParam->mb_width];
-                                 if (pMB->sad16 > IntraThresh) {
                                          dev = dev16(pCurrent->y + (x + (i&1) + (y + (i>>1)) * pParam->edged_width) * 16,
                                                                          pParam->edged_width);
+                                 complexity += dev;
                                          if (dev + IntraThresh < pMB->sad16) {
                                                  pMB->mode = MODE_INTRA;
                                                  if (++intra > ((pParam->mb_height-2)*(pParam->mb_width-2))/2) return I_VOP;
                                          }
-                                 }
-                                 if (pMB->mvs[0].x == 0 && pMB->mvs[0].y == 0) s++;
+                                 if (pMB->mvs[0].x == 0 && pMB->mvs[0].y == 0)
+                                         if (dev > 500 && pMB->sad16 < 1000)
+                                                 sSAD += 1000;
                                  sSAD += pMB->sad16;
                          }
                  }
          }
+         complexity >>= 7;
-         sSAD /= blocks;
+         sSAD /= complexity + 4*blocks;
-         s = (10*s) / blocks;
-         if (s > 4) sSAD += (s - 2) * (60 - 2*b_thresh); //static block - looks bad when in bframe...
+         if (intraCount > 12 && sSAD > INTRA_THRESH2 ) return I_VOP;
          if (sSAD > InterThresh ) return P_VOP;
          emms();
          return B_VOP;
-Line 2446
+Line 2453
                  Data->qpel_precision = 1;
                  CheckCandidateBits16(Data->currentQMV[0].x, Data->currentQMV[0].y, 255, &iDirection, Data);
-                 //checking if this vector is perfect. if it is, we stop.
-                 if (Data->temp[0] == 0 && Data->temp[1] == 0 && Data->temp[2] == 0 && Data->temp[3] == 0)
-                         return 0; //quick stop
                  if (MotionFlags & (HALFPELREFINE16_BITS | EXTSEARCH_BITS)) { //we have to prepare for halfpixel-precision search
                          for(i = 0; i < 5; i++) bsad[i] = Data->iMinSAD[i];
                          get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 16,
-Line 2462
+Line 2465
          } else { // not qpel
                  CheckCandidateBits16(Data->currentMV[0].x, Data->currentMV[0].y, 255, &iDirection, Data);
-                 //checking if this vector is perfect. if it is, we stop.
-                 if (Data->temp[0] == 0 && Data->temp[1] == 0 && Data->temp[2] == 0 && Data->temp[3] == 0) {
-                         return 0; //inter
-                 }
          }
          if (MotionFlags&EXTSEARCH_BITS) SquareSearch(Data->currentMV->x, Data->currentMV->y, Data, iDirection);
-Line 2495
+Line 2494
          return Data->iMinSAD[0];
  }
  static int
  CountMBBitsInter4v(const SearchData * const Data,
                                          MACROBLOCK * const pMB, const MACROBLOCK * const pMBs,
-Line 2537
+Line 2535
                  get_range(&Data8->min_dx, &Data8->max_dx, &Data8->min_dy, &Data8->max_dy, 2*x + (i&1), 2*y + (i>>1), 8,
                                          pParam->width, pParam->height, Data8->iFcode, Data8->qpel, 0);
-                 *Data8->iMinSAD += t;
+                 *Data8->iMinSAD += BITS_MULT*t;
                  Data8->qpel_precision = Data8->qpel;
                  // checking the vector which has been found by SAD-based 8x8 search (if it's different than the one found so far)
-Line 2615
+Line 2613
          } // /for all luma blocks
-         bits += xvid_cbpy_tab[15-(cbp>>2)].len;
+         bits += BITS_MULT*xvid_cbpy_tab[15-(cbp>>2)].len;
          // let's check chroma
          sumx = (sumx >> 3) + roundtab_76[sumx & 0xf];
-Line 2624
+Line 2622
          //chroma U
          ptr = interpolate8x8_switch2(Data->RefQ + 64, Data->RefP[4], 0, 0, sumx, sumy, Data->iEdgedWidth/2, Data->rounding);
          transfer_8to16subro(in, Data->CurU, ptr, Data->iEdgedWidth/2);
-         bits += Block_CalcBits(coeff, in, Data->iQuant, Data->quant_type, &cbp, 4, 0);
+         bits += Block_CalcBits(coeff, in, Data->dctSpace + 128, Data->iQuant, Data->quant_type, &cbp, 4);
          if (bits >= *Data->iMinSAD) return bits;
          //chroma V
          ptr = interpolate8x8_switch2(Data->RefQ + 64, Data->RefP[5], 0, 0, sumx, sumy, Data->iEdgedWidth/2, Data->rounding);
          transfer_8to16subro(in, Data->CurV, ptr, Data->iEdgedWidth/2);
-         bits += Block_CalcBits(coeff, in, Data->iQuant, Data->quant_type, &cbp, 5, 0);
+         bits += Block_CalcBits(coeff, in, Data->dctSpace + 128, Data->iQuant, Data->quant_type, &cbp, 5);
-         bits += mcbpc_inter_tab[(MODE_INTER4V & 7) | ((cbp & 3) << 3)].len;
+         bits += BITS_MULT*mcbpc_inter_tab[(MODE_INTER4V & 7) | ((cbp & 3) << 3)].len;
          return bits;
  }
  static int
  CountMBBitsIntra(const SearchData * const Data)
  {
-         int bits = 1; //this one is ac/dc prediction flag. always 1.
+         int bits = BITS_MULT*1; //this one is ac/dc prediction flag bit
-         int cbp = 0, i, t, dc = 1024, b_dc;
+         int cbp = 0, i, dc = 0;
          int16_t *in = Data->dctSpace, * coeff = Data->dctSpace + 64;
-         uint32_t iDcScaler = get_dc_scaler(Data->iQuant, 1);
          for(i = 0; i < 4; i++) {
                  int s = 8*((i&1) + (i>>1)*Data->iEdgedWidth);
                  transfer_8to16copy(in, Data->Cur + s, Data->iEdgedWidth);
-                 fdct(in);
+                 bits += Block_CalcBitsIntra(coeff, in, Data->dctSpace + 128, Data->iQuant, Data->quant_type, &cbp, i, &dc);
-                 b_dc = in[0];
-                 in[0] -= dc;
-                 dc = b_dc;
-                 if (Data->quant_type == 0) quant_intra(coeff, in, Data->iQuant, iDcScaler);
-                 else quant4_intra(coeff, in, Data->iQuant, iDcScaler);
-                 bits += t = CodeCoeffIntra_CalcBits(coeff, scan_tables[0]) + dcy_tab[coeff[0] + 255].len;
-                 Data->temp[i] = t;
-                 if (t != 0)  cbp |= 1 << (5 - i);
                  if (bits >= Data->iMinSAD[0]) return bits;
          }
-         bits += xvid_cbpy_tab[cbp>>2].len;
+         bits += BITS_MULT*xvid_cbpy_tab[cbp>>2].len;
-         iDcScaler = get_dc_scaler(Data->iQuant, 0);
          //chroma U
          transfer_8to16copy(in, Data->CurU, Data->iEdgedWidth/2);
-         fdct(in);
+         bits += Block_CalcBitsIntra(coeff, in, Data->dctSpace + 128, Data->iQuant, Data->quant_type, &cbp, 4, &dc);
-         in[0] -= 1024;
-         if (Data->quant_type == 0) quant_intra(coeff, in, Data->iQuant, iDcScaler);
-         else quant4_intra(coeff, in, Data->iQuant, iDcScaler);
-         bits += t = CodeCoeffIntra_CalcBits(coeff, scan_tables[0]) + dcc_tab[coeff[0] + 255].len;
-         if (t != 0) cbp |= 1 << (5 - 4);
          if (bits >= Data->iMinSAD[0]) return bits;
          //chroma V
          transfer_8to16copy(in, Data->CurV, Data->iEdgedWidth/2);
-         fdct(in);
+         bits += Block_CalcBitsIntra(coeff, in, Data->dctSpace + 128, Data->iQuant, Data->quant_type, &cbp, 5, &dc);
-         in[0] -= 1024;
-         if (Data->quant_type == 0) quant_intra(coeff, in, Data->iQuant, iDcScaler);
-         else quant4_intra(coeff, in, Data->iQuant, iDcScaler);
-         bits += t = CodeCoeffIntra_CalcBits(coeff, scan_tables[0]) + dcc_tab[coeff[0] + 255].len;
-         if (t != 0) cbp |= 1 << (5 - 5);
-         bits += mcbpc_inter_tab[(MODE_INTRA & 7) | ((cbp & 3) << 3)].len;
+         bits += BITS_MULT*mcbpc_inter_tab[(MODE_INTRA & 7) | ((cbp & 3) << 3)].len;
          return bits;
  }

 Legend:



Removed from v.1.69
 


changed lines


 
Added in v.1.72
 Legend:



Removed from v.1.69
 


changed lines


 
Added in v.1.72
-Removed from v.1.69
+Added in v.1.72

No admin address has been configured	ViewVC Help
Powered by ViewVC 1.0.4