Diff of /xvidcore/src/image/postprocessing.c

-revision 1.1.2.1, Sat May  3 23:26:55 2003 UTC
+revision 1.1.4.1, Wed Dec 10 01:02:40 2003 UTC
 Line 1
+ /*****************************************************************************
+  *
+  *  XVID MPEG-4 VIDEO CODEC
+  *  - Postprocessing  functions -
+  *
+  *  Copyright(C) 2003 Michael Militzer <isibaar@xvid.org>
+  *
+  *  This program is free software ; you can redistribute it and/or modify
+  *  it under the terms of the GNU General Public License as published by
+  *  the Free Software Foundation ; either version 2 of the License, or
+  *  (at your option) any later version.
+  *
+  *  This program is distributed in the hope that it will be useful,
+  *  but WITHOUT ANY WARRANTY ; without even the implied warranty of
+  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+  *  GNU General Public License for more details.
+  *
+  *  You should have received a copy of the GNU General Public License
+  *  along with this program ; if not, write to the Free Software
+  *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
+  *
+  ****************************************************************************/
  #include <stdlib.h>
  #include <string.h>
  #include <math.h>
-Line 7
+Line 30
  #include "image.h"
  #include "postprocessing.h"
+ /* Filtering thresholds */
+ #define THR1 2
+ #define THR2 6
+ /* Some useful (and fast) macros
+    Note that the MIN/MAX macros assume signed shift - if your compiler
+    doesn't do signed shifts, use the default MIN/MAX macros from global.h */
+ #define FAST_MAX(x,y) ((x) - ((((x) - (y))>>(32 - 1)) & ((x) - (y))))
+ #define FAST_MIN(x,y) ((x) + ((((y) - (x))>>(32 - 1)) & ((y) - (x))))
+ #define FAST_ABS(x) ((((int)(x)) >> 31) ^ ((int)(x))) - (((int)(x)) >> 31)
+ #define ABS(X)    (((X)>0)?(X):-(X))
+ static int8_t xvid_thresh_tbl[510];
+ static int8_t xvid_abs_tbl[510];
+ void init_postproc(void)
+ {
+         int i;
+         for(i = -255; i < 256; i++) {
+                 xvid_thresh_tbl[i + 255] = 0;
+                 if(ABS(i) < THR1)
+                         xvid_thresh_tbl[i + 255] = 1;
+                 xvid_abs_tbl[i + 255] = ABS(i);
+         }
+ }
  void
  image_deblock(IMAGE * img, int edged_width,
                                  const MACROBLOCK * mbs, int mb_width, int mb_height, int mb_stride,
-Line 17
+Line 69
          int quant;
          /* luma: j,i in block units */
-         if ((flags & XVID_DEC_DEBLOCKY))
+         if ((flags & XVID_DEBLOCKY))
          {
                  for (j = 1; j < mb_height*2; j++)               /* horizontal deblocking */
                  for (i = 0; i < mb_width*2; i++)
-Line 36
+Line 88
          /* chroma */
-         if ((flags & XVID_DEC_DEBLOCKUV))
+         if ((flags & XVID_DEBLOCKUV))
          {
                  for (j = 1; j < mb_height; j++)         /* horizontal deblocking */
                  for (i = 0; i < mb_width; i++)
-Line 56
+Line 108
          }
  }
- #define THR1 2
+ #define LOAD_DATA_HOR(x) \
- #define THR2 6
+                 /* Load pixel addresses and data for filtering */ \
+             s[0] = *(v[0] = img - 5*stride + x); \
+                 s[1] = *(v[1] = img - 4*stride + x); \
+                 s[2] = *(v[2] = img - 3*stride + x); \
+                 s[3] = *(v[3] = img - 2*stride + x); \
+                 s[4] = *(v[4] = img - 1*stride + x); \
+                 s[5] = *(v[5] = img + 0*stride + x); \
+                 s[6] = *(v[6] = img + 1*stride + x); \
+                 s[7] = *(v[7] = img + 2*stride + x); \
+                 s[8] = *(v[8] = img + 3*stride + x); \
+                 s[9] = *(v[9] = img + 4*stride + x);
+ #define LOAD_DATA_VER(x) \
+                 /* Load pixel addresses and data for filtering */ \
+                 s[0] = *(v[0] = img + x*stride - 5); \
+                 s[1] = *(v[1] = img + x*stride - 4); \
+                 s[2] = *(v[2] = img + x*stride - 3); \
+                 s[3] = *(v[3] = img + x*stride - 2); \
+                 s[4] = *(v[4] = img + x*stride - 1); \
+                 s[5] = *(v[5] = img + x*stride + 0); \
+                 s[6] = *(v[6] = img + x*stride + 1); \
+                 s[7] = *(v[7] = img + x*stride + 2); \
+                 s[8] = *(v[8] = img + x*stride + 3); \
+                 s[9] = *(v[9] = img + x*stride + 4);
+ #define APPLY_FILTER_CORE \
+                 /* First, decide whether to use default or DC-offset mode */ \
+                 \
+                 eq_cnt = 0; \
+                 \
+                 eq_cnt += xvid_thresh_tbl[s[0] - s[1] + 255]; \
+                 eq_cnt += xvid_thresh_tbl[s[1] - s[2] + 255]; \
+                 eq_cnt += xvid_thresh_tbl[s[2] - s[3] + 255]; \
+                 eq_cnt += xvid_thresh_tbl[s[3] - s[4] + 255]; \
+                 eq_cnt += xvid_thresh_tbl[s[4] - s[5] + 255]; \
+                 eq_cnt += xvid_thresh_tbl[s[5] - s[6] + 255]; \
+                 eq_cnt += xvid_thresh_tbl[s[6] - s[7] + 255]; \
+                 eq_cnt += xvid_thresh_tbl[s[7] - s[8] + 255]; \
+                 \
+                 if(eq_cnt < THR2) { /* Default mode */  \
+                         int a30, a31, a32;                                      \
+                         int diff, limit;                                        \
+                                                                                                 \
+                         a30 = ((s[3]<<1) - s[4] * 5 + s[5] * 5 - (s[6]<<1));    \
+                                                                                                                                         \
+                         if(xvid_abs_tbl[a30 + 255] < 8*quant) {                                                         \
+                                 a31 = ((s[1]<<1) - s[2] * 5 + s[3] * 5 - (s[4]<<1));    \
+                                 a32 = ((s[5]<<1) - s[6] * 5 + s[7] * 5 - (s[8]<<1));    \
+                                                                                                                                                 \
+                                 diff = (5 * ((SIGN(a30) * MIN(xvid_abs_tbl[a30 + 255], MIN(xvid_abs_tbl[a31 + 255], xvid_abs_tbl[a32 + 255]))) - a30) + 32) >> 6;       \
+                                 limit = (s[4] - s[5]) / 2;      \
+                                 \
+                                 if (limit > 0)                          \
+                                         diff = (diff < 0) ? 0 : ((diff > limit) ? limit : diff);        \
+                                 else    \
+                                         diff = (diff > 0) ? 0 : ((diff < limit) ? limit : diff);        \
+                                                                                                                                                                 \
+                                 *v[4] -= diff;  \
+                                 *v[5] += diff;  \
+                         }       \
+                 }       \
+                 else {  /* DC-offset mode */    \
+                         uint8_t p0, p9; \
+                         int min, max;   \
+                                                         \
+                         /* Now decide whether to apply smoothing filter or not */       \
+                         max = FAST_MAX(s[1], FAST_MAX(s[2], FAST_MAX(s[3], FAST_MAX(s[4], FAST_MAX(s[5], FAST_MAX(s[6], FAST_MAX(s[7], s[8])))))));     \
+                         min = FAST_MIN(s[1], FAST_MIN(s[2], FAST_MIN(s[3], FAST_MIN(s[4], FAST_MIN(s[5], FAST_MIN(s[6], FAST_MIN(s[7], s[8])))))));     \
+                         \
+                         if(((max-min)) < 2*quant) {     \
+                                                                                 \
+                                 /* Choose edge pixels */        \
+                                 p0 = (xvid_abs_tbl[(s[1] - s[0]) + 255] < quant) ? s[0] : s[1]; \
+                                 p9 = (xvid_abs_tbl[(s[8] - s[9]) + 255] < quant) ? s[9] : s[8]; \
+                                                                                                                                 \
+                                 *v[1] = (uint8_t) ((6*p0 + (s[1]<<2) + (s[2]<<1) + (s[3]<<1) + s[4] + s[5] + 8) >> 4);  \
+                                 *v[2] = (uint8_t) (((p0<<2) + (s[1]<<1) + (s[2]<<2) + (s[3]<<1) + (s[4]<<1) + s[5] + s[6] + 8) >> 4);   \
+                                 *v[3] = (uint8_t) (((p0<<1) + (s[1]<<1) + (s[2]<<1) + (s[3]<<2) + (s[4]<<1) + (s[5]<<1) + s[6] + s[7] + 8) >> 4);       \
+                                 *v[4] = (uint8_t) ((p0 + s[1] + (s[2]<<1) + (s[3]<<1) + (s[4]<<2) + (s[5]<<1) + (s[6]<<1) + s[7] + s[8] + 8) >> 4);     \
+                                 *v[5] = (uint8_t) ((s[1] + s[2] + (s[3]<<1) + (s[4]<<1) + (s[5]<<2) + (s[6]<<1) + (s[7]<<1) + s[8] + p9 + 8) >> 4);     \
+                                 *v[6] = (uint8_t) ((s[2] + s[3] + (s[4]<<1) + (s[5]<<1) + (s[6]<<2) + (s[7]<<1) + (s[8]<<1) + (p9<<1) + 8) >> 4);       \
+                                 *v[7] = (uint8_t) ((s[3] + s[4] + (s[5]<<1) + (s[6]<<1) + (s[7]<<2) + (s[8]<<1) + (p9<<2) + 8) >> 4);   \
+                                 *v[8] = (uint8_t) ((s[4] + s[5] + (s[6]<<1) + (s[7]<<1) + (s[8]<<2) + 6*p9 + 8) >> 4);  \
+                         }       \
+                 }
  void deblock8x8_h(uint8_t *img, int stride, int quant)
  {
-         int i, j;
          int eq_cnt;
-         uint8_t *v[10], p0, p9;
+         uint8_t *v[10];
-         int min, max;
+         int32_t s[10];
-         int a30, a31, a32;
-         int diff, limit;
-         for(j = 0; j < 8; j++) {
-                 eq_cnt = 0;
-                 /* Load pixel addresses for filtering */
-                 for(i = 0; i < 10; i++)
-                         v[i] = img + (i-5)*stride + j;
-                 /* First, decide whether to use default or DC-offset mode */
-                 for(i = 0; i < 9; i++)
-                 {
-                         if(ABS(*v[i] - *v[(i+1)]) < THR1)
-                                 eq_cnt++;
-                 }
-                 if(eq_cnt < THR2) { /* Default mode */
-                         a30 = (*v[3] * 2 - *v[4] * 5 + *v[5] * 5 - *v[6] * 2);
-                         if(ABS(a30) < 8*quant) {
+         LOAD_DATA_HOR(0)
-                                 a31 = (*v[1] * 2 - *v[2] * 5 + *v[3] * 5 - *v[4] * 2);
+         APPLY_FILTER_CORE
-                                 a32 = (*v[5] * 2 - *v[6] * 5 + *v[7] * 5 - *v[8] * 2);
-                                 diff = (5 * ((SIGN(a30) * MIN(ABS(a30), MIN(ABS(a31), ABS(a32)))) - a30) + 32) >> 6;
+         LOAD_DATA_HOR(1)
-                                 limit = (*v[4] - *v[5]) / 2;
+         APPLY_FILTER_CORE
-                                 if (limit > 0)
+         LOAD_DATA_HOR(2)
-                                         diff = (diff < 0) ? 0 : ((diff > limit) ? limit : diff);
+         APPLY_FILTER_CORE
-                                 else
-                                         diff = (diff > 0) ? 0 : ((diff < limit) ? limit : diff);
-                                 *v[4] -= diff;
+         LOAD_DATA_HOR(3)
-                                 *v[5] += diff;
+         APPLY_FILTER_CORE
-                         }
-                 }
-                 else {  /* DC-offset mode */
-                         /* Now decide whether to apply smoothing filter or not */
+         LOAD_DATA_HOR(4)
-                         max = MAX(*v[1], MAX(*v[2], MAX(*v[3], MAX(*v[4], MAX(*v[5], MAX(*v[6], MAX(*v[7], *v[8])))))));
+         APPLY_FILTER_CORE
-                         min = MIN(*v[1], MIN(*v[2], MIN(*v[3], MIN(*v[4], MIN(*v[5], MIN(*v[6], MIN(*v[7], *v[8])))))));
-                         if((max-min) < 2*quant) {
+         LOAD_DATA_HOR(5)
+         APPLY_FILTER_CORE
-                                 /* Choose edge pixels */
+         LOAD_DATA_HOR(6)
-                                 p0 = (ABS(*v[1]-*v[0]) < quant) ? *v[0] : *v[1];
+         APPLY_FILTER_CORE
-                                 p9 = (ABS(*v[8]-*v[9]) < quant) ? *v[9] : *v[8];
-                                 *v[1] = (6*p0 + (*v[1]<<2) + (*v[2]<<1) + (*v[3]<<1) + *v[4] + *v[5] + 8) >> 4;
+         LOAD_DATA_HOR(7)
-                                 *v[2] = ((p0<<2) + (*v[1]<<1) + (*v[2]<<2) + (*v[3]<<1) + (*v[4]<<1) + *v[5] + *v[6] + 8) >> 4;
+         APPLY_FILTER_CORE
-                                 *v[3] = ((p0<<1) + (*v[1]<<1) + (*v[2]<<1) + (*v[3]<<2) + (*v[4]<<1) + (*v[5]<<1) + *v[6] + *v[7] + 8) >> 4;
-                                 *v[4] = (p0 + *v[1] + (*v[2]<<1) + (*v[3]<<1) + (*v[4]<<2) + (*v[5]<<1) + (*v[6]<<1) + *v[7] + *v[8] + 8) >> 4;
-                                 *v[5] = (*v[1] + *v[2] + (*v[3]<<1) + (*v[4]<<1) + (*v[5]<<2) + (*v[6]<<1) + (*v[7]<<1) + *v[8] + p9 + 8) >> 4;
-                                 *v[6] = (*v[2] + *v[3] + (*v[4]<<1) + (*v[5]<<1) + (*v[6]<<2) + (*v[7]<<1) + (*v[8]<<1) + (p9<<1) + 8) >> 4;
-                                 *v[7] = (*v[3] + *v[4] + (*v[5]<<1) + (*v[6]<<1) + (*v[7]<<2) + (*v[8]<<1) + (p9<<2) + 8) >> 4;
-                                 *v[8] = (*v[4] + *v[5] + (*v[6]<<1) + (*v[7]<<1) + (*v[8]<<2) + 6*p9 + 8) >> 4;
-                         }
                  }
-         }
- }
  void deblock8x8_v(uint8_t *img, int stride, int quant)
  {
-         int i, j;
          int eq_cnt;
-         uint8_t *v[10], p0, p9;
+         uint8_t *v[10];
-         int min, max;
+         int s[10];
-         int a30, a31, a32;
-         int diff, limit;
-         for(j = 0; j < 8; j++) {
-                 eq_cnt = 0;
-                 /* Load pixel addresses for filtering */
-                 for(i = 0; i < 10; i++)
+         LOAD_DATA_VER(0)
-                         v[i] = img + j*stride + (i-5);
+         APPLY_FILTER_CORE
-                 /* First, decide whether to use default or DC-offset mode */
+         LOAD_DATA_VER(1)
+         APPLY_FILTER_CORE
-                 for(i = 0; i < 9; i++)
+         LOAD_DATA_VER(2)
-                 {
+         APPLY_FILTER_CORE
-                         if(ABS(*v[i] - *v[i+1]) < THR1)
-                                 eq_cnt++;
-                 }
-                 if(eq_cnt < THR2) { /* Default mode */
+         LOAD_DATA_VER(3)
+         APPLY_FILTER_CORE
-                         a30 = (*v[3] * 2 - *v[4] * 5 + *v[5] * 5 - *v[6] * 2);
+         LOAD_DATA_VER(4)
+         APPLY_FILTER_CORE
-                         if(ABS(a30) < 8*quant) {
+         LOAD_DATA_VER(5)
-                                 a31 = (*v[1] * 2 - *v[2] * 5 + *v[3] * 5 - *v[4] * 2);
+         APPLY_FILTER_CORE
-                                 a32 = (*v[5] * 2 - *v[6] * 5 + *v[7] * 5 - *v[8] * 2);
-                                 diff = (5 * ((SIGN(a30) * MIN(ABS(a30), MIN(ABS(a31), ABS(a32)))) - a30) + 32) >> 6;
+         LOAD_DATA_VER(6)
-                                 limit = (*v[4] - *v[5]) / 2;
+         APPLY_FILTER_CORE
-                                 if (limit > 0)
+         LOAD_DATA_VER(7)
-                                         diff = (diff < 0) ? 0 : ((diff > limit) ? limit : diff);
+         APPLY_FILTER_CORE
-                                 else
-                                         diff = (diff > 0) ? 0 : ((diff < limit) ? limit : diff);
-                                 *v[4] -= diff;
-                                 *v[5] += diff;
-                         }
-                 }
-                 else {  /* DC-offset mode */
-                         /* Now decide whether to apply smoothing filter or not */
-                         max = MAX(*v[1], MAX(*v[2], MAX(*v[3], MAX(*v[4], MAX(*v[5], MAX(*v[6], MAX(*v[7], *v[8])))))));
-                         min = MIN(*v[1], MIN(*v[2], MIN(*v[3], MIN(*v[4], MIN(*v[5], MIN(*v[6], MIN(*v[7], *v[8])))))));
-                         if((max-min) < 2*quant) {
-                                 /* Choose edge pixels */
-                                 p0 = (ABS(*v[1]-*v[0]) < quant) ? *v[0] : *v[1];
-                                 p9 = (ABS(*v[8]-*v[9]) < quant) ? *v[9] : *v[8];
-                                 *v[1] = (6*p0 + (*v[1]<<2) + (*v[2]<<1) + (*v[3]<<1) + *v[4] + *v[5] + 8) >> 4;
-                                 *v[2] = ((p0<<2) + (*v[1]<<1) + (*v[2]<<2) + (*v[3]<<1) + (*v[4]<<1) + *v[5] + *v[6] + 8) >> 4;
-                                 *v[3] = ((p0<<1) + (*v[1]<<1) + (*v[2]<<1) + (*v[3]<<2) + (*v[4]<<1) + (*v[5]<<1) + *v[6] + *v[7] + 8) >> 4;
-                                 *v[4] = (p0 + *v[1] + (*v[2]<<1) + (*v[3]<<1) + (*v[4]<<2) + (*v[5]<<1) + (*v[6]<<1) + *v[7] + *v[8] + 8) >> 4;
-                                 *v[5] = (*v[1] + *v[2] + (*v[3]<<1) + (*v[4]<<1) + (*v[5]<<2) + (*v[6]<<1) + (*v[7]<<1) + *v[8] + p9 + 8) >> 4;
-                                 *v[6] = (*v[2] + *v[3] + (*v[4]<<1) + (*v[5]<<1) + (*v[6]<<2) + (*v[7]<<1) + (*v[8]<<1) + (p9<<1) + 8) >> 4;
-                                 *v[7] = (*v[3] + *v[4] + (*v[5]<<1) + (*v[6]<<1) + (*v[7]<<2) + (*v[8]<<1) + (p9<<2) + 8) >> 4;
-                                 *v[8] = (*v[4] + *v[5] + (*v[6]<<1) + (*v[7]<<1) + (*v[8]<<2) + 6*p9 + 8) >> 4;
-                         }
-                 }
-         }
  }

 Legend:



Removed from v.1.1.2.1
 


changed lines


 
Added in v.1.1.4.1
 Legend:



Removed from v.1.1.2.1
 


changed lines


 
Added in v.1.1.4.1
-Removed from v.1.1.2.1
+Added in v.1.1.4.1

No admin address has been configured	ViewVC Help
Powered by ViewVC 1.0.4