1 |
/***************************************************************************** |
/************************************************************************** |
2 |
* |
* |
3 |
* XVID MPEG-4 VIDEO CODEC |
* XVID MPEG-4 VIDEO CODEC |
4 |
* - image module - |
* - Image management functions - |
5 |
* |
* |
6 |
* Copyright(C) 2002 Peter Ross <pross@xvid.org> |
* Copyright(C) 2001-2004 Peter Ross <pross@xvid.org> |
|
* |
|
|
* This program is an implementation of a part of one or more MPEG-4 |
|
|
* Video tools as specified in ISO/IEC 14496-2 standard. Those intending |
|
|
* to use this software module in hardware or software products are |
|
|
* advised that its use may infringe existing patents or copyrights, and |
|
|
* any such use would be at such party's own risk. The original |
|
|
* developer of this software module and his/her company, and subsequent |
|
|
* editors and their companies, will have no liability for use of this |
|
|
* software or modifications or derivatives thereof. |
|
7 |
* |
* |
8 |
* This program is free software; you can redistribute it and/or modify |
* This program is free software; you can redistribute it and/or modify |
9 |
* it under the terms of the GNU General Public License as published by |
* it under the terms of the GNU General Public License as published by |
19 |
* along with this program; if not, write to the Free Software |
* along with this program; if not, write to the Free Software |
20 |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
21 |
* |
* |
22 |
|
* $Id$ |
23 |
|
* |
24 |
****************************************************************************/ |
****************************************************************************/ |
25 |
|
|
26 |
#include <stdlib.h> |
#include <stdlib.h> |
27 |
#include <string.h> // memcpy, memset |
#include <string.h> /* memcpy, memset */ |
28 |
#include <math.h> |
#include <math.h> |
|
|
|
29 |
#include "../portab.h" |
#include "../portab.h" |
30 |
#include "../xvid.h" // XVID_CSP_XXX's |
#include "../global.h" /* XVID_CSP_XXX's */ |
31 |
|
#include "../xvid.h" /* XVID_CSP_XXX's */ |
32 |
#include "image.h" |
#include "image.h" |
33 |
#include "colorspace.h" |
#include "colorspace.h" |
34 |
#include "interpolate8x8.h" |
#include "interpolate8x8.h" |
|
#include "../divx4.h" |
|
35 |
#include "../utils/mem_align.h" |
#include "../utils/mem_align.h" |
36 |
|
#include "../motion/sad.h" |
37 |
|
#include "../utils/emms.h" |
38 |
|
|
39 |
|
#include "font.h" /* XXX: remove later */ |
40 |
|
|
41 |
#define SAFETY 64 |
#define SAFETY 64 |
42 |
#define EDGE_SIZE2 (EDGE_SIZE/2) |
#define EDGE_SIZE2 (EDGE_SIZE/2) |
49 |
{ |
{ |
50 |
const uint32_t edged_width2 = edged_width / 2; |
const uint32_t edged_width2 = edged_width / 2; |
51 |
const uint32_t edged_height2 = edged_height / 2; |
const uint32_t edged_height2 = edged_height / 2; |
|
uint32_t i; |
|
52 |
|
|
53 |
image->y = |
image->y = |
54 |
xvid_malloc(edged_width * (edged_height + 1) + SAFETY, CACHE_LINE); |
xvid_malloc(edged_width * (edged_height + 1) + SAFETY, CACHE_LINE); |
55 |
if (image->y == NULL) { |
if (image->y == NULL) { |
56 |
return -1; |
return -1; |
57 |
} |
} |
58 |
|
memset(image->y, 0, edged_width * (edged_height + 1) + SAFETY); |
|
for (i = 0; i < edged_width * edged_height + SAFETY; i++) { |
|
|
image->y[i] = 0; |
|
|
} |
|
59 |
|
|
60 |
image->u = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE); |
image->u = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE); |
61 |
if (image->u == NULL) { |
if (image->u == NULL) { |
62 |
xvid_free(image->y); |
xvid_free(image->y); |
63 |
|
image->y = NULL; |
64 |
return -1; |
return -1; |
65 |
} |
} |
66 |
|
memset(image->u, 0, edged_width2 * edged_height2 + SAFETY); |
67 |
|
|
68 |
image->v = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE); |
image->v = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE); |
69 |
if (image->v == NULL) { |
if (image->v == NULL) { |
70 |
xvid_free(image->u); |
xvid_free(image->u); |
71 |
|
image->u = NULL; |
72 |
xvid_free(image->y); |
xvid_free(image->y); |
73 |
|
image->y = NULL; |
74 |
return -1; |
return -1; |
75 |
} |
} |
76 |
|
memset(image->v, 0, edged_width2 * edged_height2 + SAFETY); |
77 |
|
|
78 |
image->y += EDGE_SIZE * edged_width + EDGE_SIZE; |
image->y += EDGE_SIZE * edged_width + EDGE_SIZE; |
79 |
image->u += EDGE_SIZE2 * edged_width2 + EDGE_SIZE2; |
image->u += EDGE_SIZE2 * edged_width2 + EDGE_SIZE2; |
93 |
|
|
94 |
if (image->y) { |
if (image->y) { |
95 |
xvid_free(image->y - (EDGE_SIZE * edged_width + EDGE_SIZE)); |
xvid_free(image->y - (EDGE_SIZE * edged_width + EDGE_SIZE)); |
96 |
|
image->y = NULL; |
97 |
} |
} |
98 |
if (image->u) { |
if (image->u) { |
99 |
xvid_free(image->u - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2)); |
xvid_free(image->u - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2)); |
100 |
|
image->u = NULL; |
101 |
} |
} |
102 |
if (image->v) { |
if (image->v) { |
103 |
xvid_free(image->v - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2)); |
xvid_free(image->v - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2)); |
104 |
|
image->v = NULL; |
105 |
} |
} |
106 |
} |
} |
107 |
|
|
110 |
image_swap(IMAGE * image1, |
image_swap(IMAGE * image1, |
111 |
IMAGE * image2) |
IMAGE * image2) |
112 |
{ |
{ |
113 |
uint8_t *tmp; |
SWAP(uint8_t*, image1->y, image2->y); |
114 |
|
SWAP(uint8_t*, image1->u, image2->u); |
115 |
tmp = image1->y; |
SWAP(uint8_t*, image1->v, image2->v); |
|
image1->y = image2->y; |
|
|
image2->y = tmp; |
|
|
|
|
|
tmp = image1->u; |
|
|
image1->u = image2->u; |
|
|
image2->u = tmp; |
|
|
|
|
|
tmp = image1->v; |
|
|
image1->v = image2->v; |
|
|
image2->v = tmp; |
|
116 |
} |
} |
117 |
|
|
118 |
|
|
127 |
memcpy(image1->v, image2->v, edged_width * height / 4); |
memcpy(image1->v, image2->v, edged_width * height / 4); |
128 |
} |
} |
129 |
|
|
130 |
|
/* setedges bug was fixed in this BS version */ |
131 |
|
#define SETEDGES_BUG_BEFORE 18 |
132 |
|
|
133 |
void |
void |
134 |
image_setedges(IMAGE * image, |
image_setedges(IMAGE * image, |
135 |
uint32_t edged_width, |
uint32_t edged_width, |
136 |
uint32_t edged_height, |
uint32_t edged_height, |
137 |
uint32_t width, |
uint32_t width, |
138 |
uint32_t height) |
uint32_t height, |
139 |
|
int bs_version) |
140 |
{ |
{ |
141 |
const uint32_t edged_width2 = edged_width / 2; |
const uint32_t edged_width2 = edged_width / 2; |
142 |
const uint32_t width2 = width / 2; |
uint32_t width2; |
143 |
uint32_t i; |
uint32_t i; |
144 |
uint8_t *dst; |
uint8_t *dst; |
145 |
uint8_t *src; |
uint8_t *src; |
146 |
|
|
|
|
|
147 |
dst = image->y - (EDGE_SIZE + EDGE_SIZE * edged_width); |
dst = image->y - (EDGE_SIZE + EDGE_SIZE * edged_width); |
148 |
src = image->y; |
src = image->y; |
149 |
|
|
150 |
|
/* According to the Standard Clause 7.6.4, padding is done starting at 16 |
151 |
|
* pixel width and height multiples. This was not respected in old xvids */ |
152 |
|
if (bs_version == 0 || bs_version >= SETEDGES_BUG_BEFORE) { |
153 |
|
width = (width+15)&~15; |
154 |
|
height = (height+15)&~15; |
155 |
|
} |
156 |
|
|
157 |
|
width2 = width/2; |
158 |
|
|
159 |
for (i = 0; i < EDGE_SIZE; i++) { |
for (i = 0; i < EDGE_SIZE; i++) { |
160 |
memset(dst, *src, EDGE_SIZE); |
memset(dst, *src, EDGE_SIZE); |
161 |
memcpy(dst + EDGE_SIZE, src, width); |
memcpy(dst + EDGE_SIZE, src, width); |
181 |
} |
} |
182 |
|
|
183 |
|
|
184 |
//U |
/* U */ |
185 |
dst = image->u - (EDGE_SIZE2 + EDGE_SIZE2 * edged_width2); |
dst = image->u - (EDGE_SIZE2 + EDGE_SIZE2 * edged_width2); |
186 |
src = image->u; |
src = image->u; |
187 |
|
|
209 |
} |
} |
210 |
|
|
211 |
|
|
212 |
// V |
/* V */ |
213 |
dst = image->v - (EDGE_SIZE2 + EDGE_SIZE2 * edged_width2); |
dst = image->v - (EDGE_SIZE2 + EDGE_SIZE2 * edged_width2); |
214 |
src = image->v; |
src = image->v; |
215 |
|
|
237 |
} |
} |
238 |
} |
} |
239 |
|
|
|
// bframe encoding requires image-based u,v interpolation |
|
240 |
void |
void |
241 |
image_interpolate(const IMAGE * refn, |
image_interpolate(const uint8_t * refn, |
242 |
IMAGE * refh, |
uint8_t * refh, |
243 |
IMAGE * refv, |
uint8_t * refv, |
244 |
IMAGE * refhv, |
uint8_t * refhv, |
245 |
uint32_t edged_width, |
uint32_t edged_width, |
246 |
uint32_t edged_height, |
uint32_t edged_height, |
247 |
|
uint32_t quarterpel, |
248 |
uint32_t rounding) |
uint32_t rounding) |
249 |
{ |
{ |
250 |
const uint32_t offset = EDGE_SIZE * (edged_width + 1); |
const uint32_t offset = EDGE_SIZE2 * (edged_width + 1); /* we only interpolate half of the edge area */ |
251 |
const uint32_t stride_add = 7 * edged_width; |
const uint32_t stride_add = 7 * edged_width; |
252 |
|
|
253 |
uint8_t *n_ptr, *h_ptr, *v_ptr, *hv_ptr; |
uint8_t *n_ptr; |
254 |
|
uint8_t *h_ptr, *v_ptr, *hv_ptr; |
255 |
uint32_t x, y; |
uint32_t x, y; |
256 |
|
|
257 |
|
n_ptr = (uint8_t*)refn; |
258 |
n_ptr = refn->y; |
h_ptr = refh; |
259 |
h_ptr = refh->y; |
v_ptr = refv; |
|
v_ptr = refv->y; |
|
|
hv_ptr = refhv->y; |
|
260 |
|
|
261 |
n_ptr -= offset; |
n_ptr -= offset; |
262 |
h_ptr -= offset; |
h_ptr -= offset; |
263 |
v_ptr -= offset; |
v_ptr -= offset; |
264 |
|
|
265 |
|
/* Note we initialize the hv pointer later, as we can optimize code a bit |
266 |
|
* doing it down to up in quarterpel and up to down in halfpel */ |
267 |
|
if(quarterpel) { |
268 |
|
|
269 |
|
for (y = 0; y < (edged_height - EDGE_SIZE); y += 8) { |
270 |
|
for (x = 0; x < (edged_width - EDGE_SIZE); x += 8) { |
271 |
|
interpolate8x8_6tap_lowpass_h(h_ptr, n_ptr, edged_width, rounding); |
272 |
|
interpolate8x8_6tap_lowpass_v(v_ptr, n_ptr, edged_width, rounding); |
273 |
|
|
274 |
|
n_ptr += 8; |
275 |
|
h_ptr += 8; |
276 |
|
v_ptr += 8; |
277 |
|
} |
278 |
|
|
279 |
|
n_ptr += EDGE_SIZE; |
280 |
|
h_ptr += EDGE_SIZE; |
281 |
|
v_ptr += EDGE_SIZE; |
282 |
|
|
283 |
|
h_ptr += stride_add; |
284 |
|
v_ptr += stride_add; |
285 |
|
n_ptr += stride_add; |
286 |
|
} |
287 |
|
|
288 |
|
h_ptr = refh + (edged_height - EDGE_SIZE - EDGE_SIZE2)*edged_width - EDGE_SIZE2; |
289 |
|
hv_ptr = refhv + (edged_height - EDGE_SIZE - EDGE_SIZE2)*edged_width - EDGE_SIZE2; |
290 |
|
|
291 |
|
for (y = 0; y < (edged_height - EDGE_SIZE); y = y + 8) { |
292 |
|
hv_ptr -= stride_add; |
293 |
|
h_ptr -= stride_add; |
294 |
|
hv_ptr -= EDGE_SIZE; |
295 |
|
h_ptr -= EDGE_SIZE; |
296 |
|
|
297 |
|
for (x = 0; x < (edged_width - EDGE_SIZE); x = x + 8) { |
298 |
|
hv_ptr -= 8; |
299 |
|
h_ptr -= 8; |
300 |
|
interpolate8x8_6tap_lowpass_v(hv_ptr, h_ptr, edged_width, rounding); |
301 |
|
} |
302 |
|
} |
303 |
|
} else { |
304 |
|
|
305 |
|
hv_ptr = refhv; |
306 |
hv_ptr -= offset; |
hv_ptr -= offset; |
307 |
|
|
308 |
for (y = 0; y < edged_height; y = y + 8) { |
for (y = 0; y < (edged_height - EDGE_SIZE); y += 8) { |
309 |
for (x = 0; x < edged_width; x = x + 8) { |
for (x = 0; x < (edged_width - EDGE_SIZE); x += 8) { |
310 |
interpolate8x8_halfpel_h(h_ptr, n_ptr, edged_width, rounding); |
interpolate8x8_halfpel_h(h_ptr, n_ptr, edged_width, rounding); |
311 |
interpolate8x8_halfpel_v(v_ptr, n_ptr, edged_width, rounding); |
interpolate8x8_halfpel_v(v_ptr, n_ptr, edged_width, rounding); |
312 |
interpolate8x8_halfpel_hv(hv_ptr, n_ptr, edged_width, rounding); |
interpolate8x8_halfpel_hv(hv_ptr, n_ptr, edged_width, rounding); |
316 |
v_ptr += 8; |
v_ptr += 8; |
317 |
hv_ptr += 8; |
hv_ptr += 8; |
318 |
} |
} |
319 |
|
|
320 |
|
h_ptr += EDGE_SIZE; |
321 |
|
v_ptr += EDGE_SIZE; |
322 |
|
hv_ptr += EDGE_SIZE; |
323 |
|
n_ptr += EDGE_SIZE; |
324 |
|
|
325 |
h_ptr += stride_add; |
h_ptr += stride_add; |
326 |
v_ptr += stride_add; |
v_ptr += stride_add; |
327 |
hv_ptr += stride_add; |
hv_ptr += stride_add; |
328 |
n_ptr += stride_add; |
n_ptr += stride_add; |
329 |
} |
} |
330 |
|
} |
331 |
|
} |
332 |
|
|
333 |
|
|
334 |
/* |
/* |
335 |
interpolate_halfpel_h( |
chroma optimize filter, invented by mf |
336 |
refh->y - offset, |
a chroma pixel is average from the surrounding pixels, when the |
337 |
refn->y - offset, |
correpsonding luma pixels are pure black or white. |
|
edged_width, edged_height, |
|
|
rounding); |
|
|
|
|
|
interpolate_halfpel_v( |
|
|
refv->y - offset, |
|
|
refn->y - offset, |
|
|
edged_width, edged_height, |
|
|
rounding); |
|
|
|
|
|
interpolate_halfpel_hv( |
|
|
refhv->y - offset, |
|
|
refn->y - offset, |
|
|
edged_width, edged_height, |
|
|
rounding); |
|
338 |
*/ |
*/ |
339 |
|
|
340 |
/* uv-image-based compensation |
void |
341 |
offset = EDGE_SIZE2 * (edged_width / 2 + 1); |
image_chroma_optimize(IMAGE * img, int width, int height, int edged_width) |
342 |
|
{ |
343 |
|
int x,y; |
344 |
|
int pixels = 0; |
345 |
|
|
346 |
|
for (y = 1; y < height/2 - 1; y++) |
347 |
|
for (x = 1; x < width/2 - 1; x++) |
348 |
|
{ |
349 |
|
#define IS_PURE(a) ((a)<=16||(a)>=235) |
350 |
|
#define IMG_Y(Y,X) img->y[(Y)*edged_width + (X)] |
351 |
|
#define IMG_U(Y,X) img->u[(Y)*edged_width/2 + (X)] |
352 |
|
#define IMG_V(Y,X) img->v[(Y)*edged_width/2 + (X)] |
353 |
|
|
354 |
|
if (IS_PURE(IMG_Y(y*2 ,x*2 )) && |
355 |
|
IS_PURE(IMG_Y(y*2 ,x*2+1)) && |
356 |
|
IS_PURE(IMG_Y(y*2+1,x*2 )) && |
357 |
|
IS_PURE(IMG_Y(y*2+1,x*2+1))) |
358 |
|
{ |
359 |
|
IMG_U(y,x) = (IMG_U(y,x-1) + IMG_U(y-1, x) + IMG_U(y, x+1) + IMG_U(y+1, x)) / 4; |
360 |
|
IMG_V(y,x) = (IMG_V(y,x-1) + IMG_V(y-1, x) + IMG_V(y, x+1) + IMG_V(y+1, x)) / 4; |
361 |
|
pixels++; |
362 |
|
} |
363 |
|
|
364 |
interpolate_halfpel_h( |
#undef IS_PURE |
365 |
refh->u - offset, |
#undef IMG_Y |
366 |
refn->u - offset, |
#undef IMG_U |
367 |
edged_width / 2, edged_height / 2, |
#undef IMG_V |
368 |
rounding); |
} |
369 |
|
|
370 |
interpolate_halfpel_v( |
DPRINTF(XVID_DEBUG_DEBUG,"chroma_optimized_pixels = %i/%i\n", pixels, width*height/4); |
371 |
refv->u - offset, |
} |
372 |
refn->u - offset, |
|
373 |
edged_width / 2, edged_height / 2, |
|
374 |
rounding); |
|
375 |
|
|
376 |
interpolate_halfpel_hv( |
|
377 |
refhv->u - offset, |
/* |
378 |
refn->u - offset, |
perform safe packed colorspace conversion, by splitting |
379 |
edged_width / 2, edged_height / 2, |
the image up into an optimized area (pixel width divisible by 16), |
380 |
rounding); |
and two unoptimized/plain-c areas (pixel width divisible by 2) |
|
|
|
|
|
|
|
interpolate_halfpel_h( |
|
|
refh->v - offset, |
|
|
refn->v - offset, |
|
|
edged_width / 2, edged_height / 2, |
|
|
rounding); |
|
|
|
|
|
interpolate_halfpel_v( |
|
|
refv->v - offset, |
|
|
refn->v - offset, |
|
|
edged_width / 2, edged_height / 2, |
|
|
rounding); |
|
|
|
|
|
interpolate_halfpel_hv( |
|
|
refhv->v - offset, |
|
|
refn->v - offset, |
|
|
edged_width / 2, edged_height / 2, |
|
|
rounding); |
|
381 |
*/ |
*/ |
382 |
|
|
383 |
|
static void |
384 |
|
safe_packed_conv(uint8_t * x_ptr, int x_stride, |
385 |
|
uint8_t * y_ptr, uint8_t * u_ptr, uint8_t * v_ptr, |
386 |
|
int y_stride, int uv_stride, |
387 |
|
int width, int height, int vflip, |
388 |
|
packedFunc * func_opt, packedFunc func_c, int size) |
389 |
|
{ |
390 |
|
int width_opt, width_c; |
391 |
|
|
392 |
|
if (func_opt != func_c && x_stride < size*((width+15)/16)*16) |
393 |
|
{ |
394 |
|
width_opt = width & (~15); |
395 |
|
width_c = width - width_opt; |
396 |
|
} |
397 |
|
else |
398 |
|
{ |
399 |
|
width_opt = width; |
400 |
|
width_c = 0; |
401 |
} |
} |
402 |
|
|
403 |
|
func_opt(x_ptr, x_stride, |
404 |
|
y_ptr, u_ptr, v_ptr, y_stride, uv_stride, |
405 |
|
width_opt, height, vflip); |
406 |
|
|
407 |
|
if (width_c) |
408 |
|
{ |
409 |
|
func_c(x_ptr + size*width_opt, x_stride, |
410 |
|
y_ptr + width_opt, u_ptr + width_opt/2, v_ptr + width_opt/2, |
411 |
|
y_stride, uv_stride, width_c, height, vflip); |
412 |
|
} |
413 |
|
} |
414 |
|
|
415 |
|
|
416 |
|
|
417 |
int |
int |
418 |
image_input(IMAGE * image, |
image_input(IMAGE * image, |
419 |
uint32_t width, |
uint32_t width, |
420 |
int height, |
int height, |
421 |
uint32_t edged_width, |
uint32_t edged_width, |
422 |
uint8_t * src, |
uint8_t * src[4], |
423 |
int csp) |
int src_stride[4], |
424 |
|
int csp, |
425 |
|
int interlacing) |
426 |
{ |
{ |
427 |
|
const int edged_width2 = edged_width/2; |
428 |
/* if (csp & XVID_CSP_VFLIP) |
const int width2 = width/2; |
429 |
{ |
const int height2 = height/2; |
430 |
height = -height; |
#if 0 |
431 |
} |
const int height_signed = (csp & XVID_CSP_VFLIP) ? -height : height; |
432 |
*/ |
#endif |
433 |
|
|
434 |
switch (csp & ~XVID_CSP_VFLIP) { |
switch (csp & ~XVID_CSP_VFLIP) { |
435 |
case XVID_CSP_RGB555: |
case XVID_CSP_RGB555: |
436 |
rgb555_to_yv12(image->y, image->u, image->v, src, width, height, |
safe_packed_conv( |
437 |
edged_width); |
src[0], src_stride[0], image->y, image->u, image->v, |
438 |
return 0; |
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
439 |
|
interlacing?rgb555i_to_yv12 :rgb555_to_yv12, |
440 |
|
interlacing?rgb555i_to_yv12_c:rgb555_to_yv12_c, 2); |
441 |
|
break; |
442 |
|
|
443 |
case XVID_CSP_RGB565: |
case XVID_CSP_RGB565: |
444 |
rgb565_to_yv12(image->y, image->u, image->v, src, width, height, |
safe_packed_conv( |
445 |
edged_width); |
src[0], src_stride[0], image->y, image->u, image->v, |
446 |
return 0; |
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
447 |
|
interlacing?rgb565i_to_yv12 :rgb565_to_yv12, |
448 |
|
interlacing?rgb565i_to_yv12_c:rgb565_to_yv12_c, 2); |
449 |
|
break; |
450 |
|
|
451 |
|
|
452 |
case XVID_CSP_RGB24: |
case XVID_CSP_BGR: |
453 |
rgb24_to_yv12(image->y, image->u, image->v, src, width, height, |
safe_packed_conv( |
454 |
edged_width); |
src[0], src_stride[0], image->y, image->u, image->v, |
455 |
return 0; |
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
456 |
|
interlacing?bgri_to_yv12 :bgr_to_yv12, |
457 |
|
interlacing?bgri_to_yv12_c:bgr_to_yv12_c, 3); |
458 |
|
break; |
459 |
|
|
460 |
case XVID_CSP_RGB32: |
case XVID_CSP_BGRA: |
461 |
rgb32_to_yv12(image->y, image->u, image->v, src, width, height, |
safe_packed_conv( |
462 |
edged_width); |
src[0], src_stride[0], image->y, image->u, image->v, |
463 |
return 0; |
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
464 |
|
interlacing?bgrai_to_yv12 :bgra_to_yv12, |
465 |
|
interlacing?bgrai_to_yv12_c:bgra_to_yv12_c, 4); |
466 |
|
break; |
467 |
|
|
468 |
case XVID_CSP_I420: |
case XVID_CSP_ABGR : |
469 |
yuv_to_yv12(image->y, image->u, image->v, src, width, height, |
safe_packed_conv( |
470 |
edged_width); |
src[0], src_stride[0], image->y, image->u, image->v, |
471 |
return 0; |
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
472 |
|
interlacing?abgri_to_yv12 :abgr_to_yv12, |
473 |
|
interlacing?abgri_to_yv12_c:abgr_to_yv12_c, 4); |
474 |
|
break; |
475 |
|
|
476 |
case XVID_CSP_YV12: /* u/v swapped */ |
case XVID_CSP_RGBA : |
477 |
yuv_to_yv12(image->y, image->v, image->u, src, width, height, |
safe_packed_conv( |
478 |
edged_width); |
src[0], src_stride[0], image->y, image->u, image->v, |
479 |
return 0; |
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
480 |
|
interlacing?rgbai_to_yv12 :rgba_to_yv12, |
481 |
|
interlacing?rgbai_to_yv12_c:rgba_to_yv12_c, 4); |
482 |
|
break; |
483 |
|
|
484 |
|
case XVID_CSP_ARGB: |
485 |
|
safe_packed_conv( |
486 |
|
src[0], src_stride[0], image->y, image->u, image->v, |
487 |
|
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
488 |
|
interlacing?argbi_to_yv12 : argb_to_yv12, |
489 |
|
interlacing?argbi_to_yv12_c: argb_to_yv12_c, 4); |
490 |
|
break; |
491 |
|
|
492 |
case XVID_CSP_YUY2: |
case XVID_CSP_YUY2: |
493 |
yuyv_to_yv12(image->y, image->u, image->v, src, width, height, |
safe_packed_conv( |
494 |
edged_width); |
src[0], src_stride[0], image->y, image->u, image->v, |
495 |
return 0; |
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
496 |
|
interlacing?yuyvi_to_yv12 :yuyv_to_yv12, |
497 |
|
interlacing?yuyvi_to_yv12_c:yuyv_to_yv12_c, 2); |
498 |
|
break; |
499 |
|
|
500 |
case XVID_CSP_YVYU: /* u/v swapped */ |
case XVID_CSP_YVYU: /* u/v swapped */ |
501 |
yuyv_to_yv12(image->y, image->v, image->u, src, width, height, |
safe_packed_conv( |
502 |
edged_width); |
src[0], src_stride[0], image->y, image->v, image->u, |
503 |
return 0; |
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
504 |
|
interlacing?yuyvi_to_yv12 :yuyv_to_yv12, |
505 |
|
interlacing?yuyvi_to_yv12_c:yuyv_to_yv12_c, 2); |
506 |
|
break; |
507 |
|
|
508 |
case XVID_CSP_UYVY: |
case XVID_CSP_UYVY: |
509 |
uyvy_to_yv12(image->y, image->u, image->v, src, width, height, |
safe_packed_conv( |
510 |
edged_width); |
src[0], src_stride[0], image->y, image->u, image->v, |
511 |
return 0; |
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
512 |
|
interlacing?uyvyi_to_yv12 :uyvy_to_yv12, |
513 |
|
interlacing?uyvyi_to_yv12_c:uyvy_to_yv12_c, 2); |
514 |
|
break; |
515 |
|
|
516 |
case XVID_CSP_USER: |
case XVID_CSP_I420: /* YCbCr == YUV == internal colorspace for MPEG */ |
517 |
user_to_yuv_c(image->y, image->u, image->v, edged_width, |
yv12_to_yv12(image->y, image->u, image->v, edged_width, edged_width2, |
518 |
(DEC_PICTURE *) src, width, height); |
src[0], src[0] + src_stride[0]*height, src[0] + src_stride[0]*height + (src_stride[0]/2)*height2, |
519 |
return 0; |
src_stride[0], src_stride[0]/2, width, height, (csp & XVID_CSP_VFLIP)); |
520 |
|
break; |
521 |
|
|
522 |
|
case XVID_CSP_YV12: /* YCrCb == YVA == U and V plane swapped */ |
523 |
|
yv12_to_yv12(image->y, image->v, image->u, edged_width, edged_width2, |
524 |
|
src[0], src[0] + src_stride[0]*height, src[0] + src_stride[0]*height + (src_stride[0]/2)*height2, |
525 |
|
src_stride[0], src_stride[0]/2, width, height, (csp & XVID_CSP_VFLIP)); |
526 |
|
break; |
527 |
|
|
528 |
|
case XVID_CSP_PLANAR: /* YCbCr with arbitrary pointers and different strides for Y and UV */ |
529 |
|
yv12_to_yv12(image->y, image->u, image->v, edged_width, edged_width2, |
530 |
|
src[0], src[1], src[2], src_stride[0], src_stride[1], /* v: dst_stride[2] not yet supported */ |
531 |
|
width, height, (csp & XVID_CSP_VFLIP)); |
532 |
|
break; |
533 |
|
|
534 |
case XVID_CSP_NULL: |
case XVID_CSP_NULL: |
535 |
break; |
break; |
536 |
|
|
537 |
|
default : |
538 |
|
return -1; |
539 |
} |
} |
540 |
|
|
541 |
return -1; |
|
542 |
|
/* pad out image when the width and/or height is not a multiple of 16 */ |
543 |
|
|
544 |
|
if (width & 15) |
545 |
|
{ |
546 |
|
int i; |
547 |
|
int pad_width = 16 - (width&15); |
548 |
|
for (i = 0; i < height; i++) |
549 |
|
{ |
550 |
|
memset(image->y + i*edged_width + width, |
551 |
|
*(image->y + i*edged_width + width - 1), pad_width); |
552 |
|
} |
553 |
|
for (i = 0; i < height/2; i++) |
554 |
|
{ |
555 |
|
memset(image->u + i*edged_width2 + width2, |
556 |
|
*(image->u + i*edged_width2 + width2 - 1),pad_width/2); |
557 |
|
memset(image->v + i*edged_width2 + width2, |
558 |
|
*(image->v + i*edged_width2 + width2 - 1),pad_width/2); |
559 |
|
} |
560 |
|
} |
561 |
|
|
562 |
|
if (height & 15) |
563 |
|
{ |
564 |
|
int pad_height = 16 - (height&15); |
565 |
|
int length = ((width+15)/16)*16; |
566 |
|
int i; |
567 |
|
for (i = 0; i < pad_height; i++) |
568 |
|
{ |
569 |
|
memcpy(image->y + (height+i)*edged_width, |
570 |
|
image->y + (height-1)*edged_width,length); |
571 |
|
} |
572 |
|
|
573 |
|
for (i = 0; i < pad_height/2; i++) |
574 |
|
{ |
575 |
|
memcpy(image->u + (height2+i)*edged_width2, |
576 |
|
image->u + (height2-1)*edged_width2,length/2); |
577 |
|
memcpy(image->v + (height2+i)*edged_width2, |
578 |
|
image->v + (height2-1)*edged_width2,length/2); |
579 |
|
} |
580 |
|
} |
581 |
|
|
582 |
|
/* |
583 |
|
if (interlacing) |
584 |
|
image_printf(image, edged_width, height, 5,5, "[i]"); |
585 |
|
image_dump_yuvpgm(image, edged_width, ((width+15)/16)*16, ((height+15)/16)*16, "\\encode.pgm"); |
586 |
|
*/ |
587 |
|
return 0; |
588 |
} |
} |
589 |
|
|
590 |
|
|
594 |
uint32_t width, |
uint32_t width, |
595 |
int height, |
int height, |
596 |
uint32_t edged_width, |
uint32_t edged_width, |
597 |
uint8_t * dst, |
uint8_t * dst[4], |
598 |
uint32_t dst_stride, |
int dst_stride[4], |
599 |
int csp) |
int csp, |
600 |
|
int interlacing) |
601 |
{ |
{ |
602 |
if (csp & XVID_CSP_VFLIP) { |
const int edged_width2 = edged_width/2; |
603 |
height = -height; |
int height2 = height/2; |
604 |
} |
|
605 |
|
/* |
606 |
|
if (interlacing) |
607 |
|
image_printf(image, edged_width, height, 5,100, "[i]=%i,%i",width,height); |
608 |
|
image_dump_yuvpgm(image, edged_width, width, height, "\\decode.pgm"); |
609 |
|
*/ |
610 |
|
|
611 |
switch (csp & ~XVID_CSP_VFLIP) { |
switch (csp & ~XVID_CSP_VFLIP) { |
612 |
case XVID_CSP_RGB555: |
case XVID_CSP_RGB555: |
613 |
yv12_to_rgb555(dst, dst_stride, image->y, image->u, image->v, |
safe_packed_conv( |
614 |
edged_width, edged_width / 2, width, height); |
dst[0], dst_stride[0], image->y, image->u, image->v, |
615 |
|
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
616 |
|
interlacing?yv12_to_rgb555i :yv12_to_rgb555, |
617 |
|
interlacing?yv12_to_rgb555i_c:yv12_to_rgb555_c, 2); |
618 |
return 0; |
return 0; |
619 |
|
|
620 |
case XVID_CSP_RGB565: |
case XVID_CSP_RGB565: |
621 |
yv12_to_rgb565(dst, dst_stride, image->y, image->u, image->v, |
safe_packed_conv( |
622 |
edged_width, edged_width / 2, width, height); |
dst[0], dst_stride[0], image->y, image->u, image->v, |
623 |
return 0; |
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
624 |
|
interlacing?yv12_to_rgb565i :yv12_to_rgb565, |
625 |
case XVID_CSP_RGB24: |
interlacing?yv12_to_rgb565i_c:yv12_to_rgb565_c, 2); |
626 |
yv12_to_rgb24(dst, dst_stride, image->y, image->u, image->v, |
return 0; |
627 |
edged_width, edged_width / 2, width, height); |
|
628 |
return 0; |
case XVID_CSP_BGR: |
629 |
|
safe_packed_conv( |
630 |
case XVID_CSP_RGB32: |
dst[0], dst_stride[0], image->y, image->u, image->v, |
631 |
yv12_to_rgb32(dst, dst_stride, image->y, image->u, image->v, |
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
632 |
edged_width, edged_width / 2, width, height); |
interlacing?yv12_to_bgri :yv12_to_bgr, |
633 |
return 0; |
interlacing?yv12_to_bgri_c:yv12_to_bgr_c, 3); |
634 |
|
return 0; |
635 |
case XVID_CSP_I420: |
|
636 |
yv12_to_yuv(dst, dst_stride, image->y, image->u, image->v, edged_width, |
case XVID_CSP_BGRA: |
637 |
edged_width / 2, width, height); |
safe_packed_conv( |
638 |
return 0; |
dst[0], dst_stride[0], image->y, image->u, image->v, |
639 |
|
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
640 |
case XVID_CSP_YV12: // u,v swapped |
interlacing?yv12_to_bgrai :yv12_to_bgra, |
641 |
yv12_to_yuv(dst, dst_stride, image->y, image->v, image->u, edged_width, |
interlacing?yv12_to_bgrai_c:yv12_to_bgra_c, 4); |
642 |
edged_width / 2, width, height); |
return 0; |
643 |
|
|
644 |
|
case XVID_CSP_ABGR: |
645 |
|
safe_packed_conv( |
646 |
|
dst[0], dst_stride[0], image->y, image->u, image->v, |
647 |
|
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
648 |
|
interlacing?yv12_to_abgri :yv12_to_abgr, |
649 |
|
interlacing?yv12_to_abgri_c:yv12_to_abgr_c, 4); |
650 |
|
return 0; |
651 |
|
|
652 |
|
case XVID_CSP_RGBA: |
653 |
|
safe_packed_conv( |
654 |
|
dst[0], dst_stride[0], image->y, image->u, image->v, |
655 |
|
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
656 |
|
interlacing?yv12_to_rgbai :yv12_to_rgba, |
657 |
|
interlacing?yv12_to_rgbai_c:yv12_to_rgba_c, 4); |
658 |
|
return 0; |
659 |
|
|
660 |
|
case XVID_CSP_ARGB: |
661 |
|
safe_packed_conv( |
662 |
|
dst[0], dst_stride[0], image->y, image->u, image->v, |
663 |
|
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
664 |
|
interlacing?yv12_to_argbi :yv12_to_argb, |
665 |
|
interlacing?yv12_to_argbi_c:yv12_to_argb_c, 4); |
666 |
return 0; |
return 0; |
667 |
|
|
668 |
case XVID_CSP_YUY2: |
case XVID_CSP_YUY2: |
669 |
yv12_to_yuyv(dst, dst_stride, image->y, image->u, image->v, |
safe_packed_conv( |
670 |
edged_width, edged_width / 2, width, height); |
dst[0], dst_stride[0], image->y, image->u, image->v, |
671 |
|
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
672 |
|
interlacing?yv12_to_yuyvi :yv12_to_yuyv, |
673 |
|
interlacing?yv12_to_yuyvi_c:yv12_to_yuyv_c, 2); |
674 |
return 0; |
return 0; |
675 |
|
|
676 |
case XVID_CSP_YVYU: // u,v swapped |
case XVID_CSP_YVYU: /* u,v swapped */ |
677 |
yv12_to_yuyv(dst, dst_stride, image->y, image->v, image->u, |
safe_packed_conv( |
678 |
edged_width, edged_width / 2, width, height); |
dst[0], dst_stride[0], image->y, image->v, image->u, |
679 |
|
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
680 |
|
interlacing?yv12_to_yuyvi :yv12_to_yuyv, |
681 |
|
interlacing?yv12_to_yuyvi_c:yv12_to_yuyv_c, 2); |
682 |
return 0; |
return 0; |
683 |
|
|
684 |
case XVID_CSP_UYVY: |
case XVID_CSP_UYVY: |
685 |
yv12_to_uyvy(dst, dst_stride, image->y, image->u, image->v, |
safe_packed_conv( |
686 |
edged_width, edged_width / 2, width, height); |
dst[0], dst_stride[0], image->y, image->u, image->v, |
687 |
return 0; |
edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP), |
688 |
|
interlacing?yv12_to_uyvyi :yv12_to_uyvy, |
689 |
case XVID_CSP_USER: |
interlacing?yv12_to_uyvyi_c:yv12_to_uyvy_c, 2); |
690 |
((DEC_PICTURE *) dst)->y = image->y; |
return 0; |
691 |
((DEC_PICTURE *) dst)->u = image->u; |
|
692 |
((DEC_PICTURE *) dst)->v = image->v; |
case XVID_CSP_I420: /* YCbCr == YUV == internal colorspace for MPEG */ |
693 |
((DEC_PICTURE *) dst)->stride_y = edged_width; |
yv12_to_yv12(dst[0], dst[0] + dst_stride[0]*height, dst[0] + dst_stride[0]*height + (dst_stride[0]/2)*height2, |
694 |
((DEC_PICTURE *) dst)->stride_uv = edged_width / 2; |
dst_stride[0], dst_stride[0]/2, |
695 |
|
image->y, image->u, image->v, edged_width, edged_width2, |
696 |
|
width, height, (csp & XVID_CSP_VFLIP)); |
697 |
|
return 0; |
698 |
|
|
699 |
|
case XVID_CSP_YV12: /* YCrCb == YVU == U and V plane swapped */ |
700 |
|
yv12_to_yv12(dst[0], dst[0] + dst_stride[0]*height, dst[0] + dst_stride[0]*height + (dst_stride[0]/2)*height2, |
701 |
|
dst_stride[0], dst_stride[0]/2, |
702 |
|
image->y, image->v, image->u, edged_width, edged_width2, |
703 |
|
width, height, (csp & XVID_CSP_VFLIP)); |
704 |
|
return 0; |
705 |
|
|
706 |
|
case XVID_CSP_PLANAR: /* YCbCr with arbitrary pointers and different strides for Y and UV */ |
707 |
|
yv12_to_yv12(dst[0], dst[1], dst[2], |
708 |
|
dst_stride[0], dst_stride[1], /* v: dst_stride[2] not yet supported */ |
709 |
|
image->y, image->u, image->v, edged_width, edged_width2, |
710 |
|
width, height, (csp & XVID_CSP_VFLIP)); |
711 |
|
return 0; |
712 |
|
|
713 |
|
case XVID_CSP_INTERNAL : |
714 |
|
dst[0] = image->y; |
715 |
|
dst[1] = image->u; |
716 |
|
dst[2] = image->v; |
717 |
|
dst_stride[0] = edged_width; |
718 |
|
dst_stride[1] = edged_width/2; |
719 |
|
dst_stride[2] = edged_width/2; |
720 |
return 0; |
return 0; |
721 |
|
|
722 |
case XVID_CSP_NULL: |
case XVID_CSP_NULL: |
723 |
case XVID_CSP_EXTERN: |
case XVID_CSP_SLICE: |
724 |
return 0; |
return 0; |
725 |
|
|
726 |
} |
} |
760 |
return psnr_y; |
return psnr_y; |
761 |
} |
} |
762 |
|
|
763 |
/* |
|
764 |
|
float sse_to_PSNR(long sse, int pixels) |
765 |
|
{ |
766 |
|
if (sse==0) |
767 |
|
return 99.99F; |
768 |
|
|
769 |
|
return 48.131F - 10*(float)log10((float)sse/(float)(pixels)); /* log10(255*255)=4.8131 */ |
770 |
|
|
771 |
|
} |
772 |
|
|
773 |
|
long plane_sse(uint8_t *orig, |
774 |
|
uint8_t *recon, |
775 |
|
uint16_t stride, |
776 |
|
uint16_t width, |
777 |
|
uint16_t height) |
778 |
|
{ |
779 |
|
int y, bwidth, bheight; |
780 |
|
long sse = 0; |
781 |
|
|
782 |
|
bwidth = width & (~0x07); |
783 |
|
bheight = height & (~0x07); |
784 |
|
|
785 |
|
/* Compute the 8x8 integer part */ |
786 |
|
for (y = 0; y<bheight; y += 8) { |
787 |
|
int x; |
788 |
|
|
789 |
|
/* Compute sse for the band */ |
790 |
|
for (x = 0; x<bwidth; x += 8) |
791 |
|
sse += sse8_8bit(orig + x, recon + x, stride); |
792 |
|
|
793 |
|
/* remaining pixels of the 8 pixels high band */ |
794 |
|
for (x = bwidth; x < width; x++) { |
795 |
|
int diff; |
796 |
|
diff = *(orig + 0*stride + x) - *(recon + 0*stride + x); |
797 |
|
sse += diff * diff; |
798 |
|
diff = *(orig + 1*stride + x) - *(recon + 1*stride + x); |
799 |
|
sse += diff * diff; |
800 |
|
diff = *(orig + 2*stride + x) - *(recon + 2*stride + x); |
801 |
|
sse += diff * diff; |
802 |
|
diff = *(orig + 3*stride + x) - *(recon + 3*stride + x); |
803 |
|
sse += diff * diff; |
804 |
|
diff = *(orig + 4*stride + x) - *(recon + 4*stride + x); |
805 |
|
sse += diff * diff; |
806 |
|
diff = *(orig + 5*stride + x) - *(recon + 5*stride + x); |
807 |
|
sse += diff * diff; |
808 |
|
diff = *(orig + 6*stride + x) - *(recon + 6*stride + x); |
809 |
|
sse += diff * diff; |
810 |
|
diff = *(orig + 7*stride + x) - *(recon + 7*stride + x); |
811 |
|
sse += diff * diff; |
812 |
|
} |
813 |
|
|
814 |
|
orig += 8*stride; |
815 |
|
recon += 8*stride; |
816 |
|
} |
817 |
|
|
818 |
|
/* Compute the down rectangle sse */ |
819 |
|
for (y = bheight; y < height; y++) { |
820 |
|
int x; |
821 |
|
for (x = 0; x < width; x++) { |
822 |
|
int diff; |
823 |
|
diff = *(orig + x) - *(recon + x); |
824 |
|
sse += diff * diff; |
825 |
|
} |
826 |
|
orig += stride; |
827 |
|
recon += stride; |
828 |
|
} |
829 |
|
|
830 |
|
return (sse); |
831 |
|
} |
832 |
|
|
833 |
|
#if 0 |
834 |
|
|
835 |
#include <stdio.h> |
#include <stdio.h> |
836 |
#include <string.h> |
#include <string.h> |
854 |
} |
} |
855 |
|
|
856 |
|
|
857 |
// dump image+edges to yuv pgm files |
/* dump image+edges to yuv pgm files */ |
858 |
|
|
859 |
int image_dump(IMAGE * image, uint32_t edged_width, uint32_t edged_height, char * path, int number) |
int image_dump(IMAGE * image, uint32_t edged_width, uint32_t edged_height, char * path, int number) |
860 |
{ |
{ |
877 |
|
|
878 |
return 0; |
return 0; |
879 |
} |
} |
880 |
*/ |
#endif |
881 |
|
|
882 |
|
|
883 |
|
|
926 |
} |
} |
927 |
|
|
928 |
|
|
|
#define ABS(X) (((X)>0)?(X):-(X)) |
|
929 |
float |
float |
930 |
image_mad(const IMAGE * img1, |
image_mad(const IMAGE * img1, |
931 |
const IMAGE * img2, |
const IMAGE * img2, |
942 |
|
|
943 |
for (y = 0; y < height; y++) |
for (y = 0; y < height; y++) |
944 |
for (x = 0; x < width; x++) |
for (x = 0; x < width; x++) |
945 |
sum += ABS(img1->y[x + y * stride] - img2->y[x + y * stride]); |
sum += abs(img1->y[x + y * stride] - img2->y[x + y * stride]); |
946 |
|
|
947 |
for (y = 0; y < height2; y++) |
for (y = 0; y < height2; y++) |
948 |
for (x = 0; x < width2; x++) |
for (x = 0; x < width2; x++) |
949 |
sum += ABS(img1->u[x + y * stride2] - img2->u[x + y * stride2]); |
sum += abs(img1->u[x + y * stride2] - img2->u[x + y * stride2]); |
950 |
|
|
951 |
for (y = 0; y < height2; y++) |
for (y = 0; y < height2; y++) |
952 |
for (x = 0; x < width2; x++) |
for (x = 0; x < width2; x++) |
953 |
sum += ABS(img1->v[x + y * stride2] - img2->v[x + y * stride2]); |
sum += abs(img1->v[x + y * stride2] - img2->v[x + y * stride2]); |
954 |
|
|
955 |
return (float) sum / (width * height * 3 / 2); |
return (float) sum / (width * height * 3 / 2); |
956 |
} |
} |
957 |
|
|
958 |
void |
void |
959 |
output_slice(IMAGE * cur, int std, int width, XVID_DEC_PICTURE* out_frm, int mbx, int mby,int mbl) { |
output_slice(IMAGE * cur, int stride, int width, xvid_image_t* out_frm, int mbx, int mby,int mbl) { |
960 |
uint8_t *dY,*dU,*dV,*sY,*sU,*sV; |
uint8_t *dY,*dU,*dV,*sY,*sU,*sV; |
961 |
int std2 = std >> 1; |
int stride2 = stride >> 1; |
962 |
int w = mbl << 4, w2,i; |
int w = mbl << 4, w2,i; |
963 |
|
|
964 |
if(w > width) |
if(w > width) |
965 |
w = width; |
w = width; |
966 |
w2 = w >> 1; |
w2 = w >> 1; |
967 |
|
|
968 |
dY = (uint8_t*)out_frm->y + (mby << 4) * out_frm->stride_y + (mbx << 4); |
dY = (uint8_t*)out_frm->plane[0] + (mby << 4) * out_frm->stride[0] + (mbx << 4); |
969 |
dU = (uint8_t*)out_frm->u + (mby << 3) * out_frm->stride_u + (mbx << 3); |
dU = (uint8_t*)out_frm->plane[1] + (mby << 3) * out_frm->stride[1] + (mbx << 3); |
970 |
dV = (uint8_t*)out_frm->v + (mby << 3) * out_frm->stride_v + (mbx << 3); |
dV = (uint8_t*)out_frm->plane[2] + (mby << 3) * out_frm->stride[2] + (mbx << 3); |
971 |
sY = cur->y + (mby << 4) * std + (mbx << 4); |
sY = cur->y + (mby << 4) * stride + (mbx << 4); |
972 |
sU = cur->u + (mby << 3) * std2 + (mbx << 3); |
sU = cur->u + (mby << 3) * stride2 + (mbx << 3); |
973 |
sV = cur->v + (mby << 3) * std2 + (mbx << 3); |
sV = cur->v + (mby << 3) * stride2 + (mbx << 3); |
974 |
|
|
975 |
for(i = 0 ; i < 16 ; i++) { |
for(i = 0 ; i < 16 ; i++) { |
976 |
memcpy(dY,sY,w); |
memcpy(dY,sY,w); |
977 |
dY += out_frm->stride_y; |
dY += out_frm->stride[0]; |
978 |
sY += std; |
sY += stride; |
979 |
} |
} |
980 |
for(i = 0 ; i < 8 ; i++) { |
for(i = 0 ; i < 8 ; i++) { |
981 |
memcpy(dU,sU,w2); |
memcpy(dU,sU,w2); |
982 |
dU += out_frm->stride_u; |
dU += out_frm->stride[1]; |
983 |
sU += std2; |
sU += stride2; |
984 |
} |
} |
985 |
for(i = 0 ; i < 8 ; i++) { |
for(i = 0 ; i < 8 ; i++) { |
986 |
memcpy(dV,sV,w2); |
memcpy(dV,sV,w2); |
987 |
dV += out_frm->stride_v; |
dV += out_frm->stride[2]; |
988 |
sV += std2; |
sV += stride2; |
989 |
} |
} |
990 |
} |
} |
991 |
|
|
992 |
|
|
993 |
|
void |
994 |
|
image_clear(IMAGE * img, int width, int height, int edged_width, |
995 |
|
int y, int u, int v) |
996 |
|
{ |
997 |
|
uint8_t * p; |
998 |
|
int i; |
999 |
|
|
1000 |
|
p = img->y; |
1001 |
|
for (i = 0; i < height; i++) { |
1002 |
|
memset(p, y, width); |
1003 |
|
p += edged_width; |
1004 |
|
} |
1005 |
|
|
1006 |
|
p = img->u; |
1007 |
|
for (i = 0; i < height/2; i++) { |
1008 |
|
memset(p, u, width/2); |
1009 |
|
p += edged_width/2; |
1010 |
|
} |
1011 |
|
|
1012 |
|
p = img->v; |
1013 |
|
for (i = 0; i < height/2; i++) { |
1014 |
|
memset(p, v, width/2); |
1015 |
|
p += edged_width/2; |
1016 |
|
} |
1017 |
|
} |
1018 |
|
|
1019 |
|
/****************************************************************************/ |
1020 |
|
|
1021 |
|
static void (*deintl_core)(uint8_t *, int width, int height, const int stride) = 0; |
1022 |
|
extern void xvid_deinterlace_sse(uint8_t *, int width, int height, const int stride); |
1023 |
|
|
1024 |
|
#define CLIP_255(x) ( ((x)&~255) ? ((-(x)) >> (8*sizeof((x))-1))&0xff : (x) ) |
1025 |
|
|
1026 |
|
static void deinterlace_c(uint8_t *pix, int width, int height, const int bps) |
1027 |
|
{ |
1028 |
|
pix += bps; |
1029 |
|
while(width-->0) |
1030 |
|
{ |
1031 |
|
int p1 = pix[-bps]; |
1032 |
|
int p2 = pix[0]; |
1033 |
|
int p0 = p2; |
1034 |
|
int j = (height>>1) - 1; |
1035 |
|
int V; |
1036 |
|
unsigned char *P = pix++; |
1037 |
|
while(j-->0) |
1038 |
|
{ |
1039 |
|
const int p3 = P[ bps]; |
1040 |
|
const int p4 = P[2*bps]; |
1041 |
|
V = ((p1+p3+1)>>1) + ((p2 - ((p0+p4+1)>>1)) >> 2); |
1042 |
|
P[0] = CLIP_255( V ); |
1043 |
|
p0 = p2; |
1044 |
|
p1 = p3; |
1045 |
|
p2 = p4; |
1046 |
|
P += 2*bps; |
1047 |
|
} |
1048 |
|
V = ((p1+p1+1)>>1) + ((p2 - ((p0+p2+1)>>1)) >> 2); |
1049 |
|
P[0] = CLIP_255( V ); |
1050 |
|
} |
1051 |
|
} |
1052 |
|
#undef CLIP_255 |
1053 |
|
|
1054 |
|
int xvid_image_deinterlace(xvid_image_t* img, int width, int height, int bottom_first) |
1055 |
|
{ |
1056 |
|
if (height&1) |
1057 |
|
return 0; |
1058 |
|
if (img->csp!=XVID_CSP_PLANAR && img->csp!=XVID_CSP_I420 && img->csp!=XVID_CSP_YV12) |
1059 |
|
return 0; /* not yet supported */ |
1060 |
|
if (deintl_core==0) { |
1061 |
|
deintl_core = deinterlace_c; |
1062 |
|
#ifdef ARCH_IS_IA32 |
1063 |
|
{ |
1064 |
|
int cpu_flags = check_cpu_features(); |
1065 |
|
if (cpu_flags & XVID_CPU_MMX) |
1066 |
|
deintl_core = xvid_deinterlace_sse; |
1067 |
|
} |
1068 |
|
#endif |
1069 |
|
} |
1070 |
|
if (!bottom_first) { |
1071 |
|
deintl_core(img->plane[0], width, height, img->stride[0]); |
1072 |
|
deintl_core(img->plane[1], width>>1, height>>1, img->stride[1]); |
1073 |
|
deintl_core(img->plane[2], width>>1, height>>1, img->stride[2]); |
1074 |
|
} |
1075 |
|
else { |
1076 |
|
deintl_core((uint8_t *)img->plane[0] + ( height -1)*img->stride[0], width, height, -img->stride[0]); |
1077 |
|
deintl_core((uint8_t *)img->plane[1] + ((height>>1)-1)*img->stride[1], width>>1, height>>1, -img->stride[1]); |
1078 |
|
deintl_core((uint8_t *)img->plane[2] + ((height>>1)-1)*img->stride[2], width>>1, height>>1, -img->stride[2]); |
1079 |
|
} |
1080 |
|
emms(); |
1081 |
|
|
1082 |
|
return 1; |
1083 |
|
} |
1084 |
|
|