32 |
* |
* |
33 |
* History: |
* History: |
34 |
* |
* |
35 |
|
* 15.07.2002 fix a bug in B-frame decode at DIRECT mode |
36 |
|
* MinChen <chenm001@163.com> |
37 |
|
* 10.07.2002 added BFRAMES_DEC_DEBUG support |
38 |
|
* Fix a little bug for low_delay flage |
39 |
|
* MinChen <chenm001@163.com> |
40 |
* 28.06.2002 added basic resync support to iframe/pframe_decode() |
* 28.06.2002 added basic resync support to iframe/pframe_decode() |
41 |
* 22.06.2002 added primative N_VOP support |
* 22.06.2002 added primative N_VOP support |
42 |
* #define BFRAMES_DEC now enables Minchenm's bframe decoder |
* #define BFRAMES_DEC now enables Minchen's bframe decoder |
43 |
* 08.05.2002 add low_delay support for B_VOP decode |
* 08.05.2002 add low_delay support for B_VOP decode |
44 |
* MinChen <chenm001@163.com> |
* MinChen <chenm001@163.com> |
45 |
* 05.05.2002 fix some B-frame decode problem |
* 05.05.2002 fix some B-frame decode problem |
62 |
#include <stdlib.h> |
#include <stdlib.h> |
63 |
#include <string.h> |
#include <string.h> |
64 |
|
|
65 |
|
#ifdef BFRAMES_DEC_DEBUG |
66 |
|
#define BFRAMES_DEC |
67 |
|
#endif |
68 |
|
|
69 |
#include "xvid.h" |
#include "xvid.h" |
70 |
#include "portab.h" |
#include "portab.h" |
71 |
|
|
136 |
return XVID_ERR_MEMORY; |
return XVID_ERR_MEMORY; |
137 |
} |
} |
138 |
|
|
139 |
|
if (image_create(&dec->refh, dec->edged_width, dec->edged_height)) { |
140 |
|
image_destroy(&dec->cur, dec->edged_width, dec->edged_height); |
141 |
|
image_destroy(&dec->refn[0], dec->edged_width, dec->edged_height); |
142 |
|
image_destroy(&dec->refn[1], dec->edged_width, dec->edged_height); |
143 |
|
image_destroy(&dec->refn[2], dec->edged_width, dec->edged_height); |
144 |
|
xvid_free(dec); |
145 |
|
return XVID_ERR_MEMORY; |
146 |
|
} |
147 |
|
|
148 |
dec->mbs = |
dec->mbs = |
149 |
xvid_malloc(sizeof(MACROBLOCK) * dec->mb_width * dec->mb_height, |
xvid_malloc(sizeof(MACROBLOCK) * dec->mb_width * dec->mb_height, |
150 |
CACHE_LINE); |
CACHE_LINE); |
153 |
image_destroy(&dec->refn[0], dec->edged_width, dec->edged_height); |
image_destroy(&dec->refn[0], dec->edged_width, dec->edged_height); |
154 |
image_destroy(&dec->refn[1], dec->edged_width, dec->edged_height); |
image_destroy(&dec->refn[1], dec->edged_width, dec->edged_height); |
155 |
image_destroy(&dec->refn[2], dec->edged_width, dec->edged_height); |
image_destroy(&dec->refn[2], dec->edged_width, dec->edged_height); |
156 |
|
image_destroy(&dec->refh, dec->edged_width, dec->edged_height); |
157 |
xvid_free(dec); |
xvid_free(dec); |
158 |
return XVID_ERR_MEMORY; |
return XVID_ERR_MEMORY; |
159 |
} |
} |
171 |
image_destroy(&dec->refn[0], dec->edged_width, dec->edged_height); |
image_destroy(&dec->refn[0], dec->edged_width, dec->edged_height); |
172 |
image_destroy(&dec->refn[1], dec->edged_width, dec->edged_height); |
image_destroy(&dec->refn[1], dec->edged_width, dec->edged_height); |
173 |
image_destroy(&dec->refn[2], dec->edged_width, dec->edged_height); |
image_destroy(&dec->refn[2], dec->edged_width, dec->edged_height); |
174 |
|
image_destroy(&dec->refh, dec->edged_width, dec->edged_height); |
175 |
xvid_free(dec); |
xvid_free(dec); |
176 |
return XVID_ERR_MEMORY; |
return XVID_ERR_MEMORY; |
177 |
} |
} |
197 |
image_destroy(&dec->refn[0], dec->edged_width, dec->edged_height); |
image_destroy(&dec->refn[0], dec->edged_width, dec->edged_height); |
198 |
image_destroy(&dec->refn[1], dec->edged_width, dec->edged_height); |
image_destroy(&dec->refn[1], dec->edged_width, dec->edged_height); |
199 |
image_destroy(&dec->refn[2], dec->edged_width, dec->edged_height); |
image_destroy(&dec->refn[2], dec->edged_width, dec->edged_height); |
200 |
|
image_destroy(&dec->refh, dec->edged_width, dec->edged_height); |
201 |
image_destroy(&dec->cur, dec->edged_width, dec->edged_height); |
image_destroy(&dec->cur, dec->edged_width, dec->edged_height); |
202 |
xvid_free(dec); |
xvid_free(dec); |
203 |
|
|
280 |
start_timer(); |
start_timer(); |
281 |
if (cbp & (1 << (5 - i))) // coded |
if (cbp & (1 << (5 - i))) // coded |
282 |
{ |
{ |
283 |
get_intra_block(bs, &block[i * 64], pMB->acpred_directions[i], |
int direction = dec->alternate_vertical_scan ? |
284 |
start_coeff); |
2 : pMB->acpred_directions[i]; |
285 |
|
|
286 |
|
get_intra_block(bs, &block[i * 64], direction, start_coeff); |
287 |
} |
} |
288 |
stop_coding_timer(); |
stop_coding_timer(); |
289 |
|
|
362 |
uv_dx = pMB->mvs[0].x; |
uv_dx = pMB->mvs[0].x; |
363 |
uv_dy = pMB->mvs[0].y; |
uv_dy = pMB->mvs[0].y; |
364 |
|
|
365 |
|
if (dec->quarterpel) |
366 |
|
{ |
367 |
|
uv_dx = (uv_dx >> 1) | (uv_dx & 1); |
368 |
|
uv_dy = (uv_dy >> 1) | (uv_dy & 1); |
369 |
|
} |
370 |
|
|
371 |
uv_dx = (uv_dx & 3) ? (uv_dx >> 1) | 1 : uv_dx / 2; |
uv_dx = (uv_dx & 3) ? (uv_dx >> 1) | 1 : uv_dx / 2; |
372 |
uv_dy = (uv_dy & 3) ? (uv_dy >> 1) | 1 : uv_dy / 2; |
uv_dy = (uv_dy & 3) ? (uv_dy >> 1) | 1 : uv_dy / 2; |
373 |
|
|
374 |
|
start_timer(); |
375 |
|
if(dec->quarterpel) { |
376 |
|
interpolate16x16_quarterpel(dec->cur.y, dec->refn[0].y, dec->refh.y, dec->refh.y + 64, |
377 |
|
dec->refh.y + 128, 16*x_pos, 16*y_pos, |
378 |
|
pMB->mvs[0].x, pMB->mvs[0].y, stride, rounding); |
379 |
|
} |
380 |
|
else { |
381 |
|
interpolate8x8_switch(dec->cur.y, dec->refn[0].y, 16*x_pos, 16*y_pos, |
382 |
|
pMB->mvs[0].x, pMB->mvs[0].y, stride, rounding); |
383 |
|
interpolate8x8_switch(dec->cur.y, dec->refn[0].y, 16*x_pos + 8, 16*y_pos, |
384 |
|
pMB->mvs[1].x, pMB->mvs[1].y, stride, rounding); |
385 |
|
interpolate8x8_switch(dec->cur.y, dec->refn[0].y, 16*x_pos, 16*y_pos + 8, |
386 |
|
pMB->mvs[2].x, pMB->mvs[2].y, stride, rounding); |
387 |
|
interpolate8x8_switch(dec->cur.y, dec->refn[0].y, 16*x_pos + 8, 16*y_pos + 8, |
388 |
|
pMB->mvs[3].x, pMB->mvs[3].y, stride, rounding); |
389 |
|
} |
390 |
|
|
391 |
|
interpolate8x8_switch(dec->cur.u, dec->refn[0].u, 8 * x_pos, 8 * y_pos, |
392 |
|
uv_dx, uv_dy, stride2, rounding); |
393 |
|
interpolate8x8_switch(dec->cur.v, dec->refn[0].v, 8 * x_pos, 8 * y_pos, |
394 |
|
uv_dx, uv_dy, stride2, rounding); |
395 |
|
stop_comp_timer(); |
396 |
|
|
397 |
} else { |
} else { |
398 |
int sum; |
int sum; |
|
|
|
399 |
sum = pMB->mvs[0].x + pMB->mvs[1].x + pMB->mvs[2].x + pMB->mvs[3].x; |
sum = pMB->mvs[0].x + pMB->mvs[1].x + pMB->mvs[2].x + pMB->mvs[3].x; |
400 |
uv_dx = |
|
401 |
(sum == |
if (dec->quarterpel) |
402 |
0 ? 0 : SIGN(sum) * (roundtab[ABS(sum) % 16] + |
{ |
403 |
(ABS(sum) / 16) * 2)); |
sum /= 2; |
404 |
|
} |
405 |
|
|
406 |
|
uv_dx = (sum == 0 ? 0 : SIGN(sum) * (roundtab[ABS(sum) % 16] + (ABS(sum) / 16) * 2)); |
407 |
|
|
408 |
sum = pMB->mvs[0].y + pMB->mvs[1].y + pMB->mvs[2].y + pMB->mvs[3].y; |
sum = pMB->mvs[0].y + pMB->mvs[1].y + pMB->mvs[2].y + pMB->mvs[3].y; |
409 |
uv_dy = |
|
410 |
(sum == |
if (dec->quarterpel) |
411 |
0 ? 0 : SIGN(sum) * (roundtab[ABS(sum) % 16] + |
{ |
412 |
(ABS(sum) / 16) * 2)); |
sum /= 2; |
413 |
} |
} |
414 |
|
|
415 |
|
uv_dy = (sum == 0 ? 0 : SIGN(sum) * (roundtab[ABS(sum) % 16] + (ABS(sum) / 16) * 2)); |
416 |
|
|
417 |
start_timer(); |
start_timer(); |
418 |
|
if(dec->quarterpel) { |
419 |
|
interpolate8x8_quarterpel(dec->cur.y, dec->refn[0].y, dec->refh.y, dec->refh.y + 64, |
420 |
|
dec->refh.y + 128, 16*x_pos, 16*y_pos, |
421 |
|
pMB->mvs[0].x, pMB->mvs[0].y, stride, rounding); |
422 |
|
interpolate8x8_quarterpel(dec->cur.y, dec->refn[0].y, dec->refh.y, dec->refh.y + 64, |
423 |
|
dec->refh.y + 128, 16*x_pos + 8, 16*y_pos, |
424 |
|
pMB->mvs[1].x, pMB->mvs[1].y, stride, rounding); |
425 |
|
interpolate8x8_quarterpel(dec->cur.y, dec->refn[0].y, dec->refh.y, dec->refh.y + 64, |
426 |
|
dec->refh.y + 128, 16*x_pos, 16*y_pos + 8, |
427 |
|
pMB->mvs[2].x, pMB->mvs[2].y, stride, rounding); |
428 |
|
interpolate8x8_quarterpel(dec->cur.y, dec->refn[0].y, dec->refh.y, dec->refh.y + 64, |
429 |
|
dec->refh.y + 128, 16*x_pos + 8, 16*y_pos + 8, |
430 |
|
pMB->mvs[3].x, pMB->mvs[3].y, stride, rounding); |
431 |
|
} |
432 |
|
else { |
433 |
interpolate8x8_switch(dec->cur.y, dec->refn[0].y, 16 * x_pos, 16 * y_pos, |
interpolate8x8_switch(dec->cur.y, dec->refn[0].y, 16 * x_pos, 16 * y_pos, |
434 |
pMB->mvs[0].x, pMB->mvs[0].y, stride, rounding); |
pMB->mvs[0].x, pMB->mvs[0].y, stride, rounding); |
435 |
interpolate8x8_switch(dec->cur.y, dec->refn[0].y, 16 * x_pos + 8, |
interpolate8x8_switch(dec->cur.y, dec->refn[0].y, 16*x_pos + 8, 16*y_pos, |
436 |
16 * y_pos, pMB->mvs[1].x, pMB->mvs[1].y, stride, |
pMB->mvs[1].x, pMB->mvs[1].y, stride, rounding); |
437 |
rounding); |
interpolate8x8_switch(dec->cur.y, dec->refn[0].y, 16*x_pos, 16*y_pos + 8, |
438 |
interpolate8x8_switch(dec->cur.y, dec->refn[0].y, 16 * x_pos, |
pMB->mvs[2].x, pMB->mvs[2].y, stride, rounding); |
439 |
16 * y_pos + 8, pMB->mvs[2].x, pMB->mvs[2].y, stride, |
interpolate8x8_switch(dec->cur.y, dec->refn[0].y, 16*x_pos + 8, 16*y_pos + 8, |
440 |
rounding); |
pMB->mvs[3].x, pMB->mvs[3].y, stride, rounding); |
441 |
interpolate8x8_switch(dec->cur.y, dec->refn[0].y, 16 * x_pos + 8, |
} |
442 |
16 * y_pos + 8, pMB->mvs[3].x, pMB->mvs[3].y, stride, |
|
|
rounding); |
|
443 |
interpolate8x8_switch(dec->cur.u, dec->refn[0].u, 8 * x_pos, 8 * y_pos, |
interpolate8x8_switch(dec->cur.u, dec->refn[0].u, 8 * x_pos, 8 * y_pos, |
444 |
uv_dx, uv_dy, stride2, rounding); |
uv_dx, uv_dy, stride2, rounding); |
445 |
interpolate8x8_switch(dec->cur.v, dec->refn[0].v, 8 * x_pos, 8 * y_pos, |
interpolate8x8_switch(dec->cur.v, dec->refn[0].v, 8 * x_pos, 8 * y_pos, |
446 |
uv_dx, uv_dy, stride2, rounding); |
uv_dx, uv_dy, stride2, rounding); |
447 |
stop_comp_timer(); |
stop_comp_timer(); |
448 |
|
} |
449 |
|
|
450 |
for (i = 0; i < 6; i++) { |
for (i = 0; i < 6; i++) { |
451 |
|
int direction = dec->alternate_vertical_scan ? 2 : 0; |
452 |
|
|
453 |
if (cbp & (1 << (5 - i))) // coded |
if (cbp & (1 << (5 - i))) // coded |
454 |
{ |
{ |
455 |
memset(&block[i * 64], 0, 64 * sizeof(int16_t)); // clear |
memset(&block[i * 64], 0, 64 * sizeof(int16_t)); // clear |
456 |
|
|
457 |
start_timer(); |
start_timer(); |
458 |
get_inter_block(bs, &block[i * 64]); |
get_inter_block(bs, &block[i * 64], direction); |
459 |
stop_coding_timer(); |
stop_coding_timer(); |
460 |
|
|
461 |
start_timer(); |
start_timer(); |
545 |
} |
} |
546 |
} |
} |
547 |
mb->quant = quant; |
mb->quant = quant; |
548 |
|
mb->mvs[0].x = mb->mvs[0].y = |
549 |
|
mb->mvs[1].x = mb->mvs[1].y = |
550 |
|
mb->mvs[2].x = mb->mvs[2].y = |
551 |
|
mb->mvs[3].x = mb->mvs[3].y =0; |
552 |
|
|
553 |
if (dec->interlacing) { |
if (dec->interlacing) { |
554 |
mb->field_dct = BitstreamGetBit(bs); |
mb->field_dct = BitstreamGetBit(bs); |
558 |
decoder_mbintra(dec, mb, x, y, acpred_flag, cbp, bs, quant, |
decoder_mbintra(dec, mb, x, y, acpred_flag, cbp, bs, quant, |
559 |
intra_dc_threshold, bound); |
intra_dc_threshold, bound); |
560 |
} |
} |
561 |
|
if(dec->out_frm) |
562 |
|
output_slice(&dec->cur, dec->edged_width,dec->width,dec->out_frm,0,y,dec->mb_width); |
563 |
|
|
564 |
} |
} |
565 |
|
|
566 |
} |
} |
624 |
|
|
625 |
uint32_t x, y; |
uint32_t x, y; |
626 |
uint32_t bound; |
uint32_t bound; |
627 |
|
int cp_mb, st_mb; |
628 |
|
|
629 |
start_timer(); |
start_timer(); |
630 |
image_setedges(&dec->refn[0], dec->edged_width, dec->edged_height, |
image_setedges(&dec->refn[0], dec->edged_width, dec->edged_height, |
631 |
dec->width, dec->height, dec->interlacing); |
dec->width, dec->height); |
632 |
stop_edges_timer(); |
stop_edges_timer(); |
633 |
|
|
634 |
bound = 0; |
bound = 0; |
635 |
|
|
636 |
for (y = 0; y < dec->mb_height; y++) { |
for (y = 0; y < dec->mb_height; y++) { |
637 |
|
cp_mb = st_mb = 0; |
638 |
for (x = 0; x < dec->mb_width; x++) { |
for (x = 0; x < dec->mb_width; x++) { |
639 |
MACROBLOCK *mb; |
MACROBLOCK *mb; |
640 |
|
|
662 |
uint32_t cbp; |
uint32_t cbp; |
663 |
uint32_t intra; |
uint32_t intra; |
664 |
|
|
665 |
|
cp_mb++; |
666 |
mcbpc = get_mcbpc_inter(bs); |
mcbpc = get_mcbpc_inter(bs); |
667 |
mb->mode = mcbpc & 7; |
mb->mode = mcbpc & 7; |
668 |
cbpc = (mcbpc >> 4); |
cbpc = (mcbpc >> 4); |
696 |
mb->quant = quant; |
mb->quant = quant; |
697 |
|
|
698 |
if (dec->interlacing) { |
if (dec->interlacing) { |
699 |
|
if (cbp || intra) { |
700 |
mb->field_dct = BitstreamGetBit(bs); |
mb->field_dct = BitstreamGetBit(bs); |
701 |
DEBUG1("decp: field_dct: ", mb->field_dct); |
DEBUG1("decp: field_dct: ", mb->field_dct); |
702 |
|
} |
703 |
|
|
704 |
if (mb->mode == MODE_INTER || mb->mode == MODE_INTER_Q) { |
if (mb->mode == MODE_INTER || mb->mode == MODE_INTER_Q) { |
705 |
mb->field_pred = BitstreamGetBit(bs); |
mb->field_pred = BitstreamGetBit(bs); |
728 |
mb->mvs[1].y = mb->mvs[2].y = mb->mvs[3].y = |
mb->mvs[1].y = mb->mvs[2].y = mb->mvs[3].y = |
729 |
mb->mvs[0].y; |
mb->mvs[0].y; |
730 |
} |
} |
731 |
} else if (mb->mode == |
} else if (mb->mode == MODE_INTER4V ) { |
732 |
MODE_INTER4V /* || mb->mode == MODE_INTER4V_Q */ ) { |
|
733 |
get_motion_vector(dec, bs, x, y, 0, &mb->mvs[0], fcode, bound); |
get_motion_vector(dec, bs, x, y, 0, &mb->mvs[0], fcode, bound); |
734 |
get_motion_vector(dec, bs, x, y, 1, &mb->mvs[1], fcode, bound); |
get_motion_vector(dec, bs, x, y, 1, &mb->mvs[1], fcode, bound); |
735 |
get_motion_vector(dec, bs, x, y, 2, &mb->mvs[2], fcode, bound); |
get_motion_vector(dec, bs, x, y, 2, &mb->mvs[2], fcode, bound); |
749 |
rounding); |
rounding); |
750 |
} else // not coded |
} else // not coded |
751 |
{ |
{ |
752 |
//DEBUG2("P-frame MB at (X,Y)=",x,y); |
DEBUG2("P-frame MB at (X,Y)=",x,y); |
753 |
mb->mode = MODE_NOT_CODED; |
mb->mode = MODE_NOT_CODED; |
754 |
mb->mvs[0].x = mb->mvs[1].x = mb->mvs[2].x = mb->mvs[3].x = 0; |
mb->mvs[0].x = mb->mvs[1].x = mb->mvs[2].x = mb->mvs[3].x = 0; |
755 |
mb->mvs[0].y = mb->mvs[1].y = mb->mvs[2].y = mb->mvs[3].y = 0; |
mb->mvs[0].y = mb->mvs[1].y = mb->mvs[2].y = mb->mvs[3].y = 0; |
791 |
dec->refn[0].v + |
dec->refn[0].v + |
792 |
(8 * y) * dec->edged_width / 2 + (8 * x), |
(8 * y) * dec->edged_width / 2 + (8 * x), |
793 |
dec->edged_width / 2); |
dec->edged_width / 2); |
|
|
|
794 |
stop_transfer_timer(); |
stop_transfer_timer(); |
795 |
|
if(dec->out_frm && cp_mb > 0) { |
796 |
|
output_slice(&dec->cur, dec->edged_width,dec->width,dec->out_frm,st_mb,y,cp_mb); |
797 |
|
cp_mb = 0; |
798 |
|
} |
799 |
|
st_mb = x+1; |
800 |
} |
} |
801 |
} |
} |
802 |
|
if(dec->out_frm && cp_mb > 0) |
803 |
|
output_slice(&dec->cur, dec->edged_width,dec->width,dec->out_frm,st_mb,y,cp_mb); |
804 |
} |
} |
805 |
} |
} |
806 |
|
|
878 |
pU_Cur = dec->cur.u + (y_pos << 3) * stride2 + (x_pos << 3); |
pU_Cur = dec->cur.u + (y_pos << 3) * stride2 + (x_pos << 3); |
879 |
pV_Cur = dec->cur.v + (y_pos << 3) * stride2 + (x_pos << 3); |
pV_Cur = dec->cur.v + (y_pos << 3) * stride2 + (x_pos << 3); |
880 |
|
|
881 |
|
|
882 |
if (!(pMB->mode == MODE_INTER || pMB->mode == MODE_INTER_Q)) { |
if (!(pMB->mode == MODE_INTER || pMB->mode == MODE_INTER_Q)) { |
883 |
uv_dx = pMB->mvs[0].x; |
uv_dx = pMB->mvs[0].x; |
884 |
uv_dy = pMB->mvs[0].y; |
uv_dy = pMB->mvs[0].y; |
919 |
stop_comp_timer(); |
stop_comp_timer(); |
920 |
|
|
921 |
for (i = 0; i < 6; i++) { |
for (i = 0; i < 6; i++) { |
922 |
|
int direction = dec->alternate_vertical_scan ? 2 : 0; |
923 |
|
|
924 |
if (cbp & (1 << (5 - i))) // coded |
if (cbp & (1 << (5 - i))) // coded |
925 |
{ |
{ |
926 |
memset(&block[i * 64], 0, 64 * sizeof(int16_t)); // clear |
memset(&block[i * 64], 0, 64 * sizeof(int16_t)); // clear |
927 |
|
|
928 |
start_timer(); |
start_timer(); |
929 |
get_inter_block(bs, &block[i * 64]); |
get_inter_block(bs, &block[i * 64], direction); |
930 |
stop_coding_timer(); |
stop_coding_timer(); |
931 |
|
|
932 |
start_timer(); |
start_timer(); |
974 |
const MACROBLOCK * pMB, |
const MACROBLOCK * pMB, |
975 |
const uint32_t x_pos, |
const uint32_t x_pos, |
976 |
const uint32_t y_pos, |
const uint32_t y_pos, |
|
const uint32_t cbp, |
|
977 |
Bitstream * bs) |
Bitstream * bs) |
978 |
{ |
{ |
979 |
|
|
988 |
int b_uv_dx, b_uv_dy; |
int b_uv_dx, b_uv_dy; |
989 |
uint32_t i; |
uint32_t i; |
990 |
uint8_t *pY_Cur, *pU_Cur, *pV_Cur; |
uint8_t *pY_Cur, *pU_Cur, *pV_Cur; |
991 |
|
const uint32_t cbp = pMB->cbp; |
992 |
|
|
993 |
pY_Cur = dec->cur.y + (y_pos << 4) * stride + (x_pos << 4); |
pY_Cur = dec->cur.y + (y_pos << 4) * stride + (x_pos << 4); |
994 |
pU_Cur = dec->cur.u + (y_pos << 3) * stride2 + (x_pos << 3); |
pU_Cur = dec->cur.u + (y_pos << 3) * stride2 + (x_pos << 3); |
995 |
pV_Cur = dec->cur.v + (y_pos << 3) * stride2 + (x_pos << 3); |
pV_Cur = dec->cur.v + (y_pos << 3) * stride2 + (x_pos << 3); |
996 |
|
|
997 |
|
|
998 |
if ((pMB->mode == MODE_INTER || pMB->mode == MODE_INTER_Q)) { |
if ((pMB->mode == MODE_INTER || pMB->mode == MODE_INTER_Q)) { |
999 |
uv_dx = pMB->mvs[0].x; |
uv_dx = pMB->mvs[0].x; |
1000 |
uv_dy = pMB->mvs[0].y; |
uv_dy = pMB->mvs[0].y; |
1072 |
interpolate8x8_switch(dec->refn[2].v, backward.v, 8 * x_pos, 8 * y_pos, |
interpolate8x8_switch(dec->refn[2].v, backward.v, 8 * x_pos, 8 * y_pos, |
1073 |
b_uv_dx, b_uv_dy, stride2, 0); |
b_uv_dx, b_uv_dy, stride2, 0); |
1074 |
|
|
1075 |
interpolate8x8_c(dec->cur.y, dec->refn[2].y, 16 * x_pos, 16 * y_pos, |
interpolate8x8_avg2(dec->cur.y + (16 * y_pos * stride) + 16 * x_pos, |
1076 |
stride); |
dec->cur.y + (16 * y_pos * stride) + 16 * x_pos, |
1077 |
interpolate8x8_c(dec->cur.y, dec->refn[2].y, 16 * x_pos + 8, 16 * y_pos, |
dec->refn[2].y + (16 * y_pos * stride) + 16 * x_pos, |
1078 |
stride); |
stride, 0); |
1079 |
interpolate8x8_c(dec->cur.y, dec->refn[2].y, 16 * x_pos, 16 * y_pos + 8, |
|
1080 |
stride); |
interpolate8x8_avg2(dec->cur.y + (16 * y_pos * stride) + 16 * x_pos + 8, |
1081 |
interpolate8x8_c(dec->cur.y, dec->refn[2].y, 16 * x_pos + 8, |
dec->cur.y + (16 * y_pos * stride) + 16 * x_pos + 8, |
1082 |
16 * y_pos + 8, stride); |
dec->refn[2].y + (16 * y_pos * stride) + 16 * x_pos + 8, |
1083 |
interpolate8x8_c(dec->cur.u, dec->refn[2].u, 8 * x_pos, 8 * y_pos, |
stride, 0); |
1084 |
stride2); |
|
1085 |
interpolate8x8_c(dec->cur.v, dec->refn[2].v, 8 * x_pos, 8 * y_pos, |
interpolate8x8_avg2(dec->cur.y + (16 * (y_pos + 8) * stride) + 16 * x_pos, |
1086 |
stride2); |
dec->cur.y + (16 * (y_pos + 8) * stride) + 16 * x_pos, |
1087 |
|
dec->refn[2].y + (16 * (y_pos + 8) * stride) + 16 * x_pos, |
1088 |
|
stride, 0); |
1089 |
|
|
1090 |
|
interpolate8x8_avg2(dec->cur.y + (16 * (y_pos + 8) * stride) + 16 * x_pos + 8, |
1091 |
|
dec->cur.y + (16 * (y_pos + 8) * stride) + 16 * x_pos + 8, |
1092 |
|
dec->refn[2].y + (16 * (y_pos + 8) * stride) + 16 * x_pos + 8, |
1093 |
|
stride, 0); |
1094 |
|
|
1095 |
|
interpolate8x8_avg2(dec->cur.u + (8 * y_pos * stride) + 8 * x_pos, |
1096 |
|
dec->cur.u + (8 * y_pos * stride) + 8 * x_pos, |
1097 |
|
dec->refn[2].u + (8 * y_pos * stride) + 8 * x_pos, |
1098 |
|
stride2, 0); |
1099 |
|
|
1100 |
|
interpolate8x8_avg2(dec->cur.v + (8 * y_pos * stride) + 8 * x_pos, |
1101 |
|
dec->cur.v + (8 * y_pos * stride) + 8 * x_pos, |
1102 |
|
dec->refn[2].v + (8 * y_pos * stride) + 8 * x_pos, |
1103 |
|
stride2, 0); |
1104 |
|
|
1105 |
stop_comp_timer(); |
stop_comp_timer(); |
1106 |
|
|
1107 |
for (i = 0; i < 6; i++) { |
for (i = 0; i < 6; i++) { |
1108 |
|
int direction = dec->alternate_vertical_scan ? 2 : 0; |
1109 |
|
|
1110 |
if (cbp & (1 << (5 - i))) // coded |
if (cbp & (1 << (5 - i))) // coded |
1111 |
{ |
{ |
1112 |
memset(&block[i * 64], 0, 64 * sizeof(int16_t)); // clear |
memset(&block[i * 64], 0, 64 * sizeof(int16_t)); // clear |
1113 |
|
|
1114 |
start_timer(); |
start_timer(); |
1115 |
get_inter_block(bs, &block[i * 64]); |
get_inter_block(bs, &block[i * 64], direction); |
1116 |
stop_coding_timer(); |
stop_coding_timer(); |
1117 |
|
|
1118 |
start_timer(); |
start_timer(); |
1194 |
int fcode_forward, |
int fcode_forward, |
1195 |
int fcode_backward) |
int fcode_backward) |
1196 |
{ |
{ |
|
|
|
1197 |
uint32_t x, y; |
uint32_t x, y; |
1198 |
VECTOR mv, zeromv; |
VECTOR mv; |
1199 |
|
const VECTOR zeromv = {0,0}; |
1200 |
|
#ifdef BFRAMES_DEC_DEBUG |
1201 |
|
FILE *fp; |
1202 |
|
static char first=0; |
1203 |
|
#define BFRAME_DEBUG if (!first && fp){ \ |
1204 |
|
fprintf(fp,"Y=%3d X=%3d MB=%2d CBP=%02X\n",y,x,mb->mb_type,mb->cbp); \ |
1205 |
|
} |
1206 |
|
#endif |
1207 |
|
|
1208 |
start_timer(); |
start_timer(); |
1209 |
image_setedges(&dec->refn[0], dec->edged_width, dec->edged_height, |
image_setedges(&dec->refn[0], dec->edged_width, dec->edged_height, |
1210 |
dec->width, dec->height, dec->interlacing); |
dec->width, dec->height); |
1211 |
//image_setedges(&dec->refn[1], dec->edged_width, dec->edged_height, dec->width, dec->height, dec->interlacing); |
image_setedges(&dec->refn[1], dec->edged_width, dec->edged_height, |
1212 |
|
dec->width, dec->height); |
1213 |
stop_edges_timer(); |
stop_edges_timer(); |
1214 |
|
|
1215 |
|
#ifdef BFRAMES_DEC_DEBUG |
1216 |
|
if (!first){ |
1217 |
|
fp=fopen("C:\\XVIDDBG.TXT","w"); |
1218 |
|
} |
1219 |
|
#endif |
1220 |
|
|
1221 |
for (y = 0; y < dec->mb_height; y++) { |
for (y = 0; y < dec->mb_height; y++) { |
1222 |
// Initialize Pred Motion Vector |
// Initialize Pred Motion Vector |
1223 |
dec->p_fmv.x = dec->p_fmv.y = dec->p_bmv.x = dec->p_bmv.y = 0; |
dec->p_fmv = dec->p_bmv = zeromv; |
1224 |
for (x = 0; x < dec->mb_width; x++) { |
for (x = 0; x < dec->mb_width; x++) { |
1225 |
MACROBLOCK *mb = &dec->mbs[y * dec->mb_width + x]; |
MACROBLOCK *mb = &dec->mbs[y * dec->mb_width + x]; |
1226 |
MACROBLOCK *last_mb = &dec->last_mbs[y * dec->mb_width + x]; |
MACROBLOCK *last_mb = &dec->last_mbs[y * dec->mb_width + x]; |
1227 |
|
|
1228 |
mb->mvs[0].x = mb->mvs[0].y = zeromv.x = zeromv.y = mv.x = mv.y = |
mv = |
1229 |
0; |
mb->b_mvs[0] = mb->b_mvs[1] = mb->b_mvs[2] = mb->b_mvs[3] = |
1230 |
|
mb->mvs[0] = mb->mvs[1] = mb->mvs[2] = mb->mvs[3] = zeromv; |
1231 |
|
|
1232 |
// the last P_VOP is skip macroblock ? |
// the last P_VOP is skip macroblock ? |
1233 |
if (last_mb->mode == MODE_NOT_CODED) { |
if (last_mb->mode == MODE_NOT_CODED) { |
1234 |
//DEBUG2("Skip MB in B-frame at (X,Y)=!",x,y); |
//DEBUG2("Skip MB in B-frame at (X,Y)=!",x,y); |
|
mb->mb_type = MODE_FORWARD; |
|
1235 |
mb->cbp = 0; |
mb->cbp = 0; |
1236 |
mb->mvs[1].x = mb->mvs[2].x = mb->mvs[3].x = mb->mvs[0].x; |
#ifdef BFRAMES_DEC_DEBUG |
1237 |
mb->mvs[1].y = mb->mvs[2].y = mb->mvs[3].y = mb->mvs[0].y; |
mb->mb_type = MODE_NOT_CODED; |
1238 |
mb->quant = 8; |
BFRAME_DEBUG |
1239 |
|
#endif |
1240 |
|
mb->mb_type = MODE_FORWARD; |
1241 |
|
mb->quant = last_mb->quant; |
1242 |
|
//mb->mvs[1].x = mb->mvs[2].x = mb->mvs[3].x = mb->mvs[0].x; |
1243 |
|
//mb->mvs[1].y = mb->mvs[2].y = mb->mvs[3].y = mb->mvs[0].y; |
1244 |
|
|
1245 |
decoder_bf_mbinter(dec, mb, x, y, mb->cbp, bs, quant, 1); |
decoder_bf_mbinter(dec, mb, x, y, mb->cbp, bs, mb->quant, 1); |
1246 |
continue; |
continue; |
1247 |
} |
} |
|
//t=BitstreamShowBits(bs,32); |
|
1248 |
|
|
1249 |
if (!BitstreamGetBit(bs)) { // modb=='0' |
if (!BitstreamGetBit(bs)) { // modb=='0' |
1250 |
const uint8_t modb2 = BitstreamGetBit(bs); |
const uint8_t modb2 = BitstreamGetBit(bs); |
1264 |
} else if (quant < 1) { |
} else if (quant < 1) { |
1265 |
quant = 1; |
quant = 1; |
1266 |
} |
} |
|
} else { |
|
|
quant = 8; |
|
1267 |
} |
} |
|
mb->quant = quant; |
|
1268 |
} else { |
} else { |
1269 |
mb->mb_type = MODE_DIRECT_NONE_MV; |
mb->mb_type = MODE_DIRECT_NONE_MV; |
1270 |
mb->cbp = 0; |
mb->cbp = 0; |
1271 |
} |
} |
1272 |
|
|
1273 |
mb->mode = MODE_INTER; |
mb->quant = quant; |
1274 |
|
mb->mode = MODE_INTER4V; |
1275 |
//DEBUG1("Switch bm_type=",mb->mb_type); |
//DEBUG1("Switch bm_type=",mb->mb_type); |
1276 |
|
|
1277 |
|
#ifdef BFRAMES_DEC_DEBUG |
1278 |
|
BFRAME_DEBUG |
1279 |
|
#endif |
1280 |
|
|
1281 |
switch (mb->mb_type) { |
switch (mb->mb_type) { |
1282 |
case MODE_DIRECT: |
case MODE_DIRECT: |
1283 |
get_b_motion_vector(dec, bs, x, y, &mb->mvs[0], 1, zeromv); |
get_b_motion_vector(dec, bs, x, y, &mv, 1, zeromv); |
1284 |
|
|
1285 |
case MODE_DIRECT_NONE_MV: |
case MODE_DIRECT_NONE_MV: |
1286 |
{ // Because this file is a C file not C++ so I use '{' to define var |
{ |
1287 |
const int64_t TRB = dec->time_pp - dec->time_bp, TRD = |
const int64_t TRB = dec->time_pp - dec->time_bp, TRD = dec->time_pp; |
|
dec->time_pp; |
|
1288 |
int i; |
int i; |
1289 |
|
|
1290 |
for (i = 0; i < 4; i++) { |
for (i = 0; i < 4; i++) { |
1291 |
mb->mvs[i].x = |
mb->mvs[i].x = (int32_t) ((TRB * last_mb->mvs[i].x) |
1292 |
(int32_t) ((TRB * last_mb->mvs[i].x) / TRD + |
/ TRD + mv.x); |
1293 |
mb->mvs[0].x); |
mb->b_mvs[i].x = (int32_t) ((mv.x == 0) |
1294 |
mb->b_mvs[i].x = |
? ((TRB - TRD) * last_mb->mvs[i].x) |
1295 |
(int32_t) ((mb->mvs[0].x == |
/ TRD |
1296 |
0) ? ((TRB - |
: mb->mvs[i].x - last_mb->mvs[i].x); |
1297 |
TRD) * last_mb->mvs[i].x) / |
mb->mvs[i].y = (int32_t) ((TRB * last_mb->mvs[i].y) |
1298 |
TRD : mb->mvs[i].x - last_mb->mvs[i].x); |
/ TRD + mv.y); |
1299 |
mb->mvs[i].y = |
mb->b_mvs[i].y = (int32_t) ((mv.y == 0) |
1300 |
(int32_t) ((TRB * last_mb->mvs[i].y) / TRD + |
? ((TRB - TRD) * last_mb->mvs[i].y) |
1301 |
mb->mvs[0].y); |
/ TRD |
1302 |
mb->b_mvs[i].y = |
: mb->mvs[i].y - last_mb->mvs[i].y); |
|
(int32_t) ((mb->mvs[0].y == |
|
|
0) ? ((TRB - |
|
|
TRD) * last_mb->mvs[i].y) / |
|
|
TRD : mb->mvs[i].y - last_mb->mvs[i].y); |
|
1303 |
} |
} |
1304 |
//DEBUG("B-frame Direct!\n"); |
//DEBUG("B-frame Direct!\n"); |
1305 |
} |
} |
|
mb->mode = MODE_INTER4V; |
|
1306 |
decoder_bf_interpolate_mbinter(dec, dec->refn[1], dec->refn[0], |
decoder_bf_interpolate_mbinter(dec, dec->refn[1], dec->refn[0], |
1307 |
mb, x, y, mb->cbp, bs); |
mb, x, y, bs); |
1308 |
break; |
break; |
1309 |
|
|
1310 |
case MODE_INTERPOLATE: |
case MODE_INTERPOLATE: |
1311 |
get_b_motion_vector(dec, bs, x, y, &mb->mvs[0], fcode_forward, |
get_b_motion_vector(dec, bs, x, y, &mb->mvs[0], fcode_forward, |
1312 |
dec->p_fmv); |
dec->p_fmv); |
1313 |
dec->p_fmv.x = mb->mvs[1].x = mb->mvs[2].x = mb->mvs[3].x = |
dec->p_fmv = mb->mvs[1] = mb->mvs[2] = mb->mvs[3] = mb->mvs[0]; |
|
mb->mvs[0].x; |
|
|
dec->p_fmv.y = mb->mvs[1].y = mb->mvs[2].y = mb->mvs[3].y = |
|
|
mb->mvs[0].y; |
|
1314 |
|
|
1315 |
get_b_motion_vector(dec, bs, x, y, &mb->b_mvs[0], |
get_b_motion_vector(dec, bs, x, y, &mb->b_mvs[0], |
1316 |
fcode_backward, dec->p_bmv); |
fcode_backward, dec->p_bmv); |
1317 |
dec->p_bmv.x = mb->b_mvs[1].x = mb->b_mvs[2].x = |
dec->p_bmv = mb->b_mvs[1] = mb->b_mvs[2] = |
1318 |
mb->b_mvs[3].x = mb->b_mvs[0].x; |
mb->b_mvs[3] = mb->b_mvs[0]; |
|
dec->p_bmv.y = mb->b_mvs[1].y = mb->b_mvs[2].y = |
|
|
mb->b_mvs[3].y = mb->b_mvs[0].y; |
|
1319 |
|
|
1320 |
decoder_bf_interpolate_mbinter(dec, dec->refn[1], dec->refn[0], |
decoder_bf_interpolate_mbinter(dec, dec->refn[1], dec->refn[0], |
1321 |
mb, x, y, mb->cbp, bs); |
mb, x, y, bs); |
1322 |
//DEBUG("B-frame Bidir!\n"); |
//DEBUG("B-frame Bidir!\n"); |
1323 |
break; |
break; |
1324 |
|
|
1325 |
case MODE_BACKWARD: |
case MODE_BACKWARD: |
1326 |
get_b_motion_vector(dec, bs, x, y, &mb->mvs[0], fcode_backward, |
get_b_motion_vector(dec, bs, x, y, &mb->mvs[0], fcode_backward, |
1327 |
dec->p_bmv); |
dec->p_bmv); |
1328 |
dec->p_bmv.x = mb->mvs[1].x = mb->mvs[2].x = mb->mvs[3].x = |
dec->p_bmv = mb->mvs[1] = mb->mvs[2] = mb->mvs[3] = mb->mvs[0]; |
|
mb->mvs[0].x; |
|
|
dec->p_bmv.y = mb->mvs[1].y = mb->mvs[2].y = mb->mvs[3].y = |
|
|
mb->mvs[0].y; |
|
1329 |
|
|
1330 |
|
mb->mode = MODE_INTER; |
1331 |
decoder_bf_mbinter(dec, mb, x, y, mb->cbp, bs, quant, 0); |
decoder_bf_mbinter(dec, mb, x, y, mb->cbp, bs, quant, 0); |
1332 |
//DEBUG("B-frame Backward!\n"); |
//DEBUG("B-frame Backward!\n"); |
1333 |
break; |
break; |
1335 |
case MODE_FORWARD: |
case MODE_FORWARD: |
1336 |
get_b_motion_vector(dec, bs, x, y, &mb->mvs[0], fcode_forward, |
get_b_motion_vector(dec, bs, x, y, &mb->mvs[0], fcode_forward, |
1337 |
dec->p_fmv); |
dec->p_fmv); |
1338 |
dec->p_fmv.x = mb->mvs[1].x = mb->mvs[2].x = mb->mvs[3].x = |
dec->p_fmv = mb->mvs[1] = mb->mvs[2] = mb->mvs[3] = mb->mvs[0]; |
|
mb->mvs[0].x; |
|
|
dec->p_fmv.y = mb->mvs[1].y = mb->mvs[2].y = mb->mvs[3].y = |
|
|
mb->mvs[0].y; |
|
1339 |
|
|
1340 |
|
mb->mode = MODE_INTER; |
1341 |
decoder_bf_mbinter(dec, mb, x, y, mb->cbp, bs, quant, 1); |
decoder_bf_mbinter(dec, mb, x, y, mb->cbp, bs, quant, 1); |
1342 |
//DEBUG("B-frame Forward!\n"); |
//DEBUG("B-frame Forward!\n"); |
1343 |
break; |
break; |
1348 |
|
|
1349 |
} // end of FOR |
} // end of FOR |
1350 |
} |
} |
1351 |
|
#ifdef BFRAMES_DEC_DEBUG |
1352 |
|
if (!first){ |
1353 |
|
first=1; |
1354 |
|
if (fp) |
1355 |
|
fclose(fp); |
1356 |
|
} |
1357 |
|
#endif |
1358 |
} |
} |
1359 |
|
|
1360 |
// swap two MACROBLOCK array |
// swap two MACROBLOCK array |
1383 |
|
|
1384 |
start_global_timer(); |
start_global_timer(); |
1385 |
|
|
1386 |
|
dec->out_frm = (frame->colorspace == XVID_CSP_EXTERN) ? frame->image : NULL; |
1387 |
|
|
1388 |
BitstreamInit(&bs, frame->bitstream, frame->length); |
BitstreamInit(&bs, frame->bitstream, frame->length); |
1389 |
|
|
1390 |
// add by chenm001 <chenm001@163.com> |
// add by chenm001 <chenm001@163.com> |
1434 |
return XVID_ERR_FAIL; |
return XVID_ERR_FAIL; |
1435 |
} |
} |
1436 |
|
|
1437 |
|
#ifdef BFRAMES_DEC_DEBUG |
1438 |
|
if (frame->length != BitstreamPos(&bs) / 8){ |
1439 |
|
DEBUG2("InLen/UseLen",frame->length, BitstreamPos(&bs) / 8); |
1440 |
|
} |
1441 |
|
#endif |
1442 |
frame->length = BitstreamPos(&bs) / 8; |
frame->length = BitstreamPos(&bs) / 8; |
1443 |
|
|
1444 |
|
|
1445 |
#ifdef BFRAMES_DEC |
#ifdef BFRAMES_DEC |
1446 |
// test if no B_VOP |
// test if no B_VOP |
1447 |
if (dec->low_delay) { |
if (dec->low_delay || dec->frames == 0) { |
1448 |
#endif |
#endif |
1449 |
image_output(&dec->cur, dec->width, dec->height, dec->edged_width, |
image_output(&dec->cur, dec->width, dec->height, dec->edged_width, |
1450 |
frame->image, frame->stride, frame->colorspace); |
frame->image, frame->stride, frame->colorspace); |
1451 |
|
|
1452 |
#ifdef BFRAMES_DEC |
#ifdef BFRAMES_DEC |
1453 |
} else { |
} else { |
1454 |
if (dec->frames >= 1) { |
if (dec->frames >= 1) { |
1470 |
if (vop_type == I_VOP || vop_type == P_VOP) { |
if (vop_type == I_VOP || vop_type == P_VOP) { |
1471 |
image_swap(&dec->refn[0], &dec->refn[1]); |
image_swap(&dec->refn[0], &dec->refn[1]); |
1472 |
image_swap(&dec->cur, &dec->refn[0]); |
image_swap(&dec->cur, &dec->refn[0]); |
1473 |
|
|
1474 |
// swap MACROBLOCK |
// swap MACROBLOCK |
1475 |
if (dec->low_delay && vop_type == P_VOP) |
// the Divx will not set the low_delay flage some times |
1476 |
|
// so follow code will wrong to not swap at that time |
1477 |
|
// this will broken bitstream! so I'm change it, |
1478 |
|
// But that is not the best way! can anyone tell me how |
1479 |
|
// to do another way? |
1480 |
|
// 18-07-2002 MinChen<chenm001@163.com> |
1481 |
|
//if (!dec->low_delay && vop_type == P_VOP) |
1482 |
|
if (vop_type == P_VOP) |
1483 |
mb_swap(&dec->mbs, &dec->last_mbs); |
mb_swap(&dec->mbs, &dec->last_mbs); |
1484 |
} |
} |
1485 |
|
|