302 |
dev16 = dev16_c; |
dev16 = dev16_c; |
303 |
sad16v = sad16v_c; |
sad16v = sad16v_c; |
304 |
sse8_16bit = sse8_16bit_c; |
sse8_16bit = sse8_16bit_c; |
305 |
|
sse8_8bit = sse8_8bit_c; |
306 |
|
|
307 |
#if defined(ARCH_IS_IA32) |
#if defined(ARCH_IS_IA32) |
308 |
|
|
398 |
dev16 = dev16_mmx; |
dev16 = dev16_mmx; |
399 |
sad16v = sad16v_mmx; |
sad16v = sad16v_mmx; |
400 |
sse8_16bit = sse8_16bit_mmx; |
sse8_16bit = sse8_16bit_mmx; |
401 |
|
sse8_8bit = sse8_8bit_mmx; |
402 |
} |
} |
403 |
|
|
404 |
/* these 3dnow functions are faster than mmx, but slower than xmm. */ |
/* these 3dnow functions are faster than mmx, but slower than xmm. */ |
464 |
|
|
465 |
if ((cpu_flags & XVID_CPU_3DNOWEXT)) { |
if ((cpu_flags & XVID_CPU_3DNOWEXT)) { |
466 |
|
|
|
/* Inverse DCT */ |
|
|
idct = idct_3dne; |
|
|
|
|
467 |
/* Buffer transfer */ |
/* Buffer transfer */ |
468 |
transfer_8to16copy = transfer_8to16copy_3dne; |
transfer_8to16copy = transfer_8to16copy_3dne; |
469 |
transfer_16to8copy = transfer_16to8copy_3dne; |
transfer_16to8copy = transfer_16to8copy_3dne; |
470 |
transfer_8to16sub = transfer_8to16sub_3dne; |
transfer_8to16sub = transfer_8to16sub_3dne; |
471 |
transfer_8to16subro = transfer_8to16subro_3dne; |
transfer_8to16subro = transfer_8to16subro_3dne; |
|
transfer_8to16sub2 = transfer_8to16sub2_3dne; |
|
472 |
transfer_16to8add = transfer_16to8add_3dne; |
transfer_16to8add = transfer_16to8add_3dne; |
473 |
transfer8x8_copy = transfer8x8_copy_3dne; |
transfer8x8_copy = transfer8x8_copy_3dne; |
474 |
|
|
475 |
|
if ((cpu_flags & XVID_CPU_MMXEXT)) { |
476 |
|
/* Inverse DCT */ |
477 |
|
idct = idct_3dne; |
478 |
|
|
479 |
|
/* Buffer transfer */ |
480 |
|
transfer_8to16sub2 = transfer_8to16sub2_3dne; |
481 |
|
|
482 |
|
/* Interpolation */ |
483 |
|
interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_3dne; |
484 |
|
interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_3dne; |
485 |
|
interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_3dne; |
486 |
|
|
487 |
/* Quantization */ |
/* Quantization */ |
488 |
quant_h263_intra = quant_h263_intra_3dne; |
quant_h263_intra = quant_h263_intra_3dne; /* cmov only */ |
489 |
quant_h263_inter = quant_h263_inter_3dne; |
quant_h263_inter = quant_h263_inter_3dne; |
490 |
dequant_mpeg_intra = dequant_mpeg_intra_3dne; |
dequant_mpeg_intra = dequant_mpeg_intra_3dne; /* cmov only */ |
491 |
dequant_mpeg_inter = dequant_mpeg_inter_3dne; |
dequant_mpeg_inter = dequant_mpeg_inter_3dne; |
492 |
dequant_h263_intra = dequant_h263_intra_3dne; |
dequant_h263_intra = dequant_h263_intra_3dne; |
493 |
dequant_h263_inter = dequant_h263_inter_3dne; |
dequant_h263_inter = dequant_h263_inter_3dne; |
494 |
|
|
495 |
/* ME functions */ |
/* ME functions */ |
496 |
calc_cbp = calc_cbp_3dne; |
calc_cbp = calc_cbp_3dne; |
497 |
|
|
498 |
sad16 = sad16_3dne; |
sad16 = sad16_3dne; |
499 |
sad8 = sad8_3dne; |
sad8 = sad8_3dne; |
500 |
sad16bi = sad16bi_3dne; |
sad16bi = sad16bi_3dne; |
501 |
sad8bi = sad8bi_3dne; |
sad8bi = sad8bi_3dne; |
502 |
dev16 = dev16_3dne; |
dev16 = dev16_3dne; |
503 |
|
} |
|
/* Interpolation */ |
|
|
interpolate8x8_halfpel_h = interpolate8x8_halfpel_h_3dne; |
|
|
interpolate8x8_halfpel_v = interpolate8x8_halfpel_v_3dne; |
|
|
interpolate8x8_halfpel_hv = interpolate8x8_halfpel_hv_3dne; |
|
504 |
} |
} |
505 |
|
|
506 |
if ((cpu_flags & XVID_CPU_SSE2)) { |
if ((cpu_flags & XVID_CPU_SSE2)) { |