35 |
/* forces second pass not to be bigger than first */ |
/* forces second pass not to be bigger than first */ |
36 |
#undef PASS_SMALLER |
#undef PASS_SMALLER |
37 |
|
|
38 |
/* automtically alters overflow controls (strength and improvement/degradation) |
/* automatically alters overflow controls (strength and improvement/degradation) |
39 |
to fight most common problems without user's knowladge */ |
to fight most common problems without user's knowladge */ |
40 |
#define SMART_OVERFLOW_SETTING |
#define SMART_OVERFLOW_SETTING |
41 |
|
|
177 |
twopass_stat_t * stats; |
twopass_stat_t * stats; |
178 |
|
|
179 |
/*---------------------------------- |
/*---------------------------------- |
180 |
* Histerysis helpers |
* Hysteresis helpers |
181 |
*--------------------------------*/ |
*--------------------------------*/ |
182 |
|
|
183 |
/* This field holds the int2float conversion errors of each quant per |
/* This field holds the int2float conversion errors of each quant per |
270 |
static void first_pass_stats_prepare_data(rc_2pass2_t * rc); |
static void first_pass_stats_prepare_data(rc_2pass2_t * rc); |
271 |
static void first_pass_scale_curve_internal(rc_2pass2_t *rc); |
static void first_pass_scale_curve_internal(rc_2pass2_t *rc); |
272 |
static void scaled_curve_apply_advanced_parameters(rc_2pass2_t * rc); |
static void scaled_curve_apply_advanced_parameters(rc_2pass2_t * rc); |
273 |
|
static int check_curve_for_vbv_compliancy(rc_2pass2_t * rc, const float fps); |
274 |
|
static int scale_curve_for_vbv_compliancy(rc_2pass2_t * rc, const float fps); |
275 |
#if 0 |
#if 0 |
276 |
static void stats_print(rc_2pass2_t * rc); |
static void stats_print(rc_2pass2_t * rc); |
277 |
#endif |
#endif |
290 |
if (rc == NULL) |
if (rc == NULL) |
291 |
return XVID_ERR_MEMORY; |
return XVID_ERR_MEMORY; |
292 |
|
|
293 |
rc->param = *param; |
/* v1.0.x */ |
294 |
|
rc->param.version = param->version; |
295 |
|
rc->param.bitrate = param->bitrate; |
296 |
|
rc->param.filename = param->filename; |
297 |
|
rc->param.keyframe_boost = param->keyframe_boost; |
298 |
|
rc->param.curve_compression_high = param->curve_compression_high; |
299 |
|
rc->param.curve_compression_low = param->curve_compression_low; |
300 |
|
rc->param.overflow_control_strength = param->overflow_control_strength; |
301 |
|
rc->param.max_overflow_improvement = param->max_overflow_improvement; |
302 |
|
rc->param.max_overflow_degradation = param->max_overflow_degradation; |
303 |
|
rc->param.kfreduction = param->kfreduction; |
304 |
|
rc->param.kfthreshold = param->kfthreshold; |
305 |
|
rc->param.container_frame_overhead = param->container_frame_overhead; |
306 |
|
|
307 |
|
if (XVID_VERSION_MINOR(param->version) >= 1) { |
308 |
|
rc->param.vbv_size = param->vbv_size; |
309 |
|
rc->param.vbv_initial = param->vbv_initial; |
310 |
|
rc->param.vbv_maxrate = param->vbv_maxrate; |
311 |
|
rc->param.vbv_peakrate = param->vbv_peakrate; |
312 |
|
}else{ |
313 |
|
rc->param.vbv_size = |
314 |
|
rc->param.vbv_initial = |
315 |
|
rc->param.vbv_maxrate = |
316 |
|
rc->param.vbv_peakrate = 0; |
317 |
|
} |
318 |
|
|
319 |
/* Initialize all defaults */ |
/* Initialize all defaults */ |
320 |
#define _INIT(a, b) if((a) <= 0) (a) = (b) |
#define _INIT(a, b) if((a) <= 0) (a) = (b) |
452 |
* shape the curve in the BEFORE/AFTER pair of functions */ |
* shape the curve in the BEFORE/AFTER pair of functions */ |
453 |
scaled_curve_apply_advanced_parameters(rc); |
scaled_curve_apply_advanced_parameters(rc); |
454 |
|
|
455 |
|
/* Check curve for VBV compliancy and rescale if necessary */ |
456 |
|
#ifdef VBV_FORCE |
457 |
|
if (rc->param.vbv_size==0) { |
458 |
|
rc->param.vbv_size = 3145728; |
459 |
|
rc->param.vbv_initial = 2359296; |
460 |
|
rc->param.vbv_maxrate = 4854000; |
461 |
|
rc->param.vbv_peakrate = 8000000; |
462 |
|
} |
463 |
|
#endif |
464 |
|
|
465 |
|
/* vbv_size==0 switches VBV check off */ |
466 |
|
if (rc->param.vbv_size > 0) { |
467 |
|
const double fps = (double)create->fbase/(double)create->fincr; |
468 |
|
int status = check_curve_for_vbv_compliancy(rc, fps); |
469 |
|
|
470 |
|
if (status) { |
471 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] Underflow detected - Scaling Curve for compliancy.\n"); |
472 |
|
} |
473 |
|
|
474 |
|
status = scale_curve_for_vbv_compliancy(rc, fps); |
475 |
|
|
476 |
|
if (status == 0) { |
477 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] VBV compliant curve scaling done.\n"); |
478 |
|
} else { |
479 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] VBV compliant curve scaling impossible.\n"); |
480 |
|
} |
481 |
|
} |
482 |
*handle = rc; |
*handle = rc; |
483 |
return(0); |
return(0); |
484 |
} |
} |
857 |
rc->KFoverflow -= rc->KFoverflow_partial; |
rc->KFoverflow -= rc->KFoverflow_partial; |
858 |
} |
} |
859 |
|
|
860 |
rc->overflow += (s->error = s->desired_length - data->length); |
s->error = s->desired_length - data->length; |
861 |
rc->real_total += data->length; |
rc->real_total += data->length; |
862 |
|
|
863 |
DPRINTF(XVID_DEBUG_RC, "[xvid rc] -- frame:%d type:%c quant:%d stats:%d scaled:%d desired:%d actual:%d error:%d overflow:%.2f\n", |
DPRINTF(XVID_DEBUG_RC, "[xvid rc] -- frame:%d type:%c quant:%d stats:%d scaled:%d desired:%d actual:%d error:%d overflow:%.2f\n", |
1434 |
} |
} |
1435 |
|
|
1436 |
/***************************************************************************** |
/***************************************************************************** |
1437 |
|
* VBV compliancy check and scale |
1438 |
|
* MPEG-4 standard specifies certain restrictions for bitrate/framesize in VBR |
1439 |
|
* to enable playback on devices with limited readspeed and memory (and which |
1440 |
|
* aren't...) |
1441 |
|
* |
1442 |
|
* DivX profiles have 2 criteria: VBV as in MPEG standard |
1443 |
|
* a limit on peak bitrate for any 3 seconds |
1444 |
|
* |
1445 |
|
* But if VBV is fulfilled, peakrate is automatically fulfilled in any profile |
1446 |
|
* define so far, so we check for it (for completeness) but correct only VBV |
1447 |
|
* |
1448 |
|
*****************************************************************************/ |
1449 |
|
|
1450 |
|
#define VBV_COMPLIANT 0 |
1451 |
|
#define VBV_UNDERFLOW 1 /* video buffer runs empty */ |
1452 |
|
#define VBV_OVERFLOW 2 /* doesn't exist for VBR encoding */ |
1453 |
|
#define VBV_PEAKRATE 4 /* peak bitrate (within 3s) violated */ |
1454 |
|
|
1455 |
|
static int |
1456 |
|
check_curve_for_vbv_compliancy(rc_2pass2_t * rc, const float fps) |
1457 |
|
{ |
1458 |
|
/* We do all calculations in float, for higher accuracy, |
1459 |
|
* and in bytes for convenience. |
1460 |
|
* |
1461 |
|
* typical values from DivX Home Theater profile: |
1462 |
|
* vbv_size= 384*1024 (384kB) |
1463 |
|
* vbv_initial= 288*1024 (75% fill) |
1464 |
|
* maxrate= 4854000 (4.854MBps) |
1465 |
|
* peakrate= 8000000 (8MBps) |
1466 |
|
* |
1467 |
|
* PAL: offset3s = 75 (3 seconds of 25fps) |
1468 |
|
* NTSC: offset3s = 90 (3 seconds of 29.97fps) or 72 (3 seconds of 23.976fps) |
1469 |
|
*/ |
1470 |
|
|
1471 |
|
const float vbv_size = (float)rc->param.vbv_size/8.f; |
1472 |
|
float vbvfill = (float)rc->param.vbv_initial/8.f; |
1473 |
|
float vbvmin; |
1474 |
|
|
1475 |
|
const float maxrate = (float)rc->param.vbv_maxrate; |
1476 |
|
const float peakrate = (float)rc->param.vbv_peakrate; |
1477 |
|
const float r0 = (int)(maxrate/fps+0.5)/8.f; |
1478 |
|
|
1479 |
|
int bytes3s = 0; |
1480 |
|
int offset3s = (int)(3.f*fps+0.5); |
1481 |
|
int i; |
1482 |
|
|
1483 |
|
/* 1Gbit should be enough to inuitialize the vbvmin |
1484 |
|
* an arbitrary high value */ |
1485 |
|
vbvmin = 1000*1000*1000; |
1486 |
|
|
1487 |
|
for (i=0; i<rc->num_frames; i++) { |
1488 |
|
/* DivX 3s peak bitrate check */ |
1489 |
|
bytes3s += rc->stats[i].scaled_length; |
1490 |
|
if (i>=offset3s) |
1491 |
|
bytes3s -= rc->stats[i-offset3s].scaled_length; |
1492 |
|
|
1493 |
|
/* ignore peakrate constraint if peakrate is <= 0.f */ |
1494 |
|
if (peakrate>0.f && 8.f*bytes3s > 3*peakrate) |
1495 |
|
return(VBV_PEAKRATE); |
1496 |
|
|
1497 |
|
/* update vbv fill level */ |
1498 |
|
vbvfill += r0 - rc->stats[i].scaled_length; |
1499 |
|
|
1500 |
|
/* this check is _NOT_ an "overflow"! only reading from disk stops then */ |
1501 |
|
if (vbvfill > vbv_size) |
1502 |
|
vbvfill = vbv_size; |
1503 |
|
|
1504 |
|
/* but THIS would be an underflow. report it! */ |
1505 |
|
if (vbvfill < 0) |
1506 |
|
return(VBV_UNDERFLOW); |
1507 |
|
|
1508 |
|
/* Store the minimum buffer filling */ |
1509 |
|
if (vbvfill < vbvmin) |
1510 |
|
vbvmin = vbvfill; |
1511 |
|
} |
1512 |
|
|
1513 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] Minimum buffer fill: %f bytes\n", vbvmin); |
1514 |
|
|
1515 |
|
return(VBV_COMPLIANT); |
1516 |
|
} |
1517 |
|
|
1518 |
|
|
1519 |
|
static int |
1520 |
|
scale_curve_for_vbv_compliancy(rc_2pass2_t * rc, const float fps) |
1521 |
|
{ |
1522 |
|
/* correct any VBV violations. Peak bitrate violations disappears |
1523 |
|
* by this automatically |
1524 |
|
* |
1525 |
|
* This implementation follows |
1526 |
|
* |
1527 |
|
* Westerink, Rajagopalan, Gonzales "Two-pass MPEG-2 variable-bitrate encoding" |
1528 |
|
* IBM J. RES. DEVELOP. VOL 43, No. 4, July 1999, p.471--488 |
1529 |
|
* |
1530 |
|
* Thanks, guys! This paper rocks!!! */ |
1531 |
|
|
1532 |
|
/* For each scene of len N, we have to check up to N^2 possible buffer fills. |
1533 |
|
* This works well with MPEG-2 where N==12 or so, but for MPEG-4 it's a |
1534 |
|
* little slow... |
1535 |
|
* |
1536 |
|
* TODO: Better control on VBVfill between scenes */ |
1537 |
|
|
1538 |
|
const float vbv_size = (float)rc->param.vbv_size/8.f; |
1539 |
|
const float vbv_initial = (float)rc->param.vbv_initial/8.f; |
1540 |
|
|
1541 |
|
const float maxrate = 0.9*rc->param.vbv_maxrate; |
1542 |
|
const float vbv_low = 0.10f*vbv_size; |
1543 |
|
const float r0 = (int)(maxrate/fps+0.5)/8.f; |
1544 |
|
|
1545 |
|
int i,k,l,n,violation = 0; |
1546 |
|
float *scenefactor; |
1547 |
|
int *scenestart; |
1548 |
|
int *scenelength; |
1549 |
|
|
1550 |
|
/* first step: determine how many "scenes" there are and store their |
1551 |
|
* boundaries we could get all this from existing keyframe_positions, |
1552 |
|
* somehow, but there we don't have a min_scenelength, and it's no big |
1553 |
|
* deal to get it again. */ |
1554 |
|
|
1555 |
|
const int min_scenelength = (int)(fps+0.5); |
1556 |
|
int num_scenes = 0; |
1557 |
|
int last_scene = -999; |
1558 |
|
for (i=0; i<rc->num_frames; i++) { |
1559 |
|
if ((rc->stats[i].type == XVID_TYPE_IVOP) && (i-last_scene>min_scenelength)) { |
1560 |
|
last_scene = i; |
1561 |
|
num_scenes++; |
1562 |
|
} |
1563 |
|
} |
1564 |
|
|
1565 |
|
scenefactor = (float*)malloc(num_scenes*sizeof(float)); |
1566 |
|
scenestart = (int*)malloc(num_scenes*sizeof(int)); |
1567 |
|
scenelength = (int*)malloc(num_scenes*sizeof(int)); |
1568 |
|
|
1569 |
|
if ((!scenefactor) || (!scenestart) || (!scenelength) ) { |
1570 |
|
free(scenefactor); |
1571 |
|
free(scenestart); |
1572 |
|
free(scenelength); |
1573 |
|
/* remember: free(0) is valid and does exactly nothing. */ |
1574 |
|
return(-1); |
1575 |
|
} |
1576 |
|
|
1577 |
|
/* count again and safe the length/position */ |
1578 |
|
|
1579 |
|
num_scenes = 0; |
1580 |
|
last_scene = -999; |
1581 |
|
for (i=0; i<rc->num_frames; i++) { |
1582 |
|
if ((rc->stats[i].type == XVID_TYPE_IVOP) && (i-last_scene>min_scenelength)) { |
1583 |
|
if (num_scenes>0) { |
1584 |
|
scenelength[num_scenes-1]=i-last_scene; |
1585 |
|
} |
1586 |
|
scenestart[num_scenes]=i; |
1587 |
|
num_scenes++; |
1588 |
|
last_scene = i; |
1589 |
|
} |
1590 |
|
} |
1591 |
|
scenelength[num_scenes-1]=i-last_scene; |
1592 |
|
|
1593 |
|
/* second step: check for each scene, how much we can scale its frames up or |
1594 |
|
* down such that the VBV restriction is just fulfilled */ |
1595 |
|
#define R(k,n) (((n)+1-(k))*r0) /* how much enters the buffer between frame k and n */ |
1596 |
|
for (l=0; l<num_scenes;l++) { |
1597 |
|
const int start = scenestart[l]; |
1598 |
|
const int length = scenelength[l]; |
1599 |
|
twopass_stat_t * frames = &rc->stats[start]; |
1600 |
|
|
1601 |
|
float S0n,Skn; |
1602 |
|
float f,minf = 99999.f; |
1603 |
|
|
1604 |
|
S0n=0.; |
1605 |
|
for (n=0;n<=length-1;n++) { |
1606 |
|
S0n += frames[n].scaled_length; |
1607 |
|
|
1608 |
|
k = 0; |
1609 |
|
Skn = S0n; |
1610 |
|
f = (R(k,n-1) + (vbv_initial - vbv_low)) / Skn; |
1611 |
|
if (f < minf) |
1612 |
|
minf = f; |
1613 |
|
|
1614 |
|
for (k=1;k<=n;k++) { |
1615 |
|
Skn -= frames[k].scaled_length; |
1616 |
|
|
1617 |
|
f = (R(k,n-1) + (vbv_size - vbv_low)) / Skn; |
1618 |
|
if (f < minf) |
1619 |
|
minf = f; |
1620 |
|
} |
1621 |
|
} |
1622 |
|
|
1623 |
|
/* special case: at the end, fill buffer up to vbv_initial again |
1624 |
|
* |
1625 |
|
* TODO: Allow other values for buffer fill between scenes |
1626 |
|
* e.g. if n=N is smallest f-value, then check for better value */ |
1627 |
|
|
1628 |
|
n=length; |
1629 |
|
k=0; |
1630 |
|
Skn = S0n; |
1631 |
|
f = R(k,n-1)/Skn; |
1632 |
|
if (f < minf) |
1633 |
|
minf = f; |
1634 |
|
|
1635 |
|
for (k=1;k<=n-1;k++) { |
1636 |
|
Skn -= frames[k].scaled_length; |
1637 |
|
|
1638 |
|
f = (R(k,n-1) + (vbv_initial - vbv_low)) / Skn; |
1639 |
|
if (f < minf) |
1640 |
|
minf = f; |
1641 |
|
} |
1642 |
|
|
1643 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] Scene %d (Frames %d-%d): VBVfactor %f\n", |
1644 |
|
l, start, start+length-1 , minf); |
1645 |
|
|
1646 |
|
scenefactor[l] = minf; |
1647 |
|
} |
1648 |
|
#undef R |
1649 |
|
|
1650 |
|
/* last step: now we know of any scene how much it can be scaled up or down |
1651 |
|
* without violating VBV. Next, distribute bits from the evil scenes to the |
1652 |
|
* good ones */ |
1653 |
|
do { |
1654 |
|
float S_red = 0.f; /* how much to redistribute */ |
1655 |
|
float S_elig = 0.f; /* sum of bit for those scenes you can still swallow something*/ |
1656 |
|
float f_red; |
1657 |
|
int l; |
1658 |
|
|
1659 |
|
/* check how much is wrong */ |
1660 |
|
for (l=0;l<num_scenes;l++) { |
1661 |
|
const int start = scenestart[l]; |
1662 |
|
const int length = scenelength[l]; |
1663 |
|
twopass_stat_t * frames = &rc->stats[start]; |
1664 |
|
|
1665 |
|
/* exactly 1 means "don't touch this anymore!" */ |
1666 |
|
if (scenefactor[l] == 1.) |
1667 |
|
continue; |
1668 |
|
|
1669 |
|
/* within limits */ |
1670 |
|
if (scenefactor[l] > 1.) { |
1671 |
|
for (n= 0; n < length; n++) |
1672 |
|
S_elig += frames[n].scaled_length; |
1673 |
|
} else { |
1674 |
|
/* underflowing segment */ |
1675 |
|
for (n= 0; n < length; n++) { |
1676 |
|
float newbytes = (float)frames[n].scaled_length * scenefactor[l]; |
1677 |
|
S_red += (float)frames[n].scaled_length - (float)newbytes; |
1678 |
|
frames[n].scaled_length =(int)newbytes; |
1679 |
|
} |
1680 |
|
scenefactor[l] = 1.f; |
1681 |
|
} |
1682 |
|
} |
1683 |
|
|
1684 |
|
/* no more underflows */ |
1685 |
|
if (S_red < 1.f) |
1686 |
|
break; |
1687 |
|
|
1688 |
|
if (S_elig < 1.f) { |
1689 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] Everything underflowing.\n"); |
1690 |
|
free(scenefactor); |
1691 |
|
free(scenestart); |
1692 |
|
free(scenelength); |
1693 |
|
return(-2); |
1694 |
|
} |
1695 |
|
|
1696 |
|
f_red = (1.f + S_red/S_elig); |
1697 |
|
|
1698 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] Moving %.0f kB to avoid buffer underflow, correction factor: %.5f\n", |
1699 |
|
S_red/1024.f, f_red); |
1700 |
|
|
1701 |
|
violation=0; |
1702 |
|
/* scale remaining scenes up to meet total size */ |
1703 |
|
for (l=0; l<num_scenes; l++) { |
1704 |
|
const int start = scenestart[l]; |
1705 |
|
const int length = scenelength[l]; |
1706 |
|
twopass_stat_t * frames = &rc->stats[start]; |
1707 |
|
|
1708 |
|
if (scenefactor[l] == 1.) |
1709 |
|
continue; |
1710 |
|
|
1711 |
|
/* there shouldn't be any segments with factor<1 left, so all the rest is >1 */ |
1712 |
|
for (n= 0; n < length; n++) { |
1713 |
|
frames[n].scaled_length = (int)(frames[n].scaled_length * f_red + 0.5); |
1714 |
|
} |
1715 |
|
|
1716 |
|
scenefactor[l] /= f_red; |
1717 |
|
if (scenefactor[l] < 1.f) |
1718 |
|
violation=1; |
1719 |
|
} |
1720 |
|
|
1721 |
|
} while (violation); |
1722 |
|
|
1723 |
|
free(scenefactor); |
1724 |
|
free(scenestart); |
1725 |
|
free(scenelength); |
1726 |
|
return(0); |
1727 |
|
} |
1728 |
|
|
1729 |
|
|
1730 |
|
/***************************************************************************** |
1731 |
* Still more low level stuff (nothing to do with stats treatment) |
* Still more low level stuff (nothing to do with stats treatment) |
1732 |
****************************************************************************/ |
****************************************************************************/ |
1733 |
|
|