35 |
/* forces second pass not to be bigger than first */ |
/* forces second pass not to be bigger than first */ |
36 |
#undef PASS_SMALLER |
#undef PASS_SMALLER |
37 |
|
|
38 |
|
/* automatically alters overflow controls (strength and improvement/degradation) |
39 |
|
to fight most common problems without user's knowladge */ |
40 |
|
#define SMART_OVERFLOW_SETTING |
41 |
|
|
42 |
#include <stdio.h> |
#include <stdio.h> |
43 |
#include <math.h> |
#include <math.h> |
44 |
#include <limits.h> |
#include <limits.h> |
134 |
|
|
135 |
/*---------------------------------- |
/*---------------------------------- |
136 |
* Zones statistical data |
* Zones statistical data |
|
* |
|
|
* ToDo: Fix zones, current |
|
|
* implementation is buggy |
|
137 |
*--------------------------------*/ |
*--------------------------------*/ |
138 |
|
|
|
/* Average weight of the zones */ |
|
|
double avg_weight; |
|
|
|
|
139 |
/* Total length used by XVID_ZONE_QUANT zones */ |
/* Total length used by XVID_ZONE_QUANT zones */ |
140 |
uint64_t tot_quant; |
uint64_t tot_quant; |
141 |
uint64_t tot_quant_invariant; |
uint64_t tot_quant_invariant; |
142 |
|
|
143 |
|
/* Holds the total amount of frame bytes, zone weighted (only scalable |
144 |
|
* part of frame bytes) */ |
145 |
|
uint64_t tot_weighted; |
146 |
|
|
147 |
/*---------------------------------- |
/*---------------------------------- |
148 |
* Advanced settings helper ratios |
* Advanced settings helper ratios |
149 |
*--------------------------------*/ |
*--------------------------------*/ |
177 |
twopass_stat_t * stats; |
twopass_stat_t * stats; |
178 |
|
|
179 |
/*---------------------------------- |
/*---------------------------------- |
180 |
* Histerysis helpers |
* Hysteresis helpers |
181 |
*--------------------------------*/ |
*--------------------------------*/ |
182 |
|
|
183 |
/* This field holds the int2float conversion errors of each quant per |
/* This field holds the int2float conversion errors of each quant per |
212 |
* ToDo: description */ |
* ToDo: description */ |
213 |
double fq_error; |
double fq_error; |
214 |
|
|
215 |
|
int min_quant; /* internal minimal quant, prevents wrong quants from being used */ |
216 |
|
|
217 |
/*---------------------------------- |
/*---------------------------------- |
218 |
* Debug |
* Debug |
219 |
*--------------------------------*/ |
*--------------------------------*/ |
270 |
static void first_pass_stats_prepare_data(rc_2pass2_t * rc); |
static void first_pass_stats_prepare_data(rc_2pass2_t * rc); |
271 |
static void first_pass_scale_curve_internal(rc_2pass2_t *rc); |
static void first_pass_scale_curve_internal(rc_2pass2_t *rc); |
272 |
static void scaled_curve_apply_advanced_parameters(rc_2pass2_t * rc); |
static void scaled_curve_apply_advanced_parameters(rc_2pass2_t * rc); |
273 |
|
static int check_curve_for_vbv_compliancy(rc_2pass2_t * rc, const float fps); |
274 |
|
static int scale_curve_for_vbv_compliancy(rc_2pass2_t * rc, const float fps); |
275 |
#if 0 |
#if 0 |
276 |
static void stats_print(rc_2pass2_t * rc); |
static void stats_print(rc_2pass2_t * rc); |
277 |
#endif |
#endif |
290 |
if (rc == NULL) |
if (rc == NULL) |
291 |
return XVID_ERR_MEMORY; |
return XVID_ERR_MEMORY; |
292 |
|
|
293 |
rc->param = *param; |
/* v1.0.x */ |
294 |
|
rc->param.version = param->version; |
295 |
|
rc->param.bitrate = param->bitrate; |
296 |
|
rc->param.filename = param->filename; |
297 |
|
rc->param.keyframe_boost = param->keyframe_boost; |
298 |
|
rc->param.curve_compression_high = param->curve_compression_high; |
299 |
|
rc->param.curve_compression_low = param->curve_compression_low; |
300 |
|
rc->param.overflow_control_strength = param->overflow_control_strength; |
301 |
|
rc->param.max_overflow_improvement = param->max_overflow_improvement; |
302 |
|
rc->param.max_overflow_degradation = param->max_overflow_degradation; |
303 |
|
rc->param.kfreduction = param->kfreduction; |
304 |
|
rc->param.kfthreshold = param->kfthreshold; |
305 |
|
rc->param.container_frame_overhead = param->container_frame_overhead; |
306 |
|
|
307 |
|
if (XVID_VERSION_MINOR(param->version) >= 1) { |
308 |
|
rc->param.vbv_size = param->vbv_size; |
309 |
|
rc->param.vbv_initial = param->vbv_initial; |
310 |
|
rc->param.vbv_maxrate = param->vbv_maxrate; |
311 |
|
rc->param.vbv_peakrate = param->vbv_peakrate; |
312 |
|
}else{ |
313 |
|
rc->param.vbv_size = |
314 |
|
rc->param.vbv_initial = |
315 |
|
rc->param.vbv_maxrate = |
316 |
|
rc->param.vbv_peakrate = 0; |
317 |
|
} |
318 |
|
|
319 |
/* Initialize all defaults */ |
/* Initialize all defaults */ |
320 |
#define _INIT(a, b) if((a) <= 0) (a) = (b) |
#define _INIT(a, b) if((a) <= 0) (a) = (b) |
343 |
for (i=0; i<3; i++) rc->last_quant[i] = 0; |
for (i=0; i<3; i++) rc->last_quant[i] = 0; |
344 |
|
|
345 |
rc->fq_error = 0; |
rc->fq_error = 0; |
346 |
|
rc->min_quant = 1; |
347 |
|
|
348 |
/* Count frames (and intra frames) in the stats file, store the result into |
/* Count frames (and intra frames) in the stats file, store the result into |
349 |
* the rc structure */ |
* the rc structure */ |
406 |
if(rc->param.container_frame_overhead) |
if(rc->param.container_frame_overhead) |
407 |
DPRINTF(XVID_DEBUG_RC, "[xvid rc] -- New target filesize after container compensation: %lld\n", rc->target); |
DPRINTF(XVID_DEBUG_RC, "[xvid rc] -- New target filesize after container compensation: %lld\n", rc->target); |
408 |
|
|
409 |
|
/* When bitrate is not given it means it has been scaled by an external |
410 |
|
* application */ |
411 |
|
if (rc->param.bitrate) { |
412 |
|
/* Apply zone settings |
413 |
|
* - set rc->tot_quant which represents the total num of bytes spent in |
414 |
|
* fixed quant zones |
415 |
|
* - set rc->tot_weighted which represents the total amount of bytes |
416 |
|
* spent in normal or weighted zones in first pass (normal zones can |
417 |
|
* be considered weight=1) |
418 |
|
* - set rc->tot_quant_invariant which represents the total num of bytes |
419 |
|
* spent in fixed quant zones for headers */ |
420 |
|
zone_process(rc, create); |
421 |
|
} else { |
422 |
|
/* External scaling -- zones are ignored */ |
423 |
|
for (i=0;i<rc->num_frames;i++) { |
424 |
|
rc->stats[i].zone_mode = XVID_ZONE_WEIGHT; |
425 |
|
rc->stats[i].weight = 1.0; |
426 |
|
} |
427 |
|
rc->tot_quant = 0; |
428 |
|
} |
429 |
|
|
430 |
/* Gathers some information about first pass stats: |
/* Gathers some information about first pass stats: |
431 |
* - finds the minimum frame length for each frame type during 1st pass. |
* - finds the minimum frame length for each frame type during 1st pass. |
432 |
* rc->min_size[] |
* rc->min_size[] |
442 |
*/ |
*/ |
443 |
first_pass_stats_prepare_data(rc); |
first_pass_stats_prepare_data(rc); |
444 |
|
|
445 |
/* When bitrate is not given it means it has been scaled by an external |
/* If we have a user bitrate, it means it's an internal curve scaling */ |
|
* application */ |
|
446 |
if (rc->param.bitrate) { |
if (rc->param.bitrate) { |
|
/* Apply zone settings |
|
|
* - set rc->tot_quant which represents the total num of bytes spent in |
|
|
* fixed quant zones |
|
|
* - set rc->tot_quant_invariant which represents the total num of bytes spent |
|
|
* in fixed quant zones for headers */ |
|
|
zone_process(rc, create); |
|
447 |
/* Perform internal curve scaling */ |
/* Perform internal curve scaling */ |
448 |
first_pass_scale_curve_internal(rc); |
first_pass_scale_curve_internal(rc); |
|
} else { |
|
|
/* External scaling -- zones are ignored */ |
|
|
for (i=0;i<rc->num_frames;i++) { |
|
|
rc->stats[i].zone_mode = XVID_ZONE_WEIGHT; |
|
|
rc->stats[i].weight = 1.0; |
|
|
} |
|
|
rc->avg_weight = 1.0; |
|
|
rc->tot_quant = 0; |
|
449 |
} |
} |
450 |
|
|
451 |
/* Apply advanced curve options, and compute some parameters in order to |
/* Apply advanced curve options, and compute some parameters in order to |
452 |
* shape the curve in the BEFORE/AFTER pair of functions */ |
* shape the curve in the BEFORE/AFTER pair of functions */ |
453 |
scaled_curve_apply_advanced_parameters(rc); |
scaled_curve_apply_advanced_parameters(rc); |
454 |
|
|
455 |
|
/* Check curve for VBV compliancy and rescale if necessary */ |
456 |
|
#ifdef VBV_FORCE |
457 |
|
if (rc->param.vbv_size==0) { |
458 |
|
rc->param.vbv_size = 3145728; |
459 |
|
rc->param.vbv_initial = 2359296; |
460 |
|
rc->param.vbv_maxrate = 4854000; |
461 |
|
rc->param.vbv_peakrate = 8000000; |
462 |
|
} |
463 |
|
#endif |
464 |
|
|
465 |
|
/* vbv_size==0 switches VBV check off */ |
466 |
|
if (rc->param.vbv_size > 0) { |
467 |
|
const double fps = (double)create->fbase/(double)create->fincr; |
468 |
|
int status = check_curve_for_vbv_compliancy(rc, fps); |
469 |
|
|
470 |
|
if (status) { |
471 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] Underflow detected - Scaling Curve for compliancy.\n"); |
472 |
|
} |
473 |
|
|
474 |
|
status = scale_curve_for_vbv_compliancy(rc, fps); |
475 |
|
|
476 |
|
if (status == 0) { |
477 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] VBV compliant curve scaling done.\n"); |
478 |
|
} else { |
479 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] VBV compliant curve scaling impossible.\n"); |
480 |
|
} |
481 |
|
} |
482 |
*handle = rc; |
*handle = rc; |
483 |
return(0); |
return(0); |
484 |
} |
} |
521 |
if (data->quant > 0) |
if (data->quant > 0) |
522 |
return(0); |
return(0); |
523 |
|
|
524 |
/* Second case: insufficent stats data */ |
/* Second case: insufficent stats data |
525 |
|
* We can't guess much what we should do, let core decide all alone */ |
526 |
if (data->frame_num >= rc->num_frames) { |
if (data->frame_num >= rc->num_frames) { |
527 |
DPRINTF(XVID_DEBUG_RC,"[xvid rc] -- stats file too short (now processing frame %d)", |
DPRINTF(XVID_DEBUG_RC,"[xvid rc] -- stats file too short (now processing frame %d)", |
528 |
data->frame_num); |
data->frame_num); |
529 |
return(0); |
return(0); |
530 |
} |
} |
531 |
|
|
532 |
/* Third case: We are in a Quant zone */ |
/* Third case: We are in a Quant zone |
533 |
|
* Quant zones must just ensure we use the same settings as first pass |
534 |
|
* So set the quantizer and the type */ |
535 |
if (s->zone_mode == XVID_ZONE_QUANT) { |
if (s->zone_mode == XVID_ZONE_QUANT) { |
536 |
|
/* Quant stuff */ |
537 |
rc->fq_error += s->weight; |
rc->fq_error += s->weight; |
538 |
data->quant = (int)rc->fq_error; |
data->quant = (int)rc->fq_error; |
539 |
rc->fq_error -= data->quant; |
rc->fq_error -= data->quant; |
540 |
|
|
541 |
|
/* The type stuff */ |
542 |
|
data->type = s->type; |
543 |
|
|
544 |
|
/* The only required data for AFTER step is this one for the overflow |
545 |
|
* control */ |
546 |
s->desired_length = s->length; |
s->desired_length = s->length; |
547 |
|
|
548 |
return(0); |
return(0); |
677 |
#ifdef PASS_SMALLER |
#ifdef PASS_SMALLER |
678 |
if (dbytes > s->length) { |
if (dbytes > s->length) { |
679 |
dbytes = s->length; |
dbytes = s->length; |
680 |
} else |
} |
681 |
#endif |
#endif |
682 |
|
|
683 |
|
/* Prevent stupid desired sizes under logical values */ |
684 |
if (dbytes < rc->min_length[s->type-1]) { |
if (dbytes < rc->min_length[s->type-1]) { |
685 |
dbytes = rc->min_length[s->type-1]; |
dbytes = rc->min_length[s->type-1]; |
|
} else if (dbytes > rc->max_length) { |
|
|
/* ToDo: this condition is always wrong as max_length == maximum frame |
|
|
* length of first pass, so the first condition already caps the frame |
|
|
* size... */ |
|
|
capped_to_max_framesize = 1; |
|
|
dbytes = rc->max_length; |
|
|
DPRINTF(XVID_DEBUG_RC,"[xvid rc] -- frame:%d Capped to maximum frame size\n", |
|
|
data->frame_num); |
|
686 |
} |
} |
687 |
|
|
688 |
/*------------------------------------------------------------------------ |
/*------------------------------------------------------------------------ |
767 |
data->quant = data->max_quant[s->type-1]; |
data->quant = data->max_quant[s->type-1]; |
768 |
} |
} |
769 |
|
|
770 |
|
if (data->quant < rc->min_quant) data->quant = rc->min_quant; |
771 |
|
|
772 |
/* To avoid big quality jumps from frame to frame, we apply a "security" |
/* To avoid big quality jumps from frame to frame, we apply a "security" |
773 |
* rule that makes |last_quant - new_quant| <= 2. This rule only applies |
* rule that makes |last_quant - new_quant| <= 2. This rule only applies |
774 |
* to predicted frames (P and B) */ |
* to predicted frames (P and B) */ |
857 |
rc->KFoverflow -= rc->KFoverflow_partial; |
rc->KFoverflow -= rc->KFoverflow_partial; |
858 |
} |
} |
859 |
|
|
860 |
rc->overflow += (s->error = s->desired_length - data->length); |
s->error = s->desired_length - data->length; |
861 |
rc->real_total += data->length; |
rc->real_total += data->length; |
862 |
|
|
863 |
DPRINTF(XVID_DEBUG_RC, "[xvid rc] -- frame:%d type:%c quant:%d stats:%d scaled:%d desired:%d actual:%d error:%d overflow:%.2f\n", |
DPRINTF(XVID_DEBUG_RC, "[xvid rc] -- frame:%d type:%c quant:%d stats:%d scaled:%d desired:%d actual:%d error:%d overflow:%.2f\n", |
1044 |
|
|
1045 |
/* pre-process the statistics data |
/* pre-process the statistics data |
1046 |
* - for each type, count, tot_length, min_length, max_length |
* - for each type, count, tot_length, min_length, max_length |
1047 |
* - set keyframes_locations */ |
* - set keyframes_locations, tot_prescaled */ |
1048 |
static void |
static void |
1049 |
first_pass_stats_prepare_data(rc_2pass2_t * rc) |
first_pass_stats_prepare_data(rc_2pass2_t * rc) |
1050 |
{ |
{ |
1061 |
} |
} |
1062 |
|
|
1063 |
rc->max_length = INT_MIN; |
rc->max_length = INT_MIN; |
1064 |
|
rc->tot_weighted = 0; |
1065 |
|
|
1066 |
/* Loop through all frames and find/compute all the stuff this function |
/* Loop through all frames and find/compute all the stuff this function |
1067 |
* is supposed to do */ |
* is supposed to do */ |
1071 |
rc->count[s->type-1]++; |
rc->count[s->type-1]++; |
1072 |
rc->tot_length[s->type-1] += s->length; |
rc->tot_length[s->type-1] += s->length; |
1073 |
rc->tot_invariant[s->type-1] += s->invariant; |
rc->tot_invariant[s->type-1] += s->invariant; |
1074 |
|
if (s->zone_mode != XVID_ZONE_QUANT) |
1075 |
|
rc->tot_weighted += (int)(s->weight*(s->length - s->invariant)); |
1076 |
|
|
1077 |
if (s->length < rc->min_length[s->type-1]) { |
if (s->length < rc->min_length[s->type-1]) { |
1078 |
rc->min_length[s->type-1] = s->length; |
rc->min_length[s->type-1] = s->length; |
1107 |
int i,j; |
int i,j; |
1108 |
int n = 0; |
int n = 0; |
1109 |
|
|
|
rc->avg_weight = 0.0; |
|
1110 |
rc->tot_quant = 0; |
rc->tot_quant = 0; |
1111 |
rc->tot_quant_invariant = 0; |
rc->tot_quant_invariant = 0; |
1112 |
|
|
1115 |
rc->stats[j].zone_mode = XVID_ZONE_WEIGHT; |
rc->stats[j].zone_mode = XVID_ZONE_WEIGHT; |
1116 |
rc->stats[j].weight = 1.0; |
rc->stats[j].weight = 1.0; |
1117 |
} |
} |
|
rc->avg_weight += rc->num_frames * 1.0; |
|
1118 |
n += rc->num_frames; |
n += rc->num_frames; |
1119 |
} |
} |
1120 |
|
|
1123 |
|
|
1124 |
int next = (i+1<create->num_zones) ? create->zones[i+1].frame : rc->num_frames; |
int next = (i+1<create->num_zones) ? create->zones[i+1].frame : rc->num_frames; |
1125 |
|
|
1126 |
|
/* Zero weight make no sense */ |
1127 |
|
if (create->zones[i].increment == 0) create->zones[i].increment = 1; |
1128 |
|
/* And obviously an undetermined infinite makes even less sense */ |
1129 |
|
if (create->zones[i].base == 0) create->zones[i].base = 1; |
1130 |
|
|
1131 |
if (i==0 && create->zones[i].frame > 0) { |
if (i==0 && create->zones[i].frame > 0) { |
1132 |
for (j = 0; j < create->zones[i].frame && j < rc->num_frames; j++) { |
for (j = 0; j < create->zones[i].frame && j < rc->num_frames; j++) { |
1133 |
rc->stats[j].zone_mode = XVID_ZONE_WEIGHT; |
rc->stats[j].zone_mode = XVID_ZONE_WEIGHT; |
1134 |
rc->stats[j].weight = 1.0; |
rc->stats[j].weight = 1.0; |
1135 |
} |
} |
|
rc->avg_weight += create->zones[i].frame * 1.0; |
|
1136 |
n += create->zones[i].frame; |
n += create->zones[i].frame; |
1137 |
} |
} |
1138 |
|
|
1142 |
rc->stats[j].weight = (double)create->zones[i].increment / (double)create->zones[i].base; |
rc->stats[j].weight = (double)create->zones[i].increment / (double)create->zones[i].base; |
1143 |
} |
} |
1144 |
next -= create->zones[i].frame; |
next -= create->zones[i].frame; |
|
rc->avg_weight += (double)(next * create->zones[i].increment) / (double)create->zones[i].base; |
|
1145 |
n += next; |
n += next; |
1146 |
} else{ /* XVID_ZONE_QUANT */ |
} else{ /* XVID_ZONE_QUANT */ |
1147 |
for (j = create->zones[i].frame; j < next && j < rc->num_frames; j++ ) { |
for (j = create->zones[i].frame; j < next && j < rc->num_frames; j++ ) { |
1152 |
} |
} |
1153 |
} |
} |
1154 |
} |
} |
|
rc->avg_weight = n>0 ? rc->avg_weight/n : 1.0; |
|
|
|
|
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] -- center_weight:%f (for %d frames) fixed_bytes:%d\n", rc->avg_weight, n, rc->tot_quant); |
|
1155 |
} |
} |
1156 |
|
|
1157 |
|
|
1160 |
first_pass_scale_curve_internal(rc_2pass2_t *rc) |
first_pass_scale_curve_internal(rc_2pass2_t *rc) |
1161 |
{ |
{ |
1162 |
int64_t target; |
int64_t target; |
|
int64_t pass1_length; |
|
1163 |
int64_t total_invariant; |
int64_t total_invariant; |
1164 |
double scaler; |
double scaler; |
1165 |
int i, num_MBs; |
int i, num_MBs; |
1178 |
target = rc->target; |
target = rc->target; |
1179 |
target -= rc->tot_quant; |
target -= rc->tot_quant; |
1180 |
|
|
|
/* Do the same for the first pass data */ |
|
|
pass1_length = rc->tot_length[XVID_TYPE_IVOP-1]; |
|
|
pass1_length += rc->tot_length[XVID_TYPE_PVOP-1]; |
|
|
pass1_length += rc->tot_length[XVID_TYPE_BVOP-1]; |
|
|
pass1_length -= rc->tot_quant; |
|
|
|
|
1181 |
/* Let's compute a linear scaler in order to perform curve scaling */ |
/* Let's compute a linear scaler in order to perform curve scaling */ |
1182 |
scaler = (double)(target - total_invariant) / (double)(pass1_length - total_invariant); |
scaler = (double)(target - total_invariant) / (double)(rc->tot_weighted); |
1183 |
|
|
1184 |
#ifdef PASS_SMALLER |
#ifdef SMART_OVERFLOW_SETTING |
1185 |
if ((target - total_invariant) <= 0 || |
if (scaler > 0.9) { |
1186 |
(pass1_length - total_invariant) <= 0 || |
rc->param.max_overflow_degradation *= 5; |
1187 |
target >= pass1_length) { |
rc->param.max_overflow_improvement *= 5; |
1188 |
DPRINTF(XVID_DEBUG_RC, "[xvid rc] -- WARNING: Undersize detected before correction\n"); |
rc->param.overflow_control_strength *= 3; |
1189 |
scaler = 1.0; |
} else if (scaler > 0.6) { |
1190 |
|
rc->param.max_overflow_degradation *= 2; |
1191 |
|
rc->param.max_overflow_improvement *= 2; |
1192 |
|
rc->param.overflow_control_strength *= 2; |
1193 |
|
} else { |
1194 |
|
rc->min_quant = 2; |
1195 |
} |
} |
1196 |
#endif |
#endif |
1197 |
|
|
1198 |
/* Compute min frame lengths (for each frame type) according to the number |
/* Compute min frame lengths (for each frame type) according to the number |
1199 |
* of MBs. We sum all block type counters of frame 0, this gives us the |
* of MBs. We sum all block type counters of frame 0, this gives us the |
1200 |
* number of MBs. |
* number of MBs. |
1236 |
} |
} |
1237 |
|
|
1238 |
/* Compute the scaled length -- only non invariant data length is scaled */ |
/* Compute the scaled length -- only non invariant data length is scaled */ |
1239 |
len = s->invariant + (int)((double)(s->length-s->invariant) * scaler * s->weight / rc->avg_weight); |
len = s->invariant + (int)((double)(s->length-s->invariant) * scaler * s->weight); |
1240 |
|
|
1241 |
/* Compare with the computed minimum */ |
/* Compare with the computed minimum */ |
1242 |
if (len < rc->min_length[s->type-1]) { |
if (len < rc->min_length[s->type-1]) { |
1248 |
* total counters, as we prepare a second pass for 'regular' |
* total counters, as we prepare a second pass for 'regular' |
1249 |
* frames */ |
* frames */ |
1250 |
target -= s->scaled_length; |
target -= s->scaled_length; |
|
pass1_length -= s->length; |
|
1251 |
} else { |
} else { |
1252 |
/* Do nothing for now, we'll scale this later */ |
/* Do nothing for now, we'll scale this later */ |
1253 |
s->scaled_length = 0; |
s->scaled_length = 0; |
1258 |
* total counters. Now, it's possible to scale the 'regular' frames. */ |
* total counters. Now, it's possible to scale the 'regular' frames. */ |
1259 |
|
|
1260 |
/* Scaling factor for 'regular' frames */ |
/* Scaling factor for 'regular' frames */ |
1261 |
scaler = (double)(target - total_invariant) / (double)(pass1_length - total_invariant); |
scaler = (double)(target - total_invariant) / (double)(rc->tot_weighted); |
|
|
|
|
#ifdef PASS_SMALLER |
|
|
/* Detect undersizing */ |
|
|
if (target <= 0 || pass1_length <= 0 || target >= pass1_length) { |
|
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] -- WARNING: Undersize detected after correction\n"); |
|
|
scaler = 1.0; |
|
|
} |
|
|
#endif |
|
1262 |
|
|
1263 |
/* Do another pass with the new scaler */ |
/* Do another pass with the new scaler */ |
1264 |
for (i=0; i<rc->num_frames; i++) { |
for (i=0; i<rc->num_frames; i++) { |
1266 |
|
|
1267 |
/* Ignore frame with forced frame sizes */ |
/* Ignore frame with forced frame sizes */ |
1268 |
if (s->scaled_length == 0) |
if (s->scaled_length == 0) |
1269 |
s->scaled_length = s->invariant + (int)((double)(s->length-s->invariant) * scaler * s->weight / rc->avg_weight); |
s->scaled_length = s->invariant + (int)((double)(s->length-s->invariant) * scaler * s->weight); |
1270 |
} |
} |
1271 |
|
|
1272 |
/* Job done */ |
/* Job done */ |
1434 |
} |
} |
1435 |
|
|
1436 |
/***************************************************************************** |
/***************************************************************************** |
1437 |
|
* VBV compliancy check and scale |
1438 |
|
* MPEG-4 standard specifies certain restrictions for bitrate/framesize in VBR |
1439 |
|
* to enable playback on devices with limited readspeed and memory (and which |
1440 |
|
* aren't...) |
1441 |
|
* |
1442 |
|
* DivX profiles have 2 criteria: VBV as in MPEG standard |
1443 |
|
* a limit on peak bitrate for any 3 seconds |
1444 |
|
* |
1445 |
|
* But if VBV is fulfilled, peakrate is automatically fulfilled in any profile |
1446 |
|
* define so far, so we check for it (for completeness) but correct only VBV |
1447 |
|
* |
1448 |
|
*****************************************************************************/ |
1449 |
|
|
1450 |
|
#define VBV_COMPLIANT 0 |
1451 |
|
#define VBV_UNDERFLOW 1 /* video buffer runs empty */ |
1452 |
|
#define VBV_OVERFLOW 2 /* doesn't exist for VBR encoding */ |
1453 |
|
#define VBV_PEAKRATE 4 /* peak bitrate (within 3s) violated */ |
1454 |
|
|
1455 |
|
static int |
1456 |
|
check_curve_for_vbv_compliancy(rc_2pass2_t * rc, const float fps) |
1457 |
|
{ |
1458 |
|
/* We do all calculations in float, for higher accuracy, |
1459 |
|
* and in bytes for convenience. |
1460 |
|
* |
1461 |
|
* typical values from DivX Home Theater profile: |
1462 |
|
* vbv_size= 384*1024 (384kB) |
1463 |
|
* vbv_initial= 288*1024 (75% fill) |
1464 |
|
* maxrate= 4854000 (4.854MBps) |
1465 |
|
* peakrate= 8000000 (8MBps) |
1466 |
|
* |
1467 |
|
* PAL: offset3s = 75 (3 seconds of 25fps) |
1468 |
|
* NTSC: offset3s = 90 (3 seconds of 29.97fps) or 72 (3 seconds of 23.976fps) |
1469 |
|
*/ |
1470 |
|
|
1471 |
|
const float vbv_size = (float)rc->param.vbv_size/8.f; |
1472 |
|
float vbvfill = (float)rc->param.vbv_initial/8.f; |
1473 |
|
float vbvmin; |
1474 |
|
|
1475 |
|
const float maxrate = (float)rc->param.vbv_maxrate; |
1476 |
|
const float peakrate = (float)rc->param.vbv_peakrate; |
1477 |
|
const float r0 = (int)(maxrate/fps+0.5)/8.f; |
1478 |
|
|
1479 |
|
int bytes3s = 0; |
1480 |
|
int offset3s = (int)(3.f*fps+0.5); |
1481 |
|
int i; |
1482 |
|
|
1483 |
|
/* 1Gbit should be enough to inuitialize the vbvmin |
1484 |
|
* an arbitrary high value */ |
1485 |
|
vbvmin = 1000*1000*1000; |
1486 |
|
|
1487 |
|
for (i=0; i<rc->num_frames; i++) { |
1488 |
|
/* DivX 3s peak bitrate check */ |
1489 |
|
bytes3s += rc->stats[i].scaled_length; |
1490 |
|
if (i>=offset3s) |
1491 |
|
bytes3s -= rc->stats[i-offset3s].scaled_length; |
1492 |
|
|
1493 |
|
/* ignore peakrate constraint if peakrate is <= 0.f */ |
1494 |
|
if (peakrate>0.f && 8.f*bytes3s > 3*peakrate) |
1495 |
|
return(VBV_PEAKRATE); |
1496 |
|
|
1497 |
|
/* update vbv fill level */ |
1498 |
|
vbvfill += r0 - rc->stats[i].scaled_length; |
1499 |
|
|
1500 |
|
/* this check is _NOT_ an "overflow"! only reading from disk stops then */ |
1501 |
|
if (vbvfill > vbv_size) |
1502 |
|
vbvfill = vbv_size; |
1503 |
|
|
1504 |
|
/* but THIS would be an underflow. report it! */ |
1505 |
|
if (vbvfill < 0) |
1506 |
|
return(VBV_UNDERFLOW); |
1507 |
|
|
1508 |
|
/* Store the minimum buffer filling */ |
1509 |
|
if (vbvfill < vbvmin) |
1510 |
|
vbvmin = vbvfill; |
1511 |
|
} |
1512 |
|
|
1513 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] Minimum buffer fill: %f bytes\n", vbvmin); |
1514 |
|
|
1515 |
|
return(VBV_COMPLIANT); |
1516 |
|
} |
1517 |
|
|
1518 |
|
|
1519 |
|
static int |
1520 |
|
scale_curve_for_vbv_compliancy(rc_2pass2_t * rc, const float fps) |
1521 |
|
{ |
1522 |
|
/* correct any VBV violations. Peak bitrate violations disappears |
1523 |
|
* by this automatically |
1524 |
|
* |
1525 |
|
* This implementation follows |
1526 |
|
* |
1527 |
|
* Westerink, Rajagopalan, Gonzales "Two-pass MPEG-2 variable-bitrate encoding" |
1528 |
|
* IBM J. RES. DEVELOP. VOL 43, No. 4, July 1999, p.471--488 |
1529 |
|
* |
1530 |
|
* Thanks, guys! This paper rocks!!! */ |
1531 |
|
|
1532 |
|
/* For each scene of len N, we have to check up to N^2 possible buffer fills. |
1533 |
|
* This works well with MPEG-2 where N==12 or so, but for MPEG-4 it's a |
1534 |
|
* little slow... |
1535 |
|
* |
1536 |
|
* TODO: Better control on VBVfill between scenes */ |
1537 |
|
|
1538 |
|
const float vbv_size = (float)rc->param.vbv_size/8.f; |
1539 |
|
const float vbv_initial = (float)rc->param.vbv_initial/8.f; |
1540 |
|
|
1541 |
|
const float maxrate = 0.9*rc->param.vbv_maxrate; |
1542 |
|
const float vbv_low = 0.10f*vbv_size; |
1543 |
|
const float r0 = (int)(maxrate/fps+0.5)/8.f; |
1544 |
|
|
1545 |
|
int i,k,l,n,violation = 0; |
1546 |
|
float *scenefactor; |
1547 |
|
int *scenestart; |
1548 |
|
int *scenelength; |
1549 |
|
|
1550 |
|
/* first step: determine how many "scenes" there are and store their |
1551 |
|
* boundaries we could get all this from existing keyframe_positions, |
1552 |
|
* somehow, but there we don't have a min_scenelength, and it's no big |
1553 |
|
* deal to get it again. */ |
1554 |
|
|
1555 |
|
const int min_scenelength = (int)(fps+0.5); |
1556 |
|
int num_scenes = 0; |
1557 |
|
int last_scene = -999; |
1558 |
|
for (i=0; i<rc->num_frames; i++) { |
1559 |
|
if ((rc->stats[i].type == XVID_TYPE_IVOP) && (i-last_scene>min_scenelength)) { |
1560 |
|
last_scene = i; |
1561 |
|
num_scenes++; |
1562 |
|
} |
1563 |
|
} |
1564 |
|
|
1565 |
|
scenefactor = (float*)malloc(num_scenes*sizeof(float)); |
1566 |
|
scenestart = (int*)malloc(num_scenes*sizeof(int)); |
1567 |
|
scenelength = (int*)malloc(num_scenes*sizeof(int)); |
1568 |
|
|
1569 |
|
if ((!scenefactor) || (!scenestart) || (!scenelength) ) { |
1570 |
|
free(scenefactor); |
1571 |
|
free(scenestart); |
1572 |
|
free(scenelength); |
1573 |
|
/* remember: free(0) is valid and does exactly nothing. */ |
1574 |
|
return(-1); |
1575 |
|
} |
1576 |
|
|
1577 |
|
/* count again and safe the length/position */ |
1578 |
|
|
1579 |
|
num_scenes = 0; |
1580 |
|
last_scene = -999; |
1581 |
|
for (i=0; i<rc->num_frames; i++) { |
1582 |
|
if ((rc->stats[i].type == XVID_TYPE_IVOP) && (i-last_scene>min_scenelength)) { |
1583 |
|
if (num_scenes>0) { |
1584 |
|
scenelength[num_scenes-1]=i-last_scene; |
1585 |
|
} |
1586 |
|
scenestart[num_scenes]=i; |
1587 |
|
num_scenes++; |
1588 |
|
last_scene = i; |
1589 |
|
} |
1590 |
|
} |
1591 |
|
scenelength[num_scenes-1]=i-last_scene; |
1592 |
|
|
1593 |
|
/* second step: check for each scene, how much we can scale its frames up or |
1594 |
|
* down such that the VBV restriction is just fulfilled */ |
1595 |
|
#define R(k,n) (((n)+1-(k))*r0) /* how much enters the buffer between frame k and n */ |
1596 |
|
for (l=0; l<num_scenes;l++) { |
1597 |
|
const int start = scenestart[l]; |
1598 |
|
const int length = scenelength[l]; |
1599 |
|
twopass_stat_t * frames = &rc->stats[start]; |
1600 |
|
|
1601 |
|
float S0n,Skn; |
1602 |
|
float f,minf = 99999.f; |
1603 |
|
|
1604 |
|
S0n=0.; |
1605 |
|
for (n=0;n<=length-1;n++) { |
1606 |
|
S0n += frames[n].scaled_length; |
1607 |
|
|
1608 |
|
k = 0; |
1609 |
|
Skn = S0n; |
1610 |
|
f = (R(k,n-1) + (vbv_initial - vbv_low)) / Skn; |
1611 |
|
if (f < minf) |
1612 |
|
minf = f; |
1613 |
|
|
1614 |
|
for (k=1;k<=n;k++) { |
1615 |
|
Skn -= frames[k].scaled_length; |
1616 |
|
|
1617 |
|
f = (R(k,n-1) + (vbv_size - vbv_low)) / Skn; |
1618 |
|
if (f < minf) |
1619 |
|
minf = f; |
1620 |
|
} |
1621 |
|
} |
1622 |
|
|
1623 |
|
/* special case: at the end, fill buffer up to vbv_initial again |
1624 |
|
* |
1625 |
|
* TODO: Allow other values for buffer fill between scenes |
1626 |
|
* e.g. if n=N is smallest f-value, then check for better value */ |
1627 |
|
|
1628 |
|
n=length; |
1629 |
|
k=0; |
1630 |
|
Skn = S0n; |
1631 |
|
f = R(k,n-1)/Skn; |
1632 |
|
if (f < minf) |
1633 |
|
minf = f; |
1634 |
|
|
1635 |
|
for (k=1;k<=n-1;k++) { |
1636 |
|
Skn -= frames[k].scaled_length; |
1637 |
|
|
1638 |
|
f = (R(k,n-1) + (vbv_initial - vbv_low)) / Skn; |
1639 |
|
if (f < minf) |
1640 |
|
minf = f; |
1641 |
|
} |
1642 |
|
|
1643 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] Scene %d (Frames %d-%d): VBVfactor %f\n", |
1644 |
|
l, start, start+length-1 , minf); |
1645 |
|
|
1646 |
|
scenefactor[l] = minf; |
1647 |
|
} |
1648 |
|
#undef R |
1649 |
|
|
1650 |
|
/* last step: now we know of any scene how much it can be scaled up or down |
1651 |
|
* without violating VBV. Next, distribute bits from the evil scenes to the |
1652 |
|
* good ones */ |
1653 |
|
do { |
1654 |
|
float S_red = 0.f; /* how much to redistribute */ |
1655 |
|
float S_elig = 0.f; /* sum of bit for those scenes you can still swallow something*/ |
1656 |
|
float f_red; |
1657 |
|
int l; |
1658 |
|
|
1659 |
|
/* check how much is wrong */ |
1660 |
|
for (l=0;l<num_scenes;l++) { |
1661 |
|
const int start = scenestart[l]; |
1662 |
|
const int length = scenelength[l]; |
1663 |
|
twopass_stat_t * frames = &rc->stats[start]; |
1664 |
|
|
1665 |
|
/* exactly 1 means "don't touch this anymore!" */ |
1666 |
|
if (scenefactor[l] == 1.) |
1667 |
|
continue; |
1668 |
|
|
1669 |
|
/* within limits */ |
1670 |
|
if (scenefactor[l] > 1.) { |
1671 |
|
for (n= 0; n < length; n++) |
1672 |
|
S_elig += frames[n].scaled_length; |
1673 |
|
} else { |
1674 |
|
/* underflowing segment */ |
1675 |
|
for (n= 0; n < length; n++) { |
1676 |
|
float newbytes = (float)frames[n].scaled_length * scenefactor[l]; |
1677 |
|
S_red += (float)frames[n].scaled_length - (float)newbytes; |
1678 |
|
frames[n].scaled_length =(int)newbytes; |
1679 |
|
} |
1680 |
|
scenefactor[l] = 1.f; |
1681 |
|
} |
1682 |
|
} |
1683 |
|
|
1684 |
|
/* no more underflows */ |
1685 |
|
if (S_red < 1.f) |
1686 |
|
break; |
1687 |
|
|
1688 |
|
if (S_elig < 1.f) { |
1689 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] Everything underflowing.\n"); |
1690 |
|
free(scenefactor); |
1691 |
|
free(scenestart); |
1692 |
|
free(scenelength); |
1693 |
|
return(-2); |
1694 |
|
} |
1695 |
|
|
1696 |
|
f_red = (1.f + S_red/S_elig); |
1697 |
|
|
1698 |
|
DPRINTF(XVID_DEBUG_RC, "[xvid rc] Moving %.0f kB to avoid buffer underflow, correction factor: %.5f\n", |
1699 |
|
S_red/1024.f, f_red); |
1700 |
|
|
1701 |
|
violation=0; |
1702 |
|
/* scale remaining scenes up to meet total size */ |
1703 |
|
for (l=0; l<num_scenes; l++) { |
1704 |
|
const int start = scenestart[l]; |
1705 |
|
const int length = scenelength[l]; |
1706 |
|
twopass_stat_t * frames = &rc->stats[start]; |
1707 |
|
|
1708 |
|
if (scenefactor[l] == 1.) |
1709 |
|
continue; |
1710 |
|
|
1711 |
|
/* there shouldn't be any segments with factor<1 left, so all the rest is >1 */ |
1712 |
|
for (n= 0; n < length; n++) { |
1713 |
|
frames[n].scaled_length = (int)(frames[n].scaled_length * f_red + 0.5); |
1714 |
|
} |
1715 |
|
|
1716 |
|
scenefactor[l] /= f_red; |
1717 |
|
if (scenefactor[l] < 1.f) |
1718 |
|
violation=1; |
1719 |
|
} |
1720 |
|
|
1721 |
|
} while (violation); |
1722 |
|
|
1723 |
|
free(scenefactor); |
1724 |
|
free(scenestart); |
1725 |
|
free(scenelength); |
1726 |
|
return(0); |
1727 |
|
} |
1728 |
|
|
1729 |
|
|
1730 |
|
/***************************************************************************** |
1731 |
* Still more low level stuff (nothing to do with stats treatment) |
* Still more low level stuff (nothing to do with stats treatment) |
1732 |
****************************************************************************/ |
****************************************************************************/ |
1733 |
|
|