📄 ratecontrol.c
字号:
/***************************************************-*- coding: iso-8859-1 -*- * ratecontrol.c: h264 encoder library (Rate Control) ***************************************************************************** * Copyright (C) 2005 x264 project * $Id: ratecontrol.c,v 1.1 2004/06/03 19:27:08 fenrir Exp $ * * Authors: Loren Merritt <lorenm@u.washington.edu> * Michael Niedermayer <michaelni@gmx.at> * M錸s Rullg錼d <mru@mru.ath.cx> * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111, USA. *****************************************************************************/#define _ISOC99_SOURCE#undef NDEBUG // always check asserts, the speed effect is far too small to disable them#include <stdio.h>#include <string.h>#include <math.h>#include <limits.h>#include <assert.h>#include "include/common.h"#include "include/cpu.h"#include "include/ratecontrol.h"#if defined(SYS_FREEBSD) || defined(SYS_BEOS) || defined(SYS_NETBSD) || defined(SYS_OPENBSD)#define exp2f(x) powf( 2, (x) )#endif#if defined(SYS_MACOSX)#define exp2f(x) (float)pow( 2, (x) )#define sqrtf sqrt#endif#if defined(SYS_OPENBSD)#define isfinite finite#endif#if defined(_MSC_VER)#define isfinite _finite#endif#if defined(_MSC_VER) || defined(SYS_SunOS)#define exp2f(x) pow( 2, (x) )#define sqrtf sqrt#endif#ifdef WIN32 // POSIX says that rename() removes the destination, but win32 doesn't.#define rename(src,dst) (unlink(dst), rename(src,dst))#endif//typedef struct
//{
// int pict_type;
// int kept_as_ref;
// float qscale;
// int mv_bits;
// int i_tex_bits;
// int p_tex_bits;
// int misc_bits;
// uint64_t expected_bits;
// float new_qscale;
// int new_qp;
// int i_count;
// int p_count;
// int s_count;
// float blurred_complexity;
// char direct_mode;
//} ratecontrol_entry_t;
//typedef struct
//{
// double coeff;
// double count;
// double decay;
//} predictor_t;
//struct x264_ratecontrol_t
//{
// /* constants */
// int b_abr;
// int b_2pass;
// int b_vbv;
// double fps;
// double bitrate;
// double rate_tolerance;
// int nmb; /* number of macroblocks in a frame */
// int qp_constant[5];
// /* current frame */
// ratecontrol_entry_t *rce;
// int qp; /* qp for current frame */
// int qpm; /* qp for current macroblock */
// float qpa; /* average of macroblocks' qp */
// int slice_type;
// int qp_force;
// /* VBV stuff */
// double buffer_size;
// double buffer_fill;
// double buffer_rate; /* # of bits added to buffer_fill after each frame */
// predictor_t pred[5]; /* predict frame size from satd */
// /* ABR stuff */
// int last_satd;
// double last_rceq;
// double cplxr_sum; /* sum of bits*qscale/rceq */
// double expected_bits_sum; /* sum of qscale2bits after rceq, ratefactor, and overflow */
// double wanted_bits_window; /* target bitrate * window */
// double cbr_decay;
// double short_term_cplxsum;
// double short_term_cplxcount;
// double rate_factor_constant;
// double ip_offset;
// double pb_offset;
// /* 2pass stuff */
// FILE *p_stat_file_out;
// char *psz_stat_file_tmpname;
// int num_entries; /* number of ratecontrol_entry_ts */
// ratecontrol_entry_t *entry; /* FIXME: copy needed data and free this once init is done */
// double last_qscale;
// double last_qscale_for[5]; /* last qscale for a specific pict type, used for max_diff & ipb factor stuff */
// int last_non_b_pict_type;
// double accum_p_qp; /* for determining I-frame quant */
// double accum_p_norm;
// double last_accum_p_norm;
// double lmin[5]; /* min qscale by frame type */
// double lmax[5];
// double lstep; /* max change (multiply) in qscale per frame */
// double i_cplx_sum[5]; /* estimated total texture bits in intra MBs at qscale=1 */
// double p_cplx_sum[5];
// double mv_bits_sum[5];
// int frame_count[5]; /* number of frames of each type */
// /* MBRC stuff */
// double frame_size_planned;
// int first_row, last_row; /* region of the frame to be encoded by this thread */
// predictor_t *row_pred;
// predictor_t row_preds[5];
// predictor_t pred_b_from_p; /* predict B-frame size from P-frame satd */
// int bframes; /* # consecutive B-frames before this P-frame */
// int bframe_bits; /* total cost of those frames */
// int i_zones;
// x264_zone_t *zones;
//};
static int parse_zones( x264_t *h );static int init_pass2(x264_t *);static float rate_estimate_qscale( x264_t *h, int pict_type );static void update_vbv( x264_t *h, int bits );static double predict_size( predictor_t *p, double q, double var );static void update_predictor( predictor_t *p, double q, double var, double bits );int x264_rc_analyse_slice( x264_t *h );/* Terminology: * qp = h.264's quantizer * qscale = linearized quantizer = Lagrange multiplier */static inline double qp2qscale(double qp){ return 0.85 * pow(2.0, ( qp - 12.0 ) / 6.0);}static inline double qscale2qp(double qscale){ return 12.0 + 6.0 * log(qscale/0.85) / log(2.0);}/* Texture bitrate is not quite inversely proportional to qscale, * probably due the the changing number of SKIP blocks. * MV bits level off at about qp<=12, because the lambda used * for motion estimation is constant there. */static inline double qscale2bits(ratecontrol_entry_t *rce, double qscale){ if(qscale<0.1) qscale = 0.1; return (rce->i_tex_bits + rce->p_tex_bits + .1) * pow( rce->qscale / qscale, 1.1 ) + rce->mv_bits * pow( X264_MAX(rce->qscale, 1) / X264_MAX(qscale, 1), 0.5 ) + rce->misc_bits;}int x264_ratecontrol_new( x264_t *h ){ x264_ratecontrol_t *rc; int i; x264_cpu_restore( h->param.cpu ); h->rc = rc = x264_malloc( h->param.i_threads * sizeof(x264_ratecontrol_t) ); memset( rc, 0, h->param.i_threads * sizeof(x264_ratecontrol_t) ); rc->b_abr = h->param.rc.i_rc_method != X264_RC_CQP && !h->param.rc.b_stat_read; rc->b_2pass = h->param.rc.i_rc_method == X264_RC_ABR && h->param.rc.b_stat_read; /* FIXME: use integers */ if(h->param.i_fps_num > 0 && h->param.i_fps_den > 0) rc->fps = (float) h->param.i_fps_num / h->param.i_fps_den; else rc->fps = 25.0; rc->bitrate = h->param.rc.i_bitrate * 1000; rc->rate_tolerance = h->param.rc.f_rate_tolerance; rc->nmb = h->mb.i_mb_count; rc->last_non_b_pict_type = -1; rc->cbr_decay = 1.0; if( h->param.rc.i_rc_method == X264_RC_CRF && h->param.rc.b_stat_read ) { x264_log(h, X264_LOG_ERROR, "constant rate-factor is incompatible with 2pass.\n"); return -1; } if( h->param.rc.i_vbv_buffer_size ) { if( h->param.rc.i_rc_method == X264_RC_CQP ) x264_log(h, X264_LOG_WARNING, "VBV is incompatible with constant QP, ignored.\n"); else if( h->param.rc.i_vbv_max_bitrate == 0 ) { x264_log( h, X264_LOG_DEBUG, "VBV maxrate unspecified, assuming CBR\n" ); h->param.rc.i_vbv_max_bitrate = h->param.rc.i_bitrate; } } if( h->param.rc.i_vbv_max_bitrate < h->param.rc.i_bitrate && h->param.rc.i_vbv_max_bitrate > 0) x264_log(h, X264_LOG_WARNING, "max bitrate less than average bitrate, ignored.\n"); else if( h->param.rc.i_vbv_max_bitrate > 0 && h->param.rc.i_vbv_buffer_size > 0 ) { if( h->param.rc.i_vbv_buffer_size < 3 * h->param.rc.i_vbv_max_bitrate / rc->fps ) { h->param.rc.i_vbv_buffer_size = (int)(3 * h->param.rc.i_vbv_max_bitrate / rc->fps); x264_log( h, X264_LOG_WARNING, "VBV buffer size too small, using %d kbit\n", h->param.rc.i_vbv_buffer_size ); } rc->buffer_rate = h->param.rc.i_vbv_max_bitrate * 1000 / rc->fps; rc->buffer_size = h->param.rc.i_vbv_buffer_size * 1000; rc->buffer_fill = rc->buffer_size * h->param.rc.f_vbv_buffer_init; rc->cbr_decay = 1.0 - rc->buffer_rate / rc->buffer_size * 0.5 * X264_MAX(0, 1.5 - rc->buffer_rate * rc->fps / rc->bitrate); rc->b_vbv = 1; } else if( h->param.rc.i_vbv_max_bitrate ) x264_log(h, X264_LOG_WARNING, "VBV maxrate specified, but no bufsize.\n"); if(rc->rate_tolerance < 0.01) { x264_log(h, X264_LOG_WARNING, "bitrate tolerance too small, using .01\n"); rc->rate_tolerance = 0.01; } h->mb.b_variable_qp = rc->b_vbv && !rc->b_2pass; if( rc->b_abr ) { /* FIXME ABR_INIT_QP is actually used only in CRF */#define ABR_INIT_QP ( h->param.rc.i_rc_method == X264_RC_CRF ? h->param.rc.i_rf_constant : 24 ) rc->accum_p_norm = .01; rc->accum_p_qp = ABR_INIT_QP * rc->accum_p_norm; /* estimated ratio that produces a reasonable QP for the first I-frame */ rc->cplxr_sum = .01 * pow( 7.0e5, h->param.rc.f_qcompress ) * pow( h->mb.i_mb_count, 0.5 ); rc->wanted_bits_window = 1.0 * rc->bitrate / rc->fps; rc->last_non_b_pict_type = SLICE_TYPE_I; } if( h->param.rc.i_rc_method == X264_RC_CRF ) { /* arbitrary rescaling to make CRF somewhat similar to QP */ double base_cplx = h->mb.i_mb_count * (h->param.i_bframe ? 120 : 80); rc->rate_factor_constant = pow( base_cplx, 1 - h->param.rc.f_qcompress ) / qp2qscale( h->param.rc.i_rf_constant ); } rc->ip_offset = 6.0 * log(h->param.rc.f_ip_factor) / log(2.0); rc->pb_offset = 6.0 * log(h->param.rc.f_pb_factor) / log(2.0); rc->qp_constant[SLICE_TYPE_P] = h->param.rc.i_qp_constant; rc->qp_constant[SLICE_TYPE_I] = (x264_clip3( h->param.rc.i_qp_constant - rc->ip_offset + 0.5, 0, 51 )); rc->qp_constant[SLICE_TYPE_B] = (x264_clip3( h->param.rc.i_qp_constant + rc->pb_offset + 0.5, 0, 51 )); rc->lstep = exp2f(h->param.rc.i_qp_step / 6.0); rc->last_qscale = qp2qscale(26); for( i = 0; i < 5; i++ ) { rc->last_qscale_for[i] = qp2qscale( ABR_INIT_QP ); rc->lmin[i] = qp2qscale( h->param.rc.i_qp_min ); rc->lmax[i] = qp2qscale( h->param.rc.i_qp_max ); rc->pred[i].coeff= 2.0; rc->pred[i].count= 1.0; rc->pred[i].decay= 0.5; rc->row_preds[i].coeff= .25; rc->row_preds[i].count= 1.0; rc->row_preds[i].decay= 0.5; } rc->pred_b_from_p = rc->pred[0]; if( parse_zones( h ) < 0 ) return -1; /* Load stat file and init 2pass algo */ if( h->param.rc.b_stat_read ) { char *p, *stats_in, *stats_buf; /* read 1st pass stats */ assert( h->param.rc.psz_stat_in ); stats_buf = stats_in = x264_slurp_file( h->param.rc.psz_stat_in ); if( !stats_buf ) { x264_log(h, X264_LOG_ERROR, "ratecontrol_init: can't open stats file\n"); return -1; } /* check whether 1st pass options were compatible with current options */ if( !strncmp( stats_buf, "#options:", 9 ) ) { int i; char *opts = stats_buf; stats_in = strchr( stats_buf, '\n' ); if( !stats_in ) return -1; *stats_in = '\0'; stats_in++; if( ( p = strstr( opts, "bframes=" ) ) && sscanf( p, "bframes=%d", &i ) && h->param.i_bframe != i ) { x264_log( h, X264_LOG_ERROR, "different number of B-frames than 1st pass (%d vs %d)\n", h->param.i_bframe, i ); return -1; } /* since B-adapt doesn't (yet) take into account B-pyramid, * the converse is not a problem */ if( strstr( opts, "b_pyramid=1" ) && !h->param.b_bframe_pyramid ) x264_log( h, X264_LOG_WARNING, "1st pass used B-pyramid, 2nd doesn't\n" ); if( ( p = strstr( opts, "keyint=" ) ) && sscanf( p, "keyint=%d", &i ) && h->param.i_keyint_max != i ) x264_log( h, X264_LOG_WARNING, "different keyint than 1st pass (%d vs %d)\n", h->param.i_keyint_max, i ); if( strstr( opts, "qp=0" ) && h->param.rc.i_rc_method == X264_RC_ABR ) x264_log( h, X264_LOG_WARNING, "1st pass was lossless, bitrate prediction will be inaccurate\n" ); } /* find number of pics */ p = stats_in; for(i=-1; p; i++) p = strchr(p+1, ';'); if(i==0) { x264_log(h, X264_LOG_ERROR, "empty stats file\n"); return -1; } rc->num_entries = i; if( h->param.i_frame_total < rc->num_entries && h->param.i_frame_total > 0 ) { x264_log( h, X264_LOG_WARNING, "2nd pass has fewer frames than 1st pass (%d vs %d)\n", h->param.i_frame_total, rc->num_entries ); } if( h->param.i_frame_total > rc->num_entries + h->param.i_bframe ) { x264_log( h, X264_LOG_ERROR, "2nd pass has more frames than 1st pass (%d vs %d)\n", h->param.i_frame_total, rc->num_entries ); return -1; } /* FIXME: ugly padding because VfW drops delayed B-frames */ rc->num_entries += h->param.i_bframe; rc->entry = (ratecontrol_entry_t*) x264_malloc(rc->num_entries * sizeof(ratecontrol_entry_t)); memset(rc->entry, 0, rc->num_entries * sizeof(ratecontrol_entry_t)); /* init all to skipped p frames */ for(i=0; i<rc->num_entries; i++){ ratecontrol_entry_t *rce = &rc->entry[i]; rce->pict_type = SLICE_TYPE_P; rce->qscale = rce->new_qscale = (float)qp2qscale(20); rce->misc_bits = rc->nmb + 10;
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -