vp9_ratectrl.h 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335
  1. /*
  2. * Copyright (c) 2010 The WebM project authors. All Rights Reserved.
  3. *
  4. * Use of this source code is governed by a BSD-style license
  5. * that can be found in the LICENSE file in the root of the source
  6. * tree. An additional intellectual property rights grant can be found
  7. * in the file PATENTS. All contributing project authors may
  8. * be found in the AUTHORS file in the root of the source tree.
  9. */
  10. #ifndef VPX_VP9_ENCODER_VP9_RATECTRL_H_
  11. #define VPX_VP9_ENCODER_VP9_RATECTRL_H_
  12. #include "vpx/vpx_codec.h"
  13. #include "vpx/vpx_integer.h"
  14. #include "vp9/common/vp9_blockd.h"
  15. #include "vp9/encoder/vp9_lookahead.h"
  16. #ifdef __cplusplus
  17. extern "C" {
  18. #endif
  19. // Used to control aggressive VBR mode.
  20. // #define AGGRESSIVE_VBR 1
  21. // Bits Per MB at different Q (Multiplied by 512)
  22. #define BPER_MB_NORMBITS 9
  23. #define MIN_GF_INTERVAL 4
  24. #define MAX_GF_INTERVAL 16
  25. #define FIXED_GF_INTERVAL 8 // Used in some testing modes only
  26. #define ONEHALFONLY_RESIZE 0
  27. #define FRAME_OVERHEAD_BITS 200
  28. // Threshold used to define a KF group as static (e.g. a slide show).
  29. // Essentially this means that no frame in the group has more than 1% of MBs
  30. // that are not marked as coded with 0,0 motion in the first pass.
  31. #define STATIC_KF_GROUP_THRESH 99
  32. // The maximum duration of a GF group that is static (for example a slide show).
  33. #define MAX_STATIC_GF_GROUP_LENGTH 250
  34. typedef enum {
  35. INTER_NORMAL = 0,
  36. INTER_HIGH = 1,
  37. GF_ARF_LOW = 2,
  38. GF_ARF_STD = 3,
  39. KF_STD = 4,
  40. RATE_FACTOR_LEVELS = 5
  41. } RATE_FACTOR_LEVEL;
  42. // Internal frame scaling level.
  43. typedef enum {
  44. UNSCALED = 0, // Frame is unscaled.
  45. SCALE_STEP1 = 1, // First-level down-scaling.
  46. FRAME_SCALE_STEPS
  47. } FRAME_SCALE_LEVEL;
  48. typedef enum {
  49. NO_RESIZE = 0,
  50. DOWN_THREEFOUR = 1, // From orig to 3/4.
  51. DOWN_ONEHALF = 2, // From orig or 3/4 to 1/2.
  52. UP_THREEFOUR = -1, // From 1/2 to 3/4.
  53. UP_ORIG = -2, // From 1/2 or 3/4 to orig.
  54. } RESIZE_ACTION;
  55. typedef enum { ORIG = 0, THREE_QUARTER = 1, ONE_HALF = 2 } RESIZE_STATE;
  56. // Frame dimensions multiplier wrt the native frame size, in 1/16ths,
  57. // specified for the scale-up case.
  58. // e.g. 24 => 16/24 = 2/3 of native size. The restriction to 1/16th is
  59. // intended to match the capabilities of the normative scaling filters,
  60. // giving precedence to the up-scaling accuracy.
  61. static const int frame_scale_factor[FRAME_SCALE_STEPS] = { 16, 24 };
  62. // Multiplier of the target rate to be used as threshold for triggering scaling.
  63. static const double rate_thresh_mult[FRAME_SCALE_STEPS] = { 1.0, 2.0 };
  64. // Scale dependent Rate Correction Factor multipliers. Compensates for the
  65. // greater number of bits per pixel generated in down-scaled frames.
  66. static const double rcf_mult[FRAME_SCALE_STEPS] = { 1.0, 2.0 };
  67. typedef struct {
  68. // Rate targetting variables
  69. int base_frame_target; // A baseline frame target before adjustment
  70. // for previous under or over shoot.
  71. int this_frame_target; // Actual frame target after rc adjustment.
  72. int projected_frame_size;
  73. int sb64_target_rate;
  74. int last_q[FRAME_TYPES]; // Separate values for Intra/Inter
  75. int last_boosted_qindex; // Last boosted GF/KF/ARF q
  76. int last_kf_qindex; // Q index of the last key frame coded.
  77. int gfu_boost;
  78. int last_boost;
  79. int kf_boost;
  80. double rate_correction_factors[RATE_FACTOR_LEVELS];
  81. int frames_since_golden;
  82. int frames_till_gf_update_due;
  83. int min_gf_interval;
  84. int max_gf_interval;
  85. int static_scene_max_gf_interval;
  86. int baseline_gf_interval;
  87. int constrained_gf_group;
  88. int frames_to_key;
  89. int frames_since_key;
  90. int this_key_frame_forced;
  91. int next_key_frame_forced;
  92. int source_alt_ref_pending;
  93. int source_alt_ref_active;
  94. int is_src_frame_alt_ref;
  95. int avg_frame_bandwidth; // Average frame size target for clip
  96. int min_frame_bandwidth; // Minimum allocation used for any frame
  97. int max_frame_bandwidth; // Maximum burst rate allowed for a frame.
  98. int ni_av_qi;
  99. int ni_tot_qi;
  100. int ni_frames;
  101. int avg_frame_qindex[FRAME_TYPES];
  102. double tot_q;
  103. double avg_q;
  104. int64_t buffer_level;
  105. int64_t bits_off_target;
  106. int64_t vbr_bits_off_target;
  107. int64_t vbr_bits_off_target_fast;
  108. int decimation_factor;
  109. int decimation_count;
  110. int rolling_target_bits;
  111. int rolling_actual_bits;
  112. int long_rolling_target_bits;
  113. int long_rolling_actual_bits;
  114. int rate_error_estimate;
  115. int64_t total_actual_bits;
  116. int64_t total_target_bits;
  117. int64_t total_target_vs_actual;
  118. int worst_quality;
  119. int best_quality;
  120. int64_t starting_buffer_level;
  121. int64_t optimal_buffer_level;
  122. int64_t maximum_buffer_size;
  123. // rate control history for last frame(1) and the frame before(2).
  124. // -1: undershot
  125. // 1: overshoot
  126. // 0: not initialized.
  127. int rc_1_frame;
  128. int rc_2_frame;
  129. int q_1_frame;
  130. int q_2_frame;
  131. // Keep track of the last target average frame bandwidth.
  132. int last_avg_frame_bandwidth;
  133. // Auto frame-scaling variables.
  134. FRAME_SCALE_LEVEL frame_size_selector;
  135. FRAME_SCALE_LEVEL next_frame_size_selector;
  136. int frame_width[FRAME_SCALE_STEPS];
  137. int frame_height[FRAME_SCALE_STEPS];
  138. int rf_level_maxq[RATE_FACTOR_LEVELS];
  139. int fac_active_worst_inter;
  140. int fac_active_worst_gf;
  141. uint64_t avg_source_sad[MAX_LAG_BUFFERS];
  142. uint64_t prev_avg_source_sad_lag;
  143. int high_source_sad_lagindex;
  144. int high_num_blocks_with_motion;
  145. int alt_ref_gf_group;
  146. int last_frame_is_src_altref;
  147. int high_source_sad;
  148. int count_last_scene_change;
  149. int hybrid_intra_scene_change;
  150. int re_encode_maxq_scene_change;
  151. int avg_frame_low_motion;
  152. int af_ratio_onepass_vbr;
  153. int force_qpmin;
  154. int reset_high_source_sad;
  155. double perc_arf_usage;
  156. int force_max_q;
  157. // Last frame was dropped post encode on scene change.
  158. int last_post_encode_dropped_scene_change;
  159. // Enable post encode frame dropping for screen content. Only enabled when
  160. // ext_use_post_encode_drop is enabled by user.
  161. int use_post_encode_drop;
  162. // External flag to enable post encode frame dropping, controlled by user.
  163. int ext_use_post_encode_drop;
  164. int damped_adjustment[RATE_FACTOR_LEVELS];
  165. double arf_active_best_quality_adjustment_factor;
  166. int arf_active_best_quality_adjustment_window;
  167. int preserve_arf_as_gld;
  168. int preserve_next_arf_as_gld;
  169. int show_arf_as_gld;
  170. } RATE_CONTROL;
  171. struct VP9_COMP;
  172. struct VP9EncoderConfig;
  173. void vp9_rc_init(const struct VP9EncoderConfig *oxcf, int pass,
  174. RATE_CONTROL *rc);
  175. int vp9_estimate_bits_at_q(FRAME_TYPE frame_type, int q, int mbs,
  176. double correction_factor, vpx_bit_depth_t bit_depth);
  177. double vp9_convert_qindex_to_q(int qindex, vpx_bit_depth_t bit_depth);
  178. int vp9_convert_q_to_qindex(double q_val, vpx_bit_depth_t bit_depth);
  179. void vp9_rc_init_minq_luts(void);
  180. int vp9_rc_get_default_min_gf_interval(int width, int height, double framerate);
  181. // Note vp9_rc_get_default_max_gf_interval() requires the min_gf_interval to
  182. // be passed in to ensure that the max_gf_interval returned is at least as big
  183. // as that.
  184. int vp9_rc_get_default_max_gf_interval(double framerate, int min_gf_interval);
  185. // Generally at the high level, the following flow is expected
  186. // to be enforced for rate control:
  187. // First call per frame, one of:
  188. // vp9_rc_get_one_pass_vbr_params()
  189. // vp9_rc_get_one_pass_cbr_params()
  190. // vp9_rc_get_svc_params()
  191. // vp9_rc_get_first_pass_params()
  192. // vp9_rc_get_second_pass_params()
  193. // depending on the usage to set the rate control encode parameters desired.
  194. //
  195. // Then, call encode_frame_to_data_rate() to perform the
  196. // actual encode. This function will in turn call encode_frame()
  197. // one or more times, followed by one of:
  198. // vp9_rc_postencode_update()
  199. // vp9_rc_postencode_update_drop_frame()
  200. //
  201. // The majority of rate control parameters are only expected
  202. // to be set in the vp9_rc_get_..._params() functions and
  203. // updated during the vp9_rc_postencode_update...() functions.
  204. // The only exceptions are vp9_rc_drop_frame() and
  205. // vp9_rc_update_rate_correction_factors() functions.
  206. // Functions to set parameters for encoding before the actual
  207. // encode_frame_to_data_rate() function.
  208. void vp9_rc_get_one_pass_vbr_params(struct VP9_COMP *cpi);
  209. void vp9_rc_get_one_pass_cbr_params(struct VP9_COMP *cpi);
  210. void vp9_rc_get_svc_params(struct VP9_COMP *cpi);
  211. // Post encode update of the rate control parameters based
  212. // on bytes used
  213. void vp9_rc_postencode_update(struct VP9_COMP *cpi, uint64_t bytes_used);
  214. // Post encode update of the rate control parameters for dropped frames
  215. void vp9_rc_postencode_update_drop_frame(struct VP9_COMP *cpi);
  216. // Updates rate correction factors
  217. // Changes only the rate correction factors in the rate control structure.
  218. void vp9_rc_update_rate_correction_factors(struct VP9_COMP *cpi);
  219. // Post encode drop for CBR mode.
  220. int post_encode_drop_cbr(struct VP9_COMP *cpi, size_t *size);
  221. // Decide if we should drop this frame: For 1-pass CBR.
  222. // Changes only the decimation count in the rate control structure
  223. int vp9_rc_drop_frame(struct VP9_COMP *cpi);
  224. // Computes frame size bounds.
  225. void vp9_rc_compute_frame_size_bounds(const struct VP9_COMP *cpi,
  226. int frame_target,
  227. int *frame_under_shoot_limit,
  228. int *frame_over_shoot_limit);
  229. // Picks q and q bounds given the target for bits
  230. int vp9_rc_pick_q_and_bounds(const struct VP9_COMP *cpi, int *bottom_index,
  231. int *top_index);
  232. // Estimates q to achieve a target bits per frame
  233. int vp9_rc_regulate_q(const struct VP9_COMP *cpi, int target_bits_per_frame,
  234. int active_best_quality, int active_worst_quality);
  235. // Estimates bits per mb for a given qindex and correction factor.
  236. int vp9_rc_bits_per_mb(FRAME_TYPE frame_type, int qindex,
  237. double correction_factor, vpx_bit_depth_t bit_depth);
  238. // Clamping utilities for bitrate targets for iframes and pframes.
  239. int vp9_rc_clamp_iframe_target_size(const struct VP9_COMP *const cpi,
  240. int target);
  241. int vp9_rc_clamp_pframe_target_size(const struct VP9_COMP *const cpi,
  242. int target);
  243. // Utility to set frame_target into the RATE_CONTROL structure
  244. // This function is called only from the vp9_rc_get_..._params() functions.
  245. void vp9_rc_set_frame_target(struct VP9_COMP *cpi, int target);
  246. // Computes a q delta (in "q index" terms) to get from a starting q value
  247. // to a target q value
  248. int vp9_compute_qdelta(const RATE_CONTROL *rc, double qstart, double qtarget,
  249. vpx_bit_depth_t bit_depth);
  250. // Computes a q delta (in "q index" terms) to get from a starting q value
  251. // to a value that should equate to the given rate ratio.
  252. int vp9_compute_qdelta_by_rate(const RATE_CONTROL *rc, FRAME_TYPE frame_type,
  253. int qindex, double rate_target_ratio,
  254. vpx_bit_depth_t bit_depth);
  255. int vp9_frame_type_qdelta(const struct VP9_COMP *cpi, int rf_level, int q);
  256. void vp9_rc_update_framerate(struct VP9_COMP *cpi);
  257. void vp9_rc_set_gf_interval_range(const struct VP9_COMP *const cpi,
  258. RATE_CONTROL *const rc);
  259. void vp9_set_target_rate(struct VP9_COMP *cpi);
  260. int vp9_resize_one_pass_cbr(struct VP9_COMP *cpi);
  261. void vp9_scene_detection_onepass(struct VP9_COMP *cpi);
  262. int vp9_encodedframe_overshoot(struct VP9_COMP *cpi, int frame_size, int *q);
  263. void vp9_configure_buffer_updates(struct VP9_COMP *cpi, int gf_group_index);
  264. void vp9_estimate_qp_gop(struct VP9_COMP *cpi);
  265. #ifdef __cplusplus
  266. } // extern "C"
  267. #endif
  268. #endif // VPX_VP9_ENCODER_VP9_RATECTRL_H_