AOMedia AV1 Codec
ratectrl.h
1 /*
2  * Copyright (c) 2016, Alliance for Open Media. All rights reserved
3  *
4  * This source code is subject to the terms of the BSD 2 Clause License and
5  * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6  * was not distributed with this source code in the LICENSE file, you can
7  * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8  * Media Patent License 1.0 was not distributed with this source code in the
9  * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10  */
11 
12 #ifndef AOM_AV1_ENCODER_RATECTRL_H_
13 #define AOM_AV1_ENCODER_RATECTRL_H_
14 
15 #include "aom/aom_codec.h"
16 #include "aom/aom_integer.h"
17 
18 #include "aom_ports/mem.h"
19 
20 #include "av1/common/av1_common_int.h"
21 #include "av1/common/blockd.h"
22 
23 #ifdef __cplusplus
24 extern "C" {
25 #endif
26 
29 // Bits Per MB at different Q (Multiplied by 512)
30 #define BPER_MB_NORMBITS 9
31 
32 // Use this macro to turn on/off use of alt-refs in one-pass mode.
33 #define USE_ALTREF_FOR_ONE_PASS 1
34 
35 // Threshold used to define if a KF group is static (e.g. a slide show).
36 // Essentially, this means that no frame in the group has more than 1% of MBs
37 // that are not marked as coded with 0,0 motion in the first pass.
38 #define STATIC_KF_GROUP_THRESH 99
39 #define STATIC_KF_GROUP_FLOAT_THRESH 0.99
40 
41 // The maximum duration of a GF group that is static (e.g. a slide show).
42 #define MAX_STATIC_GF_GROUP_LENGTH 250
43 
44 #define MIN_GF_INTERVAL 4
45 #define MAX_GF_INTERVAL 32
46 #define FIXED_GF_INTERVAL 16
47 #define MAX_GF_LENGTH_LAP 16
48 
49 #define FIXED_GF_INTERVAL_RT 80
50 #define MAX_GF_INTERVAL_RT 160
51 
52 #define MAX_NUM_GF_INTERVALS 15
53 
54 #define MAX_ARF_LAYERS 6
55 // #define STRICT_RC
56 
57 #define DEFAULT_KF_BOOST_RT 2300
58 #define DEFAULT_GF_BOOST_RT 2000
59 
60 // A passive rate control strategy for screen content type in real-time mode.
61 // When it is turned on, the compression performance is improved by
62 // 7.8% (overall_psnr), 5.0% (VMAF) on average. Some clips see gains
63 // over 20% on metric.
64 // The downside is that it does not guarantee frame size.
65 // Since RT mode has a tight restriction on buffer overflow control, we
66 // turn it off by default.
67 #define RT_PASSIVE_STRATEGY 0
68 #define MAX_Q_HISTORY 1000
69 
70 typedef struct {
71  int resize_width;
72  int resize_height;
73  uint8_t superres_denom;
74 } size_params_type;
75 
76 enum {
77  INTER_NORMAL,
78  GF_ARF_LOW,
79  GF_ARF_STD,
80  KF_STD,
81  RATE_FACTOR_LEVELS
82 } UENUM1BYTE(RATE_FACTOR_LEVEL);
83 
84 enum {
85  KF_UPDATE,
86  LF_UPDATE,
87  GF_UPDATE,
88  ARF_UPDATE,
89  OVERLAY_UPDATE,
90  INTNL_OVERLAY_UPDATE, // Internal Overlay Frame
91  INTNL_ARF_UPDATE, // Internal Altref Frame
92  FRAME_UPDATE_TYPES
93 } UENUM1BYTE(FRAME_UPDATE_TYPE);
94 
95 enum {
96  REFBUF_RESET, // Clear reference frame buffer
97  REFBUF_UPDATE, // Refresh reference frame buffer
98  REFBUF_STATES
99 } UENUM1BYTE(REFBUF_STATE);
100 
101 typedef enum {
102  NO_RESIZE = 0,
103  DOWN_THREEFOUR = 1, // From orig to 3/4.
104  DOWN_ONEHALF = 2, // From orig or 3/4 to 1/2.
105  UP_THREEFOUR = -1, // From 1/2 to 3/4.
106  UP_ORIG = -2, // From 1/2 or 3/4 to orig.
107 } RESIZE_ACTION;
108 
109 typedef enum { ORIG = 0, THREE_QUARTER = 1, ONE_HALF = 2 } RESIZE_STATE;
110 
111 #define MAX_FIRSTPASS_ANALYSIS_FRAMES 150
112 typedef enum region_types {
113  STABLE_REGION = 0,
114  HIGH_VAR_REGION = 1,
115  SCENECUT_REGION = 2,
116  BLENDING_REGION = 3,
117 } REGION_TYPES;
118 
119 typedef struct regions {
120  int start;
121  int last;
122  double avg_noise_var;
123  double avg_cor_coeff;
124  double avg_sr_fr_ratio;
125  double avg_intra_err;
126  double avg_coded_err;
127  REGION_TYPES type;
128 } REGIONS;
129 
134 typedef struct {
135  // Rate targetting variables
136 
145  int this_frame_target; // Actual frame target after rc adjustment.
146 
151 
156 
161 
166 
171 
176 
178  int min_gf_interval;
179  int max_gf_interval;
180  int static_scene_max_gf_interval;
187  int frames_since_key;
188  int frames_to_fwd_kf;
189  int is_src_frame_alt_ref;
190  int sframe_due;
191 
192  int high_source_sad;
193  uint64_t avg_source_sad;
194  uint64_t prev_avg_source_sad;
195  uint64_t frame_source_sad;
196 
197  int avg_frame_bandwidth; // Average frame size target for clip
198  int min_frame_bandwidth; // Minimum allocation used for any frame
199  int max_frame_bandwidth; // Maximum burst rate allowed for a frame.
200  int prev_avg_frame_bandwidth;
201 
202  int ni_av_qi;
203  int ni_tot_qi;
204 
205  int decimation_factor;
206  int decimation_count;
207  int prev_frame_is_dropped;
208  int drop_count_consec;
209  int max_consec_drop;
210 
215  unsigned int frame_number_encoded;
216 
226 
229  // rate control history for last frame(1) and the frame before(2).
230  // -1: overshoot
231  // 1: undershoot
232  // 0: not initialized.
233  int rc_1_frame;
234  int rc_2_frame;
235  int q_1_frame;
236  int q_2_frame;
237 
243 
245  // Track amount of low motion in scene
246  int avg_frame_low_motion;
247  int cnt_zeromv;
248 
249  // signals if number of blocks with motion is high
250  int percent_blocks_with_motion;
251 
252  // Maximum value of source sad across all blocks of frame.
253  uint64_t max_block_source_sad;
254 
255  // For dynamic resize, 1 pass cbr.
256  RESIZE_STATE resize_state;
257  int resize_avg_qp;
258  int resize_buffer_underflow;
259  int resize_count;
260 
261  // Flag to disable content related qp adjustment.
262  int rtc_external_ratectrl;
263 
264  // Stores fast_extra_bits of the current frame.
265  int frame_level_fast_extra_bits;
266 
267  double frame_level_rate_correction_factors[RATE_FACTOR_LEVELS];
268 
269  int frame_num_last_gf_refresh;
270 
271  int prev_coded_width;
272  int prev_coded_height;
273 
274  // The ratio used for inter frames in bit estimation.
275  // TODO(yunqing): if golden frame is treated differently (e.g. gf_cbr_boost_
276  // pct > THR), consider to add bit_est_ratio_g for golden frames.
277  int bit_est_ratio;
278 
279  // Whether to use a fixed qp for the frame, bypassing internal rate control.
280  // This flag will reset to 0 after every frame.
281  int use_external_qp_one_pass;
283 } RATE_CONTROL;
284 
288 typedef struct {
289  // Sub-gop level Rate targetting variables
290 
294  int64_t gf_group_bits;
295 
299  int kf_boost;
300 
305 
309  int gf_intervals[MAX_NUM_GF_INTERVALS];
310 
315 
317  int num_regions;
318 
319  REGIONS regions[MAX_FIRSTPASS_ANALYSIS_FRAMES];
320  int regions_offset; // offset of regions from the last keyframe
321  int frames_till_regions_update;
322 
323  int baseline_gf_interval;
324 
325  int constrained_gf_group;
326 
327  int this_key_frame_forced;
328 
329  int next_key_frame_forced;
336 
341 
346 
350  int arf_q;
351 
353  float_t arf_boost_factor;
354 
355  int base_layer_qp;
356 
357  // Total number of stats used only for kf_boost calculation.
358  int num_stats_used_for_kf_boost;
359 
360  // Total number of stats used only for gfu_boost calculation.
361  int num_stats_used_for_gfu_boost;
362 
363  // Total number of stats required by gfu_boost calculation.
364  int num_stats_required_for_gfu_boost;
365 
366  int enable_scenecut_detection;
367 
368  int use_arf_in_this_kf_group;
369 
370  int ni_frames;
371 
372  double tot_q;
379 
383  int avg_frame_qindex[FRAME_TYPES];
384 
385 #if CONFIG_FPMT_TEST
390  int temp_active_best_quality[MAX_ARF_LAYERS + 1];
391 
396  int temp_last_boosted_qindex;
397 
402  double temp_avg_q;
403 
408  int temp_last_q[FRAME_TYPES];
409 
414  int temp_projected_frame_size;
415 
420  int64_t temp_total_actual_bits;
421 
426  int64_t temp_buffer_level;
427 
432  int64_t temp_vbr_bits_off_target;
433 
438  int64_t temp_vbr_bits_off_target_fast;
439 
444  double temp_rate_correction_factors[RATE_FACTOR_LEVELS];
445 
450  int temp_rate_error_estimate;
451 
456  int temp_rolling_arf_group_target_bits;
457 
462  int temp_rolling_arf_group_actual_bits;
463 
468  int64_t temp_bits_left;
469 
474  int temp_extend_minq;
475 
480  int temp_extend_maxq;
481 
482 #endif
486  int active_best_quality[MAX_ARF_LAYERS + 1];
487 
492 
496  double avg_q;
497 
501  int last_q[FRAME_TYPES];
502 
507  double rate_correction_factors[RATE_FACTOR_LEVELS];
508 
513 
518 
522  int64_t buffer_level;
523 
528 
533 
538 
544 
549 
555 
560  int q_history[MAX_Q_HISTORY];
562 
565 struct AV1_COMP;
566 struct AV1EncoderConfig;
567 struct GF_GROUP;
568 
569 void av1_primary_rc_init(const struct AV1EncoderConfig *oxcf,
570  PRIMARY_RATE_CONTROL *p_rc);
571 
572 void av1_rc_init(const struct AV1EncoderConfig *oxcf, RATE_CONTROL *rc);
573 
574 int av1_estimate_bits_at_q(const struct AV1_COMP *cpi, int q,
575  double correction_factor);
576 
577 double av1_convert_qindex_to_q(int qindex, aom_bit_depth_t bit_depth);
578 
579 void av1_rc_init_minq_luts(void);
580 
581 int av1_rc_get_default_min_gf_interval(int width, int height, double framerate);
582 // Note av1_rc_get_default_max_gf_interval() requires the min_gf_interval to
583 // be passed in to ensure that the max_gf_interval returned is at least as bis
584 // as that.
585 int av1_rc_get_default_max_gf_interval(double framerate, int min_gf_interval);
586 
587 // Generally at the high level, the following flow is expected
588 // to be enforced for rate control:
589 // First call per frame, one of:
590 // av1_get_one_pass_rt_params()
591 // av1_get_second_pass_params()
592 // depending on the usage to set the rate control encode parameters desired.
593 //
594 // Then, call encode_frame_to_data_rate() to perform the
595 // actual encode. This function will in turn call encode_frame()
596 // one or more times, followed by:
597 // av1_rc_postencode_update_drop_frame()
598 //
599 // The majority of rate control parameters are only expected
600 // to be set in the av1_get_..._params() functions and
601 // updated during the av1_rc_postencode_update...() functions.
602 // The only exceptions are av1_rc_drop_frame() and
603 // av1_rc_update_rate_correction_factors() functions.
604 
605 // Functions to set parameters for encoding before the actual
606 // encode_frame_to_data_rate() function.
607 struct EncodeFrameInput;
608 
609 // Post encode update of the rate control parameters based
610 // on bytes used
611 void av1_rc_postencode_update(struct AV1_COMP *cpi, uint64_t bytes_used);
612 // Post encode update of the rate control parameters for dropped frames
613 void av1_rc_postencode_update_drop_frame(struct AV1_COMP *cpi);
614 
630  int is_encode_stage, int width,
631  int height);
634 // Decide if we should drop this frame: For 1-pass CBR.
635 // Changes only the decimation count in the rate control structure
636 int av1_rc_drop_frame(struct AV1_COMP *cpi);
637 
638 // Computes frame size bounds.
639 void av1_rc_compute_frame_size_bounds(const struct AV1_COMP *cpi,
640  int this_frame_target,
641  int *frame_under_shoot_limit,
642  int *frame_over_shoot_limit);
643 
658 int av1_rc_pick_q_and_bounds(struct AV1_COMP *cpi, int width, int height,
659  int gf_index, int *bottom_index, int *top_index);
660 
673 int av1_rc_regulate_q(const struct AV1_COMP *cpi, int target_bits_per_frame,
674  int active_best_quality, int active_worst_quality,
675  int width, int height);
676 
678 // Gets the appropriate bpmb ennumerator based on the frame and content type
679 int av1_get_bpmb_enumerator(FRAME_TYPE frame_type,
680  const int is_screen_content_type);
681 
682 // Estimates bits per mb for a given qindex and correction factor.
683 int av1_rc_bits_per_mb(const struct AV1_COMP *cpi, FRAME_TYPE frame_type,
684  int qindex, double correction_factor,
685  int accurate_estimate);
686 
687 // Clamping utilities for bitrate targets for iframes and pframes.
688 int av1_rc_clamp_iframe_target_size(const struct AV1_COMP *const cpi,
689  int64_t target);
690 int av1_rc_clamp_pframe_target_size(const struct AV1_COMP *const cpi,
691  int target, uint8_t frame_update_type);
692 
693 // Find q_index corresponding to desired_q, within [best_qindex, worst_qindex].
694 // To be precise, 'q_index' is the smallest integer, for which the corresponding
695 // q >= desired_q.
696 // If no such q index is found, returns 'worst_qindex'.
697 int av1_find_qindex(double desired_q, aom_bit_depth_t bit_depth,
698  int best_qindex, int worst_qindex);
699 
700 // Computes a q delta (in "q index" terms) to get from a starting q value
701 // to a target q value
702 int av1_compute_qdelta(const RATE_CONTROL *rc, double qstart, double qtarget,
703  aom_bit_depth_t bit_depth);
704 
705 // Computes a q delta (in "q index" terms) to get from a starting q value
706 // to a value that should equate to the given rate ratio.
707 int av1_compute_qdelta_by_rate(const struct AV1_COMP *cpi,
708  FRAME_TYPE frame_type, int qindex,
709  double rate_target_ratio);
710 
711 int av1_frame_type_qdelta(const struct AV1_COMP *cpi, int q);
712 
713 void av1_rc_update_framerate(struct AV1_COMP *cpi, int width, int height);
714 
715 void av1_rc_set_gf_interval_range(const struct AV1_COMP *const cpi,
716  RATE_CONTROL *const rc);
717 
718 void av1_set_target_rate(struct AV1_COMP *cpi, int width, int height);
719 
720 int av1_resize_one_pass_cbr(struct AV1_COMP *cpi);
721 
722 void av1_rc_set_frame_target(struct AV1_COMP *cpi, int target, int width,
723  int height);
724 
725 void av1_adjust_gf_refresh_qp_one_pass_rt(struct AV1_COMP *cpi);
726 
728  int gf_update);
729 
743  const struct AV1_COMP *const cpi, FRAME_UPDATE_TYPE frame_update_type);
744 
756 
769  const struct AV1_COMP *cpi, FRAME_UPDATE_TYPE frame_update_type);
770 
782 
802  FRAME_TYPE *const frame_type,
803  const struct EncodeFrameInput *frame_input,
804  unsigned int frame_flags);
805 
820 int av1_encodedframe_overshoot_cbr(struct AV1_COMP *cpi, int *q);
821 
833 int av1_q_mode_get_q_index(int base_q_index, int gf_update_type,
834  int gf_pyramid_level, int arf_q);
835 
845 int av1_get_arf_q_index(int base_q_index, int gfu_boost, int bit_depth,
846  double arf_boost_factor);
847 
848 #if !CONFIG_REALTIME_ONLY
849 struct TplDepFrame;
857 int av1_get_arf_q_index_q_mode(struct AV1_COMP *cpi,
858  struct TplDepFrame *tpl_frame);
859 #endif
860 #ifdef __cplusplus
861 } // extern "C"
862 #endif
863 
864 #endif // AOM_AV1_ENCODER_RATECTRL_H_
Describes the codec algorithm interface to applications.
enum aom_bit_depth aom_bit_depth_t
Bit depth for codecThis enumeration determines the bit depth of the codec.
int av1_calc_pframe_target_size_one_pass_vbr(const struct AV1_COMP *const cpi, FRAME_UPDATE_TYPE frame_update_type)
Calculates how many bits to use for a P frame in one pass vbr.
void av1_rc_update_rate_correction_factors(struct AV1_COMP *cpi, int is_encode_stage, int width, int height)
Updates the rate correction factor linking Q to output bits.
Definition: ratectrl.c:771
int av1_encodedframe_overshoot_cbr(struct AV1_COMP *cpi, int *q)
Increase q on expected encoder overshoot, for CBR mode.
Definition: ratectrl.c:3480
void av1_get_one_pass_rt_params(struct AV1_COMP *cpi, FRAME_TYPE *const frame_type, const struct EncodeFrameInput *frame_input, unsigned int frame_flags)
Setup the rate control parameters for 1 pass real-time mode.
int av1_calc_pframe_target_size_one_pass_cbr(const struct AV1_COMP *cpi, FRAME_UPDATE_TYPE frame_update_type)
Calculates how many bits to use for a P frame in one pass cbr.
int av1_rc_pick_q_and_bounds(struct AV1_COMP *cpi, int width, int height, int gf_index, int *bottom_index, int *top_index)
Picks q and q bounds given the rate control parameters in cpi->rc.
Definition: ratectrl.c:2139
int av1_calc_iframe_target_size_one_pass_cbr(const struct AV1_COMP *cpi)
Calculates how many bits to use for an i frame in one pass cbr.
int av1_calc_iframe_target_size_one_pass_vbr(const struct AV1_COMP *const cpi)
Calculates how many bits to use for an i frame in one pass vbr.
int av1_rc_regulate_q(const struct AV1_COMP *cpi, int target_bits_per_frame, int active_best_quality, int active_worst_quality, int width, int height)
Estimates q to achieve a target bits per frame.
void av1_set_rtc_reference_structure_one_layer(AV1_COMP *cpi, int gf_update)
Setup the reference prediction structure for 1 pass real-time.
Definition: ratectrl.c:2857
Main encoder configuration data structure.
Definition: encoder.h:915
Top level encoder structure.
Definition: encoder.h:2872
Input frames and last input frame.
Definition: encoder.h:3661
Data related to the current GF/ARF group and the individual frames within the group.
Definition: firstpass.h:354
Primary Rate Control parameters and status.
Definition: ratectrl.h:288
int64_t bits_off_target
Definition: ratectrl.h:543
int rate_error_estimate
Definition: ratectrl.h:527
double avg_q
Definition: ratectrl.h:496
int64_t maximum_buffer_size
Definition: ratectrl.h:345
int kf_boost
Definition: ratectrl.h:299
int64_t starting_buffer_level
Definition: ratectrl.h:335
int64_t total_actual_bits
Definition: ratectrl.h:512
int64_t vbr_bits_off_target_fast
Definition: ratectrl.h:537
int rolling_target_bits
Definition: ratectrl.h:548
int64_t buffer_level
Definition: ratectrl.h:522
int gfu_boost
Definition: ratectrl.h:304
int64_t optimal_buffer_level
Definition: ratectrl.h:340
int arf_q
Definition: ratectrl.h:350
int rolling_actual_bits
Definition: ratectrl.h:554
int last_boosted_qindex
Definition: ratectrl.h:491
int cur_gf_index
Definition: ratectrl.h:314
int64_t total_target_bits
Definition: ratectrl.h:517
int last_kf_qindex
Definition: ratectrl.h:378
int64_t gf_group_bits
Definition: ratectrl.h:294
int64_t vbr_bits_off_target
Definition: ratectrl.h:532
Rate Control parameters and status.
Definition: ratectrl.h:134
int best_quality
Definition: ratectrl.h:225
int intervals_till_gf_calculate_due
Definition: ratectrl.h:175
int this_frame_target
Definition: ratectrl.h:145
int frames_to_key
Definition: ratectrl.h:185
int base_frame_target
Definition: ratectrl.h:141
int projected_frame_size
Definition: ratectrl.h:150
int worst_quality
Definition: ratectrl.h:221
int sb64_target_rate
Definition: ratectrl.h:160
int coefficient_size
Definition: ratectrl.h:155
int active_worst_quality
Definition: ratectrl.h:242
int frames_since_golden
Definition: ratectrl.h:165
int frames_till_gf_update_due
Definition: ratectrl.h:170