AOMedia AV1 Codec
ratectrl.h
1 /*
2  * Copyright (c) 2016, Alliance for Open Media. All rights reserved
3  *
4  * This source code is subject to the terms of the BSD 2 Clause License and
5  * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6  * was not distributed with this source code in the LICENSE file, you can
7  * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8  * Media Patent License 1.0 was not distributed with this source code in the
9  * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10  */
11 
12 #ifndef AOM_AV1_ENCODER_RATECTRL_H_
13 #define AOM_AV1_ENCODER_RATECTRL_H_
14 
15 #include "aom/aom_codec.h"
16 #include "aom/aom_integer.h"
17 
18 #include "aom_ports/mem.h"
19 
20 #include "av1/common/av1_common_int.h"
21 #include "av1/common/blockd.h"
22 
23 #ifdef __cplusplus
24 extern "C" {
25 #endif
26 
29 // Bits Per MB at different Q (Multiplied by 512)
30 #define BPER_MB_NORMBITS 9
31 
32 // Use this macro to turn on/off use of alt-refs in one-pass mode.
33 #define USE_ALTREF_FOR_ONE_PASS 1
34 
35 // Threshold used to define if a KF group is static (e.g. a slide show).
36 // Essentially, this means that no frame in the group has more than 1% of MBs
37 // that are not marked as coded with 0,0 motion in the first pass.
38 #define STATIC_KF_GROUP_THRESH 99
39 #define STATIC_KF_GROUP_FLOAT_THRESH 0.99
40 
41 // The maximum duration of a GF group that is static (e.g. a slide show).
42 #define MAX_STATIC_GF_GROUP_LENGTH 250
43 
44 #define MIN_GF_INTERVAL 4
45 #define MAX_GF_INTERVAL 32
46 #define FIXED_GF_INTERVAL 16
47 #define MAX_GF_LENGTH_LAP 16
48 
49 #define MAX_NUM_GF_INTERVALS 15
50 
51 #define MAX_ARF_LAYERS 6
52 // #define STRICT_RC
53 
54 typedef struct {
55  int resize_width;
56  int resize_height;
57  uint8_t superres_denom;
58 } size_params_type;
59 
60 enum {
61  INTER_NORMAL,
62  GF_ARF_LOW,
63  GF_ARF_STD,
64  KF_STD,
65  RATE_FACTOR_LEVELS
66 } UENUM1BYTE(RATE_FACTOR_LEVEL);
67 
68 enum {
69  KF_UPDATE,
70  LF_UPDATE,
71  GF_UPDATE,
72  ARF_UPDATE,
73  OVERLAY_UPDATE,
74  INTNL_OVERLAY_UPDATE, // Internal Overlay Frame
75  INTNL_ARF_UPDATE, // Internal Altref Frame
76  FRAME_UPDATE_TYPES
77 } UENUM1BYTE(FRAME_UPDATE_TYPE);
78 
79 enum {
80  REFBUF_RESET, // Clear reference frame buffer
81  REFBUF_UPDATE, // Refresh reference frame buffer
82  REFBUF_STATES
83 } UENUM1BYTE(REFBUF_STATE);
84 
85 typedef enum {
86  NO_RESIZE = 0,
87  DOWN_THREEFOUR = 1, // From orig to 3/4.
88  DOWN_ONEHALF = 2, // From orig or 3/4 to 1/2.
89  UP_THREEFOUR = -1, // From 1/2 to 3/4.
90  UP_ORIG = -2, // From 1/2 or 3/4 to orig.
91 } RESIZE_ACTION;
92 
93 typedef enum { ORIG = 0, THREE_QUARTER = 1, ONE_HALF = 2 } RESIZE_STATE;
94 
95 #define MAX_FIRSTPASS_ANALYSIS_FRAMES 150
96 typedef enum region_types {
97  STABLE_REGION = 0,
98  HIGH_VAR_REGION = 1,
99  SCENECUT_REGION = 2,
100  BLENDING_REGION = 3,
101 } REGION_TYPES;
102 
103 typedef struct regions {
104  int start;
105  int last;
106  double avg_noise_var;
107  double avg_cor_coeff;
108  double avg_sr_fr_ratio;
109  double avg_intra_err;
110  double avg_coded_err;
111  REGION_TYPES type;
112 } REGIONS;
113 
118 typedef struct {
119  // Rate targetting variables
120 
129  int this_frame_target; // Actual frame target after rc adjustment.
130 
134  int64_t gf_group_bits;
135 
140 
145 
150 
154  int last_q[FRAME_TYPES];
155 
160 
165 
173  int kf_boost;
174 
179  double rate_correction_factors[RATE_FACTOR_LEVELS];
180 
185 
190 
195 
199  int gf_intervals[MAX_NUM_GF_INTERVALS];
200 
205 
207  int num_regions;
208  REGIONS regions[MAX_FIRSTPASS_ANALYSIS_FRAMES];
209  double cor_coeff[MAX_FIRSTPASS_ANALYSIS_FRAMES];
210  int regions_offset; // offset of regions from the last keyframe
211  int frames_till_regions_update;
212 
213  int min_gf_interval;
214  int max_gf_interval;
215  int static_scene_max_gf_interval;
216  int baseline_gf_interval;
217  int constrained_gf_group;
224  int frames_since_key;
225  int this_key_frame_forced;
226  int next_key_frame_forced;
227  int is_src_frame_alt_ref;
228  int sframe_due;
229 
230  int high_source_sad;
231  uint64_t avg_source_sad;
232  uint64_t prev_avg_source_sad;
233 
234  int avg_frame_bandwidth; // Average frame size target for clip
235  int min_frame_bandwidth; // Minimum allocation used for any frame
236  int max_frame_bandwidth; // Maximum burst rate allowed for a frame.
237  int prev_avg_frame_bandwidth;
238 
239  int ni_av_qi;
240  int ni_tot_qi;
241  int ni_frames;
242  int avg_frame_qindex[FRAME_TYPES];
243  double tot_q;
244  double avg_q;
245 
246  int64_t buffer_level;
247  int64_t bits_off_target;
248  int64_t vbr_bits_off_target;
249  int64_t vbr_bits_off_target_fast;
250 
251  int decimation_factor;
252  int decimation_count;
253 
254  int rolling_target_bits;
255  int rolling_actual_bits;
256 
257  int rate_error_estimate;
258 
259  int64_t total_actual_bits;
260  int64_t total_target_bits;
261 
271 
286  // rate control history for last frame(1) and the frame before(2).
287  // -1: undershot
288  // 1: overshoot
289  // 0: not initialized.
290  int rc_1_frame;
291  int rc_2_frame;
292  int q_1_frame;
293  int q_2_frame;
294 
295  float_t arf_boost_factor;
296 
301  int arf_q;
309  int active_best_quality[MAX_ARF_LAYERS + 1];
310 
312  int base_layer_qp;
313 
314  // Total number of stats used only for kf_boost calculation.
315  int num_stats_used_for_kf_boost;
316  // Total number of stats used only for gfu_boost calculation.
317  int num_stats_used_for_gfu_boost;
318  // Total number of stats required by gfu_boost calculation.
319  int num_stats_required_for_gfu_boost;
320  int next_is_fwd_key;
321  int enable_scenecut_detection;
322  int use_arf_in_this_kf_group;
323  // Track amount of low motion in scene
324  int avg_frame_low_motion;
325 
326  // For dynamic resize, 1 pass cbr.
327  RESIZE_STATE resize_state;
328  int resize_avg_qp;
329  int resize_buffer_underflow;
330  int resize_count;
332 } RATE_CONTROL;
333 
336 struct AV1_COMP;
337 struct AV1EncoderConfig;
338 
339 void av1_rc_init(const struct AV1EncoderConfig *oxcf, int pass,
340  RATE_CONTROL *rc);
341 
342 int av1_estimate_bits_at_q(FRAME_TYPE frame_kind, int q, int mbs,
343  double correction_factor, aom_bit_depth_t bit_depth,
344  const int is_screen_content_type);
345 
346 double av1_convert_qindex_to_q(int qindex, aom_bit_depth_t bit_depth);
347 
348 void av1_rc_init_minq_luts(void);
349 
350 int av1_rc_get_default_min_gf_interval(int width, int height, double framerate);
351 // Note av1_rc_get_default_max_gf_interval() requires the min_gf_interval to
352 // be passed in to ensure that the max_gf_interval returned is at least as bis
353 // as that.
354 int av1_rc_get_default_max_gf_interval(double framerate, int min_gf_interval);
355 
356 // Generally at the high level, the following flow is expected
357 // to be enforced for rate control:
358 // First call per frame, one of:
359 // av1_rc_get_first_pass_params()
360 // av1_rc_get_second_pass_params()
361 // depending on the usage to set the rate control encode parameters desired.
362 //
363 // Then, call encode_frame_to_data_rate() to perform the
364 // actual encode. This function will in turn call encode_frame()
365 // one or more times, followed by one of:
366 // av1_rc_postencode_update()
367 // av1_rc_postencode_update_drop_frame()
368 //
369 // The majority of rate control parameters are only expected
370 // to be set in the av1_rc_get_..._params() functions and
371 // updated during the av1_rc_postencode_update...() functions.
372 // The only exceptions are av1_rc_drop_frame() and
373 // av1_rc_update_rate_correction_factors() functions.
374 
375 // Functions to set parameters for encoding before the actual
376 // encode_frame_to_data_rate() function.
377 struct EncodeFrameParams;
378 
379 // Post encode update of the rate control parameters based
380 // on bytes used
381 void av1_rc_postencode_update(struct AV1_COMP *cpi, uint64_t bytes_used);
382 // Post encode update of the rate control parameters for dropped frames
383 void av1_rc_postencode_update_drop_frame(struct AV1_COMP *cpi);
384 
398 void av1_rc_update_rate_correction_factors(struct AV1_COMP *cpi, int width,
399  int height);
402 // Decide if we should drop this frame: For 1-pass CBR.
403 // Changes only the decimation count in the rate control structure
404 int av1_rc_drop_frame(struct AV1_COMP *cpi);
405 
406 // Computes frame size bounds.
407 void av1_rc_compute_frame_size_bounds(const struct AV1_COMP *cpi,
408  int this_frame_target,
409  int *frame_under_shoot_limit,
410  int *frame_over_shoot_limit);
411 
427 int av1_rc_pick_q_and_bounds(const struct AV1_COMP *cpi, RATE_CONTROL *rc,
428  int width, int height, int gf_index,
429  int *bottom_index, int *top_index);
430 
443 int av1_rc_regulate_q(const struct AV1_COMP *cpi, int target_bits_per_frame,
444  int active_best_quality, int active_worst_quality,
445  int width, int height);
446 
448 // Estimates bits per mb for a given qindex and correction factor.
449 int av1_rc_bits_per_mb(FRAME_TYPE frame_type, int qindex,
450  double correction_factor, aom_bit_depth_t bit_depth,
451  const int is_screen_content_type);
452 
453 // Clamping utilities for bitrate targets for iframes and pframes.
454 int av1_rc_clamp_iframe_target_size(const struct AV1_COMP *const cpi,
455  int target);
456 int av1_rc_clamp_pframe_target_size(const struct AV1_COMP *const cpi,
457  int target, uint8_t frame_update_type);
458 
459 // Find q_index corresponding to desired_q, within [best_qindex, worst_qindex].
460 // To be precise, 'q_index' is the smallest integer, for which the corresponding
461 // q >= desired_q.
462 // If no such q index is found, returns 'worst_qindex'.
463 int av1_find_qindex(double desired_q, aom_bit_depth_t bit_depth,
464  int best_qindex, int worst_qindex);
465 
466 // Computes a q delta (in "q index" terms) to get from a starting q value
467 // to a target q value
468 int av1_compute_qdelta(const RATE_CONTROL *rc, double qstart, double qtarget,
469  aom_bit_depth_t bit_depth);
470 
471 // Computes a q delta (in "q index" terms) to get from a starting q value
472 // to a value that should equate to the given rate ratio.
473 int av1_compute_qdelta_by_rate(const RATE_CONTROL *rc, FRAME_TYPE frame_type,
474  int qindex, double rate_target_ratio,
475  const int is_screen_content_type,
476  aom_bit_depth_t bit_depth);
477 
478 int av1_frame_type_qdelta(const struct AV1_COMP *cpi, int q);
479 
480 void av1_rc_update_framerate(struct AV1_COMP *cpi, int width, int height);
481 
482 void av1_rc_set_gf_interval_range(const struct AV1_COMP *const cpi,
483  RATE_CONTROL *const rc);
484 
485 void av1_set_target_rate(struct AV1_COMP *cpi, int width, int height);
486 
487 int av1_resize_one_pass_cbr(struct AV1_COMP *cpi);
488 
489 void av1_rc_set_frame_target(struct AV1_COMP *cpi, int target, int width,
490  int height);
491 
493  int gf_update);
494 
508  const struct AV1_COMP *const cpi, FRAME_UPDATE_TYPE frame_update_type);
509 
521 
534  const struct AV1_COMP *cpi, FRAME_UPDATE_TYPE frame_update_type);
535 
547 
564 void av1_get_one_pass_rt_params(struct AV1_COMP *cpi,
565  struct EncodeFrameParams *const frame_params,
566  unsigned int frame_flags);
567 
582 int av1_encodedframe_overshoot_cbr(struct AV1_COMP *cpi, int *q);
583 
584 #ifdef __cplusplus
585 } // extern "C"
586 #endif
587 
588 #endif // AOM_AV1_ENCODER_RATECTRL_H_
Describes the codec algorithm interface to applications.
enum aom_bit_depth aom_bit_depth_t
Bit depth for codecThis enumeration determines the bit depth of the codec.
int av1_calc_pframe_target_size_one_pass_vbr(const struct AV1_COMP *const cpi, FRAME_UPDATE_TYPE frame_update_type)
Calculates how many bits to use for a P frame in one pass vbr.
int av1_rc_pick_q_and_bounds(const struct AV1_COMP *cpi, RATE_CONTROL *rc, int width, int height, int gf_index, int *bottom_index, int *top_index)
Picks q and q bounds given the rate control parameters in cpi->rc.
int av1_encodedframe_overshoot_cbr(struct AV1_COMP *cpi, int *q)
Increase q on expected encoder overshoot, for CBR mode.
Definition: ratectrl.c:2649
int av1_calc_pframe_target_size_one_pass_cbr(const struct AV1_COMP *cpi, FRAME_UPDATE_TYPE frame_update_type)
Calculates how many bits to use for a P frame in one pass cbr.
void av1_set_reference_structure_one_pass_rt(AV1_COMP *cpi, int gf_update)
Setup the reference prediction structure for 1 pass real-time.
Definition: ratectrl.c:2167
int av1_calc_iframe_target_size_one_pass_cbr(const struct AV1_COMP *cpi)
Calculates how many bits to use for an i frame in one pass cbr.
int av1_calc_iframe_target_size_one_pass_vbr(const struct AV1_COMP *const cpi)
Calculates how many bits to use for an i frame in one pass vbr.
int av1_rc_regulate_q(const struct AV1_COMP *cpi, int target_bits_per_frame, int active_best_quality, int active_worst_quality, int width, int height)
Estimates q to achieve a target bits per frame.
void av1_get_one_pass_rt_params(struct AV1_COMP *cpi, struct EncodeFrameParams *const frame_params, unsigned int frame_flags)
Setup the rate control parameters for 1 pass real-time mode.
Definition: ratectrl.c:2547
void av1_rc_update_rate_correction_factors(struct AV1_COMP *cpi, int width, int height)
Updates the rate correction factor linking Q to output bits.
Definition: ratectrl.c:541
Main encoder configuration data structure.
Definition: encoder.h:791
enum aom_enc_pass pass
Definition: encoder.h:916
Top level encoder structure.
Definition: encoder.h:2042
contains per-frame encoding parameters decided upon by av1_encode_strategy() and passed down to av1_e...
Definition: encoder.h:2675
FRAME_TYPE frame_type
Definition: encoder.h:2683
Rate Control parameters and status.
Definition: ratectrl.h:118
int best_quality
Definition: ratectrl.h:270
int64_t starting_buffer_level
Definition: ratectrl.h:275
int intervals_till_gf_calculate_due
Definition: ratectrl.h:194
int64_t gf_group_bits
Definition: ratectrl.h:134
int this_frame_target
Definition: ratectrl.h:129
int frames_to_key
Definition: ratectrl.h:222
int base_frame_target
Definition: ratectrl.h:125
int projected_frame_size
Definition: ratectrl.h:139
int worst_quality
Definition: ratectrl.h:266
int arf_q
Definition: ratectrl.h:301
int cur_gf_index
Definition: ratectrl.h:204
int sb64_target_rate
Definition: ratectrl.h:149
int last_kf_qindex
Definition: ratectrl.h:164
int gfu_boost
Definition: ratectrl.h:169
int coefficient_size
Definition: ratectrl.h:144
int64_t maximum_buffer_size
Definition: ratectrl.h:283
int64_t optimal_buffer_level
Definition: ratectrl.h:279
int active_worst_quality
Definition: ratectrl.h:305
int last_boosted_qindex
Definition: ratectrl.h:159
int frames_since_golden
Definition: ratectrl.h:184
int kf_boost
Definition: ratectrl.h:173
int frames_till_gf_update_due
Definition: ratectrl.h:189