12 #ifndef AOM_AV1_ENCODER_TPL_MODEL_H_
13 #define AOM_AV1_ENCODER_TPL_MODEL_H_
23 struct AV1_SEQ_CODING_TOOLS;
30 #include "config/aom_config.h"
32 #include "aom_scale/yv12config.h"
34 #include "av1/common/mv.h"
35 #include "av1/common/scale.h"
38 #include "av1/encoder/ratectrl.h"
40 static INLINE BLOCK_SIZE convert_length_to_bsize(
int length) {
42 case 64:
return BLOCK_64X64;
43 case 32:
return BLOCK_32X32;
44 case 16:
return BLOCK_16X16;
45 case 8:
return BLOCK_8X8;
46 case 4:
return BLOCK_4X4;
48 assert(0 &&
"Invalid block size for tpl model");
53 typedef struct AV1TplRowMultiThreadSync {
54 #if CONFIG_MULTITHREAD
56 pthread_mutex_t *mutex_;
57 pthread_cond_t *cond_;
62 int *num_finished_cols;
70 int num_threads_working;
71 } AV1TplRowMultiThreadSync;
73 typedef struct AV1TplRowMultiThreadInfo {
77 #if CONFIG_MULTITHREAD
79 pthread_mutex_t *mutex_;
82 void (*sync_read_ptr)(AV1TplRowMultiThreadSync *tpl_mt_sync,
int r,
int c);
83 void (*sync_write_ptr)(AV1TplRowMultiThreadSync *tpl_mt_sync,
int r,
int c,
85 } AV1TplRowMultiThreadInfo;
98 #define MAX_TPL_FRAME_IDX (2 * MAX_LAG_BUFFERS)
101 #define MAX_LENGTH_TPL_FRAME_STATS (MAX_TPL_FRAME_IDX + REF_FRAMES + 1)
102 #define TPL_DEP_COST_SCALE_LOG2 4
104 #define TPL_EPSILON 0.0000001
106 typedef struct TplTxfmStats {
108 double abs_coeff_sum[256];
109 double abs_coeff_mean[256];
110 int txfm_block_count;
122 typedef struct TplDepStats {
129 int64_t cmp_recrf_dist[2];
132 int64_t pred_error[INTER_REFS_PER_FRAME];
138 int32_t cmp_recrf_rate[2];
139 int_mv mv[INTER_REFS_PER_FRAME];
140 int8_t ref_frame_index[2];
143 typedef struct TplDepFrame {
145 TplDepStats *tpl_stats_ptr;
148 int ref_map_index[REF_FRAMES];
155 uint32_t frame_display_index;
216 struct scale_factors
sf;
254 #if CONFIG_BITRATE_ACCURACY || CONFIG_RATECTRL_LOG
255 #define VBR_RC_INFO_MAX_FRAMES 500
258 #if CONFIG_BITRATE_ACCURACY
266 double total_bit_budget;
267 int show_frame_count;
269 int gop_showframe_count;
270 double gop_bit_budget;
271 double scale_factors[FRAME_UPDATE_TYPES];
273 double mv_scale_factors[FRAME_UPDATE_TYPES];
278 int q_index_list_ready;
279 int q_index_list[VBR_RC_INFO_MAX_FRAMES];
283 double qstep_ratio_list[VBR_RC_INFO_MAX_FRAMES];
285 #if CONFIG_THREE_PASS
286 TplTxfmStats txfm_stats_list[VBR_RC_INFO_MAX_FRAMES];
287 FRAME_UPDATE_TYPE update_type_list[VBR_RC_INFO_MAX_FRAMES];
288 int gop_start_idx_list[VBR_RC_INFO_MAX_FRAMES];
289 int gop_length_list[VBR_RC_INFO_MAX_FRAMES];
291 int total_frame_count;
296 static INLINE
void vbr_rc_reset_gop_data(VBR_RATECTRL_INFO *vbr_rc_info) {
297 vbr_rc_info->q_index_list_ready = 0;
298 av1_zero(vbr_rc_info->q_index_list);
301 void av1_vbr_rc_init(VBR_RATECTRL_INFO *vbr_rc_info,
double total_bit_budget,
302 int show_frame_count);
304 int av1_vbr_rc_frame_coding_idx(
const VBR_RATECTRL_INFO *vbr_rc_info,
307 void av1_vbr_rc_append_tpl_info(VBR_RATECTRL_INFO *vbr_rc_info,
308 const struct TPL_INFO *tpl_info);
310 void av1_vbr_rc_set_gop_bit_budget(VBR_RATECTRL_INFO *vbr_rc_info,
311 int gop_showframe_count);
313 void av1_vbr_rc_compute_q_indices(
int base_q_index,
int frame_count,
314 const double *qstep_ratio_list,
325 void av1_vbr_rc_update_q_index_list(VBR_RATECTRL_INFO *vbr_rc_info,
351 double av1_vbr_rc_info_estimate_gop_bitrate(
353 const double *update_type_scale_factors,
int frame_count,
354 const FRAME_UPDATE_TYPE *update_type_list,
const double *qstep_ratio_list,
355 const TplTxfmStats *stats_list,
int *q_index_list,
356 double *estimated_bitrate_byframe);
379 int av1_vbr_rc_info_estimate_base_q(
381 const double *update_type_scale_factors,
int frame_count,
382 const FRAME_UPDATE_TYPE *update_type_list,
const double *qstep_ratio_list,
383 const TplTxfmStats *stats_list,
int *q_index_list,
384 double *estimated_bitrate_byframe);
388 #if CONFIG_RD_COMMAND
392 RD_OPTION_SET_Q_RDMULT
395 typedef struct RD_COMMAND {
396 RD_OPTION option_ls[MAX_LENGTH_TPL_FRAME_STATS];
397 int q_index_ls[MAX_LENGTH_TPL_FRAME_STATS];
398 int rdmult_ls[MAX_LENGTH_TPL_FRAME_STATS];
403 void av1_read_rd_command(
const char *filepath, RD_COMMAND *rd_command);
414 void av1_setup_tpl_buffers(
struct AV1_PRIMARY *
const ppi,
416 int height,
int byte_alignment,
int lag_in_frames);
418 static AOM_INLINE
void tpl_dealloc_temp_buffers(TplBuffers *tpl_tmp_buffers) {
419 aom_free(tpl_tmp_buffers->predictor8);
420 tpl_tmp_buffers->predictor8 = NULL;
421 aom_free(tpl_tmp_buffers->src_diff);
422 tpl_tmp_buffers->src_diff = NULL;
423 aom_free(tpl_tmp_buffers->coeff);
424 tpl_tmp_buffers->coeff = NULL;
425 aom_free(tpl_tmp_buffers->qcoeff);
426 tpl_tmp_buffers->qcoeff = NULL;
427 aom_free(tpl_tmp_buffers->dqcoeff);
428 tpl_tmp_buffers->dqcoeff = NULL;
431 static AOM_INLINE
bool tpl_alloc_temp_buffers(TplBuffers *tpl_tmp_buffers,
432 uint8_t tpl_bsize_1d) {
434 const int tpl_block_pels = tpl_bsize_1d * tpl_bsize_1d;
437 tpl_tmp_buffers->predictor8 = (uint8_t *)aom_memalign(
438 32, tpl_block_pels * 2 *
sizeof(*tpl_tmp_buffers->predictor8));
439 tpl_tmp_buffers->src_diff = (int16_t *)aom_memalign(
440 32, tpl_block_pels *
sizeof(*tpl_tmp_buffers->src_diff));
441 tpl_tmp_buffers->coeff = (tran_low_t *)aom_memalign(
442 32, tpl_block_pels *
sizeof(*tpl_tmp_buffers->coeff));
443 tpl_tmp_buffers->qcoeff = (tran_low_t *)aom_memalign(
444 32, tpl_block_pels *
sizeof(*tpl_tmp_buffers->qcoeff));
445 tpl_tmp_buffers->dqcoeff = (tran_low_t *)aom_memalign(
446 32, tpl_block_pels *
sizeof(*tpl_tmp_buffers->dqcoeff));
448 if (!(tpl_tmp_buffers->predictor8 && tpl_tmp_buffers->src_diff &&
449 tpl_tmp_buffers->coeff && tpl_tmp_buffers->qcoeff &&
450 tpl_tmp_buffers->dqcoeff)) {
451 tpl_dealloc_temp_buffers(tpl_tmp_buffers);
473 void av1_tpl_preload_rc_estimate(
476 int av1_tpl_ptr_pos(
int mi_row,
int mi_col,
int stride, uint8_t right_shift);
478 void av1_init_tpl_stats(
TplParams *
const tpl_data);
480 int av1_tpl_stats_ready(
const TplParams *tpl_data,
int gf_frame_index);
482 void av1_tpl_rdmult_setup(
struct AV1_COMP *cpi);
485 BLOCK_SIZE sb_size,
int mi_row,
int mi_col);
487 void av1_mc_flow_dispenser_row(
struct AV1_COMP *cpi,
488 TplTxfmStats *tpl_txfm_stats,
490 int mi_row, BLOCK_SIZE bsize, TX_SIZE tx_size);
504 double av1_exponential_entropy(
double q_step,
double b);
519 double av1_laplace_entropy(
double q_step,
double b,
double zero_bin_ratio);
538 double av1_laplace_estimate_frame_rate(
int q_index,
int block_count,
539 const double *abs_coeff_mean,
548 void av1_init_tpl_txfm_stats(TplTxfmStats *tpl_txfm_stats);
550 #if CONFIG_BITRATE_ACCURACY
559 void av1_accumulate_tpl_txfm_stats(
const TplTxfmStats *sub_stats,
560 TplTxfmStats *accumulated_stats);
570 void av1_record_tpl_txfm_block(TplTxfmStats *tpl_txfm_stats,
571 const tran_low_t *coeff);
581 void av1_tpl_txfm_stats_update_abs_coeff_mean(TplTxfmStats *txfm_stats);
599 double av1_estimate_coeff_entropy(
double q_step,
double b,
600 double zero_bin_ratio,
int qcoeff);
614 double av1_estimate_txfm_block_entropy(
int q_index,
615 const double *abs_coeff_mean,
616 int *qcoeff_arr,
int coeff_num);
619 int64_t av1_delta_rate_cost(int64_t delta_rate, int64_t recrf_dist,
620 int64_t srcrf_dist,
int pix_num);
637 int av1_get_overlap_area(
int row_a,
int col_a,
int row_b,
int col_b,
int width,
649 int av1_tpl_get_q_index(
const TplParams *tpl_data,
int gf_frame_index,
659 double av1_tpl_get_frame_importance(
const TplParams *tpl_data,
672 double av1_tpl_get_qstep_ratio(
const TplParams *tpl_data,
int gf_frame_index);
682 int av1_get_q_index_from_qstep_ratio(
int leaf_qindex,
double qstep_ratio,
699 int_mv av1_compute_mv_difference(
const TplDepFrame *tpl_frame,
int row,
int col,
700 int step,
int tpl_stride,
int right_shift);
709 double av1_tpl_compute_frame_mv_entropy(
const TplDepFrame *tpl_frame,
710 uint8_t right_shift);
712 #if CONFIG_RATECTRL_LOG
714 int coding_frame_count;
718 int q_index_list[VBR_RC_INFO_MAX_FRAMES];
719 double qstep_ratio_list[VBR_RC_INFO_MAX_FRAMES];
720 FRAME_UPDATE_TYPE update_type_list[VBR_RC_INFO_MAX_FRAMES];
723 TplTxfmStats txfm_stats_list[VBR_RC_INFO_MAX_FRAMES];
726 double est_coeff_rate_list[VBR_RC_INFO_MAX_FRAMES];
729 double act_rate_list[VBR_RC_INFO_MAX_FRAMES];
730 double act_coeff_rate_list[VBR_RC_INFO_MAX_FRAMES];
733 static INLINE
void rc_log_init(RATECTRL_LOG *rc_log) { av1_zero(*rc_log); }
735 static INLINE
void rc_log_frame_stats(RATECTRL_LOG *rc_log,
int coding_index,
736 const TplTxfmStats *txfm_stats) {
737 rc_log->txfm_stats_list[coding_index] = *txfm_stats;
740 static INLINE
void rc_log_frame_encode_param(RATECTRL_LOG *rc_log,
742 double qstep_ratio,
int q_index,
743 FRAME_UPDATE_TYPE update_type) {
744 rc_log->qstep_ratio_list[coding_index] = qstep_ratio;
745 rc_log->q_index_list[coding_index] = q_index;
746 rc_log->update_type_list[coding_index] = update_type;
747 const TplTxfmStats *txfm_stats = &rc_log->txfm_stats_list[coding_index];
748 rc_log->est_coeff_rate_list[coding_index] = 0;
749 if (txfm_stats->ready) {
750 rc_log->est_coeff_rate_list[coding_index] = av1_laplace_estimate_frame_rate(
751 q_index, txfm_stats->txfm_block_count, txfm_stats->abs_coeff_mean,
752 txfm_stats->coeff_num);
756 static INLINE
void rc_log_frame_entropy(RATECTRL_LOG *rc_log,
int coding_index,
758 double act_coeff_rate) {
759 rc_log->act_rate_list[coding_index] = act_rate;
760 rc_log->act_coeff_rate_list[coding_index] = act_coeff_rate;
763 static INLINE
void rc_log_record_chunk_info(RATECTRL_LOG *rc_log,
765 int coding_frame_count) {
766 rc_log->base_q_index = base_q_index;
767 rc_log->coding_frame_count = coding_frame_count;
770 static INLINE
void rc_log_show(
const RATECTRL_LOG *rc_log) {
771 printf(
"= chunk 1\n");
772 printf(
"coding_frame_count %d base_q_index %d\n", rc_log->coding_frame_count,
773 rc_log->base_q_index);
774 printf(
"= frame %d\n", rc_log->coding_frame_count);
775 for (
int coding_idx = 0; coding_idx < rc_log->coding_frame_count;
778 "coding_idx %d update_type %d q %d qstep_ratio %f est_coeff_rate %f "
779 "act_coeff_rate %f act_rate %f\n",
780 coding_idx, rc_log->update_type_list[coding_idx],
781 rc_log->q_index_list[coding_idx], rc_log->qstep_ratio_list[coding_idx],
782 rc_log->est_coeff_rate_list[coding_idx],
783 rc_log->act_coeff_rate_list[coding_idx],
784 rc_log->act_rate_list[coding_idx]);
enum aom_bit_depth aom_bit_depth_t
Bit depth for codecThis enumeration determines the bit depth of the codec.
int av1_tpl_setup_stats(struct AV1_COMP *cpi, int gop_eval, const struct EncodeFrameParams *const frame_params)
Implements temporal dependency modelling for a GOP (GF/ARF group) and selects between 16 and 32 frame...
Describes look ahead buffer operations.
Top level encoder structure.
Definition: encoder.h:2872
Top level primary encoder structure.
Definition: encoder.h:2576
Params related to MB_MODE_INFO arrays and related info.
Definition: av1_common_int.h:503
contains per-frame encoding parameters decided upon by av1_encode_strategy() and passed down to av1_e...
Definition: encoder.h:3673
Data related to the current GF/ARF group and the individual frames within the group.
Definition: firstpass.h:354
Params related to temporal dependency model.
Definition: tpl_model.h:164
const YV12_BUFFER_CONFIG * src_ref_frame[INTER_REFS_PER_FRAME]
Definition: tpl_model.h:228
struct scale_factors sf
Definition: tpl_model.h:216
int ready
Definition: tpl_model.h:168
TplDepFrame tpl_stats_buffer[MAX_LENGTH_TPL_FRAME_STATS]
Definition: tpl_model.h:185
uint8_t tpl_bsize_1d
Definition: tpl_model.h:178
AV1TplRowMultiThreadSync tpl_mt_sync
Definition: tpl_model.h:241
TplDepFrame * tpl_frame
Definition: tpl_model.h:211
int border_in_pixels
Definition: tpl_model.h:246
TplDepStats * tpl_stats_pool[MAX_LAG_BUFFERS]
Definition: tpl_model.h:192
TplTxfmStats * txfm_stats_list
Definition: tpl_model.h:200
YV12_BUFFER_CONFIG tpl_rec_pool[MAX_LAG_BUFFERS]
Definition: tpl_model.h:206
uint8_t tpl_stats_block_mis_log2
Definition: tpl_model.h:173
int frame_idx
Definition: tpl_model.h:221
double r0_adjust_factor
Definition: tpl_model.h:251
const YV12_BUFFER_CONFIG * ref_frame[INTER_REFS_PER_FRAME]
Definition: tpl_model.h:235
Encoder's parameters related to the current coding block.
Definition: block.h:878
YV12 frame buffer data structure.
Definition: yv12config.h:44