12 #ifndef AOM_AV1_ENCODER_TPL_MODEL_H_
13 #define AOM_AV1_ENCODER_TPL_MODEL_H_
23 struct AV1_SEQ_CODING_TOOLS;
28 #include "config/aom_config.h"
30 #include "aom_scale/yv12config.h"
32 #include "av1/common/mv.h"
33 #include "av1/common/scale.h"
36 #include "av1/encoder/ratectrl.h"
38 static INLINE BLOCK_SIZE convert_length_to_bsize(
int length) {
40 case 64:
return BLOCK_64X64;
41 case 32:
return BLOCK_32X32;
42 case 16:
return BLOCK_16X16;
43 case 8:
return BLOCK_8X8;
44 case 4:
return BLOCK_4X4;
46 assert(0 &&
"Invalid block size for tpl model");
51 typedef struct AV1TplRowMultiThreadSync {
52 #if CONFIG_MULTITHREAD
54 pthread_mutex_t *mutex_;
55 pthread_cond_t *cond_;
60 int *num_finished_cols;
68 int num_threads_working;
69 } AV1TplRowMultiThreadSync;
71 typedef struct AV1TplRowMultiThreadInfo {
73 void (*sync_read_ptr)(AV1TplRowMultiThreadSync *tpl_mt_sync,
int r,
int c);
74 void (*sync_write_ptr)(AV1TplRowMultiThreadSync *tpl_mt_sync,
int r,
int c,
76 } AV1TplRowMultiThreadInfo;
89 #define MAX_TPL_FRAME_IDX (2 * MAX_LAG_BUFFERS)
92 #define MAX_LENGTH_TPL_FRAME_STATS (MAX_TPL_FRAME_IDX + REF_FRAMES + 1)
93 #define TPL_DEP_COST_SCALE_LOG2 4
95 #define TPL_EPSILON 0.0000001
97 typedef struct TplTxfmStats {
98 double abs_coeff_sum[256];
103 typedef struct TplDepStats {
108 int64_t cmp_recrf_dist[2];
112 int64_t cmp_recrf_rate[2];
115 int_mv mv[INTER_REFS_PER_FRAME];
116 int ref_frame_index[2];
117 int64_t pred_error[INTER_REFS_PER_FRAME];
120 typedef struct TplDepFrame {
122 TplDepStats *tpl_stats_ptr;
125 int ref_map_index[REF_FRAMES];
132 uint32_t frame_display_index;
189 struct scale_factors
sf;
221 #if CONFIG_BITRATE_ACCURACY
225 double estimated_gop_bitrate;
226 double actual_gop_bitrate;
230 #if CONFIG_BITRATE_ACCURACY
236 double keyframe_bitrate;
237 double total_bit_budget;
238 int show_frame_count;
240 int gop_showframe_count;
241 double gop_bit_budget;
242 double scale_factors[FRAME_UPDATE_TYPES];
244 double mv_scale_factors[FRAME_UPDATE_TYPES];
249 int q_index_list_ready;
250 int q_index_list[MAX_LENGTH_TPL_FRAME_STATS];
253 double estimated_bitrate_byframe[MAX_LENGTH_TPL_FRAME_STATS];
254 double estimated_mv_bitrate_byframe[MAX_LENGTH_TPL_FRAME_STATS];
255 int actual_bitrate_byframe[MAX_LENGTH_TPL_FRAME_STATS];
256 int actual_mv_bitrate_byframe[MAX_LENGTH_TPL_FRAME_STATS];
257 int actual_coeff_bitrate_byframe[MAX_LENGTH_TPL_FRAME_STATS];
260 double qstep_ratio_list[MAX_LENGTH_TPL_FRAME_STATS];
263 static INLINE
void vbr_rc_reset_gop_data(VBR_RATECTRL_INFO *vbr_rc_info) {
264 vbr_rc_info->q_index_list_ready = 0;
265 av1_zero(vbr_rc_info->q_index_list);
266 av1_zero(vbr_rc_info->estimated_bitrate_byframe);
267 av1_zero(vbr_rc_info->estimated_mv_bitrate_byframe);
268 av1_zero(vbr_rc_info->actual_bitrate_byframe);
269 av1_zero(vbr_rc_info->actual_mv_bitrate_byframe);
270 av1_zero(vbr_rc_info->actual_coeff_bitrate_byframe);
273 static INLINE
void vbr_rc_init(VBR_RATECTRL_INFO *vbr_rc_info,
274 double total_bit_budget,
int show_frame_count) {
275 vbr_rc_info->total_bit_budget = total_bit_budget;
276 vbr_rc_info->show_frame_count = show_frame_count;
277 vbr_rc_info->keyframe_bitrate = 0;
278 const double scale_factors[FRAME_UPDATE_TYPES] = { 0.94559, 0.12040, 1,
281 const double mv_scale_factors[FRAME_UPDATE_TYPES] = { 3, 3, 3, 3, 3, 3, 3 };
282 memcpy(vbr_rc_info->scale_factors, scale_factors,
283 sizeof(scale_factors[0]) * FRAME_UPDATE_TYPES);
284 memcpy(vbr_rc_info->mv_scale_factors, mv_scale_factors,
285 sizeof(mv_scale_factors[0]) * FRAME_UPDATE_TYPES);
287 vbr_rc_reset_gop_data(vbr_rc_info);
290 static INLINE
void vbr_rc_set_gop_bit_budget(VBR_RATECTRL_INFO *vbr_rc_info,
291 int gop_showframe_count) {
292 vbr_rc_info->gop_showframe_count = gop_showframe_count;
293 vbr_rc_info->gop_bit_budget = vbr_rc_info->total_bit_budget *
294 gop_showframe_count /
295 vbr_rc_info->show_frame_count;
298 static INLINE
void vbr_rc_set_keyframe_bitrate(VBR_RATECTRL_INFO *vbr_rc_info,
299 double keyframe_bitrate) {
300 vbr_rc_info->keyframe_bitrate = keyframe_bitrate;
303 static INLINE
void vbr_rc_info_log(
const VBR_RATECTRL_INFO *vbr_rc_info,
304 int gf_frame_index,
int gf_group_size,
305 FRAME_UPDATE_TYPE *update_type) {
307 if (gf_frame_index + 2 >= gf_group_size) {
309 "\ni, \test_bitrate, \test_mv_bitrate, \tact_bitrate, "
310 "\tact_mv_bitrate, \tact_coeff_bitrate, \tq, \tupdate_type\n");
311 for (
int i = 0; i < gf_group_size; i++) {
312 printf(
"%d, \t%f, \t%f, \t%d, \t%d, \t%d, \t%d, \t%d\n", i,
313 vbr_rc_info->estimated_bitrate_byframe[i],
314 vbr_rc_info->estimated_mv_bitrate_byframe[i],
315 vbr_rc_info->actual_bitrate_byframe[i],
316 vbr_rc_info->actual_mv_bitrate_byframe[i],
317 vbr_rc_info->actual_coeff_bitrate_byframe[i],
318 vbr_rc_info->q_index_list[i], update_type[i]);
325 #if CONFIG_RD_COMMAND
329 RD_OPTION_SET_Q_RDMULT
332 typedef struct RD_COMMAND {
333 RD_OPTION option_ls[MAX_LENGTH_TPL_FRAME_STATS];
334 int q_index_ls[MAX_LENGTH_TPL_FRAME_STATS];
335 int rdmult_ls[MAX_LENGTH_TPL_FRAME_STATS];
340 void av1_read_rd_command(
const char *filepath, RD_COMMAND *rd_command);
351 void av1_setup_tpl_buffers(
struct AV1_PRIMARY *
const ppi,
353 int height,
int byte_alignment,
int lag_in_frames);
371 void av1_tpl_preload_rc_estimate(
374 int av1_tpl_ptr_pos(
int mi_row,
int mi_col,
int stride, uint8_t right_shift);
376 void av1_init_tpl_stats(
TplParams *
const tpl_data);
378 int av1_tpl_stats_ready(
const TplParams *tpl_data,
int gf_frame_index);
380 void av1_tpl_rdmult_setup(
struct AV1_COMP *cpi);
383 BLOCK_SIZE sb_size,
int mi_row,
int mi_col);
385 void av1_mc_flow_dispenser_row(
struct AV1_COMP *cpi,
387 int mi_row, BLOCK_SIZE bsize, TX_SIZE tx_size);
401 double av1_exponential_entropy(
double q_step,
double b);
416 double av1_laplace_entropy(
double q_step,
double b,
double zero_bin_ratio);
435 double av1_laplace_estimate_frame_rate(
int q_index,
int block_count,
436 const double *abs_coeff_mean,
452 double av1_estimate_gop_bitrate(
const int *q_index_list,
const int frame_count,
453 const TplTxfmStats *stats,
454 const int *stats_valid_list,
455 double *bitrate_byframe_list);
463 void av1_init_tpl_txfm_stats(TplTxfmStats *tpl_txfm_stats);
473 void av1_accumulate_tpl_txfm_stats(
const TplTxfmStats *sub_stats,
474 TplTxfmStats *accumulated_stats);
484 void av1_record_tpl_txfm_block(TplTxfmStats *tpl_txfm_stats,
485 const tran_low_t *coeff);
502 double av1_estimate_coeff_entropy(
double q_step,
double b,
503 double zero_bin_ratio,
int qcoeff);
517 double av1_estimate_txfm_block_entropy(
int q_index,
518 const double *abs_coeff_mean,
519 int *qcoeff_arr,
int coeff_num);
522 int64_t av1_delta_rate_cost(int64_t delta_rate, int64_t recrf_dist,
523 int64_t srcrf_dist,
int pix_num);
540 int av1_get_overlap_area(
int row_a,
int col_a,
int row_b,
int col_b,
int width,
563 int av1_q_mode_estimate_base_q(
const struct GF_GROUP *gf_group,
564 const TplTxfmStats *txfm_stats_list,
565 const int *stats_valid_list,
double bit_budget,
568 const double *qstep_ratio_list,
570 double *estimated_bitrate_byframe);
581 int av1_tpl_get_q_index(
const TplParams *tpl_data,
int gf_frame_index,
591 double av1_tpl_get_frame_importance(
const TplParams *tpl_data,
604 double av1_tpl_get_qstep_ratio(
const TplParams *tpl_data,
int gf_frame_index);
615 int av1_get_q_index_from_qstep_ratio(
int leaf_qindex,
double qstep_ratio,
618 #if CONFIG_BITRATE_ACCURACY
628 void av1_vbr_rc_update_q_index_list(VBR_RATECTRL_INFO *vbr_rc_info,
644 double av1_tpl_compute_mv_bits(
const TplParams *tpl_data,
int gf_group_size,
645 int gf_frame_index,
int gf_update_type,
646 VBR_RATECTRL_INFO *vbr_rc_info);
661 int_mv av1_compute_mv_difference(
const TplDepFrame *tpl_frame,
int row,
int col,
662 int step,
int tpl_stride,
int right_shift);
671 double av1_tpl_compute_frame_mv_entropy(
const TplDepFrame *tpl_frame,
672 uint8_t right_shift);
enum aom_bit_depth aom_bit_depth_t
Bit depth for codecThis enumeration determines the bit depth of the codec.
int av1_tpl_setup_stats(struct AV1_COMP *cpi, int gop_eval, const struct EncodeFrameParams *const frame_params)
Implements temporal dependency modelling for a GOP (GF/ARF group) and selects between 16 and 32 frame...
Describes look ahead buffer operations.
Top level encoder structure.
Definition: encoder.h:2632
Top level primary encoder structure.
Definition: encoder.h:2332
Params related to MB_MODE_INFO arrays and related info.
Definition: av1_common_int.h:505
contains per-frame encoding parameters decided upon by av1_encode_strategy() and passed down to av1_e...
Definition: encoder.h:3302
Data related to the current GF/ARF group and the individual frames within the group.
Definition: firstpass.h:344
Params related to temporal dependency model.
Definition: tpl_model.h:139
const YV12_BUFFER_CONFIG * src_ref_frame[INTER_REFS_PER_FRAME]
Definition: tpl_model.h:201
struct scale_factors sf
Definition: tpl_model.h:189
int ready
Definition: tpl_model.h:143
TplDepFrame tpl_stats_buffer[MAX_LENGTH_TPL_FRAME_STATS]
Definition: tpl_model.h:160
uint8_t tpl_bsize_1d
Definition: tpl_model.h:153
AV1TplRowMultiThreadSync tpl_mt_sync
Definition: tpl_model.h:214
TplDepFrame * tpl_frame
Definition: tpl_model.h:184
int border_in_pixels
Definition: tpl_model.h:219
TplDepStats * tpl_stats_pool[MAX_LAG_BUFFERS]
Definition: tpl_model.h:167
YV12_BUFFER_CONFIG tpl_rec_pool[MAX_LAG_BUFFERS]
Definition: tpl_model.h:179
uint8_t tpl_stats_block_mis_log2
Definition: tpl_model.h:148
int frame_idx
Definition: tpl_model.h:194
TplTxfmStats txfm_stats_list[MAX_LENGTH_TPL_FRAME_STATS]
Definition: tpl_model.h:173
const YV12_BUFFER_CONFIG * ref_frame[INTER_REFS_PER_FRAME]
Definition: tpl_model.h:208
Encoder's parameters related to the current coding block.
Definition: block.h:778
YV12 frame buffer data structure.
Definition: yv12config.h:39