/* * Copyright (c) 2016, Alliance for Open Media. All rights reserved * * This source code is subject to the terms of the BSD 2 Clause License and * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License * was not distributed with this source code in the LICENSE file, you can * obtain it at www.aomedia.org/license/software. If the Alliance for Open * Media Patent License 1.0 was not distributed with this source code in the * PATENTS file, you can obtain it at www.aomedia.org/license/patent. */ #ifndef AV1_ENCODER_RD_H_ #define AV1_ENCODER_RD_H_ #include <limits.h> #if CONFIG_ANS #include "aom_dsp/ans.h" #endif // CONFIG_ANS #include "av1/common/blockd.h" #include "av1/encoder/block.h" #include "av1/encoder/context_tree.h" #include "av1/encoder/cost.h" #ifdef __cplusplus extern "C" { #endif #define RDDIV_BITS 7 #define RD_EPB_SHIFT 6 #define RDCOST(RM, DM, R, D) \ (ROUND_POWER_OF_TWO(((int64_t)R) * (RM), AV1_PROB_COST_SHIFT) + (D << DM)) #define RDCOST_DBL(RM, DM, R, D) \ (((((double)(R)) * (RM)) / (double)(1 << AV1_PROB_COST_SHIFT)) + \ ((double)(D) * (1 << (DM)))) #define QIDX_SKIP_THRESH 115 #define MV_COST_WEIGHT 108 #define MV_COST_WEIGHT_SUB 120 #define INVALID_MV 0x80008000 #if CONFIG_EXT_REFS #define MAX_REFS 15 #else #define MAX_REFS 6 #endif // CONFIG_EXT_REFS #define RD_THRESH_MAX_FACT 64 #define RD_THRESH_INC 1 // This enumerator type needs to be kept aligned with the mode order in // const MODE_DEFINITION av1_mode_order[MAX_MODES] used in the rd code. typedef enum { THR_NEARESTMV, #if CONFIG_EXT_REFS THR_NEARESTL2, THR_NEARESTL3, THR_NEARESTB, #endif // CONFIG_EXT_REFS THR_NEARESTA, THR_NEARESTG, THR_DC, THR_NEWMV, #if CONFIG_EXT_REFS THR_NEWL2, THR_NEWL3, THR_NEWB, #endif // CONFIG_EXT_REFS THR_NEWA, THR_NEWG, THR_NEARMV, #if CONFIG_EXT_REFS THR_NEARL2, THR_NEARL3, THR_NEARB, #endif // CONFIG_EXT_REFS THR_NEARA, THR_NEARG, THR_ZEROMV, #if CONFIG_EXT_REFS THR_ZEROL2, THR_ZEROL3, THR_ZEROB, #endif // CONFIG_EXT_REFS THR_ZEROG, THR_ZEROA, #if CONFIG_EXT_INTER THR_COMP_NEAREST_NEARESTLA, #if CONFIG_EXT_REFS THR_COMP_NEAREST_NEARESTL2A, THR_COMP_NEAREST_NEARESTL3A, #endif // CONFIG_EXT_REFS THR_COMP_NEAREST_NEARESTGA, #if CONFIG_EXT_REFS THR_COMP_NEAREST_NEARESTLB, THR_COMP_NEAREST_NEARESTL2B, THR_COMP_NEAREST_NEARESTL3B, THR_COMP_NEAREST_NEARESTGB, #endif // CONFIG_EXT_REFS #else // CONFIG_EXT_INTER THR_COMP_NEARESTLA, #if CONFIG_EXT_REFS THR_COMP_NEARESTL2A, THR_COMP_NEARESTL3A, #endif // CONFIG_EXT_REFS THR_COMP_NEARESTGA, #if CONFIG_EXT_REFS THR_COMP_NEARESTLB, THR_COMP_NEARESTL2B, THR_COMP_NEARESTL3B, THR_COMP_NEARESTGB, #endif // CONFIG_EXT_REFS #endif // CONFIG_EXT_INTER THR_TM, #if CONFIG_ALT_INTRA THR_SMOOTH, #endif // CONFIG_ALT_INTRA #if CONFIG_EXT_INTER THR_COMP_NEAR_NEARESTLA, THR_COMP_NEAREST_NEARLA, THR_COMP_NEAR_NEARLA, THR_COMP_NEW_NEARESTLA, THR_COMP_NEAREST_NEWLA, THR_COMP_NEW_NEARLA, THR_COMP_NEAR_NEWLA, THR_COMP_NEW_NEWLA, THR_COMP_ZERO_ZEROLA, #if CONFIG_EXT_REFS THR_COMP_NEAR_NEARESTL2A, THR_COMP_NEAREST_NEARL2A, THR_COMP_NEAR_NEARL2A, THR_COMP_NEW_NEARESTL2A, THR_COMP_NEAREST_NEWL2A, THR_COMP_NEW_NEARL2A, THR_COMP_NEAR_NEWL2A, THR_COMP_NEW_NEWL2A, THR_COMP_ZERO_ZEROL2A, THR_COMP_NEAR_NEARESTL3A, THR_COMP_NEAREST_NEARL3A, THR_COMP_NEAR_NEARL3A, THR_COMP_NEW_NEARESTL3A, THR_COMP_NEAREST_NEWL3A, THR_COMP_NEW_NEARL3A, THR_COMP_NEAR_NEWL3A, THR_COMP_NEW_NEWL3A, THR_COMP_ZERO_ZEROL3A, #endif // CONFIG_EXT_REFS THR_COMP_NEAR_NEARESTGA, THR_COMP_NEAREST_NEARGA, THR_COMP_NEAR_NEARGA, THR_COMP_NEW_NEARESTGA, THR_COMP_NEAREST_NEWGA, THR_COMP_NEW_NEARGA, THR_COMP_NEAR_NEWGA, THR_COMP_NEW_NEWGA, THR_COMP_ZERO_ZEROGA, #if CONFIG_EXT_REFS THR_COMP_NEAR_NEARESTLB, THR_COMP_NEAREST_NEARLB, THR_COMP_NEAR_NEARLB, THR_COMP_NEW_NEARESTLB, THR_COMP_NEAREST_NEWLB, THR_COMP_NEW_NEARLB, THR_COMP_NEAR_NEWLB, THR_COMP_NEW_NEWLB, THR_COMP_ZERO_ZEROLB, THR_COMP_NEAR_NEARESTL2B, THR_COMP_NEAREST_NEARL2B, THR_COMP_NEAR_NEARL2B, THR_COMP_NEW_NEARESTL2B, THR_COMP_NEAREST_NEWL2B, THR_COMP_NEW_NEARL2B, THR_COMP_NEAR_NEWL2B, THR_COMP_NEW_NEWL2B, THR_COMP_ZERO_ZEROL2B, THR_COMP_NEAR_NEARESTL3B, THR_COMP_NEAREST_NEARL3B, THR_COMP_NEAR_NEARL3B, THR_COMP_NEW_NEARESTL3B, THR_COMP_NEAREST_NEWL3B, THR_COMP_NEW_NEARL3B, THR_COMP_NEAR_NEWL3B, THR_COMP_NEW_NEWL3B, THR_COMP_ZERO_ZEROL3B, THR_COMP_NEAR_NEARESTGB, THR_COMP_NEAREST_NEARGB, THR_COMP_NEAR_NEARGB, THR_COMP_NEW_NEARESTGB, THR_COMP_NEAREST_NEWGB, THR_COMP_NEW_NEARGB, THR_COMP_NEAR_NEWGB, THR_COMP_NEW_NEWGB, THR_COMP_ZERO_ZEROGB, #endif // CONFIG_EXT_REFS #else // CONFIG_EXT_INTER THR_COMP_NEARLA, THR_COMP_NEWLA, #if CONFIG_EXT_REFS THR_COMP_NEARL2A, THR_COMP_NEWL2A, THR_COMP_NEARL3A, THR_COMP_NEWL3A, #endif // CONFIG_EXT_REFS THR_COMP_NEARGA, THR_COMP_NEWGA, #if CONFIG_EXT_REFS THR_COMP_NEARLB, THR_COMP_NEWLB, THR_COMP_NEARL2B, THR_COMP_NEWL2B, THR_COMP_NEARL3B, THR_COMP_NEWL3B, THR_COMP_NEARGB, THR_COMP_NEWGB, #endif // CONFIG_EXT_REFS THR_COMP_ZEROLA, #if CONFIG_EXT_REFS THR_COMP_ZEROL2A, THR_COMP_ZEROL3A, #endif // CONFIG_EXT_REFS THR_COMP_ZEROGA, #if CONFIG_EXT_REFS THR_COMP_ZEROLB, THR_COMP_ZEROL2B, THR_COMP_ZEROL3B, THR_COMP_ZEROGB, #endif // CONFIG_EXT_REFS #endif // CONFIG_EXT_INTER THR_H_PRED, THR_V_PRED, THR_D135_PRED, THR_D207_PRED, THR_D153_PRED, THR_D63_PRED, THR_D117_PRED, THR_D45_PRED, #if CONFIG_EXT_INTER THR_COMP_INTERINTRA_ZEROL, THR_COMP_INTERINTRA_NEARESTL, THR_COMP_INTERINTRA_NEARL, THR_COMP_INTERINTRA_NEWL, #if CONFIG_EXT_REFS THR_COMP_INTERINTRA_ZEROL2, THR_COMP_INTERINTRA_NEARESTL2, THR_COMP_INTERINTRA_NEARL2, THR_COMP_INTERINTRA_NEWL2, THR_COMP_INTERINTRA_ZEROL3, THR_COMP_INTERINTRA_NEARESTL3, THR_COMP_INTERINTRA_NEARL3, THR_COMP_INTERINTRA_NEWL3, #endif // CONFIG_EXT_REFS THR_COMP_INTERINTRA_ZEROG, THR_COMP_INTERINTRA_NEARESTG, THR_COMP_INTERINTRA_NEARG, THR_COMP_INTERINTRA_NEWG, #if CONFIG_EXT_REFS THR_COMP_INTERINTRA_ZEROB, THR_COMP_INTERINTRA_NEARESTB, THR_COMP_INTERINTRA_NEARB, THR_COMP_INTERINTRA_NEWB, #endif // CONFIG_EXT_REFS THR_COMP_INTERINTRA_ZEROA, THR_COMP_INTERINTRA_NEARESTA, THR_COMP_INTERINTRA_NEARA, THR_COMP_INTERINTRA_NEWA, #endif // CONFIG_EXT_INTER MAX_MODES } THR_MODES; typedef enum { THR_LAST, #if CONFIG_EXT_REFS THR_LAST2, THR_LAST3, THR_BWDR, #endif // CONFIG_EXT_REFS THR_GOLD, THR_ALTR, THR_COMP_LA, #if CONFIG_EXT_REFS THR_COMP_L2A, THR_COMP_L3A, #endif // CONFIG_EXT_REFS THR_COMP_GA, #if CONFIG_EXT_REFS THR_COMP_LB, THR_COMP_L2B, THR_COMP_L3B, THR_COMP_GB, #endif // CONFIG_EXT_REFS THR_INTRA, } THR_MODES_SUB8X8; typedef struct RD_OPT { // Thresh_mult is used to set a threshold for the rd score. A higher value // means that we will accept the best mode so far more often. This number // is used in combination with the current block size, and thresh_freq_fact // to pick a threshold. int thresh_mult[MAX_MODES]; int thresh_mult_sub8x8[MAX_REFS]; int threshes[MAX_SEGMENTS][BLOCK_SIZES][MAX_MODES]; int64_t prediction_type_threshes[TOTAL_REFS_PER_FRAME][REFERENCE_MODES]; int RDMULT; int RDDIV; } RD_OPT; static INLINE void av1_init_rd_stats(RD_STATS *rd_stats) { #if CONFIG_RD_DEBUG int plane; #endif rd_stats->rate = 0; rd_stats->dist = 0; rd_stats->rdcost = 0; rd_stats->sse = 0; rd_stats->skip = 1; #if CONFIG_RD_DEBUG for (plane = 0; plane < MAX_MB_PLANE; ++plane) { rd_stats->txb_coeff_cost[plane] = 0; #if CONFIG_VAR_TX { int r, c; for (r = 0; r < TXB_COEFF_COST_MAP_SIZE; ++r) for (c = 0; c < TXB_COEFF_COST_MAP_SIZE; ++c) rd_stats->txb_coeff_cost_map[plane][r][c] = 0; } #endif } #endif } static INLINE void av1_invalid_rd_stats(RD_STATS *rd_stats) { #if CONFIG_RD_DEBUG int plane; #endif rd_stats->rate = INT_MAX; rd_stats->dist = INT64_MAX; rd_stats->rdcost = INT64_MAX; rd_stats->sse = INT64_MAX; rd_stats->skip = 0; #if CONFIG_RD_DEBUG for (plane = 0; plane < MAX_MB_PLANE; ++plane) { rd_stats->txb_coeff_cost[plane] = INT_MAX; #if CONFIG_VAR_TX { int r, c; for (r = 0; r < TXB_COEFF_COST_MAP_SIZE; ++r) for (c = 0; c < TXB_COEFF_COST_MAP_SIZE; ++c) rd_stats->txb_coeff_cost_map[plane][r][c] = INT_MAX; } #endif } #endif } static INLINE void av1_merge_rd_stats(RD_STATS *rd_stats_dst, const RD_STATS *rd_stats_src) { #if CONFIG_RD_DEBUG int plane; #endif rd_stats_dst->rate += rd_stats_src->rate; rd_stats_dst->dist += rd_stats_src->dist; rd_stats_dst->sse += rd_stats_src->sse; rd_stats_dst->skip &= rd_stats_src->skip; #if CONFIG_RD_DEBUG for (plane = 0; plane < MAX_MB_PLANE; ++plane) { rd_stats_dst->txb_coeff_cost[plane] += rd_stats_src->txb_coeff_cost[plane]; #if CONFIG_VAR_TX { // TODO(angiebird): optimize this part int r, c; int ref_txb_coeff_cost = 0; for (r = 0; r < TXB_COEFF_COST_MAP_SIZE; ++r) for (c = 0; c < TXB_COEFF_COST_MAP_SIZE; ++c) { rd_stats_dst->txb_coeff_cost_map[plane][r][c] += rd_stats_src->txb_coeff_cost_map[plane][r][c]; ref_txb_coeff_cost += rd_stats_dst->txb_coeff_cost_map[plane][r][c]; } assert(ref_txb_coeff_cost == rd_stats_dst->txb_coeff_cost[plane]); } #endif } #endif } struct TileInfo; struct TileDataEnc; struct AV1_COMP; struct macroblock; int av1_compute_rd_mult(const struct AV1_COMP *cpi, int qindex); void av1_initialize_rd_consts(struct AV1_COMP *cpi); void av1_initialize_me_consts(const struct AV1_COMP *cpi, MACROBLOCK *x, int qindex); void av1_model_rd_from_var_lapndz(int64_t var, unsigned int n, unsigned int qstep, int *rate, int64_t *dist); int av1_get_switchable_rate(const struct AV1_COMP *cpi, const MACROBLOCKD *xd); int av1_raster_block_offset(BLOCK_SIZE plane_bsize, int raster_block, int stride); int16_t *av1_raster_block_offset_int16(BLOCK_SIZE plane_bsize, int raster_block, int16_t *base); YV12_BUFFER_CONFIG *av1_get_scaled_ref_frame(const struct AV1_COMP *cpi, int ref_frame); void av1_init_me_luts(void); #if CONFIG_REF_MV void av1_set_mvcost(MACROBLOCK *x, MV_REFERENCE_FRAME ref_frame, int ref, int ref_mv_idx); #endif void av1_get_entropy_contexts(BLOCK_SIZE bsize, TX_SIZE tx_size, const struct macroblockd_plane *pd, ENTROPY_CONTEXT t_above[2 * MAX_MIB_SIZE], ENTROPY_CONTEXT t_left[2 * MAX_MIB_SIZE]); void av1_set_rd_speed_thresholds(struct AV1_COMP *cpi); void av1_set_rd_speed_thresholds_sub8x8(struct AV1_COMP *cpi); void av1_update_rd_thresh_fact(const AV1_COMMON *const cm, int (*fact)[MAX_MODES], int rd_thresh, int bsize, int best_mode_index); void av1_fill_token_costs(av1_coeff_cost *c, av1_coeff_probs_model (*p)[PLANE_TYPES]); static INLINE int rd_less_than_thresh(int64_t best_rd, int thresh, int thresh_fact) { return best_rd < ((int64_t)thresh * thresh_fact >> 5) || thresh == INT_MAX; } void av1_mv_pred(const struct AV1_COMP *cpi, MACROBLOCK *x, uint8_t *ref_y_buffer, int ref_y_stride, int ref_frame, BLOCK_SIZE block_size); static INLINE void set_error_per_bit(MACROBLOCK *x, int rdmult) { x->errorperbit = rdmult >> RD_EPB_SHIFT; x->errorperbit += (x->errorperbit == 0); } void av1_setup_pred_block(const MACROBLOCKD *xd, struct buf_2d dst[MAX_MB_PLANE], const YV12_BUFFER_CONFIG *src, int mi_row, int mi_col, const struct scale_factors *scale, const struct scale_factors *scale_uv); int av1_get_intra_cost_penalty(int qindex, int qdelta, aom_bit_depth_t bit_depth); #ifdef __cplusplus } // extern "C" #endif #endif // AV1_ENCODER_RD_H_