/* * Copyright (c) 2016, Alliance for Open Media. All rights reserved * * This source code is subject to the terms of the BSD 2 Clause License and * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License * was not distributed with this source code in the LICENSE file, you can * obtain it at www.aomedia.org/license/software. If the Alliance for Open * Media Patent License 1.0 was not distributed with this source code in the * PATENTS file, you can obtain it at www.aomedia.org/license/patent. */ #ifndef AV1_ENCODER_BLOCK_H_ #define AV1_ENCODER_BLOCK_H_ #include "av1/common/entropymv.h" #include "av1/common/entropy.h" #if CONFIG_PVQ #include "av1/encoder/encint.h" #endif #include "av1/common/mvref_common.h" #ifdef __cplusplus extern "C" { #endif #if CONFIG_PVQ // Maximum possible # of tx blocks in luma plane, which is currently 256, // since there can be 16x16 of 4x4 tx. #define MAX_PVQ_BLOCKS_IN_SB (MAX_SB_SQUARE >> 2 * OD_LOG_BSIZE0) #endif typedef struct { unsigned int sse; int sum; unsigned int var; } DIFF; typedef struct macroblock_plane { DECLARE_ALIGNED(16, int16_t, src_diff[MAX_SB_SQUARE]); #if CONFIG_PVQ DECLARE_ALIGNED(16, int16_t, src_int16[MAX_SB_SQUARE]); #endif tran_low_t *qcoeff; tran_low_t *coeff; uint16_t *eobs; #if CONFIG_LV_MAP uint8_t *txb_entropy_ctx; #endif struct buf_2d src; // Quantizer setings const int16_t *quant_fp; const int16_t *round_fp; const int16_t *quant; const int16_t *quant_shift; const int16_t *zbin; const int16_t *round; #if CONFIG_NEW_QUANT const cuml_bins_type_nuq *cuml_bins_nuq[QUANT_PROFILES]; #endif // CONFIG_NEW_QUANT } MACROBLOCK_PLANE; /* The [2] dimension is for whether we skip the EOB node (i.e. if previous * coefficient in this block was zero) or not. */ typedef unsigned int av1_coeff_cost[PLANE_TYPES][REF_TYPES][COEF_BANDS][2] [COEFF_CONTEXTS][ENTROPY_TOKENS]; typedef struct { int_mv ref_mvs[MODE_CTX_REF_FRAMES][MAX_MV_REF_CANDIDATES]; int16_t mode_context[MODE_CTX_REF_FRAMES]; #if CONFIG_LV_MAP // TODO(angiebird): Reduce the buffer size according to sb_type tran_low_t tcoeff[MAX_MB_PLANE][MAX_SB_SQUARE]; uint16_t eobs[MAX_MB_PLANE][MAX_SB_SQUARE / (TX_SIZE_W_MIN * TX_SIZE_H_MIN)]; uint8_t txb_skip_ctx[MAX_MB_PLANE] [MAX_SB_SQUARE / (TX_SIZE_W_MIN * TX_SIZE_H_MIN)]; int dc_sign_ctx[MAX_MB_PLANE] [MAX_SB_SQUARE / (TX_SIZE_W_MIN * TX_SIZE_H_MIN)]; #endif uint8_t ref_mv_count[MODE_CTX_REF_FRAMES]; CANDIDATE_MV ref_mv_stack[MODE_CTX_REF_FRAMES][MAX_REF_MV_STACK_SIZE]; #if CONFIG_EXT_INTER int16_t compound_mode_context[MODE_CTX_REF_FRAMES]; #endif // CONFIG_EXT_INTER } MB_MODE_INFO_EXT; typedef struct { int col_min; int col_max; int row_min; int row_max; } MvLimits; #if CONFIG_PALETTE typedef struct { uint8_t best_palette_color_map[MAX_SB_SQUARE]; float kmeans_data_buf[2 * MAX_SB_SQUARE]; } PALETTE_BUFFER; #endif // CONFIG_PALETTE typedef struct macroblock MACROBLOCK; struct macroblock { struct macroblock_plane plane[MAX_MB_PLANE]; MACROBLOCKD e_mbd; MB_MODE_INFO_EXT *mbmi_ext; int skip_block; int qindex; // The equivalent error at the current rdmult of one whole bit (not one // bitcost unit). int errorperbit; // The equivalend SAD error of one (whole) bit at the current quantizer // for large blocks. int sadperbit16; // The equivalend SAD error of one (whole) bit at the current quantizer // for sub-8x8 blocks. int sadperbit4; int rddiv; int rdmult; int mb_energy; int *m_search_count_ptr; int *ex_search_count_ptr; #if CONFIG_VAR_TX unsigned int txb_split_count; #endif // These are set to their default values at the beginning, and then adjusted // further in the encoding process. BLOCK_SIZE min_partition_size; BLOCK_SIZE max_partition_size; int mv_best_ref_index[TOTAL_REFS_PER_FRAME]; unsigned int max_mv_context[TOTAL_REFS_PER_FRAME]; unsigned int source_variance; unsigned int pred_sse[TOTAL_REFS_PER_FRAME]; int pred_mv_sad[TOTAL_REFS_PER_FRAME]; int *nmvjointcost; int nmv_vec_cost[NMV_CONTEXTS][MV_JOINTS]; int *nmvcost[NMV_CONTEXTS][2]; int *nmvcost_hp[NMV_CONTEXTS][2]; int **mv_cost_stack[NMV_CONTEXTS]; int **mvcost; #if CONFIG_MOTION_VAR int32_t *wsrc_buf; int32_t *mask_buf; uint8_t *above_pred_buf; uint8_t *left_pred_buf; #endif // CONFIG_MOTION_VAR #if CONFIG_PALETTE PALETTE_BUFFER *palette_buffer; #endif // CONFIG_PALETTE // These define limits to motion vector components to prevent them // from extending outside the UMV borders MvLimits mv_limits; #if CONFIG_VAR_TX uint8_t blk_skip[MAX_MB_PLANE][MAX_MIB_SIZE * MAX_MIB_SIZE * 8]; uint8_t blk_skip_drl[MAX_MB_PLANE][MAX_MIB_SIZE * MAX_MIB_SIZE * 8]; #endif int skip; #if CONFIG_CB4X4 int skip_chroma_rd; #endif // note that token_costs is the cost when eob node is skipped av1_coeff_cost token_costs[TX_SIZES]; int optimize; // Used to store sub partition's choices. MV pred_mv[TOTAL_REFS_PER_FRAME]; // Store the best motion vector during motion search int_mv best_mv; // Store the second best motion vector during full-pixel motion search int_mv second_best_mv; // use default transform and skip transform type search for intra modes int use_default_intra_tx_type; // use default transform and skip transform type search for inter modes int use_default_inter_tx_type; #if CONFIG_PVQ int rate; // 1 if neither AC nor DC is coded. Only used during RDO. int pvq_skip[MAX_MB_PLANE]; PVQ_QUEUE *pvq_q; // Storage for PVQ tx block encodings in a superblock. // There can be max 16x16 of 4x4 blocks (and YUV) encode by PVQ // 256 is the max # of 4x4 blocks in a SB (64x64), which comes from: // 1) Since PVQ is applied to each trasnform-ed block // 2) 4x4 is the smallest tx size in AV1 // 3) AV1 allows using smaller tx size than block (i.e. partition) size // TODO(yushin) : The memory usage could be improved a lot, since this has // storage for 10 bands and 128 coefficients for every 4x4 block, PVQ_INFO pvq[MAX_PVQ_BLOCKS_IN_SB][MAX_MB_PLANE]; daala_enc_ctx daala_enc; int pvq_speed; int pvq_coded; // Indicates whether pvq_info needs be stored to tokenize #endif #if CONFIG_DAALA_DIST // Keep rate of each 4x4 block in the current macroblock during RDO // This is needed when using the 8x8 Daala distortion metric during RDO, // because it evaluates distortion in a different order than the underlying // 4x4 blocks are coded. int rate_4x4[MAX_SB_SQUARE / (TX_SIZE_W_MIN * TX_SIZE_H_MIN)]; #if CONFIG_CB4X4 DECLARE_ALIGNED(16, uint8_t, decoded_8x8[8 * 8]); #endif // CONFIG_CB4X4 #endif // CONFIG_DAALA_DIST #if CONFIG_CFL // Whether luma needs to be stored during RDO. int cfl_store_y; #endif }; #ifdef __cplusplus } // extern "C" #endif #endif // AV1_ENCODER_BLOCK_H_