/* * Copyright (c) 2016, Alliance for Open Media. All rights reserved * * This source code is subject to the terms of the BSD 2 Clause License and * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License * was not distributed with this source code in the LICENSE file, you can * obtain it at www.aomedia.org/license/software. If the Alliance for Open * Media Patent License 1.0 was not distributed with this source code in the * PATENTS file, you can obtain it at www.aomedia.org/license/patent. */ #include #include #include "./aom_config.h" #include "aom/aom_encoder.h" #include "aom_ports/aom_once.h" #include "aom_ports/system_state.h" #include "aom/internal/aom_codec_internal.h" #include "./aom_version.h" #include "av1/encoder/encoder.h" #include "aom/aomcx.h" #include "av1/encoder/firstpass.h" #include "av1/av1_iface_common.h" struct av1_extracfg { int cpu_used; // available cpu percentage in 1/16 unsigned int enable_auto_alt_ref; #if CONFIG_EXT_REFS unsigned int enable_auto_bwd_ref; #endif // CONFIG_EXT_REFS unsigned int noise_sensitivity; unsigned int sharpness; unsigned int static_thresh; unsigned int tile_columns; unsigned int tile_rows; #if CONFIG_DEPENDENT_HORZTILES unsigned int dependent_horz_tiles; #endif #if CONFIG_LOOPFILTERING_ACROSS_TILES unsigned int loop_filter_across_tiles_enabled; #endif // CONFIG_LOOPFILTERING_ACROSS_TILES unsigned int arnr_max_frames; unsigned int arnr_strength; unsigned int min_gf_interval; unsigned int max_gf_interval; aom_tune_metric tuning; unsigned int cq_level; // constrained quality level unsigned int rc_max_intra_bitrate_pct; unsigned int rc_max_inter_bitrate_pct; unsigned int gf_cbr_boost_pct; unsigned int lossless; #if CONFIG_AOM_QM unsigned int enable_qm; unsigned int qm_min; unsigned int qm_max; #endif unsigned int num_tg; unsigned int mtu_size; #if CONFIG_TEMPMV_SIGNALING unsigned int disable_tempmv; #endif unsigned int frame_parallel_decoding_mode; AQ_MODE aq_mode; #if CONFIG_EXT_DELTA_Q DELTAQ_MODE deltaq_mode; #endif unsigned int frame_periodic_boost; aom_bit_depth_t bit_depth; aom_tune_content content; aom_color_space_t color_space; #if CONFIG_COLORSPACE_HEADERS aom_transfer_function_t transfer_function; aom_chroma_sample_position_t chroma_sample_position; #endif int color_range; int render_width; int render_height; aom_superblock_size_t superblock_size; #if CONFIG_ANS && ANS_MAX_SYMBOLS int ans_window_size_log2; #endif #if CONFIG_EXT_TILE unsigned int single_tile_decoding; #endif // CONFIG_EXT_TILE unsigned int motion_vector_unit_test; }; static struct av1_extracfg default_extra_cfg = { 0, // cpu_used 1, // enable_auto_alt_ref #if CONFIG_EXT_REFS 0, // enable_auto_bwd_ref #endif // CONFIG_EXT_REFS 0, // noise_sensitivity 0, // sharpness 0, // static_thresh 0, // tile_columns 0, // tile_rows #if CONFIG_DEPENDENT_HORZTILES 0, // Dependent Horizontal tiles #endif #if CONFIG_LOOPFILTERING_ACROSS_TILES 1, // loop_filter_across_tiles_enabled #endif // CONFIG_LOOPFILTERING_ACROSS_TILES 7, // arnr_max_frames 5, // arnr_strength 0, // min_gf_interval; 0 -> default decision 0, // max_gf_interval; 0 -> default decision AOM_TUNE_PSNR, // tuning 10, // cq_level 0, // rc_max_intra_bitrate_pct 0, // rc_max_inter_bitrate_pct 0, // gf_cbr_boost_pct 0, // lossless #if CONFIG_AOM_QM 0, // enable_qm DEFAULT_QM_FIRST, // qm_min DEFAULT_QM_LAST, // qm_max #endif 1, // max number of tile groups 0, // mtu_size #if CONFIG_TEMPMV_SIGNALING 0, // disable temporal mv prediction #endif 1, // frame_parallel_decoding_mode NO_AQ, // aq_mode #if CONFIG_EXT_DELTA_Q NO_DELTA_Q, // deltaq_mode #endif CONFIG_XIPHRC, // frame_periodic_delta_q AOM_BITS_8, // Bit depth AOM_CONTENT_DEFAULT, // content AOM_CS_UNKNOWN, // color space #if CONFIG_COLORSPACE_HEADERS AOM_TF_UNKNOWN, // transfer function AOM_CSP_UNKNOWN, // chroma sample position #endif 0, // color range 0, // render width 0, // render height AOM_SUPERBLOCK_SIZE_DYNAMIC, // superblock_size #if CONFIG_ANS && ANS_MAX_SYMBOLS 23, // ans_window_size_log2 #endif #if CONFIG_EXT_TILE 0, // Single tile decoding is off by default. #endif // CONFIG_EXT_TILE 0, // motion_vector_unit_test }; struct aom_codec_alg_priv { aom_codec_priv_t base; aom_codec_enc_cfg_t cfg; struct av1_extracfg extra_cfg; AV1EncoderConfig oxcf; AV1_COMP *cpi; unsigned char *cx_data; size_t cx_data_sz; unsigned char *pending_cx_data; size_t pending_cx_data_sz; int pending_frame_count; size_t pending_frame_sizes[8]; aom_image_t preview_img; aom_enc_frame_flags_t next_frame_flags; aom_postproc_cfg_t preview_ppcfg; aom_codec_pkt_list_decl(256) pkt_list; unsigned int fixed_kf_cntr; // BufferPool that holds all reference frames. BufferPool *buffer_pool; }; static aom_codec_err_t update_error_state( aom_codec_alg_priv_t *ctx, const struct aom_internal_error_info *error) { const aom_codec_err_t res = error->error_code; if (res != AOM_CODEC_OK) ctx->base.err_detail = error->has_detail ? error->detail : NULL; return res; } #undef ERROR #define ERROR(str) \ do { \ ctx->base.err_detail = str; \ return AOM_CODEC_INVALID_PARAM; \ } while (0) #define RANGE_CHECK(p, memb, lo, hi) \ do { \ if (!((p)->memb >= (lo) && (p)->memb <= (hi))) \ ERROR(#memb " out of range [" #lo ".." #hi "]"); \ } while (0) #define RANGE_CHECK_HI(p, memb, hi) \ do { \ if (!((p)->memb <= (hi))) ERROR(#memb " out of range [.." #hi "]"); \ } while (0) #define RANGE_CHECK_LO(p, memb, lo) \ do { \ if (!((p)->memb >= (lo))) ERROR(#memb " out of range [" #lo "..]"); \ } while (0) #define RANGE_CHECK_BOOL(p, memb) \ do { \ if (!!((p)->memb) != (p)->memb) ERROR(#memb " expected boolean"); \ } while (0) static aom_codec_err_t validate_config(aom_codec_alg_priv_t *ctx, const aom_codec_enc_cfg_t *cfg, const struct av1_extracfg *extra_cfg) { RANGE_CHECK(cfg, g_w, 1, 65535); // 16 bits available RANGE_CHECK(cfg, g_h, 1, 65535); // 16 bits available RANGE_CHECK(cfg, g_timebase.den, 1, 1000000000); RANGE_CHECK(cfg, g_timebase.num, 1, cfg->g_timebase.den); RANGE_CHECK_HI(cfg, g_profile, 3); RANGE_CHECK_HI(cfg, rc_max_quantizer, 63); RANGE_CHECK_HI(cfg, rc_min_quantizer, cfg->rc_max_quantizer); RANGE_CHECK_BOOL(extra_cfg, lossless); RANGE_CHECK(extra_cfg, aq_mode, 0, AQ_MODE_COUNT - 1); #if CONFIG_EXT_DELTA_Q RANGE_CHECK(extra_cfg, deltaq_mode, 0, DELTAQ_MODE_COUNT - 1); #endif RANGE_CHECK_HI(extra_cfg, frame_periodic_boost, 1); RANGE_CHECK_HI(cfg, g_threads, 64); RANGE_CHECK_HI(cfg, g_lag_in_frames, MAX_LAG_BUFFERS); RANGE_CHECK(cfg, rc_end_usage, AOM_VBR, AOM_Q); RANGE_CHECK_HI(cfg, rc_undershoot_pct, 100); RANGE_CHECK_HI(cfg, rc_overshoot_pct, 100); RANGE_CHECK_HI(cfg, rc_2pass_vbr_bias_pct, 100); RANGE_CHECK(cfg, kf_mode, AOM_KF_DISABLED, AOM_KF_AUTO); RANGE_CHECK_HI(cfg, rc_dropframe_thresh, 100); RANGE_CHECK(cfg, g_pass, AOM_RC_ONE_PASS, AOM_RC_LAST_PASS); RANGE_CHECK_HI(extra_cfg, min_gf_interval, MAX_LAG_BUFFERS - 1); RANGE_CHECK_HI(extra_cfg, max_gf_interval, MAX_LAG_BUFFERS - 1); if (extra_cfg->max_gf_interval > 0) { RANGE_CHECK(extra_cfg, max_gf_interval, 2, (MAX_LAG_BUFFERS - 1)); } if (extra_cfg->min_gf_interval > 0 && extra_cfg->max_gf_interval > 0) { RANGE_CHECK(extra_cfg, max_gf_interval, extra_cfg->min_gf_interval, (MAX_LAG_BUFFERS - 1)); } RANGE_CHECK_HI(cfg, rc_resize_mode, RESIZE_DYNAMIC); RANGE_CHECK(cfg, rc_resize_numerator, SCALE_DENOMINATOR / 2, SCALE_DENOMINATOR); RANGE_CHECK(cfg, rc_resize_kf_numerator, SCALE_DENOMINATOR / 2, SCALE_DENOMINATOR); #if CONFIG_FRAME_SUPERRES RANGE_CHECK_HI(cfg, rc_superres_mode, SUPERRES_DYNAMIC); RANGE_CHECK(cfg, rc_superres_numerator, SCALE_DENOMINATOR / 2, SCALE_DENOMINATOR); RANGE_CHECK(cfg, rc_superres_kf_numerator, SCALE_DENOMINATOR / 2, SCALE_DENOMINATOR); #endif // CONFIG_FRAME_SUPERRES // AV1 does not support a lower bound on the keyframe interval in // automatic keyframe placement mode. if (cfg->kf_mode != AOM_KF_DISABLED && cfg->kf_min_dist != cfg->kf_max_dist && cfg->kf_min_dist > 0) ERROR( "kf_min_dist not supported in auto mode, use 0 " "or kf_max_dist instead."); RANGE_CHECK_HI(extra_cfg, motion_vector_unit_test, 2); RANGE_CHECK_HI(extra_cfg, enable_auto_alt_ref, 2); #if CONFIG_EXT_REFS RANGE_CHECK_HI(extra_cfg, enable_auto_bwd_ref, 2); #endif // CONFIG_EXT_REFS RANGE_CHECK(extra_cfg, cpu_used, 0, 8); RANGE_CHECK_HI(extra_cfg, noise_sensitivity, 6); RANGE_CHECK(extra_cfg, superblock_size, AOM_SUPERBLOCK_SIZE_64X64, AOM_SUPERBLOCK_SIZE_DYNAMIC); #if CONFIG_EXT_TILE RANGE_CHECK_HI(cfg, large_scale_tile, 1); RANGE_CHECK_HI(extra_cfg, single_tile_decoding, 1); if (cfg->large_scale_tile) { // TODO(any): Waring. If CONFIG_EXT_TILE is true, tile_columns really // means tile_width, and tile_rows really means tile_hight. The interface // should be sanitized. #if CONFIG_EXT_PARTITION if (extra_cfg->superblock_size != AOM_SUPERBLOCK_SIZE_64X64) { if (extra_cfg->tile_columns != 0) RANGE_CHECK(extra_cfg, tile_columns, 1, 32); if (extra_cfg->tile_rows != 0) RANGE_CHECK(extra_cfg, tile_rows, 1, 32); } else { #endif // CONFIG_EXT_PARTITION if (extra_cfg->tile_columns != 0) RANGE_CHECK(extra_cfg, tile_columns, 1, 64); if (extra_cfg->tile_rows != 0) RANGE_CHECK(extra_cfg, tile_rows, 1, 64); #if CONFIG_EXT_PARTITION } #endif // CONFIG_EXT_PARTITION } else { #endif // CONFIG_EXT_TILE RANGE_CHECK_HI(extra_cfg, tile_columns, 6); RANGE_CHECK_HI(extra_cfg, tile_rows, 2); #if CONFIG_EXT_TILE } #endif // CONFIG_EXT_TILE #if CONFIG_DEPENDENT_HORZTILES RANGE_CHECK_HI(extra_cfg, dependent_horz_tiles, 1); #endif #if CONFIG_LOOPFILTERING_ACROSS_TILES RANGE_CHECK_HI(extra_cfg, loop_filter_across_tiles_enabled, 1); #endif // CONFIG_LOOPFILTERING_ACROSS_TILES RANGE_CHECK_HI(extra_cfg, sharpness, 7); RANGE_CHECK_HI(extra_cfg, arnr_max_frames, 15); RANGE_CHECK_HI(extra_cfg, arnr_strength, 6); RANGE_CHECK_HI(extra_cfg, cq_level, 63); RANGE_CHECK(cfg, g_bit_depth, AOM_BITS_8, AOM_BITS_12); RANGE_CHECK(cfg, g_input_bit_depth, 8, 12); RANGE_CHECK(extra_cfg, content, AOM_CONTENT_DEFAULT, AOM_CONTENT_INVALID - 1); // TODO(yaowu): remove this when ssim tuning is implemented for av1 if (extra_cfg->tuning == AOM_TUNE_SSIM) ERROR("Option --tune=ssim is not currently supported in AV1."); if (cfg->g_pass == AOM_RC_LAST_PASS) { #if !CONFIG_XIPHRC const size_t packet_sz = sizeof(FIRSTPASS_STATS); const int n_packets = (int)(cfg->rc_twopass_stats_in.sz / packet_sz); const FIRSTPASS_STATS *stats; #endif if (cfg->rc_twopass_stats_in.buf == NULL) ERROR("rc_twopass_stats_in.buf not set."); #if !CONFIG_XIPHRC if (cfg->rc_twopass_stats_in.sz % packet_sz) ERROR("rc_twopass_stats_in.sz indicates truncated packet."); if (cfg->rc_twopass_stats_in.sz < 2 * packet_sz) ERROR("rc_twopass_stats_in requires at least two packets."); stats = (const FIRSTPASS_STATS *)cfg->rc_twopass_stats_in.buf + n_packets - 1; if ((int)(stats->count + 0.5) != n_packets - 1) ERROR("rc_twopass_stats_in missing EOS stats packet"); #endif } #if !CONFIG_HIGHBITDEPTH if (cfg->g_profile > (unsigned int)PROFILE_1) { ERROR("Profile > 1 not supported in this build configuration"); } #endif if (cfg->g_profile <= (unsigned int)PROFILE_1 && cfg->g_bit_depth > AOM_BITS_8) { ERROR("Codec high bit-depth not supported in profile < 2"); } if (cfg->g_profile <= (unsigned int)PROFILE_1 && cfg->g_input_bit_depth > 8) { ERROR("Source high bit-depth not supported in profile < 2"); } if (cfg->g_profile > (unsigned int)PROFILE_1 && cfg->g_bit_depth == AOM_BITS_8) { ERROR("Codec bit-depth 8 not supported in profile > 1"); } #if CONFIG_COLORSPACE_HEADERS RANGE_CHECK(extra_cfg, color_space, AOM_CS_UNKNOWN, AOM_CS_ICTCP); RANGE_CHECK(extra_cfg, transfer_function, AOM_TF_UNKNOWN, AOM_TF_HLG); RANGE_CHECK(extra_cfg, chroma_sample_position, AOM_CSP_UNKNOWN, AOM_CSP_COLOCATED); #else RANGE_CHECK(extra_cfg, color_space, AOM_CS_UNKNOWN, AOM_CS_SRGB); #endif RANGE_CHECK(extra_cfg, color_range, 0, 1); #if CONFIG_ANS && ANS_MAX_SYMBOLS RANGE_CHECK(extra_cfg, ans_window_size_log2, 8, 23); #endif return AOM_CODEC_OK; } static aom_codec_err_t validate_img(aom_codec_alg_priv_t *ctx, const aom_image_t *img) { switch (img->fmt) { case AOM_IMG_FMT_YV12: case AOM_IMG_FMT_I420: case AOM_IMG_FMT_I42016: break; case AOM_IMG_FMT_I422: case AOM_IMG_FMT_I444: case AOM_IMG_FMT_I440: if (ctx->cfg.g_profile != (unsigned int)PROFILE_1) { ERROR( "Invalid image format. I422, I444, I440 images are " "not supported in profile."); } break; case AOM_IMG_FMT_I42216: case AOM_IMG_FMT_I44416: case AOM_IMG_FMT_I44016: if (ctx->cfg.g_profile != (unsigned int)PROFILE_1 && ctx->cfg.g_profile != (unsigned int)PROFILE_3) { ERROR( "Invalid image format. 16-bit I422, I444, I440 images are " "not supported in profile."); } break; default: ERROR( "Invalid image format. Only YV12, I420, I422, I444 images are " "supported."); break; } if (img->d_w != ctx->cfg.g_w || img->d_h != ctx->cfg.g_h) ERROR("Image size must match encoder init configuration size"); return AOM_CODEC_OK; } static int get_image_bps(const aom_image_t *img) { switch (img->fmt) { case AOM_IMG_FMT_YV12: case AOM_IMG_FMT_I420: return 12; case AOM_IMG_FMT_I422: return 16; case AOM_IMG_FMT_I444: return 24; case AOM_IMG_FMT_I440: return 16; case AOM_IMG_FMT_I42016: return 24; case AOM_IMG_FMT_I42216: return 32; case AOM_IMG_FMT_I44416: return 48; case AOM_IMG_FMT_I44016: return 32; default: assert(0 && "Invalid image format"); break; } return 0; } static aom_codec_err_t set_encoder_config( AV1EncoderConfig *oxcf, const aom_codec_enc_cfg_t *cfg, const struct av1_extracfg *extra_cfg) { const int is_vbr = cfg->rc_end_usage == AOM_VBR; oxcf->profile = cfg->g_profile; oxcf->max_threads = (int)cfg->g_threads; oxcf->width = cfg->g_w; oxcf->height = cfg->g_h; oxcf->bit_depth = cfg->g_bit_depth; oxcf->input_bit_depth = cfg->g_input_bit_depth; // guess a frame rate if out of whack, use 30 oxcf->init_framerate = (double)cfg->g_timebase.den / cfg->g_timebase.num; if (oxcf->init_framerate > 180) oxcf->init_framerate = 30; oxcf->mode = GOOD; switch (cfg->g_pass) { case AOM_RC_ONE_PASS: oxcf->pass = 0; break; case AOM_RC_FIRST_PASS: oxcf->pass = 1; break; case AOM_RC_LAST_PASS: oxcf->pass = 2; break; } oxcf->lag_in_frames = cfg->g_pass == AOM_RC_FIRST_PASS ? 0 : cfg->g_lag_in_frames; oxcf->rc_mode = cfg->rc_end_usage; // Convert target bandwidth from Kbit/s to Bit/s oxcf->target_bandwidth = 1000 * cfg->rc_target_bitrate; oxcf->rc_max_intra_bitrate_pct = extra_cfg->rc_max_intra_bitrate_pct; oxcf->rc_max_inter_bitrate_pct = extra_cfg->rc_max_inter_bitrate_pct; oxcf->gf_cbr_boost_pct = extra_cfg->gf_cbr_boost_pct; oxcf->best_allowed_q = extra_cfg->lossless ? 0 : av1_quantizer_to_qindex(cfg->rc_min_quantizer); oxcf->worst_allowed_q = extra_cfg->lossless ? 0 : av1_quantizer_to_qindex(cfg->rc_max_quantizer); oxcf->cq_level = av1_quantizer_to_qindex(extra_cfg->cq_level); oxcf->fixed_q = -1; #if CONFIG_AOM_QM oxcf->using_qm = extra_cfg->enable_qm; oxcf->qm_minlevel = extra_cfg->qm_min; oxcf->qm_maxlevel = extra_cfg->qm_max; #endif oxcf->num_tile_groups = extra_cfg->num_tg; #if CONFIG_EXT_TILE // In large-scale tile encoding mode, num_tile_groups is always 1. if (cfg->large_scale_tile) oxcf->num_tile_groups = 1; #endif // CONFIG_EXT_TILE oxcf->mtu = extra_cfg->mtu_size; #if CONFIG_TEMPMV_SIGNALING oxcf->disable_tempmv = extra_cfg->disable_tempmv; #endif oxcf->under_shoot_pct = cfg->rc_undershoot_pct; oxcf->over_shoot_pct = cfg->rc_overshoot_pct; oxcf->resize_mode = (RESIZE_MODE)cfg->rc_resize_mode; oxcf->resize_scale_numerator = (uint8_t)cfg->rc_resize_numerator; oxcf->resize_kf_scale_numerator = (uint8_t)cfg->rc_resize_kf_numerator; if (oxcf->resize_mode == RESIZE_FIXED && oxcf->resize_scale_numerator == SCALE_DENOMINATOR && oxcf->resize_kf_scale_numerator == SCALE_DENOMINATOR) oxcf->resize_mode = RESIZE_NONE; #if CONFIG_FRAME_SUPERRES oxcf->superres_mode = (SUPERRES_MODE)cfg->rc_superres_mode; oxcf->superres_scale_numerator = (uint8_t)cfg->rc_superres_numerator; oxcf->superres_kf_scale_numerator = (uint8_t)cfg->rc_superres_kf_numerator; if (oxcf->superres_mode == SUPERRES_FIXED && oxcf->superres_scale_numerator == SCALE_DENOMINATOR && oxcf->superres_kf_scale_numerator == SCALE_DENOMINATOR) oxcf->superres_mode = SUPERRES_NONE; #endif // CONFIG_FRAME_SUPERRES oxcf->maximum_buffer_size_ms = is_vbr ? 240000 : cfg->rc_buf_sz; oxcf->starting_buffer_level_ms = is_vbr ? 60000 : cfg->rc_buf_initial_sz; oxcf->optimal_buffer_level_ms = is_vbr ? 60000 : cfg->rc_buf_optimal_sz; oxcf->drop_frames_water_mark = cfg->rc_dropframe_thresh; oxcf->two_pass_vbrbias = cfg->rc_2pass_vbr_bias_pct; oxcf->two_pass_vbrmin_section = cfg->rc_2pass_vbr_minsection_pct; oxcf->two_pass_vbrmax_section = cfg->rc_2pass_vbr_maxsection_pct; oxcf->auto_key = cfg->kf_mode == AOM_KF_AUTO && cfg->kf_min_dist != cfg->kf_max_dist; oxcf->key_freq = cfg->kf_max_dist; oxcf->speed = extra_cfg->cpu_used; oxcf->enable_auto_arf = extra_cfg->enable_auto_alt_ref; #if CONFIG_EXT_REFS oxcf->enable_auto_brf = extra_cfg->enable_auto_bwd_ref; #endif // CONFIG_EXT_REFS oxcf->noise_sensitivity = extra_cfg->noise_sensitivity; oxcf->sharpness = extra_cfg->sharpness; oxcf->two_pass_stats_in = cfg->rc_twopass_stats_in; #if CONFIG_FP_MB_STATS oxcf->firstpass_mb_stats_in = cfg->rc_firstpass_mb_stats_in; #endif oxcf->color_space = extra_cfg->color_space; #if CONFIG_COLORSPACE_HEADERS oxcf->transfer_function = extra_cfg->transfer_function; oxcf->chroma_sample_position = extra_cfg->chroma_sample_position; #endif oxcf->color_range = extra_cfg->color_range; oxcf->render_width = extra_cfg->render_width; oxcf->render_height = extra_cfg->render_height; oxcf->arnr_max_frames = extra_cfg->arnr_max_frames; oxcf->arnr_strength = extra_cfg->arnr_strength; oxcf->min_gf_interval = extra_cfg->min_gf_interval; oxcf->max_gf_interval = extra_cfg->max_gf_interval; oxcf->tuning = extra_cfg->tuning; oxcf->content = extra_cfg->content; #if CONFIG_EXT_PARTITION oxcf->superblock_size = extra_cfg->superblock_size; #endif // CONFIG_EXT_PARTITION #if CONFIG_ANS && ANS_MAX_SYMBOLS oxcf->ans_window_size_log2 = extra_cfg->ans_window_size_log2; #endif // CONFIG_ANS && ANS_MAX_SYMBOLS #if CONFIG_EXT_TILE oxcf->large_scale_tile = cfg->large_scale_tile; oxcf->single_tile_decoding = (oxcf->large_scale_tile) ? extra_cfg->single_tile_decoding : 0; if (oxcf->large_scale_tile) { #if CONFIG_EXT_PARTITION const unsigned int max = extra_cfg->superblock_size == AOM_SUPERBLOCK_SIZE_64X64 ? 64 : 32; #else const unsigned int max = 64; #endif // CONFIG_EXT_PARTITION // If tile size is not set, set it to the default value. const unsigned int tc = (!extra_cfg->tile_columns) ? UINT_MAX : extra_cfg->tile_columns; const unsigned int tr = (!extra_cfg->tile_rows) ? UINT_MAX : extra_cfg->tile_rows; oxcf->tile_columns = AOMMIN(tc, max); oxcf->tile_rows = AOMMIN(tr, max); } else { #endif // CONFIG_EXT_TILE oxcf->tile_columns = extra_cfg->tile_columns; oxcf->tile_rows = extra_cfg->tile_rows; #if CONFIG_EXT_TILE } #endif // CONFIG_EXT_TILE #if CONFIG_DEPENDENT_HORZTILES oxcf->dependent_horz_tiles = #if CONFIG_EXT_TILE (cfg->large_scale_tile) ? 0 : #endif // CONFIG_EXT_TILE extra_cfg->dependent_horz_tiles; #endif #if CONFIG_LOOPFILTERING_ACROSS_TILES oxcf->loop_filter_across_tiles_enabled = extra_cfg->loop_filter_across_tiles_enabled; #endif // CONFIG_LOOPFILTERING_ACROSS_TILES oxcf->error_resilient_mode = cfg->g_error_resilient; oxcf->frame_parallel_decoding_mode = extra_cfg->frame_parallel_decoding_mode; oxcf->aq_mode = extra_cfg->aq_mode; #if CONFIG_EXT_DELTA_Q oxcf->deltaq_mode = extra_cfg->deltaq_mode; #endif oxcf->frame_periodic_boost = extra_cfg->frame_periodic_boost; oxcf->motion_vector_unit_test = extra_cfg->motion_vector_unit_test; /* printf("Current AV1 Settings: \n"); printf("target_bandwidth: %d\n", oxcf->target_bandwidth); printf("noise_sensitivity: %d\n", oxcf->noise_sensitivity); printf("sharpness: %d\n", oxcf->sharpness); printf("cpu_used: %d\n", oxcf->cpu_used); printf("Mode: %d\n", oxcf->mode); printf("auto_key: %d\n", oxcf->auto_key); printf("key_freq: %d\n", oxcf->key_freq); printf("end_usage: %d\n", oxcf->end_usage); printf("under_shoot_pct: %d\n", oxcf->under_shoot_pct); printf("over_shoot_pct: %d\n", oxcf->over_shoot_pct); printf("starting_buffer_level: %d\n", oxcf->starting_buffer_level); printf("optimal_buffer_level: %d\n", oxcf->optimal_buffer_level); printf("maximum_buffer_size: %d\n", oxcf->maximum_buffer_size); printf("fixed_q: %d\n", oxcf->fixed_q); printf("worst_allowed_q: %d\n", oxcf->worst_allowed_q); printf("best_allowed_q: %d\n", oxcf->best_allowed_q); printf("allow_spatial_resampling: %d\n", oxcf->allow_spatial_resampling); printf("scaled_frame_width: %d\n", oxcf->scaled_frame_width); printf("scaled_frame_height: %d\n", oxcf->scaled_frame_height); printf("two_pass_vbrbias: %d\n", oxcf->two_pass_vbrbias); printf("two_pass_vbrmin_section: %d\n", oxcf->two_pass_vbrmin_section); printf("two_pass_vbrmax_section: %d\n", oxcf->two_pass_vbrmax_section); printf("lag_in_frames: %d\n", oxcf->lag_in_frames); printf("enable_auto_arf: %d\n", oxcf->enable_auto_arf); printf("Version: %d\n", oxcf->Version); printf("error resilient: %d\n", oxcf->error_resilient_mode); printf("frame parallel detokenization: %d\n", oxcf->frame_parallel_decoding_mode); */ return AOM_CODEC_OK; } static aom_codec_err_t encoder_set_config(aom_codec_alg_priv_t *ctx, const aom_codec_enc_cfg_t *cfg) { aom_codec_err_t res; int force_key = 0; if (cfg->g_w != ctx->cfg.g_w || cfg->g_h != ctx->cfg.g_h) { if (cfg->g_lag_in_frames > 1 || cfg->g_pass != AOM_RC_ONE_PASS) ERROR("Cannot change width or height after initialization"); if (!valid_ref_frame_size(ctx->cfg.g_w, ctx->cfg.g_h, cfg->g_w, cfg->g_h) || (ctx->cpi->initial_width && (int)cfg->g_w > ctx->cpi->initial_width) || (ctx->cpi->initial_height && (int)cfg->g_h > ctx->cpi->initial_height)) force_key = 1; } // Prevent increasing lag_in_frames. This check is stricter than it needs // to be -- the limit is not increasing past the first lag_in_frames // value, but we don't track the initial config, only the last successful // config. if (cfg->g_lag_in_frames > ctx->cfg.g_lag_in_frames) ERROR("Cannot increase lag_in_frames"); res = validate_config(ctx, cfg, &ctx->extra_cfg); if (res == AOM_CODEC_OK) { ctx->cfg = *cfg; set_encoder_config(&ctx->oxcf, &ctx->cfg, &ctx->extra_cfg); // On profile change, request a key frame force_key |= ctx->cpi->common.profile != ctx->oxcf.profile; av1_change_config(ctx->cpi, &ctx->oxcf); } if (force_key) ctx->next_frame_flags |= AOM_EFLAG_FORCE_KF; return res; } static aom_codec_err_t ctrl_get_quantizer(aom_codec_alg_priv_t *ctx, va_list args) { int *const arg = va_arg(args, int *); if (arg == NULL) return AOM_CODEC_INVALID_PARAM; *arg = av1_get_quantizer(ctx->cpi); return AOM_CODEC_OK; } static aom_codec_err_t ctrl_get_quantizer64(aom_codec_alg_priv_t *ctx, va_list args) { int *const arg = va_arg(args, int *); if (arg == NULL) return AOM_CODEC_INVALID_PARAM; *arg = av1_qindex_to_quantizer(av1_get_quantizer(ctx->cpi)); return AOM_CODEC_OK; } static aom_codec_err_t update_extra_cfg(aom_codec_alg_priv_t *ctx, const struct av1_extracfg *extra_cfg) { const aom_codec_err_t res = validate_config(ctx, &ctx->cfg, extra_cfg); if (res == AOM_CODEC_OK) { ctx->extra_cfg = *extra_cfg; set_encoder_config(&ctx->oxcf, &ctx->cfg, &ctx->extra_cfg); av1_change_config(ctx->cpi, &ctx->oxcf); } return res; } static aom_codec_err_t ctrl_set_cpuused(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.cpu_used = CAST(AOME_SET_CPUUSED, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_enable_auto_alt_ref(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.enable_auto_alt_ref = CAST(AOME_SET_ENABLEAUTOALTREF, args); return update_extra_cfg(ctx, &extra_cfg); } #if CONFIG_EXT_REFS static aom_codec_err_t ctrl_set_enable_auto_bwd_ref(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.enable_auto_bwd_ref = CAST(AOME_SET_ENABLEAUTOBWDREF, args); return update_extra_cfg(ctx, &extra_cfg); } #endif // CONFIG_EXT_REFS static aom_codec_err_t ctrl_set_noise_sensitivity(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.noise_sensitivity = CAST(AV1E_SET_NOISE_SENSITIVITY, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_sharpness(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.sharpness = CAST(AOME_SET_SHARPNESS, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_static_thresh(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.static_thresh = CAST(AOME_SET_STATIC_THRESHOLD, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_tile_columns(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.tile_columns = CAST(AV1E_SET_TILE_COLUMNS, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_tile_rows(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.tile_rows = CAST(AV1E_SET_TILE_ROWS, args); return update_extra_cfg(ctx, &extra_cfg); } #if CONFIG_DEPENDENT_HORZTILES static aom_codec_err_t ctrl_set_tile_dependent_rows(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.dependent_horz_tiles = CAST(AV1E_SET_TILE_DEPENDENT_ROWS, args); return update_extra_cfg(ctx, &extra_cfg); } #endif #if CONFIG_LOOPFILTERING_ACROSS_TILES static aom_codec_err_t ctrl_set_tile_loopfilter(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.loop_filter_across_tiles_enabled = CAST(AV1E_SET_TILE_LOOPFILTER, args); return update_extra_cfg(ctx, &extra_cfg); } #endif // CONFIG_LOOPFILTERING_ACROSS_TILES static aom_codec_err_t ctrl_set_arnr_max_frames(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.arnr_max_frames = CAST(AOME_SET_ARNR_MAXFRAMES, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_arnr_strength(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.arnr_strength = CAST(AOME_SET_ARNR_STRENGTH, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_tuning(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.tuning = CAST(AOME_SET_TUNING, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_cq_level(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.cq_level = CAST(AOME_SET_CQ_LEVEL, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_rc_max_intra_bitrate_pct( aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.rc_max_intra_bitrate_pct = CAST(AOME_SET_MAX_INTRA_BITRATE_PCT, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_rc_max_inter_bitrate_pct( aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.rc_max_inter_bitrate_pct = CAST(AOME_SET_MAX_INTER_BITRATE_PCT, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_rc_gf_cbr_boost_pct(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.gf_cbr_boost_pct = CAST(AV1E_SET_GF_CBR_BOOST_PCT, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_lossless(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.lossless = CAST(AV1E_SET_LOSSLESS, args); return update_extra_cfg(ctx, &extra_cfg); } #if CONFIG_AOM_QM static aom_codec_err_t ctrl_set_enable_qm(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.enable_qm = CAST(AV1E_SET_ENABLE_QM, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_qm_min(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.qm_min = CAST(AV1E_SET_QM_MIN, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_qm_max(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.qm_max = CAST(AV1E_SET_QM_MAX, args); return update_extra_cfg(ctx, &extra_cfg); } #endif static aom_codec_err_t ctrl_set_num_tg(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.num_tg = CAST(AV1E_SET_NUM_TG, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_mtu(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.mtu_size = CAST(AV1E_SET_MTU, args); return update_extra_cfg(ctx, &extra_cfg); } #if CONFIG_TEMPMV_SIGNALING static aom_codec_err_t ctrl_set_disable_tempmv(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.disable_tempmv = CAST(AV1E_SET_DISABLE_TEMPMV, args); return update_extra_cfg(ctx, &extra_cfg); } #endif static aom_codec_err_t ctrl_set_frame_parallel_decoding_mode( aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.frame_parallel_decoding_mode = CAST(AV1E_SET_FRAME_PARALLEL_DECODING, args); return update_extra_cfg(ctx, &extra_cfg); } #if CONFIG_EXT_TILE static aom_codec_err_t ctrl_set_single_tile_decoding(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.single_tile_decoding = CAST(AV1E_SET_SINGLE_TILE_DECODING, args); return update_extra_cfg(ctx, &extra_cfg); } #endif // CONFIG_EXT_TILE static aom_codec_err_t ctrl_set_aq_mode(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.aq_mode = CAST(AV1E_SET_AQ_MODE, args); return update_extra_cfg(ctx, &extra_cfg); } #if CONFIG_EXT_DELTA_Q static aom_codec_err_t ctrl_set_deltaq_mode(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.deltaq_mode = CAST(AV1E_SET_DELTAQ_MODE, args); return update_extra_cfg(ctx, &extra_cfg); } #endif static aom_codec_err_t ctrl_set_min_gf_interval(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.min_gf_interval = CAST(AV1E_SET_MIN_GF_INTERVAL, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_max_gf_interval(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.max_gf_interval = CAST(AV1E_SET_MAX_GF_INTERVAL, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_frame_periodic_boost(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.frame_periodic_boost = CAST(AV1E_SET_FRAME_PERIODIC_BOOST, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_enable_motion_vector_unit_test( aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.motion_vector_unit_test = CAST(AV1E_ENABLE_MOTION_VECTOR_UNIT_TEST, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t encoder_init(aom_codec_ctx_t *ctx, aom_codec_priv_enc_mr_cfg_t *data) { aom_codec_err_t res = AOM_CODEC_OK; (void)data; if (ctx->priv == NULL) { aom_codec_alg_priv_t *const priv = aom_calloc(1, sizeof(*priv)); if (priv == NULL) return AOM_CODEC_MEM_ERROR; ctx->priv = (aom_codec_priv_t *)priv; ctx->priv->init_flags = ctx->init_flags; ctx->priv->enc.total_encoders = 1; priv->buffer_pool = (BufferPool *)aom_calloc(1, sizeof(BufferPool)); if (priv->buffer_pool == NULL) return AOM_CODEC_MEM_ERROR; #if CONFIG_MULTITHREAD if (pthread_mutex_init(&priv->buffer_pool->pool_mutex, NULL)) { return AOM_CODEC_MEM_ERROR; } #endif if (ctx->config.enc) { // Update the reference to the config structure to an internal copy. priv->cfg = *ctx->config.enc; ctx->config.enc = &priv->cfg; } priv->extra_cfg = default_extra_cfg; once(av1_initialize_enc); res = validate_config(priv, &priv->cfg, &priv->extra_cfg); if (res == AOM_CODEC_OK) { set_encoder_config(&priv->oxcf, &priv->cfg, &priv->extra_cfg); #if CONFIG_HIGHBITDEPTH priv->oxcf.use_highbitdepth = (ctx->init_flags & AOM_CODEC_USE_HIGHBITDEPTH) ? 1 : 0; #endif priv->cpi = av1_create_compressor(&priv->oxcf, priv->buffer_pool); if (priv->cpi == NULL) res = AOM_CODEC_MEM_ERROR; else priv->cpi->output_pkt_list = &priv->pkt_list.head; } } return res; } static aom_codec_err_t encoder_destroy(aom_codec_alg_priv_t *ctx) { free(ctx->cx_data); av1_remove_compressor(ctx->cpi); #if CONFIG_MULTITHREAD pthread_mutex_destroy(&ctx->buffer_pool->pool_mutex); #endif aom_free(ctx->buffer_pool); aom_free(ctx); return AOM_CODEC_OK; } static void pick_quickcompress_mode(aom_codec_alg_priv_t *ctx, unsigned long deadline) { MODE new_mode = GOOD; switch (ctx->cfg.g_pass) { case AOM_RC_ONE_PASS: switch (deadline) { default: new_mode = GOOD; break; } break; case AOM_RC_FIRST_PASS: break; case AOM_RC_LAST_PASS: new_mode = GOOD; } if (ctx->oxcf.mode != new_mode) { ctx->oxcf.mode = new_mode; av1_change_config(ctx->cpi, &ctx->oxcf); } } // Turn on to test if supplemental superframe data breaks decoding #define TEST_SUPPLEMENTAL_SUPERFRAME_DATA 0 static int write_superframe_index(aom_codec_alg_priv_t *ctx) { uint8_t marker = 0xc0; size_t max_frame_sz = 0; assert(ctx->pending_frame_count); assert(ctx->pending_frame_count <= 8); // Add the number of frames to the marker byte marker |= ctx->pending_frame_count - 1; for (int i = 0; i < ctx->pending_frame_count - 1; i++) { const size_t frame_sz = ctx->pending_frame_sizes[i] - 1; max_frame_sz = AOMMAX(frame_sz, max_frame_sz); } // Choose the magnitude int mag; unsigned int mask; for (mag = 0, mask = 0xff; mag < 4; mag++) { if (max_frame_sz <= mask) break; mask <<= 8; mask |= 0xff; } marker |= mag << 3; // Write the index uint8_t buffer[256]; uint8_t *x = buffer; if (TEST_SUPPLEMENTAL_SUPERFRAME_DATA) { uint8_t marker_test = 0xc0; int mag_test = 2; // 1 - 4 int frames_test = 4; // 1 - 8 marker_test |= frames_test - 1; marker_test |= (mag_test - 1) << 3; *x++ = marker_test; for (int i = 0; i < mag_test * frames_test; ++i) *x++ = 0; // fill up with arbitrary data *x++ = marker_test; printf("Added supplemental superframe data\n"); } *x++ = marker; for (int i = 0; i < ctx->pending_frame_count - 1; i++) { assert(ctx->pending_frame_sizes[i] > 0); unsigned int this_sz = (unsigned int)ctx->pending_frame_sizes[i] - 1; for (int j = 0; j <= mag; j++) { *x++ = this_sz & 0xff; this_sz >>= 8; } } *x++ = marker; const size_t index_sz = x - buffer; assert(ctx->pending_cx_data_sz + index_sz < ctx->cx_data_sz); // move the frame to make room for the index memmove(ctx->pending_cx_data + index_sz, ctx->pending_cx_data, ctx->pending_cx_data_sz); memcpy(ctx->pending_cx_data, buffer, index_sz); ctx->pending_cx_data_sz += index_sz; return (int)index_sz; } // av1 uses 10,000,000 ticks/second as time stamp #define TICKS_PER_SEC 10000000LL static int64_t timebase_units_to_ticks(const aom_rational_t *timebase, int64_t n) { return n * TICKS_PER_SEC * timebase->num / timebase->den; } static int64_t ticks_to_timebase_units(const aom_rational_t *timebase, int64_t n) { const int64_t round = TICKS_PER_SEC * timebase->num / 2 - 1; return (n * timebase->den + round) / timebase->num / TICKS_PER_SEC; } static aom_codec_frame_flags_t get_frame_pkt_flags(const AV1_COMP *cpi, unsigned int lib_flags) { aom_codec_frame_flags_t flags = lib_flags << 16; if (lib_flags & FRAMEFLAGS_KEY) flags |= AOM_FRAME_IS_KEY; if (cpi->droppable) flags |= AOM_FRAME_IS_DROPPABLE; return flags; } static aom_codec_err_t encoder_encode(aom_codec_alg_priv_t *ctx, const aom_image_t *img, aom_codec_pts_t pts, unsigned long duration, aom_enc_frame_flags_t enc_flags, unsigned long deadline) { const size_t kMinCompressedSize = 8192; volatile aom_codec_err_t res = AOM_CODEC_OK; AV1_COMP *const cpi = ctx->cpi; const aom_rational_t *const timebase = &ctx->cfg.g_timebase; if (cpi == NULL) return AOM_CODEC_INVALID_PARAM; if (img != NULL) { res = validate_img(ctx, img); // TODO(jzern) the checks related to cpi's validity should be treated as a // failure condition, encoder setup is done fully in init() currently. if (res == AOM_CODEC_OK) { #if CONFIG_EXT_REFS size_t data_sz = ALIGN_POWER_OF_TWO(ctx->cfg.g_w, 5) * ALIGN_POWER_OF_TWO(ctx->cfg.g_h, 5) * get_image_bps(img); #else // There's no codec control for multiple alt-refs so check the encoder // instance for its status to determine the compressed data size. size_t data_sz = ALIGN_POWER_OF_TWO(ctx->cfg.g_w, 5) * ALIGN_POWER_OF_TWO(ctx->cfg.g_h, 5) * get_image_bps(img) / 8 * (cpi->multi_arf_allowed ? 8 : 2); #endif // CONFIG_EXT_REFS if (data_sz < kMinCompressedSize) data_sz = kMinCompressedSize; if (ctx->cx_data == NULL || ctx->cx_data_sz < data_sz) { ctx->cx_data_sz = data_sz; free(ctx->cx_data); ctx->cx_data = (unsigned char *)malloc(ctx->cx_data_sz); if (ctx->cx_data == NULL) { return AOM_CODEC_MEM_ERROR; } } } } pick_quickcompress_mode(ctx, deadline); aom_codec_pkt_list_init(&ctx->pkt_list); volatile aom_enc_frame_flags_t flags = enc_flags; // Handle Flags if (((flags & AOM_EFLAG_NO_UPD_GF) && (flags & AOM_EFLAG_FORCE_GF)) || ((flags & AOM_EFLAG_NO_UPD_ARF) && (flags & AOM_EFLAG_FORCE_ARF))) { ctx->base.err_detail = "Conflicting flags."; return AOM_CODEC_INVALID_PARAM; } if (setjmp(cpi->common.error.jmp)) { cpi->common.error.setjmp = 0; res = update_error_state(ctx, &cpi->common.error); aom_clear_system_state(); return res; } cpi->common.error.setjmp = 1; av1_apply_encoding_flags(cpi, flags); // Handle fixed keyframe intervals if (ctx->cfg.kf_mode == AOM_KF_AUTO && ctx->cfg.kf_min_dist == ctx->cfg.kf_max_dist) { if (++ctx->fixed_kf_cntr > ctx->cfg.kf_min_dist) { flags |= AOM_EFLAG_FORCE_KF; ctx->fixed_kf_cntr = 1; } } if (res == AOM_CODEC_OK) { int64_t dst_time_stamp = timebase_units_to_ticks(timebase, pts); int64_t dst_end_time_stamp = timebase_units_to_ticks(timebase, pts + duration); // Set up internal flags if (ctx->base.init_flags & AOM_CODEC_USE_PSNR) cpi->b_calculate_psnr = 1; if (img != NULL) { YV12_BUFFER_CONFIG sd; res = image2yuvconfig(img, &sd); // Store the original flags in to the frame buffer. Will extract the // key frame flag when we actually encode this frame. if (av1_receive_raw_frame(cpi, flags | ctx->next_frame_flags, &sd, dst_time_stamp, dst_end_time_stamp)) { res = update_error_state(ctx, &cpi->common.error); } ctx->next_frame_flags = 0; } unsigned char *cx_data = ctx->cx_data; size_t cx_data_sz = ctx->cx_data_sz; /* Any pending invisible frames? */ if (ctx->pending_cx_data) { memmove(cx_data, ctx->pending_cx_data, ctx->pending_cx_data_sz); ctx->pending_cx_data = cx_data; cx_data += ctx->pending_cx_data_sz; cx_data_sz -= ctx->pending_cx_data_sz; /* TODO: this is a minimal check, the underlying codec doesn't respect * the buffer size anyway. */ if (cx_data_sz < ctx->cx_data_sz / 2) { aom_internal_error(&cpi->common.error, AOM_CODEC_ERROR, "Compressed data buffer too small"); return AOM_CODEC_ERROR; } } size_t frame_size; unsigned int lib_flags = 0; while (cx_data_sz >= ctx->cx_data_sz / 2 && -1 != av1_get_compressed_data(cpi, &lib_flags, &frame_size, cx_data, &dst_time_stamp, &dst_end_time_stamp, !img)) { #if CONFIG_REFERENCE_BUFFER if (cpi->common.invalid_delta_frame_id_minus1) { ctx->base.err_detail = "Invalid delta_frame_id_minus1"; return AOM_CODEC_ERROR; } #endif if (!frame_size) continue; if (ctx->pending_cx_data == 0) ctx->pending_cx_data = cx_data; ctx->pending_frame_sizes[ctx->pending_frame_count++] = frame_size; ctx->pending_cx_data_sz += frame_size; cx_data += frame_size; cx_data_sz -= frame_size; // invisible frames get packed with the next visible frame if (!cpi->common.show_frame) continue; // insert superframe index if needed if (ctx->pending_frame_count > 1) { const size_t index_size = write_superframe_index(ctx); cx_data += index_size; cx_data_sz -= index_size; } // Add the frame packet to the list of returned packets. aom_codec_cx_pkt_t pkt; pkt.kind = AOM_CODEC_CX_FRAME_PKT; pkt.data.frame.buf = ctx->pending_cx_data; pkt.data.frame.sz = ctx->pending_cx_data_sz; pkt.data.frame.partition_id = -1; pkt.data.frame.pts = ticks_to_timebase_units(timebase, dst_time_stamp); pkt.data.frame.flags = get_frame_pkt_flags(cpi, lib_flags); pkt.data.frame.duration = (uint32_t)ticks_to_timebase_units( timebase, dst_end_time_stamp - dst_time_stamp); aom_codec_pkt_list_add(&ctx->pkt_list.head, &pkt); ctx->pending_cx_data = NULL; ctx->pending_cx_data_sz = 0; ctx->pending_frame_count = 0; } } cpi->common.error.setjmp = 0; return res; } static const aom_codec_cx_pkt_t *encoder_get_cxdata(aom_codec_alg_priv_t *ctx, aom_codec_iter_t *iter) { return aom_codec_pkt_list_get(&ctx->pkt_list.head, iter); } static aom_codec_err_t ctrl_set_reference(aom_codec_alg_priv_t *ctx, va_list args) { aom_ref_frame_t *const frame = va_arg(args, aom_ref_frame_t *); if (frame != NULL) { YV12_BUFFER_CONFIG sd; image2yuvconfig(&frame->img, &sd); av1_set_reference_enc(ctx->cpi, ref_frame_to_av1_reframe(frame->frame_type), &sd); return AOM_CODEC_OK; } else { return AOM_CODEC_INVALID_PARAM; } } static aom_codec_err_t ctrl_copy_reference(aom_codec_alg_priv_t *ctx, va_list args) { aom_ref_frame_t *const frame = va_arg(args, aom_ref_frame_t *); if (frame != NULL) { YV12_BUFFER_CONFIG sd; image2yuvconfig(&frame->img, &sd); av1_copy_reference_enc(ctx->cpi, ref_frame_to_av1_reframe(frame->frame_type), &sd); return AOM_CODEC_OK; } else { return AOM_CODEC_INVALID_PARAM; } } static aom_codec_err_t ctrl_get_reference(aom_codec_alg_priv_t *ctx, va_list args) { av1_ref_frame_t *const frame = va_arg(args, av1_ref_frame_t *); if (frame != NULL) { YV12_BUFFER_CONFIG *fb = get_ref_frame(&ctx->cpi->common, frame->idx); if (fb == NULL) return AOM_CODEC_ERROR; yuvconfig2image(&frame->img, fb, NULL); return AOM_CODEC_OK; } else { return AOM_CODEC_INVALID_PARAM; } } static aom_codec_err_t ctrl_get_new_frame_image(aom_codec_alg_priv_t *ctx, va_list args) { aom_image_t *const new_img = va_arg(args, aom_image_t *); if (new_img != NULL) { YV12_BUFFER_CONFIG new_frame; if (av1_get_last_show_frame(ctx->cpi, &new_frame) == 0) { yuvconfig2image(new_img, &new_frame, NULL); return AOM_CODEC_OK; } else { return AOM_CODEC_ERROR; } } else { return AOM_CODEC_INVALID_PARAM; } } static aom_codec_err_t ctrl_set_previewpp(aom_codec_alg_priv_t *ctx, va_list args) { (void)ctx; (void)args; return AOM_CODEC_INCAPABLE; } static aom_image_t *encoder_get_preview(aom_codec_alg_priv_t *ctx) { YV12_BUFFER_CONFIG sd; if (av1_get_preview_raw_frame(ctx->cpi, &sd) == 0) { yuvconfig2image(&ctx->preview_img, &sd, NULL); return &ctx->preview_img; } else { return NULL; } } static aom_codec_err_t ctrl_use_reference(aom_codec_alg_priv_t *ctx, va_list args) { const int reference_flag = va_arg(args, int); av1_use_as_reference(ctx->cpi, reference_flag); return AOM_CODEC_OK; } static aom_codec_err_t ctrl_set_roi_map(aom_codec_alg_priv_t *ctx, va_list args) { (void)ctx; (void)args; // TODO(yaowu): Need to re-implement and test for AV1. return AOM_CODEC_INVALID_PARAM; } static aom_codec_err_t ctrl_set_active_map(aom_codec_alg_priv_t *ctx, va_list args) { aom_active_map_t *const map = va_arg(args, aom_active_map_t *); if (map) { if (!av1_set_active_map(ctx->cpi, map->active_map, (int)map->rows, (int)map->cols)) return AOM_CODEC_OK; else return AOM_CODEC_INVALID_PARAM; } else { return AOM_CODEC_INVALID_PARAM; } } static aom_codec_err_t ctrl_get_active_map(aom_codec_alg_priv_t *ctx, va_list args) { aom_active_map_t *const map = va_arg(args, aom_active_map_t *); if (map) { if (!av1_get_active_map(ctx->cpi, map->active_map, (int)map->rows, (int)map->cols)) return AOM_CODEC_OK; else return AOM_CODEC_INVALID_PARAM; } else { return AOM_CODEC_INVALID_PARAM; } } static aom_codec_err_t ctrl_set_scale_mode(aom_codec_alg_priv_t *ctx, va_list args) { aom_scaling_mode_t *const mode = va_arg(args, aom_scaling_mode_t *); if (mode) { const int res = av1_set_internal_size(ctx->cpi, (AOM_SCALING)mode->h_scaling_mode, (AOM_SCALING)mode->v_scaling_mode); return (res == 0) ? AOM_CODEC_OK : AOM_CODEC_INVALID_PARAM; } else { return AOM_CODEC_INVALID_PARAM; } } static aom_codec_err_t ctrl_set_tune_content(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.content = CAST(AV1E_SET_TUNE_CONTENT, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_color_space(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.color_space = CAST(AV1E_SET_COLOR_SPACE, args); return update_extra_cfg(ctx, &extra_cfg); } #if CONFIG_COLORSPACE_HEADERS static aom_codec_err_t ctrl_set_transfer_function(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.transfer_function = CAST(AV1E_SET_TRANSFER_FUNCTION, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_chroma_sample_position( aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.chroma_sample_position = CAST(AV1E_SET_CHROMA_SAMPLE_POSITION, args); return update_extra_cfg(ctx, &extra_cfg); } #endif static aom_codec_err_t ctrl_set_color_range(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.color_range = CAST(AV1E_SET_COLOR_RANGE, args); return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_render_size(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; int *const render_size = va_arg(args, int *); extra_cfg.render_width = render_size[0]; extra_cfg.render_height = render_size[1]; return update_extra_cfg(ctx, &extra_cfg); } static aom_codec_err_t ctrl_set_superblock_size(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.superblock_size = CAST(AV1E_SET_SUPERBLOCK_SIZE, args); return update_extra_cfg(ctx, &extra_cfg); } #if CONFIG_ANS && ANS_MAX_SYMBOLS static aom_codec_err_t ctrl_set_ans_window_size_log2(aom_codec_alg_priv_t *ctx, va_list args) { struct av1_extracfg extra_cfg = ctx->extra_cfg; extra_cfg.ans_window_size_log2 = CAST(AV1E_SET_ANS_WINDOW_SIZE_LOG2, args); return update_extra_cfg(ctx, &extra_cfg); } #endif static aom_codec_ctrl_fn_map_t encoder_ctrl_maps[] = { { AOM_COPY_REFERENCE, ctrl_copy_reference }, { AOME_USE_REFERENCE, ctrl_use_reference }, // Setters { AOM_SET_REFERENCE, ctrl_set_reference }, { AOM_SET_POSTPROC, ctrl_set_previewpp }, { AOME_SET_ROI_MAP, ctrl_set_roi_map }, { AOME_SET_ACTIVEMAP, ctrl_set_active_map }, { AOME_SET_SCALEMODE, ctrl_set_scale_mode }, { AOME_SET_CPUUSED, ctrl_set_cpuused }, { AOME_SET_ENABLEAUTOALTREF, ctrl_set_enable_auto_alt_ref }, #if CONFIG_EXT_REFS { AOME_SET_ENABLEAUTOBWDREF, ctrl_set_enable_auto_bwd_ref }, #endif // CONFIG_EXT_REFS { AOME_SET_SHARPNESS, ctrl_set_sharpness }, { AOME_SET_STATIC_THRESHOLD, ctrl_set_static_thresh }, { AV1E_SET_TILE_COLUMNS, ctrl_set_tile_columns }, { AV1E_SET_TILE_ROWS, ctrl_set_tile_rows }, #if CONFIG_DEPENDENT_HORZTILES { AV1E_SET_TILE_DEPENDENT_ROWS, ctrl_set_tile_dependent_rows }, #endif #if CONFIG_LOOPFILTERING_ACROSS_TILES { AV1E_SET_TILE_LOOPFILTER, ctrl_set_tile_loopfilter }, #endif // CONFIG_LOOPFILTERING_ACROSS_TILES { AOME_SET_ARNR_MAXFRAMES, ctrl_set_arnr_max_frames }, { AOME_SET_ARNR_STRENGTH, ctrl_set_arnr_strength }, { AOME_SET_TUNING, ctrl_set_tuning }, { AOME_SET_CQ_LEVEL, ctrl_set_cq_level }, { AOME_SET_MAX_INTRA_BITRATE_PCT, ctrl_set_rc_max_intra_bitrate_pct }, { AV1E_SET_MAX_INTER_BITRATE_PCT, ctrl_set_rc_max_inter_bitrate_pct }, { AV1E_SET_GF_CBR_BOOST_PCT, ctrl_set_rc_gf_cbr_boost_pct }, { AV1E_SET_LOSSLESS, ctrl_set_lossless }, #if CONFIG_AOM_QM { AV1E_SET_ENABLE_QM, ctrl_set_enable_qm }, { AV1E_SET_QM_MIN, ctrl_set_qm_min }, { AV1E_SET_QM_MAX, ctrl_set_qm_max }, #endif { AV1E_SET_NUM_TG, ctrl_set_num_tg }, { AV1E_SET_MTU, ctrl_set_mtu }, #if CONFIG_TEMPMV_SIGNALING { AV1E_SET_DISABLE_TEMPMV, ctrl_set_disable_tempmv }, #endif { AV1E_SET_FRAME_PARALLEL_DECODING, ctrl_set_frame_parallel_decoding_mode }, { AV1E_SET_AQ_MODE, ctrl_set_aq_mode }, #if CONFIG_EXT_DELTA_Q { AV1E_SET_DELTAQ_MODE, ctrl_set_deltaq_mode }, #endif { AV1E_SET_FRAME_PERIODIC_BOOST, ctrl_set_frame_periodic_boost }, { AV1E_SET_TUNE_CONTENT, ctrl_set_tune_content }, { AV1E_SET_COLOR_SPACE, ctrl_set_color_space }, #if CONFIG_COLORSPACE_HEADERS { AV1E_SET_TRANSFER_FUNCTION, ctrl_set_transfer_function }, { AV1E_SET_CHROMA_SAMPLE_POSITION, ctrl_set_chroma_sample_position }, #endif { AV1E_SET_COLOR_RANGE, ctrl_set_color_range }, { AV1E_SET_NOISE_SENSITIVITY, ctrl_set_noise_sensitivity }, { AV1E_SET_MIN_GF_INTERVAL, ctrl_set_min_gf_interval }, { AV1E_SET_MAX_GF_INTERVAL, ctrl_set_max_gf_interval }, { AV1E_SET_RENDER_SIZE, ctrl_set_render_size }, { AV1E_SET_SUPERBLOCK_SIZE, ctrl_set_superblock_size }, #if CONFIG_ANS && ANS_MAX_SYMBOLS { AV1E_SET_ANS_WINDOW_SIZE_LOG2, ctrl_set_ans_window_size_log2 }, #endif #if CONFIG_EXT_TILE { AV1E_SET_SINGLE_TILE_DECODING, ctrl_set_single_tile_decoding }, #endif // CONFIG_EXT_TILE { AV1E_ENABLE_MOTION_VECTOR_UNIT_TEST, ctrl_enable_motion_vector_unit_test }, // Getters { AOME_GET_LAST_QUANTIZER, ctrl_get_quantizer }, { AOME_GET_LAST_QUANTIZER_64, ctrl_get_quantizer64 }, { AV1_GET_REFERENCE, ctrl_get_reference }, { AV1E_GET_ACTIVEMAP, ctrl_get_active_map }, { AV1_GET_NEW_FRAME_IMAGE, ctrl_get_new_frame_image }, { -1, NULL }, }; static aom_codec_enc_cfg_map_t encoder_usage_cfg_map[] = { { 0, { // NOLINT 0, // g_usage 8, // g_threads 0, // g_profile 320, // g_width 240, // g_height AOM_BITS_8, // g_bit_depth 8, // g_input_bit_depth { 1, 30 }, // g_timebase 0, // g_error_resilient AOM_RC_ONE_PASS, // g_pass 25, // g_lag_in_frames 0, // rc_dropframe_thresh RESIZE_NONE, // rc_resize_mode SCALE_DENOMINATOR, // rc_resize_numerator SCALE_DENOMINATOR, // rc_resize_kf_numerator 0, // rc_superres_mode SCALE_DENOMINATOR, // rc_superres_numerator SCALE_DENOMINATOR, // rc_superres_kf_numerator AOM_VBR, // rc_end_usage { NULL, 0 }, // rc_twopass_stats_in { NULL, 0 }, // rc_firstpass_mb_stats_in 256, // rc_target_bandwidth 0, // rc_min_quantizer 63, // rc_max_quantizer 25, // rc_undershoot_pct 25, // rc_overshoot_pct 6000, // rc_max_buffer_size 4000, // rc_buffer_initial_size 5000, // rc_buffer_optimal_size 50, // rc_two_pass_vbrbias 0, // rc_two_pass_vbrmin_section 2000, // rc_two_pass_vbrmax_section // keyframing settings (kf) AOM_KF_AUTO, // g_kfmode 0, // kf_min_dist 9999, // kf_max_dist 0, // large_scale_tile } }, }; #ifndef VERSION_STRING #define VERSION_STRING #endif CODEC_INTERFACE(aom_codec_av1_cx) = { "AOMedia Project AV1 Encoder" VERSION_STRING, AOM_CODEC_INTERNAL_ABI_VERSION, #if CONFIG_HIGHBITDEPTH AOM_CODEC_CAP_HIGHBITDEPTH | #endif AOM_CODEC_CAP_ENCODER | AOM_CODEC_CAP_PSNR, // aom_codec_caps_t encoder_init, // aom_codec_init_fn_t encoder_destroy, // aom_codec_destroy_fn_t encoder_ctrl_maps, // aom_codec_ctrl_fn_map_t { // NOLINT NULL, // aom_codec_peek_si_fn_t NULL, // aom_codec_get_si_fn_t NULL, // aom_codec_decode_fn_t NULL, // aom_codec_frame_get_fn_t NULL // aom_codec_set_fb_fn_t }, { // NOLINT 1, // 1 cfg map encoder_usage_cfg_map, // aom_codec_enc_cfg_map_t encoder_encode, // aom_codec_encode_fn_t encoder_get_cxdata, // aom_codec_get_cx_data_fn_t encoder_set_config, // aom_codec_enc_config_set_fn_t NULL, // aom_codec_get_global_headers_fn_t encoder_get_preview, // aom_codec_get_preview_frame_fn_t NULL // aom_codec_enc_mr_get_mem_loc_fn_t } };