encoder.c (225737B)
1 /* 2 * Copyright (c) 2016, Alliance for Open Media. All rights reserved. 3 * 4 * This source code is subject to the terms of the BSD 2 Clause License and 5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License 6 * was not distributed with this source code in the LICENSE file, you can 7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open 8 * Media Patent License 1.0 was not distributed with this source code in the 9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent. 10 */ 11 12 #include <assert.h> 13 #include <float.h> 14 #include <inttypes.h> 15 #include <limits.h> 16 #include <math.h> 17 #include <stdbool.h> 18 #include <stdint.h> 19 #include <stdio.h> 20 #include <stdlib.h> 21 #include <time.h> 22 23 #include "av1/common/scale.h" 24 #include "config/aom_config.h" 25 #include "config/aom_dsp_rtcd.h" 26 27 #include "aom/aomcx.h" 28 29 #if CONFIG_DENOISE 30 #include "aom_dsp/grain_table.h" 31 #include "aom_dsp/noise_util.h" 32 #include "aom_dsp/noise_model.h" 33 #endif 34 #include "aom_dsp/flow_estimation/corner_detect.h" 35 #include "aom_dsp/psnr.h" 36 #if CONFIG_INTERNAL_STATS 37 #include "aom_dsp/ssim.h" 38 #endif 39 #include "aom_ports/aom_timer.h" 40 #include "aom_ports/mem.h" 41 #include "aom_util/aom_pthread.h" 42 #if CONFIG_BITSTREAM_DEBUG 43 #include "aom_util/debug_util.h" 44 #endif // CONFIG_BITSTREAM_DEBUG 45 46 #include "av1/common/alloccommon.h" 47 #include "av1/common/debugmodes.h" 48 #include "av1/common/filter.h" 49 #include "av1/common/idct.h" 50 #include "av1/common/reconinter.h" 51 #include "av1/common/reconintra.h" 52 #include "av1/common/resize.h" 53 #include "av1/common/tile_common.h" 54 55 #include "av1/encoder/allintra_vis.h" 56 #include "av1/encoder/aq_complexity.h" 57 #include "av1/encoder/aq_cyclicrefresh.h" 58 #include "av1/encoder/aq_variance.h" 59 #include "av1/encoder/bitstream.h" 60 #if CONFIG_INTERNAL_STATS 61 #include "av1/encoder/blockiness.h" 62 #endif 63 #include "av1/encoder/context_tree.h" 64 #include "av1/encoder/dwt.h" 65 #include "av1/encoder/encodeframe.h" 66 #include "av1/encoder/encodemv.h" 67 #include "av1/encoder/encode_strategy.h" 68 #include "av1/encoder/encoder.h" 69 #include "av1/encoder/encoder_alloc.h" 70 #include "av1/encoder/encoder_utils.h" 71 #include "av1/encoder/encodetxb.h" 72 #include "av1/encoder/ethread.h" 73 #include "av1/encoder/firstpass.h" 74 #include "av1/encoder/hash_motion.h" 75 #include "av1/encoder/hybrid_fwd_txfm.h" 76 #include "av1/encoder/intra_mode_search.h" 77 #include "av1/encoder/mv_prec.h" 78 #include "av1/encoder/pass2_strategy.h" 79 #include "av1/encoder/pickcdef.h" 80 #include "av1/encoder/picklpf.h" 81 #include "av1/encoder/pickrst.h" 82 #include "av1/encoder/random.h" 83 #include "av1/encoder/ratectrl.h" 84 #include "av1/encoder/rc_utils.h" 85 #include "av1/encoder/rd.h" 86 #include "av1/encoder/rdopt.h" 87 #if CONFIG_SALIENCY_MAP 88 #include "av1/encoder/saliency_map.h" 89 #endif 90 #include "av1/encoder/segmentation.h" 91 #include "av1/encoder/speed_features.h" 92 #include "av1/encoder/superres_scale.h" 93 #if CONFIG_THREE_PASS 94 #include "av1/encoder/thirdpass.h" 95 #endif 96 #include "av1/encoder/tpl_model.h" 97 #include "av1/encoder/reconinter_enc.h" 98 #include "av1/encoder/var_based_part.h" 99 100 #define DEFAULT_EXPLICIT_ORDER_HINT_BITS 7 101 102 // #define OUTPUT_YUV_REC 103 #ifdef OUTPUT_YUV_REC 104 FILE *yuv_rec_file; 105 #define FILE_NAME_LEN 100 106 #endif 107 108 #ifdef OUTPUT_YUV_DENOISED 109 FILE *yuv_denoised_file = NULL; 110 #endif 111 112 static inline void Scale2Ratio(AOM_SCALING_MODE mode, int *hr, int *hs) { 113 switch (mode) { 114 case AOME_NORMAL: 115 *hr = 1; 116 *hs = 1; 117 break; 118 case AOME_FOURFIVE: 119 *hr = 4; 120 *hs = 5; 121 break; 122 case AOME_THREEFIVE: 123 *hr = 3; 124 *hs = 5; 125 break; 126 case AOME_THREEFOUR: 127 *hr = 3; 128 *hs = 4; 129 break; 130 case AOME_ONEFOUR: 131 *hr = 1; 132 *hs = 4; 133 break; 134 case AOME_ONEEIGHT: 135 *hr = 1; 136 *hs = 8; 137 break; 138 case AOME_ONETWO: 139 *hr = 1; 140 *hs = 2; 141 break; 142 case AOME_TWOTHREE: 143 *hr = 2; 144 *hs = 3; 145 break; 146 case AOME_ONETHREE: 147 *hr = 1; 148 *hs = 3; 149 break; 150 default: 151 *hr = 1; 152 *hs = 1; 153 assert(0); 154 break; 155 } 156 } 157 158 static int check_seg_range(int seg_data[8], int range) { 159 for (int i = 0; i < 8; ++i) { 160 // Note abs() alone can't be used as the behavior of abs(INT_MIN) is 161 // undefined. 162 if (seg_data[i] > range || seg_data[i] < -range) { 163 return 0; 164 } 165 } 166 return 1; 167 } 168 169 int av1_set_roi_map(AV1_COMP *cpi, unsigned char *map, unsigned int rows, 170 unsigned int cols, int delta_q[8], int delta_lf[8], 171 int skip[8], int ref_frame[8]) { 172 AV1_COMMON *cm = &cpi->common; 173 aom_roi_map_t *roi = &cpi->roi; 174 const int range = 63; 175 const int ref_frame_range = REF_FRAMES; 176 const int skip_range = 1; 177 const int frame_rows = cpi->common.mi_params.mi_rows; 178 const int frame_cols = cpi->common.mi_params.mi_cols; 179 180 // Check number of rows and columns match 181 if (frame_rows != (int)rows || frame_cols != (int)cols) { 182 return AOM_CODEC_INVALID_PARAM; 183 } 184 185 if (!check_seg_range(delta_q, range) || !check_seg_range(delta_lf, range) || 186 !check_seg_range(ref_frame, ref_frame_range) || 187 !check_seg_range(skip, skip_range)) 188 return AOM_CODEC_INVALID_PARAM; 189 190 // Also disable segmentation if no deltas are specified. 191 if (!map || 192 (!(delta_q[0] | delta_q[1] | delta_q[2] | delta_q[3] | delta_q[4] | 193 delta_q[5] | delta_q[6] | delta_q[7] | delta_lf[0] | delta_lf[1] | 194 delta_lf[2] | delta_lf[3] | delta_lf[4] | delta_lf[5] | delta_lf[6] | 195 delta_lf[7] | skip[0] | skip[1] | skip[2] | skip[3] | skip[4] | 196 skip[5] | skip[6] | skip[7]) && 197 (ref_frame[0] == -1 && ref_frame[1] == -1 && ref_frame[2] == -1 && 198 ref_frame[3] == -1 && ref_frame[4] == -1 && ref_frame[5] == -1 && 199 ref_frame[6] == -1 && ref_frame[7] == -1))) { 200 av1_disable_segmentation(&cm->seg); 201 cpi->roi.enabled = 0; 202 return AOM_CODEC_OK; 203 } 204 205 if (roi->roi_map) { 206 aom_free(roi->roi_map); 207 roi->roi_map = NULL; 208 } 209 roi->roi_map = aom_malloc(rows * cols); 210 if (!roi->roi_map) return AOM_CODEC_MEM_ERROR; 211 212 // Copy to ROI structure in the compressor. 213 memcpy(roi->roi_map, map, rows * cols); 214 memcpy(&roi->delta_q, delta_q, MAX_SEGMENTS * sizeof(delta_q[0])); 215 memcpy(&roi->delta_lf, delta_lf, MAX_SEGMENTS * sizeof(delta_lf[0])); 216 memcpy(&roi->skip, skip, MAX_SEGMENTS * sizeof(skip[0])); 217 memcpy(&roi->ref_frame, ref_frame, MAX_SEGMENTS * sizeof(ref_frame[0])); 218 roi->enabled = 1; 219 roi->rows = rows; 220 roi->cols = cols; 221 222 return AOM_CODEC_OK; 223 } 224 225 int av1_set_active_map(AV1_COMP *cpi, unsigned char *new_map_16x16, int rows, 226 int cols) { 227 const CommonModeInfoParams *const mi_params = &cpi->common.mi_params; 228 if (rows == mi_params->mb_rows && cols == mi_params->mb_cols) { 229 unsigned char *const active_map_4x4 = cpi->active_map.map; 230 const int mi_rows = mi_params->mi_rows; 231 const int mi_cols = mi_params->mi_cols; 232 cpi->active_map.update = 0; 233 cpi->rc.percent_blocks_inactive = 0; 234 assert(mi_rows % 2 == 0 && mi_rows > 0); 235 assert(mi_cols % 2 == 0 && mi_cols > 0); 236 if (new_map_16x16) { 237 int num_samples = 0; 238 int num_blocks_inactive = 0; 239 for (int r = 0; r < mi_rows; r += 4) { 240 for (int c = 0; c < mi_cols; c += 4) { 241 const uint8_t val = new_map_16x16[(r >> 2) * cols + (c >> 2)] 242 ? AM_SEGMENT_ID_ACTIVE 243 : AM_SEGMENT_ID_INACTIVE; 244 num_samples++; 245 if (val == AM_SEGMENT_ID_INACTIVE) num_blocks_inactive++; 246 const int row_max = AOMMIN(4, mi_rows - r); 247 const int col_max = AOMMIN(4, mi_cols - c); 248 for (int x = 0; x < row_max; ++x) { 249 for (int y = 0; y < col_max; ++y) { 250 active_map_4x4[(r + x) * mi_cols + (c + y)] = val; 251 } 252 } 253 } 254 } 255 cpi->active_map.enabled = 1; 256 cpi->active_map.update = 1; 257 assert(num_samples); 258 cpi->rc.percent_blocks_inactive = 259 (num_blocks_inactive * 100) / num_samples; 260 } 261 return 0; 262 } 263 264 return -1; 265 } 266 267 int av1_get_active_map(AV1_COMP *cpi, unsigned char *new_map_16x16, int rows, 268 int cols) { 269 const CommonModeInfoParams *const mi_params = &cpi->common.mi_params; 270 if (rows == mi_params->mb_rows && cols == mi_params->mb_cols && 271 new_map_16x16) { 272 unsigned char *const seg_map_8x8 = cpi->enc_seg.map; 273 const int mi_rows = mi_params->mi_rows; 274 const int mi_cols = mi_params->mi_cols; 275 const int row_scale = mi_size_high_log2[BLOCK_16X16]; 276 const int col_scale = mi_size_wide_log2[BLOCK_16X16]; 277 assert(mi_rows % 2 == 0); 278 assert(mi_cols % 2 == 0); 279 280 memset(new_map_16x16, !cpi->active_map.enabled, rows * cols); 281 if (cpi->active_map.enabled) { 282 for (int r = 0; r < (mi_rows >> row_scale); ++r) { 283 for (int c = 0; c < (mi_cols >> col_scale); ++c) { 284 // Cyclic refresh segments are considered active despite not having 285 // AM_SEGMENT_ID_ACTIVE 286 uint8_t temp = 0; 287 temp |= seg_map_8x8[(2 * r + 0) * mi_cols + (2 * c + 0)] != 288 AM_SEGMENT_ID_INACTIVE; 289 temp |= seg_map_8x8[(2 * r + 0) * mi_cols + (2 * c + 1)] != 290 AM_SEGMENT_ID_INACTIVE; 291 temp |= seg_map_8x8[(2 * r + 1) * mi_cols + (2 * c + 0)] != 292 AM_SEGMENT_ID_INACTIVE; 293 temp |= seg_map_8x8[(2 * r + 1) * mi_cols + (2 * c + 1)] != 294 AM_SEGMENT_ID_INACTIVE; 295 new_map_16x16[r * cols + c] |= temp; 296 } 297 } 298 } 299 return 0; 300 } 301 302 return -1; 303 } 304 305 void av1_initialize_enc(unsigned int usage, enum aom_rc_mode end_usage) { 306 bool is_allintra = usage == ALLINTRA; 307 308 av1_rtcd(); 309 aom_dsp_rtcd(); 310 aom_scale_rtcd(); 311 av1_init_intra_predictors(); 312 av1_init_me_luts(); 313 if (!is_allintra) av1_init_wedge_masks(); 314 if (!is_allintra || end_usage != AOM_Q) av1_rc_init_minq_luts(); 315 } 316 317 void av1_new_framerate(AV1_COMP *cpi, double framerate) { 318 cpi->framerate = framerate < 0.1 ? 30 : framerate; 319 av1_rc_update_framerate(cpi, cpi->common.width, cpi->common.height); 320 } 321 322 double av1_get_compression_ratio(const AV1_COMMON *const cm, 323 size_t encoded_frame_size) { 324 const int upscaled_width = cm->superres_upscaled_width; 325 const int height = cm->height; 326 const int64_t luma_pic_size = (int64_t)upscaled_width * height; 327 const SequenceHeader *const seq_params = cm->seq_params; 328 const BITSTREAM_PROFILE profile = seq_params->profile; 329 const int pic_size_profile_factor = 330 profile == PROFILE_0 ? 15 : (profile == PROFILE_1 ? 30 : 36); 331 encoded_frame_size = 332 (encoded_frame_size > 129 ? encoded_frame_size - 128 : 1); 333 const int64_t uncompressed_frame_size = 334 (luma_pic_size * pic_size_profile_factor) >> 3; 335 return (double)uncompressed_frame_size / encoded_frame_size; 336 } 337 338 static void auto_tile_size_balancing(AV1_COMMON *const cm, int num_sbs, 339 int num_tiles_lg, int tile_col_row) { 340 CommonTileParams *const tiles = &cm->tiles; 341 int i, start_sb; 342 int size_sb = num_sbs >> num_tiles_lg; 343 int res_sbs = num_sbs - (size_sb << num_tiles_lg); 344 int num_tiles = 1 << num_tiles_lg; 345 int inc_index = num_tiles - res_sbs; 346 347 tiles->uniform_spacing = 0; 348 349 const int max_size_sb = 350 tile_col_row ? tiles->max_width_sb : tiles->max_height_sb; 351 for (i = 0, start_sb = 0; start_sb < num_sbs && i < MAX_TILE_COLS; ++i) { 352 if (i == inc_index) ++size_sb; 353 if (tile_col_row) 354 tiles->col_start_sb[i] = start_sb; 355 else 356 tiles->row_start_sb[i] = start_sb; 357 358 start_sb += AOMMIN(size_sb, max_size_sb); 359 } 360 361 if (tile_col_row) { 362 tiles->cols = i; 363 tiles->col_start_sb[i] = num_sbs; 364 } else { 365 tiles->rows = i; 366 tiles->row_start_sb[i] = num_sbs; 367 } 368 } 369 370 static void set_tile_info(AV1_COMMON *const cm, 371 const TileConfig *const tile_cfg) { 372 const CommonModeInfoParams *const mi_params = &cm->mi_params; 373 const SequenceHeader *const seq_params = cm->seq_params; 374 CommonTileParams *const tiles = &cm->tiles; 375 int i, start_sb; 376 377 av1_get_tile_limits(cm); 378 379 int sb_cols = 380 CEIL_POWER_OF_TWO(mi_params->mi_cols, seq_params->mib_size_log2); 381 // configure tile columns 382 if (tile_cfg->tile_width_count == 0 || tile_cfg->tile_height_count == 0) { 383 tiles->uniform_spacing = 1; 384 tiles->log2_cols = AOMMAX(tile_cfg->tile_columns, tiles->min_log2_cols); 385 // Add a special case to handle super resolution 386 sb_cols = coded_to_superres_mi(sb_cols, cm->superres_scale_denominator); 387 int min_log2_cols = 0; 388 for (; (tiles->max_width_sb << min_log2_cols) <= sb_cols; ++min_log2_cols) { 389 } 390 tiles->log2_cols = AOMMAX(tiles->log2_cols, min_log2_cols); 391 392 tiles->log2_cols = AOMMIN(tiles->log2_cols, tiles->max_log2_cols); 393 } else if (tile_cfg->tile_widths[0] < 0) { 394 auto_tile_size_balancing(cm, sb_cols, tile_cfg->tile_columns, 1); 395 } else { 396 int size_sb, j = 0; 397 tiles->uniform_spacing = 0; 398 for (i = 0, start_sb = 0; start_sb < sb_cols && i < MAX_TILE_COLS; i++) { 399 tiles->col_start_sb[i] = start_sb; 400 size_sb = tile_cfg->tile_widths[j++]; 401 if (j >= tile_cfg->tile_width_count) j = 0; 402 start_sb += AOMMIN(size_sb, tiles->max_width_sb); 403 } 404 tiles->cols = i; 405 tiles->col_start_sb[i] = sb_cols; 406 } 407 av1_calculate_tile_cols(seq_params, mi_params->mi_rows, mi_params->mi_cols, 408 tiles); 409 410 // configure tile rows 411 int sb_rows = 412 CEIL_POWER_OF_TWO(mi_params->mi_rows, seq_params->mib_size_log2); 413 if (tiles->uniform_spacing) { 414 tiles->log2_rows = AOMMAX(tile_cfg->tile_rows, tiles->min_log2_rows); 415 tiles->log2_rows = AOMMIN(tiles->log2_rows, tiles->max_log2_rows); 416 } else if (tile_cfg->tile_heights[0] < 0) { 417 auto_tile_size_balancing(cm, sb_rows, tile_cfg->tile_rows, 0); 418 } else { 419 int size_sb, j = 0; 420 for (i = 0, start_sb = 0; start_sb < sb_rows && i < MAX_TILE_ROWS; i++) { 421 tiles->row_start_sb[i] = start_sb; 422 size_sb = tile_cfg->tile_heights[j++]; 423 if (j >= tile_cfg->tile_height_count) j = 0; 424 start_sb += AOMMIN(size_sb, tiles->max_height_sb); 425 } 426 tiles->rows = i; 427 tiles->row_start_sb[i] = sb_rows; 428 } 429 av1_calculate_tile_rows(seq_params, mi_params->mi_rows, tiles); 430 } 431 432 void av1_update_frame_size(AV1_COMP *cpi) { 433 AV1_COMMON *const cm = &cpi->common; 434 MACROBLOCKD *const xd = &cpi->td.mb.e_mbd; 435 436 // Setup mi_params here in case we need more mi's. 437 CommonModeInfoParams *const mi_params = &cm->mi_params; 438 mi_params->set_mb_mi(mi_params, cm->width, cm->height, 439 cpi->sf.part_sf.default_min_partition_size); 440 441 av1_init_macroblockd(cm, xd); 442 443 if (!cpi->ppi->seq_params_locked) 444 set_sb_size(cm->seq_params, 445 av1_select_sb_size(&cpi->oxcf, cm->width, cm->height, 446 cpi->ppi->number_spatial_layers)); 447 448 set_tile_info(cm, &cpi->oxcf.tile_cfg); 449 } 450 451 static inline int does_level_match(int width, int height, double fps, 452 int lvl_width, int lvl_height, 453 double lvl_fps, int lvl_dim_mult) { 454 const int64_t lvl_luma_pels = (int64_t)lvl_width * lvl_height; 455 const double lvl_display_sample_rate = lvl_luma_pels * lvl_fps; 456 const int64_t luma_pels = (int64_t)width * height; 457 const double display_sample_rate = luma_pels * fps; 458 return luma_pels <= lvl_luma_pels && 459 display_sample_rate <= lvl_display_sample_rate && 460 width <= lvl_width * lvl_dim_mult && 461 height <= lvl_height * lvl_dim_mult; 462 } 463 464 static void set_bitstream_level_tier(AV1_PRIMARY *const ppi, int width, 465 int height, double init_framerate) { 466 SequenceHeader *const seq_params = &ppi->seq_params; 467 const AV1LevelParams *const level_params = &ppi->level_params; 468 // TODO(any): This is a placeholder function that only addresses dimensions 469 // and max display sample rates. 470 // Need to add checks for max bit rate, max decoded luma sample rate, header 471 // rate, etc. that are not covered by this function. 472 AV1_LEVEL level = SEQ_LEVEL_MAX; 473 if (does_level_match(width, height, init_framerate, 512, 288, 30.0, 4)) { 474 level = SEQ_LEVEL_2_0; 475 } else if (does_level_match(width, height, init_framerate, 704, 396, 30.0, 476 4)) { 477 level = SEQ_LEVEL_2_1; 478 } else if (does_level_match(width, height, init_framerate, 1088, 612, 30.0, 479 4)) { 480 level = SEQ_LEVEL_3_0; 481 } else if (does_level_match(width, height, init_framerate, 1376, 774, 30.0, 482 4)) { 483 level = SEQ_LEVEL_3_1; 484 } else if (does_level_match(width, height, init_framerate, 2048, 1152, 30.0, 485 3)) { 486 level = SEQ_LEVEL_4_0; 487 } else if (does_level_match(width, height, init_framerate, 2048, 1152, 60.0, 488 3)) { 489 level = SEQ_LEVEL_4_1; 490 } else if (does_level_match(width, height, init_framerate, 4096, 2176, 30.0, 491 2)) { 492 level = SEQ_LEVEL_5_0; 493 } else if (does_level_match(width, height, init_framerate, 4096, 2176, 60.0, 494 2)) { 495 level = SEQ_LEVEL_5_1; 496 } else if (does_level_match(width, height, init_framerate, 4096, 2176, 120.0, 497 2)) { 498 level = SEQ_LEVEL_5_2; 499 } else if (does_level_match(width, height, init_framerate, 8192, 4352, 30.0, 500 2)) { 501 level = SEQ_LEVEL_6_0; 502 } else if (does_level_match(width, height, init_framerate, 8192, 4352, 60.0, 503 2)) { 504 level = SEQ_LEVEL_6_1; 505 } else if (does_level_match(width, height, init_framerate, 8192, 4352, 120.0, 506 2)) { 507 level = SEQ_LEVEL_6_2; 508 } 509 #if CONFIG_CWG_C013 510 // TODO(bohanli): currently target level is only working for the 0th operating 511 // point, so scalable coding is not supported. 512 else if (level_params->target_seq_level_idx[0] >= SEQ_LEVEL_7_0 && 513 level_params->target_seq_level_idx[0] <= SEQ_LEVEL_8_3) { 514 // Only use level 7.x to 8.x when explicitly asked to. 515 if (does_level_match(width, height, init_framerate, 16384, 8704, 30.0, 2)) { 516 level = SEQ_LEVEL_7_0; 517 } else if (does_level_match(width, height, init_framerate, 16384, 8704, 518 60.0, 2)) { 519 level = SEQ_LEVEL_7_1; 520 } else if (does_level_match(width, height, init_framerate, 16384, 8704, 521 120.0, 2)) { 522 level = SEQ_LEVEL_7_2; 523 } else if (does_level_match(width, height, init_framerate, 32768, 17408, 524 30.0, 2)) { 525 level = SEQ_LEVEL_8_0; 526 } else if (does_level_match(width, height, init_framerate, 32768, 17408, 527 60.0, 2)) { 528 level = SEQ_LEVEL_8_1; 529 } else if (does_level_match(width, height, init_framerate, 32768, 17408, 530 120.0, 2)) { 531 level = SEQ_LEVEL_8_2; 532 } 533 } 534 #endif 535 536 for (int i = 0; i < MAX_NUM_OPERATING_POINTS; ++i) { 537 assert(is_valid_seq_level_idx(level_params->target_seq_level_idx[i]) || 538 level_params->target_seq_level_idx[i] == SEQ_LEVEL_KEEP_STATS); 539 // If a higher target level is specified, it is then used rather than the 540 // inferred one from resolution and framerate. 541 seq_params->seq_level_idx[i] = 542 level_params->target_seq_level_idx[i] < SEQ_LEVELS && 543 level_params->target_seq_level_idx[i] > level 544 ? level_params->target_seq_level_idx[i] 545 : level; 546 // Set the maximum parameters for bitrate and buffer size for this profile, 547 // level, and tier 548 seq_params->op_params[i].bitrate = av1_max_level_bitrate( 549 seq_params->profile, seq_params->seq_level_idx[i], seq_params->tier[i]); 550 // Level with seq_level_idx = 31 returns a high "dummy" bitrate to pass the 551 // check 552 if (seq_params->op_params[i].bitrate == 0) 553 aom_internal_error( 554 &ppi->error, AOM_CODEC_UNSUP_BITSTREAM, 555 "AV1 does not support this combination of profile, level, and tier."); 556 // Buffer size in bits/s is bitrate in bits/s * 1 s 557 seq_params->op_params[i].buffer_size = seq_params->op_params[i].bitrate; 558 } 559 } 560 561 void av1_set_svc_seq_params(AV1_PRIMARY *const ppi) { 562 SequenceHeader *const seq = &ppi->seq_params; 563 if (seq->operating_points_cnt_minus_1 == 0) { 564 seq->operating_point_idc[0] = 0; 565 seq->has_nonzero_operating_point_idc = false; 566 } else { 567 // Set operating_point_idc[] such that the i=0 point corresponds to the 568 // highest quality operating point (all layers), and subsequent 569 // operarting points (i > 0) are lower quality corresponding to 570 // skip decoding enhancement layers (temporal first). 571 int i = 0; 572 assert(seq->operating_points_cnt_minus_1 == 573 (int)(ppi->number_spatial_layers * ppi->number_temporal_layers - 1)); 574 for (unsigned int sl = 0; sl < ppi->number_spatial_layers; sl++) { 575 for (unsigned int tl = 0; tl < ppi->number_temporal_layers; tl++) { 576 seq->operating_point_idc[i] = 577 (~(~0u << (ppi->number_spatial_layers - sl)) << 8) | 578 ~(~0u << (ppi->number_temporal_layers - tl)); 579 assert(seq->operating_point_idc[i] != 0); 580 i++; 581 } 582 } 583 seq->has_nonzero_operating_point_idc = true; 584 } 585 } 586 587 static void init_seq_coding_tools(AV1_PRIMARY *const ppi, 588 const AV1EncoderConfig *oxcf, 589 int disable_frame_id_numbers) { 590 SequenceHeader *const seq = &ppi->seq_params; 591 const FrameDimensionCfg *const frm_dim_cfg = &oxcf->frm_dim_cfg; 592 const ToolCfg *const tool_cfg = &oxcf->tool_cfg; 593 594 seq->still_picture = 595 !tool_cfg->force_video_mode && (oxcf->input_cfg.limit == 1); 596 seq->reduced_still_picture_hdr = 597 seq->still_picture && !tool_cfg->full_still_picture_hdr; 598 seq->force_screen_content_tools = 2; 599 seq->force_integer_mv = 2; 600 seq->order_hint_info.enable_order_hint = tool_cfg->enable_order_hint; 601 seq->frame_id_numbers_present_flag = 602 !seq->reduced_still_picture_hdr && 603 !oxcf->tile_cfg.enable_large_scale_tile && 604 tool_cfg->error_resilient_mode && !disable_frame_id_numbers; 605 if (seq->reduced_still_picture_hdr) { 606 seq->order_hint_info.enable_order_hint = 0; 607 seq->force_screen_content_tools = 2; 608 seq->force_integer_mv = 2; 609 } 610 seq->order_hint_info.order_hint_bits_minus_1 = 611 seq->order_hint_info.enable_order_hint 612 ? DEFAULT_EXPLICIT_ORDER_HINT_BITS - 1 613 : -1; 614 615 seq->max_frame_width = frm_dim_cfg->forced_max_frame_width 616 ? frm_dim_cfg->forced_max_frame_width 617 : AOMMAX(seq->max_frame_width, frm_dim_cfg->width); 618 seq->max_frame_height = 619 frm_dim_cfg->forced_max_frame_height 620 ? frm_dim_cfg->forced_max_frame_height 621 : AOMMAX(seq->max_frame_height, frm_dim_cfg->height); 622 seq->num_bits_width = 623 (seq->max_frame_width > 1) ? get_msb(seq->max_frame_width - 1) + 1 : 1; 624 seq->num_bits_height = 625 (seq->max_frame_height > 1) ? get_msb(seq->max_frame_height - 1) + 1 : 1; 626 assert(seq->num_bits_width <= 16); 627 assert(seq->num_bits_height <= 16); 628 629 seq->frame_id_length = FRAME_ID_LENGTH; 630 seq->delta_frame_id_length = DELTA_FRAME_ID_LENGTH; 631 632 seq->enable_dual_filter = tool_cfg->enable_dual_filter; 633 seq->order_hint_info.enable_dist_wtd_comp = 634 oxcf->comp_type_cfg.enable_dist_wtd_comp; 635 seq->order_hint_info.enable_dist_wtd_comp &= 636 seq->order_hint_info.enable_order_hint; 637 seq->order_hint_info.enable_ref_frame_mvs = tool_cfg->ref_frame_mvs_present; 638 seq->order_hint_info.enable_ref_frame_mvs &= 639 seq->order_hint_info.enable_order_hint; 640 seq->enable_superres = oxcf->superres_cfg.enable_superres; 641 seq->enable_cdef = tool_cfg->cdef_control != CDEF_NONE ? 1 : 0; 642 seq->enable_restoration = tool_cfg->enable_restoration; 643 seq->enable_warped_motion = oxcf->motion_mode_cfg.enable_warped_motion; 644 seq->enable_interintra_compound = tool_cfg->enable_interintra_comp; 645 seq->enable_masked_compound = oxcf->comp_type_cfg.enable_masked_comp; 646 seq->enable_intra_edge_filter = oxcf->intra_mode_cfg.enable_intra_edge_filter; 647 seq->enable_filter_intra = oxcf->intra_mode_cfg.enable_filter_intra; 648 649 set_bitstream_level_tier(ppi, frm_dim_cfg->width, frm_dim_cfg->height, 650 oxcf->input_cfg.init_framerate); 651 av1_set_svc_seq_params(ppi); 652 } 653 654 static void init_config_sequence(struct AV1_PRIMARY *ppi, 655 const AV1EncoderConfig *oxcf) { 656 SequenceHeader *const seq_params = &ppi->seq_params; 657 const DecoderModelCfg *const dec_model_cfg = &oxcf->dec_model_cfg; 658 const ColorCfg *const color_cfg = &oxcf->color_cfg; 659 660 ppi->use_svc = 0; 661 ppi->number_spatial_layers = 1; 662 ppi->number_temporal_layers = 1; 663 664 seq_params->profile = oxcf->profile; 665 seq_params->bit_depth = oxcf->tool_cfg.bit_depth; 666 seq_params->use_highbitdepth = oxcf->use_highbitdepth; 667 seq_params->color_primaries = color_cfg->color_primaries; 668 seq_params->transfer_characteristics = color_cfg->transfer_characteristics; 669 seq_params->matrix_coefficients = color_cfg->matrix_coefficients; 670 seq_params->monochrome = oxcf->tool_cfg.enable_monochrome; 671 seq_params->chroma_sample_position = color_cfg->chroma_sample_position; 672 seq_params->color_range = color_cfg->color_range; 673 seq_params->timing_info_present = dec_model_cfg->timing_info_present; 674 seq_params->timing_info.num_units_in_display_tick = 675 dec_model_cfg->timing_info.num_units_in_display_tick; 676 seq_params->timing_info.time_scale = dec_model_cfg->timing_info.time_scale; 677 seq_params->timing_info.equal_picture_interval = 678 dec_model_cfg->timing_info.equal_picture_interval; 679 seq_params->timing_info.num_ticks_per_picture = 680 dec_model_cfg->timing_info.num_ticks_per_picture; 681 682 seq_params->display_model_info_present_flag = 683 dec_model_cfg->display_model_info_present_flag; 684 seq_params->decoder_model_info_present_flag = 685 dec_model_cfg->decoder_model_info_present_flag; 686 if (dec_model_cfg->decoder_model_info_present_flag) { 687 // set the decoder model parameters in schedule mode 688 seq_params->decoder_model_info.num_units_in_decoding_tick = 689 dec_model_cfg->num_units_in_decoding_tick; 690 ppi->buffer_removal_time_present = 1; 691 av1_set_aom_dec_model_info(&seq_params->decoder_model_info); 692 av1_set_dec_model_op_parameters(&seq_params->op_params[0]); 693 } else if (seq_params->timing_info_present && 694 seq_params->timing_info.equal_picture_interval && 695 !seq_params->decoder_model_info_present_flag) { 696 // set the decoder model parameters in resource availability mode 697 av1_set_resource_availability_parameters(&seq_params->op_params[0]); 698 } else { 699 seq_params->op_params[0].initial_display_delay = 700 10; // Default value (not signaled) 701 } 702 703 if (seq_params->monochrome) { 704 seq_params->subsampling_x = 1; 705 seq_params->subsampling_y = 1; 706 } else if (seq_params->color_primaries == AOM_CICP_CP_BT_709 && 707 seq_params->transfer_characteristics == AOM_CICP_TC_SRGB && 708 seq_params->matrix_coefficients == AOM_CICP_MC_IDENTITY) { 709 seq_params->subsampling_x = 0; 710 seq_params->subsampling_y = 0; 711 } else { 712 if (seq_params->profile == 0) { 713 seq_params->subsampling_x = 1; 714 seq_params->subsampling_y = 1; 715 } else if (seq_params->profile == 1) { 716 seq_params->subsampling_x = 0; 717 seq_params->subsampling_y = 0; 718 } else { 719 if (seq_params->bit_depth == AOM_BITS_12) { 720 seq_params->subsampling_x = oxcf->input_cfg.chroma_subsampling_x; 721 seq_params->subsampling_y = oxcf->input_cfg.chroma_subsampling_y; 722 } else { 723 seq_params->subsampling_x = 1; 724 seq_params->subsampling_y = 0; 725 } 726 } 727 } 728 av1_change_config_seq(ppi, oxcf, NULL); 729 } 730 731 static void init_config(struct AV1_COMP *cpi, const AV1EncoderConfig *oxcf) { 732 AV1_COMMON *const cm = &cpi->common; 733 ResizePendingParams *resize_pending_params = &cpi->resize_pending_params; 734 735 cpi->oxcf = *oxcf; 736 cpi->framerate = oxcf->input_cfg.init_framerate; 737 738 cm->width = oxcf->frm_dim_cfg.width; 739 cm->height = oxcf->frm_dim_cfg.height; 740 cpi->is_dropped_frame = false; 741 742 alloc_compressor_data(cpi); 743 744 cpi->data_alloc_width = cm->width; 745 cpi->data_alloc_height = cm->height; 746 cpi->frame_size_related_setup_done = false; 747 748 // Single thread case: use counts in common. 749 cpi->td.counts = &cpi->counts; 750 751 // Init SVC parameters. 752 cpi->svc.number_spatial_layers = 1; 753 cpi->svc.number_temporal_layers = 1; 754 cm->spatial_layer_id = 0; 755 cm->temporal_layer_id = 0; 756 // Init rtc_ref parameters. 757 cpi->ppi->rtc_ref.set_ref_frame_config = 0; 758 cpi->ppi->rtc_ref.non_reference_frame = 0; 759 cpi->ppi->rtc_ref.ref_frame_comp[0] = 0; 760 cpi->ppi->rtc_ref.ref_frame_comp[1] = 0; 761 cpi->ppi->rtc_ref.ref_frame_comp[2] = 0; 762 763 // change includes all joint functionality 764 av1_change_config(cpi, oxcf, false); 765 766 cpi->ref_frame_flags = 0; 767 768 // Reset resize pending flags 769 resize_pending_params->width = 0; 770 resize_pending_params->height = 0; 771 772 // Setup identity scale factor 773 av1_setup_scale_factors_for_frame(&cm->sf_identity, 1, 1, 1, 1); 774 775 init_buffer_indices(&cpi->force_intpel_info, cm->remapped_ref_idx); 776 777 av1_noise_estimate_init(&cpi->noise_estimate, cm->width, cm->height); 778 } 779 780 void av1_change_config_seq(struct AV1_PRIMARY *ppi, 781 const AV1EncoderConfig *oxcf, 782 bool *is_sb_size_changed) { 783 SequenceHeader *const seq_params = &ppi->seq_params; 784 const FrameDimensionCfg *const frm_dim_cfg = &oxcf->frm_dim_cfg; 785 const DecoderModelCfg *const dec_model_cfg = &oxcf->dec_model_cfg; 786 const ColorCfg *const color_cfg = &oxcf->color_cfg; 787 788 if (seq_params->profile != oxcf->profile) seq_params->profile = oxcf->profile; 789 seq_params->bit_depth = oxcf->tool_cfg.bit_depth; 790 seq_params->color_primaries = color_cfg->color_primaries; 791 seq_params->transfer_characteristics = color_cfg->transfer_characteristics; 792 seq_params->matrix_coefficients = color_cfg->matrix_coefficients; 793 seq_params->monochrome = oxcf->tool_cfg.enable_monochrome; 794 seq_params->chroma_sample_position = color_cfg->chroma_sample_position; 795 seq_params->color_range = color_cfg->color_range; 796 797 assert(IMPLIES(seq_params->profile <= PROFILE_1, 798 seq_params->bit_depth <= AOM_BITS_10)); 799 800 seq_params->timing_info_present = dec_model_cfg->timing_info_present; 801 seq_params->timing_info.num_units_in_display_tick = 802 dec_model_cfg->timing_info.num_units_in_display_tick; 803 seq_params->timing_info.time_scale = dec_model_cfg->timing_info.time_scale; 804 seq_params->timing_info.equal_picture_interval = 805 dec_model_cfg->timing_info.equal_picture_interval; 806 seq_params->timing_info.num_ticks_per_picture = 807 dec_model_cfg->timing_info.num_ticks_per_picture; 808 809 seq_params->display_model_info_present_flag = 810 dec_model_cfg->display_model_info_present_flag; 811 seq_params->decoder_model_info_present_flag = 812 dec_model_cfg->decoder_model_info_present_flag; 813 if (dec_model_cfg->decoder_model_info_present_flag) { 814 // set the decoder model parameters in schedule mode 815 seq_params->decoder_model_info.num_units_in_decoding_tick = 816 dec_model_cfg->num_units_in_decoding_tick; 817 ppi->buffer_removal_time_present = 1; 818 av1_set_aom_dec_model_info(&seq_params->decoder_model_info); 819 av1_set_dec_model_op_parameters(&seq_params->op_params[0]); 820 } else if (seq_params->timing_info_present && 821 seq_params->timing_info.equal_picture_interval && 822 !seq_params->decoder_model_info_present_flag) { 823 // set the decoder model parameters in resource availability mode 824 av1_set_resource_availability_parameters(&seq_params->op_params[0]); 825 } else { 826 seq_params->op_params[0].initial_display_delay = 827 10; // Default value (not signaled) 828 } 829 830 #if !CONFIG_REALTIME_ONLY 831 av1_update_film_grain_parameters_seq(ppi, oxcf); 832 #endif 833 834 int sb_size = seq_params->sb_size; 835 // Superblock size should not be updated after the first key frame. 836 if (!ppi->seq_params_locked) { 837 set_sb_size(seq_params, av1_select_sb_size(oxcf, frm_dim_cfg->width, 838 frm_dim_cfg->height, 839 ppi->number_spatial_layers)); 840 for (int i = 0; i < MAX_NUM_OPERATING_POINTS; ++i) 841 seq_params->tier[i] = (oxcf->tier_mask >> i) & 1; 842 } 843 if (is_sb_size_changed != NULL && sb_size != seq_params->sb_size) 844 *is_sb_size_changed = true; 845 846 // Init sequence level coding tools 847 // This should not be called after the first key frame. 848 // Note that for SVC encoding the sequence parameters 849 // (operating_points_cnt_minus_1, operating_point_idc[], 850 // has_nonzero_operating_point_idc) should be updated whenever the 851 // number of layers is changed. This is done in the 852 // ctrl_set_svc_params(). 853 if (!ppi->seq_params_locked) { 854 seq_params->operating_points_cnt_minus_1 = 855 (ppi->number_spatial_layers > 1 || ppi->number_temporal_layers > 1) 856 ? ppi->number_spatial_layers * ppi->number_temporal_layers - 1 857 : 0; 858 init_seq_coding_tools(ppi, oxcf, 859 ppi->use_svc || ppi->rtc_ref.set_ref_frame_config); 860 } 861 seq_params->timing_info_present &= !seq_params->reduced_still_picture_hdr; 862 863 #if CONFIG_AV1_HIGHBITDEPTH 864 highbd_set_var_fns(ppi); 865 #endif 866 867 set_primary_rc_buffer_sizes(oxcf, ppi); 868 } 869 870 void av1_change_config(struct AV1_COMP *cpi, const AV1EncoderConfig *oxcf, 871 bool is_sb_size_changed) { 872 AV1_COMMON *const cm = &cpi->common; 873 SequenceHeader *const seq_params = cm->seq_params; 874 RATE_CONTROL *const rc = &cpi->rc; 875 PRIMARY_RATE_CONTROL *const p_rc = &cpi->ppi->p_rc; 876 MACROBLOCK *const x = &cpi->td.mb; 877 AV1LevelParams *const level_params = &cpi->ppi->level_params; 878 RefreshFrameInfo *const refresh_frame = &cpi->refresh_frame; 879 const FrameDimensionCfg *const frm_dim_cfg = &cpi->oxcf.frm_dim_cfg; 880 const RateControlCfg *const rc_cfg = &oxcf->rc_cfg; 881 FeatureFlags *const features = &cm->features; 882 883 // in case of LAP, lag in frames is set according to number of lap buffers 884 // calculated at init time. This stores and restores LAP's lag in frames to 885 // prevent override by new cfg. 886 int lap_lag_in_frames = -1; 887 if (cpi->ppi->lap_enabled && cpi->compressor_stage == LAP_STAGE) { 888 lap_lag_in_frames = cpi->oxcf.gf_cfg.lag_in_frames; 889 } 890 891 cpi->oxcf = *oxcf; 892 893 #if !CONFIG_REALTIME_ONLY 894 av1_update_film_grain_parameters(cpi, oxcf); 895 #endif 896 897 // When user provides superres_mode = AOM_SUPERRES_AUTO, we still initialize 898 // superres mode for current encoding = AOM_SUPERRES_NONE. This is to ensure 899 // that any analysis (e.g. TPL) happening outside the main encoding loop still 900 // happens at full resolution. 901 // This value will later be set appropriately just before main encoding loop. 902 cpi->superres_mode = oxcf->superres_cfg.superres_mode == AOM_SUPERRES_AUTO 903 ? AOM_SUPERRES_NONE 904 : oxcf->superres_cfg.superres_mode; // default 905 x->e_mbd.bd = (int)seq_params->bit_depth; 906 x->e_mbd.global_motion = cm->global_motion; 907 908 memcpy(level_params->target_seq_level_idx, cpi->oxcf.target_seq_level_idx, 909 sizeof(level_params->target_seq_level_idx)); 910 level_params->keep_level_stats = 0; 911 for (int i = 0; i < MAX_NUM_OPERATING_POINTS; ++i) { 912 if (level_params->target_seq_level_idx[i] < SEQ_LEVELS || 913 level_params->target_seq_level_idx[i] == SEQ_LEVEL_KEEP_STATS) { 914 level_params->keep_level_stats |= 1u << i; 915 if (!level_params->level_info[i]) { 916 CHECK_MEM_ERROR(cm, level_params->level_info[i], 917 aom_calloc(1, sizeof(*level_params->level_info[i]))); 918 } 919 } 920 } 921 922 // TODO(huisu@): level targeting currently only works for the 0th operating 923 // point, so scalable coding is not supported yet. 924 if (level_params->target_seq_level_idx[0] < SEQ_LEVELS) { 925 // Adjust encoder config in order to meet target level. 926 config_target_level(cpi, level_params->target_seq_level_idx[0], 927 seq_params->tier[0]); 928 } 929 930 if (has_no_stats_stage(cpi) && (rc_cfg->mode == AOM_Q)) { 931 p_rc->baseline_gf_interval = FIXED_GF_INTERVAL; 932 } else if (!is_one_pass_rt_params(cpi) || 933 cm->current_frame.frame_number == 0) { 934 // For rtc mode: logic for setting the baseline_gf_interval is done 935 // in av1_get_one_pass_rt_params(), and it should not be reset here in 936 // change_config(), unless after init_config (first frame). 937 p_rc->baseline_gf_interval = (MIN_GF_INTERVAL + MAX_GF_INTERVAL) / 2; 938 } 939 940 refresh_frame->golden_frame = false; 941 refresh_frame->bwd_ref_frame = false; 942 943 features->refresh_frame_context = 944 (oxcf->tool_cfg.frame_parallel_decoding_mode) 945 ? REFRESH_FRAME_CONTEXT_DISABLED 946 : REFRESH_FRAME_CONTEXT_BACKWARD; 947 if (oxcf->tile_cfg.enable_large_scale_tile) 948 features->refresh_frame_context = REFRESH_FRAME_CONTEXT_DISABLED; 949 950 if (x->palette_buffer == NULL) { 951 CHECK_MEM_ERROR(cm, x->palette_buffer, 952 aom_memalign(16, sizeof(*x->palette_buffer))); 953 } 954 955 if (x->tmp_conv_dst == NULL) { 956 CHECK_MEM_ERROR( 957 cm, x->tmp_conv_dst, 958 aom_memalign(32, MAX_SB_SIZE * MAX_SB_SIZE * sizeof(*x->tmp_conv_dst))); 959 x->e_mbd.tmp_conv_dst = x->tmp_conv_dst; 960 } 961 // The buffers 'tmp_pred_bufs[]' and 'comp_rd_buffer' are used in inter frames 962 // to store intermediate inter mode prediction results and are not required 963 // for allintra encoding mode. Hence, the memory allocations for these buffers 964 // are avoided for allintra encoding mode. 965 if (cpi->oxcf.kf_cfg.key_freq_max != 0) { 966 if (x->comp_rd_buffer.pred0 == NULL) 967 alloc_compound_type_rd_buffers(cm->error, &x->comp_rd_buffer); 968 969 for (int i = 0; i < 2; ++i) { 970 if (x->tmp_pred_bufs[i] == NULL) { 971 CHECK_MEM_ERROR(cm, x->tmp_pred_bufs[i], 972 aom_memalign(32, 2 * MAX_MB_PLANE * MAX_SB_SQUARE * 973 sizeof(*x->tmp_pred_bufs[i]))); 974 x->e_mbd.tmp_obmc_bufs[i] = x->tmp_pred_bufs[i]; 975 } 976 } 977 } 978 979 av1_reset_segment_features(cm); 980 981 av1_set_high_precision_mv(cpi, 1, 0); 982 983 // Under a configuration change, where maximum_buffer_size may change, 984 // keep buffer level clipped to the maximum allowed buffer size. 985 p_rc->bits_off_target = 986 AOMMIN(p_rc->bits_off_target, p_rc->maximum_buffer_size); 987 p_rc->buffer_level = AOMMIN(p_rc->buffer_level, p_rc->maximum_buffer_size); 988 989 // Set up frame rate and related parameters rate control values. 990 av1_new_framerate(cpi, cpi->framerate); 991 992 // Set absolute upper and lower quality limits 993 rc->worst_quality = rc_cfg->worst_allowed_q; 994 rc->best_quality = rc_cfg->best_allowed_q; 995 996 // If lossless has been requested make sure average Q accumulators are reset. 997 if (is_lossless_requested(&cpi->oxcf.rc_cfg)) { 998 int i; 999 for (i = 0; i < FRAME_TYPES; ++i) { 1000 p_rc->avg_frame_qindex[i] = 0; 1001 } 1002 } 1003 1004 features->interp_filter = 1005 oxcf->tile_cfg.enable_large_scale_tile ? EIGHTTAP_REGULAR : SWITCHABLE; 1006 features->switchable_motion_mode = is_switchable_motion_mode_allowed( 1007 features->allow_warped_motion, oxcf->motion_mode_cfg.enable_obmc); 1008 1009 if (frm_dim_cfg->render_width > 0 && frm_dim_cfg->render_height > 0) { 1010 cm->render_width = frm_dim_cfg->render_width; 1011 cm->render_height = frm_dim_cfg->render_height; 1012 } else { 1013 cm->render_width = frm_dim_cfg->width; 1014 cm->render_height = frm_dim_cfg->height; 1015 } 1016 1017 int last_width = cm->width; 1018 int last_height = cm->height; 1019 cm->width = frm_dim_cfg->width; 1020 cm->height = frm_dim_cfg->height; 1021 1022 if (cm->width > cpi->data_alloc_width || 1023 cm->height > cpi->data_alloc_height || is_sb_size_changed) { 1024 av1_free_context_buffers(cm); 1025 av1_free_shared_coeff_buffer(&cpi->td.shared_coeff_buf); 1026 av1_free_sms_tree(&cpi->td); 1027 av1_free_pmc(cpi->td.firstpass_ctx, av1_num_planes(cm)); 1028 cpi->td.firstpass_ctx = NULL; 1029 alloc_compressor_data(cpi); 1030 realloc_segmentation_maps(cpi); 1031 cpi->data_alloc_width = cm->width; 1032 cpi->data_alloc_height = cm->height; 1033 cpi->frame_size_related_setup_done = false; 1034 } 1035 av1_update_frame_size(cpi); 1036 1037 if (cm->width != last_width || cm->height != last_height) { 1038 if (cpi->oxcf.q_cfg.aq_mode == CYCLIC_REFRESH_AQ) { 1039 int mi_rows = cpi->common.mi_params.mi_rows; 1040 int mi_cols = cpi->common.mi_params.mi_cols; 1041 aom_free(cpi->cyclic_refresh->map); 1042 CHECK_MEM_ERROR( 1043 cm, cpi->cyclic_refresh->map, 1044 aom_calloc(mi_rows * mi_cols, sizeof(*cpi->cyclic_refresh->map))); 1045 if (cpi->svc.number_spatial_layers > 1) { 1046 for (int sl = 0; sl < cpi->svc.number_spatial_layers; ++sl) { 1047 const int layer = 1048 LAYER_IDS_TO_IDX(sl, 0, cpi->svc.number_temporal_layers); 1049 LAYER_CONTEXT *const lc = &cpi->svc.layer_context[layer]; 1050 lc->sb_index = 0; 1051 lc->actual_num_seg1_blocks = 0; 1052 lc->actual_num_seg2_blocks = 0; 1053 lc->counter_encode_maxq_scene_change = 0; 1054 aom_free(lc->map); 1055 CHECK_MEM_ERROR(cm, lc->map, 1056 aom_calloc(mi_rows * mi_cols, sizeof(*lc->map))); 1057 } 1058 } 1059 } 1060 } 1061 1062 rc->is_src_frame_alt_ref = 0; 1063 1064 if (!cpi->ppi->rtc_ref.set_ref_frame_config) 1065 cpi->ext_flags.refresh_frame.update_pending = 0; 1066 cpi->ext_flags.refresh_frame_context_pending = 0; 1067 1068 if (cpi->ppi->use_svc) 1069 av1_update_layer_context_change_config(cpi, rc_cfg->target_bandwidth); 1070 1071 check_reset_rc_flag(cpi); 1072 1073 // restore the value of lag_in_frame for LAP stage. 1074 if (lap_lag_in_frames != -1) { 1075 cpi->oxcf.gf_cfg.lag_in_frames = lap_lag_in_frames; 1076 } 1077 1078 #if CONFIG_REALTIME_ONLY 1079 assert(!oxcf->tool_cfg.enable_global_motion); 1080 cpi->alloc_pyramid = false; 1081 #else 1082 cpi->alloc_pyramid = oxcf->tool_cfg.enable_global_motion; 1083 #endif // CONFIG_REALTIME_ONLY 1084 } 1085 1086 static inline void init_frame_info(FRAME_INFO *frame_info, 1087 const AV1_COMMON *const cm) { 1088 const CommonModeInfoParams *const mi_params = &cm->mi_params; 1089 const SequenceHeader *const seq_params = cm->seq_params; 1090 frame_info->frame_width = cm->width; 1091 frame_info->frame_height = cm->height; 1092 frame_info->mi_cols = mi_params->mi_cols; 1093 frame_info->mi_rows = mi_params->mi_rows; 1094 frame_info->mb_cols = mi_params->mb_cols; 1095 frame_info->mb_rows = mi_params->mb_rows; 1096 frame_info->num_mbs = mi_params->MBs; 1097 frame_info->bit_depth = seq_params->bit_depth; 1098 frame_info->subsampling_x = seq_params->subsampling_x; 1099 frame_info->subsampling_y = seq_params->subsampling_y; 1100 } 1101 1102 static inline void init_frame_index_set(FRAME_INDEX_SET *frame_index_set) { 1103 frame_index_set->show_frame_count = 0; 1104 } 1105 1106 static inline void update_counters_for_show_frame(AV1_COMP *const cpi) { 1107 assert(cpi->common.show_frame); 1108 cpi->frame_index_set.show_frame_count++; 1109 cpi->common.current_frame.frame_number++; 1110 } 1111 1112 AV1_PRIMARY *av1_create_primary_compressor( 1113 struct aom_codec_pkt_list *pkt_list_head, int num_lap_buffers, 1114 const AV1EncoderConfig *oxcf) { 1115 AV1_PRIMARY *volatile const ppi = aom_memalign(32, sizeof(AV1_PRIMARY)); 1116 if (!ppi) return NULL; 1117 av1_zero(*ppi); 1118 1119 // The jmp_buf is valid only for the duration of the function that calls 1120 // setjmp(). Therefore, this function must reset the 'setjmp' field to 0 1121 // before it returns. 1122 if (setjmp(ppi->error.jmp)) { 1123 ppi->error.setjmp = 0; 1124 av1_remove_primary_compressor(ppi); 1125 return 0; 1126 } 1127 ppi->error.setjmp = 1; 1128 1129 ppi->seq_params_locked = 0; 1130 ppi->lap_enabled = num_lap_buffers > 0; 1131 ppi->output_pkt_list = pkt_list_head; 1132 ppi->b_calculate_psnr = CONFIG_INTERNAL_STATS; 1133 ppi->frames_left = oxcf->input_cfg.limit; 1134 ppi->num_fp_contexts = 1; 1135 1136 init_config_sequence(ppi, oxcf); 1137 1138 #if CONFIG_ENTROPY_STATS 1139 av1_zero(ppi->aggregate_fc); 1140 #endif // CONFIG_ENTROPY_STATS 1141 1142 av1_primary_rc_init(oxcf, &ppi->p_rc); 1143 1144 // For two pass and lag_in_frames > 33 in LAP. 1145 ppi->p_rc.enable_scenecut_detection = ENABLE_SCENECUT_MODE_2; 1146 if (ppi->lap_enabled) { 1147 if ((num_lap_buffers < 1148 (MAX_GF_LENGTH_LAP + SCENE_CUT_KEY_TEST_INTERVAL + 1)) && 1149 num_lap_buffers >= (MAX_GF_LENGTH_LAP + 3)) { 1150 /* 1151 * For lag in frames >= 19 and <33, enable scenecut 1152 * with limited future frame prediction. 1153 */ 1154 ppi->p_rc.enable_scenecut_detection = ENABLE_SCENECUT_MODE_1; 1155 } else if (num_lap_buffers < (MAX_GF_LENGTH_LAP + 3)) { 1156 // Disable scenecut when lag_in_frames < 19. 1157 ppi->p_rc.enable_scenecut_detection = DISABLE_SCENECUT; 1158 } 1159 } 1160 1161 #define BFP(BT, SDF, SDAF, VF, SVF, SVAF, SDX4DF, SDX3DF) \ 1162 ppi->fn_ptr[BT].sdf = SDF; \ 1163 ppi->fn_ptr[BT].sdaf = SDAF; \ 1164 ppi->fn_ptr[BT].vf = VF; \ 1165 ppi->fn_ptr[BT].svf = SVF; \ 1166 ppi->fn_ptr[BT].svaf = SVAF; \ 1167 ppi->fn_ptr[BT].sdx4df = SDX4DF; \ 1168 ppi->fn_ptr[BT].sdx3df = SDX3DF; 1169 1170 // Realtime mode doesn't use 4x rectangular blocks. 1171 #if !CONFIG_REALTIME_ONLY 1172 // sdaf (used in compound prediction, get_mvpred_compound_sad()) is unused 1173 // for 4xN and Nx4 blocks. 1174 BFP(BLOCK_4X16, aom_sad4x16, /*SDAF=*/NULL, aom_variance4x16, 1175 aom_sub_pixel_variance4x16, aom_sub_pixel_avg_variance4x16, 1176 aom_sad4x16x4d, aom_sad4x16x3d) 1177 1178 // sdaf (used in compound prediction, get_mvpred_compound_sad()) is unused 1179 // for 4xN and Nx4 blocks. 1180 BFP(BLOCK_16X4, aom_sad16x4, /*SDAF=*/NULL, aom_variance16x4, 1181 aom_sub_pixel_variance16x4, aom_sub_pixel_avg_variance16x4, 1182 aom_sad16x4x4d, aom_sad16x4x3d) 1183 1184 BFP(BLOCK_8X32, aom_sad8x32, aom_sad8x32_avg, aom_variance8x32, 1185 aom_sub_pixel_variance8x32, aom_sub_pixel_avg_variance8x32, 1186 aom_sad8x32x4d, aom_sad8x32x3d) 1187 1188 BFP(BLOCK_32X8, aom_sad32x8, aom_sad32x8_avg, aom_variance32x8, 1189 aom_sub_pixel_variance32x8, aom_sub_pixel_avg_variance32x8, 1190 aom_sad32x8x4d, aom_sad32x8x3d) 1191 1192 BFP(BLOCK_16X64, aom_sad16x64, aom_sad16x64_avg, aom_variance16x64, 1193 aom_sub_pixel_variance16x64, aom_sub_pixel_avg_variance16x64, 1194 aom_sad16x64x4d, aom_sad16x64x3d) 1195 1196 BFP(BLOCK_64X16, aom_sad64x16, aom_sad64x16_avg, aom_variance64x16, 1197 aom_sub_pixel_variance64x16, aom_sub_pixel_avg_variance64x16, 1198 aom_sad64x16x4d, aom_sad64x16x3d) 1199 #endif // !CONFIG_REALTIME_ONLY 1200 1201 BFP(BLOCK_128X128, aom_sad128x128, aom_sad128x128_avg, aom_variance128x128, 1202 aom_sub_pixel_variance128x128, aom_sub_pixel_avg_variance128x128, 1203 aom_sad128x128x4d, aom_sad128x128x3d) 1204 1205 BFP(BLOCK_128X64, aom_sad128x64, aom_sad128x64_avg, aom_variance128x64, 1206 aom_sub_pixel_variance128x64, aom_sub_pixel_avg_variance128x64, 1207 aom_sad128x64x4d, aom_sad128x64x3d) 1208 1209 BFP(BLOCK_64X128, aom_sad64x128, aom_sad64x128_avg, aom_variance64x128, 1210 aom_sub_pixel_variance64x128, aom_sub_pixel_avg_variance64x128, 1211 aom_sad64x128x4d, aom_sad64x128x3d) 1212 1213 BFP(BLOCK_32X16, aom_sad32x16, aom_sad32x16_avg, aom_variance32x16, 1214 aom_sub_pixel_variance32x16, aom_sub_pixel_avg_variance32x16, 1215 aom_sad32x16x4d, aom_sad32x16x3d) 1216 1217 BFP(BLOCK_16X32, aom_sad16x32, aom_sad16x32_avg, aom_variance16x32, 1218 aom_sub_pixel_variance16x32, aom_sub_pixel_avg_variance16x32, 1219 aom_sad16x32x4d, aom_sad16x32x3d) 1220 1221 BFP(BLOCK_64X32, aom_sad64x32, aom_sad64x32_avg, aom_variance64x32, 1222 aom_sub_pixel_variance64x32, aom_sub_pixel_avg_variance64x32, 1223 aom_sad64x32x4d, aom_sad64x32x3d) 1224 1225 BFP(BLOCK_32X64, aom_sad32x64, aom_sad32x64_avg, aom_variance32x64, 1226 aom_sub_pixel_variance32x64, aom_sub_pixel_avg_variance32x64, 1227 aom_sad32x64x4d, aom_sad32x64x3d) 1228 1229 BFP(BLOCK_32X32, aom_sad32x32, aom_sad32x32_avg, aom_variance32x32, 1230 aom_sub_pixel_variance32x32, aom_sub_pixel_avg_variance32x32, 1231 aom_sad32x32x4d, aom_sad32x32x3d) 1232 1233 BFP(BLOCK_64X64, aom_sad64x64, aom_sad64x64_avg, aom_variance64x64, 1234 aom_sub_pixel_variance64x64, aom_sub_pixel_avg_variance64x64, 1235 aom_sad64x64x4d, aom_sad64x64x3d) 1236 1237 BFP(BLOCK_16X16, aom_sad16x16, aom_sad16x16_avg, aom_variance16x16, 1238 aom_sub_pixel_variance16x16, aom_sub_pixel_avg_variance16x16, 1239 aom_sad16x16x4d, aom_sad16x16x3d) 1240 1241 BFP(BLOCK_16X8, aom_sad16x8, aom_sad16x8_avg, aom_variance16x8, 1242 aom_sub_pixel_variance16x8, aom_sub_pixel_avg_variance16x8, 1243 aom_sad16x8x4d, aom_sad16x8x3d) 1244 1245 BFP(BLOCK_8X16, aom_sad8x16, aom_sad8x16_avg, aom_variance8x16, 1246 aom_sub_pixel_variance8x16, aom_sub_pixel_avg_variance8x16, 1247 aom_sad8x16x4d, aom_sad8x16x3d) 1248 1249 BFP(BLOCK_8X8, aom_sad8x8, aom_sad8x8_avg, aom_variance8x8, 1250 aom_sub_pixel_variance8x8, aom_sub_pixel_avg_variance8x8, aom_sad8x8x4d, 1251 aom_sad8x8x3d) 1252 1253 // sdaf (used in compound prediction, get_mvpred_compound_sad()) is unused 1254 // for 4xN and Nx4 blocks. 1255 BFP(BLOCK_8X4, aom_sad8x4, /*SDAF=*/NULL, aom_variance8x4, 1256 aom_sub_pixel_variance8x4, aom_sub_pixel_avg_variance8x4, aom_sad8x4x4d, 1257 aom_sad8x4x3d) 1258 1259 // sdaf (used in compound prediction, get_mvpred_compound_sad()) is unused 1260 // for 4xN and Nx4 blocks. 1261 BFP(BLOCK_4X8, aom_sad4x8, /*SDAF=*/NULL, aom_variance4x8, 1262 aom_sub_pixel_variance4x8, aom_sub_pixel_avg_variance4x8, aom_sad4x8x4d, 1263 aom_sad4x8x3d) 1264 1265 // sdaf (used in compound prediction, get_mvpred_compound_sad()) is unused 1266 // for 4xN and Nx4 blocks. 1267 BFP(BLOCK_4X4, aom_sad4x4, /*SDAF=*/NULL, aom_variance4x4, 1268 aom_sub_pixel_variance4x4, aom_sub_pixel_avg_variance4x4, aom_sad4x4x4d, 1269 aom_sad4x4x3d) 1270 1271 #if !CONFIG_REALTIME_ONLY 1272 #define OBFP(BT, OSDF, OVF, OSVF) \ 1273 ppi->fn_ptr[BT].osdf = OSDF; \ 1274 ppi->fn_ptr[BT].ovf = OVF; \ 1275 ppi->fn_ptr[BT].osvf = OSVF; 1276 1277 OBFP(BLOCK_128X128, aom_obmc_sad128x128, aom_obmc_variance128x128, 1278 aom_obmc_sub_pixel_variance128x128) 1279 OBFP(BLOCK_128X64, aom_obmc_sad128x64, aom_obmc_variance128x64, 1280 aom_obmc_sub_pixel_variance128x64) 1281 OBFP(BLOCK_64X128, aom_obmc_sad64x128, aom_obmc_variance64x128, 1282 aom_obmc_sub_pixel_variance64x128) 1283 OBFP(BLOCK_64X64, aom_obmc_sad64x64, aom_obmc_variance64x64, 1284 aom_obmc_sub_pixel_variance64x64) 1285 OBFP(BLOCK_64X32, aom_obmc_sad64x32, aom_obmc_variance64x32, 1286 aom_obmc_sub_pixel_variance64x32) 1287 OBFP(BLOCK_32X64, aom_obmc_sad32x64, aom_obmc_variance32x64, 1288 aom_obmc_sub_pixel_variance32x64) 1289 OBFP(BLOCK_32X32, aom_obmc_sad32x32, aom_obmc_variance32x32, 1290 aom_obmc_sub_pixel_variance32x32) 1291 OBFP(BLOCK_32X16, aom_obmc_sad32x16, aom_obmc_variance32x16, 1292 aom_obmc_sub_pixel_variance32x16) 1293 OBFP(BLOCK_16X32, aom_obmc_sad16x32, aom_obmc_variance16x32, 1294 aom_obmc_sub_pixel_variance16x32) 1295 OBFP(BLOCK_16X16, aom_obmc_sad16x16, aom_obmc_variance16x16, 1296 aom_obmc_sub_pixel_variance16x16) 1297 OBFP(BLOCK_16X8, aom_obmc_sad16x8, aom_obmc_variance16x8, 1298 aom_obmc_sub_pixel_variance16x8) 1299 OBFP(BLOCK_8X16, aom_obmc_sad8x16, aom_obmc_variance8x16, 1300 aom_obmc_sub_pixel_variance8x16) 1301 OBFP(BLOCK_8X8, aom_obmc_sad8x8, aom_obmc_variance8x8, 1302 aom_obmc_sub_pixel_variance8x8) 1303 OBFP(BLOCK_4X8, aom_obmc_sad4x8, aom_obmc_variance4x8, 1304 aom_obmc_sub_pixel_variance4x8) 1305 OBFP(BLOCK_8X4, aom_obmc_sad8x4, aom_obmc_variance8x4, 1306 aom_obmc_sub_pixel_variance8x4) 1307 OBFP(BLOCK_4X4, aom_obmc_sad4x4, aom_obmc_variance4x4, 1308 aom_obmc_sub_pixel_variance4x4) 1309 OBFP(BLOCK_4X16, aom_obmc_sad4x16, aom_obmc_variance4x16, 1310 aom_obmc_sub_pixel_variance4x16) 1311 OBFP(BLOCK_16X4, aom_obmc_sad16x4, aom_obmc_variance16x4, 1312 aom_obmc_sub_pixel_variance16x4) 1313 OBFP(BLOCK_8X32, aom_obmc_sad8x32, aom_obmc_variance8x32, 1314 aom_obmc_sub_pixel_variance8x32) 1315 OBFP(BLOCK_32X8, aom_obmc_sad32x8, aom_obmc_variance32x8, 1316 aom_obmc_sub_pixel_variance32x8) 1317 OBFP(BLOCK_16X64, aom_obmc_sad16x64, aom_obmc_variance16x64, 1318 aom_obmc_sub_pixel_variance16x64) 1319 OBFP(BLOCK_64X16, aom_obmc_sad64x16, aom_obmc_variance64x16, 1320 aom_obmc_sub_pixel_variance64x16) 1321 #endif // !CONFIG_REALTIME_ONLY 1322 1323 #define MBFP(BT, MCSDF, MCSVF) \ 1324 ppi->fn_ptr[BT].msdf = MCSDF; \ 1325 ppi->fn_ptr[BT].msvf = MCSVF; 1326 1327 MBFP(BLOCK_128X128, aom_masked_sad128x128, 1328 aom_masked_sub_pixel_variance128x128) 1329 MBFP(BLOCK_128X64, aom_masked_sad128x64, aom_masked_sub_pixel_variance128x64) 1330 MBFP(BLOCK_64X128, aom_masked_sad64x128, aom_masked_sub_pixel_variance64x128) 1331 MBFP(BLOCK_64X64, aom_masked_sad64x64, aom_masked_sub_pixel_variance64x64) 1332 MBFP(BLOCK_64X32, aom_masked_sad64x32, aom_masked_sub_pixel_variance64x32) 1333 MBFP(BLOCK_32X64, aom_masked_sad32x64, aom_masked_sub_pixel_variance32x64) 1334 MBFP(BLOCK_32X32, aom_masked_sad32x32, aom_masked_sub_pixel_variance32x32) 1335 MBFP(BLOCK_32X16, aom_masked_sad32x16, aom_masked_sub_pixel_variance32x16) 1336 MBFP(BLOCK_16X32, aom_masked_sad16x32, aom_masked_sub_pixel_variance16x32) 1337 MBFP(BLOCK_16X16, aom_masked_sad16x16, aom_masked_sub_pixel_variance16x16) 1338 MBFP(BLOCK_16X8, aom_masked_sad16x8, aom_masked_sub_pixel_variance16x8) 1339 MBFP(BLOCK_8X16, aom_masked_sad8x16, aom_masked_sub_pixel_variance8x16) 1340 MBFP(BLOCK_8X8, aom_masked_sad8x8, aom_masked_sub_pixel_variance8x8) 1341 MBFP(BLOCK_4X8, aom_masked_sad4x8, aom_masked_sub_pixel_variance4x8) 1342 MBFP(BLOCK_8X4, aom_masked_sad8x4, aom_masked_sub_pixel_variance8x4) 1343 MBFP(BLOCK_4X4, aom_masked_sad4x4, aom_masked_sub_pixel_variance4x4) 1344 1345 #if !CONFIG_REALTIME_ONLY 1346 MBFP(BLOCK_4X16, aom_masked_sad4x16, aom_masked_sub_pixel_variance4x16) 1347 MBFP(BLOCK_16X4, aom_masked_sad16x4, aom_masked_sub_pixel_variance16x4) 1348 MBFP(BLOCK_8X32, aom_masked_sad8x32, aom_masked_sub_pixel_variance8x32) 1349 MBFP(BLOCK_32X8, aom_masked_sad32x8, aom_masked_sub_pixel_variance32x8) 1350 MBFP(BLOCK_16X64, aom_masked_sad16x64, aom_masked_sub_pixel_variance16x64) 1351 MBFP(BLOCK_64X16, aom_masked_sad64x16, aom_masked_sub_pixel_variance64x16) 1352 #endif 1353 1354 #define SDSFP(BT, SDSF, SDSX4DF) \ 1355 ppi->fn_ptr[BT].sdsf = SDSF; \ 1356 ppi->fn_ptr[BT].sdsx4df = SDSX4DF; 1357 1358 SDSFP(BLOCK_128X128, aom_sad_skip_128x128, aom_sad_skip_128x128x4d) 1359 SDSFP(BLOCK_128X64, aom_sad_skip_128x64, aom_sad_skip_128x64x4d) 1360 SDSFP(BLOCK_64X128, aom_sad_skip_64x128, aom_sad_skip_64x128x4d) 1361 SDSFP(BLOCK_64X64, aom_sad_skip_64x64, aom_sad_skip_64x64x4d) 1362 SDSFP(BLOCK_64X32, aom_sad_skip_64x32, aom_sad_skip_64x32x4d) 1363 1364 SDSFP(BLOCK_32X64, aom_sad_skip_32x64, aom_sad_skip_32x64x4d) 1365 SDSFP(BLOCK_32X32, aom_sad_skip_32x32, aom_sad_skip_32x32x4d) 1366 SDSFP(BLOCK_32X16, aom_sad_skip_32x16, aom_sad_skip_32x16x4d) 1367 1368 SDSFP(BLOCK_16X32, aom_sad_skip_16x32, aom_sad_skip_16x32x4d) 1369 SDSFP(BLOCK_16X16, aom_sad_skip_16x16, aom_sad_skip_16x16x4d) 1370 SDSFP(BLOCK_8X16, aom_sad_skip_8x16, aom_sad_skip_8x16x4d) 1371 1372 #if !CONFIG_REALTIME_ONLY 1373 SDSFP(BLOCK_64X16, aom_sad_skip_64x16, aom_sad_skip_64x16x4d) 1374 SDSFP(BLOCK_16X64, aom_sad_skip_16x64, aom_sad_skip_16x64x4d) 1375 SDSFP(BLOCK_8X32, aom_sad_skip_8x32, aom_sad_skip_8x32x4d) 1376 SDSFP(BLOCK_4X16, aom_sad_skip_4x16, aom_sad_skip_4x16x4d) 1377 #endif 1378 #undef SDSFP 1379 1380 #if CONFIG_AV1_HIGHBITDEPTH 1381 highbd_set_var_fns(ppi); 1382 #endif 1383 1384 { 1385 // As cm->mi_params is a part of the frame level context (cpi), it is 1386 // unavailable at this point. mi_params is created as a local temporary 1387 // variable, to be passed into the functions used for allocating tpl 1388 // buffers. The values in this variable are populated according to initial 1389 // width and height of the frame. 1390 CommonModeInfoParams mi_params; 1391 enc_set_mb_mi(&mi_params, oxcf->frm_dim_cfg.width, oxcf->frm_dim_cfg.height, 1392 BLOCK_4X4); 1393 1394 const BLOCK_SIZE bsize = BLOCK_16X16; 1395 const int w = mi_size_wide[bsize]; 1396 const int h = mi_size_high[bsize]; 1397 const int num_cols = (mi_params.mi_cols + w - 1) / w; 1398 const int num_rows = (mi_params.mi_rows + h - 1) / h; 1399 AOM_CHECK_MEM_ERROR( 1400 &ppi->error, ppi->tpl_sb_rdmult_scaling_factors, 1401 aom_calloc(num_rows * num_cols, 1402 sizeof(*ppi->tpl_sb_rdmult_scaling_factors))); 1403 1404 #if CONFIG_INTERNAL_STATS 1405 ppi->b_calculate_blockiness = 1; 1406 ppi->b_calculate_consistency = 1; 1407 1408 for (int i = 0; i <= STAT_ALL; i++) { 1409 ppi->psnr[0].stat[i] = 0; 1410 ppi->psnr[1].stat[i] = 0; 1411 1412 ppi->fastssim.stat[i] = 0; 1413 ppi->psnrhvs.stat[i] = 0; 1414 } 1415 1416 ppi->psnr[0].worst = 100.0; 1417 ppi->psnr[1].worst = 100.0; 1418 ppi->worst_ssim = 100.0; 1419 ppi->worst_ssim_hbd = 100.0; 1420 1421 ppi->count[0] = 0; 1422 ppi->count[1] = 0; 1423 ppi->total_bytes = 0; 1424 1425 if (ppi->b_calculate_psnr) { 1426 ppi->total_sq_error[0] = 0; 1427 ppi->total_samples[0] = 0; 1428 ppi->total_sq_error[1] = 0; 1429 ppi->total_samples[1] = 0; 1430 ppi->total_recode_hits = 0; 1431 ppi->summed_quality = 0; 1432 ppi->summed_weights = 0; 1433 ppi->summed_quality_hbd = 0; 1434 ppi->summed_weights_hbd = 0; 1435 } 1436 1437 ppi->fastssim.worst = 100.0; 1438 ppi->psnrhvs.worst = 100.0; 1439 1440 if (ppi->b_calculate_blockiness) { 1441 ppi->total_blockiness = 0; 1442 ppi->worst_blockiness = 0.0; 1443 } 1444 1445 ppi->total_inconsistency = 0; 1446 ppi->worst_consistency = 100.0; 1447 if (ppi->b_calculate_consistency) { 1448 AOM_CHECK_MEM_ERROR(&ppi->error, ppi->ssim_vars, 1449 aom_malloc(sizeof(*ppi->ssim_vars) * 4 * 1450 mi_params.mi_rows * mi_params.mi_cols)); 1451 } 1452 #endif 1453 } 1454 1455 ppi->error.setjmp = 0; 1456 return ppi; 1457 } 1458 1459 AV1_COMP *av1_create_compressor(AV1_PRIMARY *ppi, const AV1EncoderConfig *oxcf, 1460 BufferPool *const pool, COMPRESSOR_STAGE stage, 1461 int lap_lag_in_frames) { 1462 AV1_COMP *volatile const cpi = aom_memalign(32, sizeof(AV1_COMP)); 1463 1464 if (!cpi) return NULL; 1465 1466 av1_zero(*cpi); 1467 1468 cpi->ppi = ppi; 1469 1470 AV1_COMMON *volatile const cm = &cpi->common; 1471 cm->seq_params = &ppi->seq_params; 1472 cm->error = 1473 (struct aom_internal_error_info *)aom_calloc(1, sizeof(*cm->error)); 1474 if (!cm->error) { 1475 aom_free(cpi); 1476 return NULL; 1477 } 1478 1479 // The jmp_buf is valid only for the duration of the function that calls 1480 // setjmp(). Therefore, this function must reset the 'setjmp' field to 0 1481 // before it returns. 1482 if (setjmp(cm->error->jmp)) { 1483 cm->error->setjmp = 0; 1484 av1_remove_compressor(cpi); 1485 return NULL; 1486 } 1487 1488 cm->error->setjmp = 1; 1489 cpi->compressor_stage = stage; 1490 1491 cpi->do_frame_data_update = true; 1492 1493 CommonModeInfoParams *const mi_params = &cm->mi_params; 1494 mi_params->free_mi = enc_free_mi; 1495 mi_params->setup_mi = enc_setup_mi; 1496 mi_params->set_mb_mi = 1497 (oxcf->pass == AOM_RC_FIRST_PASS || cpi->compressor_stage == LAP_STAGE) 1498 ? stat_stage_set_mb_mi 1499 : enc_set_mb_mi; 1500 1501 mi_params->mi_alloc_bsize = BLOCK_4X4; 1502 1503 CHECK_MEM_ERROR(cm, cm->fc, 1504 (FRAME_CONTEXT *)aom_memalign(32, sizeof(*cm->fc))); 1505 CHECK_MEM_ERROR( 1506 cm, cm->default_frame_context, 1507 (FRAME_CONTEXT *)aom_memalign(32, sizeof(*cm->default_frame_context))); 1508 memset(cm->fc, 0, sizeof(*cm->fc)); 1509 memset(cm->default_frame_context, 0, sizeof(*cm->default_frame_context)); 1510 1511 cpi->common.buffer_pool = pool; 1512 1513 init_config(cpi, oxcf); 1514 if (cpi->compressor_stage == LAP_STAGE) { 1515 cpi->oxcf.gf_cfg.lag_in_frames = lap_lag_in_frames; 1516 } 1517 1518 av1_rc_init(&cpi->oxcf, &cpi->rc); 1519 1520 init_frame_info(&cpi->frame_info, cm); 1521 init_frame_index_set(&cpi->frame_index_set); 1522 1523 cm->current_frame.frame_number = 0; 1524 cpi->rc.frame_number_encoded = 0; 1525 cpi->rc.prev_frame_is_dropped = 0; 1526 cpi->rc.max_consec_drop = INT_MAX; 1527 cpi->rc.drop_count_consec = 0; 1528 cm->current_frame_id = -1; 1529 cpi->tile_data = NULL; 1530 cpi->last_show_frame_buf = NULL; 1531 realloc_segmentation_maps(cpi); 1532 1533 cpi->refresh_frame.alt_ref_frame = false; 1534 1535 #if CONFIG_SPEED_STATS 1536 cpi->tx_search_count = 0; 1537 #endif // CONFIG_SPEED_STATS 1538 1539 cpi->time_stamps.first_ts_start = INT64_MAX; 1540 1541 #ifdef OUTPUT_YUV_REC 1542 yuv_rec_file = fopen("rec.yuv", "wb"); 1543 #endif 1544 #ifdef OUTPUT_YUV_DENOISED 1545 yuv_denoised_file = fopen("denoised.yuv", "wb"); 1546 #endif 1547 1548 #if !CONFIG_REALTIME_ONLY 1549 if (is_stat_consumption_stage(cpi)) { 1550 const size_t packet_sz = sizeof(FIRSTPASS_STATS); 1551 const int packets = (int)(oxcf->twopass_stats_in.sz / packet_sz); 1552 1553 if (!cpi->ppi->lap_enabled) { 1554 /*Re-initialize to stats buffer, populated by application in the case of 1555 * two pass*/ 1556 cpi->ppi->twopass.stats_buf_ctx->stats_in_start = 1557 oxcf->twopass_stats_in.buf; 1558 cpi->twopass_frame.stats_in = 1559 cpi->ppi->twopass.stats_buf_ctx->stats_in_start; 1560 cpi->ppi->twopass.stats_buf_ctx->stats_in_end = 1561 &cpi->ppi->twopass.stats_buf_ctx->stats_in_start[packets - 1]; 1562 1563 // The buffer size is packets - 1 because the last packet is total_stats. 1564 av1_firstpass_info_init(&cpi->ppi->twopass.firstpass_info, 1565 oxcf->twopass_stats_in.buf, packets - 1); 1566 av1_init_second_pass(cpi); 1567 } else { 1568 av1_firstpass_info_init(&cpi->ppi->twopass.firstpass_info, NULL, 0); 1569 av1_init_single_pass_lap(cpi); 1570 } 1571 } 1572 #endif 1573 1574 // The buffer "obmc_buffer" is used in inter frames for fast obmc search. 1575 // Hence, the memory allocation for the same is avoided for allintra encoding 1576 // mode. 1577 if (cpi->oxcf.kf_cfg.key_freq_max != 0) 1578 alloc_obmc_buffers(&cpi->td.mb.obmc_buffer, cm->error); 1579 1580 for (int x = 0; x < 2; x++) { 1581 CHECK_MEM_ERROR( 1582 cm, cpi->td.mb.intrabc_hash_info.hash_value_buffer[x], 1583 (uint32_t *)aom_malloc( 1584 AOM_BUFFER_SIZE_FOR_BLOCK_HASH * 1585 sizeof(*cpi->td.mb.intrabc_hash_info.hash_value_buffer[x]))); 1586 } 1587 1588 cpi->td.mb.intrabc_hash_info.crc_initialized = 0; 1589 1590 av1_set_speed_features_framesize_independent(cpi, oxcf->speed); 1591 av1_set_speed_features_framesize_dependent(cpi, oxcf->speed); 1592 1593 int max_mi_cols = mi_params->mi_cols; 1594 int max_mi_rows = mi_params->mi_rows; 1595 if (oxcf->frm_dim_cfg.forced_max_frame_width) { 1596 max_mi_cols = size_in_mi(oxcf->frm_dim_cfg.forced_max_frame_width); 1597 } 1598 if (oxcf->frm_dim_cfg.forced_max_frame_height) { 1599 max_mi_rows = size_in_mi(oxcf->frm_dim_cfg.forced_max_frame_height); 1600 } 1601 1602 const int consec_zero_mv_alloc_size = (max_mi_rows * max_mi_cols) >> 2; 1603 CHECK_MEM_ERROR( 1604 cm, cpi->consec_zero_mv, 1605 aom_calloc(consec_zero_mv_alloc_size, sizeof(*cpi->consec_zero_mv))); 1606 cpi->consec_zero_mv_alloc_size = consec_zero_mv_alloc_size; 1607 1608 cpi->mb_weber_stats = NULL; 1609 cpi->mb_delta_q = NULL; 1610 cpi->palette_pixel_num = 0; 1611 cpi->scaled_last_source_available = 0; 1612 1613 { 1614 const BLOCK_SIZE bsize = BLOCK_16X16; 1615 const int w = mi_size_wide[bsize]; 1616 const int h = mi_size_high[bsize]; 1617 const int num_cols = (max_mi_cols + w - 1) / w; 1618 const int num_rows = (max_mi_rows + h - 1) / h; 1619 CHECK_MEM_ERROR(cm, cpi->ssim_rdmult_scaling_factors, 1620 aom_calloc(num_rows * num_cols, 1621 sizeof(*cpi->ssim_rdmult_scaling_factors))); 1622 CHECK_MEM_ERROR(cm, cpi->tpl_rdmult_scaling_factors, 1623 aom_calloc(num_rows * num_cols, 1624 sizeof(*cpi->tpl_rdmult_scaling_factors))); 1625 } 1626 1627 #if CONFIG_TUNE_VMAF 1628 { 1629 const BLOCK_SIZE bsize = BLOCK_64X64; 1630 const int w = mi_size_wide[bsize]; 1631 const int h = mi_size_high[bsize]; 1632 const int num_cols = (mi_params->mi_cols + w - 1) / w; 1633 const int num_rows = (mi_params->mi_rows + h - 1) / h; 1634 CHECK_MEM_ERROR(cm, cpi->vmaf_info.rdmult_scaling_factors, 1635 aom_calloc(num_rows * num_cols, 1636 sizeof(*cpi->vmaf_info.rdmult_scaling_factors))); 1637 for (int i = 0; i < MAX_ARF_LAYERS; i++) { 1638 cpi->vmaf_info.last_frame_unsharp_amount[i] = -1.0; 1639 cpi->vmaf_info.last_frame_ysse[i] = -1.0; 1640 cpi->vmaf_info.last_frame_vmaf[i] = -1.0; 1641 } 1642 cpi->vmaf_info.original_qindex = -1; 1643 cpi->vmaf_info.vmaf_model = NULL; 1644 } 1645 #endif 1646 1647 #if CONFIG_TUNE_BUTTERAUGLI 1648 { 1649 const int w = mi_size_wide[butteraugli_rdo_bsize]; 1650 const int h = mi_size_high[butteraugli_rdo_bsize]; 1651 const int num_cols = (mi_params->mi_cols + w - 1) / w; 1652 const int num_rows = (mi_params->mi_rows + h - 1) / h; 1653 CHECK_MEM_ERROR( 1654 cm, cpi->butteraugli_info.rdmult_scaling_factors, 1655 aom_malloc(num_rows * num_cols * 1656 sizeof(*cpi->butteraugli_info.rdmult_scaling_factors))); 1657 memset(&cpi->butteraugli_info.source, 0, 1658 sizeof(cpi->butteraugli_info.source)); 1659 memset(&cpi->butteraugli_info.resized_source, 0, 1660 sizeof(cpi->butteraugli_info.resized_source)); 1661 cpi->butteraugli_info.recon_set = false; 1662 } 1663 #endif 1664 1665 #if CONFIG_SALIENCY_MAP 1666 { 1667 CHECK_MEM_ERROR(cm, cpi->saliency_map, 1668 (uint8_t *)aom_calloc(cm->height * cm->width, 1669 sizeof(*cpi->saliency_map))); 1670 // Buffer initialization based on MIN_MIB_SIZE_LOG2 to ensure that 1671 // cpi->sm_scaling_factor buffer is allocated big enough, since we have no 1672 // idea of the actual superblock size we are going to use yet. 1673 const int min_mi_w_sb = (1 << MIN_MIB_SIZE_LOG2); 1674 const int min_mi_h_sb = (1 << MIN_MIB_SIZE_LOG2); 1675 const int max_sb_cols = 1676 (cm->mi_params.mi_cols + min_mi_w_sb - 1) / min_mi_w_sb; 1677 const int max_sb_rows = 1678 (cm->mi_params.mi_rows + min_mi_h_sb - 1) / min_mi_h_sb; 1679 CHECK_MEM_ERROR(cm, cpi->sm_scaling_factor, 1680 (double *)aom_calloc(max_sb_rows * max_sb_cols, 1681 sizeof(*cpi->sm_scaling_factor))); 1682 } 1683 #endif 1684 1685 #if CONFIG_COLLECT_PARTITION_STATS 1686 av1_zero(cpi->partition_stats); 1687 #endif // CONFIG_COLLECT_PARTITION_STATS 1688 1689 // Initialize the members of DeltaQuantParams with INT_MAX to ensure that 1690 // the quantizer tables are correctly initialized using the default deltaq 1691 // parameters when av1_init_quantizer is called for the first time. 1692 DeltaQuantParams *const prev_deltaq_params = 1693 &cpi->enc_quant_dequant_params.prev_deltaq_params; 1694 prev_deltaq_params->y_dc_delta_q = INT_MAX; 1695 prev_deltaq_params->u_dc_delta_q = INT_MAX; 1696 prev_deltaq_params->v_dc_delta_q = INT_MAX; 1697 prev_deltaq_params->u_ac_delta_q = INT_MAX; 1698 prev_deltaq_params->v_ac_delta_q = INT_MAX; 1699 1700 av1_init_quantizer(&cpi->enc_quant_dequant_params, &cm->quant_params, 1701 cm->seq_params->bit_depth, cpi->oxcf.algo_cfg.sharpness); 1702 av1_qm_init(&cm->quant_params, av1_num_planes(cm)); 1703 1704 av1_loop_filter_init(cm); 1705 cm->superres_scale_denominator = SCALE_NUMERATOR; 1706 cm->superres_upscaled_width = oxcf->frm_dim_cfg.width; 1707 cm->superres_upscaled_height = oxcf->frm_dim_cfg.height; 1708 #if !CONFIG_REALTIME_ONLY 1709 av1_loop_restoration_precal(); 1710 #endif 1711 1712 #if CONFIG_THREE_PASS 1713 cpi->third_pass_ctx = NULL; 1714 if (cpi->oxcf.pass == AOM_RC_THIRD_PASS) { 1715 av1_init_thirdpass_ctx(cm, &cpi->third_pass_ctx, NULL); 1716 } 1717 #endif 1718 1719 cpi->second_pass_log_stream = NULL; 1720 cpi->use_ducky_encode = 0; 1721 1722 cm->error->setjmp = 0; 1723 return cpi; 1724 } 1725 1726 #if CONFIG_INTERNAL_STATS 1727 #define SNPRINT(H, T) snprintf((H) + strlen(H), sizeof(H) - strlen(H), (T)) 1728 1729 #define SNPRINT2(H, T, V) \ 1730 snprintf((H) + strlen(H), sizeof(H) - strlen(H), (T), (V)) 1731 #endif // CONFIG_INTERNAL_STATS 1732 1733 void av1_remove_primary_compressor(AV1_PRIMARY *ppi) { 1734 if (!ppi) return; 1735 #if !CONFIG_REALTIME_ONLY 1736 av1_tf_info_free(&ppi->tf_info); 1737 #endif // !CONFIG_REALTIME_ONLY 1738 1739 for (int i = 0; i < MAX_NUM_OPERATING_POINTS; ++i) { 1740 aom_free(ppi->level_params.level_info[i]); 1741 } 1742 av1_lookahead_destroy(ppi->lookahead); 1743 1744 aom_free(ppi->tpl_sb_rdmult_scaling_factors); 1745 ppi->tpl_sb_rdmult_scaling_factors = NULL; 1746 1747 TplParams *const tpl_data = &ppi->tpl_data; 1748 aom_free(tpl_data->txfm_stats_list); 1749 1750 for (int frame = 0; frame < MAX_LAG_BUFFERS; ++frame) { 1751 aom_free(tpl_data->tpl_stats_pool[frame]); 1752 aom_free_frame_buffer(&tpl_data->tpl_rec_pool[frame]); 1753 tpl_data->tpl_stats_pool[frame] = NULL; 1754 } 1755 1756 #if !CONFIG_REALTIME_ONLY 1757 av1_tpl_dealloc(&tpl_data->tpl_mt_sync); 1758 #endif 1759 1760 av1_terminate_workers(ppi); 1761 free_thread_data(ppi); 1762 1763 aom_free(ppi->p_mt_info.tile_thr_data); 1764 ppi->p_mt_info.tile_thr_data = NULL; 1765 aom_free(ppi->p_mt_info.workers); 1766 ppi->p_mt_info.workers = NULL; 1767 ppi->p_mt_info.num_workers = 0; 1768 1769 aom_free(ppi); 1770 } 1771 1772 void av1_remove_compressor(AV1_COMP *cpi) { 1773 if (!cpi) return; 1774 #if CONFIG_RATECTRL_LOG 1775 if (cpi->oxcf.pass == 3) { 1776 rc_log_show(&cpi->rc_log); 1777 } 1778 #endif // CONFIG_RATECTRL_LOG 1779 1780 AV1_COMMON *cm = &cpi->common; 1781 if (cm->current_frame.frame_number > 0) { 1782 #if CONFIG_SPEED_STATS 1783 if (!is_stat_generation_stage(cpi)) { 1784 fprintf(stdout, "tx_search_count = %d\n", cpi->tx_search_count); 1785 } 1786 #endif // CONFIG_SPEED_STATS 1787 1788 #if CONFIG_COLLECT_PARTITION_STATS == 2 1789 if (!is_stat_generation_stage(cpi)) { 1790 av1_print_fr_partition_timing_stats(&cpi->partition_stats, 1791 "fr_part_timing_data.csv"); 1792 } 1793 #endif 1794 } 1795 1796 #if CONFIG_AV1_TEMPORAL_DENOISING 1797 av1_denoiser_free(&(cpi->denoiser)); 1798 #endif 1799 1800 if (cm->error) { 1801 // Help detect use after free of the error detail string. 1802 memset(cm->error->detail, 'A', sizeof(cm->error->detail) - 1); 1803 cm->error->detail[sizeof(cm->error->detail) - 1] = '\0'; 1804 aom_free(cm->error); 1805 } 1806 aom_free(cpi->td.tctx); 1807 MultiThreadInfo *const mt_info = &cpi->mt_info; 1808 #if CONFIG_MULTITHREAD 1809 pthread_mutex_t *const enc_row_mt_mutex_ = mt_info->enc_row_mt.mutex_; 1810 pthread_cond_t *const enc_row_mt_cond_ = mt_info->enc_row_mt.cond_; 1811 pthread_mutex_t *const gm_mt_mutex_ = mt_info->gm_sync.mutex_; 1812 pthread_mutex_t *const tpl_error_mutex_ = mt_info->tpl_row_mt.mutex_; 1813 pthread_mutex_t *const pack_bs_mt_mutex_ = mt_info->pack_bs_sync.mutex_; 1814 if (enc_row_mt_mutex_ != NULL) { 1815 pthread_mutex_destroy(enc_row_mt_mutex_); 1816 aom_free(enc_row_mt_mutex_); 1817 } 1818 if (enc_row_mt_cond_ != NULL) { 1819 pthread_cond_destroy(enc_row_mt_cond_); 1820 aom_free(enc_row_mt_cond_); 1821 } 1822 if (gm_mt_mutex_ != NULL) { 1823 pthread_mutex_destroy(gm_mt_mutex_); 1824 aom_free(gm_mt_mutex_); 1825 } 1826 if (tpl_error_mutex_ != NULL) { 1827 pthread_mutex_destroy(tpl_error_mutex_); 1828 aom_free(tpl_error_mutex_); 1829 } 1830 if (pack_bs_mt_mutex_ != NULL) { 1831 pthread_mutex_destroy(pack_bs_mt_mutex_); 1832 aom_free(pack_bs_mt_mutex_); 1833 } 1834 #endif 1835 av1_row_mt_mem_dealloc(cpi); 1836 1837 if (mt_info->num_workers > 1) { 1838 av1_row_mt_sync_mem_dealloc(&cpi->ppi->intra_row_mt_sync); 1839 av1_loop_filter_dealloc(&mt_info->lf_row_sync); 1840 av1_cdef_mt_dealloc(&mt_info->cdef_sync); 1841 #if !CONFIG_REALTIME_ONLY 1842 av1_loop_restoration_dealloc(&mt_info->lr_row_sync); 1843 av1_tf_mt_dealloc(&mt_info->tf_sync); 1844 #endif 1845 } 1846 1847 #if CONFIG_THREE_PASS 1848 av1_free_thirdpass_ctx(cpi->third_pass_ctx); 1849 1850 av1_close_second_pass_log(cpi); 1851 #endif 1852 1853 dealloc_compressor_data(cpi); 1854 1855 av1_ext_part_delete(&cpi->ext_part_controller); 1856 1857 av1_remove_common(cm); 1858 1859 aom_free(cpi); 1860 1861 #ifdef OUTPUT_YUV_REC 1862 fclose(yuv_rec_file); 1863 #endif 1864 1865 #ifdef OUTPUT_YUV_DENOISED 1866 fclose(yuv_denoised_file); 1867 #endif 1868 } 1869 1870 static void generate_psnr_packet(AV1_COMP *cpi) { 1871 struct aom_codec_cx_pkt pkt; 1872 int i; 1873 PSNR_STATS psnr; 1874 #if CONFIG_AV1_HIGHBITDEPTH 1875 const uint32_t in_bit_depth = cpi->oxcf.input_cfg.input_bit_depth; 1876 const uint32_t bit_depth = cpi->td.mb.e_mbd.bd; 1877 aom_calc_highbd_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr, 1878 bit_depth, in_bit_depth); 1879 #else 1880 aom_calc_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr); 1881 #endif 1882 1883 for (i = 0; i < 4; ++i) { 1884 pkt.data.psnr.samples[i] = psnr.samples[i]; 1885 pkt.data.psnr.sse[i] = psnr.sse[i]; 1886 pkt.data.psnr.psnr[i] = psnr.psnr[i]; 1887 } 1888 1889 #if CONFIG_AV1_HIGHBITDEPTH 1890 if ((cpi->source->flags & YV12_FLAG_HIGHBITDEPTH) && 1891 (in_bit_depth < bit_depth)) { 1892 for (i = 0; i < 4; ++i) { 1893 pkt.data.psnr.samples_hbd[i] = psnr.samples_hbd[i]; 1894 pkt.data.psnr.sse_hbd[i] = psnr.sse_hbd[i]; 1895 pkt.data.psnr.psnr_hbd[i] = psnr.psnr_hbd[i]; 1896 } 1897 } 1898 #endif 1899 1900 pkt.kind = AOM_CODEC_PSNR_PKT; 1901 aom_codec_pkt_list_add(cpi->ppi->output_pkt_list, &pkt); 1902 } 1903 1904 int av1_use_as_reference(int *ext_ref_frame_flags, int ref_frame_flags) { 1905 if (ref_frame_flags > ((1 << INTER_REFS_PER_FRAME) - 1)) return -1; 1906 1907 *ext_ref_frame_flags = ref_frame_flags; 1908 return 0; 1909 } 1910 1911 int av1_copy_reference_enc(AV1_COMP *cpi, int idx, YV12_BUFFER_CONFIG *sd) { 1912 AV1_COMMON *const cm = &cpi->common; 1913 const int num_planes = av1_num_planes(cm); 1914 YV12_BUFFER_CONFIG *cfg = get_ref_frame(cm, idx); 1915 if (cfg) { 1916 aom_yv12_copy_frame(cfg, sd, num_planes); 1917 return 0; 1918 } else { 1919 return -1; 1920 } 1921 } 1922 1923 int av1_set_reference_enc(AV1_COMP *cpi, int idx, YV12_BUFFER_CONFIG *sd) { 1924 AV1_COMMON *const cm = &cpi->common; 1925 const int num_planes = av1_num_planes(cm); 1926 YV12_BUFFER_CONFIG *cfg = get_ref_frame(cm, idx); 1927 if (cfg) { 1928 aom_yv12_copy_frame(sd, cfg, num_planes); 1929 return 0; 1930 } else { 1931 return -1; 1932 } 1933 } 1934 1935 #ifdef OUTPUT_YUV_REC 1936 static void aom_write_one_yuv_frame(AV1_COMMON *cm, YV12_BUFFER_CONFIG *s) { 1937 uint8_t *src = s->y_buffer; 1938 int h = cm->height; 1939 if (yuv_rec_file == NULL) return; 1940 if (s->flags & YV12_FLAG_HIGHBITDEPTH) { 1941 uint16_t *src16 = CONVERT_TO_SHORTPTR(s->y_buffer); 1942 1943 do { 1944 fwrite(src16, s->y_width, 2, yuv_rec_file); 1945 src16 += s->y_stride; 1946 } while (--h); 1947 1948 src16 = CONVERT_TO_SHORTPTR(s->u_buffer); 1949 h = s->uv_height; 1950 1951 do { 1952 fwrite(src16, s->uv_width, 2, yuv_rec_file); 1953 src16 += s->uv_stride; 1954 } while (--h); 1955 1956 src16 = CONVERT_TO_SHORTPTR(s->v_buffer); 1957 h = s->uv_height; 1958 1959 do { 1960 fwrite(src16, s->uv_width, 2, yuv_rec_file); 1961 src16 += s->uv_stride; 1962 } while (--h); 1963 1964 fflush(yuv_rec_file); 1965 return; 1966 } 1967 1968 do { 1969 fwrite(src, s->y_width, 1, yuv_rec_file); 1970 src += s->y_stride; 1971 } while (--h); 1972 1973 src = s->u_buffer; 1974 h = s->uv_height; 1975 1976 do { 1977 fwrite(src, s->uv_width, 1, yuv_rec_file); 1978 src += s->uv_stride; 1979 } while (--h); 1980 1981 src = s->v_buffer; 1982 h = s->uv_height; 1983 1984 do { 1985 fwrite(src, s->uv_width, 1, yuv_rec_file); 1986 src += s->uv_stride; 1987 } while (--h); 1988 1989 fflush(yuv_rec_file); 1990 } 1991 #endif // OUTPUT_YUV_REC 1992 1993 void av1_set_mv_search_params(AV1_COMP *cpi) { 1994 const AV1_COMMON *const cm = &cpi->common; 1995 MotionVectorSearchParams *const mv_search_params = &cpi->mv_search_params; 1996 const int max_mv_def = AOMMAX(cm->width, cm->height); 1997 1998 // Default based on max resolution. 1999 mv_search_params->mv_step_param = av1_init_search_range(max_mv_def); 2000 2001 if (cpi->sf.mv_sf.auto_mv_step_size) { 2002 if (frame_is_intra_only(cm)) { 2003 // Initialize max_mv_magnitude for use in the first INTER frame 2004 // after a key/intra-only frame. 2005 mv_search_params->max_mv_magnitude = max_mv_def; 2006 } else { 2007 // Use adaptive mv steps based on previous frame stats for show frames and 2008 // internal arfs. 2009 FRAME_UPDATE_TYPE cur_update_type = 2010 cpi->ppi->gf_group.update_type[cpi->gf_frame_index]; 2011 int use_auto_mv_step = 2012 (cm->show_frame || cur_update_type == INTNL_ARF_UPDATE) && 2013 mv_search_params->max_mv_magnitude != -1 && 2014 cpi->sf.mv_sf.auto_mv_step_size >= 2; 2015 if (use_auto_mv_step) { 2016 // Allow mv_steps to correspond to twice the max mv magnitude found 2017 // in the previous frame, capped by the default max_mv_magnitude based 2018 // on resolution. 2019 mv_search_params->mv_step_param = av1_init_search_range( 2020 AOMMIN(max_mv_def, 2 * mv_search_params->max_mv_magnitude)); 2021 } 2022 // Reset max_mv_magnitude based on update flag. 2023 if (cpi->do_frame_data_update) mv_search_params->max_mv_magnitude = -1; 2024 } 2025 } 2026 } 2027 2028 // Estimate if the source frame is screen content, based on the portion of 2029 // blocks that have few luma colors. 2030 static void estimate_screen_content(AV1_COMP *cpi, FeatureFlags *features) { 2031 const AV1_COMMON *const cm = &cpi->common; 2032 const MACROBLOCKD *const xd = &cpi->td.mb.e_mbd; 2033 const uint8_t *src = cpi->unfiltered_source->y_buffer; 2034 assert(src != NULL); 2035 const int use_hbd = cpi->unfiltered_source->flags & YV12_FLAG_HIGHBITDEPTH; 2036 const int stride = cpi->unfiltered_source->y_stride; 2037 const int width = cpi->unfiltered_source->y_width; 2038 const int height = cpi->unfiltered_source->y_height; 2039 const int64_t area = (int64_t)width * height; 2040 const int bd = cm->seq_params->bit_depth; 2041 const int kBlockWidth = 16; 2042 const int kBlockHeight = 16; 2043 const int kBlockArea = kBlockWidth * kBlockHeight; 2044 // These threshold values are selected experimentally. 2045 const int kColorThresh = 4; 2046 const unsigned int kVarThresh = 0; 2047 // Counts of blocks with no more than kColorThresh colors. 2048 int64_t counts_1 = 0; 2049 // Counts of blocks with no more than kColorThresh colors and variance larger 2050 // than kVarThresh. 2051 int64_t counts_2 = 0; 2052 2053 for (int r = 0; r + kBlockHeight <= height; r += kBlockHeight) { 2054 for (int c = 0; c + kBlockWidth <= width; c += kBlockWidth) { 2055 int count_buf[1 << 8]; // Maximum (1 << 8) bins for hbd path. 2056 const uint8_t *const this_src = src + r * stride + c; 2057 int n_colors; 2058 if (use_hbd) { 2059 av1_count_colors_highbd(this_src, stride, /*rows=*/kBlockHeight, 2060 /*cols=*/kBlockWidth, bd, NULL, count_buf, 2061 &n_colors, NULL); 2062 } else { 2063 av1_count_colors(this_src, stride, /*rows=*/kBlockHeight, 2064 /*cols=*/kBlockWidth, count_buf, &n_colors); 2065 } 2066 if (n_colors > 1 && n_colors <= kColorThresh) { 2067 ++counts_1; 2068 struct buf_2d buf; 2069 buf.stride = stride; 2070 buf.buf = (uint8_t *)this_src; 2071 const unsigned int var = av1_get_perpixel_variance( 2072 cpi, xd, &buf, BLOCK_16X16, AOM_PLANE_Y, use_hbd); 2073 if (var > kVarThresh) ++counts_2; 2074 } 2075 } 2076 } 2077 2078 // The threshold values are selected experimentally. 2079 features->allow_screen_content_tools = counts_1 * kBlockArea * 10 > area; 2080 // IntraBC would force loop filters off, so we use more strict rules that also 2081 // requires that the block has high variance. 2082 features->allow_intrabc = 2083 features->allow_screen_content_tools && counts_2 * kBlockArea * 12 > area; 2084 cpi->use_screen_content_tools = features->allow_screen_content_tools; 2085 cpi->is_screen_content_type = 2086 features->allow_intrabc || (counts_1 * kBlockArea * 10 > area * 4 && 2087 counts_2 * kBlockArea * 30 > area); 2088 } 2089 2090 // Macro that helps debug the screen content mode 2 mechanism 2091 // #define OUTPUT_SCR_DET_MODE2_STATS 2092 2093 /*!\brief Helper function that finds the dominant value of a block. 2094 * 2095 * This function builds a histogram of all 256 possible (8 bit) values, and 2096 * returns with the value with the greatest count (i.e. the dominant value). 2097 */ 2098 uint8_t av1_find_dominant_value(const uint8_t *src, int stride, int rows, 2099 int cols) { 2100 uint32_t value_count[1 << 8] = { 0 }; // Maximum (1 << 8) value levels. 2101 uint32_t dominant_value_count = 0; 2102 uint8_t dominant_value = 0; 2103 2104 for (int r = 0; r < rows; ++r) { 2105 for (int c = 0; c < cols; ++c) { 2106 const uint8_t value = src[r * (ptrdiff_t)stride + c]; 2107 2108 value_count[value]++; 2109 2110 if (value_count[value] > dominant_value_count) { 2111 dominant_value = value; 2112 dominant_value_count = value_count[value]; 2113 } 2114 } 2115 } 2116 2117 return dominant_value; 2118 } 2119 2120 /*!\brief Helper function that performs one round of image dilation on a block. 2121 * 2122 * This function finds the dominant value (i.e. the value that appears most 2123 * often within a block), then performs a round of dilation by "extending" all 2124 * occurrences of the dominant value outwards in all 8 directions (4 sides + 4 2125 * corners). 2126 * 2127 * For a visual example, let: 2128 * - D: the dominant value 2129 * - [a-p]: different non-dominant values (usually anti-aliased pixels) 2130 * - .: the most common non-dominant value 2131 * 2132 * Before dilation: After dilation: 2133 * . . a b D c d . . . . D D D D D . . 2134 * . e f D D D g h . D D D D D D D D D 2135 * . D D D D D D D . D D D D D D D D D 2136 * . D D D D D D D . D D D D D D D D D 2137 * . i j D D D k l . D D D D D D D D D 2138 * . . m n D o p . . . . D D D D D . . 2139 */ 2140 void av1_dilate_block(const uint8_t *src, int src_stride, uint8_t *dilated, 2141 int dilated_stride, int rows, int cols) { 2142 uint8_t dominant_value = av1_find_dominant_value(src, src_stride, rows, cols); 2143 2144 for (int r = 0; r < rows; ++r) { 2145 for (int c = 0; c < cols; ++c) { 2146 const uint8_t value = src[r * (ptrdiff_t)src_stride + c]; 2147 2148 dilated[r * (ptrdiff_t)dilated_stride + c] = value; 2149 } 2150 } 2151 2152 for (int r = 0; r < rows; ++r) { 2153 for (int c = 0; c < cols; ++c) { 2154 const uint8_t value = src[r * (ptrdiff_t)src_stride + c]; 2155 2156 if (value == dominant_value) { 2157 // Dilate up 2158 if (r != 0) { 2159 dilated[(r - 1) * (ptrdiff_t)dilated_stride + c] = value; 2160 } 2161 // Dilate down 2162 if (r != rows - 1) { 2163 dilated[(r + 1) * (ptrdiff_t)dilated_stride + c] = value; 2164 } 2165 // Dilate left 2166 if (c != 0) { 2167 dilated[r * (ptrdiff_t)dilated_stride + (c - 1)] = value; 2168 } 2169 // Dilate right 2170 if (c != cols - 1) { 2171 dilated[r * (ptrdiff_t)dilated_stride + (c + 1)] = value; 2172 } 2173 // Dilate upper-left corner 2174 if (r != 0 && c != 0) { 2175 dilated[(r - 1) * (ptrdiff_t)dilated_stride + (c - 1)] = value; 2176 } 2177 // Dilate upper-right corner 2178 if (r != 0 && c != cols - 1) { 2179 dilated[(r - 1) * (ptrdiff_t)dilated_stride + (c + 1)] = value; 2180 } 2181 // Dilate lower-left corner 2182 if (r != rows - 1 && c != 0) { 2183 dilated[(r + 1) * (ptrdiff_t)dilated_stride + (c - 1)] = value; 2184 } 2185 // Dilate lower-right corner 2186 if (r != rows - 1 && c != cols - 1) { 2187 dilated[(r + 1) * (ptrdiff_t)dilated_stride + (c + 1)] = value; 2188 } 2189 } 2190 } 2191 } 2192 } 2193 2194 /*!\brief Estimates if the source frame is a candidate to enable palette mode 2195 * and intra block copy, with an accurate detection of anti-aliased text and 2196 * graphics. 2197 * 2198 * Screen content detection is done by dividing frame's luma plane (Y) into 2199 * small blocks, counting how many unique colors each block contains and 2200 * their per-pixel variance, and classifying these blocks into three main 2201 * categories: 2202 * 1. Palettizable blocks, low variance (can use palette mode) 2203 * 2. Palettizable blocks, high variance (can use palette mode and IntraBC) 2204 * 3. Non palettizable, photo-like blocks (can neither use palette mode nor 2205 * IntraBC) 2206 * Finally, this function decides whether the frame could benefit from 2207 * enabling palette mode with or without IntraBC, based on the ratio of the 2208 * three categories mentioned above. 2209 */ 2210 static void estimate_screen_content_antialiasing_aware(AV1_COMP *cpi, 2211 FeatureFlags *features) { 2212 enum { 2213 kBlockWidth = 16, 2214 kBlockHeight = 16, 2215 kBlockArea = kBlockWidth * kBlockHeight 2216 }; 2217 2218 const bool fast_detection = 2219 cpi->sf.hl_sf.screen_detection_mode2_fast_detection; 2220 const AV1_COMMON *const cm = &cpi->common; 2221 const MACROBLOCKD *const xd = &cpi->td.mb.e_mbd; 2222 const uint8_t *src = cpi->unfiltered_source->y_buffer; 2223 assert(src != NULL); 2224 const int use_hbd = cpi->unfiltered_source->flags & YV12_FLAG_HIGHBITDEPTH; 2225 const int stride = cpi->unfiltered_source->y_stride; 2226 const int width = cpi->unfiltered_source->y_width; 2227 const int height = cpi->unfiltered_source->y_height; 2228 const int64_t area = (int64_t)width * height; 2229 const int bd = cm->seq_params->bit_depth; 2230 // Holds the down-converted block to 8 bit (if source is HBD) 2231 uint8_t downconv_blk[kBlockArea]; 2232 // Holds the block after a round of dilation 2233 uint8_t dilated_blk[kBlockArea]; 2234 2235 // These threshold values are selected experimentally 2236 // Detects text and glyphs without anti-aliasing, and graphics with a 4-color 2237 // palette 2238 const int kSimpleColorThresh = 4; 2239 // Detects potential text and glyphs with anti-aliasing, and graphics with a 2240 // more extended color palette 2241 const int kComplexInitialColorThresh = 40; 2242 // Detects text and glyphs with anti-aliasing, and graphics with a more 2243 // extended color palette 2244 const int kComplexFinalColorThresh = 6; 2245 // Threshold used to classify low-variance and high-variance blocks 2246 const int kVarThresh = 5; 2247 // Count of blocks that are candidates for using palette mode 2248 int64_t count_palette = 0; 2249 // Count of blocks that are candidates for using IntraBC 2250 int64_t count_intrabc = 0; 2251 // Count of "photo-like" blocks (i.e. can't use palette mode or IntraBC) 2252 int64_t count_photo = 0; 2253 2254 #ifdef OUTPUT_SCR_DET_MODE2_STATS 2255 FILE *stats_file; 2256 stats_file = fopen("scrdetm2.stt", "a"); 2257 2258 fprintf(stats_file, "\n"); 2259 fprintf(stats_file, "Screen detection mode 2 image map legend\n"); 2260 if (fast_detection) { 2261 fprintf(stats_file, "Fast detection enabled\n"); 2262 } 2263 fprintf(stats_file, 2264 "-------------------------------------------------------\n"); 2265 fprintf(stats_file, 2266 "S: simple block, high var C: complex block, high var\n"); 2267 fprintf(stats_file, 2268 "-: simple block, low var =: complex block, low var \n"); 2269 fprintf(stats_file, 2270 "x: photo-like block .: non-palettizable block \n"); 2271 fprintf(stats_file, 2272 "(whitespace): solid block \n"); 2273 fprintf(stats_file, 2274 "-------------------------------------------------------\n"); 2275 #endif 2276 2277 // Skip every other block and weigh each block twice as much when performing 2278 // fast detection 2279 const int multiplier = fast_detection ? 2 : 1; 2280 2281 for (int r = 0; r + kBlockHeight <= height; r += kBlockHeight) { 2282 // Alternate skipping in a "checkerboard" pattern when performing fast 2283 // detection 2284 const int initial_col = 2285 (fast_detection && (r / kBlockHeight) % 2) ? kBlockWidth : 0; 2286 2287 for (int c = initial_col; c + kBlockWidth <= width; 2288 c += kBlockWidth * multiplier) { 2289 const uint8_t *blk_src = src + r * (ptrdiff_t)stride + c; 2290 const uint8_t *blk = blk_src; 2291 int blk_stride = stride; 2292 2293 // Down-convert pixels to 8-bit domain if source is HBD 2294 if (use_hbd) { 2295 const uint16_t *blk_src_hbd = CONVERT_TO_SHORTPTR(blk_src); 2296 2297 for (int blk_r = 0; blk_r < kBlockHeight; ++blk_r) { 2298 for (int blk_c = 0; blk_c < kBlockWidth; ++blk_c) { 2299 const int downconv_val = 2300 (blk_src_hbd[blk_r * (ptrdiff_t)stride + blk_c]) >> (bd - 8); 2301 2302 // Ensure down-converted value is 8-bit 2303 assert(downconv_val < (1 << 8)); 2304 downconv_blk[blk_r * (ptrdiff_t)kBlockWidth + blk_c] = downconv_val; 2305 } 2306 } 2307 2308 // Switch block source and stride to down-converted buffer and its width 2309 blk = downconv_blk; 2310 blk_stride = kBlockWidth; 2311 } 2312 2313 // First, find if the block could be palettized 2314 int number_of_colors; 2315 bool under_threshold = av1_count_colors_with_threshold( 2316 blk, blk_stride, /*rows=*/kBlockHeight, 2317 /*cols=*/kBlockWidth, kComplexInitialColorThresh, &number_of_colors); 2318 if (number_of_colors > 1 && under_threshold) { 2319 struct buf_2d buf; 2320 buf.stride = stride; 2321 buf.buf = (uint8_t *)blk_src; 2322 2323 if (number_of_colors <= kSimpleColorThresh) { 2324 // Simple block detected, add to block count with no further 2325 // processing required 2326 ++count_palette; 2327 // Variance always comes from the source image with no down-conversion 2328 int var = av1_get_perpixel_variance(cpi, xd, &buf, BLOCK_16X16, 2329 AOM_PLANE_Y, use_hbd); 2330 2331 if (var > kVarThresh) { 2332 ++count_intrabc; 2333 #ifdef OUTPUT_SCR_DET_MODE2_STATS 2334 fprintf(stats_file, "S"); 2335 } else { 2336 fprintf(stats_file, "-"); 2337 #endif 2338 } 2339 } else { 2340 // Complex block detected, try to find if it's palettizable 2341 // Dilate block with dominant color, to exclude anti-aliased pixels 2342 // from final palette count 2343 av1_dilate_block(blk, blk_stride, dilated_blk, kBlockWidth, 2344 /*rows=*/kBlockHeight, /*cols=*/kBlockWidth); 2345 under_threshold = av1_count_colors_with_threshold( 2346 dilated_blk, kBlockWidth, /*rows=*/kBlockHeight, 2347 /*cols=*/kBlockWidth, kComplexFinalColorThresh, 2348 &number_of_colors); 2349 2350 if (under_threshold) { 2351 // Variance always comes from the source image with no 2352 // down-conversion 2353 int var = av1_get_perpixel_variance(cpi, xd, &buf, BLOCK_16X16, 2354 AOM_PLANE_Y, use_hbd); 2355 2356 if (var > kVarThresh) { 2357 ++count_palette; 2358 ++count_intrabc; 2359 #ifdef OUTPUT_SCR_DET_MODE2_STATS 2360 fprintf(stats_file, "C"); 2361 } else { 2362 fprintf(stats_file, "="); 2363 #endif 2364 } 2365 #ifdef OUTPUT_SCR_DET_MODE2_STATS 2366 } else { 2367 fprintf(stats_file, "."); 2368 #endif 2369 } 2370 } 2371 } else { 2372 if (number_of_colors > kComplexInitialColorThresh) { 2373 ++count_photo; 2374 #ifdef OUTPUT_SCR_DET_MODE2_STATS 2375 fprintf(stats_file, "x"); 2376 } else { 2377 fprintf(stats_file, " "); // Solid block (1 color) 2378 #endif 2379 } 2380 } 2381 } 2382 #ifdef OUTPUT_SCR_DET_MODE2_STATS 2383 fprintf(stats_file, "\n"); 2384 #endif 2385 } 2386 2387 // Normalize counts to account for the blocks that were skipped 2388 if (fast_detection) { 2389 count_photo *= multiplier; 2390 count_palette *= multiplier; 2391 count_intrabc *= multiplier; 2392 } 2393 2394 // The threshold values are selected experimentally. 2395 // Penalize presence of photo-like blocks (1/16th the weight of a palettizable 2396 // block) 2397 features->allow_screen_content_tools = 2398 ((count_palette - count_photo / 16) * kBlockArea * 10 > area); 2399 2400 // IntraBC would force loop filters off, so we use more strict rules that also 2401 // requires that the block has high variance. 2402 // Penalize presence of photo-like blocks (1/16th the weight of a palettizable 2403 // block) 2404 features->allow_intrabc = 2405 features->allow_screen_content_tools && 2406 ((count_intrabc - count_photo / 16) * kBlockArea * 12 > area); 2407 cpi->use_screen_content_tools = features->allow_screen_content_tools; 2408 cpi->is_screen_content_type = 2409 features->allow_intrabc || (count_palette * kBlockArea * 15 > area * 4 && 2410 count_intrabc * kBlockArea * 30 > area); 2411 2412 #ifdef OUTPUT_SCR_DET_MODE2_STATS 2413 fprintf(stats_file, 2414 "block count palette: %" PRId64 ", count intrabc: %" PRId64 2415 ", count photo: %" PRId64 ", total: %d\n", 2416 count_palette, count_intrabc, count_photo, 2417 (int)(ceil(width / kBlockWidth) * ceil(height / kBlockHeight))); 2418 fprintf(stats_file, "sc palette value: %" PRId64 ", threshold %" PRId64 "\n", 2419 (count_palette - count_photo / 16) * kBlockArea * 10, area); 2420 fprintf(stats_file, "sc ibc value: %" PRId64 ", threshold %" PRId64 "\n", 2421 (count_intrabc - count_photo / 16) * kBlockArea * 12, area); 2422 fprintf(stats_file, "allow sct: %d, allow ibc: %d\n", 2423 features->allow_screen_content_tools, features->allow_intrabc); 2424 #endif 2425 } 2426 2427 void av1_set_screen_content_options(AV1_COMP *cpi, FeatureFlags *features) { 2428 const AV1_COMMON *const cm = &cpi->common; 2429 2430 if (cm->seq_params->force_screen_content_tools != 2) { 2431 features->allow_screen_content_tools = features->allow_intrabc = 2432 cm->seq_params->force_screen_content_tools; 2433 return; 2434 } 2435 2436 if (cpi->oxcf.tune_cfg.content == AOM_CONTENT_SCREEN) { 2437 features->allow_screen_content_tools = 1; 2438 features->allow_intrabc = cpi->oxcf.mode == REALTIME ? 0 : 1; 2439 cpi->is_screen_content_type = 1; 2440 cpi->use_screen_content_tools = 1; 2441 return; 2442 } 2443 2444 if (cpi->oxcf.mode == REALTIME) { 2445 features->allow_screen_content_tools = features->allow_intrabc = 0; 2446 return; 2447 } 2448 2449 // Screen content tools are not evaluated in non-RD encoding mode unless 2450 // content type is not set explicitly, i.e., when 2451 // cpi->oxcf.tune_cfg.content != AOM_CONTENT_SCREEN, use_nonrd_pick_mode = 1 2452 // and hybrid_intra_pickmode = 0. Hence, screen content detection is 2453 // disabled. 2454 if (cpi->sf.rt_sf.use_nonrd_pick_mode && 2455 !cpi->sf.rt_sf.hybrid_intra_pickmode) { 2456 features->allow_screen_content_tools = features->allow_intrabc = 0; 2457 return; 2458 } 2459 2460 if (cpi->oxcf.algo_cfg.screen_detection_mode == 2461 AOM_SCREEN_DETECTION_ANTIALIASING_AWARE) { 2462 estimate_screen_content_antialiasing_aware(cpi, features); 2463 } else { 2464 estimate_screen_content(cpi, features); 2465 } 2466 } 2467 2468 static void init_motion_estimation(AV1_COMP *cpi) { 2469 AV1_COMMON *const cm = &cpi->common; 2470 MotionVectorSearchParams *const mv_search_params = &cpi->mv_search_params; 2471 const int aligned_width = (cm->width + 7) & ~7; 2472 const int y_stride = 2473 aom_calc_y_stride(aligned_width, cpi->oxcf.border_in_pixels); 2474 const int y_stride_src = ((cpi->oxcf.frm_dim_cfg.width != cm->width || 2475 cpi->oxcf.frm_dim_cfg.height != cm->height) || 2476 av1_superres_scaled(cm)) 2477 ? y_stride 2478 : cpi->ppi->lookahead->buf->img.y_stride; 2479 int fpf_y_stride = 2480 cm->cur_frame != NULL ? cm->cur_frame->buf.y_stride : y_stride; 2481 2482 // Update if search_site_cfg is uninitialized or the current frame has a new 2483 // stride 2484 const int should_update = 2485 !mv_search_params->search_site_cfg[SS_CFG_SRC][DIAMOND].stride || 2486 !mv_search_params->search_site_cfg[SS_CFG_LOOKAHEAD][DIAMOND].stride || 2487 (y_stride != 2488 mv_search_params->search_site_cfg[SS_CFG_SRC][DIAMOND].stride); 2489 2490 if (!should_update) { 2491 return; 2492 } 2493 2494 // Initialization of search_site_cfg for NUM_DISTINCT_SEARCH_METHODS. 2495 for (SEARCH_METHODS i = DIAMOND; i < NUM_DISTINCT_SEARCH_METHODS; i++) { 2496 const int level = ((i == NSTEP_8PT) || (i == CLAMPED_DIAMOND)) ? 1 : 0; 2497 av1_init_motion_compensation[i]( 2498 &mv_search_params->search_site_cfg[SS_CFG_SRC][i], y_stride, level); 2499 av1_init_motion_compensation[i]( 2500 &mv_search_params->search_site_cfg[SS_CFG_LOOKAHEAD][i], y_stride_src, 2501 level); 2502 } 2503 2504 // First pass search site config initialization. 2505 av1_init_motion_fpf(&mv_search_params->search_site_cfg[SS_CFG_FPF][DIAMOND], 2506 fpf_y_stride); 2507 for (SEARCH_METHODS i = NSTEP; i < NUM_DISTINCT_SEARCH_METHODS; i++) { 2508 memcpy(&mv_search_params->search_site_cfg[SS_CFG_FPF][i], 2509 &mv_search_params->search_site_cfg[SS_CFG_FPF][DIAMOND], 2510 sizeof(search_site_config)); 2511 } 2512 } 2513 2514 static void init_ref_frame_bufs(AV1_COMP *cpi) { 2515 AV1_COMMON *const cm = &cpi->common; 2516 int i; 2517 if (cm->cur_frame) { 2518 cm->cur_frame->ref_count--; 2519 cm->cur_frame = NULL; 2520 } 2521 for (i = 0; i < REF_FRAMES; ++i) { 2522 if (cm->ref_frame_map[i]) { 2523 cm->ref_frame_map[i]->ref_count--; 2524 cm->ref_frame_map[i] = NULL; 2525 } 2526 } 2527 #ifndef NDEBUG 2528 BufferPool *const pool = cm->buffer_pool; 2529 for (i = 0; i < pool->num_frame_bufs; ++i) { 2530 assert(pool->frame_bufs[i].ref_count == 0); 2531 } 2532 #endif 2533 } 2534 2535 // TODO(chengchen): consider renaming this function as it is necessary 2536 // for the encoder to setup critical parameters, and it does not 2537 // deal with initial width any longer. 2538 aom_codec_err_t av1_check_initial_width(AV1_COMP *cpi, int use_highbitdepth, 2539 int subsampling_x, int subsampling_y) { 2540 AV1_COMMON *const cm = &cpi->common; 2541 SequenceHeader *const seq_params = cm->seq_params; 2542 2543 if (!cpi->frame_size_related_setup_done || 2544 seq_params->use_highbitdepth != use_highbitdepth || 2545 seq_params->subsampling_x != subsampling_x || 2546 seq_params->subsampling_y != subsampling_y) { 2547 seq_params->subsampling_x = subsampling_x; 2548 seq_params->subsampling_y = subsampling_y; 2549 seq_params->use_highbitdepth = use_highbitdepth; 2550 2551 av1_set_speed_features_framesize_independent(cpi, cpi->oxcf.speed); 2552 av1_set_speed_features_framesize_dependent(cpi, cpi->oxcf.speed); 2553 2554 if (!is_stat_generation_stage(cpi)) { 2555 #if !CONFIG_REALTIME_ONLY 2556 if (!av1_tf_info_alloc(&cpi->ppi->tf_info, cpi)) 2557 return AOM_CODEC_MEM_ERROR; 2558 #endif // !CONFIG_REALTIME_ONLY 2559 } 2560 init_ref_frame_bufs(cpi); 2561 2562 init_motion_estimation(cpi); // TODO(agrange) This can be removed. 2563 2564 cpi->initial_mbs = cm->mi_params.MBs; 2565 cpi->frame_size_related_setup_done = true; 2566 } 2567 return AOM_CODEC_OK; 2568 } 2569 2570 #if CONFIG_AV1_TEMPORAL_DENOISING 2571 static void setup_denoiser_buffer(AV1_COMP *cpi) { 2572 AV1_COMMON *const cm = &cpi->common; 2573 if (cpi->oxcf.noise_sensitivity > 0 && 2574 !cpi->denoiser.frame_buffer_initialized) { 2575 if (av1_denoiser_alloc( 2576 cm, &cpi->svc, &cpi->denoiser, cpi->ppi->use_svc, 2577 cpi->oxcf.noise_sensitivity, cm->width, cm->height, 2578 cm->seq_params->subsampling_x, cm->seq_params->subsampling_y, 2579 cm->seq_params->use_highbitdepth, AOM_BORDER_IN_PIXELS)) 2580 aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR, 2581 "Failed to allocate denoiser"); 2582 } 2583 } 2584 #endif 2585 2586 // Returns 1 if the assigned width or height was <= 0. 2587 static int set_size_literal(AV1_COMP *cpi, int width, int height) { 2588 AV1_COMMON *cm = &cpi->common; 2589 aom_codec_err_t err = av1_check_initial_width( 2590 cpi, cm->seq_params->use_highbitdepth, cm->seq_params->subsampling_x, 2591 cm->seq_params->subsampling_y); 2592 if (err != AOM_CODEC_OK) { 2593 aom_internal_error(cm->error, err, "av1_check_initial_width() failed"); 2594 } 2595 2596 if (width <= 0 || height <= 0) return 1; 2597 2598 cm->width = width; 2599 cm->height = height; 2600 2601 #if CONFIG_AV1_TEMPORAL_DENOISING 2602 setup_denoiser_buffer(cpi); 2603 #endif 2604 2605 if (cm->width > cpi->data_alloc_width || 2606 cm->height > cpi->data_alloc_height) { 2607 av1_free_context_buffers(cm); 2608 av1_free_shared_coeff_buffer(&cpi->td.shared_coeff_buf); 2609 av1_free_sms_tree(&cpi->td); 2610 av1_free_pmc(cpi->td.firstpass_ctx, av1_num_planes(cm)); 2611 cpi->td.firstpass_ctx = NULL; 2612 alloc_compressor_data(cpi); 2613 realloc_segmentation_maps(cpi); 2614 cpi->data_alloc_width = cm->width; 2615 cpi->data_alloc_height = cm->height; 2616 cpi->frame_size_related_setup_done = false; 2617 } 2618 alloc_mb_mode_info_buffers(cpi); 2619 av1_update_frame_size(cpi); 2620 2621 return 0; 2622 } 2623 2624 void av1_set_frame_size(AV1_COMP *cpi, int width, int height) { 2625 AV1_COMMON *const cm = &cpi->common; 2626 const SequenceHeader *const seq_params = cm->seq_params; 2627 const int num_planes = av1_num_planes(cm); 2628 MACROBLOCKD *const xd = &cpi->td.mb.e_mbd; 2629 int ref_frame; 2630 2631 if (width != cm->width || height != cm->height) { 2632 // There has been a change in the encoded frame size 2633 set_size_literal(cpi, width, height); 2634 // Recalculate 'all_lossless' in case super-resolution was (un)selected. 2635 cm->features.all_lossless = 2636 cm->features.coded_lossless && !av1_superres_scaled(cm); 2637 2638 av1_noise_estimate_init(&cpi->noise_estimate, cm->width, cm->height); 2639 #if CONFIG_AV1_TEMPORAL_DENOISING 2640 // Reset the denoiser on the resized frame. 2641 if (cpi->oxcf.noise_sensitivity > 0) { 2642 av1_denoiser_free(&(cpi->denoiser)); 2643 setup_denoiser_buffer(cpi); 2644 } 2645 #endif 2646 } 2647 if (is_stat_consumption_stage(cpi)) { 2648 av1_set_target_rate(cpi, cm->width, cm->height); 2649 } 2650 2651 alloc_frame_mvs(cm, cm->cur_frame); 2652 2653 // Allocate above context buffers 2654 CommonContexts *const above_contexts = &cm->above_contexts; 2655 if (above_contexts->num_planes < av1_num_planes(cm) || 2656 above_contexts->num_mi_cols < cm->mi_params.mi_cols || 2657 above_contexts->num_tile_rows < cm->tiles.rows) { 2658 av1_free_above_context_buffers(above_contexts); 2659 if (av1_alloc_above_context_buffers(above_contexts, cm->tiles.rows, 2660 cm->mi_params.mi_cols, 2661 av1_num_planes(cm))) 2662 aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR, 2663 "Failed to allocate context buffers"); 2664 } 2665 2666 AV1EncoderConfig *oxcf = &cpi->oxcf; 2667 oxcf->border_in_pixels = av1_get_enc_border_size( 2668 av1_is_resize_needed(oxcf), oxcf->kf_cfg.key_freq_max == 0, 2669 cm->seq_params->sb_size); 2670 2671 // Reset the frame pointers to the current frame size. 2672 if (aom_realloc_frame_buffer( 2673 &cm->cur_frame->buf, cm->width, cm->height, seq_params->subsampling_x, 2674 seq_params->subsampling_y, seq_params->use_highbitdepth, 2675 cpi->oxcf.border_in_pixels, cm->features.byte_alignment, NULL, NULL, 2676 NULL, cpi->alloc_pyramid, 0)) 2677 aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR, 2678 "Failed to allocate frame buffer"); 2679 2680 if (!is_stat_generation_stage(cpi)) av1_init_cdef_worker(cpi); 2681 2682 #if !CONFIG_REALTIME_ONLY 2683 if (is_restoration_used(cm)) { 2684 for (int i = 0; i < num_planes; ++i) 2685 cm->rst_info[i].frame_restoration_type = RESTORE_NONE; 2686 2687 const bool is_sgr_enabled = !cpi->sf.lpf_sf.disable_sgr_filter; 2688 av1_alloc_restoration_buffers(cm, is_sgr_enabled); 2689 // Store the allocated restoration buffers in MT object. 2690 if (cpi->ppi->p_mt_info.num_workers > 1) { 2691 av1_init_lr_mt_buffers(cpi); 2692 } 2693 } 2694 #endif 2695 2696 init_motion_estimation(cpi); 2697 2698 int has_valid_ref_frame = 0; 2699 for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) { 2700 RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame); 2701 if (buf != NULL) { 2702 struct scale_factors *sf = get_ref_scale_factors(cm, ref_frame); 2703 av1_setup_scale_factors_for_frame(sf, buf->buf.y_crop_width, 2704 buf->buf.y_crop_height, cm->width, 2705 cm->height); 2706 has_valid_ref_frame |= av1_is_valid_scale(sf); 2707 if (av1_is_scaled(sf)) aom_extend_frame_borders(&buf->buf, num_planes); 2708 } 2709 } 2710 // For 1 pass CBR mode: we can skip this check for spatial enhancement 2711 // layer if the target_bandwidth is zero, since it will be dropped. 2712 const bool dropped_frame = 2713 has_no_stats_stage(cpi) && cpi->oxcf.rc_cfg.mode == AOM_CBR && 2714 cpi->svc.spatial_layer_id > 0 && cpi->oxcf.rc_cfg.target_bandwidth == 0; 2715 if (!frame_is_intra_only(cm) && !has_valid_ref_frame && !dropped_frame) { 2716 aom_internal_error( 2717 cm->error, AOM_CODEC_CORRUPT_FRAME, 2718 "Can't find at least one reference frame with valid size"); 2719 } 2720 2721 av1_setup_scale_factors_for_frame(&cm->sf_identity, cm->width, cm->height, 2722 cm->width, cm->height); 2723 2724 set_ref_ptrs(cm, xd, LAST_FRAME, LAST_FRAME); 2725 } 2726 2727 static inline int extend_borders_mt(const AV1_COMP *cpi, 2728 MULTI_THREADED_MODULES stage, int plane) { 2729 const AV1_COMMON *const cm = &cpi->common; 2730 if (cpi->mt_info.num_mod_workers[stage] < 2) return 0; 2731 switch (stage) { 2732 // TODO(deepa.kg@ittiam.com): When cdef and loop-restoration are disabled, 2733 // multi-thread frame border extension along with loop filter frame. 2734 // As loop-filtering of a superblock row modifies the pixels of the 2735 // above superblock row, border extension requires that loop filtering 2736 // of the current and above superblock row is complete. 2737 case MOD_LPF: return 0; 2738 case MOD_CDEF: 2739 return is_cdef_used(cm) && !cpi->ppi->rtc_ref.non_reference_frame && 2740 !is_restoration_used(cm) && !av1_superres_scaled(cm); 2741 case MOD_LR: 2742 return is_restoration_used(cm) && 2743 (cm->rst_info[plane].frame_restoration_type != RESTORE_NONE); 2744 default: assert(0); 2745 } 2746 return 0; 2747 } 2748 2749 /*!\brief Select and apply cdef filters and switchable restoration filters 2750 * 2751 * \ingroup high_level_algo 2752 */ 2753 static void cdef_restoration_frame(AV1_COMP *cpi, AV1_COMMON *cm, 2754 MACROBLOCKD *xd, int use_restoration, 2755 int use_cdef, 2756 unsigned int skip_apply_postproc_filters) { 2757 #if !CONFIG_REALTIME_ONLY 2758 if (use_restoration) 2759 av1_loop_restoration_save_boundary_lines(&cm->cur_frame->buf, cm, 0); 2760 #else 2761 (void)use_restoration; 2762 #endif 2763 2764 if (use_cdef) { 2765 #if CONFIG_COLLECT_COMPONENT_TIMING 2766 start_timing(cpi, cdef_time); 2767 #endif 2768 const int num_workers = cpi->mt_info.num_mod_workers[MOD_CDEF]; 2769 // Find CDEF parameters 2770 av1_cdef_search(cpi); 2771 2772 // Apply the filter 2773 if ((skip_apply_postproc_filters & SKIP_APPLY_CDEF) == 0) { 2774 assert(!cpi->ppi->rtc_ref.non_reference_frame); 2775 if (num_workers > 1) { 2776 // Extension of frame borders is multi-threaded along with cdef. 2777 const int do_extend_border = 2778 extend_borders_mt(cpi, MOD_CDEF, /* plane */ 0); 2779 av1_cdef_frame_mt(cm, xd, cpi->mt_info.cdef_worker, 2780 cpi->mt_info.workers, &cpi->mt_info.cdef_sync, 2781 num_workers, av1_cdef_init_fb_row_mt, 2782 do_extend_border); 2783 } else { 2784 av1_cdef_frame(&cm->cur_frame->buf, cm, xd, av1_cdef_init_fb_row); 2785 } 2786 } 2787 #if CONFIG_COLLECT_COMPONENT_TIMING 2788 end_timing(cpi, cdef_time); 2789 #endif 2790 } 2791 2792 const int use_superres = av1_superres_scaled(cm); 2793 if (use_superres) { 2794 if ((skip_apply_postproc_filters & SKIP_APPLY_SUPERRES) == 0) { 2795 av1_superres_post_encode(cpi); 2796 } 2797 } 2798 2799 #if !CONFIG_REALTIME_ONLY 2800 #if CONFIG_COLLECT_COMPONENT_TIMING 2801 start_timing(cpi, loop_restoration_time); 2802 #endif 2803 if (use_restoration) { 2804 MultiThreadInfo *const mt_info = &cpi->mt_info; 2805 const int num_workers = mt_info->num_mod_workers[MOD_LR]; 2806 av1_loop_restoration_save_boundary_lines(&cm->cur_frame->buf, cm, 1); 2807 av1_pick_filter_restoration(cpi->source, cpi); 2808 if ((skip_apply_postproc_filters & SKIP_APPLY_RESTORATION) == 0 && 2809 (cm->rst_info[0].frame_restoration_type != RESTORE_NONE || 2810 cm->rst_info[1].frame_restoration_type != RESTORE_NONE || 2811 cm->rst_info[2].frame_restoration_type != RESTORE_NONE)) { 2812 if (num_workers > 1) { 2813 // Extension of frame borders is multi-threaded along with loop 2814 // restoration filter. 2815 const int do_extend_border = 1; 2816 av1_loop_restoration_filter_frame_mt( 2817 &cm->cur_frame->buf, cm, 0, mt_info->workers, num_workers, 2818 &mt_info->lr_row_sync, &cpi->lr_ctxt, do_extend_border); 2819 } else { 2820 av1_loop_restoration_filter_frame(&cm->cur_frame->buf, cm, 0, 2821 &cpi->lr_ctxt); 2822 } 2823 } 2824 } 2825 #if CONFIG_COLLECT_COMPONENT_TIMING 2826 end_timing(cpi, loop_restoration_time); 2827 #endif 2828 #endif // !CONFIG_REALTIME_ONLY 2829 } 2830 2831 static void extend_frame_borders(AV1_COMP *cpi) { 2832 const AV1_COMMON *const cm = &cpi->common; 2833 // TODO(debargha): Fix mv search range on encoder side 2834 for (int plane = 0; plane < av1_num_planes(cm); ++plane) { 2835 const bool extend_border_done = extend_borders_mt(cpi, MOD_CDEF, plane) || 2836 extend_borders_mt(cpi, MOD_LR, plane); 2837 if (!extend_border_done) { 2838 const YV12_BUFFER_CONFIG *const ybf = &cm->cur_frame->buf; 2839 aom_extend_frame_borders_plane_row(ybf, plane, 0, 2840 ybf->crop_heights[plane > 0]); 2841 } 2842 } 2843 } 2844 2845 /*!\brief Select and apply deblocking filters, cdef filters, and restoration 2846 * filters. 2847 * 2848 * \ingroup high_level_algo 2849 */ 2850 static void loopfilter_frame(AV1_COMP *cpi, AV1_COMMON *cm) { 2851 MultiThreadInfo *const mt_info = &cpi->mt_info; 2852 const int num_workers = mt_info->num_mod_workers[MOD_LPF]; 2853 const int num_planes = av1_num_planes(cm); 2854 MACROBLOCKD *xd = &cpi->td.mb.e_mbd; 2855 cpi->td.mb.rdmult = cpi->rd.RDMULT; 2856 2857 assert(IMPLIES(is_lossless_requested(&cpi->oxcf.rc_cfg), 2858 cm->features.coded_lossless && cm->features.all_lossless)); 2859 2860 const int use_loopfilter = 2861 is_loopfilter_used(cm) && !cpi->mt_info.pipeline_lpf_mt_with_enc; 2862 const int use_cdef = is_cdef_used(cm); 2863 const int use_superres = av1_superres_scaled(cm); 2864 const int use_restoration = is_restoration_used(cm); 2865 2866 const unsigned int skip_apply_postproc_filters = 2867 derive_skip_apply_postproc_filters(cpi, use_loopfilter, use_cdef, 2868 use_superres, use_restoration); 2869 2870 #if CONFIG_COLLECT_COMPONENT_TIMING 2871 start_timing(cpi, loop_filter_time); 2872 #endif 2873 if (use_loopfilter) { 2874 av1_pick_filter_level(cpi->source, cpi, cpi->sf.lpf_sf.lpf_pick); 2875 struct loopfilter *lf = &cm->lf; 2876 if ((lf->filter_level[0] || lf->filter_level[1]) && 2877 (skip_apply_postproc_filters & SKIP_APPLY_LOOPFILTER) == 0) { 2878 assert(!cpi->ppi->rtc_ref.non_reference_frame); 2879 // lpf_opt_level = 1 : Enables dual/quad loop-filtering. 2880 // lpf_opt_level is set to 1 if transform size search depth in inter 2881 // blocks is limited to one as quad loop filtering assumes that all the 2882 // transform blocks within a 16x8/8x16/16x16 prediction block are of the 2883 // same size. lpf_opt_level = 2 : Filters both chroma planes together, in 2884 // addition to enabling dual/quad loop-filtering. This is enabled when lpf 2885 // pick method is LPF_PICK_FROM_Q as u and v plane filter levels are 2886 // equal. 2887 int lpf_opt_level = get_lpf_opt_level(&cpi->sf); 2888 av1_loop_filter_frame_mt(&cm->cur_frame->buf, cm, xd, 0, num_planes, 0, 2889 mt_info->workers, num_workers, 2890 &mt_info->lf_row_sync, lpf_opt_level); 2891 } 2892 } 2893 2894 #if CONFIG_COLLECT_COMPONENT_TIMING 2895 end_timing(cpi, loop_filter_time); 2896 #endif 2897 2898 cdef_restoration_frame(cpi, cm, xd, use_restoration, use_cdef, 2899 skip_apply_postproc_filters); 2900 } 2901 2902 static void update_motion_stat(AV1_COMP *const cpi) { 2903 AV1_COMMON *const cm = &cpi->common; 2904 const CommonModeInfoParams *const mi_params = &cm->mi_params; 2905 RATE_CONTROL *const rc = &cpi->rc; 2906 SVC *const svc = &cpi->svc; 2907 const int avg_cnt_zeromv = 2908 100 * cpi->rc.cnt_zeromv / (mi_params->mi_rows * mi_params->mi_cols); 2909 if (!cpi->ppi->use_svc || 2910 (cpi->ppi->use_svc && 2911 !cpi->svc.layer_context[cpi->svc.temporal_layer_id].is_key_frame && 2912 cpi->svc.spatial_layer_id == cpi->svc.number_spatial_layers - 1)) { 2913 rc->avg_frame_low_motion = 2914 (rc->avg_frame_low_motion == 0) 2915 ? avg_cnt_zeromv 2916 : (3 * rc->avg_frame_low_motion + avg_cnt_zeromv) / 4; 2917 // For SVC: set avg_frame_low_motion (only computed on top spatial layer) 2918 // to all lower spatial layers. 2919 if (cpi->ppi->use_svc && 2920 svc->spatial_layer_id == svc->number_spatial_layers - 1) { 2921 for (int i = 0; i < svc->number_spatial_layers - 1; ++i) { 2922 const int layer = LAYER_IDS_TO_IDX(i, svc->temporal_layer_id, 2923 svc->number_temporal_layers); 2924 LAYER_CONTEXT *const lc = &svc->layer_context[layer]; 2925 RATE_CONTROL *const lrc = &lc->rc; 2926 lrc->avg_frame_low_motion = rc->avg_frame_low_motion; 2927 } 2928 } 2929 } 2930 } 2931 2932 /*!\brief Encode a frame without the recode loop, usually used in one-pass 2933 * encoding and realtime coding. 2934 * 2935 * \ingroup high_level_algo 2936 * 2937 * \param[in] cpi Top-level encoder structure 2938 * 2939 * \return Returns a value to indicate if the encoding is done successfully. 2940 * \retval #AOM_CODEC_OK 2941 * \retval #AOM_CODEC_ERROR 2942 */ 2943 static int encode_without_recode(AV1_COMP *cpi) { 2944 AV1_COMMON *const cm = &cpi->common; 2945 const QuantizationCfg *const q_cfg = &cpi->oxcf.q_cfg; 2946 SVC *const svc = &cpi->svc; 2947 const int resize_pending = is_frame_resize_pending(cpi); 2948 int top_index = 0, bottom_index = 0, q = 0; 2949 YV12_BUFFER_CONFIG *unscaled = cpi->unscaled_source; 2950 InterpFilter filter_scaler = 2951 cpi->ppi->use_svc ? svc->downsample_filter_type[svc->spatial_layer_id] 2952 : EIGHTTAP_SMOOTH; 2953 int phase_scaler = cpi->ppi->use_svc 2954 ? svc->downsample_filter_phase[svc->spatial_layer_id] 2955 : 0; 2956 2957 if (cpi->rc.postencode_drop && allow_postencode_drop_rtc(cpi)) 2958 av1_save_all_coding_context(cpi); 2959 2960 set_size_independent_vars(cpi); 2961 av1_setup_frame_size(cpi); 2962 cm->prev_frame = get_primary_ref_frame_buf(cm); 2963 av1_set_size_dependent_vars(cpi, &q, &bottom_index, &top_index); 2964 av1_set_mv_search_params(cpi); 2965 2966 if (cm->current_frame.frame_number == 0 && 2967 (cpi->ppi->use_svc || cpi->oxcf.rc_cfg.drop_frames_water_mark > 0) && 2968 cpi->svc.temporal_layer_id == 0) { 2969 const SequenceHeader *seq_params = cm->seq_params; 2970 if (aom_alloc_frame_buffer( 2971 &cpi->svc.source_last_TL0, cpi->oxcf.frm_dim_cfg.width, 2972 cpi->oxcf.frm_dim_cfg.height, seq_params->subsampling_x, 2973 seq_params->subsampling_y, seq_params->use_highbitdepth, 2974 cpi->oxcf.border_in_pixels, cm->features.byte_alignment, false, 2975 0)) { 2976 aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR, 2977 "Failed to allocate buffer for source_last_TL0"); 2978 } 2979 } 2980 2981 if (!cpi->ppi->use_svc) { 2982 phase_scaler = 8; 2983 // 2:1 scaling. 2984 if ((cm->width << 1) == unscaled->y_crop_width && 2985 (cm->height << 1) == unscaled->y_crop_height) { 2986 filter_scaler = BILINEAR; 2987 // For lower resolutions use eighttap_smooth. 2988 if (cm->width * cm->height <= 320 * 180) filter_scaler = EIGHTTAP_SMOOTH; 2989 } else if ((cm->width << 2) == unscaled->y_crop_width && 2990 (cm->height << 2) == unscaled->y_crop_height) { 2991 // 4:1 scaling. 2992 filter_scaler = EIGHTTAP_SMOOTH; 2993 } else if ((cm->width << 2) == 3 * unscaled->y_crop_width && 2994 (cm->height << 2) == 3 * unscaled->y_crop_height) { 2995 // 4:3 scaling. 2996 filter_scaler = EIGHTTAP_REGULAR; 2997 } 2998 } 2999 3000 allocate_gradient_info_for_hog(cpi); 3001 3002 allocate_src_var_of_4x4_sub_block_buf(cpi); 3003 3004 const SPEED_FEATURES *sf = &cpi->sf; 3005 if (sf->part_sf.partition_search_type == VAR_BASED_PARTITION) 3006 variance_partition_alloc(cpi); 3007 3008 if (cm->current_frame.frame_type == KEY_FRAME || 3009 ((sf->inter_sf.extra_prune_warped && cpi->refresh_frame.golden_frame))) 3010 copy_frame_prob_info(cpi); 3011 3012 #if CONFIG_COLLECT_COMPONENT_TIMING 3013 printf("\n Encoding a frame: \n"); 3014 #endif 3015 3016 #if CONFIG_TUNE_BUTTERAUGLI 3017 if (cpi->oxcf.tune_cfg.tuning == AOM_TUNE_BUTTERAUGLI) { 3018 av1_setup_butteraugli_rdmult(cpi); 3019 } 3020 #endif 3021 3022 cpi->source = av1_realloc_and_scale_if_required( 3023 cm, unscaled, &cpi->scaled_source, filter_scaler, phase_scaler, true, 3024 false, cpi->oxcf.border_in_pixels, cpi->alloc_pyramid); 3025 if (frame_is_intra_only(cm) || resize_pending != 0) { 3026 const int current_size = 3027 (cm->mi_params.mi_rows * cm->mi_params.mi_cols) >> 2; 3028 if (cpi->consec_zero_mv && 3029 (cpi->consec_zero_mv_alloc_size < current_size)) { 3030 aom_free(cpi->consec_zero_mv); 3031 cpi->consec_zero_mv_alloc_size = 0; 3032 CHECK_MEM_ERROR(cm, cpi->consec_zero_mv, 3033 aom_malloc(current_size * sizeof(*cpi->consec_zero_mv))); 3034 cpi->consec_zero_mv_alloc_size = current_size; 3035 } 3036 assert(cpi->consec_zero_mv != NULL); 3037 memset(cpi->consec_zero_mv, 0, current_size * sizeof(*cpi->consec_zero_mv)); 3038 } 3039 3040 if (cpi->scaled_last_source_available) { 3041 cpi->last_source = &cpi->scaled_last_source; 3042 cpi->scaled_last_source_available = 0; 3043 } else if (cpi->unscaled_last_source != NULL) { 3044 cpi->last_source = av1_realloc_and_scale_if_required( 3045 cm, cpi->unscaled_last_source, &cpi->scaled_last_source, filter_scaler, 3046 phase_scaler, true, false, cpi->oxcf.border_in_pixels, 3047 cpi->alloc_pyramid); 3048 } 3049 3050 if (cpi->sf.rt_sf.use_temporal_noise_estimate) { 3051 av1_update_noise_estimate(cpi); 3052 } 3053 3054 #if CONFIG_AV1_TEMPORAL_DENOISING 3055 if (cpi->oxcf.noise_sensitivity > 0 && cpi->ppi->use_svc) 3056 av1_denoiser_reset_on_first_frame(cpi); 3057 #endif 3058 3059 // For 1 spatial layer encoding: if the (non-LAST) reference has different 3060 // resolution from the source then disable that reference. This is to avoid 3061 // significant increase in encode time from scaling the references in 3062 // av1_scale_references. Note GOLDEN is forced to update on the (first/tigger) 3063 // resized frame and ALTREF will be refreshed ~4 frames later, so both 3064 // references become available again after few frames. 3065 // For superres: don't disable golden reference. 3066 if (svc->number_spatial_layers == 1) { 3067 if (!cpi->oxcf.superres_cfg.enable_superres) { 3068 if (cpi->ref_frame_flags & av1_ref_frame_flag_list[GOLDEN_FRAME]) { 3069 const YV12_BUFFER_CONFIG *const ref = 3070 get_ref_frame_yv12_buf(cm, GOLDEN_FRAME); 3071 if (ref == NULL || ref->y_crop_width != cm->width || 3072 ref->y_crop_height != cm->height) { 3073 cpi->ref_frame_flags ^= AOM_GOLD_FLAG; 3074 } 3075 } 3076 } 3077 if (cpi->ref_frame_flags & av1_ref_frame_flag_list[ALTREF_FRAME]) { 3078 const YV12_BUFFER_CONFIG *const ref = 3079 get_ref_frame_yv12_buf(cm, ALTREF_FRAME); 3080 if (ref == NULL || ref->y_crop_width != cm->width || 3081 ref->y_crop_height != cm->height) { 3082 cpi->ref_frame_flags ^= AOM_ALT_FLAG; 3083 } 3084 } 3085 } 3086 3087 int scale_references = 0; 3088 #if CONFIG_FPMT_TEST 3089 scale_references = 3090 cpi->ppi->fpmt_unit_test_cfg == PARALLEL_SIMULATION_ENCODE ? 1 : 0; 3091 #endif // CONFIG_FPMT_TEST 3092 if (scale_references || 3093 cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] == 0) { 3094 if (!frame_is_intra_only(cm)) { 3095 av1_scale_references(cpi, filter_scaler, phase_scaler, 1); 3096 } 3097 } 3098 3099 av1_set_quantizer(cm, q_cfg->qm_minlevel, q_cfg->qm_maxlevel, q, 3100 q_cfg->enable_chroma_deltaq, q_cfg->enable_hdr_deltaq, 3101 cpi->oxcf.mode == ALLINTRA, cpi->oxcf.tune_cfg.tuning); 3102 av1_set_speed_features_qindex_dependent(cpi, cpi->oxcf.speed); 3103 av1_init_quantizer(&cpi->enc_quant_dequant_params, &cm->quant_params, 3104 cm->seq_params->bit_depth, cpi->oxcf.algo_cfg.sharpness); 3105 av1_set_variance_partition_thresholds(cpi, q, 0); 3106 av1_setup_frame(cpi); 3107 3108 // Check if this high_source_sad (scene/slide change) frame should be 3109 // encoded at high/max QP, and if so, set the q and adjust some rate 3110 // control parameters. 3111 if (cpi->sf.rt_sf.overshoot_detection_cbr == FAST_DETECTION_MAXQ && 3112 cpi->rc.high_source_sad) { 3113 if (av1_encodedframe_overshoot_cbr(cpi, &q)) { 3114 av1_set_quantizer(cm, q_cfg->qm_minlevel, q_cfg->qm_maxlevel, q, 3115 q_cfg->enable_chroma_deltaq, q_cfg->enable_hdr_deltaq, 3116 cpi->oxcf.mode == ALLINTRA, cpi->oxcf.tune_cfg.tuning); 3117 av1_set_speed_features_qindex_dependent(cpi, cpi->oxcf.speed); 3118 av1_init_quantizer(&cpi->enc_quant_dequant_params, &cm->quant_params, 3119 cm->seq_params->bit_depth, 3120 cpi->oxcf.algo_cfg.sharpness); 3121 av1_set_variance_partition_thresholds(cpi, q, 0); 3122 if (frame_is_intra_only(cm) || cm->features.error_resilient_mode || 3123 cm->features.primary_ref_frame == PRIMARY_REF_NONE) 3124 av1_setup_frame(cpi); 3125 } 3126 } 3127 av1_apply_active_map(cpi); 3128 if (cpi->roi.enabled) { 3129 // For now if roi map is used: don't setup cyclic refresh. 3130 av1_apply_roi_map(cpi); 3131 } else if (q_cfg->aq_mode == CYCLIC_REFRESH_AQ) { 3132 av1_cyclic_refresh_setup(cpi); 3133 } 3134 if (cm->seg.enabled) { 3135 if (!cm->seg.update_data && cm->prev_frame) { 3136 segfeatures_copy(&cm->seg, &cm->prev_frame->seg); 3137 cm->seg.enabled = cm->prev_frame->seg.enabled; 3138 } else { 3139 av1_calculate_segdata(&cm->seg); 3140 } 3141 } else { 3142 memset(&cm->seg, 0, sizeof(cm->seg)); 3143 } 3144 segfeatures_copy(&cm->cur_frame->seg, &cm->seg); 3145 cm->cur_frame->seg.enabled = cm->seg.enabled; 3146 3147 // This is for rtc temporal filtering case. 3148 if (is_psnr_calc_enabled(cpi) && cpi->sf.rt_sf.use_rtc_tf) { 3149 const SequenceHeader *seq_params = cm->seq_params; 3150 3151 if (cpi->orig_source.buffer_alloc_sz == 0 || 3152 cpi->rc.prev_coded_width != cpi->oxcf.frm_dim_cfg.width || 3153 cpi->rc.prev_coded_height != cpi->oxcf.frm_dim_cfg.height) { 3154 // Allocate a source buffer to store the true source for psnr calculation. 3155 if (aom_alloc_frame_buffer( 3156 &cpi->orig_source, cpi->oxcf.frm_dim_cfg.width, 3157 cpi->oxcf.frm_dim_cfg.height, seq_params->subsampling_x, 3158 seq_params->subsampling_y, seq_params->use_highbitdepth, 3159 cpi->oxcf.border_in_pixels, cm->features.byte_alignment, false, 3160 0)) 3161 aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR, 3162 "Failed to allocate scaled buffer"); 3163 } 3164 3165 aom_yv12_copy_y(cpi->source, &cpi->orig_source, 1); 3166 aom_yv12_copy_u(cpi->source, &cpi->orig_source, 1); 3167 aom_yv12_copy_v(cpi->source, &cpi->orig_source, 1); 3168 } 3169 3170 #if CONFIG_COLLECT_COMPONENT_TIMING 3171 start_timing(cpi, av1_encode_frame_time); 3172 #endif 3173 3174 // Set the motion vector precision based on mv stats from the last coded 3175 // frame. 3176 if (!frame_is_intra_only(cm)) av1_pick_and_set_high_precision_mv(cpi, q); 3177 3178 // transform / motion compensation build reconstruction frame 3179 av1_encode_frame(cpi); 3180 3181 if (!cpi->rc.rtc_external_ratectrl && !frame_is_intra_only(cm)) 3182 update_motion_stat(cpi); 3183 3184 // Adjust the refresh of the golden (longer-term) reference based on QP 3185 // selected for this frame. This is for CBR real-time mode, and only 3186 // for single layer without usage of the set_ref_frame_config (so 3187 // reference structure for 1 layer is set internally). 3188 if (!frame_is_intra_only(cm) && cpi->oxcf.rc_cfg.mode == AOM_CBR && 3189 cpi->oxcf.mode == REALTIME && svc->number_spatial_layers == 1 && 3190 svc->number_temporal_layers == 1 && !cpi->rc.rtc_external_ratectrl && 3191 !cpi->ppi->rtc_ref.set_ref_frame_config && 3192 sf->rt_sf.gf_refresh_based_on_qp) 3193 av1_adjust_gf_refresh_qp_one_pass_rt(cpi); 3194 3195 // For non-svc: if scaling is required, copy scaled_source 3196 // into scaled_last_source. 3197 if (cm->current_frame.frame_number > 1 && !cpi->ppi->use_svc && 3198 cpi->scaled_source.y_buffer != NULL && 3199 cpi->scaled_last_source.y_buffer != NULL && 3200 cpi->scaled_source.y_crop_width == cpi->scaled_last_source.y_crop_width && 3201 cpi->scaled_source.y_crop_height == 3202 cpi->scaled_last_source.y_crop_height && 3203 (cm->width != cpi->unscaled_source->y_crop_width || 3204 cm->height != cpi->unscaled_source->y_crop_height)) { 3205 cpi->scaled_last_source_available = 1; 3206 aom_yv12_copy_y(&cpi->scaled_source, &cpi->scaled_last_source, 1); 3207 aom_yv12_copy_u(&cpi->scaled_source, &cpi->scaled_last_source, 1); 3208 aom_yv12_copy_v(&cpi->scaled_source, &cpi->scaled_last_source, 1); 3209 } 3210 3211 #if CONFIG_COLLECT_COMPONENT_TIMING 3212 end_timing(cpi, av1_encode_frame_time); 3213 #endif 3214 #if CONFIG_INTERNAL_STATS 3215 ++cpi->frame_recode_hits; 3216 #endif 3217 3218 return AOM_CODEC_OK; 3219 } 3220 3221 #if !CONFIG_REALTIME_ONLY 3222 3223 /*!\brief Recode loop for encoding one frame. the purpose of encoding one frame 3224 * for multiple times can be approaching a target bitrate or adjusting the usage 3225 * of global motions. 3226 * 3227 * \ingroup high_level_algo 3228 * 3229 * \param[in] cpi Top-level encoder structure 3230 * \param[in] size Bitstream size 3231 * \param[out] dest Bitstream output buffer 3232 * \param[in] dest_size Bitstream output buffer size 3233 * 3234 * \return Returns a value to indicate if the encoding is done successfully. 3235 * \retval #AOM_CODEC_OK 3236 * \retval -1 3237 * \retval #AOM_CODEC_ERROR 3238 */ 3239 static int encode_with_recode_loop(AV1_COMP *cpi, size_t *size, uint8_t *dest, 3240 size_t dest_size) { 3241 AV1_COMMON *const cm = &cpi->common; 3242 RATE_CONTROL *const rc = &cpi->rc; 3243 GlobalMotionInfo *const gm_info = &cpi->gm_info; 3244 const AV1EncoderConfig *const oxcf = &cpi->oxcf; 3245 const QuantizationCfg *const q_cfg = &oxcf->q_cfg; 3246 const int allow_recode = (cpi->sf.hl_sf.recode_loop != DISALLOW_RECODE); 3247 // Must allow recode if minimum compression ratio is set. 3248 assert(IMPLIES(oxcf->rc_cfg.min_cr > 0, allow_recode)); 3249 3250 set_size_independent_vars(cpi); 3251 if (is_stat_consumption_stage_twopass(cpi) && 3252 cpi->sf.interp_sf.adaptive_interp_filter_search) 3253 cpi->interp_search_flags.interp_filter_search_mask = 3254 av1_setup_interp_filter_search_mask(cpi); 3255 3256 av1_setup_frame_size(cpi); 3257 3258 if (av1_superres_in_recode_allowed(cpi) && 3259 cpi->superres_mode != AOM_SUPERRES_NONE && 3260 cm->superres_scale_denominator == SCALE_NUMERATOR) { 3261 // Superres mode is currently enabled, but the denominator selected will 3262 // disable superres. So no need to continue, as we will go through another 3263 // recode loop for full-resolution after this anyway. 3264 return -1; 3265 } 3266 3267 int top_index = 0, bottom_index = 0; 3268 int q = 0, q_low = 0, q_high = 0; 3269 av1_set_size_dependent_vars(cpi, &q, &bottom_index, &top_index); 3270 q_low = bottom_index; 3271 q_high = top_index; 3272 3273 av1_set_mv_search_params(cpi); 3274 3275 allocate_gradient_info_for_hog(cpi); 3276 3277 allocate_src_var_of_4x4_sub_block_buf(cpi); 3278 3279 if (cpi->sf.part_sf.partition_search_type == VAR_BASED_PARTITION) 3280 variance_partition_alloc(cpi); 3281 3282 if (cm->current_frame.frame_type == KEY_FRAME) copy_frame_prob_info(cpi); 3283 3284 #if CONFIG_COLLECT_COMPONENT_TIMING 3285 printf("\n Encoding a frame: \n"); 3286 #endif 3287 3288 #if !CONFIG_RD_COMMAND 3289 // Determine whether to use screen content tools using two fast encoding. 3290 if (!cpi->sf.hl_sf.disable_extra_sc_testing && !cpi->use_ducky_encode) 3291 av1_determine_sc_tools_with_encoding(cpi, q); 3292 #endif // !CONFIG_RD_COMMAND 3293 3294 #if CONFIG_TUNE_VMAF 3295 if (oxcf->tune_cfg.tuning == AOM_TUNE_VMAF_NEG_MAX_GAIN) { 3296 av1_vmaf_neg_preprocessing(cpi, cpi->unscaled_source); 3297 } 3298 #endif 3299 3300 #if CONFIG_TUNE_BUTTERAUGLI 3301 cpi->butteraugli_info.recon_set = false; 3302 int original_q = 0; 3303 #endif 3304 3305 cpi->num_frame_recode = 0; 3306 3307 // Loop variables 3308 int loop = 0; 3309 int loop_count = 0; 3310 int overshoot_seen = 0; 3311 int undershoot_seen = 0; 3312 int low_cr_seen = 0; 3313 int last_loop_allow_hp = 0; 3314 3315 do { 3316 loop = 0; 3317 int do_mv_stats_collection = 1; 3318 3319 // if frame was scaled calculate global_motion_search again if already 3320 // done 3321 if (loop_count > 0 && cpi->source && gm_info->search_done) { 3322 if (cpi->source->y_crop_width != cm->width || 3323 cpi->source->y_crop_height != cm->height) { 3324 gm_info->search_done = 0; 3325 } 3326 } 3327 cpi->source = av1_realloc_and_scale_if_required( 3328 cm, cpi->unscaled_source, &cpi->scaled_source, EIGHTTAP_REGULAR, 0, 3329 false, false, cpi->oxcf.border_in_pixels, cpi->alloc_pyramid); 3330 3331 #if CONFIG_TUNE_BUTTERAUGLI 3332 if (oxcf->tune_cfg.tuning == AOM_TUNE_BUTTERAUGLI) { 3333 if (loop_count == 0) { 3334 original_q = q; 3335 // TODO(sdeng): different q here does not make big difference. Use a 3336 // faster pass instead. 3337 q = 96; 3338 av1_setup_butteraugli_source(cpi); 3339 } else { 3340 q = original_q; 3341 } 3342 } 3343 #endif 3344 3345 if (cpi->unscaled_last_source != NULL) { 3346 cpi->last_source = av1_realloc_and_scale_if_required( 3347 cm, cpi->unscaled_last_source, &cpi->scaled_last_source, 3348 EIGHTTAP_REGULAR, 0, false, false, cpi->oxcf.border_in_pixels, 3349 cpi->alloc_pyramid); 3350 } 3351 3352 int scale_references = 0; 3353 #if CONFIG_FPMT_TEST 3354 scale_references = 3355 cpi->ppi->fpmt_unit_test_cfg == PARALLEL_SIMULATION_ENCODE ? 1 : 0; 3356 #endif // CONFIG_FPMT_TEST 3357 if (scale_references || 3358 cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] == 0) { 3359 if (!frame_is_intra_only(cm)) { 3360 if (loop_count > 0) { 3361 release_scaled_references(cpi); 3362 } 3363 av1_scale_references(cpi, EIGHTTAP_REGULAR, 0, 0); 3364 } 3365 } 3366 3367 #if CONFIG_TUNE_VMAF 3368 if (oxcf->tune_cfg.tuning >= AOM_TUNE_VMAF_WITH_PREPROCESSING && 3369 oxcf->tune_cfg.tuning <= AOM_TUNE_VMAF_NEG_MAX_GAIN) { 3370 cpi->vmaf_info.original_qindex = q; 3371 q = av1_get_vmaf_base_qindex(cpi, q); 3372 } 3373 #endif 3374 3375 #if CONFIG_RD_COMMAND 3376 RD_COMMAND *rd_command = &cpi->rd_command; 3377 RD_OPTION option = rd_command->option_ls[rd_command->frame_index]; 3378 if (option == RD_OPTION_SET_Q || option == RD_OPTION_SET_Q_RDMULT) { 3379 q = rd_command->q_index_ls[rd_command->frame_index]; 3380 } 3381 #endif // CONFIG_RD_COMMAND 3382 3383 #if CONFIG_BITRATE_ACCURACY 3384 #if CONFIG_THREE_PASS 3385 if (oxcf->pass == AOM_RC_THIRD_PASS && cpi->vbr_rc_info.ready == 1) { 3386 int frame_coding_idx = 3387 av1_vbr_rc_frame_coding_idx(&cpi->vbr_rc_info, cpi->gf_frame_index); 3388 if (frame_coding_idx < cpi->vbr_rc_info.total_frame_count) { 3389 q = cpi->vbr_rc_info.q_index_list[frame_coding_idx]; 3390 } else { 3391 // TODO(angiebird): Investigate why sometimes there is an extra frame 3392 // after the last GOP. 3393 q = cpi->vbr_rc_info.base_q_index; 3394 } 3395 } 3396 #else 3397 if (cpi->vbr_rc_info.q_index_list_ready) { 3398 q = cpi->vbr_rc_info.q_index_list[cpi->gf_frame_index]; 3399 } 3400 #endif // CONFIG_THREE_PASS 3401 #endif // CONFIG_BITRATE_ACCURACY 3402 3403 #if CONFIG_RATECTRL_LOG && CONFIG_THREE_PASS && CONFIG_BITRATE_ACCURACY 3404 // TODO(angiebird): Move this into a function. 3405 if (oxcf->pass == AOM_RC_THIRD_PASS) { 3406 int frame_coding_idx = 3407 av1_vbr_rc_frame_coding_idx(&cpi->vbr_rc_info, cpi->gf_frame_index); 3408 double qstep_ratio = cpi->vbr_rc_info.qstep_ratio_list[frame_coding_idx]; 3409 FRAME_UPDATE_TYPE update_type = 3410 cpi->vbr_rc_info.update_type_list[frame_coding_idx]; 3411 rc_log_frame_encode_param(&cpi->rc_log, frame_coding_idx, qstep_ratio, q, 3412 update_type); 3413 } 3414 #endif // CONFIG_RATECTRL_LOG && CONFIG_THREE_PASS && CONFIG_BITRATE_ACCURACY 3415 3416 if (cpi->use_ducky_encode) { 3417 const DuckyEncodeFrameInfo *frame_info = 3418 &cpi->ducky_encode_info.frame_info; 3419 if (frame_info->qp_mode == DUCKY_ENCODE_FRAME_MODE_QINDEX) { 3420 q = frame_info->q_index; 3421 cm->delta_q_info.delta_q_present_flag = frame_info->delta_q_enabled; 3422 } 3423 } 3424 3425 av1_set_quantizer(cm, q_cfg->qm_minlevel, q_cfg->qm_maxlevel, q, 3426 q_cfg->enable_chroma_deltaq, q_cfg->enable_hdr_deltaq, 3427 oxcf->mode == ALLINTRA, oxcf->tune_cfg.tuning); 3428 av1_set_speed_features_qindex_dependent(cpi, oxcf->speed); 3429 av1_init_quantizer(&cpi->enc_quant_dequant_params, &cm->quant_params, 3430 cm->seq_params->bit_depth, cpi->oxcf.algo_cfg.sharpness); 3431 3432 av1_set_variance_partition_thresholds(cpi, q, 0); 3433 3434 if (loop_count == 0) { 3435 av1_setup_frame(cpi); 3436 } else if (get_primary_ref_frame_buf(cm) == NULL) { 3437 // Base q-index may have changed, so we need to assign proper default coef 3438 // probs before every iteration. 3439 av1_default_coef_probs(cm); 3440 av1_setup_frame_contexts(cm); 3441 } 3442 3443 if (q_cfg->aq_mode == VARIANCE_AQ) { 3444 av1_vaq_frame_setup(cpi); 3445 } else if (q_cfg->aq_mode == COMPLEXITY_AQ) { 3446 av1_setup_in_frame_q_adj(cpi); 3447 } 3448 3449 if (cm->seg.enabled) { 3450 if (!cm->seg.update_data && cm->prev_frame) { 3451 segfeatures_copy(&cm->seg, &cm->prev_frame->seg); 3452 cm->seg.enabled = cm->prev_frame->seg.enabled; 3453 } else { 3454 av1_calculate_segdata(&cm->seg); 3455 } 3456 } else { 3457 memset(&cm->seg, 0, sizeof(cm->seg)); 3458 } 3459 segfeatures_copy(&cm->cur_frame->seg, &cm->seg); 3460 cm->cur_frame->seg.enabled = cm->seg.enabled; 3461 3462 #if CONFIG_COLLECT_COMPONENT_TIMING 3463 start_timing(cpi, av1_encode_frame_time); 3464 #endif 3465 // Set the motion vector precision based on mv stats from the last coded 3466 // frame. 3467 if (!frame_is_intra_only(cm)) { 3468 av1_pick_and_set_high_precision_mv(cpi, q); 3469 3470 // If the precision has changed during different iteration of the loop, 3471 // then we need to reset the global motion vectors 3472 if (loop_count > 0 && 3473 cm->features.allow_high_precision_mv != last_loop_allow_hp) { 3474 gm_info->search_done = 0; 3475 } 3476 last_loop_allow_hp = cm->features.allow_high_precision_mv; 3477 } 3478 3479 // transform / motion compensation build reconstruction frame 3480 av1_encode_frame(cpi); 3481 3482 // Disable mv_stats collection for parallel frames based on update flag. 3483 if (!cpi->do_frame_data_update) do_mv_stats_collection = 0; 3484 3485 // Reset the mv_stats in case we are interrupted by an intraframe or an 3486 // overlay frame. 3487 if (cpi->mv_stats.valid && do_mv_stats_collection) av1_zero(cpi->mv_stats); 3488 3489 // Gather the mv_stats for the next frame 3490 if (cpi->sf.hl_sf.high_precision_mv_usage == LAST_MV_DATA && 3491 av1_frame_allows_smart_mv(cpi) && do_mv_stats_collection) { 3492 av1_collect_mv_stats(cpi, q); 3493 } 3494 3495 #if CONFIG_COLLECT_COMPONENT_TIMING 3496 end_timing(cpi, av1_encode_frame_time); 3497 #endif 3498 3499 #if CONFIG_BITRATE_ACCURACY || CONFIG_RD_COMMAND 3500 const int do_dummy_pack = 1; 3501 #else // CONFIG_BITRATE_ACCURACY 3502 // Dummy pack of the bitstream using up to date stats to get an 3503 // accurate estimate of output frame size to determine if we need 3504 // to recode. 3505 const int do_dummy_pack = 3506 (cpi->sf.hl_sf.recode_loop >= ALLOW_RECODE_KFARFGF && 3507 oxcf->rc_cfg.mode != AOM_Q) || 3508 oxcf->rc_cfg.min_cr > 0; 3509 #endif // CONFIG_BITRATE_ACCURACY 3510 if (do_dummy_pack) { 3511 av1_finalize_encoded_frame(cpi); 3512 int largest_tile_id = 0; // Output from bitstream: unused here 3513 rc->coefficient_size = 0; 3514 if (av1_pack_bitstream(cpi, dest, dest_size, size, &largest_tile_id) != 3515 AOM_CODEC_OK) { 3516 return AOM_CODEC_ERROR; 3517 } 3518 3519 // bits used for this frame 3520 rc->projected_frame_size = (int)(*size) << 3; 3521 #if CONFIG_RD_COMMAND 3522 PSNR_STATS psnr; 3523 aom_calc_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr); 3524 printf("q %d rdmult %d rate %d dist %" PRIu64 "\n", q, cpi->rd.RDMULT, 3525 rc->projected_frame_size, psnr.sse[0]); 3526 ++rd_command->frame_index; 3527 if (rd_command->frame_index == rd_command->frame_count) { 3528 return AOM_CODEC_ERROR; 3529 } 3530 #endif // CONFIG_RD_COMMAND 3531 3532 #if CONFIG_RATECTRL_LOG && CONFIG_THREE_PASS && CONFIG_BITRATE_ACCURACY 3533 if (oxcf->pass == AOM_RC_THIRD_PASS) { 3534 int frame_coding_idx = 3535 av1_vbr_rc_frame_coding_idx(&cpi->vbr_rc_info, cpi->gf_frame_index); 3536 rc_log_frame_entropy(&cpi->rc_log, frame_coding_idx, 3537 rc->projected_frame_size, rc->coefficient_size); 3538 } 3539 #endif // CONFIG_RATECTRL_LOG && CONFIG_THREE_PASS && CONFIG_BITRATE_ACCURACY 3540 } 3541 3542 #if CONFIG_TUNE_VMAF 3543 if (oxcf->tune_cfg.tuning >= AOM_TUNE_VMAF_WITH_PREPROCESSING && 3544 oxcf->tune_cfg.tuning <= AOM_TUNE_VMAF_NEG_MAX_GAIN) { 3545 q = cpi->vmaf_info.original_qindex; 3546 } 3547 #endif 3548 if (allow_recode) { 3549 // Update q and decide whether to do a recode loop 3550 recode_loop_update_q(cpi, &loop, &q, &q_low, &q_high, top_index, 3551 bottom_index, &undershoot_seen, &overshoot_seen, 3552 &low_cr_seen, loop_count); 3553 } 3554 3555 #if CONFIG_TUNE_BUTTERAUGLI 3556 if (loop_count == 0 && oxcf->tune_cfg.tuning == AOM_TUNE_BUTTERAUGLI) { 3557 loop = 1; 3558 av1_setup_butteraugli_rdmult_and_restore_source(cpi, 0.4); 3559 } 3560 #endif 3561 3562 if (cpi->use_ducky_encode) { 3563 // Ducky encode currently does not support recode loop. 3564 loop = 0; 3565 } 3566 #if CONFIG_BITRATE_ACCURACY || CONFIG_RD_COMMAND 3567 loop = 0; // turn off recode loop when CONFIG_BITRATE_ACCURACY is on 3568 #endif // CONFIG_BITRATE_ACCURACY || CONFIG_RD_COMMAND 3569 3570 if (loop) { 3571 ++loop_count; 3572 cpi->num_frame_recode = 3573 (cpi->num_frame_recode < (NUM_RECODES_PER_FRAME - 1)) 3574 ? (cpi->num_frame_recode + 1) 3575 : (NUM_RECODES_PER_FRAME - 1); 3576 #if CONFIG_INTERNAL_STATS 3577 ++cpi->frame_recode_hits; 3578 #endif 3579 } 3580 #if CONFIG_COLLECT_COMPONENT_TIMING 3581 if (loop) printf("\n Recoding:"); 3582 #endif 3583 } while (loop); 3584 3585 return AOM_CODEC_OK; 3586 } 3587 #endif // !CONFIG_REALTIME_ONLY 3588 3589 // TODO(jingning, paulwilkins): Set up high grain level to test 3590 // hardware decoders. Need to adapt the actual noise variance 3591 // according to the difference between reconstructed frame and the 3592 // source signal. 3593 static void set_grain_syn_params(AV1_COMMON *cm) { 3594 aom_film_grain_t *film_grain_params = &cm->film_grain_params; 3595 film_grain_params->apply_grain = 1; 3596 film_grain_params->update_parameters = 1; 3597 film_grain_params->random_seed = rand() & 0xffff; 3598 3599 film_grain_params->num_y_points = 1; 3600 film_grain_params->scaling_points_y[0][0] = 128; 3601 film_grain_params->scaling_points_y[0][1] = 100; 3602 3603 if (!cm->seq_params->monochrome) { 3604 film_grain_params->num_cb_points = 1; 3605 film_grain_params->scaling_points_cb[0][0] = 128; 3606 film_grain_params->scaling_points_cb[0][1] = 100; 3607 3608 film_grain_params->num_cr_points = 1; 3609 film_grain_params->scaling_points_cr[0][0] = 128; 3610 film_grain_params->scaling_points_cr[0][1] = 100; 3611 } else { 3612 film_grain_params->num_cb_points = 0; 3613 film_grain_params->num_cr_points = 0; 3614 } 3615 3616 film_grain_params->chroma_scaling_from_luma = 0; 3617 3618 film_grain_params->scaling_shift = 1; 3619 film_grain_params->ar_coeff_lag = 0; 3620 film_grain_params->ar_coeff_shift = 1; 3621 film_grain_params->overlap_flag = 1; 3622 film_grain_params->grain_scale_shift = 0; 3623 } 3624 3625 /*!\brief Recode loop or a single loop for encoding one frame, followed by 3626 * in-loop deblocking filters, CDEF filters, and restoration filters. 3627 * 3628 * \ingroup high_level_algo 3629 * \callgraph 3630 * \callergraph 3631 * 3632 * \param[in] cpi Top-level encoder structure 3633 * \param[in] size Bitstream size 3634 * \param[out] dest Bitstream output buffer 3635 * \param[in] dest_size Bitstream output buffer size 3636 * \param[in] sse Total distortion of the frame 3637 * \param[in] rate Total rate of the frame 3638 * \param[in] largest_tile_id Tile id of the last tile 3639 * 3640 * \return Returns a value to indicate if the encoding is done successfully. 3641 * \retval #AOM_CODEC_OK 3642 * \retval #AOM_CODEC_ERROR 3643 */ 3644 static int encode_with_recode_loop_and_filter(AV1_COMP *cpi, size_t *size, 3645 uint8_t *dest, size_t dest_size, 3646 int64_t *sse, int64_t *rate, 3647 int *largest_tile_id) { 3648 #if CONFIG_COLLECT_COMPONENT_TIMING 3649 start_timing(cpi, encode_with_or_without_recode_time); 3650 #endif 3651 for (int i = 0; i < NUM_RECODES_PER_FRAME; i++) { 3652 cpi->do_update_frame_probs_txtype[i] = 0; 3653 cpi->do_update_frame_probs_obmc[i] = 0; 3654 cpi->do_update_frame_probs_warp[i] = 0; 3655 cpi->do_update_frame_probs_interpfilter[i] = 0; 3656 } 3657 3658 cpi->do_update_vbr_bits_off_target_fast = 0; 3659 int err; 3660 #if CONFIG_REALTIME_ONLY 3661 err = encode_without_recode(cpi); 3662 #else 3663 if (cpi->sf.hl_sf.recode_loop == DISALLOW_RECODE) 3664 err = encode_without_recode(cpi); 3665 else 3666 err = encode_with_recode_loop(cpi, size, dest, dest_size); 3667 #endif 3668 #if CONFIG_COLLECT_COMPONENT_TIMING 3669 end_timing(cpi, encode_with_or_without_recode_time); 3670 #endif 3671 if (err != AOM_CODEC_OK) { 3672 if (err == -1) { 3673 // special case as described in encode_with_recode_loop(). 3674 // Encoding was skipped. 3675 err = AOM_CODEC_OK; 3676 if (sse != NULL) *sse = INT64_MAX; 3677 if (rate != NULL) *rate = INT64_MAX; 3678 *largest_tile_id = 0; 3679 } 3680 return err; 3681 } 3682 3683 #ifdef OUTPUT_YUV_DENOISED 3684 const AV1EncoderConfig *const oxcf = &cpi->oxcf; 3685 if (oxcf->noise_sensitivity > 0 && denoise_svc(cpi)) { 3686 aom_write_yuv_frame(yuv_denoised_file, 3687 &cpi->denoiser.running_avg_y[INTRA_FRAME]); 3688 } 3689 #endif 3690 3691 AV1_COMMON *const cm = &cpi->common; 3692 SequenceHeader *const seq_params = cm->seq_params; 3693 3694 // Special case code to reduce pulsing when key frames are forced at a 3695 // fixed interval. Note the reconstruction error if it is the frame before 3696 // the force key frame 3697 if (cpi->ppi->p_rc.next_key_frame_forced && cpi->rc.frames_to_key == 1) { 3698 #if CONFIG_AV1_HIGHBITDEPTH 3699 if (seq_params->use_highbitdepth) { 3700 cpi->ambient_err = aom_highbd_get_y_sse(cpi->source, &cm->cur_frame->buf); 3701 } else { 3702 cpi->ambient_err = aom_get_y_sse(cpi->source, &cm->cur_frame->buf); 3703 } 3704 #else 3705 cpi->ambient_err = aom_get_y_sse(cpi->source, &cm->cur_frame->buf); 3706 #endif 3707 } 3708 3709 cm->cur_frame->buf.color_primaries = seq_params->color_primaries; 3710 cm->cur_frame->buf.transfer_characteristics = 3711 seq_params->transfer_characteristics; 3712 cm->cur_frame->buf.matrix_coefficients = seq_params->matrix_coefficients; 3713 cm->cur_frame->buf.monochrome = seq_params->monochrome; 3714 cm->cur_frame->buf.chroma_sample_position = 3715 seq_params->chroma_sample_position; 3716 cm->cur_frame->buf.color_range = seq_params->color_range; 3717 cm->cur_frame->buf.render_width = cm->render_width; 3718 cm->cur_frame->buf.render_height = cm->render_height; 3719 3720 if (!cpi->mt_info.pipeline_lpf_mt_with_enc) 3721 set_postproc_filter_default_params(&cpi->common); 3722 3723 if (!cm->features.allow_intrabc) { 3724 loopfilter_frame(cpi, cm); 3725 } 3726 3727 if (cpi->oxcf.mode != ALLINTRA && !cpi->ppi->rtc_ref.non_reference_frame) { 3728 extend_frame_borders(cpi); 3729 } 3730 3731 #ifdef OUTPUT_YUV_REC 3732 aom_write_one_yuv_frame(cm, &cm->cur_frame->buf); 3733 #endif 3734 3735 if (cpi->oxcf.tune_cfg.content == AOM_CONTENT_FILM) { 3736 set_grain_syn_params(cm); 3737 } 3738 3739 av1_finalize_encoded_frame(cpi); 3740 // Build the bitstream 3741 #if CONFIG_COLLECT_COMPONENT_TIMING 3742 start_timing(cpi, av1_pack_bitstream_final_time); 3743 #endif 3744 cpi->rc.coefficient_size = 0; 3745 if (av1_pack_bitstream(cpi, dest, dest_size, size, largest_tile_id) != 3746 AOM_CODEC_OK) 3747 return AOM_CODEC_ERROR; 3748 #if CONFIG_COLLECT_COMPONENT_TIMING 3749 end_timing(cpi, av1_pack_bitstream_final_time); 3750 #endif 3751 3752 if (cpi->rc.postencode_drop && allow_postencode_drop_rtc(cpi) && 3753 av1_postencode_drop_cbr(cpi, size)) { 3754 return AOM_CODEC_OK; 3755 } 3756 3757 // Compute sse and rate. 3758 if (sse != NULL) { 3759 #if CONFIG_AV1_HIGHBITDEPTH 3760 *sse = (seq_params->use_highbitdepth) 3761 ? aom_highbd_get_y_sse(cpi->source, &cm->cur_frame->buf) 3762 : aom_get_y_sse(cpi->source, &cm->cur_frame->buf); 3763 #else 3764 *sse = aom_get_y_sse(cpi->source, &cm->cur_frame->buf); 3765 #endif 3766 } 3767 if (rate != NULL) { 3768 const int64_t bits = (*size << 3); 3769 *rate = (bits << 5); // To match scale. 3770 } 3771 3772 #if !CONFIG_REALTIME_ONLY 3773 if (cpi->use_ducky_encode) { 3774 PSNR_STATS psnr; 3775 aom_calc_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr); 3776 DuckyEncodeFrameResult *frame_result = &cpi->ducky_encode_info.frame_result; 3777 frame_result->global_order_idx = cm->cur_frame->display_order_hint; 3778 frame_result->q_index = cm->quant_params.base_qindex; 3779 frame_result->rdmult = cpi->rd.RDMULT; 3780 frame_result->rate = (int)(*size) * 8; 3781 frame_result->dist = psnr.sse[0]; 3782 frame_result->psnr = psnr.psnr[0]; 3783 } 3784 #endif // !CONFIG_REALTIME_ONLY 3785 3786 return AOM_CODEC_OK; 3787 } 3788 3789 static int encode_with_and_without_superres(AV1_COMP *cpi, size_t *size, 3790 uint8_t *dest, size_t dest_size, 3791 int *largest_tile_id) { 3792 const AV1_COMMON *const cm = &cpi->common; 3793 assert(cm->seq_params->enable_superres); 3794 assert(av1_superres_in_recode_allowed(cpi)); 3795 aom_codec_err_t err = AOM_CODEC_OK; 3796 av1_save_all_coding_context(cpi); 3797 3798 int64_t sse1 = INT64_MAX; 3799 int64_t rate1 = INT64_MAX; 3800 int largest_tile_id1 = 0; 3801 int64_t sse2 = INT64_MAX; 3802 int64_t rate2 = INT64_MAX; 3803 int largest_tile_id2; 3804 double proj_rdcost1 = DBL_MAX; 3805 const GF_GROUP *const gf_group = &cpi->ppi->gf_group; 3806 const FRAME_UPDATE_TYPE update_type = 3807 gf_group->update_type[cpi->gf_frame_index]; 3808 const aom_bit_depth_t bit_depth = cm->seq_params->bit_depth; 3809 3810 // Encode with superres. 3811 if (cpi->sf.hl_sf.superres_auto_search_type == SUPERRES_AUTO_ALL) { 3812 SuperResCfg *const superres_cfg = &cpi->oxcf.superres_cfg; 3813 int64_t superres_sses[SCALE_NUMERATOR]; 3814 int64_t superres_rates[SCALE_NUMERATOR]; 3815 int superres_largest_tile_ids[SCALE_NUMERATOR]; 3816 // Use superres for Key-frames and Alt-ref frames only. 3817 if (update_type != OVERLAY_UPDATE && update_type != INTNL_OVERLAY_UPDATE) { 3818 for (int denom = SCALE_NUMERATOR + 1; denom <= 2 * SCALE_NUMERATOR; 3819 ++denom) { 3820 superres_cfg->superres_scale_denominator = denom; 3821 superres_cfg->superres_kf_scale_denominator = denom; 3822 const int this_index = denom - (SCALE_NUMERATOR + 1); 3823 3824 cpi->superres_mode = AOM_SUPERRES_AUTO; // Super-res on for this loop. 3825 err = encode_with_recode_loop_and_filter( 3826 cpi, size, dest, dest_size, &superres_sses[this_index], 3827 &superres_rates[this_index], 3828 &superres_largest_tile_ids[this_index]); 3829 cpi->superres_mode = AOM_SUPERRES_NONE; // Reset to default (full-res). 3830 if (err != AOM_CODEC_OK) return err; 3831 restore_all_coding_context(cpi); 3832 } 3833 // Reset. 3834 superres_cfg->superres_scale_denominator = SCALE_NUMERATOR; 3835 superres_cfg->superres_kf_scale_denominator = SCALE_NUMERATOR; 3836 } else { 3837 for (int denom = SCALE_NUMERATOR + 1; denom <= 2 * SCALE_NUMERATOR; 3838 ++denom) { 3839 const int this_index = denom - (SCALE_NUMERATOR + 1); 3840 superres_sses[this_index] = INT64_MAX; 3841 superres_rates[this_index] = INT64_MAX; 3842 superres_largest_tile_ids[this_index] = 0; 3843 } 3844 } 3845 // Encode without superres. 3846 assert(cpi->superres_mode == AOM_SUPERRES_NONE); 3847 err = encode_with_recode_loop_and_filter(cpi, size, dest, dest_size, &sse2, 3848 &rate2, &largest_tile_id2); 3849 if (err != AOM_CODEC_OK) return err; 3850 3851 // Note: Both use common rdmult based on base qindex of fullres. 3852 const int64_t rdmult = av1_compute_rd_mult_based_on_qindex( 3853 bit_depth, update_type, cm->quant_params.base_qindex, 3854 cpi->oxcf.tune_cfg.tuning); 3855 3856 // Find the best rdcost among all superres denoms. 3857 int best_denom = -1; 3858 for (int denom = SCALE_NUMERATOR + 1; denom <= 2 * SCALE_NUMERATOR; 3859 ++denom) { 3860 const int this_index = denom - (SCALE_NUMERATOR + 1); 3861 const int64_t this_sse = superres_sses[this_index]; 3862 const int64_t this_rate = superres_rates[this_index]; 3863 const int this_largest_tile_id = superres_largest_tile_ids[this_index]; 3864 const double this_rdcost = RDCOST_DBL_WITH_NATIVE_BD_DIST( 3865 rdmult, this_rate, this_sse, bit_depth); 3866 if (this_rdcost < proj_rdcost1) { 3867 sse1 = this_sse; 3868 rate1 = this_rate; 3869 largest_tile_id1 = this_largest_tile_id; 3870 proj_rdcost1 = this_rdcost; 3871 best_denom = denom; 3872 } 3873 } 3874 const double proj_rdcost2 = 3875 RDCOST_DBL_WITH_NATIVE_BD_DIST(rdmult, rate2, sse2, bit_depth); 3876 // Re-encode with superres if it's better. 3877 if (proj_rdcost1 < proj_rdcost2) { 3878 restore_all_coding_context(cpi); 3879 // TODO(urvang): We should avoid rerunning the recode loop by saving 3880 // previous output+state, or running encode only for the selected 'q' in 3881 // previous step. 3882 // Again, temporarily force the best denom. 3883 superres_cfg->superres_scale_denominator = best_denom; 3884 superres_cfg->superres_kf_scale_denominator = best_denom; 3885 int64_t sse3 = INT64_MAX; 3886 int64_t rate3 = INT64_MAX; 3887 cpi->superres_mode = 3888 AOM_SUPERRES_AUTO; // Super-res on for this recode loop. 3889 err = encode_with_recode_loop_and_filter(cpi, size, dest, dest_size, 3890 &sse3, &rate3, largest_tile_id); 3891 cpi->superres_mode = AOM_SUPERRES_NONE; // Reset to default (full-res). 3892 assert(sse1 == sse3); 3893 assert(rate1 == rate3); 3894 assert(largest_tile_id1 == *largest_tile_id); 3895 // Reset. 3896 superres_cfg->superres_scale_denominator = SCALE_NUMERATOR; 3897 superres_cfg->superres_kf_scale_denominator = SCALE_NUMERATOR; 3898 } else { 3899 *largest_tile_id = largest_tile_id2; 3900 } 3901 } else { 3902 assert(cpi->sf.hl_sf.superres_auto_search_type == SUPERRES_AUTO_DUAL); 3903 cpi->superres_mode = 3904 AOM_SUPERRES_AUTO; // Super-res on for this recode loop. 3905 err = encode_with_recode_loop_and_filter(cpi, size, dest, dest_size, &sse1, 3906 &rate1, &largest_tile_id1); 3907 cpi->superres_mode = AOM_SUPERRES_NONE; // Reset to default (full-res). 3908 if (err != AOM_CODEC_OK) return err; 3909 restore_all_coding_context(cpi); 3910 // Encode without superres. 3911 assert(cpi->superres_mode == AOM_SUPERRES_NONE); 3912 err = encode_with_recode_loop_and_filter(cpi, size, dest, dest_size, &sse2, 3913 &rate2, &largest_tile_id2); 3914 if (err != AOM_CODEC_OK) return err; 3915 3916 // Note: Both use common rdmult based on base qindex of fullres. 3917 const int64_t rdmult = av1_compute_rd_mult_based_on_qindex( 3918 bit_depth, update_type, cm->quant_params.base_qindex, 3919 cpi->oxcf.tune_cfg.tuning); 3920 proj_rdcost1 = 3921 RDCOST_DBL_WITH_NATIVE_BD_DIST(rdmult, rate1, sse1, bit_depth); 3922 const double proj_rdcost2 = 3923 RDCOST_DBL_WITH_NATIVE_BD_DIST(rdmult, rate2, sse2, bit_depth); 3924 // Re-encode with superres if it's better. 3925 if (proj_rdcost1 < proj_rdcost2) { 3926 restore_all_coding_context(cpi); 3927 // TODO(urvang): We should avoid rerunning the recode loop by saving 3928 // previous output+state, or running encode only for the selected 'q' in 3929 // previous step. 3930 int64_t sse3 = INT64_MAX; 3931 int64_t rate3 = INT64_MAX; 3932 cpi->superres_mode = 3933 AOM_SUPERRES_AUTO; // Super-res on for this recode loop. 3934 err = encode_with_recode_loop_and_filter(cpi, size, dest, dest_size, 3935 &sse3, &rate3, largest_tile_id); 3936 cpi->superres_mode = AOM_SUPERRES_NONE; // Reset to default (full-res). 3937 assert(sse1 == sse3); 3938 assert(rate1 == rate3); 3939 assert(largest_tile_id1 == *largest_tile_id); 3940 } else { 3941 *largest_tile_id = largest_tile_id2; 3942 } 3943 } 3944 3945 return err; 3946 } 3947 3948 // Conditions to disable cdf_update mode in selective mode for real-time. 3949 // Handle case for layers, scene change, and resizing. 3950 static inline int selective_disable_cdf_rtc(const AV1_COMP *cpi) { 3951 const AV1_COMMON *const cm = &cpi->common; 3952 const RATE_CONTROL *const rc = &cpi->rc; 3953 // For single layer. 3954 if (cpi->svc.number_spatial_layers == 1 && 3955 cpi->svc.number_temporal_layers == 1) { 3956 // Don't disable on intra_only, scene change (high_source_sad = 1), 3957 // or resized frame. To avoid quality loss force enable at 3958 // for ~30 frames after key or scene/slide change, and 3959 // after 8 frames since last update if frame_source_sad > 0. 3960 if (frame_is_intra_only(cm) || is_frame_resize_pending(cpi) || 3961 rc->high_source_sad || rc->frames_since_key < 30 || 3962 (cpi->oxcf.q_cfg.aq_mode == CYCLIC_REFRESH_AQ && 3963 cpi->cyclic_refresh->counter_encode_maxq_scene_change < 30) || 3964 (cpi->frames_since_last_update > 8 && cpi->rc.frame_source_sad > 0)) 3965 return 0; 3966 else 3967 return 1; 3968 } else if (cpi->svc.number_temporal_layers > 1) { 3969 // Disable only on top temporal enhancement layer for now. 3970 return cpi->svc.temporal_layer_id == cpi->svc.number_temporal_layers - 1; 3971 } 3972 return 1; 3973 } 3974 3975 #if !CONFIG_REALTIME_ONLY 3976 static void subtract_stats(FIRSTPASS_STATS *section, 3977 const FIRSTPASS_STATS *frame) { 3978 section->frame -= frame->frame; 3979 section->weight -= frame->weight; 3980 section->intra_error -= frame->intra_error; 3981 section->frame_avg_wavelet_energy -= frame->frame_avg_wavelet_energy; 3982 section->coded_error -= frame->coded_error; 3983 section->sr_coded_error -= frame->sr_coded_error; 3984 section->pcnt_inter -= frame->pcnt_inter; 3985 section->pcnt_motion -= frame->pcnt_motion; 3986 section->pcnt_second_ref -= frame->pcnt_second_ref; 3987 section->pcnt_neutral -= frame->pcnt_neutral; 3988 section->intra_skip_pct -= frame->intra_skip_pct; 3989 section->inactive_zone_rows -= frame->inactive_zone_rows; 3990 section->inactive_zone_cols -= frame->inactive_zone_cols; 3991 section->MVr -= frame->MVr; 3992 section->mvr_abs -= frame->mvr_abs; 3993 section->MVc -= frame->MVc; 3994 section->mvc_abs -= frame->mvc_abs; 3995 section->MVrv -= frame->MVrv; 3996 section->MVcv -= frame->MVcv; 3997 section->mv_in_out_count -= frame->mv_in_out_count; 3998 section->new_mv_count -= frame->new_mv_count; 3999 section->count -= frame->count; 4000 section->duration -= frame->duration; 4001 } 4002 4003 static void calculate_frame_avg_haar_energy(AV1_COMP *cpi) { 4004 TWO_PASS *const twopass = &cpi->ppi->twopass; 4005 const FIRSTPASS_STATS *const total_stats = 4006 twopass->stats_buf_ctx->total_stats; 4007 4008 if (is_one_pass_rt_params(cpi) || 4009 (cpi->oxcf.q_cfg.deltaq_mode != DELTA_Q_PERCEPTUAL) || 4010 (is_fp_wavelet_energy_invalid(total_stats) == 0)) 4011 return; 4012 4013 const int num_mbs = (cpi->oxcf.resize_cfg.resize_mode != RESIZE_NONE) 4014 ? cpi->initial_mbs 4015 : cpi->common.mi_params.MBs; 4016 const YV12_BUFFER_CONFIG *const unfiltered_source = cpi->unfiltered_source; 4017 const uint8_t *const src = unfiltered_source->y_buffer; 4018 const int hbd = unfiltered_source->flags & YV12_FLAG_HIGHBITDEPTH; 4019 const int stride = unfiltered_source->y_stride; 4020 const BLOCK_SIZE fp_block_size = 4021 get_fp_block_size(cpi->is_screen_content_type); 4022 const int fp_block_size_width = block_size_wide[fp_block_size]; 4023 const int fp_block_size_height = block_size_high[fp_block_size]; 4024 const int num_unit_cols = 4025 get_num_blocks(unfiltered_source->y_crop_width, fp_block_size_width); 4026 const int num_unit_rows = 4027 get_num_blocks(unfiltered_source->y_crop_height, fp_block_size_height); 4028 const int num_8x8_cols = num_unit_cols * (fp_block_size_width / 8); 4029 const int num_8x8_rows = num_unit_rows * (fp_block_size_height / 8); 4030 int64_t frame_avg_wavelet_energy = av1_haar_ac_sad_mxn_uint8_input( 4031 src, stride, hbd, num_8x8_rows, num_8x8_cols); 4032 4033 cpi->twopass_frame.frame_avg_haar_energy = 4034 log1p((double)frame_avg_wavelet_energy / num_mbs); 4035 } 4036 #endif 4037 4038 /*!\brief Run the final pass encoding for 1-pass/2-pass encoding mode, and pack 4039 * the bitstream 4040 * 4041 * \ingroup high_level_algo 4042 * \callgraph 4043 * \callergraph 4044 * 4045 * \param[in] cpi Top-level encoder structure 4046 * \param[in] size Bitstream size 4047 * \param[out] dest Bitstream output buffer 4048 * \param[in] dest_size Bitstream output buffer size 4049 * 4050 * \return Returns a value to indicate if the encoding is done successfully. 4051 * \retval #AOM_CODEC_OK 4052 * \retval #AOM_CODEC_ERROR 4053 */ 4054 static int encode_frame_to_data_rate(AV1_COMP *cpi, size_t *size, uint8_t *dest, 4055 size_t dest_size) { 4056 AV1_COMMON *const cm = &cpi->common; 4057 SequenceHeader *const seq_params = cm->seq_params; 4058 CurrentFrame *const current_frame = &cm->current_frame; 4059 const AV1EncoderConfig *const oxcf = &cpi->oxcf; 4060 struct segmentation *const seg = &cm->seg; 4061 FeatureFlags *const features = &cm->features; 4062 const TileConfig *const tile_cfg = &oxcf->tile_cfg; 4063 assert(cpi->source != NULL); 4064 cpi->td.mb.e_mbd.cur_buf = cpi->source; 4065 4066 #if CONFIG_COLLECT_COMPONENT_TIMING 4067 start_timing(cpi, encode_frame_to_data_rate_time); 4068 #endif 4069 4070 #if !CONFIG_REALTIME_ONLY 4071 calculate_frame_avg_haar_energy(cpi); 4072 #endif 4073 4074 // frame type has been decided outside of this function call 4075 cm->cur_frame->frame_type = current_frame->frame_type; 4076 4077 cm->tiles.large_scale = tile_cfg->enable_large_scale_tile; 4078 cm->tiles.single_tile_decoding = tile_cfg->enable_single_tile_decoding; 4079 4080 features->allow_ref_frame_mvs &= frame_might_allow_ref_frame_mvs(cm); 4081 // features->allow_ref_frame_mvs needs to be written into the frame header 4082 // while cm->tiles.large_scale is 1, therefore, "cm->tiles.large_scale=1" case 4083 // is separated from frame_might_allow_ref_frame_mvs(). 4084 features->allow_ref_frame_mvs &= !cm->tiles.large_scale; 4085 4086 features->allow_warped_motion = oxcf->motion_mode_cfg.allow_warped_motion && 4087 frame_might_allow_warped_motion(cm); 4088 4089 cpi->last_frame_type = current_frame->frame_type; 4090 4091 if (frame_is_intra_only(cm)) { 4092 cpi->frames_since_last_update = 0; 4093 } 4094 4095 if (frame_is_sframe(cm)) { 4096 GF_GROUP *gf_group = &cpi->ppi->gf_group; 4097 // S frame will wipe out any previously encoded altref so we cannot place 4098 // an overlay frame 4099 gf_group->update_type[gf_group->size] = GF_UPDATE; 4100 } 4101 4102 if (encode_show_existing_frame(cm)) { 4103 #if CONFIG_RATECTRL_LOG && CONFIG_THREE_PASS && CONFIG_BITRATE_ACCURACY 4104 // TODO(angiebird): Move this into a function. 4105 if (oxcf->pass == AOM_RC_THIRD_PASS) { 4106 int frame_coding_idx = 4107 av1_vbr_rc_frame_coding_idx(&cpi->vbr_rc_info, cpi->gf_frame_index); 4108 rc_log_frame_encode_param( 4109 &cpi->rc_log, frame_coding_idx, 1, 255, 4110 cpi->ppi->gf_group.update_type[cpi->gf_frame_index]); 4111 } 4112 #endif 4113 av1_finalize_encoded_frame(cpi); 4114 // Build the bitstream 4115 int largest_tile_id = 0; // Output from bitstream: unused here 4116 cpi->rc.coefficient_size = 0; 4117 if (av1_pack_bitstream(cpi, dest, dest_size, size, &largest_tile_id) != 4118 AOM_CODEC_OK) 4119 return AOM_CODEC_ERROR; 4120 4121 if (seq_params->frame_id_numbers_present_flag && 4122 current_frame->frame_type == KEY_FRAME) { 4123 // Displaying a forward key-frame, so reset the ref buffer IDs 4124 int display_frame_id = cm->ref_frame_id[cpi->existing_fb_idx_to_show]; 4125 for (int i = 0; i < REF_FRAMES; i++) 4126 cm->ref_frame_id[i] = display_frame_id; 4127 } 4128 4129 #if DUMP_RECON_FRAMES == 1 4130 // NOTE(zoeliu): For debug - Output the filtered reconstructed video. 4131 av1_dump_filtered_recon_frames(cpi); 4132 #endif // DUMP_RECON_FRAMES 4133 4134 // NOTE: Save the new show frame buffer index for --test-code=warn, i.e., 4135 // for the purpose to verify no mismatch between encoder and decoder. 4136 if (cm->show_frame) cpi->last_show_frame_buf = cm->cur_frame; 4137 4138 #if CONFIG_AV1_TEMPORAL_DENOISING 4139 av1_denoiser_update_ref_frame(cpi); 4140 #endif 4141 4142 // Since we allocate a spot for the OVERLAY frame in the gf group, we need 4143 // to do post-encoding update accordingly. 4144 av1_set_target_rate(cpi, cm->width, cm->height); 4145 4146 if (is_psnr_calc_enabled(cpi)) { 4147 cpi->source = 4148 realloc_and_scale_source(cpi, cm->cur_frame->buf.y_crop_width, 4149 cm->cur_frame->buf.y_crop_height); 4150 } 4151 4152 #if !CONFIG_REALTIME_ONLY 4153 if (cpi->use_ducky_encode) { 4154 PSNR_STATS psnr; 4155 aom_calc_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr); 4156 DuckyEncodeFrameResult *frame_result = 4157 &cpi->ducky_encode_info.frame_result; 4158 frame_result->global_order_idx = cm->cur_frame->display_order_hint; 4159 frame_result->q_index = cm->quant_params.base_qindex; 4160 frame_result->rdmult = cpi->rd.RDMULT; 4161 frame_result->rate = (int)(*size) * 8; 4162 frame_result->dist = psnr.sse[0]; 4163 frame_result->psnr = psnr.psnr[0]; 4164 } 4165 #endif // !CONFIG_REALTIME_ONLY 4166 4167 update_counters_for_show_frame(cpi); 4168 return AOM_CODEC_OK; 4169 } 4170 4171 // Work out whether to force_integer_mv this frame 4172 if (!is_stat_generation_stage(cpi) && 4173 cpi->common.features.allow_screen_content_tools && 4174 !frame_is_intra_only(cm) && !cpi->sf.rt_sf.use_nonrd_pick_mode) { 4175 if (cpi->common.seq_params->force_integer_mv == 2) { 4176 // Adaptive mode: see what previous frame encoded did 4177 if (cpi->unscaled_last_source != NULL) { 4178 features->cur_frame_force_integer_mv = av1_is_integer_mv( 4179 cpi->source, cpi->unscaled_last_source, &cpi->force_intpel_info); 4180 } else { 4181 cpi->common.features.cur_frame_force_integer_mv = 0; 4182 } 4183 } else { 4184 cpi->common.features.cur_frame_force_integer_mv = 4185 cpi->common.seq_params->force_integer_mv; 4186 } 4187 } else { 4188 cpi->common.features.cur_frame_force_integer_mv = 0; 4189 } 4190 4191 // This is used by av1_pack_bitstream. So this needs to be set in case of 4192 // row-mt where the encoding code will use a temporary structure. 4193 cpi->td.mb.e_mbd.cur_frame_force_integer_mv = 4194 cpi->common.features.cur_frame_force_integer_mv; 4195 4196 // Set default state for segment based loop filter update flags. 4197 cm->lf.mode_ref_delta_update = 0; 4198 4199 // Set various flags etc to special state if it is a key frame. 4200 if (frame_is_intra_only(cm) || frame_is_sframe(cm)) { 4201 // Reset the loop filter deltas and segmentation map. 4202 av1_reset_segment_features(cm); 4203 4204 // If segmentation is enabled force a map update for key frames. 4205 if (seg->enabled) { 4206 seg->update_map = 1; 4207 seg->update_data = 1; 4208 } 4209 } 4210 if (tile_cfg->mtu == 0) { 4211 cpi->num_tg = tile_cfg->num_tile_groups; 4212 } else { 4213 // Use a default value for the purposes of weighting costs in probability 4214 // updates 4215 cpi->num_tg = DEFAULT_MAX_NUM_TG; 4216 } 4217 4218 // For 1 pass CBR mode: check if we are dropping this frame. 4219 if (has_no_stats_stage(cpi) && oxcf->rc_cfg.mode == AOM_CBR) { 4220 // Always drop for spatial enhancement layer if layer bandwidth is 0. 4221 // Otherwise check for frame-dropping based on buffer level in 4222 // av1_rc_drop_frame(). 4223 if ((cpi->svc.spatial_layer_id > 0 && 4224 cpi->oxcf.rc_cfg.target_bandwidth == 0) || 4225 av1_rc_drop_frame(cpi)) { 4226 cpi->is_dropped_frame = true; 4227 } 4228 if (cpi->is_dropped_frame) { 4229 av1_setup_frame_size(cpi); 4230 av1_set_mv_search_params(cpi); 4231 av1_rc_postencode_update_drop_frame(cpi); 4232 release_scaled_references(cpi); 4233 cpi->ppi->gf_group.is_frame_dropped[cpi->gf_frame_index] = true; 4234 // A dropped frame might not be shown but it always takes a slot in the gf 4235 // group. Therefore, even when it is not shown, we still need to update 4236 // the relevant frame counters. 4237 if (cm->show_frame) { 4238 update_counters_for_show_frame(cpi); 4239 } 4240 return AOM_CODEC_OK; 4241 } 4242 } 4243 4244 if (oxcf->tune_cfg.tuning == AOM_TUNE_SSIM || 4245 oxcf->tune_cfg.tuning == AOM_TUNE_IQ || 4246 oxcf->tune_cfg.tuning == AOM_TUNE_SSIMULACRA2) { 4247 av1_set_mb_ssim_rdmult_scaling(cpi); 4248 } 4249 #if CONFIG_SALIENCY_MAP 4250 else if (oxcf->tune_cfg.tuning == AOM_TUNE_VMAF_SALIENCY_MAP && 4251 !(cpi->source->flags & YV12_FLAG_HIGHBITDEPTH)) { 4252 if (av1_set_saliency_map(cpi) == 0) { 4253 return AOM_CODEC_MEM_ERROR; 4254 } 4255 #if !CONFIG_REALTIME_ONLY 4256 double motion_ratio = av1_setup_motion_ratio(cpi); 4257 #else 4258 double motion_ratio = 1.0; 4259 #endif 4260 if (av1_setup_sm_rdmult_scaling_factor(cpi, motion_ratio) == 0) { 4261 return AOM_CODEC_MEM_ERROR; 4262 } 4263 } 4264 #endif 4265 #if CONFIG_TUNE_VMAF 4266 else if (oxcf->tune_cfg.tuning == AOM_TUNE_VMAF_WITHOUT_PREPROCESSING || 4267 oxcf->tune_cfg.tuning == AOM_TUNE_VMAF_MAX_GAIN || 4268 oxcf->tune_cfg.tuning == AOM_TUNE_VMAF_NEG_MAX_GAIN) { 4269 av1_set_mb_vmaf_rdmult_scaling(cpi); 4270 } 4271 #endif 4272 4273 if (cpi->oxcf.q_cfg.deltaq_mode == DELTA_Q_PERCEPTUAL_AI && 4274 cpi->sf.rt_sf.use_nonrd_pick_mode == 0) { 4275 av1_init_mb_wiener_var_buffer(cpi); 4276 av1_set_mb_wiener_variance(cpi); 4277 } 4278 4279 if (cpi->oxcf.q_cfg.deltaq_mode == DELTA_Q_USER_RATING_BASED) { 4280 av1_init_mb_ur_var_buffer(cpi); 4281 av1_set_mb_ur_variance(cpi); 4282 } 4283 4284 #if CONFIG_INTERNAL_STATS 4285 memset(cpi->mode_chosen_counts, 0, 4286 MAX_MODES * sizeof(*cpi->mode_chosen_counts)); 4287 #endif 4288 4289 if (seq_params->frame_id_numbers_present_flag) { 4290 /* Non-normative definition of current_frame_id ("frame counter" with 4291 * wraparound) */ 4292 if (cm->current_frame_id == -1) { 4293 int lsb, msb; 4294 /* quasi-random initialization of current_frame_id for a key frame */ 4295 if (cpi->source->flags & YV12_FLAG_HIGHBITDEPTH) { 4296 lsb = CONVERT_TO_SHORTPTR(cpi->source->y_buffer)[0] & 0xff; 4297 msb = CONVERT_TO_SHORTPTR(cpi->source->y_buffer)[1] & 0xff; 4298 } else { 4299 lsb = cpi->source->y_buffer[0] & 0xff; 4300 msb = cpi->source->y_buffer[1] & 0xff; 4301 } 4302 cm->current_frame_id = 4303 ((msb << 8) + lsb) % (1 << seq_params->frame_id_length); 4304 4305 // S_frame is meant for stitching different streams of different 4306 // resolutions together, so current_frame_id must be the 4307 // same across different streams of the same content current_frame_id 4308 // should be the same and not random. 0x37 is a chosen number as start 4309 // point 4310 if (oxcf->kf_cfg.sframe_dist != 0) cm->current_frame_id = 0x37; 4311 } else { 4312 cm->current_frame_id = 4313 (cm->current_frame_id + 1 + (1 << seq_params->frame_id_length)) % 4314 (1 << seq_params->frame_id_length); 4315 } 4316 } 4317 4318 switch (oxcf->algo_cfg.cdf_update_mode) { 4319 case 0: // No CDF update for any frames(4~6% compression loss). 4320 features->disable_cdf_update = 1; 4321 break; 4322 case 1: // Enable CDF update for all frames. 4323 if (cpi->sf.rt_sf.disable_cdf_update_non_reference_frame && 4324 cpi->ppi->rtc_ref.non_reference_frame && cpi->rc.frames_since_key > 2) 4325 features->disable_cdf_update = 1; 4326 else if (cpi->sf.rt_sf.selective_cdf_update) 4327 features->disable_cdf_update = selective_disable_cdf_rtc(cpi); 4328 else 4329 features->disable_cdf_update = 0; 4330 break; 4331 case 2: 4332 // Strategically determine at which frames to do CDF update. 4333 // Currently only enable CDF update for all-intra and no-show frames(1.5% 4334 // compression loss) for good qualiy or allintra mode. 4335 if (oxcf->mode == GOOD || oxcf->mode == ALLINTRA) { 4336 features->disable_cdf_update = 4337 (frame_is_intra_only(cm) || !cm->show_frame) ? 0 : 1; 4338 } else { 4339 features->disable_cdf_update = selective_disable_cdf_rtc(cpi); 4340 } 4341 break; 4342 } 4343 4344 // Disable cdf update for the INTNL_ARF_UPDATE frame with 4345 // frame_parallel_level 1. 4346 if (!cpi->do_frame_data_update && 4347 cpi->ppi->gf_group.update_type[cpi->gf_frame_index] == INTNL_ARF_UPDATE) { 4348 assert(cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] == 1); 4349 features->disable_cdf_update = 1; 4350 } 4351 4352 #if !CONFIG_REALTIME_ONLY 4353 if (cpi->oxcf.tool_cfg.enable_global_motion && !frame_is_intra_only(cm)) { 4354 // Flush any stale global motion information, which may be left over 4355 // from a previous frame 4356 aom_invalidate_pyramid(cpi->source->y_pyramid); 4357 av1_invalidate_corner_list(cpi->source->corners); 4358 } 4359 #endif // !CONFIG_REALTIME_ONLY 4360 4361 int largest_tile_id = 0; 4362 if (av1_superres_in_recode_allowed(cpi)) { 4363 if (encode_with_and_without_superres(cpi, size, dest, dest_size, 4364 &largest_tile_id) != AOM_CODEC_OK) { 4365 return AOM_CODEC_ERROR; 4366 } 4367 } else { 4368 const aom_superres_mode orig_superres_mode = cpi->superres_mode; // save 4369 cpi->superres_mode = cpi->oxcf.superres_cfg.superres_mode; 4370 if (encode_with_recode_loop_and_filter(cpi, size, dest, dest_size, NULL, 4371 NULL, 4372 &largest_tile_id) != AOM_CODEC_OK) { 4373 return AOM_CODEC_ERROR; 4374 } 4375 cpi->superres_mode = orig_superres_mode; // restore 4376 } 4377 4378 // Update reference frame ids for reference frames this frame will overwrite 4379 if (seq_params->frame_id_numbers_present_flag) { 4380 for (int i = 0; i < REF_FRAMES; i++) { 4381 if ((current_frame->refresh_frame_flags >> i) & 1) { 4382 cm->ref_frame_id[i] = cm->current_frame_id; 4383 } 4384 } 4385 } 4386 4387 if (cpi->svc.spatial_layer_id == cpi->svc.number_spatial_layers - 1) 4388 cpi->svc.num_encoded_top_layer++; 4389 4390 #if DUMP_RECON_FRAMES == 1 4391 // NOTE(zoeliu): For debug - Output the filtered reconstructed video. 4392 av1_dump_filtered_recon_frames(cpi); 4393 #endif // DUMP_RECON_FRAMES 4394 4395 if (cm->seg.enabled) { 4396 if (cm->seg.update_map == 0 && cm->last_frame_seg_map) { 4397 memcpy(cm->cur_frame->seg_map, cm->last_frame_seg_map, 4398 cm->cur_frame->mi_cols * cm->cur_frame->mi_rows * 4399 sizeof(*cm->cur_frame->seg_map)); 4400 } 4401 } 4402 4403 int release_scaled_refs = 0; 4404 #if CONFIG_FPMT_TEST 4405 release_scaled_refs = 4406 (cpi->ppi->fpmt_unit_test_cfg == PARALLEL_SIMULATION_ENCODE) ? 1 : 0; 4407 #endif // CONFIG_FPMT_TEST 4408 if (release_scaled_refs || 4409 cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] == 0) { 4410 if (frame_is_intra_only(cm) == 0) { 4411 release_scaled_references(cpi); 4412 } 4413 } 4414 #if CONFIG_AV1_TEMPORAL_DENOISING 4415 av1_denoiser_update_ref_frame(cpi); 4416 #endif 4417 4418 // NOTE: Save the new show frame buffer index for --test-code=warn, i.e., 4419 // for the purpose to verify no mismatch between encoder and decoder. 4420 if (cm->show_frame) cpi->last_show_frame_buf = cm->cur_frame; 4421 4422 if (features->refresh_frame_context == REFRESH_FRAME_CONTEXT_BACKWARD) { 4423 *cm->fc = cpi->tile_data[largest_tile_id].tctx; 4424 av1_reset_cdf_symbol_counters(cm->fc); 4425 } 4426 if (!cm->tiles.large_scale) { 4427 cm->cur_frame->frame_context = *cm->fc; 4428 } 4429 4430 if (tile_cfg->enable_ext_tile_debug) { 4431 // (yunqing) This test ensures the correctness of large scale tile coding. 4432 if (cm->tiles.large_scale && is_stat_consumption_stage(cpi)) { 4433 char fn[20] = "./fc"; 4434 fn[4] = current_frame->frame_number / 100 + '0'; 4435 fn[5] = (current_frame->frame_number % 100) / 10 + '0'; 4436 fn[6] = (current_frame->frame_number % 10) + '0'; 4437 fn[7] = '\0'; 4438 av1_print_frame_contexts(cm->fc, fn); 4439 } 4440 } 4441 4442 cpi->last_frame_type = current_frame->frame_type; 4443 4444 if (cm->features.disable_cdf_update) { 4445 cpi->frames_since_last_update++; 4446 } else { 4447 cpi->frames_since_last_update = 1; 4448 } 4449 4450 if (cpi->svc.spatial_layer_id == cpi->svc.number_spatial_layers - 1) { 4451 cpi->svc.prev_number_spatial_layers = cpi->svc.number_spatial_layers; 4452 } 4453 cpi->svc.prev_number_temporal_layers = cpi->svc.number_temporal_layers; 4454 4455 // Clear the one shot update flags for segmentation map and mode/ref loop 4456 // filter deltas. 4457 cm->seg.update_map = 0; 4458 cm->seg.update_data = 0; 4459 cm->lf.mode_ref_delta_update = 0; 4460 4461 if (cm->show_frame) { 4462 update_counters_for_show_frame(cpi); 4463 } 4464 4465 #if CONFIG_COLLECT_COMPONENT_TIMING 4466 end_timing(cpi, encode_frame_to_data_rate_time); 4467 #endif 4468 4469 return AOM_CODEC_OK; 4470 } 4471 4472 int av1_encode(AV1_COMP *const cpi, uint8_t *const dest, size_t dest_size, 4473 const EncodeFrameInput *const frame_input, 4474 const EncodeFrameParams *const frame_params, 4475 size_t *const frame_size) { 4476 AV1_COMMON *const cm = &cpi->common; 4477 CurrentFrame *const current_frame = &cm->current_frame; 4478 4479 cpi->unscaled_source = frame_input->source; 4480 cpi->source = frame_input->source; 4481 cpi->unscaled_last_source = frame_input->last_source; 4482 4483 current_frame->refresh_frame_flags = frame_params->refresh_frame_flags; 4484 cm->features.error_resilient_mode = frame_params->error_resilient_mode; 4485 cm->features.primary_ref_frame = frame_params->primary_ref_frame; 4486 cm->current_frame.frame_type = frame_params->frame_type; 4487 cm->show_frame = frame_params->show_frame; 4488 cpi->ref_frame_flags = frame_params->ref_frame_flags; 4489 cpi->speed = frame_params->speed; 4490 cm->show_existing_frame = frame_params->show_existing_frame; 4491 cpi->existing_fb_idx_to_show = frame_params->existing_fb_idx_to_show; 4492 4493 memcpy(cm->remapped_ref_idx, frame_params->remapped_ref_idx, 4494 REF_FRAMES * sizeof(*cm->remapped_ref_idx)); 4495 4496 memcpy(&cpi->refresh_frame, &frame_params->refresh_frame, 4497 sizeof(cpi->refresh_frame)); 4498 4499 if (current_frame->frame_type == KEY_FRAME && 4500 cpi->ppi->gf_group.refbuf_state[cpi->gf_frame_index] == REFBUF_RESET) { 4501 current_frame->frame_number = 0; 4502 } 4503 4504 current_frame->order_hint = 4505 current_frame->frame_number + frame_params->order_offset; 4506 4507 current_frame->display_order_hint = current_frame->order_hint; 4508 current_frame->order_hint %= 4509 (1 << (cm->seq_params->order_hint_info.order_hint_bits_minus_1 + 1)); 4510 4511 current_frame->pyramid_level = get_true_pyr_level( 4512 cpi->ppi->gf_group.layer_depth[cpi->gf_frame_index], 4513 current_frame->display_order_hint, cpi->ppi->gf_group.max_layer_depth); 4514 4515 if (is_stat_generation_stage(cpi)) { 4516 #if !CONFIG_REALTIME_ONLY 4517 if (cpi->oxcf.q_cfg.use_fixed_qp_offsets) 4518 av1_noop_first_pass_frame(cpi, frame_input->ts_duration); 4519 else 4520 av1_first_pass(cpi, frame_input->ts_duration); 4521 #endif 4522 } else if (cpi->oxcf.pass == AOM_RC_ONE_PASS || 4523 cpi->oxcf.pass >= AOM_RC_SECOND_PASS) { 4524 if (encode_frame_to_data_rate(cpi, frame_size, dest, dest_size) != 4525 AOM_CODEC_OK) { 4526 return AOM_CODEC_ERROR; 4527 } 4528 } else { 4529 return AOM_CODEC_ERROR; 4530 } 4531 4532 return AOM_CODEC_OK; 4533 } 4534 4535 #if CONFIG_DENOISE && !CONFIG_REALTIME_ONLY 4536 static int apply_denoise_2d(AV1_COMP *cpi, const YV12_BUFFER_CONFIG *sd, 4537 int block_size, float noise_level, 4538 int64_t time_stamp, int64_t end_time) { 4539 AV1_COMMON *const cm = &cpi->common; 4540 if (!cpi->denoise_and_model) { 4541 cpi->denoise_and_model = aom_denoise_and_model_alloc( 4542 cm->seq_params->bit_depth, block_size, noise_level); 4543 if (!cpi->denoise_and_model) { 4544 aom_set_error(cm->error, AOM_CODEC_MEM_ERROR, 4545 "Error allocating denoise and model"); 4546 return -1; 4547 } 4548 } 4549 if (!cpi->film_grain_table) { 4550 cpi->film_grain_table = aom_malloc(sizeof(*cpi->film_grain_table)); 4551 if (!cpi->film_grain_table) { 4552 aom_set_error(cm->error, AOM_CODEC_MEM_ERROR, 4553 "Error allocating grain table"); 4554 return -1; 4555 } 4556 memset(cpi->film_grain_table, 0, sizeof(*cpi->film_grain_table)); 4557 } 4558 if (aom_denoise_and_model_run(cpi->denoise_and_model, sd, 4559 &cm->film_grain_params, 4560 cpi->oxcf.enable_dnl_denoising)) { 4561 if (cm->film_grain_params.apply_grain) { 4562 aom_film_grain_table_append(cpi->film_grain_table, time_stamp, end_time, 4563 &cm->film_grain_params); 4564 } 4565 } 4566 return 0; 4567 } 4568 #endif 4569 4570 int av1_receive_raw_frame(AV1_COMP *cpi, aom_enc_frame_flags_t frame_flags, 4571 const YV12_BUFFER_CONFIG *sd, int64_t time_stamp, 4572 int64_t end_time) { 4573 AV1_COMMON *const cm = &cpi->common; 4574 const SequenceHeader *const seq_params = cm->seq_params; 4575 int res = 0; 4576 const int subsampling_x = sd->subsampling_x; 4577 const int subsampling_y = sd->subsampling_y; 4578 const int use_highbitdepth = (sd->flags & YV12_FLAG_HIGHBITDEPTH) != 0; 4579 4580 #if CONFIG_TUNE_VMAF 4581 if (!is_stat_generation_stage(cpi) && 4582 cpi->oxcf.tune_cfg.tuning == AOM_TUNE_VMAF_WITH_PREPROCESSING) { 4583 av1_vmaf_frame_preprocessing(cpi, sd); 4584 } 4585 if (!is_stat_generation_stage(cpi) && 4586 cpi->oxcf.tune_cfg.tuning == AOM_TUNE_VMAF_MAX_GAIN) { 4587 av1_vmaf_blk_preprocessing(cpi, sd); 4588 } 4589 #endif 4590 4591 #if CONFIG_INTERNAL_STATS 4592 struct aom_usec_timer timer; 4593 aom_usec_timer_start(&timer); 4594 #endif 4595 4596 #if CONFIG_AV1_TEMPORAL_DENOISING 4597 setup_denoiser_buffer(cpi); 4598 #endif 4599 4600 #if CONFIG_DENOISE 4601 // even if denoise_noise_level is > 0, we don't need need to denoise on pass 4602 // 1 of 2 if enable_dnl_denoising is disabled since the 2nd pass will be 4603 // encoding the original (non-denoised) frame 4604 if (cpi->oxcf.noise_level > 0 && !(cpi->oxcf.pass == AOM_RC_FIRST_PASS && 4605 !cpi->oxcf.enable_dnl_denoising)) { 4606 #if !CONFIG_REALTIME_ONLY 4607 // Choose a synthetic noise level for still images for enhanced perceptual 4608 // quality based on an estimated noise level in the source, but only if 4609 // the noise level is set on the command line to > 0. 4610 if (cpi->oxcf.mode == ALLINTRA) { 4611 // No noise synthesis if source is very clean. 4612 // Uses a low edge threshold to focus on smooth areas. 4613 // Increase output noise setting a little compared to measured value. 4614 double y_noise_level = 0.0; 4615 av1_estimate_noise_level(sd, &y_noise_level, AOM_PLANE_Y, AOM_PLANE_Y, 4616 cm->seq_params->bit_depth, 16); 4617 cpi->oxcf.noise_level = (float)(y_noise_level - 0.1); 4618 cpi->oxcf.noise_level = (float)AOMMAX(0.0, cpi->oxcf.noise_level); 4619 if (cpi->oxcf.noise_level > 0.0) { 4620 cpi->oxcf.noise_level += (float)0.5; 4621 } 4622 cpi->oxcf.noise_level = (float)AOMMIN(5.0, cpi->oxcf.noise_level); 4623 } 4624 4625 if (apply_denoise_2d(cpi, sd, cpi->oxcf.noise_block_size, 4626 cpi->oxcf.noise_level, time_stamp, end_time) < 0) 4627 res = -1; 4628 #endif // !CONFIG_REALTIME_ONLY 4629 } 4630 #endif // CONFIG_DENOISE 4631 4632 if (av1_lookahead_push(cpi->ppi->lookahead, sd, time_stamp, end_time, 4633 use_highbitdepth, cpi->alloc_pyramid, frame_flags)) { 4634 aom_set_error(cm->error, AOM_CODEC_ERROR, "av1_lookahead_push() failed"); 4635 res = -1; 4636 } 4637 #if CONFIG_INTERNAL_STATS 4638 aom_usec_timer_mark(&timer); 4639 cpi->ppi->total_time_receive_data += aom_usec_timer_elapsed(&timer); 4640 #endif 4641 4642 // Note: Regarding profile setting, the following checks are added to help 4643 // choose a proper profile for the input video. The criterion is that all 4644 // bitstreams must be designated as the lowest profile that match its content. 4645 // E.G. A bitstream that contains 4:4:4 video must be designated as High 4646 // Profile in the seq header, and likewise a bitstream that contains 4:2:2 4647 // bitstream must be designated as Professional Profile in the sequence 4648 // header. 4649 if ((seq_params->profile == PROFILE_0) && !seq_params->monochrome && 4650 (subsampling_x != 1 || subsampling_y != 1)) { 4651 aom_set_error(cm->error, AOM_CODEC_INVALID_PARAM, 4652 "Non-4:2:0 color format requires profile 1 or 2"); 4653 res = -1; 4654 } 4655 if ((seq_params->profile == PROFILE_1) && 4656 !(subsampling_x == 0 && subsampling_y == 0)) { 4657 aom_set_error(cm->error, AOM_CODEC_INVALID_PARAM, 4658 "Profile 1 requires 4:4:4 color format"); 4659 res = -1; 4660 } 4661 if ((seq_params->profile == PROFILE_2) && 4662 (seq_params->bit_depth <= AOM_BITS_10) && 4663 !(subsampling_x == 1 && subsampling_y == 0)) { 4664 aom_set_error(cm->error, AOM_CODEC_INVALID_PARAM, 4665 "Profile 2 bit-depth <= 10 requires 4:2:2 color format"); 4666 res = -1; 4667 } 4668 4669 return res; 4670 } 4671 4672 #if CONFIG_ENTROPY_STATS 4673 void print_entropy_stats(AV1_PRIMARY *const ppi) { 4674 if (!ppi->cpi) return; 4675 4676 if (ppi->cpi->oxcf.pass != 1 && 4677 ppi->cpi->common.current_frame.frame_number > 0) { 4678 fprintf(stderr, "Writing counts.stt\n"); 4679 FILE *f = fopen("counts.stt", "wb"); 4680 fwrite(&ppi->aggregate_fc, sizeof(ppi->aggregate_fc), 1, f); 4681 fclose(f); 4682 } 4683 } 4684 #endif // CONFIG_ENTROPY_STATS 4685 4686 #if CONFIG_INTERNAL_STATS 4687 static void adjust_image_stat(double y, double u, double v, double all, 4688 ImageStat *s) { 4689 s->stat[STAT_Y] += y; 4690 s->stat[STAT_U] += u; 4691 s->stat[STAT_V] += v; 4692 s->stat[STAT_ALL] += all; 4693 s->worst = AOMMIN(s->worst, all); 4694 } 4695 4696 static void compute_internal_stats(AV1_COMP *cpi, int frame_bytes) { 4697 AV1_PRIMARY *const ppi = cpi->ppi; 4698 AV1_COMMON *const cm = &cpi->common; 4699 double samples = 0.0; 4700 const uint32_t in_bit_depth = cpi->oxcf.input_cfg.input_bit_depth; 4701 const uint32_t bit_depth = cpi->td.mb.e_mbd.bd; 4702 4703 if (cpi->ppi->use_svc && 4704 cpi->svc.spatial_layer_id < cpi->svc.number_spatial_layers - 1) 4705 return; 4706 4707 #if CONFIG_INTER_STATS_ONLY 4708 if (cm->current_frame.frame_type == KEY_FRAME) return; // skip key frame 4709 #endif 4710 cpi->bytes += frame_bytes; 4711 if (cm->show_frame) { 4712 const YV12_BUFFER_CONFIG *orig = cpi->source; 4713 const YV12_BUFFER_CONFIG *recon = &cpi->common.cur_frame->buf; 4714 double y, u, v, frame_all; 4715 4716 ppi->count[0]++; 4717 ppi->count[1]++; 4718 if (cpi->ppi->b_calculate_psnr) { 4719 PSNR_STATS psnr; 4720 double weight[2] = { 0.0, 0.0 }; 4721 double frame_ssim2[2] = { 0.0, 0.0 }; 4722 #if CONFIG_AV1_HIGHBITDEPTH 4723 aom_calc_highbd_psnr(orig, recon, &psnr, bit_depth, in_bit_depth); 4724 #else 4725 aom_calc_psnr(orig, recon, &psnr); 4726 #endif 4727 adjust_image_stat(psnr.psnr[1], psnr.psnr[2], psnr.psnr[3], psnr.psnr[0], 4728 &(ppi->psnr[0])); 4729 ppi->total_sq_error[0] += psnr.sse[0]; 4730 ppi->total_samples[0] += psnr.samples[0]; 4731 samples = psnr.samples[0]; 4732 4733 aom_calc_ssim(orig, recon, bit_depth, in_bit_depth, 4734 cm->seq_params->use_highbitdepth, weight, frame_ssim2); 4735 4736 ppi->worst_ssim = AOMMIN(ppi->worst_ssim, frame_ssim2[0]); 4737 ppi->summed_quality += frame_ssim2[0] * weight[0]; 4738 ppi->summed_weights += weight[0]; 4739 4740 #if CONFIG_AV1_HIGHBITDEPTH 4741 // Compute PSNR based on stream bit depth 4742 if ((cpi->source->flags & YV12_FLAG_HIGHBITDEPTH) && 4743 (in_bit_depth < bit_depth)) { 4744 adjust_image_stat(psnr.psnr_hbd[1], psnr.psnr_hbd[2], psnr.psnr_hbd[3], 4745 psnr.psnr_hbd[0], &ppi->psnr[1]); 4746 ppi->total_sq_error[1] += psnr.sse_hbd[0]; 4747 ppi->total_samples[1] += psnr.samples_hbd[0]; 4748 4749 ppi->worst_ssim_hbd = AOMMIN(ppi->worst_ssim_hbd, frame_ssim2[1]); 4750 ppi->summed_quality_hbd += frame_ssim2[1] * weight[1]; 4751 ppi->summed_weights_hbd += weight[1]; 4752 } 4753 #endif 4754 4755 #if 0 4756 { 4757 FILE *f = fopen("q_used.stt", "a"); 4758 double y2 = psnr.psnr[1]; 4759 double u2 = psnr.psnr[2]; 4760 double v2 = psnr.psnr[3]; 4761 double frame_psnr2 = psnr.psnr[0]; 4762 fprintf(f, "%5d : Y%f7.3:U%f7.3:V%f7.3:F%f7.3:S%7.3f\n", 4763 cm->current_frame.frame_number, y2, u2, v2, 4764 frame_psnr2, frame_ssim2); 4765 fclose(f); 4766 } 4767 #endif 4768 } 4769 if (ppi->b_calculate_blockiness) { 4770 if (!cm->seq_params->use_highbitdepth) { 4771 const double frame_blockiness = 4772 av1_get_blockiness(orig->y_buffer, orig->y_stride, recon->y_buffer, 4773 recon->y_stride, orig->y_width, orig->y_height); 4774 ppi->worst_blockiness = AOMMAX(ppi->worst_blockiness, frame_blockiness); 4775 ppi->total_blockiness += frame_blockiness; 4776 } 4777 4778 if (ppi->b_calculate_consistency) { 4779 if (!cm->seq_params->use_highbitdepth) { 4780 const double this_inconsistency = aom_get_ssim_metrics( 4781 orig->y_buffer, orig->y_stride, recon->y_buffer, recon->y_stride, 4782 orig->y_width, orig->y_height, ppi->ssim_vars, &ppi->metrics, 1); 4783 4784 const double peak = (double)((1 << in_bit_depth) - 1); 4785 const double consistency = 4786 aom_sse_to_psnr(samples, peak, ppi->total_inconsistency); 4787 if (consistency > 0.0) 4788 ppi->worst_consistency = 4789 AOMMIN(ppi->worst_consistency, consistency); 4790 ppi->total_inconsistency += this_inconsistency; 4791 } 4792 } 4793 } 4794 4795 frame_all = 4796 aom_calc_fastssim(orig, recon, &y, &u, &v, bit_depth, in_bit_depth); 4797 adjust_image_stat(y, u, v, frame_all, &ppi->fastssim); 4798 frame_all = aom_psnrhvs(orig, recon, &y, &u, &v, bit_depth, in_bit_depth); 4799 adjust_image_stat(y, u, v, frame_all, &ppi->psnrhvs); 4800 } 4801 } 4802 4803 void print_internal_stats(AV1_PRIMARY *ppi) { 4804 if (!ppi->cpi) return; 4805 AV1_COMP *const cpi = ppi->cpi; 4806 4807 if (ppi->cpi->oxcf.pass != 1 && 4808 ppi->cpi->common.current_frame.frame_number > 0) { 4809 char headings[512] = { 0 }; 4810 char results[512] = { 0 }; 4811 FILE *f = fopen("opsnr.stt", "a"); 4812 double time_encoded = 4813 (cpi->time_stamps.prev_ts_end - cpi->time_stamps.first_ts_start) / 4814 10000000.000; 4815 double total_encode_time = 4816 (ppi->total_time_receive_data + ppi->total_time_compress_data) / 4817 1000.000; 4818 const double dr = 4819 (double)ppi->total_bytes * (double)8 / (double)1000 / time_encoded; 4820 const double peak = 4821 (double)((1 << ppi->cpi->oxcf.input_cfg.input_bit_depth) - 1); 4822 const double target_rate = 4823 (double)ppi->cpi->oxcf.rc_cfg.target_bandwidth / 1000; 4824 const double rate_err = ((100.0 * (dr - target_rate)) / target_rate); 4825 4826 if (ppi->b_calculate_psnr) { 4827 const double total_psnr = aom_sse_to_psnr( 4828 (double)ppi->total_samples[0], peak, (double)ppi->total_sq_error[0]); 4829 const double total_ssim = 4830 100 * pow(ppi->summed_quality / ppi->summed_weights, 8.0); 4831 snprintf(headings, sizeof(headings), 4832 "Bitrate\tAVGPsnr\tGLBPsnr\tAVPsnrP\tGLPsnrP\t" 4833 "AOMSSIM\tVPSSIMP\tFASTSIM\tPSNRHVS\t" 4834 "WstPsnr\tWstSsim\tWstFast\tWstHVS\t" 4835 "AVPsrnY\tAPsnrCb\tAPsnrCr"); 4836 snprintf(results, sizeof(results), 4837 "%7.2f\t%7.3f\t%7.3f\t%7.3f\t%7.3f\t" 4838 "%7.3f\t%7.3f\t%7.3f\t%7.3f\t" 4839 "%7.3f\t%7.3f\t%7.3f\t%7.3f\t" 4840 "%7.3f\t%7.3f\t%7.3f", 4841 dr, ppi->psnr[0].stat[STAT_ALL] / ppi->count[0], total_psnr, 4842 ppi->psnr[0].stat[STAT_ALL] / ppi->count[0], total_psnr, 4843 total_ssim, total_ssim, 4844 ppi->fastssim.stat[STAT_ALL] / ppi->count[0], 4845 ppi->psnrhvs.stat[STAT_ALL] / ppi->count[0], ppi->psnr[0].worst, 4846 ppi->worst_ssim, ppi->fastssim.worst, ppi->psnrhvs.worst, 4847 ppi->psnr[0].stat[STAT_Y] / ppi->count[0], 4848 ppi->psnr[0].stat[STAT_U] / ppi->count[0], 4849 ppi->psnr[0].stat[STAT_V] / ppi->count[0]); 4850 4851 if (ppi->b_calculate_blockiness) { 4852 SNPRINT(headings, "\t Block\tWstBlck"); 4853 SNPRINT2(results, "\t%7.3f", ppi->total_blockiness / ppi->count[0]); 4854 SNPRINT2(results, "\t%7.3f", ppi->worst_blockiness); 4855 } 4856 4857 if (ppi->b_calculate_consistency) { 4858 double consistency = 4859 aom_sse_to_psnr((double)ppi->total_samples[0], peak, 4860 (double)ppi->total_inconsistency); 4861 4862 SNPRINT(headings, "\tConsist\tWstCons"); 4863 SNPRINT2(results, "\t%7.3f", consistency); 4864 SNPRINT2(results, "\t%7.3f", ppi->worst_consistency); 4865 } 4866 4867 SNPRINT(headings, "\t Time\tRcErr\tAbsErr"); 4868 SNPRINT2(results, "\t%8.0f", total_encode_time); 4869 SNPRINT2(results, " %7.2f", rate_err); 4870 SNPRINT2(results, " %7.2f", fabs(rate_err)); 4871 4872 SNPRINT(headings, "\tAPsnr611"); 4873 SNPRINT2(results, " %7.3f", 4874 (6 * ppi->psnr[0].stat[STAT_Y] + ppi->psnr[0].stat[STAT_U] + 4875 ppi->psnr[0].stat[STAT_V]) / 4876 (ppi->count[0] * 8)); 4877 4878 #if CONFIG_AV1_HIGHBITDEPTH 4879 const uint32_t in_bit_depth = ppi->cpi->oxcf.input_cfg.input_bit_depth; 4880 const uint32_t bit_depth = ppi->seq_params.bit_depth; 4881 // Since cpi->source->flags is not available here, but total_samples[1] 4882 // will be non-zero if cpi->source->flags & YV12_FLAG_HIGHBITDEPTH was 4883 // true in compute_internal_stats 4884 if ((ppi->total_samples[1] > 0) && (in_bit_depth < bit_depth)) { 4885 const double peak_hbd = (double)((1 << bit_depth) - 1); 4886 const double total_psnr_hbd = 4887 aom_sse_to_psnr((double)ppi->total_samples[1], peak_hbd, 4888 (double)ppi->total_sq_error[1]); 4889 const double total_ssim_hbd = 4890 100 * pow(ppi->summed_quality_hbd / ppi->summed_weights_hbd, 8.0); 4891 SNPRINT(headings, 4892 "\t AVGPsnrH GLBPsnrH AVPsnrPH GLPsnrPH" 4893 " AVPsnrYH APsnrCbH APsnrCrH WstPsnrH" 4894 " AOMSSIMH VPSSIMPH WstSsimH"); 4895 SNPRINT2(results, "\t%7.3f", 4896 ppi->psnr[1].stat[STAT_ALL] / ppi->count[1]); 4897 SNPRINT2(results, " %7.3f", total_psnr_hbd); 4898 SNPRINT2(results, " %7.3f", 4899 ppi->psnr[1].stat[STAT_ALL] / ppi->count[1]); 4900 SNPRINT2(results, " %7.3f", total_psnr_hbd); 4901 SNPRINT2(results, " %7.3f", ppi->psnr[1].stat[STAT_Y] / ppi->count[1]); 4902 SNPRINT2(results, " %7.3f", ppi->psnr[1].stat[STAT_U] / ppi->count[1]); 4903 SNPRINT2(results, " %7.3f", ppi->psnr[1].stat[STAT_V] / ppi->count[1]); 4904 SNPRINT2(results, " %7.3f", ppi->psnr[1].worst); 4905 SNPRINT2(results, " %7.3f", total_ssim_hbd); 4906 SNPRINT2(results, " %7.3f", total_ssim_hbd); 4907 SNPRINT2(results, " %7.3f", ppi->worst_ssim_hbd); 4908 } 4909 #endif 4910 fprintf(f, "%s\n", headings); 4911 fprintf(f, "%s\n", results); 4912 } 4913 4914 fclose(f); 4915 4916 aom_free(ppi->ssim_vars); 4917 ppi->ssim_vars = NULL; 4918 } 4919 } 4920 #endif // CONFIG_INTERNAL_STATS 4921 4922 static inline void update_keyframe_counters(AV1_COMP *cpi) { 4923 if (cpi->common.show_frame && cpi->rc.frames_to_key) { 4924 #if !CONFIG_REALTIME_ONLY 4925 FIRSTPASS_INFO *firstpass_info = &cpi->ppi->twopass.firstpass_info; 4926 if (firstpass_info->past_stats_count > FIRSTPASS_INFO_STATS_PAST_MIN) { 4927 av1_firstpass_info_move_cur_index_and_pop(firstpass_info); 4928 } else { 4929 // When there is not enough past stats, we move the current 4930 // index without popping the past stats 4931 av1_firstpass_info_move_cur_index(firstpass_info); 4932 } 4933 #endif 4934 if (cpi->svc.spatial_layer_id == cpi->svc.number_spatial_layers - 1) { 4935 cpi->rc.frames_since_key++; 4936 cpi->rc.frames_to_key--; 4937 cpi->rc.frames_to_fwd_kf--; 4938 cpi->rc.frames_since_scene_change++; 4939 } 4940 } 4941 } 4942 4943 static inline void update_frames_till_gf_update(AV1_COMP *cpi) { 4944 // TODO(weitinglin): Updating this counter for is_frame_droppable 4945 // is a work-around to handle the condition when a frame is drop. 4946 // We should fix the cpi->common.show_frame flag 4947 // instead of checking the other condition to update the counter properly. 4948 if (cpi->common.show_frame || 4949 is_frame_droppable(&cpi->ppi->rtc_ref, &cpi->ext_flags.refresh_frame)) { 4950 // Decrement count down till next gf 4951 if (cpi->rc.frames_till_gf_update_due > 0) 4952 cpi->rc.frames_till_gf_update_due--; 4953 } 4954 } 4955 4956 static inline void update_gf_group_index(AV1_COMP *cpi) { 4957 // Increment the gf group index ready for the next frame. 4958 if (is_one_pass_rt_params(cpi) && 4959 cpi->svc.spatial_layer_id == cpi->svc.number_spatial_layers - 1) { 4960 ++cpi->gf_frame_index; 4961 // Reset gf_frame_index in case it reaches MAX_STATIC_GF_GROUP_LENGTH 4962 // for real time encoding. 4963 if (cpi->gf_frame_index == MAX_STATIC_GF_GROUP_LENGTH) 4964 cpi->gf_frame_index = 0; 4965 } else { 4966 ++cpi->gf_frame_index; 4967 } 4968 } 4969 4970 static void update_fb_of_context_type(const AV1_COMP *const cpi, 4971 int *const fb_of_context_type) { 4972 const AV1_COMMON *const cm = &cpi->common; 4973 const int current_frame_ref_type = get_current_frame_ref_type(cpi); 4974 4975 if (frame_is_intra_only(cm) || cm->features.error_resilient_mode || 4976 cpi->ext_flags.use_primary_ref_none) { 4977 for (int i = 0; i < REF_FRAMES; i++) { 4978 fb_of_context_type[i] = -1; 4979 } 4980 fb_of_context_type[current_frame_ref_type] = 4981 cm->show_frame ? get_ref_frame_map_idx(cm, GOLDEN_FRAME) 4982 : get_ref_frame_map_idx(cm, ALTREF_FRAME); 4983 } 4984 4985 if (!encode_show_existing_frame(cm)) { 4986 // Refresh fb_of_context_type[]: see encoder.h for explanation 4987 if (cm->current_frame.frame_type == KEY_FRAME) { 4988 // All ref frames are refreshed, pick one that will live long enough 4989 fb_of_context_type[current_frame_ref_type] = 0; 4990 } else { 4991 // If more than one frame is refreshed, it doesn't matter which one we 4992 // pick so pick the first. LST sometimes doesn't refresh any: this is ok 4993 4994 for (int i = 0; i < REF_FRAMES; i++) { 4995 if (cm->current_frame.refresh_frame_flags & (1 << i)) { 4996 fb_of_context_type[current_frame_ref_type] = i; 4997 break; 4998 } 4999 } 5000 } 5001 } 5002 } 5003 5004 static void update_rc_counts(AV1_COMP *cpi) { 5005 update_keyframe_counters(cpi); 5006 update_frames_till_gf_update(cpi); 5007 update_gf_group_index(cpi); 5008 } 5009 5010 static void update_end_of_frame_stats(AV1_COMP *cpi) { 5011 if (cpi->do_frame_data_update) { 5012 // Store current frame loopfilter levels in ppi, if update flag is set. 5013 if (!cpi->common.show_existing_frame) { 5014 AV1_COMMON *const cm = &cpi->common; 5015 struct loopfilter *const lf = &cm->lf; 5016 cpi->ppi->filter_level[0] = lf->backup_filter_level[0]; 5017 cpi->ppi->filter_level[1] = lf->backup_filter_level[1]; 5018 cpi->ppi->filter_level_u = lf->backup_filter_level_u; 5019 cpi->ppi->filter_level_v = lf->backup_filter_level_v; 5020 } 5021 } 5022 // Store frame level mv_stats from cpi to ppi. 5023 cpi->ppi->mv_stats = cpi->mv_stats; 5024 } 5025 5026 // Updates frame level stats related to global motion 5027 static inline void update_gm_stats(AV1_COMP *cpi) { 5028 FRAME_UPDATE_TYPE update_type = 5029 cpi->ppi->gf_group.update_type[cpi->gf_frame_index]; 5030 int i, is_gm_present = 0; 5031 5032 // Check if the current frame has any valid global motion model across its 5033 // reference frames 5034 for (i = 0; i < REF_FRAMES; i++) { 5035 if (cpi->common.global_motion[i].wmtype != IDENTITY) { 5036 is_gm_present = 1; 5037 break; 5038 } 5039 } 5040 int update_actual_stats = 1; 5041 #if CONFIG_FPMT_TEST 5042 update_actual_stats = 5043 (cpi->ppi->fpmt_unit_test_cfg == PARALLEL_SIMULATION_ENCODE) ? 0 : 1; 5044 if (!update_actual_stats) { 5045 if (cpi->ppi->temp_valid_gm_model_found[update_type] == INT32_MAX) { 5046 cpi->ppi->temp_valid_gm_model_found[update_type] = is_gm_present; 5047 } else { 5048 cpi->ppi->temp_valid_gm_model_found[update_type] |= is_gm_present; 5049 } 5050 int show_existing_between_parallel_frames = 5051 (cpi->ppi->gf_group.update_type[cpi->gf_frame_index] == 5052 INTNL_OVERLAY_UPDATE && 5053 cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index + 1] == 2); 5054 if (cpi->do_frame_data_update == 1 && 5055 !show_existing_between_parallel_frames) { 5056 for (i = 0; i < FRAME_UPDATE_TYPES; i++) { 5057 cpi->ppi->valid_gm_model_found[i] = 5058 cpi->ppi->temp_valid_gm_model_found[i]; 5059 } 5060 } 5061 } 5062 #endif 5063 if (update_actual_stats) { 5064 if (cpi->ppi->valid_gm_model_found[update_type] == INT32_MAX) { 5065 cpi->ppi->valid_gm_model_found[update_type] = is_gm_present; 5066 } else { 5067 cpi->ppi->valid_gm_model_found[update_type] |= is_gm_present; 5068 } 5069 } 5070 } 5071 5072 void av1_post_encode_updates(AV1_COMP *const cpi, 5073 const AV1_COMP_DATA *const cpi_data) { 5074 AV1_PRIMARY *const ppi = cpi->ppi; 5075 AV1_COMMON *const cm = &cpi->common; 5076 5077 update_gm_stats(cpi); 5078 5079 #if !CONFIG_REALTIME_ONLY 5080 // Update the total stats remaining structure. 5081 if (cpi->twopass_frame.this_frame != NULL && 5082 ppi->twopass.stats_buf_ctx->total_left_stats) { 5083 subtract_stats(ppi->twopass.stats_buf_ctx->total_left_stats, 5084 cpi->twopass_frame.this_frame); 5085 } 5086 #endif 5087 5088 #if CONFIG_OUTPUT_FRAME_SIZE 5089 FILE *f = fopen("frame_sizes.csv", "a"); 5090 fprintf(f, "%d,", 8 * (int)cpi_data->frame_size); 5091 fprintf(f, "%d\n", cm->quant_params.base_qindex); 5092 fclose(f); 5093 #endif // CONFIG_OUTPUT_FRAME_SIZE 5094 5095 if (!is_stat_generation_stage(cpi) && !cpi->is_dropped_frame) { 5096 // Before calling refresh_reference_frames(), copy ppi->ref_frame_map_copy 5097 // to cm->ref_frame_map for frame_parallel_level 2 frame in a parallel 5098 // encode set of lower layer frames. 5099 // TODO(Remya): Move ref_frame_map from AV1_COMMON to AV1_PRIMARY to avoid 5100 // copy. 5101 if (ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] == 2 && 5102 ppi->gf_group.frame_parallel_level[cpi->gf_frame_index - 1] == 1 && 5103 ppi->gf_group.update_type[cpi->gf_frame_index - 1] == 5104 INTNL_ARF_UPDATE) { 5105 memcpy(cm->ref_frame_map, ppi->ref_frame_map_copy, 5106 sizeof(cm->ref_frame_map)); 5107 } 5108 refresh_reference_frames(cpi); 5109 // For frame_parallel_level 1 frame in a parallel encode set of lower layer 5110 // frames, store the updated cm->ref_frame_map in ppi->ref_frame_map_copy. 5111 if (ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] == 1 && 5112 ppi->gf_group.update_type[cpi->gf_frame_index] == INTNL_ARF_UPDATE) { 5113 memcpy(ppi->ref_frame_map_copy, cm->ref_frame_map, 5114 sizeof(cm->ref_frame_map)); 5115 } 5116 av1_rc_postencode_update(cpi, cpi_data->frame_size); 5117 } 5118 5119 if (cpi_data->pop_lookahead == 1) { 5120 av1_lookahead_pop(cpi->ppi->lookahead, cpi_data->flush, 5121 cpi->compressor_stage); 5122 } 5123 if (cpi->common.show_frame) { 5124 cpi->ppi->ts_start_last_show_frame = cpi_data->ts_frame_start; 5125 cpi->ppi->ts_end_last_show_frame = cpi_data->ts_frame_end; 5126 } 5127 if (ppi->level_params.keep_level_stats && !is_stat_generation_stage(cpi)) { 5128 // Initialize level info. at the beginning of each sequence. 5129 if (cm->current_frame.frame_type == KEY_FRAME && 5130 ppi->gf_group.refbuf_state[cpi->gf_frame_index] == REFBUF_RESET) { 5131 av1_init_level_info(cpi); 5132 } 5133 av1_update_level_info(cpi, cpi_data->frame_size, cpi_data->ts_frame_start, 5134 cpi_data->ts_frame_end); 5135 } 5136 5137 if (!is_stat_generation_stage(cpi)) { 5138 #if !CONFIG_REALTIME_ONLY 5139 if (!has_no_stats_stage(cpi)) av1_twopass_postencode_update(cpi); 5140 #endif 5141 update_fb_of_context_type(cpi, ppi->fb_of_context_type); 5142 update_rc_counts(cpi); 5143 update_end_of_frame_stats(cpi); 5144 } 5145 5146 #if CONFIG_THREE_PASS 5147 if (cpi->oxcf.pass == AOM_RC_THIRD_PASS && cpi->third_pass_ctx) { 5148 av1_pop_third_pass_info(cpi->third_pass_ctx); 5149 } 5150 #endif 5151 5152 if (ppi->rtc_ref.set_ref_frame_config && !cpi->is_dropped_frame) { 5153 av1_svc_update_buffer_slot_refreshed(cpi); 5154 av1_svc_set_reference_was_previous(cpi); 5155 } 5156 5157 if (ppi->use_svc) av1_save_layer_context(cpi); 5158 5159 // Note *size = 0 indicates a dropped frame for which psnr is not calculated 5160 if (ppi->b_calculate_psnr && cpi_data->frame_size > 0) { 5161 if (cm->show_existing_frame || 5162 (!is_stat_generation_stage(cpi) && cm->show_frame)) { 5163 generate_psnr_packet(cpi); 5164 } 5165 } 5166 5167 #if CONFIG_INTERNAL_STATS 5168 if (!is_stat_generation_stage(cpi)) { 5169 compute_internal_stats(cpi, (int)cpi_data->frame_size); 5170 } 5171 #endif // CONFIG_INTERNAL_STATS 5172 5173 #if CONFIG_THREE_PASS 5174 // Write frame info. Subtract 1 from frame index since if was incremented in 5175 // update_rc_counts. 5176 av1_write_second_pass_per_frame_info(cpi, cpi->gf_frame_index - 1); 5177 #endif 5178 } 5179 5180 int av1_get_compressed_data(AV1_COMP *cpi, AV1_COMP_DATA *const cpi_data) { 5181 const AV1EncoderConfig *const oxcf = &cpi->oxcf; 5182 AV1_COMMON *const cm = &cpi->common; 5183 5184 // The jmp_buf is valid only for the duration of the function that calls 5185 // setjmp(). Therefore, this function must reset the 'setjmp' field to 0 5186 // before it returns. 5187 if (setjmp(cm->error->jmp)) { 5188 cm->error->setjmp = 0; 5189 return cm->error->error_code; 5190 } 5191 cm->error->setjmp = 1; 5192 5193 #if CONFIG_INTERNAL_STATS 5194 cpi->frame_recode_hits = 0; 5195 cpi->time_compress_data = 0; 5196 cpi->bytes = 0; 5197 #endif 5198 #if CONFIG_ENTROPY_STATS 5199 if (cpi->compressor_stage == ENCODE_STAGE) { 5200 av1_zero(cpi->counts); 5201 } 5202 #endif 5203 5204 #if CONFIG_BITSTREAM_DEBUG 5205 assert(cpi->oxcf.max_threads <= 1 && 5206 "bitstream debug tool does not support multithreading"); 5207 bitstream_queue_record_write(); 5208 5209 if (cm->seq_params->order_hint_info.enable_order_hint) { 5210 aom_bitstream_queue_set_frame_write(cm->current_frame.order_hint * 2 + 5211 cm->show_frame); 5212 } else { 5213 // This is currently used in RTC encoding. cm->show_frame is always 1. 5214 aom_bitstream_queue_set_frame_write(cm->current_frame.frame_number); 5215 } 5216 #endif 5217 if (cpi->ppi->use_svc) { 5218 av1_one_pass_cbr_svc_start_layer(cpi); 5219 } 5220 5221 cpi->is_dropped_frame = false; 5222 cm->showable_frame = 0; 5223 cpi_data->frame_size = 0; 5224 cpi->available_bs_size = cpi_data->cx_data_sz; 5225 #if CONFIG_INTERNAL_STATS 5226 struct aom_usec_timer cmptimer; 5227 aom_usec_timer_start(&cmptimer); 5228 #endif 5229 av1_set_high_precision_mv(cpi, 1, 0); 5230 5231 // Normal defaults 5232 cm->features.refresh_frame_context = 5233 oxcf->tool_cfg.frame_parallel_decoding_mode 5234 ? REFRESH_FRAME_CONTEXT_DISABLED 5235 : REFRESH_FRAME_CONTEXT_BACKWARD; 5236 if (oxcf->tile_cfg.enable_large_scale_tile) 5237 cm->features.refresh_frame_context = REFRESH_FRAME_CONTEXT_DISABLED; 5238 5239 if (assign_cur_frame_new_fb(cm) == NULL) { 5240 aom_internal_error(cpi->common.error, AOM_CODEC_ERROR, 5241 "Failed to allocate new cur_frame"); 5242 } 5243 5244 #if CONFIG_COLLECT_COMPONENT_TIMING 5245 // Accumulate 2nd pass time in 2-pass case or 1 pass time in 1-pass case. 5246 if (cpi->oxcf.pass == 2 || cpi->oxcf.pass == 0) 5247 start_timing(cpi, av1_encode_strategy_time); 5248 #endif 5249 5250 const int result = av1_encode_strategy( 5251 cpi, &cpi_data->frame_size, cpi_data->cx_data, cpi_data->cx_data_sz, 5252 &cpi_data->lib_flags, &cpi_data->ts_frame_start, &cpi_data->ts_frame_end, 5253 cpi_data->timestamp_ratio, &cpi_data->pop_lookahead, cpi_data->flush); 5254 5255 #if CONFIG_COLLECT_COMPONENT_TIMING 5256 if (cpi->oxcf.pass == 2 || cpi->oxcf.pass == 0) 5257 end_timing(cpi, av1_encode_strategy_time); 5258 5259 // Print out timing information. 5260 // Note: Use "cpi->frame_component_time[0] > 100 us" to avoid showing of 5261 // show_existing_frame and lag-in-frames. 5262 if ((cpi->oxcf.pass == 2 || cpi->oxcf.pass == 0) && 5263 cpi->frame_component_time[0] > 100) { 5264 int i; 5265 uint64_t frame_total = 0, total = 0; 5266 const GF_GROUP *const gf_group = &cpi->ppi->gf_group; 5267 FRAME_UPDATE_TYPE frame_update_type = 5268 get_frame_update_type(gf_group, cpi->gf_frame_index); 5269 5270 fprintf(stderr, 5271 "\n Frame number: %d, Frame type: %s, Show Frame: %d, Frame Update " 5272 "Type: %d, Q: %d\n", 5273 cm->current_frame.frame_number, 5274 get_frame_type_enum(cm->current_frame.frame_type), cm->show_frame, 5275 frame_update_type, cm->quant_params.base_qindex); 5276 for (i = 0; i < kTimingComponents; i++) { 5277 cpi->component_time[i] += cpi->frame_component_time[i]; 5278 // Use av1_encode_strategy_time (i = 0) as the total time. 5279 if (i == 0) { 5280 frame_total = cpi->frame_component_time[0]; 5281 total = cpi->component_time[0]; 5282 } 5283 fprintf(stderr, 5284 " %50s: %15" PRId64 " us [%6.2f%%] (total: %15" PRId64 5285 " us [%6.2f%%])\n", 5286 get_component_name(i), cpi->frame_component_time[i], 5287 (float)((float)cpi->frame_component_time[i] * 100.0 / 5288 (float)frame_total), 5289 cpi->component_time[i], 5290 (float)((float)cpi->component_time[i] * 100.0 / (float)total)); 5291 cpi->frame_component_time[i] = 0; 5292 } 5293 } 5294 #endif 5295 5296 // Reset the flag to 0 afer encoding. 5297 cpi->rc.use_external_qp_one_pass = 0; 5298 5299 if (result == -1) { 5300 cm->error->setjmp = 0; 5301 // Returning -1 indicates no frame encoded; more input is required 5302 return -1; 5303 } 5304 if (result != AOM_CODEC_OK) { 5305 aom_internal_error(cpi->common.error, AOM_CODEC_ERROR, 5306 "Failed to encode frame"); 5307 } 5308 #if CONFIG_INTERNAL_STATS 5309 aom_usec_timer_mark(&cmptimer); 5310 cpi->time_compress_data += aom_usec_timer_elapsed(&cmptimer); 5311 #endif // CONFIG_INTERNAL_STATS 5312 5313 #if CONFIG_SPEED_STATS 5314 if (!is_stat_generation_stage(cpi) && !cm->show_existing_frame) { 5315 cpi->tx_search_count += cpi->td.mb.txfm_search_info.tx_search_count; 5316 cpi->td.mb.txfm_search_info.tx_search_count = 0; 5317 } 5318 #endif // CONFIG_SPEED_STATS 5319 5320 cm->error->setjmp = 0; 5321 return AOM_CODEC_OK; 5322 } 5323 5324 // Populates cpi->scaled_ref_buf corresponding to frames in a parallel encode 5325 // set. Also sets the bitmask 'ref_buffers_used_map'. 5326 static void scale_references_fpmt(AV1_COMP *cpi, int *ref_buffers_used_map) { 5327 AV1_COMMON *cm = &cpi->common; 5328 MV_REFERENCE_FRAME ref_frame; 5329 5330 for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) { 5331 // Need to convert from AOM_REFFRAME to index into ref_mask (subtract 1). 5332 if (cpi->ref_frame_flags & av1_ref_frame_flag_list[ref_frame]) { 5333 const YV12_BUFFER_CONFIG *const ref = 5334 get_ref_frame_yv12_buf(cm, ref_frame); 5335 5336 if (ref == NULL) { 5337 cpi->scaled_ref_buf[ref_frame - 1] = NULL; 5338 continue; 5339 } 5340 5341 // FPMT does not support scaling yet. 5342 assert(ref->y_crop_width == cm->width && 5343 ref->y_crop_height == cm->height); 5344 5345 RefCntBuffer *buf = get_ref_frame_buf(cm, ref_frame); 5346 cpi->scaled_ref_buf[ref_frame - 1] = buf; 5347 for (int i = 0; i < cm->buffer_pool->num_frame_bufs; ++i) { 5348 if (&cm->buffer_pool->frame_bufs[i] == buf) { 5349 *ref_buffers_used_map |= (1 << i); 5350 } 5351 } 5352 } else { 5353 if (!has_no_stats_stage(cpi)) cpi->scaled_ref_buf[ref_frame - 1] = NULL; 5354 } 5355 } 5356 } 5357 5358 // Increments the ref_count of frame buffers referenced by cpi->scaled_ref_buf 5359 // corresponding to frames in a parallel encode set. 5360 static void increment_scaled_ref_counts_fpmt(BufferPool *buffer_pool, 5361 int ref_buffers_used_map) { 5362 for (int i = 0; i < buffer_pool->num_frame_bufs; ++i) { 5363 if (ref_buffers_used_map & (1 << i)) { 5364 ++buffer_pool->frame_bufs[i].ref_count; 5365 } 5366 } 5367 } 5368 5369 // Releases cpi->scaled_ref_buf corresponding to frames in a parallel encode 5370 // set. 5371 void av1_release_scaled_references_fpmt(AV1_COMP *cpi) { 5372 // TODO(isbs): only refresh the necessary frames, rather than all of them 5373 for (int i = 0; i < INTER_REFS_PER_FRAME; ++i) { 5374 RefCntBuffer *const buf = cpi->scaled_ref_buf[i]; 5375 if (buf != NULL) { 5376 cpi->scaled_ref_buf[i] = NULL; 5377 } 5378 } 5379 } 5380 5381 // Decrements the ref_count of frame buffers referenced by cpi->scaled_ref_buf 5382 // corresponding to frames in a parallel encode set. 5383 void av1_decrement_ref_counts_fpmt(BufferPool *buffer_pool, 5384 int ref_buffers_used_map) { 5385 for (int i = 0; i < buffer_pool->num_frame_bufs; ++i) { 5386 if (ref_buffers_used_map & (1 << i)) { 5387 --buffer_pool->frame_bufs[i].ref_count; 5388 } 5389 } 5390 } 5391 5392 // Initialize parallel frame contexts with screen content decisions. 5393 void av1_init_sc_decisions(AV1_PRIMARY *const ppi) { 5394 AV1_COMP *const first_cpi = ppi->cpi; 5395 for (int i = 1; i < ppi->num_fp_contexts; ++i) { 5396 AV1_COMP *cur_cpi = ppi->parallel_cpi[i]; 5397 cur_cpi->common.features.allow_screen_content_tools = 5398 first_cpi->common.features.allow_screen_content_tools; 5399 cur_cpi->common.features.allow_intrabc = 5400 first_cpi->common.features.allow_intrabc; 5401 cur_cpi->use_screen_content_tools = first_cpi->use_screen_content_tools; 5402 cur_cpi->is_screen_content_type = first_cpi->is_screen_content_type; 5403 } 5404 } 5405 5406 AV1_COMP *av1_get_parallel_frame_enc_data(AV1_PRIMARY *const ppi, 5407 AV1_COMP_DATA *const first_cpi_data) { 5408 int cpi_idx = 0; 5409 5410 // Loop over parallel_cpi to find the cpi that processed the current 5411 // gf_frame_index ahead of time. 5412 for (int i = 1; i < ppi->num_fp_contexts; i++) { 5413 if (ppi->cpi->gf_frame_index == ppi->parallel_cpi[i]->gf_frame_index) { 5414 cpi_idx = i; 5415 break; 5416 } 5417 } 5418 5419 assert(cpi_idx > 0); 5420 assert(!ppi->parallel_cpi[cpi_idx]->common.show_existing_frame); 5421 5422 // Release the previously-used frame-buffer. 5423 if (ppi->cpi->common.cur_frame != NULL) { 5424 --ppi->cpi->common.cur_frame->ref_count; 5425 ppi->cpi->common.cur_frame = NULL; 5426 } 5427 5428 // Swap the appropriate parallel_cpi with the parallel_cpi[0]. 5429 ppi->cpi = ppi->parallel_cpi[cpi_idx]; 5430 ppi->parallel_cpi[cpi_idx] = ppi->parallel_cpi[0]; 5431 ppi->parallel_cpi[0] = ppi->cpi; 5432 5433 // Copy appropriate parallel_frames_data to local data. 5434 { 5435 AV1_COMP_DATA *data = &ppi->parallel_frames_data[cpi_idx - 1]; 5436 assert(data->frame_size > 0); 5437 if (data->frame_size > first_cpi_data->cx_data_sz) { 5438 aom_internal_error(&ppi->error, AOM_CODEC_ERROR, 5439 "first_cpi_data->cx_data buffer full"); 5440 } 5441 5442 first_cpi_data->lib_flags = data->lib_flags; 5443 first_cpi_data->ts_frame_start = data->ts_frame_start; 5444 first_cpi_data->ts_frame_end = data->ts_frame_end; 5445 memcpy(first_cpi_data->cx_data, data->cx_data, data->frame_size); 5446 first_cpi_data->frame_size = data->frame_size; 5447 if (ppi->cpi->common.show_frame) { 5448 first_cpi_data->pop_lookahead = 1; 5449 } 5450 } 5451 5452 return ppi->cpi; 5453 } 5454 5455 // Initialises frames belonging to a parallel encode set. 5456 int av1_init_parallel_frame_context(const AV1_COMP_DATA *const first_cpi_data, 5457 AV1_PRIMARY *const ppi, 5458 int *ref_buffers_used_map) { 5459 AV1_COMP *const first_cpi = ppi->cpi; 5460 GF_GROUP *const gf_group = &ppi->gf_group; 5461 int gf_index_start = first_cpi->gf_frame_index; 5462 assert(gf_group->frame_parallel_level[gf_index_start] == 1); 5463 int parallel_frame_count = 0; 5464 int cur_frame_num = first_cpi->common.current_frame.frame_number; 5465 int show_frame_count = first_cpi->frame_index_set.show_frame_count; 5466 int frames_since_key = first_cpi->rc.frames_since_key; 5467 int frames_to_key = first_cpi->rc.frames_to_key; 5468 int frames_to_fwd_kf = first_cpi->rc.frames_to_fwd_kf; 5469 int cur_frame_disp = cur_frame_num + gf_group->arf_src_offset[gf_index_start]; 5470 const FIRSTPASS_STATS *stats_in = first_cpi->twopass_frame.stats_in; 5471 5472 assert(*ref_buffers_used_map == 0); 5473 5474 // Release the previously used frame-buffer by a frame_parallel_level 1 frame. 5475 if (first_cpi->common.cur_frame != NULL) { 5476 --first_cpi->common.cur_frame->ref_count; 5477 first_cpi->common.cur_frame = NULL; 5478 } 5479 5480 RefFrameMapPair ref_frame_map_pairs[REF_FRAMES]; 5481 RefFrameMapPair first_ref_frame_map_pairs[REF_FRAMES]; 5482 init_ref_map_pair(first_cpi, first_ref_frame_map_pairs); 5483 memcpy(ref_frame_map_pairs, first_ref_frame_map_pairs, 5484 sizeof(RefFrameMapPair) * REF_FRAMES); 5485 5486 // Store the reference refresh index of frame_parallel_level 1 frame in a 5487 // parallel encode set of lower layer frames. 5488 if (gf_group->update_type[gf_index_start] == INTNL_ARF_UPDATE) { 5489 first_cpi->ref_refresh_index = av1_calc_refresh_idx_for_intnl_arf( 5490 first_cpi, ref_frame_map_pairs, gf_index_start); 5491 assert(first_cpi->ref_refresh_index != INVALID_IDX && 5492 first_cpi->ref_refresh_index < REF_FRAMES); 5493 first_cpi->refresh_idx_available = true; 5494 // Update ref_frame_map_pairs. 5495 ref_frame_map_pairs[first_cpi->ref_refresh_index].disp_order = 5496 gf_group->display_idx[gf_index_start]; 5497 ref_frame_map_pairs[first_cpi->ref_refresh_index].pyr_level = 5498 gf_group->layer_depth[gf_index_start]; 5499 } 5500 5501 // Set do_frame_data_update flag as false for frame_parallel_level 1 frame. 5502 first_cpi->do_frame_data_update = false; 5503 if (gf_group->arf_src_offset[gf_index_start] == 0) { 5504 first_cpi->time_stamps.prev_ts_start = ppi->ts_start_last_show_frame; 5505 first_cpi->time_stamps.prev_ts_end = ppi->ts_end_last_show_frame; 5506 } 5507 5508 av1_get_ref_frames(first_ref_frame_map_pairs, cur_frame_disp, first_cpi, 5509 gf_index_start, 1, first_cpi->common.remapped_ref_idx); 5510 5511 scale_references_fpmt(first_cpi, ref_buffers_used_map); 5512 parallel_frame_count++; 5513 5514 // Iterate through the GF_GROUP to find the remaining frame_parallel_level 2 5515 // frames which are part of the current parallel encode set and initialize the 5516 // required cpi elements. 5517 for (int i = gf_index_start + 1; i < gf_group->size; i++) { 5518 // Update frame counters if previous frame was show frame or show existing 5519 // frame. 5520 if (gf_group->arf_src_offset[i - 1] == 0) { 5521 cur_frame_num++; 5522 show_frame_count++; 5523 if (frames_to_fwd_kf <= 0) 5524 frames_to_fwd_kf = first_cpi->oxcf.kf_cfg.fwd_kf_dist; 5525 if (frames_to_key) { 5526 frames_since_key++; 5527 frames_to_key--; 5528 frames_to_fwd_kf--; 5529 } 5530 stats_in++; 5531 } 5532 cur_frame_disp = cur_frame_num + gf_group->arf_src_offset[i]; 5533 if (gf_group->frame_parallel_level[i] == 2) { 5534 AV1_COMP *cur_cpi = ppi->parallel_cpi[parallel_frame_count]; 5535 AV1_COMP_DATA *cur_cpi_data = 5536 &ppi->parallel_frames_data[parallel_frame_count - 1]; 5537 cur_cpi->gf_frame_index = i; 5538 cur_cpi->framerate = first_cpi->framerate; 5539 cur_cpi->common.current_frame.frame_number = cur_frame_num; 5540 cur_cpi->common.current_frame.frame_type = gf_group->frame_type[i]; 5541 cur_cpi->frame_index_set.show_frame_count = show_frame_count; 5542 cur_cpi->rc.frames_since_key = frames_since_key; 5543 cur_cpi->rc.frames_to_key = frames_to_key; 5544 cur_cpi->rc.frames_to_fwd_kf = frames_to_fwd_kf; 5545 cur_cpi->rc.active_worst_quality = first_cpi->rc.active_worst_quality; 5546 cur_cpi->rc.avg_frame_bandwidth = first_cpi->rc.avg_frame_bandwidth; 5547 cur_cpi->rc.max_frame_bandwidth = first_cpi->rc.max_frame_bandwidth; 5548 cur_cpi->rc.min_frame_bandwidth = first_cpi->rc.min_frame_bandwidth; 5549 cur_cpi->rc.intervals_till_gf_calculate_due = 5550 first_cpi->rc.intervals_till_gf_calculate_due; 5551 cur_cpi->mv_search_params.max_mv_magnitude = 5552 first_cpi->mv_search_params.max_mv_magnitude; 5553 if (gf_group->update_type[cur_cpi->gf_frame_index] == INTNL_ARF_UPDATE) { 5554 cur_cpi->common.lf.mode_ref_delta_enabled = 1; 5555 } 5556 cur_cpi->do_frame_data_update = false; 5557 // Initialize prev_ts_start and prev_ts_end for show frame(s) and show 5558 // existing frame(s). 5559 if (gf_group->arf_src_offset[i] == 0) { 5560 // Choose source of prev frame. 5561 int src_index = gf_group->src_offset[i]; 5562 struct lookahead_entry *prev_source = av1_lookahead_peek( 5563 ppi->lookahead, src_index - 1, cur_cpi->compressor_stage); 5564 // Save timestamps of prev frame. 5565 cur_cpi->time_stamps.prev_ts_start = prev_source->ts_start; 5566 cur_cpi->time_stamps.prev_ts_end = prev_source->ts_end; 5567 } 5568 cur_cpi->time_stamps.first_ts_start = 5569 first_cpi->time_stamps.first_ts_start; 5570 5571 memcpy(cur_cpi->common.ref_frame_map, first_cpi->common.ref_frame_map, 5572 sizeof(first_cpi->common.ref_frame_map)); 5573 cur_cpi_data->lib_flags = 0; 5574 cur_cpi_data->timestamp_ratio = first_cpi_data->timestamp_ratio; 5575 cur_cpi_data->flush = first_cpi_data->flush; 5576 cur_cpi_data->frame_size = 0; 5577 if (gf_group->update_type[gf_index_start] == INTNL_ARF_UPDATE) { 5578 // If the first frame in a parallel encode set is INTNL_ARF_UPDATE 5579 // frame, initialize lib_flags of frame_parallel_level 2 frame in the 5580 // set with that of frame_parallel_level 1 frame. 5581 cur_cpi_data->lib_flags = first_cpi_data->lib_flags; 5582 // Store the reference refresh index of frame_parallel_level 2 frame in 5583 // a parallel encode set of lower layer frames. 5584 cur_cpi->ref_refresh_index = 5585 av1_calc_refresh_idx_for_intnl_arf(cur_cpi, ref_frame_map_pairs, i); 5586 cur_cpi->refresh_idx_available = true; 5587 // Skip the reference frame which will be refreshed by 5588 // frame_parallel_level 1 frame in a parallel encode set of lower layer 5589 // frames. 5590 cur_cpi->ref_idx_to_skip = first_cpi->ref_refresh_index; 5591 } else { 5592 cur_cpi->ref_idx_to_skip = INVALID_IDX; 5593 cur_cpi->ref_refresh_index = INVALID_IDX; 5594 cur_cpi->refresh_idx_available = false; 5595 } 5596 cur_cpi->twopass_frame.stats_in = stats_in; 5597 5598 av1_get_ref_frames(first_ref_frame_map_pairs, cur_frame_disp, cur_cpi, i, 5599 1, cur_cpi->common.remapped_ref_idx); 5600 scale_references_fpmt(cur_cpi, ref_buffers_used_map); 5601 parallel_frame_count++; 5602 } 5603 5604 // Set do_frame_data_update to true for the last frame_parallel_level 2 5605 // frame in the current parallel encode set. 5606 if (i == (gf_group->size - 1) || 5607 (gf_group->frame_parallel_level[i + 1] == 0 && 5608 (gf_group->update_type[i + 1] == ARF_UPDATE || 5609 gf_group->update_type[i + 1] == INTNL_ARF_UPDATE)) || 5610 gf_group->frame_parallel_level[i + 1] == 1) { 5611 ppi->parallel_cpi[parallel_frame_count - 1]->do_frame_data_update = true; 5612 break; 5613 } 5614 } 5615 5616 increment_scaled_ref_counts_fpmt(first_cpi->common.buffer_pool, 5617 *ref_buffers_used_map); 5618 5619 // Return the number of frames in the parallel encode set. 5620 return parallel_frame_count; 5621 } 5622 5623 int av1_get_preview_raw_frame(AV1_COMP *cpi, YV12_BUFFER_CONFIG *dest) { 5624 AV1_COMMON *cm = &cpi->common; 5625 if (!cm->show_frame) { 5626 return -1; 5627 } else { 5628 int ret; 5629 if (cm->cur_frame != NULL && !cpi->oxcf.algo_cfg.skip_postproc_filtering) { 5630 *dest = cm->cur_frame->buf; 5631 dest->y_width = cm->width; 5632 dest->y_height = cm->height; 5633 dest->uv_width = cm->width >> cm->seq_params->subsampling_x; 5634 dest->uv_height = cm->height >> cm->seq_params->subsampling_y; 5635 ret = 0; 5636 } else { 5637 ret = -1; 5638 } 5639 return ret; 5640 } 5641 } 5642 5643 int av1_get_last_show_frame(AV1_COMP *cpi, YV12_BUFFER_CONFIG *frame) { 5644 if (cpi->last_show_frame_buf == NULL || 5645 cpi->oxcf.algo_cfg.skip_postproc_filtering) 5646 return -1; 5647 5648 *frame = cpi->last_show_frame_buf->buf; 5649 return 0; 5650 } 5651 5652 aom_codec_err_t av1_copy_new_frame_enc(AV1_COMMON *cm, 5653 YV12_BUFFER_CONFIG *new_frame, 5654 YV12_BUFFER_CONFIG *sd) { 5655 const int num_planes = av1_num_planes(cm); 5656 if (!equal_dimensions_and_border(new_frame, sd)) 5657 aom_internal_error(cm->error, AOM_CODEC_ERROR, 5658 "Incorrect buffer dimensions"); 5659 else 5660 aom_yv12_copy_frame(new_frame, sd, num_planes); 5661 5662 return cm->error->error_code; 5663 } 5664 5665 int av1_set_internal_size(AV1EncoderConfig *const oxcf, 5666 ResizePendingParams *resize_pending_params, 5667 AOM_SCALING_MODE horiz_mode, 5668 AOM_SCALING_MODE vert_mode) { 5669 int hr = 0, hs = 0, vr = 0, vs = 0; 5670 5671 // Checks for invalid AOM_SCALING_MODE values. 5672 if (horiz_mode > AOME_ONETHREE || vert_mode > AOME_ONETHREE) return -1; 5673 5674 Scale2Ratio(horiz_mode, &hr, &hs); 5675 Scale2Ratio(vert_mode, &vr, &vs); 5676 5677 // always go to the next whole number 5678 resize_pending_params->width = (hs - 1 + oxcf->frm_dim_cfg.width * hr) / hs; 5679 resize_pending_params->height = (vs - 1 + oxcf->frm_dim_cfg.height * vr) / vs; 5680 5681 if (horiz_mode != AOME_NORMAL || vert_mode != AOME_NORMAL) { 5682 oxcf->resize_cfg.resize_mode = RESIZE_FIXED; 5683 oxcf->algo_cfg.enable_tpl_model = 0; 5684 } 5685 return 0; 5686 } 5687 5688 int av1_get_quantizer(AV1_COMP *cpi) { 5689 return cpi->common.quant_params.base_qindex; 5690 } 5691 5692 int av1_convert_sect5obus_to_annexb(uint8_t *buffer, size_t buffer_size, 5693 size_t *frame_size) { 5694 assert(*frame_size <= buffer_size); 5695 size_t output_size = 0; 5696 size_t remaining_size = *frame_size; 5697 uint8_t *buff_ptr = buffer; 5698 5699 // go through each OBUs 5700 while (remaining_size > 0) { 5701 uint8_t saved_obu_header[2]; 5702 uint64_t obu_payload_size; 5703 size_t length_of_payload_size; 5704 size_t length_of_obu_size; 5705 const uint32_t obu_header_size = (buff_ptr[0] >> 2) & 0x1 ? 2 : 1; 5706 size_t obu_bytes_read = obu_header_size; // bytes read for current obu 5707 5708 // save the obu header (1 or 2 bytes) 5709 memcpy(saved_obu_header, buff_ptr, obu_header_size); 5710 // clear the obu_has_size_field 5711 saved_obu_header[0] &= ~0x2; 5712 5713 // get the payload_size and length of payload_size 5714 if (aom_uleb_decode(buff_ptr + obu_header_size, 5715 remaining_size - obu_header_size, &obu_payload_size, 5716 &length_of_payload_size) != 0) { 5717 return AOM_CODEC_ERROR; 5718 } 5719 obu_bytes_read += length_of_payload_size; 5720 5721 // calculate the length of size of the obu header plus payload 5722 const uint64_t obu_size = obu_header_size + obu_payload_size; 5723 length_of_obu_size = aom_uleb_size_in_bytes(obu_size); 5724 5725 if (length_of_obu_size + obu_header_size > 5726 buffer_size - output_size - (remaining_size - obu_bytes_read)) { 5727 return AOM_CODEC_ERROR; 5728 } 5729 // move the rest of data to new location 5730 memmove(buff_ptr + length_of_obu_size + obu_header_size, 5731 buff_ptr + obu_bytes_read, remaining_size - obu_bytes_read); 5732 obu_bytes_read += (size_t)obu_payload_size; 5733 5734 // write the new obu size 5735 size_t coded_obu_size; 5736 if (aom_uleb_encode(obu_size, length_of_obu_size, buff_ptr, 5737 &coded_obu_size) != 0 || 5738 coded_obu_size != length_of_obu_size) { 5739 return AOM_CODEC_ERROR; 5740 } 5741 5742 // write the saved (modified) obu_header following obu size 5743 memcpy(buff_ptr + length_of_obu_size, saved_obu_header, obu_header_size); 5744 5745 remaining_size -= obu_bytes_read; 5746 buff_ptr += length_of_obu_size + (size_t)obu_size; 5747 output_size += length_of_obu_size + (size_t)obu_size; 5748 } 5749 5750 *frame_size = output_size; 5751 return AOM_CODEC_OK; 5752 } 5753 5754 static void rtc_set_updates_ref_frame_config( 5755 ExtRefreshFrameFlagsInfo *const ext_refresh_frame_flags, 5756 RTC_REF *const rtc_ref) { 5757 ext_refresh_frame_flags->update_pending = 1; 5758 ext_refresh_frame_flags->last_frame = rtc_ref->refresh[rtc_ref->ref_idx[0]]; 5759 ext_refresh_frame_flags->golden_frame = rtc_ref->refresh[rtc_ref->ref_idx[3]]; 5760 ext_refresh_frame_flags->bwd_ref_frame = 5761 rtc_ref->refresh[rtc_ref->ref_idx[4]]; 5762 ext_refresh_frame_flags->alt2_ref_frame = 5763 rtc_ref->refresh[rtc_ref->ref_idx[5]]; 5764 ext_refresh_frame_flags->alt_ref_frame = 5765 rtc_ref->refresh[rtc_ref->ref_idx[6]]; 5766 rtc_ref->non_reference_frame = 1; 5767 for (int i = 0; i < REF_FRAMES; i++) { 5768 if (rtc_ref->refresh[i] == 1) { 5769 rtc_ref->non_reference_frame = 0; 5770 break; 5771 } 5772 } 5773 } 5774 5775 static int rtc_set_references_external_ref_frame_config(AV1_COMP *cpi) { 5776 // LAST_FRAME (0), LAST2_FRAME(1), LAST3_FRAME(2), GOLDEN_FRAME(3), 5777 // BWDREF_FRAME(4), ALTREF2_FRAME(5), ALTREF_FRAME(6). 5778 int ref = AOM_REFFRAME_ALL; 5779 for (int i = 0; i < INTER_REFS_PER_FRAME; i++) { 5780 if (!cpi->ppi->rtc_ref.reference[i]) ref ^= (1 << i); 5781 } 5782 return ref; 5783 } 5784 5785 void av1_apply_encoding_flags(AV1_COMP *cpi, aom_enc_frame_flags_t flags) { 5786 // TODO(yunqingwang): For what references to use, external encoding flags 5787 // should be consistent with internal reference frame selection. Need to 5788 // ensure that there is not conflict between the two. In AV1 encoder, the 5789 // priority rank for 7 reference frames are: LAST, ALTREF, LAST2, LAST3, 5790 // GOLDEN, BWDREF, ALTREF2. 5791 5792 ExternalFlags *const ext_flags = &cpi->ext_flags; 5793 ExtRefreshFrameFlagsInfo *const ext_refresh_frame_flags = 5794 &ext_flags->refresh_frame; 5795 ext_flags->ref_frame_flags = AOM_REFFRAME_ALL; 5796 if (flags & 5797 (AOM_EFLAG_NO_REF_LAST | AOM_EFLAG_NO_REF_LAST2 | AOM_EFLAG_NO_REF_LAST3 | 5798 AOM_EFLAG_NO_REF_GF | AOM_EFLAG_NO_REF_ARF | AOM_EFLAG_NO_REF_BWD | 5799 AOM_EFLAG_NO_REF_ARF2)) { 5800 int ref = AOM_REFFRAME_ALL; 5801 5802 if (flags & AOM_EFLAG_NO_REF_LAST) ref ^= AOM_LAST_FLAG; 5803 if (flags & AOM_EFLAG_NO_REF_LAST2) ref ^= AOM_LAST2_FLAG; 5804 if (flags & AOM_EFLAG_NO_REF_LAST3) ref ^= AOM_LAST3_FLAG; 5805 5806 if (flags & AOM_EFLAG_NO_REF_GF) ref ^= AOM_GOLD_FLAG; 5807 5808 if (flags & AOM_EFLAG_NO_REF_ARF) { 5809 ref ^= AOM_ALT_FLAG; 5810 ref ^= AOM_BWD_FLAG; 5811 ref ^= AOM_ALT2_FLAG; 5812 } else { 5813 if (flags & AOM_EFLAG_NO_REF_BWD) ref ^= AOM_BWD_FLAG; 5814 if (flags & AOM_EFLAG_NO_REF_ARF2) ref ^= AOM_ALT2_FLAG; 5815 } 5816 5817 av1_use_as_reference(&ext_flags->ref_frame_flags, ref); 5818 } else { 5819 if (cpi->ppi->rtc_ref.set_ref_frame_config) { 5820 int ref = rtc_set_references_external_ref_frame_config(cpi); 5821 av1_use_as_reference(&ext_flags->ref_frame_flags, ref); 5822 } 5823 } 5824 5825 if (flags & 5826 (AOM_EFLAG_NO_UPD_LAST | AOM_EFLAG_NO_UPD_GF | AOM_EFLAG_NO_UPD_ARF)) { 5827 int upd = AOM_REFFRAME_ALL; 5828 5829 // Refreshing LAST/LAST2/LAST3 is handled by 1 common flag. 5830 if (flags & AOM_EFLAG_NO_UPD_LAST) upd ^= AOM_LAST_FLAG; 5831 5832 if (flags & AOM_EFLAG_NO_UPD_GF) upd ^= AOM_GOLD_FLAG; 5833 5834 if (flags & AOM_EFLAG_NO_UPD_ARF) { 5835 upd ^= AOM_ALT_FLAG; 5836 upd ^= AOM_BWD_FLAG; 5837 upd ^= AOM_ALT2_FLAG; 5838 } 5839 5840 ext_refresh_frame_flags->last_frame = (upd & AOM_LAST_FLAG) != 0; 5841 ext_refresh_frame_flags->golden_frame = (upd & AOM_GOLD_FLAG) != 0; 5842 ext_refresh_frame_flags->alt_ref_frame = (upd & AOM_ALT_FLAG) != 0; 5843 ext_refresh_frame_flags->bwd_ref_frame = (upd & AOM_BWD_FLAG) != 0; 5844 ext_refresh_frame_flags->alt2_ref_frame = (upd & AOM_ALT2_FLAG) != 0; 5845 ext_refresh_frame_flags->update_pending = 1; 5846 } else { 5847 if (cpi->ppi->rtc_ref.set_ref_frame_config) 5848 rtc_set_updates_ref_frame_config(ext_refresh_frame_flags, 5849 &cpi->ppi->rtc_ref); 5850 else 5851 ext_refresh_frame_flags->update_pending = 0; 5852 } 5853 5854 ext_flags->use_ref_frame_mvs = cpi->oxcf.tool_cfg.enable_ref_frame_mvs & 5855 ((flags & AOM_EFLAG_NO_REF_FRAME_MVS) == 0); 5856 ext_flags->use_error_resilient = cpi->oxcf.tool_cfg.error_resilient_mode | 5857 ((flags & AOM_EFLAG_ERROR_RESILIENT) != 0); 5858 ext_flags->use_s_frame = 5859 cpi->oxcf.kf_cfg.enable_sframe | ((flags & AOM_EFLAG_SET_S_FRAME) != 0); 5860 ext_flags->use_primary_ref_none = 5861 (flags & AOM_EFLAG_SET_PRIMARY_REF_NONE) != 0; 5862 5863 if (flags & AOM_EFLAG_NO_UPD_ENTROPY) { 5864 update_entropy(&ext_flags->refresh_frame_context, 5865 &ext_flags->refresh_frame_context_pending, 0); 5866 } 5867 } 5868 5869 aom_fixed_buf_t *av1_get_global_headers(AV1_PRIMARY *ppi) { 5870 if (!ppi) return NULL; 5871 5872 uint8_t header_buf[512] = { 0 }; 5873 const uint32_t sequence_header_size = av1_write_sequence_header_obu( 5874 &ppi->seq_params, &header_buf[0], sizeof(header_buf)); 5875 assert(sequence_header_size <= sizeof(header_buf)); 5876 if (sequence_header_size == 0) return NULL; 5877 5878 const size_t obu_header_size = 1; 5879 const size_t size_field_size = aom_uleb_size_in_bytes(sequence_header_size); 5880 const size_t payload_offset = obu_header_size + size_field_size; 5881 5882 if (payload_offset + sequence_header_size > sizeof(header_buf)) return NULL; 5883 memmove(&header_buf[payload_offset], &header_buf[0], sequence_header_size); 5884 5885 if (av1_write_obu_header(&ppi->level_params, &ppi->cpi->frame_header_count, 5886 OBU_SEQUENCE_HEADER, 5887 ppi->seq_params.has_nonzero_operating_point_idc, 5888 /*is_layer_specific_obu=*/false, 0, 5889 &header_buf[0]) != obu_header_size) { 5890 return NULL; 5891 } 5892 5893 size_t coded_size_field_size = 0; 5894 if (aom_uleb_encode(sequence_header_size, size_field_size, 5895 &header_buf[obu_header_size], 5896 &coded_size_field_size) != 0) { 5897 return NULL; 5898 } 5899 assert(coded_size_field_size == size_field_size); 5900 5901 aom_fixed_buf_t *global_headers = 5902 (aom_fixed_buf_t *)malloc(sizeof(*global_headers)); 5903 if (!global_headers) return NULL; 5904 5905 const size_t global_header_buf_size = 5906 obu_header_size + size_field_size + sequence_header_size; 5907 5908 global_headers->buf = malloc(global_header_buf_size); 5909 if (!global_headers->buf) { 5910 free(global_headers); 5911 return NULL; 5912 } 5913 5914 memcpy(global_headers->buf, &header_buf[0], global_header_buf_size); 5915 global_headers->sz = global_header_buf_size; 5916 return global_headers; 5917 }