AOMedia AV1 Codec
speed_features.h
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2016, Alliance for Open Media. All rights reserved.
3  *
4  * This source code is subject to the terms of the BSD 2 Clause License and
5  * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6  * was not distributed with this source code in the LICENSE file, you can
7  * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8  * Media Patent License 1.0 was not distributed with this source code in the
9  * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10  */
11 
12 #ifndef AOM_AV1_ENCODER_SPEED_FEATURES_H_
13 #define AOM_AV1_ENCODER_SPEED_FEATURES_H_
14 
15 #include "av1/common/enums.h"
16 #include "av1/encoder/enc_enums.h"
17 #include "av1/encoder/mcomp.h"
18 #include "av1/encoder/encodemb.h"
19 
20 #ifdef __cplusplus
21 extern "C" {
22 #endif
23 
27 #define MAX_MESH_STEP 4
28 
29 typedef struct MESH_PATTERN {
30  int range;
31  int interval;
32 } MESH_PATTERN;
33 
34 enum {
35  GM_FULL_SEARCH,
36  GM_REDUCED_REF_SEARCH_SKIP_L2_L3,
37  GM_REDUCED_REF_SEARCH_SKIP_L2_L3_ARF2,
38 
39  // Same as GM_REDUCED_REF_SEARCH_SKIP_L2_L3_ARF2 but with extra filtering
40  // to keep at most two ref frames
41  GM_SEARCH_CLOSEST_REFS_ONLY,
42 
43  GM_DISABLE_SEARCH
44 } UENUM1BYTE(GM_SEARCH_TYPE);
45 
46 enum {
47  DIST_WTD_COMP_ENABLED,
48  DIST_WTD_COMP_SKIP_MV_SEARCH,
49  DIST_WTD_COMP_DISABLED,
50 } UENUM1BYTE(DIST_WTD_COMP_FLAG);
51 
52 enum {
53  INTRA_ALL = (1 << DC_PRED) | (1 << V_PRED) | (1 << H_PRED) | (1 << D45_PRED) |
54  (1 << D135_PRED) | (1 << D113_PRED) | (1 << D157_PRED) |
55  (1 << D203_PRED) | (1 << D67_PRED) | (1 << SMOOTH_PRED) |
56  (1 << SMOOTH_V_PRED) | (1 << SMOOTH_H_PRED) | (1 << PAETH_PRED),
57  UV_INTRA_ALL =
58  (1 << UV_DC_PRED) | (1 << UV_V_PRED) | (1 << UV_H_PRED) |
59  (1 << UV_D45_PRED) | (1 << UV_D135_PRED) | (1 << UV_D113_PRED) |
60  (1 << UV_D157_PRED) | (1 << UV_D203_PRED) | (1 << UV_D67_PRED) |
61  (1 << UV_SMOOTH_PRED) | (1 << UV_SMOOTH_V_PRED) |
62  (1 << UV_SMOOTH_H_PRED) | (1 << UV_PAETH_PRED) | (1 << UV_CFL_PRED),
63  UV_INTRA_DC = (1 << UV_DC_PRED),
64  UV_INTRA_DC_CFL = (1 << UV_DC_PRED) | (1 << UV_CFL_PRED),
65  UV_INTRA_DC_TM = (1 << UV_DC_PRED) | (1 << UV_PAETH_PRED),
66  UV_INTRA_DC_PAETH_CFL =
67  (1 << UV_DC_PRED) | (1 << UV_PAETH_PRED) | (1 << UV_CFL_PRED),
68  UV_INTRA_DC_H_V = (1 << UV_DC_PRED) | (1 << UV_V_PRED) | (1 << UV_H_PRED),
69  UV_INTRA_DC_H_V_CFL = (1 << UV_DC_PRED) | (1 << UV_V_PRED) |
70  (1 << UV_H_PRED) | (1 << UV_CFL_PRED),
71  UV_INTRA_DC_PAETH_H_V = (1 << UV_DC_PRED) | (1 << UV_PAETH_PRED) |
72  (1 << UV_V_PRED) | (1 << UV_H_PRED),
73  UV_INTRA_DC_PAETH_H_V_CFL = (1 << UV_DC_PRED) | (1 << UV_PAETH_PRED) |
74  (1 << UV_V_PRED) | (1 << UV_H_PRED) |
75  (1 << UV_CFL_PRED),
76  INTRA_DC = (1 << DC_PRED),
77  INTRA_DC_TM = (1 << DC_PRED) | (1 << PAETH_PRED),
78  INTRA_DC_H_V = (1 << DC_PRED) | (1 << V_PRED) | (1 << H_PRED),
79  INTRA_DC_H_V_SMOOTH =
80  (1 << DC_PRED) | (1 << V_PRED) | (1 << H_PRED) | (1 << SMOOTH_PRED),
81  INTRA_DC_PAETH_H_V =
82  (1 << DC_PRED) | (1 << PAETH_PRED) | (1 << V_PRED) | (1 << H_PRED)
83 };
84 
85 enum {
86  INTER_ALL = (1 << NEARESTMV) | (1 << NEARMV) | (1 << GLOBALMV) |
87  (1 << NEWMV) | (1 << NEAREST_NEARESTMV) | (1 << NEAR_NEARMV) |
88  (1 << NEW_NEWMV) | (1 << NEAREST_NEWMV) | (1 << NEAR_NEWMV) |
89  (1 << NEW_NEARMV) | (1 << NEW_NEARESTMV) | (1 << GLOBAL_GLOBALMV),
90  INTER_NEAREST_NEAR_ZERO = (1 << NEARESTMV) | (1 << NEARMV) | (1 << GLOBALMV) |
91  (1 << NEAREST_NEARESTMV) | (1 << GLOBAL_GLOBALMV) |
92  (1 << NEAREST_NEWMV) | (1 << NEW_NEARESTMV) |
93  (1 << NEW_NEARMV) | (1 << NEAR_NEWMV) |
94  (1 << NEAR_NEARMV),
95  INTER_SINGLE_ALL =
96  (1 << NEARESTMV) | (1 << NEARMV) | (1 << GLOBALMV) | (1 << NEWMV),
97 };
98 
99 enum {
100  DISABLE_ALL_INTER_SPLIT = (1 << THR_COMP_GA) | (1 << THR_COMP_LA) |
101  (1 << THR_ALTR) | (1 << THR_GOLD) | (1 << THR_LAST),
102 
103  DISABLE_ALL_SPLIT = (1 << THR_INTRA) | DISABLE_ALL_INTER_SPLIT,
104 
105  DISABLE_COMPOUND_SPLIT = (1 << THR_COMP_GA) | (1 << THR_COMP_LA),
106 
107  LAST_AND_INTRA_SPLIT_ONLY = (1 << THR_COMP_GA) | (1 << THR_COMP_LA) |
108  (1 << THR_ALTR) | (1 << THR_GOLD)
109 };
110 
111 enum {
112  TXFM_CODING_SF = 1,
113  INTER_PRED_SF = 2,
114  INTRA_PRED_SF = 4,
115  PARTITION_SF = 8,
116  LOOP_FILTER_SF = 16,
117  RD_SKIP_SF = 32,
118  RESERVE_2_SF = 64,
119  RESERVE_3_SF = 128,
120 } UENUM1BYTE(DEV_SPEED_FEATURES);
121 
122 /* This enumeration defines when the rate control recode loop will be
123  * enabled.
124  */
125 enum {
126  /*
127  * No recodes allowed
128  */
129  DISALLOW_RECODE = 0,
130  /*
131  * Allow recode only for KF/ARF/GF frames
132  */
133  ALLOW_RECODE_KFARFGF = 1,
134  /*
135  * Allow recode for all frame types based on bitrate constraints.
136  */
137  ALLOW_RECODE = 2,
138 } UENUM1BYTE(RECODE_LOOP_TYPE);
139 
140 enum {
141  SUBPEL_TREE = 0,
142  SUBPEL_TREE_PRUNED = 1, // Prunes 1/2-pel searches
143  SUBPEL_TREE_PRUNED_MORE = 2, // Prunes 1/2-pel searches more aggressively
144  SUBPEL_SEARCH_METHODS
145 } UENUM1BYTE(SUBPEL_SEARCH_METHOD);
146 
147 enum {
148  // Try the full image with different values.
149  LPF_PICK_FROM_FULL_IMAGE,
150  // Try the full image filter search with non-dual filter only.
151  LPF_PICK_FROM_FULL_IMAGE_NON_DUAL,
152  // Try a small portion of the image with different values.
153  LPF_PICK_FROM_SUBIMAGE,
154  // Estimate the level based on quantizer and frame type
155  LPF_PICK_FROM_Q,
156  // Pick 0 to disable LPF if LPF was enabled last frame
157  LPF_PICK_MINIMAL_LPF
158 } UENUM1BYTE(LPF_PICK_METHOD);
164 typedef enum {
173  CDEF_PICK_METHODS
175 
177 enum {
178  // Terminate search early based on distortion so far compared to
179  // qp step, distortion in the neighborhood of the frame, etc.
180  FLAG_EARLY_TERMINATE = 1 << 0,
181 
182  // Skips comp inter modes if the best so far is an intra mode.
183  FLAG_SKIP_COMP_BESTINTRA = 1 << 1,
184 
185  // Skips oblique intra modes if the best so far is an inter mode.
186  FLAG_SKIP_INTRA_BESTINTER = 1 << 3,
187 
188  // Skips oblique intra modes at angles 27, 63, 117, 153 if the best
189  // intra so far is not one of the neighboring directions.
190  FLAG_SKIP_INTRA_DIRMISMATCH = 1 << 4,
191 
192  // Skips intra modes other than DC_PRED if the source variance is small
193  FLAG_SKIP_INTRA_LOWVAR = 1 << 5,
194 } UENUM1BYTE(MODE_SEARCH_SKIP_LOGIC);
195 
196 enum {
197  // No tx type pruning
198  TX_TYPE_PRUNE_0 = 0,
199  // adaptively prunes the least perspective tx types out of all 16
200  // (tuned to provide negligible quality loss)
201  TX_TYPE_PRUNE_1 = 1,
202  // similar, but applies much more aggressive pruning to get better speed-up
203  TX_TYPE_PRUNE_2 = 2,
204  TX_TYPE_PRUNE_3 = 3,
205  // More aggressive pruning based on tx type score and allowed tx count
206  TX_TYPE_PRUNE_4 = 4,
207  TX_TYPE_PRUNE_5 = 5,
208 } UENUM1BYTE(TX_TYPE_PRUNE_MODE);
209 
210 enum {
211  // No reaction to rate control on a detected slide/scene change.
212  NO_DETECTION = 0,
213 
214  // Set to larger Q based only on the detected slide/scene change and
215  // current/past Q.
216  FAST_DETECTION_MAXQ = 1,
217 } UENUM1BYTE(OVERSHOOT_DETECTION_CBR);
218 
219 enum {
220  // Turns off multi-winner mode. So we will do txfm search on either all modes
221  // if winner mode is off, or we will only on txfm search on a single winner
222  // mode.
223  MULTI_WINNER_MODE_OFF = 0,
224 
225  // Limits the number of winner modes to at most 2
226  MULTI_WINNER_MODE_FAST = 1,
227 
228  // Uses the default number of winner modes, which is 3 for intra mode, and 1
229  // for inter mode.
230  MULTI_WINNER_MODE_DEFAULT = 2,
231 
232  // Maximum number of winner modes allowed.
233  MULTI_WINNER_MODE_LEVELS,
234 } UENUM1BYTE(MULTI_WINNER_MODE_TYPE);
235 
236 enum {
237  PRUNE_NEARMV_OFF = 0, // Turn off nearmv pruning
238  PRUNE_NEARMV_LEVEL1 = 1, // Prune nearmv for qindex (0-85)
239  PRUNE_NEARMV_LEVEL2 = 2, // Prune nearmv for qindex (0-170)
240  PRUNE_NEARMV_LEVEL3 = 3, // Prune nearmv more aggressively for qindex (0-170)
241  PRUNE_NEARMV_MAX = PRUNE_NEARMV_LEVEL3,
242 } UENUM1BYTE(PRUNE_NEARMV_LEVEL);
243 
244 enum {
245  // Default transform search used in evaluation of best inter candidates
246  // (MODE_EVAL stage) and motion mode winner processing (WINNER_MODE_EVAL
247  // stage).
248  TX_SEARCH_DEFAULT = 0,
249  // Transform search in motion mode rd during MODE_EVAL stage.
250  TX_SEARCH_MOTION_MODE,
251  // Transform search in compound type mode rd during MODE_EVAL stage.
252  TX_SEARCH_COMP_TYPE_MODE,
253  // All transform search cases
254  TX_SEARCH_CASES
255 } UENUM1BYTE(TX_SEARCH_CASE);
256 
257 typedef struct {
258  TX_TYPE_PRUNE_MODE prune_2d_txfm_mode;
259 
260  // Limit the intra transform search type.
261  // 1 : Limit the intra transform search type to the ones in the table
262  // av1_derived_intra_tx_used_flag[INTRA_MODES].
263  // 2 : Limit the intra transform search type to the default transform.
264  int fast_intra_tx_type_search;
265 
266  // INT_MAX: Disable fast search.
267  // 1 - 1024: Probability threshold used for conditionally forcing tx type,
268  // during mode search.
269  // 0: Force tx type to be DCT_DCT unconditionally, during
270  // mode search.
271  int fast_inter_tx_type_prob_thresh;
272 
273  // Prune less likely chosen transforms for each intra mode. The speed
274  // feature ranges from 0 to 2, for different speed / compression trade offs.
275  int use_reduced_intra_txset;
276 
277  // Use a skip flag prediction model to detect blocks with skip = 1 early
278  // and avoid doing full TX type search for such blocks.
279  int use_skip_flag_prediction;
280 
281  // Threshold used by the ML based method to predict TX block split decisions.
282  int ml_tx_split_thresh;
283 
284  // skip remaining transform type search when we found the rdcost of skip is
285  // better than applying transform
286  int skip_tx_search;
287 
288  // Prune tx type search using previous frame stats.
289  int prune_tx_type_using_stats;
290  // Prune tx type search using estimated RDcost
291  int prune_tx_type_est_rd;
292 
293  // Flag used to control the winner mode processing for tx type pruning for
294  // inter blocks. It enables further tx type mode pruning based on ML model for
295  // mode evaluation and disables tx type mode pruning for winner mode
296  // processing.
297  int winner_mode_tx_type_pruning;
298 } TX_TYPE_SEARCH;
299 
300 enum {
301  // Search partitions using RD criterion
302  SEARCH_PARTITION,
303 
304  // Always use a fixed size partition
305  FIXED_PARTITION,
306 
307  // Partition using source variance
308  VAR_BASED_PARTITION,
309 
310 #if CONFIG_RT_ML_PARTITIONING
311  // Partition using ML model
312  ML_BASED_PARTITION
313 #endif
314 } UENUM1BYTE(PARTITION_SEARCH_TYPE);
315 
316 enum {
317  NOT_IN_USE,
318  DIRECT_PRED,
319  RELAXED_PRED,
320  ADAPT_PRED
321 } UENUM1BYTE(MAX_PART_PRED_MODE);
322 
323 enum {
324  LAST_MV_DATA,
325  CURRENT_Q,
326  QTR_ONLY,
327 } UENUM1BYTE(MV_PREC_LOGIC);
328 
329 enum {
330  SUPERRES_AUTO_ALL, // Tries all possible superres ratios
331  SUPERRES_AUTO_DUAL, // Tries no superres and q-based superres ratios
332  SUPERRES_AUTO_SOLO, // Only apply the q-based superres ratio
333 } UENUM1BYTE(SUPERRES_AUTO_SEARCH_TYPE);
351 typedef enum {
358 
363 typedef enum {
364  NO_PRUNING = -1,
383 
387 typedef enum {
392 
397 typedef enum {
399  0,
401  1,
403  2,
405  3,
407  4,
410 
417 
421  RECODE_LOOP_TYPE recode_loop;
422 
428 
435  MV_PREC_LOGIC high_precision_mv_usage;
436 
445 
449  SUPERRES_AUTO_SEARCH_TYPE superres_auto_search_type;
450 
455 
460 
470 
477 
484 
492 
500 
508 
520 
525 
530 
536 
538 typedef struct TPL_SPEED_FEATURES {
539  // GOP length adaptive decision.
540  // If set to 0, tpl model decides whether a shorter gf interval is better.
541  // If set to 1, tpl stats of ARFs from base layer, (base+1) layer and
542  // (base+2) layer decide whether a shorter gf interval is better.
543  // If set to 2, tpl stats of ARFs from base layer, (base+1) layer and GF boost
544  // decide whether a shorter gf interval is better.
545  // If set to 3, gop length adaptive decision is disabled.
546  int gop_length_decision_method;
547  // Prune the intra modes search by tpl.
548  // If set to 0, we will search all intra modes from DC_PRED to PAETH_PRED.
549  // If set to 1, we only search DC_PRED, V_PRED, and H_PRED.
550  int prune_intra_modes;
551  // This parameter controls which step in the n-step process we start at.
552  int reduce_first_step_size;
553  // Skip motion estimation based on the precision of center MVs and the
554  // difference between center MVs.
555  // If set to 0, motion estimation is skipped for duplicate center MVs
556  // (default). If set to 1, motion estimation is skipped for duplicate
557  // full-pixel center MVs. If set to 2, motion estimation is skipped if the
558  // difference between center MVs is less than the threshold.
559  int skip_alike_starting_mv;
560 
561  // When to stop subpel search.
562  SUBPEL_FORCE_STOP subpel_force_stop;
563 
564  // Which search method to use.
565  SEARCH_METHODS search_method;
566 
567  // Prune starting mvs in TPL based on sad scores.
568  int prune_starting_mv;
569 
570  // Prune reference frames in TPL.
571  int prune_ref_frames_in_tpl;
572 
573  // Support compound predictions.
574  int allow_compound_pred;
575 
576  // Calculate rate and distortion based on Y plane only.
577  int use_y_only_rate_distortion;
578 
579  // Use SAD instead of SATD during intra/inter mode search.
580  // If set to 0, use SATD always.
581  // If set to 1, use SAD during intra/inter mode search for frames in the
582  // higher temporal layers of the hierarchical prediction structure.
583  // If set to 2, use SAD during intra/inter mode search for all frames.
584  // This sf is disabled for the first GF group of the key-frame interval,
585  // i.e., SATD is used during intra/inter mode search of the first GF group.
586  int use_sad_for_mode_decision;
587 
588  // Skip tpl processing for frames of type LF_UPDATE.
589  // This sf is disabled for the first GF group of the key-frame interval.
590  int reduce_num_frames;
591 } TPL_SPEED_FEATURES;
592 
593 typedef struct GLOBAL_MOTION_SPEED_FEATURES {
594  GM_SEARCH_TYPE gm_search_type;
595 
596  // During global motion estimation, prune remaining reference frames in a
597  // given direction(past/future), if the evaluated ref_frame in that direction
598  // yields gm_type as INVALID/TRANSLATION/IDENTITY
599  int prune_ref_frame_for_gm_search;
600 
601  // When the current GM type is set to ZEROMV, prune ZEROMV if its performance
602  // is worse than NEWMV under SSE metric.
603  // 0 : no pruning
604  // 1 : conservative pruning
605  // 2 : aggressive pruning
607 
608  // Disable global motion estimation based on stats of previous frames in the
609  // GF group
610  int disable_gm_search_based_on_stats;
611 
612  // Downsampling pyramid level to use for global motion estimation
613  int downsample_level;
614 
615  // Number of refinement steps to apply after initial model generation
616  int num_refinement_steps;
617 
618  // Error advantage threshold level used to determine whether global motion
619  // compensation should be enabled
620  int gm_erroradv_tr_level;
621 } GLOBAL_MOTION_SPEED_FEATURES;
622 
623 typedef struct PARTITION_SPEED_FEATURES {
624  PARTITION_SEARCH_TYPE partition_search_type;
625 
626  // Used if partition_search_type = FIXED_PARTITION
627  BLOCK_SIZE fixed_partition_size;
628 
629  // Prune extended partition types search based on the current best partition
630  // and the combined rdcost of the subblocks estimated from previous
631  // partitions. Can take values 0 - 2, 0 referring to no pruning, and 1 - 2
632  // increasing aggressiveness of pruning in order.
633  int prune_ext_partition_types_search_level;
634 
635  // Prune part4 based on block size
636  int prune_part4_search;
637 
638  // Use a ML model to prune rectangular, ab and 4-way horz
639  // and vert partitions
640  int ml_prune_partition;
641 
642  // Use a ML model to adaptively terminate partition search after trying
643  // PARTITION_SPLIT. Can take values 0 - 2, 0 meaning not being enabled, and
644  // 1 - 2 increasing aggressiveness in order.
645  int ml_early_term_after_part_split_level;
646 
647  // Skip rectangular partition test when partition type none gives better
648  // rd than partition type split. Can take values 0 - 2, 0 referring to no
649  // skipping, and 1 - 2 increasing aggressiveness of skipping in order.
650  int less_rectangular_check_level;
651 
652  // Use square partition only beyond this block size.
653  BLOCK_SIZE use_square_partition_only_threshold;
654 
655  // Sets max square partition levels for this superblock based on
656  // motion vector and prediction error distribution produced from 16x16
657  // simple motion search
658  MAX_PART_PRED_MODE auto_max_partition_based_on_simple_motion;
659 
660  // Min and max square partition size we enable (block_size) as per auto
661  // min max, but also used by adjust partitioning, and pick_partitioning.
662  BLOCK_SIZE default_min_partition_size;
663  BLOCK_SIZE default_max_partition_size;
664 
665  // Sets level of adjustment of variance-based partitioning during
666  // rd_use_partition 0 - no partition adjustment, 1 - try to merge partitions
667  // for small blocks and high QP, 2 - try to merge partitions, 3 - try to merge
668  // and split leaf partitions and 0 - 3 decreasing aggressiveness in order.
669  int adjust_var_based_rd_partitioning;
670 
671  // Partition search early breakout thresholds.
672  int64_t partition_search_breakout_dist_thr;
673  int partition_search_breakout_rate_thr;
674 
675  // Thresholds for ML based partition search breakout.
676  float ml_partition_search_breakout_thresh[PARTITION_BLOCK_SIZES];
677 
678  // ML based partition search breakout model index
679  int ml_partition_search_breakout_model_index;
680 
681  // ML based partition search breakout model index
682  int ml_4_partition_search_level_index;
683 
684  // Aggressiveness levels for pruning split and rectangular partitions based on
685  // simple_motion_search. SIMPLE_AGG_LVL0 to SIMPLE_AGG_LVL5 correspond to
686  // simple motion search based pruning. QIDX_BASED_AGG_LVL1 corresponds to
687  // qindex based and simple motion search based pruning.
688  int simple_motion_search_prune_agg;
689 
690  // Perform simple_motion_search on each possible subblock and use it to prune
691  // PARTITION_HORZ and PARTITION_VERT.
692  int simple_motion_search_prune_rect;
693 
694  // Perform simple motion search before none_partition to decide if we
695  // want to remove all partitions other than PARTITION_SPLIT. If set to 0, this
696  // model is disabled. If set to 1, the model attempts to perform
697  // PARTITION_SPLIT only. If set to 2, the model also attempts to prune
698  // PARTITION_SPLIT.
699  int simple_motion_search_split;
700 
701  // Use features from simple_motion_search to terminate prediction block
702  // partition after PARTITION_NONE
703  int simple_motion_search_early_term_none;
704 
705  // Controls whether to reduce the number of motion search steps. If this is 0,
706  // then simple_motion_search has the same number of steps as
707  // single_motion_search (assuming no other speed features). Otherwise, reduce
708  // the number of steps by the value contained in this variable.
709  int simple_motion_search_reduce_search_steps;
710 
711  // This variable controls the maximum block size where intra blocks can be
712  // used in inter frames.
713  // TODO(aconverse): Fold this into one of the other many mode skips
714  BLOCK_SIZE max_intra_bsize;
715 
716  // Use CNN with luma pixels on source frame on each of the 64x64 subblock to
717  // perform partition pruning in intra frames.
718  // 0: No Pruning
719  // 1: Prune split and rectangular partitions only
720  // 2: Prune none, split and rectangular partitions
721  int intra_cnn_based_part_prune_level;
722 
723  // Disable extended partition search if the current bsize is greater than the
724  // threshold. Must be a square block size BLOCK_8X8 or higher.
725  BLOCK_SIZE ext_partition_eval_thresh;
726 
727  // Use best partition decision so far to tune 'ext_partition_eval_thresh'
728  int ext_part_eval_based_on_cur_best;
729 
730  // Disable rectangular partitions for larger block sizes.
731  int rect_partition_eval_thresh;
732 
733  // Prune extended partition search based on whether the split/rect partitions
734  // provided an improvement in the previous search.
735  // 0 : no pruning
736  // 1 : prune 1:4 partition search using winner info from split partitions
737  // 2 : prune 1:4 and AB partition search using split and HORZ/VERT info
738  int prune_ext_part_using_split_info;
739 
740  // Prunt rectangular, AB and 4-way partition based on q index and block size
741  // 0 : no pruning
742  // 1 : prune sub_8x8 at very low quantizers
743  // 2 : prune all block size based on qindex
744  int prune_rectangular_split_based_on_qidx;
745 
746  // Prune rectangular partitions based on 4x4 sub-block variance
747  // false : no pruning
748  // true : prune rectangular partitions based on 4x4 sub-block variance
749  // deviation
750  //
751  // For allintra encode, this speed feature reduces instruction count by 6.4%
752  // for speed=6 with coding performance change less than 0.24%. For AVIF image
753  // encode, this speed feature reduces encode time by 8.14% for speed 6 on a
754  // typical image dataset with coding performance change less than 0.16%. This
755  // speed feature is not applicable to speed >= 7.
756  bool prune_rect_part_using_4x4_var_deviation;
757 
758  // Prune rectangular partitions based on prediction mode chosen by NONE
759  // partition.
760  // false : no pruning
761  // true : prunes rectangular partition as described below
762  // If prediction mode chosen by NONE partition is
763  // DC_PRED or SMOOTH_PRED: Prunes both horizontal and vertical partitions if
764  // at least one of the left and top neighbor blocks is larger than the
765  // current block.
766  // Directional Mode: Prunes either of the horizontal and vertical partition
767  // based on center angle of the prediction mode chosen by NONE partition. For
768  // example, vertical partition is pruned if center angle of the prediction
769  // mode chosen by NONE partition is close to 180 degrees (i.e. horizontal
770  // direction) and vice versa.
771  // For allintra encode, this speed feature reduces instruction count by 5.1%
772  // for speed=6 with coding performance change less than 0.22%. For AVIF image
773  // encode, this speed feature reduces encode time by 4.44% for speed 6 on a
774  // typical image dataset with coding performance change less than 0.15%.
775  // For speed >= 7, variance-based logic is used to determine the partition
776  // structure instead of recursive partition search. Therefore, this speed
777  // feature is not applicable in such cases.
778  bool prune_rect_part_using_none_pred_mode;
779 
780  // Terminate partition search for child partition,
781  // when NONE and SPLIT partition rd_costs are INT64_MAX.
782  int early_term_after_none_split;
783 
784  // Level used to adjust threshold for av1_ml_predict_breakout(). At lower
785  // levels, more conservative threshold is used, and value of 0 indicates
786  // av1_ml_predict_breakout() is disabled. Value of 3 corresponds to default
787  // case with no adjustment to lbd thresholds.
788  int ml_predict_breakout_level;
789 
790  // Prune sub_8x8 (BLOCK_4X4, BLOCK_4X8 and BLOCK_8X4) partitions.
791  // 0 : no pruning
792  // 1 : pruning based on neighbour block information
793  // 2 : prune always
794  int prune_sub_8x8_partition_level;
795 
796  // Prune rectangular split based on simple motion search split/no_split score.
797  // 0: disable pruning, 1: enable pruning
798  int simple_motion_search_rect_split;
799 
800  // The current encoder adopts a DFS search for block partitions.
801  // Therefore the mode selection and associated rdcost is ready for smaller
802  // blocks before the mode selection for some partition types.
803  // AB partition could use previous rd information and skip mode search.
804  // An example is:
805  //
806  // current block
807  // +---+---+
808  // | |
809  // + +
810  // | |
811  // +-------+
812  //
813  // SPLIT partition has been searched first before trying HORZ_A
814  // +---+---+
815  // | R | R |
816  // +---+---+
817  // | R | R |
818  // +---+---+
819  //
820  // HORZ_A
821  // +---+---+
822  // | | |
823  // +---+---+
824  // | |
825  // +-------+
826  //
827  // With this speed feature, the top two sub blocks can directly use rdcost
828  // searched in split partition, and the mode info is also copied from
829  // saved info. Similarly, the bottom rectangular block can also use
830  // the available information from previous rectangular search.
831  int reuse_prev_rd_results_for_part_ab;
832 
833  // Reuse the best prediction modes found in PARTITION_SPLIT and PARTITION_RECT
834  // when encoding PARTITION_AB.
835  int reuse_best_prediction_for_part_ab;
836 
837  // The current partition search records the best rdcost so far and uses it
838  // in mode search and transform search to early skip when some criteria is
839  // met. For example, when the current rdcost is larger than the best rdcost,
840  // or the model rdcost is larger than the best rdcost times some thresholds.
841  // By default, this feature is turned on to speed up the encoder partition
842  // search.
843  // If disabling it, at speed 0, 30 frames, we could get
844  // about -0.25% quality gain (psnr, ssim, vmaf), with about 13% slowdown.
845  int use_best_rd_for_pruning;
846 
847  // Skip evaluation of non-square partitions based on the corresponding NONE
848  // partition.
849  // 0: no pruning
850  // 1: prune extended partitions if NONE is skippable
851  // 2: on top of 1, prune rectangular partitions if NONE is inter, not a newmv
852  // mode and skippable
853  int skip_non_sq_part_based_on_none;
854 
855  // Disables 8x8 and below partitions for low quantizers.
856  int disable_8x8_part_based_on_qidx;
857 
858  // Disables either of PARTITION_HORZ_4 or PARTITION_VERT_4 using SSE from
859  // simple motion search.
860  bool prune_h_or_v_4part_using_sms_info;
861 
862  // Decoder side speed feature to add penalty for use of smaller partitions.
863  // Takes values 0 - 2, 0 indicating no penalty and higher level indicating
864  // increased penalty.
865  int split_partition_penalty_level;
866 } PARTITION_SPEED_FEATURES;
867 
868 typedef struct MV_SPEED_FEATURES {
869  // Motion search method (Diamond, NSTEP, Hex, Big Diamond, Square, etc).
870  SEARCH_METHODS search_method;
871 
872  // Enable the use of faster, less accurate mv search method
873  // 0: Disable
874  // 1 - 3: Disable for larger bsize
875  // 4: Based on bsize, SAD and qp
876  // TODO(chiyotsai@google.com): Take the clip's resolution and mv activity into
877  // account.
878  int use_bsize_dependent_search_method;
879 
880  // If this is set to 1, we limit the motion search range to 2 times the
881  // largest motion vector found in the last frame.
882  int auto_mv_step_size;
883 
884  // Subpel_search_method can only be subpel_tree which does a subpixel
885  // logarithmic search that keeps stepping at 1/2 pixel units until
886  // you stop getting a gain, and then goes on to 1/4 and repeats
887  // the same process. Along the way it skips many diagonals.
888  SUBPEL_SEARCH_METHOD subpel_search_method;
889 
890  // Maximum number of steps in logarithmic subpel search before giving up.
891  int subpel_iters_per_step;
892 
893  // When to stop subpel search.
894  SUBPEL_FORCE_STOP subpel_force_stop;
895 
896  // When to stop subpel search in simple motion search.
897  SUBPEL_FORCE_STOP simple_motion_subpel_force_stop;
898 
899  // If true, sub-pixel search uses the exact convolve function used for final
900  // encoding and decoding; otherwise, it uses bilinear interpolation.
901  SUBPEL_SEARCH_TYPE use_accurate_subpel_search;
902 
903  // Threshold for allowing exhaustive motion search.
904  int exhaustive_searches_thresh;
905 
906  // Pattern to be used for any exhaustive mesh searches (except intraBC ME).
907  MESH_PATTERN mesh_patterns[MAX_MESH_STEP];
908 
909  // Pattern to be used for exhaustive mesh searches of intraBC ME.
910  MESH_PATTERN intrabc_mesh_patterns[MAX_MESH_STEP];
911 
912  // Reduce single motion search range based on MV result of prior ref_mv_idx.
913  int reduce_search_range;
914 
915  // Prune mesh search.
916  PRUNE_MESH_SEARCH_LEVEL prune_mesh_search;
917 
918  // Use the rd cost around the best FULLPEL_MV to speed up subpel search
919  int use_fullpel_costlist;
920 
921  // Set the full pixel search level of obmc
922  // 0: obmc_full_pixel_diamond
923  // 1: obmc_refining_search_sad (faster)
924  int obmc_full_pixel_search_level;
925 
926  // Accurate full pixel motion search based on TPL stats.
927  int full_pixel_search_level;
928 
929  // Allow intrabc motion search
930  int use_intrabc;
931 
932  // Prune intrabc candidate block hash search
933  // 0: check every block hash candidate
934  // 1: check the first 64 block hash candidates only
935  int prune_intrabc_candidate_block_hash_search;
936 
937  // Intrabc search level
938  // 0: top + left search, all block sizes, always hash plus pixel search
939  // 1: top search only, 4x4, 8x8 and 16x16 block sizes only, perform pixel
940  // search if and only if hash search failed to find a candidate
941  int intrabc_search_level;
942 
943  // Whether the maximum intrabc block size to hash is 8x8
944  // 0: Hash from 4x4 up to superblock size
945  // 1: Hash 4x4 and 8x8 only
946  int hash_max_8x8_intrabc_blocks;
947 
948  // Whether to downsample the rows in sad calculation during motion search.
949  // This is only active when there are at least 16 rows. When this sf is
950  // active, if there is a large discrepancy in the SAD values for the final
951  // motion vector between skipping vs not skipping, motion search is redone
952  // with skip row features off.
953  // 0: Disabled (do not downsample rows)
954  // 1: Skip SAD calculation of odd rows if the SAD deviation of the even and
955  // odd rows for the starting MV is small. Redo motion search with sf off
956  // when SAD deviation is high for the final motion vector.
957  // 2: Skip SAD calculation of odd rows. SAD deviation is not tested for the
958  // start MV and tested only for the final MV.
959  int use_downsampled_sad;
960 
961  // Enable/disable extensive joint motion search.
962  int disable_extensive_joint_motion_search;
963 
964  // Enable second best mv check in joint mv search.
965  // 0: allow second MV (use rd cost as the metric)
966  // 1: use var as the metric
967  // 2: disable second MV
968  int disable_second_mv;
969 
970  // Skips full pixel search based on closeness of start mv and ref mv
971  // of previous search.
972  // 0: Disabled
973  // 1: Skips the full pixel search upto 4 neighbor full-pel start MV and ref MV
974  // positions.
975  // 2: Skips the full pixel search upto 8 neighbor full-pel start MV and ref MV
976  // positions.
977  int skip_fullpel_search_using_startmv_refmv;
978 
979  // Method to use for refining WARPED_CAUSAL motion vectors
980  // TODO(rachelbarker): Can this be unified with OBMC in some way?
981  WARP_SEARCH_METHOD warp_search_method;
982 
983  // Maximum number of iterations in WARPED_CAUSAL refinement search
984  int warp_search_iters;
985 } MV_SPEED_FEATURES;
986 
987 typedef struct INTER_MODE_SPEED_FEATURES {
988  // 2-pass inter mode model estimation where the preliminary pass skips
989  // transform search and uses a model to estimate rd, while the final pass
990  // computes the full transform search. Two types of models are supported:
991  // 0: not used
992  // 1: used with online dynamic rd model
993  // 2: used with static rd model
994  int inter_mode_rd_model_estimation;
995 
996  // Bypass transform search based on skip rd at following stages
997  // i. Compound type mode search
998  // ii. Motion mode search (mode evaluation and winner motion mode stage)
999  // iii. Transform search for best inter candidates
1000  int txfm_rd_gate_level[TX_SEARCH_CASES];
1001 
1002  // Limit the inter mode tested in the RD loop
1003  int reduce_inter_modes;
1004 
1005  // This variable is used to cap the maximum number of times we skip testing a
1006  // mode to be evaluated. A high value means we will be faster.
1007  int adaptive_rd_thresh;
1008 
1009  // Aggressively prune inter modes when best mode is skippable.
1010  int prune_inter_modes_if_skippable;
1011 
1012  // Drop less likely to be picked reference frames in the RD search.
1013  // Has seven levels for now: 0, 1, 2, 3, 4, 5 and 6 where higher levels prune
1014  // more aggressively than lower ones. (0 means no pruning).
1015  int selective_ref_frame;
1016 
1017  // Prune reference frames for rectangular partitions.
1018  // 0 implies no pruning
1019  // 1 implies prune for extended partition
1020  // 2 implies prune horiz, vert and extended partition
1021  int prune_ref_frame_for_rect_partitions;
1022 
1023  // Prune inter modes w.r.t past reference frames
1024  // 0 no pruning
1025  // 1 prune inter modes w.r.t ALTREF2 and ALTREF reference frames
1026  // 2 prune inter modes w.r.t BWDREF, ALTREF2 and ALTREF reference frames
1027  int alt_ref_search_fp;
1028 
1029  // Prune reference frames for single prediction modes based on temporal
1030  // distance and pred MV SAD. Feasible values are 0-4. The feature is
1031  // disabled for 0. An increasing value indicates more aggressive pruning
1032  // threshold.
1033  int prune_single_ref;
1034 
1035  // Prune compound reference frames
1036  // 0 no pruning
1037  // 1 prune based on temporal distance and pred_mv_sad. However, disallow
1038  // pruning of important reference frame pairs decided based on temporal
1039  // distance and quality.
1040  // 2 prune compound references which do not satisfy the two conditions:
1041  // a) The references are at a nearest distance from the current frame in
1042  // both past and future direction.
1043  // b) The references have minimum pred_mv_sad in both past and future
1044  // direction.
1045  // 3 prune compound references except the one with nearest distance from the
1046  // current frame in both past and future direction.
1047  int prune_comp_ref_frames;
1048 
1049  // Skip the current ref_mv in NEW_MV mode based on mv, rate cost, etc.
1050  // This speed feature equaling 0 means no skipping.
1051  // If the speed feature equals 1 or 2, skip the current ref_mv in NEW_MV mode
1052  // if we have already encountered ref_mv in the drl such that:
1053  // 1. The other drl has the same mv during the SIMPLE_TRANSLATION search
1054  // process as the current mv.
1055  // 2. The rate needed to encode the current mv is larger than that for the
1056  // other ref_mv.
1057  // The speed feature equaling 1 means using subpel mv in the comparison.
1058  // The speed feature equaling 2 means using fullpel mv in the comparison.
1059  // If the speed feature >= 3, skip the current ref_mv in NEW_MV mode based on
1060  // known full_mv bestsme and drl cost.
1061  int skip_newmv_in_drl;
1062 
1063  // This speed feature checks duplicate ref MVs among NEARESTMV, NEARMV,
1064  // GLOBALMV and skips NEARMV or GLOBALMV (in order) if a duplicate is found
1065  // TODO(any): Instead of skipping repeated ref mv, use the recalculated
1066  // rd-cost based on mode rate and skip the mode evaluation
1067  int skip_repeated_ref_mv;
1068 
1069  // Flag used to control the ref_best_rd based gating for chroma
1070  int perform_best_rd_based_gating_for_chroma;
1071 
1072  // Reuse the inter_intra_mode search result from NEARESTMV mode to other
1073  // single ref modes
1074  int reuse_inter_intra_mode;
1075 
1076  // prune wedge and compound segment approximate rd evaluation based on
1077  // compound average modeled rd
1078  int prune_comp_type_by_model_rd;
1079 
1080  // prune wedge and compound segment approximate rd evaluation based on
1081  // compound average rd/ref_best_rd
1082  int prune_comp_type_by_comp_avg;
1083 
1084  // Skip some ref frames in compound motion search by single motion search
1085  // result. Has three levels for now: 0 referring to no skipping, and 1 - 3
1086  // increasing aggressiveness of skipping in order.
1087  // Note: The search order might affect the result. It assumes that the single
1088  // reference modes are searched before compound modes. It is better to search
1089  // same single inter mode as a group.
1090  int prune_comp_search_by_single_result;
1091 
1092  // Instead of performing a full MV search, do a simple translation first
1093  // and only perform a full MV search on the motion vectors that performed
1094  // well.
1095  int prune_mode_search_simple_translation;
1096 
1097  // Only search compound modes with at least one "good" reference frame.
1098  // A reference frame is good if, after looking at its performance among
1099  // the single reference modes, it is one of the two best performers.
1100  int prune_compound_using_single_ref;
1101 
1102  // Skip extended compound mode (NEAREST_NEWMV, NEW_NEARESTMV, NEAR_NEWMV,
1103  // NEW_NEARMV) using ref frames of above and left neighbor
1104  // blocks.
1105  // 0 : no pruning
1106  // 1 : prune ext compound modes using neighbor blocks (less aggressiveness)
1107  // 2 : prune ext compound modes using neighbor blocks (high aggressiveness)
1108  // 3 : prune ext compound modes unconditionally (highest aggressiveness)
1109  int prune_ext_comp_using_neighbors;
1110 
1111  // Skip NEW_NEARMV and NEAR_NEWMV extended compound modes
1112  int skip_ext_comp_nearmv_mode;
1113 
1114  // Skip extended compound mode when ref frame corresponding to NEWMV does not
1115  // have NEWMV as single mode winner.
1116  // 0 : no pruning
1117  // 1 : prune extended compound mode (less aggressiveness)
1118  // 2 : prune extended compound mode (high aggressiveness)
1119  int prune_comp_using_best_single_mode_ref;
1120 
1121  // Skip NEARESTMV and NEARMV using weight computed in ref mv list population
1122  //
1123  // Pruning is enabled only when both the top and left neighbor blocks are
1124  // available and when the current block already has a valid inter prediction.
1125  int prune_nearest_near_mv_using_refmv_weight;
1126 
1127  // Based on previous ref_mv_idx search result, prune the following search.
1128  int prune_ref_mv_idx_search;
1129 
1130  // Disable one sided compound modes.
1131  int disable_onesided_comp;
1132 
1133  // Prune obmc search using previous frame stats.
1134  // INT_MAX : disable obmc search
1135  int prune_obmc_prob_thresh;
1136 
1137  // Prune warped motion search using previous frame stats.
1138  int prune_warped_prob_thresh;
1139 
1140  // Variance threshold to enable/disable Interintra wedge search
1141  unsigned int disable_interintra_wedge_var_thresh;
1142 
1143  // Variance threshold to enable/disable Interinter wedge search
1144  unsigned int disable_interinter_wedge_var_thresh;
1145 
1146  // De-couple wedge and mode search during interintra RDO.
1147  int fast_interintra_wedge_search;
1148 
1149  // Whether fast wedge sign estimate is used
1150  int fast_wedge_sign_estimate;
1151 
1152  // Enable/disable ME for interinter wedge search.
1153  int disable_interinter_wedge_newmv_search;
1154 
1155  // Decide when and how to use joint_comp.
1156  DIST_WTD_COMP_FLAG use_dist_wtd_comp_flag;
1157 
1158  // Clip the frequency of updating the mv cost.
1159  INTERNAL_COST_UPDATE_TYPE mv_cost_upd_level;
1160 
1161  // Clip the frequency of updating the coeff cost.
1162  INTERNAL_COST_UPDATE_TYPE coeff_cost_upd_level;
1163 
1164  // Clip the frequency of updating the mode cost.
1165  INTERNAL_COST_UPDATE_TYPE mode_cost_upd_level;
1166 
1167  // Prune inter modes based on tpl stats
1168  // 0 : no pruning
1169  // 1 : Allow pruning of LAST2 frame
1170  // 2 - 4: Allow pruning of all reference frames with increased aggressiveness
1171  // of pruning in order
1172  int prune_inter_modes_based_on_tpl;
1173 
1174  // Skip NEARMV and NEAR_NEARMV modes using ref frames of above and left
1175  // neighbor blocks and qindex.
1176  PRUNE_NEARMV_LEVEL prune_nearmv_using_neighbors;
1177 
1178  // Model based breakout after interpolation filter search
1179  // 0: no breakout
1180  // 1: use model based rd breakout
1181  int model_based_post_interp_filter_breakout;
1182 
1183  // Reuse compound type rd decision when exact match is found
1184  // 0: No reuse
1185  // 1: Reuse the compound type decision
1186  int reuse_compound_type_decision;
1187 
1188  // Enable/disable masked compound.
1189  int disable_masked_comp;
1190 
1191  // Enable/disable MV refinement for compound modes corresponds to compound
1192  // types COMPOUND_AVERAGE, COMPOUND_DISTWTD (currently, this compound type
1193  // is disabled for speeds >= 2 using the sf 'use_dist_wtd_comp_flag') and
1194  // COMPOUND_DIFFWTD based on the availability. Levels 0 to 3 indicate
1195  // increasing order of aggressiveness to disable MV refinement.
1196  // 0: MV Refinement is enabled and for NEW_NEWMV mode used two iterations of
1197  // refinement in av1_joint_motion_search().
1198  // 1: MV Refinement is disabled for COMPOUND_DIFFWTD and enabled for
1199  // COMPOUND_AVERAGE & COMPOUND_DISTWTD.
1200  // 2: MV Refinement is enabled for COMPOUND_AVERAGE & COMPOUND_DISTWTD for
1201  // NEW_NEWMV mode with one iteration of refinement in
1202  // av1_joint_motion_search() and MV Refinement is disabled for other compound
1203  // type modes.
1204  // 3: MV Refinement is disabled.
1205  int enable_fast_compound_mode_search;
1206 
1207  // Reuse masked compound type search results
1208  int reuse_mask_search_results;
1209 
1210  // Enable/disable fast search for wedge masks
1211  int enable_fast_wedge_mask_search;
1212 
1213  // Early breakout from transform search of inter modes
1214  int inter_mode_txfm_breakout;
1215 
1216  // Limit number of inter modes for txfm search if a newmv mode gets
1217  // evaluated among the top modes.
1218  // 0: no pruning
1219  // 1 to 3 indicate increasing order of aggressiveness
1220  int limit_inter_mode_cands;
1221 
1222  // Cap the no. of txfm searches for a given prediction mode.
1223  // 0: no cap, 1: cap beyond first 4 searches, 2: cap beyond first 3 searches.
1224  int limit_txfm_eval_per_mode;
1225 
1226  // Prune warped motion search based on block size.
1227  int extra_prune_warped;
1228 
1229  // Do not search compound modes for ARF.
1230  // The intuition is that ARF is predicted by frames far away from it,
1231  // whose temporal correlations with the ARF are likely low.
1232  // It is therefore likely that compound modes do not work as well for ARF
1233  // as other inter frames.
1234  // Speed/quality impact:
1235  // Speed 1: 12% faster, 0.1% psnr loss.
1236  // Speed 2: 2% faster, 0.05% psnr loss.
1237  // No change for speed 3 and up, because |disable_onesided_comp| is true.
1238  int skip_arf_compound;
1239 
1240  // Percentage of scaling used to increase the rd cost of warp mode so that
1241  // encoder decisions are biased against local warp, favoring low complexity
1242  // modes.
1243  int bias_warp_mode_rd_scale_pct;
1244 
1245  // Percentage of scaling used to increase the rd cost of obmc motion mode so
1246  // that encoder decisions are biased against local obmc, favoring low
1247  // complexity modes.
1248  float bias_obmc_mode_rd_scale_pct;
1249 
1250  // Avoid further evaluation of compound modes using top estimate RD Costs of
1251  // compound average.
1252  // Values are 0 (not used),1 - 3 with progressively increasing
1253  // aggressiveness, i.e., decreasing number of top candidates.
1254  int skip_cmp_using_top_cmp_avg_est_rd_lvl;
1255 
1256  // Skip interinter wedge search based on MSE between the two predictors.
1257  int skip_interinter_wedge_search_based_on_mse;
1258 } INTER_MODE_SPEED_FEATURES;
1259 
1260 typedef struct INTERP_FILTER_SPEED_FEATURES {
1261  // Do limited interpolation filter search for dual filters, since best choice
1262  // usually includes EIGHTTAP_REGULAR.
1263  int use_fast_interpolation_filter_search;
1264 
1265  // Disable dual filter
1266  int disable_dual_filter;
1267 
1268  // Save results of av1_interpolation_filter_search for a block
1269  // Check mv and ref_frames before search, if they are very close with previous
1270  // saved results, filter search can be skipped.
1271  int use_interp_filter;
1272 
1273  // skip sharp_filter evaluation based on regular and smooth filter rd for
1274  // dual_filter=0 case
1275  int skip_sharp_interp_filter_search;
1276 
1277  // skip interpolation filter search for a block in chessboard pattern
1278  int cb_pred_filter_search;
1279 
1280  // adaptive interp_filter search to allow skip of certain filter types.
1281  int adaptive_interp_filter_search;
1282 
1283  // Forces interpolation filter to EIGHTTAP_REGULAR and skips interpolation
1284  // filter search.
1285  int skip_interp_filter_search;
1286 
1287  // Bias towards sharp filter
1288  int use_more_sharp_interp;
1289 
1290  // Skip model RD evaluation of chroma planes during interpolation filter
1291  // search.
1292  int skip_model_rd_uv;
1293 } INTERP_FILTER_SPEED_FEATURES;
1294 
1295 typedef struct INTRA_MODE_SPEED_FEATURES {
1296  // These bit masks allow you to enable or disable intra modes for each
1297  // transform size separately.
1298  int intra_y_mode_mask[TX_SIZES];
1299  int intra_uv_mode_mask[TX_SIZES];
1300 
1301  // flag to allow skipping intra mode for inter frame prediction
1302  int skip_intra_in_interframe;
1303 
1304  // Prune intra mode candidates based on source block histogram of gradient.
1305  // Applies to luma plane only.
1306  // Feasible values are 0..4. The feature is disabled for 0. An increasing
1307  // value indicates more aggressive pruning threshold.
1308  int intra_pruning_with_hog;
1309 
1310  // Prune intra mode candidates based on source block histogram of gradient.
1311  // Applies to chroma plane only.
1312  // Feasible values are 0..4. The feature is disabled for 0. An increasing
1313  // value indicates more aggressive pruning threshold.
1314  int chroma_intra_pruning_with_hog;
1315 
1316  // Enable/disable smooth intra modes.
1317  int disable_smooth_intra;
1318 
1319  // Prune UV_SMOOTH_PRED mode for chroma based on chroma source variance.
1320  // false : No pruning
1321  // true : Prune UV_SMOOTH_PRED mode based on chroma source variance
1322  //
1323  // For allintra encode, this speed feature reduces instruction count
1324  // by 1.90%, 2.21% and 1.97% for speed 6, 7 and 8 with coding performance
1325  // change less than 0.04%. For AVIF image encode, this speed feature reduces
1326  // encode time by 1.56%, 2.14% and 0.90% for speed 6, 7 and 8 on a typical
1327  // image dataset with coding performance change less than 0.05%.
1328  bool prune_smooth_intra_mode_for_chroma;
1329 
1330  // Prune filter intra modes in intra frames.
1331  // 0 : No pruning
1332  // 1 : Evaluate applicable filter intra modes based on best intra mode so far
1333  // 2 : Do not evaluate filter intra modes
1334  int prune_filter_intra_level;
1335 
1336  // prune palette search
1337  // 0: No pruning
1338  // 1: Perform coarse search to prune the palette colors. For winner colors,
1339  // neighbors are also evaluated using a finer search.
1340  // 2: Perform 2 way palette search from max colors to min colors (and min
1341  // colors to remaining colors) and terminate the search if current number of
1342  // palette colors is not the winner.
1343  int prune_palette_search_level;
1344 
1345  // Terminate early in luma palette_size search. Speed feature values indicate
1346  // increasing level of pruning.
1347  // 0: No early termination
1348  // 1: Terminate early for higher luma palette_size, if header rd cost of lower
1349  // palette_size is more than 2 * best_rd. This level of pruning is more
1350  // conservative when compared to sf level 2 as the cases which will get pruned
1351  // with sf level 1 is a subset of the cases which will get pruned with sf
1352  // level 2.
1353  // 2: Terminate early for higher luma palette_size, if header rd cost of lower
1354  // palette_size is more than best_rd.
1355  // For allintra encode, this sf reduces instruction count by 2.49%, 1.07%,
1356  // 2.76%, 2.30%, 1.84%, 2.69%, 2.04%, 2.05% and 1.44% for speed 0, 1, 2, 3, 4,
1357  // 5, 6, 7 and 8 on screen content set with coding performance change less
1358  // than 0.01% for speed <= 2 and less than 0.03% for speed >= 3. For AVIF
1359  // image encode, this sf reduces instruction count by 1.94%, 1.13%, 1.29%,
1360  // 0.93%, 0.89%, 1.03%, 1.07%, 1.20% and 0.18% for speed 0, 1, 2, 3, 4, 5, 6,
1361  // 7 and 8 on a typical image dataset with coding performance change less than
1362  // 0.01%.
1363  int prune_luma_palette_size_search_level;
1364 
1365  // Prune chroma intra modes based on luma intra mode winner.
1366  // 0: No pruning
1367  // 1: Prune chroma intra modes other than UV_DC_PRED, UV_SMOOTH_PRED,
1368  // UV_CFL_PRED and the mode that corresponds to luma intra mode winner.
1369  int prune_chroma_modes_using_luma_winner;
1370 
1371  // Clip the frequency of updating the mv cost for intrabc.
1372  INTERNAL_COST_UPDATE_TYPE dv_cost_upd_level;
1373 
1374  // We use DCT_DCT transform followed by computing SATD (Sum of Absolute
1375  // Transformed Differences) as an estimation of RD score to quickly find the
1376  // best possible Chroma from Luma (CFL) parameter. Then we do a full RD search
1377  // near the best possible parameter. The search range is set here.
1378  // The range of cfl_searh_range should be [1, 33], and the following are the
1379  // recommended values.
1380  // 1: Fastest mode.
1381  // 3: Default mode that provides good speedup without losing compression
1382  // performance at speed 0.
1383  // 33: Exhaustive rd search (33 == CFL_MAGS_SIZE). This mode should only
1384  // be used for debugging purpose.
1385  int cfl_search_range;
1386 
1387  // TOP_INTRA_MODEL_COUNT is 4 that is the number of top model rd to store in
1388  // intra mode decision. Here, add a speed feature to reduce this number for
1389  // higher speeds.
1390  int top_intra_model_count_allowed;
1391 
1392  // Adapt top_intra_model_count_allowed locally to prune luma intra modes using
1393  // neighbor block and quantizer information.
1394  int adapt_top_model_rd_count_using_neighbors;
1395 
1396  // Prune the evaluation of odd delta angles of directional luma intra modes by
1397  // using the rdcosts of neighbouring delta angles.
1398  // For allintra encode, this speed feature reduces instruction count
1399  // by 4.461%, 3.699% and 3.536% for speed 6, 7 and 8 on a typical video
1400  // dataset with coding performance change less than 0.26%. For AVIF image
1401  // encode, this speed feature reduces encode time by 2.849%, 2.471%,
1402  // and 2.051% for speed 6, 7 and 8 on a typical image dataset with coding
1403  // performance change less than 0.27%.
1404  int prune_luma_odd_delta_angles_in_intra;
1405 
1406  // Terminate early in chroma palette_size search.
1407  // 0: No early termination
1408  // 1: Terminate early for higher palette_size, if header rd cost of lower
1409  // palette_size is more than best_rd.
1410  // For allintra encode, this sf reduces instruction count by 0.45%,
1411  // 0.62%, 1.73%, 2.50%, 2.89%, 3.09% and 3.86% for speed 0 to 6 on screen
1412  // content set with coding performance change less than 0.01%.
1413  // For AVIF image encode, this sf reduces instruction count by 0.45%, 0.81%,
1414  // 0.85%, 1.05%, 1.45%, 1.66% and 1.95% for speed 0 to 6 on a typical image
1415  // dataset with no quality drop.
1416  int early_term_chroma_palette_size_search;
1417 
1418  // Skips the evaluation of filter intra modes in inter frames if rd evaluation
1419  // of luma intra dc mode results in invalid rd stats.
1420  int skip_filter_intra_in_inter_frames;
1421 } INTRA_MODE_SPEED_FEATURES;
1422 
1423 typedef struct TX_SPEED_FEATURES {
1424  // Init search depth for square and rectangular transform partitions.
1425  // Values:
1426  // 0 - search full tree, 1: search 1 level, 2: search the highest level only
1427  int inter_tx_size_search_init_depth_sqr;
1428  int inter_tx_size_search_init_depth_rect;
1429  int intra_tx_size_search_init_depth_sqr;
1430  int intra_tx_size_search_init_depth_rect;
1431 
1432  // If any dimension of a coding block size above 64, always search the
1433  // largest transform only, since the largest transform block size is 64x64.
1434  int tx_size_search_lgr_block;
1435 
1436  TX_TYPE_SEARCH tx_type_search;
1437 
1438  // Skip split transform block partition when the collocated bigger block
1439  // is selected as all zero coefficients.
1440  int txb_split_cap;
1441 
1442  // Shortcut the transform block partition and type search when the target
1443  // rdcost is relatively lower.
1444  // Values are 0 (not used) , or 1 - 2 with progressively increasing
1445  // aggressiveness
1446  int adaptive_txb_search_level;
1447 
1448  // Prune level for tx_size_type search for inter based on rd model
1449  // 0: no pruning
1450  // 1-2: progressively increasing aggressiveness of pruning
1451  int model_based_prune_tx_search_level;
1452 
1453  // Refine TX type after fast TX search.
1454  int refine_fast_tx_search_results;
1455 
1456  // Prune transform split/no_split eval based on residual properties. A value
1457  // of 0 indicates no pruning, and the aggressiveness of pruning progressively
1458  // increases from levels 1 to 3.
1459  int prune_tx_size_level;
1460 
1461  // Prune the evaluation of transform depths as decided by the NN model.
1462  // false: No pruning.
1463  // true : Avoid the evaluation of specific transform depths using NN model.
1464  //
1465  // For allintra encode, this speed feature reduces instruction count
1466  // by 4.76%, 8.92% and 11.28% for speed 6, 7 and 8 with coding performance
1467  // change less than 0.32%. For AVIF image encode, this speed feature reduces
1468  // encode time by 4.65%, 9.16% and 10.45% for speed 6, 7 and 8 on a typical
1469  // image dataset with coding performance change less than 0.19%.
1470  bool prune_intra_tx_depths_using_nn;
1471 
1472  // Enable/disable early breakout during transform search of intra modes, by
1473  // using the minimum rd cost possible. By using this approach, the rd
1474  // evaluation of applicable transform blocks (in the current block) can be
1475  // avoided as
1476  // 1) best_rd evolves during the search in choose_tx_size_type_from_rd()
1477  // 2) appropriate ref_best_rd is passed in intra_block_yrd()
1478  //
1479  // For allintra encode, this speed feature reduces instruction count
1480  // by 1.11%, 1.08%, 1.02% and 0.93% for speed 3, 6, 7 and 8 with coding
1481  // performance change less than 0.02%. For AVIF image encode, this speed
1482  // feature reduces encode time by 0.93%, 1.46%, 1.07%, 0.84%, 0.99% and 0.73%
1483  // for speed 3, 4, 5, 6, 7 and 8 on a typical image dataset with coding
1484  // performance change less than 0.004%.
1485  bool use_rd_based_breakout_for_intra_tx_search;
1486 
1487  // Prune RD evaluation of transform split using RD Costs of transform no-split
1488  // of inter modes that are evaluated so far.
1489  // Values are 0 (not used), 1 - 2 with progressively increasing
1490  // aggressiveness, i.e., decreasing number of top candidates
1491  int prune_inter_tx_split_rd_eval_lvl;
1492 
1493  // If 1, use a trellis rd multiplier that favors chroma plane more.
1494  int use_chroma_trellis_rd_mult;
1495 } TX_SPEED_FEATURES;
1496 
1497 typedef struct RD_CALC_SPEED_FEATURES {
1498  // Fast approximation of av1_model_rd_from_var_lapndz
1499  int simple_model_rd_from_var;
1500 
1501  // Perform faster distortion computation during the R-D evaluation by trying
1502  // to approximate the prediction error with transform coefficients (faster but
1503  // less accurate) rather than computing distortion in the pixel domain (slower
1504  // but more accurate). The following methods are used for distortion
1505  // computation:
1506  // Method 0: Always compute distortion in the pixel domain
1507  // Method 1: Based on block error, try using transform domain distortion for
1508  // tx_type search and compute distortion in pixel domain for final RD_STATS
1509  // Method 2: Based on block error, try to compute distortion in transform
1510  // domain
1511  // Methods 1 and 2 may fallback to computing distortion in the pixel domain in
1512  // case the block error is less than the threshold, which is controlled by the
1513  // speed feature tx_domain_dist_thres_level.
1514  //
1515  // The speed feature tx_domain_dist_level decides which of the above methods
1516  // needs to be used across different mode evaluation stages as described
1517  // below:
1518  // Eval type: Default Mode Winner
1519  // Level 0 : Method 0 Method 2 Method 0
1520  // Level 1 : Method 1 Method 2 Method 0
1521  // Level 2 : Method 2 Method 2 Method 0
1522  // Level 3 : Method 2 Method 2 Method 2
1523  int tx_domain_dist_level;
1524 
1525  // Transform domain distortion threshold level
1526  int tx_domain_dist_thres_level;
1527 
1528  // Trellis (dynamic programming) optimization of quantized values
1529  TRELLIS_OPT_TYPE optimize_coefficients;
1530 
1531  // Use hash table to store macroblock RD search results
1532  // to avoid repeated search on the same residue signal.
1533  int use_mb_rd_hash;
1534 
1535  // Flag used to control the extent of coeff R-D optimization
1536  int perform_coeff_opt;
1537 } RD_CALC_SPEED_FEATURES;
1538 
1539 typedef struct WINNER_MODE_SPEED_FEATURES {
1540  // Flag used to control the winner mode processing for better R-D optimization
1541  // of quantized coeffs
1542  int enable_winner_mode_for_coeff_opt;
1543 
1544  // Flag used to control the winner mode processing for transform size
1545  // search method
1546  int enable_winner_mode_for_tx_size_srch;
1547 
1548  // Control transform size search level
1549  // Eval type: Default Mode Winner
1550  // Level 0 : FULL RD LARGEST ALL FULL RD
1551  // Level 1 : FAST RD LARGEST ALL FULL RD
1552  // Level 2 : LARGEST ALL LARGEST ALL FULL RD
1553  // Level 3 : LARGEST ALL LARGEST ALL LARGEST ALL
1554  int tx_size_search_level;
1555 
1556  // Flag used to control the winner mode processing for use transform
1557  // domain distortion
1558  int enable_winner_mode_for_use_tx_domain_dist;
1559 
1560  // Flag used to enable processing of multiple winner modes
1561  MULTI_WINNER_MODE_TYPE multi_winner_mode_type;
1562 
1563  // Motion mode for winner candidates:
1564  // 0: speed feature OFF
1565  // 1 / 2 : Use configured number of winner candidates
1566  int motion_mode_for_winner_cand;
1567 
1568  // Controls the prediction of transform skip block or DC only block.
1569  //
1570  // Different speed feature values (0 to 3) decide the aggressiveness of
1571  // prediction (refer to predict_dc_levels[][] in speed_features.c) to be used
1572  // during different mode evaluation stages.
1573  int dc_blk_pred_level;
1574 
1575  // If on, disables interpolation filter search in handle_inter_mode loop, and
1576  // performs it during winner mode processing by \ref
1577  // tx_search_best_inter_candidates.
1578  int winner_mode_ifs;
1579 
1580  // Controls the disabling of winner mode processing. Speed feature levels
1581  // are ordered in increasing aggressiveness of pruning. The method considered
1582  // for disabling, depends on the sf level value and it is described as below.
1583  // 0: Do not disable
1584  // 1: Disable for blocks with low source variance.
1585  // 2: Disable for blocks which turn out to be transform skip (skipped based on
1586  // eob) during MODE_EVAL stage except NEWMV mode.
1587  // 3: Disable for blocks which turn out to be transform skip during MODE_EVAL
1588  // stage except NEWMV mode. For high quantizers, prune conservatively based on
1589  // transform skip (skipped based on eob) except for NEWMV mode.
1590  // 4: Disable for blocks which turn out to be transform skip during MODE_EVAL
1591  // stage.
1592  int prune_winner_mode_eval_level;
1593 } WINNER_MODE_SPEED_FEATURES;
1594 
1595 typedef struct LOOP_FILTER_SPEED_FEATURES {
1596  // This feature controls how the loop filter level is determined.
1597  LPF_PICK_METHOD lpf_pick;
1598 
1599  // Skip some final iterations in the determination of the best loop filter
1600  // level.
1601  int use_coarse_filter_level_search;
1602 
1603  // Reset luma filter levels to zero based on minimum filter levels of
1604  // reference frames and current frame's pyramid level.
1605  int adaptive_luma_loop_filter_skip;
1606 
1607  // Reset luma filter levels to zero when the percentage of SSE difference
1608  // between the unfiltered and filtered versions of the current frame is below
1609  // a threshold.
1610  int skip_loop_filter_using_filt_error;
1611 
1612  // Control how the CDEF strength is determined.
1613  CDEF_PICK_METHOD cdef_pick_method;
1614 
1615  // Decoder side speed feature for adaptive CDEF with strength reduction.
1616  // Zero out values with low CDEF strengths (luma and/or chroma). This is
1617  // done as CDEF is a relatively-expensive filter to compute during decode.
1618  // This speed feature is only enabled in all intra mode.
1619  bool zero_low_cdef_strengths;
1620 
1621  // Decoder side speed feature for adaptive CDEF control based on MSE
1622  // 0 : Enable CDEF for all planes
1623  // 1 : Disable CDEF for chroma planes and disable for luma adaptively based on
1624  // current frame's pyramid level and improvement in MSE after CDEF
1625  // filtering.
1626  int adaptive_cdef_mode;
1627 
1628  // Decoder side speed feature to add penalty for use of dual-sgr filters.
1629  // Takes values 0 - 10, 0 indicating no penalty and each additional level
1630  // adding a penalty of 1%
1631  int dual_sgr_penalty_level;
1632 
1633  // Restricts loop restoration to RESTORE_SWITCHABLE by skipping RD cost
1634  // comparisons for RESTORE_WIENER and RESTORE_SGRPROJ. Also applies a bias
1635  // during switchable restoration search: each level adds a 0.5% penalty to
1636  // Wiener and SGR selection.
1637  // 0 : No restriction or bias (all restoration types allowed)
1638  // 1+: Skip WIENER/SGRPROJ and apply (level x 0.5%) penalty in
1639  // search_switchable()
1640  int switchable_lr_with_bias_level;
1641 
1642  // Enable fast search in self guided restoration
1643  // 0 : Search over all 16 SGR projection parameters listed
1644  // in av1_sgr_params[SGRPROJ_PARAMS].
1645  // 1 : Approximate search using binary search like mechanism,
1646  // a total of 8 SGR projection parameters are searched.
1647  // 2 : Search only 'ep' values in
1648  // sgproj_ep_grp1_seed[SGRPROJ_EP_GRP1_SEARCH_COUNT],
1649  // a total of 4 SGR projection parameters are searched.
1650  int enable_sgr_ep_pruning;
1651 
1652  // Disable loop restoration for Chroma plane
1653  int disable_loop_restoration_chroma;
1654 
1655  // Disable loop restoration for luma plane
1656  int disable_loop_restoration_luma;
1657 
1658  // Range of loop restoration unit sizes to search
1659  // The minimum size is clamped against the superblock size in
1660  // av1_pick_filter_restoration, so that the code which sets this value does
1661  // not need to know the superblock size ahead of time.
1662  int min_lr_unit_size;
1663  int max_lr_unit_size;
1664 
1665  // Prune RESTORE_WIENER evaluation based on source variance
1666  // 0 : no pruning
1667  // 1 : conservative pruning
1668  // 2 : aggressive pruning
1669  int prune_wiener_based_on_src_var;
1670 
1671  // Prune self-guided loop restoration based on wiener search results
1672  // 0 : no pruning
1673  // 1 : pruning based on rdcost ratio of RESTORE_WIENER and RESTORE_NONE
1674  // 2 : pruning based on winner restoration type among RESTORE_WIENER and
1675  // RESTORE_NONE
1676  int prune_sgr_based_on_wiener;
1677 
1678  // Reduce the wiener filter win size for luma
1679  int reduce_wiener_window_size;
1680 
1681  // Flag to disable Wiener Loop restoration filter.
1682  bool disable_wiener_filter;
1683 
1684  // Flag to disable Self-guided Loop restoration filter.
1685  bool disable_sgr_filter;
1686 
1687  // Disable the refinement search around the wiener filter coefficients.
1688  bool disable_wiener_coeff_refine_search;
1689 
1690  // Whether to downsample the rows in computation of wiener stats.
1691  int use_downsampled_wiener_stats;
1692 } LOOP_FILTER_SPEED_FEATURES;
1693 
1694 typedef struct REAL_TIME_SPEED_FEATURES {
1695  // check intra prediction for non-RD mode.
1696  int check_intra_pred_nonrd;
1697 
1698  // Skip checking intra prediction.
1699  // 0 - don't skip
1700  // 1 - skip if TX is skipped and best mode is not NEWMV
1701  // 2 - skip if TX is skipped
1702  // Skipping aggressiveness increases from level 1 to 2.
1703  int skip_intra_pred;
1704 
1705  // Estimate motion before calculating variance in variance-based partition
1706  // 0 - Only use zero MV
1707  // 1 - perform coarse ME
1708  // 2 - perform coarse ME, and also use neighbours' MVs
1709  // 3 - use neighbours' MVs without performing coarse ME
1710  int estimate_motion_for_var_based_partition;
1711 
1712  // For nonrd_use_partition: mode of extra check of leaf partition
1713  // 0 - don't check merge
1714  // 1 - always check merge
1715  // 2 - check merge and prune checking final split
1716  // 3 - check merge and prune checking final split based on bsize and qindex
1717  int nonrd_check_partition_merge_mode;
1718 
1719  // For nonrd_use_partition: check of leaf partition extra split
1720  int nonrd_check_partition_split;
1721 
1722  // Implements various heuristics to skip searching modes
1723  // The heuristics selected are based on flags
1724  // defined in the MODE_SEARCH_SKIP_HEURISTICS enum
1725  unsigned int mode_search_skip_flags;
1726 
1727  // For nonrd: Reduces ref frame search.
1728  // 0 - low level of search prune in non last frames
1729  // 1 - pruned search in non last frames
1730  // 2 - more pruned search in non last frames
1731  int nonrd_prune_ref_frame_search;
1732 
1733  // This flag controls the use of non-RD mode decision.
1734  int use_nonrd_pick_mode;
1735 
1736  // Flag that controls discounting for color map cost during palette search.
1737  // This saves about 5% of CPU and in non-RD speeds delivers better results
1738  // across rtc_screen set (on speed 10 overall BDRate growth is 13%)
1739  int discount_color_cost;
1740 
1741  // Use ALTREF frame in non-RD mode decision.
1742  int use_nonrd_altref_frame;
1743 
1744  // Use compound reference for non-RD mode.
1745  int use_comp_ref_nonrd;
1746 
1747  // Reference frames for compound prediction for nonrd pickmode:
1748  // LAST_GOLDEN (0), LAST_LAST2 (1), or LAST_ALTREF (2).
1749  int ref_frame_comp_nonrd[3];
1750 
1751  // use reduced ref set for real-time mode
1752  int use_real_time_ref_set;
1753 
1754  // Skip a number of expensive mode evaluations for blocks with very low
1755  // temporal variance.
1756  int short_circuit_low_temp_var;
1757 
1758  // Reuse inter prediction in fast non-rd mode.
1759  int reuse_inter_pred_nonrd;
1760 
1761  // Number of best inter modes to search transform. INT_MAX - search all.
1762  int num_inter_modes_for_tx_search;
1763 
1764  // Use interpolation filter search in non-RD mode decision.
1765  int use_nonrd_filter_search;
1766 
1767  // Use simplified RD model for interpolation search and Intra
1768  int use_simple_rd_model;
1769 
1770  // For nonrd mode: use hybrid intra mode search for intra only frames based on
1771  // block properties.
1772  // 0 : use nonrd pick intra for all blocks
1773  // 1 : use rd for bsize < 16x16, nonrd otherwise
1774  // 2 : use rd for bsize < 16x16 and src var >= 101, nonrd otherwise
1775  int hybrid_intra_pickmode;
1776 
1777  // Filter blocks by certain criteria such as SAD, source variance, such that
1778  // fewer blocks will go through the palette search.
1779  // For nonrd encoding path, enable this feature reduces encoding time when
1780  // palette mode is used. Disabling it leads to better compression efficiency.
1781  // 0: off
1782  // 1: less aggressive pruning mode
1783  // 2, 3: more aggressive pruning mode
1784  int prune_palette_search_nonrd;
1785 
1786  // Compute variance/sse on source difference, prior to encoding superblock.
1787  int source_metrics_sb_nonrd;
1788 
1789  // Flag to indicate process for handling overshoot on slide/scene change,
1790  // for real-time CBR mode.
1791  OVERSHOOT_DETECTION_CBR overshoot_detection_cbr;
1792 
1793  // Check for scene/content change detection on every frame before encoding.
1794  int check_scene_detection;
1795 
1796  // For keyframes in rtc: adjust the rc_bits_per_mb, to reduce overshoot.
1797  int rc_adjust_keyframe;
1798 
1799  // On scene change or keyframe: compute spatial variance.
1800  int rc_compute_spatial_var_sc_kf;
1801 
1802  // For nonrd mode: Prefer larger partition blks in variance based partitioning
1803  // 0: disabled, 1-3: increasing aggressiveness
1804  int prefer_large_partition_blocks;
1805 
1806  // uses results of temporal noise estimate
1807  int use_temporal_noise_estimate;
1808 
1809  // Parameter indicating initial search window to be used in full-pixel search
1810  // for nonrd_pickmode. Range [0, MAX_MVSEARCH_STEPS - 1]. Lower value
1811  // indicates larger window. If set to 0, step_param is set based on internal
1812  // logic in set_mv_search_params().
1813  int fullpel_search_step_param;
1814 
1815  // Bit mask to enable or disable intra modes for each prediction block size
1816  // separately, for nonrd_pickmode. Currently, the sf is not respected when
1817  // 'force_intra_check' is true in 'av1_estimate_intra_mode()' function. Also,
1818  // H and V pred modes allowed through this sf can be further pruned when
1819  //'prune_hv_pred_modes_using_src_sad' sf is true.
1820  int intra_y_mode_bsize_mask_nrd[BLOCK_SIZES];
1821 
1822  // Prune H and V intra predition modes evalution in inter frame.
1823  // The sf does not have any impact.
1824  // i. when frame_source_sad is 1.1 times greater than avg_source_sad
1825  // ii. when cyclic_refresh_segment_id_boosted is enabled
1826  // iii. when SB level source sad is greater than kMedSad
1827  // iv. when color sensitivity is non zero for both the chroma channels
1828  bool prune_hv_pred_modes_using_src_sad;
1829 
1830  // Skips mode checks more aggressively in nonRD mode
1831  int nonrd_aggressive_skip;
1832 
1833  // Skip cdef on 64x64 blocks/
1834  // 0: disabled
1835  // 1: skip when NEWMV or INTRA is not picked or color sensitivity is off.
1836  // When color sensitivity is on for a superblock, all 64x64 blocks within
1837  // will not skip.
1838  // 2: more aggressive mode where skip is done for all frames where
1839  // rc->high_source_sad = 0 (non slide-changes), and color sensitivity off.
1840  int skip_cdef_sb;
1841 
1842  // Force selective cdf update.
1843  int selective_cdf_update;
1844 
1845  // Force only single reference (LAST) for prediction.
1846  int force_only_last_ref;
1847 
1848  // Forces larger partition blocks in variance based partitioning for intra
1849  // frames
1850  int force_large_partition_blocks_intra;
1851 
1852  // Use fixed partition for superblocks based on source_sad.
1853  // 0: disabled
1854  // 1: enabled
1855  int use_fast_fixed_part;
1856 
1857  // Increase source_sad thresholds in nonrd pickmode.
1858  int increase_source_sad_thresh;
1859 
1860  // Skip evaluation of no split in tx size selection for merge partition
1861  int skip_tx_no_split_var_based_partition;
1862 
1863  // Intermediate termination of newMV mode evaluation based on so far best mode
1864  // sse
1865  int skip_newmv_mode_based_on_sse;
1866 
1867  // Define gf length multiplier.
1868  // Level 0: use large multiplier, level 1: use medium multiplier.
1869  int gf_length_lvl;
1870 
1871  // Prune inter modes with golden frame as reference for NEARMV and NEWMV modes
1872  int prune_inter_modes_with_golden_ref;
1873 
1874  // Prune inter modes w.r.t golden or alt-ref frame based on sad
1875  int prune_inter_modes_wrt_gf_arf_based_on_sad;
1876 
1877  // Prune inter mode search in rd path based on current block's temporal
1878  // variance wrt LAST reference.
1879  int prune_inter_modes_using_temp_var;
1880 
1881  // Reduce MV precision to halfpel for higher int MV value & frame-level motion
1882  // 0: disabled
1883  // 1-2: Reduce precision to halfpel, fullpel based on conservative
1884  // thresholds, aggressiveness increases with increase in level
1885  // 3: Reduce precision to halfpel using more aggressive thresholds
1886  int reduce_mv_pel_precision_highmotion;
1887 
1888  // Reduce MV precision for low complexity blocks
1889  // 0: disabled
1890  // 1: Reduce the mv resolution for zero mv if the variance is low
1891  // 2: Switch to halfpel, fullpel based on low block spatial-temporal
1892  // complexity.
1893  int reduce_mv_pel_precision_lowcomplex;
1894 
1895  // Prune intra mode evaluation in inter frames based on mv range.
1896  BLOCK_SIZE prune_intra_mode_based_on_mv_range;
1897  // The number of times to left shift the splitting thresholds in variance
1898  // based partitioning. The minimum values should be 7 to avoid left shifting
1899  // by a negative number.
1900  int var_part_split_threshold_shift;
1901 
1902  // Qindex based variance partition threshold index, which determines
1903  // the aggressiveness of partition pruning
1904  // 0: disabled for speeds 9,10
1905  // 1,2: (rd-path) lowers qindex thresholds conditionally (for low SAD sb)
1906  // 3,4: (non-rd path) uses pre-tuned qindex thresholds
1907  int var_part_based_on_qidx;
1908 
1909  // Enable GF refresh based on Q value.
1910  int gf_refresh_based_on_qp;
1911 
1912  // Temporal filtering
1913  // The value can be 1 or 2, which indicates the threshold to use.
1914  // Must be off for lossless mode.
1915  int use_rtc_tf;
1916 
1917  // Use of the identity transform in nonrd_pickmode,
1918  int use_idtx_nonrd;
1919 
1920  // Prune the use of the identity transform in nonrd_pickmode:
1921  // only for smaller blocks and higher spatial variance, and when skip_txfm
1922  // is not already set.
1923  int prune_idtx_nonrd;
1924 
1925  // Force to only use dct for palette search in nonrd pickmode.
1926  int dct_only_palette_nonrd;
1927 
1928  // Skip loopfilter, for static content after slide change
1929  // or key frame, once quality has ramped up.
1930  // 0: disabled
1931  // 1: skip only after quality is ramped up.
1932  // 2: aggrssive mode, where skip is done for all frames that
1933  // where rc->high_source_sad = 0 (no slide-changes).
1934  int skip_lf_screen;
1935 
1936  // Threshold on the active/inactive region percent to disable
1937  // the loopfilter and cdef. Setting to 100 disables this feature.
1938  int thresh_active_maps_skip_lf_cdef;
1939 
1940  // For nonrd: early exit out of variance partition that sets the
1941  // block size to superblock size, and sets mode to zeromv-last skip.
1942  // 0: disabled
1943  // 1: zeromv-skip is enabled at SB level only
1944  // 2: zeromv-skip is enabled at SB level and coding block level
1945  int part_early_exit_zeromv;
1946 
1947  // Early terminate inter mode search based on sse in non-rd path.
1948  INTER_SEARCH_EARLY_TERM_IDX sse_early_term_inter_search;
1949 
1950  // SAD based adaptive altref selection
1951  int sad_based_adp_altref_lag;
1952 
1953  // Enable/disable partition direct merging.
1954  int partition_direct_merging;
1955 
1956  // Level of aggressiveness for obtaining tx size based on qstep
1957  int tx_size_level_based_on_qstep;
1958 
1959  // Avoid the partitioning of a 16x16 block in variance based partitioning
1960  // (VBP) by making use of minimum and maximum sub-block variances.
1961  // For allintra encode, this speed feature reduces instruction count by 5.39%
1962  // for speed 9 on a typical video dataset with coding performance gain
1963  // of 1.44%.
1964  // For AVIF image encode, this speed feature reduces encode time
1965  // by 8.44% for speed 9 on a typical image dataset with coding performance
1966  // gain of 0.78%.
1967  bool vbp_prune_16x16_split_using_min_max_sub_blk_var;
1968 
1969  // A qindex threshold that determines whether to use qindex based CDEF filter
1970  // strength estimation for screen content types. The strength estimation model
1971  // used for screen contents prefers to allow cdef filtering for more frames.
1972  // This sf is used to limit the frames which go through cdef filtering and
1973  // following explains the setting of the same.
1974  // MAXQ (255): This disables the usage of this sf. Here, frame does not use a
1975  // screen content model thus reduces the number of frames that go through cdef
1976  // filtering.
1977  // MINQ (0): Frames always use screen content model thus increasing the number
1978  // of frames that go through cdef filtering.
1979  // This speed feature has a substantial gain on coding metrics, with moderate
1980  // increase encoding time. Select threshold based on speed vs quality
1981  // trade-off.
1982  int screen_content_cdef_filter_qindex_thresh;
1983 
1984  // Prune compound mode if its variance is higher than the variance of single
1985  // modes.
1986  bool prune_compoundmode_with_singlecompound_var;
1987 
1988  // Allow mode cost update at frame level every couple frames. This
1989  // overrides the command line setting --mode-cost-upd-freq=3 (never update
1990  // except on key frame and first delta).
1991  bool frame_level_mode_cost_update;
1992 
1993  // Prune H_PRED during intra mode evaluation in the nonrd path based on best
1994  // mode so far.
1995  //
1996  // For allintra encode, this speed feature reduces instruction count by 1.10%
1997  // for speed 9 with coding performance change less than 0.04%.
1998  // For AVIF image encode, this speed feature reduces encode time by 1.03% for
1999  // speed 9 on a typical image dataset with coding performance change less than
2000  // 0.08%.
2001  bool prune_h_pred_using_best_mode_so_far;
2002 
2003  // Enable pruning of intra mode evaluations in nonrd path based on source
2004  // variance and best mode so far. The pruning logic is enabled only if the
2005  // mode is not a winner mode of both the neighboring blocks (left/top).
2006  //
2007  // For allintra encode, this speed feature reduces instruction count by 3.96%
2008  // for speed 9 with coding performance change less than 0.38%.
2009  // For AVIF image encode, this speed feature reduces encode time by 3.46% for
2010  // speed 9 on a typical image dataset with coding performance change less than
2011  // -0.06%.
2012  bool enable_intra_mode_pruning_using_neighbors;
2013 
2014  // Prune intra mode evaluations in nonrd path based on best sad so far.
2015  //
2016  // For allintra encode, this speed feature reduces instruction count by 3.05%
2017  // for speed 9 with coding performance change less than 0.24%.
2018  // For AVIF image encode, this speed feature reduces encode time by 1.87% for
2019  // speed 9 on a typical image dataset with coding performance change less than
2020  // 0.16%.
2021  bool prune_intra_mode_using_best_sad_so_far;
2022 
2023  // If compound is enabled, and the current block size is \geq BLOCK_16X16,
2024  // limit the compound modes to GLOBAL_GLOBALMV. This does not apply to the
2025  // base layer of svc.
2026  bool check_only_zero_zeromv_on_large_blocks;
2027 
2028  // Allow for disabling cdf update for non reference frames in svc mode.
2029  bool disable_cdf_update_non_reference_frame;
2030 
2031  // Prune compound modes if the single modes variances do not perform well.
2032  bool prune_compoundmode_with_singlemode_var;
2033 
2034  // Skip searching all compound mode if the variance of single_mode residue is
2035  // sufficiently low.
2036  bool skip_compound_based_on_var;
2037 
2038  // Sets force_zeromv_skip based on the source sad available. Aggressiveness
2039  // increases with increase in the level set for speed feature.
2040  // 0: No setting
2041  // 1: If source sad is kZeroSad
2042  // 2: If source sad <= kVeryLowSad
2043  int set_zeromv_skip_based_on_source_sad;
2044 
2045  // Downgrades the block-level subpel motion search to
2046  // av1_find_best_sub_pixel_tree_pruned_more for higher QP and when fullpel
2047  // search performed well, zeromv has low sad or low source_var
2048  bool use_adaptive_subpel_search;
2049 
2050  // A flag used in RTC case to control frame_refs_short_signaling. Note that
2051  // the final decision is made in check_frame_refs_short_signaling(). The flag
2052  // can only be turned on when res < 360p and speed >= 9, in which case only
2053  // LAST and GOLDEN ref frames are used now.
2054  bool enable_ref_short_signaling;
2055 
2056  // A flag that controls if we check or bypass GLOBALMV in rtc single ref frame
2057  // case.
2058  bool check_globalmv_on_single_ref;
2059 
2060  // Allows for increasing the color_threshold for palette prediction.
2061  // This generally leads to better coding efficiency but with some speed loss.
2062  // Only used for screen content and for nonrd_pickmode.
2063  bool increase_color_thresh_palette;
2064 
2065  // Flag to indicate selecting of higher threshold for scenee change detection.
2066  int higher_thresh_scene_detection;
2067 
2068  // FLag to indicate skip testing of NEWMV for flat blocks.
2069  int skip_newmv_flat_blocks_screen;
2070 
2071  // Flag to force skip encoding for non_reference_frame on slide/scene changes.
2072  int skip_encoding_non_reference_slide_change;
2073 
2074  // Flag to indicate more aggressive QP downward adjustment for screen static
2075  // content, to make convergence to min_qp faster.
2076  int rc_faster_convergence_static;
2077 
2078  // Skip NEWMV mode evaluation based on sad for screen content.
2079  int skip_newmv_mode_sad_screen;
2080 } REAL_TIME_SPEED_FEATURES;
2081 
2087 typedef struct SPEED_FEATURES {
2092 
2097 
2101  TPL_SPEED_FEATURES tpl_sf;
2102 
2106  GLOBAL_MOTION_SPEED_FEATURES gm_sf;
2107 
2111  PARTITION_SPEED_FEATURES part_sf;
2112 
2116  MV_SPEED_FEATURES mv_sf;
2117 
2121  INTER_MODE_SPEED_FEATURES inter_sf;
2122 
2126  INTERP_FILTER_SPEED_FEATURES interp_sf;
2127 
2131  INTRA_MODE_SPEED_FEATURES intra_sf;
2132 
2136  TX_SPEED_FEATURES tx_sf;
2137 
2141  RD_CALC_SPEED_FEATURES rd_sf;
2142 
2146  WINNER_MODE_SPEED_FEATURES winner_mode_sf;
2147 
2151  LOOP_FILTER_SPEED_FEATURES lpf_sf;
2152 
2156  REAL_TIME_SPEED_FEATURES rt_sf;
2157 } SPEED_FEATURES;
2160 struct AV1_COMP;
2161 
2175  int speed);
2176 
2189  int speed);
2202 
2203 #ifdef __cplusplus
2204 } // extern "C"
2205 #endif
2206 
2207 #endif // AOM_AV1_ENCODER_SPEED_FEATURES_H_
Definition: speed_features.h:390
void av1_set_speed_features_framesize_independent(struct AV1_COMP *cpi, int speed)
Frame size independent speed vs quality trade off flags.
int accurate_bit_estimate
Definition: speed_features.h:476
MV_SPEED_FEATURES mv_sf
Definition: speed_features.h:2116
int allow_sub_blk_me_in_tf
Definition: speed_features.h:491
int recode_tolerance
Definition: speed_features.h:427
INTER_SEARCH_EARLY_TERM_IDX
This enumeration defines inter search early termination index in non-rd path based on sse value...
Definition: speed_features.h:397
Definition: speed_features.h:170
RD_CALC_SPEED_FEATURES rd_sf
Definition: speed_features.h:2141
Definition: speed_features.h:365
Definition: speed_features.h:371
int disable_extra_sc_testing
Definition: speed_features.h:454
CDEF_PICK_METHOD
This enumeration defines a variety of CDEF pick methods.
Definition: speed_features.h:164
PARTITION_SPEED_FEATURES part_sf
Definition: speed_features.h:2111
struct HIGH_LEVEL_SPEED_FEATURES HIGH_LEVEL_SPEED_FEATURES
Sequence/frame level speed vs quality features.
int skip_zeromv_motion_search
Skips the motion search centered on 0,0 mv.
Definition: speed_features.h:534
Definition: speed_features.h:370
Definition: speed_features.h:398
int screen_detection_mode2_fast_detection
Definition: speed_features.h:506
Definition: speed_features.h:353
int static_segmentation
Definition: speed_features.h:444
struct FIRST_PASS_SPEED_FEATURES FIRST_PASS_SPEED_FEATURES
Definition: speed_features.h:402
Definition: speed_features.h:171
Definition: speed_features.h:406
int reduce_mv_step_param
Reduces the mv search window. By default, the initial search window is around MIN(MIN(dims), MAX_FULL_PEL_VAL) = MIN(MIN(dims), 1023). Each step reduction decrease the window size by about a factor of 2.
Definition: speed_features.h:519
int adjust_num_frames_for_arf_filtering
Definition: speed_features.h:469
MV_PREC_LOGIC high_precision_mv_usage
Definition: speed_features.h:435
int frame_parameter_update
Definition: speed_features.h:416
SUPERRES_AUTO_SEARCH_TYPE superres_auto_search_type
Definition: speed_features.h:449
Definition: speed_features.h:355
Definition: speed_features.h:376
Definition: speed_features.h:366
PRUNE_MESH_SEARCH_LEVEL
This enumeration defines a variety of mesh search prune levels.
Definition: speed_features.h:387
Top level speed vs quality trade off data struture.
Definition: speed_features.h:2087
Definition: speed_features.h:167
TX_SPEED_FEATURES tx_sf
Definition: speed_features.h:2136
Definition: speed_features.h:172
LOOP_FILTER_SPEED_FEATURES lpf_sf
Definition: speed_features.h:2151
Definition: speed_features.h:380
WINNER_MODE_SPEED_FEATURES winner_mode_sf
Definition: speed_features.h:2146
HIGH_LEVEL_SPEED_FEATURES hl_sf
Definition: speed_features.h:2091
Definition: speed_features.h:165
INTRA_MODE_SPEED_FEATURES intra_sf
Definition: speed_features.h:2131
static int prune_zero_mv_with_sse(const aom_variance_fn_ptr_t *fn_ptr, const MACROBLOCK *x, BLOCK_SIZE bsize, const HandleInterModeArgs *args, int prune_zero_mv_with_sse)
Prunes ZeroMV Search Using Best NEWMV's SSE.
Definition: rdopt.c:2809
Definition: speed_features.h:404
INTER_MODE_SPEED_FEATURES inter_sf
Definition: speed_features.h:2121
Definition: speed_features.h:512
Definition: speed_features.h:367
SIMPLE_MOTION_SEARCH_PRUNE_LEVEL
This enumeration defines a variety of simple motion search based partition prune levels.
Definition: speed_features.h:363
Definition: speed_features.h:408
FIRST_PASS_SPEED_FEATURES fp_sf
Definition: speed_features.h:2096
Sequence/frame level speed vs quality features.
Definition: speed_features.h:414
Definition: speed_features.h:352
void av1_set_speed_features_framesize_dependent(struct AV1_COMP *cpi, int speed)
Frame size dependent speed vs quality trade off flags.
Definition: speed_features.h:356
int second_alt_ref_filtering
Definition: speed_features.h:459
int disable_recon
Skips reconstruction by using source buffers for prediction.
Definition: speed_features.h:529
struct SPEED_FEATURES SPEED_FEATURES
Top level speed vs quality trade off data struture.
Definition: speed_features.h:400
Top level encoder structure.
Definition: encoder.h:2897
Definition: speed_features.h:369
Definition: speed_features.h:374
INTERNAL_COST_UPDATE_TYPE
This enum decides internally how often to update the entropy costs.
Definition: speed_features.h:351
REAL_TIME_SPEED_FEATURES rt_sf
Definition: speed_features.h:2156
Definition: speed_features.h:368
RECODE_LOOP_TYPE recode_loop
Definition: speed_features.h:421
int speed
Definition: encoder.h:3119
Definition: speed_features.h:388
int ref_frame_mvs_lvl
Definition: speed_features.h:499
Definition: speed_features.h:166
GLOBAL_MOTION_SPEED_FEATURES gm_sf
Definition: speed_features.h:2106
TPL_SPEED_FEATURES tpl_sf
Definition: speed_features.h:2101
Definition: speed_features.h:168
Definition: speed_features.h:354
int weight_calc_level_in_tf
Definition: speed_features.h:483
int skip_motion_search_threshold
Skips the motion search when the zero mv has small sse.
Definition: speed_features.h:524
INTERP_FILTER_SPEED_FEATURES interp_sf
Definition: speed_features.h:2126
void av1_set_speed_features_qindex_dependent(struct AV1_COMP *cpi, int speed)
Q index dependent speed vs quality trade off flags.
Definition: speed_features.h:389