1 /*
2 * Copyright (c) 2016, Alliance for Open Media. All rights reserved.
3 *
4 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10 */
11
12 /*! \file
13 * Declares various structs used to encode the current partition block.
14 */
15 #ifndef AOM_AV1_ENCODER_BLOCK_H_
16 #define AOM_AV1_ENCODER_BLOCK_H_
17
18 #include "av1/common/blockd.h"
19 #include "av1/common/entropymv.h"
20 #include "av1/common/entropy.h"
21 #include "av1/common/enums.h"
22 #include "av1/common/mvref_common.h"
23
24 #include "av1/encoder/enc_enums.h"
25 #include "av1/encoder/mcomp_structs.h"
26 #if !CONFIG_REALTIME_ONLY
27 #include "av1/encoder/partition_cnn_weights.h"
28 #endif
29
30 #include "av1/encoder/hash_motion.h"
31
32 #ifdef __cplusplus
33 extern "C" {
34 #endif
35
36 //! Minimum linear dimension of a tpl block
37 #define MIN_TPL_BSIZE_1D 16
38 //! Maximum number of tpl block in a super block
39 #define MAX_TPL_BLK_IN_SB (MAX_SB_SIZE / MIN_TPL_BSIZE_1D)
40 //! Number of txfm hash records kept for the partition block.
41 #define RD_RECORD_BUFFER_LEN 8
42
43 /*! Maximum value taken by transform type probabilities */
44 #define MAX_TX_TYPE_PROB 1024
45
46 //! Compute color sensitivity index for given plane
47 #define COLOR_SENS_IDX(plane) ((plane)-1)
48
49 //! Enable timer statistics of mode search in non-rd
50 #define COLLECT_NONRD_PICK_MODE_STAT 0
51
52 /*!\cond */
53 #if COLLECT_NONRD_PICK_MODE_STAT
54 #include "aom_ports/aom_timer.h"
55
56 typedef struct _mode_search_stat_nonrd {
57 int32_t num_blocks[BLOCK_SIZES];
58 int64_t total_block_times[BLOCK_SIZES];
59 int32_t num_searches[BLOCK_SIZES][MB_MODE_COUNT];
60 int32_t num_nonskipped_searches[BLOCK_SIZES][MB_MODE_COUNT];
61 int64_t search_times[BLOCK_SIZES][MB_MODE_COUNT];
62 int64_t nonskipped_search_times[BLOCK_SIZES][MB_MODE_COUNT];
63 int64_t ms_time[BLOCK_SIZES][MB_MODE_COUNT];
64 int64_t ifs_time[BLOCK_SIZES][MB_MODE_COUNT];
65 int64_t model_rd_time[BLOCK_SIZES][MB_MODE_COUNT];
66 int64_t txfm_time[BLOCK_SIZES][MB_MODE_COUNT];
67 struct aom_usec_timer timer1;
68 struct aom_usec_timer timer2;
69 struct aom_usec_timer bsize_timer;
70 } mode_search_stat_nonrd;
71 #endif // COLLECT_NONRD_PICK_MODE_STAT
72 /*!\endcond */
73
74 /*! \brief Superblock level encoder info
75 *
76 * SuperblockEnc stores superblock level information used by the encoder for
77 * more efficient encoding. Currently this is mostly used to store TPL data
78 * for the current superblock.
79 */
80 typedef struct {
81 //! Maximum partition size for the sb.
82 BLOCK_SIZE min_partition_size;
83 //! Minimum partition size for the sb.
84 BLOCK_SIZE max_partition_size;
85
86 /*****************************************************************************
87 * \name TPL Info
88 *
89 * Information gathered from tpl_model at tpl block precision for the
90 * superblock to speed up the encoding process..
91 ****************************************************************************/
92 /**@{*/
93 //! Number of TPL blocks in this superblock.
94 int tpl_data_count;
95 //! TPL's estimate of inter cost for each tpl block.
96 int64_t tpl_inter_cost[MAX_TPL_BLK_IN_SB * MAX_TPL_BLK_IN_SB];
97 //! TPL's estimate of tpl cost for each tpl block.
98 int64_t tpl_intra_cost[MAX_TPL_BLK_IN_SB * MAX_TPL_BLK_IN_SB];
99 //! Motion vectors found by TPL model for each tpl block.
100 int_mv tpl_mv[MAX_TPL_BLK_IN_SB * MAX_TPL_BLK_IN_SB][INTER_REFS_PER_FRAME];
101 //! TPL's stride for the arrays in this struct.
102 int tpl_stride;
103 /**@}*/
104 } SuperBlockEnc;
105
106 /*! \brief Stores the best performing modes.
107 */
108 typedef struct {
109 //! The mbmi used to reconstruct the winner mode.
110 MB_MODE_INFO mbmi;
111 //! Rdstats of the winner mode.
112 RD_STATS rd_cost;
113 //! Rdcost of the winner mode
114 int64_t rd;
115 //! Luma rate of the winner mode.
116 int rate_y;
117 //! Chroma rate of the winner mode.
118 int rate_uv;
119 //! The color map needed to reconstruct palette mode.
120 uint8_t color_index_map[MAX_SB_SQUARE];
121 //! The current winner mode.
122 THR_MODES mode_index;
123 } WinnerModeStats;
124
125 /*! \brief Each source plane of the current macroblock
126 *
127 * This struct also stores the txfm buffers and quantizer settings.
128 */
129 typedef struct macroblock_plane {
130 //! Stores source - pred so the txfm can be computed later
131 int16_t *src_diff;
132 //! Dequantized coefficients
133 tran_low_t *dqcoeff;
134 //! Quantized coefficients
135 tran_low_t *qcoeff;
136 //! Transformed coefficients
137 tran_low_t *coeff;
138 //! Location of the end of qcoeff (end of block).
139 uint16_t *eobs;
140 //! Contexts used to code the transform coefficients.
141 uint8_t *txb_entropy_ctx;
142 //! A buffer containing the source frame.
143 struct buf_2d src;
144
145 /*! \name Quantizer Settings
146 *
147 * \attention These are used/accessed only in the quantization process.
148 * RDO does not and *must not* depend on any of these values.
149 * All values below share the coefficient scale/shift used in TX.
150 */
151 /**@{*/
152 //! Quantization step size used by AV1_XFORM_QUANT_FP.
153 const int16_t *quant_fp_QTX;
154 //! Offset used for rounding in the quantizer process by AV1_XFORM_QUANT_FP.
155 const int16_t *round_fp_QTX;
156 //! Quantization step size used by AV1_XFORM_QUANT_B.
157 const int16_t *quant_QTX;
158 //! Offset used for rounding in the quantizer process by AV1_XFORM_QUANT_B.
159 const int16_t *round_QTX;
160 //! Scale factor to shift coefficients toward zero. Only used by QUANT_B.
161 const int16_t *quant_shift_QTX;
162 //! Size of the quantization bin around 0. Only Used by QUANT_B
163 const int16_t *zbin_QTX;
164 //! Dequantizer
165 const int16_t *dequant_QTX;
166 /**@}*/
167 } MACROBLOCK_PLANE;
168
169 /*! \brief Costs for encoding the coefficients within a level.
170 *
171 * Covers everything including txb_skip, eob, dc_sign,
172 */
173 typedef struct {
174 //! Cost to skip txfm for the current txfm block.
175 int txb_skip_cost[TXB_SKIP_CONTEXTS][2];
176 /*! \brief Cost for encoding the base_eob of a level.
177 *
178 * Decoder uses base_eob to derive the base_level as base_eob := base_eob+1.
179 */
180 int base_eob_cost[SIG_COEF_CONTEXTS_EOB][3];
181 /*! \brief Cost for encoding the base level of a coefficient.
182 *
183 * Decoder derives coeff_base as coeff_base := base_eob + 1.
184 */
185 int base_cost[SIG_COEF_CONTEXTS][8];
186 /*! \brief Cost for encoding the last non-zero coefficient.
187 *
188 * Eob is derived from eob_extra at the decoder as eob := eob_extra + 1
189 */
190 int eob_extra_cost[EOB_COEF_CONTEXTS][2];
191 //! Cost for encoding the dc_sign
192 int dc_sign_cost[DC_SIGN_CONTEXTS][2];
193 //! Cost for encoding an increment to the coefficient
194 int lps_cost[LEVEL_CONTEXTS][COEFF_BASE_RANGE + 1 + COEFF_BASE_RANGE + 1];
195 } LV_MAP_COEFF_COST;
196
197 /*! \brief Costs for encoding the eob.
198 */
199 typedef struct {
200 //! eob_cost.
201 int eob_cost[2][11];
202 } LV_MAP_EOB_COST;
203
204 /*! \brief Stores the transforms coefficients for the whole superblock.
205 */
206 typedef struct {
207 //! The transformed coefficients.
208 tran_low_t *tcoeff[MAX_MB_PLANE];
209 //! Where the transformed coefficients end.
210 uint16_t *eobs[MAX_MB_PLANE];
211 /*! \brief Transform block entropy contexts.
212 *
213 * Each element is used as a bit field.
214 * - Bits 0~3: txb_skip_ctx
215 * - Bits 4~5: dc_sign_ctx.
216 */
217 uint8_t *entropy_ctx[MAX_MB_PLANE];
218 } CB_COEFF_BUFFER;
219
220 /*! \brief Extended mode info derived from mbmi.
221 */
222 typedef struct {
223 // TODO(angiebird): Reduce the buffer size according to sb_type
224 //! The reference mv list for the current block.
225 CANDIDATE_MV ref_mv_stack[MODE_CTX_REF_FRAMES][USABLE_REF_MV_STACK_SIZE];
226 //! The weights used to compute the ref mvs.
227 uint16_t weight[MODE_CTX_REF_FRAMES][USABLE_REF_MV_STACK_SIZE];
228 //! Number of ref mvs in the drl.
229 uint8_t ref_mv_count[MODE_CTX_REF_FRAMES];
230 //! Global mvs
231 int_mv global_mvs[REF_FRAMES];
232 //! Context used to encode the current mode.
233 int16_t mode_context[MODE_CTX_REF_FRAMES];
234 } MB_MODE_INFO_EXT;
235
236 /*! \brief Stores best extended mode information at frame level.
237 *
238 * The frame level in here is used in bitstream preparation stage. The
239 * information in \ref MB_MODE_INFO_EXT are copied to this struct to save
240 * memory.
241 */
242 typedef struct {
243 //! \copydoc MB_MODE_INFO_EXT::ref_mv_stack
244 CANDIDATE_MV ref_mv_stack[USABLE_REF_MV_STACK_SIZE];
245 //! \copydoc MB_MODE_INFO_EXT::weight
246 uint16_t weight[USABLE_REF_MV_STACK_SIZE];
247 //! \copydoc MB_MODE_INFO_EXT::ref_mv_count
248 uint8_t ref_mv_count;
249 // TODO(Ravi/Remya): Reduce the buffer size of global_mvs
250 //! \copydoc MB_MODE_INFO_EXT::global_mvs
251 int_mv global_mvs[REF_FRAMES];
252 //! \copydoc MB_MODE_INFO_EXT::mode_context
253 int16_t mode_context;
254 //! Offset of current coding block's coeff buffer relative to the sb.
255 uint16_t cb_offset[PLANE_TYPES];
256 } MB_MODE_INFO_EXT_FRAME;
257
258 /*! \brief Inter-mode txfm results for a partition block.
259 */
260 typedef struct {
261 //! Txfm size used if the current mode is intra mode.
262 TX_SIZE tx_size;
263 //! Txfm sizes used if the current mode is inter mode.
264 TX_SIZE inter_tx_size[INTER_TX_SIZE_BUF_LEN];
265 //! Map showing which txfm block skips the txfm process.
266 uint8_t blk_skip[MAX_MIB_SIZE * MAX_MIB_SIZE];
267 //! Map showing the txfm types for each block.
268 uint8_t tx_type_map[MAX_MIB_SIZE * MAX_MIB_SIZE];
269 //! Rd_stats for the whole partition block.
270 RD_STATS rd_stats;
271 //! Hash value of the current record.
272 uint32_t hash_value;
273 } MB_RD_INFO;
274
275 /*! \brief Hash records of the inter-mode transform results
276 *
277 * Hash records of the inter-mode transform results for a whole partition block
278 * based on the residue. Since this operates on the partition block level, this
279 * can give us a whole txfm partition tree.
280 */
281 typedef struct {
282 /*! Circular buffer that stores the inter-mode txfm results of a partition
283 * block.
284 */
285 MB_RD_INFO mb_rd_info[RD_RECORD_BUFFER_LEN];
286 //! Index to insert the newest rd record.
287 int index_start;
288 //! Number of info stored in this record.
289 int num;
290 //! Hash function
291 CRC32C crc_calculator;
292 } MB_RD_RECORD;
293
294 //! Number of compound rd stats
295 #define MAX_COMP_RD_STATS 64
296 /*! \brief Rdcost stats in compound mode.
297 */
298 typedef struct {
299 //! Rate of the compound modes.
300 int32_t rate[COMPOUND_TYPES];
301 //! Distortion of the compound modes.
302 int64_t dist[COMPOUND_TYPES];
303 //! Estimated rate of the compound modes.
304 int32_t model_rate[COMPOUND_TYPES];
305 //! Estimated distortion of the compound modes.
306 int64_t model_dist[COMPOUND_TYPES];
307 //! Rate need to send the mask type.
308 int comp_rs2[COMPOUND_TYPES];
309 //! Motion vector for each predictor.
310 int_mv mv[2];
311 //! Ref frame for each predictor.
312 MV_REFERENCE_FRAME ref_frames[2];
313 //! Current prediction mode.
314 PREDICTION_MODE mode;
315 //! Current interpolation filter.
316 int_interpfilters filter;
317 //! Refmv index in the drl.
318 int ref_mv_idx;
319 //! Whether the predictors are GLOBALMV.
320 int is_global[2];
321 //! Current parameters for interinter mode.
322 INTERINTER_COMPOUND_DATA interinter_comp;
323 } COMP_RD_STATS;
324
325 /*! \brief Contains buffers used to speed up rdopt for obmc.
326 *
327 * See the comments for calc_target_weighted_pred for details.
328 */
329 typedef struct {
330 /*! \brief A new source weighted with the above and left predictors.
331 *
332 * Used to efficiently construct multiple obmc predictors during rdopt.
333 */
334 int32_t *wsrc;
335 /*! \brief A new mask constructed from the original horz/vert mask.
336 *
337 * \copydetails wsrc
338 */
339 int32_t *mask;
340 /*! \brief Prediction from the up predictor.
341 *
342 * Used to build the obmc predictor.
343 */
344 uint8_t *above_pred;
345 /*! \brief Prediction from the up predictor.
346 *
347 * \copydetails above_pred
348 */
349 uint8_t *left_pred;
350 } OBMCBuffer;
351
352 /*! \brief Contains color maps used in palette mode.
353 */
354 typedef struct {
355 //! The best color map found.
356 uint8_t best_palette_color_map[MAX_PALETTE_SQUARE];
357 //! A temporary buffer used for k-means clustering.
358 int16_t kmeans_data_buf[2 * MAX_PALETTE_SQUARE];
359 } PALETTE_BUFFER;
360
361 /*! \brief Contains buffers used by av1_compound_type_rd()
362 *
363 * For sizes and alignment of these arrays, refer to
364 * alloc_compound_type_rd_buffers() function.
365 */
366 typedef struct {
367 //! First prediction.
368 uint8_t *pred0;
369 //! Second prediction.
370 uint8_t *pred1;
371 //! Source - first prediction.
372 int16_t *residual1;
373 //! Second prediction - first prediction.
374 int16_t *diff10;
375 //! Backup of the best segmentation mask.
376 uint8_t *tmp_best_mask_buf;
377 } CompoundTypeRdBuffers;
378
379 /*! \brief Holds some parameters related to partitioning schemes in AV1.
380 */
381 // TODO([email protected]): Consolidate this with SIMPLE_MOTION_DATA_TREE
382 typedef struct {
383 #if !CONFIG_REALTIME_ONLY
384 // The following 4 parameters are used for cnn-based partitioning on intra
385 // frame.
386 /*! \brief Current index on the partition block quad tree.
387 *
388 * Used to index into the cnn buffer for partition decision.
389 */
390 int quad_tree_idx;
391 //! Whether the CNN buffer contains valid output.
392 int cnn_output_valid;
393 //! A buffer used by our segmentation CNN for intra-frame partitioning.
394 float cnn_buffer[CNN_OUT_BUF_SIZE];
395 //! log of the quantization parameter of the ancestor BLOCK_64X64.
396 float log_q;
397 #endif
398
399 /*! \brief Variance of the subblocks in the superblock.
400 *
401 * This is used by rt mode for variance based partitioning.
402 * The indices corresponds to the following block sizes:
403 * - 0 - 128x128
404 * - 1-2 - 128x64
405 * - 3-4 - 64x128
406 * - 5-8 - 64x64
407 * - 9-16 - 64x32
408 * - 17-24 - 32x64
409 * - 25-40 - 32x32
410 * - 41-104 - 16x16
411 */
412 uint8_t variance_low[105];
413 } PartitionSearchInfo;
414
415 /*!\cond */
416 enum {
417 /**
418 * Do not prune transform depths.
419 */
420 TX_PRUNE_NONE = 0,
421 /**
422 * Prune largest transform (depth 0) based on NN model.
423 */
424 TX_PRUNE_LARGEST = 1,
425 /**
426 * Prune split transforms (depth>=1) based on NN model.
427 */
428 TX_PRUNE_SPLIT = 2,
429 } UENUM1BYTE(TX_PRUNE_TYPE);
430 /*!\endcond */
431
432 /*! \brief Defines the parameters used to perform txfm search.
433 *
434 * For the most part, this determines how various speed features are used.
435 */
436 typedef struct {
437 /*! \brief Whether to limit the intra txfm search type to the default txfm.
438 *
439 * This could either be a result of either sequence parameter or speed
440 * features.
441 */
442 int use_default_intra_tx_type;
443
444 /*! Probability threshold used for conditionally forcing tx type*/
445 int default_inter_tx_type_prob_thresh;
446
447 //! Whether to prune 2d transforms based on 1d transform results.
448 int prune_2d_txfm_mode;
449
450 /*! \brief Variable from \ref WinnerModeParams based on current eval mode.
451 *
452 * See the documentation for \ref WinnerModeParams for more detail.
453 */
454 unsigned int coeff_opt_thresholds[2];
455 /*! \copydoc coeff_opt_thresholds */
456 unsigned int tx_domain_dist_threshold;
457 /*! \copydoc coeff_opt_thresholds */
458 TX_SIZE_SEARCH_METHOD tx_size_search_method;
459 /*! \copydoc coeff_opt_thresholds */
460 unsigned int use_transform_domain_distortion;
461 /*! \copydoc coeff_opt_thresholds */
462 unsigned int skip_txfm_level;
463
464 /*! \brief How to search for the optimal tx_size
465 *
466 * If ONLY_4X4, use TX_4X4; if TX_MODE_LARGEST, use the largest tx_size for
467 * the current partition block; if TX_MODE_SELECT, search through the whole
468 * tree.
469 *
470 * \attention
471 * Although this looks suspicious similar to a bitstream element, this
472 * tx_mode_search_type is only used internally by the encoder, and is *not*
473 * written to the bitstream. It determines what kind of tx_mode would be
474 * searched. For example, we might set it to TX_MODE_LARGEST to find a good
475 * candidate, then code it as TX_MODE_SELECT.
476 */
477 TX_MODE tx_mode_search_type;
478
479 /*!
480 * Determines whether a block can be predicted as transform skip or DC only
481 * based on residual mean and variance.
482 * Type 0 : No skip block or DC only block prediction
483 * Type 1 : Prediction of skip block based on residual mean and variance
484 * Type 2 : Prediction of skip block or DC only block based on residual mean
485 * and variance
486 */
487 unsigned int predict_dc_level;
488
489 /*!
490 * Whether or not we should use the quantization matrix as weights for PSNR
491 * during RD search.
492 */
493 int use_qm_dist_metric;
494
495 /*!
496 * Keep track of previous mode evaluation stage type. This will be used to
497 * reset mb rd hash record when mode evaluation type changes.
498 */
499 int mode_eval_type;
500
501 #if !CONFIG_REALTIME_ONLY
502 //! Indicates the transform depths for which RD evaluation is skipped.
503 TX_PRUNE_TYPE nn_prune_depths_for_intra_tx;
504
505 /*! \brief Indicates if NN model should be invoked to prune transform depths.
506 *
507 * Used to signal whether NN model should be evaluated to prune the R-D
508 * evaluation of specific transform depths.
509 */
510 bool enable_nn_prune_intra_tx_depths;
511 #endif
512 } TxfmSearchParams;
513
514 /*!\cond */
515 #define MAX_NUM_8X8_TXBS ((MAX_MIB_SIZE >> 1) * (MAX_MIB_SIZE >> 1))
516 #define MAX_NUM_16X16_TXBS ((MAX_MIB_SIZE >> 2) * (MAX_MIB_SIZE >> 2))
517 #define MAX_NUM_32X32_TXBS ((MAX_MIB_SIZE >> 3) * (MAX_MIB_SIZE >> 3))
518 #define MAX_NUM_64X64_TXBS ((MAX_MIB_SIZE >> 4) * (MAX_MIB_SIZE >> 4))
519 /*!\endcond */
520
521 /*! \brief Stores various encoding/search decisions related to txfm search.
522 *
523 * This struct contains a cache of previous txfm results, and some buffers for
524 * the current txfm decision.
525 */
526 typedef struct {
527 //! Whether to skip transform and quantization on a partition block level.
528 uint8_t skip_txfm;
529
530 /*! \brief Whether to skip transform and quantization on a txfm block level.
531 *
532 * Skips transform and quantization on a transform block level inside the
533 * current partition block. Each element of this array is used as a bit-field.
534 * So for example, the we are skipping on the luma plane, then the last bit
535 * would be set to 1.
536 */
537 uint8_t blk_skip[MAX_MIB_SIZE * MAX_MIB_SIZE];
538
539 /*! \brief Transform types inside the partition block
540 *
541 * Keeps a record of what kind of transform to use for each of the transform
542 * block inside the partition block.
543 * \attention The buffer here is *never* directly used. Instead, this just
544 * allocates the memory for MACROBLOCKD::tx_type_map during rdopt on the
545 * partition block. So if we need to save memory, we could move the allocation
546 * to pick_sb_mode instead.
547 */
548 uint8_t tx_type_map_[MAX_MIB_SIZE * MAX_MIB_SIZE];
549
550 //! Txfm hash records of inter-modes.
551 MB_RD_RECORD *mb_rd_record;
552
553 /*! \brief Number of txb splits.
554 *
555 * Keep track of how many times we've used split tx partition for transform
556 * blocks. Somewhat misleadingly, this parameter doesn't actually keep track
557 * of the count of the current block. Instead, it's a cumulative count across
558 * of the whole frame. The main usage is that if txb_split_count is zero, then
559 * we can signal TX_MODE_LARGEST at frame level.
560 */
561 // TODO([email protected]): Move this to a more appropriate location such
562 // as ThreadData.
563 unsigned int txb_split_count;
564 #if CONFIG_SPEED_STATS
565 //! For debugging. Used to check how many txfm searches we are doing.
566 unsigned int tx_search_count;
567 #endif // CONFIG_SPEED_STATS
568 } TxfmSearchInfo;
569 #undef MAX_NUM_8X8_TXBS
570 #undef MAX_NUM_16X16_TXBS
571 #undef MAX_NUM_32X32_TXBS
572 #undef MAX_NUM_64X64_TXBS
573
574 /*! \brief Holds the entropy costs for various modes sent to the bitstream.
575 *
576 * \attention This does not include the costs for mv and transformed
577 * coefficients.
578 */
579 typedef struct {
580 /*****************************************************************************
581 * \name Partition Costs
582 ****************************************************************************/
583 /**@{*/
584 //! Cost for coding the partition.
585 int partition_cost[PARTITION_CONTEXTS][EXT_PARTITION_TYPES];
586 /**@}*/
587
588 /*****************************************************************************
589 * \name Intra Costs: General
590 ****************************************************************************/
591 /**@{*/
592 //! Luma mode cost for inter frame.
593 int mbmode_cost[BLOCK_SIZE_GROUPS][INTRA_MODES];
594 //! Luma mode cost for intra frame.
595 int y_mode_costs[INTRA_MODES][INTRA_MODES][INTRA_MODES];
596 //! Chroma mode cost
597 int intra_uv_mode_cost[CFL_ALLOWED_TYPES][INTRA_MODES][UV_INTRA_MODES];
598 //! filter_intra_cost
599 int filter_intra_cost[BLOCK_SIZES_ALL][2];
600 //! filter_intra_mode_cost
601 int filter_intra_mode_cost[FILTER_INTRA_MODES];
602 //! angle_delta_cost
603 int angle_delta_cost[DIRECTIONAL_MODES][2 * MAX_ANGLE_DELTA + 1];
604
605 //! Rate rate associated with each alpha codeword
606 int cfl_cost[CFL_JOINT_SIGNS][CFL_PRED_PLANES][CFL_ALPHABET_SIZE];
607 /**@}*/
608
609 /*****************************************************************************
610 * \name Intra Costs: Screen Contents
611 ****************************************************************************/
612 /**@{*/
613 //! intrabc_cost
614 int intrabc_cost[2];
615
616 //! palette_y_size_cost
617 int palette_y_size_cost[PALATTE_BSIZE_CTXS][PALETTE_SIZES];
618 //! palette_uv_size_cost
619 int palette_uv_size_cost[PALATTE_BSIZE_CTXS][PALETTE_SIZES];
620 //! palette_y_color_cost
621 int palette_y_color_cost[PALETTE_SIZES][PALETTE_COLOR_INDEX_CONTEXTS]
622 [PALETTE_COLORS];
623 //! palette_uv_color_cost
624 int palette_uv_color_cost[PALETTE_SIZES][PALETTE_COLOR_INDEX_CONTEXTS]
625 [PALETTE_COLORS];
626 //! palette_y_mode_cost
627 int palette_y_mode_cost[PALATTE_BSIZE_CTXS][PALETTE_Y_MODE_CONTEXTS][2];
628 //! palette_uv_mode_cost
629 int palette_uv_mode_cost[PALETTE_UV_MODE_CONTEXTS][2];
630 /**@}*/
631
632 /*****************************************************************************
633 * \name Inter Costs: MV Modes
634 ****************************************************************************/
635 /**@{*/
636 //! skip_mode_cost
637 int skip_mode_cost[SKIP_MODE_CONTEXTS][2];
638 //! newmv_mode_cost
639 int newmv_mode_cost[NEWMV_MODE_CONTEXTS][2];
640 //! zeromv_mode_cost
641 int zeromv_mode_cost[GLOBALMV_MODE_CONTEXTS][2];
642 //! refmv_mode_cost
643 int refmv_mode_cost[REFMV_MODE_CONTEXTS][2];
644 //! drl_mode_cost0
645 int drl_mode_cost0[DRL_MODE_CONTEXTS][2];
646 /**@}*/
647
648 /*****************************************************************************
649 * \name Inter Costs: Ref Frame Types
650 ****************************************************************************/
651 /**@{*/
652 //! single_ref_cost
653 int single_ref_cost[REF_CONTEXTS][SINGLE_REFS - 1][2];
654 //! comp_inter_cost
655 int comp_inter_cost[COMP_INTER_CONTEXTS][2];
656 //! comp_ref_type_cost
657 int comp_ref_type_cost[COMP_REF_TYPE_CONTEXTS]
658 [CDF_SIZE(COMP_REFERENCE_TYPES)];
659 //! uni_comp_ref_cost
660 int uni_comp_ref_cost[UNI_COMP_REF_CONTEXTS][UNIDIR_COMP_REFS - 1]
661 [CDF_SIZE(2)];
662 /*! \brief Cost for signaling ref_frame[0] in bidir-comp mode
663 *
664 * Includes LAST_FRAME, LAST2_FRAME, LAST3_FRAME, and GOLDEN_FRAME.
665 */
666 int comp_ref_cost[REF_CONTEXTS][FWD_REFS - 1][2];
667 /*! \brief Cost for signaling ref_frame[1] in bidir-comp mode
668 *
669 * Includes ALTREF_FRAME, ALTREF2_FRAME, and BWDREF_FRAME.
670 */
671 int comp_bwdref_cost[REF_CONTEXTS][BWD_REFS - 1][2];
672 /**@}*/
673
674 /*****************************************************************************
675 * \name Inter Costs: Compound Types
676 ****************************************************************************/
677 /**@{*/
678 //! intra_inter_cost
679 int intra_inter_cost[INTRA_INTER_CONTEXTS][2];
680 //! inter_compound_mode_cost
681 int inter_compound_mode_cost[INTER_MODE_CONTEXTS][INTER_COMPOUND_MODES];
682 //! compound_type_cost
683 int compound_type_cost[BLOCK_SIZES_ALL][MASKED_COMPOUND_TYPES];
684 //! wedge_idx_cost
685 int wedge_idx_cost[BLOCK_SIZES_ALL][16];
686 //! interintra_cost
687 int interintra_cost[BLOCK_SIZE_GROUPS][2];
688 //! wedge_interintra_cost
689 int wedge_interintra_cost[BLOCK_SIZES_ALL][2];
690 //! interintra_mode_cost
691 int interintra_mode_cost[BLOCK_SIZE_GROUPS][INTERINTRA_MODES];
692 /**@}*/
693
694 /*****************************************************************************
695 * \name Inter Costs: Compound Masks
696 ****************************************************************************/
697 /**@{*/
698 //! comp_idx_cost
699 int comp_idx_cost[COMP_INDEX_CONTEXTS][2];
700 //! comp_group_idx_cost
701 int comp_group_idx_cost[COMP_GROUP_IDX_CONTEXTS][2];
702 /**@}*/
703
704 /*****************************************************************************
705 * \name Inter Costs: Motion Modes/Filters
706 ****************************************************************************/
707 /**@{*/
708 //! motion_mode_cost
709 int motion_mode_cost[BLOCK_SIZES_ALL][MOTION_MODES];
710 //! motion_mode_cost1
711 int motion_mode_cost1[BLOCK_SIZES_ALL][2];
712 //! switchable_interp_costs
713 int switchable_interp_costs[SWITCHABLE_FILTER_CONTEXTS][SWITCHABLE_FILTERS];
714 /**@}*/
715
716 /*****************************************************************************
717 * \name Txfm Mode Costs
718 ****************************************************************************/
719 /**@{*/
720 //! skip_txfm_cost
721 int skip_txfm_cost[SKIP_CONTEXTS][2];
722 //! tx_size_cost
723 int tx_size_cost[TX_SIZES - 1][TX_SIZE_CONTEXTS][TX_SIZES];
724 //! txfm_partition_cost
725 int txfm_partition_cost[TXFM_PARTITION_CONTEXTS][2];
726 //! inter_tx_type_costs
727 int inter_tx_type_costs[EXT_TX_SETS_INTER][EXT_TX_SIZES][TX_TYPES];
728 //! intra_tx_type_costs
729 int intra_tx_type_costs[EXT_TX_SETS_INTRA][EXT_TX_SIZES][INTRA_MODES]
730 [TX_TYPES];
731 /**@}*/
732
733 /*****************************************************************************
734 * \name Restoration Mode Costs
735 ****************************************************************************/
736 /**@{*/
737 //! switchable_restore_cost
738 int switchable_restore_cost[RESTORE_SWITCHABLE_TYPES];
739 //! wiener_restore_cost
740 int wiener_restore_cost[2];
741 //! sgrproj_restore_cost
742 int sgrproj_restore_cost[2];
743 /**@}*/
744
745 /*****************************************************************************
746 * \name Segmentation Mode Costs
747 ****************************************************************************/
748 /**@{*/
749 //! tmp_pred_cost
750 int tmp_pred_cost[SEG_TEMPORAL_PRED_CTXS][2];
751 //! spatial_pred_cost
752 int spatial_pred_cost[SPATIAL_PREDICTION_PROBS][MAX_SEGMENTS];
753 /**@}*/
754 } ModeCosts;
755
756 /*! \brief Holds mv costs for encoding and motion search.
757 */
758 typedef struct {
759 /*****************************************************************************
760 * \name Encoding Costs
761 * Here are the entropy costs needed to encode a given mv.
762 * \ref nmv_cost_alloc and \ref nmv_cost_hp_alloc are two arrays that holds
763 * the memory for holding the mv cost. But since the motion vectors can be
764 * negative, we shift them to the middle and store the resulting pointer in
765 * \ref nmv_cost and \ref nmv_cost_hp for easier referencing. Finally, \ref
766 * mv_cost_stack points to the \ref nmv_cost with the mv precision we are
767 * currently working with. In essence, only \ref mv_cost_stack is needed for
768 * motion search, the other can be considered private.
769 ****************************************************************************/
770 /**@{*/
771 //! Costs for coding the zero components.
772 int nmv_joint_cost[MV_JOINTS];
773
774 //! Allocates memory for 1/4-pel motion vector costs.
775 int nmv_cost_alloc[2][MV_VALS];
776 //! Allocates memory for 1/8-pel motion vector costs.
777 int nmv_cost_hp_alloc[2][MV_VALS];
778 //! Points to the middle of \ref nmv_cost_alloc
779 int *nmv_cost[2];
780 //! Points to the middle of \ref nmv_cost_hp_alloc
781 int *nmv_cost_hp[2];
782 //! Points to the nmv_cost_hp in use.
783 int **mv_cost_stack;
784 /**@}*/
785 } MvCosts;
786
787 /*! \brief Holds mv costs for intrabc.
788 */
789 typedef struct {
790 /*! Costs for coding the joint mv. */
791 int joint_mv[MV_JOINTS];
792
793 /*! \brief Cost of transmitting the actual motion vector.
794 * dv_costs_alloc[0][i] is the cost of motion vector with horizontal
795 * component (mv_row) equal to i - MV_MAX. dv_costs_alloc[1][i] is the cost of
796 * motion vector with vertical component (mv_col) equal to i - MV_MAX.
797 */
798 int dv_costs_alloc[2][MV_VALS];
799
800 /*! Points to the middle of \ref dv_costs_alloc. */
801 int *dv_costs[2];
802 } IntraBCMVCosts;
803
804 /*! \brief Holds the costs needed to encode the coefficients
805 */
806 typedef struct {
807 //! Costs for coding the coefficients.
808 LV_MAP_COEFF_COST coeff_costs[TX_SIZES][PLANE_TYPES];
809 //! Costs for coding the eobs.
810 LV_MAP_EOB_COST eob_costs[7][2];
811 } CoeffCosts;
812
813 /*!\cond */
814 // 4: NEAREST, NEW, NEAR, GLOBAL
815 #define SINGLE_REF_MODES ((REF_FRAMES - 1) * 4)
816 /*!\endcond */
817 struct inter_modes_info;
818
819 /*! \brief Holds the motion samples for warp motion model estimation
820 */
821 typedef struct {
822 //! Number of samples.
823 int num;
824 //! Sample locations in current frame.
825 int pts[16];
826 //! Sample location in the reference frame.
827 int pts_inref[16];
828 } WARP_SAMPLE_INFO;
829
830 /*!\cond */
831 typedef enum {
832 kZeroSad = 0,
833 kVeryLowSad = 1,
834 kLowSad = 2,
835 kMedSad = 3,
836 kHighSad = 4
837 } SOURCE_SAD;
838
839 typedef struct {
840 //! SAD levels in non-rd path
841 SOURCE_SAD source_sad_nonrd;
842 //! SAD levels in rd-path for var-based part qindex thresholds
843 SOURCE_SAD source_sad_rd;
844 int lighting_change;
845 int low_sumdiff;
846 } CONTENT_STATE_SB;
847
848 // Structure to hold pixel level gradient info.
849 typedef struct {
850 uint16_t abs_dx_abs_dy_sum;
851 int8_t hist_bin_idx;
852 bool is_dx_zero;
853 } PixelLevelGradientInfo;
854
855 // Structure to hold the variance and log(1 + variance) for 4x4 sub-blocks.
856 typedef struct {
857 double log_var;
858 int var;
859 } Block4x4VarInfo;
860
861 #ifndef NDEBUG
862 typedef struct SetOffsetsLoc {
863 int mi_row;
864 int mi_col;
865 BLOCK_SIZE bsize;
866 } SetOffsetsLoc;
867 #endif // NDEBUG
868
869 /*!\endcond */
870
871 /*! \brief Encoder's parameters related to the current coding block.
872 *
873 * This struct contains most of the information the encoder needs to encode the
874 * current coding block. This includes the src and pred buffer, a copy of the
875 * decoder's view of the current block, the txfm coefficients. This struct also
876 * contains various buffers and data used to speed up the encoding process.
877 */
878 typedef struct macroblock {
879 /*****************************************************************************
880 * \name Source, Buffers and Decoder
881 ****************************************************************************/
882 /**@{*/
883 /*! \brief Each of the encoding plane.
884 *
885 * An array holding the src buffer for each of plane of the current block. It
886 * also contains the txfm and quantized txfm coefficients.
887 */
888 struct macroblock_plane plane[MAX_MB_PLANE];
889
890 /*! \brief Decoder's view of current coding block.
891 *
892 * Contains the encoder's copy of what the decoder sees in the current block.
893 * Most importantly, this struct contains pointers to mbmi that is used in
894 * final bitstream packing.
895 */
896 MACROBLOCKD e_mbd;
897
898 /*! \brief Derived coding information.
899 *
900 * Contains extra information not transmitted in the bitstream but are
901 * derived. For example, this contains the stack of ref_mvs.
902 */
903 MB_MODE_INFO_EXT mbmi_ext;
904
905 /*! \brief Finalized mbmi_ext for the whole frame.
906 *
907 * Contains the finalized info in mbmi_ext that gets used at the frame level
908 * for bitstream packing.
909 */
910 MB_MODE_INFO_EXT_FRAME *mbmi_ext_frame;
911
912 //! Entropy context for the current row.
913 FRAME_CONTEXT *row_ctx;
914 /*! \brief Entropy context for the current tile.
915 *
916 * This context will be used to update color_map_cdf pointer which would be
917 * used during pack bitstream. For single thread and tile-multithreading case
918 * this pointer will be same as xd->tile_ctx, but for the case of row-mt:
919 * xd->tile_ctx will point to a temporary context while tile_pb_ctx will point
920 * to the accurate tile context.
921 */
922 FRAME_CONTEXT *tile_pb_ctx;
923
924 /*! \brief Buffer of transformed coefficients
925 *
926 * Points to cb_coef_buff in the AV1_COMP struct, which contains the finalized
927 * coefficients. This is here to conveniently copy the best coefficients to
928 * frame level for bitstream packing. Since CB_COEFF_BUFFER is allocated on a
929 * superblock level, we need to combine it with cb_offset to get the proper
930 * position for the current coding block.
931 */
932 CB_COEFF_BUFFER *cb_coef_buff;
933 //! Offset of current coding block's coeff buffer relative to the sb.
934 uint16_t cb_offset[PLANE_TYPES];
935
936 //! Modified source and masks used for fast OBMC search.
937 OBMCBuffer obmc_buffer;
938 //! Buffer to store the best palette map.
939 PALETTE_BUFFER *palette_buffer;
940 //! Buffer used for compound_type_rd().
941 CompoundTypeRdBuffers comp_rd_buffer;
942 //! Buffer to store convolution during averaging process in compound mode.
943 CONV_BUF_TYPE *tmp_conv_dst;
944
945 /*! \brief Temporary buffer to hold prediction.
946 *
947 * Points to a buffer that is used to hold temporary prediction results. This
948 * is used in two ways:
949 * - This is a temporary buffer used to ping-pong the prediction in
950 * handle_inter_mode.
951 * - xd->tmp_obmc_bufs also points to this buffer, and is used in ombc
952 * prediction.
953 */
954 uint8_t *tmp_pred_bufs[2];
955 /**@}*/
956
957 /*****************************************************************************
958 * \name Rdopt Costs
959 ****************************************************************************/
960 /**@{*/
961 /*! \brief Quantization index for the current partition block.
962 *
963 * This is used to as the index to find quantization parameter for luma and
964 * chroma transformed coefficients.
965 */
966 int qindex;
967
968 /*! \brief Difference between frame-level qindex and current qindex.
969 *
970 * This is used to track whether a non-zero delta for qindex is used at least
971 * once in the current frame.
972 */
973 int delta_qindex;
974
975 /*! \brief Difference between frame-level qindex and qindex used to
976 * compute rdmult (lambda).
977 *
978 * rdmult_delta_qindex is assigned the same as delta_qindex before qp sweep.
979 * During qp sweep, delta_qindex is changed and used to calculate the actual
980 * quant params, while rdmult_delta_qindex remains the same, and is used to
981 * calculate the rdmult in "set_deltaq_rdmult".
982 */
983 int rdmult_delta_qindex;
984
985 /*! \brief Current qindex (before being adjusted by delta_q_res) used to
986 * derive rdmult_delta_qindex.
987 */
988 int rdmult_cur_qindex;
989
990 /*! \brief Rate-distortion multiplier.
991 *
992 * The rd multiplier used to determine the rate-distortion trade-off. This is
993 * roughly proportional to the inverse of q-index for a given frame, but this
994 * can be manipulated for better rate-control. For example, in tune_ssim
995 * mode, this is scaled by a factor related to the variance of the current
996 * block.
997 */
998 int rdmult;
999
1000 //! Intra only, per sb rd adjustment.
1001 int intra_sb_rdmult_modifier;
1002
1003 //! Superblock level distortion propagation factor.
1004 double rb;
1005
1006 //! Energy in the current source coding block. Used to calculate \ref rdmult
1007 int mb_energy;
1008 //! Energy in the current source superblock. Used to calculate \ref rdmult
1009 int sb_energy_level;
1010
1011 //! The rate needed to signal a mode to the bitstream.
1012 ModeCosts mode_costs;
1013
1014 //! The rate needed to encode a new motion vector to the bitstream and some
1015 //! multipliers for motion search.
1016 MvCosts *mv_costs;
1017
1018 /*! The rate needed to encode a new motion vector to the bitstream in intrabc
1019 * mode.
1020 */
1021 IntraBCMVCosts *dv_costs;
1022
1023 //! The rate needed to signal the txfm coefficients to the bitstream.
1024 CoeffCosts coeff_costs;
1025 /**@}*/
1026
1027 /*****************************************************************************
1028 * \name Rate to Distortion Multipliers
1029 ****************************************************************************/
1030 /**@{*/
1031 //! A multiplier that converts mv cost to l2 error.
1032 int errorperbit;
1033 //! A multiplier that converts mv cost to l1 error.
1034 int sadperbit;
1035 /**@}*/
1036
1037 /******************************************************************************
1038 * \name Segmentation
1039 *****************************************************************************/
1040 /**@{*/
1041 /*! \brief Skip mode for the segment
1042 *
1043 * A syntax element of the segmentation mode. In skip_block mode, all mvs are
1044 * set 0 and all txfms are skipped.
1045 */
1046 int seg_skip_block;
1047
1048 /*! \brief Number of segment 1 blocks
1049 * Actual number of (4x4) blocks that were applied delta-q,
1050 * for segment 1.
1051 */
1052 int actual_num_seg1_blocks;
1053
1054 /*!\brief Number of segment 2 blocks
1055 * Actual number of (4x4) blocks that were applied delta-q,
1056 * for segment 2.
1057 */
1058 int actual_num_seg2_blocks;
1059
1060 /*!\brief Number of zero motion vectors
1061 */
1062 int cnt_zeromv;
1063
1064 /*!\brief Flag to force zeromv-skip at superblock level, for nonrd path.
1065 *
1066 * 0/1 imply zeromv-skip is disabled/enabled. 2 implies that the blocks
1067 * in the superblock may be marked as zeromv-skip at block level.
1068 */
1069 int force_zeromv_skip_for_sb;
1070
1071 /*!\brief Flag to force zeromv-skip at block level, for nonrd path.
1072 */
1073 int force_zeromv_skip_for_blk;
1074
1075 /*! \brief Previous segment id for which qmatrices were updated.
1076 * This is used to bypass setting of qmatrices if no change in qindex.
1077 */
1078 int prev_segment_id;
1079 /**@}*/
1080
1081 /*****************************************************************************
1082 * \name Superblock
1083 ****************************************************************************/
1084 /**@{*/
1085 //! Information on a whole superblock level.
1086 // TODO([email protected]): Refactor this out of macroblock
1087 SuperBlockEnc sb_enc;
1088
1089 /*! \brief Characteristics of the current superblock.
1090 *
1091 * Characteristics like whether the block has high sad, low sad, etc. This is
1092 * only used by av1 realtime mode.
1093 */
1094 CONTENT_STATE_SB content_state_sb;
1095 /**@}*/
1096
1097 /*****************************************************************************
1098 * \name Reference Frame Search
1099 ****************************************************************************/
1100 /**@{*/
1101 /*! \brief Sum absolute distortion of the predicted mv for each ref frame.
1102 *
1103 * This is used to measure how viable a reference frame is.
1104 */
1105 int pred_mv_sad[REF_FRAMES];
1106 /*! \brief The minimum of \ref pred_mv_sad.
1107 *
1108 * Index 0 stores the minimum \ref pred_mv_sad across past reference frames.
1109 * Index 1 stores the minimum \ref pred_mv_sad across future reference frames.
1110 */
1111 int best_pred_mv_sad[2];
1112 //! The sad of the 1st mv ref (nearest).
1113 int pred_mv0_sad[REF_FRAMES];
1114 //! The sad of the 2nd mv ref (near).
1115 int pred_mv1_sad[REF_FRAMES];
1116
1117 /*! \brief Disables certain ref frame pruning based on tpl.
1118 *
1119 * Determines whether a given ref frame is "good" based on data from the TPL
1120 * model. If so, this stops selective_ref frame from pruning the given ref
1121 * frame at block level.
1122 */
1123 uint8_t tpl_keep_ref_frame[REF_FRAMES];
1124
1125 /*! \brief Warp motion samples buffer.
1126 *
1127 * Store the motion samples used for warp motion.
1128 */
1129 WARP_SAMPLE_INFO warp_sample_info[REF_FRAMES];
1130
1131 /*! \brief Reference frames picked by the square subblocks in a superblock.
1132 *
1133 * Keeps track of ref frames that are selected by square partition blocks
1134 * within a superblock, in MI resolution. They can be used to prune ref frames
1135 * for rectangular blocks.
1136 */
1137 int picked_ref_frames_mask[MAX_MIB_SIZE * MAX_MIB_SIZE];
1138
1139 /*! \brief Prune ref frames in real-time mode.
1140 *
1141 * Determines whether to prune reference frames in real-time mode. For the
1142 * most part, this is the same as nonrd_prune_ref_frame_search in
1143 * cpi->sf.rt_sf.nonrd_prune_ref_frame_search, but this can be selectively
1144 * turned off if the only frame available is GOLDEN_FRAME.
1145 */
1146 int nonrd_prune_ref_frame_search;
1147 /**@}*/
1148
1149 /*****************************************************************************
1150 * \name Partition Search
1151 ****************************************************************************/
1152 /**@{*/
1153 //! Stores some partition-search related buffers.
1154 PartitionSearchInfo part_search_info;
1155
1156 /*! \brief Whether to disable some features to force a mode in current block.
1157 *
1158 * In some cases, our speed features can be overly aggressive and remove all
1159 * modes search in the superblock. When this happens, we set
1160 * must_find_valid_partition to 1 to reduce the number of speed features, and
1161 * recode the superblock again.
1162 */
1163 int must_find_valid_partition;
1164 /**@}*/
1165
1166 /*****************************************************************************
1167 * \name Prediction Mode Search
1168 ****************************************************************************/
1169 /**@{*/
1170 /*! \brief Inter skip mode.
1171 *
1172 * Skip mode tries to use the closest forward and backward references for
1173 * inter prediction. Skip here means to skip transmitting the reference
1174 * frames, not to be confused with skip_txfm.
1175 */
1176 int skip_mode;
1177
1178 /*! \brief Factors used for rd-thresholding.
1179 *
1180 * Determines a rd threshold to determine whether to continue searching the
1181 * current mode. If the current best rd is already <= threshold, then we skip
1182 * the current mode.
1183 */
1184 int thresh_freq_fact[BLOCK_SIZES_ALL][MAX_MODES];
1185
1186 /*! \brief Tracks the winner modes in the current coding block.
1187 *
1188 * Winner mode is a two-pass strategy to find the best prediction mode. In the
1189 * first pass, we search the prediction modes with a limited set of txfm
1190 * options, and keep the top modes. These modes are called the winner modes.
1191 * In the second pass, we retry the winner modes with more thorough txfm
1192 * options.
1193 */
1194 WinnerModeStats *winner_mode_stats;
1195 //! Tracks how many winner modes there are.
1196 int winner_mode_count;
1197
1198 /*! \brief The model used for rd-estimation to avoid txfm
1199 *
1200 * These are for inter_mode_rd_model_estimation, which is another two pass
1201 * approach. In this speed feature, we collect data in the first couple frames
1202 * to build an rd model to estimate the rdcost of a prediction model based on
1203 * the residue error. Once enough data is collected, this speed feature uses
1204 * the estimated rdcost to find the most performant prediction mode. Then we
1205 * follow up with a second pass find the best transform for the mode.
1206 * Determines if one would go with reduced complexity transform block
1207 * search model to select prediction modes, or full complexity model
1208 * to select transform kernel.
1209 */
1210 TXFM_RD_MODEL rd_model;
1211
1212 /*! \brief Stores the inter mode information needed to build an rd model.
1213 *
1214 * These are for inter_mode_rd_model_estimation, which is another two pass
1215 * approach. In this speed feature, we collect data in the first couple frames
1216 * to build an rd model to estimate the rdcost of a prediction model based on
1217 * the residue error. Once enough data is collected, this speed feature uses
1218 * the estimated rdcost to find the most performant prediction mode. Then we
1219 * follow up with a second pass find the best transform for the mode.
1220 */
1221 // TODO(any): try to consolidate this speed feature with winner mode
1222 // processing.
1223 struct inter_modes_info *inter_modes_info;
1224
1225 //! How to blend the compound predictions.
1226 uint8_t compound_idx;
1227
1228 //! A caches of results of compound type search so they can be reused later.
1229 COMP_RD_STATS comp_rd_stats[MAX_COMP_RD_STATS];
1230 //! The idx for the latest compound mode in the cache \ref comp_rd_stats.
1231 int comp_rd_stats_idx;
1232
1233 /*! \brief Whether to recompute the luma prediction.
1234 *
1235 * In interpolation search, we can usually skip recalculating the luma
1236 * prediction because it is already calculated by a previous predictor. This
1237 * flag signifies that some modes might have been skipped, so we need to
1238 * rebuild the prediction.
1239 */
1240 int recalc_luma_mc_data;
1241
1242 /*! \brief Data structure to speed up intrabc search.
1243 *
1244 * Contains the hash table, hash function, and buffer used for intrabc.
1245 */
1246 IntraBCHashInfo intrabc_hash_info;
1247
1248 /*! \brief Whether to reuse the mode stored in mb_mode_cache. */
1249 int use_mb_mode_cache;
1250 /*! \brief The mode to reuse during \ref av1_rd_pick_intra_mode_sb and
1251 * \ref av1_rd_pick_inter_mode. */
1252 const MB_MODE_INFO *mb_mode_cache;
1253 /*! \brief Pointer to the buffer which caches gradient information.
1254 *
1255 * Pointer to the array of structures to store gradient information of each
1256 * pixel in a superblock. The buffer constitutes of MAX_SB_SQUARE pixel level
1257 * structures for each of the plane types (PLANE_TYPE_Y and PLANE_TYPE_UV).
1258 */
1259 PixelLevelGradientInfo *pixel_gradient_info;
1260 /*! \brief Flags indicating the availability of cached gradient info. */
1261 bool is_sb_gradient_cached[PLANE_TYPES];
1262
1263 /*! \brief Flag to reuse predicted samples of inter block. */
1264 bool reuse_inter_pred;
1265 /**@}*/
1266
1267 /*****************************************************************************
1268 * \name MV Search
1269 ****************************************************************************/
1270 /**@{*/
1271 /*! \brief Context used to determine the initial step size in motion search.
1272 *
1273 * This context is defined as the \f$l_\inf\f$ norm of the best ref_mvs for
1274 * each frame.
1275 */
1276 unsigned int max_mv_context[REF_FRAMES];
1277
1278 /*! \brief Limit for the range of motion vectors.
1279 *
1280 * These define limits to motion vector components to prevent them from
1281 * extending outside the UMV borders
1282 */
1283 FullMvLimits mv_limits;
1284
1285 /*! \brief Buffer for storing the search site config.
1286 *
1287 * When resize mode or super resolution mode is on, the stride of the
1288 * reference frame does not always match what's specified in \ref
1289 * MotionVectorSearchParams::search_site_cfg. When his happens, we update the
1290 * search_sine_config buffer here and use it for motion search.
1291 */
1292 search_site_config search_site_cfg_buf[NUM_DISTINCT_SEARCH_METHODS];
1293 /**@}*/
1294
1295 /*****************************************************************************
1296 * \name Txfm Search
1297 ****************************************************************************/
1298 /**@{*/
1299 /*! \brief Parameters that control how motion search is done.
1300 *
1301 * Stores various txfm search related parameters such as txfm_type, txfm_size,
1302 * trellis eob search, etc.
1303 */
1304 TxfmSearchParams txfm_search_params;
1305
1306 /*! \brief Results of the txfm searches that have been done.
1307 *
1308 * Caches old txfm search results and keeps the current txfm decisions to
1309 * facilitate rdopt.
1310 */
1311 TxfmSearchInfo txfm_search_info;
1312
1313 /*! \brief Whether there is a strong color activity.
1314 *
1315 * Used in REALTIME coding mode to enhance the visual quality at the boundary
1316 * of moving color objects.
1317 */
1318 uint8_t color_sensitivity_sb[MAX_MB_PLANE - 1];
1319 //! Color sensitivity flag for the superblock for golden reference.
1320 uint8_t color_sensitivity_sb_g[MAX_MB_PLANE - 1];
1321 //! Color sensitivity flag for the superblock for altref reference.
1322 uint8_t color_sensitivity_sb_alt[MAX_MB_PLANE - 1];
1323 //! Color sensitivity flag for the coding block.
1324 uint8_t color_sensitivity[MAX_MB_PLANE - 1];
1325 //! Coding block distortion value for uv/color, minimum over the inter modes.
1326 int64_t min_dist_inter_uv;
1327
1328 //! Threshold on the number of colors for testing palette mode.
1329 int color_palette_thresh;
1330
1331 //! The buffer used by search_tx_type() to swap dqcoeff in macroblockd_plane
1332 // so we can keep dqcoeff of the best tx_type.
1333 tran_low_t *dqcoeff_buf;
1334 /**@}*/
1335
1336 /*****************************************************************************
1337 * \name Misc
1338 ****************************************************************************/
1339 /**@{*/
1340 //! Variance of the source frame.
1341 unsigned int source_variance;
1342 //! Flag to indicate coding block is zero sad.
1343 int block_is_zero_sad;
1344 //! Flag to indicate superblock ME in variance partition is determined to be
1345 // good/reliable, and so the superblock MV will be tested in the
1346 // nonrd_pickmode. This is only used for LAST_FRAME.
1347 int sb_me_partition;
1348 //! Flag to indicate to test the superblock MV for the coding block in the
1349 // nonrd_pickmode.
1350 int sb_me_block;
1351 //! Motion vector from superblock MV derived from int_pro_motion() in
1352 // the variance_partitioning.
1353 int_mv sb_me_mv;
1354 //! Flag to indicate if a fixed partition should be used, only if the
1355 // speed feature rt_sf->use_fast_fixed_part is enabled.
1356 int sb_force_fixed_part;
1357 //! SSE of the current predictor.
1358 unsigned int pred_sse[REF_FRAMES];
1359 //! Prediction for ML based partition.
1360 #if CONFIG_RT_ML_PARTITIONING
1361 DECLARE_ALIGNED(16, uint8_t, est_pred[128 * 128]);
1362 #endif
1363 /**@}*/
1364
1365 /*! \brief NONE partition evaluated for merge.
1366 *
1367 * In variance based partitioning scheme, NONE & SPLIT partitions are
1368 * evaluated to check the SPLIT can be merged as NONE. This flag signifies the
1369 * partition is evaluated in the scheme.
1370 */
1371 int try_merge_partition;
1372
1373 /*! \brief Pointer to buffer which caches sub-block variances in a superblock.
1374 *
1375 * Pointer to the array of structures to store source variance information of
1376 * each 4x4 sub-block in a superblock. Block4x4VarInfo structure is used to
1377 * store source variance and log of source variance of each 4x4 sub-block.
1378 */
1379 Block4x4VarInfo *src_var_info_of_4x4_sub_blocks;
1380 #ifndef NDEBUG
1381 /*! \brief A hash to make sure av1_set_offsets is called */
1382 SetOffsetsLoc last_set_offsets_loc;
1383 #endif // NDEBUG
1384
1385 #if COLLECT_NONRD_PICK_MODE_STAT
1386 mode_search_stat_nonrd ms_stat_nonrd;
1387 #endif // COLLECT_NONRD_PICK_MODE_STAT
1388
1389 /*!\brief Number of pixels in current thread that choose palette mode in the
1390 * fast encoding stage for screen content tool detemination.
1391 */
1392 int palette_pixels;
1393
1394 /*!\brief Pointer to the structure which stores the statistics used by
1395 * sb-level multi-pass encoding.
1396 */
1397 struct SB_FIRST_PASS_STATS *sb_stats_cache;
1398
1399 /*!\brief Pointer to the structure which stores the statistics used by
1400 * first-pass when superblock is searched twice consecutively.
1401 */
1402 struct SB_FIRST_PASS_STATS *sb_fp_stats;
1403
1404 #if CONFIG_PARTITION_SEARCH_ORDER
1405 /*!\brief Pointer to RD_STATS structure to be used in
1406 * av1_rd_partition_search().
1407 */
1408 RD_STATS *rdcost;
1409 #endif // CONFIG_PARTITION_SEARCH_ORDER
1410 } MACROBLOCK;
1411 #undef SINGLE_REF_MODES
1412
1413 /*!\cond */
1414 // Zeroes out 'n_stats' elements in the array x->winner_mode_stats.
1415 // It only zeroes out what is necessary in 'color_index_map' (just the block
1416 // size, not the whole array).
zero_winner_mode_stats(BLOCK_SIZE bsize,int n_stats,WinnerModeStats * stats)1417 static inline void zero_winner_mode_stats(BLOCK_SIZE bsize, int n_stats,
1418 WinnerModeStats *stats) {
1419 // When winner mode stats are not required, the memory allocation is avoided
1420 // for x->winner_mode_stats. The stats pointer will be NULL in such cases.
1421 if (stats == NULL) return;
1422
1423 const int block_height = block_size_high[bsize];
1424 const int block_width = block_size_wide[bsize];
1425 for (int i = 0; i < n_stats; ++i) {
1426 WinnerModeStats *const stat = &stats[i];
1427 memset(&stat->mbmi, 0, sizeof(stat->mbmi));
1428 memset(&stat->rd_cost, 0, sizeof(stat->rd_cost));
1429 memset(&stat->rd, 0, sizeof(stat->rd));
1430 memset(&stat->rate_y, 0, sizeof(stat->rate_y));
1431 memset(&stat->rate_uv, 0, sizeof(stat->rate_uv));
1432 // Do not reset the whole array as it is CPU intensive.
1433 memset(&stat->color_index_map, 0,
1434 block_width * block_height * sizeof(stat->color_index_map[0]));
1435 memset(&stat->mode_index, 0, sizeof(stat->mode_index));
1436 }
1437 }
1438
is_rect_tx_allowed_bsize(BLOCK_SIZE bsize)1439 static inline int is_rect_tx_allowed_bsize(BLOCK_SIZE bsize) {
1440 static const char LUT[BLOCK_SIZES_ALL] = {
1441 0, // BLOCK_4X4
1442 1, // BLOCK_4X8
1443 1, // BLOCK_8X4
1444 0, // BLOCK_8X8
1445 1, // BLOCK_8X16
1446 1, // BLOCK_16X8
1447 0, // BLOCK_16X16
1448 1, // BLOCK_16X32
1449 1, // BLOCK_32X16
1450 0, // BLOCK_32X32
1451 1, // BLOCK_32X64
1452 1, // BLOCK_64X32
1453 0, // BLOCK_64X64
1454 0, // BLOCK_64X128
1455 0, // BLOCK_128X64
1456 0, // BLOCK_128X128
1457 1, // BLOCK_4X16
1458 1, // BLOCK_16X4
1459 1, // BLOCK_8X32
1460 1, // BLOCK_32X8
1461 1, // BLOCK_16X64
1462 1, // BLOCK_64X16
1463 };
1464
1465 return LUT[bsize];
1466 }
1467
is_rect_tx_allowed(const MACROBLOCKD * xd,const MB_MODE_INFO * mbmi)1468 static inline int is_rect_tx_allowed(const MACROBLOCKD *xd,
1469 const MB_MODE_INFO *mbmi) {
1470 return is_rect_tx_allowed_bsize(mbmi->bsize) &&
1471 !xd->lossless[mbmi->segment_id];
1472 }
1473
tx_size_to_depth(TX_SIZE tx_size,BLOCK_SIZE bsize)1474 static inline int tx_size_to_depth(TX_SIZE tx_size, BLOCK_SIZE bsize) {
1475 TX_SIZE ctx_size = max_txsize_rect_lookup[bsize];
1476 int depth = 0;
1477 while (tx_size != ctx_size) {
1478 depth++;
1479 ctx_size = sub_tx_size_map[ctx_size];
1480 assert(depth <= MAX_TX_DEPTH);
1481 }
1482 return depth;
1483 }
1484
set_blk_skip(uint8_t txb_skip[],int plane,int blk_idx,int skip)1485 static inline void set_blk_skip(uint8_t txb_skip[], int plane, int blk_idx,
1486 int skip) {
1487 if (skip)
1488 txb_skip[blk_idx] |= 1UL << plane;
1489 else
1490 txb_skip[blk_idx] &= ~(1UL << plane);
1491 #ifndef NDEBUG
1492 // Set chroma planes to uninitialized states when luma is set to check if
1493 // it will be set later
1494 if (plane == 0) {
1495 txb_skip[blk_idx] |= 1UL << (1 + 4);
1496 txb_skip[blk_idx] |= 1UL << (2 + 4);
1497 }
1498
1499 // Clear the initialization checking bit
1500 txb_skip[blk_idx] &= ~(1UL << (plane + 4));
1501 #endif
1502 }
1503
is_blk_skip(uint8_t * txb_skip,int plane,int blk_idx)1504 static inline int is_blk_skip(uint8_t *txb_skip, int plane, int blk_idx) {
1505 #ifndef NDEBUG
1506 // Check if this is initialized
1507 assert(!(txb_skip[blk_idx] & (1UL << (plane + 4))));
1508
1509 // The magic number is 0x77, this is to test if there is garbage data
1510 assert((txb_skip[blk_idx] & 0x88) == 0);
1511 #endif
1512 return (txb_skip[blk_idx] >> plane) & 1;
1513 }
1514
1515 /*!\endcond */
1516
1517 #ifdef __cplusplus
1518 } // extern "C"
1519 #endif
1520
1521 #endif // AOM_AV1_ENCODER_BLOCK_H_
1522