2 * Copyright (c) 2021, Alliance for Open Media. All rights reserved
4 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
11 #ifndef AOM_AOM_AOM_EXTERNAL_PARTITION_H_
12 #define AOM_AOM_AOM_EXTERNAL_PARTITION_H_
14 /*!\defgroup aom_encoder AOMedia AOM/AV1 Encoder
22 * \brief Provides function pointer definitions for the external partition.
25 /*!\brief Current ABI version number
28 * If this file is altered in any way that changes the ABI, this value
29 * must be bumped. Examples include, but are not limited to, changing
30 * types, removing or reassigning enums, adding/removing/rearranging
31 * fields to structures.
33 #define AOM_EXT_PART_ABI_VERSION 8
39 /*!\brief Abstract external partition model handler
41 typedef void *aom_ext_part_model_t
;
43 /*!\brief Number of features to determine whether to skip partition none and
44 * do partition split directly. The same as "FEATURE_SIZE_SMS_SPLIT".
46 #define AOM_EXT_PART_SIZE_DIRECT_SPLIT 17
48 /*!\brief Number of features to use simple motion search to prune out
49 * rectangular partition in some direction. The same as
50 * "FEATURE_SIZE_SMS_PRUNE_PART".
52 #define AOM_EXT_PART_SIZE_PRUNE_PART 25
54 /*!\brief Number of features to prune split and rectangular partition
55 * after PARTITION_NONE.
57 #define AOM_EXT_PART_SIZE_PRUNE_NONE 4
59 /*!\brief Number of features to terminates partition after partition none using
60 * simple_motion_search features and the rate, distortion, and rdcost of
61 * PARTITION_NONE. The same as "FEATURE_SIZE_SMS_TERM_NONE".
63 #define AOM_EXT_PART_SIZE_TERM_NONE 28
65 /*!\brief Number of features to terminates partition after partition split.
67 #define AOM_EXT_PART_SIZE_TERM_SPLIT 31
69 /*!\brief Number of features to prune rectangular partition using stats
70 * collected after partition split.
72 #define AOM_EXT_PART_SIZE_PRUNE_RECT 9
74 /*!\brief Number of features to prune AB partition using stats
75 * collected after rectangular partition..
77 #define AOM_EXT_PART_SIZE_PRUNE_AB 10
79 /*!\brief Number of features to prune 4-way partition using stats
80 * collected after AB partition.
82 #define AOM_EXT_PART_SIZE_PRUNE_4_WAY 18
84 /*!\brief Decision mode of the external partition model.
85 * AOM_EXT_PART_WHOLE_TREE: the external partition model should provide the
86 * whole partition tree for the superblock.
88 * AOM_EXT_PART_RECURSIVE: the external partition model provides the partition
89 * decision of the current block only. The decision process starts from
90 * the superblock size, down to the smallest block size (4x4) recursively.
92 typedef enum aom_ext_part_decision_mode
{
93 AOM_EXT_PART_WHOLE_TREE
= 0,
94 AOM_EXT_PART_RECURSIVE
= 1,
95 } aom_ext_part_decision_mode_t
;
97 /*!\brief Config information sent to the external partition model.
99 * For example, the maximum superblock size determined by the sequence header.
101 typedef struct aom_ext_part_config
{
102 int superblock_size
; ///< super block size (either 64x64 or 128x128)
103 } aom_ext_part_config_t
;
105 /*!\brief Features pass to the external model to make partition decisions.
106 * Specifically, features collected before NONE partition.
107 * Features "f" are used to determine:
108 * partition_none_allowed, partition_horz_allowed, partition_vert_allowed,
109 * do_rectangular_split, do_square_split
110 * Features "f_part2" are used to determine:
111 * prune_horz, prune_vert.
113 typedef struct aom_partition_features_before_none
{
114 /*! features to determine whether skip partition none and do split directly */
115 float f
[AOM_EXT_PART_SIZE_DIRECT_SPLIT
];
116 /*! features to determine whether to prune rectangular partition */
117 float f_part2
[AOM_EXT_PART_SIZE_PRUNE_PART
];
118 } aom_partition_features_before_none_t
;
120 /*!\brief Features pass to the external model to make partition decisions.
121 * Specifically, features collected after NONE partition.
123 typedef struct aom_partition_features_none
{
124 /*! features to prune split and rectangular partition */
125 float f
[AOM_EXT_PART_SIZE_PRUNE_NONE
];
126 /*! features to determine termination of partition */
127 float f_terminate
[AOM_EXT_PART_SIZE_TERM_NONE
];
128 } aom_partition_features_none_t
;
130 /*!\brief Features pass to the external model to make partition decisions.
131 * Specifically, features collected after SPLIT partition.
133 typedef struct aom_partition_features_split
{
134 /*! features to determine termination of partition */
135 float f_terminate
[AOM_EXT_PART_SIZE_TERM_SPLIT
];
136 /*! features to determine pruning rect partition */
137 float f_prune_rect
[AOM_EXT_PART_SIZE_PRUNE_RECT
];
138 } aom_partition_features_split_t
;
140 /*!\brief Features pass to the external model to make partition decisions.
141 * Specifically, features collected after RECTANGULAR partition.
143 typedef struct aom_partition_features_rect
{
144 /*! features to determine pruning AB partition */
145 float f
[AOM_EXT_PART_SIZE_PRUNE_AB
];
146 } aom_partition_features_rect_t
;
148 /*!\brief Features pass to the external model to make partition decisions.
149 * Specifically, features collected after AB partition: HORZ_A, HORZ_B, VERT_A,
152 typedef struct aom_partition_features_ab
{
153 /*! features to determine pruning 4-way partition */
154 float f
[AOM_EXT_PART_SIZE_PRUNE_4_WAY
];
155 } aom_partition_features_ab_t
;
157 /*!\brief Feature id to tell the external model the current stage in partition
158 * pruning and what features to use to make decisions accordingly.
161 AOM_EXT_PART_FEATURE_BEFORE_NONE
,
162 AOM_EXT_PART_FEATURE_BEFORE_NONE_PART2
,
163 AOM_EXT_PART_FEATURE_AFTER_NONE
,
164 AOM_EXT_PART_FEATURE_AFTER_NONE_PART2
,
165 AOM_EXT_PART_FEATURE_AFTER_SPLIT
,
166 AOM_EXT_PART_FEATURE_AFTER_SPLIT_PART2
,
167 AOM_EXT_PART_FEATURE_AFTER_RECT
,
168 AOM_EXT_PART_FEATURE_AFTER_AB
169 } AOM_EXT_PART_FEATURE_ID
;
171 /*!\brief Features collected from the tpl process.
173 * The tpl process collects information that help measure the inter-frame
175 * The tpl process is computed in the unit of tpl_bsize_1d (16x16).
176 * Therefore, the max number of units inside a superblock is
177 * 128x128 / (16x16) = 64. Change it if the tpl process changes.
179 typedef struct aom_sb_tpl_features
{
180 int available
; ///< If tpl stats are available
181 int tpl_unit_length
; ///< The block length of tpl process
182 int num_units
; ///< The number of units inside the current superblock
183 int64_t intra_cost
[64]; ///< The intra cost of each unit
184 int64_t inter_cost
[64]; ///< The inter cost of each unit
185 int64_t mc_dep_cost
[64]; ///< The motion compensated dependency cost
186 } aom_sb_tpl_features_t
;
188 /*!\brief Features collected from the simple motion process.
190 * The simple motion process collects information by applying motion compensated
191 * prediction on each block.
192 * The block size is 16x16, which could be changed. If it is changed, update
193 * comments and the array size here.
195 typedef struct aom_sb_simple_motion_features
{
196 int unit_length
; ///< The block length of the simple motion process
197 int num_units
; ///< The number of units inside the current superblock
198 int block_sse
[64]; ///< Sum of squared error of each unit
199 int block_var
[64]; ///< Variance of each unit
200 } aom_sb_simple_motion_features_t
;
202 /*!\brief Features of each super block.
204 * Features collected for each super block before partition search.
206 typedef struct aom_sb_features
{
207 /*! Features from motion search */
208 aom_sb_simple_motion_features_t motion_features
;
209 /*! Features from tpl process */
210 aom_sb_tpl_features_t tpl_features
;
213 /*!\brief Features pass to the external model to make partition decisions.
215 * The encoder sends these features to the external model through
216 * "func()" defined in .....
218 * NOTE: new member variables may be added to this structure in the future.
219 * Once new features are finalized, bump the major version of libaom.
221 typedef struct aom_partition_features
{
222 // Features for the current supervised multi-stage ML model.
223 /*! Feature ID to indicate active features */
224 AOM_EXT_PART_FEATURE_ID id
;
225 /*! Features collected before NONE partition */
226 aom_partition_features_before_none_t before_part_none
;
227 /*! Features collected after NONE partition */
228 aom_partition_features_none_t after_part_none
;
229 /*! Features collected after SPLIT partition */
230 aom_partition_features_split_t after_part_split
;
231 /*! Features collected after RECTANGULAR partition */
232 aom_partition_features_rect_t after_part_rect
;
233 /*! Features collected after AB partition */
234 aom_partition_features_ab_t after_part_ab
;
236 // Features for a new ML model.
237 aom_sb_features_t sb_features
; ///< Features collected for the super block
238 int mi_row
; ///< Mi_row position of the block
239 int mi_col
; ///< Mi_col position of the block
240 int frame_width
; ///< Frame width
241 int frame_height
; ///< Frame height
242 int block_size
; ///< As "BLOCK_SIZE" in av1/common/enums.h
244 * Valid partition types. A bitmask is used. "1" represents the
245 * corresponding type is vaild. The bitmask follows the enum order for
246 * PARTITION_TYPE in "enums.h" to represent one partition type at a bit.
247 * For example, 0x01 stands for only PARTITION_NONE is valid,
248 * 0x09 (00...001001) stands for PARTITION_NONE and PARTITION_SPLIT are valid.
250 int valid_partition_types
;
251 int update_type
; ///< Frame update type, defined in ratectrl.h
252 int qindex
; ///< Quantization index, range: [0, 255]
253 int rdmult
; ///< Rate-distortion multiplier
254 int pyramid_level
; ///< The level of this frame in the hierarchical structure
255 int has_above_block
; ///< Has above neighbor block
256 int above_block_width
; ///< Width of the above block, -1 if not exist
257 int above_block_height
; ///< Height of the above block, -1 if not exist
258 int has_left_block
; ///< Has left neighbor block
259 int left_block_width
; ///< Width of the left block, -1 if not exist
260 int left_block_height
; ///< Height of the left block, -1 if not exist
262 * The following parameters are collected from applying simple motion search.
263 * Sum of squared error (SSE) and variance of motion compensated residual
264 * are good indicators of block partitioning.
265 * If a block is a square, we also apply motion search for its 4 sub blocks.
266 * If not a square, their values are -1.
267 * If a block is able to split horizontally, we apply motion search and get
268 * stats for horizontal blocks. If not, their values are -1.
269 * If a block is able to split vertically, we apply motion search and get
270 * stats for vertical blocks. If not, their values are -1.
272 unsigned int block_sse
; ///< SSE of motion compensated residual
273 unsigned int block_var
; ///< Variance of motion compensated residual
274 unsigned int sub_block_sse
[4]; ///< SSE of sub blocks.
275 unsigned int sub_block_var
[4]; ///< Variance of sub blocks.
276 unsigned int horz_block_sse
[2]; ///< SSE of horz sub blocks
277 unsigned int horz_block_var
[2]; ///< Variance of horz sub blocks
278 unsigned int vert_block_sse
[2]; ///< SSE of vert sub blocks
279 unsigned int vert_block_var
[2]; ///< Variance of vert sub blocks
281 * The following parameters are calculated from tpl model.
282 * If tpl model is not available, their values are -1.
284 int64_t tpl_intra_cost
; ///< Intra cost, ref to "TplDepStats" in tpl_model.h
285 int64_t tpl_inter_cost
; ///< Inter cost in tpl model
286 int64_t tpl_mc_dep_cost
; ///< Motion compensated dependency cost in tpl model
287 } aom_partition_features_t
;
289 /*!\brief Partition decisions received from the external model.
291 * The encoder receives partition decisions and encodes the superblock
292 * with the given partition type.
293 * The encoder receives it from "func()" define in ....
295 * NOTE: new member variables may be added to this structure in the future.
296 * Once new features are finalized, bump the major version of libaom.
298 typedef struct aom_partition_decision
{
299 // Decisions for directly set partition types
300 int is_final_decision
; ///< The flag whether it's the final decision
301 int num_nodes
; ///< The number of leaf nodes
302 int partition_decision
[2048]; ///< Partition decisions
303 int current_decision
; ///< Partition decision for the current block
305 // Decisions for partition type pruning
306 int terminate_partition_search
; ///< Terminate further partition search
307 int partition_none_allowed
; ///< Allow partition none type
308 int partition_rect_allowed
[2]; ///< Allow rectangular partitions
309 int do_rectangular_split
; ///< Try rectangular split partition
310 int do_square_split
; ///< Try square split partition
311 int prune_rect_part
[2]; ///< Prune rectangular partition
312 int horza_partition_allowed
; ///< Allow HORZ_A partitioin
313 int horzb_partition_allowed
; ///< Allow HORZ_B partitioin
314 int verta_partition_allowed
; ///< Allow VERT_A partitioin
315 int vertb_partition_allowed
; ///< Allow VERT_B partitioin
316 int partition_horz4_allowed
; ///< Allow HORZ4 partition
317 int partition_vert4_allowed
; ///< Allow VERT4 partition
318 } aom_partition_decision_t
;
320 /*!\brief Encoding stats for the given partition decision.
322 * The encoding stats collected by encoding the superblock with the
323 * given partition types.
324 * The encoder sends the stats to the external model for training
325 * or inference though "func()" defined in ....
327 typedef struct aom_partition_stats
{
328 int rate
; ///< Rate cost of the block
329 int64_t dist
; ///< Distortion of the block
330 int64_t rdcost
; ///< Rate-distortion cost of the block
331 } aom_partition_stats_t
;
333 /*!\brief Enum for return status.
335 typedef enum aom_ext_part_status
{
336 AOM_EXT_PART_OK
= 0, ///< Status of success
337 AOM_EXT_PART_ERROR
= 1, ///< Status of failure
338 AOM_EXT_PART_TEST
= 2, ///< Status used for tests
339 } aom_ext_part_status_t
;
341 /*!\brief Callback of creating an external partition model.
343 * The callback is invoked by the encoder to create an external partition
346 * \param[in] priv Callback's private data
347 * \param[in] part_config Config information pointer for model creation
348 * \param[out] ext_part_model Pointer to the model
350 typedef aom_ext_part_status_t (*aom_ext_part_create_model_fn_t
)(
351 void *priv
, const aom_ext_part_config_t
*part_config
,
352 aom_ext_part_model_t
*ext_part_model
);
354 /*!\brief Callback of sending features to the external partition model.
356 * The callback is invoked by the encoder to send features to the external
359 * \param[in] ext_part_model The external model
360 * \param[in] part_features Pointer to the features
362 typedef aom_ext_part_status_t (*aom_ext_part_send_features_fn_t
)(
363 aom_ext_part_model_t ext_part_model
,
364 const aom_partition_features_t
*part_features
);
366 /*!\brief Callback of receiving partition decisions from the external
369 * The callback is invoked by the encoder to receive partition decisions from
370 * the external partition model.
372 * \param[in] ext_part_model The external model
373 * \param[in] ext_part_decision Pointer to the partition decisions
375 typedef aom_ext_part_status_t (*aom_ext_part_get_decision_fn_t
)(
376 aom_ext_part_model_t ext_part_model
,
377 aom_partition_decision_t
*ext_part_decision
);
379 /*!\brief Callback of sending stats to the external partition model.
381 * The callback is invoked by the encoder to send encoding stats to
382 * the external partition model.
384 * \param[in] ext_part_model The external model
385 * \param[in] ext_part_stats Pointer to the encoding stats
387 typedef aom_ext_part_status_t (*aom_ext_part_send_partition_stats_fn_t
)(
388 aom_ext_part_model_t ext_part_model
,
389 const aom_partition_stats_t
*ext_part_stats
);
391 /*!\brief Callback of deleting the external partition model.
393 * The callback is invoked by the encoder to delete the external partition
396 * \param[in] ext_part_model The external model
398 typedef aom_ext_part_status_t (*aom_ext_part_delete_model_fn_t
)(
399 aom_ext_part_model_t ext_part_model
);
401 /*!\brief Callback function set for external partition model.
403 * Uses can enable external partition model by registering a set of
404 * callback functions with the flag: AV1E_SET_EXTERNAL_PARTITION_MODEL
406 typedef struct aom_ext_part_funcs
{
408 * Create an external partition model.
410 aom_ext_part_create_model_fn_t create_model
;
413 * Send features to the external partition model to make partition decisions.
415 aom_ext_part_send_features_fn_t send_features
;
418 * Get partition decisions from the external partition model.
420 aom_ext_part_get_decision_fn_t get_partition_decision
;
423 * Send stats of the current partition to the external model.
425 aom_ext_part_send_partition_stats_fn_t send_partition_stats
;
428 * Delete the external partition model.
430 aom_ext_part_delete_model_fn_t delete_model
;
433 * The decision mode of the model.
435 aom_ext_part_decision_mode_t decision_mode
;
438 * Private data for the external partition model.
441 } aom_ext_part_funcs_t
;
443 /*!@} - end defgroup aom_encoder*/
448 #endif // AOM_AOM_AOM_EXTERNAL_PARTITION_H_