AOMedia AV1 Codec
encoder.h
Go to the documentation of this file.
1/*
2 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
3 *
4 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10 */
11
15#ifndef AOM_AV1_ENCODER_ENCODER_H_
16#define AOM_AV1_ENCODER_ENCODER_H_
17
18#include <stdbool.h>
19#include <stdio.h>
20
21#include "config/aom_config.h"
22
23#include "aom/aomcx.h"
24
25#include "av1/common/alloccommon.h"
26#include "av1/common/av1_common_int.h"
27#include "av1/common/blockd.h"
28#include "av1/common/entropymode.h"
29#include "av1/common/enums.h"
30#include "av1/common/reconintra.h"
31#include "av1/common/resize.h"
32#include "av1/common/thread_common.h"
33#include "av1/common/timing.h"
34
35#include "av1/encoder/aq_cyclicrefresh.h"
36#include "av1/encoder/av1_quantize.h"
37#include "av1/encoder/block.h"
38#include "av1/encoder/context_tree.h"
39#include "av1/encoder/encodemb.h"
40#include "av1/encoder/external_partition.h"
41#include "av1/encoder/firstpass.h"
42#include "av1/encoder/global_motion.h"
43#include "av1/encoder/level.h"
45#include "av1/encoder/mcomp.h"
46#include "av1/encoder/pickcdef.h"
47#include "av1/encoder/ratectrl.h"
48#include "av1/encoder/rd.h"
50#include "av1/encoder/svc_layercontext.h"
51#include "av1/encoder/temporal_filter.h"
52#include "av1/encoder/thirdpass.h"
53#include "av1/encoder/tokenize.h"
54#include "av1/encoder/tpl_model.h"
55#include "av1/encoder/av1_noise_estimate.h"
56#include "av1/encoder/bitstream.h"
57
58#if CONFIG_INTERNAL_STATS
59#include "aom_dsp/ssim.h"
60#endif
61#include "aom_dsp/variance.h"
62#if CONFIG_DENOISE
63#include "aom_dsp/noise_model.h"
64#endif
65#if CONFIG_TUNE_VMAF
66#include "av1/encoder/tune_vmaf.h"
67#endif
68#if CONFIG_AV1_TEMPORAL_DENOISING
69#include "av1/encoder/av1_temporal_denoiser.h"
70#endif
71#if CONFIG_TUNE_BUTTERAUGLI
72#include "av1/encoder/tune_butteraugli.h"
73#endif
74
75#include "aom/internal/aom_codec_internal.h"
76#include "aom_util/aom_thread.h"
77
78#ifdef __cplusplus
79extern "C" {
80#endif
81
82// TODO(yunqing, any): Added suppression tag to quiet Doxygen warnings. Need to
83// adjust it while we work on documentation.
85// Number of frames required to test for scene cut detection
86#define SCENE_CUT_KEY_TEST_INTERVAL 16
87
88// Lookahead index threshold to enable temporal filtering for second arf.
89#define TF_LOOKAHEAD_IDX_THR 7
90
91#define HDR_QP_LEVELS 10
92#define CHROMA_CB_QP_SCALE 1.04
93#define CHROMA_CR_QP_SCALE 1.04
94#define CHROMA_QP_SCALE -0.46
95#define CHROMA_QP_OFFSET 9.26
96#define QP_SCALE_FACTOR 2.0
97#define DISABLE_HDR_LUMA_DELTAQ 1
98
99// Rational number with an int64 numerator
100// This structure holds a fractional value
101typedef struct aom_rational64 {
102 int64_t num; // fraction numerator
103 int den; // fraction denominator
104} aom_rational64_t; // alias for struct aom_rational
105
106enum {
107 NORMAL = 0,
108 FOURFIVE = 1,
109 THREEFIVE = 2,
110 THREEFOUR = 3,
111 ONEFOUR = 4,
112 ONEEIGHT = 5,
113 ONETWO = 6
114} UENUM1BYTE(AOM_SCALING);
115
116enum {
117 // Good Quality Fast Encoding. The encoder balances quality with the amount of
118 // time it takes to encode the output. Speed setting controls how fast.
119 GOOD,
120 // Realtime Fast Encoding. Will force some restrictions on bitrate
121 // constraints.
122 REALTIME,
123 // All intra mode. All the frames are coded as intra frames.
124 ALLINTRA
125} UENUM1BYTE(MODE);
126
127enum {
128 FRAMEFLAGS_KEY = 1 << 0,
129 FRAMEFLAGS_GOLDEN = 1 << 1,
130 FRAMEFLAGS_BWDREF = 1 << 2,
131 // TODO(zoeliu): To determine whether a frame flag is needed for ALTREF2_FRAME
132 FRAMEFLAGS_ALTREF = 1 << 3,
133 FRAMEFLAGS_INTRAONLY = 1 << 4,
134 FRAMEFLAGS_SWITCH = 1 << 5,
135 FRAMEFLAGS_ERROR_RESILIENT = 1 << 6,
136} UENUM1BYTE(FRAMETYPE_FLAGS);
137
138#if CONFIG_FRAME_PARALLEL_ENCODE && CONFIG_FPMT_TEST
139enum {
140 PARALLEL_ENCODE = 0,
141 PARALLEL_SIMULATION_ENCODE,
142 NUM_FPMT_TEST_ENCODES
143} UENUM1BYTE(FPMT_TEST_ENC_CFG);
144#endif // CONFIG_FRAME_PARALLEL_ENCODE && CONFIG_FPMT_TEST
145// 0 level frames are sometimes used for rate control purposes, but for
146// reference mapping purposes, the minimum level should be 1.
147#define MIN_PYR_LEVEL 1
148static INLINE int get_true_pyr_level(int frame_level, int frame_order,
149 int max_layer_depth) {
150 if (frame_order == 0) {
151 // Keyframe case
152 return MIN_PYR_LEVEL;
153 } else if (frame_level == MAX_ARF_LAYERS) {
154 // Leaves
155 return max_layer_depth;
156 } else if (frame_level == (MAX_ARF_LAYERS + 1)) {
157 // Altrefs
158 return MIN_PYR_LEVEL;
159 }
160 return AOMMAX(MIN_PYR_LEVEL, frame_level);
161}
162
163enum {
164 NO_AQ = 0,
165 VARIANCE_AQ = 1,
166 COMPLEXITY_AQ = 2,
167 CYCLIC_REFRESH_AQ = 3,
168 AQ_MODE_COUNT // This should always be the last member of the enum
169} UENUM1BYTE(AQ_MODE);
170enum {
171 NO_DELTA_Q = 0,
172 DELTA_Q_OBJECTIVE = 1, // Modulation to improve objective quality
173 DELTA_Q_PERCEPTUAL = 2, // Modulation to improve video perceptual quality
174 DELTA_Q_PERCEPTUAL_AI = 3, // Perceptual quality opt for all intra mode
175 DELTA_Q_USER_RATING_BASED = 4, // User rating based delta q mode
176 DELTA_Q_HDR = 5, // QP adjustment based on HDR block pixel average
177 DELTA_Q_MODE_COUNT // This should always be the last member of the enum
178} UENUM1BYTE(DELTAQ_MODE);
179
180enum {
181 RESIZE_NONE = 0, // No frame resizing allowed.
182 RESIZE_FIXED = 1, // All frames are coded at the specified scale.
183 RESIZE_RANDOM = 2, // All frames are coded at a random scale.
184 RESIZE_DYNAMIC = 3, // Frames coded at lower scale based on rate control.
185 RESIZE_MODES
186} UENUM1BYTE(RESIZE_MODE);
187
188enum {
189 SS_CFG_SRC = 0,
190 SS_CFG_LOOKAHEAD = 1,
191 SS_CFG_FPF = 2,
192 SS_CFG_TOTAL = 3
193} UENUM1BYTE(SS_CFG_OFFSET);
194
195enum {
196 DISABLE_SCENECUT, // For LAP, lag_in_frames < 19
197 ENABLE_SCENECUT_MODE_1, // For LAP, lag_in_frames >=19 and < 33
198 ENABLE_SCENECUT_MODE_2 // For twopass and LAP - lag_in_frames >=33
199} UENUM1BYTE(SCENECUT_MODE);
200
201#define MAX_VBR_CORPUS_COMPLEXITY 10000
202
205typedef enum {
206 MOD_FP, // First pass
207 MOD_TF, // Temporal filtering
208 MOD_TPL, // TPL
209 MOD_GME, // Global motion estimation
210 MOD_ENC, // Encode stage
211 MOD_LPF, // Deblocking loop filter
212 MOD_CDEF_SEARCH, // CDEF search
213 MOD_CDEF, // CDEF frame
214 MOD_LR, // Loop restoration filtering
215 MOD_PACK_BS, // Pack bitstream
216 MOD_FRAME_ENC, // Frame Parallel encode
217 NUM_MT_MODULES
218} MULTI_THREADED_MODULES;
219
228typedef enum {
229 COST_UPD_SB,
230 COST_UPD_SBROW,
231 COST_UPD_TILE,
232 COST_UPD_OFF,
233 NUM_COST_UPDATE_TYPES,
234} COST_UPDATE_TYPE;
235
239typedef enum {
240 LOOPFILTER_NONE = 0,
241 LOOPFILTER_ALL = 1,
242 LOOPFILTER_REFERENCE = 2,
243 LOOPFILTER_SELECTIVELY =
244 3,
245} LOOPFILTER_CONTROL;
246
250typedef struct {
254 RESIZE_MODE resize_mode;
259 uint8_t resize_scale_denominator;
264 uint8_t resize_kf_scale_denominator;
265} ResizeCfg;
266
270typedef struct {
274 bool enable_rect_partitions;
278 bool enable_ab_partitions;
282 bool enable_1to4_partitions;
287 BLOCK_SIZE min_partition_size;
292 BLOCK_SIZE max_partition_size;
293} PartitionCfg;
294
298typedef struct {
302 bool enable_intra_edge_filter;
307 bool enable_filter_intra;
311 bool enable_smooth_intra;
315 bool enable_paeth_intra;
319 bool enable_cfl_intra;
323 bool enable_directional_intra;
328 bool enable_diagonal_intra;
333 bool enable_angle_delta;
347 bool auto_intra_tools_off;
348} IntraModeCfg;
349
353typedef struct {
357 bool enable_tx64;
361 bool enable_flip_idtx;
365 bool enable_rect_tx;
370 bool reduced_tx_type_set;
375 bool use_intra_dct_only;
380 bool use_inter_dct_only;
385 bool use_intra_default_tx_only;
389 bool enable_tx_size_search;
390} TxfmSizeTypeCfg;
391
395typedef struct {
399 bool enable_dist_wtd_comp;
404 bool enable_masked_comp;
408 bool enable_smooth_interintra;
412 bool enable_diff_wtd_comp;
416 bool enable_interinter_wedge;
420 bool enable_interintra_wedge;
421} CompoundTypeCfg;
422
426typedef struct {
431 int superres_qthresh;
436 int superres_kf_qthresh;
442 uint8_t superres_scale_denominator;
448 uint8_t superres_kf_scale_denominator;
452 aom_superres_mode superres_mode;
456 bool enable_superres;
457} SuperResCfg;
458
462typedef struct {
466 int key_freq_min;
467
471 int key_freq_max;
472
476 int enable_keyframe_filtering;
477
482 int sframe_dist;
483
489 int sframe_mode;
490
494 bool auto_key;
495
499 int fwd_kf_dist;
500
504 bool fwd_kf_enabled;
505
509 bool enable_sframe;
510
514 bool enable_intrabc;
515} KeyFrameCfg;
516
520typedef struct {
522 // BUFFERING PARAMETERS
529 int64_t starting_buffer_level_ms;
534 int64_t optimal_buffer_level_ms;
539 int64_t maximum_buffer_size_ms;
540
544 int64_t target_bandwidth;
545
550 unsigned int vbr_corpus_complexity_lap;
555 unsigned int max_intra_bitrate_pct;
560 unsigned int max_inter_bitrate_pct;
564 unsigned int gf_cbr_boost_pct;
569 unsigned int min_cr;
573 int drop_frames_water_mark;
579 int under_shoot_pct;
585 int over_shoot_pct;
590 int worst_allowed_q;
595 int best_allowed_q;
599 int cq_level;
604 enum aom_rc_mode mode;
611 int vbrbias;
616 int vbrmin_section;
621 int vbrmax_section;
622} RateControlCfg;
623
625typedef struct {
626 // Indicates the number of frames lag before encoding is started.
627 int lag_in_frames;
628 // Indicates the minimum gf/arf interval to be used.
629 int min_gf_interval;
630 // Indicates the maximum gf/arf interval to be used.
631 int max_gf_interval;
632 // Indicates the minimum height for GF group pyramid structure to be used.
633 int gf_min_pyr_height;
634 // Indicates the maximum height for GF group pyramid structure to be used.
635 int gf_max_pyr_height;
636 // Indicates if automatic set and use of altref frames should be enabled.
637 bool enable_auto_arf;
638 // Indicates if automatic set and use of (b)ackward (r)ef (f)rames should be
639 // enabled.
640 bool enable_auto_brf;
641} GFConfig;
642
643typedef struct {
644 // Indicates the number of tile groups.
645 unsigned int num_tile_groups;
646 // Indicates the MTU size for a tile group. If mtu is non-zero,
647 // num_tile_groups is set to DEFAULT_MAX_NUM_TG.
648 unsigned int mtu;
649 // Indicates the number of tile columns in log2.
650 int tile_columns;
651 // Indicates the number of tile rows in log2.
652 int tile_rows;
653 // Indicates the number of widths in the tile_widths[] array.
654 int tile_width_count;
655 // Indicates the number of heights in the tile_heights[] array.
656 int tile_height_count;
657 // Indicates the tile widths, and may be empty.
658 int tile_widths[MAX_TILE_COLS];
659 // Indicates the tile heights, and may be empty.
660 int tile_heights[MAX_TILE_ROWS];
661 // Indicates if large scale tile coding should be used.
662 bool enable_large_scale_tile;
663 // Indicates if single tile decoding mode should be enabled.
664 bool enable_single_tile_decoding;
665 // Indicates if EXT_TILE_DEBUG should be enabled.
666 bool enable_ext_tile_debug;
667} TileConfig;
668
669typedef struct {
670 // Indicates the width of the input frame.
671 int width;
672 // Indicates the height of the input frame.
673 int height;
674 // If forced_max_frame_width is non-zero then it is used to force the maximum
675 // frame width written in write_sequence_header().
676 int forced_max_frame_width;
677 // If forced_max_frame_width is non-zero then it is used to force the maximum
678 // frame height written in write_sequence_header().
679 int forced_max_frame_height;
680 // Indicates the frame width after applying both super-resolution and resize
681 // to the coded frame.
682 int render_width;
683 // Indicates the frame height after applying both super-resolution and resize
684 // to the coded frame.
685 int render_height;
686} FrameDimensionCfg;
687
688typedef struct {
689 // Indicates if warped motion should be enabled.
690 bool enable_warped_motion;
691 // Indicates if warped motion should be evaluated or not.
692 bool allow_warped_motion;
693 // Indicates if OBMC motion should be enabled.
694 bool enable_obmc;
695} MotionModeCfg;
696
697typedef struct {
698 // Timing info for each frame.
699 aom_timing_info_t timing_info;
700 // Indicates the number of time units of a decoding clock.
701 uint32_t num_units_in_decoding_tick;
702 // Indicates if decoder model information is present in the coded sequence
703 // header.
704 bool decoder_model_info_present_flag;
705 // Indicates if display model information is present in the coded sequence
706 // header.
707 bool display_model_info_present_flag;
708 // Indicates if timing info for each frame is present.
709 bool timing_info_present;
710} DecoderModelCfg;
711
712typedef struct {
713 // Indicates the update frequency for coeff costs.
714 COST_UPDATE_TYPE coeff;
715 // Indicates the update frequency for mode costs.
716 COST_UPDATE_TYPE mode;
717 // Indicates the update frequency for mv costs.
718 COST_UPDATE_TYPE mv;
719 // Indicates the update frequency for dv costs.
720 COST_UPDATE_TYPE dv;
721} CostUpdateFreq;
722
723typedef struct {
724 // Indicates the maximum number of reference frames allowed per frame.
725 unsigned int max_reference_frames;
726 // Indicates if the reduced set of references should be enabled.
727 bool enable_reduced_reference_set;
728 // Indicates if one-sided compound should be enabled.
729 bool enable_onesided_comp;
730} RefFrameCfg;
731
732typedef struct {
733 // Indicates the color space that should be used.
734 aom_color_primaries_t color_primaries;
735 // Indicates the characteristics of transfer function to be used.
736 aom_transfer_characteristics_t transfer_characteristics;
737 // Indicates the matrix coefficients to be used for the transfer function.
738 aom_matrix_coefficients_t matrix_coefficients;
739 // Indicates the chroma 4:2:0 sample position info.
740 aom_chroma_sample_position_t chroma_sample_position;
741 // Indicates if a limited color range or full color range should be used.
742 aom_color_range_t color_range;
743} ColorCfg;
744
745typedef struct {
746 // Indicates if extreme motion vector unit test should be enabled or not.
747 unsigned int motion_vector_unit_test;
748 // Indicates if superblock multipass unit test should be enabled or not.
749 unsigned int sb_multipass_unit_test;
750} UnitTestCfg;
751
752typedef struct {
753 // Indicates the file path to the VMAF model.
754 const char *vmaf_model_path;
755 // Indicates the path to the film grain parameters.
756 const char *film_grain_table_filename;
757 // Indicates the visual tuning metric.
758 aom_tune_metric tuning;
759 // Indicates if the current content is screen or default type.
760 aom_tune_content content;
761 // Indicates the film grain parameters.
762 int film_grain_test_vector;
763 // Indicates the in-block distortion metric to use.
764 aom_dist_metric dist_metric;
765} TuneCfg;
766
767typedef struct {
768 // Indicates the framerate of the input video.
769 double init_framerate;
770 // Indicates the bit-depth of the input video.
771 unsigned int input_bit_depth;
772 // Indicates the maximum number of frames to be encoded.
773 unsigned int limit;
774 // Indicates the chrome subsampling x value.
775 unsigned int chroma_subsampling_x;
776 // Indicates the chrome subsampling y value.
777 unsigned int chroma_subsampling_y;
778} InputCfg;
779
780typedef struct {
781 // If true, encoder will use fixed QP offsets, that are either:
782 // - Given by the user, and stored in 'fixed_qp_offsets' array, OR
783 // - Picked automatically from cq_level.
784 int use_fixed_qp_offsets;
785 // Indicates the minimum flatness of the quantization matrix.
786 int qm_minlevel;
787 // Indicates the maximum flatness of the quantization matrix.
788 int qm_maxlevel;
789 // Indicates if adaptive quantize_b should be enabled.
790 int quant_b_adapt;
791 // Indicates the Adaptive Quantization mode to be used.
792 AQ_MODE aq_mode;
793 // Indicates the delta q mode to be used.
794 DELTAQ_MODE deltaq_mode;
795 // Indicates the delta q mode strength.
796 DELTAQ_MODE deltaq_strength;
797 // Indicates if delta quantization should be enabled in chroma planes.
798 bool enable_chroma_deltaq;
799 // Indicates if delta quantization should be enabled for hdr video
800 bool enable_hdr_deltaq;
801 // Indicates if encoding with quantization matrices should be enabled.
802 bool using_qm;
803} QuantizationCfg;
804
809typedef struct {
816 int sharpness;
817
825 int disable_trellis_quant;
826
830 int arnr_max_frames;
831
835 int arnr_strength;
836
843 uint8_t cdf_update_mode;
844
848 bool enable_tpl_model;
849
854 bool enable_overlay;
855
863 LOOPFILTER_CONTROL loopfilter_control;
864} AlgoCfg;
867typedef struct {
868 // Indicates the codec bit-depth.
869 aom_bit_depth_t bit_depth;
870 // Indicates the superblock size that should be used by the encoder.
871 aom_superblock_size_t superblock_size;
872 // Indicates if loopfilter modulation should be enabled.
873 bool enable_deltalf_mode;
874 // Indicates how CDEF should be applied.
875 CDEF_CONTROL cdef_control;
876 // Indicates if loop restoration filter should be enabled.
877 bool enable_restoration;
878 // When enabled, video mode should be used even for single frame input.
879 bool force_video_mode;
880 // Indicates if the error resiliency features should be enabled.
881 bool error_resilient_mode;
882 // Indicates if frame parallel decoding feature should be enabled.
883 bool frame_parallel_decoding_mode;
884 // Indicates if the input should be encoded as monochrome.
885 bool enable_monochrome;
886 // When enabled, the encoder will use a full header even for still pictures.
887 // When disabled, a reduced header is used for still pictures.
888 bool full_still_picture_hdr;
889 // Indicates if dual interpolation filters should be enabled.
890 bool enable_dual_filter;
891 // Indicates if frame order hint should be enabled or not.
892 bool enable_order_hint;
893 // Indicates if ref_frame_mvs should be enabled at the sequence level.
894 bool ref_frame_mvs_present;
895 // Indicates if ref_frame_mvs should be enabled at the frame level.
896 bool enable_ref_frame_mvs;
897 // Indicates if interintra compound mode is enabled.
898 bool enable_interintra_comp;
899 // Indicates if global motion should be enabled.
900 bool enable_global_motion;
901 // Indicates if palette should be enabled.
902 bool enable_palette;
903} ToolCfg;
904
909typedef struct AV1EncoderConfig {
911 // Configuration related to the input video.
912 InputCfg input_cfg;
913
914 // Configuration related to frame-dimensions.
915 FrameDimensionCfg frm_dim_cfg;
916
921 AlgoCfg algo_cfg;
922
926 KeyFrameCfg kf_cfg;
927
931 RateControlCfg rc_cfg;
934 // Configuration related to Quantization.
935 QuantizationCfg q_cfg;
936
937 // Internal frame size scaling.
938 ResizeCfg resize_cfg;
939
940 // Frame Super-Resolution size scaling.
941 SuperResCfg superres_cfg;
942
948 aom_fixed_buf_t twopass_stats_in;
951 // Configuration related to encoder toolsets.
952 ToolCfg tool_cfg;
953
954 // Configuration related to Group of frames.
955 GFConfig gf_cfg;
956
957 // Tile related configuration parameters.
958 TileConfig tile_cfg;
959
960 // Configuration related to Tune.
961 TuneCfg tune_cfg;
962
963 // Configuration related to color.
964 ColorCfg color_cfg;
965
966 // Configuration related to decoder model.
967 DecoderModelCfg dec_model_cfg;
968
969 // Configuration related to reference frames.
970 RefFrameCfg ref_frm_cfg;
971
972 // Configuration related to unit tests.
973 UnitTestCfg unit_test_cfg;
974
975 // Flags related to motion mode.
976 MotionModeCfg motion_mode_cfg;
977
978 // Flags related to intra mode search.
979 IntraModeCfg intra_mode_cfg;
980
981 // Flags related to transform size/type.
982 TxfmSizeTypeCfg txfm_cfg;
983
984 // Flags related to compound type.
985 CompoundTypeCfg comp_type_cfg;
986
987 // Partition related information.
988 PartitionCfg part_cfg;
989
990 // Configuration related to frequency of cost update.
991 CostUpdateFreq cost_upd_freq;
992
993#if CONFIG_DENOISE
994 // Indicates the noise level.
995 float noise_level;
996 // Indicates the the denoisers block size.
997 int noise_block_size;
998 // Indicates whether to apply denoising to the frame to be encoded
999 int enable_dnl_denoising;
1000#endif
1001
1002#if CONFIG_AV1_TEMPORAL_DENOISING
1003 // Noise sensitivity.
1004 int noise_sensitivity;
1005#endif
1006 // Bit mask to specify which tier each of the 32 possible operating points
1007 // conforms to.
1008 unsigned int tier_mask;
1009
1010 // Indicates the number of pixels off the edge of a reference frame we're
1011 // allowed to go when forming an inter prediction.
1012 int border_in_pixels;
1013
1014 // Indicates the maximum number of threads that may be used by the encoder.
1015 int max_threads;
1016
1017 // Indicates the speed preset to be used.
1018 int speed;
1019
1020 // Indicates the target sequence level index for each operating point(OP).
1021 AV1_LEVEL target_seq_level_idx[MAX_NUM_OPERATING_POINTS];
1022
1023 // Indicates the bitstream profile to be used.
1024 BITSTREAM_PROFILE profile;
1025
1034 enum aom_enc_pass pass;
1037 // Total number of encoding passes.
1038 int passes;
1039
1040 // the name of the second pass output file when passes > 2
1041 const char *two_pass_output;
1042
1043 // the name of the second pass log file when passes > 2
1044 const char *second_pass_log;
1045
1046 // Indicates if the encoding is GOOD or REALTIME.
1047 MODE mode;
1048
1049 // Indicates if row-based multi-threading should be enabled or not.
1050 bool row_mt;
1051
1052 // Indicates if frame parallel multi-threading should be enabled or not.
1053 bool fp_mt;
1054
1055 // Indicates if 16bit frame buffers are to be used i.e., the content is >
1056 // 8-bit.
1057 bool use_highbitdepth;
1058
1059 // Indicates the bitstream syntax mode. 0 indicates bitstream is saved as
1060 // Section 5 bitstream, while 1 indicates the bitstream is saved in Annex - B
1061 // format.
1062 bool save_as_annexb;
1063
1064 // The path for partition stats reading and writing, used in the experiment
1065 // CONFIG_PARTITION_SEARCH_ORDER.
1066 const char *partition_info_path;
1067
1068 // Exit the encoder when it fails to encode to a given level.
1069 int strict_level_conformance;
1071} AV1EncoderConfig;
1072
1074static INLINE int is_lossless_requested(const RateControlCfg *const rc_cfg) {
1075 return rc_cfg->best_allowed_q == 0 && rc_cfg->worst_allowed_q == 0;
1076}
1082typedef struct {
1088 int obmc_probs[FRAME_UPDATE_TYPES][BLOCK_SIZES_ALL];
1089
1095 int warped_probs[FRAME_UPDATE_TYPES];
1096
1103 int tx_type_probs[FRAME_UPDATE_TYPES][TX_SIZES_ALL][TX_TYPES];
1104
1111 int switchable_interp_probs[FRAME_UPDATE_TYPES][SWITCHABLE_FILTER_CONTEXTS]
1112 [SWITCHABLE_FILTERS];
1113} FrameProbInfo;
1114
1117typedef struct FRAME_COUNTS {
1118// Note: This structure should only contain 'unsigned int' fields, or
1119// aggregates built solely from 'unsigned int' fields/elements
1120#if CONFIG_ENTROPY_STATS
1121 unsigned int kf_y_mode[KF_MODE_CONTEXTS][KF_MODE_CONTEXTS][INTRA_MODES];
1122 unsigned int angle_delta[DIRECTIONAL_MODES][2 * MAX_ANGLE_DELTA + 1];
1123 unsigned int y_mode[BLOCK_SIZE_GROUPS][INTRA_MODES];
1124 unsigned int uv_mode[CFL_ALLOWED_TYPES][INTRA_MODES][UV_INTRA_MODES];
1125 unsigned int cfl_sign[CFL_JOINT_SIGNS];
1126 unsigned int cfl_alpha[CFL_ALPHA_CONTEXTS][CFL_ALPHABET_SIZE];
1127 unsigned int palette_y_mode[PALATTE_BSIZE_CTXS][PALETTE_Y_MODE_CONTEXTS][2];
1128 unsigned int palette_uv_mode[PALETTE_UV_MODE_CONTEXTS][2];
1129 unsigned int palette_y_size[PALATTE_BSIZE_CTXS][PALETTE_SIZES];
1130 unsigned int palette_uv_size[PALATTE_BSIZE_CTXS][PALETTE_SIZES];
1131 unsigned int palette_y_color_index[PALETTE_SIZES]
1132 [PALETTE_COLOR_INDEX_CONTEXTS]
1133 [PALETTE_COLORS];
1134 unsigned int palette_uv_color_index[PALETTE_SIZES]
1135 [PALETTE_COLOR_INDEX_CONTEXTS]
1136 [PALETTE_COLORS];
1137 unsigned int partition[PARTITION_CONTEXTS][EXT_PARTITION_TYPES];
1138 unsigned int txb_skip[TOKEN_CDF_Q_CTXS][TX_SIZES][TXB_SKIP_CONTEXTS][2];
1139 unsigned int eob_extra[TOKEN_CDF_Q_CTXS][TX_SIZES][PLANE_TYPES]
1140 [EOB_COEF_CONTEXTS][2];
1141 unsigned int dc_sign[PLANE_TYPES][DC_SIGN_CONTEXTS][2];
1142 unsigned int coeff_lps[TX_SIZES][PLANE_TYPES][BR_CDF_SIZE - 1][LEVEL_CONTEXTS]
1143 [2];
1144 unsigned int eob_flag[TX_SIZES][PLANE_TYPES][EOB_COEF_CONTEXTS][2];
1145 unsigned int eob_multi16[TOKEN_CDF_Q_CTXS][PLANE_TYPES][2][5];
1146 unsigned int eob_multi32[TOKEN_CDF_Q_CTXS][PLANE_TYPES][2][6];
1147 unsigned int eob_multi64[TOKEN_CDF_Q_CTXS][PLANE_TYPES][2][7];
1148 unsigned int eob_multi128[TOKEN_CDF_Q_CTXS][PLANE_TYPES][2][8];
1149 unsigned int eob_multi256[TOKEN_CDF_Q_CTXS][PLANE_TYPES][2][9];
1150 unsigned int eob_multi512[TOKEN_CDF_Q_CTXS][PLANE_TYPES][2][10];
1151 unsigned int eob_multi1024[TOKEN_CDF_Q_CTXS][PLANE_TYPES][2][11];
1152 unsigned int coeff_lps_multi[TOKEN_CDF_Q_CTXS][TX_SIZES][PLANE_TYPES]
1153 [LEVEL_CONTEXTS][BR_CDF_SIZE];
1154 unsigned int coeff_base_multi[TOKEN_CDF_Q_CTXS][TX_SIZES][PLANE_TYPES]
1155 [SIG_COEF_CONTEXTS][NUM_BASE_LEVELS + 2];
1156 unsigned int coeff_base_eob_multi[TOKEN_CDF_Q_CTXS][TX_SIZES][PLANE_TYPES]
1157 [SIG_COEF_CONTEXTS_EOB][NUM_BASE_LEVELS + 1];
1158 unsigned int newmv_mode[NEWMV_MODE_CONTEXTS][2];
1159 unsigned int zeromv_mode[GLOBALMV_MODE_CONTEXTS][2];
1160 unsigned int refmv_mode[REFMV_MODE_CONTEXTS][2];
1161 unsigned int drl_mode[DRL_MODE_CONTEXTS][2];
1162 unsigned int inter_compound_mode[INTER_MODE_CONTEXTS][INTER_COMPOUND_MODES];
1163 unsigned int wedge_idx[BLOCK_SIZES_ALL][16];
1164 unsigned int interintra[BLOCK_SIZE_GROUPS][2];
1165 unsigned int interintra_mode[BLOCK_SIZE_GROUPS][INTERINTRA_MODES];
1166 unsigned int wedge_interintra[BLOCK_SIZES_ALL][2];
1167 unsigned int compound_type[BLOCK_SIZES_ALL][MASKED_COMPOUND_TYPES];
1168 unsigned int motion_mode[BLOCK_SIZES_ALL][MOTION_MODES];
1169 unsigned int obmc[BLOCK_SIZES_ALL][2];
1170 unsigned int intra_inter[INTRA_INTER_CONTEXTS][2];
1171 unsigned int comp_inter[COMP_INTER_CONTEXTS][2];
1172 unsigned int comp_ref_type[COMP_REF_TYPE_CONTEXTS][2];
1173 unsigned int uni_comp_ref[UNI_COMP_REF_CONTEXTS][UNIDIR_COMP_REFS - 1][2];
1174 unsigned int single_ref[REF_CONTEXTS][SINGLE_REFS - 1][2];
1175 unsigned int comp_ref[REF_CONTEXTS][FWD_REFS - 1][2];
1176 unsigned int comp_bwdref[REF_CONTEXTS][BWD_REFS - 1][2];
1177 unsigned int intrabc[2];
1178
1179 unsigned int txfm_partition[TXFM_PARTITION_CONTEXTS][2];
1180 unsigned int intra_tx_size[MAX_TX_CATS][TX_SIZE_CONTEXTS][MAX_TX_DEPTH + 1];
1181 unsigned int skip_mode[SKIP_MODE_CONTEXTS][2];
1182 unsigned int skip_txfm[SKIP_CONTEXTS][2];
1183 unsigned int compound_index[COMP_INDEX_CONTEXTS][2];
1184 unsigned int comp_group_idx[COMP_GROUP_IDX_CONTEXTS][2];
1185 unsigned int delta_q[DELTA_Q_PROBS][2];
1186 unsigned int delta_lf_multi[FRAME_LF_COUNT][DELTA_LF_PROBS][2];
1187 unsigned int delta_lf[DELTA_LF_PROBS][2];
1188
1189 unsigned int inter_ext_tx[EXT_TX_SETS_INTER][EXT_TX_SIZES][TX_TYPES];
1190 unsigned int intra_ext_tx[EXT_TX_SETS_INTRA][EXT_TX_SIZES][INTRA_MODES]
1191 [TX_TYPES];
1192 unsigned int filter_intra_mode[FILTER_INTRA_MODES];
1193 unsigned int filter_intra[BLOCK_SIZES_ALL][2];
1194 unsigned int switchable_restore[RESTORE_SWITCHABLE_TYPES];
1195 unsigned int wiener_restore[2];
1196 unsigned int sgrproj_restore[2];
1197#endif // CONFIG_ENTROPY_STATS
1198
1199 unsigned int switchable_interp[SWITCHABLE_FILTER_CONTEXTS]
1200 [SWITCHABLE_FILTERS];
1201} FRAME_COUNTS;
1202
1203#define INTER_MODE_RD_DATA_OVERALL_SIZE 6400
1204
1205typedef struct {
1206 int ready;
1207 double a;
1208 double b;
1209 double dist_mean;
1210 double ld_mean;
1211 double sse_mean;
1212 double sse_sse_mean;
1213 double sse_ld_mean;
1214 int num;
1215 double dist_sum;
1216 double ld_sum;
1217 double sse_sum;
1218 double sse_sse_sum;
1219 double sse_ld_sum;
1220} InterModeRdModel;
1221
1222typedef struct {
1223 int idx;
1224 int64_t rd;
1225} RdIdxPair;
1226// TODO(angiebird): This is an estimated size. We still need to figure what is
1227// the maximum number of modes.
1228#define MAX_INTER_MODES 1024
1229// TODO(any): rename this struct to something else. There is already another
1230// struct called inter_mode_info, which makes this terribly confusing.
1238typedef struct inter_modes_info {
1243 int num;
1247 MB_MODE_INFO mbmi_arr[MAX_INTER_MODES];
1251 int mode_rate_arr[MAX_INTER_MODES];
1255 int64_t sse_arr[MAX_INTER_MODES];
1259 int64_t est_rd_arr[MAX_INTER_MODES];
1263 RdIdxPair rd_idx_pair_arr[MAX_INTER_MODES];
1267 RD_STATS rd_cost_arr[MAX_INTER_MODES];
1271 RD_STATS rd_cost_y_arr[MAX_INTER_MODES];
1275 RD_STATS rd_cost_uv_arr[MAX_INTER_MODES];
1276} InterModesInfo;
1277
1279typedef struct {
1280 // TODO(kyslov): consider changing to 64bit
1281
1282 // This struct is used for computing variance in choose_partitioning(), where
1283 // the max number of samples within a superblock is 32x32 (with 4x4 avg).
1284 // With 8bit bitdepth, uint32_t is enough for sum_square_error (2^8 * 2^8 * 32
1285 // * 32 = 2^26). For high bitdepth we need to consider changing this to 64 bit
1286 uint32_t sum_square_error;
1287 int32_t sum_error;
1288 int log2_count;
1289 int variance;
1290} VPartVar;
1291
1292typedef struct {
1293 VPartVar none;
1294 VPartVar horz[2];
1295 VPartVar vert[2];
1296} VPVariance;
1297
1298typedef struct {
1299 VPVariance part_variances;
1300 VPartVar split[4];
1301} VP4x4;
1302
1303typedef struct {
1304 VPVariance part_variances;
1305 VP4x4 split[4];
1306} VP8x8;
1307
1308typedef struct {
1309 VPVariance part_variances;
1310 VP8x8 split[4];
1311} VP16x16;
1312
1313typedef struct {
1314 VPVariance part_variances;
1315 VP16x16 split[4];
1316} VP32x32;
1317
1318typedef struct {
1319 VPVariance part_variances;
1320 VP32x32 split[4];
1321} VP64x64;
1322
1323typedef struct {
1324 VPVariance part_variances;
1325 VP64x64 *split;
1326} VP128x128;
1327
1333typedef struct {
1342 int64_t thresholds[5];
1343
1348 int64_t threshold_minmax;
1349} VarBasedPartitionInfo;
1350
1354typedef struct {
1355#if CONFIG_MULTITHREAD
1360 pthread_mutex_t *mutex_;
1361 pthread_cond_t *cond_;
1363#endif // CONFIG_MULTITHREAD
1369 int *num_finished_cols;
1375 int sync_range;
1379 int rows;
1383 int next_mi_row;
1387 int num_threads_working;
1388} AV1EncRowMultiThreadSync;
1389
1392// TODO(jingning) All spatially adaptive variables should go to TileDataEnc.
1393typedef struct TileDataEnc {
1394 TileInfo tile_info;
1395 DECLARE_ALIGNED(16, FRAME_CONTEXT, tctx);
1396 FRAME_CONTEXT *row_ctx;
1397 uint64_t abs_sum_level;
1398 uint8_t allow_update_cdf;
1399 InterModeRdModel inter_mode_rd_models[BLOCK_SIZES_ALL];
1400 AV1EncRowMultiThreadSync row_mt_sync;
1401 MV firstpass_top_mv;
1402} TileDataEnc;
1403
1404typedef struct RD_COUNTS {
1405 int compound_ref_used_flag;
1406 int skip_mode_used_flag;
1407 int tx_type_used[TX_SIZES_ALL][TX_TYPES];
1408 int obmc_used[BLOCK_SIZES_ALL][2];
1409 int warped_used[2];
1410 int newmv_or_intra_blocks;
1411 uint64_t seg_tmp_pred_cost[2];
1412} RD_COUNTS;
1413
1414typedef struct ThreadData {
1415 MACROBLOCK mb;
1416 RD_COUNTS rd_counts;
1417 FRAME_COUNTS *counts;
1418 PC_TREE_SHARED_BUFFERS shared_coeff_buf;
1419 SIMPLE_MOTION_DATA_TREE *sms_tree;
1420 SIMPLE_MOTION_DATA_TREE *sms_root;
1421 uint32_t *hash_value_buffer[2][2];
1422 OBMCBuffer obmc_buffer;
1423 PALETTE_BUFFER *palette_buffer;
1424 CompoundTypeRdBuffers comp_rd_buffer;
1425 CONV_BUF_TYPE *tmp_conv_dst;
1426 uint64_t abs_sum_level;
1427 uint8_t *tmp_pred_bufs[2];
1428 int intrabc_used;
1429 int deltaq_used;
1430 int coefficient_size;
1431 int max_mv_magnitude;
1432 int interp_filter_selected[SWITCHABLE];
1433 FRAME_CONTEXT *tctx;
1434 VP64x64 *vt64x64;
1435 int32_t num_64x64_blocks;
1436 PICK_MODE_CONTEXT *firstpass_ctx;
1437 TemporalFilterData tf_data;
1438 TplTxfmStats tpl_txfm_stats;
1439 // Pointer to the array of structures to store gradient information of each
1440 // pixel in a superblock. The buffer constitutes of MAX_SB_SQUARE pixel level
1441 // structures for each of the plane types (PLANE_TYPE_Y and PLANE_TYPE_UV).
1442 PixelLevelGradientInfo *pixel_gradient_info;
1443 // Pointer to the array of structures to store source variance information of
1444 // each 4x4 sub-block in a superblock. Block4x4VarInfo structure is used to
1445 // store source variance and log of source variance of each 4x4 sub-block
1446 // for subsequent retrieval.
1447 Block4x4VarInfo *src_var_info_of_4x4_sub_blocks;
1448} ThreadData;
1449
1450struct EncWorkerData;
1451
1457typedef struct {
1461 int allocated_tile_rows;
1465 int allocated_tile_cols;
1472 int allocated_rows;
1479 int allocated_cols;
1480
1484 int thread_id_to_tile_id[MAX_NUM_THREADS];
1485
1486#if CONFIG_MULTITHREAD
1490 pthread_mutex_t *mutex_;
1491#endif
1492
1500 void (*sync_read_ptr)(AV1EncRowMultiThreadSync *const, int, int);
1504 void (*sync_write_ptr)(AV1EncRowMultiThreadSync *const, int, int, int);
1506} AV1EncRowMultiThreadInfo;
1507
1511#define NUM_RECODES_PER_FRAME 10
1512
1513#if CONFIG_FRAME_PARALLEL_ENCODE
1517#define MAX_PARALLEL_FRAMES 4
1518
1523typedef struct RestoreStateBuffers {
1527 uint16_t *cdef_srcbuf;
1528
1532 uint16_t *cdef_colbuf[MAX_MB_PLANE];
1533
1537 int32_t *rst_tmpbuf;
1538
1542 RestorationLineBuffers *rlbs;
1543} RestoreStateBuffers;
1544#endif // CONFIG_FRAME_PARALLEL_ENCODE
1545
1549typedef struct PrimaryMultiThreadInfo {
1553 int num_workers;
1554
1558 int num_mod_workers[NUM_MT_MODULES];
1559
1563 AVxWorker *workers;
1564
1569 struct EncWorkerData *tile_thr_data;
1570
1574 AV1CdefWorkerData *cdef_worker;
1575
1576#if CONFIG_FRAME_PARALLEL_ENCODE
1581 AVxWorker *p_workers[MAX_PARALLEL_FRAMES];
1582
1586 int p_num_workers;
1587#endif // CONFIG_FRAME_PARALLEL_ENCODE
1588} PrimaryMultiThreadInfo;
1589
1593typedef struct MultiThreadInfo {
1597 int num_workers;
1598
1602 int num_mod_workers[NUM_MT_MODULES];
1603
1607 AVxWorker *workers;
1608
1613 struct EncWorkerData *tile_thr_data;
1614
1619 bool row_mt_enabled;
1620
1624 bool pack_bs_mt_enabled;
1625
1629 AV1EncRowMultiThreadInfo enc_row_mt;
1630
1634 AV1TplRowMultiThreadInfo tpl_row_mt;
1635
1639 AV1LfSync lf_row_sync;
1640
1644 AV1LrSync lr_row_sync;
1645
1649 AV1EncPackBSSync pack_bs_sync;
1650
1654 AV1GlobalMotionSync gm_sync;
1655
1659 AV1TemporalFilterSync tf_sync;
1660
1664 AV1CdefSync cdef_sync;
1665
1669 AV1CdefWorkerData *cdef_worker;
1670
1671#if CONFIG_FRAME_PARALLEL_ENCODE
1675 RestoreStateBuffers restore_state_buf;
1676#endif // CONFIG_FRAME_PARALLEL_ENCODE
1677} MultiThreadInfo;
1678
1681typedef struct ActiveMap {
1682 int enabled;
1683 int update;
1684 unsigned char *map;
1685} ActiveMap;
1686
1692typedef struct {
1697 double cs_rate_array[32];
1701 int rate_index;
1705 int rate_size;
1706} ForceIntegerMVInfo;
1707
1710#if CONFIG_INTERNAL_STATS
1711// types of stats
1712enum {
1713 STAT_Y,
1714 STAT_U,
1715 STAT_V,
1716 STAT_ALL,
1717 NUM_STAT_TYPES // This should always be the last member of the enum
1718} UENUM1BYTE(StatType);
1719
1720typedef struct IMAGE_STAT {
1721 double stat[NUM_STAT_TYPES];
1722 double worst;
1723} ImageStat;
1724#endif // CONFIG_INTERNAL_STATS
1725
1726typedef struct {
1727 int ref_count;
1729} EncRefCntBuffer;
1730
1738typedef struct {
1743 MB_MODE_INFO_EXT_FRAME *frame_base;
1747 int alloc_size;
1751 int stride;
1752} MBMIExtFrameBufferInfo;
1753
1756#if CONFIG_COLLECT_PARTITION_STATS
1757typedef struct FramePartitionTimingStats {
1758 int partition_decisions[6][EXT_PARTITION_TYPES];
1759 int partition_attempts[6][EXT_PARTITION_TYPES];
1760 int64_t partition_times[6][EXT_PARTITION_TYPES];
1761
1762 int partition_redo;
1763} FramePartitionTimingStats;
1764#endif // CONFIG_COLLECT_PARTITION_STATS
1765
1766#if CONFIG_COLLECT_COMPONENT_TIMING
1767#include "aom_ports/aom_timer.h"
1768// Adjust the following to add new components.
1769enum {
1770 av1_encode_strategy_time,
1771 av1_get_one_pass_rt_params_time,
1772 av1_get_second_pass_params_time,
1773 denoise_and_encode_time,
1774 apply_filtering_time,
1775 av1_tpl_setup_stats_time,
1776 encode_frame_to_data_rate_time,
1777 encode_with_or_without_recode_time,
1778 loop_filter_time,
1779 cdef_time,
1780 loop_restoration_time,
1781 av1_pack_bitstream_final_time,
1782 av1_encode_frame_time,
1783 av1_compute_global_motion_time,
1784 av1_setup_motion_field_time,
1785 encode_sb_row_time,
1786
1787 rd_pick_partition_time,
1788 rd_use_partition_time,
1789 choose_var_based_partitioning_time,
1790 av1_prune_partitions_time,
1791 none_partition_search_time,
1792 split_partition_search_time,
1793 rectangular_partition_search_time,
1794 ab_partitions_search_time,
1795 rd_pick_4partition_time,
1796 encode_sb_time,
1797
1798 rd_pick_sb_modes_time,
1799 av1_rd_pick_intra_mode_sb_time,
1800 av1_rd_pick_inter_mode_sb_time,
1801 set_params_rd_pick_inter_mode_time,
1802 skip_inter_mode_time,
1803 handle_inter_mode_time,
1804 evaluate_motion_mode_for_winner_candidates_time,
1805 do_tx_search_time,
1806 handle_intra_mode_time,
1807 refine_winner_mode_tx_time,
1808 av1_search_palette_mode_time,
1809 handle_newmv_time,
1810 compound_type_rd_time,
1811 interpolation_filter_search_time,
1812 motion_mode_rd_time,
1813
1814 nonrd_use_partition_time,
1815 pick_sb_modes_nonrd_time,
1816 hybrid_intra_mode_search_time,
1817 nonrd_pick_inter_mode_sb_time,
1818 encode_b_nonrd_time,
1819
1820 kTimingComponents,
1821} UENUM1BYTE(TIMING_COMPONENT);
1822
1823static INLINE char const *get_component_name(int index) {
1824 switch (index) {
1825 case av1_encode_strategy_time: return "av1_encode_strategy_time";
1826 case av1_get_one_pass_rt_params_time:
1827 return "av1_get_one_pass_rt_params_time";
1828 case av1_get_second_pass_params_time:
1829 return "av1_get_second_pass_params_time";
1830 case denoise_and_encode_time: return "denoise_and_encode_time";
1831 case apply_filtering_time: return "apply_filtering_time";
1832 case av1_tpl_setup_stats_time: return "av1_tpl_setup_stats_time";
1833 case encode_frame_to_data_rate_time:
1834 return "encode_frame_to_data_rate_time";
1835 case encode_with_or_without_recode_time:
1836 return "encode_with_or_without_recode_time";
1837 case loop_filter_time: return "loop_filter_time";
1838 case cdef_time: return "cdef_time";
1839 case loop_restoration_time: return "loop_restoration_time";
1840 case av1_pack_bitstream_final_time: return "av1_pack_bitstream_final_time";
1841 case av1_encode_frame_time: return "av1_encode_frame_time";
1842 case av1_compute_global_motion_time:
1843 return "av1_compute_global_motion_time";
1844 case av1_setup_motion_field_time: return "av1_setup_motion_field_time";
1845 case encode_sb_row_time: return "encode_sb_row_time";
1846
1847 case rd_pick_partition_time: return "rd_pick_partition_time";
1848 case rd_use_partition_time: return "rd_use_partition_time";
1849 case choose_var_based_partitioning_time:
1850 return "choose_var_based_partitioning_time";
1851 case av1_prune_partitions_time: return "av1_prune_partitions_time";
1852 case none_partition_search_time: return "none_partition_search_time";
1853 case split_partition_search_time: return "split_partition_search_time";
1854 case rectangular_partition_search_time:
1855 return "rectangular_partition_search_time";
1856 case ab_partitions_search_time: return "ab_partitions_search_time";
1857 case rd_pick_4partition_time: return "rd_pick_4partition_time";
1858 case encode_sb_time: return "encode_sb_time";
1859
1860 case rd_pick_sb_modes_time: return "rd_pick_sb_modes_time";
1861 case av1_rd_pick_intra_mode_sb_time:
1862 return "av1_rd_pick_intra_mode_sb_time";
1863 case av1_rd_pick_inter_mode_sb_time:
1864 return "av1_rd_pick_inter_mode_sb_time";
1865 case set_params_rd_pick_inter_mode_time:
1866 return "set_params_rd_pick_inter_mode_time";
1867 case skip_inter_mode_time: return "skip_inter_mode_time";
1868 case handle_inter_mode_time: return "handle_inter_mode_time";
1869 case evaluate_motion_mode_for_winner_candidates_time:
1870 return "evaluate_motion_mode_for_winner_candidates_time";
1871 case do_tx_search_time: return "do_tx_search_time";
1872 case handle_intra_mode_time: return "handle_intra_mode_time";
1873 case refine_winner_mode_tx_time: return "refine_winner_mode_tx_time";
1874 case av1_search_palette_mode_time: return "av1_search_palette_mode_time";
1875 case handle_newmv_time: return "handle_newmv_time";
1876 case compound_type_rd_time: return "compound_type_rd_time";
1877 case interpolation_filter_search_time:
1878 return "interpolation_filter_search_time";
1879 case motion_mode_rd_time: return "motion_mode_rd_time";
1880
1881 case nonrd_use_partition_time: return "nonrd_use_partition_time";
1882 case pick_sb_modes_nonrd_time: return "pick_sb_modes_nonrd_time";
1883 case hybrid_intra_mode_search_time: return "hybrid_intra_mode_search_time";
1884 case nonrd_pick_inter_mode_sb_time: return "nonrd_pick_inter_mode_sb_time";
1885 case encode_b_nonrd_time: return "encode_b_nonrd_time";
1886
1887 default: assert(0);
1888 }
1889 return "error";
1890}
1891#endif
1892
1893// The maximum number of internal ARFs except ALTREF_FRAME
1894#define MAX_INTERNAL_ARFS (REF_FRAMES - BWDREF_FRAME - 1)
1895
1901typedef struct {
1905 bool search_done;
1906
1912 YV12_BUFFER_CONFIG *ref_buf[REF_FRAMES];
1913
1917 unsigned char *src_buffer;
1918
1924 int num_ref_frames[MAX_DIRECTIONS];
1925
1932 FrameDistPair reference_frames[MAX_DIRECTIONS][REF_FRAMES - 1];
1933
1938 int segment_map_w;
1939 int segment_map_h;
1945 int num_src_corners;
1946
1952 int src_corners[2 * MAX_CORNERS];
1953} GlobalMotionInfo;
1954
1964typedef struct {
1965 int width;
1966 int height;
1967} InitialDimensions;
1968
1972typedef struct {
1977 int default_interp_skip_flags;
1981 uint16_t interp_filter_search_mask;
1982} InterpSearchFlags;
1983
1987typedef struct {
1993 int max_mv_magnitude;
1998 int mv_step_param;
2007 fractional_mv_step_fp *find_fractional_mv_step;
2014 search_site_config search_site_cfg[SS_CFG_TOTAL][NUM_DISTINCT_SEARCH_METHODS];
2015} MotionVectorSearchParams;
2016
2025typedef struct {
2026 bool golden_frame;
2027 bool bwd_ref_frame;
2028 bool alt_ref_frame;
2029} RefreshFrameInfo;
2030
2038typedef struct {
2039 int width;
2040 int height;
2041} ResizePendingParams;
2042
2046typedef struct {
2050 int ref_relative_dist[INTER_REFS_PER_FRAME];
2054 int8_t nearest_past_ref;
2058 int8_t nearest_future_ref;
2059} RefFrameDistanceInfo;
2060
2076typedef struct {
2084 unsigned int coeff_opt_thresholds[MODE_EVAL_TYPES][2];
2085
2090 TX_SIZE_SEARCH_METHOD tx_size_search_methods[MODE_EVAL_TYPES];
2091
2098 unsigned int use_transform_domain_distortion[MODE_EVAL_TYPES];
2099
2105 unsigned int tx_domain_dist_threshold[MODE_EVAL_TYPES];
2106
2112 unsigned int skip_txfm_level[MODE_EVAL_TYPES];
2113
2119 unsigned int predict_dc_level[MODE_EVAL_TYPES];
2120} WinnerModeParams;
2121
2129typedef struct {
2130 bool last_frame;
2131 bool golden_frame;
2132 bool bwd_ref_frame;
2133 bool alt2_ref_frame;
2134 bool alt_ref_frame;
2138 bool update_pending;
2139} ExtRefreshFrameFlagsInfo;
2140
2144typedef struct {
2148 int ref_frame_flags;
2149
2153 ExtRefreshFrameFlagsInfo refresh_frame;
2154
2158 bool refresh_frame_context;
2159
2164 bool refresh_frame_context_pending;
2165
2169 bool use_ref_frame_mvs;
2170
2174 bool use_error_resilient;
2175
2179 bool use_s_frame;
2180
2185 bool use_primary_ref_none;
2186} ExternalFlags;
2187
2190typedef struct {
2191 // Some misc info
2192 int high_prec;
2193 int q;
2194 int order;
2195
2196 // MV counters
2197 int inter_count;
2198 int intra_count;
2199 int default_mvs;
2200 int mv_joint_count[4];
2201 int last_bit_zero;
2202 int last_bit_nonzero;
2203
2204 // Keep track of the rates
2205 int total_mv_rate;
2206 int hp_total_mv_rate;
2207 int lp_total_mv_rate;
2208
2209 // Texture info
2210 int horz_text;
2211 int vert_text;
2212 int diag_text;
2213
2214 // Whether the current struct contains valid data
2215 int valid;
2216} MV_STATS;
2217
2218typedef struct WeberStats {
2219 int64_t mb_wiener_variance;
2220 int64_t src_variance;
2221 int64_t rec_variance;
2222 int16_t src_pix_max;
2223 int16_t rec_pix_max;
2224 int64_t distortion;
2225 int64_t satd;
2226 double max_scale;
2227} WeberStats;
2228
2229typedef struct {
2230 struct loopfilter lf;
2231 CdefInfo cdef_info;
2232 YV12_BUFFER_CONFIG copy_buffer;
2233 RATE_CONTROL rc;
2234 MV_STATS mv_stats;
2235} CODING_CONTEXT;
2236
2237typedef struct {
2238 int frame_width;
2239 int frame_height;
2240 int mi_rows;
2241 int mi_cols;
2242 int mb_rows;
2243 int mb_cols;
2244 int num_mbs;
2245 aom_bit_depth_t bit_depth;
2246 int subsampling_x;
2247 int subsampling_y;
2248} FRAME_INFO;
2249
2253typedef struct {
2254 int show_frame_count;
2255} FRAME_INDEX_SET;
2256
2262typedef struct {
2268 uint8_t *map;
2274 bool has_lossless_segment;
2275} EncSegmentationInfo;
2276
2280typedef struct {
2284 int64_t prev_ts_start;
2288 int64_t prev_ts_end;
2292 int64_t first_ts_start;
2293} TimeStamps;
2294
2299typedef struct {
2303 tran_low_t *tcoeff;
2307 uint16_t *eobs;
2311 uint8_t *entropy_ctx;
2312} CoeffBufferPool;
2313
2317typedef struct AV1_COMP_DATA {
2321 unsigned char *cx_data;
2322
2326 size_t cx_data_sz;
2327
2331 size_t frame_size;
2332
2336 unsigned int lib_flags;
2337
2341 int64_t ts_frame_start;
2342
2346 int64_t ts_frame_end;
2347
2351 int flush;
2352
2356 const aom_rational64_t *timestamp_ratio;
2357
2361 int pop_lookahead;
2362#if CONFIG_FRAME_PARALLEL_ENCODE
2366 int frame_display_order_hint;
2367#endif
2368} AV1_COMP_DATA;
2369
2373typedef struct AV1_PRIMARY {
2374#if CONFIG_FRAME_PARALLEL_ENCODE
2378 struct AV1_COMP *parallel_cpi[MAX_PARALLEL_FRAMES];
2379
2384 struct AV1_COMP_DATA parallel_frames_data[MAX_PARALLEL_FRAMES - 1];
2385
2386#if CONFIG_FPMT_TEST
2392 FPMT_TEST_ENC_CFG fpmt_unit_test_cfg;
2393
2397 FrameProbInfo temp_frame_probs;
2398
2404 FrameProbInfo temp_frame_probs_simulation;
2405
2410 int temp_valid_gm_model_found[FRAME_UPDATE_TYPES];
2411#endif
2412#if CONFIG_FRAME_PARALLEL_ENCODE_2
2418 RefCntBuffer *ref_frame_map_copy[REF_FRAMES];
2419#endif // CONFIG_FRAME_PARALLEL_ENCODE_2
2420#endif // CONFIG_FRAME_PARALLEL_ENCODE
2421
2425 int64_t ts_start_last_show_frame;
2426
2430 int64_t ts_end_last_show_frame;
2431
2435 int num_fp_contexts;
2436
2440 int filter_level[2];
2441
2445 int filter_level_u;
2446
2450 int filter_level_v;
2451
2457 struct AV1_COMP *cpi;
2458
2462 struct AV1_COMP *cpi_lap;
2463
2467 struct lookahead_ctx *lookahead;
2468
2474 int seq_params_locked;
2475
2480 struct aom_codec_pkt_list *output_pkt_list;
2481
2485 int internal_altref_allowed;
2486
2490 int show_existing_alt_ref;
2491
2495 GF_GROUP gf_group;
2496
2500 GF_STATE gf_state;
2501
2505 int lap_enabled;
2506
2510 AV1LevelParams level_params;
2511
2515 int b_calculate_psnr;
2516
2520 int frames_left;
2521
2525 TWO_PASS twopass;
2526
2531
2535 TEMPORAL_FILTER_INFO tf_info;
2540 SequenceHeader seq_params;
2541
2545 int use_svc;
2546
2550 bool buffer_removal_time_present;
2551
2555 unsigned int number_temporal_layers;
2556
2560 unsigned int number_spatial_layers;
2561
2565 struct aom_internal_error_info error;
2566
2572 aom_variance_fn_ptr_t fn_ptr[BLOCK_SIZES_ALL];
2573
2578 double *tpl_sb_rdmult_scaling_factors;
2579
2583 TplParams tpl_data;
2584
2588 MV_STATS mv_stats;
2589
2590#if CONFIG_INTERNAL_STATS
2592 uint64_t total_time_receive_data;
2593 uint64_t total_time_compress_data;
2594
2595 unsigned int total_mode_chosen_counts[MAX_MODES];
2596
2597 int count[2];
2598 uint64_t total_sq_error[2];
2599 uint64_t total_samples[2];
2600 ImageStat psnr[2];
2601
2602 double total_blockiness;
2603 double worst_blockiness;
2604
2605 int total_bytes;
2606 double summed_quality;
2607 double summed_weights;
2608 double summed_quality_hbd;
2609 double summed_weights_hbd;
2610 unsigned int total_recode_hits;
2611 double worst_ssim;
2612 double worst_ssim_hbd;
2613
2614 ImageStat fastssim;
2615 ImageStat psnrhvs;
2616
2617 int b_calculate_blockiness;
2618 int b_calculate_consistency;
2619
2620 double total_inconsistency;
2621 double worst_consistency;
2622 Ssimv *ssim_vars;
2623 Metrics metrics;
2625#endif
2626
2627#if CONFIG_ENTROPY_STATS
2631 FRAME_COUNTS aggregate_fc;
2632#endif // CONFIG_ENTROPY_STATS
2633
2640 int fb_of_context_type[REF_FRAMES];
2641
2645 PrimaryMultiThreadInfo p_mt_info;
2646
2650 FrameProbInfo frame_probs;
2651
2658 int valid_gm_model_found[FRAME_UPDATE_TYPES];
2659} AV1_PRIMARY;
2660
2664typedef struct AV1_COMP {
2668 AV1_PRIMARY *ppi;
2669
2674 EncQuantDequantParams enc_quant_dequant_params;
2675
2679 ThreadData td;
2680
2684 FRAME_COUNTS counts;
2685
2689 MBMIExtFrameBufferInfo mbmi_ext_info;
2690
2696 CB_COEFF_BUFFER *coeff_buffer_base;
2697
2702 CoeffBufferPool coeff_buffer_pool;
2703
2707 AV1_COMMON common;
2708
2712 AV1EncoderConfig oxcf;
2713
2718 TRELLIS_OPT_TYPE optimize_seg_arr[MAX_SEGMENTS];
2719
2725 YV12_BUFFER_CONFIG *source;
2726
2734 YV12_BUFFER_CONFIG *last_source;
2735
2740 YV12_BUFFER_CONFIG *unscaled_source;
2741
2745 YV12_BUFFER_CONFIG scaled_source;
2746
2750 YV12_BUFFER_CONFIG *unscaled_last_source;
2751
2755 YV12_BUFFER_CONFIG scaled_last_source;
2756
2761 YV12_BUFFER_CONFIG *unfiltered_source;
2762
2767 YV12_BUFFER_CONFIG orig_source;
2768
2772 int skip_tpl_setup_stats;
2773
2782 double *tpl_rdmult_scaling_factors;
2783
2787 TemporalFilterCtx tf_ctx;
2788
2792 ForceIntegerMVInfo force_intpel_info;
2793
2798 RefCntBuffer *scaled_ref_buf[INTER_REFS_PER_FRAME];
2799
2803 RefCntBuffer *last_show_frame_buf;
2804
2808 RefreshFrameInfo refresh_frame;
2809
2813 ExternalFlags ext_flags;
2814
2819 YV12_BUFFER_CONFIG last_frame_uf;
2820
2825 YV12_BUFFER_CONFIG trial_frame_rst;
2826
2830 int64_t ambient_err;
2831
2835 RD_OPT rd;
2836
2841 CODING_CONTEXT coding_context;
2842
2846 GlobalMotionInfo gm_info;
2847
2851 WinnerModeParams winner_mode_params;
2852
2856 TimeStamps time_stamps;
2857
2861 RATE_CONTROL rc;
2862
2866 double framerate;
2867
2871 int ref_frame_flags;
2872
2876 int speed;
2877
2881 SPEED_FEATURES sf;
2882
2886 MotionVectorSearchParams mv_search_params;
2887
2892 int all_one_sided_refs;
2893
2897 EncSegmentationInfo enc_seg;
2898
2902 CYCLIC_REFRESH *cyclic_refresh;
2907 ActiveMap active_map;
2908
2912 unsigned char gf_frame_index;
2913
2914#if CONFIG_INTERNAL_STATS
2916 uint64_t time_compress_data;
2917
2918 unsigned int mode_chosen_counts[MAX_MODES];
2919 int bytes;
2920 unsigned int frame_recode_hits;
2922#endif
2923
2924#if CONFIG_SPEED_STATS
2928 unsigned int tx_search_count;
2929#endif // CONFIG_SPEED_STATS
2930
2935 int droppable;
2936
2940 FRAME_INFO frame_info;
2941
2945 FRAME_INDEX_SET frame_index_set;
2946
2950 InitialDimensions initial_dimensions;
2951
2958 int initial_mbs;
2959
2963 ResizePendingParams resize_pending_params;
2964
2969 TileDataEnc *tile_data;
2973 int allocated_tiles;
2974
2978 TokenInfo token_info;
2979
2983 int vaq_refresh;
2984
2988 VarBasedPartitionInfo vbp_info;
2989
2993 int num_frame_recode;
2994
2998 FrameProbInfo frame_new_probs[NUM_RECODES_PER_FRAME];
2999
3003 int do_update_frame_probs_txtype[NUM_RECODES_PER_FRAME];
3004
3008 int do_update_frame_probs_obmc[NUM_RECODES_PER_FRAME];
3009
3013 int do_update_frame_probs_warp[NUM_RECODES_PER_FRAME];
3014
3018 int do_update_frame_probs_interpfilter[NUM_RECODES_PER_FRAME];
3019
3020#if CONFIG_FRAME_PARALLEL_ENCODE && CONFIG_FPMT_TEST
3025 double temp_framerate;
3026#endif
3032 double new_framerate;
3033
3037 int do_update_vbr_bits_off_target_fast;
3038
3042 MultiThreadInfo mt_info;
3043
3049 int existing_fb_idx_to_show;
3050
3054 int intrabc_used;
3055
3059 int prune_ref_frame_mask;
3060
3064 AV1LrStruct lr_ctxt;
3065
3069 aom_film_grain_table_t *film_grain_table;
3070
3071#if CONFIG_DENOISE
3076 struct aom_denoise_and_model_t *denoise_and_model;
3077#endif
3078
3082 InterpSearchFlags interp_search_flags;
3083
3091 int use_screen_content_tools;
3092
3099 int is_screen_content_type;
3100
3101#if CONFIG_COLLECT_PARTITION_STATS
3105 FramePartitionTimingStats partition_stats;
3106#endif // CONFIG_COLLECT_PARTITION_STATS
3107
3108#if CONFIG_COLLECT_COMPONENT_TIMING
3112 uint64_t component_time[kTimingComponents];
3117 struct aom_usec_timer component_timer[kTimingComponents];
3121 uint64_t frame_component_time[kTimingComponents];
3122#endif
3123
3127 int frame_header_count;
3128
3132 int deltaq_used;
3133
3137 RefFrameDistanceInfo ref_frame_dist_info;
3138
3144 double *ssim_rdmult_scaling_factors;
3145
3146#if CONFIG_TUNE_VMAF
3150 TuneVMAFInfo vmaf_info;
3151#endif
3152
3153#if CONFIG_TUNE_BUTTERAUGLI
3157 TuneButteraugliInfo butteraugli_info;
3158#endif
3159
3163 SVC svc;
3164
3168 COMPRESSOR_STAGE compressor_stage;
3169
3174 FRAME_TYPE last_frame_type;
3175
3179 int num_tg;
3180
3186 aom_superres_mode superres_mode;
3187
3191 FirstPassData firstpass_data;
3192
3196 NOISE_ESTIMATE noise_estimate;
3197
3198#if CONFIG_AV1_TEMPORAL_DENOISING
3202 AV1_DENOISER denoiser;
3203#endif
3204
3209 uint8_t *consec_zero_mv;
3210
3214 BLOCK_SIZE fp_block_size;
3215
3220 int sb_counter;
3221
3225 size_t available_bs_size;
3226
3231 ExtPartController ext_part_controller;
3232
3237 MV_STATS mv_stats;
3238#if CONFIG_FRAME_PARALLEL_ENCODE && CONFIG_FRAME_PARALLEL_ENCODE_2
3242 int ref_refresh_index;
3243
3248 bool refresh_idx_available;
3249
3255 int ref_idx_to_skip;
3256#if CONFIG_FPMT_TEST
3263 int wanted_fb;
3264#endif
3265#endif // CONFIG_FRAME_PARALLEL_ENCODE && CONFIG_FRAME_PARALLEL_ENCODE_2
3266
3272 bool do_frame_data_update;
3273
3274#if CONFIG_RD_COMMAND
3278 RD_COMMAND rd_command;
3279#endif // CONFIG_RD_COMMAND
3280
3284 WeberStats *mb_weber_stats;
3285
3289 BLOCK_SIZE weber_bsize;
3290
3294 int64_t norm_wiener_variance;
3295
3299 int *mb_delta_q;
3300
3304 bool is_dropped_frame;
3305
3306#if CONFIG_BITRATE_ACCURACY
3310 VBR_RATECTRL_INFO vbr_rc_info;
3311#endif
3312
3313#if CONFIG_RATECTRL_LOG
3317 RATECTRL_LOG rc_log;
3318#endif // CONFIG_RATECTRL_LOG
3319
3323 TWO_PASS_FRAME twopass_frame;
3324
3328 THIRD_PASS_DEC_CTX *third_pass_ctx;
3329
3333 FILE *second_pass_log_stream;
3334
3338 uint64_t *src_sad_blk_64x64;
3339} AV1_COMP;
3340
3344typedef struct EncodeFrameInput {
3346 YV12_BUFFER_CONFIG *source;
3347 YV12_BUFFER_CONFIG *last_source;
3348 int64_t ts_duration;
3350} EncodeFrameInput;
3351
3356typedef struct EncodeFrameParams {
3360 int error_resilient_mode;
3364 FRAME_TYPE frame_type;
3365
3367 int primary_ref_frame;
3368 int order_offset;
3369
3374 int show_frame;
3375
3377 int refresh_frame_flags;
3378
3379 int show_existing_frame;
3380 int existing_fb_idx_to_show;
3381
3386 int ref_frame_flags;
3387
3391 int remapped_ref_idx[REF_FRAMES];
3392
3397 RefreshFrameInfo refresh_frame;
3398
3402 int speed;
3403} EncodeFrameParams;
3404
3407// EncodeFrameResults contains information about the result of encoding a
3408// single frame
3409typedef struct {
3410 size_t size; // Size of resulting bitstream
3411} EncodeFrameResults;
3412
3413void av1_initialize_enc(unsigned int usage, enum aom_rc_mode end_usage);
3414
3415struct AV1_COMP *av1_create_compressor(AV1_PRIMARY *ppi,
3416 const AV1EncoderConfig *oxcf,
3417 BufferPool *const pool,
3418 COMPRESSOR_STAGE stage,
3419 int lap_lag_in_frames);
3420
3421struct AV1_PRIMARY *av1_create_primary_compressor(
3422 struct aom_codec_pkt_list *pkt_list_head, int num_lap_buffers,
3423 const AV1EncoderConfig *oxcf);
3424
3425void av1_remove_compressor(AV1_COMP *cpi);
3426
3427void av1_remove_primary_compressor(AV1_PRIMARY *ppi);
3428
3429#if CONFIG_ENTROPY_STATS
3430void print_entropy_stats(AV1_PRIMARY *const ppi);
3431#endif
3432#if CONFIG_INTERNAL_STATS
3433void print_internal_stats(AV1_PRIMARY *ppi);
3434#endif
3435
3436void av1_change_config_seq(AV1_PRIMARY *ppi, const AV1EncoderConfig *oxcf,
3437 bool *sb_size_changed);
3438
3439void av1_change_config(AV1_COMP *cpi, const AV1EncoderConfig *oxcf,
3440 bool sb_size_changed);
3441
3442void av1_check_initial_width(AV1_COMP *cpi, int use_highbitdepth,
3443 int subsampling_x, int subsampling_y);
3444
3445void av1_init_seq_coding_tools(AV1_PRIMARY *const ppi,
3446 const AV1EncoderConfig *oxcf, int use_svc);
3447
3448void av1_post_encode_updates(AV1_COMP *const cpi,
3449 const AV1_COMP_DATA *const cpi_data);
3450
3451#if CONFIG_FRAME_PARALLEL_ENCODE
3452void av1_scale_references_fpmt(AV1_COMP *cpi, int *ref_buffers_used_map);
3453
3454void av1_increment_scaled_ref_counts_fpmt(BufferPool *buffer_pool,
3455 int ref_buffers_used_map);
3456
3457void av1_release_scaled_references_fpmt(AV1_COMP *cpi);
3458
3459void av1_decrement_ref_counts_fpmt(BufferPool *buffer_pool,
3460 int ref_buffers_used_map);
3461
3462void av1_init_sc_decisions(AV1_PRIMARY *const ppi);
3463
3464AV1_COMP *av1_get_parallel_frame_enc_data(AV1_PRIMARY *const ppi,
3465 AV1_COMP_DATA *const first_cpi_data);
3466
3467int av1_init_parallel_frame_context(const AV1_COMP_DATA *const first_cpi_data,
3468 AV1_PRIMARY *const ppi,
3469 int *ref_buffers_used_map);
3470#endif // CONFIG_FRAME_PARALLEL_ENCODE
3471
3490int av1_receive_raw_frame(AV1_COMP *cpi, aom_enc_frame_flags_t frame_flags,
3491 YV12_BUFFER_CONFIG *sd, int64_t time_stamp,
3492 int64_t end_time_stamp);
3493
3513int av1_get_compressed_data(AV1_COMP *cpi, AV1_COMP_DATA *const cpi_data);
3514
3521int av1_encode(AV1_COMP *const cpi, uint8_t *const dest,
3522 const EncodeFrameInput *const frame_input,
3523 const EncodeFrameParams *const frame_params,
3524 EncodeFrameResults *const frame_results);
3525
3527int av1_get_preview_raw_frame(AV1_COMP *cpi, YV12_BUFFER_CONFIG *dest);
3528
3529int av1_get_last_show_frame(AV1_COMP *cpi, YV12_BUFFER_CONFIG *frame);
3530
3531aom_codec_err_t av1_copy_new_frame_enc(AV1_COMMON *cm,
3532 YV12_BUFFER_CONFIG *new_frame,
3533 YV12_BUFFER_CONFIG *sd);
3534
3535int av1_use_as_reference(int *ext_ref_frame_flags, int ref_frame_flags);
3536
3537int av1_copy_reference_enc(AV1_COMP *cpi, int idx, YV12_BUFFER_CONFIG *sd);
3538
3539int av1_set_reference_enc(AV1_COMP *cpi, int idx, YV12_BUFFER_CONFIG *sd);
3540
3541int av1_set_size_literal(AV1_COMP *cpi, int width, int height);
3542
3543void av1_set_frame_size(AV1_COMP *cpi, int width, int height);
3544
3545void av1_set_mv_search_params(AV1_COMP *cpi);
3546
3547int av1_set_active_map(AV1_COMP *cpi, unsigned char *map, int rows, int cols);
3548
3549int av1_get_active_map(AV1_COMP *cpi, unsigned char *map, int rows, int cols);
3550
3551int av1_set_internal_size(AV1EncoderConfig *const oxcf,
3552 ResizePendingParams *resize_pending_params,
3553 AOM_SCALING horiz_mode, AOM_SCALING vert_mode);
3554
3555int av1_get_quantizer(struct AV1_COMP *cpi);
3556
3557int av1_convert_sect5obus_to_annexb(uint8_t *buffer, size_t *input_size);
3558
3559// Set screen content options.
3560// This function estimates whether to use screen content tools, by counting
3561// the portion of blocks that have few luma colors.
3562// Modifies:
3563// cpi->commom.features.allow_screen_content_tools
3564// cpi->common.features.allow_intrabc
3565// cpi->use_screen_content_tools
3566// cpi->is_screen_content_type
3567// However, the estimation is not accurate and may misclassify videos.
3568// A slower but more accurate approach that determines whether to use screen
3569// content tools is employed later. See av1_determine_sc_tools_with_encoding().
3570void av1_set_screen_content_options(struct AV1_COMP *cpi,
3571 FeatureFlags *features);
3572
3573void av1_update_frame_size(AV1_COMP *cpi);
3574
3575typedef struct {
3576 int pyr_level;
3577 int disp_order;
3578} RefFrameMapPair;
3579
3580static INLINE void init_ref_map_pair(
3581 AV1_COMP *cpi, RefFrameMapPair ref_frame_map_pairs[REF_FRAMES]) {
3582 if (cpi->ppi->gf_group.update_type[cpi->gf_frame_index] == KF_UPDATE) {
3583 memset(ref_frame_map_pairs, -1, sizeof(*ref_frame_map_pairs) * REF_FRAMES);
3584 return;
3585 }
3586 memset(ref_frame_map_pairs, 0, sizeof(*ref_frame_map_pairs) * REF_FRAMES);
3587 for (int map_idx = 0; map_idx < REF_FRAMES; map_idx++) {
3588 // Get reference frame buffer.
3589 const RefCntBuffer *const buf = cpi->common.ref_frame_map[map_idx];
3590 if (ref_frame_map_pairs[map_idx].disp_order == -1) continue;
3591 if (buf == NULL) {
3592 ref_frame_map_pairs[map_idx].disp_order = -1;
3593 ref_frame_map_pairs[map_idx].pyr_level = -1;
3594 continue;
3595 } else if (buf->ref_count > 1) {
3596 // Once the keyframe is coded, the slots in ref_frame_map will all
3597 // point to the same frame. In that case, all subsequent pointers
3598 // matching the current are considered "free" slots. This will find
3599 // the next occurrence of the current pointer if ref_count indicates
3600 // there are multiple instances of it and mark it as free.
3601 for (int idx2 = map_idx + 1; idx2 < REF_FRAMES; ++idx2) {
3602 const RefCntBuffer *const buf2 = cpi->common.ref_frame_map[idx2];
3603 if (buf2 == buf) {
3604 ref_frame_map_pairs[idx2].disp_order = -1;
3605 ref_frame_map_pairs[idx2].pyr_level = -1;
3606 }
3607 }
3608 }
3609 ref_frame_map_pairs[map_idx].disp_order = (int)buf->display_order_hint;
3610 ref_frame_map_pairs[map_idx].pyr_level = buf->pyramid_level;
3611 }
3612}
3613
3614#if CONFIG_FRAME_PARALLEL_ENCODE && CONFIG_FPMT_TEST
3615static AOM_INLINE void calc_frame_data_update_flag(
3616 GF_GROUP *const gf_group, int gf_frame_index,
3617 bool *const do_frame_data_update) {
3618 *do_frame_data_update = true;
3619 // Set the flag to false for all frames in a given parallel encode set except
3620 // the last frame in the set with frame_parallel_level = 2.
3621 if (gf_group->frame_parallel_level[gf_frame_index] == 1) {
3622 *do_frame_data_update = false;
3623 } else if (gf_group->frame_parallel_level[gf_frame_index] == 2) {
3624 // Check if this is the last frame in the set with frame_parallel_level = 2.
3625 for (int i = gf_frame_index + 1; i < gf_group->size; i++) {
3626 if ((gf_group->frame_parallel_level[i] == 0 &&
3627 (gf_group->update_type[i] == ARF_UPDATE ||
3628 gf_group->update_type[i] == INTNL_ARF_UPDATE)) ||
3629 gf_group->frame_parallel_level[i] == 1) {
3630 break;
3631 } else if (gf_group->frame_parallel_level[i] == 2) {
3632 *do_frame_data_update = false;
3633 break;
3634 }
3635 }
3636 }
3637}
3638#endif
3639
3640// av1 uses 10,000,000 ticks/second as time stamp
3641#define TICKS_PER_SEC 10000000LL
3642
3643static INLINE int64_t
3644timebase_units_to_ticks(const aom_rational64_t *timestamp_ratio, int64_t n) {
3645 return n * timestamp_ratio->num / timestamp_ratio->den;
3646}
3647
3648static INLINE int64_t
3649ticks_to_timebase_units(const aom_rational64_t *timestamp_ratio, int64_t n) {
3650 int64_t round = timestamp_ratio->num / 2;
3651 if (round > 0) --round;
3652 return (n * timestamp_ratio->den + round) / timestamp_ratio->num;
3653}
3654
3655static INLINE int frame_is_kf_gf_arf(const AV1_COMP *cpi) {
3656 const GF_GROUP *const gf_group = &cpi->ppi->gf_group;
3657 const FRAME_UPDATE_TYPE update_type =
3658 gf_group->update_type[cpi->gf_frame_index];
3659
3660 return frame_is_intra_only(&cpi->common) || update_type == ARF_UPDATE ||
3661 update_type == GF_UPDATE;
3662}
3663
3664// TODO(huisu@google.com, youzhou@microsoft.com): enable hash-me for HBD.
3665static INLINE int av1_use_hash_me(const AV1_COMP *const cpi) {
3666 return (cpi->common.features.allow_screen_content_tools &&
3667 cpi->common.features.allow_intrabc &&
3668 frame_is_intra_only(&cpi->common));
3669}
3670
3671static INLINE const YV12_BUFFER_CONFIG *get_ref_frame_yv12_buf(
3672 const AV1_COMMON *const cm, MV_REFERENCE_FRAME ref_frame) {
3673 const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame);
3674 return buf != NULL ? &buf->buf : NULL;
3675}
3676
3677static INLINE void alloc_frame_mvs(AV1_COMMON *const cm, RefCntBuffer *buf) {
3678 assert(buf != NULL);
3679 ensure_mv_buffer(buf, cm);
3680 buf->width = cm->width;
3681 buf->height = cm->height;
3682}
3683
3684// Get the allocated token size for a tile. It does the same calculation as in
3685// the frame token allocation.
3686static INLINE unsigned int allocated_tokens(const TileInfo *tile,
3687 int sb_size_log2, int num_planes) {
3688 int tile_mb_rows = (tile->mi_row_end - tile->mi_row_start + 2) >> 2;
3689 int tile_mb_cols = (tile->mi_col_end - tile->mi_col_start + 2) >> 2;
3690
3691 return get_token_alloc(tile_mb_rows, tile_mb_cols, sb_size_log2, num_planes);
3692}
3693
3694static INLINE void get_start_tok(AV1_COMP *cpi, int tile_row, int tile_col,
3695 int mi_row, TokenExtra **tok, int sb_size_log2,
3696 int num_planes) {
3697 AV1_COMMON *const cm = &cpi->common;
3698 const int tile_cols = cm->tiles.cols;
3699 TileDataEnc *this_tile = &cpi->tile_data[tile_row * tile_cols + tile_col];
3700 const TileInfo *const tile_info = &this_tile->tile_info;
3701
3702 const int tile_mb_cols =
3703 (tile_info->mi_col_end - tile_info->mi_col_start + 2) >> 2;
3704 const int tile_mb_row = (mi_row - tile_info->mi_row_start + 2) >> 2;
3705
3706 *tok = cpi->token_info.tile_tok[tile_row][tile_col] +
3707 get_token_alloc(tile_mb_row, tile_mb_cols, sb_size_log2, num_planes);
3708}
3709
3710void av1_apply_encoding_flags(AV1_COMP *cpi, aom_enc_frame_flags_t flags);
3711
3712#define ALT_MIN_LAG 3
3713static INLINE int is_altref_enabled(int lag_in_frames, bool enable_auto_arf) {
3714 return lag_in_frames >= ALT_MIN_LAG && enable_auto_arf;
3715}
3716
3717static AOM_INLINE int can_disable_altref(const GFConfig *gf_cfg) {
3718 return is_altref_enabled(gf_cfg->lag_in_frames, gf_cfg->enable_auto_arf) &&
3719 (gf_cfg->gf_min_pyr_height == 0);
3720}
3721
3722// Helper function to compute number of blocks on either side of the frame.
3723static INLINE int get_num_blocks(const int frame_length, const int mb_length) {
3724 return (frame_length + mb_length - 1) / mb_length;
3725}
3726
3727// Check if statistics generation stage
3728static INLINE int is_stat_generation_stage(const AV1_COMP *const cpi) {
3729 assert(IMPLIES(cpi->compressor_stage == LAP_STAGE,
3730 cpi->oxcf.pass == AOM_RC_ONE_PASS && cpi->ppi->lap_enabled));
3731 return (cpi->oxcf.pass == AOM_RC_FIRST_PASS ||
3732 (cpi->compressor_stage == LAP_STAGE));
3733}
3734// Check if statistics consumption stage
3735static INLINE int is_stat_consumption_stage_twopass(const AV1_COMP *const cpi) {
3736 return (cpi->oxcf.pass >= AOM_RC_SECOND_PASS);
3737}
3738
3739// Check if statistics consumption stage
3740static INLINE int is_stat_consumption_stage(const AV1_COMP *const cpi) {
3741 return (is_stat_consumption_stage_twopass(cpi) ||
3742 (cpi->oxcf.pass == AOM_RC_ONE_PASS &&
3743 (cpi->compressor_stage == ENCODE_STAGE) && cpi->ppi->lap_enabled));
3744}
3745
3746// Decide whether 'dv_costs' need to be allocated/stored during the encoding.
3747static AOM_INLINE bool av1_need_dv_costs(const AV1_COMP *const cpi) {
3748 return !cpi->sf.rt_sf.use_nonrd_pick_mode &&
3749 av1_allow_intrabc(&cpi->common) && !is_stat_generation_stage(cpi);
3750}
3751
3761static INLINE int has_no_stats_stage(const AV1_COMP *const cpi) {
3762 assert(
3763 IMPLIES(!cpi->ppi->lap_enabled, cpi->compressor_stage == ENCODE_STAGE));
3764 return (cpi->oxcf.pass == AOM_RC_ONE_PASS && !cpi->ppi->lap_enabled);
3765}
3766
3769static INLINE int is_one_pass_rt_params(const AV1_COMP *cpi) {
3770 return has_no_stats_stage(cpi) && cpi->oxcf.mode == REALTIME &&
3771 cpi->oxcf.gf_cfg.lag_in_frames == 0;
3772}
3773
3774// Function return size of frame stats buffer
3775static INLINE int get_stats_buf_size(int num_lap_buffer, int num_lag_buffer) {
3776 /* if lookahead is enabled return num_lap_buffers else num_lag_buffers */
3777 return (num_lap_buffer > 0 ? num_lap_buffer + 1 : num_lag_buffer);
3778}
3779
3780// TODO(zoeliu): To set up cpi->oxcf.gf_cfg.enable_auto_brf
3781
3782static INLINE void set_ref_ptrs(const AV1_COMMON *cm, MACROBLOCKD *xd,
3783 MV_REFERENCE_FRAME ref0,
3784 MV_REFERENCE_FRAME ref1) {
3786 get_ref_scale_factors_const(cm, ref0 >= LAST_FRAME ? ref0 : 1);
3788 get_ref_scale_factors_const(cm, ref1 >= LAST_FRAME ? ref1 : 1);
3789}
3790
3791static INLINE int get_chessboard_index(int frame_index) {
3792 return frame_index & 0x1;
3793}
3794
3795static INLINE const int *cond_cost_list_const(const struct AV1_COMP *cpi,
3796 const int *cost_list) {
3797 const int use_cost_list = cpi->sf.mv_sf.subpel_search_method != SUBPEL_TREE &&
3798 cpi->sf.mv_sf.use_fullpel_costlist;
3799 return use_cost_list ? cost_list : NULL;
3800}
3801
3802static INLINE int *cond_cost_list(const struct AV1_COMP *cpi, int *cost_list) {
3803 const int use_cost_list = cpi->sf.mv_sf.subpel_search_method != SUBPEL_TREE &&
3804 cpi->sf.mv_sf.use_fullpel_costlist;
3805 return use_cost_list ? cost_list : NULL;
3806}
3807
3808// Compression ratio of current frame.
3809double av1_get_compression_ratio(const AV1_COMMON *const cm,
3810 size_t encoded_frame_size);
3811
3812void av1_new_framerate(AV1_COMP *cpi, double framerate);
3813
3814void av1_setup_frame_size(AV1_COMP *cpi);
3815
3816#define LAYER_IDS_TO_IDX(sl, tl, num_tl) ((sl) * (num_tl) + (tl))
3817
3818// Returns 1 if a frame is scaled and 0 otherwise.
3819static INLINE int av1_resize_scaled(const AV1_COMMON *cm) {
3820 return !(cm->superres_upscaled_width == cm->render_width &&
3822}
3823
3824static INLINE int av1_frame_scaled(const AV1_COMMON *cm) {
3825 return !av1_superres_scaled(cm) && av1_resize_scaled(cm);
3826}
3827
3828// Don't allow a show_existing_frame to coincide with an error resilient
3829// frame. An exception can be made for a forward keyframe since it has no
3830// previous dependencies.
3831static INLINE int encode_show_existing_frame(const AV1_COMMON *cm) {
3833 cm->current_frame.frame_type == KEY_FRAME);
3834}
3835
3836// Get index into the 'cpi->mbmi_ext_info.frame_base' array for the given
3837// 'mi_row' and 'mi_col'.
3838static INLINE int get_mi_ext_idx(const int mi_row, const int mi_col,
3839 const BLOCK_SIZE mi_alloc_bsize,
3840 const int mbmi_ext_stride) {
3841 const int mi_ext_size_1d = mi_size_wide[mi_alloc_bsize];
3842 const int mi_ext_row = mi_row / mi_ext_size_1d;
3843 const int mi_ext_col = mi_col / mi_ext_size_1d;
3844 return mi_ext_row * mbmi_ext_stride + mi_ext_col;
3845}
3846
3847// Lighter version of set_offsets that only sets the mode info
3848// pointers.
3849static INLINE void set_mode_info_offsets(
3850 const CommonModeInfoParams *const mi_params,
3851 const MBMIExtFrameBufferInfo *const mbmi_ext_info, MACROBLOCK *const x,
3852 MACROBLOCKD *const xd, int mi_row, int mi_col) {
3853 set_mi_offsets(mi_params, xd, mi_row, mi_col);
3854 const int ext_idx = get_mi_ext_idx(mi_row, mi_col, mi_params->mi_alloc_bsize,
3855 mbmi_ext_info->stride);
3856 x->mbmi_ext_frame = mbmi_ext_info->frame_base + ext_idx;
3857}
3858
3859// Check to see if the given partition size is allowed for a specified number
3860// of mi block rows and columns remaining in the image.
3861// If not then return the largest allowed partition size
3862static INLINE BLOCK_SIZE find_partition_size(BLOCK_SIZE bsize, int rows_left,
3863 int cols_left, int *bh, int *bw) {
3864 int int_size = (int)bsize;
3865 if (rows_left <= 0 || cols_left <= 0) {
3866 return AOMMIN(bsize, BLOCK_8X8);
3867 } else {
3868 for (; int_size > 0; int_size -= 3) {
3869 *bh = mi_size_high[int_size];
3870 *bw = mi_size_wide[int_size];
3871 if ((*bh <= rows_left) && (*bw <= cols_left)) {
3872 break;
3873 }
3874 }
3875 }
3876 return (BLOCK_SIZE)int_size;
3877}
3878
3879static const uint8_t av1_ref_frame_flag_list[REF_FRAMES] = { 0,
3880 AOM_LAST_FLAG,
3881 AOM_LAST2_FLAG,
3882 AOM_LAST3_FLAG,
3883 AOM_GOLD_FLAG,
3884 AOM_BWD_FLAG,
3885 AOM_ALT2_FLAG,
3886 AOM_ALT_FLAG };
3887
3888// When more than 'max_allowed_refs' are available, we reduce the number of
3889// reference frames one at a time based on this order.
3890static const MV_REFERENCE_FRAME disable_order[] = {
3891 LAST3_FRAME,
3892 LAST2_FRAME,
3893 ALTREF2_FRAME,
3894 BWDREF_FRAME,
3895};
3896
3897static const MV_REFERENCE_FRAME
3898 ref_frame_priority_order[INTER_REFS_PER_FRAME] = {
3899 LAST_FRAME, ALTREF_FRAME, BWDREF_FRAME, GOLDEN_FRAME,
3900 ALTREF2_FRAME, LAST2_FRAME, LAST3_FRAME,
3901 };
3902
3903static INLINE int get_ref_frame_flags(const SPEED_FEATURES *const sf,
3904 const int use_one_pass_rt_params,
3905 const YV12_BUFFER_CONFIG **ref_frames,
3906 const int ext_ref_frame_flags) {
3907 // cpi->ext_flags.ref_frame_flags allows certain reference types to be
3908 // disabled by the external interface. These are set by
3909 // av1_apply_encoding_flags(). Start with what the external interface allows,
3910 // then suppress any reference types which we have found to be duplicates.
3911 int flags = ext_ref_frame_flags;
3912
3913 for (int i = 1; i < INTER_REFS_PER_FRAME; ++i) {
3914 const YV12_BUFFER_CONFIG *const this_ref = ref_frames[i];
3915 // If this_ref has appeared before, mark the corresponding ref frame as
3916 // invalid. For one_pass_rt mode, only disable GOLDEN_FRAME if it's the
3917 // same as LAST_FRAME or ALTREF_FRAME (if ALTREF is being used in nonrd).
3918 int index =
3919 (use_one_pass_rt_params && ref_frame_priority_order[i] == GOLDEN_FRAME)
3920 ? (1 + sf->rt_sf.use_nonrd_altref_frame)
3921 : i;
3922 for (int j = 0; j < index; ++j) {
3923 // If this_ref has appeared before (same as the reference corresponding
3924 // to lower index j), remove it as a reference only if that reference
3925 // (for index j) is actually used as a reference.
3926 if (this_ref == ref_frames[j] &&
3927 (flags & (1 << (ref_frame_priority_order[j] - 1)))) {
3928 flags &= ~(1 << (ref_frame_priority_order[i] - 1));
3929 break;
3930 }
3931 }
3932 }
3933 return flags;
3934}
3935
3936// Returns a Sequence Header OBU stored in an aom_fixed_buf_t, or NULL upon
3937// failure. When a non-NULL aom_fixed_buf_t pointer is returned by this
3938// function, the memory must be freed by the caller. Both the buf member of the
3939// aom_fixed_buf_t, and the aom_fixed_buf_t pointer itself must be freed. Memory
3940// returned must be freed via call to free().
3941//
3942// Note: The OBU returned is in Low Overhead Bitstream Format. Specifically,
3943// the obu_has_size_field bit is set, and the buffer contains the obu_size
3944// field.
3945aom_fixed_buf_t *av1_get_global_headers(AV1_PRIMARY *ppi);
3946
3947#define MAX_GFUBOOST_FACTOR 10.0
3948#define MIN_GFUBOOST_FACTOR 4.0
3949
3950static INLINE int is_frame_tpl_eligible(const GF_GROUP *const gf_group,
3951 uint8_t index) {
3952 const FRAME_UPDATE_TYPE update_type = gf_group->update_type[index];
3953 return update_type == ARF_UPDATE || update_type == GF_UPDATE ||
3954 update_type == KF_UPDATE;
3955}
3956
3957static INLINE int is_frame_eligible_for_ref_pruning(const GF_GROUP *gf_group,
3958 int selective_ref_frame,
3959 int prune_ref_frames,
3960 int gf_index) {
3961 return (selective_ref_frame > 0) && (prune_ref_frames > 0) &&
3962 !is_frame_tpl_eligible(gf_group, gf_index);
3963}
3964
3965// Get update type of the current frame.
3966static INLINE FRAME_UPDATE_TYPE get_frame_update_type(const GF_GROUP *gf_group,
3967 int gf_frame_index) {
3968 return gf_group->update_type[gf_frame_index];
3969}
3970
3971static INLINE int av1_pixels_to_mi(int pixels) {
3972 return ALIGN_POWER_OF_TWO(pixels, 3) >> MI_SIZE_LOG2;
3973}
3974
3975static AOM_INLINE int is_psnr_calc_enabled(const AV1_COMP *cpi) {
3976 const AV1_COMMON *const cm = &cpi->common;
3977
3978 return cpi->ppi->b_calculate_psnr && !is_stat_generation_stage(cpi) &&
3979 cm->show_frame;
3980}
3981
3982static INLINE int is_frame_resize_pending(AV1_COMP *const cpi) {
3983 ResizePendingParams *const resize_pending_params =
3984 &cpi->resize_pending_params;
3985 return (resize_pending_params->width && resize_pending_params->height &&
3986 (cpi->common.width != resize_pending_params->width ||
3987 cpi->common.height != resize_pending_params->height));
3988}
3989
3990// Check if loop restoration filter is used.
3991static INLINE int is_restoration_used(const AV1_COMMON *const cm) {
3992 return cm->seq_params->enable_restoration && !cm->features.all_lossless &&
3993 !cm->tiles.large_scale;
3994}
3995
3996static INLINE int is_inter_tx_size_search_level_one(
3997 const TX_SPEED_FEATURES *tx_sf) {
3998 return (tx_sf->inter_tx_size_search_init_depth_rect >= 1 &&
3999 tx_sf->inter_tx_size_search_init_depth_sqr >= 1);
4000}
4001
4002#if CONFIG_AV1_TEMPORAL_DENOISING
4003static INLINE int denoise_svc(const struct AV1_COMP *const cpi) {
4004 return (!cpi->ppi->use_svc ||
4005 (cpi->ppi->use_svc &&
4006 cpi->svc.spatial_layer_id >= cpi->svc.first_layer_denoise));
4007}
4008#endif
4009
4010#if CONFIG_COLLECT_PARTITION_STATS == 2
4011static INLINE void av1_print_fr_partition_timing_stats(
4012 const FramePartitionTimingStats *part_stats, const char *filename) {
4013 FILE *f = fopen(filename, "w");
4014 if (!f) {
4015 return;
4016 }
4017
4018 fprintf(f, "bsize,redo,");
4019 for (int part = 0; part < EXT_PARTITION_TYPES; part++) {
4020 fprintf(f, "decision_%d,", part);
4021 }
4022 for (int part = 0; part < EXT_PARTITION_TYPES; part++) {
4023 fprintf(f, "attempt_%d,", part);
4024 }
4025 for (int part = 0; part < EXT_PARTITION_TYPES; part++) {
4026 fprintf(f, "time_%d,", part);
4027 }
4028 fprintf(f, "\n");
4029
4030 static const int bsizes[6] = { 128, 64, 32, 16, 8, 4 };
4031
4032 for (int bsize_idx = 0; bsize_idx < 6; bsize_idx++) {
4033 fprintf(f, "%d,%d,", bsizes[bsize_idx], part_stats->partition_redo);
4034 for (int part = 0; part < EXT_PARTITION_TYPES; part++) {
4035 fprintf(f, "%d,", part_stats->partition_decisions[bsize_idx][part]);
4036 }
4037 for (int part = 0; part < EXT_PARTITION_TYPES; part++) {
4038 fprintf(f, "%d,", part_stats->partition_attempts[bsize_idx][part]);
4039 }
4040 for (int part = 0; part < EXT_PARTITION_TYPES; part++) {
4041 fprintf(f, "%ld,", part_stats->partition_times[bsize_idx][part]);
4042 }
4043 fprintf(f, "\n");
4044 }
4045 fclose(f);
4046}
4047#endif // CONFIG_COLLECT_PARTITION_STATS == 2
4048
4049#if CONFIG_COLLECT_PARTITION_STATS
4050static INLINE int av1_get_bsize_idx_for_part_stats(BLOCK_SIZE bsize) {
4051 assert(bsize == BLOCK_128X128 || bsize == BLOCK_64X64 ||
4052 bsize == BLOCK_32X32 || bsize == BLOCK_16X16 || bsize == BLOCK_8X8 ||
4053 bsize == BLOCK_4X4);
4054 switch (bsize) {
4055 case BLOCK_128X128: return 0;
4056 case BLOCK_64X64: return 1;
4057 case BLOCK_32X32: return 2;
4058 case BLOCK_16X16: return 3;
4059 case BLOCK_8X8: return 4;
4060 case BLOCK_4X4: return 5;
4061 default: assert(0 && "Invalid bsize for partition_stats."); return -1;
4062 }
4063}
4064#endif // CONFIG_COLLECT_PARTITION_STATS
4065
4066#if CONFIG_COLLECT_COMPONENT_TIMING
4067static INLINE void start_timing(AV1_COMP *cpi, int component) {
4068 aom_usec_timer_start(&cpi->component_timer[component]);
4069}
4070static INLINE void end_timing(AV1_COMP *cpi, int component) {
4071 aom_usec_timer_mark(&cpi->component_timer[component]);
4072 cpi->frame_component_time[component] +=
4073 aom_usec_timer_elapsed(&cpi->component_timer[component]);
4074}
4075static INLINE char const *get_frame_type_enum(int type) {
4076 switch (type) {
4077 case 0: return "KEY_FRAME";
4078 case 1: return "INTER_FRAME";
4079 case 2: return "INTRA_ONLY_FRAME";
4080 case 3: return "S_FRAME";
4081 default: assert(0);
4082 }
4083 return "error";
4084}
4085#endif
4086
4089#ifdef __cplusplus
4090} // extern "C"
4091#endif
4092
4093#endif // AOM_AV1_ENCODER_ENCODER_H_
enum aom_chroma_sample_position aom_chroma_sample_position_t
List of chroma sample positions.
enum aom_transfer_characteristics aom_transfer_characteristics_t
List of supported transfer functions.
enum aom_color_range aom_color_range_t
List of supported color range.
enum aom_color_primaries aom_color_primaries_t
List of supported color primaries.
enum aom_matrix_coefficients aom_matrix_coefficients_t
List of supported matrix coefficients.
Provides definitions for using AOM or AV1 encoder algorithm within the aom Codec Interface.
@ RESTORE_SWITCHABLE_TYPES
Definition: enums.h:602
aom_dist_metric
Distortion metric to use for RD optimization.
Definition: aomcx.h:1557
aom_tune_content
Definition: aomcx.h:1519
aom_tune_metric
Model tuning parameters.
Definition: aomcx.h:1538
enum aom_bit_depth aom_bit_depth_t
Bit depth for codecThis enumeration determines the bit depth of the codec.
enum aom_superblock_size aom_superblock_size_t
Superblock size selection.
aom_codec_err_t
Algorithm return codes.
Definition: aom_codec.h:155
aom_superres_mode
Frame super-resolution mode.
Definition: aom_encoder.h:206
aom_rc_mode
Rate control mode.
Definition: aom_encoder.h:184
aom_enc_pass
Multi-pass Encoding Pass.
Definition: aom_encoder.h:175
long aom_enc_frame_flags_t
Encoded Frame Flags.
Definition: aom_encoder.h:376
@ AOM_RC_ONE_PASS
Definition: aom_encoder.h:176
@ AOM_RC_SECOND_PASS
Definition: aom_encoder.h:178
@ AOM_RC_FIRST_PASS
Definition: aom_encoder.h:177
Describes look ahead buffer operations.
Top level common structure used by both encoder and decoder.
Definition: av1_common_int.h:750
int superres_upscaled_width
Definition: av1_common_int.h:799
int superres_upscaled_height
Definition: av1_common_int.h:800
SequenceHeader * seq_params
Definition: av1_common_int.h:976
int width
Definition: av1_common_int.h:775
CurrentFrame current_frame
Definition: av1_common_int.h:754
int show_existing_frame
Definition: av1_common_int.h:900
FeatureFlags features
Definition: av1_common_int.h:905
int show_frame
Definition: av1_common_int.h:885
CommonTileParams tiles
Definition: av1_common_int.h:992
int height
Definition: av1_common_int.h:776
int render_width
Definition: av1_common_int.h:786
int render_height
Definition: av1_common_int.h:787
Stores the transforms coefficients for the whole superblock.
Definition: block.h:176
The stucture of CYCLIC_REFRESH.
Definition: aq_cyclicrefresh.h:36
Parameters related to CDEF.
Definition: av1_common_int.h:196
Params related to MB_MODE_INFO arrays and related info.
Definition: av1_common_int.h:501
BLOCK_SIZE mi_alloc_bsize
Definition: av1_common_int.h:550
int cols
Definition: av1_common_int.h:428
unsigned int large_scale
Definition: av1_common_int.h:488
Contains buffers used by av1_compound_type_rd()
Definition: block.h:336
Frame level features.
Definition: av1_common_int.h:358
bool error_resilient_mode
Definition: av1_common_int.h:400
bool all_lossless
Definition: av1_common_int.h:389
Data related to the current GF/ARF group and the individual frames within the group.
Definition: firstpass.h:344
Stores best extended mode information at frame level.
Definition: block.h:212
Stores the prediction/txfm mode of the current coding block.
Definition: blockd.h:222
Contains buffers used to speed up rdopt for obmc.
Definition: block.h:299
Contains color maps used in palette mode.
Definition: block.h:324
Primary Rate Control parameters and status.
Definition: ratectrl.h:261
Rate Control parameters and status.
Definition: ratectrl.h:134
Top level speed vs quality trade off data struture.
Definition: speed_features.h:1528
REAL_TIME_SPEED_FEATURES rt_sf
Definition: speed_features.h:1597
The stucture of SVC.
Definition: svc_layercontext.h:87
Temporal filter info for a gop.
Definition: temporal_filter.h:156
Frame level Two pass status and control data.
Definition: firstpass.h:455
Two pass status and control data.
Definition: firstpass.h:412
Parameters related to temporal filtering.
Definition: temporal_filter.h:93
Params related to temporal dependency model.
Definition: tpl_model.h:142
Generic fixed size buffer structure.
Definition: aom_encoder.h:87
Encoder's parameters related to the current coding block.
Definition: block.h:813
MB_MODE_INFO_EXT_FRAME * mbmi_ext_frame
Finalized mbmi_ext for the whole frame.
Definition: block.h:845
Variables related to current coding block.
Definition: blockd.h:577
const struct scale_factors * block_ref_scale_factors[2]
Definition: blockd.h:694
YV12 frame buffer data structure.
Definition: yv12config.h:39