1 /*
2 * Copyright (c) 2020, Alliance for Open Media. All rights reserved.
3 *
4 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10 */
11
12 #include <string.h>
13
14 #include "aom/aomcx.h"
15
16 #include "av1/common/av1_common_int.h"
17 #include "av1/encoder/bitstream.h"
18 #include "av1/encoder/encodeframe.h"
19 #include "av1/encoder/encoder.h"
20 #include "av1/encoder/encoder_alloc.h"
21 #include "av1/encoder/encodetxb.h"
22 #include "av1/encoder/encoder_utils.h"
23 #include "av1/encoder/grain_test_vectors.h"
24 #include "av1/encoder/mv_prec.h"
25 #include "av1/encoder/rc_utils.h"
26 #include "av1/encoder/rdopt.h"
27 #include "av1/encoder/segmentation.h"
28 #include "av1/encoder/superres_scale.h"
29 #include "av1/encoder/tpl_model.h"
30 #include "av1/encoder/var_based_part.h"
31
32 #if CONFIG_TUNE_VMAF
33 #include "av1/encoder/tune_vmaf.h"
34 #endif
35
36 #define MIN_BOOST_COMBINE_FACTOR 4.0
37 #define MAX_BOOST_COMBINE_FACTOR 12.0
38
39 const int default_tx_type_probs[FRAME_UPDATE_TYPES][TX_SIZES_ALL][TX_TYPES] = {
40 { { 221, 189, 214, 292, 0, 0, 0, 0, 0, 2, 38, 68, 0, 0, 0, 0 },
41 { 262, 203, 216, 239, 0, 0, 0, 0, 0, 1, 37, 66, 0, 0, 0, 0 },
42 { 315, 231, 239, 226, 0, 0, 0, 0, 0, 13, 0, 0, 0, 0, 0, 0 },
43 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
44 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
45 { 222, 188, 214, 287, 0, 0, 0, 0, 0, 2, 50, 61, 0, 0, 0, 0 },
46 { 256, 182, 205, 282, 0, 0, 0, 0, 0, 2, 21, 76, 0, 0, 0, 0 },
47 { 281, 214, 217, 222, 0, 0, 0, 0, 0, 1, 48, 41, 0, 0, 0, 0 },
48 { 263, 194, 225, 225, 0, 0, 0, 0, 0, 2, 15, 100, 0, 0, 0, 0 },
49 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
50 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
51 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
52 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
53 { 170, 192, 242, 293, 0, 0, 0, 0, 0, 1, 68, 58, 0, 0, 0, 0 },
54 { 199, 210, 213, 291, 0, 0, 0, 0, 0, 1, 14, 96, 0, 0, 0, 0 },
55 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
56 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
57 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
58 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
59 { { 106, 69, 107, 278, 9, 15, 20, 45, 49, 23, 23, 88, 36, 74, 25, 57 },
60 { 105, 72, 81, 98, 45, 49, 47, 50, 56, 72, 30, 81, 33, 95, 27, 83 },
61 { 211, 105, 109, 120, 57, 62, 43, 49, 52, 58, 42, 116, 0, 0, 0, 0 },
62 { 1008, 0, 0, 0, 0, 0, 0, 0, 0, 16, 0, 0, 0, 0, 0, 0 },
63 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
64 { 131, 57, 98, 172, 19, 40, 37, 64, 69, 22, 41, 52, 51, 77, 35, 59 },
65 { 176, 83, 93, 202, 22, 24, 28, 47, 50, 16, 12, 93, 26, 76, 17, 59 },
66 { 136, 72, 89, 95, 46, 59, 47, 56, 61, 68, 35, 51, 32, 82, 26, 69 },
67 { 122, 80, 87, 105, 49, 47, 46, 46, 57, 52, 13, 90, 19, 103, 15, 93 },
68 { 1009, 0, 0, 0, 0, 0, 0, 0, 0, 15, 0, 0, 0, 0, 0, 0 },
69 { 1011, 0, 0, 0, 0, 0, 0, 0, 0, 13, 0, 0, 0, 0, 0, 0 },
70 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
71 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
72 { 202, 20, 84, 114, 14, 60, 41, 79, 99, 21, 41, 15, 50, 84, 34, 66 },
73 { 196, 44, 23, 72, 30, 22, 28, 57, 67, 13, 4, 165, 15, 148, 9, 131 },
74 { 882, 0, 0, 0, 0, 0, 0, 0, 0, 142, 0, 0, 0, 0, 0, 0 },
75 { 840, 0, 0, 0, 0, 0, 0, 0, 0, 184, 0, 0, 0, 0, 0, 0 },
76 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
77 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
78 { { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
79 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
80 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
81 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
82 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
83 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
84 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
85 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
86 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
87 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
88 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
89 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
90 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
91 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
92 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
93 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
94 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
95 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
96 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 } },
97 { { 213, 110, 141, 269, 12, 16, 15, 19, 21, 11, 38, 68, 22, 29, 16, 24 },
98 { 216, 119, 128, 143, 38, 41, 26, 30, 31, 30, 42, 70, 23, 36, 19, 32 },
99 { 367, 149, 154, 154, 38, 35, 17, 21, 21, 10, 22, 36, 0, 0, 0, 0 },
100 { 1022, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0 },
101 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
102 { 219, 96, 127, 191, 21, 40, 25, 32, 34, 18, 45, 45, 33, 39, 26, 33 },
103 { 296, 99, 122, 198, 23, 21, 19, 24, 25, 13, 20, 64, 23, 32, 18, 27 },
104 { 275, 128, 142, 143, 35, 48, 23, 30, 29, 18, 42, 36, 18, 23, 14, 20 },
105 { 239, 132, 166, 175, 36, 27, 19, 21, 24, 14, 13, 85, 9, 31, 8, 25 },
106 { 1022, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0 },
107 { 1022, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0 },
108 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
109 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
110 { 309, 25, 79, 59, 25, 80, 34, 53, 61, 25, 49, 23, 43, 64, 36, 59 },
111 { 270, 57, 40, 54, 50, 42, 41, 53, 56, 28, 17, 81, 45, 86, 34, 70 },
112 { 1005, 0, 0, 0, 0, 0, 0, 0, 0, 19, 0, 0, 0, 0, 0, 0 },
113 { 992, 0, 0, 0, 0, 0, 0, 0, 0, 32, 0, 0, 0, 0, 0, 0 },
114 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
115 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
116 { { 133, 63, 55, 83, 57, 87, 58, 72, 68, 16, 24, 35, 29, 105, 25, 114 },
117 { 131, 75, 74, 60, 71, 77, 65, 66, 73, 33, 21, 79, 20, 83, 18, 78 },
118 { 276, 95, 82, 58, 86, 93, 63, 60, 64, 17, 38, 92, 0, 0, 0, 0 },
119 { 1006, 0, 0, 0, 0, 0, 0, 0, 0, 18, 0, 0, 0, 0, 0, 0 },
120 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
121 { 147, 49, 75, 78, 50, 97, 60, 67, 76, 17, 42, 35, 31, 93, 27, 80 },
122 { 157, 49, 58, 75, 61, 52, 56, 67, 69, 12, 15, 79, 24, 119, 11, 120 },
123 { 178, 69, 83, 77, 69, 85, 72, 77, 77, 20, 35, 40, 25, 48, 23, 46 },
124 { 174, 55, 64, 57, 73, 68, 62, 61, 75, 15, 12, 90, 17, 99, 16, 86 },
125 { 1008, 0, 0, 0, 0, 0, 0, 0, 0, 16, 0, 0, 0, 0, 0, 0 },
126 { 1018, 0, 0, 0, 0, 0, 0, 0, 0, 6, 0, 0, 0, 0, 0, 0 },
127 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
128 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
129 { 266, 31, 63, 64, 21, 52, 39, 54, 63, 30, 52, 31, 48, 89, 46, 75 },
130 { 272, 26, 32, 44, 29, 31, 32, 53, 51, 13, 13, 88, 22, 153, 16, 149 },
131 { 923, 0, 0, 0, 0, 0, 0, 0, 0, 101, 0, 0, 0, 0, 0, 0 },
132 { 969, 0, 0, 0, 0, 0, 0, 0, 0, 55, 0, 0, 0, 0, 0, 0 },
133 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
134 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
135 { { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
136 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
137 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
138 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
139 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
140 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
141 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
142 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
143 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
144 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
145 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
146 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
147 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
148 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
149 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
150 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
151 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
152 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
153 { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 } },
154 { { 158, 92, 125, 298, 12, 15, 20, 29, 31, 12, 29, 67, 34, 44, 23, 35 },
155 { 147, 94, 103, 123, 45, 48, 38, 41, 46, 48, 37, 78, 33, 63, 27, 53 },
156 { 268, 126, 125, 136, 54, 53, 31, 38, 38, 33, 35, 87, 0, 0, 0, 0 },
157 { 1018, 0, 0, 0, 0, 0, 0, 0, 0, 6, 0, 0, 0, 0, 0, 0 },
158 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
159 { 159, 72, 103, 194, 20, 35, 37, 50, 56, 21, 39, 40, 51, 61, 38, 48 },
160 { 259, 86, 95, 188, 32, 20, 25, 34, 37, 13, 12, 85, 25, 53, 17, 43 },
161 { 189, 99, 113, 123, 45, 59, 37, 46, 48, 44, 39, 41, 31, 47, 26, 37 },
162 { 175, 110, 113, 128, 58, 38, 33, 33, 43, 29, 13, 100, 14, 68, 12, 57 },
163 { 1017, 0, 0, 0, 0, 0, 0, 0, 0, 7, 0, 0, 0, 0, 0, 0 },
164 { 1019, 0, 0, 0, 0, 0, 0, 0, 0, 5, 0, 0, 0, 0, 0, 0 },
165 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
166 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
167 { 208, 22, 84, 101, 21, 59, 44, 70, 90, 25, 59, 13, 64, 67, 49, 48 },
168 { 277, 52, 32, 63, 43, 26, 33, 48, 54, 11, 6, 130, 18, 119, 11, 101 },
169 { 963, 0, 0, 0, 0, 0, 0, 0, 0, 61, 0, 0, 0, 0, 0, 0 },
170 { 979, 0, 0, 0, 0, 0, 0, 0, 0, 45, 0, 0, 0, 0, 0, 0 },
171 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
172 { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } }
173 };
174
175 const int default_obmc_probs[FRAME_UPDATE_TYPES][BLOCK_SIZES_ALL] = {
176 { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
177 { 0, 0, 0, 106, 90, 90, 97, 67, 59, 70, 28,
178 30, 38, 16, 16, 16, 0, 0, 44, 50, 26, 25 },
179 { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
180 { 0, 0, 0, 98, 93, 97, 68, 82, 85, 33, 30,
181 33, 16, 16, 16, 16, 0, 0, 43, 37, 26, 16 },
182 { 0, 0, 0, 91, 80, 76, 78, 55, 49, 24, 16,
183 16, 16, 16, 16, 16, 0, 0, 29, 45, 16, 38 },
184 { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
185 { 0, 0, 0, 103, 89, 89, 89, 62, 63, 76, 34,
186 35, 32, 19, 16, 16, 0, 0, 49, 55, 29, 19 }
187 };
188
189 const int default_warped_probs[FRAME_UPDATE_TYPES] = { 64, 64, 64, 64,
190 64, 64, 64 };
191
192 // TODO(yunqing): the default probs can be trained later from better
193 // performance.
194 const int default_switchable_interp_probs[FRAME_UPDATE_TYPES]
195 [SWITCHABLE_FILTER_CONTEXTS]
196 [SWITCHABLE_FILTERS] = {
197 { { 512, 512, 512 },
198 { 512, 512, 512 },
199 { 512, 512, 512 },
200 { 512, 512, 512 },
201 { 512, 512, 512 },
202 { 512, 512, 512 },
203 { 512, 512, 512 },
204 { 512, 512, 512 },
205 { 512, 512, 512 },
206 { 512, 512, 512 },
207 { 512, 512, 512 },
208 { 512, 512, 512 },
209 { 512, 512, 512 },
210 { 512, 512, 512 },
211 { 512, 512, 512 },
212 { 512, 512, 512 } },
213 { { 512, 512, 512 },
214 { 512, 512, 512 },
215 { 512, 512, 512 },
216 { 512, 512, 512 },
217 { 512, 512, 512 },
218 { 512, 512, 512 },
219 { 512, 512, 512 },
220 { 512, 512, 512 },
221 { 512, 512, 512 },
222 { 512, 512, 512 },
223 { 512, 512, 512 },
224 { 512, 512, 512 },
225 { 512, 512, 512 },
226 { 512, 512, 512 },
227 { 512, 512, 512 },
228 { 512, 512, 512 } },
229 { { 512, 512, 512 },
230 { 512, 512, 512 },
231 { 512, 512, 512 },
232 { 512, 512, 512 },
233 { 512, 512, 512 },
234 { 512, 512, 512 },
235 { 512, 512, 512 },
236 { 512, 512, 512 },
237 { 512, 512, 512 },
238 { 512, 512, 512 },
239 { 512, 512, 512 },
240 { 512, 512, 512 },
241 { 512, 512, 512 },
242 { 512, 512, 512 },
243 { 512, 512, 512 },
244 { 512, 512, 512 } },
245 { { 512, 512, 512 },
246 { 512, 512, 512 },
247 { 512, 512, 512 },
248 { 512, 512, 512 },
249 { 512, 512, 512 },
250 { 512, 512, 512 },
251 { 512, 512, 512 },
252 { 512, 512, 512 },
253 { 512, 512, 512 },
254 { 512, 512, 512 },
255 { 512, 512, 512 },
256 { 512, 512, 512 },
257 { 512, 512, 512 },
258 { 512, 512, 512 },
259 { 512, 512, 512 },
260 { 512, 512, 512 } },
261 { { 512, 512, 512 },
262 { 512, 512, 512 },
263 { 512, 512, 512 },
264 { 512, 512, 512 },
265 { 512, 512, 512 },
266 { 512, 512, 512 },
267 { 512, 512, 512 },
268 { 512, 512, 512 },
269 { 512, 512, 512 },
270 { 512, 512, 512 },
271 { 512, 512, 512 },
272 { 512, 512, 512 },
273 { 512, 512, 512 },
274 { 512, 512, 512 },
275 { 512, 512, 512 },
276 { 512, 512, 512 } },
277 { { 512, 512, 512 },
278 { 512, 512, 512 },
279 { 512, 512, 512 },
280 { 512, 512, 512 },
281 { 512, 512, 512 },
282 { 512, 512, 512 },
283 { 512, 512, 512 },
284 { 512, 512, 512 },
285 { 512, 512, 512 },
286 { 512, 512, 512 },
287 { 512, 512, 512 },
288 { 512, 512, 512 },
289 { 512, 512, 512 },
290 { 512, 512, 512 },
291 { 512, 512, 512 },
292 { 512, 512, 512 } },
293 { { 512, 512, 512 },
294 { 512, 512, 512 },
295 { 512, 512, 512 },
296 { 512, 512, 512 },
297 { 512, 512, 512 },
298 { 512, 512, 512 },
299 { 512, 512, 512 },
300 { 512, 512, 512 },
301 { 512, 512, 512 },
302 { 512, 512, 512 },
303 { 512, 512, 512 },
304 { 512, 512, 512 },
305 { 512, 512, 512 },
306 { 512, 512, 512 },
307 { 512, 512, 512 },
308 { 512, 512, 512 } }
309 };
310
configure_static_seg_features(AV1_COMP * cpi)311 static void configure_static_seg_features(AV1_COMP *cpi) {
312 AV1_COMMON *const cm = &cpi->common;
313 const RATE_CONTROL *const rc = &cpi->rc;
314 struct segmentation *const seg = &cm->seg;
315
316 double avg_q;
317 #if CONFIG_FPMT_TEST
318 avg_q = ((cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] > 0) &&
319 (cpi->ppi->fpmt_unit_test_cfg == PARALLEL_SIMULATION_ENCODE))
320 ? cpi->ppi->p_rc.temp_avg_q
321 : cpi->ppi->p_rc.avg_q;
322 #else
323 avg_q = cpi->ppi->p_rc.avg_q;
324 #endif
325
326 int high_q = (int)(avg_q > 48.0);
327 int qi_delta;
328
329 // Disable and clear down for KF
330 if (cm->current_frame.frame_type == KEY_FRAME) {
331 // Clear down the global segmentation map
332 memset(cpi->enc_seg.map, 0, cm->mi_params.mi_rows * cm->mi_params.mi_cols);
333 seg->update_map = 0;
334 seg->update_data = 0;
335
336 // Disable segmentation
337 av1_disable_segmentation(seg);
338
339 // Clear down the segment features.
340 av1_clearall_segfeatures(seg);
341 } else if (cpi->refresh_frame.alt_ref_frame) {
342 // If this is an alt ref frame
343 // Clear down the global segmentation map
344 memset(cpi->enc_seg.map, 0, cm->mi_params.mi_rows * cm->mi_params.mi_cols);
345 seg->update_map = 0;
346 seg->update_data = 0;
347
348 // Disable segmentation and individual segment features by default
349 av1_disable_segmentation(seg);
350 av1_clearall_segfeatures(seg);
351
352 // If segmentation was enabled set those features needed for the
353 // arf itself.
354 if (seg->enabled) {
355 seg->update_map = 1;
356 seg->update_data = 1;
357
358 qi_delta = av1_compute_qdelta(rc, avg_q, avg_q * 0.875,
359 cm->seq_params->bit_depth);
360 av1_set_segdata(seg, 1, SEG_LVL_ALT_Q, qi_delta - 2);
361 av1_set_segdata(seg, 1, SEG_LVL_ALT_LF_Y_H, -2);
362 av1_set_segdata(seg, 1, SEG_LVL_ALT_LF_Y_V, -2);
363 av1_set_segdata(seg, 1, SEG_LVL_ALT_LF_U, -2);
364 av1_set_segdata(seg, 1, SEG_LVL_ALT_LF_V, -2);
365
366 av1_enable_segfeature(seg, 1, SEG_LVL_ALT_LF_Y_H);
367 av1_enable_segfeature(seg, 1, SEG_LVL_ALT_LF_Y_V);
368 av1_enable_segfeature(seg, 1, SEG_LVL_ALT_LF_U);
369 av1_enable_segfeature(seg, 1, SEG_LVL_ALT_LF_V);
370
371 av1_enable_segfeature(seg, 1, SEG_LVL_ALT_Q);
372 }
373 } else if (seg->enabled) {
374 // All other frames if segmentation has been enabled
375
376 // First normal frame in a valid gf or alt ref group
377 if (rc->frames_since_golden == 0) {
378 // Set up segment features for normal frames in an arf group
379 // Disable segmentation and clear down features if alt ref
380 // is not active for this group
381
382 av1_disable_segmentation(seg);
383
384 memset(cpi->enc_seg.map, 0,
385 cm->mi_params.mi_rows * cm->mi_params.mi_cols);
386
387 seg->update_map = 0;
388 seg->update_data = 0;
389
390 av1_clearall_segfeatures(seg);
391 } else if (rc->is_src_frame_alt_ref) {
392 // Special case where we are coding over the top of a previous
393 // alt ref frame.
394 // Segment coding disabled for compred testing
395
396 // Enable ref frame features for segment 0 as well
397 av1_enable_segfeature(seg, 0, SEG_LVL_REF_FRAME);
398 av1_enable_segfeature(seg, 1, SEG_LVL_REF_FRAME);
399
400 // All mbs should use ALTREF_FRAME
401 av1_clear_segdata(seg, 0, SEG_LVL_REF_FRAME);
402 av1_set_segdata(seg, 0, SEG_LVL_REF_FRAME, ALTREF_FRAME);
403 av1_clear_segdata(seg, 1, SEG_LVL_REF_FRAME);
404 av1_set_segdata(seg, 1, SEG_LVL_REF_FRAME, ALTREF_FRAME);
405
406 // Skip all MBs if high Q (0,0 mv and skip coeffs)
407 if (high_q) {
408 av1_enable_segfeature(seg, 0, SEG_LVL_SKIP);
409 av1_enable_segfeature(seg, 1, SEG_LVL_SKIP);
410 }
411 // Enable data update
412 seg->update_data = 1;
413 } else {
414 // All other frames.
415
416 // No updates.. leave things as they are.
417 seg->update_map = 0;
418 seg->update_data = 0;
419 }
420 }
421 }
422
av1_apply_active_map(AV1_COMP * cpi)423 void av1_apply_active_map(AV1_COMP *cpi) {
424 struct segmentation *const seg = &cpi->common.seg;
425 unsigned char *const seg_map = cpi->enc_seg.map;
426 const unsigned char *const active_map = cpi->active_map.map;
427
428 assert(AM_SEGMENT_ID_ACTIVE == CR_SEGMENT_ID_BASE);
429
430 // Disable the active_maps on intra_only frames or if the
431 // input map for the current frame has no inactive blocks.
432 if (frame_is_intra_only(&cpi->common) ||
433 cpi->rc.percent_blocks_inactive == 0) {
434 cpi->active_map.enabled = 0;
435 cpi->active_map.update = 1;
436 }
437
438 if (cpi->active_map.update) {
439 if (cpi->active_map.enabled) {
440 const int num_mis =
441 cpi->common.mi_params.mi_rows * cpi->common.mi_params.mi_cols;
442 memcpy(seg_map, active_map, sizeof(active_map[0]) * num_mis);
443 av1_enable_segmentation(seg);
444 av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_SKIP);
445 av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_H);
446 av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_V);
447 av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_U);
448 av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_V);
449
450 av1_set_segdata(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_H,
451 -MAX_LOOP_FILTER);
452 av1_set_segdata(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_V,
453 -MAX_LOOP_FILTER);
454 av1_set_segdata(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_U,
455 -MAX_LOOP_FILTER);
456 av1_set_segdata(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_V,
457 -MAX_LOOP_FILTER);
458 } else {
459 av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_SKIP);
460 av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_H);
461 av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_V);
462 av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_U);
463 av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_V);
464 if (seg->enabled) {
465 seg->update_data = 1;
466 seg->update_map = 1;
467 }
468 }
469 cpi->active_map.update = 0;
470 }
471 }
472
473 #if !CONFIG_REALTIME_ONLY
process_tpl_stats_frame(AV1_COMP * cpi)474 static void process_tpl_stats_frame(AV1_COMP *cpi) {
475 const GF_GROUP *const gf_group = &cpi->ppi->gf_group;
476 AV1_COMMON *const cm = &cpi->common;
477
478 assert(IMPLIES(gf_group->size > 0, cpi->gf_frame_index < gf_group->size));
479
480 const int tpl_idx = cpi->gf_frame_index;
481 TplParams *const tpl_data = &cpi->ppi->tpl_data;
482 TplDepFrame *tpl_frame = &tpl_data->tpl_frame[tpl_idx];
483 TplDepStats *tpl_stats = tpl_frame->tpl_stats_ptr;
484
485 if (tpl_frame->is_valid) {
486 int tpl_stride = tpl_frame->stride;
487 double intra_cost_base = 0;
488 double mc_dep_cost_base = 0;
489 double cbcmp_base = 1;
490 const int step = 1 << tpl_data->tpl_stats_block_mis_log2;
491 const int row_step = step;
492 const int col_step_sr =
493 coded_to_superres_mi(step, cm->superres_scale_denominator);
494 const int mi_cols_sr = av1_pixels_to_mi(cm->superres_upscaled_width);
495
496 for (int row = 0; row < cm->mi_params.mi_rows; row += row_step) {
497 for (int col = 0; col < mi_cols_sr; col += col_step_sr) {
498 TplDepStats *this_stats = &tpl_stats[av1_tpl_ptr_pos(
499 row, col, tpl_stride, tpl_data->tpl_stats_block_mis_log2)];
500 double cbcmp = (double)(this_stats->srcrf_dist);
501 int64_t mc_dep_delta =
502 RDCOST(tpl_frame->base_rdmult, this_stats->mc_dep_rate,
503 this_stats->mc_dep_dist);
504 double dist_scaled = (double)(this_stats->recrf_dist << RDDIV_BITS);
505 intra_cost_base += log(dist_scaled) * cbcmp;
506 mc_dep_cost_base += log(dist_scaled + mc_dep_delta) * cbcmp;
507 cbcmp_base += cbcmp;
508 }
509 }
510
511 if (mc_dep_cost_base == 0) {
512 tpl_frame->is_valid = 0;
513 } else {
514 cpi->rd.r0 = exp((intra_cost_base - mc_dep_cost_base) / cbcmp_base);
515 if (is_frame_tpl_eligible(gf_group, cpi->gf_frame_index)) {
516 if (cpi->ppi->lap_enabled) {
517 double min_boost_factor = sqrt(cpi->ppi->p_rc.baseline_gf_interval);
518 const int gfu_boost = get_gfu_boost_from_r0_lap(
519 min_boost_factor, MAX_GFUBOOST_FACTOR, cpi->rd.r0,
520 cpi->ppi->p_rc.num_stats_required_for_gfu_boost);
521 // printf("old boost %d new boost %d\n", cpi->rc.gfu_boost,
522 // gfu_boost);
523 cpi->ppi->p_rc.gfu_boost = combine_prior_with_tpl_boost(
524 min_boost_factor, MAX_BOOST_COMBINE_FACTOR,
525 cpi->ppi->p_rc.gfu_boost, gfu_boost,
526 cpi->ppi->p_rc.num_stats_used_for_gfu_boost);
527 } else {
528 // TPL may only look at a subset of frame in the gf group when the
529 // speed feature 'reduce_num_frames' is on, which affects the r0
530 // calcuation. Thus, to compensate for TPL not using all frames a
531 // factor to adjust r0 is used.
532 const int gfu_boost =
533 (int)(200.0 * cpi->ppi->tpl_data.r0_adjust_factor / cpi->rd.r0);
534 cpi->ppi->p_rc.gfu_boost = combine_prior_with_tpl_boost(
535 MIN_BOOST_COMBINE_FACTOR, MAX_BOOST_COMBINE_FACTOR,
536 cpi->ppi->p_rc.gfu_boost, gfu_boost, cpi->rc.frames_to_key);
537 }
538 }
539 }
540 }
541 }
542 #endif // !CONFIG_REALTIME_ONLY
543
av1_set_size_dependent_vars(AV1_COMP * cpi,int * q,int * bottom_index,int * top_index)544 void av1_set_size_dependent_vars(AV1_COMP *cpi, int *q, int *bottom_index,
545 int *top_index) {
546 AV1_COMMON *const cm = &cpi->common;
547
548 // Setup variables that depend on the dimensions of the frame.
549 av1_set_speed_features_framesize_dependent(cpi, cpi->speed);
550
551 #if !CONFIG_REALTIME_ONLY
552 GF_GROUP *gf_group = &cpi->ppi->gf_group;
553 if (cpi->oxcf.algo_cfg.enable_tpl_model &&
554 av1_tpl_stats_ready(&cpi->ppi->tpl_data, cpi->gf_frame_index)) {
555 process_tpl_stats_frame(cpi);
556 av1_tpl_rdmult_setup(cpi);
557 }
558 #endif
559
560 // Decide q and q bounds.
561 *q = av1_rc_pick_q_and_bounds(cpi, cm->width, cm->height, cpi->gf_frame_index,
562 bottom_index, top_index);
563
564 if (cpi->oxcf.rc_cfg.mode == AOM_CBR && cpi->rc.force_max_q) {
565 *q = cpi->rc.worst_quality;
566 cpi->rc.force_max_q = 0;
567 }
568
569 #if !CONFIG_REALTIME_ONLY
570 if (cpi->oxcf.rc_cfg.mode == AOM_Q &&
571 cpi->ppi->tpl_data.tpl_frame[cpi->gf_frame_index].is_valid &&
572 !is_lossless_requested(&cpi->oxcf.rc_cfg)) {
573 const RateControlCfg *const rc_cfg = &cpi->oxcf.rc_cfg;
574 const int tpl_q = av1_tpl_get_q_index(
575 &cpi->ppi->tpl_data, cpi->gf_frame_index, cpi->rc.active_worst_quality,
576 cm->seq_params->bit_depth);
577 *q = clamp(tpl_q, rc_cfg->best_allowed_q, rc_cfg->worst_allowed_q);
578 *top_index = *bottom_index = *q;
579 if (gf_group->update_type[cpi->gf_frame_index] == ARF_UPDATE)
580 cpi->ppi->p_rc.arf_q = *q;
581 }
582
583 if (cpi->oxcf.q_cfg.use_fixed_qp_offsets && cpi->oxcf.rc_cfg.mode == AOM_Q) {
584 if (is_frame_tpl_eligible(gf_group, cpi->gf_frame_index)) {
585 const double qratio_grad =
586 cpi->ppi->p_rc.baseline_gf_interval > 20 ? 0.2 : 0.3;
587 const double qstep_ratio =
588 0.2 +
589 (1.0 - (double)cpi->rc.active_worst_quality / MAXQ) * qratio_grad;
590 *q = av1_get_q_index_from_qstep_ratio(
591 cpi->rc.active_worst_quality, qstep_ratio, cm->seq_params->bit_depth);
592 *top_index = *bottom_index = *q;
593 if (gf_group->update_type[cpi->gf_frame_index] == ARF_UPDATE ||
594 gf_group->update_type[cpi->gf_frame_index] == KF_UPDATE ||
595 gf_group->update_type[cpi->gf_frame_index] == GF_UPDATE)
596 cpi->ppi->p_rc.arf_q = *q;
597 } else if (gf_group->layer_depth[cpi->gf_frame_index] <
598 gf_group->max_layer_depth) {
599 int this_height = gf_group->layer_depth[cpi->gf_frame_index];
600 int arf_q = cpi->ppi->p_rc.arf_q;
601 while (this_height > 1) {
602 arf_q = (arf_q + cpi->oxcf.rc_cfg.cq_level + 1) / 2;
603 --this_height;
604 }
605 *top_index = *bottom_index = *q = arf_q;
606 }
607 }
608 #endif
609
610 // Configure experimental use of segmentation for enhanced coding of
611 // static regions if indicated.
612 // Only allowed in the second pass of a two pass encode, as it requires
613 // lagged coding, and if the relevant speed feature flag is set.
614 if (is_stat_consumption_stage_twopass(cpi) &&
615 cpi->sf.hl_sf.static_segmentation)
616 configure_static_seg_features(cpi);
617 }
618
619 #if !CONFIG_REALTIME_ONLY
reset_film_grain_chroma_params(aom_film_grain_t * pars)620 static void reset_film_grain_chroma_params(aom_film_grain_t *pars) {
621 pars->num_cr_points = 0;
622 pars->cr_mult = 0;
623 pars->cr_luma_mult = 0;
624 memset(pars->scaling_points_cr, 0, sizeof(pars->scaling_points_cr));
625 memset(pars->ar_coeffs_cr, 0, sizeof(pars->ar_coeffs_cr));
626 pars->num_cb_points = 0;
627 pars->cb_mult = 0;
628 pars->cb_luma_mult = 0;
629 pars->chroma_scaling_from_luma = 0;
630 memset(pars->scaling_points_cb, 0, sizeof(pars->scaling_points_cb));
631 memset(pars->ar_coeffs_cb, 0, sizeof(pars->ar_coeffs_cb));
632 }
633
av1_update_film_grain_parameters_seq(struct AV1_PRIMARY * ppi,const AV1EncoderConfig * oxcf)634 void av1_update_film_grain_parameters_seq(struct AV1_PRIMARY *ppi,
635 const AV1EncoderConfig *oxcf) {
636 SequenceHeader *const seq_params = &ppi->seq_params;
637 const TuneCfg *const tune_cfg = &oxcf->tune_cfg;
638
639 if (tune_cfg->film_grain_test_vector || tune_cfg->film_grain_table_filename ||
640 tune_cfg->content == AOM_CONTENT_FILM) {
641 seq_params->film_grain_params_present = 1;
642 } else {
643 #if CONFIG_DENOISE
644 seq_params->film_grain_params_present = (oxcf->noise_level > 0);
645 #else
646 seq_params->film_grain_params_present = 0;
647 #endif
648 }
649 }
650
av1_update_film_grain_parameters(struct AV1_COMP * cpi,const AV1EncoderConfig * oxcf)651 void av1_update_film_grain_parameters(struct AV1_COMP *cpi,
652 const AV1EncoderConfig *oxcf) {
653 AV1_COMMON *const cm = &cpi->common;
654 const TuneCfg *const tune_cfg = &oxcf->tune_cfg;
655
656 if (cpi->film_grain_table) {
657 aom_film_grain_table_free(cpi->film_grain_table);
658 aom_free(cpi->film_grain_table);
659 cpi->film_grain_table = NULL;
660 }
661
662 if (tune_cfg->film_grain_test_vector) {
663 if (cm->current_frame.frame_type == KEY_FRAME) {
664 memcpy(&cm->film_grain_params,
665 film_grain_test_vectors + tune_cfg->film_grain_test_vector - 1,
666 sizeof(cm->film_grain_params));
667 if (oxcf->tool_cfg.enable_monochrome)
668 reset_film_grain_chroma_params(&cm->film_grain_params);
669 cm->film_grain_params.bit_depth = cm->seq_params->bit_depth;
670 if (cm->seq_params->color_range == AOM_CR_FULL_RANGE) {
671 cm->film_grain_params.clip_to_restricted_range = 0;
672 }
673 }
674 } else if (tune_cfg->film_grain_table_filename) {
675 CHECK_MEM_ERROR(cm, cpi->film_grain_table,
676 aom_calloc(1, sizeof(*cpi->film_grain_table)));
677
678 aom_film_grain_table_read(cpi->film_grain_table,
679 tune_cfg->film_grain_table_filename, cm->error);
680 } else if (tune_cfg->content == AOM_CONTENT_FILM) {
681 cm->film_grain_params.bit_depth = cm->seq_params->bit_depth;
682 if (oxcf->tool_cfg.enable_monochrome)
683 reset_film_grain_chroma_params(&cm->film_grain_params);
684 if (cm->seq_params->color_range == AOM_CR_FULL_RANGE)
685 cm->film_grain_params.clip_to_restricted_range = 0;
686 } else {
687 memset(&cm->film_grain_params, 0, sizeof(cm->film_grain_params));
688 }
689 }
690 #endif // !CONFIG_REALTIME_ONLY
691
av1_scale_references(AV1_COMP * cpi,const InterpFilter filter,const int phase,const int use_optimized_scaler)692 void av1_scale_references(AV1_COMP *cpi, const InterpFilter filter,
693 const int phase, const int use_optimized_scaler) {
694 AV1_COMMON *cm = &cpi->common;
695 const int num_planes = av1_num_planes(cm);
696 MV_REFERENCE_FRAME ref_frame;
697
698 for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
699 // Need to convert from AOM_REFFRAME to index into ref_mask (subtract 1).
700 if (cpi->ref_frame_flags & av1_ref_frame_flag_list[ref_frame]) {
701 BufferPool *const pool = cm->buffer_pool;
702 const YV12_BUFFER_CONFIG *const ref =
703 get_ref_frame_yv12_buf(cm, ref_frame);
704
705 if (ref == NULL) {
706 cpi->scaled_ref_buf[ref_frame - 1] = NULL;
707 continue;
708 }
709
710 // For RTC-SVC: if force_zero_mode_spatial_ref is enabled, check if the
711 // motion search can be skipped for the references: last, golden, altref.
712 // If so, we can skip scaling that reference.
713 if (cpi->ppi->use_svc && cpi->svc.force_zero_mode_spatial_ref &&
714 cpi->ppi->rtc_ref.set_ref_frame_config) {
715 if (ref_frame == LAST_FRAME && cpi->svc.skip_mvsearch_last) continue;
716 if (ref_frame == GOLDEN_FRAME && cpi->svc.skip_mvsearch_gf) continue;
717 if (ref_frame == ALTREF_FRAME && cpi->svc.skip_mvsearch_altref)
718 continue;
719 }
720 // For RTC with superres on: golden reference only needs to be scaled
721 // if it was refreshed in previous frame.
722 if (is_one_pass_rt_params(cpi) &&
723 cpi->oxcf.superres_cfg.enable_superres && ref_frame == GOLDEN_FRAME &&
724 cpi->rc.frame_num_last_gf_refresh <
725 (int)cm->current_frame.frame_number - 1) {
726 continue;
727 }
728
729 if (ref->y_crop_width != cm->width || ref->y_crop_height != cm->height) {
730 // Replace the reference buffer with a copy having a thicker border,
731 // if the reference buffer is higher resolution than the current
732 // frame, and the border is thin.
733 if ((ref->y_crop_width > cm->width ||
734 ref->y_crop_height > cm->height) &&
735 ref->border < AOM_BORDER_IN_PIXELS) {
736 RefCntBuffer *ref_fb = get_ref_frame_buf(cm, ref_frame);
737 if (aom_yv12_realloc_with_new_border(
738 &ref_fb->buf, AOM_BORDER_IN_PIXELS,
739 cm->features.byte_alignment, cpi->alloc_pyramid,
740 num_planes) != 0) {
741 aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
742 "Failed to allocate frame buffer");
743 }
744 }
745 int force_scaling = 0;
746 RefCntBuffer *new_fb = cpi->scaled_ref_buf[ref_frame - 1];
747 if (new_fb == NULL) {
748 const int new_fb_idx = get_free_fb(cm);
749 if (new_fb_idx == INVALID_IDX) {
750 aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
751 "Unable to find free frame buffer");
752 }
753 force_scaling = 1;
754 new_fb = &pool->frame_bufs[new_fb_idx];
755 }
756
757 if (force_scaling || new_fb->buf.y_crop_width != cm->width ||
758 new_fb->buf.y_crop_height != cm->height) {
759 if (aom_realloc_frame_buffer(
760 &new_fb->buf, cm->width, cm->height,
761 cm->seq_params->subsampling_x, cm->seq_params->subsampling_y,
762 cm->seq_params->use_highbitdepth, AOM_BORDER_IN_PIXELS,
763 cm->features.byte_alignment, NULL, NULL, NULL, false, 0)) {
764 if (force_scaling) {
765 // Release the reference acquired in the get_free_fb() call above.
766 --new_fb->ref_count;
767 }
768 aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
769 "Failed to allocate frame buffer");
770 }
771 bool has_optimized_scaler = av1_has_optimized_scaler(
772 ref->y_crop_width, ref->y_crop_height, new_fb->buf.y_crop_width,
773 new_fb->buf.y_crop_height);
774 if (num_planes > 1) {
775 has_optimized_scaler =
776 has_optimized_scaler &&
777 av1_has_optimized_scaler(
778 ref->uv_crop_width, ref->uv_crop_height,
779 new_fb->buf.uv_crop_width, new_fb->buf.uv_crop_height);
780 }
781 #if CONFIG_AV1_HIGHBITDEPTH
782 if (use_optimized_scaler && has_optimized_scaler &&
783 cm->seq_params->bit_depth == AOM_BITS_8) {
784 av1_resize_and_extend_frame(ref, &new_fb->buf, filter, phase,
785 num_planes);
786 } else if (!av1_resize_and_extend_frame_nonnormative(
787 ref, &new_fb->buf, (int)cm->seq_params->bit_depth,
788 num_planes)) {
789 aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
790 "Failed to allocate buffer during resize");
791 }
792 #else
793 if (use_optimized_scaler && has_optimized_scaler) {
794 av1_resize_and_extend_frame(ref, &new_fb->buf, filter, phase,
795 num_planes);
796 } else if (!av1_resize_and_extend_frame_nonnormative(
797 ref, &new_fb->buf, (int)cm->seq_params->bit_depth,
798 num_planes)) {
799 aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
800 "Failed to allocate buffer during resize");
801 }
802 #endif
803 cpi->scaled_ref_buf[ref_frame - 1] = new_fb;
804 alloc_frame_mvs(cm, new_fb);
805 }
806 } else {
807 RefCntBuffer *buf = get_ref_frame_buf(cm, ref_frame);
808 buf->buf.y_crop_width = ref->y_crop_width;
809 buf->buf.y_crop_height = ref->y_crop_height;
810 cpi->scaled_ref_buf[ref_frame - 1] = buf;
811 ++buf->ref_count;
812 }
813 } else {
814 if (!has_no_stats_stage(cpi)) cpi->scaled_ref_buf[ref_frame - 1] = NULL;
815 }
816 }
817 }
818
av1_select_sb_size(const AV1EncoderConfig * const oxcf,int width,int height,int number_spatial_layers)819 BLOCK_SIZE av1_select_sb_size(const AV1EncoderConfig *const oxcf, int width,
820 int height, int number_spatial_layers) {
821 if (oxcf->tool_cfg.superblock_size == AOM_SUPERBLOCK_SIZE_64X64) {
822 return BLOCK_64X64;
823 }
824 if (oxcf->tool_cfg.superblock_size == AOM_SUPERBLOCK_SIZE_128X128) {
825 return BLOCK_128X128;
826 }
827 #if CONFIG_TFLITE
828 if (oxcf->q_cfg.deltaq_mode == DELTA_Q_USER_RATING_BASED) return BLOCK_64X64;
829 #endif
830 // Force 64x64 superblock size to increase resolution in perceptual
831 // AQ mode.
832 if (oxcf->mode == ALLINTRA &&
833 (oxcf->q_cfg.deltaq_mode == DELTA_Q_PERCEPTUAL_AI ||
834 oxcf->q_cfg.deltaq_mode == DELTA_Q_USER_RATING_BASED)) {
835 return BLOCK_64X64;
836 }
837 assert(oxcf->tool_cfg.superblock_size == AOM_SUPERBLOCK_SIZE_DYNAMIC);
838
839 if (number_spatial_layers > 1 ||
840 oxcf->resize_cfg.resize_mode != RESIZE_NONE) {
841 // Use the configured size (top resolution) for spatial layers or
842 // on resize.
843 return AOMMIN(oxcf->frm_dim_cfg.width, oxcf->frm_dim_cfg.height) > 720
844 ? BLOCK_128X128
845 : BLOCK_64X64;
846 } else if (oxcf->mode == REALTIME) {
847 if (oxcf->tune_cfg.content == AOM_CONTENT_SCREEN) {
848 const TileConfig *const tile_cfg = &oxcf->tile_cfg;
849 const int num_tiles =
850 (1 << tile_cfg->tile_columns) * (1 << tile_cfg->tile_rows);
851 // For multi-thread encode: if the number of (128x128) superblocks
852 // per tile is low use 64X64 superblock.
853 if (oxcf->row_mt == 1 && oxcf->max_threads >= 4 &&
854 oxcf->max_threads >= num_tiles && AOMMIN(width, height) >= 720 &&
855 (width * height) / (128 * 128 * num_tiles) < 40)
856 return BLOCK_64X64;
857 else
858 return AOMMIN(width, height) >= 720 ? BLOCK_128X128 : BLOCK_64X64;
859 } else {
860 return AOMMIN(width, height) > 720 ? BLOCK_128X128 : BLOCK_64X64;
861 }
862 }
863
864 // TODO(any): Possibly could improve this with a heuristic.
865 // When superres / resize is on, 'cm->width / height' can change between
866 // calls, so we don't apply this heuristic there.
867 // Things break if superblock size changes between the first pass and second
868 // pass encoding, which is why this heuristic is not configured as a
869 // speed-feature.
870 if (oxcf->superres_cfg.superres_mode == AOM_SUPERRES_NONE &&
871 oxcf->resize_cfg.resize_mode == RESIZE_NONE) {
872 int is_480p_or_lesser = AOMMIN(width, height) <= 480;
873 if (oxcf->speed >= 1 && is_480p_or_lesser) return BLOCK_64X64;
874
875 // For 1080p and lower resolutions, choose SB size adaptively based on
876 // resolution and speed level for multi-thread encode.
877 int is_1080p_or_lesser = AOMMIN(width, height) <= 1080;
878 if (!is_480p_or_lesser && is_1080p_or_lesser && oxcf->mode == GOOD &&
879 oxcf->row_mt == 1 && oxcf->max_threads > 1 && oxcf->speed >= 5)
880 return BLOCK_64X64;
881
882 // For allintra encode, since the maximum partition size is set to 32X32 for
883 // speed>=6, superblock size is set to 64X64 instead of 128X128. This
884 // improves the multithread performance due to reduction in top right delay
885 // and thread sync wastage. Currently, this setting is selectively enabled
886 // only for speed>=9 and resolutions less than 4k since cost update
887 // frequency is set to INTERNAL_COST_UPD_OFF in these cases.
888 const int is_4k_or_larger = AOMMIN(width, height) >= 2160;
889 if (oxcf->mode == ALLINTRA && oxcf->speed >= 9 && !is_4k_or_larger)
890 return BLOCK_64X64;
891 }
892 return BLOCK_128X128;
893 }
894
av1_setup_frame(AV1_COMP * cpi)895 void av1_setup_frame(AV1_COMP *cpi) {
896 AV1_COMMON *const cm = &cpi->common;
897 // Set up entropy context depending on frame type. The decoder mandates
898 // the use of the default context, index 0, for keyframes and inter
899 // frames where the error_resilient_mode or intra_only flag is set. For
900 // other inter-frames the encoder currently uses only two contexts;
901 // context 1 for ALTREF frames and context 0 for the others.
902
903 if (frame_is_intra_only(cm) || cm->features.error_resilient_mode ||
904 cpi->ext_flags.use_primary_ref_none) {
905 av1_setup_past_independence(cm);
906 }
907
908 if ((cm->current_frame.frame_type == KEY_FRAME && cm->show_frame) ||
909 frame_is_sframe(cm)) {
910 if (!cpi->ppi->seq_params_locked) {
911 set_sb_size(cm->seq_params,
912 av1_select_sb_size(&cpi->oxcf, cm->width, cm->height,
913 cpi->ppi->number_spatial_layers));
914 }
915 } else {
916 const RefCntBuffer *const primary_ref_buf = get_primary_ref_frame_buf(cm);
917 if (primary_ref_buf == NULL) {
918 av1_setup_past_independence(cm);
919 cm->seg.update_map = 1;
920 cm->seg.update_data = 1;
921 } else {
922 *cm->fc = primary_ref_buf->frame_context;
923 }
924 }
925
926 av1_zero(cm->cur_frame->interp_filter_selected);
927 cm->prev_frame = get_primary_ref_frame_buf(cm);
928 cpi->vaq_refresh = 0;
929 }
930
931 #if !CONFIG_REALTIME_ONLY
get_interp_filter_selected(const AV1_COMMON * const cm,MV_REFERENCE_FRAME ref,InterpFilter ifilter)932 static int get_interp_filter_selected(const AV1_COMMON *const cm,
933 MV_REFERENCE_FRAME ref,
934 InterpFilter ifilter) {
935 const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref);
936 if (buf == NULL) return 0;
937 return buf->interp_filter_selected[ifilter];
938 }
939
av1_setup_interp_filter_search_mask(AV1_COMP * cpi)940 uint16_t av1_setup_interp_filter_search_mask(AV1_COMP *cpi) {
941 const AV1_COMMON *const cm = &cpi->common;
942 int ref_total[REF_FRAMES] = { 0 };
943 uint16_t mask = ALLOW_ALL_INTERP_FILT_MASK;
944
945 if (cpi->last_frame_type == KEY_FRAME || cpi->refresh_frame.alt_ref_frame)
946 return mask;
947
948 for (MV_REFERENCE_FRAME ref = LAST_FRAME; ref <= ALTREF_FRAME; ++ref) {
949 for (InterpFilter ifilter = EIGHTTAP_REGULAR; ifilter <= MULTITAP_SHARP;
950 ++ifilter) {
951 ref_total[ref] += get_interp_filter_selected(cm, ref, ifilter);
952 }
953 }
954 int ref_total_total = (ref_total[LAST2_FRAME] + ref_total[LAST3_FRAME] +
955 ref_total[GOLDEN_FRAME] + ref_total[BWDREF_FRAME] +
956 ref_total[ALTREF2_FRAME] + ref_total[ALTREF_FRAME]);
957
958 for (InterpFilter ifilter = EIGHTTAP_REGULAR; ifilter <= MULTITAP_SHARP;
959 ++ifilter) {
960 int last_score = get_interp_filter_selected(cm, LAST_FRAME, ifilter) * 30;
961 if (ref_total[LAST_FRAME] && last_score <= ref_total[LAST_FRAME]) {
962 int filter_score =
963 get_interp_filter_selected(cm, LAST2_FRAME, ifilter) * 20 +
964 get_interp_filter_selected(cm, LAST3_FRAME, ifilter) * 20 +
965 get_interp_filter_selected(cm, GOLDEN_FRAME, ifilter) * 20 +
966 get_interp_filter_selected(cm, BWDREF_FRAME, ifilter) * 10 +
967 get_interp_filter_selected(cm, ALTREF2_FRAME, ifilter) * 10 +
968 get_interp_filter_selected(cm, ALTREF_FRAME, ifilter) * 10;
969 if (filter_score < ref_total_total) {
970 DUAL_FILTER_TYPE filt_type = ifilter + SWITCHABLE_FILTERS * ifilter;
971 reset_interp_filter_allowed_mask(&mask, filt_type);
972 }
973 }
974 }
975 return mask;
976 }
977
978 #define STRICT_PSNR_DIFF_THRESH 0.9
979 // Encode key frame with/without screen content tools to determine whether
980 // screen content tools should be enabled for this key frame group or not.
981 // The first encoding is without screen content tools.
982 // The second encoding is with screen content tools.
983 // We compare the psnr and frame size to make the decision.
screen_content_tools_determination(AV1_COMP * cpi,const int allow_screen_content_tools_orig_decision,const int allow_intrabc_orig_decision,const int use_screen_content_tools_orig_decision,const int is_screen_content_type_orig_decision,const int pass,int * projected_size_pass,PSNR_STATS * psnr)984 static void screen_content_tools_determination(
985 AV1_COMP *cpi, const int allow_screen_content_tools_orig_decision,
986 const int allow_intrabc_orig_decision,
987 const int use_screen_content_tools_orig_decision,
988 const int is_screen_content_type_orig_decision, const int pass,
989 int *projected_size_pass, PSNR_STATS *psnr) {
990 AV1_COMMON *const cm = &cpi->common;
991 FeatureFlags *const features = &cm->features;
992
993 #if CONFIG_FPMT_TEST
994 projected_size_pass[pass] =
995 ((cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] > 0) &&
996 (cpi->ppi->fpmt_unit_test_cfg == PARALLEL_SIMULATION_ENCODE))
997 ? cpi->ppi->p_rc.temp_projected_frame_size
998 : cpi->rc.projected_frame_size;
999 #else
1000 projected_size_pass[pass] = cpi->rc.projected_frame_size;
1001 #endif
1002
1003 #if CONFIG_AV1_HIGHBITDEPTH
1004 const uint32_t in_bit_depth = cpi->oxcf.input_cfg.input_bit_depth;
1005 const uint32_t bit_depth = cpi->td.mb.e_mbd.bd;
1006 aom_calc_highbd_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr[pass],
1007 bit_depth, in_bit_depth);
1008 #else
1009 aom_calc_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr[pass]);
1010 #endif
1011 if (pass != 1) return;
1012
1013 const double psnr_diff = psnr[1].psnr[0] - psnr[0].psnr[0];
1014 // Calculate % of palette mode to be chosen in a frame from mode decision.
1015 const double palette_ratio =
1016 (double)cpi->palette_pixel_num / (double)(cm->height * cm->width);
1017 const int psnr_diff_is_large = (psnr_diff > STRICT_PSNR_DIFF_THRESH);
1018 const int ratio_is_large =
1019 ((palette_ratio >= 0.0001) && ((psnr_diff / palette_ratio) > 4));
1020 const int is_sc_encoding_much_better = (psnr_diff_is_large || ratio_is_large);
1021 if (is_sc_encoding_much_better) {
1022 // Use screen content tools, if we get coding gain.
1023 features->allow_screen_content_tools = 1;
1024 features->allow_intrabc = cpi->intrabc_used;
1025 cpi->use_screen_content_tools = 1;
1026 cpi->is_screen_content_type = 1;
1027 } else {
1028 // Use original screen content decision.
1029 features->allow_screen_content_tools =
1030 allow_screen_content_tools_orig_decision;
1031 features->allow_intrabc = allow_intrabc_orig_decision;
1032 cpi->use_screen_content_tools = use_screen_content_tools_orig_decision;
1033 cpi->is_screen_content_type = is_screen_content_type_orig_decision;
1034 }
1035 }
1036
1037 // Set some encoding parameters to make the encoding process fast.
1038 // A fixed block partition size, and a large q is used.
set_encoding_params_for_screen_content(AV1_COMP * cpi,const int pass)1039 static void set_encoding_params_for_screen_content(AV1_COMP *cpi,
1040 const int pass) {
1041 AV1_COMMON *const cm = &cpi->common;
1042 if (pass == 0) {
1043 // In the first pass, encode without screen content tools.
1044 // Use a high q, and a fixed block size for fast encoding.
1045 cm->features.allow_screen_content_tools = 0;
1046 cm->features.allow_intrabc = 0;
1047 cpi->use_screen_content_tools = 0;
1048 cpi->sf.part_sf.partition_search_type = FIXED_PARTITION;
1049 cpi->sf.part_sf.fixed_partition_size = BLOCK_32X32;
1050 return;
1051 }
1052 assert(pass == 1);
1053 // In the second pass, encode with screen content tools.
1054 // Use a high q, and a fixed block size for fast encoding.
1055 cm->features.allow_screen_content_tools = 1;
1056 // TODO(chengchen): turn intrabc on could lead to data race issue.
1057 // cm->allow_intrabc = 1;
1058 cpi->use_screen_content_tools = 1;
1059 cpi->sf.part_sf.partition_search_type = FIXED_PARTITION;
1060 cpi->sf.part_sf.fixed_partition_size = BLOCK_32X32;
1061 }
1062
1063 // Determines whether to use screen content tools for the key frame group.
1064 // This function modifies "cm->features.allow_screen_content_tools",
1065 // "cm->features.allow_intrabc" and "cpi->use_screen_content_tools".
av1_determine_sc_tools_with_encoding(AV1_COMP * cpi,const int q_orig)1066 void av1_determine_sc_tools_with_encoding(AV1_COMP *cpi, const int q_orig) {
1067 AV1_COMMON *const cm = &cpi->common;
1068 const AV1EncoderConfig *const oxcf = &cpi->oxcf;
1069 const QuantizationCfg *const q_cfg = &oxcf->q_cfg;
1070 // Variables to help determine if we should allow screen content tools.
1071 int projected_size_pass[3] = { 0 };
1072 PSNR_STATS psnr[3];
1073 const int is_key_frame = cm->current_frame.frame_type == KEY_FRAME;
1074 const int allow_screen_content_tools_orig_decision =
1075 cm->features.allow_screen_content_tools;
1076 const int allow_intrabc_orig_decision = cm->features.allow_intrabc;
1077 const int use_screen_content_tools_orig_decision =
1078 cpi->use_screen_content_tools;
1079 const int is_screen_content_type_orig_decision = cpi->is_screen_content_type;
1080 // Turn off the encoding trial for forward key frame and superres.
1081 if (cpi->sf.rt_sf.use_nonrd_pick_mode || oxcf->kf_cfg.fwd_kf_enabled ||
1082 cpi->superres_mode != AOM_SUPERRES_NONE || oxcf->mode == REALTIME ||
1083 use_screen_content_tools_orig_decision || !is_key_frame) {
1084 return;
1085 }
1086
1087 // TODO(chengchen): multiple encoding for the lossless mode is time consuming.
1088 // Find a better way to determine whether screen content tools should be used
1089 // for lossless coding.
1090 // Use a high q and a fixed partition to do quick encoding.
1091 const int q_for_screen_content_quick_run =
1092 is_lossless_requested(&oxcf->rc_cfg) ? q_orig : AOMMAX(q_orig, 244);
1093 const int partition_search_type_orig = cpi->sf.part_sf.partition_search_type;
1094 const BLOCK_SIZE fixed_partition_block_size_orig =
1095 cpi->sf.part_sf.fixed_partition_size;
1096
1097 // Setup necessary params for encoding, including frame source, etc.
1098
1099 cpi->source = av1_realloc_and_scale_if_required(
1100 cm, cpi->unscaled_source, &cpi->scaled_source, cm->features.interp_filter,
1101 0, false, false, cpi->oxcf.border_in_pixels, cpi->alloc_pyramid);
1102 if (cpi->unscaled_last_source != NULL) {
1103 cpi->last_source = av1_realloc_and_scale_if_required(
1104 cm, cpi->unscaled_last_source, &cpi->scaled_last_source,
1105 cm->features.interp_filter, 0, false, false, cpi->oxcf.border_in_pixels,
1106 cpi->alloc_pyramid);
1107 }
1108
1109 av1_setup_frame(cpi);
1110
1111 if (cm->seg.enabled) {
1112 if (!cm->seg.update_data && cm->prev_frame) {
1113 segfeatures_copy(&cm->seg, &cm->prev_frame->seg);
1114 cm->seg.enabled = cm->prev_frame->seg.enabled;
1115 } else {
1116 av1_calculate_segdata(&cm->seg);
1117 }
1118 } else {
1119 memset(&cm->seg, 0, sizeof(cm->seg));
1120 }
1121 segfeatures_copy(&cm->cur_frame->seg, &cm->seg);
1122 cm->cur_frame->seg.enabled = cm->seg.enabled;
1123
1124 // The two encoding passes aim to help determine whether to use screen
1125 // content tools, with a high q and fixed partition.
1126 for (int pass = 0; pass < 2; ++pass) {
1127 set_encoding_params_for_screen_content(cpi, pass);
1128 av1_set_quantizer(cm, q_cfg->qm_minlevel, q_cfg->qm_maxlevel,
1129 q_for_screen_content_quick_run,
1130 q_cfg->enable_chroma_deltaq, q_cfg->enable_hdr_deltaq);
1131 av1_set_speed_features_qindex_dependent(cpi, oxcf->speed);
1132 av1_init_quantizer(&cpi->enc_quant_dequant_params, &cm->quant_params,
1133 cm->seq_params->bit_depth);
1134
1135 av1_set_variance_partition_thresholds(cpi, q_for_screen_content_quick_run,
1136 0);
1137 // transform / motion compensation build reconstruction frame
1138 av1_encode_frame(cpi);
1139 // Screen content decision
1140 screen_content_tools_determination(
1141 cpi, allow_screen_content_tools_orig_decision,
1142 allow_intrabc_orig_decision, use_screen_content_tools_orig_decision,
1143 is_screen_content_type_orig_decision, pass, projected_size_pass, psnr);
1144 }
1145
1146 // Set partition speed feature back.
1147 cpi->sf.part_sf.partition_search_type = partition_search_type_orig;
1148 cpi->sf.part_sf.fixed_partition_size = fixed_partition_block_size_orig;
1149
1150 // Free token related info if screen content coding tools are not enabled.
1151 if (!cm->features.allow_screen_content_tools)
1152 free_token_info(&cpi->token_info);
1153 }
1154 #endif // CONFIG_REALTIME_ONLY
1155
fix_interp_filter(InterpFilter * const interp_filter,const FRAME_COUNTS * const counts)1156 static void fix_interp_filter(InterpFilter *const interp_filter,
1157 const FRAME_COUNTS *const counts) {
1158 if (*interp_filter == SWITCHABLE) {
1159 // Check to see if only one of the filters is actually used
1160 int count[SWITCHABLE_FILTERS] = { 0 };
1161 int num_filters_used = 0;
1162 for (int i = 0; i < SWITCHABLE_FILTERS; ++i) {
1163 for (int j = 0; j < SWITCHABLE_FILTER_CONTEXTS; ++j)
1164 count[i] += counts->switchable_interp[j][i];
1165 num_filters_used += (count[i] > 0);
1166 }
1167 if (num_filters_used == 1) {
1168 // Only one filter is used. So set the filter at frame level
1169 for (int i = 0; i < SWITCHABLE_FILTERS; ++i) {
1170 if (count[i]) {
1171 *interp_filter = i;
1172 break;
1173 }
1174 }
1175 }
1176 }
1177 }
1178
av1_finalize_encoded_frame(AV1_COMP * const cpi)1179 void av1_finalize_encoded_frame(AV1_COMP *const cpi) {
1180 AV1_COMMON *const cm = &cpi->common;
1181 CurrentFrame *const current_frame = &cm->current_frame;
1182
1183 if (!cm->seq_params->reduced_still_picture_hdr &&
1184 encode_show_existing_frame(cm)) {
1185 RefCntBuffer *const frame_to_show =
1186 cm->ref_frame_map[cpi->existing_fb_idx_to_show];
1187
1188 if (frame_to_show == NULL) {
1189 aom_internal_error(cm->error, AOM_CODEC_UNSUP_BITSTREAM,
1190 "Buffer does not contain a reconstructed frame");
1191 }
1192 assert(frame_to_show->ref_count > 0);
1193 assign_frame_buffer_p(&cm->cur_frame, frame_to_show);
1194 }
1195
1196 if (!encode_show_existing_frame(cm) &&
1197 cm->seq_params->film_grain_params_present &&
1198 (cm->show_frame || cm->showable_frame)) {
1199 // Copy the current frame's film grain params to the its corresponding
1200 // RefCntBuffer slot.
1201 cm->cur_frame->film_grain_params = cm->film_grain_params;
1202
1203 // We must update the parameters if this is not an INTER_FRAME
1204 if (current_frame->frame_type != INTER_FRAME)
1205 cm->cur_frame->film_grain_params.update_parameters = 1;
1206
1207 // Iterate the random seed for the next frame.
1208 cm->film_grain_params.random_seed += 3381;
1209 if (cm->film_grain_params.random_seed == 0)
1210 cm->film_grain_params.random_seed = 7391;
1211 }
1212
1213 // Initialise all tiles' contexts from the global frame context
1214 for (int tile_col = 0; tile_col < cm->tiles.cols; tile_col++) {
1215 for (int tile_row = 0; tile_row < cm->tiles.rows; tile_row++) {
1216 const int tile_idx = tile_row * cm->tiles.cols + tile_col;
1217 cpi->tile_data[tile_idx].tctx = *cm->fc;
1218 }
1219 }
1220
1221 if (!frame_is_intra_only(cm))
1222 fix_interp_filter(&cm->features.interp_filter, cpi->td.counts);
1223 }
1224
av1_is_integer_mv(const YV12_BUFFER_CONFIG * cur_picture,const YV12_BUFFER_CONFIG * last_picture,ForceIntegerMVInfo * const force_intpel_info)1225 int av1_is_integer_mv(const YV12_BUFFER_CONFIG *cur_picture,
1226 const YV12_BUFFER_CONFIG *last_picture,
1227 ForceIntegerMVInfo *const force_intpel_info) {
1228 // check use hash ME
1229 int k;
1230
1231 const int block_size = FORCE_INT_MV_DECISION_BLOCK_SIZE;
1232 const double threshold_current = 0.8;
1233 const double threshold_average = 0.95;
1234 const int max_history_size = 32;
1235 int T = 0; // total block
1236 int C = 0; // match with collocated block
1237 int S = 0; // smooth region but not match with collocated block
1238
1239 const int pic_width = cur_picture->y_width;
1240 const int pic_height = cur_picture->y_height;
1241 for (int i = 0; i + block_size <= pic_height; i += block_size) {
1242 for (int j = 0; j + block_size <= pic_width; j += block_size) {
1243 const int x_pos = j;
1244 const int y_pos = i;
1245 int match = 1;
1246 T++;
1247
1248 // check whether collocated block match with current
1249 uint8_t *p_cur = cur_picture->y_buffer;
1250 uint8_t *p_ref = last_picture->y_buffer;
1251 int stride_cur = cur_picture->y_stride;
1252 int stride_ref = last_picture->y_stride;
1253 p_cur += (y_pos * stride_cur + x_pos);
1254 p_ref += (y_pos * stride_ref + x_pos);
1255
1256 if (cur_picture->flags & YV12_FLAG_HIGHBITDEPTH) {
1257 uint16_t *p16_cur = CONVERT_TO_SHORTPTR(p_cur);
1258 uint16_t *p16_ref = CONVERT_TO_SHORTPTR(p_ref);
1259 for (int tmpY = 0; tmpY < block_size && match; tmpY++) {
1260 for (int tmpX = 0; tmpX < block_size && match; tmpX++) {
1261 if (p16_cur[tmpX] != p16_ref[tmpX]) {
1262 match = 0;
1263 }
1264 }
1265 p16_cur += stride_cur;
1266 p16_ref += stride_ref;
1267 }
1268 } else {
1269 for (int tmpY = 0; tmpY < block_size && match; tmpY++) {
1270 for (int tmpX = 0; tmpX < block_size && match; tmpX++) {
1271 if (p_cur[tmpX] != p_ref[tmpX]) {
1272 match = 0;
1273 }
1274 }
1275 p_cur += stride_cur;
1276 p_ref += stride_ref;
1277 }
1278 }
1279
1280 if (match) {
1281 C++;
1282 continue;
1283 }
1284
1285 if (av1_hash_is_horizontal_perfect(cur_picture, block_size, x_pos,
1286 y_pos) ||
1287 av1_hash_is_vertical_perfect(cur_picture, block_size, x_pos, y_pos)) {
1288 S++;
1289 continue;
1290 }
1291 }
1292 }
1293
1294 assert(T > 0);
1295 double cs_rate = ((double)(C + S)) / ((double)(T));
1296
1297 force_intpel_info->cs_rate_array[force_intpel_info->rate_index] = cs_rate;
1298
1299 force_intpel_info->rate_index =
1300 (force_intpel_info->rate_index + 1) % max_history_size;
1301 force_intpel_info->rate_size++;
1302 force_intpel_info->rate_size =
1303 AOMMIN(force_intpel_info->rate_size, max_history_size);
1304
1305 if (cs_rate < threshold_current) {
1306 return 0;
1307 }
1308
1309 if (C == T) {
1310 return 1;
1311 }
1312
1313 double cs_average = 0.0;
1314
1315 for (k = 0; k < force_intpel_info->rate_size; k++) {
1316 cs_average += force_intpel_info->cs_rate_array[k];
1317 }
1318 cs_average /= force_intpel_info->rate_size;
1319
1320 if (cs_average < threshold_average) {
1321 return 0;
1322 }
1323
1324 if ((T - C - S) < 0) {
1325 return 1;
1326 }
1327
1328 if (cs_average > 1.01) {
1329 return 1;
1330 }
1331
1332 return 0;
1333 }
1334
av1_set_mb_ssim_rdmult_scaling(AV1_COMP * cpi)1335 void av1_set_mb_ssim_rdmult_scaling(AV1_COMP *cpi) {
1336 const CommonModeInfoParams *const mi_params = &cpi->common.mi_params;
1337 const MACROBLOCKD *const xd = &cpi->td.mb.e_mbd;
1338 uint8_t *y_buffer = cpi->source->y_buffer;
1339 const int y_stride = cpi->source->y_stride;
1340 const int block_size = BLOCK_16X16;
1341
1342 const int num_mi_w = mi_size_wide[block_size];
1343 const int num_mi_h = mi_size_high[block_size];
1344 const int num_cols = (mi_params->mi_cols + num_mi_w - 1) / num_mi_w;
1345 const int num_rows = (mi_params->mi_rows + num_mi_h - 1) / num_mi_h;
1346 double log_sum = 0.0;
1347
1348 // Loop through each 16x16 block.
1349 for (int row = 0; row < num_rows; ++row) {
1350 for (int col = 0; col < num_cols; ++col) {
1351 double var = 0.0, num_of_var = 0.0;
1352 const int index = row * num_cols + col;
1353
1354 // Loop through each 8x8 block.
1355 for (int mi_row = row * num_mi_h;
1356 mi_row < mi_params->mi_rows && mi_row < (row + 1) * num_mi_h;
1357 mi_row += 2) {
1358 for (int mi_col = col * num_mi_w;
1359 mi_col < mi_params->mi_cols && mi_col < (col + 1) * num_mi_w;
1360 mi_col += 2) {
1361 struct buf_2d buf;
1362 const int row_offset_y = mi_row << 2;
1363 const int col_offset_y = mi_col << 2;
1364
1365 buf.buf = y_buffer + row_offset_y * y_stride + col_offset_y;
1366 buf.stride = y_stride;
1367
1368 var += av1_get_perpixel_variance_facade(cpi, xd, &buf, BLOCK_8X8,
1369 AOM_PLANE_Y);
1370 num_of_var += 1.0;
1371 }
1372 }
1373 var = var / num_of_var;
1374
1375 // Curve fitting with an exponential model on all 16x16 blocks from the
1376 // midres dataset.
1377 var = 67.035434 * (1 - exp(-0.0021489 * var)) + 17.492222;
1378
1379 // As per the above computation, var will be in the range of
1380 // [17.492222, 84.527656], assuming the data type is of infinite
1381 // precision. The following assert conservatively checks if var is in the
1382 // range of [17.0, 85.0] to avoid any issues due to the precision of the
1383 // relevant data type.
1384 assert(var > 17.0 && var < 85.0);
1385 cpi->ssim_rdmult_scaling_factors[index] = var;
1386 log_sum += log(var);
1387 }
1388 }
1389
1390 // As log_sum holds the geometric mean, it will be in the range
1391 // [17.492222, 84.527656]. Hence, in the below loop, the value of
1392 // cpi->ssim_rdmult_scaling_factors[index] would be in the range
1393 // [0.2069, 4.8323].
1394 log_sum = exp(log_sum / (double)(num_rows * num_cols));
1395
1396 for (int row = 0; row < num_rows; ++row) {
1397 for (int col = 0; col < num_cols; ++col) {
1398 const int index = row * num_cols + col;
1399 cpi->ssim_rdmult_scaling_factors[index] /= log_sum;
1400 }
1401 }
1402 }
1403
1404 // Coding context that only needs to be saved when recode loop includes
1405 // filtering (deblocking, CDEF, superres post-encode upscale and/or loop
1406 // restoraton).
save_extra_coding_context(AV1_COMP * cpi)1407 static void save_extra_coding_context(AV1_COMP *cpi) {
1408 CODING_CONTEXT *const cc = &cpi->coding_context;
1409 AV1_COMMON *cm = &cpi->common;
1410
1411 cc->lf = cm->lf;
1412 cc->cdef_info = cm->cdef_info;
1413 cc->rc = cpi->rc;
1414 cc->mv_stats = cpi->ppi->mv_stats;
1415 }
1416
av1_save_all_coding_context(AV1_COMP * cpi)1417 void av1_save_all_coding_context(AV1_COMP *cpi) {
1418 save_extra_coding_context(cpi);
1419 if (!frame_is_intra_only(&cpi->common)) release_scaled_references(cpi);
1420 }
1421
1422 #if DUMP_RECON_FRAMES == 1
1423
1424 // NOTE(zoeliu): For debug - Output the filtered reconstructed video.
av1_dump_filtered_recon_frames(AV1_COMP * cpi)1425 void av1_dump_filtered_recon_frames(AV1_COMP *cpi) {
1426 AV1_COMMON *const cm = &cpi->common;
1427 const CurrentFrame *const current_frame = &cm->current_frame;
1428 const YV12_BUFFER_CONFIG *recon_buf = &cm->cur_frame->buf;
1429
1430 if (recon_buf == NULL) {
1431 printf("Frame %d is not ready.\n", current_frame->frame_number);
1432 return;
1433 }
1434
1435 static const int flag_list[REF_FRAMES] = { 0,
1436 AOM_LAST_FLAG,
1437 AOM_LAST2_FLAG,
1438 AOM_LAST3_FLAG,
1439 AOM_GOLD_FLAG,
1440 AOM_BWD_FLAG,
1441 AOM_ALT2_FLAG,
1442 AOM_ALT_FLAG };
1443 printf(
1444 "\n***Frame=%d (frame_offset=%d, show_frame=%d, "
1445 "show_existing_frame=%d) "
1446 "[LAST LAST2 LAST3 GOLDEN BWD ALT2 ALT]=[",
1447 current_frame->frame_number, current_frame->order_hint, cm->show_frame,
1448 cm->show_existing_frame);
1449 for (int ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
1450 const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame);
1451 const int ref_offset = buf != NULL ? (int)buf->order_hint : -1;
1452 printf(" %d(%c)", ref_offset,
1453 (cpi->ref_frame_flags & flag_list[ref_frame]) ? 'Y' : 'N');
1454 }
1455 printf(" ]\n");
1456
1457 if (!cm->show_frame) {
1458 printf("Frame %d is a no show frame, so no image dump.\n",
1459 current_frame->frame_number);
1460 return;
1461 }
1462
1463 int h;
1464 char file_name[256] = "/tmp/enc_filtered_recon.yuv";
1465 FILE *f_recon = NULL;
1466
1467 if (current_frame->frame_number == 0) {
1468 if ((f_recon = fopen(file_name, "wb")) == NULL) {
1469 printf("Unable to open file %s to write.\n", file_name);
1470 return;
1471 }
1472 } else {
1473 if ((f_recon = fopen(file_name, "ab")) == NULL) {
1474 printf("Unable to open file %s to append.\n", file_name);
1475 return;
1476 }
1477 }
1478 printf(
1479 "\nFrame=%5d, encode_update_type[%5d]=%1d, frame_offset=%d, "
1480 "show_frame=%d, show_existing_frame=%d, source_alt_ref_active=%d, "
1481 "refresh_alt_ref_frame=%d, "
1482 "y_stride=%4d, uv_stride=%4d, cm->width=%4d, cm->height=%4d\n\n",
1483 current_frame->frame_number, cpi->gf_frame_index,
1484 cpi->ppi->gf_group.update_type[cpi->gf_frame_index],
1485 current_frame->order_hint, cm->show_frame, cm->show_existing_frame,
1486 cpi->rc.source_alt_ref_active, cpi->refresh_frame.alt_ref_frame,
1487 recon_buf->y_stride, recon_buf->uv_stride, cm->width, cm->height);
1488 #if 0
1489 int ref_frame;
1490 printf("get_ref_frame_map_idx: [");
1491 for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame)
1492 printf(" %d", get_ref_frame_map_idx(cm, ref_frame));
1493 printf(" ]\n");
1494 #endif // 0
1495
1496 // --- Y ---
1497 for (h = 0; h < cm->height; ++h) {
1498 fwrite(&recon_buf->y_buffer[h * recon_buf->y_stride], 1, cm->width,
1499 f_recon);
1500 }
1501 // --- U ---
1502 for (h = 0; h < (cm->height >> 1); ++h) {
1503 fwrite(&recon_buf->u_buffer[h * recon_buf->uv_stride], 1, (cm->width >> 1),
1504 f_recon);
1505 }
1506 // --- V ---
1507 for (h = 0; h < (cm->height >> 1); ++h) {
1508 fwrite(&recon_buf->v_buffer[h * recon_buf->uv_stride], 1, (cm->width >> 1),
1509 f_recon);
1510 }
1511
1512 fclose(f_recon);
1513 }
1514 #endif // DUMP_RECON_FRAMES
1515