1 /*
2 * Copyright © Microsoft Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 #include "d3d12_video_enc.h"
25 #include "d3d12_video_enc_av1.h"
26 #include "util/u_video.h"
27 #include "d3d12_resource.h"
28 #include "d3d12_screen.h"
29 #include "d3d12_format.h"
30 #include <cmath>
31 #include <numeric>
32
33 void
d3d12_video_encoder_update_current_rate_control_av1(struct d3d12_video_encoder * pD3D12Enc,pipe_av1_enc_picture_desc * picture)34 d3d12_video_encoder_update_current_rate_control_av1(struct d3d12_video_encoder *pD3D12Enc,
35 pipe_av1_enc_picture_desc *picture)
36 {
37 assert(picture->temporal_id < ARRAY_SIZE(pipe_av1_enc_picture_desc::rc));
38 assert(picture->temporal_id < ARRAY_SIZE(D3D12EncodeConfiguration::m_encoderRateControlDesc));
39
40 struct D3D12EncodeRateControlState m_prevRCState = pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id];
41 pD3D12Enc->m_currentEncodeConfig.m_activeRateControlIndex = picture->temporal_id;
42 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id] = {};
43 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_FrameRate.Numerator = picture->rc[picture->temporal_id].frame_rate_num;
44 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_FrameRate.Denominator = picture->rc[picture->temporal_id].frame_rate_den;
45 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags = D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_NONE;
46
47 if (picture->roi.num > 0)
48 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
49 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_DELTA_QP;
50
51 switch (picture->rc[picture->temporal_id].rate_ctrl_method) {
52 case PIPE_H2645_ENC_RATE_CONTROL_METHOD_VARIABLE_SKIP:
53 case PIPE_H2645_ENC_RATE_CONTROL_METHOD_VARIABLE:
54 {
55 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Mode = D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_VBR;
56 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.TargetAvgBitRate =
57 picture->rc[picture->temporal_id].target_bitrate;
58 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.PeakBitRate =
59 picture->rc[picture->temporal_id].peak_bitrate;
60
61 if (D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE) {
62 debug_printf(
63 "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
64 "D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE environment variable is set, "
65 ", forcing VBV Size = VBV Initial Capacity = Target Bitrate = %" PRIu64 " (bits)\n",
66 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate);
67 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
68 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
69 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.VBVCapacity =
70 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate;
71 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.InitialVBVFullness =
72 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate;
73 } else if (picture->rc[picture->temporal_id].app_requested_hrd_buffer) {
74 debug_printf(
75 "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 HRD required by app,"
76 " setting VBV Size = %d (bits) - VBV Initial Capacity %d (bits)\n",
77 picture->rc[picture->temporal_id].vbv_buffer_size,
78 picture->rc[picture->temporal_id].vbv_buf_initial_size);
79 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
80 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
81 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.VBVCapacity =
82 picture->rc[picture->temporal_id].vbv_buffer_size;
83 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.InitialVBVFullness =
84 picture->rc[picture->temporal_id].vbv_buf_initial_size;
85 }
86
87 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].max_frame_size = picture->rc[picture->temporal_id].max_au_size;
88 if (picture->rc[picture->temporal_id].max_au_size > 0) {
89 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
90 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_MAX_FRAME_SIZE;
91 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.MaxFrameBitSize =
92 picture->rc[picture->temporal_id].max_au_size;
93
94 debug_printf(
95 "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
96 "Upper layer requested explicit MaxFrameBitSize: %" PRIu64 "\n",
97 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.MaxFrameBitSize);
98 }
99
100 if (picture->rc[picture->temporal_id].app_requested_qp_range) {
101 debug_printf("[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
102 "Upper layer requested explicit MinQP: %d MaxQP: %d\n",
103 picture->rc[picture->temporal_id].min_qp,
104 picture->rc[picture->temporal_id].max_qp);
105 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
106 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QP_RANGE;
107 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.MinQP =
108 picture->rc[picture->temporal_id].min_qp;
109 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.MaxQP =
110 picture->rc[picture->temporal_id].max_qp;
111 }
112
113 if (picture->quality_modes.level > 0) {
114 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
115 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QUALITY_VS_SPEED;
116 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
117 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_EXTENSION1_SUPPORT;
118
119 // Convert between D3D12 definition and PIPE definition
120 // D3D12: QualityVsSpeed must be in the range [0, D3D12_FEATURE_DATA_VIDEO_ENCODER_SUPPORT1.MaxQualityVsSpeed]
121 // The lower the value, the fastest the encode operation
122 // PIPE: The quality level range can be queried through the VAConfigAttribEncQualityRange attribute.
123 // A lower value means higher quality, and a value of 1 represents the highest quality.
124 // The quality level setting is used as a trade-off between quality and speed/power
125 // consumption, with higher quality corresponds to lower speed and higher power consumption.
126
127 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR1.QualityVsSpeed =
128 pD3D12Enc->max_quality_levels - picture->quality_modes.level;
129 }
130
131 } break;
132 case PIPE_H2645_ENC_RATE_CONTROL_METHOD_QUALITY_VARIABLE:
133 {
134 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Mode = D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_QVBR;
135 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.TargetAvgBitRate =
136 picture->rc[picture->temporal_id].target_bitrate;
137 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.PeakBitRate =
138 picture->rc[picture->temporal_id].peak_bitrate;
139 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.ConstantQualityTarget =
140 picture->rc[picture->temporal_id].vbr_quality_factor;
141
142 if (D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE) {
143 debug_printf("[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
144 "D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE environment variable is set, "
145 ", forcing VBV Size = VBV Initial Capacity = Target Bitrate = %" PRIu64 " (bits)\n",
146 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1
147 .TargetAvgBitRate);
148 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
149 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
150 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
151 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_EXTENSION1_SUPPORT;
152 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.VBVCapacity =
153 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.TargetAvgBitRate;
154 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.InitialVBVFullness =
155 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.TargetAvgBitRate;
156 } else if (picture->rc[picture->temporal_id].app_requested_hrd_buffer) {
157 debug_printf(
158 "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 HRD required by app,"
159 " setting VBV Size = %d (bits) - VBV Initial Capacity %d (bits)\n",
160 picture->rc[picture->temporal_id].vbv_buffer_size,
161 picture->rc[picture->temporal_id].vbv_buf_initial_size);
162 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
163 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
164 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
165 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_EXTENSION1_SUPPORT;
166 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.VBVCapacity =
167 picture->rc[picture->temporal_id].vbv_buffer_size;
168 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.InitialVBVFullness =
169 picture->rc[picture->temporal_id].vbv_buf_initial_size;
170 }
171 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].max_frame_size = picture->rc[picture->temporal_id].max_au_size;
172 if (picture->rc[picture->temporal_id].max_au_size > 0) {
173 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
174 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_MAX_FRAME_SIZE;
175 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.MaxFrameBitSize =
176 picture->rc[picture->temporal_id].max_au_size;
177
178 debug_printf(
179 "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
180 "Upper layer requested explicit MaxFrameBitSize: %" PRIu64 "\n",
181 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.MaxFrameBitSize);
182 }
183
184 if (picture->rc[picture->temporal_id].app_requested_qp_range) {
185 debug_printf("[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
186 "Upper layer requested explicit MinQP: %d MaxQP: %d\n",
187 picture->rc[picture->temporal_id].min_qp,
188 picture->rc[picture->temporal_id].max_qp);
189 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
190 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QP_RANGE;
191 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.MinQP =
192 picture->rc[picture->temporal_id].min_qp;
193 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.MaxQP =
194 picture->rc[picture->temporal_id].max_qp;
195 }
196
197 if (picture->quality_modes.level > 0) {
198 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
199 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QUALITY_VS_SPEED;
200 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
201 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_EXTENSION1_SUPPORT;
202
203 // Convert between D3D12 definition and PIPE definition
204 // D3D12: QualityVsSpeed must be in the range [0, D3D12_FEATURE_DATA_VIDEO_ENCODER_SUPPORT1.MaxQualityVsSpeed]
205 // The lower the value, the fastest the encode operation
206 // PIPE: The quality level range can be queried through the VAConfigAttribEncQualityRange attribute.
207 // A lower value means higher quality, and a value of 1 represents the highest quality.
208 // The quality level setting is used as a trade-off between quality and speed/power
209 // consumption, with higher quality corresponds to lower speed and higher power consumption.
210
211 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.QualityVsSpeed =
212 pD3D12Enc->max_quality_levels - picture->quality_modes.level;
213 }
214
215 } break;
216 case PIPE_H2645_ENC_RATE_CONTROL_METHOD_CONSTANT_SKIP:
217 case PIPE_H2645_ENC_RATE_CONTROL_METHOD_CONSTANT:
218 {
219 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Mode = D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_CBR;
220 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate =
221 picture->rc[picture->temporal_id].target_bitrate;
222
223 /* For CBR mode, to guarantee bitrate of generated stream complies with
224 * target bitrate (e.g. no over +/-10%), vbv_buffer_size and initial capacity should be same
225 * as target bitrate. Controlled by OS env var D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE
226 */
227 if (D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE) {
228 debug_printf(
229 "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
230 "D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE environment variable is set, "
231 ", forcing VBV Size = VBV Initial Capacity = Target Bitrate = %" PRIu64 " (bits)\n",
232 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate);
233 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
234 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
235 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.VBVCapacity =
236 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate;
237 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.InitialVBVFullness =
238 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate;
239 } else if (picture->rc[picture->temporal_id].app_requested_hrd_buffer) {
240 debug_printf(
241 "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 HRD required by app,"
242 " setting VBV Size = %d (bits) - VBV Initial Capacity %d (bits)\n",
243 picture->rc[picture->temporal_id].vbv_buffer_size,
244 picture->rc[picture->temporal_id].vbv_buf_initial_size);
245 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
246 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
247 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.VBVCapacity =
248 picture->rc[picture->temporal_id].vbv_buffer_size;
249 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.InitialVBVFullness =
250 picture->rc[picture->temporal_id].vbv_buf_initial_size;
251 }
252
253 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].max_frame_size = picture->rc[picture->temporal_id].max_au_size;
254 if (picture->rc[picture->temporal_id].max_au_size > 0) {
255 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
256 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_MAX_FRAME_SIZE;
257 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.MaxFrameBitSize =
258 picture->rc[picture->temporal_id].max_au_size;
259
260 debug_printf(
261 "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
262 "Upper layer requested explicit MaxFrameBitSize: %" PRIu64 "\n",
263 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.MaxFrameBitSize);
264 }
265
266 if (picture->rc[picture->temporal_id].app_requested_qp_range) {
267 debug_printf("[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
268 "Upper layer requested explicit MinQP: %d MaxQP: %d\n",
269 picture->rc[picture->temporal_id].min_qp,
270 picture->rc[picture->temporal_id].max_qp);
271
272 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
273 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QP_RANGE;
274 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.MinQP =
275 picture->rc[picture->temporal_id].min_qp;
276 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.MaxQP =
277 picture->rc[picture->temporal_id].max_qp;
278 }
279
280 if (picture->quality_modes.level > 0) {
281 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
282 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QUALITY_VS_SPEED;
283 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
284 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_EXTENSION1_SUPPORT;
285
286 // Convert between D3D12 definition and PIPE definition
287 // D3D12: QualityVsSpeed must be in the range [0, D3D12_FEATURE_DATA_VIDEO_ENCODER_SUPPORT1.MaxQualityVsSpeed]
288 // The lower the value, the fastest the encode operation
289 // PIPE: The quality level range can be queried through the VAConfigAttribEncQualityRange attribute.
290 // A lower value means higher quality, and a value of 1 represents the highest quality.
291 // The quality level setting is used as a trade-off between quality and speed/power
292 // consumption, with higher quality corresponds to lower speed and higher power consumption.
293
294 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR1.QualityVsSpeed =
295 pD3D12Enc->max_quality_levels - picture->quality_modes.level;
296 }
297
298 } break;
299 case PIPE_H2645_ENC_RATE_CONTROL_METHOD_DISABLE:
300 {
301 // We need to initialize the QP value for all frame types on the first frame
302 // otherwise some drivers crash.
303 // frontends currently only send the QP values for the specific frame type of
304 // the current frame, so give a default value for all types until all frame
305 // types are configured on subsequent encode frame calls
306 if (pD3D12Enc->m_fenceValue == 1)
307 {
308 m_prevRCState.m_Config.m_Configuration_CQP
309 .ConstantQP_FullIntracodedFrame = 30 /* initial_qp_default */;
310 m_prevRCState.m_Config.m_Configuration_CQP
311 .ConstantQP_InterPredictedFrame_PrevRefOnly = 30 /* initial_qp_default */;
312 m_prevRCState.m_Config.m_Configuration_CQP
313 .ConstantQP_InterPredictedFrame_BiDirectionalRef = 30 /* initial_qp_default */;
314 }
315
316 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Mode = D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_CQP;
317 if (picture->rc[picture->temporal_id].app_requested_initial_qp) {
318 // Load previous RC state for all frames and only update the current frame
319 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP =
320 m_prevRCState.m_Config.m_Configuration_CQP;
321
322 if ((picture->frame_type == PIPE_AV1_ENC_FRAME_TYPE_INTRA_ONLY) ||
323 (picture->frame_type == PIPE_AV1_ENC_FRAME_TYPE_KEY)) {
324 // Update intra frame qp
325 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP
326 .ConstantQP_FullIntracodedFrame = picture->rc[picture->temporal_id].qp;
327 } else {
328 // Update inter frame QP config
329 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP
330 .ConstantQP_InterPredictedFrame_PrevRefOnly = picture->rc[picture->temporal_id].qp_inter;
331 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP
332 .ConstantQP_InterPredictedFrame_BiDirectionalRef = picture->rc[picture->temporal_id].qp_inter;
333 }
334 }
335
336 if (picture->quality_modes.level > 0) {
337 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
338 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QUALITY_VS_SPEED;
339 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
340 D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_EXTENSION1_SUPPORT;
341 // Convert between D3D12 definition and PIPE definition
342 // D3D12: QualityVsSpeed must be in the range [0, D3D12_FEATURE_DATA_VIDEO_ENCODER_SUPPORT1.MaxQualityVsSpeed]
343 // The lower the value, the fastest the encode operation
344 // PIPE: The quality level range can be queried through the VAConfigAttribEncQualityRange attribute.
345 // A lower value means higher quality, and a value of 1 represents the highest quality.
346 // The quality level setting is used as a trade-off between quality and speed/power
347 // consumption, with higher quality corresponds to lower speed and higher power consumption.
348
349 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP1.QualityVsSpeed =
350 pD3D12Enc->max_quality_levels - picture->quality_modes.level;
351 }
352 } break;
353 default:
354 {
355 debug_printf("[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 invalid RC "
356 "config, using default RC CQP mode\n");
357 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Mode = D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_CQP;
358 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP
359 .ConstantQP_FullIntracodedFrame = 30;
360 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP
361 .ConstantQP_InterPredictedFrame_PrevRefOnly = 30;
362 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP
363 .ConstantQP_InterPredictedFrame_BiDirectionalRef = 30;
364 } break;
365 }
366 }
367
368 //
369 // Returns AV1 extra size on top of the usual base metadata layout size
370 //
371 size_t
d3d12_video_encoder_calculate_metadata_resolved_buffer_size_av1(uint32_t maxSliceNumber)372 d3d12_video_encoder_calculate_metadata_resolved_buffer_size_av1(uint32_t maxSliceNumber)
373 {
374 return sizeof(D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES) +
375 sizeof(D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES);
376 }
377
378 void
d3d12_video_encoder_convert_d3d12_to_spec_level_av1(D3D12_VIDEO_ENCODER_AV1_LEVELS level12,uint32_t & specLevel)379 d3d12_video_encoder_convert_d3d12_to_spec_level_av1(D3D12_VIDEO_ENCODER_AV1_LEVELS level12, uint32_t &specLevel)
380 {
381 // Enum matches values as in seq_level_idx
382 specLevel = (uint32_t) level12;
383 }
384
385 void
d3d12_video_encoder_convert_d3d12_to_spec_tier_av1(D3D12_VIDEO_ENCODER_AV1_TIER tier12,uint32_t & specTier)386 d3d12_video_encoder_convert_d3d12_to_spec_tier_av1(D3D12_VIDEO_ENCODER_AV1_TIER tier12, uint32_t &specTier)
387 {
388 // Enum matches values as in seq_level_idx
389 specTier = (uint32_t) tier12;
390 }
391
392 void
d3d12_video_encoder_convert_spec_to_d3d12_level_av1(uint32_t specLevel,D3D12_VIDEO_ENCODER_AV1_LEVELS & level12)393 d3d12_video_encoder_convert_spec_to_d3d12_level_av1(uint32_t specLevel, D3D12_VIDEO_ENCODER_AV1_LEVELS &level12)
394 {
395 // Enum matches values as in seq_level_idx
396 level12 = (D3D12_VIDEO_ENCODER_AV1_LEVELS) specLevel;
397 }
398
399 void
d3d12_video_encoder_convert_spec_to_d3d12_tier_av1(uint32_t specTier,D3D12_VIDEO_ENCODER_AV1_TIER & tier12)400 d3d12_video_encoder_convert_spec_to_d3d12_tier_av1(uint32_t specTier, D3D12_VIDEO_ENCODER_AV1_TIER &tier12)
401 {
402 // Enum matches values as in seq_tier
403 tier12 = (D3D12_VIDEO_ENCODER_AV1_TIER) specTier;
404 }
405
406 uint32_t
d3d12_video_encoder_convert_d3d12_profile_to_spec_profile_av1(D3D12_VIDEO_ENCODER_AV1_PROFILE profile)407 d3d12_video_encoder_convert_d3d12_profile_to_spec_profile_av1(D3D12_VIDEO_ENCODER_AV1_PROFILE profile)
408 {
409 switch (profile) {
410 case D3D12_VIDEO_ENCODER_AV1_PROFILE_MAIN:
411 {
412 return 0;
413 } break;
414 default:
415 {
416 unreachable("Unsupported D3D12_VIDEO_ENCODER_AV1_PROFILE");
417 } break;
418 }
419 }
420
421 D3D12_VIDEO_ENCODER_AV1_PROFILE
d3d12_video_encoder_convert_profile_to_d3d12_enc_profile_av1(enum pipe_video_profile profile)422 d3d12_video_encoder_convert_profile_to_d3d12_enc_profile_av1(enum pipe_video_profile profile)
423 {
424 switch (profile) {
425 case PIPE_VIDEO_PROFILE_AV1_MAIN:
426 {
427 return D3D12_VIDEO_ENCODER_AV1_PROFILE_MAIN;
428 } break;
429 default:
430 {
431 unreachable("Unsupported pipe_video_profile");
432 } break;
433 }
434 }
435
436 bool
d3d12_video_encoder_update_av1_gop_configuration(struct d3d12_video_encoder * pD3D12Enc,pipe_av1_enc_picture_desc * picture)437 d3d12_video_encoder_update_av1_gop_configuration(struct d3d12_video_encoder *pD3D12Enc,
438 pipe_av1_enc_picture_desc *picture)
439 {
440 static_assert((unsigned) D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_KEY_FRAME == (unsigned) PIPE_AV1_ENC_FRAME_TYPE_KEY);
441 static_assert((unsigned) D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTER_FRAME == (unsigned) PIPE_AV1_ENC_FRAME_TYPE_INTER);
442 static_assert((unsigned) D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTRA_ONLY_FRAME ==
443 (unsigned) PIPE_AV1_ENC_FRAME_TYPE_INTRA_ONLY);
444 static_assert((unsigned) D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_SWITCH_FRAME ==
445 (unsigned) PIPE_AV1_ENC_FRAME_TYPE_SWITCH);
446
447 // Only update GOP when it begins
448 // This triggers DPB/encoder/heap re-creation, so only check on IDR when a GOP might change
449 if ((picture->frame_type == PIPE_AV1_ENC_FRAME_TYPE_INTRA_ONLY) ||
450 (picture->frame_type == PIPE_AV1_ENC_FRAME_TYPE_KEY)) {
451 uint32_t GOPLength = picture->seq.intra_period;
452 uint32_t PPicturePeriod = picture->seq.ip_period;
453
454 // Set dirty flag if m_AV1SequenceStructure changed
455 auto previousGOPConfig = pD3D12Enc->m_currentEncodeConfig.m_encoderGOPConfigDesc.m_AV1SequenceStructure;
456 pD3D12Enc->m_currentEncodeConfig.m_encoderGOPConfigDesc.m_AV1SequenceStructure = {
457 GOPLength,
458 PPicturePeriod,
459 };
460
461 if (memcmp(&previousGOPConfig,
462 &pD3D12Enc->m_currentEncodeConfig.m_encoderGOPConfigDesc.m_AV1SequenceStructure,
463 sizeof(D3D12_VIDEO_ENCODER_AV1_SEQUENCE_STRUCTURE)) != 0) {
464 pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_gop;
465 }
466 }
467 return true;
468 }
469
470 D3D12_VIDEO_ENCODER_MOTION_ESTIMATION_PRECISION_MODE
d3d12_video_encoder_convert_av1_motion_configuration(struct d3d12_video_encoder * pD3D12Enc,pipe_av1_enc_picture_desc * picture)471 d3d12_video_encoder_convert_av1_motion_configuration(struct d3d12_video_encoder *pD3D12Enc,
472 pipe_av1_enc_picture_desc *picture)
473 {
474 return D3D12_VIDEO_ENCODER_MOTION_ESTIMATION_PRECISION_MODE_MAXIMUM;
475 }
476
477 bool
d3d12_video_encoder_compare_tile_config_av1(D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE currentTilesMode,D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE requestedTilesMode,D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES currentTilePartition,D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES requestedTilePartition)478 d3d12_video_encoder_compare_tile_config_av1(
479 D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE currentTilesMode,
480 D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE requestedTilesMode,
481 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES currentTilePartition,
482 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES requestedTilePartition)
483 {
484 if (currentTilesMode != requestedTilesMode)
485 return false;
486
487 if (memcmp(¤tTilePartition,
488 &requestedTilePartition,
489 sizeof(D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES)))
490 return false;
491
492 return true;
493 }
494
495 ///
496 /// Tries to configurate the encoder using the requested tile configuration
497 ///
498 bool
d3d12_video_encoder_negotiate_current_av1_tiles_configuration(struct d3d12_video_encoder * pD3D12Enc,pipe_av1_enc_picture_desc * pAV1Pic)499 d3d12_video_encoder_negotiate_current_av1_tiles_configuration(struct d3d12_video_encoder *pD3D12Enc,
500 pipe_av1_enc_picture_desc *pAV1Pic)
501 {
502 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES tilePartition = {};
503 tilePartition.RowCount = pAV1Pic->tile_rows;
504 tilePartition.ColCount = pAV1Pic->tile_cols;
505 tilePartition.ContextUpdateTileId = pAV1Pic->context_update_tile_id;
506
507 // VA-API interface has 63 entries for tile cols/rows. When 64 requested,
508 // last one has to be calculated from the frame width/height in superblocks.
509
510 // Copy the tile col sizes (up to 63 defined in VA-API interface array sizes)
511 size_t accum_cols_sb = 0;
512 uint8_t src_cols_count = MIN2(63, pAV1Pic->tile_cols);
513 for (uint8_t i = 0; i < src_cols_count; i++) {
514 tilePartition.ColWidths[i] = pAV1Pic->width_in_sbs_minus_1[i] + 1;
515 accum_cols_sb += tilePartition.ColWidths[i];
516 }
517
518 // If there are 64 cols, calculate the last one manually as the difference
519 // between frame width in sb minus the accumulated tiles sb sizes
520 if (pAV1Pic->tile_cols == 64)
521 tilePartition.ColWidths[63] = pAV1Pic->frame_width_sb - accum_cols_sb;
522
523 // Copy the tile row sizes (up to 63 defined in VA-API interface array sizes)
524 size_t accum_rows_sb = 0;
525 uint8_t src_rows_count = MIN2(63, pAV1Pic->tile_rows);
526 for (uint8_t i = 0; i < src_rows_count; i++) {
527 tilePartition.RowHeights[i] = pAV1Pic->height_in_sbs_minus_1[i] + 1;
528 accum_rows_sb += tilePartition.RowHeights[i];
529 }
530
531 // If there are 64 rows, calculate the last one manually as the difference
532 // between frame height in sb minus the accumulated tiles sb sizes
533 if (pAV1Pic->tile_rows == 64)
534 tilePartition.RowHeights[63] = pAV1Pic->frame_height_sb - accum_rows_sb;
535
536 // Iterate the tiles and see if they're uniformly partitioned to decide
537 // which D3D12 tile mode to use
538 // Ignore the last row and last col width
539 bool tilesUniform = !D3D12_VIDEO_FORCE_TILE_MODE && util_is_power_of_two_or_zero(tilePartition.RowCount) &&
540 util_is_power_of_two_or_zero(tilePartition.ColCount);
541 // Iterate again now that the 63/64 edge case has been handled above.
542 for (uint8_t i = 1; tilesUniform && (i < tilePartition.RowCount - 1) /* Ignore last row */; i++)
543 tilesUniform = tilesUniform && (tilePartition.RowHeights[i - 1] == tilePartition.RowHeights[i]);
544
545 for (uint8_t i = 1; tilesUniform && (i < tilePartition.ColCount - 1) /* Ignore last col */; i++)
546 tilesUniform = tilesUniform && (tilePartition.ColWidths[i - 1] == tilePartition.ColWidths[i]);
547
548 D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE requestedTilesMode =
549 tilesUniform ? D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE_UNIFORM_GRID_PARTITION :
550 D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE_CONFIGURABLE_GRID_PARTITION;
551
552 assert(pAV1Pic->num_tile_groups <= 128); // ARRAY_SIZE(TilesGroups)
553 pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroupsCount =
554 pAV1Pic->num_tile_groups;
555 for (uint8_t i = 0; i < pAV1Pic->num_tile_groups; i++) {
556 pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroups[i].tg_start =
557 pAV1Pic->tile_groups[i].tile_group_start;
558 pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroups[i].tg_end =
559 pAV1Pic->tile_groups[i].tile_group_end;
560 }
561
562 if (!d3d12_video_encoder_compare_tile_config_av1(
563 pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigMode,
564 requestedTilesMode,
565 pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition,
566 tilePartition)) {
567 pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_slices;
568 }
569
570 // Update the encoder state with the tile config
571 pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigMode = requestedTilesMode;
572 pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition = tilePartition;
573
574 D3D12_FEATURE_DATA_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_CONFIG capDataTilesSupport = {};
575 capDataTilesSupport.NodeIndex = pD3D12Enc->m_NodeIndex;
576 capDataTilesSupport.Codec = D3D12_VIDEO_ENCODER_CODEC_AV1;
577 capDataTilesSupport.Profile.DataSize = sizeof(pD3D12Enc->m_currentEncodeConfig.m_encoderProfileDesc.m_AV1Profile);
578 capDataTilesSupport.Profile.pAV1Profile = &pD3D12Enc->m_currentEncodeConfig.m_encoderProfileDesc.m_AV1Profile;
579 capDataTilesSupport.Level.DataSize = sizeof(pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting);
580 capDataTilesSupport.Level.pAV1LevelSetting = &pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting;
581 capDataTilesSupport.FrameResolution.Width = pAV1Pic->frame_width;
582 capDataTilesSupport.FrameResolution.Height = pAV1Pic->frame_height;
583 capDataTilesSupport.SubregionMode = requestedTilesMode;
584 capDataTilesSupport.CodecSupport.DataSize =
585 sizeof(pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps);
586 capDataTilesSupport.CodecSupport.pAV1Support =
587 &pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps;
588 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps.Use128SuperBlocks = false;
589 // return units in 64x64 default size
590 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps.TilesConfiguration =
591 pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition;
592 HRESULT hr =
593 pD3D12Enc->m_spD3D12VideoDevice->CheckFeatureSupport(D3D12_FEATURE_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_CONFIG,
594 &capDataTilesSupport,
595 sizeof(capDataTilesSupport));
596 if (FAILED(hr) || !capDataTilesSupport.IsSupported) {
597 debug_printf("D3D12_FEATURE_VIDEO_ENCODER_SUBREGION_TILES_SUPPORT HR (0x%x) error or IsSupported: (%d).\n",
598 hr,
599 capDataTilesSupport.IsSupported);
600 return false;
601 }
602
603 return true;
604 }
605
606 D3D12_VIDEO_ENCODER_AV1_CODEC_CONFIGURATION
d3d12_video_encoder_convert_av1_codec_configuration(struct d3d12_video_encoder * pD3D12Enc,pipe_av1_enc_picture_desc * pAV1Pic,bool & is_supported)607 d3d12_video_encoder_convert_av1_codec_configuration(struct d3d12_video_encoder *pD3D12Enc,
608 pipe_av1_enc_picture_desc *pAV1Pic,
609 bool &is_supported)
610 {
611 is_supported = true;
612 D3D12_VIDEO_ENCODER_AV1_CODEC_CONFIGURATION config = {
613 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAGS FeatureFlags;
614 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_NONE,
615 // UINT OrderHintBitsMinus1;
616 pAV1Pic->seq.order_hint_bits - 1,
617 };
618
619 //
620 // Query AV1 caps and store in m_currentEncodeCapabilities
621 //
622
623 D3D12_FEATURE_DATA_VIDEO_ENCODER_CODEC_CONFIGURATION_SUPPORT capCodecConfigData = {};
624 capCodecConfigData.NodeIndex = pD3D12Enc->m_NodeIndex;
625 capCodecConfigData.Codec = D3D12_VIDEO_ENCODER_CODEC_AV1;
626 D3D12_VIDEO_ENCODER_AV1_PROFILE prof =
627 d3d12_video_encoder_convert_profile_to_d3d12_enc_profile_av1(pD3D12Enc->base.profile);
628 capCodecConfigData.Profile.pAV1Profile = &prof;
629 capCodecConfigData.Profile.DataSize = sizeof(prof);
630 capCodecConfigData.CodecSupportLimits.pAV1Support =
631 &pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps;
632 capCodecConfigData.CodecSupportLimits.DataSize =
633 sizeof(pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps);
634
635 if (FAILED(
636 pD3D12Enc->m_spD3D12VideoDevice->CheckFeatureSupport(D3D12_FEATURE_VIDEO_ENCODER_CODEC_CONFIGURATION_SUPPORT,
637 &capCodecConfigData,
638 sizeof(capCodecConfigData))) ||
639 !capCodecConfigData.IsSupported) {
640 debug_printf("D3D12_FEATURE_VIDEO_ENCODER_CODEC_CONFIGURATION_SUPPORT arguments not supported.\n");
641 is_supported = false;
642 return config;
643 }
644
645 // Enable features requested by gallium
646
647 if (pAV1Pic->seq.seq_bits.use_128x128_superblock)
648 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK;
649 if (pAV1Pic->seq.seq_bits.enable_filter_intra)
650 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA;
651 if (pAV1Pic->seq.seq_bits.enable_intra_edge_filter)
652 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER;
653 if (pAV1Pic->seq.seq_bits.enable_interintra_compound)
654 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND;
655 if (pAV1Pic->seq.seq_bits.enable_masked_compound)
656 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND;
657 if (pAV1Pic->seq.seq_bits.enable_warped_motion)
658 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION;
659 if (pAV1Pic->seq.seq_bits.enable_dual_filter)
660 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_DUAL_FILTER;
661 if (pAV1Pic->seq.seq_bits.enable_order_hint)
662 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS;
663 if (pAV1Pic->seq.seq_bits.enable_jnt_comp)
664 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_JNT_COMP;
665 if (pAV1Pic->seq.seq_bits.enable_ref_frame_mvs)
666 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS;
667 if (pAV1Pic->seq.seq_bits.enable_superres)
668 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION;
669 if (pAV1Pic->seq.seq_bits.enable_cdef)
670 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING;
671 if (pAV1Pic->seq.seq_bits.enable_restoration)
672 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER;
673
674 // No pipe flag for the following features, associated pic flags can be selected per frame. Enable if supported.
675
676 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
677 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS) != 0) // seq_force_integer_mv
678 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS;
679
680 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
681 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING) != 0)
682 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING;
683
684 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
685 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY) != 0)
686 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY;
687
688 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
689 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS) != 0)
690 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS;
691
692 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
693 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS) != 0)
694 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS;
695
696 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
697 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX) != 0)
698 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX;
699
700 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
701 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET) != 0)
702 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET;
703
704 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
705 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE) != 0)
706 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE;
707
708 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
709 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV) != 0)
710 config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV;
711
712 //
713 // Add any missing mandatory/required features we didn't enable before
714 //
715 if ((config.FeatureFlags &
716 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags) !=
717 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags) {
718 debug_printf(
719 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding required by caps but not selected already in "
720 "config.FeatureFlags...\n");
721
722 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK) == 0) &&
723 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
724 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK) != 0)) {
725 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
726 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK;
727 debug_printf(
728 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
729 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK required by caps but not selected already in "
730 "config.FeatureFlags...\n");
731 }
732
733 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA) == 0) &&
734 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
735 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA) != 0)) {
736 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
737 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA;
738 debug_printf(
739 "[d3d12_video_encoder_convert_av1_codec_configuration] "
740 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA Adding required by caps but not selected already in "
741 "config.FeatureFlags...\n");
742 }
743
744 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER) == 0) &&
745 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
746 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER) != 0)) {
747 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
748 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER;
749 debug_printf(
750 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
751 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER required by caps but not selected already in "
752 "config.FeatureFlags...\n");
753 }
754
755 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND) == 0) &&
756 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
757 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND) != 0)) {
758 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
759 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND;
760 debug_printf(
761 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
762 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND required by caps but not selected already in "
763 "config.FeatureFlags...\n");
764 }
765
766 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND) == 0) &&
767 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
768 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND) != 0)) {
769 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
770 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND;
771 debug_printf(
772 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
773 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND required by caps but not selected already in "
774 "config.FeatureFlags...\n");
775 }
776
777 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION) == 0) &&
778 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
779 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION) != 0)) {
780 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
781 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION;
782 debug_printf(
783 "[d3d12_video_encoder_convert_av1_codec_configuration] "
784 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION Adding required by caps but not selected already in "
785 "config.FeatureFlags...\n");
786 }
787
788 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_DUAL_FILTER) == 0) &&
789 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
790 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_DUAL_FILTER) != 0)) {
791 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
792 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_DUAL_FILTER;
793 debug_printf("[d3d12_video_encoder_convert_av1_codec_configuration] == Adding required by caps but not "
794 "selected already in "
795 "config.FeatureFlags...\n");
796 }
797
798 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_JNT_COMP) == 0) &&
799 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
800 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_JNT_COMP) != 0)) {
801 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
802 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_JNT_COMP;
803 debug_printf("[d3d12_video_encoder_convert_av1_codec_configuration] 0 Adding required by caps but not "
804 "selected already in "
805 "config.FeatureFlags...\n");
806 }
807
808 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS) == 0) &&
809 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
810 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS) != 0)) {
811 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
812 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS;
813 debug_printf(
814 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding required by "
815 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS caps but not selected already in "
816 "config.FeatureFlags...\n");
817 }
818
819 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION) == 0) &&
820 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
821 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION) != 0)) {
822 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
823 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION;
824 debug_printf(
825 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
826 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION required by caps but not selected already in "
827 "config.FeatureFlags...\n");
828 }
829
830 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER) == 0) &&
831 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
832 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER) != 0)) {
833 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
834 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER;
835 debug_printf(
836 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
837 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER required by caps but not selected already in "
838 "config.FeatureFlags...\n");
839 }
840
841 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING) == 0) &&
842 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
843 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING) != 0)) {
844 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
845 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING;
846 debug_printf(
847 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
848 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING required by caps but not selected already in "
849 "config.FeatureFlags...\n");
850 }
851
852 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING) == 0) &&
853 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
854 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING) != 0)) {
855 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
856 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING;
857 debug_printf(
858 "[d3d12_video_encoder_convert_av1_codec_configuration] "
859 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING Adding required by caps but not selected already in "
860 "config.FeatureFlags...\n");
861 }
862
863 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY) == 0) &&
864 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
865 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY) != 0)) {
866 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
867 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY;
868 debug_printf(
869 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
870 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY required by caps but not selected already in "
871 "config.FeatureFlags...\n");
872 }
873
874 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS) == 0) &&
875 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
876 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS) != 0)) {
877 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
878 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS;
879 debug_printf(
880 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding required by "
881 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS caps but not selected already in "
882 "config.FeatureFlags...\n");
883 }
884
885 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS) == 0) &&
886 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
887 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS) != 0)) {
888 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
889 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS;
890 debug_printf(
891 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
892 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS required by caps but not selected already in "
893 "config.FeatureFlags...\n");
894 }
895
896 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_AUTO_SEGMENTATION) == 0) &&
897 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
898 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_AUTO_SEGMENTATION) != 0)) {
899 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
900 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_AUTO_SEGMENTATION;
901 debug_printf(
902 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
903 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_AUTO_SEGMENTATION required by caps but not selected already in "
904 "config.FeatureFlags...\n");
905 }
906
907 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CUSTOM_SEGMENTATION) == 0) &&
908 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
909 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CUSTOM_SEGMENTATION) != 0)) {
910 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
911 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CUSTOM_SEGMENTATION;
912 debug_printf(
913 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
914 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CUSTOM_SEGMENTATION required by caps but not selected already in "
915 "config.FeatureFlags...\n");
916 }
917
918 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS) == 0) &&
919 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
920 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS) != 0)) {
921 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
922 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS;
923 debug_printf(
924 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
925 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS required by caps but not selected already in "
926 "config.FeatureFlags...\n");
927 }
928
929 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS) == 0) &&
930 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
931 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS) != 0)) {
932 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
933 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS;
934 debug_printf(
935 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
936 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS required by caps but not selected already in "
937 "config.FeatureFlags...\n");
938 }
939
940 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX) == 0) &&
941 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
942 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX) != 0)) {
943 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
944 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX;
945 debug_printf(
946 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
947 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX required by caps but not selected already in "
948 "config.FeatureFlags...\n");
949 }
950
951 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET) == 0) &&
952 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
953 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET) != 0)) {
954 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
955 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET;
956 debug_printf(
957 "[d3d12_video_encoder_convert_av1_codec_configuration] "
958 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET Adding required by caps but not selected already in "
959 "config.FeatureFlags...\n");
960 }
961
962 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE) == 0) &&
963 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
964 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE) != 0)) {
965 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
966 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE;
967 debug_printf(
968 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
969 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE required by caps but not selected already in "
970 "config.FeatureFlags...\n");
971 }
972
973 if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV) == 0) &&
974 ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
975 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV) != 0)) {
976 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
977 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV;
978 debug_printf(
979 "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
980 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV required by caps but not selected already in "
981 "config.FeatureFlags...\n");
982 }
983
984 // Enable all required flags previously not selected
985 config.FeatureFlags |=
986 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags;
987 }
988
989 // Check config.FeatureFlags against SupportedFeatureFlags and assign is_supported
990 if ((config.FeatureFlags &
991 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags) !=
992 config.FeatureFlags) {
993 debug_printf(
994 "[d3d12_video_encoder_convert_av1_codec_configuration] AV1 Configuration flags requested 0x%x not supported "
995 "by "
996 "m_AV1CodecCaps.SupportedFeatureFlags 0x%x\n",
997 config.FeatureFlags,
998 pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags);
999
1000 is_supported = false;
1001 }
1002
1003 return config;
1004 }
1005
1006 static bool
d3d12_video_encoder_update_intra_refresh_av1(struct d3d12_video_encoder * pD3D12Enc,D3D12_VIDEO_SAMPLE srcTextureDesc,struct pipe_av1_enc_picture_desc * picture)1007 d3d12_video_encoder_update_intra_refresh_av1(struct d3d12_video_encoder *pD3D12Enc,
1008 D3D12_VIDEO_SAMPLE srcTextureDesc,
1009 struct pipe_av1_enc_picture_desc * picture)
1010 {
1011 if (picture->intra_refresh.mode != INTRA_REFRESH_MODE_NONE)
1012 {
1013 // D3D12 only supports row intra-refresh
1014 if (picture->intra_refresh.mode != INTRA_REFRESH_MODE_UNIT_ROWS)
1015 {
1016 debug_printf("[d3d12_video_encoder_update_intra_refresh_av1] Unsupported INTRA_REFRESH_MODE %d\n", picture->intra_refresh.mode);
1017 return false;
1018 }
1019
1020 uint32_t sbSize = ((pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1021 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK) != 0) ? 128u : 64u;
1022 uint32_t total_frame_blocks = static_cast<uint32_t>(std::ceil(srcTextureDesc.Height / sbSize)) *
1023 static_cast<uint32_t>(std::ceil(srcTextureDesc.Width / sbSize));
1024 D3D12_VIDEO_ENCODER_INTRA_REFRESH targetIntraRefresh = {
1025 D3D12_VIDEO_ENCODER_INTRA_REFRESH_MODE_ROW_BASED,
1026 total_frame_blocks / picture->intra_refresh.region_size,
1027 };
1028 double ir_wave_progress = (picture->intra_refresh.offset == 0) ? 0 :
1029 picture->intra_refresh.offset / (double) total_frame_blocks;
1030 pD3D12Enc->m_currentEncodeConfig.m_IntraRefreshCurrentFrameIndex =
1031 static_cast<uint32_t>(std::ceil(ir_wave_progress * targetIntraRefresh.IntraRefreshDuration));
1032
1033 // Set intra refresh state
1034 pD3D12Enc->m_currentEncodeConfig.m_IntraRefresh = targetIntraRefresh;
1035 // Need to send the sequence flag during all the IR duration
1036 pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_intra_refresh;
1037 } else {
1038 pD3D12Enc->m_currentEncodeConfig.m_IntraRefreshCurrentFrameIndex = 0;
1039 pD3D12Enc->m_currentEncodeConfig.m_IntraRefresh = {
1040 D3D12_VIDEO_ENCODER_INTRA_REFRESH_MODE_NONE,
1041 0,
1042 };
1043 }
1044
1045 return true;
1046 }
1047
1048 bool
d3d12_video_encoder_update_current_encoder_config_state_av1(struct d3d12_video_encoder * pD3D12Enc,D3D12_VIDEO_SAMPLE srcTextureDesc,struct pipe_picture_desc * picture)1049 d3d12_video_encoder_update_current_encoder_config_state_av1(struct d3d12_video_encoder *pD3D12Enc,
1050 D3D12_VIDEO_SAMPLE srcTextureDesc,
1051 struct pipe_picture_desc *picture)
1052 {
1053 struct pipe_av1_enc_picture_desc *av1Pic = (struct pipe_av1_enc_picture_desc *) picture;
1054
1055 // Reset reconfig dirty flags
1056 pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags = d3d12_video_encoder_config_dirty_flag_none;
1057 // Reset sequence changes flags
1058 pD3D12Enc->m_currentEncodeConfig.m_seqFlags = D3D12_VIDEO_ENCODER_SEQUENCE_CONTROL_FLAG_NONE;
1059
1060 // Set codec
1061 if (pD3D12Enc->m_currentEncodeConfig.m_encoderCodecDesc != D3D12_VIDEO_ENCODER_CODEC_AV1) {
1062 pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_codec;
1063 }
1064 pD3D12Enc->m_currentEncodeConfig.m_encoderCodecDesc = D3D12_VIDEO_ENCODER_CODEC_AV1;
1065
1066 // Set input format
1067 DXGI_FORMAT targetFmt = srcTextureDesc.Format.Format;
1068 if (pD3D12Enc->m_currentEncodeConfig.m_encodeFormatInfo.Format != targetFmt) {
1069 pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_input_format;
1070 }
1071
1072 pD3D12Enc->m_currentEncodeConfig.m_encodeFormatInfo = {};
1073 pD3D12Enc->m_currentEncodeConfig.m_encodeFormatInfo.Format = targetFmt;
1074 HRESULT hr =
1075 pD3D12Enc->m_pD3D12Screen->dev->CheckFeatureSupport(D3D12_FEATURE_FORMAT_INFO,
1076 &pD3D12Enc->m_currentEncodeConfig.m_encodeFormatInfo,
1077 sizeof(pD3D12Enc->m_currentEncodeConfig.m_encodeFormatInfo));
1078 if (FAILED(hr)) {
1079 debug_printf("CheckFeatureSupport failed with HR 0x%x\n", hr);
1080 return false;
1081 }
1082
1083 // Set resolution (ie. frame_size)
1084 if ((pD3D12Enc->m_currentEncodeConfig.m_currentResolution.Width != srcTextureDesc.Width) ||
1085 (pD3D12Enc->m_currentEncodeConfig.m_currentResolution.Height != srcTextureDesc.Height)) {
1086 pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_resolution;
1087 }
1088 pD3D12Enc->m_currentEncodeConfig.m_currentResolution.Width = srcTextureDesc.Width;
1089 pD3D12Enc->m_currentEncodeConfig.m_currentResolution.Height = srcTextureDesc.Height;
1090
1091 // render_size
1092 pD3D12Enc->m_currentEncodeConfig.m_FrameCroppingCodecConfig.right = av1Pic->frame_width;
1093 pD3D12Enc->m_currentEncodeConfig.m_FrameCroppingCodecConfig.bottom = av1Pic->frame_height;
1094
1095 // Set profile
1096 auto targetProfile = d3d12_video_encoder_convert_profile_to_d3d12_enc_profile_av1(pD3D12Enc->base.profile);
1097 if (pD3D12Enc->m_currentEncodeConfig.m_encoderProfileDesc.m_AV1Profile != targetProfile) {
1098 pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_profile;
1099 }
1100 pD3D12Enc->m_currentEncodeConfig.m_encoderProfileDesc.m_AV1Profile = targetProfile;
1101
1102 // Set level and tier
1103 D3D12_VIDEO_ENCODER_AV1_LEVELS targetLevel = {};
1104 D3D12_VIDEO_ENCODER_AV1_TIER targetTier = {};
1105 d3d12_video_encoder_convert_spec_to_d3d12_level_av1(av1Pic->seq.level, targetLevel);
1106 d3d12_video_encoder_convert_spec_to_d3d12_tier_av1(av1Pic->seq.tier, targetTier);
1107
1108 if ((pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Level != targetLevel) ||
1109 (pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Tier != targetTier)) {
1110 pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_level;
1111 }
1112 pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Tier = targetTier;
1113 pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Level = targetLevel;
1114
1115 //
1116 // Validate caps support returned values against current settings
1117 //
1118 if (pD3D12Enc->m_currentEncodeConfig.m_encoderProfileDesc.m_AV1Profile !=
1119 pD3D12Enc->m_currentEncodeCapabilities.m_encoderSuggestedProfileDesc.m_AV1Profile) {
1120 debug_printf("[d3d12_video_encoder_av1] Warning: Requested D3D12_VIDEO_ENCODER_PROFILE_AV1 by upper layer: %d "
1121 "mismatches UMD suggested D3D12_VIDEO_ENCODER_PROFILE_AV1: %d\n",
1122 pD3D12Enc->m_currentEncodeConfig.m_encoderProfileDesc.m_AV1Profile,
1123 pD3D12Enc->m_currentEncodeCapabilities.m_encoderSuggestedProfileDesc.m_AV1Profile);
1124 }
1125
1126 if ((pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Level !=
1127 pD3D12Enc->m_currentEncodeCapabilities.m_encoderLevelSuggestedDesc.m_AV1LevelSetting.Level) ||
1128 (pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Tier !=
1129 pD3D12Enc->m_currentEncodeCapabilities.m_encoderLevelSuggestedDesc.m_AV1LevelSetting.Tier)) {
1130 debug_printf(
1131 "[d3d12_video_encoder_av1] Warning: Requested D3D12_VIDEO_ENCODER_LEVELS_AV1 by upper layer: level %d tier %d "
1132 "mismatches UMD suggested D3D12_VIDEO_ENCODER_LEVELS_AV1: level %d tier %d\n",
1133 pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Level,
1134 pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Tier,
1135 pD3D12Enc->m_currentEncodeCapabilities.m_encoderLevelSuggestedDesc.m_AV1LevelSetting.Level,
1136 pD3D12Enc->m_currentEncodeCapabilities.m_encoderLevelSuggestedDesc.m_AV1LevelSetting.Tier);
1137 }
1138
1139 // Set codec config
1140 bool is_supported = false;
1141 auto targetCodecConfig = d3d12_video_encoder_convert_av1_codec_configuration(pD3D12Enc, av1Pic, is_supported);
1142 if (!is_supported) {
1143 return false;
1144 }
1145
1146 if (memcmp(&pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config,
1147 &targetCodecConfig,
1148 sizeof(D3D12_VIDEO_ENCODER_AV1_CODEC_CONFIGURATION)) != 0) {
1149 pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_codec_config;
1150 }
1151 pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config = targetCodecConfig;
1152
1153 // Set rate control
1154 d3d12_video_encoder_update_current_rate_control_av1(pD3D12Enc, av1Pic);
1155
1156 // Set tiles config
1157 if (!d3d12_video_encoder_negotiate_current_av1_tiles_configuration(pD3D12Enc, av1Pic)) {
1158 debug_printf("d3d12_video_encoder_negotiate_current_av1_tiles_configuration failed!\n");
1159 return false;
1160 }
1161
1162 // Set GOP config
1163 if (!d3d12_video_encoder_update_av1_gop_configuration(pD3D12Enc, av1Pic)) {
1164 debug_printf("d3d12_video_encoder_update_av1_gop_configuration failed!\n");
1165 return false;
1166 }
1167
1168 // Set intra-refresh config
1169 if(!d3d12_video_encoder_update_intra_refresh_av1(pD3D12Enc, srcTextureDesc, av1Pic)) {
1170 debug_printf("d3d12_video_encoder_update_intra_refresh_av1 failed!\n");
1171 return false;
1172 }
1173
1174 // m_currentEncodeConfig.m_encoderPicParamsDesc pic params are set in d3d12_video_encoder_reconfigure_encoder_objects
1175 // after re-allocating objects if needed
1176
1177 // Set motion estimation config
1178 auto targetMotionLimit = d3d12_video_encoder_convert_av1_motion_configuration(pD3D12Enc, av1Pic);
1179 if (pD3D12Enc->m_currentEncodeConfig.m_encoderMotionPrecisionLimit != targetMotionLimit) {
1180 pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |=
1181 d3d12_video_encoder_config_dirty_flag_motion_precision_limit;
1182 }
1183 pD3D12Enc->m_currentEncodeConfig.m_encoderMotionPrecisionLimit = targetMotionLimit;
1184
1185 // Will call for d3d12 driver support based on the initial requested (non codec specific) features, then
1186 // try to fallback if any of them is not supported and return the negotiated d3d12 settings
1187 D3D12_FEATURE_DATA_VIDEO_ENCODER_SUPPORT1 capEncoderSupportData1 = {};
1188 if (!d3d12_video_encoder_negotiate_requested_features_and_d3d12_driver_caps(pD3D12Enc, capEncoderSupportData1)) {
1189 debug_printf("[d3d12_video_encoder_av1] After negotiating caps, D3D12_FEATURE_VIDEO_ENCODER_SUPPORT1 "
1190 "arguments are not supported - "
1191 "ValidationFlags: 0x%x - SupportFlags: 0x%x\n",
1192 capEncoderSupportData1.ValidationFlags,
1193 capEncoderSupportData1.SupportFlags);
1194 return false;
1195 }
1196
1197 pD3D12Enc->m_currentEncodeCapabilities.m_MaxSlicesInOutput = (av1Pic->tile_cols * av1Pic->tile_rows);
1198 if (pD3D12Enc->m_currentEncodeCapabilities.m_MaxSlicesInOutput >
1199 pD3D12Enc->m_currentEncodeCapabilities.m_currentResolutionSupportCaps.MaxSubregionsNumber) {
1200 debug_printf("[d3d12_video_encoder_av1] Desired number of subregions is not supported (higher than max "
1201 "reported slice number in query caps)\n.");
1202 return false;
1203 }
1204
1205 return true;
1206 }
1207
1208 /*
1209 * Called at begin_frame record time
1210 */
1211 void
d3d12_video_encoder_update_current_frame_pic_params_info_av1(struct d3d12_video_encoder * pD3D12Enc,struct pipe_video_buffer * srcTexture,struct pipe_picture_desc * picture,D3D12_VIDEO_ENCODER_PICTURE_CONTROL_CODEC_DATA & picParams,bool & bUsedAsReference)1212 d3d12_video_encoder_update_current_frame_pic_params_info_av1(struct d3d12_video_encoder *pD3D12Enc,
1213 struct pipe_video_buffer *srcTexture,
1214 struct pipe_picture_desc *picture,
1215 D3D12_VIDEO_ENCODER_PICTURE_CONTROL_CODEC_DATA &picParams,
1216 bool &bUsedAsReference)
1217 {
1218 struct pipe_av1_enc_picture_desc *pAV1Pic = (struct pipe_av1_enc_picture_desc *) picture;
1219
1220 // Output param bUsedAsReference
1221 bUsedAsReference = (pAV1Pic->refresh_frame_flags != 0);
1222
1223 // D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAGS Flags;
1224 picParams.pAV1PicData->Flags = D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_NONE;
1225
1226 if (pAV1Pic->error_resilient_mode)
1227 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_ERROR_RESILIENT_MODE;
1228
1229 if (pAV1Pic->disable_cdf_update)
1230 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_DISABLE_CDF_UPDATE;
1231
1232 if (pAV1Pic->palette_mode_enable)
1233 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_PALETTE_ENCODING;
1234
1235 // Override if required feature
1236 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1237 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING) != 0) {
1238 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1239 "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_PALETTE_ENCODING\n");
1240 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_PALETTE_ENCODING;
1241 }
1242
1243 if (pAV1Pic->skip_mode_present)
1244 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_SKIP_MODE;
1245
1246 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1247 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SKIP_MODE_PRESENT) != 0) {
1248 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1249 "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_SKIP_MODE\n");
1250 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_SKIP_MODE;
1251 }
1252
1253 if (pAV1Pic->use_ref_frame_mvs)
1254 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FRAME_REFERENCE_MOTION_VECTORS;
1255
1256 // Override if required feature
1257 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1258 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS) != 0) {
1259 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1260 "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FRAME_REFERENCE_MOTION_VECTORS\n");
1261 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FRAME_REFERENCE_MOTION_VECTORS;
1262 }
1263
1264 // No pipe flag for force_integer_mv (D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FORCE_INTEGER_MOTION_VECTORS)
1265 // choose default based on required/supported underlying codec flags
1266 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1267 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS) != 0) {
1268 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1269 "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FORCE_INTEGER_MOTION_VECTORS\n");
1270 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FORCE_INTEGER_MOTION_VECTORS;
1271 }
1272
1273 if (pAV1Pic->allow_intrabc)
1274 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_INTRA_BLOCK_COPY;
1275
1276 // Override if required feature
1277 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1278 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY) != 0) {
1279 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1280 "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_INTRA_BLOCK_COPY\n");
1281 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_INTRA_BLOCK_COPY;
1282 }
1283
1284 if (pAV1Pic->use_superres)
1285 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_USE_SUPER_RESOLUTION;
1286
1287 if (pAV1Pic->disable_frame_end_update_cdf)
1288 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_DISABLE_FRAME_END_UPDATE_CDF;
1289
1290 // No pipe flag for D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_AUTO
1291 // choose default based on required/supported underlying codec flags
1292 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1293 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_AUTO_SEGMENTATION) != 0) {
1294 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1295 "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_AUTO\n");
1296 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_AUTO;
1297 }
1298
1299 // No pipe flag for D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_CUSTOM
1300 // choose default based on required/supported underlying codec flags
1301 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1302 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CUSTOM_SEGMENTATION) != 0) {
1303 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1304 "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_CUSTOM\n");
1305 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_CUSTOM;
1306 assert(false); // Not implemented
1307 }
1308
1309 // No pipe flag for allow_warped_motion (D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_WARPED_MOTION)
1310 // choose default based on required/supported underlying codec flags
1311 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1312 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION) != 0) {
1313 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1314 "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_WARPED_MOTION\n");
1315 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_WARPED_MOTION;
1316 }
1317
1318 // Only enable if supported (there is no PIPE/VA cap flag for reduced_tx_set)
1319 if ((pAV1Pic->reduced_tx_set) &&
1320 (pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
1321 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET) != 0) {
1322 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_REDUCED_TX_SET;
1323 }
1324
1325 // Override if required feature
1326 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1327 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET) != 0) {
1328 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1329 "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_REDUCED_TX_SET\n");
1330 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_REDUCED_TX_SET;
1331 }
1332
1333 // Only enable if supported
1334 if ((pAV1Pic->allow_high_precision_mv) &&
1335 (pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
1336 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV) != 0) {
1337 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_HIGH_PRECISION_MV;
1338 }
1339
1340 // Override if required feature
1341 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1342 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV) != 0) {
1343 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1344 "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_HIGH_PRECISION_MV\n");
1345 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_HIGH_PRECISION_MV;
1346 }
1347
1348 // No pipe flag for is_motion_mode_switchable (D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_MOTION_MODE_SWITCHABLE)
1349 // choose default based on required/supported underlying codec flags
1350 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1351 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE) != 0) {
1352 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1353 "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_MOTION_MODE_SWITCHABLE\n");
1354 picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_MOTION_MODE_SWITCHABLE;
1355 }
1356
1357 // D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE FrameType;
1358 // AV1 spec matches w/D3D12 enum definition
1359 picParams.pAV1PicData->FrameType = static_cast<D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE>(pAV1Pic->frame_type);
1360
1361 if (picParams.pAV1PicData->FrameType == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_KEY_FRAME)
1362 debug_printf("Encoding FrameType: D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_KEY_FRAME\n");
1363 if (picParams.pAV1PicData->FrameType == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTER_FRAME)
1364 debug_printf("Encoding FrameType: D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTER_FRAME\n");
1365 if (picParams.pAV1PicData->FrameType == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTRA_ONLY_FRAME)
1366 debug_printf("Encoding FrameType: D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTRA_ONLY_FRAME\n");
1367 if (picParams.pAV1PicData->FrameType == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_SWITCH_FRAME)
1368 debug_printf("Encoding FrameType: D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_SWITCH_FRAME\n");
1369
1370 // D3D12_VIDEO_ENCODER_AV1_COMP_PREDICTION_TYPE CompoundPredictionType;
1371 picParams.pAV1PicData->CompoundPredictionType = (pAV1Pic->compound_reference_mode == 0) ?
1372 D3D12_VIDEO_ENCODER_AV1_COMP_PREDICTION_TYPE_SINGLE_REFERENCE :
1373 D3D12_VIDEO_ENCODER_AV1_COMP_PREDICTION_TYPE_COMPOUND_REFERENCE;
1374
1375 // D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS InterpolationFilter;
1376 // AV1 spec matches w/D3D12 enum definition
1377 picParams.pAV1PicData->InterpolationFilter =
1378 static_cast<D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS>(pAV1Pic->interpolation_filter);
1379
1380 // Workaround for apps sending interpolation_filter values not supported even when reporting
1381 // them in pipe_av1_enc_cap_features_ext1.interpolation_filter. If D3D12 driver doesn't support
1382 // requested InterpolationFilter, fallback to the first supported by D3D12 driver
1383 if ( (pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedInterpolationFilters &
1384 (1 << picParams.pAV1PicData->InterpolationFilter)) == 0 ) { /* See definition of D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS_FLAGS */
1385 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Requested interpolation_filter"
1386 " not supported in pipe_av1_enc_cap_features_ext1.interpolation_filter"
1387 ", auto selecting from D3D12 SupportedInterpolationFilters...");
1388 for(uint8_t i = D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS_EIGHTTAP; i <= D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS_SWITCHABLE; i++) {
1389 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedInterpolationFilters &
1390 (1 << i)) /* See definition of D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS_FLAGS */ != 0) {
1391 picParams.pAV1PicData->InterpolationFilter = static_cast<D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS>(i);
1392 break;
1393 }
1394 }
1395 }
1396
1397 // D3D12_VIDEO_ENCODER_AV1_RESTORATION_CONFIG FrameRestorationConfig;
1398 // AV1 spec matches w/D3D12 FrameRestorationType enum definition
1399
1400 picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[0] =
1401 static_cast<D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE>(pAV1Pic->restoration.yframe_restoration_type);
1402 picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[1] =
1403 static_cast<D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE>(pAV1Pic->restoration.cbframe_restoration_type);
1404 picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[2] =
1405 static_cast<D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE>(pAV1Pic->restoration.crframe_restoration_type);
1406
1407 if (picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[0] !=
1408 D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE_DISABLED) {
1409 picParams.pAV1PicData->FrameRestorationConfig.LoopRestorationPixelSize[0] =
1410 d3d12_video_encoder_looprestorationsize_uint_to_d3d12_av1(1 << (6 + pAV1Pic->restoration.lr_unit_shift));
1411 }
1412
1413 if (picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[1] !=
1414 D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE_DISABLED) {
1415 picParams.pAV1PicData->FrameRestorationConfig.LoopRestorationPixelSize[1] =
1416 d3d12_video_encoder_looprestorationsize_uint_to_d3d12_av1(
1417 1 << (6 + pAV1Pic->restoration.lr_unit_shift - pAV1Pic->restoration.lr_uv_shift));
1418 }
1419
1420 if (picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[2] !=
1421 D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE_DISABLED) {
1422 picParams.pAV1PicData->FrameRestorationConfig.LoopRestorationPixelSize[2] =
1423 d3d12_video_encoder_looprestorationsize_uint_to_d3d12_av1(
1424 1 << (6 + pAV1Pic->restoration.lr_unit_shift - pAV1Pic->restoration.lr_uv_shift));
1425 }
1426
1427 // D3D12_VIDEO_ENCODER_AV1_TX_MODE TxMode;
1428 // AV1 spec matches w/D3D12 enum definition
1429 picParams.pAV1PicData->TxMode = static_cast<D3D12_VIDEO_ENCODER_AV1_TX_MODE>(pAV1Pic->tx_mode);
1430
1431 // Workaround for mismatch between VAAPI/D3D12 and TxMode support for all/some frame types
1432 // If D3D12 driver doesn't support requested TxMode, fallback to the first supported by D3D12
1433 // driver for the requested frame type
1434 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedTxModes[picParams.pAV1PicData->FrameType] &
1435 (1 << picParams.pAV1PicData->TxMode)) == 0) /* See definition of D3D12_VIDEO_ENCODER_AV1_TX_MODE_FLAGS */ {
1436 debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Requested tx_mode not supported"
1437 ", auto selecting from D3D12 SupportedTxModes for current frame type...");
1438 for(uint8_t i = D3D12_VIDEO_ENCODER_AV1_TX_MODE_ONLY4x4; i <= D3D12_VIDEO_ENCODER_AV1_TX_MODE_SELECT; i++) {
1439 if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedTxModes[picParams.pAV1PicData->FrameType] &
1440 (1 << i)) /* See definition of D3D12_VIDEO_ENCODER_AV1_TX_MODE_FLAGS */ != 0) {
1441 picParams.pAV1PicData->TxMode = static_cast<D3D12_VIDEO_ENCODER_AV1_TX_MODE>(i);
1442 break;
1443 }
1444 }
1445 }
1446
1447 // UINT SuperResDenominator;
1448 picParams.pAV1PicData->SuperResDenominator = pAV1Pic->superres_scale_denominator;
1449
1450 // UINT OrderHint;
1451 picParams.pAV1PicData->OrderHint = pAV1Pic->order_hint;
1452
1453 // UINT PictureIndex - Substract the last_key_frame_num to make it modulo KEY frame
1454 picParams.pAV1PicData->PictureIndex = pAV1Pic->frame_num - pAV1Pic->last_key_frame_num;
1455
1456 // UINT TemporalLayerIndexPlus1;
1457 assert(pAV1Pic->temporal_id == pAV1Pic->tg_obu_header.temporal_id);
1458 picParams.pAV1PicData->TemporalLayerIndexPlus1 = pAV1Pic->temporal_id + 1;
1459
1460 // UINT SpatialLayerIndexPlus1;
1461 picParams.pAV1PicData->SpatialLayerIndexPlus1 = pAV1Pic->tg_obu_header.spatial_id + 1;
1462
1463 //
1464 // Reference Pictures
1465 //
1466 {
1467 for (uint8_t i = 0; i < ARRAY_SIZE(picParams.pAV1PicData->ReferenceIndices); i++) {
1468 picParams.pAV1PicData->ReferenceIndices[i] = pAV1Pic->ref_frame_idx[i];
1469 }
1470
1471 bool FrameIsIntra = (picParams.pAV1PicData->FrameType == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTRA_ONLY_FRAME ||
1472 picParams.pAV1PicData->FrameType == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_KEY_FRAME);
1473 if (FrameIsIntra)
1474 picParams.pAV1PicData->PrimaryRefFrame = 7; /* PRIMARY_REF_NONE */
1475 else
1476 picParams.pAV1PicData->PrimaryRefFrame = pAV1Pic->primary_ref_frame;
1477 debug_printf("App requested primary_ref_frame: %" PRIu32 "\n", pAV1Pic->primary_ref_frame);
1478 picParams.pAV1PicData->RefreshFrameFlags = pAV1Pic->refresh_frame_flags;
1479 }
1480
1481 // D3D12_VIDEO_ENCODER_CODEC_AV1_LOOP_FILTER_CONFIG LoopFilter;
1482 picParams.pAV1PicData->LoopFilter.LoopFilterLevel[0] = pAV1Pic->loop_filter.filter_level[0];
1483 picParams.pAV1PicData->LoopFilter.LoopFilterLevel[1] = pAV1Pic->loop_filter.filter_level[1];
1484 picParams.pAV1PicData->LoopFilter.LoopFilterLevelU = pAV1Pic->loop_filter.filter_level_u;
1485 picParams.pAV1PicData->LoopFilter.LoopFilterLevelV = pAV1Pic->loop_filter.filter_level_v;
1486 picParams.pAV1PicData->LoopFilter.LoopFilterSharpnessLevel = pAV1Pic->loop_filter.sharpness_level;
1487 picParams.pAV1PicData->LoopFilter.LoopFilterDeltaEnabled = pAV1Pic->loop_filter.mode_ref_delta_enabled;
1488 picParams.pAV1PicData->LoopFilter.UpdateRefDelta = pAV1Pic->loop_filter.mode_ref_delta_update;
1489 if (picParams.pAV1PicData->LoopFilter.UpdateRefDelta) {
1490 for (uint8_t i = 0; i < ARRAY_SIZE(picParams.pAV1PicData->LoopFilter.RefDeltas); i++) {
1491 picParams.pAV1PicData->LoopFilter.RefDeltas[i] = pAV1Pic->loop_filter.ref_deltas[i];
1492 }
1493 }
1494 picParams.pAV1PicData->LoopFilter.UpdateModeDelta = pAV1Pic->loop_filter.mode_ref_delta_update;
1495 if (picParams.pAV1PicData->LoopFilter.UpdateModeDelta) {
1496 for (uint8_t i = 0; i < ARRAY_SIZE(picParams.pAV1PicData->LoopFilter.ModeDeltas); i++) {
1497 picParams.pAV1PicData->LoopFilter.ModeDeltas[i] = pAV1Pic->loop_filter.mode_deltas[i];
1498 }
1499 }
1500
1501 // D3D12_VIDEO_ENCODER_CODEC_AV1_LOOP_FILTER_DELTA_CONFIG LoopFilterDelta;
1502 picParams.pAV1PicData->LoopFilterDelta.DeltaLFMulti = pAV1Pic->loop_filter.delta_lf_multi;
1503 picParams.pAV1PicData->LoopFilterDelta.DeltaLFPresent = pAV1Pic->loop_filter.delta_lf_present;
1504 picParams.pAV1PicData->LoopFilterDelta.DeltaLFRes = pAV1Pic->loop_filter.delta_lf_res;
1505
1506 // D3D12_VIDEO_ENCODER_CODEC_AV1_QUANTIZATION_CONFIG Quantization;
1507 picParams.pAV1PicData->Quantization.BaseQIndex = pAV1Pic->quantization.base_qindex;
1508 picParams.pAV1PicData->Quantization.YDCDeltaQ = pAV1Pic->quantization.y_dc_delta_q;
1509 picParams.pAV1PicData->Quantization.UDCDeltaQ = pAV1Pic->quantization.u_dc_delta_q;
1510 picParams.pAV1PicData->Quantization.UACDeltaQ = pAV1Pic->quantization.u_ac_delta_q;
1511 picParams.pAV1PicData->Quantization.VDCDeltaQ = pAV1Pic->quantization.v_dc_delta_q;
1512 picParams.pAV1PicData->Quantization.VACDeltaQ = pAV1Pic->quantization.v_ac_delta_q;
1513 picParams.pAV1PicData->Quantization.UsingQMatrix = pAV1Pic->quantization.using_qmatrix;
1514 picParams.pAV1PicData->Quantization.QMY = pAV1Pic->quantization.qm_y;
1515 picParams.pAV1PicData->Quantization.QMU = pAV1Pic->quantization.qm_u;
1516 picParams.pAV1PicData->Quantization.QMV = pAV1Pic->quantization.qm_v;
1517
1518 // D3D12_VIDEO_ENCODER_CODEC_AV1_QUANTIZATION_DELTA_CONFIG QuantizationDelta;
1519 picParams.pAV1PicData->QuantizationDelta.DeltaQPresent = pAV1Pic->quantization.delta_q_present;
1520 picParams.pAV1PicData->QuantizationDelta.DeltaQRes = pAV1Pic->quantization.delta_q_res;
1521
1522 // D3D12_VIDEO_ENCODER_AV1_CDEF_CONFIG CDEF;
1523 picParams.pAV1PicData->CDEF.CdefBits = pAV1Pic->cdef.cdef_bits;
1524 picParams.pAV1PicData->CDEF.CdefDampingMinus3 = pAV1Pic->cdef.cdef_damping_minus_3;
1525 for (uint32_t i = 0; i < 8; i++) {
1526 picParams.pAV1PicData->CDEF.CdefYPriStrength[i] = (pAV1Pic->cdef.cdef_y_strengths[i] >> 2);
1527 picParams.pAV1PicData->CDEF.CdefYSecStrength[i] = (pAV1Pic->cdef.cdef_y_strengths[i] & 0x03);
1528 picParams.pAV1PicData->CDEF.CdefUVPriStrength[i] = (pAV1Pic->cdef.cdef_uv_strengths[i] >> 2);
1529 picParams.pAV1PicData->CDEF.CdefUVSecStrength[i] = (pAV1Pic->cdef.cdef_uv_strengths[i] & 0x03);
1530 }
1531
1532 //
1533 // Set values for mandatory but not requested features (ie. RequiredFeature flags reported by driver not requested
1534 // by pipe)
1535 //
1536
1537 // For the ones that are more trivial (ie. 128x128 SB) than enabling their flag, and have more parameters to be
1538 // set (ie Restoration Filter) Set defaults based on such feature driver d3d12 caps
1539
1540 // These are a trivial flag enabling
1541 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK
1542 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA
1543 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER
1544 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND
1545 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND
1546 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION
1547 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_DUAL_FILTER
1548 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_JNT_COMP
1549 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS
1550 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION
1551 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING
1552 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY
1553 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS
1554 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS
1555 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET
1556 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE
1557 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV
1558
1559 // If driver requires these, can use post encode values to enforce specific values
1560 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING
1561 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_AUTO_SEGMENTATION // Only useful with post encode values as driver
1562 // controls D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CUSTOM_SEGMENTATION // There are more Segmentation caps in
1563 // D3D12_VIDEO_ENCODER_AV1_CODEC_CONFIGURATION_SUPPORT for these one too
1564 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS
1565 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS
1566 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX
1567
1568 // If driver requires this one, use driver restoration caps to set default values
1569 // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER
1570 if (pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags &
1571 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER) {
1572 debug_printf(
1573 "[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Adding default params for "
1574 "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER required by caps but not selected already in "
1575 "config.FeatureFlags...\n");
1576
1577 // Set Y, U, V luma plane restoration params
1578 for (uint32_t planeIdx = 0; planeIdx < 3; planeIdx++) {
1579 // Let's see which filters and with which sizes are supported for planeIdx
1580 bool foundSupportedFilter = false;
1581 for (uint32_t filterIdx = 0; ((filterIdx < 3) && !foundSupportedFilter); filterIdx++) {
1582 auto curFilterSupport = pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps
1583 .m_AV1CodecCaps.SupportedRestorationParams[filterIdx][planeIdx];
1584 for (uint32_t curFilterSize = D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_32x32;
1585 ((curFilterSize <= D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_256x256) && !foundSupportedFilter);
1586 curFilterSize++) {
1587
1588 // Check if there's support for curFilter on CurPlane and choose the first supported restoration size
1589 // If yes, set restoration params for planeIdx
1590 if (curFilterSupport &
1591 (1 << (curFilterSize - 1))) { /* Converts D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE definition
1592 into D3D12_VIDEO_ENCODER_AV1_RESTORATION_SUPPORT_FLAGS definition */
1593 {
1594 foundSupportedFilter = true;
1595 // As per d3d12 spec filterIdx corresponds to D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE - 1
1596 // (SupportedRestorationParams definition skips D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE_DISABLED)
1597 D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE curFilter =
1598 static_cast<D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE>(filterIdx + 1);
1599
1600 picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[planeIdx] = curFilter;
1601 picParams.pAV1PicData->FrameRestorationConfig.LoopRestorationPixelSize[planeIdx] =
1602 static_cast<D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE>(
1603 curFilterSize); /* loop uses enum type */
1604 }
1605 }
1606 }
1607 }
1608 }
1609 }
1610
1611 // Save state snapshot from record time to resolve headers at get_feedback time
1612 uint64_t current_metadata_slot = (pD3D12Enc->m_fenceValue % D3D12_VIDEO_ENC_METADATA_BUFFERS_COUNT);
1613 pD3D12Enc->m_spEncodedFrameMetadata[current_metadata_slot].m_associatedEncodeCapabilities =
1614 pD3D12Enc->m_currentEncodeCapabilities;
1615 pD3D12Enc->m_spEncodedFrameMetadata[current_metadata_slot].m_associatedEncodeConfig =
1616 pD3D12Enc->m_currentEncodeConfig;
1617 pD3D12Enc->m_spEncodedFrameMetadata[current_metadata_slot].m_CodecSpecificData.AV1HeadersInfo.enable_frame_obu =
1618 pAV1Pic->enable_frame_obu;
1619 pD3D12Enc->m_spEncodedFrameMetadata[current_metadata_slot].m_CodecSpecificData.AV1HeadersInfo.obu_has_size_field =
1620 (pAV1Pic->tg_obu_header.obu_has_size_field == 1);
1621 // Disabling for now as the libva spec does not allow these but some apps send down anyway. It's possible in the future
1622 // the libva spec may be retro-fitted to allow this given existing apps in the wild doing it.
1623 // pD3D12Enc->m_spEncodedFrameMetadata[current_metadata_slot]
1624 // .m_CodecSpecificData.AV1HeadersInfo.temporal_delim_rendered = pAV1Pic->temporal_delim_rendered;
1625
1626 if ((pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[pAV1Pic->temporal_id].m_Flags & D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_DELTA_QP) != 0)
1627 {
1628 // Use 16 bit qpmap array for AV1 picparams (-255, 255 range and int16_t pRateControlQPMap type)
1629 const int32_t av1_min_delta_qp = -255;
1630 const int32_t av1_max_delta_qp = 255;
1631 d3d12_video_encoder_update_picparams_region_of_interest_qpmap(
1632 pD3D12Enc,
1633 &pAV1Pic->roi,
1634 av1_min_delta_qp,
1635 av1_max_delta_qp,
1636 pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[pAV1Pic->temporal_id].m_pRateControlQPMap16Bit);
1637 picParams.pAV1PicData->pRateControlQPMap = pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[pAV1Pic->temporal_id].m_pRateControlQPMap16Bit.data();
1638 picParams.pAV1PicData->QPMapValuesCount = pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[pAV1Pic->temporal_id].m_pRateControlQPMap16Bit.size();
1639 }
1640 }
1641
1642 void
fill_av1_seq_header(EncodedBitstreamResolvedMetadata & associatedMetadata,av1_seq_header_t * seq_header)1643 fill_av1_seq_header(EncodedBitstreamResolvedMetadata &associatedMetadata, av1_seq_header_t *seq_header)
1644 {
1645 // Set all zero by default
1646 memset(seq_header, 0, sizeof(av1_seq_header_t));
1647
1648 seq_header->seq_profile = d3d12_video_encoder_convert_d3d12_profile_to_spec_profile_av1(
1649 associatedMetadata.m_associatedEncodeConfig.m_encoderProfileDesc.m_AV1Profile);
1650 // seq_header->still_picture; // coded in bitstream by default as 0
1651 // seq_header->reduced_still_picture_header; // coded in bitstream by default as 0
1652 // seq_header->timing_info_present_flag; // coded in bitstream by default as 0
1653 // seq_header->decoder_model_info_present_flag; // coded in bitstream by default as 0
1654 // seq_header->operating_points_cnt_minus_1; // memset default as 0
1655 // seq_header->operating_point_idc[32]; // memset default as 0
1656 d3d12_video_encoder_convert_d3d12_to_spec_level_av1(
1657 associatedMetadata.m_associatedEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Level,
1658 seq_header->seq_level_idx[0]);
1659 d3d12_video_encoder_convert_d3d12_to_spec_tier_av1(
1660 associatedMetadata.m_associatedEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Tier,
1661 seq_header->seq_tier[0]);
1662 // seq_header->decoder_model_present_for_this_op[32]; // memset default as 0
1663 // seq_header->initial_display_delay_present_flag; // coded in bitstream by default as 0
1664 // seq_header->initial_display_delay_minus_1[32];
1665 // seq_header->initial_display_delay_present_for_this_op[32]
1666 // seq_header->frame_width_bits; // coded in bitstream by default as 16
1667 // seq_header->frame_height_bits; // coded in bitstream by default as 16
1668
1669 // frame_size (comes from input texture size)
1670 seq_header->max_frame_width = associatedMetadata.m_associatedEncodeConfig.m_currentResolution.Width;
1671 seq_header->max_frame_height = associatedMetadata.m_associatedEncodeConfig.m_currentResolution.Height;
1672
1673 // seq_header->frame_id_numbers_present_flag; // coded in bitstream by default as 0
1674 seq_header->use_128x128_superblock =
1675 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1676 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK) != 0) ?
1677 1 :
1678 0;
1679 seq_header->enable_filter_intra =
1680 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1681 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA) != 0) ?
1682 1 :
1683 0;
1684 seq_header->enable_intra_edge_filter =
1685 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1686 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER) != 0) ?
1687 1 :
1688 0;
1689 seq_header->enable_interintra_compound =
1690 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1691 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND) != 0) ?
1692 1 :
1693 0;
1694 seq_header->enable_masked_compound =
1695 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1696 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND) != 0) ?
1697 1 :
1698 0;
1699 seq_header->enable_warped_motion =
1700 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1701 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION) != 0) ?
1702 1 :
1703 0;
1704 seq_header->enable_dual_filter =
1705 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1706 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_DUAL_FILTER) != 0) ?
1707 1 :
1708 0;
1709 seq_header->enable_order_hint =
1710 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1711 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS) != 0) ?
1712 1 :
1713 0;
1714 seq_header->enable_jnt_comp =
1715 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1716 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_JNT_COMP) != 0) ?
1717 1 :
1718 0;
1719 seq_header->enable_ref_frame_mvs =
1720 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1721 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS) != 0) ?
1722 1 :
1723 0;
1724 seq_header->seq_choose_screen_content_tools = 0; // coded in bitstream by default as 0
1725 seq_header->seq_force_screen_content_tools = 0; // coded in bitstream by default as 0
1726 seq_header->seq_choose_integer_mv = 0; // coded in bitstream by default as 0
1727 seq_header->seq_force_integer_mv = 0; // coded in bitstream by default as 0
1728 seq_header->order_hint_bits_minus1 =
1729 associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.OrderHintBitsMinus1;
1730 seq_header->enable_superres =
1731 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1732 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION) != 0) ?
1733 1 :
1734 0;
1735 seq_header->enable_cdef =
1736 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1737 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING) != 0) ?
1738 1 :
1739 0;
1740 seq_header->enable_restoration =
1741 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1742 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER) != 0) ?
1743 1 :
1744 0;
1745
1746 seq_header->color_config.bit_depth = associatedMetadata.m_associatedEncodeConfig.m_encodeFormatInfo.Format;
1747 // seq_header->color_config.mono_chrome; // coded in bitstream by default as 0
1748 // seq_header->color_config.color_description_present_flag; // memset default as 0
1749 // seq_header->color_config.color_primaries; // memset default as 0
1750 // seq_header->color_config.transfer_characteristics; // memset default as 0
1751 // seq_header->color_config.matrix_coefficients; // memset default as 0
1752 // seq_header->color_config.color_range; // memset default as 0
1753 seq_header->color_config.chroma_sample_position = 0; // CSP_UNKNOWN
1754 seq_header->color_config.subsampling_x = 1; // DX12 4:2:0 only
1755 seq_header->color_config.subsampling_y = 1; // DX12 4:2:0 only
1756 seq_header->color_config.separate_uv_delta_q = 1;
1757
1758 // seq_header->film_grain_params_present; // coded in bitstream by default as 1
1759 }
1760
1761 void
fill_av1_pic_header(EncodedBitstreamResolvedMetadata & associatedMetadata,av1_pic_header_t * pic_header,const av1_seq_header_t * seqHdr,const D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES * pParsedPostEncodeValues,const D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES * pParsedTilePartitions)1762 fill_av1_pic_header(EncodedBitstreamResolvedMetadata &associatedMetadata,
1763 av1_pic_header_t *pic_header,
1764 const av1_seq_header_t *seqHdr,
1765 const D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES *pParsedPostEncodeValues,
1766 const D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES *pParsedTilePartitions)
1767 {
1768 // Set all zero by default
1769 memset(pic_header, 0, sizeof(av1_pic_header_t));
1770
1771 {
1772 pic_header->quantization_params = pParsedPostEncodeValues->Quantization;
1773
1774 debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1775 "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_QUANTIZATION\n");
1776
1777 debug_printf("Post encode quantization_params.BaseQIndex: %" PRIu64 "\n",
1778 pic_header->quantization_params.BaseQIndex);
1779 debug_printf("Post encode quantization_params.YDCDeltaQ: %" PRId64 "\n",
1780 pic_header->quantization_params.YDCDeltaQ);
1781 debug_printf("Post encode quantization_params.UDCDeltaQ: %" PRId64 "\n",
1782 pic_header->quantization_params.UDCDeltaQ);
1783 debug_printf("Post encode quantization_params.UACDeltaQ: %" PRId64 "\n",
1784 pic_header->quantization_params.UACDeltaQ);
1785 debug_printf("Post encode quantization_params.VDCDeltaQ: %" PRId64 "\n",
1786 pic_header->quantization_params.VDCDeltaQ);
1787 debug_printf("Post encode quantization_params.VACDeltaQ: %" PRId64 "\n",
1788 pic_header->quantization_params.VACDeltaQ);
1789 debug_printf("Post encode quantization_params.UsingQMatrix: %" PRIu64 "\n",
1790 pic_header->quantization_params.UsingQMatrix);
1791 debug_printf("Post encode quantization_params.QMY: %" PRIu64 "\n", pic_header->quantization_params.QMY);
1792 debug_printf("Post encode quantization_params.QMU: %" PRIu64 "\n", pic_header->quantization_params.QMU);
1793 debug_printf("Post encode quantization_params.QMV: %" PRIu64 "\n", pic_header->quantization_params.QMV);
1794 }
1795
1796 pic_header->segmentation_enabled = 0;
1797 if ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
1798 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_AUTO) != 0) {
1799
1800 // The segmentation info comes from the driver
1801 pic_header->segmentation_config = pParsedPostEncodeValues->SegmentationConfig;
1802 pic_header->segmentation_enabled = (pic_header->segmentation_config.NumSegments != 0);
1803 }
1804
1805 {
1806 debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1807 "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_QUANTIZATION_DELTA\n");
1808 pic_header->delta_q_params = pParsedPostEncodeValues->QuantizationDelta;
1809
1810 debug_printf("Post encode delta_q_params.DeltaQPresent: %" PRIu64 "\n", pic_header->delta_q_params.DeltaQPresent);
1811 debug_printf("Post encode delta_q_params.DeltaQRes: %" PRIu64 "\n", pic_header->delta_q_params.DeltaQRes);
1812 }
1813
1814 {
1815 debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1816 "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_LOOP_FILTER_DELTA\n");
1817 pic_header->delta_lf_params = pParsedPostEncodeValues->LoopFilterDelta;
1818
1819 debug_printf("Post encode delta_lf_params.DeltaLFMulti: %" PRIu64 "\n", pic_header->delta_lf_params.DeltaLFMulti);
1820 debug_printf("Post encode delta_lf_params.DeltaLFPresent: %" PRIu64 "\n",
1821 pic_header->delta_lf_params.DeltaLFPresent);
1822 debug_printf("Post encode delta_lf_params.DeltaLFRes: %" PRIu64 "\n", pic_header->delta_lf_params.DeltaLFRes);
1823 }
1824
1825 {
1826 debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1827 "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_LOOP_FILTER\n");
1828 pic_header->loop_filter_params = pParsedPostEncodeValues->LoopFilter;
1829
1830 debug_printf("Post encode loop_filter_params.LoopFilterDeltaEnabled: %" PRIu64 "\n",
1831 pic_header->loop_filter_params.LoopFilterDeltaEnabled);
1832 debug_printf("Post encode loop_filter_params.LoopFilterLevel[0]: %" PRIu64 "\n",
1833 pic_header->loop_filter_params.LoopFilterLevel[0]);
1834 debug_printf("Post encode loop_filter_params.LoopFilterLevel[1]: %" PRIu64 "\n",
1835 pic_header->loop_filter_params.LoopFilterLevel[1]);
1836 debug_printf("Post encode loop_filter_params.LoopFilterLevelU: %" PRIu64 "\n",
1837 pic_header->loop_filter_params.LoopFilterLevelU);
1838 debug_printf("Post encode loop_filter_params.LoopFilterLevelV: %" PRIu64 "\n",
1839 pic_header->loop_filter_params.LoopFilterLevelV);
1840 debug_printf("Post encode loop_filter_params.LoopFilterSharpnessLevel: %" PRIu64 "\n",
1841 pic_header->loop_filter_params.LoopFilterSharpnessLevel);
1842 debug_printf("Post encode loop_filter_params.ModeDeltas[0]: %" PRIu64 "\n",
1843 pic_header->loop_filter_params.ModeDeltas[0]);
1844 debug_printf("Post encode loop_filter_params.ModeDeltas[1]: %" PRIu64 "\n",
1845 pic_header->loop_filter_params.ModeDeltas[1]);
1846 for (uint8_t i = 0; i < 8; i++) {
1847 debug_printf("Post encode loop_filter_params.RefDeltas[%d]: %" PRIu64 "\n",
1848 i,
1849 pic_header->loop_filter_params.RefDeltas[i]);
1850 }
1851 debug_printf("Post encode loop_filter_params.UpdateModeDelta: %" PRIu64 "\n",
1852 pic_header->loop_filter_params.UpdateModeDelta);
1853 debug_printf("Post encode loop_filter_params.UpdateRefDelta: %" PRIu64 "\n",
1854 pic_header->loop_filter_params.UpdateRefDelta);
1855 }
1856
1857 {
1858 debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1859 "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_CDEF_DATA\n");
1860 pic_header->cdef_params = pParsedPostEncodeValues->CDEF;
1861
1862 debug_printf("Post encode cdef_params.CdefBits: %" PRIu64 "\n", pic_header->cdef_params.CdefBits);
1863
1864 debug_printf("Post encode cdef_params.CdefDampingMinus3: %" PRIu64 "\n",
1865 pic_header->cdef_params.CdefDampingMinus3);
1866
1867 for (uint8_t i = 0; i < 8; i++) {
1868 debug_printf("Post encode cdef_params.CdefYPriStrength[%d]: %" PRIu64 "\n",
1869 i,
1870 pic_header->cdef_params.CdefYPriStrength[i]);
1871
1872 debug_printf("Post encode cdef_params.CdefUVPriStrength[%d]: %" PRIu64 "\n",
1873 i,
1874 pic_header->cdef_params.CdefUVPriStrength[i]);
1875
1876 debug_printf("Post encode cdef_params.CdefYSecStrength[%d]: %" PRIu64 "\n",
1877 i,
1878 pic_header->cdef_params.CdefYSecStrength[i]);
1879
1880 debug_printf("Post encode cdef_params.CdefUVSecStrength[%d]: %" PRIu64 "\n",
1881 i,
1882 pic_header->cdef_params.CdefUVSecStrength[i]);
1883 }
1884 }
1885
1886 {
1887 debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1888 "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_COMPOUND_PREDICTION_MODE\n");
1889 pic_header->reference_select = (pParsedPostEncodeValues->CompoundPredictionType ==
1890 D3D12_VIDEO_ENCODER_AV1_COMP_PREDICTION_TYPE_SINGLE_REFERENCE) ?
1891 0 :
1892 1;
1893 debug_printf("Post encode reference_select: %" PRIu32 "\n", pic_header->reference_select);
1894 }
1895
1896 // if ((pevFlags & D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_CONTEXT_UPDATE_TILE_ID) != 0)
1897 // We just copy the whole structure, the driver must copy it even if the pev flag is not set
1898 pic_header->tile_info.tile_partition = *pParsedTilePartitions;
1899
1900 {
1901 debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1902 "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_PRIMARY_REF_FRAME\n");
1903 pic_header->primary_ref_frame = static_cast<uint32_t>(pParsedPostEncodeValues->PrimaryRefFrame);
1904 debug_printf("Post encode primary_ref_frame: %" PRIu32 "\n", pic_header->primary_ref_frame);
1905 }
1906
1907 debug_printf("Post encode tile_info.tile_partition.ContextUpdateTileId: %" PRIu64 "\n",
1908 pic_header->tile_info.tile_partition.ContextUpdateTileId);
1909 debug_printf("Post encode tile_info.tile_partition.ColCount: %" PRIu64 "\n",
1910 pic_header->tile_info.tile_partition.ColCount);
1911 debug_printf("Post encode tile_info.tile_partition.RowCount: %" PRIu64 "\n",
1912 pic_header->tile_info.tile_partition.RowCount);
1913
1914 assert(pic_header->tile_info.tile_partition.ColCount < 64);
1915 for (uint8_t i = 0; i < pic_header->tile_info.tile_partition.ColCount; i++) {
1916 debug_printf("Post encode tile_info.tile_partition.ColWidths[%d]: %" PRIu64 "\n",
1917 i,
1918 pic_header->tile_info.tile_partition.ColWidths[i]);
1919 }
1920
1921 assert(pic_header->tile_info.tile_partition.RowCount < 64);
1922 for (uint8_t i = 0; i < pic_header->tile_info.tile_partition.RowCount; i++) {
1923 debug_printf("Post encode tile_info.tile_partition.RowHeights[%d]: %" PRIu64 "\n",
1924 i,
1925 pic_header->tile_info.tile_partition.RowHeights[i]);
1926 }
1927
1928 pic_header->show_existing_frame = 0;
1929 pic_header->frame_to_show_map_idx = 0;
1930
1931 // pic_header->display_frame_id; // frame_id_numbers_present_flag coded in bitstream by default as 0
1932
1933 pic_header->frame_type = associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.FrameType;
1934 {
1935 UINT EncodeOrderInGop =
1936 (associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.PictureIndex %
1937 associatedMetadata.m_associatedEncodeConfig.m_encoderGOPConfigDesc.m_AV1SequenceStructure.IntraDistance);
1938
1939 UINT ShowOrderInGop =
1940 (associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.OrderHint %
1941 associatedMetadata.m_associatedEncodeConfig.m_encoderGOPConfigDesc.m_AV1SequenceStructure.IntraDistance);
1942
1943 pic_header->show_frame = (ShowOrderInGop <= EncodeOrderInGop);
1944 }
1945
1946 pic_header->showable_frame = // this will always be showable for P/B frames, even when using show_frame for B
1947 // frame playback reordering
1948 associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.FrameType !=
1949 D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_KEY_FRAME;
1950 pic_header->error_resilient_mode =
1951 ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
1952 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_ERROR_RESILIENT_MODE) != 0);
1953 pic_header->disable_cdf_update =
1954 ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
1955 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_DISABLE_CDF_UPDATE) != 0);
1956
1957 pic_header->allow_screen_content_tools =
1958 ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
1959 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_PALETTE_ENCODING) != 0);
1960 pic_header->force_integer_mv =
1961 ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
1962 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FORCE_INTEGER_MOTION_VECTORS) != 0);
1963
1964 // frame_size_override_flag is not coded + default as 1 for SWITCH_FRAME and explicitly coded otherwise
1965 if (pic_header->frame_type == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_SWITCH_FRAME)
1966 pic_header->frame_size_override_flag = 1; // As per AV1 codec spec
1967 else
1968 pic_header->frame_size_override_flag = 0; // Set as default as 0 when explicitly coded
1969
1970 pic_header->order_hint = associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.OrderHint;
1971
1972 pic_header->refresh_frame_flags =
1973 associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.RefreshFrameFlags;
1974
1975 // frame_size (comes from input texture size)
1976 pic_header->FrameWidth = associatedMetadata.m_associatedEncodeConfig.m_currentResolution.Width;
1977 pic_header->UpscaledWidth = associatedMetadata.m_associatedEncodeConfig.m_currentResolution.Width;
1978 pic_header->FrameHeight = associatedMetadata.m_associatedEncodeConfig.m_currentResolution.Height;
1979
1980 // render_size (comes from AV1 pipe picparams pic)
1981 pic_header->RenderWidth = associatedMetadata.m_associatedEncodeConfig.m_FrameCroppingCodecConfig.right;
1982 pic_header->RenderHeight = associatedMetadata.m_associatedEncodeConfig.m_FrameCroppingCodecConfig.bottom;
1983
1984 bool use_128x128_superblock =
1985 ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1986 D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK) != 0) ?
1987 1 :
1988 0;
1989 unsigned MiCols = 2 * ((pic_header->FrameWidth + 7) >> 3);
1990 unsigned MiRows = 2 * ((pic_header->FrameHeight + 7) >> 3);
1991 pic_header->frame_width_sb = use_128x128_superblock ? ((MiCols + 31) >> 5) : ((MiCols + 15) >> 4);
1992 pic_header->frame_height_sb = use_128x128_superblock ? ((MiRows + 31) >> 5) : ((MiRows + 15) >> 4);
1993
1994 pic_header->use_superres = ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
1995 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_USE_SUPER_RESOLUTION) != 0);
1996 pic_header->SuperresDenom =
1997 associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.SuperResDenominator;
1998
1999 pic_header->allow_intrabc = ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2000 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_INTRA_BLOCK_COPY) != 0);
2001
2002 for (unsigned i = 0; i < ARRAY_SIZE(associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData
2003 .ReferenceFramesReconPictureDescriptors);
2004 i++) {
2005 pic_header->ref_order_hint[i] = associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData
2006 .ReferenceFramesReconPictureDescriptors[i]
2007 .OrderHint;
2008 }
2009
2010 for (uint8_t i = 0; i < ARRAY_SIZE(pParsedPostEncodeValues->ReferenceIndices); i++)
2011 pic_header->ref_frame_idx[i] = pParsedPostEncodeValues->ReferenceIndices[i];
2012
2013 pic_header->allow_high_precision_mv =
2014 ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2015 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_HIGH_PRECISION_MV) != 0);
2016 pic_header->interpolation_filter =
2017 associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.InterpolationFilter;
2018 pic_header->is_motion_mode_switchable =
2019 ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2020 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_MOTION_MODE_SWITCHABLE) != 0);
2021 pic_header->use_ref_frame_mvs =
2022 ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2023 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FRAME_REFERENCE_MOTION_VECTORS) != 0);
2024 pic_header->disable_frame_end_update_cdf =
2025 ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2026 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_DISABLE_FRAME_END_UPDATE_CDF) != 0);
2027
2028 pic_header->tile_info.tile_mode = associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigMode;
2029 pic_header->tile_info.tile_support_caps =
2030 associatedMetadata.m_associatedEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps;
2031
2032 pic_header->tile_info.uniform_tile_spacing_flag = 0;
2033 if ((pic_header->tile_info.tile_mode == D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE_UNIFORM_GRID_PARTITION) ||
2034 (pic_header->tile_info.tile_mode == D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE_FULL_FRAME))
2035 pic_header->tile_info.uniform_tile_spacing_flag = 1;
2036 else if (pic_header->tile_info.tile_mode ==
2037 D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE_CONFIGURABLE_GRID_PARTITION)
2038 pic_header->tile_info.uniform_tile_spacing_flag = 0;
2039 else
2040 assert(false); // Unknown pic_header->tile_info.tile_mode for AV1
2041
2042 // lr_params
2043 for (uint32_t i = 0; i < 3; i++)
2044 pic_header->lr_params.lr_type[i] = associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData
2045 .FrameRestorationConfig.FrameRestorationType[i];
2046 bool lr_enabled =
2047 pic_header->lr_params.lr_type[0] || pic_header->lr_params.lr_type[1] || pic_header->lr_params.lr_type[2];
2048 if (lr_enabled) {
2049 uint8_t luma_shift_total = log2(d3d12_video_encoder_looprestorationsize_d3d12_to_uint_av1(
2050 associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData
2051 .FrameRestorationConfig.LoopRestorationPixelSize[0])) -
2052 6;
2053 pic_header->lr_params.lr_unit_shift = (luma_shift_total > 0) ? 1 : 0;
2054 pic_header->lr_params.lr_unit_extra_shift = (luma_shift_total > 1) ? 1 : 0;
2055 assert(associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.FrameRestorationConfig
2056 .LoopRestorationPixelSize[1] == associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc
2057 .m_AV1PicData.FrameRestorationConfig.LoopRestorationPixelSize[2]);
2058
2059 if (associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.FrameRestorationConfig
2060 .LoopRestorationPixelSize[1]) {
2061 pic_header->lr_params.lr_uv_shift = log2(d3d12_video_encoder_looprestorationsize_d3d12_to_uint_av1(
2062 associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc
2063 .m_AV1PicData.FrameRestorationConfig.LoopRestorationPixelSize[1])) +
2064 6 + luma_shift_total;
2065 } else {
2066 pic_header->lr_params.lr_uv_shift = 0;
2067 }
2068 }
2069
2070 pic_header->TxMode = associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.TxMode;
2071 pic_header->skip_mode_present =
2072 ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2073 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_SKIP_MODE) != 0);
2074 pic_header->allow_warped_motion =
2075 ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2076 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_WARPED_MOTION) != 0);
2077 pic_header->reduced_tx_set =
2078 ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2079 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_REDUCED_TX_SET) != 0);
2080 // pic_header->frame_refs_short_signaling; // coded in bitstream by default as 0
2081 }
2082
2083 D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE
d3d12_video_encoder_looprestorationsize_uint_to_d3d12_av1(uint32_t pixel_size)2084 d3d12_video_encoder_looprestorationsize_uint_to_d3d12_av1(uint32_t pixel_size)
2085 {
2086 switch (pixel_size) {
2087 case 32:
2088 {
2089 return D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_32x32;
2090 } break;
2091 case 64:
2092 {
2093 return D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_64x64;
2094 } break;
2095 case 128:
2096 {
2097 return D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_128x128;
2098 } break;
2099 case 256:
2100 {
2101 return D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_256x256;
2102 } break;
2103 default:
2104 {
2105 unreachable("Unsupported D3D12_VIDEO_ENCODER_AV1_PROFILE");
2106 } break;
2107 }
2108 }
2109
2110 unsigned
d3d12_video_encoder_looprestorationsize_d3d12_to_uint_av1(D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE d3d12_type)2111 d3d12_video_encoder_looprestorationsize_d3d12_to_uint_av1(D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE d3d12_type)
2112 {
2113 switch (d3d12_type) {
2114 case D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_32x32:
2115 {
2116 return 32;
2117 } break;
2118 case D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_64x64:
2119 {
2120 return 64;
2121 } break;
2122 case D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_128x128:
2123 {
2124 return 128;
2125 } break;
2126 case D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_256x256:
2127 {
2128 return 256;
2129 } break;
2130 default:
2131 {
2132 unreachable("Unsupported D3D12_VIDEO_ENCODER_AV1_PROFILE");
2133 } break;
2134 }
2135 }
2136
2137 /*
2138 * Called at get_feedback time FOR A PREVIOUSLY RECORDED AND EXECUTED FRAME
2139 */
2140 unsigned
d3d12_video_encoder_build_post_encode_codec_bitstream_av1(struct d3d12_video_encoder * pD3D12Enc,uint64_t associated_fence_value,EncodedBitstreamResolvedMetadata & associatedMetadata)2141 d3d12_video_encoder_build_post_encode_codec_bitstream_av1(struct d3d12_video_encoder *pD3D12Enc,
2142 uint64_t associated_fence_value,
2143 EncodedBitstreamResolvedMetadata &associatedMetadata)
2144 {
2145 // Parse the AV1 resolved metadata
2146
2147 ID3D12Resource *pResolvedMetadataBuffer = associatedMetadata.spBuffer.Get();
2148 uint64_t resourceMetadataSize = associatedMetadata.bufferSize;
2149
2150 struct d3d12_screen *pD3D12Screen = (struct d3d12_screen *) pD3D12Enc->m_pD3D12Screen;
2151 pipe_resource *pPipeResolvedMetadataBuffer =
2152 d3d12_resource_from_resource(&pD3D12Screen->base, pResolvedMetadataBuffer);
2153 assert(resourceMetadataSize < INT_MAX);
2154 struct pipe_box box;
2155 u_box_3d(0, // x
2156 0, // y
2157 0, // z
2158 static_cast<int>(resourceMetadataSize), // width
2159 1, // height
2160 1, // depth
2161 &box);
2162 struct pipe_transfer *mapTransferMetadata;
2163 uint8_t *pMetadataBufferSrc =
2164 reinterpret_cast<uint8_t *>(pD3D12Enc->base.context->buffer_map(pD3D12Enc->base.context,
2165 pPipeResolvedMetadataBuffer,
2166 0,
2167 PIPE_MAP_READ,
2168 &box,
2169 &mapTransferMetadata));
2170
2171 debug_printf("[d3d12_video_enc_av1] Parsing driver resolved encode metadata...\n");
2172
2173 D3D12_VIDEO_ENCODER_OUTPUT_METADATA *pParsedMetadata =
2174 reinterpret_cast<D3D12_VIDEO_ENCODER_OUTPUT_METADATA *>(pMetadataBufferSrc);
2175 pMetadataBufferSrc += sizeof(D3D12_VIDEO_ENCODER_OUTPUT_METADATA);
2176
2177 D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA *pFrameSubregionMetadata =
2178 reinterpret_cast<D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA *>(pMetadataBufferSrc);
2179 pMetadataBufferSrc +=
2180 (sizeof(D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA) * pParsedMetadata->WrittenSubregionsCount);
2181
2182 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES *pParsedTilePartitions =
2183 reinterpret_cast<D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES *>(pMetadataBufferSrc);
2184 pMetadataBufferSrc += sizeof(D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES);
2185
2186 D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES *pParsedPostEncodeValues =
2187 reinterpret_cast<D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES *>(pMetadataBufferSrc);
2188 pMetadataBufferSrc += sizeof(D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES);
2189
2190 debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeErrorFlags: %" PRIx64 " \n",
2191 pParsedMetadata->EncodeErrorFlags);
2192 debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeStats.AverageQP: %" PRIu64 " \n",
2193 pParsedMetadata->EncodeStats.AverageQP);
2194 debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeStats.IntraCodingUnitsCount: %" PRIu64
2195 " \n",
2196 pParsedMetadata->EncodeStats.IntraCodingUnitsCount);
2197 debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeStats.InterCodingUnitsCount: %" PRIu64
2198 " \n",
2199 pParsedMetadata->EncodeStats.InterCodingUnitsCount);
2200 debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeStats.SkipCodingUnitsCount: %" PRIu64
2201 " \n",
2202 pParsedMetadata->EncodeStats.SkipCodingUnitsCount);
2203 debug_printf("[d3d12_video_enc_av1] "
2204 "D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeStats.AverageMotionEstimationXDirection: %" PRIu64 " \n",
2205 pParsedMetadata->EncodeStats.AverageMotionEstimationXDirection);
2206 debug_printf("[d3d12_video_enc_av1] "
2207 "D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeStats.AverageMotionEstimationYDirection: %" PRIu64 " \n",
2208 pParsedMetadata->EncodeStats.AverageMotionEstimationYDirection);
2209 debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodedBitstreamWrittenBytesCount: %" PRIu64
2210 " \n",
2211 pParsedMetadata->EncodedBitstreamWrittenBytesCount);
2212 debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.WrittenSubregionsCount: %" PRIu64 " \n",
2213 pParsedMetadata->WrittenSubregionsCount);
2214
2215 for (uint8_t i = 0; i < pParsedMetadata->WrittenSubregionsCount; i++) {
2216 debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA[%d].bHeaderSize: %" PRIu64 " \n",
2217 i,
2218 pFrameSubregionMetadata[i].bHeaderSize);
2219 debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA[%d].bStartOffset: %" PRIu64
2220 " \n",
2221 i,
2222 pFrameSubregionMetadata[i].bStartOffset);
2223 debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA[%d].bSize: %" PRIu64 " \n",
2224 i,
2225 pFrameSubregionMetadata[i].bSize);
2226 }
2227
2228 if (pParsedMetadata->EncodeErrorFlags != D3D12_VIDEO_ENCODER_ENCODE_ERROR_FLAG_NO_ERROR) {
2229 debug_printf("[d3d12_video_enc_av1] Encode GPU command for fence %" PRIu64 " failed - EncodeErrorFlags: %" PRIu64
2230 "\n",
2231 associated_fence_value,
2232 pParsedMetadata->EncodeErrorFlags);
2233 assert(false);
2234 return 0;
2235 }
2236
2237 if (pParsedMetadata->EncodedBitstreamWrittenBytesCount == 0u) {
2238 debug_printf("[d3d12_video_enc_av1] Encode GPU command for fence %" PRIu64
2239 " failed - EncodedBitstreamWrittenBytesCount: 0\n",
2240 associated_fence_value);
2241 assert(false);
2242 return 0;
2243 }
2244
2245 // Create headers
2246
2247 av1_seq_header_t seqHdr = {};
2248 fill_av1_seq_header(associatedMetadata, &seqHdr);
2249 av1_pic_header_t picHdr = {};
2250 fill_av1_pic_header(associatedMetadata, &picHdr, &seqHdr, pParsedPostEncodeValues, pParsedTilePartitions);
2251
2252 bool bNeedSeqUpdate = false;
2253 bool diff_uv_delta_from_pev = (picHdr.quantization_params.VDCDeltaQ != picHdr.quantization_params.UDCDeltaQ) ||
2254 (picHdr.quantization_params.VACDeltaQ != picHdr.quantization_params.UACDeltaQ);
2255 debug_printf("[Calculated] Post encode diff_uv_delta_from_pev: %d\n", diff_uv_delta_from_pev);
2256
2257 // Make sure the Seq header allows diff_uv_delta from pev
2258 if (diff_uv_delta_from_pev && !seqHdr.color_config.separate_uv_delta_q) {
2259 seqHdr.color_config.separate_uv_delta_q = 1;
2260 bNeedSeqUpdate = true;
2261 }
2262
2263 d3d12_video_bitstream_builder_av1 *pAV1BitstreamBuilder =
2264 static_cast<d3d12_video_bitstream_builder_av1 *>(pD3D12Enc->m_upBitstreamBuilder.get());
2265 assert(pAV1BitstreamBuilder);
2266
2267 associatedMetadata.pWrittenCodecUnitsSizes.clear();
2268
2269 size_t writtenTemporalDelimBytes = 0;
2270 if (picHdr.show_frame && associatedMetadata.m_CodecSpecificData.AV1HeadersInfo.temporal_delim_rendered) {
2271 pAV1BitstreamBuilder->write_temporal_delimiter_obu(
2272 pD3D12Enc->m_BitstreamHeadersBuffer,
2273 pD3D12Enc->m_BitstreamHeadersBuffer.begin(), // placingPositionStart
2274 writtenTemporalDelimBytes // Bytes Written AFTER placingPositionStart arg above
2275 );
2276 assert(pD3D12Enc->m_BitstreamHeadersBuffer.size() == writtenTemporalDelimBytes);
2277 debug_printf("Written OBU_TEMPORAL_DELIMITER bytes: %" PRIu64 "\n", static_cast<uint64_t>(writtenTemporalDelimBytes));
2278 associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenTemporalDelimBytes);
2279 }
2280
2281 size_t writtenSequenceBytes = 0;
2282 bool isFirstFrame = (associated_fence_value == 1);
2283
2284 // on first frame or on resolution change or if we changed seq hdr values with post encode values
2285 bool writeNewSeqHeader = isFirstFrame || bNeedSeqUpdate ||
2286 ((associatedMetadata.m_associatedEncodeConfig.m_seqFlags &
2287 D3D12_VIDEO_ENCODER_SEQUENCE_CONTROL_FLAG_RESOLUTION_CHANGE) != 0);
2288
2289 if (writeNewSeqHeader) {
2290 pAV1BitstreamBuilder->write_sequence_header(
2291 &seqHdr,
2292 pD3D12Enc->m_BitstreamHeadersBuffer,
2293 pD3D12Enc->m_BitstreamHeadersBuffer.begin() + writtenTemporalDelimBytes, // placingPositionStart
2294 writtenSequenceBytes // Bytes Written AFTER placingPositionStart arg above
2295 );
2296 associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenSequenceBytes);
2297 assert(pD3D12Enc->m_BitstreamHeadersBuffer.size() == (writtenSequenceBytes + writtenTemporalDelimBytes));
2298 debug_printf("Written OBU_SEQUENCE_HEADER bytes: %" PRIu64 "\n", static_cast<uint64_t>(writtenSequenceBytes));
2299 }
2300
2301 // Only supported bitstream format is with obu_size for now.
2302 assert(associatedMetadata.m_CodecSpecificData.AV1HeadersInfo.obu_has_size_field);
2303
2304 size_t writtenFrameBytes = 0;
2305 size_t writtenTileBytes = 0;
2306
2307 pipe_resource *src_driver_bitstream =
2308 d3d12_resource_from_resource(&pD3D12Enc->m_pD3D12Screen->base, associatedMetadata.spStagingBitstream.Get());
2309 assert(src_driver_bitstream);
2310
2311 size_t comp_bitstream_offset = 0;
2312 if (associatedMetadata.m_CodecSpecificData.AV1HeadersInfo.enable_frame_obu) {
2313 // FRAME_OBU combined frame and tile data case
2314
2315 assert(associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroupsCount ==
2316 1);
2317
2318 // write_frame_header writes OBU_FRAME except tile_obu_group, but included obu_size for tile_group_obu as
2319 // calculated below
2320 size_t tile_group_obu_size = 0;
2321 size_t decode_tile_elements_size = 0;
2322 pAV1BitstreamBuilder->calculate_tile_group_obu_size(
2323 pParsedMetadata,
2324 pFrameSubregionMetadata,
2325 associatedMetadata.m_associatedEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps
2326 .TileSizeBytesMinus1 +
2327 1,
2328 associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition,
2329 associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroups[0],
2330 tile_group_obu_size,
2331 decode_tile_elements_size);
2332
2333 pAV1BitstreamBuilder->write_frame_header(
2334 &seqHdr,
2335 &picHdr,
2336 OBU_FRAME,
2337 tile_group_obu_size, // We need it to code obu_size of OBU_FRAME open_bitstream_unit()
2338 pD3D12Enc->m_BitstreamHeadersBuffer,
2339 pD3D12Enc->m_BitstreamHeadersBuffer.begin() + writtenSequenceBytes +
2340 writtenTemporalDelimBytes, // placingPositionStart
2341 writtenFrameBytes // Bytes Written AFTER placingPositionStart arg above
2342 );
2343
2344 debug_printf("Written OBU_FRAME bytes: %" PRIu64 "\n", static_cast<uint64_t>(writtenFrameBytes));
2345 associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenFrameBytes);
2346
2347 assert(pD3D12Enc->m_BitstreamHeadersBuffer.size() ==
2348 (writtenSequenceBytes + writtenTemporalDelimBytes + writtenFrameBytes));
2349
2350 debug_printf("Uploading %" PRIu64
2351 " bytes from OBU sequence and/or picture headers to comp_bit_destination %p at offset 0\n",
2352 static_cast<uint64_t>(pD3D12Enc->m_BitstreamHeadersBuffer.size()),
2353 associatedMetadata.comp_bit_destination);
2354
2355 // Upload headers to the finalized compressed bitstream buffer
2356 // Note: The buffer_subdata is queued in pD3D12Enc->base.context but doesn't execute immediately
2357 pD3D12Enc->base.context->buffer_subdata(pD3D12Enc->base.context, // context
2358 associatedMetadata.comp_bit_destination, // comp. bitstream
2359 PIPE_MAP_WRITE, // usage PIPE_MAP_x
2360 0, // offset
2361 pD3D12Enc->m_BitstreamHeadersBuffer.size(),
2362 pD3D12Enc->m_BitstreamHeadersBuffer.data());
2363
2364 comp_bitstream_offset = pD3D12Enc->m_BitstreamHeadersBuffer.size();
2365 size_t written_bytes_to_staging_bitstream_buffer = 0;
2366
2367 upload_tile_group_obu(
2368 pD3D12Enc,
2369 tile_group_obu_size,
2370 decode_tile_elements_size,
2371 associatedMetadata.m_StagingBitstreamConstruction,
2372 0, // staging_bitstream_buffer_offset,
2373 src_driver_bitstream,
2374 associatedMetadata.comp_bit_destination,
2375 comp_bitstream_offset,
2376 pFrameSubregionMetadata,
2377 associatedMetadata.m_associatedEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps
2378 .TileSizeBytesMinus1 +
2379 1,
2380 associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition,
2381 associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroups[0],
2382 written_bytes_to_staging_bitstream_buffer,
2383 associatedMetadata.pWrittenCodecUnitsSizes);
2384
2385 writtenTileBytes += tile_group_obu_size;
2386 comp_bitstream_offset += writtenTileBytes;
2387
2388 // Flush batch with upload work and wait on this CPU thread for GPU work completion
2389 {
2390 struct pipe_fence_handle *pUploadGPUCompletionFence = NULL;
2391 pD3D12Enc->base.context->flush(pD3D12Enc->base.context,
2392 &pUploadGPUCompletionFence,
2393 PIPE_FLUSH_ASYNC | PIPE_FLUSH_HINT_FINISH);
2394 assert(pUploadGPUCompletionFence);
2395 debug_printf(
2396 "[d3d12_video_encoder] d3d12_video_encoder_build_post_encode_codec_bitstream_av1 - Waiting on GPU "
2397 "completion fence for "
2398 " uploading finalized codec headers to compressed bitstream.\n");
2399
2400 pD3D12Enc->m_pD3D12Screen->base.fence_finish(&pD3D12Enc->m_pD3D12Screen->base,
2401 NULL,
2402 pUploadGPUCompletionFence,
2403 OS_TIMEOUT_INFINITE);
2404 pD3D12Enc->m_pD3D12Screen->base.fence_reference(&pD3D12Enc->m_pD3D12Screen->base,
2405 &pUploadGPUCompletionFence,
2406 NULL);
2407 }
2408 } else {
2409 // FRAME_HEADER_OBU + OBU_TILE_GROUP concatenated case
2410
2411 // Build open_bitstream_unit for OBU_FRAME_HEADER
2412 pAV1BitstreamBuilder->write_frame_header(&seqHdr,
2413 &picHdr,
2414 OBU_FRAME_HEADER,
2415 0, // no tile_obu_group in OBU_FRAME_HEADER
2416 pD3D12Enc->m_BitstreamHeadersBuffer,
2417 pD3D12Enc->m_BitstreamHeadersBuffer.begin() + writtenSequenceBytes +
2418 writtenTemporalDelimBytes, // placingPositionStart
2419 writtenFrameBytes // Bytes Written AFTER placingPositionStart arg above
2420 );
2421 associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenFrameBytes);
2422
2423 debug_printf("Written OBU_FRAME_HEADER bytes: %" PRIu64 "\n", static_cast<uint64_t>(writtenFrameBytes));
2424
2425 assert(pD3D12Enc->m_BitstreamHeadersBuffer.size() ==
2426 (writtenSequenceBytes + writtenTemporalDelimBytes + writtenFrameBytes));
2427
2428 debug_printf("Uploading %" PRIu64 " bytes from OBU headers to comp_bit_destination %p at offset 0\n",
2429 static_cast<uint64_t>(pD3D12Enc->m_BitstreamHeadersBuffer.size()),
2430 associatedMetadata.comp_bit_destination);
2431
2432 // Upload headers to the finalized compressed bitstream buffer
2433 // Note: The buffer_subdata is queued in pD3D12Enc->base.context but doesn't execute immediately
2434 pD3D12Enc->base.context->buffer_subdata(pD3D12Enc->base.context, // context
2435 associatedMetadata.comp_bit_destination, // comp. bitstream
2436 PIPE_MAP_WRITE, // usage PIPE_MAP_x
2437 0, // offset
2438 pD3D12Enc->m_BitstreamHeadersBuffer.size(),
2439 pD3D12Enc->m_BitstreamHeadersBuffer.data());
2440
2441 comp_bitstream_offset = pD3D12Enc->m_BitstreamHeadersBuffer.size();
2442 size_t staging_bitstream_buffer_offset = 0;
2443
2444 for (int tg_idx = 0;
2445 tg_idx <
2446 associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroupsCount;
2447 tg_idx++) {
2448 auto ¤tTg =
2449 associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroups[tg_idx];
2450
2451 debug_printf("Uploading tile group %d to comp_bit_destination %p at offset %" PRIu64 "\n",
2452 tg_idx,
2453 associatedMetadata.comp_bit_destination,
2454 static_cast<uint64_t>(comp_bitstream_offset));
2455
2456 size_t tile_group_obu_size = 0;
2457 size_t decode_tile_elements_size = 0;
2458 pAV1BitstreamBuilder->calculate_tile_group_obu_size(
2459 pParsedMetadata,
2460 pFrameSubregionMetadata,
2461 associatedMetadata.m_associatedEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps
2462 .TileSizeBytesMinus1 +
2463 1,
2464 associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition,
2465 currentTg,
2466 tile_group_obu_size,
2467 decode_tile_elements_size);
2468
2469 size_t writtenTileObuPrefixBytes = 0;
2470 pAV1BitstreamBuilder->write_obu_tile_group_header(
2471 tile_group_obu_size, // tile_group_obu() size to pack OBU_TILE_GROUP obu_size element
2472 associatedMetadata.m_StagingBitstreamConstruction, // Source CPU buffer cannot be overwritten until
2473 // GPU upload flush finishes.
2474 associatedMetadata.m_StagingBitstreamConstruction.begin() +
2475 staging_bitstream_buffer_offset, // placingPositionStart
2476 writtenTileObuPrefixBytes); // Bytes Written AFTER placingPositionStart arg above
2477
2478 debug_printf("Written %" PRIu64 " bytes for OBU_TILE_GROUP open_bitstream_unit() prefix with obu_header() and "
2479 "obu_size to staging_bitstream_buffer %p at offset %" PRIu64 "\n",
2480 static_cast<uint64_t>(writtenTileObuPrefixBytes),
2481 associatedMetadata.m_StagingBitstreamConstruction.data(),
2482 static_cast<uint64_t>(staging_bitstream_buffer_offset));
2483
2484 writtenTileBytes += writtenTileObuPrefixBytes;
2485 associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenTileObuPrefixBytes);
2486
2487 // Note: The buffer_subdata is queued in pD3D12Enc->base.context but doesn't execute immediately
2488 pD3D12Enc->base.context->buffer_subdata(
2489 pD3D12Enc->base.context, // context
2490 associatedMetadata.comp_bit_destination, // comp. bitstream
2491 PIPE_MAP_WRITE, // usage PIPE_MAP_x
2492 comp_bitstream_offset, // offset
2493 writtenTileObuPrefixBytes,
2494 associatedMetadata.m_StagingBitstreamConstruction.data() + staging_bitstream_buffer_offset);
2495
2496 debug_printf("Uploading %" PRIu64 " bytes for OBU_TILE_GROUP open_bitstream_unit() prefix with obu_header() "
2497 "and obu_size: %" PRIu64 " to comp_bit_destination %p at offset %" PRIu64 "\n",
2498 static_cast<uint64_t>(writtenTileObuPrefixBytes),
2499 static_cast<uint64_t>(tile_group_obu_size),
2500 associatedMetadata.comp_bit_destination,
2501 static_cast<uint64_t>(comp_bitstream_offset));
2502
2503 staging_bitstream_buffer_offset += writtenTileObuPrefixBytes;
2504
2505 comp_bitstream_offset += writtenTileObuPrefixBytes;
2506
2507 size_t written_bytes_to_staging_bitstream_buffer = 0;
2508 upload_tile_group_obu(
2509 pD3D12Enc,
2510 tile_group_obu_size,
2511 decode_tile_elements_size,
2512 associatedMetadata.m_StagingBitstreamConstruction,
2513 staging_bitstream_buffer_offset,
2514 src_driver_bitstream,
2515 associatedMetadata.comp_bit_destination,
2516 comp_bitstream_offset,
2517 pFrameSubregionMetadata,
2518 associatedMetadata.m_associatedEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps
2519 .TileSizeBytesMinus1 +
2520 1,
2521 associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition,
2522 currentTg,
2523 written_bytes_to_staging_bitstream_buffer,
2524 associatedMetadata.pWrittenCodecUnitsSizes);
2525
2526 staging_bitstream_buffer_offset += written_bytes_to_staging_bitstream_buffer;
2527 comp_bitstream_offset += tile_group_obu_size;
2528 writtenTileBytes += tile_group_obu_size;
2529
2530 // Flush batch with upload work and wait on this CPU thread for GPU work completion
2531 // for this case we have to do it within the loop, so the CUP arrays that are reused
2532 // on each loop are completely done being read by the GPU before we modify them.
2533 {
2534 struct pipe_fence_handle *pUploadGPUCompletionFence = NULL;
2535 pD3D12Enc->base.context->flush(pD3D12Enc->base.context,
2536 &pUploadGPUCompletionFence,
2537 PIPE_FLUSH_ASYNC | PIPE_FLUSH_HINT_FINISH);
2538 assert(pUploadGPUCompletionFence);
2539 debug_printf(
2540 "[d3d12_video_encoder] d3d12_video_encoder_build_post_encode_codec_bitstream_av1 - Waiting on GPU "
2541 "completion fence for "
2542 " uploading finalized codec headers to compressed bitstream.\n");
2543
2544 pD3D12Enc->m_pD3D12Screen->base.fence_finish(&pD3D12Enc->m_pD3D12Screen->base,
2545 NULL,
2546 pUploadGPUCompletionFence,
2547 OS_TIMEOUT_INFINITE);
2548 pD3D12Enc->m_pD3D12Screen->base.fence_reference(&pD3D12Enc->m_pD3D12Screen->base,
2549 &pUploadGPUCompletionFence,
2550 NULL);
2551 }
2552 }
2553 }
2554
2555 size_t extra_show_existing_frame_payload_bytes = 0;
2556 if (!picHdr.show_frame) {
2557
2558 // When writing in the bitstream a frame that will be accessed as reference by a frame we did not
2559 // write to the bitstream yet, let's store them for future show_existing_frame mechanism
2560 pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificStateDescAV1.pendingShowableFrames.push_back(
2561 associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.PictureIndex);
2562
2563 } else { // picHdr.show_frame true
2564
2565 // Check if any of the pending "to be showed later" frames is present in the current frame references
2566 // and if so issue the show_existing_frame header and remove it from the pending list
2567
2568 for (auto pendingFrameIt =
2569 pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificStateDescAV1.pendingShowableFrames.begin();
2570 pendingFrameIt !=
2571 pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificStateDescAV1.pendingShowableFrames.end();) {
2572
2573 // Check if current frame references uses this pendingFrameIt
2574 int cur_ref_idx_matching_pending = -1;
2575 for (unsigned i = 0; i < ARRAY_SIZE(picHdr.ref_frame_idx) /*NUM_REF_FRAMES*/; i++) {
2576 if (
2577 // Is a valid reference
2578 (associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData
2579 .ReferenceFramesReconPictureDescriptors[picHdr.ref_frame_idx[i]]
2580 .ReconstructedPictureResourceIndex != UNUSED_VIRTUAL_DPB_SLOT_PHYSICAL_INDEX) &&
2581 // And matches the pending frame PictureIndex
2582 (associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData
2583 .ReferenceFramesReconPictureDescriptors[picHdr.ref_frame_idx[i]]
2584 .PictureIndex == *pendingFrameIt /*PictureIndex*/)) {
2585
2586 // Store the reference index
2587 cur_ref_idx_matching_pending = picHdr.ref_frame_idx[i];
2588 break;
2589 }
2590 }
2591
2592 // If we found a reference of the current frame using pendingFrameIt,
2593 // - Issue the show_existing_frame header
2594 // - Remove it from the pending list
2595 if (cur_ref_idx_matching_pending >= 0) {
2596 size_t staging_buf_offset = pD3D12Enc->m_BitstreamHeadersBuffer.size();
2597
2598
2599 size_t writtenTemporalDelimBytes = 0;
2600 if (D3D12_VIDEO_AV1_INSERT_SHOW_EXISTING_FRAME_HEADER) {
2601 pAV1BitstreamBuilder->write_temporal_delimiter_obu(
2602 pD3D12Enc->m_BitstreamHeadersBuffer,
2603 pD3D12Enc->m_BitstreamHeadersBuffer.begin() + staging_buf_offset, // placingPositionStart
2604 writtenTemporalDelimBytes // Bytes Written AFTER placingPositionStart arg above
2605 );
2606 }
2607 associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenTemporalDelimBytes);
2608 assert(writtenTemporalDelimBytes == (pD3D12Enc->m_BitstreamHeadersBuffer.size() - staging_buf_offset));
2609
2610 // Add current pending frame being processed in the loop
2611 extra_show_existing_frame_payload_bytes += writtenTemporalDelimBytes;
2612
2613 debug_printf("Written OBU_TEMPORAL_DELIMITER bytes: %" PRIu64 "\n", static_cast<uint64_t>(writtenTemporalDelimBytes));
2614
2615 size_t writtenShowExistingFrameBytes = 0;
2616 av1_pic_header_t showExistingPicHdr = {};
2617 showExistingPicHdr.show_existing_frame = 1;
2618 showExistingPicHdr.frame_to_show_map_idx = cur_ref_idx_matching_pending;
2619
2620 if (D3D12_VIDEO_AV1_INSERT_SHOW_EXISTING_FRAME_HEADER) {
2621 pAV1BitstreamBuilder->write_frame_header(
2622 NULL, // No seq header necessary for show_existing_frame
2623 &showExistingPicHdr,
2624 OBU_FRAME_HEADER,
2625 0, // No tile info for OBU_FRAME_HEADER
2626 pD3D12Enc->m_BitstreamHeadersBuffer,
2627 pD3D12Enc->m_BitstreamHeadersBuffer.begin() + staging_buf_offset +
2628 writtenTemporalDelimBytes, // placingPositionStart
2629 writtenShowExistingFrameBytes // Bytes Written AFTER placingPositionStart arg above
2630 );
2631 }
2632 associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenShowExistingFrameBytes);
2633
2634 assert(writtenShowExistingFrameBytes ==
2635 (pD3D12Enc->m_BitstreamHeadersBuffer.size() - staging_buf_offset - writtenTemporalDelimBytes));
2636
2637 // Add current pending frame being processed in the loop
2638 extra_show_existing_frame_payload_bytes += writtenShowExistingFrameBytes;
2639
2640 assert(pD3D12Enc->m_BitstreamHeadersBuffer.size() ==
2641 (staging_buf_offset + writtenShowExistingFrameBytes + writtenTemporalDelimBytes));
2642
2643 // Upload headers to the finalized compressed bitstream buffer
2644 // Note: The buffer_subdata is queued in pD3D12Enc->base.context but doesn't execute immediately
2645 pD3D12Enc->base.context->buffer_subdata(pD3D12Enc->base.context, // context
2646 associatedMetadata.comp_bit_destination, // comp. bitstream
2647 PIPE_MAP_WRITE, // usage PIPE_MAP_x
2648 comp_bitstream_offset, // offset
2649 writtenShowExistingFrameBytes + writtenTemporalDelimBytes,
2650 pD3D12Enc->m_BitstreamHeadersBuffer.data() + staging_buf_offset);
2651
2652 comp_bitstream_offset += writtenShowExistingFrameBytes;
2653 comp_bitstream_offset += writtenTemporalDelimBytes;
2654
2655 debug_printf("Written show_existing_frame OBU_FRAME header for previous frame with PictureIndex %d (Used "
2656 "in current frame ref_frame_idx[%" PRIu32 "]) bytes: %" PRIu64 "\n",
2657 *pendingFrameIt /*PictureIndex*/,
2658 showExistingPicHdr.frame_to_show_map_idx,
2659 static_cast<uint64_t>(writtenShowExistingFrameBytes));
2660
2661 // Remove it from the list of pending frames
2662 pendingFrameIt =
2663 pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificStateDescAV1.pendingShowableFrames.erase(
2664 pendingFrameIt);
2665 } else {
2666 pendingFrameIt++;
2667 }
2668 }
2669
2670 // Flush again if uploaded show_existing_frame header(s) to bitstream.
2671 if (extra_show_existing_frame_payload_bytes) {
2672 struct pipe_fence_handle *pUploadGPUCompletionFence = NULL;
2673 pD3D12Enc->base.context->flush(pD3D12Enc->base.context,
2674 &pUploadGPUCompletionFence,
2675 PIPE_FLUSH_ASYNC | PIPE_FLUSH_HINT_FINISH);
2676 assert(pUploadGPUCompletionFence);
2677 debug_printf("[d3d12_video_encoder] [show_existing_frame extra headers upload] "
2678 "d3d12_video_encoder_build_post_encode_codec_bitstream_av1 - Waiting on GPU "
2679 "completion fence for "
2680 " uploading finalized codec headers to compressed bitstream.\n");
2681
2682 pD3D12Enc->m_pD3D12Screen->base.fence_finish(&pD3D12Enc->m_pD3D12Screen->base,
2683 NULL,
2684 pUploadGPUCompletionFence,
2685 OS_TIMEOUT_INFINITE);
2686 pD3D12Enc->m_pD3D12Screen->base.fence_reference(&pD3D12Enc->m_pD3D12Screen->base,
2687 &pUploadGPUCompletionFence,
2688 NULL);
2689 }
2690 }
2691
2692 // d3d12_resource_from_resource calls AddRef to it so this should only be deleting
2693 // the pipe_resource wrapping object and not the underlying spStagingBitstream
2694 pipe_resource_reference(&src_driver_bitstream, NULL);
2695 assert(associatedMetadata.spStagingBitstream.Get());
2696
2697 // Unmap the metadata buffer tmp storage
2698 pipe_buffer_unmap(pD3D12Enc->base.context, mapTransferMetadata);
2699 pipe_resource_reference(&pPipeResolvedMetadataBuffer, NULL);
2700
2701 assert((writtenSequenceBytes + writtenTemporalDelimBytes + writtenFrameBytes +
2702 extra_show_existing_frame_payload_bytes) == pD3D12Enc->m_BitstreamHeadersBuffer.size());
2703
2704 uint32_t total_bytes_written = static_cast<uint32_t>(writtenSequenceBytes + writtenTemporalDelimBytes + writtenFrameBytes +
2705 writtenTileBytes + extra_show_existing_frame_payload_bytes);
2706 assert(std::accumulate(associatedMetadata.pWrittenCodecUnitsSizes.begin(), associatedMetadata.pWrittenCodecUnitsSizes.end(), 0u) ==
2707 static_cast<uint64_t>(total_bytes_written));
2708 return total_bytes_written;
2709 }
2710
2711 void
upload_tile_group_obu(struct d3d12_video_encoder * pD3D12Enc,size_t tile_group_obu_size,size_t decode_tile_elements_size,std::vector<uint8_t> & staging_bitstream_buffer,size_t staging_bitstream_buffer_offset,pipe_resource * src_driver_bitstream,pipe_resource * comp_bit_destination,size_t comp_bit_destination_offset,const D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA * pFrameSubregionMetadata,size_t TileSizeBytes,const D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES & TilesPartition,const av1_tile_group_t & tileGroup,size_t & written_bytes_to_staging_bitstream_buffer,std::vector<uint64_t> & pWrittenCodecUnitsSizes)2712 upload_tile_group_obu(struct d3d12_video_encoder *pD3D12Enc,
2713 size_t tile_group_obu_size,
2714 size_t decode_tile_elements_size,
2715 std::vector<uint8_t> &staging_bitstream_buffer,
2716 size_t staging_bitstream_buffer_offset,
2717 pipe_resource *src_driver_bitstream,
2718 pipe_resource *comp_bit_destination,
2719 size_t comp_bit_destination_offset,
2720 const D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA *pFrameSubregionMetadata,
2721 size_t TileSizeBytes, // Pass already +1'd from TileSizeBytesMinus1
2722 const D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES &TilesPartition,
2723 const av1_tile_group_t &tileGroup,
2724 size_t &written_bytes_to_staging_bitstream_buffer,
2725 std::vector<uint64_t> &pWrittenCodecUnitsSizes)
2726 {
2727 debug_printf("[Tile group start %d to end %d] Writing to comp_bit_destination %p starts at offset %" PRIu64 "\n",
2728 tileGroup.tg_start,
2729 tileGroup.tg_end,
2730 comp_bit_destination,
2731 static_cast<uint64_t>(comp_bit_destination_offset));
2732
2733 debug_printf("[Tile group start %d to end %d] Using staging_bitstream_buffer %p at offset %" PRIu64
2734 " to write the tile_obu_group() prefix syntax: tile_start_and_end_present_flag, tg_start, tg_end and "
2735 "the tile_size_minus1\n",
2736 tileGroup.tg_start,
2737 tileGroup.tg_end,
2738 staging_bitstream_buffer.data(),
2739 static_cast<uint64_t>(staging_bitstream_buffer_offset));
2740
2741 // Reserve space upfront in the scratch storage
2742 // Do not modify anything before staging_bitstream_buffer_offset
2743
2744 size_t tile_obu_prefix_size = tile_group_obu_size - decode_tile_elements_size;
2745 if (staging_bitstream_buffer.size() < (staging_bitstream_buffer_offset + tile_obu_prefix_size))
2746 staging_bitstream_buffer.resize(staging_bitstream_buffer_offset + tile_obu_prefix_size);
2747
2748 d3d12_video_encoder_bitstream bitstream_tile_group_obu;
2749 bitstream_tile_group_obu.setup_bitstream(staging_bitstream_buffer.size(),
2750 staging_bitstream_buffer.data(),
2751 staging_bitstream_buffer_offset);
2752
2753 uint8_t NumTiles = TilesPartition.ColCount * TilesPartition.RowCount;
2754 bool tile_start_and_end_present_flag = !(tileGroup.tg_start == 0 && (tileGroup.tg_end == (NumTiles - 1)));
2755 if (NumTiles > 1)
2756 bitstream_tile_group_obu.put_bits(1,
2757 tile_start_and_end_present_flag); // tile_start_and_end_present_flag f(1)
2758
2759 if (!(NumTiles == 1 || !tile_start_and_end_present_flag)) {
2760 uint8_t tileBits = log2(TilesPartition.ColCount) + log2(TilesPartition.RowCount);
2761 bitstream_tile_group_obu.put_bits(tileBits, tileGroup.tg_start); // tg_start f(tileBits)
2762 bitstream_tile_group_obu.put_bits(tileBits, tileGroup.tg_end); // tg_end f(tileBits)
2763 }
2764
2765 bitstream_tile_group_obu.put_aligning_bits(); // byte_alignment()
2766
2767 bitstream_tile_group_obu.flush();
2768
2769 size_t bitstream_tile_group_obu_bytes = bitstream_tile_group_obu.get_byte_count() - staging_bitstream_buffer_offset;
2770
2771 debug_printf("[Tile group start %d to end %d] Written %" PRIu64
2772 " bitstream_tile_group_obu_bytes at staging_bitstream_buffer %p at offset %" PRIu64
2773 " for tile_obu_group() prefix syntax: tile_start_and_end_present_flag, tg_start, tg_end\n",
2774 tileGroup.tg_start,
2775 tileGroup.tg_end,
2776 static_cast<uint64_t>(bitstream_tile_group_obu_bytes),
2777 staging_bitstream_buffer.data(),
2778 static_cast<uint64_t>(staging_bitstream_buffer_offset));
2779
2780
2781 // Save this to compare the final written destination byte size against the expected tile_group_obu_size
2782 // at the end of the function
2783 ASSERTED size_t comp_bit_destination_offset_before_upload = comp_bit_destination_offset;
2784
2785 // Upload first part of the header to compressed bitstream destination
2786 // Note: The buffer_subdata is queued in pD3D12Enc->base.context but doesn't execute immediately
2787 if (bitstream_tile_group_obu_bytes > 0) {
2788 pD3D12Enc->base.context->buffer_subdata(
2789 pD3D12Enc->base.context, // context
2790 comp_bit_destination, // comp. bitstream
2791 PIPE_MAP_WRITE, // usage PIPE_MAP_x
2792 comp_bit_destination_offset, // offset
2793 bitstream_tile_group_obu_bytes, // size
2794 staging_bitstream_buffer.data() + staging_bitstream_buffer_offset); // data
2795
2796 debug_printf("[Tile group start %d to end %d] Uploading %" PRIu64 " bytes"
2797 " for tile_obu_group() prefix syntax: tile_start_and_end_present_flag, tg_start, tg_end"
2798 " from staging_bitstream_buffer %p at offset %" PRIu64
2799 " to comp_bit_destination %p at offset %" PRIu64 "\n",
2800 tileGroup.tg_start,
2801 tileGroup.tg_end,
2802 static_cast<uint64_t>(bitstream_tile_group_obu_bytes),
2803 staging_bitstream_buffer.data(),
2804 static_cast<uint64_t>(staging_bitstream_buffer_offset),
2805 comp_bit_destination,
2806 static_cast<uint64_t>(comp_bit_destination_offset));
2807
2808 comp_bit_destination_offset += bitstream_tile_group_obu_bytes;
2809 written_bytes_to_staging_bitstream_buffer += bitstream_tile_group_obu_bytes;
2810 }
2811
2812 size_t src_offset = 0;
2813 for (UINT64 TileIdx = tileGroup.tg_start; TileIdx <= tileGroup.tg_end; TileIdx++) {
2814 size_t tile_size = pFrameSubregionMetadata[TileIdx].bSize - pFrameSubregionMetadata[TileIdx].bStartOffset;
2815 // The i-th tile is read from the src_buffer[offset] with offset = [sum j = (0, (i-1)){ tile[j].bSize }] +
2816 // tile[i].bStartOffset
2817 size_t src_buf_tile_position = src_offset + pFrameSubregionMetadata[TileIdx].bStartOffset;
2818 src_offset += pFrameSubregionMetadata[TileIdx].bSize;
2819
2820 // tile_size_minus_1 not coded for last tile
2821 if ((TileIdx != tileGroup.tg_end)) {
2822 bitstream_tile_group_obu.put_le_bytes(TileSizeBytes, // tile_size_minus_1 le(TileSizeBytes)
2823 tile_size - 1 /* convert to ..._minus_1 */);
2824 bitstream_tile_group_obu.flush();
2825
2826 debug_printf("[Tile group start %d to end %d] [TileIdx %" PRIu64 "] Written %" PRIu64
2827 " written_bytes_to_staging_bitstream_buffer at staging_bitstream_buffer %p at offset %" PRIu64
2828 " for the tile_size_minus1 syntax\n",
2829 tileGroup.tg_start,
2830 tileGroup.tg_end,
2831 TileIdx,
2832 static_cast<uint64_t>(TileSizeBytes),
2833 staging_bitstream_buffer.data(),
2834 static_cast<uint64_t>(written_bytes_to_staging_bitstream_buffer + staging_bitstream_buffer_offset));
2835
2836 // Upload current tile_size_minus_1
2837 // Note: The buffer_subdata is queued in pD3D12Enc->base.context but doesn't execute immediately
2838 pD3D12Enc->base.context->buffer_subdata(pD3D12Enc->base.context, // context
2839 comp_bit_destination, // comp. bitstream
2840 PIPE_MAP_WRITE, // usage PIPE_MAP_x
2841 comp_bit_destination_offset, // offset
2842 TileSizeBytes, // size
2843 staging_bitstream_buffer.data() +
2844 written_bytes_to_staging_bitstream_buffer +
2845 staging_bitstream_buffer_offset); // data
2846
2847 debug_printf("[Tile group start %d to end %d] [TileIdx %" PRIu64 "] Uploading %" PRIu64 " bytes"
2848 " for tile_obu_group() prefix syntax: tile_size_minus_1"
2849 " from staging_bitstream_buffer %p at offset %" PRIu64
2850 " to comp_bit_destination %p at offset %" PRIu64 "\n",
2851 tileGroup.tg_start,
2852 tileGroup.tg_end,
2853 TileIdx,
2854 static_cast<uint64_t>(TileSizeBytes),
2855 staging_bitstream_buffer.data(),
2856 static_cast<uint64_t>(written_bytes_to_staging_bitstream_buffer + staging_bitstream_buffer_offset),
2857 comp_bit_destination,
2858 static_cast<uint64_t>(comp_bit_destination_offset));
2859
2860 comp_bit_destination_offset += TileSizeBytes;
2861 written_bytes_to_staging_bitstream_buffer += TileSizeBytes;
2862 }
2863
2864 // Now copy the decode_tile() element from the driver staging GPU buffer onto the finalized GPU buffer
2865
2866 struct pipe_box src_box;
2867 u_box_3d(static_cast<int>(src_buf_tile_position), // x
2868 0, // y
2869 0, // z
2870 static_cast<int>(tile_size), // width
2871 1, // height
2872 1, // depth
2873 &src_box);
2874
2875 pD3D12Enc->base.context->resource_copy_region(pD3D12Enc->base.context, // ctx
2876 comp_bit_destination, // dst
2877 0, // dst_level
2878 comp_bit_destination_offset, // dstX
2879 0, // dstY
2880 0, // dstZ
2881 src_driver_bitstream, // src
2882 0, // src level
2883 &src_box);
2884
2885 debug_printf("[Tile group start %d to end %d] [TileIdx %" PRIu64 "] Written %" PRIu64
2886 " tile_size bytes data from src_driver_bitstream %p at offset %" PRIu64
2887 " into comp_bit_destination %p at offset %" PRIu64 "\n",
2888 tileGroup.tg_start,
2889 tileGroup.tg_end,
2890 TileIdx,
2891 static_cast<uint64_t>(tile_size),
2892 src_driver_bitstream,
2893 static_cast<uint64_t>(src_buf_tile_position),
2894 comp_bit_destination,
2895 static_cast<uint64_t>(comp_bit_destination_offset));
2896
2897 comp_bit_destination_offset += tile_size;
2898
2899 size_t cur_tile_reportable_size = tile_size;
2900 if (TileIdx != tileGroup.tg_end)
2901 cur_tile_reportable_size += TileSizeBytes; /* extra tile_size_bytes_minus1 in all tiles except last*/
2902 if (TileIdx == 0)
2903 cur_tile_reportable_size += bitstream_tile_group_obu_bytes; // part of the obu tile group header (make part of first tile)
2904 pWrittenCodecUnitsSizes.push_back(cur_tile_reportable_size);
2905 }
2906
2907 // Make sure we wrote the expected bytes that match the obu_size elements
2908 // in the OBUs wrapping this uploaded tile_group_obu
2909 assert((comp_bit_destination_offset - comp_bit_destination_offset_before_upload) == tile_group_obu_size);
2910 }
2911
2912 void
d3d12_video_encoder_store_current_picture_references_av1(d3d12_video_encoder * pD3D12Enc,uint64_t current_metadata_slot)2913 d3d12_video_encoder_store_current_picture_references_av1(d3d12_video_encoder *pD3D12Enc, uint64_t current_metadata_slot)
2914 {
2915 // Update DX12 picparams for post execution (get_feedback) after d3d12_video_encoder_references_manager_av1
2916 // changes
2917 pD3D12Enc->m_spEncodedFrameMetadata[current_metadata_slot].m_associatedEncodeConfig.m_encoderPicParamsDesc =
2918 pD3D12Enc->m_currentEncodeConfig.m_encoderPicParamsDesc;
2919 }
2920