xref: /aosp_15_r20/external/mesa3d/src/gallium/drivers/d3d12/d3d12_video_enc_av1.cpp (revision 6104692788411f58d303aa86923a9ff6ecaded22)
1 /*
2  * Copyright © Microsoft Corporation
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21  * IN THE SOFTWARE.
22  */
23 
24 #include "d3d12_video_enc.h"
25 #include "d3d12_video_enc_av1.h"
26 #include "util/u_video.h"
27 #include "d3d12_resource.h"
28 #include "d3d12_screen.h"
29 #include "d3d12_format.h"
30 #include <cmath>
31 #include <numeric>
32 
33 void
d3d12_video_encoder_update_current_rate_control_av1(struct d3d12_video_encoder * pD3D12Enc,pipe_av1_enc_picture_desc * picture)34 d3d12_video_encoder_update_current_rate_control_av1(struct d3d12_video_encoder *pD3D12Enc,
35                                                     pipe_av1_enc_picture_desc *picture)
36 {
37    assert(picture->temporal_id < ARRAY_SIZE(pipe_av1_enc_picture_desc::rc));
38    assert(picture->temporal_id < ARRAY_SIZE(D3D12EncodeConfiguration::m_encoderRateControlDesc));
39 
40    struct D3D12EncodeRateControlState m_prevRCState = pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id];
41    pD3D12Enc->m_currentEncodeConfig.m_activeRateControlIndex = picture->temporal_id;
42    pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id] = {};
43    pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_FrameRate.Numerator = picture->rc[picture->temporal_id].frame_rate_num;
44    pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_FrameRate.Denominator = picture->rc[picture->temporal_id].frame_rate_den;
45    pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags = D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_NONE;
46 
47    if (picture->roi.num > 0)
48       pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
49          D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_DELTA_QP;
50 
51    switch (picture->rc[picture->temporal_id].rate_ctrl_method) {
52       case PIPE_H2645_ENC_RATE_CONTROL_METHOD_VARIABLE_SKIP:
53       case PIPE_H2645_ENC_RATE_CONTROL_METHOD_VARIABLE:
54       {
55          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Mode = D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_VBR;
56          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.TargetAvgBitRate =
57             picture->rc[picture->temporal_id].target_bitrate;
58          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.PeakBitRate =
59             picture->rc[picture->temporal_id].peak_bitrate;
60 
61          if (D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE) {
62             debug_printf(
63                "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
64                "D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE environment variable is set, "
65                ", forcing VBV Size = VBV Initial Capacity = Target Bitrate = %" PRIu64 " (bits)\n",
66                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate);
67             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
68                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
69             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.VBVCapacity =
70                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate;
71             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.InitialVBVFullness =
72                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate;
73          } else if (picture->rc[picture->temporal_id].app_requested_hrd_buffer) {
74             debug_printf(
75                "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 HRD required by app,"
76                " setting VBV Size = %d (bits) - VBV Initial Capacity %d (bits)\n",
77                picture->rc[picture->temporal_id].vbv_buffer_size,
78                picture->rc[picture->temporal_id].vbv_buf_initial_size);
79             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
80                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
81             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.VBVCapacity =
82                picture->rc[picture->temporal_id].vbv_buffer_size;
83             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.InitialVBVFullness =
84                picture->rc[picture->temporal_id].vbv_buf_initial_size;
85          }
86 
87          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].max_frame_size = picture->rc[picture->temporal_id].max_au_size;
88          if (picture->rc[picture->temporal_id].max_au_size > 0) {
89             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
90                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_MAX_FRAME_SIZE;
91             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.MaxFrameBitSize =
92                picture->rc[picture->temporal_id].max_au_size;
93 
94             debug_printf(
95                "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
96                "Upper layer requested explicit MaxFrameBitSize: %" PRIu64 "\n",
97                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.MaxFrameBitSize);
98          }
99 
100          if (picture->rc[picture->temporal_id].app_requested_qp_range) {
101             debug_printf("[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
102                          "Upper layer requested explicit MinQP: %d MaxQP: %d\n",
103                          picture->rc[picture->temporal_id].min_qp,
104                          picture->rc[picture->temporal_id].max_qp);
105             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
106                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QP_RANGE;
107             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.MinQP =
108                picture->rc[picture->temporal_id].min_qp;
109             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR.MaxQP =
110                picture->rc[picture->temporal_id].max_qp;
111          }
112 
113          if (picture->quality_modes.level > 0) {
114             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
115                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QUALITY_VS_SPEED;
116             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
117                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_EXTENSION1_SUPPORT;
118 
119             // Convert between D3D12 definition and PIPE definition
120             // D3D12: QualityVsSpeed must be in the range [0, D3D12_FEATURE_DATA_VIDEO_ENCODER_SUPPORT1.MaxQualityVsSpeed]
121             // The lower the value, the fastest the encode operation
122             // PIPE: The quality level range can be queried through the VAConfigAttribEncQualityRange attribute.
123             // A lower value means higher quality, and a value of 1 represents the highest quality.
124             // The quality level setting is used as a trade-off between quality and speed/power
125             // consumption, with higher quality corresponds to lower speed and higher power consumption.
126 
127             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_VBR1.QualityVsSpeed =
128                pD3D12Enc->max_quality_levels - picture->quality_modes.level;
129          }
130 
131       } break;
132       case PIPE_H2645_ENC_RATE_CONTROL_METHOD_QUALITY_VARIABLE:
133       {
134          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Mode = D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_QVBR;
135          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.TargetAvgBitRate =
136             picture->rc[picture->temporal_id].target_bitrate;
137          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.PeakBitRate =
138             picture->rc[picture->temporal_id].peak_bitrate;
139          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.ConstantQualityTarget =
140             picture->rc[picture->temporal_id].vbr_quality_factor;
141 
142          if (D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE) {
143             debug_printf("[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
144                          "D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE environment variable is set, "
145                          ", forcing VBV Size = VBV Initial Capacity = Target Bitrate = %" PRIu64 " (bits)\n",
146                          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1
147                             .TargetAvgBitRate);
148             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
149                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
150             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
151                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_EXTENSION1_SUPPORT;
152             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.VBVCapacity =
153                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.TargetAvgBitRate;
154             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.InitialVBVFullness =
155                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.TargetAvgBitRate;
156          } else if (picture->rc[picture->temporal_id].app_requested_hrd_buffer) {
157             debug_printf(
158                "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 HRD required by app,"
159                " setting VBV Size = %d (bits) - VBV Initial Capacity %d (bits)\n",
160                picture->rc[picture->temporal_id].vbv_buffer_size,
161                picture->rc[picture->temporal_id].vbv_buf_initial_size);
162             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
163                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
164             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
165                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_EXTENSION1_SUPPORT;
166             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.VBVCapacity =
167                picture->rc[picture->temporal_id].vbv_buffer_size;
168             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.InitialVBVFullness =
169                picture->rc[picture->temporal_id].vbv_buf_initial_size;
170          }
171          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].max_frame_size = picture->rc[picture->temporal_id].max_au_size;
172          if (picture->rc[picture->temporal_id].max_au_size > 0) {
173             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
174                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_MAX_FRAME_SIZE;
175             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.MaxFrameBitSize =
176                picture->rc[picture->temporal_id].max_au_size;
177 
178             debug_printf(
179                "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
180                "Upper layer requested explicit MaxFrameBitSize: %" PRIu64 "\n",
181                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.MaxFrameBitSize);
182          }
183 
184          if (picture->rc[picture->temporal_id].app_requested_qp_range) {
185             debug_printf("[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
186                          "Upper layer requested explicit MinQP: %d MaxQP: %d\n",
187                          picture->rc[picture->temporal_id].min_qp,
188                          picture->rc[picture->temporal_id].max_qp);
189             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
190                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QP_RANGE;
191             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.MinQP =
192                picture->rc[picture->temporal_id].min_qp;
193             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR.MaxQP =
194                picture->rc[picture->temporal_id].max_qp;
195          }
196 
197          if (picture->quality_modes.level > 0) {
198             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
199                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QUALITY_VS_SPEED;
200             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
201                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_EXTENSION1_SUPPORT;
202 
203             // Convert between D3D12 definition and PIPE definition
204             // D3D12: QualityVsSpeed must be in the range [0, D3D12_FEATURE_DATA_VIDEO_ENCODER_SUPPORT1.MaxQualityVsSpeed]
205             // The lower the value, the fastest the encode operation
206             // PIPE: The quality level range can be queried through the VAConfigAttribEncQualityRange attribute.
207             // A lower value means higher quality, and a value of 1 represents the highest quality.
208             // The quality level setting is used as a trade-off between quality and speed/power
209             // consumption, with higher quality corresponds to lower speed and higher power consumption.
210 
211             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_QVBR1.QualityVsSpeed =
212                pD3D12Enc->max_quality_levels - picture->quality_modes.level;
213          }
214 
215       } break;
216       case PIPE_H2645_ENC_RATE_CONTROL_METHOD_CONSTANT_SKIP:
217       case PIPE_H2645_ENC_RATE_CONTROL_METHOD_CONSTANT:
218       {
219          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Mode = D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_CBR;
220          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate =
221             picture->rc[picture->temporal_id].target_bitrate;
222 
223          /* For CBR mode, to guarantee bitrate of generated stream complies with
224           * target bitrate (e.g. no over +/-10%), vbv_buffer_size and initial capacity should be same
225           * as target bitrate. Controlled by OS env var D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE
226           */
227          if (D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE) {
228             debug_printf(
229                "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
230                "D3D12_VIDEO_ENC_CBR_FORCE_VBV_EQUAL_BITRATE environment variable is set, "
231                ", forcing VBV Size = VBV Initial Capacity = Target Bitrate = %" PRIu64 " (bits)\n",
232                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate);
233             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
234                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
235             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.VBVCapacity =
236                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate;
237             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.InitialVBVFullness =
238                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.TargetBitRate;
239          } else if (picture->rc[picture->temporal_id].app_requested_hrd_buffer) {
240             debug_printf(
241                "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 HRD required by app,"
242                " setting VBV Size = %d (bits) - VBV Initial Capacity %d (bits)\n",
243                picture->rc[picture->temporal_id].vbv_buffer_size,
244                picture->rc[picture->temporal_id].vbv_buf_initial_size);
245             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
246                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
247             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.VBVCapacity =
248                picture->rc[picture->temporal_id].vbv_buffer_size;
249             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.InitialVBVFullness =
250                picture->rc[picture->temporal_id].vbv_buf_initial_size;
251          }
252 
253          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].max_frame_size = picture->rc[picture->temporal_id].max_au_size;
254          if (picture->rc[picture->temporal_id].max_au_size > 0) {
255             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
256                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_MAX_FRAME_SIZE;
257             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.MaxFrameBitSize =
258                picture->rc[picture->temporal_id].max_au_size;
259 
260             debug_printf(
261                "[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
262                "Upper layer requested explicit MaxFrameBitSize: %" PRIu64 "\n",
263                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.MaxFrameBitSize);
264          }
265 
266          if (picture->rc[picture->temporal_id].app_requested_qp_range) {
267             debug_printf("[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 "
268                          "Upper layer requested explicit MinQP: %d MaxQP: %d\n",
269                          picture->rc[picture->temporal_id].min_qp,
270                          picture->rc[picture->temporal_id].max_qp);
271 
272             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
273                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QP_RANGE;
274             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.MinQP =
275                picture->rc[picture->temporal_id].min_qp;
276             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR.MaxQP =
277                picture->rc[picture->temporal_id].max_qp;
278          }
279 
280          if (picture->quality_modes.level > 0) {
281             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
282                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QUALITY_VS_SPEED;
283             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
284                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_EXTENSION1_SUPPORT;
285 
286             // Convert between D3D12 definition and PIPE definition
287             // D3D12: QualityVsSpeed must be in the range [0, D3D12_FEATURE_DATA_VIDEO_ENCODER_SUPPORT1.MaxQualityVsSpeed]
288             // The lower the value, the fastest the encode operation
289             // PIPE: The quality level range can be queried through the VAConfigAttribEncQualityRange attribute.
290             // A lower value means higher quality, and a value of 1 represents the highest quality.
291             // The quality level setting is used as a trade-off between quality and speed/power
292             // consumption, with higher quality corresponds to lower speed and higher power consumption.
293 
294             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CBR1.QualityVsSpeed =
295                pD3D12Enc->max_quality_levels - picture->quality_modes.level;
296          }
297 
298       } break;
299       case PIPE_H2645_ENC_RATE_CONTROL_METHOD_DISABLE:
300       {
301          // We need to initialize the QP value for all frame types on the first frame
302          // otherwise some drivers crash.
303          // frontends currently only send the QP values for the specific frame type of
304          // the current frame, so give a default value for all types until all frame
305          // types are configured on subsequent encode frame calls
306          if (pD3D12Enc->m_fenceValue == 1)
307          {
308             m_prevRCState.m_Config.m_Configuration_CQP
309                   .ConstantQP_FullIntracodedFrame = 30 /* initial_qp_default */;
310             m_prevRCState.m_Config.m_Configuration_CQP
311                   .ConstantQP_InterPredictedFrame_PrevRefOnly = 30 /* initial_qp_default */;
312             m_prevRCState.m_Config.m_Configuration_CQP
313                   .ConstantQP_InterPredictedFrame_BiDirectionalRef = 30 /* initial_qp_default */;
314          }
315 
316          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Mode = D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_CQP;
317          if (picture->rc[picture->temporal_id].app_requested_initial_qp) {
318             // Load previous RC state for all frames and only update the current frame
319             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP =
320                m_prevRCState.m_Config.m_Configuration_CQP;
321 
322             if ((picture->frame_type == PIPE_AV1_ENC_FRAME_TYPE_INTRA_ONLY) ||
323                           (picture->frame_type == PIPE_AV1_ENC_FRAME_TYPE_KEY)) {
324                // Update intra frame qp
325                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP
326                   .ConstantQP_FullIntracodedFrame = picture->rc[picture->temporal_id].qp;
327             } else {
328                // Update inter frame QP config
329                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP
330                   .ConstantQP_InterPredictedFrame_PrevRefOnly = picture->rc[picture->temporal_id].qp_inter;
331                pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP
332                   .ConstantQP_InterPredictedFrame_BiDirectionalRef = picture->rc[picture->temporal_id].qp_inter;
333             }
334          }
335 
336          if (picture->quality_modes.level > 0) {
337             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
338                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QUALITY_VS_SPEED;
339             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Flags |=
340                D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_EXTENSION1_SUPPORT;
341             // Convert between D3D12 definition and PIPE definition
342             // D3D12: QualityVsSpeed must be in the range [0, D3D12_FEATURE_DATA_VIDEO_ENCODER_SUPPORT1.MaxQualityVsSpeed]
343             // The lower the value, the fastest the encode operation
344             // PIPE: The quality level range can be queried through the VAConfigAttribEncQualityRange attribute.
345             // A lower value means higher quality, and a value of 1 represents the highest quality.
346             // The quality level setting is used as a trade-off between quality and speed/power
347             // consumption, with higher quality corresponds to lower speed and higher power consumption.
348 
349             pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP1.QualityVsSpeed =
350                pD3D12Enc->max_quality_levels - picture->quality_modes.level;
351          }
352       } break;
353       default:
354       {
355          debug_printf("[d3d12_video_encoder_av1] d3d12_video_encoder_update_current_rate_control_av1 invalid RC "
356                       "config, using default RC CQP mode\n");
357          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Mode = D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_CQP;
358          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP
359             .ConstantQP_FullIntracodedFrame = 30;
360          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP
361             .ConstantQP_InterPredictedFrame_PrevRefOnly = 30;
362          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[picture->temporal_id].m_Config.m_Configuration_CQP
363             .ConstantQP_InterPredictedFrame_BiDirectionalRef = 30;
364       } break;
365    }
366 }
367 
368 //
369 // Returns AV1 extra size on top of the usual base metadata layout size
370 //
371 size_t
d3d12_video_encoder_calculate_metadata_resolved_buffer_size_av1(uint32_t maxSliceNumber)372 d3d12_video_encoder_calculate_metadata_resolved_buffer_size_av1(uint32_t maxSliceNumber)
373 {
374    return sizeof(D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES) +
375           sizeof(D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES);
376 }
377 
378 void
d3d12_video_encoder_convert_d3d12_to_spec_level_av1(D3D12_VIDEO_ENCODER_AV1_LEVELS level12,uint32_t & specLevel)379 d3d12_video_encoder_convert_d3d12_to_spec_level_av1(D3D12_VIDEO_ENCODER_AV1_LEVELS level12, uint32_t &specLevel)
380 {
381    // Enum matches values as in seq_level_idx
382    specLevel = (uint32_t) level12;
383 }
384 
385 void
d3d12_video_encoder_convert_d3d12_to_spec_tier_av1(D3D12_VIDEO_ENCODER_AV1_TIER tier12,uint32_t & specTier)386 d3d12_video_encoder_convert_d3d12_to_spec_tier_av1(D3D12_VIDEO_ENCODER_AV1_TIER tier12, uint32_t &specTier)
387 {
388    // Enum matches values as in seq_level_idx
389    specTier = (uint32_t) tier12;
390 }
391 
392 void
d3d12_video_encoder_convert_spec_to_d3d12_level_av1(uint32_t specLevel,D3D12_VIDEO_ENCODER_AV1_LEVELS & level12)393 d3d12_video_encoder_convert_spec_to_d3d12_level_av1(uint32_t specLevel, D3D12_VIDEO_ENCODER_AV1_LEVELS &level12)
394 {
395    // Enum matches values as in seq_level_idx
396    level12 = (D3D12_VIDEO_ENCODER_AV1_LEVELS) specLevel;
397 }
398 
399 void
d3d12_video_encoder_convert_spec_to_d3d12_tier_av1(uint32_t specTier,D3D12_VIDEO_ENCODER_AV1_TIER & tier12)400 d3d12_video_encoder_convert_spec_to_d3d12_tier_av1(uint32_t specTier, D3D12_VIDEO_ENCODER_AV1_TIER &tier12)
401 {
402    // Enum matches values as in seq_tier
403    tier12 = (D3D12_VIDEO_ENCODER_AV1_TIER) specTier;
404 }
405 
406 uint32_t
d3d12_video_encoder_convert_d3d12_profile_to_spec_profile_av1(D3D12_VIDEO_ENCODER_AV1_PROFILE profile)407 d3d12_video_encoder_convert_d3d12_profile_to_spec_profile_av1(D3D12_VIDEO_ENCODER_AV1_PROFILE profile)
408 {
409    switch (profile) {
410       case D3D12_VIDEO_ENCODER_AV1_PROFILE_MAIN:
411       {
412          return 0;
413       } break;
414       default:
415       {
416          unreachable("Unsupported D3D12_VIDEO_ENCODER_AV1_PROFILE");
417       } break;
418    }
419 }
420 
421 D3D12_VIDEO_ENCODER_AV1_PROFILE
d3d12_video_encoder_convert_profile_to_d3d12_enc_profile_av1(enum pipe_video_profile profile)422 d3d12_video_encoder_convert_profile_to_d3d12_enc_profile_av1(enum pipe_video_profile profile)
423 {
424    switch (profile) {
425       case PIPE_VIDEO_PROFILE_AV1_MAIN:
426       {
427          return D3D12_VIDEO_ENCODER_AV1_PROFILE_MAIN;
428       } break;
429       default:
430       {
431          unreachable("Unsupported pipe_video_profile");
432       } break;
433    }
434 }
435 
436 bool
d3d12_video_encoder_update_av1_gop_configuration(struct d3d12_video_encoder * pD3D12Enc,pipe_av1_enc_picture_desc * picture)437 d3d12_video_encoder_update_av1_gop_configuration(struct d3d12_video_encoder *pD3D12Enc,
438                                                  pipe_av1_enc_picture_desc *picture)
439 {
440    static_assert((unsigned) D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_KEY_FRAME == (unsigned) PIPE_AV1_ENC_FRAME_TYPE_KEY);
441    static_assert((unsigned) D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTER_FRAME == (unsigned) PIPE_AV1_ENC_FRAME_TYPE_INTER);
442    static_assert((unsigned) D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTRA_ONLY_FRAME ==
443                  (unsigned) PIPE_AV1_ENC_FRAME_TYPE_INTRA_ONLY);
444    static_assert((unsigned) D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_SWITCH_FRAME ==
445                  (unsigned) PIPE_AV1_ENC_FRAME_TYPE_SWITCH);
446 
447    // Only update GOP when it begins
448    // This triggers DPB/encoder/heap re-creation, so only check on IDR when a GOP might change
449    if ((picture->frame_type == PIPE_AV1_ENC_FRAME_TYPE_INTRA_ONLY) ||
450        (picture->frame_type == PIPE_AV1_ENC_FRAME_TYPE_KEY)) {
451       uint32_t GOPLength = picture->seq.intra_period;
452       uint32_t PPicturePeriod = picture->seq.ip_period;
453 
454       // Set dirty flag if m_AV1SequenceStructure changed
455       auto previousGOPConfig = pD3D12Enc->m_currentEncodeConfig.m_encoderGOPConfigDesc.m_AV1SequenceStructure;
456       pD3D12Enc->m_currentEncodeConfig.m_encoderGOPConfigDesc.m_AV1SequenceStructure = {
457          GOPLength,
458          PPicturePeriod,
459       };
460 
461       if (memcmp(&previousGOPConfig,
462                  &pD3D12Enc->m_currentEncodeConfig.m_encoderGOPConfigDesc.m_AV1SequenceStructure,
463                  sizeof(D3D12_VIDEO_ENCODER_AV1_SEQUENCE_STRUCTURE)) != 0) {
464          pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_gop;
465       }
466    }
467    return true;
468 }
469 
470 D3D12_VIDEO_ENCODER_MOTION_ESTIMATION_PRECISION_MODE
d3d12_video_encoder_convert_av1_motion_configuration(struct d3d12_video_encoder * pD3D12Enc,pipe_av1_enc_picture_desc * picture)471 d3d12_video_encoder_convert_av1_motion_configuration(struct d3d12_video_encoder *pD3D12Enc,
472                                                      pipe_av1_enc_picture_desc *picture)
473 {
474    return D3D12_VIDEO_ENCODER_MOTION_ESTIMATION_PRECISION_MODE_MAXIMUM;
475 }
476 
477 bool
d3d12_video_encoder_compare_tile_config_av1(D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE currentTilesMode,D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE requestedTilesMode,D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES currentTilePartition,D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES requestedTilePartition)478 d3d12_video_encoder_compare_tile_config_av1(
479    D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE currentTilesMode,
480    D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE requestedTilesMode,
481    D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES currentTilePartition,
482    D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES requestedTilePartition)
483 {
484    if (currentTilesMode != requestedTilesMode)
485       return false;
486 
487    if (memcmp(&currentTilePartition,
488               &requestedTilePartition,
489               sizeof(D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES)))
490       return false;
491 
492    return true;
493 }
494 
495 ///
496 /// Tries to configurate the encoder using the requested tile configuration
497 ///
498 bool
d3d12_video_encoder_negotiate_current_av1_tiles_configuration(struct d3d12_video_encoder * pD3D12Enc,pipe_av1_enc_picture_desc * pAV1Pic)499 d3d12_video_encoder_negotiate_current_av1_tiles_configuration(struct d3d12_video_encoder *pD3D12Enc,
500                                                               pipe_av1_enc_picture_desc *pAV1Pic)
501 {
502    D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES tilePartition = {};
503    tilePartition.RowCount = pAV1Pic->tile_rows;
504    tilePartition.ColCount = pAV1Pic->tile_cols;
505    tilePartition.ContextUpdateTileId = pAV1Pic->context_update_tile_id;
506 
507    // VA-API interface has 63 entries for tile cols/rows. When 64 requested,
508    // last one has to be calculated from the frame width/height in superblocks.
509 
510    // Copy the tile col sizes (up to 63 defined in VA-API interface array sizes)
511    size_t accum_cols_sb = 0;
512    uint8_t src_cols_count = MIN2(63, pAV1Pic->tile_cols);
513    for (uint8_t i = 0; i < src_cols_count; i++) {
514       tilePartition.ColWidths[i] = pAV1Pic->width_in_sbs_minus_1[i] + 1;
515       accum_cols_sb += tilePartition.ColWidths[i];
516    }
517 
518    // If there are 64 cols, calculate the last one manually as the difference
519    // between frame width in sb minus the accumulated tiles sb sizes
520    if (pAV1Pic->tile_cols == 64)
521       tilePartition.ColWidths[63] = pAV1Pic->frame_width_sb - accum_cols_sb;
522 
523    // Copy the tile row sizes (up to 63 defined in VA-API interface array sizes)
524    size_t accum_rows_sb = 0;
525    uint8_t src_rows_count = MIN2(63, pAV1Pic->tile_rows);
526    for (uint8_t i = 0; i < src_rows_count; i++) {
527       tilePartition.RowHeights[i] = pAV1Pic->height_in_sbs_minus_1[i] + 1;
528       accum_rows_sb += tilePartition.RowHeights[i];
529    }
530 
531    // If there are 64 rows, calculate the last one manually as the difference
532    // between frame height in sb minus the accumulated tiles sb sizes
533    if (pAV1Pic->tile_rows == 64)
534       tilePartition.RowHeights[63] = pAV1Pic->frame_height_sb - accum_rows_sb;
535 
536    // Iterate the tiles and see if they're uniformly partitioned to decide
537    // which D3D12 tile mode to use
538    // Ignore the last row and last col width
539    bool tilesUniform = !D3D12_VIDEO_FORCE_TILE_MODE && util_is_power_of_two_or_zero(tilePartition.RowCount) &&
540                        util_is_power_of_two_or_zero(tilePartition.ColCount);
541    // Iterate again now that the 63/64 edge case has been handled above.
542    for (uint8_t i = 1; tilesUniform && (i < tilePartition.RowCount - 1) /* Ignore last row */; i++)
543       tilesUniform = tilesUniform && (tilePartition.RowHeights[i - 1] == tilePartition.RowHeights[i]);
544 
545    for (uint8_t i = 1; tilesUniform && (i < tilePartition.ColCount - 1) /* Ignore last col */; i++)
546       tilesUniform = tilesUniform && (tilePartition.ColWidths[i - 1] == tilePartition.ColWidths[i]);
547 
548    D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE requestedTilesMode =
549       tilesUniform ? D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE_UNIFORM_GRID_PARTITION :
550                      D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE_CONFIGURABLE_GRID_PARTITION;
551 
552    assert(pAV1Pic->num_tile_groups <= 128);   // ARRAY_SIZE(TilesGroups)
553    pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroupsCount =
554       pAV1Pic->num_tile_groups;
555    for (uint8_t i = 0; i < pAV1Pic->num_tile_groups; i++) {
556       pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroups[i].tg_start =
557          pAV1Pic->tile_groups[i].tile_group_start;
558       pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroups[i].tg_end =
559          pAV1Pic->tile_groups[i].tile_group_end;
560    }
561 
562    if (!d3d12_video_encoder_compare_tile_config_av1(
563           pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigMode,
564           requestedTilesMode,
565           pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition,
566           tilePartition)) {
567       pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_slices;
568    }
569 
570    // Update the encoder state with the tile config
571    pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigMode = requestedTilesMode;
572    pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition = tilePartition;
573 
574    D3D12_FEATURE_DATA_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_CONFIG capDataTilesSupport = {};
575    capDataTilesSupport.NodeIndex = pD3D12Enc->m_NodeIndex;
576    capDataTilesSupport.Codec = D3D12_VIDEO_ENCODER_CODEC_AV1;
577    capDataTilesSupport.Profile.DataSize = sizeof(pD3D12Enc->m_currentEncodeConfig.m_encoderProfileDesc.m_AV1Profile);
578    capDataTilesSupport.Profile.pAV1Profile = &pD3D12Enc->m_currentEncodeConfig.m_encoderProfileDesc.m_AV1Profile;
579    capDataTilesSupport.Level.DataSize = sizeof(pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting);
580    capDataTilesSupport.Level.pAV1LevelSetting = &pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting;
581    capDataTilesSupport.FrameResolution.Width = pAV1Pic->frame_width;
582    capDataTilesSupport.FrameResolution.Height = pAV1Pic->frame_height;
583    capDataTilesSupport.SubregionMode = requestedTilesMode;
584    capDataTilesSupport.CodecSupport.DataSize =
585       sizeof(pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps);
586    capDataTilesSupport.CodecSupport.pAV1Support =
587       &pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps;
588    pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps.Use128SuperBlocks = false;
589    // return units in 64x64 default size
590    pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps.TilesConfiguration =
591       pD3D12Enc->m_currentEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition;
592    HRESULT hr =
593       pD3D12Enc->m_spD3D12VideoDevice->CheckFeatureSupport(D3D12_FEATURE_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_CONFIG,
594                                                            &capDataTilesSupport,
595                                                            sizeof(capDataTilesSupport));
596    if (FAILED(hr) || !capDataTilesSupport.IsSupported) {
597       debug_printf("D3D12_FEATURE_VIDEO_ENCODER_SUBREGION_TILES_SUPPORT HR (0x%x) error or IsSupported: (%d).\n",
598                    hr,
599                    capDataTilesSupport.IsSupported);
600       return false;
601    }
602 
603    return true;
604 }
605 
606 D3D12_VIDEO_ENCODER_AV1_CODEC_CONFIGURATION
d3d12_video_encoder_convert_av1_codec_configuration(struct d3d12_video_encoder * pD3D12Enc,pipe_av1_enc_picture_desc * pAV1Pic,bool & is_supported)607 d3d12_video_encoder_convert_av1_codec_configuration(struct d3d12_video_encoder *pD3D12Enc,
608                                                     pipe_av1_enc_picture_desc *pAV1Pic,
609                                                     bool &is_supported)
610 {
611    is_supported = true;
612    D3D12_VIDEO_ENCODER_AV1_CODEC_CONFIGURATION config = {
613       // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAGS FeatureFlags;
614       D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_NONE,
615       // UINT OrderHintBitsMinus1;
616       pAV1Pic->seq.order_hint_bits - 1,
617    };
618 
619    //
620    // Query AV1 caps and store in m_currentEncodeCapabilities
621    //
622 
623    D3D12_FEATURE_DATA_VIDEO_ENCODER_CODEC_CONFIGURATION_SUPPORT capCodecConfigData = {};
624    capCodecConfigData.NodeIndex = pD3D12Enc->m_NodeIndex;
625    capCodecConfigData.Codec = D3D12_VIDEO_ENCODER_CODEC_AV1;
626    D3D12_VIDEO_ENCODER_AV1_PROFILE prof =
627       d3d12_video_encoder_convert_profile_to_d3d12_enc_profile_av1(pD3D12Enc->base.profile);
628    capCodecConfigData.Profile.pAV1Profile = &prof;
629    capCodecConfigData.Profile.DataSize = sizeof(prof);
630    capCodecConfigData.CodecSupportLimits.pAV1Support =
631       &pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps;
632    capCodecConfigData.CodecSupportLimits.DataSize =
633       sizeof(pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps);
634 
635    if (FAILED(
636           pD3D12Enc->m_spD3D12VideoDevice->CheckFeatureSupport(D3D12_FEATURE_VIDEO_ENCODER_CODEC_CONFIGURATION_SUPPORT,
637                                                                &capCodecConfigData,
638                                                                sizeof(capCodecConfigData))) ||
639        !capCodecConfigData.IsSupported) {
640       debug_printf("D3D12_FEATURE_VIDEO_ENCODER_CODEC_CONFIGURATION_SUPPORT arguments not supported.\n");
641       is_supported = false;
642       return config;
643    }
644 
645    // Enable features requested by gallium
646 
647    if (pAV1Pic->seq.seq_bits.use_128x128_superblock)
648       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK;
649    if (pAV1Pic->seq.seq_bits.enable_filter_intra)
650       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA;
651    if (pAV1Pic->seq.seq_bits.enable_intra_edge_filter)
652       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER;
653    if (pAV1Pic->seq.seq_bits.enable_interintra_compound)
654       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND;
655    if (pAV1Pic->seq.seq_bits.enable_masked_compound)
656       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND;
657    if (pAV1Pic->seq.seq_bits.enable_warped_motion)
658       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION;
659    if (pAV1Pic->seq.seq_bits.enable_dual_filter)
660       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_DUAL_FILTER;
661    if (pAV1Pic->seq.seq_bits.enable_order_hint)
662       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS;
663    if (pAV1Pic->seq.seq_bits.enable_jnt_comp)
664       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_JNT_COMP;
665    if (pAV1Pic->seq.seq_bits.enable_ref_frame_mvs)
666       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS;
667    if (pAV1Pic->seq.seq_bits.enable_superres)
668       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION;
669    if (pAV1Pic->seq.seq_bits.enable_cdef)
670       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING;
671    if (pAV1Pic->seq.seq_bits.enable_restoration)
672       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER;
673 
674    // No pipe flag for the following features, associated pic flags can be selected per frame. Enable if supported.
675 
676    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
677         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS) != 0)   // seq_force_integer_mv
678       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS;
679 
680    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
681         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING) != 0)
682       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING;
683 
684    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
685         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY) != 0)
686       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY;
687 
688    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
689         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS) != 0)
690       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS;
691 
692    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
693         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS) != 0)
694       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS;
695 
696    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
697         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX) != 0)
698       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX;
699 
700    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
701         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET) != 0)
702       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET;
703 
704    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
705         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE) != 0)
706       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE;
707 
708    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
709         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV) != 0)
710       config.FeatureFlags |= D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV;
711 
712    //
713    // Add any missing mandatory/required features we didn't enable before
714    //
715    if ((config.FeatureFlags &
716         pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags) !=
717        pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags) {
718       debug_printf(
719          "[d3d12_video_encoder_convert_av1_codec_configuration] Adding required by caps but not selected already in "
720          "config.FeatureFlags...\n");
721 
722       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK) == 0) &&
723           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
724             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK) != 0)) {
725          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
726             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK;
727          debug_printf(
728             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
729             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK required by caps but not selected already in "
730             "config.FeatureFlags...\n");
731       }
732 
733       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA) == 0) &&
734           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
735             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA) != 0)) {
736          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
737             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA;
738          debug_printf(
739             "[d3d12_video_encoder_convert_av1_codec_configuration] "
740             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA Adding required by caps but not selected already in "
741             "config.FeatureFlags...\n");
742       }
743 
744       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER) == 0) &&
745           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
746             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER) != 0)) {
747          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
748             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER;
749          debug_printf(
750             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
751             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER required by caps but not selected already in "
752             "config.FeatureFlags...\n");
753       }
754 
755       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND) == 0) &&
756           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
757             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND) != 0)) {
758          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
759             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND;
760          debug_printf(
761             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
762             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND required by caps but not selected already in "
763             "config.FeatureFlags...\n");
764       }
765 
766       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND) == 0) &&
767           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
768             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND) != 0)) {
769          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
770             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND;
771          debug_printf(
772             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
773             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND required by caps but not selected already in "
774             "config.FeatureFlags...\n");
775       }
776 
777       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION) == 0) &&
778           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
779             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION) != 0)) {
780          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
781             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION;
782          debug_printf(
783             "[d3d12_video_encoder_convert_av1_codec_configuration] "
784             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION Adding required by caps but not selected already in "
785             "config.FeatureFlags...\n");
786       }
787 
788       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_DUAL_FILTER) == 0) &&
789           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
790             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_DUAL_FILTER) != 0)) {
791          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
792             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_DUAL_FILTER;
793          debug_printf("[d3d12_video_encoder_convert_av1_codec_configuration] == Adding required by caps but not "
794                       "selected already in "
795                       "config.FeatureFlags...\n");
796       }
797 
798       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_JNT_COMP) == 0) &&
799           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
800             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_JNT_COMP) != 0)) {
801          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
802             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_JNT_COMP;
803          debug_printf("[d3d12_video_encoder_convert_av1_codec_configuration] 0 Adding required by caps but not "
804                       "selected already in "
805                       "config.FeatureFlags...\n");
806       }
807 
808       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS) == 0) &&
809           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
810             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS) != 0)) {
811          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
812             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS;
813          debug_printf(
814             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding required by "
815             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS caps but not selected already in "
816             "config.FeatureFlags...\n");
817       }
818 
819       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION) == 0) &&
820           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
821             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION) != 0)) {
822          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
823             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION;
824          debug_printf(
825             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
826             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION required by caps but not selected already in "
827             "config.FeatureFlags...\n");
828       }
829 
830       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER) == 0) &&
831           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
832             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER) != 0)) {
833          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
834             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER;
835          debug_printf(
836             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
837             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER required by caps but not selected already in "
838             "config.FeatureFlags...\n");
839       }
840 
841       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING) == 0) &&
842           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
843             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING) != 0)) {
844          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
845             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING;
846          debug_printf(
847             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
848             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING required by caps but not selected already in "
849             "config.FeatureFlags...\n");
850       }
851 
852       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING) == 0) &&
853           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
854             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING) != 0)) {
855          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
856             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING;
857          debug_printf(
858             "[d3d12_video_encoder_convert_av1_codec_configuration] "
859             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING Adding required by caps but not selected already in "
860             "config.FeatureFlags...\n");
861       }
862 
863       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY) == 0) &&
864           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
865             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY) != 0)) {
866          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
867             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY;
868          debug_printf(
869             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
870             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY required by caps but not selected already in "
871             "config.FeatureFlags...\n");
872       }
873 
874       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS) == 0) &&
875           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
876             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS) != 0)) {
877          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
878             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS;
879          debug_printf(
880             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding required by "
881             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS caps but not selected already in "
882             "config.FeatureFlags...\n");
883       }
884 
885       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS) == 0) &&
886           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
887             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS) != 0)) {
888          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
889             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS;
890          debug_printf(
891             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
892             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS required by caps but not selected already in "
893             "config.FeatureFlags...\n");
894       }
895 
896       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_AUTO_SEGMENTATION) == 0) &&
897           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
898             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_AUTO_SEGMENTATION) != 0)) {
899          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
900             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_AUTO_SEGMENTATION;
901          debug_printf(
902             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
903             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_AUTO_SEGMENTATION required by caps but not selected already in "
904             "config.FeatureFlags...\n");
905       }
906 
907       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CUSTOM_SEGMENTATION) == 0) &&
908           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
909             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CUSTOM_SEGMENTATION) != 0)) {
910          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
911             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CUSTOM_SEGMENTATION;
912          debug_printf(
913             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
914             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CUSTOM_SEGMENTATION required by caps but not selected already in "
915             "config.FeatureFlags...\n");
916       }
917 
918       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS) == 0) &&
919           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
920             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS) != 0)) {
921          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
922             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS;
923          debug_printf(
924             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
925             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS required by caps but not selected already in "
926             "config.FeatureFlags...\n");
927       }
928 
929       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS) == 0) &&
930           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
931             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS) != 0)) {
932          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
933             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS;
934          debug_printf(
935             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
936             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS required by caps but not selected already in "
937             "config.FeatureFlags...\n");
938       }
939 
940       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX) == 0) &&
941           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
942             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX) != 0)) {
943          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
944             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX;
945          debug_printf(
946             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
947             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX required by caps but not selected already in "
948             "config.FeatureFlags...\n");
949       }
950 
951       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET) == 0) &&
952           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
953             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET) != 0)) {
954          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
955             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET;
956          debug_printf(
957             "[d3d12_video_encoder_convert_av1_codec_configuration] "
958             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET Adding required by caps but not selected already in "
959             "config.FeatureFlags...\n");
960       }
961 
962       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE) == 0) &&
963           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
964             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE) != 0)) {
965          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
966             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE;
967          debug_printf(
968             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
969             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE required by caps but not selected already in "
970             "config.FeatureFlags...\n");
971       }
972 
973       if (((config.FeatureFlags & D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV) == 0) &&
974           ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
975             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV) != 0)) {
976          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags |=
977             D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV;
978          debug_printf(
979             "[d3d12_video_encoder_convert_av1_codec_configuration] Adding "
980             "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV required by caps but not selected already in "
981             "config.FeatureFlags...\n");
982       }
983 
984       // Enable all required flags previously not selected
985       config.FeatureFlags |=
986          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags;
987    }
988 
989    // Check config.FeatureFlags against SupportedFeatureFlags and assign is_supported
990    if ((config.FeatureFlags &
991         pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags) !=
992        config.FeatureFlags) {
993       debug_printf(
994          "[d3d12_video_encoder_convert_av1_codec_configuration] AV1 Configuration flags requested 0x%x not supported "
995          "by "
996          "m_AV1CodecCaps.SupportedFeatureFlags 0x%x\n",
997          config.FeatureFlags,
998          pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags);
999 
1000       is_supported = false;
1001    }
1002 
1003    return config;
1004 }
1005 
1006 static bool
d3d12_video_encoder_update_intra_refresh_av1(struct d3d12_video_encoder * pD3D12Enc,D3D12_VIDEO_SAMPLE srcTextureDesc,struct pipe_av1_enc_picture_desc * picture)1007 d3d12_video_encoder_update_intra_refresh_av1(struct d3d12_video_encoder *pD3D12Enc,
1008                                                         D3D12_VIDEO_SAMPLE srcTextureDesc,
1009                                                         struct pipe_av1_enc_picture_desc *  picture)
1010 {
1011    if (picture->intra_refresh.mode != INTRA_REFRESH_MODE_NONE)
1012    {
1013       // D3D12 only supports row intra-refresh
1014       if (picture->intra_refresh.mode != INTRA_REFRESH_MODE_UNIT_ROWS)
1015       {
1016          debug_printf("[d3d12_video_encoder_update_intra_refresh_av1] Unsupported INTRA_REFRESH_MODE %d\n", picture->intra_refresh.mode);
1017          return false;
1018       }
1019 
1020       uint32_t sbSize = ((pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1021         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK) != 0) ? 128u : 64u;
1022       uint32_t total_frame_blocks = static_cast<uint32_t>(std::ceil(srcTextureDesc.Height / sbSize)) *
1023                               static_cast<uint32_t>(std::ceil(srcTextureDesc.Width / sbSize));
1024       D3D12_VIDEO_ENCODER_INTRA_REFRESH targetIntraRefresh = {
1025          D3D12_VIDEO_ENCODER_INTRA_REFRESH_MODE_ROW_BASED,
1026          total_frame_blocks / picture->intra_refresh.region_size,
1027       };
1028       double ir_wave_progress = (picture->intra_refresh.offset == 0) ? 0 :
1029          picture->intra_refresh.offset / (double) total_frame_blocks;
1030       pD3D12Enc->m_currentEncodeConfig.m_IntraRefreshCurrentFrameIndex =
1031          static_cast<uint32_t>(std::ceil(ir_wave_progress * targetIntraRefresh.IntraRefreshDuration));
1032 
1033       // Set intra refresh state
1034       pD3D12Enc->m_currentEncodeConfig.m_IntraRefresh = targetIntraRefresh;
1035       // Need to send the sequence flag during all the IR duration
1036       pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_intra_refresh;
1037    } else {
1038       pD3D12Enc->m_currentEncodeConfig.m_IntraRefreshCurrentFrameIndex = 0;
1039       pD3D12Enc->m_currentEncodeConfig.m_IntraRefresh = {
1040          D3D12_VIDEO_ENCODER_INTRA_REFRESH_MODE_NONE,
1041          0,
1042       };
1043    }
1044 
1045    return true;
1046 }
1047 
1048 bool
d3d12_video_encoder_update_current_encoder_config_state_av1(struct d3d12_video_encoder * pD3D12Enc,D3D12_VIDEO_SAMPLE srcTextureDesc,struct pipe_picture_desc * picture)1049 d3d12_video_encoder_update_current_encoder_config_state_av1(struct d3d12_video_encoder *pD3D12Enc,
1050                                                             D3D12_VIDEO_SAMPLE srcTextureDesc,
1051                                                             struct pipe_picture_desc *picture)
1052 {
1053    struct pipe_av1_enc_picture_desc *av1Pic = (struct pipe_av1_enc_picture_desc *) picture;
1054 
1055    // Reset reconfig dirty flags
1056    pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags = d3d12_video_encoder_config_dirty_flag_none;
1057    // Reset sequence changes flags
1058    pD3D12Enc->m_currentEncodeConfig.m_seqFlags = D3D12_VIDEO_ENCODER_SEQUENCE_CONTROL_FLAG_NONE;
1059 
1060    // Set codec
1061    if (pD3D12Enc->m_currentEncodeConfig.m_encoderCodecDesc != D3D12_VIDEO_ENCODER_CODEC_AV1) {
1062       pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_codec;
1063    }
1064    pD3D12Enc->m_currentEncodeConfig.m_encoderCodecDesc = D3D12_VIDEO_ENCODER_CODEC_AV1;
1065 
1066    // Set input format
1067    DXGI_FORMAT targetFmt = srcTextureDesc.Format.Format;
1068    if (pD3D12Enc->m_currentEncodeConfig.m_encodeFormatInfo.Format != targetFmt) {
1069       pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_input_format;
1070    }
1071 
1072    pD3D12Enc->m_currentEncodeConfig.m_encodeFormatInfo = {};
1073    pD3D12Enc->m_currentEncodeConfig.m_encodeFormatInfo.Format = targetFmt;
1074    HRESULT hr =
1075       pD3D12Enc->m_pD3D12Screen->dev->CheckFeatureSupport(D3D12_FEATURE_FORMAT_INFO,
1076                                                           &pD3D12Enc->m_currentEncodeConfig.m_encodeFormatInfo,
1077                                                           sizeof(pD3D12Enc->m_currentEncodeConfig.m_encodeFormatInfo));
1078    if (FAILED(hr)) {
1079       debug_printf("CheckFeatureSupport failed with HR 0x%x\n", hr);
1080       return false;
1081    }
1082 
1083    // Set resolution (ie. frame_size)
1084    if ((pD3D12Enc->m_currentEncodeConfig.m_currentResolution.Width != srcTextureDesc.Width) ||
1085        (pD3D12Enc->m_currentEncodeConfig.m_currentResolution.Height != srcTextureDesc.Height)) {
1086       pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_resolution;
1087    }
1088    pD3D12Enc->m_currentEncodeConfig.m_currentResolution.Width = srcTextureDesc.Width;
1089    pD3D12Enc->m_currentEncodeConfig.m_currentResolution.Height = srcTextureDesc.Height;
1090 
1091    // render_size
1092    pD3D12Enc->m_currentEncodeConfig.m_FrameCroppingCodecConfig.right = av1Pic->frame_width;
1093    pD3D12Enc->m_currentEncodeConfig.m_FrameCroppingCodecConfig.bottom = av1Pic->frame_height;
1094 
1095    // Set profile
1096    auto targetProfile = d3d12_video_encoder_convert_profile_to_d3d12_enc_profile_av1(pD3D12Enc->base.profile);
1097    if (pD3D12Enc->m_currentEncodeConfig.m_encoderProfileDesc.m_AV1Profile != targetProfile) {
1098       pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_profile;
1099    }
1100    pD3D12Enc->m_currentEncodeConfig.m_encoderProfileDesc.m_AV1Profile = targetProfile;
1101 
1102    // Set level and tier
1103    D3D12_VIDEO_ENCODER_AV1_LEVELS targetLevel = {};
1104    D3D12_VIDEO_ENCODER_AV1_TIER targetTier = {};
1105    d3d12_video_encoder_convert_spec_to_d3d12_level_av1(av1Pic->seq.level, targetLevel);
1106    d3d12_video_encoder_convert_spec_to_d3d12_tier_av1(av1Pic->seq.tier, targetTier);
1107 
1108    if ((pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Level != targetLevel) ||
1109        (pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Tier != targetTier)) {
1110       pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_level;
1111    }
1112    pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Tier = targetTier;
1113    pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Level = targetLevel;
1114 
1115    //
1116    // Validate caps support returned values against current settings
1117    //
1118    if (pD3D12Enc->m_currentEncodeConfig.m_encoderProfileDesc.m_AV1Profile !=
1119        pD3D12Enc->m_currentEncodeCapabilities.m_encoderSuggestedProfileDesc.m_AV1Profile) {
1120       debug_printf("[d3d12_video_encoder_av1] Warning: Requested D3D12_VIDEO_ENCODER_PROFILE_AV1 by upper layer: %d "
1121                    "mismatches UMD suggested D3D12_VIDEO_ENCODER_PROFILE_AV1: %d\n",
1122                    pD3D12Enc->m_currentEncodeConfig.m_encoderProfileDesc.m_AV1Profile,
1123                    pD3D12Enc->m_currentEncodeCapabilities.m_encoderSuggestedProfileDesc.m_AV1Profile);
1124    }
1125 
1126    if ((pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Level !=
1127         pD3D12Enc->m_currentEncodeCapabilities.m_encoderLevelSuggestedDesc.m_AV1LevelSetting.Level) ||
1128        (pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Tier !=
1129         pD3D12Enc->m_currentEncodeCapabilities.m_encoderLevelSuggestedDesc.m_AV1LevelSetting.Tier)) {
1130       debug_printf(
1131          "[d3d12_video_encoder_av1] Warning: Requested D3D12_VIDEO_ENCODER_LEVELS_AV1 by upper layer: level %d tier %d "
1132          "mismatches UMD suggested D3D12_VIDEO_ENCODER_LEVELS_AV1: level %d tier %d\n",
1133          pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Level,
1134          pD3D12Enc->m_currentEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Tier,
1135          pD3D12Enc->m_currentEncodeCapabilities.m_encoderLevelSuggestedDesc.m_AV1LevelSetting.Level,
1136          pD3D12Enc->m_currentEncodeCapabilities.m_encoderLevelSuggestedDesc.m_AV1LevelSetting.Tier);
1137    }
1138 
1139    // Set codec config
1140    bool is_supported = false;
1141    auto targetCodecConfig = d3d12_video_encoder_convert_av1_codec_configuration(pD3D12Enc, av1Pic, is_supported);
1142    if (!is_supported) {
1143       return false;
1144    }
1145 
1146    if (memcmp(&pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config,
1147               &targetCodecConfig,
1148               sizeof(D3D12_VIDEO_ENCODER_AV1_CODEC_CONFIGURATION)) != 0) {
1149       pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |= d3d12_video_encoder_config_dirty_flag_codec_config;
1150    }
1151    pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config = targetCodecConfig;
1152 
1153    // Set rate control
1154    d3d12_video_encoder_update_current_rate_control_av1(pD3D12Enc, av1Pic);
1155 
1156    // Set tiles config
1157    if (!d3d12_video_encoder_negotiate_current_av1_tiles_configuration(pD3D12Enc, av1Pic)) {
1158       debug_printf("d3d12_video_encoder_negotiate_current_av1_tiles_configuration failed!\n");
1159       return false;
1160    }
1161 
1162    // Set GOP config
1163    if (!d3d12_video_encoder_update_av1_gop_configuration(pD3D12Enc, av1Pic)) {
1164       debug_printf("d3d12_video_encoder_update_av1_gop_configuration failed!\n");
1165       return false;
1166    }
1167 
1168    // Set intra-refresh config
1169    if(!d3d12_video_encoder_update_intra_refresh_av1(pD3D12Enc, srcTextureDesc, av1Pic)) {
1170       debug_printf("d3d12_video_encoder_update_intra_refresh_av1 failed!\n");
1171       return false;
1172    }
1173 
1174    // m_currentEncodeConfig.m_encoderPicParamsDesc pic params are set in d3d12_video_encoder_reconfigure_encoder_objects
1175    // after re-allocating objects if needed
1176 
1177    // Set motion estimation config
1178    auto targetMotionLimit = d3d12_video_encoder_convert_av1_motion_configuration(pD3D12Enc, av1Pic);
1179    if (pD3D12Enc->m_currentEncodeConfig.m_encoderMotionPrecisionLimit != targetMotionLimit) {
1180       pD3D12Enc->m_currentEncodeConfig.m_ConfigDirtyFlags |=
1181          d3d12_video_encoder_config_dirty_flag_motion_precision_limit;
1182    }
1183    pD3D12Enc->m_currentEncodeConfig.m_encoderMotionPrecisionLimit = targetMotionLimit;
1184 
1185    // Will call for d3d12 driver support based on the initial requested (non codec specific) features, then
1186    // try to fallback if any of them is not supported and return the negotiated d3d12 settings
1187    D3D12_FEATURE_DATA_VIDEO_ENCODER_SUPPORT1 capEncoderSupportData1 = {};
1188    if (!d3d12_video_encoder_negotiate_requested_features_and_d3d12_driver_caps(pD3D12Enc, capEncoderSupportData1)) {
1189       debug_printf("[d3d12_video_encoder_av1] After negotiating caps, D3D12_FEATURE_VIDEO_ENCODER_SUPPORT1 "
1190                    "arguments are not supported - "
1191                    "ValidationFlags: 0x%x - SupportFlags: 0x%x\n",
1192                    capEncoderSupportData1.ValidationFlags,
1193                    capEncoderSupportData1.SupportFlags);
1194       return false;
1195    }
1196 
1197    pD3D12Enc->m_currentEncodeCapabilities.m_MaxSlicesInOutput = (av1Pic->tile_cols * av1Pic->tile_rows);
1198    if (pD3D12Enc->m_currentEncodeCapabilities.m_MaxSlicesInOutput >
1199        pD3D12Enc->m_currentEncodeCapabilities.m_currentResolutionSupportCaps.MaxSubregionsNumber) {
1200       debug_printf("[d3d12_video_encoder_av1] Desired number of subregions is not supported (higher than max "
1201                    "reported slice number in query caps)\n.");
1202       return false;
1203    }
1204 
1205    return true;
1206 }
1207 
1208 /*
1209  * Called at begin_frame record time
1210  */
1211 void
d3d12_video_encoder_update_current_frame_pic_params_info_av1(struct d3d12_video_encoder * pD3D12Enc,struct pipe_video_buffer * srcTexture,struct pipe_picture_desc * picture,D3D12_VIDEO_ENCODER_PICTURE_CONTROL_CODEC_DATA & picParams,bool & bUsedAsReference)1212 d3d12_video_encoder_update_current_frame_pic_params_info_av1(struct d3d12_video_encoder *pD3D12Enc,
1213                                                              struct pipe_video_buffer *srcTexture,
1214                                                              struct pipe_picture_desc *picture,
1215                                                              D3D12_VIDEO_ENCODER_PICTURE_CONTROL_CODEC_DATA &picParams,
1216                                                              bool &bUsedAsReference)
1217 {
1218    struct pipe_av1_enc_picture_desc *pAV1Pic = (struct pipe_av1_enc_picture_desc *) picture;
1219 
1220    // Output param bUsedAsReference
1221    bUsedAsReference = (pAV1Pic->refresh_frame_flags != 0);
1222 
1223    // D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAGS Flags;
1224    picParams.pAV1PicData->Flags = D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_NONE;
1225 
1226    if (pAV1Pic->error_resilient_mode)
1227       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_ERROR_RESILIENT_MODE;
1228 
1229    if (pAV1Pic->disable_cdf_update)
1230       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_DISABLE_CDF_UPDATE;
1231 
1232    if (pAV1Pic->palette_mode_enable)
1233       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_PALETTE_ENCODING;
1234 
1235    // Override if required feature
1236    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1237         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING) != 0) {
1238       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1239                    "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_PALETTE_ENCODING\n");
1240       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_PALETTE_ENCODING;
1241    }
1242 
1243    if (pAV1Pic->skip_mode_present)
1244       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_SKIP_MODE;
1245 
1246    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1247         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SKIP_MODE_PRESENT) != 0) {
1248       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1249                    "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_SKIP_MODE\n");
1250       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_SKIP_MODE;
1251    }
1252 
1253    if (pAV1Pic->use_ref_frame_mvs)
1254       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FRAME_REFERENCE_MOTION_VECTORS;
1255 
1256    // Override if required feature
1257    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1258         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS) != 0) {
1259       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1260                    "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FRAME_REFERENCE_MOTION_VECTORS\n");
1261       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FRAME_REFERENCE_MOTION_VECTORS;
1262    }
1263 
1264    // No pipe flag for force_integer_mv (D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FORCE_INTEGER_MOTION_VECTORS)
1265    // choose default based on required/supported underlying codec flags
1266    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1267         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS) != 0) {
1268       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1269                    "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FORCE_INTEGER_MOTION_VECTORS\n");
1270       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FORCE_INTEGER_MOTION_VECTORS;
1271    }
1272 
1273    if (pAV1Pic->allow_intrabc)
1274       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_INTRA_BLOCK_COPY;
1275 
1276    // Override if required feature
1277    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1278         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY) != 0) {
1279       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1280                    "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_INTRA_BLOCK_COPY\n");
1281       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_INTRA_BLOCK_COPY;
1282    }
1283 
1284    if (pAV1Pic->use_superres)
1285       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_USE_SUPER_RESOLUTION;
1286 
1287    if (pAV1Pic->disable_frame_end_update_cdf)
1288       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_DISABLE_FRAME_END_UPDATE_CDF;
1289 
1290    // No pipe flag for D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_AUTO
1291    // choose default based on required/supported underlying codec flags
1292    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1293         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_AUTO_SEGMENTATION) != 0) {
1294       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1295                    "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_AUTO\n");
1296       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_AUTO;
1297    }
1298 
1299    // No pipe flag for D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_CUSTOM
1300    // choose default based on required/supported underlying codec flags
1301    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1302         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CUSTOM_SEGMENTATION) != 0) {
1303       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1304                    "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_CUSTOM\n");
1305       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_CUSTOM;
1306       assert(false);   // Not implemented
1307    }
1308 
1309    // No pipe flag for allow_warped_motion (D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_WARPED_MOTION)
1310    // choose default based on required/supported underlying codec flags
1311    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1312         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION) != 0) {
1313       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1314                    "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_WARPED_MOTION\n");
1315       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_WARPED_MOTION;
1316    }
1317 
1318    // Only enable if supported (there is no PIPE/VA cap flag for reduced_tx_set)
1319    if ((pAV1Pic->reduced_tx_set) &&
1320        (pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
1321         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET) != 0) {
1322       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_REDUCED_TX_SET;
1323    }
1324 
1325    // Override if required feature
1326    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1327         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET) != 0) {
1328       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1329                    "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_REDUCED_TX_SET\n");
1330       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_REDUCED_TX_SET;
1331    }
1332 
1333    // Only enable if supported
1334    if ((pAV1Pic->allow_high_precision_mv) &&
1335        (pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedFeatureFlags &
1336         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV) != 0) {
1337       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_HIGH_PRECISION_MV;
1338    }
1339 
1340    // Override if required feature
1341    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1342         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV) != 0) {
1343       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1344                    "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_HIGH_PRECISION_MV\n");
1345       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_HIGH_PRECISION_MV;
1346    }
1347 
1348    // No pipe flag for is_motion_mode_switchable (D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_MOTION_MODE_SWITCHABLE)
1349    // choose default based on required/supported underlying codec flags
1350    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.RequiredFeatureFlags &
1351         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE) != 0) {
1352       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Overriding required feature "
1353                    "D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_MOTION_MODE_SWITCHABLE\n");
1354       picParams.pAV1PicData->Flags |= D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_MOTION_MODE_SWITCHABLE;
1355    }
1356 
1357    // D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE FrameType;
1358    // AV1 spec matches w/D3D12 enum definition
1359    picParams.pAV1PicData->FrameType = static_cast<D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE>(pAV1Pic->frame_type);
1360 
1361    if (picParams.pAV1PicData->FrameType == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_KEY_FRAME)
1362       debug_printf("Encoding FrameType: D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_KEY_FRAME\n");
1363    if (picParams.pAV1PicData->FrameType == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTER_FRAME)
1364       debug_printf("Encoding FrameType: D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTER_FRAME\n");
1365    if (picParams.pAV1PicData->FrameType == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTRA_ONLY_FRAME)
1366       debug_printf("Encoding FrameType: D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTRA_ONLY_FRAME\n");
1367    if (picParams.pAV1PicData->FrameType == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_SWITCH_FRAME)
1368       debug_printf("Encoding FrameType: D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_SWITCH_FRAME\n");
1369 
1370    // D3D12_VIDEO_ENCODER_AV1_COMP_PREDICTION_TYPE CompoundPredictionType;
1371    picParams.pAV1PicData->CompoundPredictionType = (pAV1Pic->compound_reference_mode == 0) ?
1372                                                       D3D12_VIDEO_ENCODER_AV1_COMP_PREDICTION_TYPE_SINGLE_REFERENCE :
1373                                                       D3D12_VIDEO_ENCODER_AV1_COMP_PREDICTION_TYPE_COMPOUND_REFERENCE;
1374 
1375    // D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS InterpolationFilter;
1376    // AV1 spec matches w/D3D12 enum definition
1377    picParams.pAV1PicData->InterpolationFilter =
1378       static_cast<D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS>(pAV1Pic->interpolation_filter);
1379 
1380    // Workaround for apps sending interpolation_filter values not supported even when reporting
1381    // them in pipe_av1_enc_cap_features_ext1.interpolation_filter. If D3D12 driver doesn't support
1382    // requested InterpolationFilter, fallback to the first supported by D3D12 driver
1383    if ( (pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedInterpolationFilters &
1384       (1 << picParams.pAV1PicData->InterpolationFilter)) == 0 ) { /* See definition of D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS_FLAGS */
1385       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Requested interpolation_filter"
1386                    " not supported in pipe_av1_enc_cap_features_ext1.interpolation_filter"
1387                    ", auto selecting from D3D12 SupportedInterpolationFilters...");
1388       for(uint8_t i = D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS_EIGHTTAP; i <= D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS_SWITCHABLE; i++) {
1389          if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedInterpolationFilters &
1390              (1 << i)) /* See definition of D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS_FLAGS */ != 0) {
1391             picParams.pAV1PicData->InterpolationFilter = static_cast<D3D12_VIDEO_ENCODER_AV1_INTERPOLATION_FILTERS>(i);
1392             break;
1393          }
1394       }
1395    }
1396 
1397    // D3D12_VIDEO_ENCODER_AV1_RESTORATION_CONFIG FrameRestorationConfig;
1398    // AV1 spec matches w/D3D12 FrameRestorationType enum definition
1399 
1400    picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[0] =
1401       static_cast<D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE>(pAV1Pic->restoration.yframe_restoration_type);
1402    picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[1] =
1403       static_cast<D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE>(pAV1Pic->restoration.cbframe_restoration_type);
1404    picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[2] =
1405       static_cast<D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE>(pAV1Pic->restoration.crframe_restoration_type);
1406 
1407    if (picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[0] !=
1408        D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE_DISABLED) {
1409       picParams.pAV1PicData->FrameRestorationConfig.LoopRestorationPixelSize[0] =
1410          d3d12_video_encoder_looprestorationsize_uint_to_d3d12_av1(1 << (6 + pAV1Pic->restoration.lr_unit_shift));
1411    }
1412 
1413    if (picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[1] !=
1414        D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE_DISABLED) {
1415       picParams.pAV1PicData->FrameRestorationConfig.LoopRestorationPixelSize[1] =
1416          d3d12_video_encoder_looprestorationsize_uint_to_d3d12_av1(
1417             1 << (6 + pAV1Pic->restoration.lr_unit_shift - pAV1Pic->restoration.lr_uv_shift));
1418    }
1419 
1420    if (picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[2] !=
1421        D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE_DISABLED) {
1422       picParams.pAV1PicData->FrameRestorationConfig.LoopRestorationPixelSize[2] =
1423          d3d12_video_encoder_looprestorationsize_uint_to_d3d12_av1(
1424             1 << (6 + pAV1Pic->restoration.lr_unit_shift - pAV1Pic->restoration.lr_uv_shift));
1425    }
1426 
1427    // D3D12_VIDEO_ENCODER_AV1_TX_MODE TxMode;
1428    // AV1 spec matches w/D3D12 enum definition
1429    picParams.pAV1PicData->TxMode = static_cast<D3D12_VIDEO_ENCODER_AV1_TX_MODE>(pAV1Pic->tx_mode);
1430 
1431    // Workaround for mismatch between VAAPI/D3D12 and TxMode support for all/some frame types
1432    // If D3D12 driver doesn't support requested TxMode, fallback to the first supported by D3D12
1433    // driver for the requested frame type
1434    if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedTxModes[picParams.pAV1PicData->FrameType] &
1435       (1 << picParams.pAV1PicData->TxMode)) == 0) /* See definition of D3D12_VIDEO_ENCODER_AV1_TX_MODE_FLAGS */ {
1436       debug_printf("[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Requested tx_mode not supported"
1437                      ", auto selecting from D3D12 SupportedTxModes for current frame type...");
1438       for(uint8_t i = D3D12_VIDEO_ENCODER_AV1_TX_MODE_ONLY4x4; i <= D3D12_VIDEO_ENCODER_AV1_TX_MODE_SELECT; i++) {
1439          if ((pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1CodecCaps.SupportedTxModes[picParams.pAV1PicData->FrameType] &
1440              (1 << i)) /* See definition of D3D12_VIDEO_ENCODER_AV1_TX_MODE_FLAGS */ != 0) {
1441             picParams.pAV1PicData->TxMode = static_cast<D3D12_VIDEO_ENCODER_AV1_TX_MODE>(i);
1442             break;
1443          }
1444       }
1445    }
1446 
1447    // UINT SuperResDenominator;
1448    picParams.pAV1PicData->SuperResDenominator = pAV1Pic->superres_scale_denominator;
1449 
1450    // UINT OrderHint;
1451    picParams.pAV1PicData->OrderHint = pAV1Pic->order_hint;
1452 
1453    // UINT PictureIndex - Substract the last_key_frame_num to make it modulo KEY frame
1454    picParams.pAV1PicData->PictureIndex = pAV1Pic->frame_num - pAV1Pic->last_key_frame_num;
1455 
1456    // UINT TemporalLayerIndexPlus1;
1457    assert(pAV1Pic->temporal_id == pAV1Pic->tg_obu_header.temporal_id);
1458    picParams.pAV1PicData->TemporalLayerIndexPlus1 = pAV1Pic->temporal_id + 1;
1459 
1460    // UINT SpatialLayerIndexPlus1;
1461    picParams.pAV1PicData->SpatialLayerIndexPlus1 = pAV1Pic->tg_obu_header.spatial_id + 1;
1462 
1463    //
1464    // Reference Pictures
1465    //
1466    {
1467       for (uint8_t i = 0; i < ARRAY_SIZE(picParams.pAV1PicData->ReferenceIndices); i++) {
1468          picParams.pAV1PicData->ReferenceIndices[i] = pAV1Pic->ref_frame_idx[i];
1469       }
1470 
1471       bool FrameIsIntra = (picParams.pAV1PicData->FrameType == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_INTRA_ONLY_FRAME ||
1472                            picParams.pAV1PicData->FrameType == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_KEY_FRAME);
1473       if (FrameIsIntra)
1474          picParams.pAV1PicData->PrimaryRefFrame = 7; /* PRIMARY_REF_NONE */
1475       else
1476          picParams.pAV1PicData->PrimaryRefFrame = pAV1Pic->primary_ref_frame;
1477       debug_printf("App requested primary_ref_frame: %" PRIu32 "\n", pAV1Pic->primary_ref_frame);
1478       picParams.pAV1PicData->RefreshFrameFlags = pAV1Pic->refresh_frame_flags;
1479    }
1480 
1481    // D3D12_VIDEO_ENCODER_CODEC_AV1_LOOP_FILTER_CONFIG LoopFilter;
1482    picParams.pAV1PicData->LoopFilter.LoopFilterLevel[0] = pAV1Pic->loop_filter.filter_level[0];
1483    picParams.pAV1PicData->LoopFilter.LoopFilterLevel[1] = pAV1Pic->loop_filter.filter_level[1];
1484    picParams.pAV1PicData->LoopFilter.LoopFilterLevelU = pAV1Pic->loop_filter.filter_level_u;
1485    picParams.pAV1PicData->LoopFilter.LoopFilterLevelV = pAV1Pic->loop_filter.filter_level_v;
1486    picParams.pAV1PicData->LoopFilter.LoopFilterSharpnessLevel = pAV1Pic->loop_filter.sharpness_level;
1487    picParams.pAV1PicData->LoopFilter.LoopFilterDeltaEnabled = pAV1Pic->loop_filter.mode_ref_delta_enabled;
1488    picParams.pAV1PicData->LoopFilter.UpdateRefDelta = pAV1Pic->loop_filter.mode_ref_delta_update;
1489    if (picParams.pAV1PicData->LoopFilter.UpdateRefDelta) {
1490       for (uint8_t i = 0; i < ARRAY_SIZE(picParams.pAV1PicData->LoopFilter.RefDeltas); i++) {
1491          picParams.pAV1PicData->LoopFilter.RefDeltas[i] = pAV1Pic->loop_filter.ref_deltas[i];
1492       }
1493    }
1494    picParams.pAV1PicData->LoopFilter.UpdateModeDelta = pAV1Pic->loop_filter.mode_ref_delta_update;
1495    if (picParams.pAV1PicData->LoopFilter.UpdateModeDelta) {
1496       for (uint8_t i = 0; i < ARRAY_SIZE(picParams.pAV1PicData->LoopFilter.ModeDeltas); i++) {
1497          picParams.pAV1PicData->LoopFilter.ModeDeltas[i] = pAV1Pic->loop_filter.mode_deltas[i];
1498       }
1499    }
1500 
1501    // D3D12_VIDEO_ENCODER_CODEC_AV1_LOOP_FILTER_DELTA_CONFIG LoopFilterDelta;
1502    picParams.pAV1PicData->LoopFilterDelta.DeltaLFMulti = pAV1Pic->loop_filter.delta_lf_multi;
1503    picParams.pAV1PicData->LoopFilterDelta.DeltaLFPresent = pAV1Pic->loop_filter.delta_lf_present;
1504    picParams.pAV1PicData->LoopFilterDelta.DeltaLFRes = pAV1Pic->loop_filter.delta_lf_res;
1505 
1506    // D3D12_VIDEO_ENCODER_CODEC_AV1_QUANTIZATION_CONFIG Quantization;
1507    picParams.pAV1PicData->Quantization.BaseQIndex = pAV1Pic->quantization.base_qindex;
1508    picParams.pAV1PicData->Quantization.YDCDeltaQ = pAV1Pic->quantization.y_dc_delta_q;
1509    picParams.pAV1PicData->Quantization.UDCDeltaQ = pAV1Pic->quantization.u_dc_delta_q;
1510    picParams.pAV1PicData->Quantization.UACDeltaQ = pAV1Pic->quantization.u_ac_delta_q;
1511    picParams.pAV1PicData->Quantization.VDCDeltaQ = pAV1Pic->quantization.v_dc_delta_q;
1512    picParams.pAV1PicData->Quantization.VACDeltaQ = pAV1Pic->quantization.v_ac_delta_q;
1513    picParams.pAV1PicData->Quantization.UsingQMatrix = pAV1Pic->quantization.using_qmatrix;
1514    picParams.pAV1PicData->Quantization.QMY = pAV1Pic->quantization.qm_y;
1515    picParams.pAV1PicData->Quantization.QMU = pAV1Pic->quantization.qm_u;
1516    picParams.pAV1PicData->Quantization.QMV = pAV1Pic->quantization.qm_v;
1517 
1518    // D3D12_VIDEO_ENCODER_CODEC_AV1_QUANTIZATION_DELTA_CONFIG QuantizationDelta;
1519    picParams.pAV1PicData->QuantizationDelta.DeltaQPresent = pAV1Pic->quantization.delta_q_present;
1520    picParams.pAV1PicData->QuantizationDelta.DeltaQRes = pAV1Pic->quantization.delta_q_res;
1521 
1522    // D3D12_VIDEO_ENCODER_AV1_CDEF_CONFIG CDEF;
1523    picParams.pAV1PicData->CDEF.CdefBits = pAV1Pic->cdef.cdef_bits;
1524    picParams.pAV1PicData->CDEF.CdefDampingMinus3 = pAV1Pic->cdef.cdef_damping_minus_3;
1525    for (uint32_t i = 0; i < 8; i++) {
1526       picParams.pAV1PicData->CDEF.CdefYPriStrength[i] = (pAV1Pic->cdef.cdef_y_strengths[i] >> 2);
1527       picParams.pAV1PicData->CDEF.CdefYSecStrength[i] = (pAV1Pic->cdef.cdef_y_strengths[i] & 0x03);
1528       picParams.pAV1PicData->CDEF.CdefUVPriStrength[i] = (pAV1Pic->cdef.cdef_uv_strengths[i] >> 2);
1529       picParams.pAV1PicData->CDEF.CdefUVSecStrength[i] = (pAV1Pic->cdef.cdef_uv_strengths[i] & 0x03);
1530    }
1531 
1532    //
1533    // Set values for mandatory but not requested features (ie. RequiredFeature flags reported by driver not requested
1534    // by pipe)
1535    //
1536 
1537    // For the ones that are more trivial (ie. 128x128 SB) than enabling their flag, and have more parameters to be
1538    // set (ie Restoration Filter) Set defaults based on such feature driver d3d12 caps
1539 
1540    // These are a trivial flag enabling
1541    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK
1542    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA
1543    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER
1544    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND
1545    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND
1546    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION
1547    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_DUAL_FILTER
1548    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_JNT_COMP
1549    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FORCED_INTEGER_MOTION_VECTORS
1550    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION
1551    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_PALETTE_ENCODING
1552    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_BLOCK_COPY
1553    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS
1554    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS
1555    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_REDUCED_TX_SET
1556    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MOTION_MODE_SWITCHABLE
1557    //  D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ALLOW_HIGH_PRECISION_MV
1558 
1559    // If driver requires these, can use post encode values to enforce specific values
1560    // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING
1561    // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_AUTO_SEGMENTATION // Only useful with post encode values as driver
1562    // controls D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CUSTOM_SEGMENTATION // There are more Segmentation caps in
1563    // D3D12_VIDEO_ENCODER_AV1_CODEC_CONFIGURATION_SUPPORT for these one too
1564    // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_FILTER_DELTAS
1565    // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_DELTAS
1566    // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_QUANTIZATION_MATRIX
1567 
1568    // If driver requires this one, use driver restoration caps to set default values
1569    // D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER
1570    if (pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps.RequiredNotRequestedFeatureFlags &
1571        D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER) {
1572       debug_printf(
1573          "[d3d12_video_encoder_update_current_frame_pic_params_info_av1] Adding default params for "
1574          "D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER required by caps but not selected already in "
1575          "config.FeatureFlags...\n");
1576 
1577       // Set Y, U, V luma plane restoration params
1578       for (uint32_t planeIdx = 0; planeIdx < 3; planeIdx++) {
1579          // Let's see which filters and with which sizes are supported for planeIdx
1580          bool foundSupportedFilter = false;
1581          for (uint32_t filterIdx = 0; ((filterIdx < 3) && !foundSupportedFilter); filterIdx++) {
1582             auto curFilterSupport = pD3D12Enc->m_currentEncodeCapabilities.m_encoderCodecSpecificConfigCaps
1583                                        .m_AV1CodecCaps.SupportedRestorationParams[filterIdx][planeIdx];
1584             for (uint32_t curFilterSize = D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_32x32;
1585                  ((curFilterSize <= D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_256x256) && !foundSupportedFilter);
1586                  curFilterSize++) {
1587 
1588                // Check if there's support for curFilter on CurPlane and choose the first supported restoration size
1589                //  If yes, set restoration params for planeIdx
1590                if (curFilterSupport &
1591                    (1 << (curFilterSize - 1))) { /* Converts D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE definition
1592                                         into D3D12_VIDEO_ENCODER_AV1_RESTORATION_SUPPORT_FLAGS definition */
1593                   {
1594                      foundSupportedFilter = true;
1595                      // As per d3d12 spec filterIdx corresponds to D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE - 1
1596                      // (SupportedRestorationParams definition skips D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE_DISABLED)
1597                      D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE curFilter =
1598                         static_cast<D3D12_VIDEO_ENCODER_AV1_RESTORATION_TYPE>(filterIdx + 1);
1599 
1600                      picParams.pAV1PicData->FrameRestorationConfig.FrameRestorationType[planeIdx] = curFilter;
1601                      picParams.pAV1PicData->FrameRestorationConfig.LoopRestorationPixelSize[planeIdx] =
1602                         static_cast<D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE>(
1603                            curFilterSize); /* loop uses enum type */
1604                   }
1605                }
1606             }
1607          }
1608       }
1609    }
1610 
1611    // Save state snapshot from record time to resolve headers at get_feedback time
1612    uint64_t current_metadata_slot = (pD3D12Enc->m_fenceValue % D3D12_VIDEO_ENC_METADATA_BUFFERS_COUNT);
1613    pD3D12Enc->m_spEncodedFrameMetadata[current_metadata_slot].m_associatedEncodeCapabilities =
1614       pD3D12Enc->m_currentEncodeCapabilities;
1615    pD3D12Enc->m_spEncodedFrameMetadata[current_metadata_slot].m_associatedEncodeConfig =
1616       pD3D12Enc->m_currentEncodeConfig;
1617    pD3D12Enc->m_spEncodedFrameMetadata[current_metadata_slot].m_CodecSpecificData.AV1HeadersInfo.enable_frame_obu =
1618       pAV1Pic->enable_frame_obu;
1619    pD3D12Enc->m_spEncodedFrameMetadata[current_metadata_slot].m_CodecSpecificData.AV1HeadersInfo.obu_has_size_field =
1620       (pAV1Pic->tg_obu_header.obu_has_size_field == 1);
1621    // Disabling for now as the libva spec does not allow these but some apps send down anyway. It's possible in the future
1622    // the libva spec may be retro-fitted to allow this given existing apps in the wild doing it.
1623    // pD3D12Enc->m_spEncodedFrameMetadata[current_metadata_slot]
1624    //   .m_CodecSpecificData.AV1HeadersInfo.temporal_delim_rendered = pAV1Pic->temporal_delim_rendered;
1625 
1626    if ((pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[pAV1Pic->temporal_id].m_Flags & D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_DELTA_QP) != 0)
1627    {
1628       // Use 16 bit qpmap array for AV1 picparams (-255, 255 range and int16_t pRateControlQPMap type)
1629       const int32_t av1_min_delta_qp = -255;
1630       const int32_t av1_max_delta_qp = 255;
1631       d3d12_video_encoder_update_picparams_region_of_interest_qpmap(
1632          pD3D12Enc,
1633          &pAV1Pic->roi,
1634          av1_min_delta_qp,
1635          av1_max_delta_qp,
1636          pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[pAV1Pic->temporal_id].m_pRateControlQPMap16Bit);
1637       picParams.pAV1PicData->pRateControlQPMap = pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[pAV1Pic->temporal_id].m_pRateControlQPMap16Bit.data();
1638       picParams.pAV1PicData->QPMapValuesCount = pD3D12Enc->m_currentEncodeConfig.m_encoderRateControlDesc[pAV1Pic->temporal_id].m_pRateControlQPMap16Bit.size();
1639    }
1640 }
1641 
1642 void
fill_av1_seq_header(EncodedBitstreamResolvedMetadata & associatedMetadata,av1_seq_header_t * seq_header)1643 fill_av1_seq_header(EncodedBitstreamResolvedMetadata &associatedMetadata, av1_seq_header_t *seq_header)
1644 {
1645    // Set all zero by default
1646    memset(seq_header, 0, sizeof(av1_seq_header_t));
1647 
1648    seq_header->seq_profile = d3d12_video_encoder_convert_d3d12_profile_to_spec_profile_av1(
1649       associatedMetadata.m_associatedEncodeConfig.m_encoderProfileDesc.m_AV1Profile);
1650    // seq_header->still_picture; // coded in bitstream by default as 0
1651    // seq_header->reduced_still_picture_header; // coded in bitstream by default as 0
1652    // seq_header->timing_info_present_flag; // coded in bitstream by default as 0
1653    // seq_header->decoder_model_info_present_flag; // coded in bitstream by default as 0
1654    // seq_header->operating_points_cnt_minus_1; // memset default as 0
1655    // seq_header->operating_point_idc[32]; // memset default as 0
1656    d3d12_video_encoder_convert_d3d12_to_spec_level_av1(
1657       associatedMetadata.m_associatedEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Level,
1658       seq_header->seq_level_idx[0]);
1659    d3d12_video_encoder_convert_d3d12_to_spec_tier_av1(
1660       associatedMetadata.m_associatedEncodeConfig.m_encoderLevelDesc.m_AV1LevelSetting.Tier,
1661       seq_header->seq_tier[0]);
1662    // seq_header->decoder_model_present_for_this_op[32]; // memset default as 0
1663    // seq_header->initial_display_delay_present_flag; // coded in bitstream by default as 0
1664    // seq_header->initial_display_delay_minus_1[32];
1665    // seq_header->initial_display_delay_present_for_this_op[32]
1666    // seq_header->frame_width_bits; // coded in bitstream by default as 16
1667    // seq_header->frame_height_bits; // coded in bitstream by default as 16
1668 
1669    // frame_size (comes from input texture size)
1670    seq_header->max_frame_width = associatedMetadata.m_associatedEncodeConfig.m_currentResolution.Width;
1671    seq_header->max_frame_height = associatedMetadata.m_associatedEncodeConfig.m_currentResolution.Height;
1672 
1673    // seq_header->frame_id_numbers_present_flag; // coded in bitstream by default as 0
1674    seq_header->use_128x128_superblock =
1675       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1676         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK) != 0) ?
1677          1 :
1678          0;
1679    seq_header->enable_filter_intra =
1680       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1681         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FILTER_INTRA) != 0) ?
1682          1 :
1683          0;
1684    seq_header->enable_intra_edge_filter =
1685       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1686         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTRA_EDGE_FILTER) != 0) ?
1687          1 :
1688          0;
1689    seq_header->enable_interintra_compound =
1690       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1691         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_INTERINTRA_COMPOUND) != 0) ?
1692          1 :
1693          0;
1694    seq_header->enable_masked_compound =
1695       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1696         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_MASKED_COMPOUND) != 0) ?
1697          1 :
1698          0;
1699    seq_header->enable_warped_motion =
1700       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1701         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_WARPED_MOTION) != 0) ?
1702          1 :
1703          0;
1704    seq_header->enable_dual_filter =
1705       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1706         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_DUAL_FILTER) != 0) ?
1707          1 :
1708          0;
1709    seq_header->enable_order_hint =
1710       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1711         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_ORDER_HINT_TOOLS) != 0) ?
1712          1 :
1713          0;
1714    seq_header->enable_jnt_comp =
1715       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1716         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_JNT_COMP) != 0) ?
1717          1 :
1718          0;
1719    seq_header->enable_ref_frame_mvs =
1720       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1721         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_FRAME_REFERENCE_MOTION_VECTORS) != 0) ?
1722          1 :
1723          0;
1724    seq_header->seq_choose_screen_content_tools = 0;   // coded in bitstream by default as 0
1725    seq_header->seq_force_screen_content_tools = 0;    // coded in bitstream by default as 0
1726    seq_header->seq_choose_integer_mv = 0;             // coded in bitstream by default as 0
1727    seq_header->seq_force_integer_mv = 0;              // coded in bitstream by default as 0
1728    seq_header->order_hint_bits_minus1 =
1729       associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.OrderHintBitsMinus1;
1730    seq_header->enable_superres =
1731       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1732         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_SUPER_RESOLUTION) != 0) ?
1733          1 :
1734          0;
1735    seq_header->enable_cdef =
1736       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1737         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_CDEF_FILTERING) != 0) ?
1738          1 :
1739          0;
1740    seq_header->enable_restoration =
1741       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1742         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_LOOP_RESTORATION_FILTER) != 0) ?
1743          1 :
1744          0;
1745 
1746    seq_header->color_config.bit_depth = associatedMetadata.m_associatedEncodeConfig.m_encodeFormatInfo.Format;
1747    // seq_header->color_config.mono_chrome; // coded in bitstream by default as 0
1748    // seq_header->color_config.color_description_present_flag; // memset default as 0
1749    // seq_header->color_config.color_primaries; // memset default as 0
1750    // seq_header->color_config.transfer_characteristics; // memset default as 0
1751    // seq_header->color_config.matrix_coefficients; // memset default as 0
1752    // seq_header->color_config.color_range; // memset default as 0
1753    seq_header->color_config.chroma_sample_position = 0;   // CSP_UNKNOWN
1754    seq_header->color_config.subsampling_x = 1;            // DX12 4:2:0 only
1755    seq_header->color_config.subsampling_y = 1;            // DX12 4:2:0 only
1756    seq_header->color_config.separate_uv_delta_q = 1;
1757 
1758    // seq_header->film_grain_params_present; // coded in bitstream by default as 1
1759 }
1760 
1761 void
fill_av1_pic_header(EncodedBitstreamResolvedMetadata & associatedMetadata,av1_pic_header_t * pic_header,const av1_seq_header_t * seqHdr,const D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES * pParsedPostEncodeValues,const D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES * pParsedTilePartitions)1762 fill_av1_pic_header(EncodedBitstreamResolvedMetadata &associatedMetadata,
1763                     av1_pic_header_t *pic_header,
1764                     const av1_seq_header_t *seqHdr,
1765                     const D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES *pParsedPostEncodeValues,
1766                     const D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES *pParsedTilePartitions)
1767 {
1768    // Set all zero by default
1769    memset(pic_header, 0, sizeof(av1_pic_header_t));
1770 
1771    {
1772       pic_header->quantization_params = pParsedPostEncodeValues->Quantization;
1773 
1774       debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1775                    "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_QUANTIZATION\n");
1776 
1777       debug_printf("Post encode quantization_params.BaseQIndex: %" PRIu64 "\n",
1778                    pic_header->quantization_params.BaseQIndex);
1779       debug_printf("Post encode quantization_params.YDCDeltaQ: %" PRId64 "\n",
1780                    pic_header->quantization_params.YDCDeltaQ);
1781       debug_printf("Post encode quantization_params.UDCDeltaQ: %" PRId64 "\n",
1782                    pic_header->quantization_params.UDCDeltaQ);
1783       debug_printf("Post encode quantization_params.UACDeltaQ: %" PRId64 "\n",
1784                    pic_header->quantization_params.UACDeltaQ);
1785       debug_printf("Post encode quantization_params.VDCDeltaQ: %" PRId64 "\n",
1786                    pic_header->quantization_params.VDCDeltaQ);
1787       debug_printf("Post encode quantization_params.VACDeltaQ: %" PRId64 "\n",
1788                    pic_header->quantization_params.VACDeltaQ);
1789       debug_printf("Post encode quantization_params.UsingQMatrix: %" PRIu64 "\n",
1790                    pic_header->quantization_params.UsingQMatrix);
1791       debug_printf("Post encode quantization_params.QMY: %" PRIu64 "\n", pic_header->quantization_params.QMY);
1792       debug_printf("Post encode quantization_params.QMU: %" PRIu64 "\n", pic_header->quantization_params.QMU);
1793       debug_printf("Post encode quantization_params.QMV: %" PRIu64 "\n", pic_header->quantization_params.QMV);
1794    }
1795 
1796    pic_header->segmentation_enabled = 0;
1797    if ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
1798         D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_FRAME_SEGMENTATION_AUTO) != 0) {
1799 
1800       // The segmentation info comes from the driver
1801       pic_header->segmentation_config = pParsedPostEncodeValues->SegmentationConfig;
1802       pic_header->segmentation_enabled = (pic_header->segmentation_config.NumSegments != 0);
1803    }
1804 
1805    {
1806       debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1807                    "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_QUANTIZATION_DELTA\n");
1808       pic_header->delta_q_params = pParsedPostEncodeValues->QuantizationDelta;
1809 
1810       debug_printf("Post encode delta_q_params.DeltaQPresent: %" PRIu64 "\n", pic_header->delta_q_params.DeltaQPresent);
1811       debug_printf("Post encode delta_q_params.DeltaQRes: %" PRIu64 "\n", pic_header->delta_q_params.DeltaQRes);
1812    }
1813 
1814    {
1815       debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1816                    "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_LOOP_FILTER_DELTA\n");
1817       pic_header->delta_lf_params = pParsedPostEncodeValues->LoopFilterDelta;
1818 
1819       debug_printf("Post encode delta_lf_params.DeltaLFMulti: %" PRIu64 "\n", pic_header->delta_lf_params.DeltaLFMulti);
1820       debug_printf("Post encode delta_lf_params.DeltaLFPresent: %" PRIu64 "\n",
1821                    pic_header->delta_lf_params.DeltaLFPresent);
1822       debug_printf("Post encode delta_lf_params.DeltaLFRes: %" PRIu64 "\n", pic_header->delta_lf_params.DeltaLFRes);
1823    }
1824 
1825    {
1826       debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1827                    "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_LOOP_FILTER\n");
1828       pic_header->loop_filter_params = pParsedPostEncodeValues->LoopFilter;
1829 
1830       debug_printf("Post encode loop_filter_params.LoopFilterDeltaEnabled: %" PRIu64 "\n",
1831                    pic_header->loop_filter_params.LoopFilterDeltaEnabled);
1832       debug_printf("Post encode loop_filter_params.LoopFilterLevel[0]: %" PRIu64 "\n",
1833                    pic_header->loop_filter_params.LoopFilterLevel[0]);
1834       debug_printf("Post encode loop_filter_params.LoopFilterLevel[1]: %" PRIu64 "\n",
1835                    pic_header->loop_filter_params.LoopFilterLevel[1]);
1836       debug_printf("Post encode loop_filter_params.LoopFilterLevelU: %" PRIu64 "\n",
1837                    pic_header->loop_filter_params.LoopFilterLevelU);
1838       debug_printf("Post encode loop_filter_params.LoopFilterLevelV: %" PRIu64 "\n",
1839                    pic_header->loop_filter_params.LoopFilterLevelV);
1840       debug_printf("Post encode loop_filter_params.LoopFilterSharpnessLevel: %" PRIu64 "\n",
1841                    pic_header->loop_filter_params.LoopFilterSharpnessLevel);
1842       debug_printf("Post encode loop_filter_params.ModeDeltas[0]: %" PRIu64 "\n",
1843                    pic_header->loop_filter_params.ModeDeltas[0]);
1844       debug_printf("Post encode loop_filter_params.ModeDeltas[1]: %" PRIu64 "\n",
1845                    pic_header->loop_filter_params.ModeDeltas[1]);
1846       for (uint8_t i = 0; i < 8; i++) {
1847          debug_printf("Post encode loop_filter_params.RefDeltas[%d]: %" PRIu64 "\n",
1848                       i,
1849                       pic_header->loop_filter_params.RefDeltas[i]);
1850       }
1851       debug_printf("Post encode loop_filter_params.UpdateModeDelta: %" PRIu64 "\n",
1852                    pic_header->loop_filter_params.UpdateModeDelta);
1853       debug_printf("Post encode loop_filter_params.UpdateRefDelta: %" PRIu64 "\n",
1854                    pic_header->loop_filter_params.UpdateRefDelta);
1855    }
1856 
1857    {
1858       debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1859                    "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_CDEF_DATA\n");
1860       pic_header->cdef_params = pParsedPostEncodeValues->CDEF;
1861 
1862       debug_printf("Post encode cdef_params.CdefBits: %" PRIu64 "\n", pic_header->cdef_params.CdefBits);
1863 
1864       debug_printf("Post encode cdef_params.CdefDampingMinus3: %" PRIu64 "\n",
1865                    pic_header->cdef_params.CdefDampingMinus3);
1866 
1867       for (uint8_t i = 0; i < 8; i++) {
1868          debug_printf("Post encode cdef_params.CdefYPriStrength[%d]: %" PRIu64 "\n",
1869                       i,
1870                       pic_header->cdef_params.CdefYPriStrength[i]);
1871 
1872          debug_printf("Post encode cdef_params.CdefUVPriStrength[%d]: %" PRIu64 "\n",
1873                       i,
1874                       pic_header->cdef_params.CdefUVPriStrength[i]);
1875 
1876          debug_printf("Post encode cdef_params.CdefYSecStrength[%d]: %" PRIu64 "\n",
1877                       i,
1878                       pic_header->cdef_params.CdefYSecStrength[i]);
1879 
1880          debug_printf("Post encode cdef_params.CdefUVSecStrength[%d]: %" PRIu64 "\n",
1881                       i,
1882                       pic_header->cdef_params.CdefUVSecStrength[i]);
1883       }
1884    }
1885 
1886    {
1887       debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1888                    "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_COMPOUND_PREDICTION_MODE\n");
1889       pic_header->reference_select = (pParsedPostEncodeValues->CompoundPredictionType ==
1890                                       D3D12_VIDEO_ENCODER_AV1_COMP_PREDICTION_TYPE_SINGLE_REFERENCE) ?
1891                                         0 :
1892                                         1;
1893       debug_printf("Post encode reference_select: %" PRIu32 "\n", pic_header->reference_select);
1894    }
1895 
1896    // if ((pevFlags & D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_CONTEXT_UPDATE_TILE_ID) != 0)
1897    // We just copy the whole structure, the driver must copy it even if the pev flag is not set
1898    pic_header->tile_info.tile_partition = *pParsedTilePartitions;
1899 
1900    {
1901       debug_printf("[d3d12_video_enc_av1] Parsing driver post encode "
1902                    "values...D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES_FLAG_PRIMARY_REF_FRAME\n");
1903       pic_header->primary_ref_frame = static_cast<uint32_t>(pParsedPostEncodeValues->PrimaryRefFrame);
1904       debug_printf("Post encode primary_ref_frame: %" PRIu32 "\n", pic_header->primary_ref_frame);
1905    }
1906 
1907    debug_printf("Post encode tile_info.tile_partition.ContextUpdateTileId: %" PRIu64 "\n",
1908                 pic_header->tile_info.tile_partition.ContextUpdateTileId);
1909    debug_printf("Post encode tile_info.tile_partition.ColCount: %" PRIu64 "\n",
1910                 pic_header->tile_info.tile_partition.ColCount);
1911    debug_printf("Post encode tile_info.tile_partition.RowCount: %" PRIu64 "\n",
1912                 pic_header->tile_info.tile_partition.RowCount);
1913 
1914    assert(pic_header->tile_info.tile_partition.ColCount < 64);
1915    for (uint8_t i = 0; i < pic_header->tile_info.tile_partition.ColCount; i++) {
1916       debug_printf("Post encode tile_info.tile_partition.ColWidths[%d]: %" PRIu64 "\n",
1917                    i,
1918                    pic_header->tile_info.tile_partition.ColWidths[i]);
1919    }
1920 
1921    assert(pic_header->tile_info.tile_partition.RowCount < 64);
1922    for (uint8_t i = 0; i < pic_header->tile_info.tile_partition.RowCount; i++) {
1923       debug_printf("Post encode tile_info.tile_partition.RowHeights[%d]: %" PRIu64 "\n",
1924                    i,
1925                    pic_header->tile_info.tile_partition.RowHeights[i]);
1926    }
1927 
1928    pic_header->show_existing_frame = 0;
1929    pic_header->frame_to_show_map_idx = 0;
1930 
1931    // pic_header->display_frame_id; // frame_id_numbers_present_flag coded in bitstream by default as 0
1932 
1933    pic_header->frame_type = associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.FrameType;
1934    {
1935       UINT EncodeOrderInGop =
1936          (associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.PictureIndex %
1937           associatedMetadata.m_associatedEncodeConfig.m_encoderGOPConfigDesc.m_AV1SequenceStructure.IntraDistance);
1938 
1939       UINT ShowOrderInGop =
1940          (associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.OrderHint %
1941           associatedMetadata.m_associatedEncodeConfig.m_encoderGOPConfigDesc.m_AV1SequenceStructure.IntraDistance);
1942 
1943       pic_header->show_frame = (ShowOrderInGop <= EncodeOrderInGop);
1944    }
1945 
1946    pic_header->showable_frame =   // this will always be showable for P/B frames, even when using show_frame for B
1947                                   // frame playback reordering
1948       associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.FrameType !=
1949       D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_KEY_FRAME;
1950    pic_header->error_resilient_mode =
1951       ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
1952         D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_ERROR_RESILIENT_MODE) != 0);
1953    pic_header->disable_cdf_update =
1954       ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
1955         D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_DISABLE_CDF_UPDATE) != 0);
1956 
1957    pic_header->allow_screen_content_tools =
1958       ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
1959         D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_PALETTE_ENCODING) != 0);
1960    pic_header->force_integer_mv =
1961       ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
1962         D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FORCE_INTEGER_MOTION_VECTORS) != 0);
1963 
1964    // frame_size_override_flag is not coded + default as 1 for SWITCH_FRAME and explicitly coded otherwise
1965    if (pic_header->frame_type == D3D12_VIDEO_ENCODER_AV1_FRAME_TYPE_SWITCH_FRAME)
1966       pic_header->frame_size_override_flag = 1;   // As per AV1 codec spec
1967    else
1968       pic_header->frame_size_override_flag = 0;   // Set as default as 0 when explicitly coded
1969 
1970    pic_header->order_hint = associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.OrderHint;
1971 
1972    pic_header->refresh_frame_flags =
1973       associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.RefreshFrameFlags;
1974 
1975    // frame_size (comes from input texture size)
1976    pic_header->FrameWidth = associatedMetadata.m_associatedEncodeConfig.m_currentResolution.Width;
1977    pic_header->UpscaledWidth = associatedMetadata.m_associatedEncodeConfig.m_currentResolution.Width;
1978    pic_header->FrameHeight = associatedMetadata.m_associatedEncodeConfig.m_currentResolution.Height;
1979 
1980    // render_size (comes from AV1 pipe picparams pic)
1981    pic_header->RenderWidth = associatedMetadata.m_associatedEncodeConfig.m_FrameCroppingCodecConfig.right;
1982    pic_header->RenderHeight = associatedMetadata.m_associatedEncodeConfig.m_FrameCroppingCodecConfig.bottom;
1983 
1984    bool use_128x128_superblock =
1985       ((associatedMetadata.m_associatedEncodeConfig.m_encoderCodecSpecificConfigDesc.m_AV1Config.FeatureFlags &
1986         D3D12_VIDEO_ENCODER_AV1_FEATURE_FLAG_128x128_SUPERBLOCK) != 0) ?
1987          1 :
1988          0;
1989    unsigned MiCols = 2 * ((pic_header->FrameWidth + 7) >> 3);
1990    unsigned MiRows = 2 * ((pic_header->FrameHeight + 7) >> 3);
1991    pic_header->frame_width_sb = use_128x128_superblock ? ((MiCols + 31) >> 5) : ((MiCols + 15) >> 4);
1992    pic_header->frame_height_sb = use_128x128_superblock ? ((MiRows + 31) >> 5) : ((MiRows + 15) >> 4);
1993 
1994    pic_header->use_superres = ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
1995                                 D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_USE_SUPER_RESOLUTION) != 0);
1996    pic_header->SuperresDenom =
1997       associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.SuperResDenominator;
1998 
1999    pic_header->allow_intrabc = ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2000                                  D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_INTRA_BLOCK_COPY) != 0);
2001 
2002    for (unsigned i = 0; i < ARRAY_SIZE(associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData
2003                                           .ReferenceFramesReconPictureDescriptors);
2004         i++) {
2005       pic_header->ref_order_hint[i] = associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData
2006                                          .ReferenceFramesReconPictureDescriptors[i]
2007                                          .OrderHint;
2008    }
2009 
2010    for (uint8_t i = 0; i < ARRAY_SIZE(pParsedPostEncodeValues->ReferenceIndices); i++)
2011       pic_header->ref_frame_idx[i] = pParsedPostEncodeValues->ReferenceIndices[i];
2012 
2013    pic_header->allow_high_precision_mv =
2014       ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2015         D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ALLOW_HIGH_PRECISION_MV) != 0);
2016    pic_header->interpolation_filter =
2017       associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.InterpolationFilter;
2018    pic_header->is_motion_mode_switchable =
2019       ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2020         D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_MOTION_MODE_SWITCHABLE) != 0);
2021    pic_header->use_ref_frame_mvs =
2022       ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2023         D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_FRAME_REFERENCE_MOTION_VECTORS) != 0);
2024    pic_header->disable_frame_end_update_cdf =
2025       ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2026         D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_DISABLE_FRAME_END_UPDATE_CDF) != 0);
2027 
2028    pic_header->tile_info.tile_mode = associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigMode;
2029    pic_header->tile_info.tile_support_caps =
2030       associatedMetadata.m_associatedEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps;
2031 
2032    pic_header->tile_info.uniform_tile_spacing_flag = 0;
2033    if ((pic_header->tile_info.tile_mode == D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE_UNIFORM_GRID_PARTITION) ||
2034        (pic_header->tile_info.tile_mode == D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE_FULL_FRAME))
2035       pic_header->tile_info.uniform_tile_spacing_flag = 1;
2036    else if (pic_header->tile_info.tile_mode ==
2037             D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE_CONFIGURABLE_GRID_PARTITION)
2038       pic_header->tile_info.uniform_tile_spacing_flag = 0;
2039    else
2040       assert(false);   // Unknown pic_header->tile_info.tile_mode for AV1
2041 
2042    // lr_params
2043    for (uint32_t i = 0; i < 3; i++)
2044       pic_header->lr_params.lr_type[i] = associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData
2045                                             .FrameRestorationConfig.FrameRestorationType[i];
2046    bool lr_enabled =
2047       pic_header->lr_params.lr_type[0] || pic_header->lr_params.lr_type[1] || pic_header->lr_params.lr_type[2];
2048    if (lr_enabled) {
2049       uint8_t luma_shift_total = log2(d3d12_video_encoder_looprestorationsize_d3d12_to_uint_av1(
2050                                     associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData
2051                                        .FrameRestorationConfig.LoopRestorationPixelSize[0])) -
2052                                  6;
2053       pic_header->lr_params.lr_unit_shift = (luma_shift_total > 0) ? 1 : 0;
2054       pic_header->lr_params.lr_unit_extra_shift = (luma_shift_total > 1) ? 1 : 0;
2055       assert(associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.FrameRestorationConfig
2056                 .LoopRestorationPixelSize[1] == associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc
2057                                                    .m_AV1PicData.FrameRestorationConfig.LoopRestorationPixelSize[2]);
2058 
2059       if (associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.FrameRestorationConfig
2060              .LoopRestorationPixelSize[1]) {
2061          pic_header->lr_params.lr_uv_shift = log2(d3d12_video_encoder_looprestorationsize_d3d12_to_uint_av1(
2062                                                 associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc
2063                                                    .m_AV1PicData.FrameRestorationConfig.LoopRestorationPixelSize[1])) +
2064                                              6 + luma_shift_total;
2065       } else {
2066          pic_header->lr_params.lr_uv_shift = 0;
2067       }
2068    }
2069 
2070    pic_header->TxMode = associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.TxMode;
2071    pic_header->skip_mode_present =
2072       ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2073         D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_SKIP_MODE) != 0);
2074    pic_header->allow_warped_motion =
2075       ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2076         D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_ENABLE_WARPED_MOTION) != 0);
2077    pic_header->reduced_tx_set =
2078       ((associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.Flags &
2079         D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_FLAG_REDUCED_TX_SET) != 0);
2080    // pic_header->frame_refs_short_signaling; // coded in bitstream by default as 0
2081 }
2082 
2083 D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE
d3d12_video_encoder_looprestorationsize_uint_to_d3d12_av1(uint32_t pixel_size)2084 d3d12_video_encoder_looprestorationsize_uint_to_d3d12_av1(uint32_t pixel_size)
2085 {
2086    switch (pixel_size) {
2087       case 32:
2088       {
2089          return D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_32x32;
2090       } break;
2091       case 64:
2092       {
2093          return D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_64x64;
2094       } break;
2095       case 128:
2096       {
2097          return D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_128x128;
2098       } break;
2099       case 256:
2100       {
2101          return D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_256x256;
2102       } break;
2103       default:
2104       {
2105          unreachable("Unsupported D3D12_VIDEO_ENCODER_AV1_PROFILE");
2106       } break;
2107    }
2108 }
2109 
2110 unsigned
d3d12_video_encoder_looprestorationsize_d3d12_to_uint_av1(D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE d3d12_type)2111 d3d12_video_encoder_looprestorationsize_d3d12_to_uint_av1(D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE d3d12_type)
2112 {
2113    switch (d3d12_type) {
2114       case D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_32x32:
2115       {
2116          return 32;
2117       } break;
2118       case D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_64x64:
2119       {
2120          return 64;
2121       } break;
2122       case D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_128x128:
2123       {
2124          return 128;
2125       } break;
2126       case D3D12_VIDEO_ENCODER_AV1_RESTORATION_TILESIZE_256x256:
2127       {
2128          return 256;
2129       } break;
2130       default:
2131       {
2132          unreachable("Unsupported D3D12_VIDEO_ENCODER_AV1_PROFILE");
2133       } break;
2134    }
2135 }
2136 
2137 /*
2138  * Called at get_feedback time FOR A PREVIOUSLY RECORDED AND EXECUTED FRAME
2139  */
2140 unsigned
d3d12_video_encoder_build_post_encode_codec_bitstream_av1(struct d3d12_video_encoder * pD3D12Enc,uint64_t associated_fence_value,EncodedBitstreamResolvedMetadata & associatedMetadata)2141 d3d12_video_encoder_build_post_encode_codec_bitstream_av1(struct d3d12_video_encoder *pD3D12Enc,
2142                                                           uint64_t associated_fence_value,
2143                                                           EncodedBitstreamResolvedMetadata &associatedMetadata)
2144 {
2145    // Parse the AV1 resolved metadata
2146 
2147    ID3D12Resource *pResolvedMetadataBuffer = associatedMetadata.spBuffer.Get();
2148    uint64_t resourceMetadataSize = associatedMetadata.bufferSize;
2149 
2150    struct d3d12_screen *pD3D12Screen = (struct d3d12_screen *) pD3D12Enc->m_pD3D12Screen;
2151    pipe_resource *pPipeResolvedMetadataBuffer =
2152       d3d12_resource_from_resource(&pD3D12Screen->base, pResolvedMetadataBuffer);
2153    assert(resourceMetadataSize < INT_MAX);
2154    struct pipe_box box;
2155    u_box_3d(0,                                        // x
2156             0,                                        // y
2157             0,                                        // z
2158             static_cast<int>(resourceMetadataSize),   // width
2159             1,                                        // height
2160             1,                                        // depth
2161             &box);
2162    struct pipe_transfer *mapTransferMetadata;
2163    uint8_t *pMetadataBufferSrc =
2164       reinterpret_cast<uint8_t *>(pD3D12Enc->base.context->buffer_map(pD3D12Enc->base.context,
2165                                                                       pPipeResolvedMetadataBuffer,
2166                                                                       0,
2167                                                                       PIPE_MAP_READ,
2168                                                                       &box,
2169                                                                       &mapTransferMetadata));
2170 
2171    debug_printf("[d3d12_video_enc_av1] Parsing driver resolved encode metadata...\n");
2172 
2173    D3D12_VIDEO_ENCODER_OUTPUT_METADATA *pParsedMetadata =
2174       reinterpret_cast<D3D12_VIDEO_ENCODER_OUTPUT_METADATA *>(pMetadataBufferSrc);
2175    pMetadataBufferSrc += sizeof(D3D12_VIDEO_ENCODER_OUTPUT_METADATA);
2176 
2177    D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA *pFrameSubregionMetadata =
2178       reinterpret_cast<D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA *>(pMetadataBufferSrc);
2179    pMetadataBufferSrc +=
2180       (sizeof(D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA) * pParsedMetadata->WrittenSubregionsCount);
2181 
2182    D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES *pParsedTilePartitions =
2183       reinterpret_cast<D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES *>(pMetadataBufferSrc);
2184    pMetadataBufferSrc += sizeof(D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES);
2185 
2186    D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES *pParsedPostEncodeValues =
2187       reinterpret_cast<D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES *>(pMetadataBufferSrc);
2188    pMetadataBufferSrc += sizeof(D3D12_VIDEO_ENCODER_AV1_POST_ENCODE_VALUES);
2189 
2190    debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeErrorFlags: %" PRIx64 " \n",
2191                 pParsedMetadata->EncodeErrorFlags);
2192    debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeStats.AverageQP: %" PRIu64 " \n",
2193                 pParsedMetadata->EncodeStats.AverageQP);
2194    debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeStats.IntraCodingUnitsCount: %" PRIu64
2195                 " \n",
2196                 pParsedMetadata->EncodeStats.IntraCodingUnitsCount);
2197    debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeStats.InterCodingUnitsCount: %" PRIu64
2198                 " \n",
2199                 pParsedMetadata->EncodeStats.InterCodingUnitsCount);
2200    debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeStats.SkipCodingUnitsCount: %" PRIu64
2201                 " \n",
2202                 pParsedMetadata->EncodeStats.SkipCodingUnitsCount);
2203    debug_printf("[d3d12_video_enc_av1] "
2204                 "D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeStats.AverageMotionEstimationXDirection: %" PRIu64 " \n",
2205                 pParsedMetadata->EncodeStats.AverageMotionEstimationXDirection);
2206    debug_printf("[d3d12_video_enc_av1] "
2207                 "D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodeStats.AverageMotionEstimationYDirection: %" PRIu64 " \n",
2208                 pParsedMetadata->EncodeStats.AverageMotionEstimationYDirection);
2209    debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.EncodedBitstreamWrittenBytesCount: %" PRIu64
2210                 " \n",
2211                 pParsedMetadata->EncodedBitstreamWrittenBytesCount);
2212    debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_OUTPUT_METADATA.WrittenSubregionsCount: %" PRIu64 " \n",
2213                 pParsedMetadata->WrittenSubregionsCount);
2214 
2215    for (uint8_t i = 0; i < pParsedMetadata->WrittenSubregionsCount; i++) {
2216       debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA[%d].bHeaderSize: %" PRIu64 " \n",
2217                    i,
2218                    pFrameSubregionMetadata[i].bHeaderSize);
2219       debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA[%d].bStartOffset: %" PRIu64
2220                    " \n",
2221                    i,
2222                    pFrameSubregionMetadata[i].bStartOffset);
2223       debug_printf("[d3d12_video_enc_av1] D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA[%d].bSize: %" PRIu64 " \n",
2224                    i,
2225                    pFrameSubregionMetadata[i].bSize);
2226    }
2227 
2228    if (pParsedMetadata->EncodeErrorFlags != D3D12_VIDEO_ENCODER_ENCODE_ERROR_FLAG_NO_ERROR) {
2229       debug_printf("[d3d12_video_enc_av1] Encode GPU command for fence %" PRIu64 " failed - EncodeErrorFlags: %" PRIu64
2230                    "\n",
2231                    associated_fence_value,
2232                    pParsedMetadata->EncodeErrorFlags);
2233       assert(false);
2234       return 0;
2235    }
2236 
2237    if (pParsedMetadata->EncodedBitstreamWrittenBytesCount == 0u) {
2238       debug_printf("[d3d12_video_enc_av1] Encode GPU command for fence %" PRIu64
2239                    " failed - EncodedBitstreamWrittenBytesCount: 0\n",
2240                    associated_fence_value);
2241       assert(false);
2242       return 0;
2243    }
2244 
2245    // Create headers
2246 
2247    av1_seq_header_t seqHdr = {};
2248    fill_av1_seq_header(associatedMetadata, &seqHdr);
2249    av1_pic_header_t picHdr = {};
2250    fill_av1_pic_header(associatedMetadata, &picHdr, &seqHdr, pParsedPostEncodeValues, pParsedTilePartitions);
2251 
2252    bool bNeedSeqUpdate = false;
2253    bool diff_uv_delta_from_pev = (picHdr.quantization_params.VDCDeltaQ != picHdr.quantization_params.UDCDeltaQ) ||
2254                                  (picHdr.quantization_params.VACDeltaQ != picHdr.quantization_params.UACDeltaQ);
2255    debug_printf("[Calculated] Post encode diff_uv_delta_from_pev: %d\n", diff_uv_delta_from_pev);
2256 
2257    // Make sure the Seq header allows diff_uv_delta from pev
2258    if (diff_uv_delta_from_pev && !seqHdr.color_config.separate_uv_delta_q) {
2259       seqHdr.color_config.separate_uv_delta_q = 1;
2260       bNeedSeqUpdate = true;
2261    }
2262 
2263    d3d12_video_bitstream_builder_av1 *pAV1BitstreamBuilder =
2264       static_cast<d3d12_video_bitstream_builder_av1 *>(pD3D12Enc->m_upBitstreamBuilder.get());
2265    assert(pAV1BitstreamBuilder);
2266 
2267    associatedMetadata.pWrittenCodecUnitsSizes.clear();
2268 
2269    size_t writtenTemporalDelimBytes = 0;
2270    if (picHdr.show_frame && associatedMetadata.m_CodecSpecificData.AV1HeadersInfo.temporal_delim_rendered) {
2271       pAV1BitstreamBuilder->write_temporal_delimiter_obu(
2272          pD3D12Enc->m_BitstreamHeadersBuffer,
2273          pD3D12Enc->m_BitstreamHeadersBuffer.begin(),   // placingPositionStart
2274          writtenTemporalDelimBytes                      // Bytes Written AFTER placingPositionStart arg above
2275       );
2276       assert(pD3D12Enc->m_BitstreamHeadersBuffer.size() == writtenTemporalDelimBytes);
2277       debug_printf("Written OBU_TEMPORAL_DELIMITER bytes: %" PRIu64 "\n", static_cast<uint64_t>(writtenTemporalDelimBytes));
2278       associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenTemporalDelimBytes);
2279    }
2280 
2281    size_t writtenSequenceBytes = 0;
2282    bool isFirstFrame = (associated_fence_value == 1);
2283 
2284    // on first frame or on resolution change or if we changed seq hdr values with post encode values
2285    bool writeNewSeqHeader = isFirstFrame || bNeedSeqUpdate ||
2286                             ((associatedMetadata.m_associatedEncodeConfig.m_seqFlags &
2287                               D3D12_VIDEO_ENCODER_SEQUENCE_CONTROL_FLAG_RESOLUTION_CHANGE) != 0);
2288 
2289    if (writeNewSeqHeader) {
2290       pAV1BitstreamBuilder->write_sequence_header(
2291          &seqHdr,
2292          pD3D12Enc->m_BitstreamHeadersBuffer,
2293          pD3D12Enc->m_BitstreamHeadersBuffer.begin() + writtenTemporalDelimBytes,   // placingPositionStart
2294          writtenSequenceBytes   // Bytes Written AFTER placingPositionStart arg above
2295       );
2296       associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenSequenceBytes);
2297       assert(pD3D12Enc->m_BitstreamHeadersBuffer.size() == (writtenSequenceBytes + writtenTemporalDelimBytes));
2298       debug_printf("Written OBU_SEQUENCE_HEADER bytes: %" PRIu64 "\n", static_cast<uint64_t>(writtenSequenceBytes));
2299    }
2300 
2301    // Only supported bitstream format is with obu_size for now.
2302    assert(associatedMetadata.m_CodecSpecificData.AV1HeadersInfo.obu_has_size_field);
2303 
2304    size_t writtenFrameBytes = 0;
2305    size_t writtenTileBytes = 0;
2306 
2307    pipe_resource *src_driver_bitstream =
2308       d3d12_resource_from_resource(&pD3D12Enc->m_pD3D12Screen->base, associatedMetadata.spStagingBitstream.Get());
2309    assert(src_driver_bitstream);
2310 
2311    size_t comp_bitstream_offset = 0;
2312    if (associatedMetadata.m_CodecSpecificData.AV1HeadersInfo.enable_frame_obu) {
2313       // FRAME_OBU combined frame and tile data case
2314 
2315       assert(associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroupsCount ==
2316              1);
2317 
2318       // write_frame_header writes OBU_FRAME except tile_obu_group, but included obu_size for tile_group_obu as
2319       // calculated below
2320       size_t tile_group_obu_size = 0;
2321       size_t decode_tile_elements_size = 0;
2322       pAV1BitstreamBuilder->calculate_tile_group_obu_size(
2323          pParsedMetadata,
2324          pFrameSubregionMetadata,
2325          associatedMetadata.m_associatedEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps
2326                .TileSizeBytesMinus1 +
2327             1,
2328          associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition,
2329          associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroups[0],
2330          tile_group_obu_size,
2331          decode_tile_elements_size);
2332 
2333       pAV1BitstreamBuilder->write_frame_header(
2334          &seqHdr,
2335          &picHdr,
2336          OBU_FRAME,
2337          tile_group_obu_size,   // We need it to code obu_size of OBU_FRAME open_bitstream_unit()
2338          pD3D12Enc->m_BitstreamHeadersBuffer,
2339          pD3D12Enc->m_BitstreamHeadersBuffer.begin() + writtenSequenceBytes +
2340             writtenTemporalDelimBytes,   // placingPositionStart
2341          writtenFrameBytes               // Bytes Written AFTER placingPositionStart arg above
2342       );
2343 
2344       debug_printf("Written OBU_FRAME bytes: %" PRIu64 "\n", static_cast<uint64_t>(writtenFrameBytes));
2345       associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenFrameBytes);
2346 
2347       assert(pD3D12Enc->m_BitstreamHeadersBuffer.size() ==
2348              (writtenSequenceBytes + writtenTemporalDelimBytes + writtenFrameBytes));
2349 
2350       debug_printf("Uploading %" PRIu64
2351                    " bytes from OBU sequence and/or picture headers to comp_bit_destination %p at offset 0\n",
2352                    static_cast<uint64_t>(pD3D12Enc->m_BitstreamHeadersBuffer.size()),
2353                    associatedMetadata.comp_bit_destination);
2354 
2355       // Upload headers to the finalized compressed bitstream buffer
2356       // Note: The buffer_subdata is queued in pD3D12Enc->base.context but doesn't execute immediately
2357       pD3D12Enc->base.context->buffer_subdata(pD3D12Enc->base.context,                   // context
2358                                               associatedMetadata.comp_bit_destination,   // comp. bitstream
2359                                               PIPE_MAP_WRITE,                            // usage PIPE_MAP_x
2360                                               0,                                         // offset
2361                                               pD3D12Enc->m_BitstreamHeadersBuffer.size(),
2362                                               pD3D12Enc->m_BitstreamHeadersBuffer.data());
2363 
2364       comp_bitstream_offset = pD3D12Enc->m_BitstreamHeadersBuffer.size();
2365       size_t written_bytes_to_staging_bitstream_buffer = 0;
2366 
2367       upload_tile_group_obu(
2368          pD3D12Enc,
2369          tile_group_obu_size,
2370          decode_tile_elements_size,
2371          associatedMetadata.m_StagingBitstreamConstruction,
2372          0,   // staging_bitstream_buffer_offset,
2373          src_driver_bitstream,
2374          associatedMetadata.comp_bit_destination,
2375          comp_bitstream_offset,
2376          pFrameSubregionMetadata,
2377          associatedMetadata.m_associatedEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps
2378                .TileSizeBytesMinus1 +
2379             1,
2380          associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition,
2381          associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroups[0],
2382          written_bytes_to_staging_bitstream_buffer,
2383          associatedMetadata.pWrittenCodecUnitsSizes);
2384 
2385       writtenTileBytes += tile_group_obu_size;
2386       comp_bitstream_offset += writtenTileBytes;
2387 
2388       // Flush batch with upload work and wait on this CPU thread for GPU work completion
2389       {
2390          struct pipe_fence_handle *pUploadGPUCompletionFence = NULL;
2391          pD3D12Enc->base.context->flush(pD3D12Enc->base.context,
2392                                         &pUploadGPUCompletionFence,
2393                                         PIPE_FLUSH_ASYNC | PIPE_FLUSH_HINT_FINISH);
2394          assert(pUploadGPUCompletionFence);
2395          debug_printf(
2396             "[d3d12_video_encoder] d3d12_video_encoder_build_post_encode_codec_bitstream_av1 - Waiting on GPU "
2397             "completion fence for "
2398             " uploading finalized codec headers to compressed bitstream.\n");
2399 
2400          pD3D12Enc->m_pD3D12Screen->base.fence_finish(&pD3D12Enc->m_pD3D12Screen->base,
2401                                                       NULL,
2402                                                       pUploadGPUCompletionFence,
2403                                                       OS_TIMEOUT_INFINITE);
2404          pD3D12Enc->m_pD3D12Screen->base.fence_reference(&pD3D12Enc->m_pD3D12Screen->base,
2405                                                          &pUploadGPUCompletionFence,
2406                                                          NULL);
2407       }
2408    } else {
2409       // FRAME_HEADER_OBU + OBU_TILE_GROUP concatenated case
2410 
2411       // Build open_bitstream_unit for OBU_FRAME_HEADER
2412       pAV1BitstreamBuilder->write_frame_header(&seqHdr,
2413                                                &picHdr,
2414                                                OBU_FRAME_HEADER,
2415                                                0,   // no tile_obu_group in OBU_FRAME_HEADER
2416                                                pD3D12Enc->m_BitstreamHeadersBuffer,
2417                                                pD3D12Enc->m_BitstreamHeadersBuffer.begin() + writtenSequenceBytes +
2418                                                   writtenTemporalDelimBytes,   // placingPositionStart
2419                                                writtenFrameBytes   // Bytes Written AFTER placingPositionStart arg above
2420       );
2421       associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenFrameBytes);
2422 
2423       debug_printf("Written OBU_FRAME_HEADER bytes: %" PRIu64 "\n", static_cast<uint64_t>(writtenFrameBytes));
2424 
2425       assert(pD3D12Enc->m_BitstreamHeadersBuffer.size() ==
2426              (writtenSequenceBytes + writtenTemporalDelimBytes + writtenFrameBytes));
2427 
2428       debug_printf("Uploading %" PRIu64 " bytes from OBU headers to comp_bit_destination %p at offset 0\n",
2429                    static_cast<uint64_t>(pD3D12Enc->m_BitstreamHeadersBuffer.size()),
2430                    associatedMetadata.comp_bit_destination);
2431 
2432       // Upload headers to the finalized compressed bitstream buffer
2433       // Note: The buffer_subdata is queued in pD3D12Enc->base.context but doesn't execute immediately
2434       pD3D12Enc->base.context->buffer_subdata(pD3D12Enc->base.context,                   // context
2435                                               associatedMetadata.comp_bit_destination,   // comp. bitstream
2436                                               PIPE_MAP_WRITE,                            // usage PIPE_MAP_x
2437                                               0,                                         // offset
2438                                               pD3D12Enc->m_BitstreamHeadersBuffer.size(),
2439                                               pD3D12Enc->m_BitstreamHeadersBuffer.data());
2440 
2441       comp_bitstream_offset = pD3D12Enc->m_BitstreamHeadersBuffer.size();
2442       size_t staging_bitstream_buffer_offset = 0;
2443 
2444       for (int tg_idx = 0;
2445            tg_idx <
2446            associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroupsCount;
2447            tg_idx++) {
2448          auto &currentTg =
2449             associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesGroups[tg_idx];
2450 
2451          debug_printf("Uploading tile group %d to comp_bit_destination %p at offset %" PRIu64 "\n",
2452                       tg_idx,
2453                       associatedMetadata.comp_bit_destination,
2454                       static_cast<uint64_t>(comp_bitstream_offset));
2455 
2456          size_t tile_group_obu_size = 0;
2457          size_t decode_tile_elements_size = 0;
2458          pAV1BitstreamBuilder->calculate_tile_group_obu_size(
2459             pParsedMetadata,
2460             pFrameSubregionMetadata,
2461             associatedMetadata.m_associatedEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps
2462                   .TileSizeBytesMinus1 +
2463                1,
2464             associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition,
2465             currentTg,
2466             tile_group_obu_size,
2467             decode_tile_elements_size);
2468 
2469          size_t writtenTileObuPrefixBytes = 0;
2470          pAV1BitstreamBuilder->write_obu_tile_group_header(
2471             tile_group_obu_size,   // tile_group_obu() size to pack OBU_TILE_GROUP obu_size element
2472             associatedMetadata.m_StagingBitstreamConstruction,   // Source CPU buffer cannot be overwritten until
2473                                                                  // GPU upload flush finishes.
2474             associatedMetadata.m_StagingBitstreamConstruction.begin() +
2475                staging_bitstream_buffer_offset,                  // placingPositionStart
2476             writtenTileObuPrefixBytes);                          // Bytes Written AFTER placingPositionStart arg above
2477 
2478          debug_printf("Written %" PRIu64 " bytes for OBU_TILE_GROUP open_bitstream_unit() prefix with obu_header() and "
2479                       "obu_size to staging_bitstream_buffer %p at offset %" PRIu64 "\n",
2480                       static_cast<uint64_t>(writtenTileObuPrefixBytes),
2481                       associatedMetadata.m_StagingBitstreamConstruction.data(),
2482                       static_cast<uint64_t>(staging_bitstream_buffer_offset));
2483 
2484          writtenTileBytes += writtenTileObuPrefixBytes;
2485          associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenTileObuPrefixBytes);
2486 
2487          // Note: The buffer_subdata is queued in pD3D12Enc->base.context but doesn't execute immediately
2488          pD3D12Enc->base.context->buffer_subdata(
2489             pD3D12Enc->base.context,                   // context
2490             associatedMetadata.comp_bit_destination,   // comp. bitstream
2491             PIPE_MAP_WRITE,                            // usage PIPE_MAP_x
2492             comp_bitstream_offset,                     // offset
2493             writtenTileObuPrefixBytes,
2494             associatedMetadata.m_StagingBitstreamConstruction.data() + staging_bitstream_buffer_offset);
2495 
2496          debug_printf("Uploading %" PRIu64 " bytes for OBU_TILE_GROUP open_bitstream_unit() prefix with obu_header() "
2497                       "and obu_size: %" PRIu64 " to comp_bit_destination %p at offset %" PRIu64 "\n",
2498                       static_cast<uint64_t>(writtenTileObuPrefixBytes),
2499                       static_cast<uint64_t>(tile_group_obu_size),
2500                       associatedMetadata.comp_bit_destination,
2501                       static_cast<uint64_t>(comp_bitstream_offset));
2502 
2503          staging_bitstream_buffer_offset += writtenTileObuPrefixBytes;
2504 
2505          comp_bitstream_offset += writtenTileObuPrefixBytes;
2506 
2507          size_t written_bytes_to_staging_bitstream_buffer = 0;
2508          upload_tile_group_obu(
2509             pD3D12Enc,
2510             tile_group_obu_size,
2511             decode_tile_elements_size,
2512             associatedMetadata.m_StagingBitstreamConstruction,
2513             staging_bitstream_buffer_offset,
2514             src_driver_bitstream,
2515             associatedMetadata.comp_bit_destination,
2516             comp_bitstream_offset,
2517             pFrameSubregionMetadata,
2518             associatedMetadata.m_associatedEncodeCapabilities.m_encoderCodecSpecificConfigCaps.m_AV1TileCaps
2519                   .TileSizeBytesMinus1 +
2520                1,
2521             associatedMetadata.m_associatedEncodeConfig.m_encoderSliceConfigDesc.m_TilesConfig_AV1.TilesPartition,
2522             currentTg,
2523             written_bytes_to_staging_bitstream_buffer,
2524             associatedMetadata.pWrittenCodecUnitsSizes);
2525 
2526          staging_bitstream_buffer_offset += written_bytes_to_staging_bitstream_buffer;
2527          comp_bitstream_offset += tile_group_obu_size;
2528          writtenTileBytes += tile_group_obu_size;
2529 
2530          // Flush batch with upload work and wait on this CPU thread for GPU work completion
2531          // for this case we have to do it within the loop, so the CUP arrays that are reused
2532          // on each loop are completely done being read by the GPU before we modify them.
2533          {
2534             struct pipe_fence_handle *pUploadGPUCompletionFence = NULL;
2535             pD3D12Enc->base.context->flush(pD3D12Enc->base.context,
2536                                            &pUploadGPUCompletionFence,
2537                                            PIPE_FLUSH_ASYNC | PIPE_FLUSH_HINT_FINISH);
2538             assert(pUploadGPUCompletionFence);
2539             debug_printf(
2540                "[d3d12_video_encoder] d3d12_video_encoder_build_post_encode_codec_bitstream_av1 - Waiting on GPU "
2541                "completion fence for "
2542                " uploading finalized codec headers to compressed bitstream.\n");
2543 
2544             pD3D12Enc->m_pD3D12Screen->base.fence_finish(&pD3D12Enc->m_pD3D12Screen->base,
2545                                                          NULL,
2546                                                          pUploadGPUCompletionFence,
2547                                                          OS_TIMEOUT_INFINITE);
2548             pD3D12Enc->m_pD3D12Screen->base.fence_reference(&pD3D12Enc->m_pD3D12Screen->base,
2549                                                             &pUploadGPUCompletionFence,
2550                                                             NULL);
2551          }
2552       }
2553    }
2554 
2555    size_t extra_show_existing_frame_payload_bytes = 0;
2556    if (!picHdr.show_frame) {
2557 
2558       // When writing in the bitstream a frame that will be accessed as reference by a frame we did not
2559       // write to the bitstream yet, let's store them for future show_existing_frame mechanism
2560       pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificStateDescAV1.pendingShowableFrames.push_back(
2561          associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData.PictureIndex);
2562 
2563    } else {   // picHdr.show_frame true
2564 
2565       // Check if any of the pending "to be showed later" frames is present in the current frame references
2566       // and if so issue the show_existing_frame header and remove it from the pending list
2567 
2568       for (auto pendingFrameIt =
2569               pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificStateDescAV1.pendingShowableFrames.begin();
2570            pendingFrameIt !=
2571            pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificStateDescAV1.pendingShowableFrames.end();) {
2572 
2573          // Check if current frame references uses this pendingFrameIt
2574          int cur_ref_idx_matching_pending = -1;
2575          for (unsigned i = 0; i < ARRAY_SIZE(picHdr.ref_frame_idx) /*NUM_REF_FRAMES*/; i++) {
2576             if (
2577                // Is a valid reference
2578                (associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData
2579                    .ReferenceFramesReconPictureDescriptors[picHdr.ref_frame_idx[i]]
2580                    .ReconstructedPictureResourceIndex != UNUSED_VIRTUAL_DPB_SLOT_PHYSICAL_INDEX) &&
2581                // And matches the pending frame PictureIndex
2582                (associatedMetadata.m_associatedEncodeConfig.m_encoderPicParamsDesc.m_AV1PicData
2583                    .ReferenceFramesReconPictureDescriptors[picHdr.ref_frame_idx[i]]
2584                    .PictureIndex == *pendingFrameIt /*PictureIndex*/)) {
2585 
2586                // Store the reference index
2587                cur_ref_idx_matching_pending = picHdr.ref_frame_idx[i];
2588                break;
2589             }
2590          }
2591 
2592          // If we found a reference of the current frame using pendingFrameIt,
2593          // - Issue the show_existing_frame header
2594          // - Remove it from the pending list
2595          if (cur_ref_idx_matching_pending >= 0) {
2596             size_t staging_buf_offset = pD3D12Enc->m_BitstreamHeadersBuffer.size();
2597 
2598 
2599             size_t writtenTemporalDelimBytes = 0;
2600             if (D3D12_VIDEO_AV1_INSERT_SHOW_EXISTING_FRAME_HEADER) {
2601                pAV1BitstreamBuilder->write_temporal_delimiter_obu(
2602                   pD3D12Enc->m_BitstreamHeadersBuffer,
2603                   pD3D12Enc->m_BitstreamHeadersBuffer.begin() + staging_buf_offset,   // placingPositionStart
2604                   writtenTemporalDelimBytes   // Bytes Written AFTER placingPositionStart arg above
2605                );
2606             }
2607             associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenTemporalDelimBytes);
2608             assert(writtenTemporalDelimBytes == (pD3D12Enc->m_BitstreamHeadersBuffer.size() - staging_buf_offset));
2609 
2610             // Add current pending frame being processed in the loop
2611             extra_show_existing_frame_payload_bytes += writtenTemporalDelimBytes;
2612 
2613             debug_printf("Written OBU_TEMPORAL_DELIMITER bytes: %" PRIu64 "\n", static_cast<uint64_t>(writtenTemporalDelimBytes));
2614 
2615             size_t writtenShowExistingFrameBytes = 0;
2616             av1_pic_header_t showExistingPicHdr = {};
2617             showExistingPicHdr.show_existing_frame = 1;
2618             showExistingPicHdr.frame_to_show_map_idx = cur_ref_idx_matching_pending;
2619 
2620             if (D3D12_VIDEO_AV1_INSERT_SHOW_EXISTING_FRAME_HEADER) {
2621                pAV1BitstreamBuilder->write_frame_header(
2622                   NULL,   // No seq header necessary for show_existing_frame
2623                   &showExistingPicHdr,
2624                   OBU_FRAME_HEADER,
2625                   0,   // No tile info for OBU_FRAME_HEADER
2626                   pD3D12Enc->m_BitstreamHeadersBuffer,
2627                   pD3D12Enc->m_BitstreamHeadersBuffer.begin() + staging_buf_offset +
2628                      writtenTemporalDelimBytes,   // placingPositionStart
2629                   writtenShowExistingFrameBytes   // Bytes Written AFTER placingPositionStart arg above
2630                );
2631             }
2632             associatedMetadata.pWrittenCodecUnitsSizes.push_back(writtenShowExistingFrameBytes);
2633 
2634             assert(writtenShowExistingFrameBytes ==
2635                    (pD3D12Enc->m_BitstreamHeadersBuffer.size() - staging_buf_offset - writtenTemporalDelimBytes));
2636 
2637             // Add current pending frame being processed in the loop
2638             extra_show_existing_frame_payload_bytes += writtenShowExistingFrameBytes;
2639 
2640             assert(pD3D12Enc->m_BitstreamHeadersBuffer.size() ==
2641                    (staging_buf_offset + writtenShowExistingFrameBytes + writtenTemporalDelimBytes));
2642 
2643             // Upload headers to the finalized compressed bitstream buffer
2644             // Note: The buffer_subdata is queued in pD3D12Enc->base.context but doesn't execute immediately
2645             pD3D12Enc->base.context->buffer_subdata(pD3D12Enc->base.context,                   // context
2646                                                     associatedMetadata.comp_bit_destination,   // comp. bitstream
2647                                                     PIPE_MAP_WRITE,                            // usage PIPE_MAP_x
2648                                                     comp_bitstream_offset,                     // offset
2649                                                     writtenShowExistingFrameBytes + writtenTemporalDelimBytes,
2650                                                     pD3D12Enc->m_BitstreamHeadersBuffer.data() + staging_buf_offset);
2651 
2652             comp_bitstream_offset += writtenShowExistingFrameBytes;
2653             comp_bitstream_offset += writtenTemporalDelimBytes;
2654 
2655             debug_printf("Written show_existing_frame OBU_FRAME header for previous frame with PictureIndex %d (Used "
2656                          "in current frame ref_frame_idx[%" PRIu32 "]) bytes: %" PRIu64 "\n",
2657                          *pendingFrameIt /*PictureIndex*/,
2658                          showExistingPicHdr.frame_to_show_map_idx,
2659                          static_cast<uint64_t>(writtenShowExistingFrameBytes));
2660 
2661             // Remove it from the list of pending frames
2662             pendingFrameIt =
2663                pD3D12Enc->m_currentEncodeConfig.m_encoderCodecSpecificStateDescAV1.pendingShowableFrames.erase(
2664                   pendingFrameIt);
2665          } else {
2666             pendingFrameIt++;
2667          }
2668       }
2669 
2670       // Flush again if uploaded show_existing_frame header(s) to bitstream.
2671       if (extra_show_existing_frame_payload_bytes) {
2672          struct pipe_fence_handle *pUploadGPUCompletionFence = NULL;
2673          pD3D12Enc->base.context->flush(pD3D12Enc->base.context,
2674                                         &pUploadGPUCompletionFence,
2675                                         PIPE_FLUSH_ASYNC | PIPE_FLUSH_HINT_FINISH);
2676          assert(pUploadGPUCompletionFence);
2677          debug_printf("[d3d12_video_encoder] [show_existing_frame extra headers upload] "
2678                       "d3d12_video_encoder_build_post_encode_codec_bitstream_av1 - Waiting on GPU "
2679                       "completion fence for "
2680                       " uploading finalized codec headers to compressed bitstream.\n");
2681 
2682          pD3D12Enc->m_pD3D12Screen->base.fence_finish(&pD3D12Enc->m_pD3D12Screen->base,
2683                                                       NULL,
2684                                                       pUploadGPUCompletionFence,
2685                                                       OS_TIMEOUT_INFINITE);
2686          pD3D12Enc->m_pD3D12Screen->base.fence_reference(&pD3D12Enc->m_pD3D12Screen->base,
2687                                                          &pUploadGPUCompletionFence,
2688                                                          NULL);
2689       }
2690    }
2691 
2692    // d3d12_resource_from_resource calls AddRef to it so this should only be deleting
2693    // the pipe_resource wrapping object and not the underlying spStagingBitstream
2694    pipe_resource_reference(&src_driver_bitstream, NULL);
2695    assert(associatedMetadata.spStagingBitstream.Get());
2696 
2697    // Unmap the metadata buffer tmp storage
2698    pipe_buffer_unmap(pD3D12Enc->base.context, mapTransferMetadata);
2699    pipe_resource_reference(&pPipeResolvedMetadataBuffer, NULL);
2700 
2701    assert((writtenSequenceBytes + writtenTemporalDelimBytes + writtenFrameBytes +
2702            extra_show_existing_frame_payload_bytes) == pD3D12Enc->m_BitstreamHeadersBuffer.size());
2703 
2704    uint32_t total_bytes_written = static_cast<uint32_t>(writtenSequenceBytes + writtenTemporalDelimBytes + writtenFrameBytes +
2705                                     writtenTileBytes + extra_show_existing_frame_payload_bytes);
2706    assert(std::accumulate(associatedMetadata.pWrittenCodecUnitsSizes.begin(), associatedMetadata.pWrittenCodecUnitsSizes.end(), 0u) ==
2707       static_cast<uint64_t>(total_bytes_written));
2708    return total_bytes_written;
2709 }
2710 
2711 void
upload_tile_group_obu(struct d3d12_video_encoder * pD3D12Enc,size_t tile_group_obu_size,size_t decode_tile_elements_size,std::vector<uint8_t> & staging_bitstream_buffer,size_t staging_bitstream_buffer_offset,pipe_resource * src_driver_bitstream,pipe_resource * comp_bit_destination,size_t comp_bit_destination_offset,const D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA * pFrameSubregionMetadata,size_t TileSizeBytes,const D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES & TilesPartition,const av1_tile_group_t & tileGroup,size_t & written_bytes_to_staging_bitstream_buffer,std::vector<uint64_t> & pWrittenCodecUnitsSizes)2712 upload_tile_group_obu(struct d3d12_video_encoder *pD3D12Enc,
2713                       size_t tile_group_obu_size,
2714                       size_t decode_tile_elements_size,
2715                       std::vector<uint8_t> &staging_bitstream_buffer,
2716                       size_t staging_bitstream_buffer_offset,
2717                       pipe_resource *src_driver_bitstream,
2718                       pipe_resource *comp_bit_destination,
2719                       size_t comp_bit_destination_offset,
2720                       const D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA *pFrameSubregionMetadata,
2721                       size_t TileSizeBytes,   // Pass already +1'd from TileSizeBytesMinus1
2722                       const D3D12_VIDEO_ENCODER_AV1_PICTURE_CONTROL_SUBREGIONS_LAYOUT_DATA_TILES &TilesPartition,
2723                       const av1_tile_group_t &tileGroup,
2724                       size_t &written_bytes_to_staging_bitstream_buffer,
2725                       std::vector<uint64_t> &pWrittenCodecUnitsSizes)
2726 {
2727    debug_printf("[Tile group start %d to end %d] Writing to comp_bit_destination %p starts at offset %" PRIu64 "\n",
2728                 tileGroup.tg_start,
2729                 tileGroup.tg_end,
2730                 comp_bit_destination,
2731                 static_cast<uint64_t>(comp_bit_destination_offset));
2732 
2733    debug_printf("[Tile group start %d to end %d] Using staging_bitstream_buffer %p at offset %" PRIu64
2734                 " to write the tile_obu_group() prefix syntax: tile_start_and_end_present_flag, tg_start, tg_end and "
2735                 "the tile_size_minus1\n",
2736                 tileGroup.tg_start,
2737                 tileGroup.tg_end,
2738                 staging_bitstream_buffer.data(),
2739                 static_cast<uint64_t>(staging_bitstream_buffer_offset));
2740 
2741    // Reserve space upfront in the scratch storage
2742    // Do not modify anything before staging_bitstream_buffer_offset
2743 
2744    size_t tile_obu_prefix_size = tile_group_obu_size - decode_tile_elements_size;
2745    if (staging_bitstream_buffer.size() < (staging_bitstream_buffer_offset + tile_obu_prefix_size))
2746       staging_bitstream_buffer.resize(staging_bitstream_buffer_offset + tile_obu_prefix_size);
2747 
2748    d3d12_video_encoder_bitstream bitstream_tile_group_obu;
2749    bitstream_tile_group_obu.setup_bitstream(staging_bitstream_buffer.size(),
2750                                             staging_bitstream_buffer.data(),
2751                                             staging_bitstream_buffer_offset);
2752 
2753    uint8_t NumTiles = TilesPartition.ColCount * TilesPartition.RowCount;
2754    bool tile_start_and_end_present_flag = !(tileGroup.tg_start == 0 && (tileGroup.tg_end == (NumTiles - 1)));
2755    if (NumTiles > 1)
2756       bitstream_tile_group_obu.put_bits(1,
2757                                         tile_start_and_end_present_flag);   // tile_start_and_end_present_flag f(1)
2758 
2759    if (!(NumTiles == 1 || !tile_start_and_end_present_flag)) {
2760       uint8_t tileBits = log2(TilesPartition.ColCount) + log2(TilesPartition.RowCount);
2761       bitstream_tile_group_obu.put_bits(tileBits, tileGroup.tg_start);   // tg_start	   f(tileBits)
2762       bitstream_tile_group_obu.put_bits(tileBits, tileGroup.tg_end);     // tg_end	      f(tileBits)
2763    }
2764 
2765    bitstream_tile_group_obu.put_aligning_bits();   // byte_alignment()
2766 
2767    bitstream_tile_group_obu.flush();
2768 
2769    size_t bitstream_tile_group_obu_bytes = bitstream_tile_group_obu.get_byte_count() - staging_bitstream_buffer_offset;
2770 
2771    debug_printf("[Tile group start %d to end %d] Written %" PRIu64
2772                 " bitstream_tile_group_obu_bytes at staging_bitstream_buffer %p at offset %" PRIu64
2773                 " for tile_obu_group() prefix syntax: tile_start_and_end_present_flag, tg_start, tg_end\n",
2774                 tileGroup.tg_start,
2775                 tileGroup.tg_end,
2776                 static_cast<uint64_t>(bitstream_tile_group_obu_bytes),
2777                 staging_bitstream_buffer.data(),
2778                 static_cast<uint64_t>(staging_bitstream_buffer_offset));
2779 
2780 
2781    // Save this to compare the final written destination byte size against the expected tile_group_obu_size
2782    // at the end of the function
2783    ASSERTED size_t comp_bit_destination_offset_before_upload = comp_bit_destination_offset;
2784 
2785    // Upload first part of the header to compressed bitstream destination
2786    // Note: The buffer_subdata is queued in pD3D12Enc->base.context but doesn't execute immediately
2787    if (bitstream_tile_group_obu_bytes > 0) {
2788       pD3D12Enc->base.context->buffer_subdata(
2789          pD3D12Enc->base.context,                                              // context
2790          comp_bit_destination,                                                 // comp. bitstream
2791          PIPE_MAP_WRITE,                                                       // usage PIPE_MAP_x
2792          comp_bit_destination_offset,                                          // offset
2793          bitstream_tile_group_obu_bytes,                                       // size
2794          staging_bitstream_buffer.data() + staging_bitstream_buffer_offset);   // data
2795 
2796       debug_printf("[Tile group start %d to end %d]  Uploading %" PRIu64 " bytes"
2797                    " for tile_obu_group() prefix syntax: tile_start_and_end_present_flag, tg_start, tg_end"
2798                    " from staging_bitstream_buffer %p at offset %" PRIu64
2799                    " to comp_bit_destination %p at offset %" PRIu64 "\n",
2800                    tileGroup.tg_start,
2801                    tileGroup.tg_end,
2802                    static_cast<uint64_t>(bitstream_tile_group_obu_bytes),
2803                    staging_bitstream_buffer.data(),
2804                    static_cast<uint64_t>(staging_bitstream_buffer_offset),
2805                    comp_bit_destination,
2806                    static_cast<uint64_t>(comp_bit_destination_offset));
2807 
2808       comp_bit_destination_offset += bitstream_tile_group_obu_bytes;
2809       written_bytes_to_staging_bitstream_buffer += bitstream_tile_group_obu_bytes;
2810    }
2811 
2812    size_t src_offset = 0;
2813    for (UINT64 TileIdx = tileGroup.tg_start; TileIdx <= tileGroup.tg_end; TileIdx++) {
2814       size_t tile_size = pFrameSubregionMetadata[TileIdx].bSize - pFrameSubregionMetadata[TileIdx].bStartOffset;
2815       // The i-th tile is read from the src_buffer[offset] with offset = [sum j = (0, (i-1)){ tile[j].bSize }] +
2816       // tile[i].bStartOffset
2817       size_t src_buf_tile_position = src_offset + pFrameSubregionMetadata[TileIdx].bStartOffset;
2818       src_offset += pFrameSubregionMetadata[TileIdx].bSize;
2819 
2820       // tile_size_minus_1	not coded for last tile
2821       if ((TileIdx != tileGroup.tg_end)) {
2822          bitstream_tile_group_obu.put_le_bytes(TileSizeBytes,   // tile_size_minus_1	le(TileSizeBytes)
2823                                                tile_size - 1 /* convert to ..._minus_1 */);
2824          bitstream_tile_group_obu.flush();
2825 
2826          debug_printf("[Tile group start %d to end %d] [TileIdx %" PRIu64 "] Written %" PRIu64
2827                       " written_bytes_to_staging_bitstream_buffer at staging_bitstream_buffer %p at offset %" PRIu64
2828                       " for the tile_size_minus1 syntax\n",
2829                       tileGroup.tg_start,
2830                       tileGroup.tg_end,
2831                       TileIdx,
2832                       static_cast<uint64_t>(TileSizeBytes),
2833                       staging_bitstream_buffer.data(),
2834                       static_cast<uint64_t>(written_bytes_to_staging_bitstream_buffer + staging_bitstream_buffer_offset));
2835 
2836          // Upload current tile_size_minus_1
2837          // Note: The buffer_subdata is queued in pD3D12Enc->base.context but doesn't execute immediately
2838          pD3D12Enc->base.context->buffer_subdata(pD3D12Enc->base.context,       // context
2839                                                  comp_bit_destination,          // comp. bitstream
2840                                                  PIPE_MAP_WRITE,                // usage PIPE_MAP_x
2841                                                  comp_bit_destination_offset,   // offset
2842                                                  TileSizeBytes,                 // size
2843                                                  staging_bitstream_buffer.data() +
2844                                                     written_bytes_to_staging_bitstream_buffer +
2845                                                     staging_bitstream_buffer_offset);   // data
2846 
2847          debug_printf("[Tile group start %d to end %d] [TileIdx %" PRIu64 "] Uploading %" PRIu64 " bytes"
2848                       " for tile_obu_group() prefix syntax: tile_size_minus_1"
2849                       " from staging_bitstream_buffer %p at offset %" PRIu64
2850                       " to comp_bit_destination %p at offset %" PRIu64 "\n",
2851                       tileGroup.tg_start,
2852                       tileGroup.tg_end,
2853                       TileIdx,
2854                       static_cast<uint64_t>(TileSizeBytes),
2855                       staging_bitstream_buffer.data(),
2856                       static_cast<uint64_t>(written_bytes_to_staging_bitstream_buffer + staging_bitstream_buffer_offset),
2857                       comp_bit_destination,
2858                       static_cast<uint64_t>(comp_bit_destination_offset));
2859 
2860          comp_bit_destination_offset += TileSizeBytes;
2861          written_bytes_to_staging_bitstream_buffer += TileSizeBytes;
2862       }
2863 
2864       // Now copy the decode_tile() element from the driver staging GPU buffer onto the finalized GPU buffer
2865 
2866       struct pipe_box src_box;
2867       u_box_3d(static_cast<int>(src_buf_tile_position),   // x
2868                0,                                         // y
2869                0,                                         // z
2870                static_cast<int>(tile_size),               // width
2871                1,                                         // height
2872                1,                                         // depth
2873                &src_box);
2874 
2875       pD3D12Enc->base.context->resource_copy_region(pD3D12Enc->base.context,       // ctx
2876                                                     comp_bit_destination,          // dst
2877                                                     0,                             // dst_level
2878                                                     comp_bit_destination_offset,   // dstX
2879                                                     0,                             // dstY
2880                                                     0,                             // dstZ
2881                                                     src_driver_bitstream,          // src
2882                                                     0,                             // src level
2883                                                     &src_box);
2884 
2885       debug_printf("[Tile group start %d to end %d] [TileIdx %" PRIu64 "] Written %" PRIu64
2886                    " tile_size bytes data from src_driver_bitstream %p at offset %" PRIu64
2887                    " into comp_bit_destination %p at offset %" PRIu64 "\n",
2888                    tileGroup.tg_start,
2889                    tileGroup.tg_end,
2890                    TileIdx,
2891                    static_cast<uint64_t>(tile_size),
2892                    src_driver_bitstream,
2893                    static_cast<uint64_t>(src_buf_tile_position),
2894                    comp_bit_destination,
2895                    static_cast<uint64_t>(comp_bit_destination_offset));
2896 
2897       comp_bit_destination_offset += tile_size;
2898 
2899       size_t cur_tile_reportable_size = tile_size;
2900       if (TileIdx != tileGroup.tg_end)
2901          cur_tile_reportable_size += TileSizeBytes; /* extra tile_size_bytes_minus1 in all tiles except last*/
2902       if (TileIdx == 0)
2903          cur_tile_reportable_size += bitstream_tile_group_obu_bytes; // part of the obu tile group header (make part of first tile)
2904       pWrittenCodecUnitsSizes.push_back(cur_tile_reportable_size);
2905    }
2906 
2907    // Make sure we wrote the expected bytes that match the obu_size elements
2908    // in the OBUs wrapping this uploaded tile_group_obu
2909    assert((comp_bit_destination_offset - comp_bit_destination_offset_before_upload) == tile_group_obu_size);
2910 }
2911 
2912 void
d3d12_video_encoder_store_current_picture_references_av1(d3d12_video_encoder * pD3D12Enc,uint64_t current_metadata_slot)2913 d3d12_video_encoder_store_current_picture_references_av1(d3d12_video_encoder *pD3D12Enc, uint64_t current_metadata_slot)
2914 {
2915    // Update DX12 picparams for post execution (get_feedback) after d3d12_video_encoder_references_manager_av1
2916    // changes
2917    pD3D12Enc->m_spEncodedFrameMetadata[current_metadata_slot].m_associatedEncodeConfig.m_encoderPicParamsDesc =
2918       pD3D12Enc->m_currentEncodeConfig.m_encoderPicParamsDesc;
2919 }
2920