1 /**************************************************************************
2 *
3 * Copyright 2013 Advanced Micro Devices, Inc.
4 *
5 * SPDX-License-Identifier: MIT
6 *
7 **************************************************************************/
8
9 #include "pipe/p_video_codec.h"
10 #include "radeon_vce.h"
11 #include "radeon_video.h"
12 #include "si_pipe.h"
13 #include "util/u_memory.h"
14 #include "util/u_video.h"
15 #include "vl/vl_video_buffer.h"
16
17 #include <stdio.h>
18
rate_control(struct rvce_encoder * enc)19 static void rate_control(struct rvce_encoder *enc)
20 {
21 uint32_t target_bits_picture =
22 enc->pic.rate_ctrl[0].target_bitrate *
23 ((float)enc->pic.rate_ctrl[0].frame_rate_den /
24 enc->pic.rate_ctrl[0].frame_rate_num);
25 uint32_t peak_bits_picture_integer =
26 enc->pic.rate_ctrl[0].peak_bitrate *
27 ((float)enc->pic.rate_ctrl[0].frame_rate_den /
28 enc->pic.rate_ctrl[0].frame_rate_num);
29 uint32_t peak_bits_picture_fraction =
30 (((enc->pic.rate_ctrl[0].peak_bitrate *
31 (uint64_t)enc->pic.rate_ctrl[0].frame_rate_den) %
32 enc->pic.rate_ctrl[0].frame_rate_num) << 32) /
33 enc->pic.rate_ctrl[0].frame_rate_num;
34
35 RVCE_BEGIN(0x04000005); // rate control
36 RVCE_CS(enc->pic.rate_ctrl[0].rate_ctrl_method); // encRateControlMethod
37 RVCE_CS(enc->pic.rate_ctrl[0].target_bitrate); // encRateControlTargetBitRate
38 RVCE_CS(enc->pic.rate_ctrl[0].peak_bitrate); // encRateControlPeakBitRate
39 RVCE_CS(enc->pic.rate_ctrl[0].frame_rate_num); // encRateControlFrameRateNum
40 RVCE_CS(0x00000000); // encGOPSize
41 RVCE_CS(enc->pic.quant_i_frames); // encQP_I
42 RVCE_CS(enc->pic.quant_p_frames); // encQP_P
43 RVCE_CS(enc->pic.quant_b_frames); // encQP_B
44 RVCE_CS(enc->pic.rate_ctrl[0].vbv_buffer_size); // encVBVBufferSize
45 RVCE_CS(enc->pic.rate_ctrl[0].frame_rate_den); // encRateControlFrameRateDen
46 RVCE_CS(0x00000000); // encVBVBufferLevel
47 RVCE_CS(0x00000000); // encMaxAUSize
48 RVCE_CS(0x00000000); // encQPInitialMode
49 RVCE_CS(target_bits_picture); // encTargetBitsPerPicture
50 RVCE_CS(peak_bits_picture_integer); // encPeakBitsPerPictureInteger
51 RVCE_CS(peak_bits_picture_fraction); // encPeakBitsPerPictureFractional
52 RVCE_CS(0x00000000); // encMinQP
53 RVCE_CS(0x00000033); // encMaxQP
54 RVCE_CS(0x00000000); // encSkipFrameEnable
55 RVCE_CS(0x00000000); // encFillerDataEnable
56 RVCE_CS(0x00000000); // encEnforceHRD
57 RVCE_CS(0x00000000); // encBPicsDeltaQP
58 RVCE_CS(0x00000000); // encReferenceBPicsDeltaQP
59 RVCE_CS(0x00000000); // encRateControlReInitDisable
60 RVCE_CS(0x00000000); // encLCVBRInitQPFlag
61 RVCE_CS(0x00000000); // encLCVBRSATDBasedNonlinearBitBudgetFlag
62 RVCE_END();
63 }
64
encode(struct rvce_encoder * enc)65 static void encode(struct rvce_encoder *enc)
66 {
67 signed luma_offset, chroma_offset, bs_offset;
68 unsigned dep, bs_idx = enc->bs_idx++;
69 int i;
70
71 if (enc->dual_inst) {
72 if (bs_idx == 0)
73 dep = 1;
74 else if (enc->pic.picture_type == PIPE_H2645_ENC_PICTURE_TYPE_IDR)
75 dep = 0;
76 else
77 dep = 2;
78 } else
79 dep = 0;
80
81 enc->task_info(enc, 0x00000003, dep, 0, bs_idx);
82
83 RVCE_BEGIN(0x05000001); // context buffer
84 RVCE_READWRITE(enc->cpb.res->buf, enc->cpb.res->domains, 0); // encodeContextAddressHi/Lo
85 RVCE_END();
86
87 bs_offset = -(signed)(bs_idx * enc->bs_size);
88
89 RVCE_BEGIN(0x05000004); // video bitstream buffer
90 RVCE_WRITE(enc->bs_handle, RADEON_DOMAIN_GTT, bs_offset); // videoBitstreamRingAddressHi/Lo
91 RVCE_CS(enc->bs_size); // videoBitstreamRingSize
92 RVCE_END();
93
94 if (enc->dual_pipe) {
95 unsigned aux_offset =
96 enc->cpb.res->buf->size - RVCE_MAX_AUX_BUFFER_NUM * RVCE_MAX_BITSTREAM_OUTPUT_ROW_SIZE * 2;
97 RVCE_BEGIN(0x05000002); // auxiliary buffer
98 for (i = 0; i < 8; ++i) {
99 RVCE_CS(aux_offset);
100 aux_offset += RVCE_MAX_BITSTREAM_OUTPUT_ROW_SIZE;
101 }
102 for (i = 0; i < 8; ++i)
103 RVCE_CS(RVCE_MAX_BITSTREAM_OUTPUT_ROW_SIZE);
104 RVCE_END();
105 }
106
107 RVCE_BEGIN(0x03000001); // encode
108 RVCE_CS(enc->pic.frame_num ? 0x0 : 0x11); // insertHeaders
109 RVCE_CS(0x00000000); // pictureStructure
110 RVCE_CS(enc->bs_size); // allowedMaxBitstreamSize
111 RVCE_CS(0x00000000); // forceRefreshMap
112 RVCE_CS(0x00000000); // insertAUD
113 RVCE_CS(0x00000000); // endOfSequence
114 RVCE_CS(0x00000000); // endOfStream
115 RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM,
116 (uint64_t)enc->luma->u.legacy.level[0].offset_256B * 256); // inputPictureLumaAddressHi/Lo
117 RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM,
118 (uint64_t)enc->chroma->u.legacy.level[0].offset_256B * 256); // inputPictureChromaAddressHi/Lo
119 RVCE_CS(align(enc->luma->u.legacy.level[0].nblk_y, 16)); // encInputFrameYPitch
120 RVCE_CS(enc->luma->u.legacy.level[0].nblk_x * enc->luma->bpe); // encInputPicLumaPitch
121 RVCE_CS(enc->chroma->u.legacy.level[0].nblk_x * enc->chroma->bpe); // encInputPicChromaPitch
122 if (enc->dual_pipe)
123 RVCE_CS(0x00000000); // encInputPic(Addr|Array)Mode,encDisable(TwoPipeMode|MBOffloading)
124 else
125 RVCE_CS(0x00010000); // encInputPic(Addr|Array)Mode,encDisable(TwoPipeMode|MBOffloading)
126 RVCE_CS(0x00000000); // encInputPicTileConfig
127 RVCE_CS(enc->pic.picture_type); // encPicType
128 RVCE_CS(enc->pic.picture_type == PIPE_H2645_ENC_PICTURE_TYPE_IDR);// encIdrFlag
129 RVCE_CS(0x00000000); // encIdrPicId
130 RVCE_CS(0x00000000); // encMGSKeyPic
131 RVCE_CS(!enc->pic.not_referenced); // encReferenceFlag
132 RVCE_CS(0x00000000); // encTemporalLayerIndex
133 RVCE_CS(0x00000000); // num_ref_idx_active_override_flag
134 RVCE_CS(0x00000000); // num_ref_idx_l0_active_minus1
135 RVCE_CS(0x00000000); // num_ref_idx_l1_active_minus1
136
137 i = enc->pic.frame_num - enc->pic.ref_idx_l0_list[0];
138 if (i > 1 && enc->pic.picture_type == PIPE_H2645_ENC_PICTURE_TYPE_P) {
139 RVCE_CS(0x00000001); // encRefListModificationOp
140 RVCE_CS(i - 1); // encRefListModificationNum
141 } else {
142 RVCE_CS(0x00000000); // encRefListModificationOp
143 RVCE_CS(0x00000000); // encRefListModificationNum
144 }
145
146 for (i = 0; i < 3; ++i) {
147 RVCE_CS(0x00000000); // encRefListModificationOp
148 RVCE_CS(0x00000000); // encRefListModificationNum
149 }
150 for (i = 0; i < 4; ++i) {
151 RVCE_CS(0x00000000); // encDecodedPictureMarkingOp
152 RVCE_CS(0x00000000); // encDecodedPictureMarkingNum
153 RVCE_CS(0x00000000); // encDecodedPictureMarkingIdx
154 RVCE_CS(0x00000000); // encDecodedRefBasePictureMarkingOp
155 RVCE_CS(0x00000000); // encDecodedRefBasePictureMarkingNum
156 }
157
158 // encReferencePictureL0[0]
159 RVCE_CS(0x00000000); // pictureStructure
160 if (enc->pic.picture_type == PIPE_H2645_ENC_PICTURE_TYPE_P ||
161 enc->pic.picture_type == PIPE_H2645_ENC_PICTURE_TYPE_B) {
162 struct rvce_cpb_slot *l0 = si_l0_slot(enc);
163 si_vce_frame_offset(enc, l0, &luma_offset, &chroma_offset);
164 RVCE_CS(l0->picture_type); // encPicType
165 RVCE_CS(l0->frame_num); // frameNumber
166 RVCE_CS(l0->pic_order_cnt); // pictureOrderCount
167 RVCE_CS(luma_offset); // lumaOffset
168 RVCE_CS(chroma_offset); // chromaOffset
169 } else {
170 RVCE_CS(0x00000000); // encPicType
171 RVCE_CS(0x00000000); // frameNumber
172 RVCE_CS(0x00000000); // pictureOrderCount
173 RVCE_CS(0xffffffff); // lumaOffset
174 RVCE_CS(0xffffffff); // chromaOffset
175 }
176
177 // encReferencePictureL0[1]
178 RVCE_CS(0x00000000); // pictureStructure
179 RVCE_CS(0x00000000); // encPicType
180 RVCE_CS(0x00000000); // frameNumber
181 RVCE_CS(0x00000000); // pictureOrderCount
182 RVCE_CS(0xffffffff); // lumaOffset
183 RVCE_CS(0xffffffff); // chromaOffset
184
185 // encReferencePictureL1[0]
186 RVCE_CS(0x00000000); // pictureStructure
187 if (enc->pic.picture_type == PIPE_H2645_ENC_PICTURE_TYPE_B) {
188 struct rvce_cpb_slot *l1 = si_l1_slot(enc);
189 si_vce_frame_offset(enc, l1, &luma_offset, &chroma_offset);
190 RVCE_CS(l1->picture_type); // encPicType
191 RVCE_CS(l1->frame_num); // frameNumber
192 RVCE_CS(l1->pic_order_cnt); // pictureOrderCount
193 RVCE_CS(luma_offset); // lumaOffset
194 RVCE_CS(chroma_offset); // chromaOffset
195 } else {
196 RVCE_CS(0x00000000); // encPicType
197 RVCE_CS(0x00000000); // frameNumber
198 RVCE_CS(0x00000000); // pictureOrderCount
199 RVCE_CS(0xffffffff); // lumaOffset
200 RVCE_CS(0xffffffff); // chromaOffset
201 }
202
203 si_vce_frame_offset(enc, si_current_slot(enc), &luma_offset, &chroma_offset);
204 RVCE_CS(luma_offset); // encReconstructedLumaOffset
205 RVCE_CS(chroma_offset); // encReconstructedChromaOffset
206 RVCE_CS(0x00000000); // encColocBufferOffset
207 RVCE_CS(0x00000000); // encReconstructedRefBasePictureLumaOffset
208 RVCE_CS(0x00000000); // encReconstructedRefBasePictureChromaOffset
209 RVCE_CS(0x00000000); // encReferenceRefBasePictureLumaOffset
210 RVCE_CS(0x00000000); // encReferenceRefBasePictureChromaOffset
211 RVCE_CS(0x00000000); // pictureCount
212 RVCE_CS(enc->pic.frame_num); // frameNumber
213 RVCE_CS(enc->pic.pic_order_cnt); // pictureOrderCount
214 RVCE_CS(0x00000000); // numIPicRemainInRCGOP
215 RVCE_CS(0x00000000); // numPPicRemainInRCGOP
216 RVCE_CS(0x00000000); // numBPicRemainInRCGOP
217 RVCE_CS(0x00000000); // numIRPicRemainInRCGOP
218 RVCE_CS(0x00000000); // enableIntraRefresh
219 RVCE_END();
220 }
221
si_vce_50_get_param(struct rvce_encoder * enc,struct pipe_h264_enc_picture_desc * pic)222 void si_vce_50_get_param(struct rvce_encoder *enc, struct pipe_h264_enc_picture_desc *pic)
223 {
224 }
225
si_vce_50_init(struct rvce_encoder * enc)226 void si_vce_50_init(struct rvce_encoder *enc)
227 {
228 si_vce_40_2_2_init(enc);
229
230 /* only the two below are different */
231 enc->rate_control = rate_control;
232 enc->encode = encode;
233 enc->si_get_pic_param = si_vce_50_get_param;
234 }
235