radeonsi: use conformant line rasterization
[mesa.git] / src / gallium / drivers / radeon / radeon_vce_52.c
1 /**************************************************************************
2 *
3 * Copyright 2015 Advanced Micro Devices, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 #include <stdio.h>
29
30 #include "pipe/p_video_codec.h"
31
32 #include "util/u_video.h"
33 #include "util/u_memory.h"
34
35 #include "vl/vl_video_buffer.h"
36
37 #include "r600_pipe_common.h"
38 #include "radeon_video.h"
39 #include "radeon_vce.h"
40
41 static const unsigned profiles[7] = { 66, 77, 88, 100, 110, 122, 244 };
42
43 static void get_rate_control_param(struct rvce_encoder *enc, struct pipe_h264_enc_picture_desc *pic)
44 {
45 enc->enc_pic.rc.rc_method = pic->rate_ctrl.rate_ctrl_method;
46 enc->enc_pic.rc.target_bitrate = pic->rate_ctrl.target_bitrate;
47 enc->enc_pic.rc.peak_bitrate = pic->rate_ctrl.peak_bitrate;
48 enc->enc_pic.rc.quant_i_frames = pic->quant_i_frames;
49 enc->enc_pic.rc.quant_p_frames = pic->quant_p_frames;
50 enc->enc_pic.rc.quant_b_frames = pic->quant_b_frames;
51 enc->enc_pic.rc.frame_rate_num = pic->rate_ctrl.frame_rate_num;
52 enc->enc_pic.rc.frame_rate_den = pic->rate_ctrl.frame_rate_den;
53 enc->enc_pic.rc.max_qp = 51;
54 enc->enc_pic.rc.vbv_buffer_size = pic->rate_ctrl.vbv_buffer_size;
55 enc->enc_pic.rc.vbv_buf_lv = 0;
56 enc->enc_pic.rc.fill_data_enable = 0;
57 enc->enc_pic.rc.enforce_hrd = 0;
58 enc->enc_pic.rc.target_bits_picture = pic->rate_ctrl.target_bits_picture;
59 enc->enc_pic.rc.peak_bits_picture_integer = pic->rate_ctrl.peak_bits_picture_integer;
60 enc->enc_pic.rc.peak_bits_picture_fraction = pic->rate_ctrl.peak_bits_picture_fraction;
61 }
62
63 static void get_motion_estimation_param(struct rvce_encoder *enc, struct pipe_h264_enc_picture_desc *pic)
64 {
65 enc->enc_pic.me.motion_est_quarter_pixel = 0x00000000;
66 enc->enc_pic.me.enc_disable_sub_mode = 0x000000fe;
67 enc->enc_pic.me.lsmvert = 0x00000000;
68 enc->enc_pic.me.enc_en_ime_overw_dis_subm = 0x00000000;
69 enc->enc_pic.me.enc_ime_overw_dis_subm_no = 0x00000000;
70 enc->enc_pic.me.enc_ime2_search_range_x = 0x00000001;
71 enc->enc_pic.me.enc_ime2_search_range_y = 0x00000001;
72 enc->enc_pic.me.enc_ime_decimation_search = 0x00000001;
73 enc->enc_pic.me.motion_est_half_pixel = 0x00000001;
74 enc->enc_pic.me.enc_search_range_x = 0x00000010;
75 enc->enc_pic.me.enc_search_range_y = 0x00000010;
76 enc->enc_pic.me.enc_search1_range_x = 0x00000010;
77 enc->enc_pic.me.enc_search1_range_y = 0x00000010;
78 }
79
80 static void get_pic_control_param(struct rvce_encoder *enc, struct pipe_h264_enc_picture_desc *pic)
81 {
82 unsigned encNumMBsPerSlice;
83 encNumMBsPerSlice = align(enc->base.width, 16) / 16;
84 encNumMBsPerSlice *= align(enc->base.height, 16) / 16;
85 enc->enc_pic.pc.enc_crop_right_offset = (align(enc->base.width, 16) - enc->base.width) >> 1;
86 enc->enc_pic.pc.enc_crop_bottom_offset = (align(enc->base.height, 16) - enc->base.height) >> 1;
87 enc->enc_pic.pc.enc_num_mbs_per_slice = encNumMBsPerSlice;
88 enc->enc_pic.pc.enc_b_pic_pattern = MAX2(enc->base.max_references, 1) - 1;
89 enc->enc_pic.pc.enc_number_of_reference_frames = MIN2(enc->base.max_references, 2);
90 enc->enc_pic.pc.enc_max_num_ref_frames = enc->base.max_references + 1;
91 enc->enc_pic.pc.enc_num_default_active_ref_l0 = 0x00000001;
92 enc->enc_pic.pc.enc_num_default_active_ref_l1 = 0x00000001;
93 enc->enc_pic.pc.enc_cabac_enable = 0x00000000;
94 enc->enc_pic.pc.enc_constraint_set_flags = 0x00000040;
95 enc->enc_pic.pc.enc_num_default_active_ref_l0 = 0x00000001;
96 enc->enc_pic.pc.enc_num_default_active_ref_l1 = 0x00000001;
97 }
98
99 static void get_task_info_param(struct rvce_encoder *enc)
100 {
101 enc->enc_pic.ti.offset_of_next_task_info = 0xffffffff;
102 }
103
104 static void get_feedback_buffer_param(struct rvce_encoder *enc)
105 {
106 enc->enc_pic.fb.feedback_ring_size = 0x00000001;
107 }
108
109 static void get_config_ext_param(struct rvce_encoder *enc)
110 {
111 enc->enc_pic.ce.enc_enable_perf_logging = 0x00000003;
112 }
113
114 static void get_vui_param(struct rvce_encoder *enc, struct pipe_h264_enc_picture_desc *pic)
115 {
116 enc->enc_pic.enable_vui = (pic->rate_ctrl.frame_rate_num != 0);
117 enc->enc_pic.vui.video_format = 0x00000005;
118 enc->enc_pic.vui.color_prim = 0x00000002;
119 enc->enc_pic.vui.transfer_char = 0x00000002;
120 enc->enc_pic.vui.matrix_coef = 0x00000002;
121 enc->enc_pic.vui.timing_info_present_flag = 0x00000001;
122 enc->enc_pic.vui.num_units_in_tick = pic->rate_ctrl.frame_rate_den;
123 enc->enc_pic.vui.time_scale = pic->rate_ctrl.frame_rate_num * 2;
124 enc->enc_pic.vui.fixed_frame_rate_flag = 0x00000001;
125 enc->enc_pic.vui.bit_rate_scale = 0x00000004;
126 enc->enc_pic.vui.cpb_size_scale = 0x00000006;
127 enc->enc_pic.vui.initial_cpb_removal_delay_length_minus1 = 0x00000017;
128 enc->enc_pic.vui.cpb_removal_delay_length_minus1 = 0x00000017;
129 enc->enc_pic.vui.dpb_output_delay_length_minus1 = 0x00000017;
130 enc->enc_pic.vui.time_offset_length = 0x00000018;
131 enc->enc_pic.vui.motion_vectors_over_pic_boundaries_flag = 0x00000001;
132 enc->enc_pic.vui.max_bytes_per_pic_denom = 0x00000002;
133 enc->enc_pic.vui.max_bits_per_mb_denom = 0x00000001;
134 enc->enc_pic.vui.log2_max_mv_length_hori = 0x00000010;
135 enc->enc_pic.vui.log2_max_mv_length_vert = 0x00000010;
136 enc->enc_pic.vui.num_reorder_frames = 0x00000003;
137 enc->enc_pic.vui.max_dec_frame_buffering = 0x00000003;
138 }
139
140 void radeon_vce_52_get_param(struct rvce_encoder *enc, struct pipe_h264_enc_picture_desc *pic)
141 {
142 get_rate_control_param(enc, pic);
143 get_motion_estimation_param(enc, pic);
144 get_pic_control_param(enc, pic);
145 get_task_info_param(enc);
146 get_feedback_buffer_param(enc);
147 get_vui_param(enc, pic);
148 get_config_ext_param(enc);
149
150 enc->enc_pic.picture_type = pic->picture_type;
151 enc->enc_pic.frame_num = pic->frame_num;
152 enc->enc_pic.pic_order_cnt = pic->pic_order_cnt;
153 enc->enc_pic.ref_idx_l0 = pic->ref_idx_l0;
154 enc->enc_pic.ref_idx_l1 = pic->ref_idx_l1;
155 enc->enc_pic.not_referenced = pic->not_referenced;
156 }
157
158 static void create(struct rvce_encoder *enc)
159 {
160 enc->task_info(enc, 0x00000000, 0, 0, 0);
161
162 RVCE_BEGIN(0x01000001); // create cmd
163 RVCE_CS(enc->enc_pic.ec.enc_use_circular_buffer);
164 RVCE_CS(profiles[enc->base.profile -
165 PIPE_VIDEO_PROFILE_MPEG4_AVC_BASELINE]); // encProfile
166 RVCE_CS(enc->base.level); // encLevel
167 RVCE_CS(enc->enc_pic.ec.enc_pic_struct_restriction);
168 RVCE_CS(enc->base.width); // encImageWidth
169 RVCE_CS(enc->base.height); // encImageHeight
170 RVCE_CS(enc->luma->level[0].pitch_bytes); // encRefPicLumaPitch
171 RVCE_CS(enc->chroma->level[0].pitch_bytes); // encRefPicChromaPitch
172 RVCE_CS(align(enc->luma->npix_y, 16) / 8); // encRefYHeightInQw
173 RVCE_CS(enc->enc_pic.addrmode_arraymode_disrdo_distwoinstants);
174
175 RVCE_CS(enc->enc_pic.ec.enc_pre_encode_context_buffer_offset);
176 RVCE_CS(enc->enc_pic.ec.enc_pre_encode_input_luma_buffer_offset);
177 RVCE_CS(enc->enc_pic.ec.enc_pre_encode_input_chroma_buffer_offset);
178 RVCE_CS(enc->enc_pic.ec.enc_pre_encode_mode_chromaflag_vbaqmode_scenechangesensitivity);
179 RVCE_END();
180 }
181
182 static void encode(struct rvce_encoder *enc)
183 {
184 signed luma_offset, chroma_offset, bs_offset;
185 unsigned dep, bs_idx = enc->bs_idx++;
186 int i;
187
188 if (enc->dual_inst) {
189 if (bs_idx == 0)
190 dep = 1;
191 else if (enc->enc_pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_IDR)
192 dep = 0;
193 else
194 dep = 2;
195 } else
196 dep = 0;
197
198 enc->task_info(enc, 0x00000003, dep, 0, bs_idx);
199
200 RVCE_BEGIN(0x05000001); // context buffer
201 RVCE_READWRITE(enc->cpb.res->buf, enc->cpb.res->domains, 0); // encodeContextAddressHi/Lo
202 RVCE_END();
203
204 bs_offset = -(signed)(bs_idx * enc->bs_size);
205
206 RVCE_BEGIN(0x05000004); // video bitstream buffer
207 RVCE_WRITE(enc->bs_handle, RADEON_DOMAIN_GTT, bs_offset); // videoBitstreamRingAddressHi/Lo
208 RVCE_CS(enc->bs_size); // videoBitstreamRingSize
209 RVCE_END();
210
211 if (enc->dual_pipe) {
212 unsigned aux_offset = enc->cpb.res->buf->size -
213 RVCE_MAX_AUX_BUFFER_NUM * RVCE_MAX_BITSTREAM_OUTPUT_ROW_SIZE * 2;
214 RVCE_BEGIN(0x05000002); // auxiliary buffer
215 for (i = 0; i < 8; ++i) {
216 RVCE_CS(aux_offset);
217 aux_offset += RVCE_MAX_BITSTREAM_OUTPUT_ROW_SIZE;
218 }
219 for (i = 0; i < 8; ++i)
220 RVCE_CS(RVCE_MAX_BITSTREAM_OUTPUT_ROW_SIZE);
221 RVCE_END();
222 }
223
224 RVCE_BEGIN(0x03000001); // encode
225 RVCE_CS(enc->enc_pic.frame_num ? 0x0 : 0x11); // insertHeaders
226 RVCE_CS(enc->enc_pic.eo.picture_structure);
227 RVCE_CS(enc->bs_size); // allowedMaxBitstreamSize
228 RVCE_CS(enc->enc_pic.eo.force_refresh_map);
229 RVCE_CS(enc->enc_pic.eo.insert_aud);
230 RVCE_CS(enc->enc_pic.eo.end_of_sequence);
231 RVCE_CS(enc->enc_pic.eo.end_of_stream);
232 RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM,
233 enc->luma->level[0].offset); // inputPictureLumaAddressHi/Lo
234 RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM,
235 enc->chroma->level[0].offset); // inputPictureChromaAddressHi/Lo
236 RVCE_CS(align(enc->luma->npix_y, 16)); // encInputFrameYPitch
237 RVCE_CS(enc->luma->level[0].pitch_bytes); // encInputPicLumaPitch
238 RVCE_CS(enc->chroma->level[0].pitch_bytes); // encInputPicChromaPitch
239 if (enc->dual_pipe)
240 enc->enc_pic.eo.enc_input_pic_addr_array_disable2pipe_disablemboffload = 0x00000000;
241 else
242 enc->enc_pic.eo.enc_input_pic_addr_array_disable2pipe_disablemboffload = 0x00010000;
243 RVCE_CS(enc->enc_pic.eo.enc_input_pic_addr_array_disable2pipe_disablemboffload);
244 RVCE_CS(enc->enc_pic.eo.enc_input_pic_tile_config);
245 RVCE_CS(enc->enc_pic.picture_type); // encPicType
246 RVCE_CS(enc->enc_pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_IDR); // encIdrFlag
247 if ((enc->enc_pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_IDR) && (enc->enc_pic.eo.enc_idr_pic_id !=0))
248 enc->enc_pic.eo.enc_idr_pic_id = enc->enc_pic.idr_pic_id - 1;
249 else
250 enc->enc_pic.eo.enc_idr_pic_id = 0x00000000;
251 RVCE_CS(enc->enc_pic.eo.enc_idr_pic_id);
252 RVCE_CS(enc->enc_pic.eo.enc_mgs_key_pic);
253 RVCE_CS(!enc->enc_pic.not_referenced);
254 RVCE_CS(enc->enc_pic.eo.enc_temporal_layer_index);
255 RVCE_CS(enc->enc_pic.eo.num_ref_idx_active_override_flag);
256 RVCE_CS(enc->enc_pic.eo.num_ref_idx_l0_active_minus1);
257 RVCE_CS(enc->enc_pic.eo.num_ref_idx_l1_active_minus1);
258
259 i = enc->enc_pic.frame_num - enc->enc_pic.ref_idx_l0;
260 if (i > 1 && enc->enc_pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_P) {
261 enc->enc_pic.eo.enc_ref_list_modification_op = 0x00000001;
262 enc->enc_pic.eo.enc_ref_list_modification_num = i - 1;
263 RVCE_CS(enc->enc_pic.eo.enc_ref_list_modification_op);
264 RVCE_CS(enc->enc_pic.eo.enc_ref_list_modification_num);
265 } else {
266 enc->enc_pic.eo.enc_ref_list_modification_op = 0x00000000;
267 enc->enc_pic.eo.enc_ref_list_modification_num = 0x00000000;
268 RVCE_CS(enc->enc_pic.eo.enc_ref_list_modification_op);
269 RVCE_CS(enc->enc_pic.eo.enc_ref_list_modification_num);
270 }
271
272 for (i = 0; i < 3; ++i) {
273 enc->enc_pic.eo.enc_ref_list_modification_op = 0x00000000;
274 enc->enc_pic.eo.enc_ref_list_modification_num = 0x00000000;
275 RVCE_CS(enc->enc_pic.eo.enc_ref_list_modification_op);
276 RVCE_CS(enc->enc_pic.eo.enc_ref_list_modification_num);
277 }
278 for (i = 0; i < 4; ++i) {
279 RVCE_CS(enc->enc_pic.eo.enc_decoded_picture_marking_op);
280 RVCE_CS(enc->enc_pic.eo.enc_decoded_picture_marking_num);
281 RVCE_CS(enc->enc_pic.eo.enc_decoded_picture_marking_idx);
282 RVCE_CS(enc->enc_pic.eo.enc_decoded_ref_base_picture_marking_op);
283 RVCE_CS(enc->enc_pic.eo.enc_decoded_ref_base_picture_marking_num);
284 }
285
286 // encReferencePictureL0[0]
287 RVCE_CS(0x00000000); // pictureStructure
288 if(enc->enc_pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_P ||
289 enc->enc_pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_B) {
290 struct rvce_cpb_slot *l0 = l0_slot(enc);
291 rvce_frame_offset(enc, l0, &luma_offset, &chroma_offset);
292 RVCE_CS(l0->picture_type);
293 RVCE_CS(l0->frame_num);
294 RVCE_CS(l0->pic_order_cnt);
295 RVCE_CS(luma_offset);
296 RVCE_CS(chroma_offset);
297 } else {
298 enc->enc_pic.eo.l0_enc_pic_type = 0x00000000;
299 enc->enc_pic.eo.l0_frame_number = 0x00000000;
300 enc->enc_pic.eo.l0_picture_order_count = 0x00000000;
301 enc->enc_pic.eo.l0_luma_offset = 0xffffffff;
302 enc->enc_pic.eo.l0_chroma_offset = 0xffffffff;
303 RVCE_CS(enc->enc_pic.eo.l0_enc_pic_type);
304 RVCE_CS(enc->enc_pic.eo.l0_frame_number);
305 RVCE_CS(enc->enc_pic.eo.l0_picture_order_count);
306 RVCE_CS(enc->enc_pic.eo.l0_luma_offset);
307 RVCE_CS(enc->enc_pic.eo.l0_chroma_offset);
308 }
309
310 // encReferencePictureL0[1]
311 enc->enc_pic.eo.l0_picture_structure = 0x00000000;
312 enc->enc_pic.eo.l0_enc_pic_type = 0x00000000;
313 enc->enc_pic.eo.l0_frame_number = 0x00000000;
314 enc->enc_pic.eo.l0_picture_order_count = 0x00000000;
315 enc->enc_pic.eo.l0_luma_offset = 0xffffffff;
316 enc->enc_pic.eo.l0_chroma_offset = 0xffffffff;
317 RVCE_CS(enc->enc_pic.eo.l0_picture_structure);
318 RVCE_CS(enc->enc_pic.eo.l0_enc_pic_type);
319 RVCE_CS(enc->enc_pic.eo.l0_frame_number);
320 RVCE_CS(enc->enc_pic.eo.l0_picture_order_count);
321 RVCE_CS(enc->enc_pic.eo.l0_luma_offset);
322 RVCE_CS(enc->enc_pic.eo.l0_chroma_offset);
323
324 // encReferencePictureL1[0]
325 RVCE_CS(0x00000000); // pictureStructure
326 if(enc->enc_pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_B) {
327 struct rvce_cpb_slot *l1 = l1_slot(enc);
328 rvce_frame_offset(enc, l1, &luma_offset, &chroma_offset);
329 RVCE_CS(l1->picture_type);
330 RVCE_CS(l1->frame_num);
331 RVCE_CS(l1->pic_order_cnt);
332 RVCE_CS(luma_offset);
333 RVCE_CS(chroma_offset);
334 } else {
335 enc->enc_pic.eo.l1_enc_pic_type = 0x00000000;
336 enc->enc_pic.eo.l1_frame_number = 0x00000000;
337 enc->enc_pic.eo.l1_picture_order_count = 0x00000000;
338 enc->enc_pic.eo.l1_luma_offset = 0xffffffff;
339 enc->enc_pic.eo.l1_chroma_offset = 0xffffffff;
340 RVCE_CS(enc->enc_pic.eo.l1_enc_pic_type);
341 RVCE_CS(enc->enc_pic.eo.l1_frame_number);
342 RVCE_CS(enc->enc_pic.eo.l1_picture_order_count);
343 RVCE_CS(enc->enc_pic.eo.l1_luma_offset);
344 RVCE_CS(enc->enc_pic.eo.l1_chroma_offset);
345 }
346
347 rvce_frame_offset(enc, current_slot(enc), &luma_offset, &chroma_offset);
348 RVCE_CS(luma_offset);
349 RVCE_CS(chroma_offset);
350 RVCE_CS(enc->enc_pic.eo.enc_coloc_buffer_offset);
351 RVCE_CS(enc->enc_pic.eo.enc_reconstructed_ref_base_picture_luma_offset);
352 RVCE_CS(enc->enc_pic.eo.enc_reconstructed_ref_base_picture_chroma_offset);
353 RVCE_CS(enc->enc_pic.eo.enc_reference_ref_base_picture_luma_offset);
354 RVCE_CS(enc->enc_pic.eo.enc_reference_ref_base_picture_chroma_offset);
355 RVCE_CS(enc->enc_pic.frame_num_cnt-1);
356 RVCE_CS(enc->enc_pic.frame_num);
357 RVCE_CS(enc->enc_pic.pic_order_cnt);
358 RVCE_CS(enc->enc_pic.i_remain);
359 RVCE_CS(enc->enc_pic.p_remain);
360 RVCE_CS(enc->enc_pic.eo.num_b_pic_remain_in_rcgop);
361 RVCE_CS(enc->enc_pic.eo.num_ir_pic_remain_in_rcgop);
362 RVCE_CS(enc->enc_pic.eo.enable_intra_refresh);
363
364 RVCE_CS(enc->enc_pic.eo.aq_variance_en);
365 RVCE_CS(enc->enc_pic.eo.aq_block_size);
366 RVCE_CS(enc->enc_pic.eo.aq_mb_variance_sel);
367 RVCE_CS(enc->enc_pic.eo.aq_frame_variance_sel);
368 RVCE_CS(enc->enc_pic.eo.aq_param_a);
369 RVCE_CS(enc->enc_pic.eo.aq_param_b);
370 RVCE_CS(enc->enc_pic.eo.aq_param_c);
371 RVCE_CS(enc->enc_pic.eo.aq_param_d);
372 RVCE_CS(enc->enc_pic.eo.aq_param_e);
373
374 RVCE_CS(enc->enc_pic.eo.context_in_sfb);
375 RVCE_END();
376 }
377
378 static void rate_control(struct rvce_encoder *enc)
379 {
380 RVCE_BEGIN(0x04000005); // rate control
381 RVCE_CS(enc->enc_pic.rc.rc_method);
382 RVCE_CS(enc->enc_pic.rc.target_bitrate);
383 RVCE_CS(enc->enc_pic.rc.peak_bitrate);
384 RVCE_CS(enc->enc_pic.rc.frame_rate_num);
385 RVCE_CS(enc->enc_pic.rc.gop_size);
386 RVCE_CS(enc->enc_pic.rc.quant_i_frames);
387 RVCE_CS(enc->enc_pic.rc.quant_p_frames);
388 RVCE_CS(enc->enc_pic.rc.quant_b_frames);
389 RVCE_CS(enc->enc_pic.rc.vbv_buffer_size);
390 RVCE_CS(enc->enc_pic.rc.frame_rate_den);
391 RVCE_CS(enc->enc_pic.rc.vbv_buf_lv);
392 RVCE_CS(enc->enc_pic.rc.max_au_size);
393 RVCE_CS(enc->enc_pic.rc.qp_initial_mode);
394 RVCE_CS(enc->enc_pic.rc.target_bits_picture);
395 RVCE_CS(enc->enc_pic.rc.peak_bits_picture_integer);
396 RVCE_CS(enc->enc_pic.rc.peak_bits_picture_fraction);
397 RVCE_CS(enc->enc_pic.rc.min_qp);
398 RVCE_CS(enc->enc_pic.rc.max_qp);
399 RVCE_CS(enc->enc_pic.rc.skip_frame_enable);
400 RVCE_CS(enc->enc_pic.rc.fill_data_enable);
401 RVCE_CS(enc->enc_pic.rc.enforce_hrd);
402 RVCE_CS(enc->enc_pic.rc.b_pics_delta_qp);
403 RVCE_CS(enc->enc_pic.rc.ref_b_pics_delta_qp);
404 RVCE_CS(enc->enc_pic.rc.rc_reinit_disable);
405 RVCE_CS(enc->enc_pic.rc.enc_lcvbr_init_qp_flag);
406 RVCE_CS(enc->enc_pic.rc.lcvbrsatd_based_nonlinear_bit_budget_flag);
407 RVCE_END();
408 }
409
410 static void config(struct rvce_encoder *enc)
411 {
412 enc->task_info(enc, 0x00000002, 0, 0xffffffff, 0);
413 enc->rate_control(enc);
414 enc->config_extension(enc);
415 enc->motion_estimation(enc);
416 enc->rdo(enc);
417 if (enc->use_vui)
418 enc->vui(enc);
419 enc->pic_control(enc);
420 }
421
422 static void config_extension(struct rvce_encoder *enc)
423 {
424 RVCE_BEGIN(0x04000001); // config extension
425 RVCE_CS(enc->enc_pic.ce.enc_enable_perf_logging);
426 RVCE_END();
427 }
428
429 static void destroy(struct rvce_encoder *enc)
430 {
431 enc->task_info(enc, 0x00000001, 0, 0, 0);
432
433 RVCE_BEGIN(0x02000001); // destroy
434 RVCE_END();
435 }
436
437 static void feedback(struct rvce_encoder *enc)
438 {
439 RVCE_BEGIN(0x05000005); // feedback buffer
440 RVCE_WRITE(enc->fb->res->buf, enc->fb->res->domains, 0x0); // feedbackRingAddressHi/Lo
441 RVCE_CS(enc->enc_pic.fb.feedback_ring_size);
442 RVCE_END();
443 }
444
445 static void motion_estimation(struct rvce_encoder *enc)
446 {
447 RVCE_BEGIN(0x04000007); // motion estimation
448 RVCE_CS(enc->enc_pic.me.enc_ime_decimation_search);
449 RVCE_CS(enc->enc_pic.me.motion_est_half_pixel);
450 RVCE_CS(enc->enc_pic.me.motion_est_quarter_pixel);
451 RVCE_CS(enc->enc_pic.me.disable_favor_pmv_point);
452 RVCE_CS(enc->enc_pic.me.force_zero_point_center);
453 RVCE_CS(enc->enc_pic.me.lsmvert);
454 RVCE_CS(enc->enc_pic.me.enc_search_range_x);
455 RVCE_CS(enc->enc_pic.me.enc_search_range_y);
456 RVCE_CS(enc->enc_pic.me.enc_search1_range_x);
457 RVCE_CS(enc->enc_pic.me.enc_search1_range_y);
458 RVCE_CS(enc->enc_pic.me.disable_16x16_frame1);
459 RVCE_CS(enc->enc_pic.me.disable_satd);
460 RVCE_CS(enc->enc_pic.me.enable_amd);
461 RVCE_CS(enc->enc_pic.me.enc_disable_sub_mode);
462 RVCE_CS(enc->enc_pic.me.enc_ime_skip_x);
463 RVCE_CS(enc->enc_pic.me.enc_ime_skip_y);
464 RVCE_CS(enc->enc_pic.me.enc_en_ime_overw_dis_subm);
465 RVCE_CS(enc->enc_pic.me.enc_ime_overw_dis_subm_no);
466 RVCE_CS(enc->enc_pic.me.enc_ime2_search_range_x);
467 RVCE_CS(enc->enc_pic.me.enc_ime2_search_range_y);
468 RVCE_CS(enc->enc_pic.me.parallel_mode_speedup_enable);
469 RVCE_CS(enc->enc_pic.me.fme0_enc_disable_sub_mode);
470 RVCE_CS(enc->enc_pic.me.fme1_enc_disable_sub_mode);
471 RVCE_CS(enc->enc_pic.me.ime_sw_speedup_enable);
472 RVCE_END();
473 }
474
475 static void pic_control(struct rvce_encoder *enc)
476 {
477 RVCE_BEGIN(0x04000002); // pic control
478 RVCE_CS(enc->enc_pic.pc.enc_use_constrained_intra_pred);
479 RVCE_CS(enc->enc_pic.pc.enc_cabac_enable);
480 RVCE_CS(enc->enc_pic.pc.enc_cabac_idc);
481 RVCE_CS(enc->enc_pic.pc.enc_loop_filter_disable);
482 RVCE_CS(enc->enc_pic.pc.enc_lf_beta_offset);
483 RVCE_CS(enc->enc_pic.pc.enc_lf_alpha_c0_offset);
484 RVCE_CS(enc->enc_pic.pc.enc_crop_left_offset);
485 RVCE_CS(enc->enc_pic.pc.enc_crop_right_offset);
486 RVCE_CS(enc->enc_pic.pc.enc_crop_top_offset);
487 RVCE_CS(enc->enc_pic.pc.enc_crop_bottom_offset);
488 RVCE_CS(enc->enc_pic.pc.enc_num_mbs_per_slice);
489 RVCE_CS(enc->enc_pic.pc.enc_intra_refresh_num_mbs_per_slot);
490 RVCE_CS(enc->enc_pic.pc.enc_force_intra_refresh);
491 RVCE_CS(enc->enc_pic.pc.enc_force_imb_period);
492 RVCE_CS(enc->enc_pic.pc.enc_pic_order_cnt_type);
493 RVCE_CS(enc->enc_pic.pc.log2_max_pic_order_cnt_lsb_minus4);
494 RVCE_CS(enc->enc_pic.pc.enc_sps_id);
495 RVCE_CS(enc->enc_pic.pc.enc_pps_id);
496 RVCE_CS(enc->enc_pic.pc.enc_constraint_set_flags);
497 RVCE_CS(enc->enc_pic.pc.enc_b_pic_pattern);
498 RVCE_CS(enc->enc_pic.pc.weight_pred_mode_b_picture);
499 RVCE_CS(enc->enc_pic.pc.enc_number_of_reference_frames);
500 RVCE_CS(enc->enc_pic.pc.enc_max_num_ref_frames);
501 RVCE_CS(enc->enc_pic.pc.enc_num_default_active_ref_l0);
502 RVCE_CS(enc->enc_pic.pc.enc_num_default_active_ref_l1);
503 RVCE_CS(enc->enc_pic.pc.enc_slice_mode);
504 RVCE_CS(enc->enc_pic.pc.enc_max_slice_size);
505 RVCE_END();
506 }
507
508 static void rdo(struct rvce_encoder *enc)
509 {
510 RVCE_BEGIN(0x04000008); // rdo
511 RVCE_CS(enc->enc_pic.rdo.enc_disable_tbe_pred_i_frame);
512 RVCE_CS(enc->enc_pic.rdo.enc_disable_tbe_pred_p_frame);
513 RVCE_CS(enc->enc_pic.rdo.use_fme_interpol_y);
514 RVCE_CS(enc->enc_pic.rdo.use_fme_interpol_uv);
515 RVCE_CS(enc->enc_pic.rdo.use_fme_intrapol_y);
516 RVCE_CS(enc->enc_pic.rdo.use_fme_intrapol_uv);
517 RVCE_CS(enc->enc_pic.rdo.use_fme_interpol_y_1);
518 RVCE_CS(enc->enc_pic.rdo.use_fme_interpol_uv_1);
519 RVCE_CS(enc->enc_pic.rdo.use_fme_intrapol_y_1);
520 RVCE_CS(enc->enc_pic.rdo.use_fme_intrapol_uv_1);
521 RVCE_CS(enc->enc_pic.rdo.enc_16x16_cost_adj);
522 RVCE_CS(enc->enc_pic.rdo.enc_skip_cost_adj);
523 RVCE_CS(enc->enc_pic.rdo.enc_force_16x16_skip);
524 RVCE_CS(enc->enc_pic.rdo.enc_disable_threshold_calc_a);
525 RVCE_CS(enc->enc_pic.rdo.enc_luma_coeff_cost);
526 RVCE_CS(enc->enc_pic.rdo.enc_luma_mb_coeff_cost);
527 RVCE_CS(enc->enc_pic.rdo.enc_chroma_coeff_cost);
528 RVCE_END();
529 }
530
531 static void session(struct rvce_encoder *enc)
532 {
533 RVCE_BEGIN(0x00000001); // session cmd
534 RVCE_CS(enc->stream_handle);
535 RVCE_END();
536 }
537
538 static void task_info(struct rvce_encoder *enc, uint32_t op,
539 uint32_t dep, uint32_t fb_idx, uint32_t ring_idx)
540 {
541 RVCE_BEGIN(0x00000002); // task info
542 if (op == 0x3) {
543 if (enc->task_info_idx) {
544 uint32_t offs = enc->cs->current.cdw - enc->task_info_idx + 3;
545 // Update offsetOfNextTaskInfo
546 enc->cs->current.buf[enc->task_info_idx] = offs;
547 }
548 enc->task_info_idx = enc->cs->current.cdw;
549 }
550 enc->enc_pic.ti.task_operation = op;
551 enc->enc_pic.ti.reference_picture_dependency = dep;
552 enc->enc_pic.ti.feedback_index = fb_idx;
553 enc->enc_pic.ti.video_bitstream_ring_index = ring_idx;
554 RVCE_CS(enc->enc_pic.ti.offset_of_next_task_info);
555 RVCE_CS(enc->enc_pic.ti.task_operation);
556 RVCE_CS(enc->enc_pic.ti.reference_picture_dependency);
557 RVCE_CS(enc->enc_pic.ti.collocate_flag_dependency);
558 RVCE_CS(enc->enc_pic.ti.feedback_index);
559 RVCE_CS(enc->enc_pic.ti.video_bitstream_ring_index);
560 RVCE_END();
561 }
562
563 static void vui(struct rvce_encoder *enc)
564 {
565 int i;
566
567 if (!enc->enc_pic.enable_vui)
568 return;
569
570 RVCE_BEGIN(0x04000009); // vui
571 RVCE_CS(enc->enc_pic.vui.aspect_ratio_info_present_flag);
572 RVCE_CS(enc->enc_pic.vui.aspect_ratio_idc);
573 RVCE_CS(enc->enc_pic.vui.sar_width);
574 RVCE_CS(enc->enc_pic.vui.sar_height);
575 RVCE_CS(enc->enc_pic.vui.overscan_info_present_flag);
576 RVCE_CS(enc->enc_pic.vui.overscan_Approp_flag);
577 RVCE_CS(enc->enc_pic.vui.video_signal_type_present_flag);
578 RVCE_CS(enc->enc_pic.vui.video_format);
579 RVCE_CS(enc->enc_pic.vui.video_full_range_flag);
580 RVCE_CS(enc->enc_pic.vui.color_description_present_flag);
581 RVCE_CS(enc->enc_pic.vui.color_prim);
582 RVCE_CS(enc->enc_pic.vui.transfer_char);
583 RVCE_CS(enc->enc_pic.vui.matrix_coef);
584 RVCE_CS(enc->enc_pic.vui.chroma_loc_info_present_flag);
585 RVCE_CS(enc->enc_pic.vui.chroma_loc_top);
586 RVCE_CS(enc->enc_pic.vui.chroma_loc_bottom);
587 RVCE_CS(enc->enc_pic.vui.timing_info_present_flag);
588 RVCE_CS(enc->enc_pic.vui.num_units_in_tick);
589 RVCE_CS(enc->enc_pic.vui.time_scale);
590 RVCE_CS(enc->enc_pic.vui.fixed_frame_rate_flag);
591 RVCE_CS(enc->enc_pic.vui.nal_hrd_parameters_present_flag);
592 RVCE_CS(enc->enc_pic.vui.cpb_cnt_minus1);
593 RVCE_CS(enc->enc_pic.vui.bit_rate_scale);
594 RVCE_CS(enc->enc_pic.vui.cpb_size_scale);
595 for (i = 0; i < 32; i++) {
596 RVCE_CS(enc->enc_pic.vui.bit_rate_value_minus);
597 RVCE_CS(enc->enc_pic.vui.cpb_size_value_minus);
598 RVCE_CS(enc->enc_pic.vui.cbr_flag);
599 }
600 RVCE_CS(enc->enc_pic.vui.initial_cpb_removal_delay_length_minus1);
601 RVCE_CS(enc->enc_pic.vui.cpb_removal_delay_length_minus1);
602 RVCE_CS(enc->enc_pic.vui.dpb_output_delay_length_minus1);
603 RVCE_CS(enc->enc_pic.vui.time_offset_length);
604 RVCE_CS(enc->enc_pic.vui.low_delay_hrd_flag);
605 RVCE_CS(enc->enc_pic.vui.pic_struct_present_flag);
606 RVCE_CS(enc->enc_pic.vui.bitstream_restriction_present_flag);
607 RVCE_CS(enc->enc_pic.vui.motion_vectors_over_pic_boundaries_flag);
608 RVCE_CS(enc->enc_pic.vui.max_bytes_per_pic_denom);
609 RVCE_CS(enc->enc_pic.vui.max_bits_per_mb_denom);
610 RVCE_CS(enc->enc_pic.vui.log2_max_mv_length_hori);
611 RVCE_CS(enc->enc_pic.vui.log2_max_mv_length_vert);
612 RVCE_CS(enc->enc_pic.vui.num_reorder_frames);
613 RVCE_CS(enc->enc_pic.vui.max_dec_frame_buffering);
614 RVCE_END();
615 }
616
617 void radeon_vce_52_init(struct rvce_encoder *enc)
618 {
619 enc->session = session;
620 enc->task_info = task_info;
621 enc->create = create;
622 enc->feedback = feedback;
623 enc->rate_control = rate_control;
624 enc->config_extension = config_extension;
625 enc->pic_control = pic_control;
626 enc->motion_estimation = motion_estimation;
627 enc->rdo = rdo;
628 enc->vui = vui;
629 enc->config = config;
630 enc->encode = encode;
631 enc->destroy = destroy;
632 }