• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /**************************************************************************
2  *
3  * Copyright 2015 Advanced Micro Devices, Inc.
4  *
5  * SPDX-License-Identifier: MIT
6  *
7  **************************************************************************/
8 
9 #include "pipe/p_video_codec.h"
10 #include "radeon_vce.h"
11 #include "radeon_video.h"
12 #include "radeon_bitstream.h"
13 #include "radeonsi/si_pipe.h"
14 #include "util/u_memory.h"
15 #include "util/u_video.h"
16 #include "vl/vl_video_buffer.h"
17 
18 #include <stdio.h>
19 
20 #define REF_LIST_MODIFICATION_OP_END                  0
21 #define REF_LIST_MODIFICATION_OP_SHORT_TERM_SUBTRACT  1
22 #define REF_LIST_MODIFICATION_OP_LONG_TERM            2
23 #define REF_LIST_MODIFICATION_OP_VIEW_ADD             3
24 
25 #define INTRAREFRESH_METHOD_BAR_BASED                 6
26 
get_rate_control_param(struct rvce_encoder * enc,struct pipe_h264_enc_picture_desc * pic)27 static void get_rate_control_param(struct rvce_encoder *enc, struct pipe_h264_enc_picture_desc *pic)
28 {
29    enc->enc_pic.rc.rc_method = pic->rate_ctrl[0].rate_ctrl_method;
30    enc->enc_pic.rc.target_bitrate = pic->rate_ctrl[0].target_bitrate;
31    enc->enc_pic.rc.peak_bitrate = pic->rate_ctrl[0].peak_bitrate;
32    enc->enc_pic.rc.quant_i_frames = pic->quant_i_frames;
33    enc->enc_pic.rc.quant_p_frames = pic->quant_p_frames;
34    enc->enc_pic.rc.quant_b_frames = pic->quant_b_frames;
35    enc->enc_pic.rc.gop_size = pic->gop_size;
36    enc->enc_pic.rc.frame_rate_num = pic->rate_ctrl[0].frame_rate_num;
37    enc->enc_pic.rc.frame_rate_den = pic->rate_ctrl[0].frame_rate_den;
38    enc->enc_pic.rc.min_qp = pic->rate_ctrl[0].min_qp;
39    enc->enc_pic.rc.max_qp = pic->rate_ctrl[0].max_qp ? pic->rate_ctrl[0].max_qp : 51;
40    enc->enc_pic.rc.max_au_size = pic->rate_ctrl[0].max_au_size;
41    enc->enc_pic.rc.vbv_buffer_size = pic->rate_ctrl[0].vbv_buffer_size;
42    enc->enc_pic.rc.vbv_buf_lv = pic->rate_ctrl[0].vbv_buf_lv;
43    enc->enc_pic.rc.fill_data_enable = pic->rate_ctrl[0].fill_data_enable;
44    enc->enc_pic.rc.enforce_hrd = pic->rate_ctrl[0].enforce_hrd;
45    enc->enc_pic.rc.target_bits_picture =
46       enc->pic.rate_ctrl[0].target_bitrate *
47       ((float)enc->pic.rate_ctrl[0].frame_rate_den /
48       enc->pic.rate_ctrl[0].frame_rate_num);
49    enc->enc_pic.rc.peak_bits_picture_integer =
50       enc->pic.rate_ctrl[0].peak_bitrate *
51       ((float)enc->pic.rate_ctrl[0].frame_rate_den /
52       enc->pic.rate_ctrl[0].frame_rate_num);
53    enc->enc_pic.rc.peak_bits_picture_fraction =
54       (((enc->pic.rate_ctrl[0].peak_bitrate *
55       (uint64_t)enc->pic.rate_ctrl[0].frame_rate_den) %
56       enc->pic.rate_ctrl[0].frame_rate_num) << 32) /
57       enc->pic.rate_ctrl[0].frame_rate_num;
58 }
59 
get_motion_estimation_param(struct rvce_encoder * enc,struct pipe_h264_enc_picture_desc * pic)60 static void get_motion_estimation_param(struct rvce_encoder *enc,
61                                         struct pipe_h264_enc_picture_desc *pic)
62 {
63    enc->enc_pic.me.enc_ime_decimation_search = 1;
64    enc->enc_pic.me.motion_est_half_pixel = 1;
65    enc->enc_pic.me.motion_est_quarter_pixel = 1;
66    enc->enc_pic.me.disable_favor_pmv_point = 0;
67    enc->enc_pic.me.lsmvert = 2;
68    enc->enc_pic.me.disable_16x16_frame1 = 0;
69    enc->enc_pic.me.disable_satd = 0;
70    enc->enc_pic.me.enc_ime_skip_x = 0;
71    enc->enc_pic.me.enc_ime_skip_y = 0;
72    enc->enc_pic.me.enc_ime2_search_range_x = 4;
73    enc->enc_pic.me.enc_ime2_search_range_y = 4;
74    enc->enc_pic.me.parallel_mode_speedup_enable = 0;
75    enc->enc_pic.me.fme0_enc_disable_sub_mode = 0;
76    enc->enc_pic.me.fme1_enc_disable_sub_mode = 0;
77    enc->enc_pic.me.ime_sw_speedup_enable = 0;
78 
79    switch (pic->quality_modes.preset_mode) {
80    case 0: /* SPEED */
81       enc->enc_pic.me.force_zero_point_center = 0;
82       enc->enc_pic.me.enc_search_range_x = 16;
83       enc->enc_pic.me.enc_search_range_y = 16;
84       enc->enc_pic.me.enc_search1_range_x = 16;
85       enc->enc_pic.me.enc_search1_range_y = 16;
86       enc->enc_pic.me.enable_amd = 0;
87       enc->enc_pic.me.enc_disable_sub_mode = 126;
88       enc->enc_pic.me.enc_en_ime_overw_dis_subm = 0;
89       enc->enc_pic.me.enc_ime_overw_dis_subm_no = 0;
90       break;
91    case 1: /* BALANCED */
92       enc->enc_pic.me.force_zero_point_center = 0;
93       enc->enc_pic.me.enc_search_range_x = 16;
94       enc->enc_pic.me.enc_search_range_y = 16;
95       enc->enc_pic.me.enc_search1_range_x = 16;
96       enc->enc_pic.me.enc_search1_range_y = 16;
97       enc->enc_pic.me.enable_amd = 0;
98       enc->enc_pic.me.enc_disable_sub_mode = 120;
99       enc->enc_pic.me.enc_en_ime_overw_dis_subm = 1;
100       enc->enc_pic.me.enc_ime_overw_dis_subm_no = 1;
101       break;
102    case 2: /* QUALITY */
103    default:
104       enc->enc_pic.me.force_zero_point_center = 1;
105       enc->enc_pic.me.enc_search_range_x = 36;
106       enc->enc_pic.me.enc_search_range_y = 36;
107       enc->enc_pic.me.enc_search1_range_x = 36;
108       enc->enc_pic.me.enc_search1_range_y = 36;
109       enc->enc_pic.me.enable_amd = 1;
110       enc->enc_pic.me.enc_disable_sub_mode = 0;
111       enc->enc_pic.me.enc_en_ime_overw_dis_subm = 0;
112       enc->enc_pic.me.enc_ime_overw_dis_subm_no = 0;
113       break;
114    }
115 }
116 
get_pic_control_param(struct rvce_encoder * enc,struct pipe_h264_enc_picture_desc * pic)117 static void get_pic_control_param(struct rvce_encoder *enc, struct pipe_h264_enc_picture_desc *pic)
118 {
119    uint32_t num_mbs_total, num_mbs_in_slice;
120 
121    num_mbs_total = DIV_ROUND_UP(enc->base.width, 16) * DIV_ROUND_UP(enc->base.height, 16);
122 
123    if (pic->num_slice_descriptors <= 1) {
124       num_mbs_in_slice = num_mbs_total;
125    } else {
126       bool use_app_config = true;
127       num_mbs_in_slice = pic->slices_descriptors[0].num_macroblocks;
128 
129       /* All slices must have equal size */
130       for (unsigned i = 1; i < pic->num_slice_descriptors - 1; i++) {
131          if (num_mbs_in_slice != pic->slices_descriptors[i].num_macroblocks)
132             use_app_config = false;
133       }
134       /* Except last one can be smaller */
135       if (pic->slices_descriptors[pic->num_slice_descriptors - 1].num_macroblocks > num_mbs_in_slice)
136          use_app_config = false;
137 
138       if (!use_app_config) {
139          assert(num_mbs_total >= pic->num_slice_descriptors);
140          num_mbs_in_slice =
141             (num_mbs_total + pic->num_slice_descriptors - 1) / pic->num_slice_descriptors;
142       }
143    }
144 
145    if (pic->seq.enc_frame_cropping_flag) {
146       enc->enc_pic.pc.enc_crop_left_offset = pic->seq.enc_frame_crop_left_offset;
147       enc->enc_pic.pc.enc_crop_right_offset = pic->seq.enc_frame_crop_right_offset;
148       enc->enc_pic.pc.enc_crop_top_offset = pic->seq.enc_frame_crop_top_offset;
149       enc->enc_pic.pc.enc_crop_bottom_offset = pic->seq.enc_frame_crop_bottom_offset;
150    }
151    enc->enc_pic.pc.enc_num_mbs_per_slice = num_mbs_in_slice;
152    enc->enc_pic.pc.enc_number_of_reference_frames = 1;
153    enc->enc_pic.pc.enc_max_num_ref_frames = pic->seq.max_num_ref_frames;
154    enc->enc_pic.pc.enc_num_default_active_ref_l0 = pic->pic_ctrl.num_ref_idx_l0_default_active_minus1 + 1;
155    enc->enc_pic.pc.enc_num_default_active_ref_l1 = pic->pic_ctrl.num_ref_idx_l1_default_active_minus1 + 1;
156    enc->enc_pic.pc.enc_slice_mode = 1;
157    enc->enc_pic.pc.enc_use_constrained_intra_pred = pic->pic_ctrl.constrained_intra_pred_flag;
158    enc->enc_pic.pc.enc_cabac_enable = pic->pic_ctrl.enc_cabac_enable;
159    enc->enc_pic.pc.enc_cabac_idc = pic->pic_ctrl.enc_cabac_init_idc;
160    enc->enc_pic.pc.enc_constraint_set_flags = pic->seq.enc_constraint_set_flags << 2;
161    enc->enc_pic.pc.enc_loop_filter_disable = !!pic->dbk.disable_deblocking_filter_idc;
162    enc->enc_pic.pc.enc_lf_beta_offset = pic->dbk.beta_offset_div2;
163    enc->enc_pic.pc.enc_lf_alpha_c0_offset = pic->dbk.alpha_c0_offset_div2;
164    enc->enc_pic.pc.enc_pic_order_cnt_type = pic->seq.pic_order_cnt_type;
165    enc->enc_pic.pc.log2_max_pic_order_cnt_lsb_minus4 = pic->seq.log2_max_pic_order_cnt_lsb_minus4;
166 }
167 
get_task_info_param(struct rvce_encoder * enc)168 static void get_task_info_param(struct rvce_encoder *enc)
169 {
170    enc->enc_pic.ti.offset_of_next_task_info = 0xffffffff;
171 }
172 
get_feedback_buffer_param(struct rvce_encoder * enc,struct pipe_enc_feedback_metadata * metadata)173 static void get_feedback_buffer_param(struct rvce_encoder *enc, struct pipe_enc_feedback_metadata* metadata)
174 {
175    enc->enc_pic.fb.feedback_ring_size = 0x00000001;
176 }
177 
get_config_ext_param(struct rvce_encoder * enc)178 static void get_config_ext_param(struct rvce_encoder *enc)
179 {
180    enc->enc_pic.ce.enc_enable_perf_logging = 0x00000003;
181 }
182 
get_param(struct rvce_encoder * enc,struct pipe_h264_enc_picture_desc * pic)183 static void get_param(struct rvce_encoder *enc, struct pipe_h264_enc_picture_desc *pic)
184 {
185    int i;
186 
187    get_rate_control_param(enc, pic);
188    get_motion_estimation_param(enc, pic);
189    get_pic_control_param(enc, pic);
190    get_task_info_param(enc);
191    get_feedback_buffer_param(enc, NULL);
192    get_config_ext_param(enc);
193 
194    enc->enc_pic.picture_type = pic->picture_type;
195    enc->enc_pic.frame_num = pic->frame_num;
196    enc->enc_pic.frame_num_cnt = pic->frame_num_cnt - 1;
197    enc->enc_pic.p_remain = pic->p_remain;
198    enc->enc_pic.i_remain = pic->i_remain;
199    enc->enc_pic.pic_order_cnt = pic->pic_order_cnt;
200    enc->enc_pic.not_referenced = pic->not_referenced;
201    enc->enc_pic.addrmode_arraymode_disrdo_distwoinstants = 0x01000201;
202    enc->enc_pic.is_idr = (pic->picture_type == PIPE_H2645_ENC_PICTURE_TYPE_IDR);
203    enc->enc_pic.eo.enc_idr_pic_id = pic->idr_pic_id;
204    enc->enc_pic.ec.enc_vbaq_mode =
205       pic->rate_ctrl[0].rate_ctrl_method != PIPE_H2645_ENC_RATE_CONTROL_METHOD_DISABLE &&
206       pic->quality_modes.vbaq_mode;
207    if (pic->intra_refresh.mode != PIPE_VIDEO_ENC_INTRA_REFRESH_NONE) {
208       enc->enc_pic.eo.enable_intra_refresh = 1;
209       enc->enc_pic.pc.enc_force_intra_refresh = INTRAREFRESH_METHOD_BAR_BASED;
210       enc->enc_pic.pc.enc_intra_refresh_num_mbs_per_slot = pic->intra_refresh.region_size;
211    } else {
212       enc->enc_pic.eo.enable_intra_refresh = 0;
213    }
214 
215    enc->enc_pic.eo.num_ref_idx_active_override_flag = pic->slice.num_ref_idx_active_override_flag;
216    enc->enc_pic.eo.num_ref_idx_l0_active_minus1 = pic->slice.num_ref_idx_l0_active_minus1;
217    enc->enc_pic.eo.num_ref_idx_l1_active_minus1 = pic->slice.num_ref_idx_l1_active_minus1;
218 
219    i = 0;
220    if (pic->slice.ref_pic_list_modification_flag_l0) {
221       for (; i < MIN2(4, pic->slice.num_ref_list0_mod_operations); i++) {
222          struct pipe_h264_ref_list_mod_entry *entry = &pic->slice.ref_list0_mod_operations[i];
223          switch (entry->modification_of_pic_nums_idc) {
224          case 0:
225             enc->enc_pic.eo.enc_ref_list_modification_op[i] = REF_LIST_MODIFICATION_OP_SHORT_TERM_SUBTRACT;
226             enc->enc_pic.eo.enc_ref_list_modification_num[i] = entry->abs_diff_pic_num_minus1;
227             break;
228          case 2:
229             enc->enc_pic.eo.enc_ref_list_modification_op[i] = REF_LIST_MODIFICATION_OP_LONG_TERM;
230             enc->enc_pic.eo.enc_ref_list_modification_num[i] = entry->long_term_pic_num;
231             break;
232          case 5:
233             enc->enc_pic.eo.enc_ref_list_modification_op[i] = REF_LIST_MODIFICATION_OP_VIEW_ADD;
234             enc->enc_pic.eo.enc_ref_list_modification_num[i] = entry->abs_diff_pic_num_minus1;
235             break;
236          default:
237          case 3:
238             enc->enc_pic.eo.enc_ref_list_modification_op[i] = REF_LIST_MODIFICATION_OP_END;
239             break;
240          }
241       }
242    }
243    if (i < 4)
244       enc->enc_pic.eo.enc_ref_list_modification_op[i] = REF_LIST_MODIFICATION_OP_END;
245 
246    i = 0;
247    if (pic->pic_ctrl.nal_unit_type == PIPE_H264_NAL_IDR_SLICE) {
248       enc->enc_pic.eo.enc_decoded_picture_marking_op[i++] = pic->slice.long_term_reference_flag ? 6 : 0;
249    } else if (pic->slice.adaptive_ref_pic_marking_mode_flag) {
250       for (; i < MIN2(4, pic->slice.num_ref_pic_marking_operations); i++) {
251          struct pipe_h264_ref_pic_marking_entry *entry = &pic->slice.ref_pic_marking_operations[i];
252          enc->enc_pic.eo.enc_decoded_picture_marking_op[i] = entry->memory_management_control_operation;
253          switch (entry->memory_management_control_operation) {
254          case 1:
255             enc->enc_pic.eo.enc_decoded_picture_marking_num[i] = entry->difference_of_pic_nums_minus1;
256             break;
257          case 2:
258             enc->enc_pic.eo.enc_decoded_picture_marking_num[i] = entry->long_term_pic_num;
259             break;
260          case 3:
261             enc->enc_pic.eo.enc_decoded_picture_marking_num[i] = entry->difference_of_pic_nums_minus1;
262             enc->enc_pic.eo.enc_decoded_picture_marking_idx[i] = entry->long_term_frame_idx;
263             break;
264          case 4:
265             enc->enc_pic.eo.enc_decoded_picture_marking_idx[i] = entry->max_long_term_frame_idx_plus1;
266             break;
267          case 6:
268             enc->enc_pic.eo.enc_decoded_picture_marking_idx[i] = entry->long_term_frame_idx;
269             break;
270          default:
271             break;
272          }
273       }
274    }
275    if (i < 4)
276       enc->enc_pic.eo.enc_decoded_picture_marking_op[i] = 0;
277 
278    enc->enc_pic.eo.cur_dpb_idx = pic->dpb_curr_pic;
279 
280    enc->enc_pic.eo.l0_dpb_idx = pic->ref_list0[0];
281 
282    enc->enc_pic.eo.l1_dpb_idx = PIPE_H2645_LIST_REF_INVALID_ENTRY;
283    enc->enc_pic.eo.l1_luma_offset = 0xffffffff;
284    enc->enc_pic.eo.l1_chroma_offset = 0xffffffff;
285 }
286 
create(struct rvce_encoder * enc)287 static void create(struct rvce_encoder *enc)
288 {
289    struct si_screen *sscreen = (struct si_screen *)enc->screen;
290    enc->task_info(enc, 0x00000000, 0);
291 
292    RVCE_BEGIN(0x01000001); // create cmd
293    RVCE_CS(enc->enc_pic.ec.enc_use_circular_buffer);
294    RVCE_CS(enc->pic.seq.profile_idc); // encProfile
295    RVCE_CS(enc->pic.seq.level_idc);                    // encLevel
296    RVCE_CS(enc->enc_pic.ec.enc_pic_struct_restriction);
297    RVCE_CS(align(enc->base.width, 16));  // encImageWidth
298    RVCE_CS(align(enc->base.height, 16)); // encImageHeight
299 
300    if (sscreen->info.gfx_level < GFX9) {
301       RVCE_CS(enc->luma->u.legacy.level[0].nblk_x * enc->luma->bpe);     // encRefPicLumaPitch
302       RVCE_CS(enc->chroma->u.legacy.level[0].nblk_x * enc->chroma->bpe); // encRefPicChromaPitch
303       RVCE_CS(align(enc->luma->u.legacy.level[0].nblk_y, 16) / 8);       // encRefYHeightInQw
304    } else {
305       RVCE_CS(enc->luma->u.gfx9.surf_pitch * enc->luma->bpe);     // encRefPicLumaPitch
306       RVCE_CS(enc->chroma->u.gfx9.surf_pitch * enc->chroma->bpe); // encRefPicChromaPitch
307       RVCE_CS(align(enc->luma->u.gfx9.surf_height, 16) / 8);      // encRefYHeightInQw
308    }
309 
310    RVCE_CS(enc->enc_pic.addrmode_arraymode_disrdo_distwoinstants);
311 
312    RVCE_CS(enc->enc_pic.ec.enc_pre_encode_context_buffer_offset);
313    RVCE_CS(enc->enc_pic.ec.enc_pre_encode_input_luma_buffer_offset);
314    RVCE_CS(enc->enc_pic.ec.enc_pre_encode_input_chroma_buffer_offset);
315    RVCE_CS(enc->enc_pic.ec.enc_pre_encode_mode_chromaflag_vbaqmode_scenechangesensitivity);
316    RVCE_END();
317 }
318 
encode(struct rvce_encoder * enc)319 static void encode(struct rvce_encoder *enc)
320 {
321    struct si_screen *sscreen = (struct si_screen *)enc->screen;
322    signed luma_offset, chroma_offset;
323    int i;
324 
325    enc->task_info(enc, 0x00000003, 0);
326 
327    RVCE_BEGIN(0x05000001);                                      // context buffer
328    RVCE_READWRITE(enc->dpb.res->buf, enc->dpb.res->domains, 0); // encodeContextAddressHi/Lo
329    RVCE_END();
330 
331    RVCE_BEGIN(0x05000004);                                   // video bitstream buffer
332    RVCE_WRITE(enc->bs_handle, RADEON_DOMAIN_GTT, enc->bs_offset); // videoBitstreamRingAddressHi/Lo
333    RVCE_CS(enc->bs_size);                                    // videoBitstreamRingSize
334    RVCE_END();
335 
336    if (enc->dual_pipe) {
337       unsigned aux_offset = 0;
338       RVCE_BEGIN(0x05000002); // auxiliary buffer
339       for (i = 0; i < 8; ++i) {
340          RVCE_CS(aux_offset);
341          aux_offset += RVCE_MAX_BITSTREAM_OUTPUT_ROW_SIZE;
342       }
343       for (i = 0; i < 8; ++i)
344          RVCE_CS(RVCE_MAX_BITSTREAM_OUTPUT_ROW_SIZE);
345       RVCE_END();
346    }
347 
348    RVCE_BEGIN(0x03000001);                       // encode
349    RVCE_CS(enc->enc_pic.eo.insert_headers);
350    RVCE_CS(enc->enc_pic.eo.picture_structure);
351    RVCE_CS(enc->bs_size - enc->bs_offset); // allowedMaxBitstreamSize
352    RVCE_CS(enc->enc_pic.eo.force_refresh_map);
353    RVCE_CS(enc->enc_pic.eo.insert_aud);
354    RVCE_CS(enc->enc_pic.eo.end_of_sequence);
355    RVCE_CS(enc->enc_pic.eo.end_of_stream);
356 
357    if (sscreen->info.gfx_level < GFX9) {
358       RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM,
359                 (uint64_t)enc->luma->u.legacy.level[0].offset_256B * 256); // inputPictureLumaAddressHi/Lo
360       RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM,
361                 (uint64_t)enc->chroma->u.legacy.level[0].offset_256B * 256);        // inputPictureChromaAddressHi/Lo
362       RVCE_CS(align(enc->luma->u.legacy.level[0].nblk_y, 16)); // encInputFrameYPitch
363       RVCE_CS(enc->luma->u.legacy.level[0].nblk_x * enc->luma->bpe);     // encInputPicLumaPitch
364       RVCE_CS(enc->chroma->u.legacy.level[0].nblk_x * enc->chroma->bpe); // encInputPicChromaPitch
365    } else {
366       RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM,
367                 enc->luma->u.gfx9.surf_offset); // inputPictureLumaAddressHi/Lo
368       RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM,
369                 enc->chroma->u.gfx9.surf_offset);                 // inputPictureChromaAddressHi/Lo
370       RVCE_CS(align(enc->luma->u.gfx9.surf_height, 16));          // encInputFrameYPitch
371       RVCE_CS(enc->luma->u.gfx9.surf_pitch * enc->luma->bpe);     // encInputPicLumaPitch
372       RVCE_CS(enc->chroma->u.gfx9.surf_pitch * enc->chroma->bpe); // encInputPicChromaPitch
373       enc->enc_pic.eo.enc_input_pic_swizzle_mode = enc->luma->u.gfx9.swizzle_mode;
374    }
375 
376    enc->enc_pic.eo.enc_disable_two_pipe_mode = !enc->dual_pipe;
377    RVCE_CS(enc->enc_pic.eo.enc_input_pic_addr_array_disable2pipe_disablemboffload);
378    RVCE_CS(enc->enc_pic.eo.enc_input_pic_tile_config);
379    RVCE_CS(enc->enc_pic.picture_type);                                    // encPicType
380    RVCE_CS(enc->enc_pic.picture_type == PIPE_H2645_ENC_PICTURE_TYPE_IDR); // encIdrFlag
381    RVCE_CS(enc->enc_pic.eo.enc_idr_pic_id);
382    RVCE_CS(enc->enc_pic.eo.enc_mgs_key_pic);
383    RVCE_CS(!enc->enc_pic.not_referenced);
384    RVCE_CS(enc->enc_pic.eo.enc_temporal_layer_index);
385    RVCE_CS(enc->enc_pic.eo.num_ref_idx_active_override_flag);
386    RVCE_CS(enc->enc_pic.eo.num_ref_idx_l0_active_minus1);
387    RVCE_CS(enc->enc_pic.eo.num_ref_idx_l1_active_minus1);
388 
389    for (i = 0; i < 4; ++i) {
390       RVCE_CS(enc->enc_pic.eo.enc_ref_list_modification_op[i]);
391       RVCE_CS(enc->enc_pic.eo.enc_ref_list_modification_num[i]);
392    }
393 
394    for (i = 0; i < 4; ++i) {
395       RVCE_CS(enc->enc_pic.eo.enc_decoded_picture_marking_op[i]);
396       RVCE_CS(enc->enc_pic.eo.enc_decoded_picture_marking_num[i]);
397       RVCE_CS(enc->enc_pic.eo.enc_decoded_picture_marking_idx[i]);
398    }
399 
400    for (i = 0; i < 4; ++i) {
401       RVCE_CS(enc->enc_pic.eo.enc_decoded_ref_base_picture_marking_op[i]);
402       RVCE_CS(enc->enc_pic.eo.enc_decoded_ref_base_picture_marking_num[i]);
403    }
404 
405    // encReferencePictureL0[0]
406    if (enc->enc_pic.eo.l0_dpb_idx != PIPE_H2645_LIST_REF_INVALID_ENTRY) {
407       si_vce_frame_offset(enc, enc->enc_pic.eo.l0_dpb_idx, &luma_offset, &chroma_offset);
408       enc->enc_pic.eo.l0_luma_offset = luma_offset;
409       enc->enc_pic.eo.l0_chroma_offset = chroma_offset;
410    } else {
411       enc->enc_pic.eo.l0_luma_offset = 0xffffffff;
412       enc->enc_pic.eo.l0_chroma_offset = 0xffffffff;
413    }
414    RVCE_CS(0x00000000); // pictureStructure
415    RVCE_CS(enc->enc_pic.eo.l0_enc_pic_type);
416    RVCE_CS(enc->enc_pic.eo.l0_frame_number);
417    RVCE_CS(enc->enc_pic.eo.l0_picture_order_count);
418    RVCE_CS(enc->enc_pic.eo.l0_luma_offset);
419    RVCE_CS(enc->enc_pic.eo.l0_chroma_offset);
420 
421    // encReferencePictureL0[1]
422    enc->enc_pic.eo.l0_picture_structure = 0x00000000;
423    enc->enc_pic.eo.l0_enc_pic_type = 0x00000000;
424    enc->enc_pic.eo.l0_frame_number = 0x00000000;
425    enc->enc_pic.eo.l0_picture_order_count = 0x00000000;
426    enc->enc_pic.eo.l0_luma_offset = 0xffffffff;
427    enc->enc_pic.eo.l0_chroma_offset = 0xffffffff;
428    RVCE_CS(enc->enc_pic.eo.l0_picture_structure);
429    RVCE_CS(enc->enc_pic.eo.l0_enc_pic_type);
430    RVCE_CS(enc->enc_pic.eo.l0_frame_number);
431    RVCE_CS(enc->enc_pic.eo.l0_picture_order_count);
432    RVCE_CS(enc->enc_pic.eo.l0_luma_offset);
433    RVCE_CS(enc->enc_pic.eo.l0_chroma_offset);
434 
435    // encReferencePictureL1[0]
436    RVCE_CS(0x00000000); // pictureStructure
437    RVCE_CS(enc->enc_pic.eo.l1_enc_pic_type);
438    RVCE_CS(enc->enc_pic.eo.l1_frame_number);
439    RVCE_CS(enc->enc_pic.eo.l1_picture_order_count);
440    RVCE_CS(enc->enc_pic.eo.l1_luma_offset);
441    RVCE_CS(enc->enc_pic.eo.l1_chroma_offset);
442 
443    si_vce_frame_offset(enc, enc->enc_pic.eo.cur_dpb_idx, &luma_offset, &chroma_offset);
444    RVCE_CS(luma_offset);
445    RVCE_CS(chroma_offset);
446    RVCE_CS(enc->enc_pic.eo.enc_coloc_buffer_offset);
447    RVCE_CS(enc->enc_pic.eo.enc_reconstructed_ref_base_picture_luma_offset);
448    RVCE_CS(enc->enc_pic.eo.enc_reconstructed_ref_base_picture_chroma_offset);
449    RVCE_CS(enc->enc_pic.eo.enc_reference_ref_base_picture_luma_offset);
450    RVCE_CS(enc->enc_pic.eo.enc_reference_ref_base_picture_chroma_offset);
451    RVCE_CS(enc->enc_pic.frame_num_cnt);
452    RVCE_CS(enc->enc_pic.frame_num);
453    RVCE_CS(enc->enc_pic.pic_order_cnt);
454    RVCE_CS(enc->enc_pic.i_remain);
455    RVCE_CS(enc->enc_pic.p_remain);
456    RVCE_CS(enc->enc_pic.eo.num_b_pic_remain_in_rcgop);
457    RVCE_CS(enc->enc_pic.eo.num_ir_pic_remain_in_rcgop);
458    RVCE_CS(enc->enc_pic.eo.enable_intra_refresh);
459 
460    RVCE_CS(enc->enc_pic.eo.aq_variance_en);
461    RVCE_CS(enc->enc_pic.eo.aq_block_size);
462    RVCE_CS(enc->enc_pic.eo.aq_mb_variance_sel);
463    RVCE_CS(enc->enc_pic.eo.aq_frame_variance_sel);
464    RVCE_CS(enc->enc_pic.eo.aq_param_a);
465    RVCE_CS(enc->enc_pic.eo.aq_param_b);
466    RVCE_CS(enc->enc_pic.eo.aq_param_c);
467    RVCE_CS(enc->enc_pic.eo.aq_param_d);
468    RVCE_CS(enc->enc_pic.eo.aq_param_e);
469 
470    RVCE_CS(enc->enc_pic.eo.context_in_sfb);
471    RVCE_END();
472 }
473 
rate_control(struct rvce_encoder * enc)474 static void rate_control(struct rvce_encoder *enc)
475 {
476    RVCE_BEGIN(0x04000005); // rate control
477    RVCE_CS(enc->enc_pic.rc.rc_method);
478    RVCE_CS(enc->enc_pic.rc.target_bitrate);
479    RVCE_CS(enc->enc_pic.rc.peak_bitrate);
480    RVCE_CS(enc->enc_pic.rc.frame_rate_num);
481    RVCE_CS(enc->enc_pic.rc.gop_size);
482    RVCE_CS(enc->enc_pic.rc.quant_i_frames);
483    RVCE_CS(enc->enc_pic.rc.quant_p_frames);
484    RVCE_CS(enc->enc_pic.rc.quant_b_frames);
485    RVCE_CS(enc->enc_pic.rc.vbv_buffer_size);
486    RVCE_CS(enc->enc_pic.rc.frame_rate_den);
487    RVCE_CS(enc->enc_pic.rc.vbv_buf_lv);
488    RVCE_CS(enc->enc_pic.rc.max_au_size);
489    RVCE_CS(enc->enc_pic.rc.qp_initial_mode);
490    RVCE_CS(enc->enc_pic.rc.target_bits_picture);
491    RVCE_CS(enc->enc_pic.rc.peak_bits_picture_integer);
492    RVCE_CS(enc->enc_pic.rc.peak_bits_picture_fraction);
493    RVCE_CS(enc->enc_pic.rc.min_qp);
494    RVCE_CS(enc->enc_pic.rc.max_qp);
495    RVCE_CS(enc->enc_pic.rc.skip_frame_enable);
496    RVCE_CS(enc->enc_pic.rc.fill_data_enable);
497    RVCE_CS(enc->enc_pic.rc.enforce_hrd);
498    RVCE_CS(enc->enc_pic.rc.b_pics_delta_qp);
499    RVCE_CS(enc->enc_pic.rc.ref_b_pics_delta_qp);
500    RVCE_CS(enc->enc_pic.rc.rc_reinit_disable);
501    RVCE_CS(enc->enc_pic.rc.enc_lcvbr_init_qp_flag);
502    RVCE_CS(enc->enc_pic.rc.lcvbrsatd_based_nonlinear_bit_budget_flag);
503    RVCE_END();
504 }
505 
config(struct rvce_encoder * enc)506 static void config(struct rvce_encoder *enc)
507 {
508    enc->task_info(enc, 0x00000002, 0xffffffff);
509    enc->rate_control(enc);
510    enc->config_extension(enc);
511    enc->motion_estimation(enc);
512    enc->rdo(enc);
513    enc->pic_control(enc);
514 }
515 
config_extension(struct rvce_encoder * enc)516 static void config_extension(struct rvce_encoder *enc)
517 {
518    RVCE_BEGIN(0x04000001); // config extension
519    RVCE_CS(enc->enc_pic.ce.enc_enable_perf_logging);
520    RVCE_END();
521 }
522 
feedback(struct rvce_encoder * enc)523 static void feedback(struct rvce_encoder *enc)
524 {
525    RVCE_BEGIN(0x05000005);                                    // feedback buffer
526    RVCE_WRITE(enc->fb->res->buf, enc->fb->res->domains, 0x0); // feedbackRingAddressHi/Lo
527    RVCE_CS(enc->enc_pic.fb.feedback_ring_size);
528    RVCE_END();
529 }
530 
destroy(struct rvce_encoder * enc)531 static void destroy(struct rvce_encoder *enc)
532 {
533    enc->task_info(enc, 0x00000001, 0);
534 
535    feedback(enc);
536 
537    RVCE_BEGIN(0x02000001); // destroy
538    RVCE_END();
539 }
540 
motion_estimation(struct rvce_encoder * enc)541 static void motion_estimation(struct rvce_encoder *enc)
542 {
543    RVCE_BEGIN(0x04000007); // motion estimation
544    RVCE_CS(enc->enc_pic.me.enc_ime_decimation_search);
545    RVCE_CS(enc->enc_pic.me.motion_est_half_pixel);
546    RVCE_CS(enc->enc_pic.me.motion_est_quarter_pixel);
547    RVCE_CS(enc->enc_pic.me.disable_favor_pmv_point);
548    RVCE_CS(enc->enc_pic.me.force_zero_point_center);
549    RVCE_CS(enc->enc_pic.me.lsmvert);
550    RVCE_CS(enc->enc_pic.me.enc_search_range_x);
551    RVCE_CS(enc->enc_pic.me.enc_search_range_y);
552    RVCE_CS(enc->enc_pic.me.enc_search1_range_x);
553    RVCE_CS(enc->enc_pic.me.enc_search1_range_y);
554    RVCE_CS(enc->enc_pic.me.disable_16x16_frame1);
555    RVCE_CS(enc->enc_pic.me.disable_satd);
556    RVCE_CS(enc->enc_pic.me.enable_amd);
557    RVCE_CS(enc->enc_pic.me.enc_disable_sub_mode);
558    RVCE_CS(enc->enc_pic.me.enc_ime_skip_x);
559    RVCE_CS(enc->enc_pic.me.enc_ime_skip_y);
560    RVCE_CS(enc->enc_pic.me.enc_en_ime_overw_dis_subm);
561    RVCE_CS(enc->enc_pic.me.enc_ime_overw_dis_subm_no);
562    RVCE_CS(enc->enc_pic.me.enc_ime2_search_range_x);
563    RVCE_CS(enc->enc_pic.me.enc_ime2_search_range_y);
564    RVCE_CS(enc->enc_pic.me.parallel_mode_speedup_enable);
565    RVCE_CS(enc->enc_pic.me.fme0_enc_disable_sub_mode);
566    RVCE_CS(enc->enc_pic.me.fme1_enc_disable_sub_mode);
567    RVCE_CS(enc->enc_pic.me.ime_sw_speedup_enable);
568    RVCE_END();
569 }
570 
pic_control(struct rvce_encoder * enc)571 static void pic_control(struct rvce_encoder *enc)
572 {
573    RVCE_BEGIN(0x04000002); // pic control
574    RVCE_CS(enc->enc_pic.pc.enc_use_constrained_intra_pred);
575    RVCE_CS(enc->enc_pic.pc.enc_cabac_enable);
576    RVCE_CS(enc->enc_pic.pc.enc_cabac_idc);
577    RVCE_CS(enc->enc_pic.pc.enc_loop_filter_disable);
578    RVCE_CS(enc->enc_pic.pc.enc_lf_beta_offset);
579    RVCE_CS(enc->enc_pic.pc.enc_lf_alpha_c0_offset);
580    RVCE_CS(enc->enc_pic.pc.enc_crop_left_offset);
581    RVCE_CS(enc->enc_pic.pc.enc_crop_right_offset);
582    RVCE_CS(enc->enc_pic.pc.enc_crop_top_offset);
583    RVCE_CS(enc->enc_pic.pc.enc_crop_bottom_offset);
584    RVCE_CS(enc->enc_pic.pc.enc_num_mbs_per_slice);
585    RVCE_CS(enc->enc_pic.pc.enc_intra_refresh_num_mbs_per_slot);
586    RVCE_CS(enc->enc_pic.pc.enc_force_intra_refresh);
587    RVCE_CS(enc->enc_pic.pc.enc_force_imb_period);
588    RVCE_CS(enc->enc_pic.pc.enc_pic_order_cnt_type);
589    RVCE_CS(enc->enc_pic.pc.log2_max_pic_order_cnt_lsb_minus4);
590    RVCE_CS(enc->enc_pic.pc.enc_sps_id);
591    RVCE_CS(enc->enc_pic.pc.enc_pps_id);
592    RVCE_CS(enc->enc_pic.pc.enc_constraint_set_flags);
593    RVCE_CS(enc->enc_pic.pc.enc_b_pic_pattern);
594    RVCE_CS(enc->enc_pic.pc.weight_pred_mode_b_picture);
595    RVCE_CS(enc->enc_pic.pc.enc_number_of_reference_frames);
596    RVCE_CS(enc->enc_pic.pc.enc_max_num_ref_frames);
597    RVCE_CS(enc->enc_pic.pc.enc_num_default_active_ref_l0);
598    RVCE_CS(enc->enc_pic.pc.enc_num_default_active_ref_l1);
599    RVCE_CS(enc->enc_pic.pc.enc_slice_mode);
600    RVCE_CS(enc->enc_pic.pc.enc_max_slice_size);
601    RVCE_END();
602 }
603 
rdo(struct rvce_encoder * enc)604 static void rdo(struct rvce_encoder *enc)
605 {
606    RVCE_BEGIN(0x04000008); // rdo
607    RVCE_CS(enc->enc_pic.rdo.enc_disable_tbe_pred_i_frame);
608    RVCE_CS(enc->enc_pic.rdo.enc_disable_tbe_pred_p_frame);
609    RVCE_CS(enc->enc_pic.rdo.use_fme_interpol_y);
610    RVCE_CS(enc->enc_pic.rdo.use_fme_interpol_uv);
611    RVCE_CS(enc->enc_pic.rdo.use_fme_intrapol_y);
612    RVCE_CS(enc->enc_pic.rdo.use_fme_intrapol_uv);
613    RVCE_CS(enc->enc_pic.rdo.use_fme_interpol_y_1);
614    RVCE_CS(enc->enc_pic.rdo.use_fme_interpol_uv_1);
615    RVCE_CS(enc->enc_pic.rdo.use_fme_intrapol_y_1);
616    RVCE_CS(enc->enc_pic.rdo.use_fme_intrapol_uv_1);
617    RVCE_CS(enc->enc_pic.rdo.enc_16x16_cost_adj);
618    RVCE_CS(enc->enc_pic.rdo.enc_skip_cost_adj);
619    RVCE_CS(enc->enc_pic.rdo.enc_force_16x16_skip);
620    RVCE_CS(enc->enc_pic.rdo.enc_disable_threshold_calc_a);
621    RVCE_CS(enc->enc_pic.rdo.enc_luma_coeff_cost);
622    RVCE_CS(enc->enc_pic.rdo.enc_luma_mb_coeff_cost);
623    RVCE_CS(enc->enc_pic.rdo.enc_chroma_coeff_cost);
624    RVCE_END();
625 }
626 
session(struct rvce_encoder * enc)627 static void session(struct rvce_encoder *enc)
628 {
629    RVCE_BEGIN(0x00000001); // session cmd
630    RVCE_CS(enc->stream_handle);
631    RVCE_END();
632 }
633 
task_info(struct rvce_encoder * enc,uint32_t op,uint32_t fb_idx)634 static void task_info(struct rvce_encoder *enc, uint32_t op, uint32_t fb_idx)
635 {
636    RVCE_BEGIN(0x00000002); // task info
637    enc->enc_pic.ti.task_operation = op;
638    enc->enc_pic.ti.reference_picture_dependency = 0;
639    enc->enc_pic.ti.feedback_index = fb_idx;
640    enc->enc_pic.ti.video_bitstream_ring_index = 0;
641    RVCE_CS(enc->enc_pic.ti.offset_of_next_task_info);
642    RVCE_CS(enc->enc_pic.ti.task_operation);
643    RVCE_CS(enc->enc_pic.ti.reference_picture_dependency);
644    RVCE_CS(enc->enc_pic.ti.collocate_flag_dependency);
645    RVCE_CS(enc->enc_pic.ti.feedback_index);
646    RVCE_CS(enc->enc_pic.ti.video_bitstream_ring_index);
647    RVCE_END();
648 }
649 
si_vce_write_sps(struct rvce_encoder * enc,uint8_t nal_byte,uint8_t * out)650 unsigned int si_vce_write_sps(struct rvce_encoder *enc, uint8_t nal_byte, uint8_t *out)
651 {
652    struct pipe_h264_enc_seq_param *sps = &enc->pic.seq;
653    struct radeon_bitstream bs;
654 
655    radeon_bs_reset(&bs, out, NULL);
656    radeon_bs_set_emulation_prevention(&bs, false);
657    radeon_bs_code_fixed_bits(&bs, 0x00000001, 32);
658    radeon_bs_code_fixed_bits(&bs, nal_byte, 8);
659    radeon_bs_set_emulation_prevention(&bs, true);
660    radeon_bs_code_fixed_bits(&bs, sps->profile_idc, 8);
661    radeon_bs_code_fixed_bits(&bs, sps->enc_constraint_set_flags, 6);
662    radeon_bs_code_fixed_bits(&bs, 0x0, 2); /* reserved_zero_2bits */
663    radeon_bs_code_fixed_bits(&bs, sps->level_idc, 8);
664    radeon_bs_code_ue(&bs, 0x0); /* seq_parameter_set_id */
665 
666    if (sps->profile_idc == 100 || sps->profile_idc == 110 ||
667        sps->profile_idc == 122 || sps->profile_idc == 244 ||
668        sps->profile_idc == 44  || sps->profile_idc == 83 ||
669        sps->profile_idc == 86  || sps->profile_idc == 118 ||
670        sps->profile_idc == 128 || sps->profile_idc == 138) {
671       radeon_bs_code_ue(&bs, 0x1); /* chroma_format_idc */
672       radeon_bs_code_ue(&bs, 0x0); /* bit_depth_luma_minus8 */
673       radeon_bs_code_ue(&bs, 0x0); /* bit_depth_chroma_minus8 */
674       radeon_bs_code_fixed_bits(&bs, 0x0, 2); /* qpprime_y_zero_transform_bypass_flag + seq_scaling_matrix_present_flag */
675    }
676 
677    radeon_bs_code_ue(&bs, 3); /* log2_max_frame_num_minus4 */
678    radeon_bs_code_ue(&bs, sps->pic_order_cnt_type);
679 
680    if (sps->pic_order_cnt_type == 0)
681       radeon_bs_code_ue(&bs, sps->log2_max_pic_order_cnt_lsb_minus4);
682 
683    radeon_bs_code_ue(&bs, sps->max_num_ref_frames);
684    radeon_bs_code_fixed_bits(&bs, sps->gaps_in_frame_num_value_allowed_flag, 1);
685    radeon_bs_code_ue(&bs, DIV_ROUND_UP(enc->base.width, 16) - 1);
686    radeon_bs_code_ue(&bs, DIV_ROUND_UP(enc->base.height, 16) - 1);
687    radeon_bs_code_fixed_bits(&bs, 0x1, 1); /* frame_mbs_only_flag */
688    radeon_bs_code_fixed_bits(&bs, 0x1, 1); /* direct_8x8_inference_flag */
689 
690    radeon_bs_code_fixed_bits(&bs, sps->enc_frame_cropping_flag, 1);
691    if (sps->enc_frame_cropping_flag) {
692       radeon_bs_code_ue(&bs, sps->enc_frame_crop_left_offset);
693       radeon_bs_code_ue(&bs, sps->enc_frame_crop_right_offset);
694       radeon_bs_code_ue(&bs, sps->enc_frame_crop_top_offset);
695       radeon_bs_code_ue(&bs, sps->enc_frame_crop_bottom_offset);
696    }
697 
698    radeon_bs_code_fixed_bits(&bs, sps->vui_parameters_present_flag, 1);
699    if (sps->vui_parameters_present_flag) {
700       radeon_bs_code_fixed_bits(&bs, (sps->vui_flags.aspect_ratio_info_present_flag), 1);
701       if (sps->vui_flags.aspect_ratio_info_present_flag) {
702          radeon_bs_code_fixed_bits(&bs, (sps->aspect_ratio_idc), 8);
703          if (sps->aspect_ratio_idc == PIPE_H2645_EXTENDED_SAR) {
704             radeon_bs_code_fixed_bits(&bs, (sps->sar_width), 16);
705             radeon_bs_code_fixed_bits(&bs, (sps->sar_height), 16);
706          }
707       }
708       radeon_bs_code_fixed_bits(&bs, sps->vui_flags.overscan_info_present_flag, 1);
709       if (sps->vui_flags.overscan_info_present_flag)
710          radeon_bs_code_fixed_bits(&bs, sps->vui_flags.overscan_appropriate_flag, 1);
711       radeon_bs_code_fixed_bits(&bs, sps->vui_flags.video_signal_type_present_flag, 1);
712       if (sps->vui_flags.video_signal_type_present_flag) {
713          radeon_bs_code_fixed_bits(&bs, sps->video_format, 3);
714          radeon_bs_code_fixed_bits(&bs, sps->video_full_range_flag, 1);
715          radeon_bs_code_fixed_bits(&bs, sps->vui_flags.colour_description_present_flag, 1);
716          if (sps->vui_flags.colour_description_present_flag) {
717             radeon_bs_code_fixed_bits(&bs, sps->colour_primaries, 8);
718             radeon_bs_code_fixed_bits(&bs, sps->transfer_characteristics, 8);
719             radeon_bs_code_fixed_bits(&bs, sps->matrix_coefficients, 8);
720          }
721       }
722       radeon_bs_code_fixed_bits(&bs, sps->vui_flags.chroma_loc_info_present_flag, 1);
723       if (sps->vui_flags.chroma_loc_info_present_flag) {
724          radeon_bs_code_ue(&bs, sps->chroma_sample_loc_type_top_field);
725          radeon_bs_code_ue(&bs, sps->chroma_sample_loc_type_bottom_field);
726       }
727       radeon_bs_code_fixed_bits(&bs, (sps->vui_flags.timing_info_present_flag), 1);
728       if (sps->vui_flags.timing_info_present_flag) {
729          radeon_bs_code_fixed_bits(&bs, (sps->num_units_in_tick), 32);
730          radeon_bs_code_fixed_bits(&bs, (sps->time_scale), 32);
731          radeon_bs_code_fixed_bits(&bs, (sps->vui_flags.fixed_frame_rate_flag), 1);
732       }
733       radeon_bs_code_fixed_bits(&bs, sps->vui_flags.nal_hrd_parameters_present_flag, 1);
734       if (sps->vui_flags.nal_hrd_parameters_present_flag)
735          radeon_bs_h264_hrd_parameters(&bs, &sps->nal_hrd_parameters);
736       radeon_bs_code_fixed_bits(&bs, sps->vui_flags.vcl_hrd_parameters_present_flag, 1);
737       if (sps->vui_flags.vcl_hrd_parameters_present_flag)
738          radeon_bs_h264_hrd_parameters(&bs, &sps->vcl_hrd_parameters);
739       if (sps->vui_flags.nal_hrd_parameters_present_flag || sps->vui_flags.vcl_hrd_parameters_present_flag)
740          radeon_bs_code_fixed_bits(&bs, sps->vui_flags.low_delay_hrd_flag, 1);
741       radeon_bs_code_fixed_bits(&bs, sps->vui_flags.pic_struct_present_flag, 1);
742       radeon_bs_code_fixed_bits(&bs, sps->vui_flags.bitstream_restriction_flag, 1);
743       if (sps->vui_flags.bitstream_restriction_flag) {
744          radeon_bs_code_fixed_bits(&bs, 0x1, 1); /* motion_vectors_over_pic_boundaries_flag */
745          radeon_bs_code_ue(&bs, 0x2); /* max_bytes_per_pic_denom */
746          radeon_bs_code_ue(&bs, 0x1); /* max_bits_per_mb_denom */
747          radeon_bs_code_ue(&bs, 0x10); /* log2_max_mv_length_horizontal */
748          radeon_bs_code_ue(&bs, 0x10); /* log2_max_mv_length_vertical */
749          radeon_bs_code_ue(&bs, sps->max_num_reorder_frames);
750          radeon_bs_code_ue(&bs, sps->max_dec_frame_buffering);
751       }
752    }
753 
754    radeon_bs_code_fixed_bits(&bs, 0x1, 1);
755    radeon_bs_byte_align(&bs);
756 
757    return bs.bits_output / 8;
758 }
759 
si_vce_write_pps(struct rvce_encoder * enc,uint8_t nal_byte,uint8_t * out)760 unsigned int si_vce_write_pps(struct rvce_encoder *enc, uint8_t nal_byte, uint8_t *out)
761 {
762    struct radeon_bitstream bs;
763 
764    radeon_bs_reset(&bs, out, NULL);
765    radeon_bs_set_emulation_prevention(&bs, false);
766    radeon_bs_code_fixed_bits(&bs, 0x00000001, 32);
767    radeon_bs_code_fixed_bits(&bs, nal_byte, 8);
768    radeon_bs_set_emulation_prevention(&bs, true);
769    radeon_bs_code_ue(&bs, 0x0); /* pic_parameter_set_id */
770    radeon_bs_code_ue(&bs, 0x0); /* seq_parameter_set_id */
771    radeon_bs_code_fixed_bits(&bs, enc->enc_pic.pc.enc_cabac_enable, 1);
772    radeon_bs_code_fixed_bits(&bs, 0x0, 1); /* bottom_field_pic_order_in_frame_present_flag */
773    radeon_bs_code_ue(&bs, 0x0); /* num_slice_groups_minus_1 */
774    radeon_bs_code_ue(&bs, enc->enc_pic.pc.enc_num_default_active_ref_l0 - 1);
775    radeon_bs_code_ue(&bs, enc->enc_pic.pc.enc_num_default_active_ref_l1 - 1);
776    radeon_bs_code_fixed_bits(&bs, 0x0, 1); /* weighted_pred_flag */
777    radeon_bs_code_fixed_bits(&bs, 0x0, 2); /* weighted_bipred_idc */
778    radeon_bs_code_se(&bs, 0x0); /* pic_init_qp_minus26 */
779    radeon_bs_code_se(&bs, 0x0); /* pic_init_qs_minus26 */
780    radeon_bs_code_se(&bs, 0x0); /* chroma_qp_index_offset */
781    bool deblocking_filter_present_flag =
782       enc->enc_pic.pc.enc_loop_filter_disable ||
783       enc->enc_pic.pc.enc_lf_beta_offset ||
784       enc->enc_pic.pc.enc_lf_alpha_c0_offset;
785    radeon_bs_code_fixed_bits(&bs, deblocking_filter_present_flag, 1);
786    radeon_bs_code_fixed_bits(&bs, enc->enc_pic.pc.enc_use_constrained_intra_pred, 1);
787    radeon_bs_code_fixed_bits(&bs, 0x0, 1); /* redundant_pic_cnt_present_flag */
788 
789    radeon_bs_code_fixed_bits(&bs, 0x1, 1);
790    radeon_bs_byte_align(&bs);
791 
792    return bs.bits_output / 8;
793 }
794 
si_vce_52_init(struct rvce_encoder * enc)795 void si_vce_52_init(struct rvce_encoder *enc)
796 {
797    enc->session = session;
798    enc->task_info = task_info;
799    enc->create = create;
800    enc->feedback = feedback;
801    enc->rate_control = rate_control;
802    enc->config_extension = config_extension;
803    enc->pic_control = pic_control;
804    enc->motion_estimation = motion_estimation;
805    enc->rdo = rdo;
806    enc->config = config;
807    enc->encode = encode;
808    enc->destroy = destroy;
809    enc->si_get_pic_param = get_param;
810 }
811