summaryrefslogtreecommitdiff
path: root/src/gallium/drivers/radeon/radeon_vce.h
blob: cf625e6fed7b3fa4269886aceb2248efe0142a50 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
/**************************************************************************
 *
 * Copyright 2013 Advanced Micro Devices, Inc.
 * All Rights Reserved.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the
 * "Software"), to deal in the Software without restriction, including
 * without limitation the rights to use, copy, modify, merge, publish,
 * distribute, sub license, and/or sell copies of the Software, and to
 * permit persons to whom the Software is furnished to do so, subject to
 * the following conditions:
 *
 * The above copyright notice and this permission notice (including the
 * next paragraph) shall be included in all copies or substantial portions
 * of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
 * IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR
 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 *
 **************************************************************************/

#ifndef RADEON_VCE_H
#define RADEON_VCE_H

#include "util/list.h"

#define RVCE_CS(value) (enc->cs->current.buf[enc->cs->current.cdw++] = (value))
#define RVCE_BEGIN(cmd) { \
	uint32_t *begin = &enc->cs->current.buf[enc->cs->current.cdw++]; \
	RVCE_CS(cmd)
#define RVCE_READ(buf, domain, off) si_vce_add_buffer(enc, (buf), RADEON_USAGE_READ, (domain), (off))
#define RVCE_WRITE(buf, domain, off) si_vce_add_buffer(enc, (buf), RADEON_USAGE_WRITE, (domain), (off))
#define RVCE_READWRITE(buf, domain, off) si_vce_add_buffer(enc, (buf), RADEON_USAGE_READWRITE, (domain), (off))
#define RVCE_END() *begin = (&enc->cs->current.buf[enc->cs->current.cdw] - begin) * 4; }

#define RVCE_MAX_BITSTREAM_OUTPUT_ROW_SIZE (4096 * 16 * 2.5)
#define RVCE_MAX_AUX_BUFFER_NUM 4

struct si_screen;

/* driver dependent callback */
typedef void (*rvce_get_buffer)(struct pipe_resource *resource,
				struct pb_buffer **handle,
				struct radeon_surf **surface);

/* Coded picture buffer slot */
struct rvce_cpb_slot {
	struct list_head		list;

	unsigned			index;
	enum pipe_h264_enc_picture_type	picture_type;
	unsigned			frame_num;
	unsigned			pic_order_cnt;
};

struct rvce_rate_control {
	uint32_t		rc_method;
	uint32_t		target_bitrate;
	uint32_t		peak_bitrate;
	uint32_t		frame_rate_num;
	uint32_t		gop_size;
	uint32_t		quant_i_frames;
	uint32_t		quant_p_frames;
	uint32_t		quant_b_frames;
	uint32_t		vbv_buffer_size;
	uint32_t		frame_rate_den;
	uint32_t		vbv_buf_lv;
	uint32_t		max_au_size;
	uint32_t		qp_initial_mode;
	uint32_t		target_bits_picture;
	uint32_t		peak_bits_picture_integer;
	uint32_t		peak_bits_picture_fraction;
	uint32_t		min_qp;
	uint32_t		max_qp;
	uint32_t		skip_frame_enable;
	uint32_t		fill_data_enable;
	uint32_t		enforce_hrd;
	uint32_t		b_pics_delta_qp;
	uint32_t		ref_b_pics_delta_qp;
	uint32_t		rc_reinit_disable;
	uint32_t		enc_lcvbr_init_qp_flag;
	uint32_t		lcvbrsatd_based_nonlinear_bit_budget_flag;
};

struct rvce_motion_estimation {
	uint32_t		enc_ime_decimation_search;
	uint32_t		motion_est_half_pixel;
	uint32_t		motion_est_quarter_pixel;
	uint32_t		disable_favor_pmv_point;
	uint32_t		force_zero_point_center;
	uint32_t		lsmvert;
	uint32_t		enc_search_range_x;
	uint32_t		enc_search_range_y;
	uint32_t		enc_search1_range_x;
	uint32_t		enc_search1_range_y;
	uint32_t		disable_16x16_frame1;
	uint32_t		disable_satd;
	uint32_t		enable_amd;
	uint32_t		enc_disable_sub_mode;
	uint32_t		enc_ime_skip_x;
	uint32_t		enc_ime_skip_y;
	uint32_t		enc_en_ime_overw_dis_subm;
	uint32_t		enc_ime_overw_dis_subm_no;
	uint32_t		enc_ime2_search_range_x;
	uint32_t		enc_ime2_search_range_y;
	uint32_t		parallel_mode_speedup_enable;
	uint32_t		fme0_enc_disable_sub_mode;
	uint32_t		fme1_enc_disable_sub_mode;
	uint32_t		ime_sw_speedup_enable;
};

struct rvce_pic_control {
	uint32_t		enc_use_constrained_intra_pred;
	uint32_t		enc_cabac_enable;
	uint32_t		enc_cabac_idc;
	uint32_t		enc_loop_filter_disable;
	int32_t			enc_lf_beta_offset;
	int32_t			enc_lf_alpha_c0_offset;
	uint32_t		enc_crop_left_offset;
	uint32_t		enc_crop_right_offset;
	uint32_t		enc_crop_top_offset;
	uint32_t		enc_crop_bottom_offset;
	uint32_t		enc_num_mbs_per_slice;
	uint32_t		enc_intra_refresh_num_mbs_per_slot;
	uint32_t		enc_force_intra_refresh;
	uint32_t		enc_force_imb_period;
	uint32_t		enc_pic_order_cnt_type;
	uint32_t		log2_max_pic_order_cnt_lsb_minus4;
	uint32_t		enc_sps_id;
	uint32_t		enc_pps_id;
	uint32_t		enc_constraint_set_flags;
	uint32_t		enc_b_pic_pattern;
	uint32_t		weight_pred_mode_b_picture;
	uint32_t		enc_number_of_reference_frames;
	uint32_t		enc_max_num_ref_frames;
	uint32_t		enc_num_default_active_ref_l0;
	uint32_t		enc_num_default_active_ref_l1;
	uint32_t		enc_slice_mode;
	uint32_t		enc_max_slice_size;
};

struct rvce_task_info {
	uint32_t		offset_of_next_task_info;
	uint32_t		task_operation;
	uint32_t		reference_picture_dependency;
	uint32_t		collocate_flag_dependency;
	uint32_t		feedback_index;
	uint32_t		video_bitstream_ring_index;
};

struct rvce_feedback_buf_pkg {
	uint32_t		feedback_ring_address_hi;
	uint32_t		feedback_ring_address_lo;
	uint32_t		feedback_ring_size;
};

struct rvce_rdo {
	uint32_t		enc_disable_tbe_pred_i_frame;
	uint32_t		enc_disable_tbe_pred_p_frame;
	uint32_t		use_fme_interpol_y;
	uint32_t		use_fme_interpol_uv;
	uint32_t		use_fme_intrapol_y;
	uint32_t		use_fme_intrapol_uv;
	uint32_t		use_fme_interpol_y_1;
	uint32_t		use_fme_interpol_uv_1;
	uint32_t		use_fme_intrapol_y_1;
	uint32_t		use_fme_intrapol_uv_1;
	uint32_t		enc_16x16_cost_adj;
	uint32_t		enc_skip_cost_adj;
	uint32_t		enc_force_16x16_skip;
	uint32_t		enc_disable_threshold_calc_a;
	uint32_t		enc_luma_coeff_cost;
	uint32_t		enc_luma_mb_coeff_cost;
	uint32_t		enc_chroma_coeff_cost;
};

struct rvce_vui {
	uint32_t		aspect_ratio_info_present_flag;
	uint32_t		aspect_ratio_idc;
	uint32_t		sar_width;
	uint32_t		sar_height;
	uint32_t		overscan_info_present_flag;
	uint32_t		overscan_Approp_flag;
	uint32_t		video_signal_type_present_flag;
	uint32_t		video_format;
	uint32_t		video_full_range_flag;
	uint32_t		color_description_present_flag;
	uint32_t		color_prim;
	uint32_t		transfer_char;
	uint32_t		matrix_coef;
	uint32_t		chroma_loc_info_present_flag;
	uint32_t		chroma_loc_top;
	uint32_t		chroma_loc_bottom;
	uint32_t		timing_info_present_flag;
	uint32_t		num_units_in_tick;
	uint32_t		time_scale;
	uint32_t		fixed_frame_rate_flag;
	uint32_t		nal_hrd_parameters_present_flag;
	uint32_t		cpb_cnt_minus1;
	uint32_t		bit_rate_scale;
	uint32_t		cpb_size_scale;
	uint32_t		bit_rate_value_minus;
	uint32_t		cpb_size_value_minus;
	uint32_t		cbr_flag;
	uint32_t		initial_cpb_removal_delay_length_minus1;
	uint32_t		cpb_removal_delay_length_minus1;
	uint32_t		dpb_output_delay_length_minus1;
	uint32_t		time_offset_length;
	uint32_t		low_delay_hrd_flag;
	uint32_t		pic_struct_present_flag;
	uint32_t		bitstream_restriction_present_flag;
	uint32_t		motion_vectors_over_pic_boundaries_flag;
	uint32_t		max_bytes_per_pic_denom;
	uint32_t		max_bits_per_mb_denom;
	uint32_t		log2_max_mv_length_hori;
	uint32_t		log2_max_mv_length_vert;
	uint32_t		num_reorder_frames;
	uint32_t		max_dec_frame_buffering;
};

struct rvce_enc_operation {
	uint32_t		insert_headers;
	uint32_t		picture_structure;
	uint32_t		allowed_max_bitstream_size;
	uint32_t		force_refresh_map;
	uint32_t		insert_aud;
	uint32_t		end_of_sequence;
	uint32_t		end_of_stream;
	uint32_t		input_picture_luma_address_hi;
	uint32_t		input_picture_luma_address_lo;
	uint32_t		input_picture_chroma_address_hi;
	uint32_t		input_picture_chroma_address_lo;
	uint32_t		enc_input_frame_y_pitch;
	uint32_t		enc_input_pic_luma_pitch;
	uint32_t		enc_input_pic_chroma_pitch;;
	uint32_t		enc_input_pic_addr_array;
	uint32_t		enc_input_pic_addr_array_disable2pipe_disablemboffload;
	uint32_t		enc_input_pic_tile_config;
	uint32_t		enc_pic_type;
	uint32_t		enc_idr_flag;
	uint32_t		enc_idr_pic_id;
	uint32_t		enc_mgs_key_pic;
	uint32_t		enc_reference_flag;
	uint32_t		enc_temporal_layer_index;
	uint32_t		num_ref_idx_active_override_flag;
	uint32_t		num_ref_idx_l0_active_minus1;
	uint32_t		num_ref_idx_l1_active_minus1;
	uint32_t		enc_ref_list_modification_op;
	uint32_t		enc_ref_list_modification_num;
	uint32_t		enc_decoded_picture_marking_op;
	uint32_t		enc_decoded_picture_marking_num;
	uint32_t		enc_decoded_picture_marking_idx;
	uint32_t		enc_decoded_ref_base_picture_marking_op;
	uint32_t		enc_decoded_ref_base_picture_marking_num;
	uint32_t		l0_picture_structure;
	uint32_t		l0_enc_pic_type;
	uint32_t		l0_frame_number;
	uint32_t		l0_picture_order_count;
	uint32_t		l0_luma_offset;
	uint32_t		l0_chroma_offset;
	uint32_t		l1_picture_structure;
	uint32_t		l1_enc_pic_type;
	uint32_t		l1_frame_number;
	uint32_t		l1_picture_order_count;
	uint32_t		l1_luma_offset;
	uint32_t		l1_chroma_offset;
	uint32_t		enc_reconstructed_luma_offset;
	uint32_t		enc_reconstructed_chroma_offset;;
	uint32_t		enc_coloc_buffer_offset;
	uint32_t		enc_reconstructed_ref_base_picture_luma_offset;
	uint32_t		enc_reconstructed_ref_base_picture_chroma_offset;
	uint32_t		enc_reference_ref_base_picture_luma_offset;
	uint32_t		enc_reference_ref_base_picture_chroma_offset;
	uint32_t		picture_count;
	uint32_t		frame_number;
	uint32_t		picture_order_count;
	uint32_t		num_i_pic_remain_in_rcgop;
	uint32_t		num_p_pic_remain_in_rcgop;
	uint32_t		num_b_pic_remain_in_rcgop;
	uint32_t		num_ir_pic_remain_in_rcgop;
	uint32_t		enable_intra_refresh;
	uint32_t		aq_variance_en;
	uint32_t		aq_block_size;
	uint32_t		aq_mb_variance_sel;
	uint32_t		aq_frame_variance_sel;
	uint32_t		aq_param_a;
	uint32_t		aq_param_b;
	uint32_t		aq_param_c;
	uint32_t		aq_param_d;
	uint32_t		aq_param_e;
	uint32_t		context_in_sfb;
};

struct rvce_enc_create {
	uint32_t		enc_use_circular_buffer;
	uint32_t		enc_profile;
	uint32_t		enc_level;
	uint32_t		enc_pic_struct_restriction;
	uint32_t		enc_image_width;
	uint32_t		enc_image_height;
	uint32_t		enc_ref_pic_luma_pitch;
	uint32_t		enc_ref_pic_chroma_pitch;
	uint32_t		enc_ref_y_height_in_qw;
	uint32_t		enc_ref_pic_addr_array_enc_pic_struct_restriction_disable_rdo;
	uint32_t		enc_pre_encode_context_buffer_offset;
	uint32_t		enc_pre_encode_input_luma_buffer_offset;
	uint32_t		enc_pre_encode_input_chroma_buffer_offset;
	uint32_t		enc_pre_encode_mode_chromaflag_vbaqmode_scenechangesensitivity;
};

struct rvce_config_ext {
	uint32_t		enc_enable_perf_logging;
};

struct rvce_h264_enc_pic {
	struct rvce_rate_control rc;
	struct rvce_motion_estimation me;
	struct rvce_pic_control pc;
	struct rvce_task_info ti;
	struct rvce_feedback_buf_pkg fb;
	struct rvce_rdo rdo;
	struct rvce_vui vui;
	struct rvce_enc_operation eo;
	struct rvce_enc_create ec;
	struct rvce_config_ext ce;

	unsigned quant_i_frames;
	unsigned quant_p_frames;
	unsigned quant_b_frames;

	enum pipe_h264_enc_picture_type picture_type;
	unsigned frame_num;
	unsigned frame_num_cnt;
	unsigned p_remain;
	unsigned i_remain;
	unsigned idr_pic_id;
	unsigned gop_cnt;
	unsigned gop_size;
	unsigned pic_order_cnt;
	unsigned ref_idx_l0;
	unsigned ref_idx_l1;
	unsigned addrmode_arraymode_disrdo_distwoinstants;

	bool not_referenced;
	bool is_idr;
	bool has_ref_pic_list;
	bool enable_vui;
	unsigned int ref_pic_list_0[32];
	unsigned int ref_pic_list_1[32];
	unsigned int frame_idx[32];
};

/* VCE encoder representation */
struct rvce_encoder {
	struct pipe_video_codec		base;

	/* version specific packets */
	void (*session)(struct rvce_encoder *enc);
	void (*create)(struct rvce_encoder *enc);
	void (*feedback)(struct rvce_encoder *enc);
	void (*rate_control)(struct rvce_encoder *enc);
	void (*config_extension)(struct rvce_encoder *enc);
	void (*pic_control)(struct rvce_encoder *enc);
	void (*motion_estimation)(struct rvce_encoder *enc);
	void (*rdo)(struct rvce_encoder *enc);
	void (*vui)(struct rvce_encoder *enc);
	void (*config)(struct rvce_encoder *enc);
	void (*encode)(struct rvce_encoder *enc);
	void (*destroy)(struct rvce_encoder *enc);
	void (*task_info)(struct rvce_encoder *enc, uint32_t op,
			  uint32_t dep, uint32_t fb_idx,
			  uint32_t ring_idx);

	unsigned			stream_handle;

	struct pipe_screen		*screen;
	struct radeon_winsys*		ws;
	struct radeon_cmdbuf*	cs;

	rvce_get_buffer			get_buffer;

	struct pb_buffer*	handle;
	struct radeon_surf*		luma;
	struct radeon_surf*		chroma;

	struct pb_buffer*	bs_handle;
	unsigned			bs_size;

	struct rvce_cpb_slot		*cpb_array;
	struct list_head		cpb_slots;
	unsigned			cpb_num;

	struct rvid_buffer		*fb;
	struct rvid_buffer		cpb;
	struct pipe_h264_enc_picture_desc pic;
	struct rvce_h264_enc_pic	enc_pic;

	unsigned			task_info_idx;
	unsigned			bs_idx;

	bool				use_vm;
	bool				use_vui;
	bool				dual_pipe;
	bool				dual_inst;
};

/* CPB handling functions */
struct rvce_cpb_slot *si_current_slot(struct rvce_encoder *enc);
struct rvce_cpb_slot *si_l0_slot(struct rvce_encoder *enc);
struct rvce_cpb_slot *si_l1_slot(struct rvce_encoder *enc);
void si_vce_frame_offset(struct rvce_encoder *enc, struct rvce_cpb_slot *slot,
			 signed *luma_offset, signed *chroma_offset);

struct pipe_video_codec *si_vce_create_encoder(struct pipe_context *context,
					       const struct pipe_video_codec *templat,
					       struct radeon_winsys* ws,
					       rvce_get_buffer get_buffer);

bool si_vce_is_fw_version_supported(struct si_screen *sscreen);

void si_vce_add_buffer(struct rvce_encoder *enc, struct pb_buffer *buf,
		       enum radeon_bo_usage usage, enum radeon_bo_domain domain,
		       signed offset);

/* init vce fw 40.2.2 specific callbacks */
void si_vce_40_2_2_init(struct rvce_encoder *enc);

/* init vce fw 50 specific callbacks */
void si_vce_50_init(struct rvce_encoder *enc);

/* init vce fw 52 specific callbacks */
void si_vce_52_init(struct rvce_encoder *enc);

/* version specific function for getting parameters */
void (*si_get_pic_param)(struct rvce_encoder *enc,
                      struct pipe_h264_enc_picture_desc *pic);

/* get parameters for vce 40.2.2 */
void si_vce_40_2_2_get_param(struct rvce_encoder *enc,
			     struct pipe_h264_enc_picture_desc *pic);

/* get parameters for vce 50 */
void si_vce_50_get_param(struct rvce_encoder *enc,
			 struct pipe_h264_enc_picture_desc *pic);

/* get parameters for vce 52 */
void si_vce_52_get_param(struct rvce_encoder *enc,
			 struct pipe_h264_enc_picture_desc *pic);

#endif