radeon/vce: implement non-referenced frames
[mesa.git] / src / gallium / drivers / radeon / radeon_vce.c
1 /**************************************************************************
2 *
3 * Copyright 2013 Advanced Micro Devices, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /*
29 * Authors:
30 * Christian König <christian.koenig@amd.com>
31 *
32 */
33
34 #include <stdio.h>
35
36 #include "pipe/p_video_codec.h"
37
38 #include "util/u_video.h"
39 #include "util/u_memory.h"
40
41 #include "vl/vl_video_buffer.h"
42
43 #include "../../winsys/radeon/drm/radeon_winsys.h"
44 #include "r600_pipe_common.h"
45 #include "radeon_video.h"
46 #include "radeon_vce.h"
47
48 /**
49 * flush commands to the hardware
50 */
51 static void flush(struct rvce_encoder *enc)
52 {
53 enc->ws->cs_flush(enc->cs, RADEON_FLUSH_ASYNC, NULL, 0);
54 }
55
56 #if 0
57 static void dump_feedback(struct rvce_encoder *enc, struct rvid_buffer *fb)
58 {
59 uint32_t *ptr = enc->ws->buffer_map(fb->cs_handle, enc->cs, PIPE_TRANSFER_READ_WRITE);
60 unsigned i = 0;
61 fprintf(stderr, "\n");
62 fprintf(stderr, "encStatus:\t\t\t%08x\n", ptr[i++]);
63 fprintf(stderr, "encHasBitstream:\t\t%08x\n", ptr[i++]);
64 fprintf(stderr, "encHasAudioBitstream:\t\t%08x\n", ptr[i++]);
65 fprintf(stderr, "encBitstreamOffset:\t\t%08x\n", ptr[i++]);
66 fprintf(stderr, "encBitstreamSize:\t\t%08x\n", ptr[i++]);
67 fprintf(stderr, "encAudioBitstreamOffset:\t%08x\n", ptr[i++]);
68 fprintf(stderr, "encAudioBitstreamSize:\t\t%08x\n", ptr[i++]);
69 fprintf(stderr, "encExtrabytes:\t\t\t%08x\n", ptr[i++]);
70 fprintf(stderr, "encAudioExtrabytes:\t\t%08x\n", ptr[i++]);
71 fprintf(stderr, "videoTimeStamp:\t\t\t%08x\n", ptr[i++]);
72 fprintf(stderr, "audioTimeStamp:\t\t\t%08x\n", ptr[i++]);
73 fprintf(stderr, "videoOutputType:\t\t%08x\n", ptr[i++]);
74 fprintf(stderr, "attributeFlags:\t\t\t%08x\n", ptr[i++]);
75 fprintf(stderr, "seiPrivatePackageOffset:\t%08x\n", ptr[i++]);
76 fprintf(stderr, "seiPrivatePackageSize:\t\t%08x\n", ptr[i++]);
77 fprintf(stderr, "\n");
78 enc->ws->buffer_unmap(fb->cs_handle);
79 }
80 #endif
81
82 /**
83 * reset the CPB handling
84 */
85 static void reset_cpb(struct rvce_encoder *enc)
86 {
87 unsigned i;
88
89 LIST_INITHEAD(&enc->cpb_slots);
90 for (i = 0; i < RVCE_NUM_CPB_FRAMES; ++i) {
91 struct rvce_cpb_slot *slot = &enc->cpb_array[i];
92 slot->index = i;
93 slot->picture_type = PIPE_H264_ENC_PICTURE_TYPE_SKIP;
94 slot->frame_num = 0;
95 slot->pic_order_cnt = 0;
96 LIST_ADDTAIL(&slot->list, &enc->cpb_slots);
97 }
98 }
99
100 /**
101 * sort l0 and l1 to the top of the list
102 */
103 static void sort_cpb(struct rvce_encoder *enc)
104 {
105 struct rvce_cpb_slot *i, *l0 = NULL, *l1 = NULL;
106
107 LIST_FOR_EACH_ENTRY(i, &enc->cpb_slots, list) {
108 if (i->frame_num == enc->pic.ref_idx_l0)
109 l0 = i;
110
111 if (i->frame_num == enc->pic.ref_idx_l1)
112 l1 = i;
113
114 if (enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_P && l0)
115 break;
116
117 if (enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_B &&
118 l0 && l1)
119 break;
120 }
121
122 if (l1) {
123 LIST_DEL(&l1->list);
124 LIST_ADD(&l1->list, &enc->cpb_slots);
125 }
126
127 if (l0) {
128 LIST_DEL(&l0->list);
129 LIST_ADD(&l0->list, &enc->cpb_slots);
130 }
131 }
132
133 /**
134 * destroy this video encoder
135 */
136 static void rvce_destroy(struct pipe_video_codec *encoder)
137 {
138 struct rvce_encoder *enc = (struct rvce_encoder*)encoder;
139 if (enc->stream_handle) {
140 struct rvid_buffer fb;
141 rvid_create_buffer(enc->ws, &fb, 512, RADEON_DOMAIN_GTT);
142 enc->fb = &fb;
143 enc->session(enc);
144 enc->feedback(enc);
145 enc->destroy(enc);
146 flush(enc);
147 rvid_destroy_buffer(&fb);
148 }
149 rvid_destroy_buffer(&enc->cpb);
150 enc->ws->cs_destroy(enc->cs);
151 FREE(enc->cpb_array);
152 FREE(enc);
153 }
154
155 static void rvce_begin_frame(struct pipe_video_codec *encoder,
156 struct pipe_video_buffer *source,
157 struct pipe_picture_desc *picture)
158 {
159 struct rvce_encoder *enc = (struct rvce_encoder*)encoder;
160 struct vl_video_buffer *vid_buf = (struct vl_video_buffer *)source;
161 struct pipe_h264_enc_picture_desc *pic = (struct pipe_h264_enc_picture_desc *)picture;
162
163 bool need_rate_control =
164 enc->pic.rate_ctrl.rate_ctrl_method != pic->rate_ctrl.rate_ctrl_method ||
165 enc->pic.quant_i_frames != pic->quant_i_frames ||
166 enc->pic.quant_p_frames != pic->quant_p_frames ||
167 enc->pic.quant_b_frames != pic->quant_b_frames;
168
169 enc->pic = *pic;
170
171 enc->get_buffer(vid_buf->resources[0], &enc->handle, &enc->luma);
172 enc->get_buffer(vid_buf->resources[1], NULL, &enc->chroma);
173
174 if (pic->picture_type == PIPE_H264_ENC_PICTURE_TYPE_IDR)
175 reset_cpb(enc);
176 else if (pic->picture_type == PIPE_H264_ENC_PICTURE_TYPE_P ||
177 pic->picture_type == PIPE_H264_ENC_PICTURE_TYPE_B)
178 sort_cpb(enc);
179
180 if (!enc->stream_handle) {
181 struct rvid_buffer fb;
182 enc->stream_handle = rvid_alloc_stream_handle();
183 rvid_create_buffer(enc->ws, &fb, 512, RADEON_DOMAIN_GTT);
184 enc->fb = &fb;
185 enc->session(enc);
186 enc->create(enc);
187 enc->rate_control(enc);
188 need_rate_control = false;
189 enc->config_extension(enc);
190 enc->motion_estimation(enc);
191 enc->rdo(enc);
192 enc->pic_control(enc);
193 enc->feedback(enc);
194 flush(enc);
195 //dump_feedback(enc, &fb);
196 rvid_destroy_buffer(&fb);
197 }
198
199 enc->session(enc);
200
201 if (need_rate_control)
202 enc->rate_control(enc);
203 }
204
205 static void rvce_encode_bitstream(struct pipe_video_codec *encoder,
206 struct pipe_video_buffer *source,
207 struct pipe_resource *destination,
208 void **fb)
209 {
210 struct rvce_encoder *enc = (struct rvce_encoder*)encoder;
211 enc->get_buffer(destination, &enc->bs_handle, NULL);
212 enc->bs_size = destination->width0;
213
214 *fb = enc->fb = CALLOC_STRUCT(rvid_buffer);
215 if (!rvid_create_buffer(enc->ws, enc->fb, 512, RADEON_DOMAIN_GTT)) {
216 RVID_ERR("Can't create feedback buffer.\n");
217 return;
218 }
219 enc->encode(enc);
220 enc->feedback(enc);
221 }
222
223 static void rvce_end_frame(struct pipe_video_codec *encoder,
224 struct pipe_video_buffer *source,
225 struct pipe_picture_desc *picture)
226 {
227 struct rvce_encoder *enc = (struct rvce_encoder*)encoder;
228 struct rvce_cpb_slot *slot = LIST_ENTRY(
229 struct rvce_cpb_slot, enc->cpb_slots.prev, list);
230
231 flush(enc);
232
233 /* update the CPB backtrack with the just encoded frame */
234 slot->picture_type = enc->pic.picture_type;
235 slot->frame_num = enc->pic.frame_num;
236 slot->pic_order_cnt = enc->pic.pic_order_cnt;
237 if (!enc->pic.not_referenced) {
238 LIST_DEL(&slot->list);
239 LIST_ADD(&slot->list, &enc->cpb_slots);
240 }
241 }
242
243 static void rvce_get_feedback(struct pipe_video_codec *encoder,
244 void *feedback, unsigned *size)
245 {
246 struct rvce_encoder *enc = (struct rvce_encoder*)encoder;
247 struct rvid_buffer *fb = feedback;
248
249 if (size) {
250 uint32_t *ptr = enc->ws->buffer_map(fb->cs_handle, enc->cs, PIPE_TRANSFER_READ_WRITE);
251
252 if (ptr[1]) {
253 *size = ptr[4] - ptr[9];
254 } else {
255 *size = 0;
256 }
257
258 enc->ws->buffer_unmap(fb->cs_handle);
259 }
260 //dump_feedback(enc, fb);
261 rvid_destroy_buffer(fb);
262 FREE(fb);
263 }
264
265 /**
266 * flush any outstanding command buffers to the hardware
267 */
268 static void rvce_flush(struct pipe_video_codec *encoder)
269 {
270 }
271
272 static void rvce_cs_flush(void *ctx, unsigned flags,
273 struct pipe_fence_handle **fence)
274 {
275 // just ignored
276 }
277
278 struct pipe_video_codec *rvce_create_encoder(struct pipe_context *context,
279 const struct pipe_video_codec *templ,
280 struct radeon_winsys* ws,
281 rvce_get_buffer get_buffer)
282 {
283 struct r600_common_screen *rscreen = (struct r600_common_screen *)context->screen;
284 struct rvce_encoder *enc;
285 struct pipe_video_buffer *tmp_buf, templat = {};
286 struct radeon_surface *tmp_surf;
287 unsigned cpb_size;
288
289 if (!rscreen->info.vce_fw_version) {
290 RVID_ERR("Kernel doesn't supports VCE!\n");
291 return NULL;
292
293 } else if (!rvce_is_fw_version_supported(rscreen)) {
294 RVID_ERR("Unsupported VCE fw version loaded!\n");
295 return NULL;
296 }
297
298 enc = CALLOC_STRUCT(rvce_encoder);
299 if (!enc)
300 return NULL;
301
302 enc->base = *templ;
303 enc->base.context = context;
304
305 enc->base.destroy = rvce_destroy;
306 enc->base.begin_frame = rvce_begin_frame;
307 enc->base.encode_bitstream = rvce_encode_bitstream;
308 enc->base.end_frame = rvce_end_frame;
309 enc->base.flush = rvce_flush;
310 enc->base.get_feedback = rvce_get_feedback;
311 enc->get_buffer = get_buffer;
312
313 enc->ws = ws;
314 enc->cs = ws->cs_create(ws, RING_VCE, rvce_cs_flush, enc, NULL);
315 if (!enc->cs) {
316 RVID_ERR("Can't get command submission context.\n");
317 goto error;
318 }
319
320 templat.buffer_format = PIPE_FORMAT_NV12;
321 templat.chroma_format = PIPE_VIDEO_CHROMA_FORMAT_420;
322 templat.width = enc->base.width;
323 templat.height = enc->base.height;
324 templat.interlaced = false;
325 if (!(tmp_buf = context->create_video_buffer(context, &templat))) {
326 RVID_ERR("Can't create video buffer.\n");
327 goto error;
328 }
329
330 get_buffer(((struct vl_video_buffer *)tmp_buf)->resources[0], NULL, &tmp_surf);
331 cpb_size = align(tmp_surf->level[0].pitch_bytes, 128);
332 cpb_size = cpb_size * align(tmp_surf->npix_y, 16);
333 cpb_size = cpb_size * 3 / 2;
334 cpb_size = cpb_size * RVCE_NUM_CPB_FRAMES;
335 tmp_buf->destroy(tmp_buf);
336 if (!rvid_create_buffer(enc->ws, &enc->cpb, cpb_size, RADEON_DOMAIN_VRAM)) {
337 RVID_ERR("Can't create CPB buffer.\n");
338 goto error;
339 }
340
341 enc->cpb_array = CALLOC(RVCE_NUM_CPB_FRAMES, sizeof(struct rvce_cpb_slot));
342 if (!enc->cpb_array)
343 goto error;
344
345 reset_cpb(enc);
346
347 radeon_vce_40_2_2_init(enc);
348
349 return &enc->base;
350
351 error:
352 if (enc->cs)
353 enc->ws->cs_destroy(enc->cs);
354
355 rvid_destroy_buffer(&enc->cpb);
356
357 FREE(enc->cpb_array);
358 FREE(enc);
359 return NULL;
360 }
361
362 /**
363 * check if kernel has the right fw version loaded
364 */
365 bool rvce_is_fw_version_supported(struct r600_common_screen *rscreen)
366 {
367 return rscreen->info.vce_fw_version == ((40 << 24) | (2 << 16) | (2 << 8));
368 }