radeon/vcn: implement vcn 2.0 jpeg decode
[mesa.git] / src / gallium / drivers / radeon / radeon_video.c
1 /**************************************************************************
2 *
3 * Copyright 2013 Advanced Micro Devices, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 #include <unistd.h>
29
30 #include "util/u_memory.h"
31 #include "util/u_video.h"
32
33 #include "vl/vl_defines.h"
34 #include "vl/vl_video_buffer.h"
35
36 #include "radeonsi/si_pipe.h"
37 #include "radeon_video.h"
38 #include "radeon_vce.h"
39
40 /* generate an stream handle */
41 unsigned si_vid_alloc_stream_handle()
42 {
43 static unsigned counter = 0;
44 unsigned stream_handle = 0;
45 unsigned pid = getpid();
46 int i;
47
48 for (i = 0; i < 32; ++i)
49 stream_handle |= ((pid >> i) & 1) << (31 - i);
50
51 stream_handle ^= ++counter;
52 return stream_handle;
53 }
54
55 /* create a buffer in the winsys */
56 bool si_vid_create_buffer(struct pipe_screen *screen, struct rvid_buffer *buffer,
57 unsigned size, unsigned usage)
58 {
59 memset(buffer, 0, sizeof(*buffer));
60 buffer->usage = usage;
61
62 /* Hardware buffer placement restrictions require the kernel to be
63 * able to move buffers around individually, so request a
64 * non-sub-allocated buffer.
65 */
66 buffer->res = si_resource(pipe_buffer_create(screen, PIPE_BIND_SHARED,
67 usage, size));
68
69 return buffer->res != NULL;
70 }
71
72 /* destroy a buffer */
73 void si_vid_destroy_buffer(struct rvid_buffer *buffer)
74 {
75 si_resource_reference(&buffer->res, NULL);
76 }
77
78 /* reallocate a buffer, preserving its content */
79 bool si_vid_resize_buffer(struct pipe_screen *screen, struct radeon_cmdbuf *cs,
80 struct rvid_buffer *new_buf, unsigned new_size)
81 {
82 struct si_screen *sscreen = (struct si_screen *)screen;
83 struct radeon_winsys* ws = sscreen->ws;
84 unsigned bytes = MIN2(new_buf->res->buf->size, new_size);
85 struct rvid_buffer old_buf = *new_buf;
86 void *src = NULL, *dst = NULL;
87
88 if (!si_vid_create_buffer(screen, new_buf, new_size, new_buf->usage))
89 goto error;
90
91 src = ws->buffer_map(old_buf.res->buf, cs,
92 PIPE_TRANSFER_READ | RADEON_TRANSFER_TEMPORARY);
93 if (!src)
94 goto error;
95
96 dst = ws->buffer_map(new_buf->res->buf, cs,
97 PIPE_TRANSFER_WRITE | RADEON_TRANSFER_TEMPORARY);
98 if (!dst)
99 goto error;
100
101 memcpy(dst, src, bytes);
102 if (new_size > bytes) {
103 new_size -= bytes;
104 dst += bytes;
105 memset(dst, 0, new_size);
106 }
107 ws->buffer_unmap(new_buf->res->buf);
108 ws->buffer_unmap(old_buf.res->buf);
109 si_vid_destroy_buffer(&old_buf);
110 return true;
111
112 error:
113 if (src)
114 ws->buffer_unmap(old_buf.res->buf);
115 si_vid_destroy_buffer(new_buf);
116 *new_buf = old_buf;
117 return false;
118 }
119
120 /* clear the buffer with zeros */
121 void si_vid_clear_buffer(struct pipe_context *context, struct rvid_buffer* buffer)
122 {
123 struct si_context *sctx = (struct si_context*)context;
124
125 si_sdma_clear_buffer(sctx, &buffer->res->b.b, 0, buffer->res->buf->size, 0);
126 context->flush(context, NULL, 0);
127 }
128
129 /**
130 * join surfaces into the same buffer with identical tiling params
131 * sumup their sizes and replace the backend buffers with a single bo
132 */
133 void si_vid_join_surfaces(struct si_context *sctx,
134 struct pb_buffer** buffers[VL_NUM_COMPONENTS],
135 struct radeon_surf *surfaces[VL_NUM_COMPONENTS])
136 {
137 struct radeon_winsys *ws = sctx->ws;;
138 unsigned best_tiling, best_wh, off;
139 unsigned size, alignment;
140 struct pb_buffer *pb;
141 unsigned i, j;
142
143 for (i = 0, best_tiling = 0, best_wh = ~0; i < VL_NUM_COMPONENTS; ++i) {
144 unsigned wh;
145
146 if (!surfaces[i])
147 continue;
148
149 if (sctx->chip_class < GFX9) {
150 /* choose the smallest bank w/h for now */
151 wh = surfaces[i]->u.legacy.bankw * surfaces[i]->u.legacy.bankh;
152 if (wh < best_wh) {
153 best_wh = wh;
154 best_tiling = i;
155 }
156 }
157 }
158
159 for (i = 0, off = 0; i < VL_NUM_COMPONENTS; ++i) {
160 if (!surfaces[i])
161 continue;
162
163 /* adjust the texture layer offsets */
164 off = align(off, surfaces[i]->surf_alignment);
165
166 if (sctx->chip_class < GFX9) {
167 /* copy the tiling parameters */
168 surfaces[i]->u.legacy.bankw = surfaces[best_tiling]->u.legacy.bankw;
169 surfaces[i]->u.legacy.bankh = surfaces[best_tiling]->u.legacy.bankh;
170 surfaces[i]->u.legacy.mtilea = surfaces[best_tiling]->u.legacy.mtilea;
171 surfaces[i]->u.legacy.tile_split = surfaces[best_tiling]->u.legacy.tile_split;
172
173 for (j = 0; j < ARRAY_SIZE(surfaces[i]->u.legacy.level); ++j)
174 surfaces[i]->u.legacy.level[j].offset += off;
175 } else {
176 surfaces[i]->u.gfx9.surf_offset += off;
177 for (j = 0; j < ARRAY_SIZE(surfaces[i]->u.gfx9.offset); ++j)
178 surfaces[i]->u.gfx9.offset[j] += off;
179 }
180
181 off += surfaces[i]->surf_size;
182 }
183
184 for (i = 0, size = 0, alignment = 0; i < VL_NUM_COMPONENTS; ++i) {
185 if (!buffers[i] || !*buffers[i])
186 continue;
187
188 size = align(size, (*buffers[i])->alignment);
189 size += (*buffers[i])->size;
190 alignment = MAX2(alignment, (*buffers[i])->alignment * 1);
191 }
192
193 if (!size)
194 return;
195
196 /* TODO: 2D tiling workaround */
197 alignment *= 2;
198
199 pb = ws->buffer_create(ws, size, alignment, RADEON_DOMAIN_VRAM,
200 RADEON_FLAG_GTT_WC);
201 if (!pb)
202 return;
203
204 for (i = 0; i < VL_NUM_COMPONENTS; ++i) {
205 if (!buffers[i] || !*buffers[i])
206 continue;
207
208 pb_reference(buffers[i], pb);
209 }
210
211 pb_reference(&pb, NULL);
212 }