winsys/amdgpu: implement sync_file import/export
[mesa.git] / src / gallium / winsys / amdgpu / drm / amdgpu_cs.h
1 /*
2 * Copyright © 2011 Marek Olšák <maraeo@gmail.com>
3 * Copyright © 2015 Advanced Micro Devices, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining
7 * a copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
15 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
16 * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
17 * NON-INFRINGEMENT. IN NO EVENT SHALL THE COPYRIGHT HOLDERS, AUTHORS
18 * AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
20 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 *
23 * The above copyright notice and this permission notice (including the
24 * next paragraph) shall be included in all copies or substantial portions
25 * of the Software.
26 */
27 /*
28 * Authors:
29 * Marek Olšák <maraeo@gmail.com>
30 */
31
32 #ifndef AMDGPU_CS_H
33 #define AMDGPU_CS_H
34
35 #include "amdgpu_bo.h"
36 #include "util/u_memory.h"
37 #include <amdgpu_drm.h>
38
39 struct amdgpu_ctx {
40 struct amdgpu_winsys *ws;
41 amdgpu_context_handle ctx;
42 amdgpu_bo_handle user_fence_bo;
43 uint64_t *user_fence_cpu_address_base;
44 int refcount;
45 unsigned initial_num_total_rejected_cs;
46 unsigned num_rejected_cs;
47 };
48
49 struct amdgpu_cs_buffer {
50 struct amdgpu_winsys_bo *bo;
51 union {
52 struct {
53 uint64_t priority_usage;
54 } real;
55 struct {
56 uint32_t real_idx; /* index of underlying real BO */
57 } slab;
58 } u;
59 enum radeon_bo_usage usage;
60 };
61
62 enum ib_type {
63 IB_MAIN,
64 IB_NUM,
65 };
66
67 struct amdgpu_ib {
68 struct radeon_winsys_cs base;
69
70 /* A buffer out of which new IBs are allocated. */
71 struct pb_buffer *big_ib_buffer;
72 uint8_t *ib_mapped;
73 unsigned used_ib_space;
74 unsigned max_ib_size;
75 uint32_t *ptr_ib_size;
76 enum ib_type ib_type;
77 };
78
79 struct amdgpu_cs_context {
80 struct drm_amdgpu_cs_chunk_ib ib[IB_NUM];
81
82 /* Buffers. */
83 unsigned max_real_buffers;
84 unsigned num_real_buffers;
85 struct amdgpu_cs_buffer *real_buffers;
86
87 unsigned max_real_submit;
88 amdgpu_bo_handle *handles;
89 uint8_t *flags;
90
91 unsigned num_slab_buffers;
92 unsigned max_slab_buffers;
93 struct amdgpu_cs_buffer *slab_buffers;
94
95 unsigned num_sparse_buffers;
96 unsigned max_sparse_buffers;
97 struct amdgpu_cs_buffer *sparse_buffers;
98
99 int buffer_indices_hashlist[4096];
100
101 struct amdgpu_winsys_bo *last_added_bo;
102 unsigned last_added_bo_index;
103 unsigned last_added_bo_usage;
104 uint64_t last_added_bo_priority_usage;
105
106 struct pipe_fence_handle **fence_dependencies;
107 unsigned num_fence_dependencies;
108 unsigned max_fence_dependencies;
109
110 struct pipe_fence_handle *fence;
111
112 /* the error returned from cs_flush for non-async submissions */
113 int error_code;
114 };
115
116 struct amdgpu_cs {
117 struct amdgpu_ib main; /* must be first because this is inherited */
118 struct amdgpu_ctx *ctx;
119 enum ring_type ring_type;
120 struct drm_amdgpu_cs_chunk_fence fence_chunk;
121
122 /* We flip between these two CS. While one is being consumed
123 * by the kernel in another thread, the other one is being filled
124 * by the pipe driver. */
125 struct amdgpu_cs_context csc1;
126 struct amdgpu_cs_context csc2;
127 /* The currently-used CS. */
128 struct amdgpu_cs_context *csc;
129 /* The CS being currently-owned by the other thread. */
130 struct amdgpu_cs_context *cst;
131
132 /* Flush CS. */
133 void (*flush_cs)(void *ctx, unsigned flags, struct pipe_fence_handle **fence);
134 void *flush_data;
135
136 struct util_queue_fence flush_completed;
137 struct pipe_fence_handle *next_fence;
138 };
139
140 struct amdgpu_fence {
141 struct pipe_reference reference;
142 /* If ctx == NULL, this fence is syncobj-based. */
143 uint32_t syncobj;
144
145 struct amdgpu_winsys *ws;
146 struct amdgpu_ctx *ctx; /* submission context */
147 struct amdgpu_cs_fence fence;
148 uint64_t *user_fence_cpu_address;
149
150 /* If the fence is unknown due to an IB still being submitted
151 * in the other thread. */
152 volatile int submission_in_progress; /* bool (int for atomicity) */
153 volatile int signalled; /* bool (int for atomicity) */
154 };
155
156 static inline bool amdgpu_fence_is_syncobj(struct amdgpu_fence *fence)
157 {
158 return fence->ctx == NULL;
159 }
160
161 static inline void amdgpu_ctx_unref(struct amdgpu_ctx *ctx)
162 {
163 if (p_atomic_dec_zero(&ctx->refcount)) {
164 amdgpu_cs_ctx_free(ctx->ctx);
165 amdgpu_bo_free(ctx->user_fence_bo);
166 FREE(ctx);
167 }
168 }
169
170 static inline void amdgpu_fence_reference(struct pipe_fence_handle **dst,
171 struct pipe_fence_handle *src)
172 {
173 struct amdgpu_fence **rdst = (struct amdgpu_fence **)dst;
174 struct amdgpu_fence *rsrc = (struct amdgpu_fence *)src;
175
176 if (pipe_reference(&(*rdst)->reference, &rsrc->reference)) {
177 struct amdgpu_fence *fence = *rdst;
178
179 if (amdgpu_fence_is_syncobj(fence))
180 amdgpu_cs_destroy_syncobj(fence->ws->dev, fence->syncobj);
181 else
182 amdgpu_ctx_unref(fence->ctx);
183
184 FREE(fence);
185 }
186 *rdst = rsrc;
187 }
188
189 int amdgpu_lookup_buffer(struct amdgpu_cs_context *cs, struct amdgpu_winsys_bo *bo);
190
191 static inline struct amdgpu_ib *
192 amdgpu_ib(struct radeon_winsys_cs *base)
193 {
194 return (struct amdgpu_ib *)base;
195 }
196
197 static inline struct amdgpu_cs *
198 amdgpu_cs(struct radeon_winsys_cs *base)
199 {
200 assert(amdgpu_ib(base)->ib_type == IB_MAIN);
201 return (struct amdgpu_cs*)base;
202 }
203
204 #define get_container(member_ptr, container_type, container_member) \
205 (container_type *)((char *)(member_ptr) - offsetof(container_type, container_member))
206
207 static inline struct amdgpu_cs *
208 amdgpu_cs_from_ib(struct amdgpu_ib *ib)
209 {
210 switch (ib->ib_type) {
211 case IB_MAIN:
212 return get_container(ib, struct amdgpu_cs, main);
213 default:
214 unreachable("bad ib_type");
215 }
216 }
217
218 static inline bool
219 amdgpu_bo_is_referenced_by_cs(struct amdgpu_cs *cs,
220 struct amdgpu_winsys_bo *bo)
221 {
222 int num_refs = bo->num_cs_references;
223 return num_refs == bo->ws->num_cs ||
224 (num_refs && amdgpu_lookup_buffer(cs->csc, bo) != -1);
225 }
226
227 static inline bool
228 amdgpu_bo_is_referenced_by_cs_with_usage(struct amdgpu_cs *cs,
229 struct amdgpu_winsys_bo *bo,
230 enum radeon_bo_usage usage)
231 {
232 int index;
233 struct amdgpu_cs_buffer *buffer;
234
235 if (!bo->num_cs_references)
236 return false;
237
238 index = amdgpu_lookup_buffer(cs->csc, bo);
239 if (index == -1)
240 return false;
241
242 buffer = bo->bo ? &cs->csc->real_buffers[index] :
243 bo->sparse ? &cs->csc->sparse_buffers[index] :
244 &cs->csc->slab_buffers[index];
245
246 return (buffer->usage & usage) != 0;
247 }
248
249 static inline bool
250 amdgpu_bo_is_referenced_by_any_cs(struct amdgpu_winsys_bo *bo)
251 {
252 return bo->num_cs_references != 0;
253 }
254
255 bool amdgpu_fence_wait(struct pipe_fence_handle *fence, uint64_t timeout,
256 bool absolute);
257 void amdgpu_add_fences(struct amdgpu_winsys_bo *bo,
258 unsigned num_fences,
259 struct pipe_fence_handle **fences);
260 void amdgpu_cs_sync_flush(struct radeon_winsys_cs *rcs);
261 void amdgpu_cs_init_functions(struct amdgpu_winsys *ws);
262 void amdgpu_cs_submit_ib(void *job, int thread_index);
263
264 #endif