radv/amdgpu: Let addrlib calculate the HTILE parameters.
[mesa.git] / src / amd / vulkan / radv_radeon_winsys.h
1 /*
2 * Copyright © 2016 Red Hat.
3 * Copyright © 2016 Bas Nieuwenhuizen
4 *
5 * Based on radeon_winsys.h which is:
6 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
7 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
8 *
9 * Permission is hereby granted, free of charge, to any person obtaining a
10 * copy of this software and associated documentation files (the "Software"),
11 * to deal in the Software without restriction, including without limitation
12 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
13 * and/or sell copies of the Software, and to permit persons to whom the
14 * Software is furnished to do so, subject to the following conditions:
15 *
16 * The above copyright notice and this permission notice (including the next
17 * paragraph) shall be included in all copies or substantial portions of the
18 * Software.
19 *
20 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
21 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
23 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
24 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
25 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
26 * IN THE SOFTWARE.
27 */
28
29 #ifndef RADV_RADEON_WINSYS_H
30 #define RADV_RADEON_WINSYS_H
31
32 #include <stdint.h>
33 #include <stdbool.h>
34 #include <stdlib.h>
35 #include "main/macros.h"
36 #include "amd_family.h"
37
38 #define FREE(x) free(x)
39
40 enum radeon_bo_domain { /* bitfield */
41 RADEON_DOMAIN_GTT = 2,
42 RADEON_DOMAIN_VRAM = 4,
43 RADEON_DOMAIN_VRAM_GTT = RADEON_DOMAIN_VRAM | RADEON_DOMAIN_GTT
44 };
45
46 enum radeon_bo_flag { /* bitfield */
47 RADEON_FLAG_GTT_WC = (1 << 0),
48 RADEON_FLAG_CPU_ACCESS = (1 << 1),
49 RADEON_FLAG_NO_CPU_ACCESS = (1 << 2),
50 };
51
52 enum radeon_bo_usage { /* bitfield */
53 RADEON_USAGE_READ = 2,
54 RADEON_USAGE_WRITE = 4,
55 RADEON_USAGE_READWRITE = RADEON_USAGE_READ | RADEON_USAGE_WRITE
56 };
57
58 enum ring_type {
59 RING_GFX = 0,
60 RING_COMPUTE,
61 RING_DMA,
62 RING_UVD,
63 RING_VCE,
64 RING_LAST,
65 };
66
67 struct radeon_winsys_cs {
68 unsigned cdw; /* Number of used dwords. */
69 unsigned max_dw; /* Maximum number of dwords. */
70 uint32_t *buf; /* The base pointer of the chunk. */
71 };
72
73 struct radeon_info {
74 /* PCI info: domain:bus:dev:func */
75 uint32_t pci_domain;
76 uint32_t pci_bus;
77 uint32_t pci_dev;
78 uint32_t pci_func;
79
80 /* Device info. */
81 uint32_t pci_id;
82 enum radeon_family family;
83 const char *name;
84 enum chip_class chip_class;
85 uint32_t gart_page_size;
86 uint64_t gart_size;
87 uint64_t vram_size;
88 uint64_t visible_vram_size;
89 bool has_dedicated_vram;
90 bool has_virtual_memory;
91 bool gfx_ib_pad_with_type2;
92 bool has_uvd;
93 uint32_t sdma_rings;
94 uint32_t compute_rings;
95 uint32_t vce_fw_version;
96 uint32_t vce_harvest_config;
97 uint32_t clock_crystal_freq;
98
99 /* Kernel info. */
100 uint32_t drm_major; /* version */
101 uint32_t drm_minor;
102 uint32_t drm_patchlevel;
103 bool has_userptr;
104
105 /* Shader cores. */
106 uint32_t r600_max_quad_pipes; /* wave size / 16 */
107 uint32_t max_shader_clock;
108 uint32_t num_good_compute_units;
109 uint32_t max_se; /* shader engines */
110 uint32_t max_sh_per_se; /* shader arrays per shader engine */
111
112 /* Render backends (color + depth blocks). */
113 uint32_t r300_num_gb_pipes;
114 uint32_t r300_num_z_pipes;
115 uint32_t r600_gb_backend_map; /* R600 harvest config */
116 bool r600_gb_backend_map_valid;
117 uint32_t r600_num_banks;
118 uint32_t num_render_backends;
119 uint32_t num_tile_pipes; /* pipe count from PIPE_CONFIG */
120 uint32_t pipe_interleave_bytes;
121 uint32_t enabled_rb_mask; /* GCN harvest config */
122
123 /* Tile modes. */
124 uint32_t si_tile_mode_array[32];
125 uint32_t cik_macrotile_mode_array[16];
126 };
127
128 #define RADEON_SURF_MAX_LEVEL 32
129
130 #define RADEON_SURF_TYPE_MASK 0xFF
131 #define RADEON_SURF_TYPE_SHIFT 0
132 #define RADEON_SURF_TYPE_1D 0
133 #define RADEON_SURF_TYPE_2D 1
134 #define RADEON_SURF_TYPE_3D 2
135 #define RADEON_SURF_TYPE_CUBEMAP 3
136 #define RADEON_SURF_TYPE_1D_ARRAY 4
137 #define RADEON_SURF_TYPE_2D_ARRAY 5
138 #define RADEON_SURF_MODE_MASK 0xFF
139 #define RADEON_SURF_MODE_SHIFT 8
140 #define RADEON_SURF_MODE_LINEAR_ALIGNED 1
141 #define RADEON_SURF_MODE_1D 2
142 #define RADEON_SURF_MODE_2D 3
143 #define RADEON_SURF_SCANOUT (1 << 16)
144 #define RADEON_SURF_ZBUFFER (1 << 17)
145 #define RADEON_SURF_SBUFFER (1 << 18)
146 #define RADEON_SURF_Z_OR_SBUFFER (RADEON_SURF_ZBUFFER | RADEON_SURF_SBUFFER)
147 #define RADEON_SURF_HAS_SBUFFER_MIPTREE (1 << 19)
148 #define RADEON_SURF_HAS_TILE_MODE_INDEX (1 << 20)
149 #define RADEON_SURF_FMASK (1 << 21)
150 #define RADEON_SURF_DISABLE_DCC (1 << 22)
151 #define RADEON_SURF_TC_COMPATIBLE_HTILE (1 << 23)
152
153 #define RADEON_SURF_GET(v, field) (((v) >> RADEON_SURF_ ## field ## _SHIFT) & RADEON_SURF_ ## field ## _MASK)
154 #define RADEON_SURF_SET(v, field) (((v) & RADEON_SURF_ ## field ## _MASK) << RADEON_SURF_ ## field ## _SHIFT)
155 #define RADEON_SURF_CLR(v, field) ((v) & ~(RADEON_SURF_ ## field ## _MASK << RADEON_SURF_ ## field ## _SHIFT))
156
157 struct radeon_surf_level {
158 uint64_t offset;
159 uint64_t slice_size;
160 uint32_t npix_x;
161 uint32_t npix_y;
162 uint32_t npix_z;
163 uint32_t nblk_x;
164 uint32_t nblk_y;
165 uint32_t nblk_z;
166 uint32_t pitch_bytes;
167 uint32_t mode;
168 uint64_t dcc_offset;
169 uint64_t dcc_fast_clear_size;
170 bool dcc_enabled;
171 };
172
173
174 /* surface defintions from the winsys */
175 struct radeon_surf {
176 /* These are inputs to the calculator. */
177 uint32_t npix_x;
178 uint32_t npix_y;
179 uint32_t npix_z;
180 uint32_t blk_w;
181 uint32_t blk_h;
182 uint32_t blk_d;
183 uint32_t array_size;
184 uint32_t last_level;
185 uint32_t bpe;
186 uint32_t nsamples;
187 uint32_t flags;
188
189 /* These are return values. Some of them can be set by the caller, but
190 * they will be treated as hints (e.g. bankw, bankh) and might be
191 * changed by the calculator.
192 */
193 uint64_t bo_size;
194 uint64_t bo_alignment;
195 /* This applies to EG and later. */
196 uint32_t bankw;
197 uint32_t bankh;
198 uint32_t mtilea;
199 uint32_t tile_split;
200 uint32_t stencil_tile_split;
201 uint64_t stencil_offset;
202 struct radeon_surf_level level[RADEON_SURF_MAX_LEVEL];
203 struct radeon_surf_level stencil_level[RADEON_SURF_MAX_LEVEL];
204 uint32_t tiling_index[RADEON_SURF_MAX_LEVEL];
205 uint32_t stencil_tiling_index[RADEON_SURF_MAX_LEVEL];
206 uint32_t pipe_config;
207 uint32_t num_banks;
208 uint32_t macro_tile_index;
209 uint32_t micro_tile_mode; /* displayable, thin, depth, rotated */
210
211 /* Whether the depth miptree or stencil miptree as used by the DB are
212 * adjusted from their TC compatible form to ensure depth/stencil
213 * compatibility. If either is true, the corresponding plane cannot be
214 * sampled from.
215 */
216 bool depth_adjusted;
217 bool stencil_adjusted;
218
219 uint64_t dcc_size;
220 uint64_t dcc_alignment;
221
222 uint64_t htile_size;
223 uint64_t htile_slice_size;
224 uint64_t htile_alignment;
225 };
226
227 enum radeon_bo_layout {
228 RADEON_LAYOUT_LINEAR = 0,
229 RADEON_LAYOUT_TILED,
230 RADEON_LAYOUT_SQUARETILED,
231
232 RADEON_LAYOUT_UNKNOWN
233 };
234
235 /* Tiling info for display code, DRI sharing, and other data. */
236 struct radeon_bo_metadata {
237 /* Tiling flags describing the texture layout for display code
238 * and DRI sharing.
239 */
240 enum radeon_bo_layout microtile;
241 enum radeon_bo_layout macrotile;
242 unsigned pipe_config;
243 unsigned bankw;
244 unsigned bankh;
245 unsigned tile_split;
246 unsigned mtilea;
247 unsigned num_banks;
248 unsigned stride;
249 bool scanout;
250
251 /* Additional metadata associated with the buffer, in bytes.
252 * The maximum size is 64 * 4. This is opaque for the winsys & kernel.
253 * Supported by amdgpu only.
254 */
255 uint32_t size_metadata;
256 uint32_t metadata[64];
257 };
258
259 struct radeon_winsys_bo;
260 struct radeon_winsys_fence;
261 struct radeon_winsys_sem;
262
263 struct radeon_winsys {
264 void (*destroy)(struct radeon_winsys *ws);
265
266 void (*query_info)(struct radeon_winsys *ws,
267 struct radeon_info *info);
268
269 struct radeon_winsys_bo *(*buffer_create)(struct radeon_winsys *ws,
270 uint64_t size,
271 unsigned alignment,
272 enum radeon_bo_domain domain,
273 enum radeon_bo_flag flags);
274
275 void (*buffer_destroy)(struct radeon_winsys_bo *bo);
276 void *(*buffer_map)(struct radeon_winsys_bo *bo);
277
278 struct radeon_winsys_bo *(*buffer_from_fd)(struct radeon_winsys *ws,
279 int fd,
280 unsigned *stride, unsigned *offset);
281
282 bool (*buffer_get_fd)(struct radeon_winsys *ws,
283 struct radeon_winsys_bo *bo,
284 int *fd);
285
286 void (*buffer_unmap)(struct radeon_winsys_bo *bo);
287
288 uint64_t (*buffer_get_va)(struct radeon_winsys_bo *bo);
289
290 void (*buffer_set_metadata)(struct radeon_winsys_bo *bo,
291 struct radeon_bo_metadata *md);
292 struct radeon_winsys_ctx *(*ctx_create)(struct radeon_winsys *ws);
293 void (*ctx_destroy)(struct radeon_winsys_ctx *ctx);
294
295 bool (*ctx_wait_idle)(struct radeon_winsys_ctx *ctx,
296 enum ring_type ring_type, int ring_index);
297
298 struct radeon_winsys_cs *(*cs_create)(struct radeon_winsys *ws,
299 enum ring_type ring_type);
300
301 void (*cs_destroy)(struct radeon_winsys_cs *cs);
302
303 void (*cs_reset)(struct radeon_winsys_cs *cs);
304
305 bool (*cs_finalize)(struct radeon_winsys_cs *cs);
306
307 void (*cs_grow)(struct radeon_winsys_cs * cs, size_t min_size);
308
309 int (*cs_submit)(struct radeon_winsys_ctx *ctx,
310 int queue_index,
311 struct radeon_winsys_cs **cs_array,
312 unsigned cs_count,
313 struct radeon_winsys_cs *initial_preamble_cs,
314 struct radeon_winsys_cs *continue_preamble_cs,
315 struct radeon_winsys_sem **wait_sem,
316 unsigned wait_sem_count,
317 struct radeon_winsys_sem **signal_sem,
318 unsigned signal_sem_count,
319 bool can_patch,
320 struct radeon_winsys_fence *fence);
321
322 void (*cs_add_buffer)(struct radeon_winsys_cs *cs,
323 struct radeon_winsys_bo *bo,
324 uint8_t priority);
325
326 void (*cs_execute_secondary)(struct radeon_winsys_cs *parent,
327 struct radeon_winsys_cs *child);
328
329 void (*cs_dump)(struct radeon_winsys_cs *cs, FILE* file, uint32_t trace_id);
330
331 int (*surface_init)(struct radeon_winsys *ws,
332 struct radeon_surf *surf);
333
334 int (*surface_best)(struct radeon_winsys *ws,
335 struct radeon_surf *surf);
336
337 struct radeon_winsys_fence *(*create_fence)();
338 void (*destroy_fence)(struct radeon_winsys_fence *fence);
339 bool (*fence_wait)(struct radeon_winsys *ws,
340 struct radeon_winsys_fence *fence,
341 bool absolute,
342 uint64_t timeout);
343
344 struct radeon_winsys_sem *(*create_sem)(struct radeon_winsys *ws);
345 void (*destroy_sem)(struct radeon_winsys_sem *sem);
346
347 };
348
349 static inline void radeon_emit(struct radeon_winsys_cs *cs, uint32_t value)
350 {
351 cs->buf[cs->cdw++] = value;
352 }
353
354 static inline void radeon_emit_array(struct radeon_winsys_cs *cs,
355 const uint32_t *values, unsigned count)
356 {
357 memcpy(cs->buf + cs->cdw, values, count * 4);
358 cs->cdw += count;
359 }
360
361 #endif /* RADV_RADEON_WINSYS_H */