ac/surface/gfx10: allow "rotated" micro mode
[mesa.git] / src / amd / common / ac_surface.h
1 /*
2 * Copyright © 2017 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining
5 * a copy of this software and associated documentation files (the
6 * "Software"), to deal in the Software without restriction, including
7 * without limitation the rights to use, copy, modify, merge, publish,
8 * distribute, sub license, and/or sell copies of the Software, and to
9 * permit persons to whom the Software is furnished to do so, subject to
10 * the following conditions:
11 *
12 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
13 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
14 * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
15 * NON-INFRINGEMENT. IN NO EVENT SHALL THE COPYRIGHT HOLDERS, AUTHORS
16 * AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
17 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
18 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
19 * USE OR OTHER DEALINGS IN THE SOFTWARE.
20 *
21 * The above copyright notice and this permission notice (including the
22 * next paragraph) shall be included in all copies or substantial portions
23 * of the Software.
24 */
25
26 #ifndef AC_SURFACE_H
27 #define AC_SURFACE_H
28
29 #include <stdint.h>
30 #include <stdbool.h>
31
32 #include "amd_family.h"
33
34 #ifdef __cplusplus
35 extern "C" {
36 #endif
37
38 /* Forward declarations. */
39 typedef void* ADDR_HANDLE;
40
41 struct amdgpu_gpu_info;
42 struct radeon_info;
43
44 #define RADEON_SURF_MAX_LEVELS 15
45
46 enum radeon_surf_mode {
47 RADEON_SURF_MODE_LINEAR_ALIGNED = 1,
48 RADEON_SURF_MODE_1D = 2,
49 RADEON_SURF_MODE_2D = 3,
50 };
51
52 /* These are defined exactly like GB_TILE_MODEn.MICRO_TILE_MODE_NEW. */
53 enum radeon_micro_mode {
54 RADEON_MICRO_MODE_DISPLAY = 0,
55 RADEON_MICRO_MODE_THIN = 1,
56 RADEON_MICRO_MODE_DEPTH = 2,
57 RADEON_MICRO_MODE_ROTATED = 3, /* gfx10+: render target */
58 };
59
60 /* the first 16 bits are reserved for libdrm_radeon, don't use them */
61 #define RADEON_SURF_SCANOUT (1 << 16)
62 #define RADEON_SURF_ZBUFFER (1 << 17)
63 #define RADEON_SURF_SBUFFER (1 << 18)
64 #define RADEON_SURF_Z_OR_SBUFFER (RADEON_SURF_ZBUFFER | RADEON_SURF_SBUFFER)
65 /* bits 19 and 20 are reserved for libdrm_radeon, don't use them */
66 #define RADEON_SURF_FMASK (1 << 21)
67 #define RADEON_SURF_DISABLE_DCC (1 << 22)
68 #define RADEON_SURF_TC_COMPATIBLE_HTILE (1 << 23)
69 #define RADEON_SURF_IMPORTED (1 << 24)
70 #define RADEON_SURF_OPTIMIZE_FOR_SPACE (1 << 25)
71 #define RADEON_SURF_SHAREABLE (1 << 26)
72 #define RADEON_SURF_NO_RENDER_TARGET (1 << 27)
73
74 struct legacy_surf_level {
75 uint64_t offset;
76 uint32_t slice_size_dw; /* in dwords; max = 4GB / 4. */
77 uint32_t dcc_offset; /* relative offset within DCC mip tree */
78 uint32_t dcc_fast_clear_size;
79 uint32_t dcc_slice_fast_clear_size;
80 unsigned nblk_x:15;
81 unsigned nblk_y:15;
82 enum radeon_surf_mode mode:2;
83 };
84
85 struct legacy_surf_fmask {
86 unsigned slice_tile_max; /* max 4M */
87 uint8_t tiling_index; /* max 31 */
88 uint8_t bankh; /* max 8 */
89 uint16_t pitch_in_pixels;
90 uint64_t slice_size;
91 };
92
93 struct legacy_surf_layout {
94 unsigned bankw:4; /* max 8 */
95 unsigned bankh:4; /* max 8 */
96 unsigned mtilea:4; /* max 8 */
97 unsigned tile_split:13; /* max 4K */
98 unsigned stencil_tile_split:13; /* max 4K */
99 unsigned pipe_config:5; /* max 17 */
100 unsigned num_banks:5; /* max 16 */
101 unsigned macro_tile_index:4; /* max 15 */
102
103 /* Whether the depth miptree or stencil miptree as used by the DB are
104 * adjusted from their TC compatible form to ensure depth/stencil
105 * compatibility. If either is true, the corresponding plane cannot be
106 * sampled from.
107 */
108 unsigned depth_adjusted:1;
109 unsigned stencil_adjusted:1;
110
111 struct legacy_surf_level level[RADEON_SURF_MAX_LEVELS];
112 struct legacy_surf_level stencil_level[RADEON_SURF_MAX_LEVELS];
113 uint8_t tiling_index[RADEON_SURF_MAX_LEVELS];
114 uint8_t stencil_tiling_index[RADEON_SURF_MAX_LEVELS];
115 struct legacy_surf_fmask fmask;
116 unsigned cmask_slice_tile_max;
117 };
118
119 /* Same as addrlib - AddrResourceType. */
120 enum gfx9_resource_type {
121 RADEON_RESOURCE_1D = 0,
122 RADEON_RESOURCE_2D,
123 RADEON_RESOURCE_3D,
124 };
125
126 struct gfx9_surf_flags {
127 uint16_t swizzle_mode; /* tile mode */
128 uint16_t epitch; /* (pitch - 1) or (height - 1) */
129 };
130
131 struct gfx9_surf_meta_flags {
132 unsigned rb_aligned:1; /* optimal for RBs */
133 unsigned pipe_aligned:1; /* optimal for TC */
134 };
135
136 struct gfx9_surf_layout {
137 struct gfx9_surf_flags surf; /* color or depth surface */
138 struct gfx9_surf_flags fmask; /* not added to surf_size */
139 struct gfx9_surf_flags stencil; /* added to surf_size, use stencil_offset */
140
141 struct gfx9_surf_meta_flags dcc; /* metadata of color */
142 struct gfx9_surf_meta_flags htile; /* metadata of depth and stencil */
143 struct gfx9_surf_meta_flags cmask; /* metadata of fmask */
144
145 enum gfx9_resource_type resource_type; /* 1D, 2D or 3D */
146 uint16_t surf_pitch; /* in blocks */
147 uint16_t surf_height;
148
149 uint64_t surf_offset; /* 0 unless imported with an offset */
150 /* The size of the 2D plane containing all mipmap levels. */
151 uint64_t surf_slice_size;
152 /* Mipmap level offset within the slice in bytes. Only valid for LINEAR. */
153 uint32_t offset[RADEON_SURF_MAX_LEVELS];
154
155 uint64_t stencil_offset; /* separate stencil */
156
157 /* Displayable DCC. This is always rb_aligned=0 and pipe_aligned=0.
158 * The 3D engine doesn't support that layout except for chips with 1 RB.
159 * All other chips must set rb_aligned=1.
160 * A compute shader needs to convert from aligned DCC to unaligned.
161 */
162 uint32_t display_dcc_size;
163 uint32_t display_dcc_alignment;
164 uint16_t display_dcc_pitch_max; /* (mip chain pitch - 1) */
165 bool dcc_retile_use_uint16; /* if all values fit into uint16_t */
166 uint32_t dcc_retile_num_elements;
167 uint32_t *dcc_retile_map;
168 };
169
170 struct radeon_surf {
171 /* Format properties. */
172 unsigned blk_w:4;
173 unsigned blk_h:4;
174 unsigned bpe:5;
175 /* Number of mipmap levels where DCC is enabled starting from level 0.
176 * Non-zero levels may be disabled due to alignment constraints, but not
177 * the first level.
178 */
179 unsigned num_dcc_levels:4;
180 unsigned is_linear:1;
181 unsigned has_stencil:1;
182 /* This might be true even if micro_tile_mode isn't displayable or rotated. */
183 unsigned is_displayable:1;
184 /* Displayable, thin, depth, rotated. AKA D,S,Z,R swizzle modes. */
185 unsigned micro_tile_mode:3;
186 uint32_t flags;
187
188 /* These are return values. Some of them can be set by the caller, but
189 * they will be treated as hints (e.g. bankw, bankh) and might be
190 * changed by the calculator.
191 */
192
193 /* Tile swizzle can be OR'd with low bits of the BASE_256B address.
194 * The value is the same for all mipmap levels. Supported tile modes:
195 * - GFX6: Only macro tiling.
196 * - GFX9: Only *_X and *_T swizzle modes. Level 0 must not be in the mip
197 * tail.
198 *
199 * Only these surfaces are allowed to set it:
200 * - color (if it doesn't have to be displayable)
201 * - DCC (same tile swizzle as color)
202 * - FMASK
203 * - CMASK if it's TC-compatible or if the gen is GFX9
204 * - depth/stencil if HTILE is not TC-compatible and if the gen is not GFX9
205 */
206 uint8_t tile_swizzle;
207 uint8_t fmask_tile_swizzle;
208
209 uint64_t surf_size;
210 uint64_t fmask_size;
211 uint32_t surf_alignment;
212 uint32_t fmask_alignment;
213
214 /* DCC and HTILE are very small. */
215 uint32_t dcc_size;
216 uint32_t dcc_slice_size;
217 uint32_t dcc_alignment;
218
219 uint32_t htile_size;
220 uint32_t htile_slice_size;
221 uint32_t htile_alignment;
222
223 uint32_t cmask_size;
224 uint32_t cmask_slice_size;
225 uint32_t cmask_alignment;
226
227 union {
228 /* Return values for GFX8 and older.
229 *
230 * Some of them can be set by the caller if certain parameters are
231 * desirable. The allocator will try to obey them.
232 */
233 struct legacy_surf_layout legacy;
234
235 /* GFX9+ return values. */
236 struct gfx9_surf_layout gfx9;
237 } u;
238 };
239
240 struct ac_surf_info {
241 uint32_t width;
242 uint32_t height;
243 uint32_t depth;
244 uint8_t samples; /* For Z/S: samples; For color: FMASK coverage samples */
245 uint8_t storage_samples; /* For color: allocated samples */
246 uint8_t levels;
247 uint8_t num_channels; /* heuristic for displayability */
248 uint16_t array_size;
249 uint32_t *surf_index; /* Set a monotonic counter for tile swizzling. */
250 uint32_t *fmask_surf_index;
251 };
252
253 struct ac_surf_config {
254 struct ac_surf_info info;
255 unsigned is_3d : 1;
256 unsigned is_cube : 1;
257 };
258
259 ADDR_HANDLE amdgpu_addr_create(const struct radeon_info *info,
260 const struct amdgpu_gpu_info *amdinfo,
261 uint64_t *max_alignment);
262
263 int ac_compute_surface(ADDR_HANDLE addrlib, const struct radeon_info *info,
264 const struct ac_surf_config * config,
265 enum radeon_surf_mode mode,
266 struct radeon_surf *surf);
267
268 #ifdef __cplusplus
269 }
270 #endif
271
272 #endif /* AC_SURFACE_H */