a3c24115a13ffd17fa4213dae1c297ee1f5a41bd
[mesa.git] / src / amd / vulkan / winsys / amdgpu / radv_amdgpu_surface.c
1 /*
2 * Copyright © 2016 Red Hat.
3 * Copyright © 2016 Bas Nieuwenhuizen
4 *
5 * based on amdgpu winsys.
6 * Copyright © 2011 Marek Olšák <maraeo@gmail.com>
7 * Copyright © 2015 Advanced Micro Devices, Inc.
8 *
9 * Permission is hereby granted, free of charge, to any person obtaining a
10 * copy of this software and associated documentation files (the "Software"),
11 * to deal in the Software without restriction, including without limitation
12 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
13 * and/or sell copies of the Software, and to permit persons to whom the
14 * Software is furnished to do so, subject to the following conditions:
15 *
16 * The above copyright notice and this permission notice (including the next
17 * paragraph) shall be included in all copies or substantial portions of the
18 * Software.
19 *
20 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
21 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
23 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
24 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
25 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
26 * IN THE SOFTWARE.
27 */
28
29 #include <errno.h>
30 #include "radv_private.h"
31 #include "addrlib/addrinterface.h"
32 #include "util/bitset.h"
33 #include "radv_amdgpu_winsys.h"
34 #include "radv_amdgpu_surface.h"
35 #include "sid.h"
36 #ifndef NO_ENTRIES
37 #define NO_ENTRIES 32
38 #endif
39
40 #ifndef NO_MACRO_ENTRIES
41 #define NO_MACRO_ENTRIES 16
42 #endif
43
44 #ifndef CIASICIDGFXENGINE_SOUTHERNISLAND
45 #define CIASICIDGFXENGINE_SOUTHERNISLAND 0x0000000A
46 #endif
47
48 static int radv_amdgpu_surface_sanity(const struct radeon_surf *surf)
49 {
50 unsigned type = RADEON_SURF_GET(surf->flags, TYPE);
51
52 if (!(surf->flags & RADEON_SURF_HAS_TILE_MODE_INDEX))
53 return -EINVAL;
54
55 /* all dimension must be at least 1 ! */
56 if (!surf->npix_x || !surf->npix_y || !surf->npix_z ||
57 !surf->array_size)
58 return -EINVAL;
59
60 if (!surf->blk_w || !surf->blk_h || !surf->blk_d)
61 return -EINVAL;
62
63 switch (surf->nsamples) {
64 case 1:
65 case 2:
66 case 4:
67 case 8:
68 break;
69 default:
70 return -EINVAL;
71 }
72
73 switch (type) {
74 case RADEON_SURF_TYPE_1D:
75 if (surf->npix_y > 1)
76 return -EINVAL;
77 /* fall through */
78 case RADEON_SURF_TYPE_2D:
79 case RADEON_SURF_TYPE_CUBEMAP:
80 if (surf->npix_z > 1 || surf->array_size > 1)
81 return -EINVAL;
82 break;
83 case RADEON_SURF_TYPE_3D:
84 if (surf->array_size > 1)
85 return -EINVAL;
86 break;
87 case RADEON_SURF_TYPE_1D_ARRAY:
88 if (surf->npix_y > 1)
89 return -EINVAL;
90 /* fall through */
91 case RADEON_SURF_TYPE_2D_ARRAY:
92 if (surf->npix_z > 1)
93 return -EINVAL;
94 break;
95 default:
96 return -EINVAL;
97 }
98 return 0;
99 }
100
101 static void *ADDR_API radv_allocSysMem(const ADDR_ALLOCSYSMEM_INPUT * pInput)
102 {
103 return malloc(pInput->sizeInBytes);
104 }
105
106 static ADDR_E_RETURNCODE ADDR_API radv_freeSysMem(const ADDR_FREESYSMEM_INPUT * pInput)
107 {
108 free(pInput->pVirtAddr);
109 return ADDR_OK;
110 }
111
112 ADDR_HANDLE radv_amdgpu_addr_create(struct amdgpu_gpu_info *amdinfo, int family, int rev_id,
113 enum chip_class chip_class)
114 {
115 ADDR_CREATE_INPUT addrCreateInput = {0};
116 ADDR_CREATE_OUTPUT addrCreateOutput = {0};
117 ADDR_REGISTER_VALUE regValue = {0};
118 ADDR_CREATE_FLAGS createFlags = {{0}};
119 ADDR_E_RETURNCODE addrRet;
120
121 addrCreateInput.size = sizeof(ADDR_CREATE_INPUT);
122 addrCreateOutput.size = sizeof(ADDR_CREATE_OUTPUT);
123
124 regValue.noOfBanks = amdinfo->mc_arb_ramcfg & 0x3;
125 regValue.gbAddrConfig = amdinfo->gb_addr_cfg;
126 regValue.noOfRanks = (amdinfo->mc_arb_ramcfg & 0x4) >> 2;
127
128 regValue.backendDisables = amdinfo->backend_disable[0];
129 regValue.pTileConfig = amdinfo->gb_tile_mode;
130 regValue.noOfEntries = ARRAY_SIZE(amdinfo->gb_tile_mode);
131 if (chip_class == SI) {
132 regValue.pMacroTileConfig = NULL;
133 regValue.noOfMacroEntries = 0;
134 } else {
135 regValue.pMacroTileConfig = amdinfo->gb_macro_tile_mode;
136 regValue.noOfMacroEntries = ARRAY_SIZE(amdinfo->gb_macro_tile_mode);
137 }
138
139 createFlags.value = 0;
140 createFlags.useTileIndex = 1;
141 createFlags.degradeBaseLevel = 1;
142
143 addrCreateInput.chipEngine = CIASICIDGFXENGINE_SOUTHERNISLAND;
144 addrCreateInput.chipFamily = family;
145 addrCreateInput.chipRevision = rev_id;
146 addrCreateInput.createFlags = createFlags;
147 addrCreateInput.callbacks.allocSysMem = radv_allocSysMem;
148 addrCreateInput.callbacks.freeSysMem = radv_freeSysMem;
149 addrCreateInput.callbacks.debugPrint = 0;
150 addrCreateInput.regValue = regValue;
151
152 addrRet = AddrCreate(&addrCreateInput, &addrCreateOutput);
153 if (addrRet != ADDR_OK)
154 return NULL;
155
156 return addrCreateOutput.hLib;
157 }
158
159 static int radv_compute_level(ADDR_HANDLE addrlib,
160 struct radeon_surf *surf, bool is_stencil,
161 unsigned level, unsigned type, bool compressed,
162 ADDR_COMPUTE_SURFACE_INFO_INPUT *AddrSurfInfoIn,
163 ADDR_COMPUTE_SURFACE_INFO_OUTPUT *AddrSurfInfoOut,
164 ADDR_COMPUTE_DCCINFO_INPUT *AddrDccIn,
165 ADDR_COMPUTE_DCCINFO_OUTPUT *AddrDccOut)
166 {
167 struct radeon_surf_level *surf_level;
168 ADDR_E_RETURNCODE ret;
169
170 AddrSurfInfoIn->mipLevel = level;
171 AddrSurfInfoIn->width = u_minify(surf->npix_x, level);
172 AddrSurfInfoIn->height = u_minify(surf->npix_y, level);
173
174 if (type == RADEON_SURF_TYPE_3D)
175 AddrSurfInfoIn->numSlices = u_minify(surf->npix_z, level);
176 else if (type == RADEON_SURF_TYPE_CUBEMAP)
177 AddrSurfInfoIn->numSlices = 6;
178 else
179 AddrSurfInfoIn->numSlices = surf->array_size;
180
181 if (level > 0) {
182 /* Set the base level pitch. This is needed for calculation
183 * of non-zero levels. */
184 if (is_stencil)
185 AddrSurfInfoIn->basePitch = surf->stencil_level[0].nblk_x;
186 else
187 AddrSurfInfoIn->basePitch = surf->level[0].nblk_x;
188
189 /* Convert blocks to pixels for compressed formats. */
190 if (compressed)
191 AddrSurfInfoIn->basePitch *= surf->blk_w;
192 }
193
194 ret = AddrComputeSurfaceInfo(addrlib,
195 AddrSurfInfoIn,
196 AddrSurfInfoOut);
197 if (ret != ADDR_OK) {
198 return ret;
199 }
200
201 surf_level = is_stencil ? &surf->stencil_level[level] : &surf->level[level];
202 surf_level->offset = align64(surf->bo_size, AddrSurfInfoOut->baseAlign);
203 surf_level->slice_size = AddrSurfInfoOut->sliceSize;
204 surf_level->pitch_bytes = AddrSurfInfoOut->pitch * (is_stencil ? 1 : surf->bpe);
205 surf_level->npix_x = u_minify(surf->npix_x, level);
206 surf_level->npix_y = u_minify(surf->npix_y, level);
207 surf_level->npix_z = u_minify(surf->npix_z, level);
208 surf_level->nblk_x = AddrSurfInfoOut->pitch;
209 surf_level->nblk_y = AddrSurfInfoOut->height;
210 if (type == RADEON_SURF_TYPE_3D)
211 surf_level->nblk_z = AddrSurfInfoOut->depth;
212 else
213 surf_level->nblk_z = 1;
214
215 switch (AddrSurfInfoOut->tileMode) {
216 case ADDR_TM_LINEAR_ALIGNED:
217 surf_level->mode = RADEON_SURF_MODE_LINEAR_ALIGNED;
218 break;
219 case ADDR_TM_1D_TILED_THIN1:
220 surf_level->mode = RADEON_SURF_MODE_1D;
221 break;
222 case ADDR_TM_2D_TILED_THIN1:
223 surf_level->mode = RADEON_SURF_MODE_2D;
224 break;
225 default:
226 assert(0);
227 }
228
229 if (is_stencil)
230 surf->stencil_tiling_index[level] = AddrSurfInfoOut->tileIndex;
231 else
232 surf->tiling_index[level] = AddrSurfInfoOut->tileIndex;
233
234 surf->bo_size = surf_level->offset + AddrSurfInfoOut->surfSize;
235
236 /* Clear DCC fields at the beginning. */
237 surf_level->dcc_offset = 0;
238 surf_level->dcc_enabled = false;
239
240 /* The previous level's flag tells us if we can use DCC for this level. */
241 if (AddrSurfInfoIn->flags.dccCompatible &&
242 (level == 0 || AddrDccOut->subLvlCompressible)) {
243 AddrDccIn->colorSurfSize = AddrSurfInfoOut->surfSize;
244 AddrDccIn->tileMode = AddrSurfInfoOut->tileMode;
245 AddrDccIn->tileInfo = *AddrSurfInfoOut->pTileInfo;
246 AddrDccIn->tileIndex = AddrSurfInfoOut->tileIndex;
247 AddrDccIn->macroModeIndex = AddrSurfInfoOut->macroModeIndex;
248
249 ret = AddrComputeDccInfo(addrlib,
250 AddrDccIn,
251 AddrDccOut);
252
253 if (ret == ADDR_OK) {
254 surf_level->dcc_offset = surf->dcc_size;
255 surf_level->dcc_fast_clear_size = AddrDccOut->dccFastClearSize;
256 surf_level->dcc_enabled = true;
257 surf->dcc_size = surf_level->dcc_offset + AddrDccOut->dccRamSize;
258 surf->dcc_alignment = MAX(surf->dcc_alignment, AddrDccOut->dccRamBaseAlign);
259 }
260 }
261
262 return 0;
263 }
264
265 static void radv_set_micro_tile_mode(struct radeon_surf *surf,
266 struct radeon_info *info)
267 {
268 uint32_t tile_mode = info->si_tile_mode_array[surf->tiling_index[0]];
269
270 if (info->chip_class >= CIK)
271 surf->micro_tile_mode = G_009910_MICRO_TILE_MODE_NEW(tile_mode);
272 else
273 surf->micro_tile_mode = G_009910_MICRO_TILE_MODE(tile_mode);
274 }
275
276
277 static int radv_amdgpu_winsys_surface_init(struct radeon_winsys *_ws,
278 struct radeon_surf *surf)
279 {
280 struct radv_amdgpu_winsys *ws = radv_amdgpu_winsys(_ws);
281 unsigned level, mode, type;
282 bool compressed;
283 ADDR_COMPUTE_SURFACE_INFO_INPUT AddrSurfInfoIn = {0};
284 ADDR_COMPUTE_SURFACE_INFO_OUTPUT AddrSurfInfoOut = {0};
285 ADDR_COMPUTE_DCCINFO_INPUT AddrDccIn = {0};
286 ADDR_COMPUTE_DCCINFO_OUTPUT AddrDccOut = {0};
287 ADDR_TILEINFO AddrTileInfoIn = {0};
288 ADDR_TILEINFO AddrTileInfoOut = {0};
289 int r;
290
291 r = radv_amdgpu_surface_sanity(surf);
292 if (r)
293 return r;
294
295 AddrSurfInfoIn.size = sizeof(ADDR_COMPUTE_SURFACE_INFO_INPUT);
296 AddrSurfInfoOut.size = sizeof(ADDR_COMPUTE_SURFACE_INFO_OUTPUT);
297 AddrDccIn.size = sizeof(ADDR_COMPUTE_DCCINFO_INPUT);
298 AddrDccOut.size = sizeof(ADDR_COMPUTE_DCCINFO_OUTPUT);
299 AddrSurfInfoOut.pTileInfo = &AddrTileInfoOut;
300
301 type = RADEON_SURF_GET(surf->flags, TYPE);
302 mode = RADEON_SURF_GET(surf->flags, MODE);
303 compressed = surf->blk_w == 4 && surf->blk_h == 4;
304
305 /* MSAA and FMASK require 2D tiling. */
306 if (surf->nsamples > 1 ||
307 (surf->flags & RADEON_SURF_FMASK))
308 mode = RADEON_SURF_MODE_2D;
309
310 /* DB doesn't support linear layouts. */
311 if (surf->flags & (RADEON_SURF_Z_OR_SBUFFER) &&
312 mode < RADEON_SURF_MODE_1D)
313 mode = RADEON_SURF_MODE_1D;
314
315 /* Set the requested tiling mode. */
316 switch (mode) {
317 case RADEON_SURF_MODE_LINEAR_ALIGNED:
318 AddrSurfInfoIn.tileMode = ADDR_TM_LINEAR_ALIGNED;
319 break;
320 case RADEON_SURF_MODE_1D:
321 AddrSurfInfoIn.tileMode = ADDR_TM_1D_TILED_THIN1;
322 break;
323 case RADEON_SURF_MODE_2D:
324 AddrSurfInfoIn.tileMode = ADDR_TM_2D_TILED_THIN1;
325 break;
326 default:
327 assert(0);
328 }
329
330 /* The format must be set correctly for the allocation of compressed
331 * textures to work. In other cases, setting the bpp is sufficient. */
332 if (compressed) {
333 switch (surf->bpe) {
334 case 8:
335 AddrSurfInfoIn.format = ADDR_FMT_BC1;
336 break;
337 case 16:
338 AddrSurfInfoIn.format = ADDR_FMT_BC3;
339 break;
340 default:
341 assert(0);
342 }
343 }
344 else {
345 AddrDccIn.bpp = AddrSurfInfoIn.bpp = surf->bpe * 8;
346 }
347
348 AddrDccIn.numSamples = AddrSurfInfoIn.numSamples = surf->nsamples;
349 AddrSurfInfoIn.tileIndex = -1;
350
351 /* Set the micro tile type. */
352 if (surf->flags & RADEON_SURF_SCANOUT)
353 AddrSurfInfoIn.tileType = ADDR_DISPLAYABLE;
354 else if (surf->flags & RADEON_SURF_Z_OR_SBUFFER)
355 AddrSurfInfoIn.tileType = ADDR_DEPTH_SAMPLE_ORDER;
356 else
357 AddrSurfInfoIn.tileType = ADDR_NON_DISPLAYABLE;
358
359 AddrSurfInfoIn.flags.color = !(surf->flags & RADEON_SURF_Z_OR_SBUFFER);
360 AddrSurfInfoIn.flags.depth = (surf->flags & RADEON_SURF_ZBUFFER) != 0;
361 AddrSurfInfoIn.flags.cube = type == RADEON_SURF_TYPE_CUBEMAP;
362 AddrSurfInfoIn.flags.display = (surf->flags & RADEON_SURF_SCANOUT) != 0;
363 AddrSurfInfoIn.flags.pow2Pad = surf->last_level > 0;
364 AddrSurfInfoIn.flags.degrade4Space = 1;
365
366 /* DCC notes:
367 * - If we add MSAA support, keep in mind that CB can't decompress 8bpp
368 * with samples >= 4.
369 * - Mipmapped array textures have low performance (discovered by a closed
370 * driver team).
371 */
372 AddrSurfInfoIn.flags.dccCompatible = !(surf->flags & RADEON_SURF_Z_OR_SBUFFER) &&
373 !(surf->flags & RADEON_SURF_DISABLE_DCC) &&
374 !compressed && AddrDccIn.numSamples <= 1 &&
375 ((surf->array_size == 1 && surf->npix_z == 1) ||
376 surf->last_level == 0);
377
378 AddrSurfInfoIn.flags.noStencil = (surf->flags & RADEON_SURF_SBUFFER) == 0;
379 AddrSurfInfoIn.flags.compressZ = AddrSurfInfoIn.flags.depth;
380
381 /* noStencil = 0 can result in a depth part that is incompatible with
382 * mipmapped texturing. So set noStencil = 1 when mipmaps are requested (in
383 * this case, we may end up setting stencil_adjusted).
384 *
385 * TODO: update addrlib to a newer version, remove this, and
386 * use flags.matchStencilTileCfg = 1 as an alternative fix.
387 */
388 if (surf->last_level > 0)
389 AddrSurfInfoIn.flags.noStencil = 1;
390
391 /* Set preferred macrotile parameters. This is usually required
392 * for shared resources. This is for 2D tiling only. */
393 if (AddrSurfInfoIn.tileMode >= ADDR_TM_2D_TILED_THIN1 &&
394 surf->bankw && surf->bankh && surf->mtilea && surf->tile_split) {
395 /* If any of these parameters are incorrect, the calculation
396 * will fail. */
397 AddrTileInfoIn.banks = surf->num_banks;
398 AddrTileInfoIn.bankWidth = surf->bankw;
399 AddrTileInfoIn.bankHeight = surf->bankh;
400 AddrTileInfoIn.macroAspectRatio = surf->mtilea;
401 AddrTileInfoIn.tileSplitBytes = surf->tile_split;
402 AddrTileInfoIn.pipeConfig = surf->pipe_config + 1; /* +1 compared to GB_TILE_MODE */
403 AddrSurfInfoIn.flags.degrade4Space = 0;
404 AddrSurfInfoIn.pTileInfo = &AddrTileInfoIn;
405
406 /* If AddrSurfInfoIn.pTileInfo is set, Addrlib doesn't set
407 * the tile index, because we are expected to know it if
408 * we know the other parameters.
409 *
410 * This is something that can easily be fixed in Addrlib.
411 * For now, just figure it out here.
412 * Note that only 2D_TILE_THIN1 is handled here.
413 */
414 assert(!(surf->flags & RADEON_SURF_Z_OR_SBUFFER));
415 assert(AddrSurfInfoIn.tileMode == ADDR_TM_2D_TILED_THIN1);
416
417 if (ws->info.chip_class == SI) {
418 if (AddrSurfInfoIn.tileType == ADDR_DISPLAYABLE) {
419 if (surf->bpe == 2)
420 AddrSurfInfoIn.tileIndex = 11; /* 16bpp */
421 else
422 AddrSurfInfoIn.tileIndex = 12; /* 32bpp */
423 } else {
424 if (surf->bpe == 1)
425 AddrSurfInfoIn.tileIndex = 14; /* 8bpp */
426 else if (surf->bpe == 2)
427 AddrSurfInfoIn.tileIndex = 15; /* 16bpp */
428 else if (surf->bpe == 4)
429 AddrSurfInfoIn.tileIndex = 16; /* 32bpp */
430 else
431 AddrSurfInfoIn.tileIndex = 17; /* 64bpp (and 128bpp) */
432 }
433 } else {
434 if (AddrSurfInfoIn.tileType == ADDR_DISPLAYABLE)
435 AddrSurfInfoIn.tileIndex = 10; /* 2D displayable */
436 else
437 AddrSurfInfoIn.tileIndex = 14; /* 2D non-displayable */
438 }
439 }
440
441 surf->bo_size = 0;
442 surf->dcc_size = 0;
443 surf->dcc_alignment = 1;
444
445 /* Calculate texture layout information. */
446 for (level = 0; level <= surf->last_level; level++) {
447 r = radv_compute_level(ws->addrlib, surf, false, level, type, compressed,
448 &AddrSurfInfoIn, &AddrSurfInfoOut, &AddrDccIn, &AddrDccOut);
449 if (r)
450 return r;
451
452 if (level == 0) {
453 surf->bo_alignment = AddrSurfInfoOut.baseAlign;
454 surf->pipe_config = AddrSurfInfoOut.pTileInfo->pipeConfig - 1;
455 radv_set_micro_tile_mode(surf, &ws->info);
456
457 /* For 2D modes only. */
458 if (AddrSurfInfoOut.tileMode >= ADDR_TM_2D_TILED_THIN1) {
459 surf->bankw = AddrSurfInfoOut.pTileInfo->bankWidth;
460 surf->bankh = AddrSurfInfoOut.pTileInfo->bankHeight;
461 surf->mtilea = AddrSurfInfoOut.pTileInfo->macroAspectRatio;
462 surf->tile_split = AddrSurfInfoOut.pTileInfo->tileSplitBytes;
463 surf->num_banks = AddrSurfInfoOut.pTileInfo->banks;
464 surf->macro_tile_index = AddrSurfInfoOut.macroModeIndex;
465 } else {
466 surf->macro_tile_index = 0;
467 }
468 }
469 }
470
471 /* Calculate texture layout information for stencil. */
472 if (surf->flags & RADEON_SURF_SBUFFER) {
473 AddrSurfInfoIn.bpp = 8;
474 AddrSurfInfoIn.flags.depth = 0;
475 AddrSurfInfoIn.flags.stencil = 1;
476 /* This will be ignored if AddrSurfInfoIn.pTileInfo is NULL. */
477 AddrTileInfoIn.tileSplitBytes = surf->stencil_tile_split;
478
479 for (level = 0; level <= surf->last_level; level++) {
480 r = radv_compute_level(ws->addrlib, surf, true, level, type, compressed,
481 &AddrSurfInfoIn, &AddrSurfInfoOut, &AddrDccIn, &AddrDccOut);
482 if (r)
483 return r;
484
485 /* DB uses the depth pitch for both stencil and depth. */
486 if (surf->stencil_level[level].nblk_x != surf->level[level].nblk_x)
487 surf->stencil_adjusted = true;
488
489 if (level == 0) {
490 /* For 2D modes only. */
491 if (AddrSurfInfoOut.tileMode >= ADDR_TM_2D_TILED_THIN1) {
492 surf->stencil_tile_split =
493 AddrSurfInfoOut.pTileInfo->tileSplitBytes;
494 }
495 }
496 }
497 }
498
499 /* Recalculate the whole DCC miptree size including disabled levels.
500 * This is what addrlib does, but calling addrlib would be a lot more
501 * complicated.
502 */
503 #if 0
504 if (surf->dcc_size && surf->last_level > 0) {
505 surf->dcc_size = align64(surf->bo_size >> 8,
506 ws->info.pipe_interleave_bytes *
507 ws->info.num_tile_pipes);
508 }
509 #endif
510 return 0;
511 }
512
513 static int radv_amdgpu_winsys_surface_best(struct radeon_winsys *rws,
514 struct radeon_surf *surf)
515 {
516 return 0;
517 }
518
519 void radv_amdgpu_surface_init_functions(struct radv_amdgpu_winsys *ws)
520 {
521 ws->base.surface_init = radv_amdgpu_winsys_surface_init;
522 ws->base.surface_best = radv_amdgpu_winsys_surface_best;
523 }