2 * Copyright © 2011 Red Hat All Rights Reserved.
3 * Copyright © 2014 Advanced Micro Devices, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining
7 * a copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
15 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
16 * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
17 * NON-INFRINGEMENT. IN NO EVENT SHALL THE COPYRIGHT HOLDERS, AUTHORS
18 * AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
20 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
23 * The above copyright notice and this permission notice (including the
24 * next paragraph) shall be included in all copies or substantial portions
29 * Marek Olšák <maraeo@gmail.com>
32 #include "amdgpu_winsys.h"
38 #ifndef NO_MACRO_ENTRIES
39 #define NO_MACRO_ENTRIES 16
42 #ifndef CIASICIDGFXENGINE_SOUTHERNISLAND
43 #define CIASICIDGFXENGINE_SOUTHERNISLAND 0x0000000A
47 static int amdgpu_surface_sanity(const struct radeon_surf
*surf
)
49 unsigned type
= RADEON_SURF_GET(surf
->flags
, TYPE
);
51 if (!(surf
->flags
& RADEON_SURF_HAS_TILE_MODE_INDEX
))
54 /* all dimension must be at least 1 ! */
55 if (!surf
->npix_x
|| !surf
->npix_y
|| !surf
->npix_z
||
59 if (!surf
->blk_w
|| !surf
->blk_h
|| !surf
->blk_d
)
62 switch (surf
->nsamples
) {
73 case RADEON_SURF_TYPE_1D
:
77 case RADEON_SURF_TYPE_2D
:
78 case RADEON_SURF_TYPE_CUBEMAP
:
79 if (surf
->npix_z
> 1 || surf
->array_size
> 1)
82 case RADEON_SURF_TYPE_3D
:
83 if (surf
->array_size
> 1)
86 case RADEON_SURF_TYPE_1D_ARRAY
:
90 case RADEON_SURF_TYPE_2D_ARRAY
:
100 static void *ADDR_API
allocSysMem(const ADDR_ALLOCSYSMEM_INPUT
* pInput
)
102 return malloc(pInput
->sizeInBytes
);
105 static ADDR_E_RETURNCODE ADDR_API
freeSysMem(const ADDR_FREESYSMEM_INPUT
* pInput
)
107 free(pInput
->pVirtAddr
);
112 * This returns the number of banks for the surface.
113 * Possible values: 2, 4, 8, 16.
115 static uint32_t cik_num_banks(struct amdgpu_winsys
*ws
,
116 struct radeon_surf
*surf
)
118 unsigned index
, tileb
;
120 tileb
= 8 * 8 * surf
->bpe
;
121 tileb
= MIN2(surf
->tile_split
, tileb
);
123 for (index
= 0; tileb
> 64; index
++) {
128 return 2 << ((ws
->amdinfo
.gb_macro_tile_mode
[index
] >> 6) & 0x3);
131 ADDR_HANDLE
amdgpu_addr_create(struct amdgpu_winsys
*ws
)
133 ADDR_CREATE_INPUT addrCreateInput
= {0};
134 ADDR_CREATE_OUTPUT addrCreateOutput
= {0};
135 ADDR_REGISTER_VALUE regValue
= {0};
136 ADDR_CREATE_FLAGS createFlags
= {{0}};
137 ADDR_E_RETURNCODE addrRet
;
139 addrCreateInput
.size
= sizeof(ADDR_CREATE_INPUT
);
140 addrCreateOutput
.size
= sizeof(ADDR_CREATE_OUTPUT
);
142 regValue
.noOfBanks
= ws
->amdinfo
.mc_arb_ramcfg
& 0x3;
143 regValue
.gbAddrConfig
= ws
->amdinfo
.gb_addr_cfg
;
144 regValue
.noOfRanks
= (ws
->amdinfo
.mc_arb_ramcfg
& 0x4) >> 2;
146 regValue
.backendDisables
= ws
->amdinfo
.backend_disable
[0];
147 regValue
.pTileConfig
= ws
->amdinfo
.gb_tile_mode
;
148 regValue
.noOfEntries
= ARRAY_SIZE(ws
->amdinfo
.gb_tile_mode
);
149 regValue
.pMacroTileConfig
= ws
->amdinfo
.gb_macro_tile_mode
;
150 regValue
.noOfMacroEntries
= ARRAY_SIZE(ws
->amdinfo
.gb_macro_tile_mode
);
152 createFlags
.value
= 0;
153 createFlags
.useTileIndex
= 1;
154 createFlags
.degradeBaseLevel
= 1;
156 addrCreateInput
.chipEngine
= CIASICIDGFXENGINE_SOUTHERNISLAND
;
157 addrCreateInput
.chipFamily
= ws
->family
;
158 addrCreateInput
.chipRevision
= ws
->rev_id
;
159 addrCreateInput
.createFlags
= createFlags
;
160 addrCreateInput
.callbacks
.allocSysMem
= allocSysMem
;
161 addrCreateInput
.callbacks
.freeSysMem
= freeSysMem
;
162 addrCreateInput
.callbacks
.debugPrint
= 0;
163 addrCreateInput
.regValue
= regValue
;
165 addrRet
= AddrCreate(&addrCreateInput
, &addrCreateOutput
);
166 if (addrRet
!= ADDR_OK
)
169 return addrCreateOutput
.hLib
;
172 static int compute_level(struct amdgpu_winsys
*ws
,
173 struct radeon_surf
*surf
, bool is_stencil
,
174 unsigned level
, unsigned type
, bool compressed
,
175 ADDR_COMPUTE_SURFACE_INFO_INPUT
*AddrSurfInfoIn
,
176 ADDR_COMPUTE_SURFACE_INFO_OUTPUT
*AddrSurfInfoOut
,
177 ADDR_COMPUTE_DCCINFO_INPUT
*AddrDccIn
,
178 ADDR_COMPUTE_DCCINFO_OUTPUT
*AddrDccOut
)
180 struct radeon_surf_level
*surf_level
;
181 ADDR_E_RETURNCODE ret
;
183 AddrSurfInfoIn
->mipLevel
= level
;
184 AddrSurfInfoIn
->width
= u_minify(surf
->npix_x
, level
);
185 AddrSurfInfoIn
->height
= u_minify(surf
->npix_y
, level
);
187 if (type
== RADEON_SURF_TYPE_3D
)
188 AddrSurfInfoIn
->numSlices
= u_minify(surf
->npix_z
, level
);
189 else if (type
== RADEON_SURF_TYPE_CUBEMAP
)
190 AddrSurfInfoIn
->numSlices
= 6;
192 AddrSurfInfoIn
->numSlices
= surf
->array_size
;
195 /* Set the base level pitch. This is needed for calculation
196 * of non-zero levels. */
198 AddrSurfInfoIn
->basePitch
= surf
->stencil_level
[0].nblk_x
;
200 AddrSurfInfoIn
->basePitch
= surf
->level
[0].nblk_x
;
202 /* Convert blocks to pixels for compressed formats. */
204 AddrSurfInfoIn
->basePitch
*= surf
->blk_w
;
207 ret
= AddrComputeSurfaceInfo(ws
->addrlib
,
210 if (ret
!= ADDR_OK
) {
214 surf_level
= is_stencil
? &surf
->stencil_level
[level
] : &surf
->level
[level
];
215 surf_level
->offset
= align64(surf
->bo_size
, AddrSurfInfoOut
->baseAlign
);
216 surf_level
->slice_size
= AddrSurfInfoOut
->sliceSize
;
217 surf_level
->pitch_bytes
= AddrSurfInfoOut
->pitch
* (is_stencil
? 1 : surf
->bpe
);
218 surf_level
->npix_x
= u_minify(surf
->npix_x
, level
);
219 surf_level
->npix_y
= u_minify(surf
->npix_y
, level
);
220 surf_level
->npix_z
= u_minify(surf
->npix_z
, level
);
221 surf_level
->nblk_x
= AddrSurfInfoOut
->pitch
;
222 surf_level
->nblk_y
= AddrSurfInfoOut
->height
;
223 if (type
== RADEON_SURF_TYPE_3D
)
224 surf_level
->nblk_z
= AddrSurfInfoOut
->depth
;
226 surf_level
->nblk_z
= 1;
228 switch (AddrSurfInfoOut
->tileMode
) {
229 case ADDR_TM_LINEAR_GENERAL
:
230 surf_level
->mode
= RADEON_SURF_MODE_LINEAR
;
232 case ADDR_TM_LINEAR_ALIGNED
:
233 surf_level
->mode
= RADEON_SURF_MODE_LINEAR_ALIGNED
;
235 case ADDR_TM_1D_TILED_THIN1
:
236 surf_level
->mode
= RADEON_SURF_MODE_1D
;
238 case ADDR_TM_2D_TILED_THIN1
:
239 surf_level
->mode
= RADEON_SURF_MODE_2D
;
246 surf
->stencil_tiling_index
[level
] = AddrSurfInfoOut
->tileIndex
;
248 surf
->tiling_index
[level
] = AddrSurfInfoOut
->tileIndex
;
250 surf
->bo_size
= surf_level
->offset
+ AddrSurfInfoOut
->surfSize
;
252 if (AddrSurfInfoIn
->flags
.dccCompatible
) {
253 AddrDccIn
->colorSurfSize
= AddrSurfInfoOut
->surfSize
;
254 AddrDccIn
->tileMode
= AddrSurfInfoOut
->tileMode
;
255 AddrDccIn
->tileInfo
= *AddrSurfInfoOut
->pTileInfo
;
256 AddrDccIn
->tileIndex
= AddrSurfInfoOut
->tileIndex
;
257 AddrDccIn
->macroModeIndex
= AddrSurfInfoOut
->macroModeIndex
;
259 ret
= AddrComputeDccInfo(ws
->addrlib
,
263 if (ret
== ADDR_OK
) {
264 surf_level
->dcc_offset
= surf
->dcc_size
;
265 surf
->dcc_size
= surf_level
->dcc_offset
+ AddrDccOut
->dccRamSize
;
266 surf
->dcc_alignment
= MAX2(surf
->dcc_alignment
, AddrDccOut
->dccRamBaseAlign
);
269 surf_level
->dcc_offset
= 0;
273 surf_level
->dcc_offset
= 0;
279 static int amdgpu_surface_init(struct radeon_winsys
*rws
,
280 struct radeon_surf
*surf
)
282 struct amdgpu_winsys
*ws
= (struct amdgpu_winsys
*)rws
;
283 unsigned level
, mode
, type
;
285 ADDR_COMPUTE_SURFACE_INFO_INPUT AddrSurfInfoIn
= {0};
286 ADDR_COMPUTE_SURFACE_INFO_OUTPUT AddrSurfInfoOut
= {0};
287 ADDR_COMPUTE_DCCINFO_INPUT AddrDccIn
= {0};
288 ADDR_COMPUTE_DCCINFO_OUTPUT AddrDccOut
= {0};
289 ADDR_TILEINFO AddrTileInfoIn
= {0};
290 ADDR_TILEINFO AddrTileInfoOut
= {0};
293 r
= amdgpu_surface_sanity(surf
);
297 AddrSurfInfoIn
.size
= sizeof(ADDR_COMPUTE_SURFACE_INFO_INPUT
);
298 AddrSurfInfoOut
.size
= sizeof(ADDR_COMPUTE_SURFACE_INFO_OUTPUT
);
299 AddrDccIn
.size
= sizeof(ADDR_COMPUTE_DCCINFO_INPUT
);
300 AddrDccOut
.size
= sizeof(ADDR_COMPUTE_DCCINFO_OUTPUT
);
301 AddrSurfInfoOut
.pTileInfo
= &AddrTileInfoOut
;
303 type
= RADEON_SURF_GET(surf
->flags
, TYPE
);
304 mode
= RADEON_SURF_GET(surf
->flags
, MODE
);
305 compressed
= surf
->blk_w
== 4 && surf
->blk_h
== 4;
307 /* MSAA and FMASK require 2D tiling. */
308 if (surf
->nsamples
> 1 ||
309 (surf
->flags
& RADEON_SURF_FMASK
))
310 mode
= RADEON_SURF_MODE_2D
;
312 /* DB doesn't support linear layouts. */
313 if (surf
->flags
& (RADEON_SURF_Z_OR_SBUFFER
) &&
314 mode
< RADEON_SURF_MODE_1D
)
315 mode
= RADEON_SURF_MODE_1D
;
317 /* Set the requested tiling mode. */
319 case RADEON_SURF_MODE_LINEAR
:
320 AddrSurfInfoIn
.tileMode
= ADDR_TM_LINEAR_GENERAL
;
322 case RADEON_SURF_MODE_LINEAR_ALIGNED
:
323 AddrSurfInfoIn
.tileMode
= ADDR_TM_LINEAR_ALIGNED
;
325 case RADEON_SURF_MODE_1D
:
326 AddrSurfInfoIn
.tileMode
= ADDR_TM_1D_TILED_THIN1
;
328 case RADEON_SURF_MODE_2D
:
329 AddrSurfInfoIn
.tileMode
= ADDR_TM_2D_TILED_THIN1
;
335 /* The format must be set correctly for the allocation of compressed
336 * textures to work. In other cases, setting the bpp is sufficient. */
340 AddrSurfInfoIn
.format
= ADDR_FMT_BC1
;
343 AddrSurfInfoIn
.format
= ADDR_FMT_BC3
;
350 AddrDccIn
.bpp
= AddrSurfInfoIn
.bpp
= surf
->bpe
* 8;
353 AddrDccIn
.numSamples
= AddrSurfInfoIn
.numSamples
= surf
->nsamples
;
354 AddrSurfInfoIn
.tileIndex
= -1;
356 /* Set the micro tile type. */
357 if (surf
->flags
& RADEON_SURF_SCANOUT
)
358 AddrSurfInfoIn
.tileType
= ADDR_DISPLAYABLE
;
359 else if (surf
->flags
& RADEON_SURF_Z_OR_SBUFFER
)
360 AddrSurfInfoIn
.tileType
= ADDR_DEPTH_SAMPLE_ORDER
;
362 AddrSurfInfoIn
.tileType
= ADDR_NON_DISPLAYABLE
;
364 AddrSurfInfoIn
.flags
.color
= !(surf
->flags
& RADEON_SURF_Z_OR_SBUFFER
);
365 AddrSurfInfoIn
.flags
.depth
= (surf
->flags
& RADEON_SURF_ZBUFFER
) != 0;
366 AddrSurfInfoIn
.flags
.stencil
= (surf
->flags
& RADEON_SURF_SBUFFER
) != 0;
367 AddrSurfInfoIn
.flags
.cube
= type
== RADEON_SURF_TYPE_CUBEMAP
;
368 AddrSurfInfoIn
.flags
.display
= (surf
->flags
& RADEON_SURF_SCANOUT
) != 0;
369 AddrSurfInfoIn
.flags
.pow2Pad
= surf
->last_level
> 0;
370 AddrSurfInfoIn
.flags
.degrade4Space
= 1;
371 AddrSurfInfoIn
.flags
.dccCompatible
= !(surf
->flags
& RADEON_SURF_Z_OR_SBUFFER
) &&
372 !(surf
->flags
& RADEON_SURF_SCANOUT
) &&
373 !compressed
&& AddrDccIn
.numSamples
<= 1;
375 /* This disables incorrect calculations (hacks) in addrlib. */
376 AddrSurfInfoIn
.flags
.noStencil
= 1;
378 /* Set preferred macrotile parameters. This is usually required
379 * for shared resources. This is for 2D tiling only. */
380 if (AddrSurfInfoIn
.tileMode
>= ADDR_TM_2D_TILED_THIN1
&&
381 surf
->bankw
&& surf
->bankh
&& surf
->mtilea
&& surf
->tile_split
) {
382 /* If any of these parameters are incorrect, the calculation
384 AddrTileInfoIn
.banks
= cik_num_banks(ws
, surf
);
385 AddrTileInfoIn
.bankWidth
= surf
->bankw
;
386 AddrTileInfoIn
.bankHeight
= surf
->bankh
;
387 AddrTileInfoIn
.macroAspectRatio
= surf
->mtilea
;
388 AddrTileInfoIn
.tileSplitBytes
= surf
->tile_split
;
389 AddrSurfInfoIn
.flags
.degrade4Space
= 0;
390 AddrSurfInfoIn
.pTileInfo
= &AddrTileInfoIn
;
392 /* If AddrSurfInfoIn.pTileInfo is set, Addrlib doesn't set
393 * the tile index, because we are expected to know it if
394 * we know the other parameters.
396 * This is something that can easily be fixed in Addrlib.
397 * For now, just figure it out here.
398 * Note that only 2D_TILE_THIN1 is handled here.
400 assert(!(surf
->flags
& RADEON_SURF_Z_OR_SBUFFER
));
401 assert(AddrSurfInfoIn
.tileMode
== ADDR_TM_2D_TILED_THIN1
);
403 if (AddrSurfInfoIn
.tileType
== ADDR_DISPLAYABLE
)
404 AddrSurfInfoIn
.tileIndex
= 10; /* 2D displayable */
406 AddrSurfInfoIn
.tileIndex
= 14; /* 2D non-displayable */
411 surf
->dcc_alignment
= 1;
413 /* Calculate texture layout information. */
414 for (level
= 0; level
<= surf
->last_level
; level
++) {
415 r
= compute_level(ws
, surf
, false, level
, type
, compressed
,
416 &AddrSurfInfoIn
, &AddrSurfInfoOut
, &AddrDccIn
, &AddrDccOut
);
421 surf
->bo_alignment
= AddrSurfInfoOut
.baseAlign
;
422 surf
->pipe_config
= AddrSurfInfoOut
.pTileInfo
->pipeConfig
- 1;
424 /* For 2D modes only. */
425 if (AddrSurfInfoOut
.tileMode
>= ADDR_TM_2D_TILED_THIN1
) {
426 surf
->bankw
= AddrSurfInfoOut
.pTileInfo
->bankWidth
;
427 surf
->bankh
= AddrSurfInfoOut
.pTileInfo
->bankHeight
;
428 surf
->mtilea
= AddrSurfInfoOut
.pTileInfo
->macroAspectRatio
;
429 surf
->tile_split
= AddrSurfInfoOut
.pTileInfo
->tileSplitBytes
;
430 surf
->num_banks
= AddrSurfInfoOut
.pTileInfo
->banks
;
435 /* Calculate texture layout information for stencil. */
436 if (surf
->flags
& RADEON_SURF_SBUFFER
) {
437 AddrSurfInfoIn
.bpp
= 8;
438 /* This will be ignored if AddrSurfInfoIn.pTileInfo is NULL. */
439 AddrTileInfoIn
.tileSplitBytes
= surf
->stencil_tile_split
;
441 for (level
= 0; level
<= surf
->last_level
; level
++) {
442 r
= compute_level(ws
, surf
, true, level
, type
, compressed
,
443 &AddrSurfInfoIn
, &AddrSurfInfoOut
, &AddrDccIn
, &AddrDccOut
);
448 surf
->stencil_offset
= surf
->stencil_level
[0].offset
;
450 /* For 2D modes only. */
451 if (AddrSurfInfoOut
.tileMode
>= ADDR_TM_2D_TILED_THIN1
) {
452 surf
->stencil_tile_split
=
453 AddrSurfInfoOut
.pTileInfo
->tileSplitBytes
;
462 static int amdgpu_surface_best(struct radeon_winsys
*rws
,
463 struct radeon_surf
*surf
)
468 void amdgpu_surface_init_functions(struct amdgpu_winsys
*ws
)
470 ws
->base
.surface_init
= amdgpu_surface_init
;
471 ws
->base
.surface_best
= amdgpu_surface_best
;