2 * Copyright © 2011 Red Hat All Rights Reserved.
3 * Copyright © 2014 Advanced Micro Devices, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining
7 * a copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
15 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
16 * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
17 * NON-INFRINGEMENT. IN NO EVENT SHALL THE COPYRIGHT HOLDERS, AUTHORS
18 * AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
20 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
23 * The above copyright notice and this permission notice (including the
24 * next paragraph) shall be included in all copies or substantial portions
29 * Marek Olšák <maraeo@gmail.com>
32 #include "amdgpu_winsys.h"
38 #ifndef NO_MACRO_ENTRIES
39 #define NO_MACRO_ENTRIES 16
42 #ifndef CIASICIDGFXENGINE_SOUTHERNISLAND
43 #define CIASICIDGFXENGINE_SOUTHERNISLAND 0x0000000A
47 static int amdgpu_surface_sanity(const struct radeon_surf
*surf
)
49 unsigned type
= RADEON_SURF_GET(surf
->flags
, TYPE
);
51 if (!(surf
->flags
& RADEON_SURF_HAS_TILE_MODE_INDEX
))
54 /* all dimension must be at least 1 ! */
55 if (!surf
->npix_x
|| !surf
->npix_y
|| !surf
->npix_z
||
59 if (!surf
->blk_w
|| !surf
->blk_h
|| !surf
->blk_d
)
62 switch (surf
->nsamples
) {
73 case RADEON_SURF_TYPE_1D
:
77 case RADEON_SURF_TYPE_2D
:
78 case RADEON_SURF_TYPE_CUBEMAP
:
79 if (surf
->npix_z
> 1 || surf
->array_size
> 1)
82 case RADEON_SURF_TYPE_3D
:
83 if (surf
->array_size
> 1)
86 case RADEON_SURF_TYPE_1D_ARRAY
:
90 case RADEON_SURF_TYPE_2D_ARRAY
:
100 static void *ADDR_API
allocSysMem(const ADDR_ALLOCSYSMEM_INPUT
* pInput
)
102 return malloc(pInput
->sizeInBytes
);
105 static ADDR_E_RETURNCODE ADDR_API
freeSysMem(const ADDR_FREESYSMEM_INPUT
* pInput
)
107 free(pInput
->pVirtAddr
);
112 * This returns the number of banks for the surface.
113 * Possible values: 2, 4, 8, 16.
115 static uint32_t cik_num_banks(struct amdgpu_winsys
*ws
,
116 struct radeon_surf
*surf
)
118 unsigned index
, tileb
;
120 tileb
= 8 * 8 * surf
->bpe
;
121 tileb
= MIN2(surf
->tile_split
, tileb
);
123 for (index
= 0; tileb
> 64; index
++) {
128 return 2 << ((ws
->amdinfo
.gb_macro_tile_mode
[index
] >> 6) & 0x3);
131 ADDR_HANDLE
amdgpu_addr_create(struct amdgpu_winsys
*ws
)
133 ADDR_CREATE_INPUT addrCreateInput
= {0};
134 ADDR_CREATE_OUTPUT addrCreateOutput
= {0};
135 ADDR_REGISTER_VALUE regValue
= {0};
136 ADDR_CREATE_FLAGS createFlags
= {{0}};
137 ADDR_E_RETURNCODE addrRet
;
139 addrCreateInput
.size
= sizeof(ADDR_CREATE_INPUT
);
140 addrCreateOutput
.size
= sizeof(ADDR_CREATE_OUTPUT
);
142 regValue
.noOfBanks
= ws
->amdinfo
.mc_arb_ramcfg
& 0x3;
143 regValue
.gbAddrConfig
= ws
->amdinfo
.gb_addr_cfg
;
144 regValue
.noOfRanks
= (ws
->amdinfo
.mc_arb_ramcfg
& 0x4) >> 2;
146 regValue
.backendDisables
= ws
->amdinfo
.backend_disable
[0];
147 regValue
.pTileConfig
= ws
->amdinfo
.gb_tile_mode
;
148 regValue
.noOfEntries
= sizeof(ws
->amdinfo
.gb_tile_mode
) /
149 sizeof(ws
->amdinfo
.gb_tile_mode
[0]);
150 regValue
.pMacroTileConfig
= ws
->amdinfo
.gb_macro_tile_mode
;
151 regValue
.noOfMacroEntries
= sizeof(ws
->amdinfo
.gb_macro_tile_mode
) /
152 sizeof(ws
->amdinfo
.gb_macro_tile_mode
[0]);
154 createFlags
.value
= 0;
155 createFlags
.useTileIndex
= 1;
156 createFlags
.degradeBaseLevel
= 1;
158 addrCreateInput
.chipEngine
= CIASICIDGFXENGINE_SOUTHERNISLAND
;
159 addrCreateInput
.chipFamily
= ws
->family
;
160 addrCreateInput
.chipRevision
= ws
->rev_id
;
161 addrCreateInput
.createFlags
= createFlags
;
162 addrCreateInput
.callbacks
.allocSysMem
= allocSysMem
;
163 addrCreateInput
.callbacks
.freeSysMem
= freeSysMem
;
164 addrCreateInput
.callbacks
.debugPrint
= 0;
165 addrCreateInput
.regValue
= regValue
;
167 addrRet
= AddrCreate(&addrCreateInput
, &addrCreateOutput
);
168 if (addrRet
!= ADDR_OK
)
171 return addrCreateOutput
.hLib
;
174 static int compute_level(struct amdgpu_winsys
*ws
,
175 struct radeon_surf
*surf
, bool is_stencil
,
176 unsigned level
, unsigned type
, bool compressed
,
177 ADDR_COMPUTE_SURFACE_INFO_INPUT
*AddrSurfInfoIn
,
178 ADDR_COMPUTE_SURFACE_INFO_OUTPUT
*AddrSurfInfoOut
)
180 struct radeon_surf_level
*surf_level
;
181 ADDR_E_RETURNCODE ret
;
183 AddrSurfInfoIn
->mipLevel
= level
;
184 AddrSurfInfoIn
->width
= u_minify(surf
->npix_x
, level
);
185 AddrSurfInfoIn
->height
= u_minify(surf
->npix_y
, level
);
187 if (type
== RADEON_SURF_TYPE_3D
)
188 AddrSurfInfoIn
->numSlices
= u_minify(surf
->npix_z
, level
);
189 else if (type
== RADEON_SURF_TYPE_CUBEMAP
)
190 AddrSurfInfoIn
->numSlices
= 6;
192 AddrSurfInfoIn
->numSlices
= surf
->array_size
;
195 /* Set the base level pitch. This is needed for calculation
196 * of non-zero levels. */
198 AddrSurfInfoIn
->basePitch
= surf
->stencil_level
[0].nblk_x
;
200 AddrSurfInfoIn
->basePitch
= surf
->level
[0].nblk_x
;
202 /* Convert blocks to pixels for compressed formats. */
204 AddrSurfInfoIn
->basePitch
*= surf
->blk_w
;
207 ret
= AddrComputeSurfaceInfo(ws
->addrlib
,
210 if (ret
!= ADDR_OK
) {
214 surf_level
= is_stencil
? &surf
->stencil_level
[level
] : &surf
->level
[level
];
215 surf_level
->offset
= align(surf
->bo_size
, AddrSurfInfoOut
->baseAlign
);
216 surf_level
->slice_size
= AddrSurfInfoOut
->sliceSize
;
217 surf_level
->pitch_bytes
= AddrSurfInfoOut
->pitch
* (is_stencil
? 1 : surf
->bpe
);
218 surf_level
->npix_x
= u_minify(surf
->npix_x
, level
);
219 surf_level
->npix_y
= u_minify(surf
->npix_y
, level
);
220 surf_level
->npix_z
= u_minify(surf
->npix_z
, level
);
221 surf_level
->nblk_x
= AddrSurfInfoOut
->pitch
;
222 surf_level
->nblk_y
= AddrSurfInfoOut
->height
;
223 if (type
== RADEON_SURF_TYPE_3D
)
224 surf_level
->nblk_z
= AddrSurfInfoOut
->depth
;
226 surf_level
->nblk_z
= 1;
228 switch (AddrSurfInfoOut
->tileMode
) {
229 case ADDR_TM_LINEAR_GENERAL
:
230 surf_level
->mode
= RADEON_SURF_MODE_LINEAR
;
232 case ADDR_TM_LINEAR_ALIGNED
:
233 surf_level
->mode
= RADEON_SURF_MODE_LINEAR_ALIGNED
;
235 case ADDR_TM_1D_TILED_THIN1
:
236 surf_level
->mode
= RADEON_SURF_MODE_1D
;
238 case ADDR_TM_2D_TILED_THIN1
:
239 surf_level
->mode
= RADEON_SURF_MODE_2D
;
246 surf
->stencil_tiling_index
[level
] = AddrSurfInfoOut
->tileIndex
;
248 surf
->tiling_index
[level
] = AddrSurfInfoOut
->tileIndex
;
250 surf
->bo_size
= surf_level
->offset
+ AddrSurfInfoOut
->surfSize
;
254 static int amdgpu_surface_init(struct radeon_winsys
*rws
,
255 struct radeon_surf
*surf
)
257 struct amdgpu_winsys
*ws
= (struct amdgpu_winsys
*)rws
;
258 unsigned level
, mode
, type
;
260 ADDR_COMPUTE_SURFACE_INFO_INPUT AddrSurfInfoIn
= {0};
261 ADDR_COMPUTE_SURFACE_INFO_OUTPUT AddrSurfInfoOut
= {0};
262 ADDR_TILEINFO AddrTileInfoIn
= {0};
263 ADDR_TILEINFO AddrTileInfoOut
= {0};
266 r
= amdgpu_surface_sanity(surf
);
270 AddrSurfInfoIn
.size
= sizeof(ADDR_COMPUTE_SURFACE_INFO_INPUT
);
271 AddrSurfInfoOut
.size
= sizeof(ADDR_COMPUTE_SURFACE_INFO_OUTPUT
);
272 AddrSurfInfoOut
.pTileInfo
= &AddrTileInfoOut
;
274 type
= RADEON_SURF_GET(surf
->flags
, TYPE
);
275 mode
= RADEON_SURF_GET(surf
->flags
, MODE
);
276 compressed
= surf
->blk_w
== 4 && surf
->blk_h
== 4;
278 /* MSAA and FMASK require 2D tiling. */
279 if (surf
->nsamples
> 1 ||
280 (surf
->flags
& RADEON_SURF_FMASK
))
281 mode
= RADEON_SURF_MODE_2D
;
283 /* DB doesn't support linear layouts. */
284 if (surf
->flags
& (RADEON_SURF_Z_OR_SBUFFER
) &&
285 mode
< RADEON_SURF_MODE_1D
)
286 mode
= RADEON_SURF_MODE_1D
;
288 /* Set the requested tiling mode. */
290 case RADEON_SURF_MODE_LINEAR
:
291 AddrSurfInfoIn
.tileMode
= ADDR_TM_LINEAR_GENERAL
;
293 case RADEON_SURF_MODE_LINEAR_ALIGNED
:
294 AddrSurfInfoIn
.tileMode
= ADDR_TM_LINEAR_ALIGNED
;
296 case RADEON_SURF_MODE_1D
:
297 AddrSurfInfoIn
.tileMode
= ADDR_TM_1D_TILED_THIN1
;
299 case RADEON_SURF_MODE_2D
:
300 AddrSurfInfoIn
.tileMode
= ADDR_TM_2D_TILED_THIN1
;
306 /* The format must be set correctly for the allocation of compressed
307 * textures to work. In other cases, setting the bpp is sufficient. */
311 AddrSurfInfoIn
.format
= ADDR_FMT_BC1
;
314 AddrSurfInfoIn
.format
= ADDR_FMT_BC3
;
321 AddrSurfInfoIn
.bpp
= surf
->bpe
* 8;
324 AddrSurfInfoIn
.numSamples
= surf
->nsamples
;
325 AddrSurfInfoIn
.tileIndex
= -1;
327 /* Set the micro tile type. */
328 if (surf
->flags
& RADEON_SURF_SCANOUT
)
329 AddrSurfInfoIn
.tileType
= ADDR_DISPLAYABLE
;
330 else if (surf
->flags
& RADEON_SURF_Z_OR_SBUFFER
)
331 AddrSurfInfoIn
.tileType
= ADDR_DEPTH_SAMPLE_ORDER
;
333 AddrSurfInfoIn
.tileType
= ADDR_NON_DISPLAYABLE
;
335 AddrSurfInfoIn
.flags
.color
= !(surf
->flags
& RADEON_SURF_Z_OR_SBUFFER
);
336 AddrSurfInfoIn
.flags
.depth
= (surf
->flags
& RADEON_SURF_ZBUFFER
) != 0;
337 AddrSurfInfoIn
.flags
.stencil
= (surf
->flags
& RADEON_SURF_SBUFFER
) != 0;
338 AddrSurfInfoIn
.flags
.cube
= type
== RADEON_SURF_TYPE_CUBEMAP
;
339 AddrSurfInfoIn
.flags
.display
= (surf
->flags
& RADEON_SURF_SCANOUT
) != 0;
340 AddrSurfInfoIn
.flags
.pow2Pad
= surf
->last_level
> 0;
341 AddrSurfInfoIn
.flags
.degrade4Space
= 1;
343 /* This disables incorrect calculations (hacks) in addrlib. */
344 AddrSurfInfoIn
.flags
.noStencil
= 1;
346 /* Set preferred macrotile parameters. This is usually required
347 * for shared resources. This is for 2D tiling only. */
348 if (AddrSurfInfoIn
.tileMode
>= ADDR_TM_2D_TILED_THIN1
&&
349 surf
->bankw
&& surf
->bankh
&& surf
->mtilea
&& surf
->tile_split
) {
350 /* If any of these parameters are incorrect, the calculation
352 AddrTileInfoIn
.banks
= cik_num_banks(ws
, surf
);
353 AddrTileInfoIn
.bankWidth
= surf
->bankw
;
354 AddrTileInfoIn
.bankHeight
= surf
->bankh
;
355 AddrTileInfoIn
.macroAspectRatio
= surf
->mtilea
;
356 AddrTileInfoIn
.tileSplitBytes
= surf
->tile_split
;
357 AddrSurfInfoIn
.flags
.degrade4Space
= 0;
358 AddrSurfInfoIn
.pTileInfo
= &AddrTileInfoIn
;
360 /* If AddrSurfInfoIn.pTileInfo is set, Addrlib doesn't set
361 * the tile index, because we are expected to know it if
362 * we know the other parameters.
364 * This is something that can easily be fixed in Addrlib.
365 * For now, just figure it out here.
366 * Note that only 2D_TILE_THIN1 is handled here.
368 assert(!(surf
->flags
& RADEON_SURF_Z_OR_SBUFFER
));
369 assert(AddrSurfInfoIn
.tileMode
== ADDR_TM_2D_TILED_THIN1
);
371 if (AddrSurfInfoIn
.tileType
== ADDR_DISPLAYABLE
)
372 AddrSurfInfoIn
.tileIndex
= 10; /* 2D displayable */
374 AddrSurfInfoIn
.tileIndex
= 14; /* 2D non-displayable */
379 /* Calculate texture layout information. */
380 for (level
= 0; level
<= surf
->last_level
; level
++) {
381 r
= compute_level(ws
, surf
, false, level
, type
, compressed
,
382 &AddrSurfInfoIn
, &AddrSurfInfoOut
);
387 surf
->bo_alignment
= AddrSurfInfoOut
.baseAlign
;
388 surf
->pipe_config
= AddrSurfInfoOut
.pTileInfo
->pipeConfig
- 1;
390 /* For 2D modes only. */
391 if (AddrSurfInfoOut
.tileMode
>= ADDR_TM_2D_TILED_THIN1
) {
392 surf
->bankw
= AddrSurfInfoOut
.pTileInfo
->bankWidth
;
393 surf
->bankh
= AddrSurfInfoOut
.pTileInfo
->bankHeight
;
394 surf
->mtilea
= AddrSurfInfoOut
.pTileInfo
->macroAspectRatio
;
395 surf
->tile_split
= AddrSurfInfoOut
.pTileInfo
->tileSplitBytes
;
396 surf
->num_banks
= AddrSurfInfoOut
.pTileInfo
->banks
;
401 /* Calculate texture layout information for stencil. */
402 if (surf
->flags
& RADEON_SURF_SBUFFER
) {
403 AddrSurfInfoIn
.bpp
= 8;
404 /* This will be ignored if AddrSurfInfoIn.pTileInfo is NULL. */
405 AddrTileInfoIn
.tileSplitBytes
= surf
->stencil_tile_split
;
407 for (level
= 0; level
<= surf
->last_level
; level
++) {
408 r
= compute_level(ws
, surf
, true, level
, type
, compressed
,
409 &AddrSurfInfoIn
, &AddrSurfInfoOut
);
414 surf
->stencil_offset
= surf
->stencil_level
[0].offset
;
416 /* For 2D modes only. */
417 if (AddrSurfInfoOut
.tileMode
>= ADDR_TM_2D_TILED_THIN1
) {
418 surf
->stencil_tile_split
=
419 AddrSurfInfoOut
.pTileInfo
->tileSplitBytes
;
428 static int amdgpu_surface_best(struct radeon_winsys
*rws
,
429 struct radeon_surf
*surf
)
434 void amdgpu_surface_init_functions(struct amdgpu_winsys
*ws
)
436 ws
->base
.surface_init
= amdgpu_surface_init
;
437 ws
->base
.surface_best
= amdgpu_surface_best
;