2 * Copyright © 2011 Red Hat All Rights Reserved.
3 * Copyright © 2014 Advanced Micro Devices, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining
7 * a copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
15 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
16 * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
17 * NON-INFRINGEMENT. IN NO EVENT SHALL THE COPYRIGHT HOLDERS, AUTHORS
18 * AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
20 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
23 * The above copyright notice and this permission notice (including the
24 * next paragraph) shall be included in all copies or substantial portions
29 * Marek Olšák <maraeo@gmail.com>
32 #include "amdgpu_winsys.h"
38 #ifndef NO_MACRO_ENTRIES
39 #define NO_MACRO_ENTRIES 16
42 #ifndef CIASICIDGFXENGINE_SOUTHERNISLAND
43 #define CIASICIDGFXENGINE_SOUTHERNISLAND 0x0000000A
47 static int amdgpu_surface_sanity(const struct radeon_surf
*surf
)
49 unsigned type
= RADEON_SURF_GET(surf
->flags
, TYPE
);
51 if (!(surf
->flags
& RADEON_SURF_HAS_TILE_MODE_INDEX
))
54 /* all dimension must be at least 1 ! */
55 if (!surf
->npix_x
|| !surf
->npix_y
|| !surf
->npix_z
||
59 if (!surf
->blk_w
|| !surf
->blk_h
|| !surf
->blk_d
)
62 switch (surf
->nsamples
) {
73 case RADEON_SURF_TYPE_1D
:
77 case RADEON_SURF_TYPE_2D
:
78 case RADEON_SURF_TYPE_CUBEMAP
:
79 if (surf
->npix_z
> 1 || surf
->array_size
> 1)
82 case RADEON_SURF_TYPE_3D
:
83 if (surf
->array_size
> 1)
86 case RADEON_SURF_TYPE_1D_ARRAY
:
90 case RADEON_SURF_TYPE_2D_ARRAY
:
100 static void *ADDR_API
allocSysMem(const ADDR_ALLOCSYSMEM_INPUT
* pInput
)
102 return malloc(pInput
->sizeInBytes
);
105 static ADDR_E_RETURNCODE ADDR_API
freeSysMem(const ADDR_FREESYSMEM_INPUT
* pInput
)
107 free(pInput
->pVirtAddr
);
112 * This returns the number of banks for the surface.
113 * Possible values: 2, 4, 8, 16.
115 static uint32_t cik_num_banks(struct amdgpu_winsys
*ws
,
116 struct radeon_surf
*surf
)
118 unsigned index
, tileb
;
120 tileb
= 8 * 8 * surf
->bpe
;
121 tileb
= MIN2(surf
->tile_split
, tileb
);
123 for (index
= 0; tileb
> 64; index
++) {
128 return 2 << ((ws
->amdinfo
.gb_macro_tile_mode
[index
] >> 6) & 0x3);
131 ADDR_HANDLE
amdgpu_addr_create(struct amdgpu_winsys
*ws
)
133 ADDR_CREATE_INPUT addrCreateInput
= {0};
134 ADDR_CREATE_OUTPUT addrCreateOutput
= {0};
135 ADDR_REGISTER_VALUE regValue
= {0};
136 ADDR_CREATE_FLAGS createFlags
= {{0}};
137 ADDR_E_RETURNCODE addrRet
;
139 addrCreateInput
.size
= sizeof(ADDR_CREATE_INPUT
);
140 addrCreateOutput
.size
= sizeof(ADDR_CREATE_OUTPUT
);
142 regValue
.noOfBanks
= ws
->amdinfo
.mc_arb_ramcfg
& 0x3;
143 regValue
.gbAddrConfig
= ws
->amdinfo
.gb_addr_cfg
;
144 regValue
.noOfRanks
= (ws
->amdinfo
.mc_arb_ramcfg
& 0x4) >> 2;
146 regValue
.backendDisables
= ws
->amdinfo
.backend_disable
[0];
147 regValue
.pTileConfig
= ws
->amdinfo
.gb_tile_mode
;
148 regValue
.noOfEntries
= sizeof(ws
->amdinfo
.gb_tile_mode
) /
149 sizeof(ws
->amdinfo
.gb_tile_mode
[0]);
150 regValue
.pMacroTileConfig
= ws
->amdinfo
.gb_macro_tile_mode
;
151 regValue
.noOfMacroEntries
= sizeof(ws
->amdinfo
.gb_macro_tile_mode
) /
152 sizeof(ws
->amdinfo
.gb_macro_tile_mode
[0]);
154 createFlags
.value
= 0;
155 createFlags
.useTileIndex
= 1;
156 createFlags
.degradeBaseLevel
= 1;
158 addrCreateInput
.chipEngine
= CIASICIDGFXENGINE_SOUTHERNISLAND
;
159 addrCreateInput
.chipFamily
= ws
->family
;
160 addrCreateInput
.chipRevision
= ws
->rev_id
;
161 addrCreateInput
.createFlags
= createFlags
;
162 addrCreateInput
.callbacks
.allocSysMem
= allocSysMem
;
163 addrCreateInput
.callbacks
.freeSysMem
= freeSysMem
;
164 addrCreateInput
.callbacks
.debugPrint
= 0;
165 addrCreateInput
.regValue
= regValue
;
167 addrRet
= AddrCreate(&addrCreateInput
, &addrCreateOutput
);
168 if (addrRet
!= ADDR_OK
)
171 return addrCreateOutput
.hLib
;
174 static int compute_level(struct amdgpu_winsys
*ws
,
175 struct radeon_surf
*surf
, bool is_stencil
,
176 unsigned level
, unsigned type
, bool compressed
,
177 ADDR_COMPUTE_SURFACE_INFO_INPUT
*AddrSurfInfoIn
,
178 ADDR_COMPUTE_SURFACE_INFO_OUTPUT
*AddrSurfInfoOut
,
179 ADDR_COMPUTE_DCCINFO_INPUT
*AddrDccIn
,
180 ADDR_COMPUTE_DCCINFO_OUTPUT
*AddrDccOut
)
182 struct radeon_surf_level
*surf_level
;
183 ADDR_E_RETURNCODE ret
;
185 AddrSurfInfoIn
->mipLevel
= level
;
186 AddrSurfInfoIn
->width
= u_minify(surf
->npix_x
, level
);
187 AddrSurfInfoIn
->height
= u_minify(surf
->npix_y
, level
);
189 if (type
== RADEON_SURF_TYPE_3D
)
190 AddrSurfInfoIn
->numSlices
= u_minify(surf
->npix_z
, level
);
191 else if (type
== RADEON_SURF_TYPE_CUBEMAP
)
192 AddrSurfInfoIn
->numSlices
= 6;
194 AddrSurfInfoIn
->numSlices
= surf
->array_size
;
197 /* Set the base level pitch. This is needed for calculation
198 * of non-zero levels. */
200 AddrSurfInfoIn
->basePitch
= surf
->stencil_level
[0].nblk_x
;
202 AddrSurfInfoIn
->basePitch
= surf
->level
[0].nblk_x
;
204 /* Convert blocks to pixels for compressed formats. */
206 AddrSurfInfoIn
->basePitch
*= surf
->blk_w
;
209 ret
= AddrComputeSurfaceInfo(ws
->addrlib
,
212 if (ret
!= ADDR_OK
) {
216 surf_level
= is_stencil
? &surf
->stencil_level
[level
] : &surf
->level
[level
];
217 surf_level
->offset
= align(surf
->bo_size
, AddrSurfInfoOut
->baseAlign
);
218 surf_level
->slice_size
= AddrSurfInfoOut
->sliceSize
;
219 surf_level
->pitch_bytes
= AddrSurfInfoOut
->pitch
* (is_stencil
? 1 : surf
->bpe
);
220 surf_level
->npix_x
= u_minify(surf
->npix_x
, level
);
221 surf_level
->npix_y
= u_minify(surf
->npix_y
, level
);
222 surf_level
->npix_z
= u_minify(surf
->npix_z
, level
);
223 surf_level
->nblk_x
= AddrSurfInfoOut
->pitch
;
224 surf_level
->nblk_y
= AddrSurfInfoOut
->height
;
225 if (type
== RADEON_SURF_TYPE_3D
)
226 surf_level
->nblk_z
= AddrSurfInfoOut
->depth
;
228 surf_level
->nblk_z
= 1;
230 switch (AddrSurfInfoOut
->tileMode
) {
231 case ADDR_TM_LINEAR_GENERAL
:
232 surf_level
->mode
= RADEON_SURF_MODE_LINEAR
;
234 case ADDR_TM_LINEAR_ALIGNED
:
235 surf_level
->mode
= RADEON_SURF_MODE_LINEAR_ALIGNED
;
237 case ADDR_TM_1D_TILED_THIN1
:
238 surf_level
->mode
= RADEON_SURF_MODE_1D
;
240 case ADDR_TM_2D_TILED_THIN1
:
241 surf_level
->mode
= RADEON_SURF_MODE_2D
;
248 surf
->stencil_tiling_index
[level
] = AddrSurfInfoOut
->tileIndex
;
250 surf
->tiling_index
[level
] = AddrSurfInfoOut
->tileIndex
;
252 surf
->bo_size
= surf_level
->offset
+ AddrSurfInfoOut
->surfSize
;
254 if (AddrSurfInfoIn
->flags
.dccCompatible
) {
255 AddrDccIn
->colorSurfSize
= AddrSurfInfoOut
->surfSize
;
256 AddrDccIn
->tileMode
= AddrSurfInfoOut
->tileMode
;
257 AddrDccIn
->tileInfo
= *AddrSurfInfoOut
->pTileInfo
;
258 AddrDccIn
->tileIndex
= AddrSurfInfoOut
->tileIndex
;
259 AddrDccIn
->macroModeIndex
= AddrSurfInfoOut
->macroModeIndex
;
261 ret
= AddrComputeDccInfo(ws
->addrlib
,
265 if (ret
== ADDR_OK
) {
266 surf_level
->dcc_offset
= surf
->dcc_size
;
267 surf
->dcc_size
= surf_level
->dcc_offset
+ AddrDccOut
->dccRamSize
;
268 surf
->dcc_alignment
= MAX2(surf
->dcc_alignment
, AddrDccOut
->dccRamBaseAlign
);
271 surf_level
->dcc_offset
= 0;
275 surf_level
->dcc_offset
= 0;
281 static int amdgpu_surface_init(struct radeon_winsys
*rws
,
282 struct radeon_surf
*surf
)
284 struct amdgpu_winsys
*ws
= (struct amdgpu_winsys
*)rws
;
285 unsigned level
, mode
, type
;
287 ADDR_COMPUTE_SURFACE_INFO_INPUT AddrSurfInfoIn
= {0};
288 ADDR_COMPUTE_SURFACE_INFO_OUTPUT AddrSurfInfoOut
= {0};
289 ADDR_COMPUTE_DCCINFO_INPUT AddrDccIn
= {0};
290 ADDR_COMPUTE_DCCINFO_OUTPUT AddrDccOut
= {0};
291 ADDR_TILEINFO AddrTileInfoIn
= {0};
292 ADDR_TILEINFO AddrTileInfoOut
= {0};
295 r
= amdgpu_surface_sanity(surf
);
299 AddrSurfInfoIn
.size
= sizeof(ADDR_COMPUTE_SURFACE_INFO_INPUT
);
300 AddrSurfInfoOut
.size
= sizeof(ADDR_COMPUTE_SURFACE_INFO_OUTPUT
);
301 AddrDccIn
.size
= sizeof(ADDR_COMPUTE_DCCINFO_INPUT
);
302 AddrDccOut
.size
= sizeof(ADDR_COMPUTE_DCCINFO_OUTPUT
);
303 AddrSurfInfoOut
.pTileInfo
= &AddrTileInfoOut
;
305 type
= RADEON_SURF_GET(surf
->flags
, TYPE
);
306 mode
= RADEON_SURF_GET(surf
->flags
, MODE
);
307 compressed
= surf
->blk_w
== 4 && surf
->blk_h
== 4;
309 /* MSAA and FMASK require 2D tiling. */
310 if (surf
->nsamples
> 1 ||
311 (surf
->flags
& RADEON_SURF_FMASK
))
312 mode
= RADEON_SURF_MODE_2D
;
314 /* DB doesn't support linear layouts. */
315 if (surf
->flags
& (RADEON_SURF_Z_OR_SBUFFER
) &&
316 mode
< RADEON_SURF_MODE_1D
)
317 mode
= RADEON_SURF_MODE_1D
;
319 /* Set the requested tiling mode. */
321 case RADEON_SURF_MODE_LINEAR
:
322 AddrSurfInfoIn
.tileMode
= ADDR_TM_LINEAR_GENERAL
;
324 case RADEON_SURF_MODE_LINEAR_ALIGNED
:
325 AddrSurfInfoIn
.tileMode
= ADDR_TM_LINEAR_ALIGNED
;
327 case RADEON_SURF_MODE_1D
:
328 AddrSurfInfoIn
.tileMode
= ADDR_TM_1D_TILED_THIN1
;
330 case RADEON_SURF_MODE_2D
:
331 AddrSurfInfoIn
.tileMode
= ADDR_TM_2D_TILED_THIN1
;
337 /* The format must be set correctly for the allocation of compressed
338 * textures to work. In other cases, setting the bpp is sufficient. */
342 AddrSurfInfoIn
.format
= ADDR_FMT_BC1
;
345 AddrSurfInfoIn
.format
= ADDR_FMT_BC3
;
352 AddrDccIn
.bpp
= AddrSurfInfoIn
.bpp
= surf
->bpe
* 8;
355 AddrDccIn
.numSamples
= AddrSurfInfoIn
.numSamples
= surf
->nsamples
;
356 AddrSurfInfoIn
.tileIndex
= -1;
358 /* Set the micro tile type. */
359 if (surf
->flags
& RADEON_SURF_SCANOUT
)
360 AddrSurfInfoIn
.tileType
= ADDR_DISPLAYABLE
;
361 else if (surf
->flags
& RADEON_SURF_Z_OR_SBUFFER
)
362 AddrSurfInfoIn
.tileType
= ADDR_DEPTH_SAMPLE_ORDER
;
364 AddrSurfInfoIn
.tileType
= ADDR_NON_DISPLAYABLE
;
366 AddrSurfInfoIn
.flags
.color
= !(surf
->flags
& RADEON_SURF_Z_OR_SBUFFER
);
367 AddrSurfInfoIn
.flags
.depth
= (surf
->flags
& RADEON_SURF_ZBUFFER
) != 0;
368 AddrSurfInfoIn
.flags
.stencil
= (surf
->flags
& RADEON_SURF_SBUFFER
) != 0;
369 AddrSurfInfoIn
.flags
.cube
= type
== RADEON_SURF_TYPE_CUBEMAP
;
370 AddrSurfInfoIn
.flags
.display
= (surf
->flags
& RADEON_SURF_SCANOUT
) != 0;
371 AddrSurfInfoIn
.flags
.pow2Pad
= surf
->last_level
> 0;
372 AddrSurfInfoIn
.flags
.degrade4Space
= 1;
373 AddrSurfInfoIn
.flags
.dccCompatible
= !(surf
->flags
& RADEON_SURF_Z_OR_SBUFFER
) &&
374 !(surf
->flags
& RADEON_SURF_SCANOUT
) &&
375 !compressed
&& AddrDccIn
.numSamples
<= 1;
377 /* This disables incorrect calculations (hacks) in addrlib. */
378 AddrSurfInfoIn
.flags
.noStencil
= 1;
380 /* Set preferred macrotile parameters. This is usually required
381 * for shared resources. This is for 2D tiling only. */
382 if (AddrSurfInfoIn
.tileMode
>= ADDR_TM_2D_TILED_THIN1
&&
383 surf
->bankw
&& surf
->bankh
&& surf
->mtilea
&& surf
->tile_split
) {
384 /* If any of these parameters are incorrect, the calculation
386 AddrTileInfoIn
.banks
= cik_num_banks(ws
, surf
);
387 AddrTileInfoIn
.bankWidth
= surf
->bankw
;
388 AddrTileInfoIn
.bankHeight
= surf
->bankh
;
389 AddrTileInfoIn
.macroAspectRatio
= surf
->mtilea
;
390 AddrTileInfoIn
.tileSplitBytes
= surf
->tile_split
;
391 AddrSurfInfoIn
.flags
.degrade4Space
= 0;
392 AddrSurfInfoIn
.pTileInfo
= &AddrTileInfoIn
;
394 /* If AddrSurfInfoIn.pTileInfo is set, Addrlib doesn't set
395 * the tile index, because we are expected to know it if
396 * we know the other parameters.
398 * This is something that can easily be fixed in Addrlib.
399 * For now, just figure it out here.
400 * Note that only 2D_TILE_THIN1 is handled here.
402 assert(!(surf
->flags
& RADEON_SURF_Z_OR_SBUFFER
));
403 assert(AddrSurfInfoIn
.tileMode
== ADDR_TM_2D_TILED_THIN1
);
405 if (AddrSurfInfoIn
.tileType
== ADDR_DISPLAYABLE
)
406 AddrSurfInfoIn
.tileIndex
= 10; /* 2D displayable */
408 AddrSurfInfoIn
.tileIndex
= 14; /* 2D non-displayable */
413 surf
->dcc_alignment
= 1;
415 /* Calculate texture layout information. */
416 for (level
= 0; level
<= surf
->last_level
; level
++) {
417 r
= compute_level(ws
, surf
, false, level
, type
, compressed
,
418 &AddrSurfInfoIn
, &AddrSurfInfoOut
, &AddrDccIn
, &AddrDccOut
);
423 surf
->bo_alignment
= AddrSurfInfoOut
.baseAlign
;
424 surf
->pipe_config
= AddrSurfInfoOut
.pTileInfo
->pipeConfig
- 1;
426 /* For 2D modes only. */
427 if (AddrSurfInfoOut
.tileMode
>= ADDR_TM_2D_TILED_THIN1
) {
428 surf
->bankw
= AddrSurfInfoOut
.pTileInfo
->bankWidth
;
429 surf
->bankh
= AddrSurfInfoOut
.pTileInfo
->bankHeight
;
430 surf
->mtilea
= AddrSurfInfoOut
.pTileInfo
->macroAspectRatio
;
431 surf
->tile_split
= AddrSurfInfoOut
.pTileInfo
->tileSplitBytes
;
432 surf
->num_banks
= AddrSurfInfoOut
.pTileInfo
->banks
;
437 /* Calculate texture layout information for stencil. */
438 if (surf
->flags
& RADEON_SURF_SBUFFER
) {
439 AddrSurfInfoIn
.bpp
= 8;
440 /* This will be ignored if AddrSurfInfoIn.pTileInfo is NULL. */
441 AddrTileInfoIn
.tileSplitBytes
= surf
->stencil_tile_split
;
443 for (level
= 0; level
<= surf
->last_level
; level
++) {
444 r
= compute_level(ws
, surf
, true, level
, type
, compressed
,
445 &AddrSurfInfoIn
, &AddrSurfInfoOut
, &AddrDccIn
, &AddrDccOut
);
450 surf
->stencil_offset
= surf
->stencil_level
[0].offset
;
452 /* For 2D modes only. */
453 if (AddrSurfInfoOut
.tileMode
>= ADDR_TM_2D_TILED_THIN1
) {
454 surf
->stencil_tile_split
=
455 AddrSurfInfoOut
.pTileInfo
->tileSplitBytes
;
464 static int amdgpu_surface_best(struct radeon_winsys
*rws
,
465 struct radeon_surf
*surf
)
470 void amdgpu_surface_init_functions(struct amdgpu_winsys
*ws
)
472 ws
->base
.surface_init
= amdgpu_surface_init
;
473 ws
->base
.surface_best
= amdgpu_surface_best
;