2 * Copyright 2008 Ben Skeggs
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
23 #include "pipe/p_state.h"
24 #include "pipe/p_defines.h"
25 #include "util/u_inlines.h"
26 #include "util/u_format.h"
28 #include "nv50/nv50_context.h"
29 #include "nv50/nv50_resource.h"
32 nv50_tex_choose_tile_dims_helper(unsigned nx
, unsigned ny
, unsigned nz
)
34 uint32_t tile_mode
= 0x000;
36 if (ny
> 64) tile_mode
= 0x040; /* height 128 tiles */
38 if (ny
> 32) tile_mode
= 0x030; /* height 64 tiles */
40 if (ny
> 16) tile_mode
= 0x020; /* height 32 tiles */
42 if (ny
> 8) tile_mode
= 0x010; /* height 16 tiles */
47 if (tile_mode
> 0x020)
50 if (nz
> 16 && tile_mode
< 0x020)
51 return tile_mode
| 0x500; /* depth 32 tiles */
52 if (nz
> 8) return tile_mode
| 0x400; /* depth 16 tiles */
53 if (nz
> 4) return tile_mode
| 0x300; /* depth 8 tiles */
54 if (nz
> 2) return tile_mode
| 0x200; /* depth 4 tiles */
56 return tile_mode
| 0x100;
60 nv50_tex_choose_tile_dims(unsigned nx
, unsigned ny
, unsigned nz
)
62 return nv50_tex_choose_tile_dims_helper(nx
, ny
* 2, nz
);
66 nv50_mt_choose_storage_type(struct nv50_miptree
*mt
, boolean compressed
)
68 const unsigned ms
= mt
->ms_x
+ mt
->ms_y
;
72 if (unlikely(mt
->base
.base
.flags
& NOUVEAU_RESOURCE_FLAG_LINEAR
))
74 if (unlikely(mt
->base
.base
.bind
& PIPE_BIND_CURSOR
))
77 switch (mt
->base
.base
.format
) {
78 case PIPE_FORMAT_Z16_UNORM
:
79 tile_flags
= 0x6c + ms
;
81 case PIPE_FORMAT_S8_UINT_Z24_UNORM
:
82 tile_flags
= 0x18 + ms
;
84 case PIPE_FORMAT_Z24X8_UNORM
:
85 case PIPE_FORMAT_Z24_UNORM_S8_UINT
:
86 tile_flags
= 0x128 + ms
;
88 case PIPE_FORMAT_Z32_FLOAT
:
89 tile_flags
= 0x40 + ms
;
91 case PIPE_FORMAT_Z32_FLOAT_S8X24_UINT
:
92 tile_flags
= 0x60 + ms
;
95 switch (util_format_get_blocksizebits(mt
->base
.base
.format
)) {
102 case 2: tile_flags
= 0xfc; break;
103 case 3: tile_flags
= 0xfd; break;
110 if (mt
->base
.base
.bind
& PIPE_BIND_SCANOUT
) {
115 case 2: tile_flags
= 0xf8; break;
116 case 3: tile_flags
= 0xf9; break;
130 if (mt
->base
.base
.bind
& PIPE_BIND_CURSOR
)
135 tile_flags
&= ~0x180;
141 nv50_miptree_destroy(struct pipe_screen
*pscreen
, struct pipe_resource
*pt
)
143 struct nv50_miptree
*mt
= nv50_miptree(pt
);
145 nouveau_bo_ref(NULL
, &mt
->base
.bo
);
147 nouveau_fence_ref(NULL
, &mt
->base
.fence
);
148 nouveau_fence_ref(NULL
, &mt
->base
.fence_wr
);
150 NOUVEAU_DRV_STAT(nouveau_screen(pscreen
), tex_obj_current_count
, -1);
151 NOUVEAU_DRV_STAT(nouveau_screen(pscreen
), tex_obj_current_bytes
,
152 -(uint64_t)mt
->total_size
);
158 nv50_miptree_get_handle(struct pipe_screen
*pscreen
,
159 struct pipe_resource
*pt
,
160 struct winsys_handle
*whandle
)
162 struct nv50_miptree
*mt
= nv50_miptree(pt
);
165 if (!mt
|| !mt
->base
.bo
)
168 stride
= mt
->level
[0].pitch
;
170 return nouveau_screen_bo_get_handle(pscreen
,
176 const struct u_resource_vtbl nv50_miptree_vtbl
=
178 nv50_miptree_get_handle
, /* get_handle */
179 nv50_miptree_destroy
, /* resource_destroy */
180 nv50_miptree_transfer_map
, /* transfer_map */
181 u_default_transfer_flush_region
, /* transfer_flush_region */
182 nv50_miptree_transfer_unmap
, /* transfer_unmap */
183 u_default_transfer_inline_write
/* transfer_inline_write */
186 static INLINE boolean
187 nv50_miptree_init_ms_mode(struct nv50_miptree
*mt
)
189 switch (mt
->base
.base
.nr_samples
) {
191 mt
->ms_mode
= NV50_3D_MULTISAMPLE_MODE_MS8
;
196 mt
->ms_mode
= NV50_3D_MULTISAMPLE_MODE_MS4
;
201 mt
->ms_mode
= NV50_3D_MULTISAMPLE_MODE_MS2
;
206 mt
->ms_mode
= NV50_3D_MULTISAMPLE_MODE_MS1
;
209 NOUVEAU_ERR("invalid nr_samples: %u\n", mt
->base
.base
.nr_samples
);
216 nv50_miptree_init_layout_linear(struct nv50_miptree
*mt
, unsigned pitch_align
)
218 struct pipe_resource
*pt
= &mt
->base
.base
;
219 const unsigned blocksize
= util_format_get_blocksize(pt
->format
);
220 unsigned h
= pt
->height0
;
222 if (util_format_is_depth_or_stencil(pt
->format
))
225 if ((pt
->last_level
> 0) || (pt
->depth0
> 1) || (pt
->array_size
> 1))
227 if (mt
->ms_x
| mt
->ms_y
)
230 mt
->level
[0].pitch
= align(pt
->width0
* blocksize
, pitch_align
);
232 /* Account for very generous prefetch (allocate size as if tiled). */
234 h
= util_next_power_of_two(h
);
236 mt
->total_size
= mt
->level
[0].pitch
* h
;
242 nv50_miptree_init_layout_video(struct nv50_miptree
*mt
)
244 const struct pipe_resource
*pt
= &mt
->base
.base
;
245 const unsigned blocksize
= util_format_get_blocksize(pt
->format
);
247 assert(pt
->last_level
== 0);
248 assert(mt
->ms_x
== 0 && mt
->ms_y
== 0);
249 assert(!util_format_is_compressed(pt
->format
));
251 mt
->layout_3d
= pt
->target
== PIPE_TEXTURE_3D
;
253 mt
->level
[0].tile_mode
= 0x20;
254 mt
->level
[0].pitch
= align(pt
->width0
* blocksize
, 64);
255 mt
->total_size
= align(pt
->height0
, 16) * mt
->level
[0].pitch
* (mt
->layout_3d
? pt
->depth0
: 1);
257 if (pt
->array_size
> 1) {
258 mt
->layer_stride
= align(mt
->total_size
, NV50_TILE_SIZE(0x20));
259 mt
->total_size
= mt
->layer_stride
* pt
->array_size
;
264 nv50_miptree_init_layout_tiled(struct nv50_miptree
*mt
)
266 struct pipe_resource
*pt
= &mt
->base
.base
;
268 const unsigned blocksize
= util_format_get_blocksize(pt
->format
);
270 mt
->layout_3d
= pt
->target
== PIPE_TEXTURE_3D
;
272 w
= pt
->width0
<< mt
->ms_x
;
273 h
= pt
->height0
<< mt
->ms_y
;
275 /* For 3D textures, a mipmap is spanned by all the layers, for array
276 * textures and cube maps, each layer contains its own mipmaps.
278 d
= mt
->layout_3d
? pt
->depth0
: 1;
280 for (l
= 0; l
<= pt
->last_level
; ++l
) {
281 struct nv50_miptree_level
*lvl
= &mt
->level
[l
];
282 unsigned tsx
, tsy
, tsz
;
283 unsigned nbx
= util_format_get_nblocksx(pt
->format
, w
);
284 unsigned nby
= util_format_get_nblocksy(pt
->format
, h
);
286 lvl
->offset
= mt
->total_size
;
288 lvl
->tile_mode
= nv50_tex_choose_tile_dims(nbx
, nby
, d
);
290 tsx
= NV50_TILE_SIZE_X(lvl
->tile_mode
); /* x is tile row pitch in bytes */
291 tsy
= NV50_TILE_SIZE_Y(lvl
->tile_mode
);
292 tsz
= NV50_TILE_SIZE_Z(lvl
->tile_mode
);
294 lvl
->pitch
= align(nbx
* blocksize
, tsx
);
296 mt
->total_size
+= lvl
->pitch
* align(nby
, tsy
) * align(d
, tsz
);
303 if (pt
->array_size
> 1) {
304 mt
->layer_stride
= align(mt
->total_size
,
305 NV50_TILE_SIZE(mt
->level
[0].tile_mode
));
306 mt
->total_size
= mt
->layer_stride
* pt
->array_size
;
310 struct pipe_resource
*
311 nv50_miptree_create(struct pipe_screen
*pscreen
,
312 const struct pipe_resource
*templ
)
314 struct nouveau_device
*dev
= nouveau_screen(pscreen
)->device
;
315 struct nv50_miptree
*mt
= CALLOC_STRUCT(nv50_miptree
);
316 struct pipe_resource
*pt
= &mt
->base
.base
;
318 union nouveau_bo_config bo_config
;
324 mt
->base
.vtbl
= &nv50_miptree_vtbl
;
326 pipe_reference_init(&pt
->reference
, 1);
327 pt
->screen
= pscreen
;
329 if (pt
->bind
& PIPE_BIND_LINEAR
)
330 pt
->flags
|= NOUVEAU_RESOURCE_FLAG_LINEAR
;
332 bo_config
.nv50
.memtype
= nv50_mt_choose_storage_type(mt
, TRUE
);
334 if (!nv50_miptree_init_ms_mode(mt
)) {
339 if (unlikely(pt
->flags
& NV50_RESOURCE_FLAG_VIDEO
)) {
340 nv50_miptree_init_layout_video(mt
);
341 if (pt
->flags
& NV50_RESOURCE_FLAG_NOALLOC
) {
342 /* BO allocation done by client */
346 if (bo_config
.nv50
.memtype
!= 0) {
347 nv50_miptree_init_layout_tiled(mt
);
349 if (!nv50_miptree_init_layout_linear(mt
, 64)) {
353 bo_config
.nv50
.tile_mode
= mt
->level
[0].tile_mode
;
355 bo_flags
= NOUVEAU_BO_VRAM
| NOUVEAU_BO_NOSNOOP
;
356 if (mt
->base
.base
.bind
& (PIPE_BIND_CURSOR
| PIPE_BIND_DISPLAY_TARGET
))
357 bo_flags
|= NOUVEAU_BO_CONTIG
;
359 ret
= nouveau_bo_new(dev
, bo_flags
, 4096, mt
->total_size
, &bo_config
,
365 mt
->base
.domain
= NOUVEAU_BO_VRAM
;
366 mt
->base
.address
= mt
->base
.bo
->offset
;
371 struct pipe_resource
*
372 nv50_miptree_from_handle(struct pipe_screen
*pscreen
,
373 const struct pipe_resource
*templ
,
374 struct winsys_handle
*whandle
)
376 struct nv50_miptree
*mt
;
379 /* only supports 2D, non-mipmapped textures for the moment */
380 if ((templ
->target
!= PIPE_TEXTURE_2D
&&
381 templ
->target
!= PIPE_TEXTURE_RECT
) ||
382 templ
->last_level
!= 0 ||
383 templ
->depth0
!= 1 ||
384 templ
->array_size
> 1)
387 mt
= CALLOC_STRUCT(nv50_miptree
);
391 mt
->base
.bo
= nouveau_screen_bo_from_handle(pscreen
, whandle
, &stride
);
392 if (mt
->base
.bo
== NULL
) {
396 mt
->base
.domain
= NOUVEAU_BO_VRAM
;
397 mt
->base
.address
= mt
->base
.bo
->offset
;
399 mt
->base
.base
= *templ
;
400 mt
->base
.vtbl
= &nv50_miptree_vtbl
;
401 pipe_reference_init(&mt
->base
.base
.reference
, 1);
402 mt
->base
.base
.screen
= pscreen
;
403 mt
->level
[0].pitch
= stride
;
404 mt
->level
[0].offset
= 0;
405 mt
->level
[0].tile_mode
= mt
->base
.bo
->config
.nv50
.tile_mode
;
407 /* no need to adjust bo reference count */
408 return &mt
->base
.base
;
412 /* Offset of zslice @z from start of level @l. */
414 nv50_mt_zslice_offset(const struct nv50_miptree
*mt
, unsigned l
, unsigned z
)
416 const struct pipe_resource
*pt
= &mt
->base
.base
;
418 unsigned tds
= NV50_TILE_SHIFT_Z(mt
->level
[l
].tile_mode
);
419 unsigned ths
= NV50_TILE_SHIFT_Y(mt
->level
[l
].tile_mode
);
421 unsigned nby
= util_format_get_nblocksy(pt
->format
,
422 u_minify(pt
->height0
, l
));
424 /* to next 2D tile slice within a 3D tile */
425 unsigned stride_2d
= NV50_TILE_SIZE_2D(mt
->level
[l
].tile_mode
);
427 /* to slice in the next (in z direction) 3D tile */
428 unsigned stride_3d
= (align(nby
, (1 << ths
)) * mt
->level
[l
].pitch
) << tds
;
430 return (z
& ((1 << tds
) - 1)) * stride_2d
+ (z
>> tds
) * stride_3d
;
433 /* Surface functions.
436 struct nv50_surface
*
437 nv50_surface_from_miptree(struct nv50_miptree
*mt
,
438 const struct pipe_surface
*templ
)
440 struct pipe_surface
*ps
;
441 struct nv50_surface
*ns
= CALLOC_STRUCT(nv50_surface
);
446 pipe_reference_init(&ps
->reference
, 1);
447 pipe_resource_reference(&ps
->texture
, &mt
->base
.base
);
449 ps
->format
= templ
->format
;
450 ps
->writable
= templ
->writable
;
451 ps
->u
.tex
.level
= templ
->u
.tex
.level
;
452 ps
->u
.tex
.first_layer
= templ
->u
.tex
.first_layer
;
453 ps
->u
.tex
.last_layer
= templ
->u
.tex
.last_layer
;
455 ns
->width
= u_minify(mt
->base
.base
.width0
, ps
->u
.tex
.level
);
456 ns
->height
= u_minify(mt
->base
.base
.height0
, ps
->u
.tex
.level
);
457 ns
->depth
= ps
->u
.tex
.last_layer
- ps
->u
.tex
.first_layer
+ 1;
458 ns
->offset
= mt
->level
[templ
->u
.tex
.level
].offset
;
460 /* comment says there are going to be removed, but they're used by the st */
461 ps
->width
= ns
->width
;
462 ps
->height
= ns
->height
;
464 ns
->width
<<= mt
->ms_x
;
465 ns
->height
<<= mt
->ms_y
;
470 struct pipe_surface
*
471 nv50_miptree_surface_new(struct pipe_context
*pipe
,
472 struct pipe_resource
*pt
,
473 const struct pipe_surface
*templ
)
475 struct nv50_miptree
*mt
= nv50_miptree(pt
);
476 struct nv50_surface
*ns
= nv50_surface_from_miptree(mt
, templ
);
479 ns
->base
.context
= pipe
;
481 if (ns
->base
.u
.tex
.first_layer
) {
482 const unsigned l
= ns
->base
.u
.tex
.level
;
483 const unsigned z
= ns
->base
.u
.tex
.first_layer
;
486 ns
->offset
+= nv50_mt_zslice_offset(mt
, l
, z
);
488 /* TODO: switch to depth 1 tiles; but actually this shouldn't happen */
490 (z
& (NV50_TILE_SIZE_Z(mt
->level
[l
].tile_mode
) - 1)))
491 NOUVEAU_ERR("Creating unsupported 3D surface !\n");
493 ns
->offset
+= mt
->layer_stride
* z
;