2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
24 #include "r300_texture_desc.h"
26 #include "r300_context.h"
27 #include "r300_winsys.h"
29 #include "util/u_format.h"
31 /* Returns the number of pixels that the texture should be aligned to
32 * in the given dimension. */
33 unsigned r300_get_pixel_alignment(enum pipe_format format
,
35 enum r300_buffer_tiling microtile
,
36 enum r300_buffer_tiling macrotile
,
37 enum r300_dim dim
, boolean is_rs690
)
39 static const unsigned table
[2][5][3][2] =
42 /* Macro: linear linear linear
43 Micro: linear tiled square-tiled */
44 {{ 32, 1}, { 8, 4}, { 0, 0}}, /* 8 bits per pixel */
45 {{ 16, 1}, { 8, 2}, { 4, 4}}, /* 16 bits per pixel */
46 {{ 8, 1}, { 4, 2}, { 0, 0}}, /* 32 bits per pixel */
47 {{ 4, 1}, { 2, 2}, { 0, 0}}, /* 64 bits per pixel */
48 {{ 2, 1}, { 0, 0}, { 0, 0}} /* 128 bits per pixel */
51 /* Macro: tiled tiled tiled
52 Micro: linear tiled square-tiled */
53 {{256, 8}, {64, 32}, { 0, 0}}, /* 8 bits per pixel */
54 {{128, 8}, {64, 16}, {32, 32}}, /* 16 bits per pixel */
55 {{ 64, 8}, {32, 16}, { 0, 0}}, /* 32 bits per pixel */
56 {{ 32, 8}, {16, 16}, { 0, 0}}, /* 64 bits per pixel */
57 {{ 16, 8}, { 0, 0}, { 0, 0}} /* 128 bits per pixel */
61 static const unsigned aa_block
[2] = {4, 8};
63 unsigned pixsize
= util_format_get_blocksize(format
);
65 assert(macrotile
<= R300_BUFFER_TILED
);
66 assert(microtile
<= R300_BUFFER_SQUARETILED
);
67 assert(pixsize
<= 16);
68 assert(dim
<= DIM_HEIGHT
);
70 if (num_samples
> 1) {
71 /* Multisampled textures have their own alignment scheme. */
76 /* Standard alignment. */
77 tile
= table
[macrotile
][util_logbase2(pixsize
)][microtile
][dim
];
78 if (macrotile
== 0 && is_rs690
&& dim
== DIM_WIDTH
) {
81 h_tile
= table
[macrotile
][util_logbase2(pixsize
)][microtile
][DIM_HEIGHT
];
82 align
= 64 / (pixsize
* h_tile
);
92 /* Return true if macrotiling should be enabled on the miplevel. */
93 static boolean
r300_texture_macro_switch(struct r300_resource
*tex
,
98 unsigned tile
, texdim
;
100 tile
= r300_get_pixel_alignment(tex
->b
.b
.b
.format
, tex
->b
.b
.b
.nr_samples
,
101 tex
->tex
.microtile
, R300_BUFFER_TILED
, dim
, 0);
102 if (dim
== DIM_WIDTH
) {
103 texdim
= u_minify(tex
->tex
.width0
, level
);
105 texdim
= u_minify(tex
->tex
.height0
, level
);
108 /* See TX_FILTER1_n.MACRO_SWITCH. */
110 return texdim
>= tile
;
112 return texdim
> tile
;
117 * Return the stride, in bytes, of the texture image of the given texture
118 * at the given level.
120 static unsigned r300_texture_get_stride(struct r300_screen
*screen
,
121 struct r300_resource
*tex
,
124 unsigned tile_width
, width
, stride
;
125 boolean is_rs690
= (screen
->caps
.family
== CHIP_FAMILY_RS600
||
126 screen
->caps
.family
== CHIP_FAMILY_RS690
||
127 screen
->caps
.family
== CHIP_FAMILY_RS740
);
129 if (tex
->tex
.stride_in_bytes_override
)
130 return tex
->tex
.stride_in_bytes_override
;
132 /* Check the level. */
133 if (level
> tex
->b
.b
.b
.last_level
) {
134 SCREEN_DBG(screen
, DBG_TEX
, "%s: level (%u) > last_level (%u)\n",
135 __FUNCTION__
, level
, tex
->b
.b
.b
.last_level
);
139 width
= u_minify(tex
->tex
.width0
, level
);
141 if (util_format_is_plain(tex
->b
.b
.b
.format
)) {
142 tile_width
= r300_get_pixel_alignment(tex
->b
.b
.b
.format
,
143 tex
->b
.b
.b
.nr_samples
,
145 tex
->tex
.macrotile
[level
],
146 DIM_WIDTH
, is_rs690
);
147 width
= align(width
, tile_width
);
149 stride
= util_format_get_stride(tex
->b
.b
.b
.format
, width
);
150 /* The alignment to 32 bytes is sort of implied by the layout... */
153 return align(util_format_get_stride(tex
->b
.b
.b
.format
, width
), is_rs690
? 64 : 32);
157 static unsigned r300_texture_get_nblocksy(struct r300_resource
*tex
,
159 boolean
*out_aligned_for_cbzb
)
161 unsigned height
, tile_height
;
163 height
= u_minify(tex
->tex
.height0
, level
);
165 if (util_format_is_plain(tex
->b
.b
.b
.format
)) {
166 tile_height
= r300_get_pixel_alignment(tex
->b
.b
.b
.format
,
167 tex
->b
.b
.b
.nr_samples
,
169 tex
->tex
.macrotile
[level
],
171 height
= align(height
, tile_height
);
173 /* This is needed for the kernel checker, unfortunately. */
174 if ((tex
->b
.b
.b
.target
!= PIPE_TEXTURE_1D
&&
175 tex
->b
.b
.b
.target
!= PIPE_TEXTURE_2D
&&
176 tex
->b
.b
.b
.target
!= PIPE_TEXTURE_RECT
) ||
177 tex
->b
.b
.b
.last_level
!= 0) {
178 height
= util_next_power_of_two(height
);
181 /* See if the CBZB clear can be used on the buffer,
182 * taking the texture size into account. */
183 if (out_aligned_for_cbzb
) {
184 if (tex
->tex
.macrotile
[level
]) {
185 /* When clearing, the layer (width*height) is horizontally split
186 * into two, and the upper and lower halves are cleared by the CB
187 * and ZB units, respectively. Therefore, the number of macrotiles
188 * in the Y direction must be even. */
190 /* Align the height so that there is an even number of macrotiles.
191 * Do so for 3 or more macrotiles in the Y direction. */
192 if (level
== 0 && tex
->b
.b
.b
.last_level
== 0 &&
193 (tex
->b
.b
.b
.target
== PIPE_TEXTURE_1D
||
194 tex
->b
.b
.b
.target
== PIPE_TEXTURE_2D
||
195 tex
->b
.b
.b
.target
== PIPE_TEXTURE_RECT
) &&
196 height
>= tile_height
* 3) {
197 height
= align(height
, tile_height
* 2);
200 *out_aligned_for_cbzb
= height
% (tile_height
* 2) == 0;
202 *out_aligned_for_cbzb
= FALSE
;
207 return util_format_get_nblocksy(tex
->b
.b
.b
.format
, height
);
210 static void r300_texture_3d_fix_mipmapping(struct r300_screen
*screen
,
211 struct r300_resource
*tex
)
213 /* The kernels <= 2.6.34-rc4 compute the size of mipmapped 3D textures
214 * incorrectly. This is a workaround to prevent CS from being rejected. */
218 if (!screen
->rws
->get_value(screen
->rws
, R300_VID_DRM_2_3_0
) &&
219 tex
->b
.b
.b
.target
== PIPE_TEXTURE_3D
&&
220 tex
->b
.b
.b
.last_level
> 0) {
223 for (i
= 0; i
<= tex
->b
.b
.b
.last_level
; i
++) {
224 size
+= tex
->tex
.stride_in_bytes
[i
] *
225 r300_texture_get_nblocksy(tex
, i
, FALSE
);
228 size
*= tex
->tex
.depth0
;
229 tex
->tex
.size_in_bytes
= size
;
233 /* Get a width in pixels from a stride in bytes. */
234 static unsigned stride_to_width(enum pipe_format format
,
235 unsigned stride_in_bytes
)
237 return (stride_in_bytes
/ util_format_get_blocksize(format
)) *
238 util_format_get_blockwidth(format
);
241 static void r300_setup_miptree(struct r300_screen
*screen
,
242 struct r300_resource
*tex
,
243 boolean align_for_cbzb
)
245 struct pipe_resource
*base
= &tex
->b
.b
.b
;
246 unsigned stride
, size
, layer_size
, nblocksy
, i
;
247 boolean rv350_mode
= screen
->caps
.family
>= CHIP_FAMILY_R350
;
248 boolean aligned_for_cbzb
;
250 tex
->tex
.size_in_bytes
= 0;
252 SCREEN_DBG(screen
, DBG_TEXALLOC
,
253 "r300: Making miptree for texture, format %s\n",
254 util_format_short_name(base
->format
));
256 for (i
= 0; i
<= base
->last_level
; i
++) {
257 /* Let's see if this miplevel can be macrotiled. */
258 tex
->tex
.macrotile
[i
] =
259 (tex
->tex
.macrotile
[0] == R300_BUFFER_TILED
&&
260 r300_texture_macro_switch(tex
, i
, rv350_mode
, DIM_WIDTH
) &&
261 r300_texture_macro_switch(tex
, i
, rv350_mode
, DIM_HEIGHT
)) ?
262 R300_BUFFER_TILED
: R300_BUFFER_LINEAR
;
264 stride
= r300_texture_get_stride(screen
, tex
, i
);
266 /* Compute the number of blocks in Y, see if the CBZB clear can be
267 * used on the texture. */
268 aligned_for_cbzb
= FALSE
;
269 if (align_for_cbzb
&& tex
->tex
.cbzb_allowed
[i
])
270 nblocksy
= r300_texture_get_nblocksy(tex
, i
, &aligned_for_cbzb
);
272 nblocksy
= r300_texture_get_nblocksy(tex
, i
, NULL
);
274 layer_size
= stride
* nblocksy
;
276 if (base
->nr_samples
) {
277 layer_size
*= base
->nr_samples
;
280 if (base
->target
== PIPE_TEXTURE_CUBE
)
281 size
= layer_size
* 6;
283 size
= layer_size
* u_minify(tex
->tex
.depth0
, i
);
285 tex
->tex
.offset_in_bytes
[i
] = tex
->tex
.size_in_bytes
;
286 tex
->tex
.size_in_bytes
= tex
->tex
.offset_in_bytes
[i
] + size
;
287 tex
->tex
.layer_size_in_bytes
[i
] = layer_size
;
288 tex
->tex
.stride_in_bytes
[i
] = stride
;
289 tex
->tex
.stride_in_pixels
[i
] = stride_to_width(tex
->b
.b
.b
.format
, stride
);
290 tex
->tex
.cbzb_allowed
[i
] = tex
->tex
.cbzb_allowed
[i
] && aligned_for_cbzb
;
292 SCREEN_DBG(screen
, DBG_TEXALLOC
, "r300: Texture miptree: Level %d "
293 "(%dx%dx%d px, pitch %d bytes) %d bytes total, macrotiled %s\n",
294 i
, u_minify(tex
->tex
.width0
, i
), u_minify(tex
->tex
.height0
, i
),
295 u_minify(tex
->tex
.depth0
, i
), stride
, tex
->tex
.size_in_bytes
,
296 tex
->tex
.macrotile
[i
] ? "TRUE" : "FALSE");
300 static void r300_setup_flags(struct r300_resource
*tex
)
302 tex
->tex
.uses_stride_addressing
=
303 !util_is_power_of_two(tex
->b
.b
.b
.width0
) ||
304 (tex
->tex
.stride_in_bytes_override
&&
305 stride_to_width(tex
->b
.b
.b
.format
,
306 tex
->tex
.stride_in_bytes_override
) != tex
->b
.b
.b
.width0
);
309 tex
->tex
.uses_stride_addressing
||
310 !util_is_power_of_two(tex
->b
.b
.b
.height0
) ||
311 !util_is_power_of_two(tex
->b
.b
.b
.depth0
);
314 static void r300_setup_cbzb_flags(struct r300_screen
*rscreen
,
315 struct r300_resource
*tex
)
318 boolean first_level_valid
;
320 bpp
= util_format_get_blocksizebits(tex
->b
.b
.b
.format
);
322 /* 1) The texture must be point-sampled,
323 * 2) The depth must be 16 or 32 bits.
324 * 3) If the midpoint ZB offset is not aligned to 2048, it returns garbage
325 * with certain texture sizes. Macrotiling ensures the alignment. */
326 first_level_valid
= tex
->b
.b
.b
.nr_samples
<= 1 &&
327 (bpp
== 16 || bpp
== 32) &&
328 tex
->tex
.macrotile
[0];
330 if (SCREEN_DBG_ON(rscreen
, DBG_NO_CBZB
))
331 first_level_valid
= FALSE
;
333 for (i
= 0; i
<= tex
->b
.b
.b
.last_level
; i
++)
334 tex
->tex
.cbzb_allowed
[i
] = first_level_valid
&& tex
->tex
.macrotile
[i
];
337 #define ALIGN_DIVUP(x, y) (((x) + (y) - 1) / (y))
339 static void r300_setup_zmask_flags(struct r300_screen
*screen
,
340 struct r300_resource
*tex
)
342 /* The tile size of 1 DWORD is:
344 * GPU Pipes 4x4 mode 8x8 mode
345 * ------------------------------------------
346 * R580 4P/1Z 32x32 64x64
347 * RV570 3P/1Z 48x16 96x32
348 * RV530 1P/2Z 32x16 64x32
351 static unsigned num_blocks_x_per_dw
[4] = {4, 8, 12, 8};
352 static unsigned num_blocks_y_per_dw
[4] = {4, 4, 4, 8};
354 if (util_format_is_depth_or_stencil(tex
->b
.b
.b
.format
) &&
355 util_format_get_blocksizebits(tex
->b
.b
.b
.format
) == 32 &&
356 tex
->tex
.microtile
) {
359 if (screen
->caps
.family
== CHIP_FAMILY_RV530
) {
360 pipes
= screen
->caps
.num_z_pipes
;
362 pipes
= screen
->caps
.num_frag_pipes
;
365 for (i
= 0; i
<= tex
->b
.b
.b
.last_level
; i
++) {
366 unsigned numdw
, compsize
;
368 /* The 8x8 compression mode needs macrotiling. */
369 compsize
= screen
->caps
.z_compress
== R300_ZCOMP_8X8
&&
370 tex
->tex
.macrotile
[i
] &&
371 tex
->b
.b
.b
.nr_samples
<= 1 ? 8 : 4;
373 /* Get the zbuffer size (with the aligned width and height). */
374 numdw
= align(tex
->tex
.stride_in_pixels
[i
],
375 num_blocks_x_per_dw
[pipes
-1] * compsize
) *
376 align(u_minify(tex
->b
.b
.b
.height0
, i
),
377 num_blocks_y_per_dw
[pipes
-1] * compsize
);
379 /* Convert pixels -> dwords. */
380 numdw
= ALIGN_DIVUP(numdw
, num_blocks_x_per_dw
[pipes
-1] * compsize
*
381 num_blocks_y_per_dw
[pipes
-1] * compsize
);
383 /* Check that we have enough ZMASK memory. */
384 if (numdw
<= screen
->caps
.zmask_ram
* pipes
) {
385 tex
->tex
.zmask_dwords
[i
] = numdw
;
386 tex
->tex
.zcomp8x8
[i
] = compsize
== 8;
388 tex
->tex
.zmask_dwords
[i
] = 0;
389 tex
->tex
.zcomp8x8
[i
] = FALSE
;
395 static void r300_setup_tiling(struct r300_screen
*screen
,
396 struct r300_resource
*tex
)
398 struct r300_winsys_screen
*rws
= screen
->rws
;
399 enum pipe_format format
= tex
->b
.b
.b
.format
;
400 boolean rv350_mode
= screen
->caps
.family
>= CHIP_FAMILY_R350
;
401 boolean is_zb
= util_format_is_depth_or_stencil(format
);
402 boolean dbg_no_tiling
= SCREEN_DBG_ON(screen
, DBG_NO_TILING
);
404 tex
->tex
.microtile
= R300_BUFFER_LINEAR
;
405 tex
->tex
.macrotile
[0] = R300_BUFFER_LINEAR
;
407 if (!util_format_is_plain(format
)) {
411 /* If height == 1, disable microtiling except for zbuffer. */
412 if (!is_zb
&& (tex
->b
.b
.b
.height0
== 1 || dbg_no_tiling
)) {
416 /* Set microtiling. */
417 switch (util_format_get_blocksize(format
)) {
421 tex
->tex
.microtile
= R300_BUFFER_TILED
;
425 if (rws
->get_value(rws
, R300_VID_DRM_2_1_0
)) {
426 tex
->tex
.microtile
= R300_BUFFER_SQUARETILED
;
435 /* Set macrotiling. */
436 if (r300_texture_macro_switch(tex
, 0, rv350_mode
, DIM_WIDTH
) &&
437 r300_texture_macro_switch(tex
, 0, rv350_mode
, DIM_HEIGHT
)) {
438 tex
->tex
.macrotile
[0] = R300_BUFFER_TILED
;
442 static void r300_tex_print_info(struct r300_resource
*tex
,
446 "r300: %s: Macro: %s, Micro: %s, Pitch: %i, Dim: %ix%ix%i, "
447 "LastLevel: %i, Size: %i, Format: %s\n",
449 tex
->tex
.macrotile
[0] ? "YES" : " NO",
450 tex
->tex
.microtile
? "YES" : " NO",
451 tex
->tex
.stride_in_pixels
[0],
452 tex
->b
.b
.b
.width0
, tex
->b
.b
.b
.height0
, tex
->b
.b
.b
.depth0
,
453 tex
->b
.b
.b
.last_level
, tex
->tex
.size_in_bytes
,
454 util_format_short_name(tex
->b
.b
.b
.format
));
457 boolean
r300_texture_desc_init(struct r300_screen
*rscreen
,
458 struct r300_resource
*tex
,
459 const struct pipe_resource
*base
)
461 tex
->b
.b
.b
.target
= base
->target
;
462 tex
->b
.b
.b
.format
= base
->format
;
463 tex
->b
.b
.b
.width0
= base
->width0
;
464 tex
->b
.b
.b
.height0
= base
->height0
;
465 tex
->b
.b
.b
.depth0
= base
->depth0
;
466 tex
->b
.b
.b
.array_size
= base
->array_size
;
467 tex
->b
.b
.b
.last_level
= base
->last_level
;
468 tex
->b
.b
.b
.nr_samples
= base
->nr_samples
;
469 tex
->tex
.width0
= base
->width0
;
470 tex
->tex
.height0
= base
->height0
;
471 tex
->tex
.depth0
= base
->depth0
;
473 r300_setup_flags(tex
);
475 /* Align a 3D NPOT texture to POT. */
476 if (base
->target
== PIPE_TEXTURE_3D
&& tex
->tex
.is_npot
) {
477 tex
->tex
.width0
= util_next_power_of_two(tex
->tex
.width0
);
478 tex
->tex
.height0
= util_next_power_of_two(tex
->tex
.height0
);
479 tex
->tex
.depth0
= util_next_power_of_two(tex
->tex
.depth0
);
483 if (tex
->tex
.microtile
== R300_BUFFER_SELECT_LAYOUT
) {
484 r300_setup_tiling(rscreen
, tex
);
487 r300_setup_cbzb_flags(rscreen
, tex
);
489 /* Setup the miptree description. */
490 r300_setup_miptree(rscreen
, tex
, TRUE
);
491 /* If the required buffer size is larger the given max size,
492 * try again without the alignment for the CBZB clear. */
493 if (tex
->buf_size
&& tex
->tex
.size_in_bytes
> tex
->buf_size
) {
494 r300_setup_miptree(rscreen
, tex
, FALSE
);
497 r300_texture_3d_fix_mipmapping(rscreen
, tex
);
498 r300_setup_zmask_flags(rscreen
, tex
);
501 /* Make sure the buffer we got is large enough. */
502 if (tex
->tex
.size_in_bytes
> tex
->buf_size
) {
503 fprintf(stderr
, "r300: texture_desc_init: The buffer is not "
504 "large enough. Got: %i, Need: %i, Info:\n",
505 tex
->buf_size
, tex
->tex
.size_in_bytes
);
506 r300_tex_print_info(tex
, "texture_desc_init");
510 tex
->tex
.buffer_size_in_bytes
= tex
->buf_size
;
512 tex
->tex
.buffer_size_in_bytes
= tex
->tex
.size_in_bytes
;
515 if (SCREEN_DBG_ON(rscreen
, DBG_TEX
))
516 r300_tex_print_info(tex
, "texture_desc_init");
521 unsigned r300_texture_get_offset(struct r300_resource
*tex
,
522 unsigned level
, unsigned layer
)
524 unsigned offset
= tex
->tex
.offset_in_bytes
[level
];
526 switch (tex
->b
.b
.b
.target
) {
527 case PIPE_TEXTURE_3D
:
528 case PIPE_TEXTURE_CUBE
:
529 return offset
+ layer
* tex
->tex
.layer_size_in_bytes
[level
];