2 * Copyright 2006 Tungsten Graphics, Inc., Cedar Park, Texas.
3 * Copyright © 2006 Intel Corporation
5 * Permission is hereby granted, free of charge, to any person obtaining
6 * a copy of this software and associated documentation files (the
7 * "Software"), to deal in the Software without restriction, including
8 * without limitation the rights to use, copy, modify, merge, publish,
9 * distribute, sublicense, and/or sell copies of the Software, and to
10 * permit persons to whom the Software is furnished to do so, subject to
11 * the following conditions:
13 * The above copyright notice and this permission notice (including the
14 * next paragraph) shall be included in all copies or substantial
15 * portions of the Software.
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
18 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
19 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
20 * IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
21 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
22 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
23 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
27 * \file brw_tex_layout.cpp
29 * Code to lay out images in a mipmap tree.
31 * \author Keith Whitwell <keith@tungstengraphics.com>
32 * \author Michel Dänzer <michel@tungstengraphics.com>
35 #include "intel_mipmap_tree.h"
36 #include "brw_context.h"
37 #include "main/macros.h"
39 #define FILE_DEBUG_FLAG DEBUG_MIPTREE
42 intel_horizontal_texture_alignment_unit(struct intel_context
*intel
,
46 * From the "Alignment Unit Size" section of various specs, namely:
47 * - Gen3 Spec: "Memory Data Formats" Volume, Section 1.20.1.4
48 * - i965 and G45 PRMs: Volume 1, Section 6.17.3.4.
49 * - Ironlake and Sandybridge PRMs: Volume 1, Part 1, Section 7.18.3.4
50 * - BSpec (for Ivybridge and slight variations in separate stencil)
52 * +----------------------------------------------------------------------+
53 * | | alignment unit width ("i") |
54 * | Surface Property |-----------------------------|
55 * | | 915 | 965 | ILK | SNB | IVB |
56 * +----------------------------------------------------------------------+
57 * | YUV 4:2:2 format | 8 | 4 | 4 | 4 | 4 |
58 * | BC1-5 compressed format (DXTn/S3TC) | 4 | 4 | 4 | 4 | 4 |
59 * | FXT1 compressed format | 8 | 8 | 8 | 8 | 8 |
60 * | Depth Buffer (16-bit) | 4 | 4 | 4 | 4 | 8 |
61 * | Depth Buffer (other) | 4 | 4 | 4 | 4 | 4 |
62 * | Separate Stencil Buffer | N/A | N/A | 8 | 8 | 8 |
63 * | All Others | 4 | 4 | 4 | 4 | 4 |
64 * +----------------------------------------------------------------------+
66 * On IVB+, non-special cases can be overridden by setting the SURFACE_STATE
67 * "Surface Horizontal Alignment" field to HALIGN_4 or HALIGN_8.
69 if (_mesa_is_format_compressed(format
)) {
70 /* The hardware alignment requirements for compressed textures
71 * happen to match the block boundaries.
74 _mesa_get_format_block_size(format
, &i
, &j
);
78 if (format
== MESA_FORMAT_S8
)
81 /* The depth alignment requirements in the table above are for rendering to
82 * depth miplevels using the LOD control fields. We don't use LOD control
83 * fields, and instead use page offsets plus intra-tile x/y offsets, which
84 * require that the low 3 bits are zero. To reduce the number of x/y
85 * offset workaround blits we do, align the X to 8, which depth texturing
86 * can handle (sadly, it can't handle 8 in the Y direction).
88 if (intel
->gen
>= 7 &&
89 _mesa_get_format_base_format(format
) == GL_DEPTH_COMPONENT
)
96 intel_vertical_texture_alignment_unit(struct intel_context
*intel
,
100 * From the "Alignment Unit Size" section of various specs, namely:
101 * - Gen3 Spec: "Memory Data Formats" Volume, Section 1.20.1.4
102 * - i965 and G45 PRMs: Volume 1, Section 6.17.3.4.
103 * - Ironlake and Sandybridge PRMs: Volume 1, Part 1, Section 7.18.3.4
104 * - BSpec (for Ivybridge and slight variations in separate stencil)
106 * +----------------------------------------------------------------------+
107 * | | alignment unit height ("j") |
108 * | Surface Property |-----------------------------|
109 * | | 915 | 965 | ILK | SNB | IVB |
110 * +----------------------------------------------------------------------+
111 * | BC1-5 compressed format (DXTn/S3TC) | 4 | 4 | 4 | 4 | 4 |
112 * | FXT1 compressed format | 4 | 4 | 4 | 4 | 4 |
113 * | Depth Buffer | 2 | 2 | 2 | 4 | 4 |
114 * | Separate Stencil Buffer | N/A | N/A | N/A | 4 | 8 |
115 * | Multisampled (4x or 8x) render target | N/A | N/A | N/A | 4 | 4 |
116 * | All Others | 2 | 2 | 2 | 2 | 2 |
117 * +----------------------------------------------------------------------+
119 * On SNB+, non-special cases can be overridden by setting the SURFACE_STATE
120 * "Surface Vertical Alignment" field to VALIGN_2 or VALIGN_4.
122 * We currently don't support multisampling.
124 if (_mesa_is_format_compressed(format
))
127 if (format
== MESA_FORMAT_S8
)
128 return intel
->gen
>= 7 ? 8 : 4;
130 GLenum base_format
= _mesa_get_format_base_format(format
);
132 if (intel
->gen
>= 6 &&
133 (base_format
== GL_DEPTH_COMPONENT
||
134 base_format
== GL_DEPTH_STENCIL
)) {
142 brw_miptree_layout_2d(struct intel_mipmap_tree
*mt
)
146 unsigned width
= mt
->physical_width0
;
147 unsigned height
= mt
->physical_height0
;
148 unsigned depth
= mt
->physical_depth0
; /* number of array layers. */
150 mt
->total_width
= mt
->physical_width0
;
152 if (mt
->compressed
) {
153 mt
->total_width
= ALIGN(mt
->physical_width0
, mt
->align_w
);
156 /* May need to adjust width to accomodate the placement of
157 * the 2nd mipmap. This occurs when the alignment
158 * constraints of mipmap placement push the right edge of the
159 * 2nd mipmap out past the width of its parent.
161 if (mt
->first_level
!= mt
->last_level
) {
164 if (mt
->compressed
) {
165 mip1_width
= ALIGN(minify(mt
->physical_width0
, 1), mt
->align_w
) +
166 ALIGN(minify(mt
->physical_width0
, 2), mt
->align_w
);
168 mip1_width
= ALIGN(minify(mt
->physical_width0
, 1), mt
->align_w
) +
169 minify(mt
->physical_width0
, 2);
172 if (mip1_width
> mt
->total_width
) {
173 mt
->total_width
= mip1_width
;
177 mt
->total_height
= 0;
179 for (unsigned level
= mt
->first_level
; level
<= mt
->last_level
; level
++) {
182 intel_miptree_set_level_info(mt
, level
, x
, y
, width
,
185 img_height
= ALIGN(height
, mt
->align_h
);
187 img_height
/= mt
->align_h
;
189 /* Because the images are packed better, the final offset
190 * might not be the maximal one:
192 mt
->total_height
= MAX2(mt
->total_height
, y
+ img_height
);
194 /* Layout_below: step right after second mipmap.
196 if (level
== mt
->first_level
+ 1) {
197 x
+= ALIGN(width
, mt
->align_w
);
202 width
= minify(width
, 1);
203 height
= minify(height
, 1);
208 brw_miptree_layout_texture_array(struct intel_context
*intel
,
209 struct intel_mipmap_tree
*mt
)
214 h0
= ALIGN(mt
->physical_height0
, mt
->align_h
);
215 h1
= ALIGN(minify(mt
->physical_height0
, 1), mt
->align_h
);
216 if (mt
->array_spacing_lod0
)
219 qpitch
= (h0
+ h1
+ (intel
->gen
>= 7 ? 12 : 11) * mt
->align_h
);
223 brw_miptree_layout_2d(mt
);
225 for (unsigned level
= mt
->first_level
; level
<= mt
->last_level
; level
++) {
226 for (int q
= 0; q
< mt
->physical_depth0
; q
++) {
227 intel_miptree_set_image_offset(mt
, level
, q
, 0, q
* qpitch
);
230 mt
->total_height
= qpitch
* mt
->physical_depth0
;
234 brw_miptree_layout_texture_3d(struct intel_context
*intel
,
235 struct intel_mipmap_tree
*mt
)
237 unsigned width
= mt
->physical_width0
;
238 unsigned height
= mt
->physical_height0
;
239 unsigned depth
= mt
->physical_depth0
;
240 unsigned pack_x_pitch
, pack_x_nr
;
241 unsigned pack_y_pitch
;
243 mt
->total_height
= 0;
245 if (mt
->compressed
) {
246 mt
->total_width
= ALIGN(width
, mt
->align_w
);
247 pack_y_pitch
= (height
+ 3) / 4;
249 mt
->total_width
= mt
->physical_width0
;
250 pack_y_pitch
= ALIGN(mt
->physical_height0
, mt
->align_h
);
253 pack_x_pitch
= width
;
256 for (unsigned level
= mt
->first_level
; level
<= mt
->last_level
; level
++) {
260 intel_miptree_set_level_info(mt
, level
,
262 width
, height
, depth
);
264 for (int q
= 0; q
< depth
; /* empty */) {
265 for (int j
= 0; j
< pack_x_nr
&& q
< depth
; j
++, q
++) {
266 intel_miptree_set_image_offset(mt
, level
, q
, x
, y
);
269 if (x
> mt
->total_width
)
276 mt
->total_height
+= y
;
277 width
= minify(width
, 1);
278 height
= minify(height
, 1);
279 if (mt
->target
== GL_TEXTURE_3D
)
280 depth
= minify(depth
, 1);
282 if (mt
->compressed
) {
283 pack_y_pitch
= (height
+ 3) / 4;
285 if (pack_x_pitch
> ALIGN(width
, mt
->align_w
)) {
286 pack_x_pitch
= ALIGN(width
, mt
->align_w
);
291 if (pack_x_pitch
> 4) {
295 if (pack_y_pitch
> 2) {
297 pack_y_pitch
= ALIGN(pack_y_pitch
, mt
->align_h
);
302 /* The 965's sampler lays cachelines out according to how accesses
303 * in the texture surfaces run, so they may be "vertical" through
304 * memory. As a result, the docs say in Surface Padding Requirements:
305 * Sampling Engine Surfaces that two extra rows of padding are required.
307 if (mt
->target
== GL_TEXTURE_CUBE_MAP
)
308 mt
->total_height
+= 2;
312 brw_miptree_layout(struct intel_context
*intel
, struct intel_mipmap_tree
*mt
)
314 mt
->align_w
= intel_horizontal_texture_alignment_unit(intel
, mt
->format
);
315 mt
->align_h
= intel_vertical_texture_alignment_unit(intel
, mt
->format
);
317 switch (mt
->target
) {
318 case GL_TEXTURE_CUBE_MAP
:
319 if (intel
->gen
== 4) {
320 /* Gen4 stores cube maps as 3D textures. */
321 assert(mt
->physical_depth0
== 6);
322 brw_miptree_layout_texture_3d(intel
, mt
);
324 /* All other hardware stores cube maps as 2D arrays. */
325 brw_miptree_layout_texture_array(intel
, mt
);
330 brw_miptree_layout_texture_3d(intel
, mt
);
333 case GL_TEXTURE_1D_ARRAY
:
334 case GL_TEXTURE_2D_ARRAY
:
335 case GL_TEXTURE_2D_MULTISAMPLE_ARRAY
:
336 case GL_TEXTURE_CUBE_MAP_ARRAY
:
337 brw_miptree_layout_texture_array(intel
, mt
);
341 switch (mt
->msaa_layout
) {
342 case INTEL_MSAA_LAYOUT_UMS
:
343 case INTEL_MSAA_LAYOUT_CMS
:
344 brw_miptree_layout_texture_array(intel
, mt
);
346 case INTEL_MSAA_LAYOUT_NONE
:
347 case INTEL_MSAA_LAYOUT_IMS
:
348 brw_miptree_layout_2d(mt
);
353 DBG("%s: %dx%dx%d\n", __FUNCTION__
,
354 mt
->total_width
, mt
->total_height
, mt
->cpp
);