b180fc8db37351a0660c6fce96963f044036e0bb
[mesa.git] / src / gallium / drivers / nvc0 / nvc0_miptree.c
1 /*
2 * Copyright 2008 Ben Skeggs
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
18 * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF
19 * OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
20 * SOFTWARE.
21 */
22
23 #include "pipe/p_state.h"
24 #include "pipe/p_defines.h"
25 #include "util/u_inlines.h"
26 #include "util/u_format.h"
27
28 #include "nvc0_context.h"
29 #include "nvc0_resource.h"
30
31 uint32_t
32 nvc0_tex_choose_tile_dims(unsigned nx, unsigned ny, unsigned nz)
33 {
34 uint32_t tile_mode = 0x000;
35
36 if (ny > 64) tile_mode = 0x040; /* height 128 tiles */
37 else
38 if (ny > 32) tile_mode = 0x030; /* height 64 tiles */
39 else
40 if (ny > 16) tile_mode = 0x020; /* height 32 tiles */
41 else
42 if (ny > 8) tile_mode = 0x010; /* height 16 tiles */
43
44 if (nz == 1)
45 return tile_mode;
46 else
47 if (tile_mode > 0x020)
48 tile_mode = 0x020;
49
50 if (nz > 16 && tile_mode < 0x020)
51 return tile_mode | 0x500; /* depth 32 tiles */
52 if (nz > 8) return tile_mode | 0x400; /* depth 16 tiles */
53 if (nz > 4) return tile_mode | 0x300; /* depth 8 tiles */
54 if (nz > 2) return tile_mode | 0x200; /* depth 4 tiles */
55
56 return tile_mode | 0x100;
57 }
58
59 static uint32_t
60 nvc0_mt_choose_storage_type(struct nv50_miptree *mt, boolean compressed)
61 {
62 const unsigned ms = util_logbase2(mt->base.base.nr_samples);
63
64 uint32_t tile_flags;
65
66 compressed = FALSE; /* not yet supported */
67
68 if (mt->base.base.bind & PIPE_BIND_CURSOR)
69 return NOUVEAU_BO_TILE_SCANOUT;
70
71 switch (mt->base.base.format) {
72 case PIPE_FORMAT_Z16_UNORM:
73 if (compressed)
74 tile_flags = 0x0200 + (ms << 8);
75 else
76 tile_flags = 0x0100;
77 break;
78 case PIPE_FORMAT_S8_UINT_Z24_UNORM:
79 if (compressed)
80 tile_flags = 0x5100 + (ms << 8);
81 else
82 tile_flags = 0x4600;
83 break;
84 case PIPE_FORMAT_Z24X8_UNORM:
85 case PIPE_FORMAT_Z24_UNORM_S8_UINT:
86 if (compressed)
87 tile_flags = 0x1700 + (ms << 8);
88 else
89 tile_flags = 0x1100;
90 break;
91 case PIPE_FORMAT_Z32_FLOAT:
92 if (compressed)
93 tile_flags = 0x8600 + (ms << 8);
94 else
95 tile_flags = 0x7b00;
96 break;
97 case PIPE_FORMAT_Z32_FLOAT_S8X24_UINT:
98 if (compressed)
99 tile_flags = 0xce00 + (ms << 8);
100 else
101 tile_flags = 0xc300;
102 break;
103 default:
104 switch (util_format_get_blocksizebits(mt->base.base.format)) {
105 case 128:
106 if (compressed)
107 tile_flags = 0xf400 + (ms << 9);
108 else
109 tile_flags = 0xfe00;
110 break;
111 case 64:
112 if (compressed) {
113 switch (ms) {
114 case 0: tile_flags = 0xe600; break;
115 case 1: tile_flags = 0xeb00; break;
116 case 2: tile_flags = 0xed00; break;
117 case 3: tile_flags = 0xf200; break;
118 default:
119 return 0;
120 }
121 } else {
122 tile_flags = 0xfe00;
123 }
124 break;
125 case 32:
126 if (compressed) {
127 switch (ms) {
128 case 0: tile_flags = 0xdb00; break;
129 case 1: tile_flags = 0xdd00; break;
130 case 2: tile_flags = 0xdf00; break;
131 case 3: tile_flags = 0xe400; break;
132 default:
133 return 0;
134 }
135 } else {
136 tile_flags = 0xfe00;
137 }
138 break;
139 case 16:
140 case 8:
141 tile_flags = 0xfe00;
142 break;
143 default:
144 return 0;
145 }
146 break;
147 }
148
149 if (mt->base.base.bind & PIPE_BIND_SCANOUT)
150 tile_flags |= NOUVEAU_BO_TILE_SCANOUT;
151
152 if (unlikely(mt->base.base.flags & NOUVEAU_RESOURCE_FLAG_LINEAR))
153 tile_flags &= ~0xff00;
154
155 return tile_flags;
156 }
157
158 static INLINE boolean
159 nvc0_miptree_init_ms_mode(struct nv50_miptree *mt)
160 {
161 switch (mt->base.base.nr_samples) {
162 case 8:
163 mt->ms_mode = NVC0_3D_MULTISAMPLE_MODE_MS8;
164 mt->ms_x = 2;
165 mt->ms_y = 1;
166 break;
167 case 4:
168 mt->ms_mode = NVC0_3D_MULTISAMPLE_MODE_MS4;
169 mt->ms_x = 1;
170 mt->ms_y = 1;
171 break;
172 case 2:
173 mt->ms_mode = NVC0_3D_MULTISAMPLE_MODE_MS2;
174 mt->ms_x = 1;
175 break;
176 case 1:
177 case 0:
178 mt->ms_mode = NVC0_3D_MULTISAMPLE_MODE_MS1;
179 break;
180 default:
181 NOUVEAU_ERR("invalid nr_samples: %u\n", mt->base.base.nr_samples);
182 return FALSE;
183 }
184 return TRUE;
185 }
186
187 boolean
188 nv50_miptree_init_layout_linear(struct nv50_miptree *);
189
190 static void
191 nvc0_miptree_init_layout_video(struct nv50_miptree *mt)
192 {
193 const struct pipe_resource *pt = &mt->base.base;
194 const unsigned blocksize = util_format_get_blocksize(pt->format);
195
196 unsigned nbx = util_format_get_nblocksx(pt->format, pt->width0);
197 unsigned nby = util_format_get_nblocksy(pt->format, pt->height0);
198
199 assert(pt->last_level == 0);
200 assert(mt->ms_x == 0 &&
201 mt->ms_y == 0);
202 assert(!util_format_is_compressed(pt->format));
203
204 assert(nby > 8);
205 mt->level[0].tile_mode = 0x10;
206 mt->level[0].pitch = align(nbx * blocksize, 64);
207 mt->total_size = align(nby, 16) * mt->level[0].pitch;
208
209 if (pt->array_size > 1) {
210 mt->layer_stride = align(mt->total_size, NVC0_TILE_SIZE(0x10));
211 mt->total_size = mt->layer_stride * pt->array_size;
212 }
213 }
214
215 static void
216 nvc0_miptree_init_layout_tiled(struct nv50_miptree *mt)
217 {
218 struct pipe_resource *pt = &mt->base.base;
219 unsigned w, h, d, l;
220 const unsigned blocksize = util_format_get_blocksize(pt->format);
221
222 mt->layout_3d = pt->target == PIPE_TEXTURE_3D;
223
224 w = pt->width0 << mt->ms_x;
225 h = pt->height0 << mt->ms_y;
226
227 /* For 3D textures, a mipmap is spanned by all the layers, for array
228 * textures and cube maps, each layer contains its own mipmaps.
229 */
230 d = mt->layout_3d ? pt->depth0 : 1;
231
232 for (l = 0; l <= pt->last_level; ++l) {
233 struct nv50_miptree_level *lvl = &mt->level[l];
234 unsigned tsx, tsy, tsz;
235 unsigned nbx = util_format_get_nblocksx(pt->format, w);
236 unsigned nby = util_format_get_nblocksy(pt->format, h);
237
238 lvl->offset = mt->total_size;
239
240 lvl->tile_mode = nvc0_tex_choose_tile_dims(nbx, nby, d);
241
242 tsx = NVC0_TILE_SIZE_X(lvl->tile_mode); /* x is tile row pitch in bytes */
243 tsy = NVC0_TILE_SIZE_Y(lvl->tile_mode);
244 tsz = NVC0_TILE_SIZE_Z(lvl->tile_mode);
245
246 lvl->pitch = align(nbx * blocksize, tsx);
247
248 mt->total_size += lvl->pitch * align(nby, tsy) * align(d, tsz);
249
250 w = u_minify(w, 1);
251 h = u_minify(h, 1);
252 d = u_minify(d, 1);
253 }
254
255 if (pt->array_size > 1) {
256 mt->layer_stride = align(mt->total_size,
257 NVC0_TILE_SIZE(mt->level[0].tile_mode));
258 mt->total_size = mt->layer_stride * pt->array_size;
259 }
260 }
261
262 const struct u_resource_vtbl nvc0_miptree_vtbl =
263 {
264 nv50_miptree_get_handle, /* get_handle */
265 nv50_miptree_destroy, /* resource_destroy */
266 nvc0_miptree_transfer_new, /* get_transfer */
267 nvc0_miptree_transfer_del, /* transfer_destroy */
268 nvc0_miptree_transfer_map, /* transfer_map */
269 u_default_transfer_flush_region, /* transfer_flush_region */
270 nvc0_miptree_transfer_unmap, /* transfer_unmap */
271 u_default_transfer_inline_write /* transfer_inline_write */
272 };
273
274 struct pipe_resource *
275 nvc0_miptree_create(struct pipe_screen *pscreen,
276 const struct pipe_resource *templ)
277 {
278 struct nouveau_device *dev = nouveau_screen(pscreen)->device;
279 struct nv50_miptree *mt = CALLOC_STRUCT(nv50_miptree);
280 struct pipe_resource *pt = &mt->base.base;
281 int ret;
282 uint32_t tile_flags;
283
284 if (!mt)
285 return NULL;
286
287 mt->base.vtbl = &nvc0_miptree_vtbl;
288 *pt = *templ;
289 pipe_reference_init(&pt->reference, 1);
290 pt->screen = pscreen;
291
292 tile_flags = nvc0_mt_choose_storage_type(mt, TRUE);
293
294 if (!nvc0_miptree_init_ms_mode(mt)) {
295 FREE(mt);
296 return NULL;
297 }
298
299 if (unlikely(pt->flags & NVC0_RESOURCE_FLAG_VIDEO)) {
300 nvc0_miptree_init_layout_video(mt);
301 } else
302 if (tile_flags & NOUVEAU_BO_TILE_LAYOUT_MASK) {
303 nvc0_miptree_init_layout_tiled(mt);
304 } else
305 if (!nv50_miptree_init_layout_linear(mt)) {
306 FREE(mt);
307 return NULL;
308 }
309
310 ret = nouveau_bo_new_tile(dev, NOUVEAU_BO_VRAM, 4096,
311 mt->total_size,
312 mt->level[0].tile_mode, tile_flags,
313 &mt->base.bo);
314 if (ret) {
315 FREE(mt);
316 return NULL;
317 }
318 mt->base.domain = NOUVEAU_BO_VRAM;
319
320 return pt;
321 }
322
323 /* Offset of zslice @z from start of level @l. */
324 INLINE unsigned
325 nvc0_mt_zslice_offset(const struct nv50_miptree *mt, unsigned l, unsigned z)
326 {
327 const struct pipe_resource *pt = &mt->base.base;
328
329 unsigned tds = NVC0_TILE_SHIFT_Z(mt->level[l].tile_mode);
330 unsigned ths = NVC0_TILE_SHIFT_Y(mt->level[l].tile_mode);
331
332 unsigned nby = util_format_get_nblocksy(pt->format,
333 u_minify(pt->height0, l));
334
335 /* to next 2D tile slice within a 3D tile */
336 unsigned stride_2d = NVC0_TILE_SIZE_2D(mt->level[l].tile_mode);
337
338 /* to slice in the next (in z direction) 3D tile */
339 unsigned stride_3d = (align(nby, (1 << ths)) * mt->level[l].pitch) << tds;
340
341 return (z & (1 << (tds - 1))) * stride_2d + (z >> tds) * stride_3d;
342 }
343
344 /* Surface functions.
345 */
346
347 struct pipe_surface *
348 nvc0_miptree_surface_new(struct pipe_context *pipe,
349 struct pipe_resource *pt,
350 const struct pipe_surface *templ)
351 {
352 struct nv50_surface *ns = nv50_surface_from_miptree(nv50_miptree(pt), templ);
353 if (!ns)
354 return NULL;
355 ns->base.context = pipe;
356 return &ns->base;
357 }