i965/gen8: Use constant pointers for reading miptree details
[mesa.git] / src / mesa / drivers / dri / i965 / gen8_surface_state.c
1 /*
2 * Copyright © 2012 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 #include "main/blend.h"
25 #include "main/mtypes.h"
26 #include "main/samplerobj.h"
27 #include "main/texformat.h"
28 #include "main/teximage.h"
29 #include "program/prog_parameter.h"
30
31 #include "intel_mipmap_tree.h"
32 #include "intel_batchbuffer.h"
33 #include "intel_tex.h"
34 #include "intel_fbo.h"
35 #include "intel_buffer_objects.h"
36
37 #include "brw_context.h"
38 #include "brw_state.h"
39 #include "brw_defines.h"
40 #include "brw_wm.h"
41
42 /**
43 * Convert an swizzle enumeration (i.e. SWIZZLE_X) to one of the Gen7.5+
44 * "Shader Channel Select" enumerations (i.e. HSW_SCS_RED). The mappings are
45 *
46 * SWIZZLE_X, SWIZZLE_Y, SWIZZLE_Z, SWIZZLE_W, SWIZZLE_ZERO, SWIZZLE_ONE
47 * 0 1 2 3 4 5
48 * 4 5 6 7 0 1
49 * SCS_RED, SCS_GREEN, SCS_BLUE, SCS_ALPHA, SCS_ZERO, SCS_ONE
50 *
51 * which is simply adding 4 then modding by 8 (or anding with 7).
52 */
53 static unsigned
54 swizzle_to_scs(unsigned swizzle)
55 {
56 return (swizzle + 4) & 7;
57 }
58
59 static uint32_t
60 surface_tiling_mode(uint32_t tiling)
61 {
62 switch (tiling) {
63 case I915_TILING_X:
64 return GEN8_SURFACE_TILING_X;
65 case I915_TILING_Y:
66 return GEN8_SURFACE_TILING_Y;
67 default:
68 return GEN8_SURFACE_TILING_NONE;
69 }
70 }
71
72 static unsigned
73 vertical_alignment(const struct intel_mipmap_tree *mt)
74 {
75 switch (mt->align_h) {
76 case 4:
77 return GEN8_SURFACE_VALIGN_4;
78 case 8:
79 return GEN8_SURFACE_VALIGN_8;
80 case 16:
81 return GEN8_SURFACE_VALIGN_16;
82 default:
83 unreachable("Unsupported vertical surface alignment.");
84 }
85 }
86
87 static unsigned
88 horizontal_alignment(const struct intel_mipmap_tree *mt)
89 {
90 switch (mt->align_w) {
91 case 4:
92 return GEN8_SURFACE_HALIGN_4;
93 case 8:
94 return GEN8_SURFACE_HALIGN_8;
95 case 16:
96 return GEN8_SURFACE_HALIGN_16;
97 default:
98 unreachable("Unsupported horizontal surface alignment.");
99 }
100 }
101
102 static uint32_t *
103 allocate_surface_state(struct brw_context *brw, uint32_t *out_offset)
104 {
105 int dwords = brw->gen >= 9 ? 16 : 13;
106 uint32_t *surf = brw_state_batch(brw, AUB_TRACE_SURFACE_STATE,
107 dwords * 4, 64, out_offset);
108 memset(surf, 0, dwords * 4);
109 return surf;
110 }
111
112 static void
113 gen8_emit_buffer_surface_state(struct brw_context *brw,
114 uint32_t *out_offset,
115 drm_intel_bo *bo,
116 unsigned buffer_offset,
117 unsigned surface_format,
118 unsigned buffer_size,
119 unsigned pitch,
120 bool rw)
121 {
122 const unsigned mocs = brw->gen >= 9 ? SKL_MOCS_WB : BDW_MOCS_WB;
123 uint32_t *surf = allocate_surface_state(brw, out_offset);
124
125 surf[0] = BRW_SURFACE_BUFFER << BRW_SURFACE_TYPE_SHIFT |
126 surface_format << BRW_SURFACE_FORMAT_SHIFT |
127 BRW_SURFACE_RC_READ_WRITE;
128 surf[1] = SET_FIELD(mocs, GEN8_SURFACE_MOCS);
129
130 surf[2] = SET_FIELD((buffer_size - 1) & 0x7f, GEN7_SURFACE_WIDTH) |
131 SET_FIELD(((buffer_size - 1) >> 7) & 0x3fff, GEN7_SURFACE_HEIGHT);
132 if (surface_format == BRW_SURFACEFORMAT_RAW)
133 surf[3] = SET_FIELD(((buffer_size - 1) >> 21) & 0x3ff, BRW_SURFACE_DEPTH);
134 else
135 surf[3] = SET_FIELD(((buffer_size - 1) >> 21) & 0x3f, BRW_SURFACE_DEPTH);
136 surf[3] |= (pitch - 1);
137 surf[7] = SET_FIELD(HSW_SCS_RED, GEN7_SURFACE_SCS_R) |
138 SET_FIELD(HSW_SCS_GREEN, GEN7_SURFACE_SCS_G) |
139 SET_FIELD(HSW_SCS_BLUE, GEN7_SURFACE_SCS_B) |
140 SET_FIELD(HSW_SCS_ALPHA, GEN7_SURFACE_SCS_A);
141 /* reloc */
142 *((uint64_t *) &surf[8]) = (bo ? bo->offset64 : 0) + buffer_offset;
143
144 /* Emit relocation to surface contents. */
145 if (bo) {
146 drm_intel_bo_emit_reloc(brw->batch.bo, *out_offset + 8 * 4,
147 bo, buffer_offset, I915_GEM_DOMAIN_SAMPLER,
148 rw ? I915_GEM_DOMAIN_SAMPLER : 0);
149 }
150 }
151
152 static void
153 gen8_emit_texture_surface_state(struct brw_context *brw,
154 struct intel_mipmap_tree *mt,
155 GLenum target,
156 unsigned min_layer, unsigned max_layer,
157 unsigned min_level, unsigned max_level,
158 unsigned format,
159 unsigned swizzle,
160 uint32_t *surf_offset,
161 bool rw, bool for_gather)
162 {
163 const unsigned depth = max_layer - min_layer;
164 struct intel_mipmap_tree *aux_mt = NULL;
165 uint32_t aux_mode = 0;
166 uint32_t mocs_wb = brw->gen >= 9 ? SKL_MOCS_WB : BDW_MOCS_WB;
167 unsigned tiling_mode, pitch;
168
169 if (mt->format == MESA_FORMAT_S_UINT8) {
170 tiling_mode = GEN8_SURFACE_TILING_W;
171 pitch = 2 * mt->pitch;
172 } else {
173 tiling_mode = surface_tiling_mode(mt->tiling);
174 pitch = mt->pitch;
175 }
176
177 if (mt->mcs_mt) {
178 aux_mt = mt->mcs_mt;
179 aux_mode = GEN8_SURFACE_AUX_MODE_MCS;
180 }
181
182 uint32_t *surf = allocate_surface_state(brw, surf_offset);
183
184 surf[0] = translate_tex_target(target) << BRW_SURFACE_TYPE_SHIFT |
185 format << BRW_SURFACE_FORMAT_SHIFT |
186 vertical_alignment(mt) |
187 horizontal_alignment(mt) |
188 tiling_mode;
189
190 if (target == GL_TEXTURE_CUBE_MAP ||
191 target == GL_TEXTURE_CUBE_MAP_ARRAY) {
192 surf[0] |= BRW_SURFACE_CUBEFACE_ENABLES;
193 }
194
195 if (_mesa_is_array_texture(target) || target == GL_TEXTURE_CUBE_MAP)
196 surf[0] |= GEN8_SURFACE_IS_ARRAY;
197
198 surf[1] = SET_FIELD(mocs_wb, GEN8_SURFACE_MOCS) | mt->qpitch >> 2;
199
200 surf[2] = SET_FIELD(mt->logical_width0 - 1, GEN7_SURFACE_WIDTH) |
201 SET_FIELD(mt->logical_height0 - 1, GEN7_SURFACE_HEIGHT);
202
203 surf[3] = SET_FIELD(depth - 1, BRW_SURFACE_DEPTH) | (pitch - 1);
204
205 surf[4] = gen7_surface_msaa_bits(mt->num_samples, mt->msaa_layout) |
206 SET_FIELD(min_layer, GEN7_SURFACE_MIN_ARRAY_ELEMENT) |
207 SET_FIELD(depth - 1, GEN7_SURFACE_RENDER_TARGET_VIEW_EXTENT);
208
209 surf[5] = SET_FIELD(min_level - mt->first_level, GEN7_SURFACE_MIN_LOD) |
210 (max_level - min_level - 1); /* mip count */
211
212 if (aux_mt) {
213 surf[6] = SET_FIELD(mt->qpitch / 4, GEN8_SURFACE_AUX_QPITCH) |
214 SET_FIELD((aux_mt->pitch / 128) - 1, GEN8_SURFACE_AUX_PITCH) |
215 aux_mode;
216 } else {
217 surf[6] = 0;
218 }
219
220 surf[7] = mt->fast_clear_color_value |
221 SET_FIELD(swizzle_to_scs(GET_SWZ(swizzle, 0)), GEN7_SURFACE_SCS_R) |
222 SET_FIELD(swizzle_to_scs(GET_SWZ(swizzle, 1)), GEN7_SURFACE_SCS_G) |
223 SET_FIELD(swizzle_to_scs(GET_SWZ(swizzle, 2)), GEN7_SURFACE_SCS_B) |
224 SET_FIELD(swizzle_to_scs(GET_SWZ(swizzle, 3)), GEN7_SURFACE_SCS_A);
225
226 *((uint64_t *) &surf[8]) = mt->bo->offset64 + mt->offset; /* reloc */
227
228 if (aux_mt) {
229 *((uint64_t *) &surf[10]) = aux_mt->bo->offset64;
230 drm_intel_bo_emit_reloc(brw->batch.bo, *surf_offset + 10 * 4,
231 aux_mt->bo, 0,
232 I915_GEM_DOMAIN_SAMPLER,
233 (rw ? I915_GEM_DOMAIN_SAMPLER : 0));
234 } else {
235 surf[10] = 0;
236 surf[11] = 0;
237 }
238 surf[12] = 0;
239
240 /* Emit relocation to surface contents */
241 drm_intel_bo_emit_reloc(brw->batch.bo,
242 *surf_offset + 8 * 4,
243 mt->bo,
244 mt->offset,
245 I915_GEM_DOMAIN_SAMPLER,
246 (rw ? I915_GEM_DOMAIN_SAMPLER : 0));
247 }
248
249 static void
250 gen8_update_texture_surface(struct gl_context *ctx,
251 unsigned unit,
252 uint32_t *surf_offset,
253 bool for_gather)
254 {
255 struct brw_context *brw = brw_context(ctx);
256 struct gl_texture_object *obj = ctx->Texture.Unit[unit]._Current;
257
258 if (obj->Target == GL_TEXTURE_BUFFER) {
259 brw_update_buffer_texture_surface(ctx, unit, surf_offset);
260
261 } else {
262 struct gl_texture_image *firstImage = obj->Image[0][obj->BaseLevel];
263 struct intel_texture_object *intel_obj = intel_texture_object(obj);
264 struct intel_mipmap_tree *mt = intel_obj->mt;
265 struct gl_sampler_object *sampler = _mesa_get_samplerobj(ctx, unit);
266 /* If this is a view with restricted NumLayers, then our effective depth
267 * is not just the miptree depth.
268 */
269 const unsigned depth = (obj->Immutable && obj->Target != GL_TEXTURE_3D ?
270 obj->NumLayers : mt->logical_depth0);
271
272 /* Handling GL_ALPHA as a surface format override breaks 1.30+ style
273 * texturing functions that return a float, as our code generation always
274 * selects the .x channel (which would always be 0).
275 */
276 const bool alpha_depth = obj->DepthMode == GL_ALPHA &&
277 (firstImage->_BaseFormat == GL_DEPTH_COMPONENT ||
278 firstImage->_BaseFormat == GL_DEPTH_STENCIL);
279 const unsigned swizzle = (unlikely(alpha_depth) ? SWIZZLE_XYZW :
280 brw_get_texture_swizzle(&brw->ctx, obj));
281
282 unsigned format = translate_tex_format(brw, intel_obj->_Format,
283 sampler->sRGBDecode);
284 if (obj->StencilSampling && firstImage->_BaseFormat == GL_DEPTH_STENCIL) {
285 mt = mt->stencil_mt;
286 format = BRW_SURFACEFORMAT_R8_UINT;
287 }
288
289 gen8_emit_texture_surface_state(brw, mt, obj->Target,
290 obj->MinLayer, obj->MinLayer + depth,
291 obj->MinLevel + obj->BaseLevel,
292 obj->MinLevel + intel_obj->_MaxLevel + 1,
293 format, swizzle, surf_offset,
294 false, for_gather);
295 }
296 }
297
298 /**
299 * Creates a null surface.
300 *
301 * This is used when the shader doesn't write to any color output. An FB
302 * write to target 0 will still be emitted, because that's how the thread is
303 * terminated (and computed depth is returned), so we need to have the
304 * hardware discard the target 0 color output..
305 */
306 static void
307 gen8_emit_null_surface_state(struct brw_context *brw,
308 unsigned width,
309 unsigned height,
310 unsigned samples,
311 uint32_t *out_offset)
312 {
313 uint32_t *surf = allocate_surface_state(brw, out_offset);
314
315 surf[0] = BRW_SURFACE_NULL << BRW_SURFACE_TYPE_SHIFT |
316 BRW_SURFACEFORMAT_B8G8R8A8_UNORM << BRW_SURFACE_FORMAT_SHIFT |
317 GEN8_SURFACE_TILING_Y;
318 surf[2] = SET_FIELD(width - 1, GEN7_SURFACE_WIDTH) |
319 SET_FIELD(height - 1, GEN7_SURFACE_HEIGHT);
320 }
321
322 /**
323 * Sets up a surface state structure to point at the given region.
324 * While it is only used for the front/back buffer currently, it should be
325 * usable for further buffers when doing ARB_draw_buffer support.
326 */
327 static void
328 gen8_update_renderbuffer_surface(struct brw_context *brw,
329 struct gl_renderbuffer *rb,
330 bool layered,
331 unsigned unit)
332 {
333 struct gl_context *ctx = &brw->ctx;
334 struct intel_renderbuffer *irb = intel_renderbuffer(rb);
335 struct intel_mipmap_tree *mt = irb->mt;
336 struct intel_mipmap_tree *aux_mt = NULL;
337 uint32_t aux_mode = 0;
338 unsigned width = mt->logical_width0;
339 unsigned height = mt->logical_height0;
340 unsigned pitch = mt->pitch;
341 uint32_t tiling = mt->tiling;
342 uint32_t format = 0;
343 uint32_t surf_type;
344 bool is_array = false;
345 int depth = MAX2(irb->layer_count, 1);
346 const int min_array_element = (mt->format == MESA_FORMAT_S_UINT8) ?
347 irb->mt_layer : (irb->mt_layer / MAX2(mt->num_samples, 1));
348 GLenum gl_target =
349 rb->TexImage ? rb->TexImage->TexObject->Target : GL_TEXTURE_2D;
350 uint32_t surf_index =
351 brw->wm.prog_data->binding_table.render_target_start + unit;
352 /* FINISHME: Use PTE MOCS on Skylake. */
353 uint32_t mocs = brw->gen >= 9 ? SKL_MOCS_WT : BDW_MOCS_PTE;
354
355 intel_miptree_used_for_rendering(mt);
356
357 switch (gl_target) {
358 case GL_TEXTURE_CUBE_MAP_ARRAY:
359 case GL_TEXTURE_CUBE_MAP:
360 surf_type = BRW_SURFACE_2D;
361 is_array = true;
362 depth *= 6;
363 break;
364 case GL_TEXTURE_3D:
365 depth = MAX2(irb->mt->logical_depth0, 1);
366 /* fallthrough */
367 default:
368 surf_type = translate_tex_target(gl_target);
369 is_array = _mesa_tex_target_is_array(gl_target);
370 break;
371 }
372
373 /* _NEW_BUFFERS */
374 /* Render targets can't use IMS layout. Stencil in turn gets configured as
375 * single sampled and indexed manually by the program.
376 */
377 if (mt->format == MESA_FORMAT_S_UINT8) {
378 brw_configure_w_tiled(mt, true, &width, &height, &pitch,
379 &tiling, &format);
380 } else {
381 assert(mt->msaa_layout != INTEL_MSAA_LAYOUT_IMS);
382 assert(brw_render_target_supported(brw, rb));
383 mesa_format rb_format = _mesa_get_render_format(ctx,
384 intel_rb_format(irb));
385 format = brw->render_target_format[rb_format];
386 if (unlikely(!brw->format_supported_as_render_target[rb_format]))
387 _mesa_problem(ctx, "%s: renderbuffer format %s unsupported\n",
388 __func__, _mesa_get_format_name(rb_format));
389 }
390
391 if (mt->mcs_mt) {
392 aux_mt = mt->mcs_mt;
393 aux_mode = GEN8_SURFACE_AUX_MODE_MCS;
394 }
395
396 uint32_t *surf =
397 allocate_surface_state(brw, &brw->wm.base.surf_offset[surf_index]);
398
399 surf[0] = (surf_type << BRW_SURFACE_TYPE_SHIFT) |
400 (is_array ? GEN7_SURFACE_IS_ARRAY : 0) |
401 (format << BRW_SURFACE_FORMAT_SHIFT) |
402 vertical_alignment(mt) |
403 horizontal_alignment(mt) |
404 surface_tiling_mode(tiling);
405
406 surf[1] = SET_FIELD(mocs, GEN8_SURFACE_MOCS) | mt->qpitch >> 2;
407
408 surf[2] = SET_FIELD(width - 1, GEN7_SURFACE_WIDTH) |
409 SET_FIELD(height - 1, GEN7_SURFACE_HEIGHT);
410
411 surf[3] = (depth - 1) << BRW_SURFACE_DEPTH_SHIFT |
412 (pitch - 1); /* Surface Pitch */
413
414 surf[4] = min_array_element << GEN7_SURFACE_MIN_ARRAY_ELEMENT_SHIFT |
415 (depth - 1) << GEN7_SURFACE_RENDER_TARGET_VIEW_EXTENT_SHIFT;
416
417 if (mt->format != MESA_FORMAT_S_UINT8)
418 surf[4] |= gen7_surface_msaa_bits(mt->num_samples, mt->msaa_layout);
419
420 surf[5] = irb->mt_level - irb->mt->first_level;
421
422 if (aux_mt) {
423 surf[6] = SET_FIELD(mt->qpitch / 4, GEN8_SURFACE_AUX_QPITCH) |
424 SET_FIELD((aux_mt->pitch / 128) - 1, GEN8_SURFACE_AUX_PITCH) |
425 aux_mode;
426 } else {
427 surf[6] = 0;
428 }
429
430 surf[7] = mt->fast_clear_color_value |
431 SET_FIELD(HSW_SCS_RED, GEN7_SURFACE_SCS_R) |
432 SET_FIELD(HSW_SCS_GREEN, GEN7_SURFACE_SCS_G) |
433 SET_FIELD(HSW_SCS_BLUE, GEN7_SURFACE_SCS_B) |
434 SET_FIELD(HSW_SCS_ALPHA, GEN7_SURFACE_SCS_A);
435
436 assert(mt->offset % mt->cpp == 0);
437 *((uint64_t *) &surf[8]) = mt->bo->offset64 + mt->offset; /* reloc */
438
439 if (aux_mt) {
440 *((uint64_t *) &surf[10]) = aux_mt->bo->offset64;
441 drm_intel_bo_emit_reloc(brw->batch.bo,
442 brw->wm.base.surf_offset[surf_index] + 10 * 4,
443 aux_mt->bo, 0,
444 I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER);
445 } else {
446 surf[10] = 0;
447 surf[11] = 0;
448 }
449 surf[12] = 0;
450
451 drm_intel_bo_emit_reloc(brw->batch.bo,
452 brw->wm.base.surf_offset[surf_index] + 8 * 4,
453 mt->bo,
454 mt->offset,
455 I915_GEM_DOMAIN_RENDER,
456 I915_GEM_DOMAIN_RENDER);
457 }
458
459 void
460 gen8_init_vtable_surface_functions(struct brw_context *brw)
461 {
462 brw->vtbl.update_texture_surface = gen8_update_texture_surface;
463 brw->vtbl.update_renderbuffer_surface = gen8_update_renderbuffer_surface;
464 brw->vtbl.emit_null_surface_state = gen8_emit_null_surface_state;
465 brw->vtbl.emit_texture_surface_state = gen8_emit_texture_surface_state;
466 brw->vtbl.emit_buffer_surface_state = gen8_emit_buffer_surface_state;
467 }