ilo: use an accessor for dev->gen
[mesa.git] / src / gallium / drivers / ilo / ilo_blitter_rectlist.c
1 /*
2 * Mesa 3-D graphics library
3 *
4 * Copyright (C) 2014 LunarG, Inc.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included
14 * in all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
22 * DEALINGS IN THE SOFTWARE.
23 *
24 * Authors:
25 * Chia-I Wu <olv@lunarg.com>
26 */
27
28 #include "util/u_draw.h"
29 #include "util/u_pack_color.h"
30
31 #include "ilo_blitter.h"
32 #include "ilo_3d.h"
33 #include "ilo_3d_pipeline.h"
34 #include "ilo_blit.h"
35 #include "ilo_gpe.h"
36 #include "ilo_gpe_gen6.h" /* for ve_init_cso_with_components and
37 zs_align_surface */
38
39 /**
40 * Set the states that are invariant between all ops.
41 */
42 static bool
43 ilo_blitter_set_invariants(struct ilo_blitter *blitter)
44 {
45 struct pipe_screen *screen = blitter->ilo->base.screen;
46 struct pipe_resource templ;
47 struct pipe_vertex_element velems[2];
48 struct pipe_viewport_state vp;
49
50 if (blitter->initialized)
51 return true;
52
53 blitter->buffer.size = 4096;
54
55 /* allocate the vertex buffer */
56 memset(&templ, 0, sizeof(templ));
57 templ.target = PIPE_BUFFER;
58 templ.width0 = blitter->buffer.size;
59 templ.usage = PIPE_USAGE_STREAM;
60 templ.bind = PIPE_BIND_VERTEX_BUFFER;
61 blitter->buffer.res = screen->resource_create(screen, &templ);
62 if (!blitter->buffer.res)
63 return false;
64
65 /* do not increase reference count */
66 blitter->vb.states[0].buffer = blitter->buffer.res;
67
68 /* only vertex X and Y */
69 blitter->vb.states[0].stride = 2 * sizeof(float);
70 blitter->vb.enabled_mask = 0x1;
71 memset(&velems, 0, sizeof(velems));
72 velems[1].src_format = PIPE_FORMAT_R32G32_FLOAT;
73 ilo_gpe_init_ve(blitter->ilo->dev, 2, velems, &blitter->ve);
74
75 /* override first VE to be VUE header */
76 ve_init_cso_with_components(blitter->ilo->dev,
77 GEN6_VFCOMP_STORE_0, /* Reserved */
78 GEN6_VFCOMP_STORE_0, /* Render Target Array Index */
79 GEN6_VFCOMP_STORE_0, /* Viewport Index */
80 GEN6_VFCOMP_STORE_0, /* Point Width */
81 &blitter->ve.cso[0]);
82
83 /* a rectangle has 3 vertices in a RECTLIST */
84 util_draw_init_info(&blitter->draw);
85 blitter->draw.count = 3;
86
87 /**
88 * From the Haswell PRM, volume 7, page 615:
89 *
90 * "The clear value must be between the min and max depth values
91 * (inclusive) defined in the CC_VIEWPORT."
92 *
93 * Even though clipping and viewport transformation will be disabled, we
94 * still need to set up the viewport states.
95 */
96 memset(&vp, 0, sizeof(vp));
97 vp.scale[0] = 1.0f;
98 vp.scale[1] = 1.0f;
99 vp.scale[2] = 1.0f;
100 vp.scale[3] = 1.0f;
101 ilo_gpe_set_viewport_cso(blitter->ilo->dev, &vp, &blitter->viewport);
102
103 blitter->initialized = true;
104
105 return true;
106 }
107
108 static void
109 ilo_blitter_set_op(struct ilo_blitter *blitter,
110 enum ilo_blitter_rectlist_op op)
111 {
112 blitter->op = op;
113 }
114
115 /**
116 * Set the rectangle primitive.
117 */
118 static void
119 ilo_blitter_set_rectlist(struct ilo_blitter *blitter,
120 unsigned x, unsigned y,
121 unsigned width, unsigned height)
122 {
123 unsigned usage = PIPE_TRANSFER_WRITE | PIPE_TRANSFER_UNSYNCHRONIZED;
124 float vertices[3][2];
125 struct pipe_box box;
126
127 /*
128 * From the Sandy Bridge PRM, volume 2 part 1, page 11:
129 *
130 * "(RECTLIST) A list of independent rectangles, where only 3 vertices
131 * are provided per rectangle object, with the fourth vertex implied
132 * by the definition of a rectangle. V0=LowerRight, V1=LowerLeft,
133 * V2=UpperLeft. Implied V3 = V0- V1+V2."
134 */
135 vertices[0][0] = (float) (x + width);
136 vertices[0][1] = (float) (y + height);
137 vertices[1][0] = (float) x;
138 vertices[1][1] = (float) (y + height);
139 vertices[2][0] = (float) x;
140 vertices[2][1] = (float) y;
141
142 /* buffer is full */
143 if (blitter->buffer.offset + sizeof(vertices) > blitter->buffer.size) {
144 if (!ilo_buffer_rename_bo(ilo_buffer(blitter->buffer.res)))
145 usage &= ~PIPE_TRANSFER_UNSYNCHRONIZED;
146
147 blitter->buffer.offset = 0;
148 }
149
150 u_box_1d(blitter->buffer.offset, sizeof(vertices), &box);
151
152 blitter->ilo->base.transfer_inline_write(&blitter->ilo->base,
153 blitter->buffer.res, 0, usage, &box, vertices, 0, 0);
154
155 blitter->vb.states[0].buffer_offset = blitter->buffer.offset;
156 blitter->buffer.offset += sizeof(vertices);
157 }
158
159 static void
160 ilo_blitter_set_clear_values(struct ilo_blitter *blitter,
161 uint32_t depth, ubyte stencil)
162 {
163 blitter->depth_clear_value = depth;
164 blitter->cc.stencil_ref.ref_value[0] = stencil;
165 }
166
167 static void
168 ilo_blitter_set_dsa(struct ilo_blitter *blitter,
169 const struct pipe_depth_stencil_alpha_state *state)
170 {
171 ilo_gpe_init_dsa(blitter->ilo->dev, state, &blitter->dsa);
172 }
173
174 static void
175 ilo_blitter_set_fb(struct ilo_blitter *blitter,
176 struct pipe_resource *res, unsigned level,
177 const struct ilo_surface_cso *cso)
178 {
179 struct ilo_texture *tex = ilo_texture(res);
180
181 blitter->fb.width = u_minify(tex->layout.width0, level);
182 blitter->fb.height = u_minify(tex->layout.height0, level);
183
184 blitter->fb.num_samples = res->nr_samples;
185 if (!blitter->fb.num_samples)
186 blitter->fb.num_samples = 1;
187
188 memcpy(&blitter->fb.dst, cso, sizeof(*cso));
189 }
190
191 static void
192 ilo_blitter_set_fb_from_surface(struct ilo_blitter *blitter,
193 struct pipe_surface *surf)
194 {
195 ilo_blitter_set_fb(blitter, surf->texture, surf->u.tex.level,
196 (const struct ilo_surface_cso *) surf);
197 }
198
199 static void
200 ilo_blitter_set_fb_from_resource(struct ilo_blitter *blitter,
201 struct pipe_resource *res,
202 enum pipe_format format,
203 unsigned level, unsigned slice)
204 {
205 struct pipe_surface templ, *surf;
206
207 memset(&templ, 0, sizeof(templ));
208 templ.format = format;
209 templ.u.tex.level = level;
210 templ.u.tex.first_layer = slice;
211 templ.u.tex.last_layer = slice;
212
213 /* if we did not call create_surface(), it would never fail */
214 surf = blitter->ilo->base.create_surface(&blitter->ilo->base, res, &templ);
215 assert(surf);
216
217 ilo_blitter_set_fb(blitter, res, level,
218 (const struct ilo_surface_cso *) surf);
219
220 pipe_surface_reference(&surf, NULL);
221 }
222
223 static void
224 ilo_blitter_set_uses(struct ilo_blitter *blitter, uint32_t uses)
225 {
226 blitter->uses = uses;
227 }
228
229 static void
230 hiz_align_fb(struct ilo_blitter *blitter)
231 {
232 unsigned align_w, align_h;
233
234 switch (blitter->op) {
235 case ILO_BLITTER_RECTLIST_CLEAR_ZS:
236 case ILO_BLITTER_RECTLIST_RESOLVE_Z:
237 break;
238 default:
239 return;
240 break;
241 }
242
243 /*
244 * From the Sandy Bridge PRM, volume 2 part 1, page 313-314:
245 *
246 * "A rectangle primitive representing the clear area is delivered. The
247 * primitive must adhere to the following restrictions on size:
248 *
249 * - If Number of Multisamples is NUMSAMPLES_1, the rectangle must be
250 * aligned to an 8x4 pixel block relative to the upper left corner
251 * of the depth buffer, and contain an integer number of these pixel
252 * blocks, and all 8x4 pixels must be lit.
253 *
254 * - If Number of Multisamples is NUMSAMPLES_4, the rectangle must be
255 * aligned to a 4x2 pixel block (8x4 sample block) relative to the
256 * upper left corner of the depth buffer, and contain an integer
257 * number of these pixel blocks, and all samples of the 4x2 pixels
258 * must be lit
259 *
260 * - If Number of Multisamples is NUMSAMPLES_8, the rectangle must be
261 * aligned to a 2x2 pixel block (8x4 sample block) relative to the
262 * upper left corner of the depth buffer, and contain an integer
263 * number of these pixel blocks, and all samples of the 2x2 pixels
264 * must be list."
265 *
266 * "The following is required when performing a depth buffer resolve:
267 *
268 * - A rectangle primitive of the same size as the previous depth
269 * buffer clear operation must be delivered, and depth buffer state
270 * cannot have changed since the previous depth buffer clear
271 * operation."
272 */
273 switch (blitter->fb.num_samples) {
274 case 1:
275 align_w = 8;
276 align_h = 4;
277 break;
278 case 2:
279 align_w = 4;
280 align_h = 4;
281 break;
282 case 4:
283 align_w = 4;
284 align_h = 2;
285 break;
286 case 8:
287 default:
288 align_w = 2;
289 align_h = 2;
290 break;
291 }
292
293 if (blitter->fb.width % align_w || blitter->fb.height % align_h) {
294 blitter->fb.width = align(blitter->fb.width, align_w);
295 blitter->fb.height = align(blitter->fb.height, align_h);
296
297 assert(!blitter->fb.dst.is_rt);
298 zs_align_surface(blitter->ilo->dev, align_w, align_h,
299 &blitter->fb.dst.u.zs);
300 }
301 }
302
303 static void
304 hiz_emit_rectlist(struct ilo_blitter *blitter)
305 {
306 struct ilo_3d *hw3d = blitter->ilo->hw3d;
307 struct ilo_3d_pipeline *p = hw3d->pipeline;
308
309 hiz_align_fb(blitter);
310
311 ilo_blitter_set_rectlist(blitter, 0, 0,
312 blitter->fb.width, blitter->fb.height);
313
314 ilo_3d_own_render_ring(hw3d);
315
316 /*
317 * From the Sandy Bridge PRM, volume 2 part 1, page 313:
318 *
319 * "If other rendering operations have preceded this clear, a
320 * PIPE_CONTROL with write cache flush enabled and Z-inhibit
321 * disabled must be issued before the rectangle primitive used for
322 * the depth buffer clear operation."
323 *
324 * From the Sandy Bridge PRM, volume 2 part 1, page 314:
325 *
326 * "Depth buffer clear pass must be followed by a PIPE_CONTROL
327 * command with DEPTH_STALL bit set and Then followed by Depth
328 * FLUSH"
329 *
330 * But the pipeline has to be flushed both before and after not only
331 * because of these workarounds. We need them for reasons such as
332 *
333 * - we may sample from a texture that was rendered to
334 * - we may sample from the fb shortly after
335 */
336 if (!ilo_cp_empty(p->cp))
337 ilo_3d_pipeline_emit_flush(p);
338
339 ilo_3d_pipeline_emit_rectlist(p, blitter);
340
341 ilo_3d_pipeline_emit_flush(p);
342 }
343
344 static bool
345 hiz_can_clear_zs(const struct ilo_blitter *blitter,
346 const struct ilo_texture *tex)
347 {
348 /*
349 * From the Sandy Bridge PRM, volume 2 part 1, page 314:
350 *
351 * "Several cases exist where Depth Buffer Clear cannot be enabled (the
352 * legacy method of clearing must be performed):
353 *
354 * - If the depth buffer format is D32_FLOAT_S8X24_UINT or
355 * D24_UNORM_S8_UINT.
356 *
357 * - If stencil test is enabled but the separate stencil buffer is
358 * disabled.
359 *
360 * - [DevSNB-A{W/A}]: ...
361 *
362 * - [DevSNB{W/A}]: When depth buffer format is D16_UNORM and the
363 * width of the map (LOD0) is not multiple of 16, fast clear
364 * optimization must be disabled."
365 *
366 * From the Ivy Bridge PRM, volume 2 part 1, page 313:
367 *
368 * "Several cases exist where Depth Buffer Clear cannot be enabled (the
369 * legacy method of clearing must be performed):
370 *
371 * - If the depth buffer format is D32_FLOAT_S8X24_UINT or
372 * D24_UNORM_S8_UINT.
373 *
374 * - If stencil test is enabled but the separate stencil buffer is
375 * disabled."
376 *
377 * The truth is when HiZ is enabled, separate stencil is also enabled on
378 * all GENs. The depth buffer format cannot be combined depth/stencil.
379 */
380 switch (tex->layout.format) {
381 case PIPE_FORMAT_Z16_UNORM:
382 if (ilo_dev_gen(blitter->ilo->dev) == ILO_GEN(6) &&
383 tex->base.width0 % 16)
384 return false;
385 break;
386 case PIPE_FORMAT_Z24_UNORM_S8_UINT:
387 case PIPE_FORMAT_Z32_FLOAT_S8X24_UINT:
388 assert(!"HiZ with combined depth/stencil");
389 return false;
390 break;
391 default:
392 break;
393 }
394
395 return true;
396 }
397
398 bool
399 ilo_blitter_rectlist_clear_zs(struct ilo_blitter *blitter,
400 struct pipe_surface *zs,
401 unsigned clear_flags,
402 double depth, unsigned stencil)
403 {
404 struct ilo_texture *tex = ilo_texture(zs->texture);
405 struct pipe_depth_stencil_alpha_state dsa_state;
406 uint32_t uses, clear_value;
407
408 if (!ilo_texture_can_enable_hiz(tex,
409 zs->u.tex.level, zs->u.tex.first_layer,
410 zs->u.tex.last_layer - zs->u.tex.first_layer + 1))
411 return false;
412
413 if (!hiz_can_clear_zs(blitter, tex))
414 return false;
415
416 clear_value = util_pack_z(tex->layout.format, depth);
417
418 ilo_blit_resolve_surface(blitter->ilo, zs,
419 ILO_TEXTURE_RENDER_WRITE | ILO_TEXTURE_CLEAR);
420 ilo_texture_set_slice_clear_value(tex, zs->u.tex.level,
421 zs->u.tex.first_layer,
422 zs->u.tex.last_layer - zs->u.tex.first_layer + 1,
423 clear_value);
424
425 /*
426 * From the Sandy Bridge PRM, volume 2 part 1, page 313-314:
427 *
428 * "- Depth Test Enable must be disabled and Depth Buffer Write Enable
429 * must be enabled (if depth is being cleared).
430 *
431 * - Stencil buffer clear can be performed at the same time by
432 * enabling Stencil Buffer Write Enable. Stencil Test Enable must
433 * be enabled and Stencil Pass Depth Pass Op set to REPLACE, and the
434 * clear value that is placed in the stencil buffer is the Stencil
435 * Reference Value from COLOR_CALC_STATE.
436 *
437 * - Note also that stencil buffer clear can be performed without
438 * depth buffer clear. For stencil only clear, Depth Test Enable and
439 * Depth Buffer Write Enable must be disabled.
440 *
441 * - [DevSNB] errata: For stencil buffer only clear, the previous
442 * depth clear value must be delivered during the clear."
443 */
444 memset(&dsa_state, 0, sizeof(dsa_state));
445
446 if (clear_flags & PIPE_CLEAR_DEPTH)
447 dsa_state.depth.writemask = true;
448
449 if (clear_flags & PIPE_CLEAR_STENCIL) {
450 dsa_state.stencil[0].enabled = true;
451 dsa_state.stencil[0].func = PIPE_FUNC_ALWAYS;
452 dsa_state.stencil[0].fail_op = PIPE_STENCIL_OP_KEEP;
453 dsa_state.stencil[0].zpass_op = PIPE_STENCIL_OP_REPLACE;
454 dsa_state.stencil[0].zfail_op = PIPE_STENCIL_OP_KEEP;
455
456 /*
457 * From the Ivy Bridge PRM, volume 2 part 1, page 277:
458 *
459 * "Additionally the following must be set to the correct values.
460 *
461 * - DEPTH_STENCIL_STATE::Stencil Write Mask must be 0xFF
462 * - DEPTH_STENCIL_STATE::Stencil Test Mask must be 0xFF
463 * - DEPTH_STENCIL_STATE::Back Face Stencil Write Mask must be 0xFF
464 * - DEPTH_STENCIL_STATE::Back Face Stencil Test Mask must be 0xFF"
465 */
466 dsa_state.stencil[0].valuemask = 0xff;
467 dsa_state.stencil[0].writemask = 0xff;
468 dsa_state.stencil[1].valuemask = 0xff;
469 dsa_state.stencil[1].writemask = 0xff;
470 }
471
472 ilo_blitter_set_invariants(blitter);
473 ilo_blitter_set_op(blitter, ILO_BLITTER_RECTLIST_CLEAR_ZS);
474
475 ilo_blitter_set_dsa(blitter, &dsa_state);
476 ilo_blitter_set_clear_values(blitter, clear_value, (ubyte) stencil);
477 ilo_blitter_set_fb_from_surface(blitter, zs);
478
479 uses = ILO_BLITTER_USE_DSA;
480 if (clear_flags & PIPE_CLEAR_DEPTH)
481 uses |= ILO_BLITTER_USE_VIEWPORT | ILO_BLITTER_USE_FB_DEPTH;
482 if (clear_flags & PIPE_CLEAR_STENCIL)
483 uses |= ILO_BLITTER_USE_CC | ILO_BLITTER_USE_FB_STENCIL;
484 ilo_blitter_set_uses(blitter, uses);
485
486 hiz_emit_rectlist(blitter);
487
488 return true;
489 }
490
491 void
492 ilo_blitter_rectlist_resolve_z(struct ilo_blitter *blitter,
493 struct pipe_resource *res,
494 unsigned level, unsigned slice)
495 {
496 struct ilo_texture *tex = ilo_texture(res);
497 struct pipe_depth_stencil_alpha_state dsa_state;
498 const struct ilo_texture_slice *s =
499 ilo_texture_get_slice(tex, level, slice);
500
501 if (!ilo_texture_can_enable_hiz(tex, level, slice, 1))
502 return;
503
504 /*
505 * From the Sandy Bridge PRM, volume 2 part 1, page 314:
506 *
507 * "Depth Test Enable must be enabled with the Depth Test Function set
508 * to NEVER. Depth Buffer Write Enable must be enabled. Stencil Test
509 * Enable and Stencil Buffer Write Enable must be disabled."
510 */
511 memset(&dsa_state, 0, sizeof(dsa_state));
512 dsa_state.depth.writemask = true;
513 dsa_state.depth.enabled = true;
514 dsa_state.depth.func = PIPE_FUNC_NEVER;
515
516 ilo_blitter_set_invariants(blitter);
517 ilo_blitter_set_op(blitter, ILO_BLITTER_RECTLIST_RESOLVE_Z);
518
519 ilo_blitter_set_dsa(blitter, &dsa_state);
520 ilo_blitter_set_clear_values(blitter, s->clear_value, 0);
521 ilo_blitter_set_fb_from_resource(blitter, res, res->format, level, slice);
522 ilo_blitter_set_uses(blitter,
523 ILO_BLITTER_USE_DSA | ILO_BLITTER_USE_FB_DEPTH);
524
525 hiz_emit_rectlist(blitter);
526 }
527
528 void
529 ilo_blitter_rectlist_resolve_hiz(struct ilo_blitter *blitter,
530 struct pipe_resource *res,
531 unsigned level, unsigned slice)
532 {
533 struct ilo_texture *tex = ilo_texture(res);
534 struct pipe_depth_stencil_alpha_state dsa_state;
535
536 if (!ilo_texture_can_enable_hiz(tex, level, slice, 1))
537 return;
538
539 /*
540 * From the Sandy Bridge PRM, volume 2 part 1, page 315:
541 *
542 * "(Hierarchical Depth Buffer Resolve) Depth Test Enable must be
543 * disabled. Depth Buffer Write Enable must be enabled. Stencil Test
544 * Enable and Stencil Buffer Write Enable must be disabled."
545 */
546 memset(&dsa_state, 0, sizeof(dsa_state));
547 dsa_state.depth.writemask = true;
548
549 ilo_blitter_set_invariants(blitter);
550 ilo_blitter_set_op(blitter, ILO_BLITTER_RECTLIST_RESOLVE_HIZ);
551
552 ilo_blitter_set_dsa(blitter, &dsa_state);
553 ilo_blitter_set_fb_from_resource(blitter, res, res->format, level, slice);
554 ilo_blitter_set_uses(blitter,
555 ILO_BLITTER_USE_DSA | ILO_BLITTER_USE_FB_DEPTH);
556
557 hiz_emit_rectlist(blitter);
558 }