vc4: Disable early Z with computed depth.
[mesa.git] / src / gallium / drivers / vc4 / vc4_emit.c
1 /*
2 * Copyright © 2014 Broadcom
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 #include "vc4_context.h"
25
26 void
27 vc4_emit_state(struct pipe_context *pctx)
28 {
29 struct vc4_context *vc4 = vc4_context(pctx);
30
31 struct vc4_cl_out *bcl = cl_start(&vc4->bcl);
32 if (vc4->dirty & (VC4_DIRTY_SCISSOR | VC4_DIRTY_VIEWPORT |
33 VC4_DIRTY_RASTERIZER)) {
34 float *vpscale = vc4->viewport.scale;
35 float *vptranslate = vc4->viewport.translate;
36 float vp_minx = -fabsf(vpscale[0]) + vptranslate[0];
37 float vp_maxx = fabsf(vpscale[0]) + vptranslate[0];
38 float vp_miny = -fabsf(vpscale[1]) + vptranslate[1];
39 float vp_maxy = fabsf(vpscale[1]) + vptranslate[1];
40
41 /* Clip to the scissor if it's enabled, but still clip to the
42 * drawable regardless since that controls where the binner
43 * tries to put things.
44 *
45 * Additionally, always clip the rendering to the viewport,
46 * since the hardware does guardband clipping, meaning
47 * primitives would rasterize outside of the view volume.
48 */
49 uint32_t minx, miny, maxx, maxy;
50 if (!vc4->rasterizer->base.scissor) {
51 minx = MAX2(vp_minx, 0);
52 miny = MAX2(vp_miny, 0);
53 maxx = MIN2(vp_maxx, vc4->draw_width);
54 maxy = MIN2(vp_maxy, vc4->draw_height);
55 } else {
56 minx = MAX2(vp_minx, vc4->scissor.minx);
57 miny = MAX2(vp_miny, vc4->scissor.miny);
58 maxx = MIN2(vp_maxx, vc4->scissor.maxx);
59 maxy = MIN2(vp_maxy, vc4->scissor.maxy);
60 }
61
62 cl_u8(&bcl, VC4_PACKET_CLIP_WINDOW);
63 cl_u16(&bcl, minx);
64 cl_u16(&bcl, miny);
65 cl_u16(&bcl, maxx - minx);
66 cl_u16(&bcl, maxy - miny);
67
68 vc4->draw_min_x = MIN2(vc4->draw_min_x, minx);
69 vc4->draw_min_y = MIN2(vc4->draw_min_y, miny);
70 vc4->draw_max_x = MAX2(vc4->draw_max_x, maxx);
71 vc4->draw_max_y = MAX2(vc4->draw_max_y, maxy);
72 }
73
74 if (vc4->dirty & (VC4_DIRTY_RASTERIZER |
75 VC4_DIRTY_ZSA |
76 VC4_DIRTY_COMPILED_FS)) {
77 uint8_t ez_enable_mask_out = ~0;
78
79 /* HW-2905: If the RCL ends up doing a full-res load when
80 * multisampling, then early Z tracking may end up with values
81 * from the previous tile due to a HW bug. Disable it to
82 * avoid that.
83 *
84 * We should be able to skip this when the Z is cleared, but I
85 * was seeing bad rendering on glxgears -samples 4 even in
86 * that case.
87 */
88 if (vc4->msaa || vc4->prog.fs->disable_early_z)
89 ez_enable_mask_out &= ~VC4_CONFIG_BITS_EARLY_Z;
90
91 cl_u8(&bcl, VC4_PACKET_CONFIGURATION_BITS);
92 cl_u8(&bcl,
93 vc4->rasterizer->config_bits[0] |
94 vc4->zsa->config_bits[0]);
95 cl_u8(&bcl,
96 vc4->rasterizer->config_bits[1] |
97 vc4->zsa->config_bits[1]);
98 cl_u8(&bcl,
99 (vc4->rasterizer->config_bits[2] |
100 vc4->zsa->config_bits[2]) & ez_enable_mask_out);
101 }
102
103 if (vc4->dirty & VC4_DIRTY_RASTERIZER) {
104 cl_u8(&bcl, VC4_PACKET_DEPTH_OFFSET);
105 cl_u16(&bcl, vc4->rasterizer->offset_factor);
106 cl_u16(&bcl, vc4->rasterizer->offset_units);
107
108 cl_u8(&bcl, VC4_PACKET_POINT_SIZE);
109 cl_f(&bcl, vc4->rasterizer->point_size);
110
111 cl_u8(&bcl, VC4_PACKET_LINE_WIDTH);
112 cl_f(&bcl, vc4->rasterizer->base.line_width);
113 }
114
115 if (vc4->dirty & VC4_DIRTY_VIEWPORT) {
116 cl_u8(&bcl, VC4_PACKET_CLIPPER_XY_SCALING);
117 cl_f(&bcl, vc4->viewport.scale[0] * 16.0f);
118 cl_f(&bcl, vc4->viewport.scale[1] * 16.0f);
119
120 cl_u8(&bcl, VC4_PACKET_CLIPPER_Z_SCALING);
121 cl_f(&bcl, vc4->viewport.translate[2]);
122 cl_f(&bcl, vc4->viewport.scale[2]);
123
124 cl_u8(&bcl, VC4_PACKET_VIEWPORT_OFFSET);
125 cl_u16(&bcl, 16 * vc4->viewport.translate[0]);
126 cl_u16(&bcl, 16 * vc4->viewport.translate[1]);
127 }
128
129 if (vc4->dirty & VC4_DIRTY_FLAT_SHADE_FLAGS) {
130 cl_u8(&bcl, VC4_PACKET_FLAT_SHADE_FLAGS);
131 cl_u32(&bcl, vc4->rasterizer->base.flatshade ?
132 vc4->prog.fs->color_inputs : 0);
133 }
134
135 cl_end(&vc4->bcl, bcl);
136 }