i965/fs: Rename demote_pull_constants to lower_constant_loads
[mesa.git] / src / mesa / drivers / dri / i965 / brw_sf.c
1 /*
2 Copyright (C) Intel Corp. 2006. All Rights Reserved.
3 Intel funded Tungsten Graphics to
4 develop this 3D driver.
5
6 Permission is hereby granted, free of charge, to any person obtaining
7 a copy of this software and associated documentation files (the
8 "Software"), to deal in the Software without restriction, including
9 without limitation the rights to use, copy, modify, merge, publish,
10 distribute, sublicense, and/or sell copies of the Software, and to
11 permit persons to whom the Software is furnished to do so, subject to
12 the following conditions:
13
14 The above copyright notice and this permission notice (including the
15 next paragraph) shall be included in all copies or substantial
16 portions of the Software.
17
18 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
19 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
21 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
22 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
23 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
24 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25
26 **********************************************************************/
27 /*
28 * Authors:
29 * Keith Whitwell <keithw@vmware.com>
30 */
31
32
33 #include "main/macros.h"
34 #include "main/mtypes.h"
35 #include "main/enums.h"
36 #include "main/fbobject.h"
37
38 #include "intel_batchbuffer.h"
39
40 #include "brw_defines.h"
41 #include "brw_context.h"
42 #include "brw_eu.h"
43 #include "brw_util.h"
44 #include "brw_sf.h"
45 #include "brw_state.h"
46
47 #include "util/ralloc.h"
48
49 static void compile_sf_prog( struct brw_context *brw,
50 struct brw_sf_prog_key *key )
51 {
52 struct brw_sf_compile c;
53 const GLuint *program;
54 void *mem_ctx;
55 GLuint program_size;
56
57 memset(&c, 0, sizeof(c));
58
59 mem_ctx = ralloc_context(NULL);
60 /* Begin the compilation:
61 */
62 brw_init_codegen(brw->intelScreen->devinfo, &c.func, mem_ctx);
63
64 c.key = *key;
65 c.vue_map = brw->vue_map_geom_out;
66 if (c.key.do_point_coord) {
67 /*
68 * gl_PointCoord is a FS instead of VS builtin variable, thus it's
69 * not included in c.vue_map generated in VS stage. Here we add
70 * it manually to let SF shader generate the needed interpolation
71 * coefficient for FS shader.
72 */
73 c.vue_map.varying_to_slot[BRW_VARYING_SLOT_PNTC] = c.vue_map.num_slots;
74 c.vue_map.slot_to_varying[c.vue_map.num_slots++] = BRW_VARYING_SLOT_PNTC;
75 }
76 c.urb_entry_read_offset = BRW_SF_URB_ENTRY_READ_OFFSET;
77 c.nr_attr_regs = (c.vue_map.num_slots + 1)/2 - c.urb_entry_read_offset;
78 c.nr_setup_regs = c.nr_attr_regs;
79
80 c.prog_data.urb_read_length = c.nr_attr_regs;
81 c.prog_data.urb_entry_size = c.nr_setup_regs * 2;
82 c.has_flat_shading = brw_any_flat_varyings(&key->interpolation_mode);
83
84 /* Which primitive? Or all three?
85 */
86 switch (key->primitive) {
87 case SF_TRIANGLES:
88 c.nr_verts = 3;
89 brw_emit_tri_setup( &c, true );
90 break;
91 case SF_LINES:
92 c.nr_verts = 2;
93 brw_emit_line_setup( &c, true );
94 break;
95 case SF_POINTS:
96 c.nr_verts = 1;
97 if (key->do_point_sprite)
98 brw_emit_point_sprite_setup( &c, true );
99 else
100 brw_emit_point_setup( &c, true );
101 break;
102 case SF_UNFILLED_TRIS:
103 c.nr_verts = 3;
104 brw_emit_anyprim_setup( &c );
105 break;
106 default:
107 unreachable("not reached");
108 }
109
110 /* FINISHME: SF programs use calculated jumps (i.e., JMPI with a register
111 * source). Compacting would be difficult.
112 */
113 /* brw_compact_instructions(&c.func, 0, 0, NULL); */
114
115 /* get the program
116 */
117 program = brw_get_program(&c.func, &program_size);
118
119 if (unlikely(INTEL_DEBUG & DEBUG_SF)) {
120 fprintf(stderr, "sf:\n");
121 brw_disassemble(brw->intelScreen->devinfo,
122 c.func.store, 0, program_size, stderr);
123 fprintf(stderr, "\n");
124 }
125
126 brw_upload_cache(&brw->cache, BRW_CACHE_SF_PROG,
127 &c.key, sizeof(c.key),
128 program, program_size,
129 &c.prog_data, sizeof(c.prog_data),
130 &brw->sf.prog_offset, &brw->sf.prog_data);
131 ralloc_free(mem_ctx);
132 }
133
134 /* Calculate interpolants for triangle and line rasterization.
135 */
136 static void
137 brw_upload_sf_prog(struct brw_context *brw)
138 {
139 struct gl_context *ctx = &brw->ctx;
140 struct brw_sf_prog_key key;
141 /* _NEW_BUFFERS */
142 bool render_to_fbo = _mesa_is_user_fbo(ctx->DrawBuffer);
143
144 memset(&key, 0, sizeof(key));
145
146 /* Populate the key, noting state dependencies:
147 */
148 /* BRW_NEW_VUE_MAP_GEOM_OUT */
149 key.attrs = brw->vue_map_geom_out.slots_valid;
150
151 /* BRW_NEW_REDUCED_PRIMITIVE */
152 switch (brw->reduced_primitive) {
153 case GL_TRIANGLES:
154 /* NOTE: We just use the edgeflag attribute as an indicator that
155 * unfilled triangles are active. We don't actually do the
156 * edgeflag testing here, it is already done in the clip
157 * program.
158 */
159 if (key.attrs & BITFIELD64_BIT(VARYING_SLOT_EDGE))
160 key.primitive = SF_UNFILLED_TRIS;
161 else
162 key.primitive = SF_TRIANGLES;
163 break;
164 case GL_LINES:
165 key.primitive = SF_LINES;
166 break;
167 case GL_POINTS:
168 key.primitive = SF_POINTS;
169 break;
170 }
171
172 /* _NEW_TRANSFORM */
173 key.userclip_active = (ctx->Transform.ClipPlanesEnabled != 0);
174
175 /* _NEW_POINT */
176 key.do_point_sprite = ctx->Point.PointSprite;
177 if (key.do_point_sprite) {
178 int i;
179
180 for (i = 0; i < 8; i++) {
181 if (ctx->Point.CoordReplace[i])
182 key.point_sprite_coord_replace |= (1 << i);
183 }
184 }
185 if (brw->fragment_program->Base.InputsRead & BITFIELD64_BIT(VARYING_SLOT_PNTC))
186 key.do_point_coord = 1;
187 /*
188 * Window coordinates in a FBO are inverted, which means point
189 * sprite origin must be inverted, too.
190 */
191 if ((ctx->Point.SpriteOrigin == GL_LOWER_LEFT) != render_to_fbo)
192 key.sprite_origin_lower_left = true;
193
194 /* BRW_NEW_INTERPOLATION_MAP */
195 key.interpolation_mode = brw->interpolation_mode;
196
197 /* _NEW_LIGHT | _NEW_PROGRAM */
198 key.do_twoside_color = ((ctx->Light.Enabled && ctx->Light.Model.TwoSide) ||
199 ctx->VertexProgram._TwoSideEnabled);
200
201 /* _NEW_POLYGON */
202 if (key.do_twoside_color) {
203 /* If we're rendering to a FBO, we have to invert the polygon
204 * face orientation, just as we invert the viewport in
205 * sf_unit_create_from_key().
206 */
207 key.frontface_ccw = ctx->Polygon._FrontBit == render_to_fbo;
208 }
209
210 if (!brw_search_cache(&brw->cache, BRW_CACHE_SF_PROG,
211 &key, sizeof(key),
212 &brw->sf.prog_offset, &brw->sf.prog_data)) {
213 compile_sf_prog( brw, &key );
214 }
215 }
216
217
218 const struct brw_tracked_state brw_sf_prog = {
219 .dirty = {
220 .mesa = _NEW_BUFFERS |
221 _NEW_HINT |
222 _NEW_LIGHT |
223 _NEW_POINT |
224 _NEW_POLYGON |
225 _NEW_PROGRAM |
226 _NEW_TRANSFORM,
227 .brw = BRW_NEW_INTERPOLATION_MAP |
228 BRW_NEW_REDUCED_PRIMITIVE |
229 BRW_NEW_VUE_MAP_GEOM_OUT,
230 },
231 .emit = brw_upload_sf_prog
232 };
233