i965: clip: rename header_position_offset to the more correct ndc_offset.
[mesa.git] / src / mesa / drivers / dri / i965 / brw_clip.c
1 /*
2 Copyright (C) Intel Corp. 2006. All Rights Reserved.
3 Intel funded Tungsten Graphics (http://www.tungstengraphics.com) to
4 develop this 3D driver.
5
6 Permission is hereby granted, free of charge, to any person obtaining
7 a copy of this software and associated documentation files (the
8 "Software"), to deal in the Software without restriction, including
9 without limitation the rights to use, copy, modify, merge, publish,
10 distribute, sublicense, and/or sell copies of the Software, and to
11 permit persons to whom the Software is furnished to do so, subject to
12 the following conditions:
13
14 The above copyright notice and this permission notice (including the
15 next paragraph) shall be included in all copies or substantial
16 portions of the Software.
17
18 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
19 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
21 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
22 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
23 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
24 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25
26 **********************************************************************/
27 /*
28 * Authors:
29 * Keith Whitwell <keith@tungstengraphics.com>
30 */
31
32 #include "main/glheader.h"
33 #include "main/macros.h"
34 #include "main/enums.h"
35
36 #include "intel_batchbuffer.h"
37
38 #include "brw_defines.h"
39 #include "brw_context.h"
40 #include "brw_eu.h"
41 #include "brw_util.h"
42 #include "brw_state.h"
43 #include "brw_clip.h"
44
45 #include "glsl/ralloc.h"
46
47 #define FRONT_UNFILLED_BIT 0x1
48 #define BACK_UNFILLED_BIT 0x2
49
50
51 static void compile_clip_prog( struct brw_context *brw,
52 struct brw_clip_prog_key *key )
53 {
54 struct intel_context *intel = &brw->intel;
55 struct brw_clip_compile c;
56 const GLuint *program;
57 void *mem_ctx;
58 GLuint program_size;
59 GLuint delta;
60 GLuint i;
61 GLuint header_regs;
62
63 memset(&c, 0, sizeof(c));
64
65 mem_ctx = ralloc_context(NULL);
66
67 /* Begin the compilation:
68 */
69 brw_init_compile(brw, &c.func, mem_ctx);
70
71 c.func.single_program_flow = 1;
72
73 c.key = *key;
74 brw_compute_vue_map(&c.vue_map, intel, c.key.nr_userclip,
75 c.key.do_twoside_color, c.key.attrs);
76
77 /* Need to locate the two positions present in vertex + header.
78 * These are currently hardcoded:
79 */
80 c.ndc_offset = ATTR_SIZE;
81
82 if (intel->gen == 5)
83 header_regs = 3;
84 else
85 header_regs = 1;
86
87 delta = header_regs * REG_SIZE;
88
89 for (i = 0; i < VERT_RESULT_MAX; i++) {
90 if (c.key.attrs & BITFIELD64_BIT(i)) {
91 c.offset[i] = delta;
92 delta += ATTR_SIZE;
93
94 c.idx_to_attr[c.nr_attrs] = i;
95 c.nr_attrs++;
96 }
97 }
98
99 /* The vertex attributes start at a URB row-aligned offset after
100 * the 8-20 dword vertex header, and continue for a URB row-aligned
101 * length. nr_regs determines the urb_read_length from the start
102 * of the header to the end of the vertex data.
103 */
104 c.nr_regs = header_regs + (c.nr_attrs + 1) / 2;
105
106 c.nr_bytes = c.nr_regs * REG_SIZE;
107
108 c.prog_data.clip_mode = c.key.clip_mode; /* XXX */
109
110 /* For some reason the thread is spawned with only 4 channels
111 * unmasked.
112 */
113 brw_set_mask_control(&c.func, BRW_MASK_DISABLE);
114
115
116 /* Would ideally have the option of producing a program which could
117 * do all three:
118 */
119 switch (key->primitive) {
120 case GL_TRIANGLES:
121 if (key->do_unfilled)
122 brw_emit_unfilled_clip( &c );
123 else
124 brw_emit_tri_clip( &c );
125 break;
126 case GL_LINES:
127 brw_emit_line_clip( &c );
128 break;
129 case GL_POINTS:
130 brw_emit_point_clip( &c );
131 break;
132 default:
133 assert(0);
134 return;
135 }
136
137
138
139 /* get the program
140 */
141 program = brw_get_program(&c.func, &program_size);
142
143 if (unlikely(INTEL_DEBUG & DEBUG_CLIP)) {
144 printf("clip:\n");
145 for (i = 0; i < program_size / sizeof(struct brw_instruction); i++)
146 brw_disasm(stdout, &((struct brw_instruction *)program)[i],
147 intel->gen);
148 printf("\n");
149 }
150
151 brw_upload_cache(&brw->cache,
152 BRW_CLIP_PROG,
153 &c.key, sizeof(c.key),
154 program, program_size,
155 &c.prog_data, sizeof(c.prog_data),
156 &brw->clip.prog_offset, &brw->clip.prog_data);
157 ralloc_free(mem_ctx);
158 }
159
160 /* Calculate interpolants for triangle and line rasterization.
161 */
162 static void upload_clip_prog(struct brw_context *brw)
163 {
164 struct intel_context *intel = &brw->intel;
165 struct gl_context *ctx = &intel->ctx;
166 struct brw_clip_prog_key key;
167
168 memset(&key, 0, sizeof(key));
169
170 /* Populate the key:
171 */
172 /* BRW_NEW_REDUCED_PRIMITIVE */
173 key.primitive = brw->intel.reduced_primitive;
174 /* CACHE_NEW_VS_PROG */
175 key.attrs = brw->vs.prog_data->outputs_written;
176 /* _NEW_LIGHT */
177 key.do_flat_shading = (ctx->Light.ShadeModel == GL_FLAT);
178 key.pv_first = (ctx->Light.ProvokingVertex == GL_FIRST_VERTEX_CONVENTION);
179 key.do_twoside_color = (ctx->Light.Enabled && ctx->Light.Model.TwoSide);
180 /* _NEW_TRANSFORM */
181 key.nr_userclip = brw_count_bits(ctx->Transform.ClipPlanesEnabled);
182
183 if (intel->gen == 5)
184 key.clip_mode = BRW_CLIPMODE_KERNEL_CLIP;
185 else
186 key.clip_mode = BRW_CLIPMODE_NORMAL;
187
188 /* _NEW_POLYGON */
189 if (key.primitive == GL_TRIANGLES) {
190 if (ctx->Polygon.CullFlag &&
191 ctx->Polygon.CullFaceMode == GL_FRONT_AND_BACK)
192 key.clip_mode = BRW_CLIPMODE_REJECT_ALL;
193 else {
194 GLuint fill_front = CLIP_CULL;
195 GLuint fill_back = CLIP_CULL;
196 GLuint offset_front = 0;
197 GLuint offset_back = 0;
198
199 if (!ctx->Polygon.CullFlag ||
200 ctx->Polygon.CullFaceMode != GL_FRONT) {
201 switch (ctx->Polygon.FrontMode) {
202 case GL_FILL:
203 fill_front = CLIP_FILL;
204 offset_front = 0;
205 break;
206 case GL_LINE:
207 fill_front = CLIP_LINE;
208 offset_front = ctx->Polygon.OffsetLine;
209 break;
210 case GL_POINT:
211 fill_front = CLIP_POINT;
212 offset_front = ctx->Polygon.OffsetPoint;
213 break;
214 }
215 }
216
217 if (!ctx->Polygon.CullFlag ||
218 ctx->Polygon.CullFaceMode != GL_BACK) {
219 switch (ctx->Polygon.BackMode) {
220 case GL_FILL:
221 fill_back = CLIP_FILL;
222 offset_back = 0;
223 break;
224 case GL_LINE:
225 fill_back = CLIP_LINE;
226 offset_back = ctx->Polygon.OffsetLine;
227 break;
228 case GL_POINT:
229 fill_back = CLIP_POINT;
230 offset_back = ctx->Polygon.OffsetPoint;
231 break;
232 }
233 }
234
235 if (ctx->Polygon.BackMode != GL_FILL ||
236 ctx->Polygon.FrontMode != GL_FILL) {
237 key.do_unfilled = 1;
238
239 /* Most cases the fixed function units will handle. Cases where
240 * one or more polygon faces are unfilled will require help:
241 */
242 key.clip_mode = BRW_CLIPMODE_CLIP_NON_REJECTED;
243
244 if (offset_back || offset_front) {
245 /* _NEW_POLYGON, _NEW_BUFFERS */
246 key.offset_units = ctx->Polygon.OffsetUnits * brw->intel.polygon_offset_scale;
247 key.offset_factor = ctx->Polygon.OffsetFactor * ctx->DrawBuffer->_MRD;
248 }
249
250 switch (ctx->Polygon.FrontFace) {
251 case GL_CCW:
252 key.fill_ccw = fill_front;
253 key.fill_cw = fill_back;
254 key.offset_ccw = offset_front;
255 key.offset_cw = offset_back;
256 if (ctx->Light.Model.TwoSide &&
257 key.fill_cw != CLIP_CULL)
258 key.copy_bfc_cw = 1;
259 break;
260 case GL_CW:
261 key.fill_cw = fill_front;
262 key.fill_ccw = fill_back;
263 key.offset_cw = offset_front;
264 key.offset_ccw = offset_back;
265 if (ctx->Light.Model.TwoSide &&
266 key.fill_ccw != CLIP_CULL)
267 key.copy_bfc_ccw = 1;
268 break;
269 }
270 }
271 }
272 }
273
274 if (!brw_search_cache(&brw->cache, BRW_CLIP_PROG,
275 &key, sizeof(key),
276 &brw->clip.prog_offset, &brw->clip.prog_data)) {
277 compile_clip_prog( brw, &key );
278 }
279 }
280
281
282 const struct brw_tracked_state brw_clip_prog = {
283 .dirty = {
284 .mesa = (_NEW_LIGHT |
285 _NEW_TRANSFORM |
286 _NEW_POLYGON |
287 _NEW_BUFFERS),
288 .brw = (BRW_NEW_REDUCED_PRIMITIVE),
289 .cache = CACHE_NEW_VS_PROG
290 },
291 .prepare = upload_clip_prog
292 };