Merge branch 'mesa_7_5_branch'
[mesa.git] / src / mesa / drivers / dri / i965 / brw_clip_line.c
1 /*
2 Copyright (C) Intel Corp. 2006. All Rights Reserved.
3 Intel funded Tungsten Graphics (http://www.tungstengraphics.com) to
4 develop this 3D driver.
5
6 Permission is hereby granted, free of charge, to any person obtaining
7 a copy of this software and associated documentation files (the
8 "Software"), to deal in the Software without restriction, including
9 without limitation the rights to use, copy, modify, merge, publish,
10 distribute, sublicense, and/or sell copies of the Software, and to
11 permit persons to whom the Software is furnished to do so, subject to
12 the following conditions:
13
14 The above copyright notice and this permission notice (including the
15 next paragraph) shall be included in all copies or substantial
16 portions of the Software.
17
18 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
19 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
21 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
22 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
23 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
24 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25
26 **********************************************************************/
27 /*
28 * Authors:
29 * Keith Whitwell <keith@tungstengraphics.com>
30 */
31
32 #include "main/glheader.h"
33 #include "main/macros.h"
34 #include "main/enums.h"
35 #include "shader/program.h"
36
37 #include "intel_batchbuffer.h"
38
39 #include "brw_defines.h"
40 #include "brw_context.h"
41 #include "brw_eu.h"
42 #include "brw_util.h"
43 #include "brw_clip.h"
44
45
46
47 static void brw_clip_line_alloc_regs( struct brw_clip_compile *c )
48 {
49 GLuint i = 0,j;
50
51 /* Register usage is static, precompute here:
52 */
53 c->reg.R0 = retype(brw_vec8_grf(i, 0), BRW_REGISTER_TYPE_UD); i++;
54
55 if (c->key.nr_userclip) {
56 c->reg.fixed_planes = brw_vec4_grf(i, 0);
57 i += (6 + c->key.nr_userclip + 1) / 2;
58
59 c->prog_data.curb_read_length = (6 + c->key.nr_userclip + 1) / 2;
60 }
61 else
62 c->prog_data.curb_read_length = 0;
63
64
65 /* Payload vertices plus space for more generated vertices:
66 */
67 for (j = 0; j < 4; j++) {
68 c->reg.vertex[j] = brw_vec4_grf(i, 0);
69 i += c->nr_regs;
70 }
71
72 c->reg.t = brw_vec1_grf(i, 0);
73 c->reg.t0 = brw_vec1_grf(i, 1);
74 c->reg.t1 = brw_vec1_grf(i, 2);
75 c->reg.planemask = retype(brw_vec1_grf(i, 3), BRW_REGISTER_TYPE_UD);
76 c->reg.plane_equation = brw_vec4_grf(i, 4);
77 i++;
78
79 c->reg.dp0 = brw_vec1_grf(i, 0); /* fixme - dp4 will clobber r.1,2,3 */
80 c->reg.dp1 = brw_vec1_grf(i, 4);
81 i++;
82
83 if (!c->key.nr_userclip) {
84 c->reg.fixed_planes = brw_vec8_grf(i, 0);
85 i++;
86 }
87
88 if (c->need_ff_sync) {
89 c->reg.ff_sync = retype(brw_vec1_grf(i, 0), BRW_REGISTER_TYPE_UD);
90 i++;
91 }
92
93 c->first_tmp = i;
94 c->last_tmp = i;
95
96 c->prog_data.urb_read_length = c->nr_regs; /* ? */
97 c->prog_data.total_grf = i;
98 }
99
100
101
102 /* Line clipping, more or less following the following algorithm:
103 *
104 * for (p=0;p<MAX_PLANES;p++) {
105 * if (clipmask & (1 << p)) {
106 * GLfloat dp0 = DOTPROD( vtx0, plane[p] );
107 * GLfloat dp1 = DOTPROD( vtx1, plane[p] );
108 *
109 * if (IS_NEGATIVE(dp1)) {
110 * GLfloat t = dp1 / (dp1 - dp0);
111 * if (t > t1) t1 = t;
112 * } else {
113 * GLfloat t = dp0 / (dp0 - dp1);
114 * if (t > t0) t0 = t;
115 * }
116 *
117 * if (t0 + t1 >= 1.0)
118 * return;
119 * }
120 * }
121 *
122 * interp( ctx, newvtx0, vtx0, vtx1, t0 );
123 * interp( ctx, newvtx1, vtx1, vtx0, t1 );
124 *
125 */
126 static void clip_and_emit_line( struct brw_clip_compile *c )
127 {
128 struct brw_compile *p = &c->func;
129 struct brw_indirect vtx0 = brw_indirect(0, 0);
130 struct brw_indirect vtx1 = brw_indirect(1, 0);
131 struct brw_indirect newvtx0 = brw_indirect(2, 0);
132 struct brw_indirect newvtx1 = brw_indirect(3, 0);
133 struct brw_indirect plane_ptr = brw_indirect(4, 0);
134 struct brw_instruction *plane_loop;
135 struct brw_instruction *plane_active;
136 struct brw_instruction *is_negative;
137 struct brw_instruction *is_neg2 = NULL;
138 struct brw_instruction *not_culled;
139 struct brw_reg v1_null_ud = retype(vec1(brw_null_reg()), BRW_REGISTER_TYPE_UD);
140
141 brw_MOV(p, get_addr_reg(vtx0), brw_address(c->reg.vertex[0]));
142 brw_MOV(p, get_addr_reg(vtx1), brw_address(c->reg.vertex[1]));
143 brw_MOV(p, get_addr_reg(newvtx0), brw_address(c->reg.vertex[2]));
144 brw_MOV(p, get_addr_reg(newvtx1), brw_address(c->reg.vertex[3]));
145 brw_MOV(p, get_addr_reg(plane_ptr), brw_clip_plane0_address(c));
146
147 /* Note: init t0, t1 together:
148 */
149 brw_MOV(p, vec2(c->reg.t0), brw_imm_f(0));
150
151 brw_clip_init_planes(c);
152 brw_clip_init_clipmask(c);
153
154 /* -ve rhw workaround */
155 if (BRW_IS_965(p->brw)) {
156 brw_set_conditionalmod(p, BRW_CONDITIONAL_NZ);
157 brw_AND(p, brw_null_reg(), get_element_ud(c->reg.R0, 2),
158 brw_imm_ud(1<<20));
159 brw_OR(p, c->reg.planemask, c->reg.planemask, brw_imm_ud(0x3f));
160 }
161
162 brw_set_predicate_control(p, BRW_PREDICATE_NONE);
163
164 plane_loop = brw_DO(p, BRW_EXECUTE_1);
165 {
166 /* if (planemask & 1)
167 */
168 brw_set_conditionalmod(p, BRW_CONDITIONAL_NZ);
169 brw_AND(p, v1_null_ud, c->reg.planemask, brw_imm_ud(1));
170
171 plane_active = brw_IF(p, BRW_EXECUTE_1);
172 {
173 if (c->key.nr_userclip)
174 brw_MOV(p, c->reg.plane_equation, deref_4f(plane_ptr, 0));
175 else
176 brw_MOV(p, c->reg.plane_equation, deref_4b(plane_ptr, 0));
177
178 /* dp = DP4(vtx->position, plane)
179 */
180 brw_DP4(p, vec4(c->reg.dp0), deref_4f(vtx0, c->offset[VERT_RESULT_HPOS]), c->reg.plane_equation);
181
182 /* if (IS_NEGATIVE(dp1))
183 */
184 brw_set_conditionalmod(p, BRW_CONDITIONAL_L);
185 brw_DP4(p, vec4(c->reg.dp1), deref_4f(vtx1, c->offset[VERT_RESULT_HPOS]), c->reg.plane_equation);
186 is_negative = brw_IF(p, BRW_EXECUTE_1);
187 {
188 /*
189 * Both can be negative on GM965/G965 due to RHW workaround
190 * if so, this object should be rejected.
191 */
192 if (BRW_IS_965(p->brw)) {
193 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_LE, c->reg.dp0, brw_imm_f(0.0));
194 is_neg2 = brw_IF(p, BRW_EXECUTE_1);
195 {
196 brw_clip_kill_thread(c);
197 }
198 brw_ENDIF(p, is_neg2);
199 }
200
201 brw_ADD(p, c->reg.t, c->reg.dp1, negate(c->reg.dp0));
202 brw_math_invert(p, c->reg.t, c->reg.t);
203 brw_MUL(p, c->reg.t, c->reg.t, c->reg.dp1);
204
205 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_G, c->reg.t, c->reg.t1 );
206 brw_MOV(p, c->reg.t1, c->reg.t);
207 brw_set_predicate_control(p, BRW_PREDICATE_NONE);
208 }
209 is_negative = brw_ELSE(p, is_negative);
210 {
211 /* Coming back in. We know that both cannot be negative
212 * because the line would have been culled in that case.
213 */
214
215 /* If both are positive, do nothing */
216 /* Only on GM965/G965 */
217 if (BRW_IS_965(p->brw)) {
218 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_L, c->reg.dp0, brw_imm_f(0.0));
219 is_neg2 = brw_IF(p, BRW_EXECUTE_1);
220 }
221
222 {
223 brw_ADD(p, c->reg.t, c->reg.dp0, negate(c->reg.dp1));
224 brw_math_invert(p, c->reg.t, c->reg.t);
225 brw_MUL(p, c->reg.t, c->reg.t, c->reg.dp0);
226
227 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_G, c->reg.t, c->reg.t0 );
228 brw_MOV(p, c->reg.t0, c->reg.t);
229 brw_set_predicate_control(p, BRW_PREDICATE_NONE);
230 }
231
232 if (BRW_IS_965(p->brw)) {
233 brw_ENDIF(p, is_neg2);
234 }
235 }
236 brw_ENDIF(p, is_negative);
237 }
238 brw_ENDIF(p, plane_active);
239
240 /* plane_ptr++;
241 */
242 brw_ADD(p, get_addr_reg(plane_ptr), get_addr_reg(plane_ptr), brw_clip_plane_stride(c));
243
244 /* while (planemask>>=1) != 0
245 */
246 brw_set_conditionalmod(p, BRW_CONDITIONAL_NZ);
247 brw_SHR(p, c->reg.planemask, c->reg.planemask, brw_imm_ud(1));
248 }
249 brw_WHILE(p, plane_loop);
250
251 brw_ADD(p, c->reg.t, c->reg.t0, c->reg.t1);
252 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_L, c->reg.t, brw_imm_f(1.0));
253 not_culled = brw_IF(p, BRW_EXECUTE_1);
254 {
255 brw_clip_interp_vertex(c, newvtx0, vtx0, vtx1, c->reg.t0, GL_FALSE);
256 brw_clip_interp_vertex(c, newvtx1, vtx1, vtx0, c->reg.t1, GL_FALSE);
257
258 brw_clip_emit_vue(c, newvtx0, 1, 0, (_3DPRIM_LINESTRIP << 2) | R02_PRIM_START);
259 brw_clip_emit_vue(c, newvtx1, 0, 1, (_3DPRIM_LINESTRIP << 2) | R02_PRIM_END);
260 }
261 brw_ENDIF(p, not_culled);
262 brw_clip_kill_thread(c);
263 }
264
265
266
267 void brw_emit_line_clip( struct brw_clip_compile *c )
268 {
269 brw_clip_line_alloc_regs(c);
270 brw_clip_init_ff_sync(c);
271
272 if (c->key.do_flat_shading)
273 brw_clip_copy_colors(c, 0, 1);
274
275 clip_and_emit_line(c);
276 }