Merge branch 'sprite-coord'
[mesa.git] / src / gallium / drivers / llvmpipe / lp_setup_point.c
1 /**************************************************************************
2 *
3 * Copyright 2010, VMware Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /*
29 * Binning code for points
30 */
31
32 #include "lp_setup_context.h"
33 #include "util/u_math.h"
34 #include "util/u_memory.h"
35 #include "lp_perf.h"
36 #include "lp_setup_context.h"
37 #include "lp_rast.h"
38 #include "lp_state_fs.h"
39 #include "tgsi/tgsi_scan.h"
40
41 #define NUM_CHANNELS 4
42
43 struct point_info {
44 /* x,y deltas */
45 int dy01, dy12;
46 int dx01, dx12;
47
48 const float (*v0)[4];
49 };
50
51
52 /**
53 * Compute a0 for a constant-valued coefficient (GL_FLAT shading).
54 */
55 static void
56 constant_coef(struct lp_setup_context *setup,
57 struct lp_rast_triangle *point,
58 unsigned slot,
59 const float value,
60 unsigned i)
61 {
62 point->inputs.a0[slot][i] = value;
63 point->inputs.dadx[slot][i] = 0.0f;
64 point->inputs.dady[slot][i] = 0.0f;
65 }
66
67
68 static void
69 perspective_coef(struct lp_setup_context *setup,
70 struct lp_rast_triangle *point,
71 const struct point_info *info,
72 unsigned slot,
73 unsigned vert_attr,
74 unsigned i,
75 unsigned sprite_coord_origin)
76 {
77 if (i == 0) {
78 float dadx = FIXED_ONE / (float)info->dx12;
79 float dady = 0.0f;
80 point->inputs.dadx[slot][i] = dadx;
81 point->inputs.dady[slot][i] = dady;
82 point->inputs.a0[slot][i] = (0.5 -
83 (dadx * ((float)info->v0[0][0] - setup->pixel_offset) +
84 dady * ((float)info->v0[0][1] - setup->pixel_offset)));
85 }
86 else if (i == 1) {
87 float dadx = 0.0f;
88 float dady = FIXED_ONE / (float)info->dx12;
89
90 if (sprite_coord_origin == PIPE_SPRITE_COORD_LOWER_LEFT) {
91 dady = -dady;
92 }
93
94 point->inputs.dadx[slot][i] = dadx;
95 point->inputs.dady[slot][i] = dady;
96 point->inputs.a0[slot][i] = (0.5 -
97 (dadx * ((float)info->v0[0][0] - setup->pixel_offset) +
98 dady * ((float)info->v0[0][1] - setup->pixel_offset)));
99 }
100 else if (i == 2) {
101 point->inputs.a0[slot][i] = 0.0f;
102 point->inputs.dadx[slot][i] = 0.0f;
103 point->inputs.dady[slot][i] = 0.0f;
104 }
105 else if (i == 3) {
106 point->inputs.a0[slot][i] = 1.0f;
107 point->inputs.dadx[slot][i] = 0.0f;
108 point->inputs.dady[slot][i] = 0.0f;
109 }
110 }
111
112
113 /**
114 * Special coefficient setup for gl_FragCoord.
115 * X and Y are trivial
116 * Z and W are copied from position_coef which should have already been computed.
117 * We could do a bit less work if we'd examine gl_FragCoord's swizzle mask.
118 */
119 static void
120 setup_point_fragcoord_coef(struct lp_setup_context *setup,
121 struct lp_rast_triangle *point,
122 const struct point_info *info,
123 unsigned slot,
124 unsigned usage_mask)
125 {
126 /*X*/
127 if (usage_mask & TGSI_WRITEMASK_X) {
128 point->inputs.a0[slot][0] = 0.0;
129 point->inputs.dadx[slot][0] = 1.0;
130 point->inputs.dady[slot][0] = 0.0;
131 }
132
133 /*Y*/
134 if (usage_mask & TGSI_WRITEMASK_Y) {
135 point->inputs.a0[slot][1] = 0.0;
136 point->inputs.dadx[slot][1] = 0.0;
137 point->inputs.dady[slot][1] = 1.0;
138 }
139
140 /*Z*/
141 if (usage_mask & TGSI_WRITEMASK_Z) {
142 constant_coef(setup, point, slot, info->v0[0][2], 2);
143 }
144
145 /*W*/
146 if (usage_mask & TGSI_WRITEMASK_W) {
147 constant_coef(setup, point, slot, info->v0[0][3], 3);
148 }
149 }
150
151
152 /**
153 * Compute the point->coef[] array dadx, dady, a0 values.
154 */
155 static void
156 setup_point_coefficients( struct lp_setup_context *setup,
157 struct lp_rast_triangle *point,
158 const struct point_info *info)
159 {
160 const struct lp_fragment_shader *shader = setup->fs.current.variant->shader;
161 unsigned fragcoord_usage_mask = TGSI_WRITEMASK_XYZ;
162 unsigned slot;
163
164 /* setup interpolation for all the remaining attributes:
165 */
166 for (slot = 0; slot < setup->fs.nr_inputs; slot++) {
167 unsigned vert_attr = setup->fs.input[slot].src_index;
168 unsigned usage_mask = setup->fs.input[slot].usage_mask;
169 unsigned i;
170
171 switch (setup->fs.input[slot].interp) {
172 case LP_INTERP_POSITION:
173 /*
174 * The generated pixel interpolators will pick up the coeffs from
175 * slot 0, so all need to ensure that the usage mask is covers all
176 * usages.
177 */
178 fragcoord_usage_mask |= usage_mask;
179 break;
180
181 case LP_INTERP_LINEAR:
182 /* Sprite tex coords may use linear interpolation someday */
183 /* fall-through */
184
185 case LP_INTERP_PERSPECTIVE:
186 /* check if the sprite coord flag is set for this attribute.
187 * If so, set it up so it up so x any y vary from 0 to 1.
188 */
189 if (shader->info.input_semantic_name[slot] == TGSI_SEMANTIC_GENERIC) {
190 const int index = shader->info.input_semantic_index[slot];
191 /* Note that sprite_coord enable is a bitfield of
192 * PIPE_MAX_SHADER_OUTPUTS bits.
193 */
194 if (index < PIPE_MAX_SHADER_OUTPUTS &&
195 (setup->sprite_coord_enable & (1 << index))) {
196 for (i = 0; i < NUM_CHANNELS; i++)
197 if (usage_mask & (1 << i))
198 perspective_coef(setup, point, info, slot+1, vert_attr, i,
199 setup->sprite_coord_origin);
200 fragcoord_usage_mask |= TGSI_WRITEMASK_W;
201 break;
202 }
203 }
204
205 /* Otherwise fallthrough */
206 default:
207 for (i = 0; i < NUM_CHANNELS; i++) {
208 if (usage_mask & (1 << i))
209 constant_coef(setup, point, slot+1, info->v0[vert_attr][i], i);
210 }
211 }
212 }
213
214 /* The internal position input is in slot zero:
215 */
216 setup_point_fragcoord_coef(setup, point, info, 0,
217 fragcoord_usage_mask);
218 }
219
220
221 static INLINE int
222 subpixel_snap(float a)
223 {
224 return util_iround(FIXED_ONE * a);
225 }
226
227
228 static boolean
229 try_setup_point( struct lp_setup_context *setup,
230 const float (*v0)[4] )
231 {
232 /* x/y positions in fixed point */
233 const int sizeAttr = setup->psize;
234 const float size
235 = (setup->point_size_per_vertex && sizeAttr > 0) ? v0[sizeAttr][0]
236 : setup->point_size;
237
238 /* Point size as fixed point integer, remove rounding errors
239 * and gives minimum width for very small points
240 */
241 int fixed_width = MAX2(FIXED_ONE,
242 (subpixel_snap(size) + FIXED_ONE/2 - 1) & ~(FIXED_ONE-1));
243
244 const int x0 = subpixel_snap(v0[0][0] - setup->pixel_offset) - fixed_width/2;
245 const int y0 = subpixel_snap(v0[0][1] - setup->pixel_offset) - fixed_width/2;
246
247 struct lp_scene *scene = setup->scene;
248 struct lp_rast_triangle *point;
249 unsigned bytes;
250 struct u_rect bbox;
251 unsigned nr_planes = 4;
252 struct point_info info;
253
254
255 /* Bounding rectangle (in pixels) */
256 {
257 /* Yes this is necessary to accurately calculate bounding boxes
258 * with the two fill-conventions we support. GL (normally) ends
259 * up needing a bottom-left fill convention, which requires
260 * slightly different rounding.
261 */
262 int adj = (setup->pixel_offset != 0) ? 1 : 0;
263
264 bbox.x0 = (x0 + (FIXED_ONE-1) + adj) >> FIXED_ORDER;
265 bbox.x1 = (x0 + fixed_width + (FIXED_ONE-1) + adj) >> FIXED_ORDER;
266 bbox.y0 = (y0 + (FIXED_ONE-1)) >> FIXED_ORDER;
267 bbox.y1 = (y0 + fixed_width + (FIXED_ONE-1)) >> FIXED_ORDER;
268
269 /* Inclusive coordinates:
270 */
271 bbox.x1--;
272 bbox.y1--;
273 }
274
275 if (!u_rect_test_intersection(&setup->draw_region, &bbox)) {
276 if (0) debug_printf("offscreen\n");
277 LP_COUNT(nr_culled_tris);
278 return TRUE;
279 }
280
281 u_rect_find_intersection(&setup->draw_region, &bbox);
282
283 point = lp_setup_alloc_triangle(scene,
284 setup->fs.nr_inputs,
285 nr_planes,
286 &bytes);
287 if (!point)
288 return FALSE;
289
290 #ifdef DEBUG
291 point->v[0][0] = v0[0][0];
292 point->v[0][1] = v0[0][1];
293 #endif
294
295 info.v0 = v0;
296 info.dx01 = 0;
297 info.dx12 = fixed_width;
298 info.dy01 = fixed_width;
299 info.dy12 = 0;
300
301 /* Setup parameter interpolants:
302 */
303 setup_point_coefficients(setup, point, &info);
304
305 point->inputs.facing = 1.0F;
306 point->inputs.state = setup->fs.stored;
307 point->inputs.disable = FALSE;
308 point->inputs.opaque = FALSE;
309
310 {
311 point->plane[0].dcdx = -1;
312 point->plane[0].dcdy = 0;
313 point->plane[0].c = 1-bbox.x0;
314 point->plane[0].ei = 0;
315 point->plane[0].eo = 1;
316
317 point->plane[1].dcdx = 1;
318 point->plane[1].dcdy = 0;
319 point->plane[1].c = bbox.x1+1;
320 point->plane[1].ei = -1;
321 point->plane[1].eo = 0;
322
323 point->plane[2].dcdx = 0;
324 point->plane[2].dcdy = 1;
325 point->plane[2].c = 1-bbox.y0;
326 point->plane[2].ei = 0;
327 point->plane[2].eo = 1;
328
329 point->plane[3].dcdx = 0;
330 point->plane[3].dcdy = -1;
331 point->plane[3].c = bbox.y1+1;
332 point->plane[3].ei = -1;
333 point->plane[3].eo = 0;
334 }
335
336 return lp_setup_bin_triangle(setup, point, &bbox, nr_planes);
337 }
338
339
340 static void
341 lp_setup_point(struct lp_setup_context *setup,
342 const float (*v0)[4])
343 {
344 if (!try_setup_point( setup, v0 ))
345 {
346 lp_setup_flush_and_restart(setup);
347
348 if (!try_setup_point( setup, v0 ))
349 assert(0);
350 }
351 }
352
353
354 void
355 lp_setup_choose_point( struct lp_setup_context *setup )
356 {
357 setup->point = lp_setup_point;
358 }
359
360