1 /**************************************************************************
3 * Copyright 2010, VMware Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
29 * Binning code for points
32 #include "lp_setup_context.h"
33 #include "util/u_math.h"
34 #include "util/u_memory.h"
36 #include "lp_setup_context.h"
38 #include "lp_state_fs.h"
39 #include "tgsi/tgsi_scan.h"
41 #define NUM_CHANNELS 4
53 * Compute a0 for a constant-valued coefficient (GL_FLAT shading).
55 static void constant_coef( struct lp_setup_context
*setup
,
56 struct lp_rast_triangle
*point
,
61 point
->inputs
.a0
[slot
][i
] = value
;
62 point
->inputs
.dadx
[slot
][i
] = 0.0f
;
63 point
->inputs
.dady
[slot
][i
] = 0.0f
;
66 static void perspective_coef( struct lp_setup_context
*setup
,
67 struct lp_rast_triangle
*point
,
68 const struct point_info
*info
,
74 float dadx
= FIXED_ONE
/ (float)info
->dx12
;
76 point
->inputs
.dadx
[slot
][i
] = dadx
;
77 point
->inputs
.dady
[slot
][i
] = dady
;
78 point
->inputs
.a0
[slot
][i
] = (0.5 -
79 (dadx
* ((float)info
->v0
[0][0] - setup
->pixel_offset
) +
80 dady
* ((float)info
->v0
[0][1] - setup
->pixel_offset
)));
85 float dady
= FIXED_ONE
/ (float)info
->dx12
;
87 point
->inputs
.dadx
[slot
][i
] = dadx
;
88 point
->inputs
.dady
[slot
][i
] = dady
;
89 point
->inputs
.a0
[slot
][i
] = (0.5 -
90 (dadx
* ((float)info
->v0
[0][0] - setup
->pixel_offset
) +
91 dady
* ((float)info
->v0
[0][1] - setup
->pixel_offset
)));
95 point
->inputs
.a0
[slot
][i
] = 0.0f
;
96 point
->inputs
.dadx
[slot
][i
] = 0.0f
;
97 point
->inputs
.dady
[slot
][i
] = 0.0f
;
101 point
->inputs
.a0
[slot
][i
] = 1.0f
;
102 point
->inputs
.dadx
[slot
][i
] = 0.0f
;
103 point
->inputs
.dady
[slot
][i
] = 0.0f
;
110 * Special coefficient setup for gl_FragCoord.
111 * X and Y are trivial
112 * Z and W are copied from position_coef which should have already been computed.
113 * We could do a bit less work if we'd examine gl_FragCoord's swizzle mask.
116 setup_point_fragcoord_coef(struct lp_setup_context
*setup
,
117 struct lp_rast_triangle
*point
,
118 const struct point_info
*info
,
123 if (usage_mask
& TGSI_WRITEMASK_X
) {
124 point
->inputs
.a0
[slot
][0] = 0.0;
125 point
->inputs
.dadx
[slot
][0] = 1.0;
126 point
->inputs
.dady
[slot
][0] = 0.0;
130 if (usage_mask
& TGSI_WRITEMASK_Y
) {
131 point
->inputs
.a0
[slot
][1] = 0.0;
132 point
->inputs
.dadx
[slot
][1] = 0.0;
133 point
->inputs
.dady
[slot
][1] = 1.0;
137 if (usage_mask
& TGSI_WRITEMASK_Z
) {
138 constant_coef(setup
, point
, slot
, info
->v0
[0][2], 2);
142 if (usage_mask
& TGSI_WRITEMASK_W
) {
143 constant_coef(setup
, point
, slot
, info
->v0
[0][3], 3);
148 * Compute the point->coef[] array dadx, dady, a0 values.
151 setup_point_coefficients( struct lp_setup_context
*setup
,
152 struct lp_rast_triangle
*point
,
153 const struct point_info
*info
)
155 unsigned fragcoord_usage_mask
= TGSI_WRITEMASK_XYZ
;
158 /* setup interpolation for all the remaining attributes:
160 for (slot
= 0; slot
< setup
->fs
.nr_inputs
; slot
++) {
161 unsigned vert_attr
= setup
->fs
.input
[slot
].src_index
;
162 unsigned usage_mask
= setup
->fs
.input
[slot
].usage_mask
;
165 switch (setup
->fs
.input
[slot
].interp
) {
166 case LP_INTERP_POSITION
:
168 * The generated pixel interpolators will pick up the coeffs from
169 * slot 0, so all need to ensure that the usage mask is covers all
172 fragcoord_usage_mask
|= usage_mask
;
175 case LP_INTERP_PERSPECTIVE
:
176 /* For point sprite textures */
177 if (setup
->fs
.current
.variant
->shader
->info
.input_semantic_name
[slot
]
178 == TGSI_SEMANTIC_GENERIC
)
180 int index
= setup
->fs
.current
.variant
->shader
->info
.input_semantic_index
[slot
];
182 if (setup
->sprite
& (1 << index
)) {
183 for (i
= 0; i
< NUM_CHANNELS
; i
++)
184 if (usage_mask
& (1 << i
))
185 perspective_coef(setup
, point
, info
, slot
+1, vert_attr
, i
);
186 fragcoord_usage_mask
|= TGSI_WRITEMASK_W
;
191 /* Otherwise fallthrough */
193 for (i
= 0; i
< NUM_CHANNELS
; i
++) {
194 if (usage_mask
& (1 << i
))
195 constant_coef(setup
, point
, slot
+1, info
->v0
[vert_attr
][i
], i
);
200 /* The internal position input is in slot zero:
202 setup_point_fragcoord_coef(setup
, point
, info
, 0,
203 fragcoord_usage_mask
);
207 subpixel_snap(float a
)
209 return util_iround(FIXED_ONE
* a
);
213 static void lp_setup_point( struct lp_setup_context
*setup
,
214 const float (*v0
)[4] )
216 /* x/y positions in fixed point */
217 const int sizeAttr
= setup
->psize
;
219 = (setup
->point_size_per_vertex
&& sizeAttr
> 0) ? v0
[sizeAttr
][0]
222 /* Point size as fixed point integer, remove rounding errors
223 * and gives minimum width for very small points
225 int fixed_width
= MAX2(FIXED_ONE
,
226 (subpixel_snap(size
) + FIXED_ONE
/2 - 1) & ~(FIXED_ONE
-1));
228 const int x0
= subpixel_snap(v0
[0][0] - setup
->pixel_offset
) - fixed_width
/2;
229 const int y0
= subpixel_snap(v0
[0][1] - setup
->pixel_offset
) - fixed_width
/2;
231 struct lp_scene
*scene
= lp_setup_get_current_scene(setup
);
232 struct lp_rast_triangle
*point
;
235 unsigned nr_planes
= 4;
236 struct point_info info
;
239 /* Bounding rectangle (in pixels) */
241 /* Yes this is necessary to accurately calculate bounding boxes
242 * with the two fill-conventions we support. GL (normally) ends
243 * up needing a bottom-left fill convention, which requires
244 * slightly different rounding.
246 int adj
= (setup
->pixel_offset
!= 0) ? 1 : 0;
248 bbox
.x0
= (x0
+ (FIXED_ONE
-1) + adj
) >> FIXED_ORDER
;
249 bbox
.x1
= (x0
+ fixed_width
+ (FIXED_ONE
-1) + adj
) >> FIXED_ORDER
;
250 bbox
.y0
= (y0
+ (FIXED_ONE
-1)) >> FIXED_ORDER
;
251 bbox
.y1
= (y0
+ fixed_width
+ (FIXED_ONE
-1)) >> FIXED_ORDER
;
253 /* Inclusive coordinates:
259 if (!u_rect_test_intersection(&setup
->draw_region
, &bbox
)) {
260 if (0) debug_printf("offscreen\n");
261 LP_COUNT(nr_culled_tris
);
265 u_rect_find_intersection(&setup
->draw_region
, &bbox
);
267 point
= lp_setup_alloc_triangle(scene
,
275 point
->v
[0][0] = v0
[0][0];
276 point
->v
[0][1] = v0
[0][1];
281 info
.dx12
= fixed_width
;
282 info
.dy01
= fixed_width
;
285 /* Setup parameter interpolants:
287 setup_point_coefficients(setup
, point
, &info
);
289 point
->inputs
.facing
= 1.0F
;
290 point
->inputs
.state
= setup
->fs
.stored
;
293 point
->plane
[0].dcdx
= -1;
294 point
->plane
[0].dcdy
= 0;
295 point
->plane
[0].c
= 1-bbox
.x0
;
296 point
->plane
[0].ei
= 0;
297 point
->plane
[0].eo
= 1;
299 point
->plane
[1].dcdx
= 1;
300 point
->plane
[1].dcdy
= 0;
301 point
->plane
[1].c
= bbox
.x1
+1;
302 point
->plane
[1].ei
= -1;
303 point
->plane
[1].eo
= 0;
305 point
->plane
[2].dcdx
= 0;
306 point
->plane
[2].dcdy
= 1;
307 point
->plane
[2].c
= 1-bbox
.y0
;
308 point
->plane
[2].ei
= 0;
309 point
->plane
[2].eo
= 1;
311 point
->plane
[3].dcdx
= 0;
312 point
->plane
[3].dcdy
= -1;
313 point
->plane
[3].c
= bbox
.y1
+1;
314 point
->plane
[3].ei
= -1;
315 point
->plane
[3].eo
= 0;
318 lp_setup_bin_triangle(setup
, point
, &bbox
, nr_planes
);
323 lp_setup_choose_point( struct lp_setup_context
*setup
)
325 setup
->point
= lp_setup_point
;