1 /**************************************************************************
3 * Copyright 2007 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
30 * Keith Whitwell <keithw@vmware.com>
33 #include "util/u_memory.h"
34 #include "util/u_math.h"
35 #include "draw/draw_context.h"
36 #include "draw/draw_private.h"
37 #include "draw/draw_vbuf.h"
38 #include "draw/draw_vertex.h"
39 #include "draw/draw_vs.h"
40 #include "translate/translate.h"
42 /* A first pass at incorporating vertex fetch/emit functionality into
44 struct draw_vs_variant_generic
{
45 struct draw_vs_variant base
;
47 struct draw_vertex_shader
*shader
;
48 struct draw_context
*draw
;
50 /* Basic plan is to run these two translate functions before/after
51 * the vertex shader's existing run_linear() routine to simulate
52 * the inclusion of this functionality into the shader...
54 * Next will look at actually including it.
56 struct translate
*fetch
;
57 struct translate
*emit
;
59 unsigned temp_vertex_stride
;
66 static void vsvg_set_buffer( struct draw_vs_variant
*variant
,
72 struct draw_vs_variant_generic
*vsvg
= (struct draw_vs_variant_generic
*)variant
;
74 vsvg
->fetch
->set_buffer(vsvg
->fetch
,
81 static const struct pipe_viewport_state
*
82 find_viewport(struct draw_context
*draw
,
87 int viewport_index_output
=
88 draw_current_shader_viewport_index_output(draw
);
89 char *ptr
= buffer
+ vertex_idx
* stride
;
90 unsigned *data
= (unsigned *)ptr
;
92 draw_current_shader_uses_viewport_index(draw
) ?
93 data
[viewport_index_output
* 4] : 0;
95 viewport_index
= draw_clamp_viewport_idx(viewport_index
);
97 return &draw
->viewports
[viewport_index
];
101 /* Mainly for debug at this stage:
103 static void do_rhw_viewport( struct draw_vs_variant_generic
*vsvg
,
105 void *output_buffer
)
107 char *ptr
= (char *)output_buffer
;
108 unsigned stride
= vsvg
->temp_vertex_stride
;
111 ptr
+= vsvg
->base
.vs
->position_output
* 4 * sizeof(float);
113 for (j
= 0; j
< count
; j
++, ptr
+= stride
) {
114 const struct pipe_viewport_state
*viewport
=
115 find_viewport(vsvg
->base
.vs
->draw
, (char*)output_buffer
,
117 const float *scale
= viewport
->scale
;
118 const float *trans
= viewport
->translate
;
119 float *data
= (float *)ptr
;
120 float w
= 1.0f
/ data
[3];
122 data
[0] = data
[0] * w
* scale
[0] + trans
[0];
123 data
[1] = data
[1] * w
* scale
[1] + trans
[1];
124 data
[2] = data
[2] * w
* scale
[2] + trans
[2];
129 static void do_viewport( struct draw_vs_variant_generic
*vsvg
,
131 void *output_buffer
)
133 char *ptr
= (char *)output_buffer
;
134 unsigned stride
= vsvg
->temp_vertex_stride
;
137 ptr
+= vsvg
->base
.vs
->position_output
* 4 * sizeof(float);
139 for (j
= 0; j
< count
; j
++, ptr
+= stride
) {
140 const struct pipe_viewport_state
*viewport
=
141 find_viewport(vsvg
->base
.vs
->draw
, (char*)output_buffer
,
143 const float *scale
= viewport
->scale
;
144 const float *trans
= viewport
->translate
;
145 float *data
= (float *)ptr
;
147 data
[0] = data
[0] * scale
[0] + trans
[0];
148 data
[1] = data
[1] * scale
[1] + trans
[1];
149 data
[2] = data
[2] * scale
[2] + trans
[2];
154 static void PIPE_CDECL
vsvg_run_elts( struct draw_vs_variant
*variant
,
155 const unsigned *elts
,
159 struct draw_vs_variant_generic
*vsvg
= (struct draw_vs_variant_generic
*)variant
;
160 unsigned temp_vertex_stride
= vsvg
->temp_vertex_stride
;
161 void *temp_buffer
= MALLOC( align(count
,4) * temp_vertex_stride
);
163 if (0) debug_printf("%s %d \n", __FUNCTION__
, count
);
165 /* Want to do this in small batches for cache locality?
168 vsvg
->fetch
->run_elts( vsvg
->fetch
,
171 vsvg
->draw
->start_instance
,
172 vsvg
->draw
->instance_id
,
175 vsvg
->base
.vs
->run_linear( vsvg
->base
.vs
,
178 vsvg
->base
.vs
->draw
->pt
.user
.vs_constants
,
179 vsvg
->base
.vs
->draw
->pt
.user
.vs_constants_size
,
184 /* FIXME: geometry shading? */
186 if (vsvg
->base
.key
.clip
) {
187 /* not really handling clipping, just do the rhw so we can
190 do_rhw_viewport( vsvg
,
194 else if (vsvg
->base
.key
.viewport
) {
201 vsvg
->emit
->set_buffer( vsvg
->emit
,
207 vsvg
->emit
->set_buffer( vsvg
->emit
,
209 &vsvg
->draw
->rasterizer
->point_size
,
213 vsvg
->emit
->run( vsvg
->emit
,
215 vsvg
->draw
->start_instance
,
216 vsvg
->draw
->instance_id
,
223 static void PIPE_CDECL
vsvg_run_linear( struct draw_vs_variant
*variant
,
226 void *output_buffer
)
228 struct draw_vs_variant_generic
*vsvg
= (struct draw_vs_variant_generic
*)variant
;
229 unsigned temp_vertex_stride
= vsvg
->temp_vertex_stride
;
230 void *temp_buffer
= MALLOC( align(count
,4) * temp_vertex_stride
);
232 if (0) debug_printf("%s %d %d (sz %d, %d)\n", __FUNCTION__
, start
, count
,
233 vsvg
->base
.key
.output_stride
,
236 vsvg
->fetch
->run( vsvg
->fetch
,
239 vsvg
->draw
->start_instance
,
240 vsvg
->draw
->instance_id
,
243 vsvg
->base
.vs
->run_linear( vsvg
->base
.vs
,
246 vsvg
->base
.vs
->draw
->pt
.user
.vs_constants
,
247 vsvg
->base
.vs
->draw
->pt
.user
.vs_constants_size
,
252 if (vsvg
->base
.key
.clip
) {
253 /* not really handling clipping, just do the rhw so we can
256 do_rhw_viewport( vsvg
,
260 else if (vsvg
->base
.key
.viewport
) {
266 vsvg
->emit
->set_buffer( vsvg
->emit
,
272 vsvg
->emit
->set_buffer( vsvg
->emit
,
274 &vsvg
->draw
->rasterizer
->point_size
,
278 vsvg
->emit
->run( vsvg
->emit
,
280 vsvg
->draw
->start_instance
,
281 vsvg
->draw
->instance_id
,
291 static void vsvg_destroy( struct draw_vs_variant
*variant
)
297 struct draw_vs_variant
*
298 draw_vs_create_variant_generic( struct draw_vertex_shader
*vs
,
299 const struct draw_vs_variant_key
*key
)
302 struct translate_key fetch
, emit
;
304 struct draw_vs_variant_generic
*vsvg
= CALLOC_STRUCT( draw_vs_variant_generic
);
308 vsvg
->base
.key
= *key
;
310 vsvg
->base
.set_buffer
= vsvg_set_buffer
;
311 vsvg
->base
.run_elts
= vsvg_run_elts
;
312 vsvg
->base
.run_linear
= vsvg_run_linear
;
313 vsvg
->base
.destroy
= vsvg_destroy
;
315 vsvg
->draw
= vs
->draw
;
317 vsvg
->temp_vertex_stride
= MAX2(key
->nr_inputs
,
318 draw_total_vs_outputs(vs
->draw
)) * 4 * sizeof(float);
320 /* Build free-standing fetch and emit functions:
322 fetch
.nr_elements
= key
->nr_inputs
;
323 fetch
.output_stride
= vsvg
->temp_vertex_stride
;
324 for (i
= 0; i
< key
->nr_inputs
; i
++) {
325 fetch
.element
[i
].type
= TRANSLATE_ELEMENT_NORMAL
;
326 fetch
.element
[i
].input_format
= key
->element
[i
].in
.format
;
327 fetch
.element
[i
].input_buffer
= key
->element
[i
].in
.buffer
;
328 fetch
.element
[i
].input_offset
= key
->element
[i
].in
.offset
;
329 fetch
.element
[i
].instance_divisor
= 0;
330 fetch
.element
[i
].output_format
= PIPE_FORMAT_R32G32B32A32_FLOAT
;
331 fetch
.element
[i
].output_offset
= i
* 4 * sizeof(float);
332 assert(fetch
.element
[i
].output_offset
< fetch
.output_stride
);
336 emit
.nr_elements
= key
->nr_outputs
;
337 emit
.output_stride
= key
->output_stride
;
338 for (i
= 0; i
< key
->nr_outputs
; i
++) {
339 if (key
->element
[i
].out
.format
!= EMIT_1F_PSIZE
)
341 emit
.element
[i
].type
= TRANSLATE_ELEMENT_NORMAL
;
342 emit
.element
[i
].input_format
= PIPE_FORMAT_R32G32B32A32_FLOAT
;
343 emit
.element
[i
].input_buffer
= 0;
344 emit
.element
[i
].input_offset
= key
->element
[i
].out
.vs_output
* 4 * sizeof(float);
345 emit
.element
[i
].instance_divisor
= 0;
346 emit
.element
[i
].output_format
= draw_translate_vinfo_format(key
->element
[i
].out
.format
);
347 emit
.element
[i
].output_offset
= key
->element
[i
].out
.offset
;
348 assert(emit
.element
[i
].input_offset
<= fetch
.output_stride
);
351 emit
.element
[i
].type
= TRANSLATE_ELEMENT_NORMAL
;
352 emit
.element
[i
].input_format
= PIPE_FORMAT_R32_FLOAT
;
353 emit
.element
[i
].input_buffer
= 1;
354 emit
.element
[i
].input_offset
= 0;
355 emit
.element
[i
].instance_divisor
= 0;
356 emit
.element
[i
].output_format
= PIPE_FORMAT_R32_FLOAT
;
357 emit
.element
[i
].output_offset
= key
->element
[i
].out
.offset
;
361 vsvg
->fetch
= draw_vs_get_fetch( vs
->draw
, &fetch
);
362 vsvg
->emit
= draw_vs_get_emit( vs
->draw
, &emit
);