svga: add new GALLIUM_HUD queries
[mesa.git] / src / gallium / drivers / svga / svga_pipe_vertex.c
1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 *
24 **********************************************************/
25
26 #include "pipe/p_defines.h"
27 #include "util/u_bitmask.h"
28 #include "util/u_format.h"
29 #include "util/u_helpers.h"
30 #include "util/u_inlines.h"
31 #include "util/u_math.h"
32 #include "util/u_memory.h"
33 #include "util/u_transfer.h"
34 #include "tgsi/tgsi_parse.h"
35
36 #include "svga_context.h"
37 #include "svga_cmd.h"
38 #include "svga_format.h"
39 #include "svga_resource_buffer.h"
40 #include "svga_screen.h"
41
42
43 static void svga_set_vertex_buffers(struct pipe_context *pipe,
44 unsigned start_slot, unsigned count,
45 const struct pipe_vertex_buffer *buffers)
46 {
47 struct svga_context *svga = svga_context(pipe);
48
49 util_set_vertex_buffers_count(svga->curr.vb,
50 &svga->curr.num_vertex_buffers,
51 buffers, start_slot, count);
52
53 svga->dirty |= SVGA_NEW_VBUFFER;
54 }
55
56
57 static void svga_set_index_buffer(struct pipe_context *pipe,
58 const struct pipe_index_buffer *ib)
59 {
60 struct svga_context *svga = svga_context(pipe);
61
62 util_set_index_buffer(&svga->curr.ib, ib);
63 }
64
65
66 /**
67 * Does the given vertex attrib format need range adjustment in the VS?
68 * Range adjustment scales and biases values from [0,1] to [-1,1].
69 * This lets us avoid the swtnl path.
70 */
71 static boolean
72 attrib_needs_range_adjustment(enum pipe_format format)
73 {
74 switch (format) {
75 case PIPE_FORMAT_R8G8B8_SNORM:
76 return TRUE;
77 default:
78 return FALSE;
79 }
80 }
81
82
83 /**
84 * Given a gallium vertex element format, return the corresponding
85 * SVGA3dDeclType.
86 */
87 static SVGA3dDeclType
88 translate_vertex_format_to_decltype(enum pipe_format format)
89 {
90 switch (format) {
91 case PIPE_FORMAT_R32_FLOAT: return SVGA3D_DECLTYPE_FLOAT1;
92 case PIPE_FORMAT_R32G32_FLOAT: return SVGA3D_DECLTYPE_FLOAT2;
93 case PIPE_FORMAT_R32G32B32_FLOAT: return SVGA3D_DECLTYPE_FLOAT3;
94 case PIPE_FORMAT_R32G32B32A32_FLOAT: return SVGA3D_DECLTYPE_FLOAT4;
95 case PIPE_FORMAT_B8G8R8A8_UNORM: return SVGA3D_DECLTYPE_D3DCOLOR;
96 case PIPE_FORMAT_R8G8B8A8_USCALED: return SVGA3D_DECLTYPE_UBYTE4;
97 case PIPE_FORMAT_R16G16_SSCALED: return SVGA3D_DECLTYPE_SHORT2;
98 case PIPE_FORMAT_R16G16B16A16_SSCALED: return SVGA3D_DECLTYPE_SHORT4;
99 case PIPE_FORMAT_R8G8B8A8_UNORM: return SVGA3D_DECLTYPE_UBYTE4N;
100 case PIPE_FORMAT_R16G16_SNORM: return SVGA3D_DECLTYPE_SHORT2N;
101 case PIPE_FORMAT_R16G16B16A16_SNORM: return SVGA3D_DECLTYPE_SHORT4N;
102 case PIPE_FORMAT_R16G16_UNORM: return SVGA3D_DECLTYPE_USHORT2N;
103 case PIPE_FORMAT_R16G16B16A16_UNORM: return SVGA3D_DECLTYPE_USHORT4N;
104 case PIPE_FORMAT_R10G10B10X2_USCALED: return SVGA3D_DECLTYPE_UDEC3;
105 case PIPE_FORMAT_R10G10B10X2_SNORM: return SVGA3D_DECLTYPE_DEC3N;
106 case PIPE_FORMAT_R16G16_FLOAT: return SVGA3D_DECLTYPE_FLOAT16_2;
107 case PIPE_FORMAT_R16G16B16A16_FLOAT: return SVGA3D_DECLTYPE_FLOAT16_4;
108
109 /* See attrib_needs_adjustment() and attrib_needs_w_to_1() above */
110 case PIPE_FORMAT_R8G8B8_SNORM: return SVGA3D_DECLTYPE_UBYTE4N;
111
112 /* See attrib_needs_w_to_1() above */
113 case PIPE_FORMAT_R16G16B16_SNORM: return SVGA3D_DECLTYPE_SHORT4N;
114 case PIPE_FORMAT_R16G16B16_UNORM: return SVGA3D_DECLTYPE_USHORT4N;
115 case PIPE_FORMAT_R8G8B8_UNORM: return SVGA3D_DECLTYPE_UBYTE4N;
116
117 default:
118 /* There are many formats without hardware support. This case
119 * will be hit regularly, meaning we'll need swvfetch.
120 */
121 return SVGA3D_DECLTYPE_MAX;
122 }
123 }
124
125
126 static void
127 define_input_element_object(struct svga_context *svga,
128 struct svga_velems_state *velems)
129 {
130 SVGA3dInputElementDesc elements[PIPE_MAX_ATTRIBS];
131 enum pipe_error ret;
132 unsigned i;
133
134 assert(velems->count <= PIPE_MAX_ATTRIBS);
135 assert(svga_have_vgpu10(svga));
136
137 for (i = 0; i < velems->count; i++) {
138 const struct pipe_vertex_element *elem = velems->velem + i;
139 SVGA3dSurfaceFormat svga_format;
140 unsigned vf_flags;
141
142 svga_translate_vertex_format_vgpu10(elem->src_format,
143 &svga_format, &vf_flags);
144
145 velems->decl_type[i] =
146 translate_vertex_format_to_decltype(elem->src_format);
147 elements[i].inputSlot = elem->vertex_buffer_index;
148 elements[i].alignedByteOffset = elem->src_offset;
149 elements[i].format = svga_format;
150
151 if (elem->instance_divisor) {
152 elements[i].inputSlotClass = SVGA3D_INPUT_PER_INSTANCE_DATA;
153 elements[i].instanceDataStepRate = elem->instance_divisor;
154 }
155 else {
156 elements[i].inputSlotClass = SVGA3D_INPUT_PER_VERTEX_DATA;
157 elements[i].instanceDataStepRate = 0;
158 }
159 elements[i].inputRegister = i;
160
161 if (elements[i].format == SVGA3D_FORMAT_INVALID) {
162 velems->need_swvfetch = TRUE;
163 }
164
165 if (util_format_is_pure_integer(elem->src_format)) {
166 velems->attrib_is_pure_int |= (1 << i);
167 }
168
169 if (vf_flags & VF_W_TO_1) {
170 velems->adjust_attrib_w_1 |= (1 << i);
171 }
172
173 if (vf_flags & VF_U_TO_F_CAST) {
174 velems->adjust_attrib_utof |= (1 << i);
175 }
176 else if (vf_flags & VF_I_TO_F_CAST) {
177 velems->adjust_attrib_itof |= (1 << i);
178 }
179
180 if (vf_flags & VF_BGRA) {
181 velems->attrib_is_bgra |= (1 << i);
182 }
183
184 if (vf_flags & VF_PUINT_TO_SNORM) {
185 velems->attrib_puint_to_snorm |= (1 << i);
186 }
187 else if (vf_flags & VF_PUINT_TO_USCALED) {
188 velems->attrib_puint_to_uscaled |= (1 << i);
189 }
190 else if (vf_flags & VF_PUINT_TO_SSCALED) {
191 velems->attrib_puint_to_sscaled |= (1 << i);
192 }
193 }
194
195 velems->id = util_bitmask_add(svga->input_element_object_id_bm);
196
197 ret = SVGA3D_vgpu10_DefineElementLayout(svga->swc, velems->count,
198 velems->id, elements);
199 if (ret != PIPE_OK) {
200 svga_context_flush(svga, NULL);
201 ret = SVGA3D_vgpu10_DefineElementLayout(svga->swc, velems->count,
202 velems->id, elements);
203 assert(ret == PIPE_OK);
204 }
205 }
206
207
208 /**
209 * Translate the vertex element types to SVGA3dDeclType and check
210 * for VS-based vertex attribute adjustments.
211 */
212 static void
213 translate_vertex_decls(struct svga_context *svga,
214 struct svga_velems_state *velems)
215 {
216 unsigned i;
217
218 assert(!svga_have_vgpu10(svga));
219
220 for (i = 0; i < velems->count; i++) {
221 const enum pipe_format f = velems->velem[i].src_format;
222 SVGA3dSurfaceFormat svga_format;
223 unsigned vf_flags;
224
225 svga_translate_vertex_format_vgpu10(f, &svga_format, &vf_flags);
226
227 velems->decl_type[i] = translate_vertex_format_to_decltype(f);
228 if (velems->decl_type[i] == SVGA3D_DECLTYPE_MAX) {
229 /* Unsupported format - use software fetch */
230 velems->need_swvfetch = TRUE;
231 }
232
233 /* Check for VS-based adjustments */
234 if (attrib_needs_range_adjustment(f)) {
235 velems->adjust_attrib_range |= (1 << i);
236 }
237
238 if (vf_flags & VF_W_TO_1) {
239 velems->adjust_attrib_w_1 |= (1 << i);
240 }
241 }
242 }
243
244
245 static void *
246 svga_create_vertex_elements_state(struct pipe_context *pipe,
247 unsigned count,
248 const struct pipe_vertex_element *attribs)
249 {
250 struct svga_context *svga = svga_context(pipe);
251 struct svga_velems_state *velems;
252
253 assert(count <= PIPE_MAX_ATTRIBS);
254 velems = (struct svga_velems_state *) MALLOC(sizeof(struct svga_velems_state));
255 if (velems) {
256 velems->count = count;
257 memcpy(velems->velem, attribs, sizeof(*attribs) * count);
258
259 velems->need_swvfetch = FALSE;
260 velems->adjust_attrib_range = 0x0;
261 velems->attrib_is_pure_int = 0x0;
262 velems->adjust_attrib_w_1 = 0x0;
263 velems->adjust_attrib_itof = 0x0;
264 velems->adjust_attrib_utof = 0x0;
265 velems->attrib_is_bgra = 0x0;
266 velems->attrib_puint_to_snorm = 0x0;
267 velems->attrib_puint_to_uscaled = 0x0;
268 velems->attrib_puint_to_sscaled = 0x0;
269
270 if (svga_have_vgpu10(svga)) {
271 define_input_element_object(svga, velems);
272 }
273 else {
274 translate_vertex_decls(svga, velems);
275 }
276 }
277
278 svga->hud.num_state_objects++;
279
280 return velems;
281 }
282
283
284 static void
285 svga_bind_vertex_elements_state(struct pipe_context *pipe, void *state)
286 {
287 struct svga_context *svga = svga_context(pipe);
288 struct svga_velems_state *velems = (struct svga_velems_state *) state;
289
290 svga->curr.velems = velems;
291 svga->dirty |= SVGA_NEW_VELEMENT;
292 }
293
294
295 static void
296 svga_delete_vertex_elements_state(struct pipe_context *pipe, void *state)
297 {
298 struct svga_context *svga = svga_context(pipe);
299 struct svga_velems_state *velems = (struct svga_velems_state *) state;
300
301 if (svga_have_vgpu10(svga)) {
302 enum pipe_error ret;
303
304 svga_hwtnl_flush_retry(svga);
305
306 ret = SVGA3D_vgpu10_DestroyElementLayout(svga->swc, velems->id);
307 if (ret != PIPE_OK) {
308 svga_context_flush(svga, NULL);
309 ret = SVGA3D_vgpu10_DestroyElementLayout(svga->swc, velems->id);
310 assert(ret == PIPE_OK);
311 }
312
313 if (velems->id == svga->state.hw_draw.layout_id)
314 svga->state.hw_draw.layout_id = SVGA3D_INVALID_ID;
315
316 util_bitmask_clear(svga->input_element_object_id_bm, velems->id);
317 velems->id = SVGA3D_INVALID_ID;
318 }
319
320 FREE(velems);
321 svga->hud.num_state_objects--;
322 }
323
324 void svga_cleanup_vertex_state( struct svga_context *svga )
325 {
326 unsigned i;
327
328 for (i = 0 ; i < svga->curr.num_vertex_buffers; i++)
329 pipe_resource_reference(&svga->curr.vb[i].buffer, NULL);
330 }
331
332
333 void svga_init_vertex_functions( struct svga_context *svga )
334 {
335 svga->pipe.set_vertex_buffers = svga_set_vertex_buffers;
336 svga->pipe.set_index_buffer = svga_set_index_buffer;
337 svga->pipe.create_vertex_elements_state = svga_create_vertex_elements_state;
338 svga->pipe.bind_vertex_elements_state = svga_bind_vertex_elements_state;
339 svga->pipe.delete_vertex_elements_state = svga_delete_vertex_elements_state;
340 }