r300/compiler: implement DP2 opcode
[mesa.git] / src / gallium / drivers / svga / svga_screen.c
1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 *
24 **********************************************************/
25
26 #include "util/u_memory.h"
27 #include "util/u_inlines.h"
28 #include "util/u_string.h"
29 #include "util/u_math.h"
30
31 #include "svga_winsys.h"
32 #include "svga_public.h"
33 #include "svga_context.h"
34 #include "svga_screen.h"
35 #include "svga_resource_texture.h"
36 #include "svga_resource.h"
37 #include "svga_debug.h"
38 #include "svga_surface.h"
39
40 #include "svga3d_shaderdefs.h"
41
42
43 #ifdef DEBUG
44 int SVGA_DEBUG = 0;
45
46 static const struct debug_named_value svga_debug_flags[] = {
47 { "dma", DEBUG_DMA, NULL },
48 { "tgsi", DEBUG_TGSI, NULL },
49 { "pipe", DEBUG_PIPE, NULL },
50 { "state", DEBUG_STATE, NULL },
51 { "screen", DEBUG_SCREEN, NULL },
52 { "tex", DEBUG_TEX, NULL },
53 { "swtnl", DEBUG_SWTNL, NULL },
54 { "const", DEBUG_CONSTS, NULL },
55 { "viewport", DEBUG_VIEWPORT, NULL },
56 { "views", DEBUG_VIEWS, NULL },
57 { "perf", DEBUG_PERF, NULL },
58 { "flush", DEBUG_FLUSH, NULL },
59 { "sync", DEBUG_SYNC, NULL },
60 { "cache", DEBUG_CACHE, NULL },
61 DEBUG_NAMED_VALUE_END
62 };
63 #endif
64
65 static const char *
66 svga_get_vendor( struct pipe_screen *pscreen )
67 {
68 return "VMware, Inc.";
69 }
70
71
72 static const char *
73 svga_get_name( struct pipe_screen *pscreen )
74 {
75 #ifdef DEBUG
76 /* Only return internal details in the DEBUG version:
77 */
78 return "SVGA3D; build: DEBUG; mutex: " PIPE_ATOMIC;
79 #else
80 return "SVGA3D; build: RELEASE; ";
81 #endif
82 }
83
84
85
86
87 static float
88 svga_get_paramf(struct pipe_screen *screen, enum pipe_cap param)
89 {
90 struct svga_screen *svgascreen = svga_screen(screen);
91 struct svga_winsys_screen *sws = svgascreen->sws;
92 SVGA3dDevCapResult result;
93
94 switch (param) {
95 case PIPE_CAP_MAX_LINE_WIDTH:
96 /* fall-through */
97 case PIPE_CAP_MAX_LINE_WIDTH_AA:
98 return 7.0;
99
100 case PIPE_CAP_MAX_POINT_WIDTH:
101 /* fall-through */
102 case PIPE_CAP_MAX_POINT_WIDTH_AA:
103 /* Keep this to a reasonable size to avoid failures in
104 * conform/pntaa.c:
105 */
106 return SVGA_MAX_POINTSIZE;
107
108 case PIPE_CAP_MAX_TEXTURE_ANISOTROPY:
109 if(!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_ANISOTROPY, &result))
110 return 4.0;
111 return result.u;
112
113 case PIPE_CAP_MAX_TEXTURE_LOD_BIAS:
114 return 16.0;
115
116 case PIPE_CAP_MAX_TEXTURE_IMAGE_UNITS:
117 return 16;
118 case PIPE_CAP_MAX_COMBINED_SAMPLERS:
119 return 16;
120 case PIPE_CAP_NPOT_TEXTURES:
121 return 1;
122 case PIPE_CAP_TWO_SIDED_STENCIL:
123 return 1;
124 case PIPE_CAP_GLSL:
125 return svgascreen->use_ps30 && svgascreen->use_vs30;
126 case PIPE_CAP_ANISOTROPIC_FILTER:
127 return 1;
128 case PIPE_CAP_POINT_SPRITE:
129 return 1;
130 case PIPE_CAP_MAX_RENDER_TARGETS:
131 if(!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_RENDER_TARGETS, &result))
132 return 1;
133 if(!result.u)
134 return 1;
135 return MIN2(result.u, PIPE_MAX_COLOR_BUFS);
136 case PIPE_CAP_OCCLUSION_QUERY:
137 return 1;
138 case PIPE_CAP_TIMER_QUERY:
139 return 0;
140 case PIPE_CAP_TEXTURE_SHADOW_MAP:
141 return 1;
142
143 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
144 {
145 unsigned levels = SVGA_MAX_TEXTURE_LEVELS;
146 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_WIDTH, &result))
147 levels = MIN2(util_logbase2(result.u) + 1, levels);
148 else
149 levels = 12 /* 2048x2048 */;
150 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_HEIGHT, &result))
151 levels = MIN2(util_logbase2(result.u) + 1, levels);
152 else
153 levels = 12 /* 2048x2048 */;
154 return levels;
155 }
156
157 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
158 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VOLUME_EXTENT, &result))
159 return 8; /* max 128x128x128 */
160 return MIN2(util_logbase2(result.u) + 1, SVGA_MAX_TEXTURE_LEVELS);
161
162 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
163 /*
164 * No mechanism to query the host, and at least limited to 2048x2048 on
165 * certain hardware.
166 */
167 return MIN2(screen->get_paramf(screen, PIPE_CAP_MAX_TEXTURE_2D_LEVELS),
168 12.0 /* 2048x2048 */);
169
170 case PIPE_CAP_TEXTURE_MIRROR_REPEAT: /* req. for GL 1.4 */
171 return 1;
172
173 case PIPE_CAP_BLEND_EQUATION_SEPARATE: /* req. for GL 1.5 */
174 return 1;
175
176 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
177 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
178 return 1;
179 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
180 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
181 return 0;
182
183 /*
184 * Fragment shader limits
185 */
186
187 case PIPE_CAP_MAX_FS_INSTRUCTIONS:
188 case PIPE_CAP_MAX_FS_ALU_INSTRUCTIONS:
189 case PIPE_CAP_MAX_FS_TEX_INSTRUCTIONS:
190 case PIPE_CAP_MAX_FS_TEX_INDIRECTIONS:
191 return svgascreen->use_ps30 ? 512 : 96;
192 case PIPE_CAP_MAX_FS_CONTROL_FLOW_DEPTH:
193 return SVGA3D_MAX_NESTING_LEVEL;
194 case PIPE_CAP_MAX_FS_INPUTS:
195 return 10;
196 case PIPE_CAP_MAX_FS_CONSTS:
197 return svgascreen->use_vs30 ? 224 : 16;
198 case PIPE_CAP_MAX_FS_TEMPS:
199 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_TEMPS, &result))
200 return svgascreen->use_ps30 ? 32 : 12;
201 return result.u;
202 case PIPE_CAP_MAX_FS_ADDRS:
203 return svgascreen->use_ps30 ? 1 : 0;
204 case PIPE_CAP_MAX_FS_PREDS:
205 return svgascreen->use_ps30 ? 1 : 0;
206
207 /*
208 * Vertex shader limits
209 */
210 case PIPE_CAP_MAX_VS_INSTRUCTIONS:
211 case PIPE_CAP_MAX_VS_ALU_INSTRUCTIONS:
212 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_INSTRUCTIONS, &result))
213 return svgascreen->use_vs30 ? 512 : 256;
214 return result.u;
215 case PIPE_CAP_MAX_VS_TEX_INSTRUCTIONS:
216 case PIPE_CAP_MAX_VS_TEX_INDIRECTIONS:
217 /* XXX: until we have vertex texture support */
218 return 0;
219 case PIPE_CAP_MAX_VS_CONTROL_FLOW_DEPTH:
220 return SVGA3D_MAX_NESTING_LEVEL;
221 case PIPE_CAP_MAX_VS_INPUTS:
222 return 16;
223 case PIPE_CAP_MAX_VS_CONSTS:
224 return 256;
225 case PIPE_CAP_MAX_VS_TEMPS:
226 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_TEMPS, &result))
227 return svgascreen->use_vs30 ? 32 : 12;
228 return result.u;
229 case PIPE_CAP_MAX_VS_ADDRS:
230 return svgascreen->use_vs30 ? 1 : 0;
231 case PIPE_CAP_MAX_VS_PREDS:
232 return svgascreen->use_vs30 ? 1 : 0;
233
234 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
235 return 1;
236
237 default:
238 return 0;
239 }
240 }
241
242
243 /* This is a fairly pointless interface
244 */
245 static int
246 svga_get_param(struct pipe_screen *screen, enum pipe_cap param)
247 {
248 return (int) svga_get_paramf( screen, param );
249 }
250
251
252 static INLINE SVGA3dDevCapIndex
253 svga_translate_format_cap(enum pipe_format format)
254 {
255 switch(format) {
256
257 case PIPE_FORMAT_B8G8R8A8_UNORM:
258 return SVGA3D_DEVCAP_SURFACEFMT_A8R8G8B8;
259 case PIPE_FORMAT_B8G8R8X8_UNORM:
260 return SVGA3D_DEVCAP_SURFACEFMT_X8R8G8B8;
261
262 case PIPE_FORMAT_B5G6R5_UNORM:
263 return SVGA3D_DEVCAP_SURFACEFMT_R5G6B5;
264 case PIPE_FORMAT_B5G5R5A1_UNORM:
265 return SVGA3D_DEVCAP_SURFACEFMT_A1R5G5B5;
266 case PIPE_FORMAT_B4G4R4A4_UNORM:
267 return SVGA3D_DEVCAP_SURFACEFMT_A4R4G4B4;
268
269 case PIPE_FORMAT_Z16_UNORM:
270 return SVGA3D_DEVCAP_SURFACEFMT_Z_D16;
271 case PIPE_FORMAT_S8_USCALED_Z24_UNORM:
272 return SVGA3D_DEVCAP_SURFACEFMT_Z_D24S8;
273 case PIPE_FORMAT_X8Z24_UNORM:
274 return SVGA3D_DEVCAP_SURFACEFMT_Z_D24X8;
275
276 case PIPE_FORMAT_A8_UNORM:
277 return SVGA3D_DEVCAP_SURFACEFMT_ALPHA8;
278 case PIPE_FORMAT_L8_UNORM:
279 return SVGA3D_DEVCAP_SURFACEFMT_LUMINANCE8;
280
281 case PIPE_FORMAT_DXT1_RGB:
282 case PIPE_FORMAT_DXT1_RGBA:
283 return SVGA3D_DEVCAP_SURFACEFMT_DXT1;
284 case PIPE_FORMAT_DXT3_RGBA:
285 return SVGA3D_DEVCAP_SURFACEFMT_DXT3;
286 case PIPE_FORMAT_DXT5_RGBA:
287 return SVGA3D_DEVCAP_SURFACEFMT_DXT5;
288
289 default:
290 return SVGA3D_DEVCAP_MAX;
291 }
292 }
293
294
295 static boolean
296 svga_is_format_supported( struct pipe_screen *screen,
297 enum pipe_format format,
298 enum pipe_texture_target target,
299 unsigned sample_count,
300 unsigned tex_usage,
301 unsigned geom_flags )
302 {
303 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
304 SVGA3dDevCapIndex index;
305 SVGA3dDevCapResult result;
306
307 assert(tex_usage);
308
309 if (sample_count > 1)
310 return FALSE;
311
312 /* Override host capabilities */
313 if (tex_usage & PIPE_BIND_RENDER_TARGET) {
314 switch(format) {
315
316 /* Often unsupported/problematic. This means we end up with the same
317 * visuals for all virtual hardware implementations.
318 */
319 case PIPE_FORMAT_B4G4R4A4_UNORM:
320 case PIPE_FORMAT_B5G5R5A1_UNORM:
321 return FALSE;
322
323 /* Simulate ability to render into compressed textures */
324 case PIPE_FORMAT_DXT1_RGB:
325 case PIPE_FORMAT_DXT1_RGBA:
326 case PIPE_FORMAT_DXT3_RGBA:
327 case PIPE_FORMAT_DXT5_RGBA:
328 return TRUE;
329
330 default:
331 break;
332 }
333 }
334
335 /* Try to query the host */
336 index = svga_translate_format_cap(format);
337 if( index < SVGA3D_DEVCAP_MAX &&
338 sws->get_cap(sws, index, &result) )
339 {
340 SVGA3dSurfaceFormatCaps mask;
341
342 mask.value = 0;
343 if (tex_usage & PIPE_BIND_RENDER_TARGET)
344 mask.offscreenRenderTarget = 1;
345 if (tex_usage & PIPE_BIND_DEPTH_STENCIL)
346 mask.zStencil = 1;
347 if (tex_usage & PIPE_BIND_SAMPLER_VIEW)
348 mask.texture = 1;
349
350 if ((result.u & mask.value) == mask.value)
351 return TRUE;
352 else
353 return FALSE;
354 }
355
356 /* Use our translate functions directly rather than relying on a
357 * duplicated list of supported formats which is prone to getting
358 * out of sync:
359 */
360 if(tex_usage & (PIPE_BIND_RENDER_TARGET | PIPE_BIND_DEPTH_STENCIL))
361 return svga_translate_format_render(format) != SVGA3D_FORMAT_INVALID;
362 else
363 return svga_translate_format(format) != SVGA3D_FORMAT_INVALID;
364 }
365
366
367 static void
368 svga_fence_reference(struct pipe_screen *screen,
369 struct pipe_fence_handle **ptr,
370 struct pipe_fence_handle *fence)
371 {
372 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
373 sws->fence_reference(sws, ptr, fence);
374 }
375
376
377 static int
378 svga_fence_signalled(struct pipe_screen *screen,
379 struct pipe_fence_handle *fence,
380 unsigned flag)
381 {
382 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
383 return sws->fence_signalled(sws, fence, flag);
384 }
385
386
387 static int
388 svga_fence_finish(struct pipe_screen *screen,
389 struct pipe_fence_handle *fence,
390 unsigned flag)
391 {
392 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
393
394 SVGA_DBG(DEBUG_DMA|DEBUG_PERF, "%s fence_ptr %p\n",
395 __FUNCTION__, fence);
396
397 return sws->fence_finish(sws, fence, flag);
398 }
399
400
401 static void
402 svga_destroy_screen( struct pipe_screen *screen )
403 {
404 struct svga_screen *svgascreen = svga_screen(screen);
405
406 svga_screen_cache_cleanup(svgascreen);
407
408 pipe_mutex_destroy(svgascreen->swc_mutex);
409 pipe_mutex_destroy(svgascreen->tex_mutex);
410
411 svgascreen->sws->destroy(svgascreen->sws);
412
413 FREE(svgascreen);
414 }
415
416
417 /**
418 * Create a new svga_screen object
419 */
420 struct pipe_screen *
421 svga_screen_create(struct svga_winsys_screen *sws)
422 {
423 struct svga_screen *svgascreen;
424 struct pipe_screen *screen;
425 SVGA3dDevCapResult result;
426
427 #ifdef DEBUG
428 SVGA_DEBUG = debug_get_flags_option("SVGA_DEBUG", svga_debug_flags, 0 );
429 #endif
430
431 svgascreen = CALLOC_STRUCT(svga_screen);
432 if (!svgascreen)
433 goto error1;
434
435 svgascreen->debug.force_level_surface_view =
436 debug_get_bool_option("SVGA_FORCE_LEVEL_SURFACE_VIEW", FALSE);
437 svgascreen->debug.force_surface_view =
438 debug_get_bool_option("SVGA_FORCE_SURFACE_VIEW", FALSE);
439 svgascreen->debug.force_sampler_view =
440 debug_get_bool_option("SVGA_FORCE_SAMPLER_VIEW", FALSE);
441 svgascreen->debug.no_surface_view =
442 debug_get_bool_option("SVGA_NO_SURFACE_VIEW", FALSE);
443 svgascreen->debug.no_sampler_view =
444 debug_get_bool_option("SVGA_NO_SAMPLER_VIEW", FALSE);
445
446 screen = &svgascreen->screen;
447
448 screen->destroy = svga_destroy_screen;
449 screen->get_name = svga_get_name;
450 screen->get_vendor = svga_get_vendor;
451 screen->get_param = svga_get_param;
452 screen->get_paramf = svga_get_paramf;
453 screen->is_format_supported = svga_is_format_supported;
454 screen->context_create = svga_context_create;
455 screen->fence_reference = svga_fence_reference;
456 screen->fence_signalled = svga_fence_signalled;
457 screen->fence_finish = svga_fence_finish;
458 svgascreen->sws = sws;
459
460 svga_screen_init_surface_functions(screen);
461 svga_init_screen_resource_functions(svgascreen);
462
463 svgascreen->use_ps30 =
464 sws->get_cap(sws, SVGA3D_DEVCAP_FRAGMENT_SHADER_VERSION, &result) &&
465 result.u >= SVGA3DPSVERSION_30 ? TRUE : FALSE;
466
467 svgascreen->use_vs30 =
468 sws->get_cap(sws, SVGA3D_DEVCAP_VERTEX_SHADER_VERSION, &result) &&
469 result.u >= SVGA3DVSVERSION_30 ? TRUE : FALSE;
470
471 #if 1
472 /* Shader model 2.0 is unsupported at the moment. */
473 if(!svgascreen->use_ps30 || !svgascreen->use_vs30)
474 goto error2;
475 #else
476 if(debug_get_bool_option("SVGA_NO_SM30", FALSE))
477 svgascreen->use_vs30 = svgascreen->use_ps30 = FALSE;
478 #endif
479
480 pipe_mutex_init(svgascreen->tex_mutex);
481 pipe_mutex_init(svgascreen->swc_mutex);
482
483 svga_screen_cache_init(svgascreen);
484
485 return screen;
486 error2:
487 FREE(svgascreen);
488 error1:
489 return NULL;
490 }
491
492 struct svga_winsys_screen *
493 svga_winsys_screen(struct pipe_screen *screen)
494 {
495 return svga_screen(screen)->sws;
496 }
497
498 #ifdef DEBUG
499 struct svga_screen *
500 svga_screen(struct pipe_screen *screen)
501 {
502 assert(screen);
503 assert(screen->destroy == svga_destroy_screen);
504 return (struct svga_screen *)screen;
505 }
506 #endif