softpipe: add support for compute shaders. (v2)
[mesa.git] / src / gallium / drivers / softpipe / sp_screen.c
1 /**************************************************************************
2 *
3 * Copyright 2008 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28
29 #include "util/u_memory.h"
30 #include "util/u_format.h"
31 #include "util/u_format_s3tc.h"
32 #include "util/u_video.h"
33 #include "os/os_misc.h"
34 #include "os/os_time.h"
35 #include "pipe/p_defines.h"
36 #include "pipe/p_screen.h"
37 #include "draw/draw_context.h"
38
39 #include "state_tracker/sw_winsys.h"
40 #include "tgsi/tgsi_exec.h"
41
42 #include "sp_texture.h"
43 #include "sp_screen.h"
44 #include "sp_context.h"
45 #include "sp_fence.h"
46 #include "sp_public.h"
47
48 DEBUG_GET_ONCE_BOOL_OPTION(use_llvm, "SOFTPIPE_USE_LLVM", FALSE)
49
50 static const char *
51 softpipe_get_vendor(struct pipe_screen *screen)
52 {
53 return "VMware, Inc.";
54 }
55
56
57 static const char *
58 softpipe_get_name(struct pipe_screen *screen)
59 {
60 return "softpipe";
61 }
62
63
64 static int
65 softpipe_get_param(struct pipe_screen *screen, enum pipe_cap param)
66 {
67 switch (param) {
68 case PIPE_CAP_NPOT_TEXTURES:
69 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
70 return 1;
71 case PIPE_CAP_TWO_SIDED_STENCIL:
72 return 1;
73 case PIPE_CAP_SM3:
74 return 1;
75 case PIPE_CAP_ANISOTROPIC_FILTER:
76 return 1;
77 case PIPE_CAP_POINT_SPRITE:
78 return 1;
79 case PIPE_CAP_MAX_RENDER_TARGETS:
80 return PIPE_MAX_COLOR_BUFS;
81 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
82 return 1;
83 case PIPE_CAP_OCCLUSION_QUERY:
84 return 1;
85 case PIPE_CAP_QUERY_TIME_ELAPSED:
86 return 1;
87 case PIPE_CAP_QUERY_PIPELINE_STATISTICS:
88 return 1;
89 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
90 return 1;
91 case PIPE_CAP_TEXTURE_SHADOW_MAP:
92 return 1;
93 case PIPE_CAP_TEXTURE_SWIZZLE:
94 return 1;
95 case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK:
96 return 0;
97 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
98 return SP_MAX_TEXTURE_2D_LEVELS;
99 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
100 return SP_MAX_TEXTURE_3D_LEVELS;
101 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
102 return SP_MAX_TEXTURE_CUBE_LEVELS;
103 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
104 return 1;
105 case PIPE_CAP_INDEP_BLEND_ENABLE:
106 return 1;
107 case PIPE_CAP_INDEP_BLEND_FUNC:
108 return 1;
109 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
110 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
111 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
112 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
113 return 1;
114 case PIPE_CAP_DEPTH_CLIP_DISABLE:
115 return 1;
116 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
117 return PIPE_MAX_SO_BUFFERS;
118 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
119 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
120 return 16*4;
121 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
122 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
123 return 1024;
124 case PIPE_CAP_MAX_VERTEX_STREAMS:
125 return 1;
126 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
127 return 2048;
128 case PIPE_CAP_PRIMITIVE_RESTART:
129 return 1;
130 case PIPE_CAP_SHADER_STENCIL_EXPORT:
131 return 1;
132 case PIPE_CAP_TGSI_INSTANCEID:
133 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
134 case PIPE_CAP_START_INSTANCE:
135 return 1;
136 case PIPE_CAP_SEAMLESS_CUBE_MAP:
137 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
138 return 1;
139 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
140 return 256; /* for GL3 */
141 case PIPE_CAP_MIN_TEXEL_OFFSET:
142 return -8;
143 case PIPE_CAP_MAX_TEXEL_OFFSET:
144 return 7;
145 case PIPE_CAP_CONDITIONAL_RENDER:
146 return 1;
147 case PIPE_CAP_TEXTURE_BARRIER:
148 return 0;
149 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
150 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED: /* draw module */
151 case PIPE_CAP_VERTEX_COLOR_CLAMPED: /* draw module */
152 return 1;
153 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
154 return 0;
155 case PIPE_CAP_GLSL_FEATURE_LEVEL:
156 return 330;
157 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
158 return 0;
159 case PIPE_CAP_COMPUTE:
160 return 1;
161 case PIPE_CAP_USER_VERTEX_BUFFERS:
162 case PIPE_CAP_USER_INDEX_BUFFERS:
163 case PIPE_CAP_USER_CONSTANT_BUFFERS:
164 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
165 case PIPE_CAP_TGSI_VS_LAYER_VIEWPORT:
166 return 1;
167 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
168 return 16;
169 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
170 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
171 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
172 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
173 case PIPE_CAP_TEXTURE_MULTISAMPLE:
174 return 0;
175 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
176 return 64;
177 case PIPE_CAP_QUERY_TIMESTAMP:
178 case PIPE_CAP_CUBE_MAP_ARRAY:
179 return 1;
180 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
181 return 1;
182 case PIPE_CAP_BUFFER_SAMPLER_VIEW_RGBA_ONLY:
183 return 0;
184 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
185 return 65536;
186 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
187 return 0;
188 case PIPE_CAP_TGSI_TEXCOORD:
189 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
190 return 0;
191 case PIPE_CAP_MAX_VIEWPORTS:
192 return PIPE_MAX_VIEWPORTS;
193 case PIPE_CAP_ENDIANNESS:
194 return PIPE_ENDIAN_NATIVE;
195 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
196 return 4;
197 case PIPE_CAP_TEXTURE_GATHER_SM5:
198 case PIPE_CAP_TEXTURE_QUERY_LOD:
199 return 1;
200 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
201 case PIPE_CAP_SAMPLE_SHADING:
202 case PIPE_CAP_TEXTURE_GATHER_OFFSETS:
203 return 0;
204 case PIPE_CAP_TGSI_VS_WINDOW_SPACE_POSITION:
205 return 1;
206 case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:
207 return 0;
208 case PIPE_CAP_SAMPLER_VIEW_TARGET:
209 return 1;
210 case PIPE_CAP_FAKE_SW_MSAA:
211 return 1;
212 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
213 return -32;
214 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
215 return 31;
216 case PIPE_CAP_DRAW_INDIRECT:
217 return 1;
218
219 case PIPE_CAP_VENDOR_ID:
220 return 0xFFFFFFFF;
221 case PIPE_CAP_DEVICE_ID:
222 return 0xFFFFFFFF;
223 case PIPE_CAP_ACCELERATED:
224 return 0;
225 case PIPE_CAP_VIDEO_MEMORY: {
226 /* XXX: Do we want to return the full amount fo system memory ? */
227 uint64_t system_memory;
228
229 if (!os_get_total_physical_memory(&system_memory))
230 return 0;
231
232 return (int)(system_memory >> 20);
233 }
234 case PIPE_CAP_UMA:
235 return 0;
236 case PIPE_CAP_CONDITIONAL_RENDER_INVERTED:
237 return 1;
238 case PIPE_CAP_CLIP_HALFZ:
239 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
240 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
241 return 1;
242 case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:
243 return 1;
244 case PIPE_CAP_VERTEXID_NOBASE:
245 return 0;
246 case PIPE_CAP_POLYGON_OFFSET_CLAMP:
247 return 0;
248 case PIPE_CAP_MULTISAMPLE_Z_RESOLVE:
249 case PIPE_CAP_RESOURCE_FROM_USER_MEMORY:
250 case PIPE_CAP_DEVICE_RESET_STATUS_QUERY:
251 case PIPE_CAP_MAX_SHADER_PATCH_VARYINGS:
252 case PIPE_CAP_DEPTH_BOUNDS_TEST:
253 case PIPE_CAP_TGSI_TXQS:
254 case PIPE_CAP_FORCE_PERSAMPLE_INTERP:
255 case PIPE_CAP_SHAREABLE_SHADERS:
256 case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS:
257 case PIPE_CAP_CLEAR_TEXTURE:
258 case PIPE_CAP_DRAW_PARAMETERS:
259 case PIPE_CAP_TGSI_PACK_HALF_FLOAT:
260 case PIPE_CAP_MULTI_DRAW_INDIRECT:
261 case PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS:
262 case PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL:
263 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
264 case PIPE_CAP_INVALIDATE_BUFFER:
265 case PIPE_CAP_GENERATE_MIPMAP:
266 case PIPE_CAP_STRING_MARKER:
267 case PIPE_CAP_SURFACE_REINTERPRET_BLOCKS:
268 case PIPE_CAP_QUERY_BUFFER_OBJECT:
269 case PIPE_CAP_QUERY_MEMORY_INFO:
270 case PIPE_CAP_PCI_GROUP:
271 case PIPE_CAP_PCI_BUS:
272 case PIPE_CAP_PCI_DEVICE:
273 case PIPE_CAP_PCI_FUNCTION:
274 case PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR:
275 return 0;
276 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
277 return 4;
278 }
279 /* should only get here on unhandled cases */
280 debug_printf("Unexpected PIPE_CAP %d query\n", param);
281 return 0;
282 }
283
284 static int
285 softpipe_get_shader_param(struct pipe_screen *screen, unsigned shader, enum pipe_shader_cap param)
286 {
287 struct softpipe_screen *sp_screen = softpipe_screen(screen);
288 switch(shader)
289 {
290 case PIPE_SHADER_FRAGMENT:
291 return tgsi_exec_get_shader_param(param);
292 case PIPE_SHADER_COMPUTE:
293 return tgsi_exec_get_shader_param(param);
294 case PIPE_SHADER_VERTEX:
295 case PIPE_SHADER_GEOMETRY:
296 if (sp_screen->use_llvm)
297 return draw_get_shader_param(shader, param);
298 else
299 return draw_get_shader_param_no_llvm(shader, param);
300 default:
301 return 0;
302 }
303 }
304
305 static float
306 softpipe_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
307 {
308 switch (param) {
309 case PIPE_CAPF_MAX_LINE_WIDTH:
310 /* fall-through */
311 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
312 return 255.0; /* arbitrary */
313 case PIPE_CAPF_MAX_POINT_WIDTH:
314 /* fall-through */
315 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
316 return 255.0; /* arbitrary */
317 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
318 return 16.0;
319 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
320 return 16.0; /* arbitrary */
321 case PIPE_CAPF_GUARD_BAND_LEFT:
322 case PIPE_CAPF_GUARD_BAND_TOP:
323 case PIPE_CAPF_GUARD_BAND_RIGHT:
324 case PIPE_CAPF_GUARD_BAND_BOTTOM:
325 return 0.0;
326 }
327 /* should only get here on unhandled cases */
328 debug_printf("Unexpected PIPE_CAPF %d query\n", param);
329 return 0.0;
330 }
331
332 /**
333 * Query format support for creating a texture, drawing surface, etc.
334 * \param format the format to test
335 * \param type one of PIPE_TEXTURE, PIPE_SURFACE
336 */
337 static boolean
338 softpipe_is_format_supported( struct pipe_screen *screen,
339 enum pipe_format format,
340 enum pipe_texture_target target,
341 unsigned sample_count,
342 unsigned bind)
343 {
344 struct sw_winsys *winsys = softpipe_screen(screen)->winsys;
345 const struct util_format_description *format_desc;
346
347 assert(target == PIPE_BUFFER ||
348 target == PIPE_TEXTURE_1D ||
349 target == PIPE_TEXTURE_1D_ARRAY ||
350 target == PIPE_TEXTURE_2D ||
351 target == PIPE_TEXTURE_2D_ARRAY ||
352 target == PIPE_TEXTURE_RECT ||
353 target == PIPE_TEXTURE_3D ||
354 target == PIPE_TEXTURE_CUBE ||
355 target == PIPE_TEXTURE_CUBE_ARRAY);
356
357 format_desc = util_format_description(format);
358 if (!format_desc)
359 return FALSE;
360
361 if (sample_count > 1)
362 return FALSE;
363
364 if (bind & (PIPE_BIND_DISPLAY_TARGET |
365 PIPE_BIND_SCANOUT |
366 PIPE_BIND_SHARED)) {
367 if(!winsys->is_displaytarget_format_supported(winsys, bind, format))
368 return FALSE;
369 }
370
371 if (bind & PIPE_BIND_RENDER_TARGET) {
372 if (format_desc->colorspace == UTIL_FORMAT_COLORSPACE_ZS)
373 return FALSE;
374
375 /*
376 * Although possible, it is unnatural to render into compressed or YUV
377 * surfaces. So disable these here to avoid going into weird paths
378 * inside the state trackers.
379 */
380 if (format_desc->block.width != 1 ||
381 format_desc->block.height != 1)
382 return FALSE;
383 }
384
385 if (bind & PIPE_BIND_DEPTH_STENCIL) {
386 if (format_desc->colorspace != UTIL_FORMAT_COLORSPACE_ZS)
387 return FALSE;
388 }
389
390 if (format_desc->layout == UTIL_FORMAT_LAYOUT_BPTC ||
391 format_desc->layout == UTIL_FORMAT_LAYOUT_ASTC) {
392 /* Software decoding is not hooked up. */
393 return FALSE;
394 }
395
396 if (format_desc->layout == UTIL_FORMAT_LAYOUT_ETC &&
397 format != PIPE_FORMAT_ETC1_RGB8)
398 return FALSE;
399
400 /*
401 * All other operations (sampling, transfer, etc).
402 */
403
404 if (format_desc->layout == UTIL_FORMAT_LAYOUT_S3TC) {
405 return util_format_s3tc_enabled;
406 }
407
408 /*
409 * Everything else should be supported by u_format.
410 */
411 return TRUE;
412 }
413
414
415 static void
416 softpipe_destroy_screen( struct pipe_screen *screen )
417 {
418 struct softpipe_screen *sp_screen = softpipe_screen(screen);
419 struct sw_winsys *winsys = sp_screen->winsys;
420
421 if(winsys->destroy)
422 winsys->destroy(winsys);
423
424 FREE(screen);
425 }
426
427
428 /* This is often overriden by the co-state tracker.
429 */
430 static void
431 softpipe_flush_frontbuffer(struct pipe_screen *_screen,
432 struct pipe_resource *resource,
433 unsigned level, unsigned layer,
434 void *context_private,
435 struct pipe_box *sub_box)
436 {
437 struct softpipe_screen *screen = softpipe_screen(_screen);
438 struct sw_winsys *winsys = screen->winsys;
439 struct softpipe_resource *texture = softpipe_resource(resource);
440
441 assert(texture->dt);
442 if (texture->dt)
443 winsys->displaytarget_display(winsys, texture->dt, context_private, sub_box);
444 }
445
446 static uint64_t
447 softpipe_get_timestamp(struct pipe_screen *_screen)
448 {
449 return os_time_get_nano();
450 }
451
452 static int
453 softpipe_get_compute_param(struct pipe_screen *_screen,
454 enum pipe_shader_ir ir_type,
455 enum pipe_compute_cap param,
456 void *ret)
457 {
458 switch (param) {
459 case PIPE_COMPUTE_CAP_IR_TARGET:
460 return 0;
461 case PIPE_COMPUTE_CAP_MAX_GRID_SIZE:
462 if (ret) {
463 uint64_t *grid_size = ret;
464 grid_size[0] = 65535;
465 grid_size[1] = 65535;
466 grid_size[2] = 65535;
467 }
468 return 3 * sizeof(uint64_t) ;
469 case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE:
470 if (ret) {
471 uint64_t *block_size = ret;
472 block_size[0] = 1024;
473 block_size[1] = 1024;
474 block_size[2] = 1024;
475 }
476 return 3 * sizeof(uint64_t);
477 case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK:
478 if (ret) {
479 uint64_t *max_threads_per_block = ret;
480 *max_threads_per_block = 1024;
481 }
482 return sizeof(uint64_t);
483 case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE:
484 if (ret) {
485 uint64_t *max_local_size = ret;
486 *max_local_size = 32768;
487 }
488 return sizeof(uint64_t);
489 case PIPE_COMPUTE_CAP_GRID_DIMENSION:
490 case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE:
491 case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE:
492 case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE:
493 case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE:
494 case PIPE_COMPUTE_CAP_MAX_CLOCK_FREQUENCY:
495 case PIPE_COMPUTE_CAP_MAX_COMPUTE_UNITS:
496 case PIPE_COMPUTE_CAP_IMAGES_SUPPORTED:
497 case PIPE_COMPUTE_CAP_SUBGROUP_SIZE:
498 break;
499 }
500 return 0;
501 }
502
503 /**
504 * Create a new pipe_screen object
505 * Note: we're not presently subclassing pipe_screen (no softpipe_screen).
506 */
507 struct pipe_screen *
508 softpipe_create_screen(struct sw_winsys *winsys)
509 {
510 struct softpipe_screen *screen = CALLOC_STRUCT(softpipe_screen);
511
512 if (!screen)
513 return NULL;
514
515 screen->winsys = winsys;
516
517 screen->base.destroy = softpipe_destroy_screen;
518
519 screen->base.get_name = softpipe_get_name;
520 screen->base.get_vendor = softpipe_get_vendor;
521 screen->base.get_device_vendor = softpipe_get_vendor; // TODO should be the CPU vendor
522 screen->base.get_param = softpipe_get_param;
523 screen->base.get_shader_param = softpipe_get_shader_param;
524 screen->base.get_paramf = softpipe_get_paramf;
525 screen->base.get_timestamp = softpipe_get_timestamp;
526 screen->base.is_format_supported = softpipe_is_format_supported;
527 screen->base.context_create = softpipe_create_context;
528 screen->base.flush_frontbuffer = softpipe_flush_frontbuffer;
529 screen->base.get_compute_param = softpipe_get_compute_param;
530 screen->use_llvm = debug_get_option_use_llvm();
531
532 util_format_s3tc_init();
533
534 softpipe_init_screen_texture_funcs(&screen->base);
535 softpipe_init_screen_fence_funcs(&screen->base);
536
537 return &screen->base;
538 }