gallium: add PIPE_CAP_TEXTURE_BARRIER
[mesa.git] / src / gallium / drivers / r300 / r300_screen.c
1 /*
2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23
24 #include "util/u_format.h"
25 #include "util/u_format_s3tc.h"
26 #include "util/u_memory.h"
27 #include "os/os_time.h"
28 #include "vl/vl_decoder.h"
29 #include "vl/vl_video_buffer.h"
30
31 #include "r300_context.h"
32 #include "r300_texture.h"
33 #include "r300_screen_buffer.h"
34 #include "r300_state_inlines.h"
35 #include "r300_public.h"
36
37 #include "draw/draw_context.h"
38
39 /* Return the identifier behind whom the brave coders responsible for this
40 * amalgamation of code, sweat, and duct tape, routinely obscure their names.
41 *
42 * ...I should have just put "Corbin Simpson", but I'm not that cool.
43 *
44 * (Or egotistical. Yet.) */
45 static const char* r300_get_vendor(struct pipe_screen* pscreen)
46 {
47 return "X.Org R300 Project";
48 }
49
50 static const char* chip_families[] = {
51 "ATI R300",
52 "ATI R350",
53 "ATI RV350",
54 "ATI RV370",
55 "ATI RV380",
56 "ATI RS400",
57 "ATI RC410",
58 "ATI RS480",
59 "ATI R420",
60 "ATI R423",
61 "ATI R430",
62 "ATI R480",
63 "ATI R481",
64 "ATI RV410",
65 "ATI RS600",
66 "ATI RS690",
67 "ATI RS740",
68 "ATI RV515",
69 "ATI R520",
70 "ATI RV530",
71 "ATI R580",
72 "ATI RV560",
73 "ATI RV570"
74 };
75
76 static const char* r300_get_name(struct pipe_screen* pscreen)
77 {
78 struct r300_screen* r300screen = r300_screen(pscreen);
79
80 return chip_families[r300screen->caps.family];
81 }
82
83 static int r300_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
84 {
85 struct r300_screen* r300screen = r300_screen(pscreen);
86 boolean is_r500 = r300screen->caps.is_r500;
87
88 switch (param) {
89 /* Supported features (boolean caps). */
90 case PIPE_CAP_NPOT_TEXTURES:
91 case PIPE_CAP_TWO_SIDED_STENCIL:
92 case PIPE_CAP_GLSL:
93 /* I'll be frank. This is a lie.
94 *
95 * We don't truly support GLSL on any of this driver's chipsets.
96 * To be fair, no chipset supports the full GLSL specification
97 * to the best of our knowledge, but some of the less esoteric
98 * features are still missing here.
99 *
100 * Rather than cripple ourselves intentionally, I'm going to set
101 * this flag, and as Gallium's interface continues to change, I
102 * hope that this single monolithic GLSL enable can slowly get
103 * split down into many different pieces and the state tracker
104 * will handle fallbacks transparently, like it should.
105 *
106 * ~ C.
107 */
108 case PIPE_CAP_ANISOTROPIC_FILTER:
109 case PIPE_CAP_POINT_SPRITE:
110 case PIPE_CAP_OCCLUSION_QUERY:
111 case PIPE_CAP_TEXTURE_SHADOW_MAP:
112 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
113 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
114 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
115 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
116 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
117 case PIPE_CAP_CONDITIONAL_RENDER:
118 case PIPE_CAP_TEXTURE_BARRIER:
119 return 1;
120
121 /* r300 cannot do swizzling of compressed textures. Supported otherwise. */
122 case PIPE_CAP_TEXTURE_SWIZZLE:
123 return util_format_s3tc_enabled ? r300screen->caps.dxtc_swizzle : 1;
124
125 /* Supported on r500 only. */
126 case PIPE_CAP_FRAGMENT_COLOR_CLAMP_CONTROL:
127 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
128 case PIPE_CAP_SM3:
129 return is_r500 ? 1 : 0;
130
131 /* Unsupported features. */
132 case PIPE_CAP_TIMER_QUERY:
133 case PIPE_CAP_DUAL_SOURCE_BLEND:
134 case PIPE_CAP_INDEP_BLEND_ENABLE:
135 case PIPE_CAP_INDEP_BLEND_FUNC:
136 case PIPE_CAP_DEPTH_CLAMP:
137 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
138 case PIPE_CAP_SHADER_STENCIL_EXPORT:
139 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
140 case PIPE_CAP_TGSI_INSTANCEID:
141 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
142 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
143 case PIPE_CAP_SEAMLESS_CUBE_MAP:
144 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
145 case PIPE_CAP_SCALED_RESOLVE:
146 case PIPE_CAP_MIN_TEXEL_OFFSET:
147 case PIPE_CAP_MAX_TEXEL_OFFSET:
148 return 0;
149
150 /* SWTCL-only features. */
151 case PIPE_CAP_STREAM_OUTPUT:
152 case PIPE_CAP_PRIMITIVE_RESTART:
153 return !r300screen->caps.has_tcl;
154
155 /* Texturing. */
156 case PIPE_CAP_MAX_COMBINED_SAMPLERS:
157 return r300screen->caps.num_tex_units;
158 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
159 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
160 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
161 /* 13 == 4096, 12 == 2048 */
162 return is_r500 ? 13 : 12;
163
164 /* Render targets. */
165 case PIPE_CAP_MAX_RENDER_TARGETS:
166 return 4;
167
168 default:
169 debug_printf("r300: Warning: Unknown CAP %d in get_param.\n",
170 param);
171 return 0;
172 }
173 }
174
175 static int r300_get_shader_param(struct pipe_screen *pscreen, unsigned shader, enum pipe_shader_cap param)
176 {
177 struct r300_screen* r300screen = r300_screen(pscreen);
178 boolean is_r400 = r300screen->caps.is_r400;
179 boolean is_r500 = r300screen->caps.is_r500;
180
181 switch (shader)
182 {
183 case PIPE_SHADER_FRAGMENT:
184 switch (param)
185 {
186 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
187 return is_r500 || is_r400 ? 512 : 96;
188 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
189 return is_r500 || is_r400 ? 512 : 64;
190 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
191 return is_r500 || is_r400 ? 512 : 32;
192 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
193 return is_r500 ? 511 : 4;
194 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
195 return is_r500 ? 64 : 0; /* Actually unlimited on r500. */
196 /* Fragment shader limits. */
197 case PIPE_SHADER_CAP_MAX_INPUTS:
198 /* 2 colors + 8 texcoords are always supported
199 * (minus fog and wpos).
200 *
201 * R500 has the ability to turn 3rd and 4th color into
202 * additional texcoords but there is no two-sided color
203 * selection then. However the facing bit can be used instead. */
204 return 10;
205 case PIPE_SHADER_CAP_MAX_CONSTS:
206 return is_r500 ? 256 : 32;
207 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
208 return 1;
209 case PIPE_SHADER_CAP_MAX_TEMPS:
210 return is_r500 ? 128 : is_r400 ? 64 : 32;
211 case PIPE_SHADER_CAP_MAX_ADDRS:
212 return 0;
213 case PIPE_SHADER_CAP_MAX_PREDS:
214 return is_r500 ? 1 : 0;
215 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
216 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
217 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
218 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
219 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
220 case PIPE_SHADER_CAP_SUBROUTINES:
221 case PIPE_SHADER_CAP_INTEGERS:
222 return 0;
223 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
224 return r300screen->caps.num_tex_units;
225 }
226 break;
227 case PIPE_SHADER_VERTEX:
228 if (!r300screen->caps.has_tcl) {
229 return draw_get_shader_param(shader, param);
230 }
231
232 switch (param)
233 {
234 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
235 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
236 return is_r500 ? 1024 : 256;
237 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
238 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
239 return 0;
240 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
241 return is_r500 ? 4 : 0; /* For loops; not sure about conditionals. */
242 case PIPE_SHADER_CAP_MAX_INPUTS:
243 return 16;
244 case PIPE_SHADER_CAP_MAX_CONSTS:
245 return 256;
246 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
247 return 1;
248 case PIPE_SHADER_CAP_MAX_TEMPS:
249 return 32;
250 case PIPE_SHADER_CAP_MAX_ADDRS:
251 return 1; /* XXX guessed */
252 case PIPE_SHADER_CAP_MAX_PREDS:
253 return is_r500 ? 4 : 0; /* XXX guessed. */
254 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
255 return 1;
256 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
257 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
258 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
259 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
260 case PIPE_SHADER_CAP_SUBROUTINES:
261 case PIPE_SHADER_CAP_INTEGERS:
262 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
263 return 0;
264 }
265 break;
266 default:
267 break;
268 }
269 return 0;
270 }
271
272 static float r300_get_paramf(struct pipe_screen* pscreen, enum pipe_cap param)
273 {
274 struct r300_screen* r300screen = r300_screen(pscreen);
275
276 switch (param) {
277 case PIPE_CAP_MAX_LINE_WIDTH:
278 case PIPE_CAP_MAX_LINE_WIDTH_AA:
279 case PIPE_CAP_MAX_POINT_WIDTH:
280 case PIPE_CAP_MAX_POINT_WIDTH_AA:
281 /* The maximum dimensions of the colorbuffer are our practical
282 * rendering limits. 2048 pixels should be enough for anybody. */
283 if (r300screen->caps.is_r500) {
284 return 4096.0f;
285 } else if (r300screen->caps.is_r400) {
286 return 4021.0f;
287 } else {
288 return 2560.0f;
289 }
290 case PIPE_CAP_MAX_TEXTURE_ANISOTROPY:
291 return 16.0f;
292 case PIPE_CAP_MAX_TEXTURE_LOD_BIAS:
293 return 16.0f;
294 case PIPE_CAP_GUARD_BAND_LEFT:
295 case PIPE_CAP_GUARD_BAND_TOP:
296 case PIPE_CAP_GUARD_BAND_RIGHT:
297 case PIPE_CAP_GUARD_BAND_BOTTOM:
298 /* XXX I don't know what these should be but the least we can do is
299 * silence the potential error message */
300 return 0.0f;
301 default:
302 debug_printf("r300: Warning: Unknown CAP %d in get_paramf.\n",
303 param);
304 return 0.0f;
305 }
306 }
307
308 static int r300_get_video_param(struct pipe_screen *screen,
309 enum pipe_video_profile profile,
310 enum pipe_video_cap param)
311 {
312 switch (param) {
313 case PIPE_VIDEO_CAP_SUPPORTED:
314 return vl_profile_supported(screen, profile);
315 case PIPE_VIDEO_CAP_NPOT_TEXTURES:
316 return 0;
317 case PIPE_VIDEO_CAP_MAX_WIDTH:
318 case PIPE_VIDEO_CAP_MAX_HEIGHT:
319 return vl_video_buffer_max_size(screen);
320 case PIPE_VIDEO_CAP_NUM_BUFFERS_DESIRED:
321 return vl_num_buffers_desired(screen, profile);
322 default:
323 return 0;
324 }
325 }
326
327 static boolean r300_is_format_supported(struct pipe_screen* screen,
328 enum pipe_format format,
329 enum pipe_texture_target target,
330 unsigned sample_count,
331 unsigned usage)
332 {
333 uint32_t retval = 0;
334 boolean drm_2_8_0 = r300_screen(screen)->info.drm_minor >= 8;
335 boolean is_r500 = r300_screen(screen)->caps.is_r500;
336 boolean is_r400 = r300_screen(screen)->caps.is_r400;
337 boolean is_color2101010 = format == PIPE_FORMAT_R10G10B10A2_UNORM ||
338 format == PIPE_FORMAT_R10G10B10X2_SNORM ||
339 format == PIPE_FORMAT_B10G10R10A2_UNORM ||
340 format == PIPE_FORMAT_R10SG10SB10SA2U_NORM;
341 boolean is_ati1n = format == PIPE_FORMAT_RGTC1_UNORM ||
342 format == PIPE_FORMAT_RGTC1_SNORM ||
343 format == PIPE_FORMAT_LATC1_UNORM ||
344 format == PIPE_FORMAT_LATC1_SNORM;
345 boolean is_ati2n = format == PIPE_FORMAT_RGTC2_UNORM ||
346 format == PIPE_FORMAT_RGTC2_SNORM ||
347 format == PIPE_FORMAT_LATC2_UNORM ||
348 format == PIPE_FORMAT_LATC2_SNORM;
349 boolean is_x16f_xy16f = format == PIPE_FORMAT_R16_FLOAT ||
350 format == PIPE_FORMAT_R16G16_FLOAT ||
351 format == PIPE_FORMAT_A16_FLOAT ||
352 format == PIPE_FORMAT_L16_FLOAT ||
353 format == PIPE_FORMAT_L16A16_FLOAT ||
354 format == PIPE_FORMAT_I16_FLOAT;
355 boolean is_half_float = format == PIPE_FORMAT_R16_FLOAT ||
356 format == PIPE_FORMAT_R16G16_FLOAT ||
357 format == PIPE_FORMAT_R16G16B16_FLOAT ||
358 format == PIPE_FORMAT_R16G16B16A16_FLOAT;
359
360 if (!util_format_is_supported(format, usage))
361 return FALSE;
362
363 /* Check multisampling support. */
364 switch (sample_count) {
365 case 0:
366 case 1:
367 break;
368 case 2:
369 case 3:
370 case 4:
371 case 6:
372 return FALSE;
373 #if 0
374 if (usage != PIPE_BIND_RENDER_TARGET ||
375 !util_format_is_rgba8_variant(
376 util_format_description(format))) {
377 return FALSE;
378 }
379 #endif
380 break;
381 default:
382 return FALSE;
383 }
384
385 /* Check sampler format support. */
386 if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
387 /* ATI1N is r5xx-only. */
388 (is_r500 || !is_ati1n) &&
389 /* ATI2N is supported on r4xx-r5xx. */
390 (is_r400 || is_r500 || !is_ati2n) &&
391 /* R16F and RG16F texture support was added in as late as DRM 2.8.0 */
392 (drm_2_8_0 || !is_x16f_xy16f) &&
393 r300_is_sampler_format_supported(format)) {
394 retval |= PIPE_BIND_SAMPLER_VIEW;
395 }
396
397 /* Check colorbuffer format support. */
398 if ((usage & (PIPE_BIND_RENDER_TARGET |
399 PIPE_BIND_DISPLAY_TARGET |
400 PIPE_BIND_SCANOUT |
401 PIPE_BIND_SHARED)) &&
402 /* 2101010 cannot be rendered to on non-r5xx. */
403 (!is_color2101010 || (is_r500 && drm_2_8_0)) &&
404 r300_is_colorbuffer_format_supported(format)) {
405 retval |= usage &
406 (PIPE_BIND_RENDER_TARGET |
407 PIPE_BIND_DISPLAY_TARGET |
408 PIPE_BIND_SCANOUT |
409 PIPE_BIND_SHARED);
410 }
411
412 /* Check depth-stencil format support. */
413 if (usage & PIPE_BIND_DEPTH_STENCIL &&
414 r300_is_zs_format_supported(format)) {
415 retval |= PIPE_BIND_DEPTH_STENCIL;
416 }
417
418 /* Check vertex buffer format support. */
419 if (usage & PIPE_BIND_VERTEX_BUFFER &&
420 /* Half float is supported on >= RV350. */
421 (is_r400 || is_r500 || !is_half_float) &&
422 r300_translate_vertex_data_type(format) != R300_INVALID_FORMAT) {
423 retval |= PIPE_BIND_VERTEX_BUFFER;
424 }
425
426 /* Transfers are always supported. */
427 if (usage & PIPE_BIND_TRANSFER_READ)
428 retval |= PIPE_BIND_TRANSFER_READ;
429 if (usage & PIPE_BIND_TRANSFER_WRITE)
430 retval |= PIPE_BIND_TRANSFER_WRITE;
431
432 return retval == usage;
433 }
434
435 static void r300_destroy_screen(struct pipe_screen* pscreen)
436 {
437 struct r300_screen* r300screen = r300_screen(pscreen);
438 struct radeon_winsys *rws = radeon_winsys(pscreen);
439
440 util_slab_destroy(&r300screen->pool_buffers);
441 pipe_mutex_destroy(r300screen->num_contexts_mutex);
442
443 if (rws)
444 rws->destroy(rws);
445
446 FREE(r300screen);
447 }
448
449 static void r300_fence_reference(struct pipe_screen *screen,
450 struct pipe_fence_handle **ptr,
451 struct pipe_fence_handle *fence)
452 {
453 pb_reference((struct pb_buffer**)ptr,
454 (struct pb_buffer*)fence);
455 }
456
457 static boolean r300_fence_signalled(struct pipe_screen *screen,
458 struct pipe_fence_handle *fence)
459 {
460 struct radeon_winsys *rws = r300_screen(screen)->rws;
461 struct pb_buffer *rfence = (struct pb_buffer*)fence;
462
463 return !rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE);
464 }
465
466 static boolean r300_fence_finish(struct pipe_screen *screen,
467 struct pipe_fence_handle *fence,
468 uint64_t timeout)
469 {
470 struct radeon_winsys *rws = r300_screen(screen)->rws;
471 struct pb_buffer *rfence = (struct pb_buffer*)fence;
472
473 if (timeout != PIPE_TIMEOUT_INFINITE) {
474 int64_t start_time = os_time_get();
475
476 /* Convert to microseconds. */
477 timeout /= 1000;
478
479 /* Wait in a loop. */
480 while (rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE)) {
481 if (os_time_get() - start_time >= timeout) {
482 return FALSE;
483 }
484 os_time_sleep(10);
485 }
486 return TRUE;
487 }
488
489 rws->buffer_wait(rfence, RADEON_USAGE_READWRITE);
490 return TRUE;
491 }
492
493 struct pipe_screen* r300_screen_create(struct radeon_winsys *rws)
494 {
495 struct r300_screen *r300screen = CALLOC_STRUCT(r300_screen);
496
497 if (!r300screen) {
498 FREE(r300screen);
499 return NULL;
500 }
501
502 rws->query_info(rws, &r300screen->info);
503
504 r300_init_debug(r300screen);
505 r300_parse_chipset(r300screen->info.pci_id, &r300screen->caps);
506
507 if (SCREEN_DBG_ON(r300screen, DBG_NO_ZMASK))
508 r300screen->caps.zmask_ram = 0;
509 if (SCREEN_DBG_ON(r300screen, DBG_NO_HIZ))
510 r300screen->caps.hiz_ram = 0;
511
512 if (r300screen->info.drm_minor < 8)
513 r300screen->caps.has_us_format = FALSE;
514
515 pipe_mutex_init(r300screen->num_contexts_mutex);
516
517 util_slab_create(&r300screen->pool_buffers,
518 sizeof(struct r300_resource), 64,
519 UTIL_SLAB_SINGLETHREADED);
520
521 r300screen->rws = rws;
522 r300screen->screen.winsys = (struct pipe_winsys*)rws;
523 r300screen->screen.destroy = r300_destroy_screen;
524 r300screen->screen.get_name = r300_get_name;
525 r300screen->screen.get_vendor = r300_get_vendor;
526 r300screen->screen.get_param = r300_get_param;
527 r300screen->screen.get_shader_param = r300_get_shader_param;
528 r300screen->screen.get_paramf = r300_get_paramf;
529 r300screen->screen.get_video_param = r300_get_video_param;
530 r300screen->screen.is_format_supported = r300_is_format_supported;
531 r300screen->screen.is_video_format_supported = vl_video_buffer_is_format_supported;
532 r300screen->screen.context_create = r300_create_context;
533 r300screen->screen.fence_reference = r300_fence_reference;
534 r300screen->screen.fence_signalled = r300_fence_signalled;
535 r300screen->screen.fence_finish = r300_fence_finish;
536
537 r300_init_screen_resource_functions(r300screen);
538
539 util_format_s3tc_init();
540
541 return &r300screen->screen;
542 }