Squash-merge branch 'gallium-clip-state'
[mesa.git] / src / gallium / drivers / r300 / r300_screen.c
1 /*
2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23
24 #include "util/u_format.h"
25 #include "util/u_format_s3tc.h"
26 #include "util/u_memory.h"
27 #include "os/os_time.h"
28 #include "vl/vl_decoder.h"
29 #include "vl/vl_video_buffer.h"
30
31 #include "r300_context.h"
32 #include "r300_texture.h"
33 #include "r300_screen_buffer.h"
34 #include "r300_state_inlines.h"
35 #include "r300_public.h"
36
37 #include "draw/draw_context.h"
38
39 /* Return the identifier behind whom the brave coders responsible for this
40 * amalgamation of code, sweat, and duct tape, routinely obscure their names.
41 *
42 * ...I should have just put "Corbin Simpson", but I'm not that cool.
43 *
44 * (Or egotistical. Yet.) */
45 static const char* r300_get_vendor(struct pipe_screen* pscreen)
46 {
47 return "X.Org R300 Project";
48 }
49
50 static const char* chip_families[] = {
51 "ATI R300",
52 "ATI R350",
53 "ATI RV350",
54 "ATI RV370",
55 "ATI RV380",
56 "ATI RS400",
57 "ATI RC410",
58 "ATI RS480",
59 "ATI R420",
60 "ATI R423",
61 "ATI R430",
62 "ATI R480",
63 "ATI R481",
64 "ATI RV410",
65 "ATI RS600",
66 "ATI RS690",
67 "ATI RS740",
68 "ATI RV515",
69 "ATI R520",
70 "ATI RV530",
71 "ATI R580",
72 "ATI RV560",
73 "ATI RV570"
74 };
75
76 static const char* r300_get_name(struct pipe_screen* pscreen)
77 {
78 struct r300_screen* r300screen = r300_screen(pscreen);
79
80 return chip_families[r300screen->caps.family];
81 }
82
83 static int r300_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
84 {
85 struct r300_screen* r300screen = r300_screen(pscreen);
86 boolean is_r500 = r300screen->caps.is_r500;
87
88 switch (param) {
89 /* Supported features (boolean caps). */
90 case PIPE_CAP_NPOT_TEXTURES:
91 case PIPE_CAP_TWO_SIDED_STENCIL:
92 case PIPE_CAP_ANISOTROPIC_FILTER:
93 case PIPE_CAP_POINT_SPRITE:
94 case PIPE_CAP_OCCLUSION_QUERY:
95 case PIPE_CAP_TEXTURE_SHADOW_MAP:
96 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
97 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
98 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
99 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
100 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
101 case PIPE_CAP_CONDITIONAL_RENDER:
102 case PIPE_CAP_TEXTURE_BARRIER:
103 case PIPE_CAP_TGSI_CAN_COMPACT_VARYINGS:
104 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
105 return 1;
106
107 /* r300 cannot do swizzling of compressed textures. Supported otherwise. */
108 case PIPE_CAP_TEXTURE_SWIZZLE:
109 return util_format_s3tc_enabled ? r300screen->caps.dxtc_swizzle : 1;
110
111 /* Supported on r500 only. */
112 case PIPE_CAP_FRAGMENT_COLOR_CLAMP_CONTROL:
113 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
114 case PIPE_CAP_SM3:
115 return is_r500 ? 1 : 0;
116
117 /* Unsupported features. */
118 case PIPE_CAP_TIMER_QUERY:
119 case PIPE_CAP_DUAL_SOURCE_BLEND:
120 case PIPE_CAP_INDEP_BLEND_ENABLE:
121 case PIPE_CAP_INDEP_BLEND_FUNC:
122 case PIPE_CAP_DEPTH_CLIP_DISABLE:
123 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
124 case PIPE_CAP_SHADER_STENCIL_EXPORT:
125 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
126 case PIPE_CAP_TGSI_INSTANCEID:
127 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
128 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
129 case PIPE_CAP_SEAMLESS_CUBE_MAP:
130 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
131 case PIPE_CAP_SCALED_RESOLVE:
132 case PIPE_CAP_MIN_TEXEL_OFFSET:
133 case PIPE_CAP_MAX_TEXEL_OFFSET:
134 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
135 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
136 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
137 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
138 return 0;
139
140 /* SWTCL-only features. */
141 case PIPE_CAP_PRIMITIVE_RESTART:
142 return !r300screen->caps.has_tcl;
143
144 /* Texturing. */
145 case PIPE_CAP_MAX_COMBINED_SAMPLERS:
146 return r300screen->caps.num_tex_units;
147 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
148 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
149 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
150 /* 13 == 4096, 12 == 2048 */
151 return is_r500 ? 13 : 12;
152
153 /* Render targets. */
154 case PIPE_CAP_MAX_RENDER_TARGETS:
155 return 4;
156 }
157 return 0;
158 }
159
160 static int r300_get_shader_param(struct pipe_screen *pscreen, unsigned shader, enum pipe_shader_cap param)
161 {
162 struct r300_screen* r300screen = r300_screen(pscreen);
163 boolean is_r400 = r300screen->caps.is_r400;
164 boolean is_r500 = r300screen->caps.is_r500;
165
166 switch (shader) {
167 case PIPE_SHADER_FRAGMENT:
168 switch (param)
169 {
170 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
171 return is_r500 || is_r400 ? 512 : 96;
172 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
173 return is_r500 || is_r400 ? 512 : 64;
174 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
175 return is_r500 || is_r400 ? 512 : 32;
176 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
177 return is_r500 ? 511 : 4;
178 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
179 return is_r500 ? 64 : 0; /* Actually unlimited on r500. */
180 /* Fragment shader limits. */
181 case PIPE_SHADER_CAP_MAX_INPUTS:
182 /* 2 colors + 8 texcoords are always supported
183 * (minus fog and wpos).
184 *
185 * R500 has the ability to turn 3rd and 4th color into
186 * additional texcoords but there is no two-sided color
187 * selection then. However the facing bit can be used instead. */
188 return 10;
189 case PIPE_SHADER_CAP_MAX_CONSTS:
190 return is_r500 ? 256 : 32;
191 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
192 return 1;
193 case PIPE_SHADER_CAP_MAX_TEMPS:
194 return is_r500 ? 128 : is_r400 ? 64 : 32;
195 case PIPE_SHADER_CAP_MAX_PREDS:
196 return is_r500 ? 1 : 0;
197 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
198 return r300screen->caps.num_tex_units;
199 case PIPE_SHADER_CAP_MAX_ADDRS:
200 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
201 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
202 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
203 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
204 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
205 case PIPE_SHADER_CAP_SUBROUTINES:
206 case PIPE_SHADER_CAP_INTEGERS:
207 case PIPE_SHADER_CAP_OUTPUT_READ:
208 return 0;
209 }
210 break;
211 case PIPE_SHADER_VERTEX:
212 switch (param)
213 {
214 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
215 return 0;
216 default:;
217 }
218
219 if (!r300screen->caps.has_tcl) {
220 return draw_get_shader_param(shader, param);
221 }
222
223 switch (param)
224 {
225 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
226 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
227 return is_r500 ? 1024 : 256;
228 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
229 return is_r500 ? 4 : 0; /* For loops; not sure about conditionals. */
230 case PIPE_SHADER_CAP_MAX_INPUTS:
231 return 16;
232 case PIPE_SHADER_CAP_MAX_CONSTS:
233 return 256;
234 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
235 return 1;
236 case PIPE_SHADER_CAP_MAX_TEMPS:
237 return 32;
238 case PIPE_SHADER_CAP_MAX_ADDRS:
239 return 1; /* XXX guessed */
240 case PIPE_SHADER_CAP_MAX_PREDS:
241 return is_r500 ? 4 : 0; /* XXX guessed. */
242 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
243 return 1;
244 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
245 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
246 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
247 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
248 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
249 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
250 case PIPE_SHADER_CAP_SUBROUTINES:
251 case PIPE_SHADER_CAP_INTEGERS:
252 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
253 case PIPE_SHADER_CAP_OUTPUT_READ:
254 return 0;
255 }
256 break;
257 }
258 return 0;
259 }
260
261 static float r300_get_paramf(struct pipe_screen* pscreen,
262 enum pipe_capf param)
263 {
264 struct r300_screen* r300screen = r300_screen(pscreen);
265
266 switch (param) {
267 case PIPE_CAPF_MAX_LINE_WIDTH:
268 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
269 case PIPE_CAPF_MAX_POINT_WIDTH:
270 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
271 /* The maximum dimensions of the colorbuffer are our practical
272 * rendering limits. 2048 pixels should be enough for anybody. */
273 if (r300screen->caps.is_r500) {
274 return 4096.0f;
275 } else if (r300screen->caps.is_r400) {
276 return 4021.0f;
277 } else {
278 return 2560.0f;
279 }
280 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
281 return 16.0f;
282 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
283 return 16.0f;
284 case PIPE_CAPF_GUARD_BAND_LEFT:
285 case PIPE_CAPF_GUARD_BAND_TOP:
286 case PIPE_CAPF_GUARD_BAND_RIGHT:
287 case PIPE_CAPF_GUARD_BAND_BOTTOM:
288 /* XXX I don't know what these should be but the least we can do is
289 * silence the potential error message */
290 return 0.0f;
291 default:
292 debug_printf("r300: Warning: Unknown CAP %d in get_paramf.\n",
293 param);
294 return 0.0f;
295 }
296 }
297
298 static int r300_get_video_param(struct pipe_screen *screen,
299 enum pipe_video_profile profile,
300 enum pipe_video_cap param)
301 {
302 switch (param) {
303 case PIPE_VIDEO_CAP_SUPPORTED:
304 return vl_profile_supported(screen, profile);
305 case PIPE_VIDEO_CAP_NPOT_TEXTURES:
306 return 0;
307 case PIPE_VIDEO_CAP_MAX_WIDTH:
308 case PIPE_VIDEO_CAP_MAX_HEIGHT:
309 return vl_video_buffer_max_size(screen);
310 default:
311 return 0;
312 }
313 }
314
315 static boolean r300_is_format_supported(struct pipe_screen* screen,
316 enum pipe_format format,
317 enum pipe_texture_target target,
318 unsigned sample_count,
319 unsigned usage)
320 {
321 uint32_t retval = 0;
322 boolean drm_2_8_0 = r300_screen(screen)->info.drm_minor >= 8;
323 boolean is_r500 = r300_screen(screen)->caps.is_r500;
324 boolean is_r400 = r300_screen(screen)->caps.is_r400;
325 boolean is_color2101010 = format == PIPE_FORMAT_R10G10B10A2_UNORM ||
326 format == PIPE_FORMAT_R10G10B10X2_SNORM ||
327 format == PIPE_FORMAT_B10G10R10A2_UNORM ||
328 format == PIPE_FORMAT_R10SG10SB10SA2U_NORM;
329 boolean is_ati1n = format == PIPE_FORMAT_RGTC1_UNORM ||
330 format == PIPE_FORMAT_RGTC1_SNORM ||
331 format == PIPE_FORMAT_LATC1_UNORM ||
332 format == PIPE_FORMAT_LATC1_SNORM;
333 boolean is_ati2n = format == PIPE_FORMAT_RGTC2_UNORM ||
334 format == PIPE_FORMAT_RGTC2_SNORM ||
335 format == PIPE_FORMAT_LATC2_UNORM ||
336 format == PIPE_FORMAT_LATC2_SNORM;
337 boolean is_x16f_xy16f = format == PIPE_FORMAT_R16_FLOAT ||
338 format == PIPE_FORMAT_R16G16_FLOAT ||
339 format == PIPE_FORMAT_A16_FLOAT ||
340 format == PIPE_FORMAT_L16_FLOAT ||
341 format == PIPE_FORMAT_L16A16_FLOAT ||
342 format == PIPE_FORMAT_I16_FLOAT;
343 boolean is_half_float = format == PIPE_FORMAT_R16_FLOAT ||
344 format == PIPE_FORMAT_R16G16_FLOAT ||
345 format == PIPE_FORMAT_R16G16B16_FLOAT ||
346 format == PIPE_FORMAT_R16G16B16A16_FLOAT;
347 boolean is_fixed = format == PIPE_FORMAT_R32_FIXED ||
348 format == PIPE_FORMAT_R32G32_FIXED ||
349 format == PIPE_FORMAT_R32G32B32_FIXED ||
350 format == PIPE_FORMAT_R32G32B32A32_FIXED;
351
352 if (!util_format_is_supported(format, usage))
353 return FALSE;
354
355 /* Check multisampling support. */
356 switch (sample_count) {
357 case 0:
358 case 1:
359 break;
360 case 2:
361 case 3:
362 case 4:
363 case 6:
364 return FALSE;
365 #if 0
366 if (usage != PIPE_BIND_RENDER_TARGET ||
367 !util_format_is_rgba8_variant(
368 util_format_description(format))) {
369 return FALSE;
370 }
371 #endif
372 break;
373 default:
374 return FALSE;
375 }
376
377 /* Check sampler format support. */
378 if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
379 /* ATI1N is r5xx-only. */
380 (is_r500 || !is_ati1n) &&
381 /* ATI2N is supported on r4xx-r5xx. */
382 (is_r400 || is_r500 || !is_ati2n) &&
383 /* R16F and RG16F texture support was added in as late as DRM 2.8.0 */
384 (drm_2_8_0 || !is_x16f_xy16f) &&
385 r300_is_sampler_format_supported(format)) {
386 retval |= PIPE_BIND_SAMPLER_VIEW;
387 }
388
389 /* Check colorbuffer format support. */
390 if ((usage & (PIPE_BIND_RENDER_TARGET |
391 PIPE_BIND_DISPLAY_TARGET |
392 PIPE_BIND_SCANOUT |
393 PIPE_BIND_SHARED)) &&
394 /* 2101010 cannot be rendered to on non-r5xx. */
395 (!is_color2101010 || (is_r500 && drm_2_8_0)) &&
396 r300_is_colorbuffer_format_supported(format)) {
397 retval |= usage &
398 (PIPE_BIND_RENDER_TARGET |
399 PIPE_BIND_DISPLAY_TARGET |
400 PIPE_BIND_SCANOUT |
401 PIPE_BIND_SHARED);
402 }
403
404 /* Check depth-stencil format support. */
405 if (usage & PIPE_BIND_DEPTH_STENCIL &&
406 r300_is_zs_format_supported(format)) {
407 retval |= PIPE_BIND_DEPTH_STENCIL;
408 }
409
410 /* Check vertex buffer format support. */
411 if (usage & PIPE_BIND_VERTEX_BUFFER &&
412 /* Half float is supported on >= R400. */
413 (is_r400 || is_r500 || !is_half_float) &&
414 /* We have a fallback for FIXED. */
415 (is_fixed || r300_translate_vertex_data_type(format) != R300_INVALID_FORMAT)) {
416 retval |= PIPE_BIND_VERTEX_BUFFER;
417 }
418
419 /* Transfers are always supported. */
420 if (usage & PIPE_BIND_TRANSFER_READ)
421 retval |= PIPE_BIND_TRANSFER_READ;
422 if (usage & PIPE_BIND_TRANSFER_WRITE)
423 retval |= PIPE_BIND_TRANSFER_WRITE;
424
425 return retval == usage;
426 }
427
428 static void r300_destroy_screen(struct pipe_screen* pscreen)
429 {
430 struct r300_screen* r300screen = r300_screen(pscreen);
431 struct radeon_winsys *rws = radeon_winsys(pscreen);
432
433 util_slab_destroy(&r300screen->pool_buffers);
434 pipe_mutex_destroy(r300screen->num_contexts_mutex);
435
436 if (rws)
437 rws->destroy(rws);
438
439 FREE(r300screen);
440 }
441
442 static void r300_fence_reference(struct pipe_screen *screen,
443 struct pipe_fence_handle **ptr,
444 struct pipe_fence_handle *fence)
445 {
446 pb_reference((struct pb_buffer**)ptr,
447 (struct pb_buffer*)fence);
448 }
449
450 static boolean r300_fence_signalled(struct pipe_screen *screen,
451 struct pipe_fence_handle *fence)
452 {
453 struct radeon_winsys *rws = r300_screen(screen)->rws;
454 struct pb_buffer *rfence = (struct pb_buffer*)fence;
455
456 return !rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE);
457 }
458
459 static boolean r300_fence_finish(struct pipe_screen *screen,
460 struct pipe_fence_handle *fence,
461 uint64_t timeout)
462 {
463 struct radeon_winsys *rws = r300_screen(screen)->rws;
464 struct pb_buffer *rfence = (struct pb_buffer*)fence;
465
466 if (timeout != PIPE_TIMEOUT_INFINITE) {
467 int64_t start_time = os_time_get();
468
469 /* Convert to microseconds. */
470 timeout /= 1000;
471
472 /* Wait in a loop. */
473 while (rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE)) {
474 if (os_time_get() - start_time >= timeout) {
475 return FALSE;
476 }
477 os_time_sleep(10);
478 }
479 return TRUE;
480 }
481
482 rws->buffer_wait(rfence, RADEON_USAGE_READWRITE);
483 return TRUE;
484 }
485
486 struct pipe_screen* r300_screen_create(struct radeon_winsys *rws)
487 {
488 struct r300_screen *r300screen = CALLOC_STRUCT(r300_screen);
489
490 if (!r300screen) {
491 FREE(r300screen);
492 return NULL;
493 }
494
495 rws->query_info(rws, &r300screen->info);
496
497 r300_init_debug(r300screen);
498 r300_parse_chipset(r300screen->info.pci_id, &r300screen->caps);
499
500 if (SCREEN_DBG_ON(r300screen, DBG_NO_ZMASK))
501 r300screen->caps.zmask_ram = 0;
502 if (SCREEN_DBG_ON(r300screen, DBG_NO_HIZ))
503 r300screen->caps.hiz_ram = 0;
504
505 if (r300screen->info.drm_minor < 8)
506 r300screen->caps.has_us_format = FALSE;
507
508 pipe_mutex_init(r300screen->num_contexts_mutex);
509
510 util_slab_create(&r300screen->pool_buffers,
511 sizeof(struct r300_resource), 64,
512 UTIL_SLAB_SINGLETHREADED);
513
514 r300screen->rws = rws;
515 r300screen->screen.winsys = (struct pipe_winsys*)rws;
516 r300screen->screen.destroy = r300_destroy_screen;
517 r300screen->screen.get_name = r300_get_name;
518 r300screen->screen.get_vendor = r300_get_vendor;
519 r300screen->screen.get_param = r300_get_param;
520 r300screen->screen.get_shader_param = r300_get_shader_param;
521 r300screen->screen.get_paramf = r300_get_paramf;
522 r300screen->screen.get_video_param = r300_get_video_param;
523 r300screen->screen.is_format_supported = r300_is_format_supported;
524 r300screen->screen.is_video_format_supported = vl_video_buffer_is_format_supported;
525 r300screen->screen.context_create = r300_create_context;
526 r300screen->screen.fence_reference = r300_fence_reference;
527 r300screen->screen.fence_signalled = r300_fence_signalled;
528 r300screen->screen.fence_finish = r300_fence_finish;
529
530 r300_init_screen_resource_functions(r300screen);
531
532 util_format_s3tc_init();
533
534 return &r300screen->screen;
535 }