r300g: set max vertex samplers to 0 on swtcl chipsets
[mesa.git] / src / gallium / drivers / r300 / r300_screen.c
1 /*
2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23
24 #include "util/u_format.h"
25 #include "util/u_format_s3tc.h"
26 #include "util/u_memory.h"
27 #include "os/os_time.h"
28 #include "vl/vl_decoder.h"
29 #include "vl/vl_video_buffer.h"
30
31 #include "r300_context.h"
32 #include "r300_texture.h"
33 #include "r300_screen_buffer.h"
34 #include "r300_state_inlines.h"
35 #include "r300_public.h"
36
37 #include "draw/draw_context.h"
38
39 /* Return the identifier behind whom the brave coders responsible for this
40 * amalgamation of code, sweat, and duct tape, routinely obscure their names.
41 *
42 * ...I should have just put "Corbin Simpson", but I'm not that cool.
43 *
44 * (Or egotistical. Yet.) */
45 static const char* r300_get_vendor(struct pipe_screen* pscreen)
46 {
47 return "X.Org R300 Project";
48 }
49
50 static const char* chip_families[] = {
51 "ATI R300",
52 "ATI R350",
53 "ATI RV350",
54 "ATI RV370",
55 "ATI RV380",
56 "ATI RS400",
57 "ATI RC410",
58 "ATI RS480",
59 "ATI R420",
60 "ATI R423",
61 "ATI R430",
62 "ATI R480",
63 "ATI R481",
64 "ATI RV410",
65 "ATI RS600",
66 "ATI RS690",
67 "ATI RS740",
68 "ATI RV515",
69 "ATI R520",
70 "ATI RV530",
71 "ATI R580",
72 "ATI RV560",
73 "ATI RV570"
74 };
75
76 static const char* r300_get_name(struct pipe_screen* pscreen)
77 {
78 struct r300_screen* r300screen = r300_screen(pscreen);
79
80 return chip_families[r300screen->caps.family];
81 }
82
83 static int r300_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
84 {
85 struct r300_screen* r300screen = r300_screen(pscreen);
86 boolean is_r500 = r300screen->caps.is_r500;
87
88 switch (param) {
89 /* Supported features (boolean caps). */
90 case PIPE_CAP_NPOT_TEXTURES:
91 case PIPE_CAP_TWO_SIDED_STENCIL:
92 case PIPE_CAP_GLSL:
93 /* I'll be frank. This is a lie.
94 *
95 * We don't truly support GLSL on any of this driver's chipsets.
96 * To be fair, no chipset supports the full GLSL specification
97 * to the best of our knowledge, but some of the less esoteric
98 * features are still missing here.
99 *
100 * Rather than cripple ourselves intentionally, I'm going to set
101 * this flag, and as Gallium's interface continues to change, I
102 * hope that this single monolithic GLSL enable can slowly get
103 * split down into many different pieces and the state tracker
104 * will handle fallbacks transparently, like it should.
105 *
106 * ~ C.
107 */
108 case PIPE_CAP_ANISOTROPIC_FILTER:
109 case PIPE_CAP_POINT_SPRITE:
110 case PIPE_CAP_OCCLUSION_QUERY:
111 case PIPE_CAP_TEXTURE_SHADOW_MAP:
112 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
113 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
114 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
115 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
116 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
117 case PIPE_CAP_CONDITIONAL_RENDER:
118 case PIPE_CAP_TEXTURE_BARRIER:
119 return 1;
120
121 /* r300 cannot do swizzling of compressed textures. Supported otherwise. */
122 case PIPE_CAP_TEXTURE_SWIZZLE:
123 return util_format_s3tc_enabled ? r300screen->caps.dxtc_swizzle : 1;
124
125 /* Supported on r500 only. */
126 case PIPE_CAP_FRAGMENT_COLOR_CLAMP_CONTROL:
127 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
128 case PIPE_CAP_SM3:
129 return is_r500 ? 1 : 0;
130
131 /* Unsupported features. */
132 case PIPE_CAP_TIMER_QUERY:
133 case PIPE_CAP_DUAL_SOURCE_BLEND:
134 case PIPE_CAP_INDEP_BLEND_ENABLE:
135 case PIPE_CAP_INDEP_BLEND_FUNC:
136 case PIPE_CAP_DEPTH_CLAMP:
137 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
138 case PIPE_CAP_SHADER_STENCIL_EXPORT:
139 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
140 case PIPE_CAP_TGSI_INSTANCEID:
141 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
142 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
143 case PIPE_CAP_SEAMLESS_CUBE_MAP:
144 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
145 case PIPE_CAP_SCALED_RESOLVE:
146 case PIPE_CAP_MIN_TEXEL_OFFSET:
147 case PIPE_CAP_MAX_TEXEL_OFFSET:
148 case PIPE_CAP_STREAM_OUTPUT:
149 return 0;
150
151 /* SWTCL-only features. */
152 case PIPE_CAP_PRIMITIVE_RESTART:
153 return !r300screen->caps.has_tcl;
154
155 /* Texturing. */
156 case PIPE_CAP_MAX_COMBINED_SAMPLERS:
157 return r300screen->caps.num_tex_units;
158 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
159 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
160 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
161 /* 13 == 4096, 12 == 2048 */
162 return is_r500 ? 13 : 12;
163
164 /* Render targets. */
165 case PIPE_CAP_MAX_RENDER_TARGETS:
166 return 4;
167
168 default:
169 debug_printf("r300: Warning: Unknown CAP %d in get_param.\n",
170 param);
171 return 0;
172 }
173 }
174
175 static int r300_get_shader_param(struct pipe_screen *pscreen, unsigned shader, enum pipe_shader_cap param)
176 {
177 struct r300_screen* r300screen = r300_screen(pscreen);
178 boolean is_r400 = r300screen->caps.is_r400;
179 boolean is_r500 = r300screen->caps.is_r500;
180
181 switch (shader)
182 {
183 case PIPE_SHADER_FRAGMENT:
184 switch (param)
185 {
186 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
187 return is_r500 || is_r400 ? 512 : 96;
188 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
189 return is_r500 || is_r400 ? 512 : 64;
190 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
191 return is_r500 || is_r400 ? 512 : 32;
192 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
193 return is_r500 ? 511 : 4;
194 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
195 return is_r500 ? 64 : 0; /* Actually unlimited on r500. */
196 /* Fragment shader limits. */
197 case PIPE_SHADER_CAP_MAX_INPUTS:
198 /* 2 colors + 8 texcoords are always supported
199 * (minus fog and wpos).
200 *
201 * R500 has the ability to turn 3rd and 4th color into
202 * additional texcoords but there is no two-sided color
203 * selection then. However the facing bit can be used instead. */
204 return 10;
205 case PIPE_SHADER_CAP_MAX_CONSTS:
206 return is_r500 ? 256 : 32;
207 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
208 return 1;
209 case PIPE_SHADER_CAP_MAX_TEMPS:
210 return is_r500 ? 128 : is_r400 ? 64 : 32;
211 case PIPE_SHADER_CAP_MAX_ADDRS:
212 return 0;
213 case PIPE_SHADER_CAP_MAX_PREDS:
214 return is_r500 ? 1 : 0;
215 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
216 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
217 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
218 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
219 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
220 case PIPE_SHADER_CAP_SUBROUTINES:
221 case PIPE_SHADER_CAP_INTEGERS:
222 return 0;
223 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
224 return r300screen->caps.num_tex_units;
225 }
226 break;
227 case PIPE_SHADER_VERTEX:
228 switch (param)
229 {
230 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
231 return 0;
232 default:;
233 }
234
235 if (!r300screen->caps.has_tcl) {
236 return draw_get_shader_param(shader, param);
237 }
238
239 switch (param)
240 {
241 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
242 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
243 return is_r500 ? 1024 : 256;
244 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
245 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
246 return 0;
247 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
248 return is_r500 ? 4 : 0; /* For loops; not sure about conditionals. */
249 case PIPE_SHADER_CAP_MAX_INPUTS:
250 return 16;
251 case PIPE_SHADER_CAP_MAX_CONSTS:
252 return 256;
253 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
254 return 1;
255 case PIPE_SHADER_CAP_MAX_TEMPS:
256 return 32;
257 case PIPE_SHADER_CAP_MAX_ADDRS:
258 return 1; /* XXX guessed */
259 case PIPE_SHADER_CAP_MAX_PREDS:
260 return is_r500 ? 4 : 0; /* XXX guessed. */
261 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
262 return 1;
263 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
264 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
265 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
266 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
267 case PIPE_SHADER_CAP_SUBROUTINES:
268 case PIPE_SHADER_CAP_INTEGERS:
269 return 0;
270 default:;
271 }
272 break;
273 }
274 return 0;
275 }
276
277 static float r300_get_paramf(struct pipe_screen* pscreen, enum pipe_cap param)
278 {
279 struct r300_screen* r300screen = r300_screen(pscreen);
280
281 switch (param) {
282 case PIPE_CAP_MAX_LINE_WIDTH:
283 case PIPE_CAP_MAX_LINE_WIDTH_AA:
284 case PIPE_CAP_MAX_POINT_WIDTH:
285 case PIPE_CAP_MAX_POINT_WIDTH_AA:
286 /* The maximum dimensions of the colorbuffer are our practical
287 * rendering limits. 2048 pixels should be enough for anybody. */
288 if (r300screen->caps.is_r500) {
289 return 4096.0f;
290 } else if (r300screen->caps.is_r400) {
291 return 4021.0f;
292 } else {
293 return 2560.0f;
294 }
295 case PIPE_CAP_MAX_TEXTURE_ANISOTROPY:
296 return 16.0f;
297 case PIPE_CAP_MAX_TEXTURE_LOD_BIAS:
298 return 16.0f;
299 case PIPE_CAP_GUARD_BAND_LEFT:
300 case PIPE_CAP_GUARD_BAND_TOP:
301 case PIPE_CAP_GUARD_BAND_RIGHT:
302 case PIPE_CAP_GUARD_BAND_BOTTOM:
303 /* XXX I don't know what these should be but the least we can do is
304 * silence the potential error message */
305 return 0.0f;
306 default:
307 debug_printf("r300: Warning: Unknown CAP %d in get_paramf.\n",
308 param);
309 return 0.0f;
310 }
311 }
312
313 static int r300_get_video_param(struct pipe_screen *screen,
314 enum pipe_video_profile profile,
315 enum pipe_video_cap param)
316 {
317 switch (param) {
318 case PIPE_VIDEO_CAP_SUPPORTED:
319 return vl_profile_supported(screen, profile);
320 case PIPE_VIDEO_CAP_NPOT_TEXTURES:
321 return 0;
322 case PIPE_VIDEO_CAP_MAX_WIDTH:
323 case PIPE_VIDEO_CAP_MAX_HEIGHT:
324 return vl_video_buffer_max_size(screen);
325 case PIPE_VIDEO_CAP_NUM_BUFFERS_DESIRED:
326 return vl_num_buffers_desired(screen, profile);
327 default:
328 return 0;
329 }
330 }
331
332 static boolean r300_is_format_supported(struct pipe_screen* screen,
333 enum pipe_format format,
334 enum pipe_texture_target target,
335 unsigned sample_count,
336 unsigned usage)
337 {
338 uint32_t retval = 0;
339 boolean drm_2_8_0 = r300_screen(screen)->info.drm_minor >= 8;
340 boolean is_r500 = r300_screen(screen)->caps.is_r500;
341 boolean is_r400 = r300_screen(screen)->caps.is_r400;
342 boolean is_color2101010 = format == PIPE_FORMAT_R10G10B10A2_UNORM ||
343 format == PIPE_FORMAT_R10G10B10X2_SNORM ||
344 format == PIPE_FORMAT_B10G10R10A2_UNORM ||
345 format == PIPE_FORMAT_R10SG10SB10SA2U_NORM;
346 boolean is_ati1n = format == PIPE_FORMAT_RGTC1_UNORM ||
347 format == PIPE_FORMAT_RGTC1_SNORM ||
348 format == PIPE_FORMAT_LATC1_UNORM ||
349 format == PIPE_FORMAT_LATC1_SNORM;
350 boolean is_ati2n = format == PIPE_FORMAT_RGTC2_UNORM ||
351 format == PIPE_FORMAT_RGTC2_SNORM ||
352 format == PIPE_FORMAT_LATC2_UNORM ||
353 format == PIPE_FORMAT_LATC2_SNORM;
354 boolean is_x16f_xy16f = format == PIPE_FORMAT_R16_FLOAT ||
355 format == PIPE_FORMAT_R16G16_FLOAT ||
356 format == PIPE_FORMAT_A16_FLOAT ||
357 format == PIPE_FORMAT_L16_FLOAT ||
358 format == PIPE_FORMAT_L16A16_FLOAT ||
359 format == PIPE_FORMAT_I16_FLOAT;
360 boolean is_half_float = format == PIPE_FORMAT_R16_FLOAT ||
361 format == PIPE_FORMAT_R16G16_FLOAT ||
362 format == PIPE_FORMAT_R16G16B16_FLOAT ||
363 format == PIPE_FORMAT_R16G16B16A16_FLOAT;
364
365 if (!util_format_is_supported(format, usage))
366 return FALSE;
367
368 /* Check multisampling support. */
369 switch (sample_count) {
370 case 0:
371 case 1:
372 break;
373 case 2:
374 case 3:
375 case 4:
376 case 6:
377 return FALSE;
378 #if 0
379 if (usage != PIPE_BIND_RENDER_TARGET ||
380 !util_format_is_rgba8_variant(
381 util_format_description(format))) {
382 return FALSE;
383 }
384 #endif
385 break;
386 default:
387 return FALSE;
388 }
389
390 /* Check sampler format support. */
391 if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
392 /* ATI1N is r5xx-only. */
393 (is_r500 || !is_ati1n) &&
394 /* ATI2N is supported on r4xx-r5xx. */
395 (is_r400 || is_r500 || !is_ati2n) &&
396 /* R16F and RG16F texture support was added in as late as DRM 2.8.0 */
397 (drm_2_8_0 || !is_x16f_xy16f) &&
398 r300_is_sampler_format_supported(format)) {
399 retval |= PIPE_BIND_SAMPLER_VIEW;
400 }
401
402 /* Check colorbuffer format support. */
403 if ((usage & (PIPE_BIND_RENDER_TARGET |
404 PIPE_BIND_DISPLAY_TARGET |
405 PIPE_BIND_SCANOUT |
406 PIPE_BIND_SHARED)) &&
407 /* 2101010 cannot be rendered to on non-r5xx. */
408 (!is_color2101010 || (is_r500 && drm_2_8_0)) &&
409 r300_is_colorbuffer_format_supported(format)) {
410 retval |= usage &
411 (PIPE_BIND_RENDER_TARGET |
412 PIPE_BIND_DISPLAY_TARGET |
413 PIPE_BIND_SCANOUT |
414 PIPE_BIND_SHARED);
415 }
416
417 /* Check depth-stencil format support. */
418 if (usage & PIPE_BIND_DEPTH_STENCIL &&
419 r300_is_zs_format_supported(format)) {
420 retval |= PIPE_BIND_DEPTH_STENCIL;
421 }
422
423 /* Check vertex buffer format support. */
424 if (usage & PIPE_BIND_VERTEX_BUFFER &&
425 /* Half float is supported on >= RV350. */
426 (is_r400 || is_r500 || !is_half_float) &&
427 r300_translate_vertex_data_type(format) != R300_INVALID_FORMAT) {
428 retval |= PIPE_BIND_VERTEX_BUFFER;
429 }
430
431 /* Transfers are always supported. */
432 if (usage & PIPE_BIND_TRANSFER_READ)
433 retval |= PIPE_BIND_TRANSFER_READ;
434 if (usage & PIPE_BIND_TRANSFER_WRITE)
435 retval |= PIPE_BIND_TRANSFER_WRITE;
436
437 return retval == usage;
438 }
439
440 static void r300_destroy_screen(struct pipe_screen* pscreen)
441 {
442 struct r300_screen* r300screen = r300_screen(pscreen);
443 struct radeon_winsys *rws = radeon_winsys(pscreen);
444
445 util_slab_destroy(&r300screen->pool_buffers);
446 pipe_mutex_destroy(r300screen->num_contexts_mutex);
447
448 if (rws)
449 rws->destroy(rws);
450
451 FREE(r300screen);
452 }
453
454 static void r300_fence_reference(struct pipe_screen *screen,
455 struct pipe_fence_handle **ptr,
456 struct pipe_fence_handle *fence)
457 {
458 pb_reference((struct pb_buffer**)ptr,
459 (struct pb_buffer*)fence);
460 }
461
462 static boolean r300_fence_signalled(struct pipe_screen *screen,
463 struct pipe_fence_handle *fence)
464 {
465 struct radeon_winsys *rws = r300_screen(screen)->rws;
466 struct pb_buffer *rfence = (struct pb_buffer*)fence;
467
468 return !rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE);
469 }
470
471 static boolean r300_fence_finish(struct pipe_screen *screen,
472 struct pipe_fence_handle *fence,
473 uint64_t timeout)
474 {
475 struct radeon_winsys *rws = r300_screen(screen)->rws;
476 struct pb_buffer *rfence = (struct pb_buffer*)fence;
477
478 if (timeout != PIPE_TIMEOUT_INFINITE) {
479 int64_t start_time = os_time_get();
480
481 /* Convert to microseconds. */
482 timeout /= 1000;
483
484 /* Wait in a loop. */
485 while (rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE)) {
486 if (os_time_get() - start_time >= timeout) {
487 return FALSE;
488 }
489 os_time_sleep(10);
490 }
491 return TRUE;
492 }
493
494 rws->buffer_wait(rfence, RADEON_USAGE_READWRITE);
495 return TRUE;
496 }
497
498 struct pipe_screen* r300_screen_create(struct radeon_winsys *rws)
499 {
500 struct r300_screen *r300screen = CALLOC_STRUCT(r300_screen);
501
502 if (!r300screen) {
503 FREE(r300screen);
504 return NULL;
505 }
506
507 rws->query_info(rws, &r300screen->info);
508
509 r300_init_debug(r300screen);
510 r300_parse_chipset(r300screen->info.pci_id, &r300screen->caps);
511
512 if (SCREEN_DBG_ON(r300screen, DBG_NO_ZMASK))
513 r300screen->caps.zmask_ram = 0;
514 if (SCREEN_DBG_ON(r300screen, DBG_NO_HIZ))
515 r300screen->caps.hiz_ram = 0;
516
517 if (r300screen->info.drm_minor < 8)
518 r300screen->caps.has_us_format = FALSE;
519
520 pipe_mutex_init(r300screen->num_contexts_mutex);
521
522 util_slab_create(&r300screen->pool_buffers,
523 sizeof(struct r300_resource), 64,
524 UTIL_SLAB_SINGLETHREADED);
525
526 r300screen->rws = rws;
527 r300screen->screen.winsys = (struct pipe_winsys*)rws;
528 r300screen->screen.destroy = r300_destroy_screen;
529 r300screen->screen.get_name = r300_get_name;
530 r300screen->screen.get_vendor = r300_get_vendor;
531 r300screen->screen.get_param = r300_get_param;
532 r300screen->screen.get_shader_param = r300_get_shader_param;
533 r300screen->screen.get_paramf = r300_get_paramf;
534 r300screen->screen.get_video_param = r300_get_video_param;
535 r300screen->screen.is_format_supported = r300_is_format_supported;
536 r300screen->screen.is_video_format_supported = vl_video_buffer_is_format_supported;
537 r300screen->screen.context_create = r300_create_context;
538 r300screen->screen.fence_reference = r300_fence_reference;
539 r300screen->screen.fence_signalled = r300_fence_signalled;
540 r300screen->screen.fence_finish = r300_fence_finish;
541
542 r300_init_screen_resource_functions(r300screen);
543
544 util_format_s3tc_init();
545
546 return &r300screen->screen;
547 }