r300g: fix texturing with sizes > 2048 on r500
[mesa.git] / src / gallium / drivers / r300 / r300_screen.c
1 /*
2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23
24 #include "util/u_format.h"
25 #include "util/u_format_s3tc.h"
26 #include "util/u_memory.h"
27 #include "os/os_time.h"
28
29 #include "r300_context.h"
30 #include "r300_texture.h"
31 #include "r300_screen_buffer.h"
32 #include "r300_state_inlines.h"
33 #include "r300_winsys.h"
34 #include "r300_public.h"
35
36 #include "draw/draw_context.h"
37
38 /* Return the identifier behind whom the brave coders responsible for this
39 * amalgamation of code, sweat, and duct tape, routinely obscure their names.
40 *
41 * ...I should have just put "Corbin Simpson", but I'm not that cool.
42 *
43 * (Or egotistical. Yet.) */
44 static const char* r300_get_vendor(struct pipe_screen* pscreen)
45 {
46 return "X.Org R300 Project";
47 }
48
49 static const char* chip_families[] = {
50 "ATI R300",
51 "ATI R350",
52 "ATI R360",
53 "ATI RV350",
54 "ATI RV370",
55 "ATI RV380",
56 "ATI R420",
57 "ATI R423",
58 "ATI R430",
59 "ATI R480",
60 "ATI R481",
61 "ATI RV410",
62 "ATI RS400",
63 "ATI RC410",
64 "ATI RS480",
65 "ATI RS482",
66 "ATI RS600",
67 "ATI RS690",
68 "ATI RS740",
69 "ATI RV515",
70 "ATI R520",
71 "ATI RV530",
72 "ATI R580",
73 "ATI RV560",
74 "ATI RV570"
75 };
76
77 static const char* r300_get_name(struct pipe_screen* pscreen)
78 {
79 struct r300_screen* r300screen = r300_screen(pscreen);
80
81 return chip_families[r300screen->caps.family];
82 }
83
84 static int r300_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
85 {
86 struct r300_screen* r300screen = r300_screen(pscreen);
87 boolean is_r500 = r300screen->caps.is_r500;
88
89 switch (param) {
90 /* Supported features (boolean caps). */
91 case PIPE_CAP_NPOT_TEXTURES:
92 case PIPE_CAP_TWO_SIDED_STENCIL:
93 case PIPE_CAP_GLSL:
94 /* I'll be frank. This is a lie.
95 *
96 * We don't truly support GLSL on any of this driver's chipsets.
97 * To be fair, no chipset supports the full GLSL specification
98 * to the best of our knowledge, but some of the less esoteric
99 * features are still missing here.
100 *
101 * Rather than cripple ourselves intentionally, I'm going to set
102 * this flag, and as Gallium's interface continues to change, I
103 * hope that this single monolithic GLSL enable can slowly get
104 * split down into many different pieces and the state tracker
105 * will handle fallbacks transparently, like it should.
106 *
107 * ~ C.
108 */
109 case PIPE_CAP_ANISOTROPIC_FILTER:
110 case PIPE_CAP_POINT_SPRITE:
111 case PIPE_CAP_OCCLUSION_QUERY:
112 case PIPE_CAP_TEXTURE_SHADOW_MAP:
113 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
114 case PIPE_CAP_TEXTURE_MIRROR_REPEAT:
115 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
116 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
117 case PIPE_CAP_FRAGMENT_COLOR_CLAMP_CONTROL:
118 return 1;
119 case PIPE_CAP_TEXTURE_SWIZZLE:
120 return util_format_s3tc_enabled ? r300screen->caps.dxtc_swizzle : 1;
121 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
122 return is_r500 ? 1 : 0;
123
124 /* Unsupported features (boolean caps). */
125 case PIPE_CAP_TIMER_QUERY:
126 case PIPE_CAP_DUAL_SOURCE_BLEND:
127 case PIPE_CAP_INDEP_BLEND_ENABLE:
128 case PIPE_CAP_INDEP_BLEND_FUNC:
129 case PIPE_CAP_DEPTH_CLAMP:
130 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
131 case PIPE_CAP_SHADER_STENCIL_EXPORT:
132 case PIPE_CAP_ARRAY_TEXTURES:
133 return 0;
134
135 /* SWTCL-only features. */
136 case PIPE_CAP_STREAM_OUTPUT:
137 case PIPE_CAP_PRIMITIVE_RESTART:
138 case PIPE_CAP_TGSI_INSTANCEID:
139 return !r300screen->caps.has_tcl;
140
141 /* Texturing. */
142 case PIPE_CAP_MAX_TEXTURE_IMAGE_UNITS:
143 case PIPE_CAP_MAX_COMBINED_SAMPLERS:
144 return r300screen->caps.num_tex_units;
145 case PIPE_CAP_MAX_VERTEX_TEXTURE_UNITS:
146 return 0;
147 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
148 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
149 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
150 /* 13 == 4096, 12 == 2048 */
151 return is_r500 ? 13 : 12;
152
153 /* Render targets. */
154 case PIPE_CAP_MAX_RENDER_TARGETS:
155 return 4;
156
157 /* General shader limits and features. */
158 case PIPE_CAP_SM3:
159 return is_r500 ? 1 : 0;
160 /* Fragment coordinate conventions. */
161 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
162 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
163 return 1;
164 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
165 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
166 return 0;
167 default:
168 debug_printf("r300: Warning: Unknown CAP %d in get_param.\n",
169 param);
170 return 0;
171 }
172 }
173
174 static int r300_get_shader_param(struct pipe_screen *pscreen, unsigned shader, enum pipe_shader_cap param)
175 {
176 struct r300_screen* r300screen = r300_screen(pscreen);
177 boolean is_r400 = r300screen->caps.is_r400;
178 boolean is_r500 = r300screen->caps.is_r500;
179
180 switch (shader)
181 {
182 case PIPE_SHADER_FRAGMENT:
183 switch (param)
184 {
185 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
186 return is_r500 || is_r400 ? 512 : 96;
187 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
188 return is_r500 || is_r400 ? 512 : 64;
189 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
190 return is_r500 || is_r400 ? 512 : 32;
191 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
192 return is_r500 ? 511 : 4;
193 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
194 return is_r500 ? 64 : 0; /* Actually unlimited on r500. */
195 /* Fragment shader limits. */
196 case PIPE_SHADER_CAP_MAX_INPUTS:
197 /* 2 colors + 8 texcoords are always supported
198 * (minus fog and wpos).
199 *
200 * R500 has the ability to turn 3rd and 4th color into
201 * additional texcoords but there is no two-sided color
202 * selection then. However the facing bit can be used instead. */
203 return 10;
204 case PIPE_SHADER_CAP_MAX_CONSTS:
205 return is_r500 ? 256 : 32;
206 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
207 return 1;
208 case PIPE_SHADER_CAP_MAX_TEMPS:
209 return is_r500 ? 128 : is_r400 ? 64 : 32;
210 case PIPE_SHADER_CAP_MAX_ADDRS:
211 return 0;
212 case PIPE_SHADER_CAP_MAX_PREDS:
213 return is_r500 ? 1 : 0;
214 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
215 return 0;
216 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
217 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
218 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
219 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
220 return 0;
221 case PIPE_SHADER_CAP_SUBROUTINES:
222 return 0;
223 }
224 break;
225 case PIPE_SHADER_VERTEX:
226 if (!r300screen->caps.has_tcl) {
227 return draw_get_shader_param(shader, param);
228 }
229
230 switch (param)
231 {
232 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
233 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
234 return is_r500 ? 1024 : 256;
235 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
236 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
237 return 0;
238 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
239 return is_r500 ? 4 : 0; /* For loops; not sure about conditionals. */
240 case PIPE_SHADER_CAP_MAX_INPUTS:
241 return 16;
242 case PIPE_SHADER_CAP_MAX_CONSTS:
243 return 256;
244 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
245 return 1;
246 case PIPE_SHADER_CAP_MAX_TEMPS:
247 return 32;
248 case PIPE_SHADER_CAP_MAX_ADDRS:
249 return 1; /* XXX guessed */
250 case PIPE_SHADER_CAP_MAX_PREDS:
251 return is_r500 ? 4 : 0; /* XXX guessed. */
252 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
253 return 0;
254 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
255 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
256 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
257 return 0;
258 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
259 return 1;
260 case PIPE_SHADER_CAP_SUBROUTINES:
261 return 0;
262 default:
263 break;
264 }
265 break;
266 default:
267 break;
268 }
269 return 0;
270 }
271
272 static float r300_get_paramf(struct pipe_screen* pscreen, enum pipe_cap param)
273 {
274 struct r300_screen* r300screen = r300_screen(pscreen);
275
276 switch (param) {
277 case PIPE_CAP_MAX_LINE_WIDTH:
278 case PIPE_CAP_MAX_LINE_WIDTH_AA:
279 case PIPE_CAP_MAX_POINT_WIDTH:
280 case PIPE_CAP_MAX_POINT_WIDTH_AA:
281 /* The maximum dimensions of the colorbuffer are our practical
282 * rendering limits. 2048 pixels should be enough for anybody. */
283 if (r300screen->caps.is_r500) {
284 return 4096.0f;
285 } else if (r300screen->caps.is_r400) {
286 return 4021.0f;
287 } else {
288 return 2560.0f;
289 }
290 case PIPE_CAP_MAX_TEXTURE_ANISOTROPY:
291 return 16.0f;
292 case PIPE_CAP_MAX_TEXTURE_LOD_BIAS:
293 return 16.0f;
294 case PIPE_CAP_GUARD_BAND_LEFT:
295 case PIPE_CAP_GUARD_BAND_TOP:
296 case PIPE_CAP_GUARD_BAND_RIGHT:
297 case PIPE_CAP_GUARD_BAND_BOTTOM:
298 /* XXX I don't know what these should be but the least we can do is
299 * silence the potential error message */
300 return 0.0f;
301 default:
302 debug_printf("r300: Warning: Unknown CAP %d in get_paramf.\n",
303 param);
304 return 0.0f;
305 }
306 }
307
308 static boolean r300_is_format_supported(struct pipe_screen* screen,
309 enum pipe_format format,
310 enum pipe_texture_target target,
311 unsigned sample_count,
312 unsigned usage)
313 {
314 struct r300_winsys_screen *rws = r300_screen(screen)->rws;
315 uint32_t retval = 0;
316 boolean drm_2_8_0 = rws->get_value(rws, R300_VID_DRM_2_8_0);
317 boolean is_r500 = r300_screen(screen)->caps.is_r500;
318 boolean is_r400 = r300_screen(screen)->caps.is_r400;
319 boolean is_color2101010 = format == PIPE_FORMAT_R10G10B10A2_UNORM ||
320 format == PIPE_FORMAT_R10G10B10X2_SNORM ||
321 format == PIPE_FORMAT_B10G10R10A2_UNORM ||
322 format == PIPE_FORMAT_R10SG10SB10SA2U_NORM;
323 boolean is_ati1n = format == PIPE_FORMAT_RGTC1_UNORM ||
324 format == PIPE_FORMAT_RGTC1_SNORM ||
325 format == PIPE_FORMAT_LATC1_UNORM ||
326 format == PIPE_FORMAT_LATC1_SNORM;
327 boolean is_ati2n = format == PIPE_FORMAT_RGTC2_UNORM ||
328 format == PIPE_FORMAT_RGTC2_SNORM ||
329 format == PIPE_FORMAT_LATC2_UNORM ||
330 format == PIPE_FORMAT_LATC2_SNORM;
331 boolean is_half_float = format == PIPE_FORMAT_R16_FLOAT ||
332 format == PIPE_FORMAT_R16G16_FLOAT ||
333 format == PIPE_FORMAT_R16G16B16_FLOAT ||
334 format == PIPE_FORMAT_R16G16B16A16_FLOAT;
335
336 /* Check multisampling support. */
337 switch (sample_count) {
338 case 0:
339 case 1:
340 break;
341 case 2:
342 case 3:
343 case 4:
344 case 6:
345 return FALSE;
346 #if 0
347 if (usage != PIPE_BIND_RENDER_TARGET ||
348 !util_format_is_rgba8_variant(
349 util_format_description(format))) {
350 return FALSE;
351 }
352 #endif
353 break;
354 default:
355 return FALSE;
356 }
357
358 /* Check sampler format support. */
359 if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
360 /* ATI1N is r5xx-only. */
361 (is_r500 || !is_ati1n) &&
362 /* ATI2N is supported on r4xx-r5xx. */
363 (is_r400 || is_r500 || !is_ati2n) &&
364 r300_is_sampler_format_supported(format)) {
365 retval |= PIPE_BIND_SAMPLER_VIEW;
366 }
367
368 /* Check colorbuffer format support. */
369 if ((usage & (PIPE_BIND_RENDER_TARGET |
370 PIPE_BIND_DISPLAY_TARGET |
371 PIPE_BIND_SCANOUT |
372 PIPE_BIND_SHARED)) &&
373 /* 2101010 cannot be rendered to on non-r5xx. */
374 (!is_color2101010 || (is_r500 && drm_2_8_0)) &&
375 r300_is_colorbuffer_format_supported(format)) {
376 retval |= usage &
377 (PIPE_BIND_RENDER_TARGET |
378 PIPE_BIND_DISPLAY_TARGET |
379 PIPE_BIND_SCANOUT |
380 PIPE_BIND_SHARED);
381 }
382
383 /* Check depth-stencil format support. */
384 if (usage & PIPE_BIND_DEPTH_STENCIL &&
385 r300_is_zs_format_supported(format)) {
386 retval |= PIPE_BIND_DEPTH_STENCIL;
387 }
388
389 /* Check vertex buffer format support. */
390 if (usage & PIPE_BIND_VERTEX_BUFFER &&
391 /* Half float is supported on >= RV350. */
392 (is_r400 || is_r500 || !is_half_float) &&
393 r300_translate_vertex_data_type(format) != R300_INVALID_FORMAT) {
394 retval |= PIPE_BIND_VERTEX_BUFFER;
395 }
396
397 /* Transfers are always supported. */
398 if (usage & PIPE_BIND_TRANSFER_READ)
399 retval |= PIPE_BIND_TRANSFER_READ;
400 if (usage & PIPE_BIND_TRANSFER_WRITE)
401 retval |= PIPE_BIND_TRANSFER_WRITE;
402
403 return retval == usage;
404 }
405
406 static void r300_destroy_screen(struct pipe_screen* pscreen)
407 {
408 struct r300_screen* r300screen = r300_screen(pscreen);
409 struct r300_winsys_screen *rws = r300_winsys_screen(pscreen);
410
411 util_slab_destroy(&r300screen->pool_buffers);
412 pipe_mutex_destroy(r300screen->num_contexts_mutex);
413
414 if (rws)
415 rws->destroy(rws);
416
417 FREE(r300screen);
418 }
419
420 static void r300_fence_reference(struct pipe_screen *screen,
421 struct pipe_fence_handle **ptr,
422 struct pipe_fence_handle *fence)
423 {
424 r300_winsys_bo_reference((struct r300_winsys_bo**)ptr,
425 (struct r300_winsys_bo*)fence);
426 }
427
428 static boolean r300_fence_signalled(struct pipe_screen *screen,
429 struct pipe_fence_handle *fence)
430 {
431 struct r300_winsys_screen *rws = r300_screen(screen)->rws;
432 struct r300_winsys_bo *rfence = (struct r300_winsys_bo*)fence;
433
434 return !rws->buffer_is_busy(rfence);
435 }
436
437 static boolean r300_fence_finish(struct pipe_screen *screen,
438 struct pipe_fence_handle *fence,
439 uint64_t timeout)
440 {
441 struct r300_winsys_screen *rws = r300_screen(screen)->rws;
442 struct r300_winsys_bo *rfence = (struct r300_winsys_bo*)fence;
443
444 if (timeout != PIPE_TIMEOUT_INFINITE) {
445 int64_t start_time = os_time_get();
446
447 /* Convert to microseconds. */
448 timeout /= 1000;
449
450 /* Wait in a loop. */
451 while (rws->buffer_is_busy(rfence)) {
452 if (os_time_get() - start_time >= timeout) {
453 return FALSE;
454 }
455 os_time_sleep(10);
456 }
457 return TRUE;
458 }
459
460 rws->buffer_wait(rfence);
461 return TRUE;
462 }
463
464 struct pipe_screen* r300_screen_create(struct r300_winsys_screen *rws)
465 {
466 struct r300_screen *r300screen = CALLOC_STRUCT(r300_screen);
467
468 if (!r300screen) {
469 FREE(r300screen);
470 return NULL;
471 }
472
473 r300screen->caps.pci_id = rws->get_value(rws, R300_VID_PCI_ID);
474 r300screen->caps.num_frag_pipes = rws->get_value(rws, R300_VID_GB_PIPES);
475 r300screen->caps.num_z_pipes = rws->get_value(rws, R300_VID_Z_PIPES);
476
477 r300_init_debug(r300screen);
478 r300_parse_chipset(&r300screen->caps);
479
480 if (SCREEN_DBG_ON(r300screen, DBG_NO_ZMASK))
481 r300screen->caps.zmask_ram = 0;
482 if (SCREEN_DBG_ON(r300screen, DBG_NO_HIZ))
483 r300screen->caps.hiz_ram = 0;
484
485 if (!rws->get_value(rws, R300_VID_DRM_2_8_0))
486 r300screen->caps.has_us_format = FALSE;
487
488 pipe_mutex_init(r300screen->num_contexts_mutex);
489
490 util_slab_create(&r300screen->pool_buffers,
491 sizeof(struct r300_resource), 64,
492 UTIL_SLAB_SINGLETHREADED);
493
494 r300screen->rws = rws;
495 r300screen->screen.winsys = (struct pipe_winsys*)rws;
496 r300screen->screen.destroy = r300_destroy_screen;
497 r300screen->screen.get_name = r300_get_name;
498 r300screen->screen.get_vendor = r300_get_vendor;
499 r300screen->screen.get_param = r300_get_param;
500 r300screen->screen.get_shader_param = r300_get_shader_param;
501 r300screen->screen.get_paramf = r300_get_paramf;
502 r300screen->screen.is_format_supported = r300_is_format_supported;
503 r300screen->screen.context_create = r300_create_context;
504
505 r300screen->screen.fence_reference = r300_fence_reference;
506 r300screen->screen.fence_signalled = r300_fence_signalled;
507 r300screen->screen.fence_finish = r300_fence_finish;
508
509 r300_init_screen_resource_functions(r300screen);
510
511 util_format_s3tc_init();
512
513 return &r300screen->screen;
514 }