r300g: add LATC support
[mesa.git] / src / gallium / drivers / r300 / r300_screen.c
1 /*
2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23
24 #include "util/u_format.h"
25 #include "util/u_format_s3tc.h"
26 #include "util/u_memory.h"
27
28 #include "r300_context.h"
29 #include "r300_texture.h"
30 #include "r300_screen_buffer.h"
31 #include "r300_state_inlines.h"
32 #include "r300_winsys.h"
33 #include "r300_public.h"
34
35 #include "draw/draw_context.h"
36
37 /* Return the identifier behind whom the brave coders responsible for this
38 * amalgamation of code, sweat, and duct tape, routinely obscure their names.
39 *
40 * ...I should have just put "Corbin Simpson", but I'm not that cool.
41 *
42 * (Or egotistical. Yet.) */
43 static const char* r300_get_vendor(struct pipe_screen* pscreen)
44 {
45 return "X.Org R300 Project";
46 }
47
48 static const char* chip_families[] = {
49 "ATI R300",
50 "ATI R350",
51 "ATI R360",
52 "ATI RV350",
53 "ATI RV370",
54 "ATI RV380",
55 "ATI R420",
56 "ATI R423",
57 "ATI R430",
58 "ATI R480",
59 "ATI R481",
60 "ATI RV410",
61 "ATI RS400",
62 "ATI RC410",
63 "ATI RS480",
64 "ATI RS482",
65 "ATI RS600",
66 "ATI RS690",
67 "ATI RS740",
68 "ATI RV515",
69 "ATI R520",
70 "ATI RV530",
71 "ATI R580",
72 "ATI RV560",
73 "ATI RV570"
74 };
75
76 static const char* r300_get_name(struct pipe_screen* pscreen)
77 {
78 struct r300_screen* r300screen = r300_screen(pscreen);
79
80 return chip_families[r300screen->caps.family];
81 }
82
83 static int r300_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
84 {
85 struct r300_screen* r300screen = r300_screen(pscreen);
86 boolean is_r500 = r300screen->caps.is_r500;
87
88 switch (param) {
89 /* Supported features (boolean caps). */
90 case PIPE_CAP_NPOT_TEXTURES:
91 case PIPE_CAP_TWO_SIDED_STENCIL:
92 case PIPE_CAP_GLSL:
93 /* I'll be frank. This is a lie.
94 *
95 * We don't truly support GLSL on any of this driver's chipsets.
96 * To be fair, no chipset supports the full GLSL specification
97 * to the best of our knowledge, but some of the less esoteric
98 * features are still missing here.
99 *
100 * Rather than cripple ourselves intentionally, I'm going to set
101 * this flag, and as Gallium's interface continues to change, I
102 * hope that this single monolithic GLSL enable can slowly get
103 * split down into many different pieces and the state tracker
104 * will handle fallbacks transparently, like it should.
105 *
106 * ~ C.
107 */
108 case PIPE_CAP_ANISOTROPIC_FILTER:
109 case PIPE_CAP_POINT_SPRITE:
110 case PIPE_CAP_OCCLUSION_QUERY:
111 case PIPE_CAP_TEXTURE_SHADOW_MAP:
112 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
113 case PIPE_CAP_TEXTURE_MIRROR_REPEAT:
114 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
115 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
116 return 1;
117 case PIPE_CAP_TEXTURE_SWIZZLE:
118 return util_format_s3tc_enabled ? r300screen->caps.dxtc_swizzle : 1;
119
120 /* Unsupported features (boolean caps). */
121 case PIPE_CAP_TIMER_QUERY:
122 case PIPE_CAP_DUAL_SOURCE_BLEND:
123 case PIPE_CAP_INDEP_BLEND_ENABLE:
124 case PIPE_CAP_INDEP_BLEND_FUNC:
125 case PIPE_CAP_DEPTH_CLAMP:
126 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
127 case PIPE_CAP_SHADER_STENCIL_EXPORT:
128 case PIPE_CAP_ARRAY_TEXTURES:
129 return 0;
130
131 /* SWTCL-only features. */
132 case PIPE_CAP_STREAM_OUTPUT:
133 case PIPE_CAP_PRIMITIVE_RESTART:
134 case PIPE_CAP_TGSI_INSTANCEID:
135 return !r300screen->caps.has_tcl;
136
137 /* Texturing. */
138 case PIPE_CAP_MAX_TEXTURE_IMAGE_UNITS:
139 case PIPE_CAP_MAX_COMBINED_SAMPLERS:
140 return r300screen->caps.num_tex_units;
141 case PIPE_CAP_MAX_VERTEX_TEXTURE_UNITS:
142 return 0;
143 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
144 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
145 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
146 /* 13 == 4096, 12 == 2048 */
147 return is_r500 ? 13 : 12;
148
149 /* Render targets. */
150 case PIPE_CAP_MAX_RENDER_TARGETS:
151 return 4;
152
153 /* General shader limits and features. */
154 case PIPE_CAP_SM3:
155 return is_r500 ? 1 : 0;
156 /* Fragment coordinate conventions. */
157 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
158 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
159 return 1;
160 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
161 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
162 return 0;
163 default:
164 debug_printf("r300: Warning: Unknown CAP %d in get_param.\n",
165 param);
166 return 0;
167 }
168 }
169
170 static int r300_get_shader_param(struct pipe_screen *pscreen, unsigned shader, enum pipe_shader_cap param)
171 {
172 struct r300_screen* r300screen = r300_screen(pscreen);
173 boolean is_r400 = r300screen->caps.is_r400;
174 boolean is_r500 = r300screen->caps.is_r500;
175
176 switch (shader)
177 {
178 case PIPE_SHADER_FRAGMENT:
179 switch (param)
180 {
181 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
182 return is_r500 || is_r400 ? 512 : 96;
183 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
184 return is_r500 || is_r400 ? 512 : 64;
185 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
186 return is_r500 || is_r400 ? 512 : 32;
187 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
188 return is_r500 ? 511 : 4;
189 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
190 return is_r500 ? 64 : 0; /* Actually unlimited on r500. */
191 /* Fragment shader limits. */
192 case PIPE_SHADER_CAP_MAX_INPUTS:
193 /* 2 colors + 8 texcoords are always supported
194 * (minus fog and wpos).
195 *
196 * R500 has the ability to turn 3rd and 4th color into
197 * additional texcoords but there is no two-sided color
198 * selection then. However the facing bit can be used instead. */
199 return 10;
200 case PIPE_SHADER_CAP_MAX_CONSTS:
201 return is_r500 ? 256 : 32;
202 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
203 return 1;
204 case PIPE_SHADER_CAP_MAX_TEMPS:
205 return is_r500 ? 128 : is_r400 ? 64 : 32;
206 case PIPE_SHADER_CAP_MAX_ADDRS:
207 return 0;
208 case PIPE_SHADER_CAP_MAX_PREDS:
209 return is_r500 ? 1 : 0;
210 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
211 return 1;
212 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
213 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
214 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
215 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
216 return 0;
217 case PIPE_SHADER_CAP_SUBROUTINES:
218 return 0;
219 }
220 break;
221 case PIPE_SHADER_VERTEX:
222 if (!r300screen->caps.has_tcl) {
223 return draw_get_shader_param(shader, param);
224 }
225
226 switch (param)
227 {
228 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
229 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
230 return is_r500 ? 1024 : 256;
231 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
232 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
233 return 0;
234 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
235 return is_r500 ? 4 : 0; /* For loops; not sure about conditionals. */
236 case PIPE_SHADER_CAP_MAX_INPUTS:
237 return 16;
238 case PIPE_SHADER_CAP_MAX_CONSTS:
239 return 256;
240 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
241 return 1;
242 case PIPE_SHADER_CAP_MAX_TEMPS:
243 return 32;
244 case PIPE_SHADER_CAP_MAX_ADDRS:
245 return 1; /* XXX guessed */
246 case PIPE_SHADER_CAP_MAX_PREDS:
247 return is_r500 ? 4 : 0; /* XXX guessed. */
248 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
249 return 1;
250 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
251 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
252 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
253 return 0;
254 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
255 return 1;
256 case PIPE_SHADER_CAP_SUBROUTINES:
257 return 0;
258 default:
259 break;
260 }
261 break;
262 default:
263 break;
264 }
265 return 0;
266 }
267
268 static float r300_get_paramf(struct pipe_screen* pscreen, enum pipe_cap param)
269 {
270 struct r300_screen* r300screen = r300_screen(pscreen);
271
272 switch (param) {
273 case PIPE_CAP_MAX_LINE_WIDTH:
274 case PIPE_CAP_MAX_LINE_WIDTH_AA:
275 case PIPE_CAP_MAX_POINT_WIDTH:
276 case PIPE_CAP_MAX_POINT_WIDTH_AA:
277 /* The maximum dimensions of the colorbuffer are our practical
278 * rendering limits. 2048 pixels should be enough for anybody. */
279 if (r300screen->caps.is_r500) {
280 return 4096.0f;
281 } else if (r300screen->caps.is_r400) {
282 return 4021.0f;
283 } else {
284 return 2560.0f;
285 }
286 case PIPE_CAP_MAX_TEXTURE_ANISOTROPY:
287 return 16.0f;
288 case PIPE_CAP_MAX_TEXTURE_LOD_BIAS:
289 return 16.0f;
290 case PIPE_CAP_GUARD_BAND_LEFT:
291 case PIPE_CAP_GUARD_BAND_TOP:
292 case PIPE_CAP_GUARD_BAND_RIGHT:
293 case PIPE_CAP_GUARD_BAND_BOTTOM:
294 /* XXX I don't know what these should be but the least we can do is
295 * silence the potential error message */
296 return 0.0f;
297 default:
298 debug_printf("r300: Warning: Unknown CAP %d in get_paramf.\n",
299 param);
300 return 0.0f;
301 }
302 }
303
304 static boolean r300_is_format_supported(struct pipe_screen* screen,
305 enum pipe_format format,
306 enum pipe_texture_target target,
307 unsigned sample_count,
308 unsigned usage,
309 unsigned geom_flags)
310 {
311 struct r300_winsys_screen *rws = r300_screen(screen)->rws;
312 uint32_t retval = 0;
313 boolean drm_2_8_0 = rws->get_value(rws, R300_VID_DRM_2_8_0);
314 boolean is_r500 = r300_screen(screen)->caps.is_r500;
315 boolean is_r400 = r300_screen(screen)->caps.is_r400;
316 boolean is_color2101010 = format == PIPE_FORMAT_R10G10B10A2_UNORM ||
317 format == PIPE_FORMAT_R10G10B10X2_SNORM ||
318 format == PIPE_FORMAT_B10G10R10A2_UNORM ||
319 format == PIPE_FORMAT_R10SG10SB10SA2U_NORM;
320 boolean is_ati1n = format == PIPE_FORMAT_RGTC1_UNORM ||
321 format == PIPE_FORMAT_RGTC1_SNORM ||
322 format == PIPE_FORMAT_LATC1_UNORM ||
323 format == PIPE_FORMAT_LATC1_SNORM;
324 boolean is_ati2n = format == PIPE_FORMAT_RGTC2_UNORM ||
325 format == PIPE_FORMAT_RGTC2_SNORM ||
326 format == PIPE_FORMAT_LATC2_UNORM ||
327 format == PIPE_FORMAT_LATC2_SNORM;
328 boolean is_half_float = format == PIPE_FORMAT_R16_FLOAT ||
329 format == PIPE_FORMAT_R16G16_FLOAT ||
330 format == PIPE_FORMAT_R16G16B16_FLOAT ||
331 format == PIPE_FORMAT_R16G16B16A16_FLOAT;
332
333 /* Check multisampling support. */
334 switch (sample_count) {
335 case 0:
336 case 1:
337 break;
338 case 2:
339 case 3:
340 case 4:
341 case 6:
342 return FALSE;
343 #if 0
344 if (usage != PIPE_BIND_RENDER_TARGET ||
345 !util_format_is_rgba8_variant(
346 util_format_description(format))) {
347 return FALSE;
348 }
349 #endif
350 break;
351 default:
352 return FALSE;
353 }
354
355 /* Check sampler format support. */
356 if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
357 /* ATI1N is r5xx-only. */
358 (is_r500 || !is_ati1n) &&
359 /* ATI2N is supported on r4xx-r5xx. */
360 (is_r400 || is_r500 || !is_ati2n) &&
361 r300_is_sampler_format_supported(format)) {
362 retval |= PIPE_BIND_SAMPLER_VIEW;
363 }
364
365 /* Check colorbuffer format support. */
366 if ((usage & (PIPE_BIND_RENDER_TARGET |
367 PIPE_BIND_DISPLAY_TARGET |
368 PIPE_BIND_SCANOUT |
369 PIPE_BIND_SHARED)) &&
370 /* 2101010 cannot be rendered to on non-r5xx. */
371 (!is_color2101010 || (is_r500 && drm_2_8_0)) &&
372 r300_is_colorbuffer_format_supported(format)) {
373 retval |= usage &
374 (PIPE_BIND_RENDER_TARGET |
375 PIPE_BIND_DISPLAY_TARGET |
376 PIPE_BIND_SCANOUT |
377 PIPE_BIND_SHARED);
378 }
379
380 /* Check depth-stencil format support. */
381 if (usage & PIPE_BIND_DEPTH_STENCIL &&
382 r300_is_zs_format_supported(format)) {
383 retval |= PIPE_BIND_DEPTH_STENCIL;
384 }
385
386 /* Check vertex buffer format support. */
387 if (usage & PIPE_BIND_VERTEX_BUFFER &&
388 /* Half float is supported on >= RV350. */
389 (is_r400 || is_r500 || !is_half_float) &&
390 r300_translate_vertex_data_type(format) != R300_INVALID_FORMAT) {
391 retval |= PIPE_BIND_VERTEX_BUFFER;
392 }
393
394 /* Transfers are always supported. */
395 if (usage & PIPE_BIND_TRANSFER_READ)
396 retval |= PIPE_BIND_TRANSFER_READ;
397 if (usage & PIPE_BIND_TRANSFER_WRITE)
398 retval |= PIPE_BIND_TRANSFER_WRITE;
399
400 return retval == usage;
401 }
402
403 static void r300_destroy_screen(struct pipe_screen* pscreen)
404 {
405 struct r300_screen* r300screen = r300_screen(pscreen);
406 struct r300_winsys_screen *rws = r300_winsys_screen(pscreen);
407
408 util_slab_destroy(&r300screen->pool_buffers);
409 pipe_mutex_destroy(r300screen->num_contexts_mutex);
410
411 if (rws)
412 rws->destroy(rws);
413
414 FREE(r300screen);
415 }
416
417 static void r300_fence_reference(struct pipe_screen *screen,
418 struct pipe_fence_handle **ptr,
419 struct pipe_fence_handle *fence)
420 {
421 r300_winsys_bo_reference((struct r300_winsys_bo**)ptr,
422 (struct r300_winsys_bo*)fence);
423 }
424
425 static int r300_fence_signalled(struct pipe_screen *screen,
426 struct pipe_fence_handle *fence,
427 unsigned flags)
428 {
429 struct r300_winsys_screen *rws = r300_screen(screen)->rws;
430 struct r300_winsys_bo *rfence = (struct r300_winsys_bo*)fence;
431
432 return !rws->buffer_is_busy(rfence) ? 0 : 1; /* 0 == success */
433 }
434
435 static int r300_fence_finish(struct pipe_screen *screen,
436 struct pipe_fence_handle *fence,
437 unsigned flags)
438 {
439 struct r300_winsys_screen *rws = r300_screen(screen)->rws;
440 struct r300_winsys_bo *rfence = (struct r300_winsys_bo*)fence;
441
442 rws->buffer_wait(rfence);
443 return 0; /* 0 == success */
444 }
445
446 struct pipe_screen* r300_screen_create(struct r300_winsys_screen *rws)
447 {
448 struct r300_screen *r300screen = CALLOC_STRUCT(r300_screen);
449
450 if (!r300screen) {
451 FREE(r300screen);
452 return NULL;
453 }
454
455 r300screen->caps.pci_id = rws->get_value(rws, R300_VID_PCI_ID);
456 r300screen->caps.num_frag_pipes = rws->get_value(rws, R300_VID_GB_PIPES);
457 r300screen->caps.num_z_pipes = rws->get_value(rws, R300_VID_Z_PIPES);
458
459 r300_init_debug(r300screen);
460 r300_parse_chipset(&r300screen->caps);
461
462 if (SCREEN_DBG_ON(r300screen, DBG_NO_ZMASK))
463 r300screen->caps.zmask_ram = 0;
464 if (SCREEN_DBG_ON(r300screen, DBG_NO_HIZ))
465 r300screen->caps.hiz_ram = 0;
466
467 pipe_mutex_init(r300screen->num_contexts_mutex);
468
469 util_slab_create(&r300screen->pool_buffers,
470 sizeof(struct r300_resource), 64,
471 UTIL_SLAB_SINGLETHREADED);
472
473 r300screen->rws = rws;
474 r300screen->screen.winsys = (struct pipe_winsys*)rws;
475 r300screen->screen.destroy = r300_destroy_screen;
476 r300screen->screen.get_name = r300_get_name;
477 r300screen->screen.get_vendor = r300_get_vendor;
478 r300screen->screen.get_param = r300_get_param;
479 r300screen->screen.get_shader_param = r300_get_shader_param;
480 r300screen->screen.get_paramf = r300_get_paramf;
481 r300screen->screen.is_format_supported = r300_is_format_supported;
482 r300screen->screen.context_create = r300_create_context;
483
484 r300screen->screen.fence_reference = r300_fence_reference;
485 r300screen->screen.fence_signalled = r300_fence_signalled;
486 r300screen->screen.fence_finish = r300_fence_finish;
487
488 r300_init_screen_resource_functions(r300screen);
489
490 util_format_s3tc_init();
491
492 return &r300screen->screen;
493 }