r300g: fix microtiling on RS6xx
[mesa.git] / src / gallium / drivers / r300 / r300_screen.c
1 /*
2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23
24 #include "util/u_format.h"
25 #include "util/u_format_s3tc.h"
26 #include "util/u_memory.h"
27
28 #include "r300_context.h"
29 #include "r300_texture.h"
30 #include "r300_screen_buffer.h"
31 #include "r300_state_inlines.h"
32 #include "r300_winsys.h"
33 #include "r300_public.h"
34
35 /* Return the identifier behind whom the brave coders responsible for this
36 * amalgamation of code, sweat, and duct tape, routinely obscure their names.
37 *
38 * ...I should have just put "Corbin Simpson", but I'm not that cool.
39 *
40 * (Or egotistical. Yet.) */
41 static const char* r300_get_vendor(struct pipe_screen* pscreen)
42 {
43 return "X.Org R300 Project";
44 }
45
46 static const char* chip_families[] = {
47 "R300",
48 "R350",
49 "R360",
50 "RV350",
51 "RV370",
52 "RV380",
53 "R420",
54 "R423",
55 "R430",
56 "R480",
57 "R481",
58 "RV410",
59 "RS400",
60 "RC410",
61 "RS480",
62 "RS482",
63 "RS600",
64 "RS690",
65 "RS740",
66 "RV515",
67 "R520",
68 "RV530",
69 "R580",
70 "RV560",
71 "RV570"
72 };
73
74 static const char* r300_get_name(struct pipe_screen* pscreen)
75 {
76 struct r300_screen* r300screen = r300_screen(pscreen);
77
78 return chip_families[r300screen->caps.family];
79 }
80
81 static int r300_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
82 {
83 struct r300_screen* r300screen = r300_screen(pscreen);
84 boolean is_r400 = r300screen->caps.is_r400;
85 boolean is_r500 = r300screen->caps.is_r500;
86
87 /* XXX extended shader capabilities of r400 unimplemented */
88 is_r400 = FALSE;
89
90 switch (param) {
91 /* Supported features (boolean caps). */
92 case PIPE_CAP_NPOT_TEXTURES:
93 case PIPE_CAP_TWO_SIDED_STENCIL:
94 case PIPE_CAP_GLSL:
95 /* I'll be frank. This is a lie.
96 *
97 * We don't truly support GLSL on any of this driver's chipsets.
98 * To be fair, no chipset supports the full GLSL specification
99 * to the best of our knowledge, but some of the less esoteric
100 * features are still missing here.
101 *
102 * Rather than cripple ourselves intentionally, I'm going to set
103 * this flag, and as Gallium's interface continues to change, I
104 * hope that this single monolithic GLSL enable can slowly get
105 * split down into many different pieces and the state tracker
106 * will handle fallbacks transparently, like it should.
107 *
108 * ~ C.
109 */
110 case PIPE_CAP_ANISOTROPIC_FILTER:
111 case PIPE_CAP_POINT_SPRITE:
112 case PIPE_CAP_OCCLUSION_QUERY:
113 case PIPE_CAP_TEXTURE_SHADOW_MAP:
114 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
115 case PIPE_CAP_TEXTURE_MIRROR_REPEAT:
116 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
117 case PIPE_CAP_TEXTURE_SWIZZLE:
118 case PIPE_CAP_DEPTH_CLAMP:
119 return 1;
120
121 /* Unsupported features (boolean caps). */
122 case PIPE_CAP_TIMER_QUERY:
123 case PIPE_CAP_DUAL_SOURCE_BLEND:
124 case PIPE_CAP_TGSI_CONT_SUPPORTED:
125 case PIPE_CAP_INDEP_BLEND_ENABLE:
126 case PIPE_CAP_INDEP_BLEND_FUNC:
127 return 0;
128
129 /* Texturing. */
130 case PIPE_CAP_MAX_TEXTURE_IMAGE_UNITS:
131 case PIPE_CAP_MAX_COMBINED_SAMPLERS:
132 return r300screen->caps.num_tex_units;
133 case PIPE_CAP_MAX_VERTEX_TEXTURE_UNITS:
134 return 0;
135 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
136 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
137 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
138 /* 13 == 4096, 12 == 2048 */
139 return is_r500 ? 13 : 12;
140
141 /* Render targets. */
142 case PIPE_CAP_MAX_RENDER_TARGETS:
143 return 4;
144
145 /* General shader limits and features. */
146 case PIPE_CAP_SM3:
147 return is_r500 ? 1 : 0;
148 case PIPE_CAP_MAX_CONST_BUFFERS:
149 return 1;
150 case PIPE_CAP_MAX_CONST_BUFFER_SIZE:
151 return 256;
152
153 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
154 return 1;
155
156 /* Fragment coordinate conventions. */
157 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
158 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
159 return 1;
160 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
161 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
162 return 0;
163
164 /* Fragment shader limits. */
165 case PIPE_CAP_MAX_FS_INSTRUCTIONS:
166 return is_r500 || is_r400 ? 512 : 96;
167 case PIPE_CAP_MAX_FS_ALU_INSTRUCTIONS:
168 return is_r500 || is_r400 ? 512 : 64;
169 case PIPE_CAP_MAX_FS_TEX_INSTRUCTIONS:
170 return is_r500 || is_r400 ? 512 : 32;
171 case PIPE_CAP_MAX_FS_TEX_INDIRECTIONS:
172 return is_r500 ? 511 : 4;
173 case PIPE_CAP_MAX_FS_CONTROL_FLOW_DEPTH:
174 return is_r500 ? 64 : 0; /* Actually unlimited on r500. */
175 case PIPE_CAP_MAX_FS_INPUTS:
176 /* 2 colors + 8 texcoords are always supported
177 * (minus fog and wpos).
178 *
179 * R500 has the ability to turn 3rd and 4th color into
180 * additional texcoords but there is no two-sided color
181 * selection then. However the facing bit can be used instead. */
182 return 10;
183 case PIPE_CAP_MAX_FS_CONSTS:
184 return is_r500 ? 256 : 32;
185 case PIPE_CAP_MAX_FS_TEMPS:
186 return is_r500 ? 128 : is_r400 ? 64 : 32;
187 case PIPE_CAP_MAX_FS_ADDRS:
188 return 0;
189 case PIPE_CAP_MAX_FS_PREDS:
190 return is_r500 ? 1 : 0;
191
192 /* Vertex shader limits. */
193 case PIPE_CAP_MAX_VS_INSTRUCTIONS:
194 case PIPE_CAP_MAX_VS_ALU_INSTRUCTIONS:
195 return is_r500 ? 1024 : 256;
196 case PIPE_CAP_MAX_VS_TEX_INSTRUCTIONS:
197 case PIPE_CAP_MAX_VS_TEX_INDIRECTIONS:
198 return 0;
199 case PIPE_CAP_MAX_VS_CONTROL_FLOW_DEPTH:
200 return is_r500 ? 4 : 0; /* For loops; not sure about conditionals. */
201 case PIPE_CAP_MAX_VS_INPUTS:
202 return 16;
203 case PIPE_CAP_MAX_VS_CONSTS:
204 return 256;
205 case PIPE_CAP_MAX_VS_TEMPS:
206 return 32;
207 case PIPE_CAP_MAX_VS_ADDRS:
208 return 1; /* XXX guessed */
209 case PIPE_CAP_MAX_VS_PREDS:
210 return is_r500 ? 4 : 0; /* XXX guessed. */
211 case PIPE_CAP_GEOMETRY_SHADER4:
212 return 0;
213
214 default:
215 fprintf(stderr, "r300: Implementation error: Bad param %d\n",
216 param);
217 return 0;
218 }
219 }
220
221 static float r300_get_paramf(struct pipe_screen* pscreen, enum pipe_cap param)
222 {
223 struct r300_screen* r300screen = r300_screen(pscreen);
224
225 switch (param) {
226 case PIPE_CAP_MAX_LINE_WIDTH:
227 case PIPE_CAP_MAX_LINE_WIDTH_AA:
228 case PIPE_CAP_MAX_POINT_WIDTH:
229 case PIPE_CAP_MAX_POINT_WIDTH_AA:
230 /* The maximum dimensions of the colorbuffer are our practical
231 * rendering limits. 2048 pixels should be enough for anybody. */
232 if (r300screen->caps.is_r500) {
233 return 4096.0f;
234 } else if (r300screen->caps.is_r400) {
235 return 4021.0f;
236 } else {
237 return 2560.0f;
238 }
239 case PIPE_CAP_MAX_TEXTURE_ANISOTROPY:
240 return 16.0f;
241 case PIPE_CAP_MAX_TEXTURE_LOD_BIAS:
242 return 16.0f;
243 default:
244 fprintf(stderr, "r300: Implementation error: Bad paramf %d\n",
245 param);
246 return 0.0f;
247 }
248 }
249
250 static boolean r300_is_format_supported(struct pipe_screen* screen,
251 enum pipe_format format,
252 enum pipe_texture_target target,
253 unsigned sample_count,
254 unsigned usage,
255 unsigned geom_flags)
256 {
257 uint32_t retval = 0;
258 boolean is_r500 = r300_screen(screen)->caps.is_r500;
259 boolean is_r400 = r300_screen(screen)->caps.is_r400;
260 boolean is_color2101010 = format == PIPE_FORMAT_R10G10B10A2_UNORM ||
261 format == PIPE_FORMAT_R10G10B10X2_SNORM ||
262 format == PIPE_FORMAT_B10G10R10A2_UNORM ||
263 format == PIPE_FORMAT_R10SG10SB10SA2U_NORM;
264 boolean is_ati1n = format == PIPE_FORMAT_RGTC1_UNORM ||
265 format == PIPE_FORMAT_RGTC1_SNORM;
266 boolean is_ati2n = format == PIPE_FORMAT_RGTC2_UNORM ||
267 format == PIPE_FORMAT_RGTC2_SNORM;
268 boolean is_half_float = format == PIPE_FORMAT_R16_FLOAT ||
269 format == PIPE_FORMAT_R16G16_FLOAT ||
270 format == PIPE_FORMAT_R16G16B16_FLOAT ||
271 format == PIPE_FORMAT_R16G16B16A16_FLOAT;
272
273 /* Check multisampling support. */
274 switch (sample_count) {
275 case 0:
276 case 1:
277 break;
278 case 2:
279 case 3:
280 case 4:
281 case 6:
282 if (usage != PIPE_BIND_RENDER_TARGET ||
283 !util_format_is_rgba8_variant(
284 util_format_description(format))) {
285 return FALSE;
286 }
287 break;
288 default:
289 return FALSE;
290 }
291
292 /* Check sampler format support. */
293 if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
294 /* ATI1N is r5xx-only. */
295 (is_r500 || !is_ati1n) &&
296 /* ATI2N is supported on r4xx-r5xx. */
297 (is_r400 || is_r500 || !is_ati2n) &&
298 r300_is_sampler_format_supported(format)) {
299 retval |= PIPE_BIND_SAMPLER_VIEW;
300 }
301
302 /* Check colorbuffer format support. */
303 if ((usage & (PIPE_BIND_RENDER_TARGET |
304 PIPE_BIND_DISPLAY_TARGET |
305 PIPE_BIND_SCANOUT |
306 PIPE_BIND_SHARED)) &&
307 /* 2101010 cannot be rendered to on non-r5xx. */
308 (is_r500 || !is_color2101010) &&
309 r300_is_colorbuffer_format_supported(format)) {
310 retval |= usage &
311 (PIPE_BIND_RENDER_TARGET |
312 PIPE_BIND_DISPLAY_TARGET |
313 PIPE_BIND_SCANOUT |
314 PIPE_BIND_SHARED);
315 }
316
317 /* Check depth-stencil format support. */
318 if (usage & PIPE_BIND_DEPTH_STENCIL &&
319 r300_is_zs_format_supported(format)) {
320 retval |= PIPE_BIND_DEPTH_STENCIL;
321 }
322
323 /* Check vertex buffer format support. */
324 if (usage & PIPE_BIND_VERTEX_BUFFER &&
325 /* Half float is supported on >= RV350. */
326 (is_r400 || is_r500 || !is_half_float) &&
327 r300_translate_vertex_data_type(format) != R300_INVALID_FORMAT) {
328 retval |= PIPE_BIND_VERTEX_BUFFER;
329 }
330
331 /* Transfers are always supported. */
332 if (usage & PIPE_BIND_TRANSFER_READ)
333 retval |= PIPE_BIND_TRANSFER_READ;
334 if (usage & PIPE_BIND_TRANSFER_WRITE)
335 retval |= PIPE_BIND_TRANSFER_WRITE;
336
337 return retval == usage;
338 }
339
340 static void r300_destroy_screen(struct pipe_screen* pscreen)
341 {
342 struct r300_screen* r300screen = r300_screen(pscreen);
343 struct r300_winsys_screen *rws = r300_winsys_screen(pscreen);
344
345 util_mempool_destroy(&r300screen->pool_buffers);
346
347 if (rws)
348 rws->destroy(rws);
349
350 FREE(r300screen);
351 }
352
353 static void r300_fence_reference(struct pipe_screen *screen,
354 struct pipe_fence_handle **ptr,
355 struct pipe_fence_handle *fence)
356 {
357 struct r300_fence **oldf = (struct r300_fence**)ptr;
358 struct r300_fence *newf = (struct r300_fence*)fence;
359
360 if (pipe_reference(&(*oldf)->reference, &newf->reference))
361 FREE(*oldf);
362
363 *ptr = fence;
364 }
365
366 static int r300_fence_signalled(struct pipe_screen *screen,
367 struct pipe_fence_handle *fence,
368 unsigned flags)
369 {
370 struct r300_fence *rfence = (struct r300_fence*)fence;
371
372 return rfence->signalled ? 0 : 1; /* 0 == success */
373 }
374
375 static int r300_fence_finish(struct pipe_screen *screen,
376 struct pipe_fence_handle *fence,
377 unsigned flags)
378 {
379 struct r300_fence *rfence = (struct r300_fence*)fence;
380
381 r300_finish(rfence->ctx);
382 rfence->signalled = TRUE;
383 return 0; /* 0 == success */
384 }
385
386 struct pipe_screen* r300_screen_create(struct r300_winsys_screen *rws)
387 {
388 struct r300_screen *r300screen = CALLOC_STRUCT(r300_screen);
389
390 if (!r300screen) {
391 FREE(r300screen);
392 return NULL;
393 }
394
395 r300screen->caps.pci_id = rws->get_value(rws, R300_VID_PCI_ID);
396 r300screen->caps.num_frag_pipes = rws->get_value(rws, R300_VID_GB_PIPES);
397 r300screen->caps.num_z_pipes = rws->get_value(rws, R300_VID_Z_PIPES);
398
399 r300_init_debug(r300screen);
400 r300_parse_chipset(&r300screen->caps);
401
402 util_mempool_create(&r300screen->pool_buffers,
403 sizeof(struct r300_buffer), 64,
404 UTIL_MEMPOOL_SINGLETHREADED);
405
406 r300screen->rws = rws;
407 r300screen->screen.winsys = (struct pipe_winsys*)rws;
408 r300screen->screen.destroy = r300_destroy_screen;
409 r300screen->screen.get_name = r300_get_name;
410 r300screen->screen.get_vendor = r300_get_vendor;
411 r300screen->screen.get_param = r300_get_param;
412 r300screen->screen.get_paramf = r300_get_paramf;
413 r300screen->screen.is_format_supported = r300_is_format_supported;
414 r300screen->screen.context_create = r300_create_context;
415
416 r300screen->screen.fence_reference = r300_fence_reference;
417 r300screen->screen.fence_signalled = r300_fence_signalled;
418 r300screen->screen.fence_finish = r300_fence_finish;
419
420 r300_init_screen_resource_functions(r300screen);
421
422 util_format_s3tc_init();
423
424 return &r300screen->screen;
425 }