r300g: final fix for r3xx constant buffer emission
[mesa.git] / src / gallium / drivers / r300 / r300_screen.c
1 /*
2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23
24 #include "util/u_format.h"
25 #include "util/u_format_s3tc.h"
26 #include "util/u_memory.h"
27
28 #include "r300_context.h"
29 #include "r300_texture.h"
30 #include "r300_screen_buffer.h"
31 #include "r300_state_inlines.h"
32 #include "r300_winsys.h"
33 #include "r300_public.h"
34
35 /* Return the identifier behind whom the brave coders responsible for this
36 * amalgamation of code, sweat, and duct tape, routinely obscure their names.
37 *
38 * ...I should have just put "Corbin Simpson", but I'm not that cool.
39 *
40 * (Or egotistical. Yet.) */
41 static const char* r300_get_vendor(struct pipe_screen* pscreen)
42 {
43 return "X.Org R300 Project";
44 }
45
46 static const char* chip_families[] = {
47 "R300",
48 "R350",
49 "R360",
50 "RV350",
51 "RV370",
52 "RV380",
53 "R420",
54 "R423",
55 "R430",
56 "R480",
57 "R481",
58 "RV410",
59 "RS400",
60 "RC410",
61 "RS480",
62 "RS482",
63 "RS600",
64 "RS690",
65 "RS740",
66 "RV515",
67 "R520",
68 "RV530",
69 "R580",
70 "RV560",
71 "RV570"
72 };
73
74 static const char* r300_get_name(struct pipe_screen* pscreen)
75 {
76 struct r300_screen* r300screen = r300_screen(pscreen);
77
78 return chip_families[r300screen->caps.family];
79 }
80
81 static int r300_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
82 {
83 struct r300_screen* r300screen = r300_screen(pscreen);
84 boolean is_r400 = r300screen->caps.is_r400;
85 boolean is_r500 = r300screen->caps.is_r500;
86
87 /* XXX extended shader capabilities of r400 unimplemented */
88 is_r400 = FALSE;
89
90 switch (param) {
91 /* Supported features (boolean caps). */
92 case PIPE_CAP_NPOT_TEXTURES:
93 case PIPE_CAP_TWO_SIDED_STENCIL:
94 case PIPE_CAP_GLSL:
95 /* I'll be frank. This is a lie.
96 *
97 * We don't truly support GLSL on any of this driver's chipsets.
98 * To be fair, no chipset supports the full GLSL specification
99 * to the best of our knowledge, but some of the less esoteric
100 * features are still missing here.
101 *
102 * Rather than cripple ourselves intentionally, I'm going to set
103 * this flag, and as Gallium's interface continues to change, I
104 * hope that this single monolithic GLSL enable can slowly get
105 * split down into many different pieces and the state tracker
106 * will handle fallbacks transparently, like it should.
107 *
108 * ~ C.
109 */
110 case PIPE_CAP_ANISOTROPIC_FILTER:
111 case PIPE_CAP_POINT_SPRITE:
112 case PIPE_CAP_OCCLUSION_QUERY:
113 case PIPE_CAP_TEXTURE_SHADOW_MAP:
114 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
115 case PIPE_CAP_TEXTURE_MIRROR_REPEAT:
116 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
117 case PIPE_CAP_TEXTURE_SWIZZLE:
118 return 1;
119
120 /* Unsupported features (boolean caps). */
121 case PIPE_CAP_TIMER_QUERY:
122 case PIPE_CAP_DUAL_SOURCE_BLEND:
123 case PIPE_CAP_TGSI_CONT_SUPPORTED:
124 case PIPE_CAP_INDEP_BLEND_ENABLE:
125 case PIPE_CAP_INDEP_BLEND_FUNC:
126 return 0;
127
128 /* Texturing. */
129 case PIPE_CAP_MAX_TEXTURE_IMAGE_UNITS:
130 case PIPE_CAP_MAX_COMBINED_SAMPLERS:
131 return r300screen->caps.num_tex_units;
132 case PIPE_CAP_MAX_VERTEX_TEXTURE_UNITS:
133 return 0;
134 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
135 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
136 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
137 /* 13 == 4096, 12 == 2048 */
138 return is_r500 ? 13 : 12;
139
140 /* Render targets. */
141 case PIPE_CAP_MAX_RENDER_TARGETS:
142 return 4;
143
144 /* General shader limits and features. */
145 case PIPE_CAP_SM3:
146 return is_r500 ? 1 : 0;
147 case PIPE_CAP_MAX_CONST_BUFFERS:
148 return 1;
149 case PIPE_CAP_MAX_CONST_BUFFER_SIZE:
150 return 256;
151
152 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
153 return 1;
154
155 /* Fragment coordinate conventions. */
156 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
157 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
158 return 1;
159 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
160 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
161 return 0;
162
163 /* Fragment shader limits. */
164 case PIPE_CAP_MAX_FS_INSTRUCTIONS:
165 return is_r500 || is_r400 ? 512 : 96;
166 case PIPE_CAP_MAX_FS_ALU_INSTRUCTIONS:
167 return is_r500 || is_r400 ? 512 : 64;
168 case PIPE_CAP_MAX_FS_TEX_INSTRUCTIONS:
169 return is_r500 || is_r400 ? 512 : 32;
170 case PIPE_CAP_MAX_FS_TEX_INDIRECTIONS:
171 return is_r500 ? 511 : 4;
172 case PIPE_CAP_MAX_FS_CONTROL_FLOW_DEPTH:
173 return is_r500 ? 64 : 0; /* Actually unlimited on r500. */
174 case PIPE_CAP_MAX_FS_INPUTS:
175 /* 2 colors + 8 texcoords are always supported
176 * (minus fog and wpos).
177 *
178 * R500 has the ability to turn 3rd and 4th color into
179 * additional texcoords but there is no two-sided color
180 * selection then. However the facing bit can be used instead. */
181 return 10;
182 case PIPE_CAP_MAX_FS_CONSTS:
183 return is_r500 ? 256 : 32;
184 case PIPE_CAP_MAX_FS_TEMPS:
185 return is_r500 ? 128 : is_r400 ? 64 : 32;
186 case PIPE_CAP_MAX_FS_ADDRS:
187 return 0;
188 case PIPE_CAP_MAX_FS_PREDS:
189 return is_r500 ? 1 : 0;
190
191 /* Vertex shader limits. */
192 case PIPE_CAP_MAX_VS_INSTRUCTIONS:
193 case PIPE_CAP_MAX_VS_ALU_INSTRUCTIONS:
194 return is_r500 ? 1024 : 256;
195 case PIPE_CAP_MAX_VS_TEX_INSTRUCTIONS:
196 case PIPE_CAP_MAX_VS_TEX_INDIRECTIONS:
197 return 0;
198 case PIPE_CAP_MAX_VS_CONTROL_FLOW_DEPTH:
199 return is_r500 ? 4 : 0; /* For loops; not sure about conditionals. */
200 case PIPE_CAP_MAX_VS_INPUTS:
201 return 16;
202 case PIPE_CAP_MAX_VS_CONSTS:
203 return 256;
204 case PIPE_CAP_MAX_VS_TEMPS:
205 return 32;
206 case PIPE_CAP_MAX_VS_ADDRS:
207 return 1; /* XXX guessed */
208 case PIPE_CAP_MAX_VS_PREDS:
209 return is_r500 ? 4 : 0; /* XXX guessed. */
210 case PIPE_CAP_GEOMETRY_SHADER4:
211 return 0;
212
213 default:
214 fprintf(stderr, "r300: Implementation error: Bad param %d\n",
215 param);
216 return 0;
217 }
218 }
219
220 static float r300_get_paramf(struct pipe_screen* pscreen, enum pipe_cap param)
221 {
222 struct r300_screen* r300screen = r300_screen(pscreen);
223
224 switch (param) {
225 case PIPE_CAP_MAX_LINE_WIDTH:
226 case PIPE_CAP_MAX_LINE_WIDTH_AA:
227 case PIPE_CAP_MAX_POINT_WIDTH:
228 case PIPE_CAP_MAX_POINT_WIDTH_AA:
229 /* The maximum dimensions of the colorbuffer are our practical
230 * rendering limits. 2048 pixels should be enough for anybody. */
231 if (r300screen->caps.is_r500) {
232 return 4096.0f;
233 } else if (r300screen->caps.is_r400) {
234 return 4021.0f;
235 } else {
236 return 2560.0f;
237 }
238 case PIPE_CAP_MAX_TEXTURE_ANISOTROPY:
239 return 16.0f;
240 case PIPE_CAP_MAX_TEXTURE_LOD_BIAS:
241 return 16.0f;
242 default:
243 fprintf(stderr, "r300: Implementation error: Bad paramf %d\n",
244 param);
245 return 0.0f;
246 }
247 }
248
249 static boolean r300_is_format_supported(struct pipe_screen* screen,
250 enum pipe_format format,
251 enum pipe_texture_target target,
252 unsigned sample_count,
253 unsigned usage,
254 unsigned geom_flags)
255 {
256 uint32_t retval = 0;
257 boolean is_r500 = r300_screen(screen)->caps.is_r500;
258 boolean is_r400 = r300_screen(screen)->caps.is_r400;
259 boolean is_z24 = format == PIPE_FORMAT_X8Z24_UNORM ||
260 format == PIPE_FORMAT_S8_USCALED_Z24_UNORM;
261 boolean is_color2101010 = format == PIPE_FORMAT_R10G10B10A2_UNORM ||
262 format == PIPE_FORMAT_R10G10B10X2_SNORM ||
263 format == PIPE_FORMAT_B10G10R10A2_UNORM ||
264 format == PIPE_FORMAT_R10SG10SB10SA2U_NORM;
265 boolean is_ati1n = format == PIPE_FORMAT_RGTC1_UNORM ||
266 format == PIPE_FORMAT_RGTC1_SNORM;
267 boolean is_ati2n = format == PIPE_FORMAT_RGTC2_UNORM ||
268 format == PIPE_FORMAT_RGTC2_SNORM;
269 boolean is_half_float = format == PIPE_FORMAT_R16_FLOAT ||
270 format == PIPE_FORMAT_R16G16_FLOAT ||
271 format == PIPE_FORMAT_R16G16B16_FLOAT ||
272 format == PIPE_FORMAT_R16G16B16A16_FLOAT;
273
274 /* Check multisampling support. */
275 switch (sample_count) {
276 case 0:
277 case 1:
278 break;
279 case 2:
280 case 3:
281 case 4:
282 case 6:
283 if (usage != PIPE_BIND_RENDER_TARGET ||
284 !util_format_is_rgba8_variant(
285 util_format_description(format))) {
286 return FALSE;
287 }
288 break;
289 default:
290 return FALSE;
291 }
292
293 /* Check sampler format support. */
294 if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
295 /* Z24 cannot be sampled from on non-r5xx. */
296 (is_r500 || !is_z24) &&
297 /* ATI1N is r5xx-only. */
298 (is_r500 || !is_ati1n) &&
299 /* ATI2N is supported on r4xx-r5xx. */
300 (is_r400 || is_r500 || !is_ati2n) &&
301 r300_is_sampler_format_supported(format)) {
302 retval |= PIPE_BIND_SAMPLER_VIEW;
303 }
304
305 /* Check colorbuffer format support. */
306 if ((usage & (PIPE_BIND_RENDER_TARGET |
307 PIPE_BIND_DISPLAY_TARGET |
308 PIPE_BIND_SCANOUT |
309 PIPE_BIND_SHARED)) &&
310 /* 2101010 cannot be rendered to on non-r5xx. */
311 (is_r500 || !is_color2101010) &&
312 r300_is_colorbuffer_format_supported(format)) {
313 retval |= usage &
314 (PIPE_BIND_RENDER_TARGET |
315 PIPE_BIND_DISPLAY_TARGET |
316 PIPE_BIND_SCANOUT |
317 PIPE_BIND_SHARED);
318 }
319
320 /* Check depth-stencil format support. */
321 if (usage & PIPE_BIND_DEPTH_STENCIL &&
322 r300_is_zs_format_supported(format)) {
323 retval |= PIPE_BIND_DEPTH_STENCIL;
324 }
325
326 /* Check vertex buffer format support. */
327 if (usage & PIPE_BIND_VERTEX_BUFFER &&
328 /* Half float is supported on >= RV350. */
329 (is_r400 || is_r500 || !is_half_float) &&
330 r300_translate_vertex_data_type(format) != R300_INVALID_FORMAT) {
331 retval |= PIPE_BIND_VERTEX_BUFFER;
332 }
333
334 /* Transfers are always supported. */
335 if (usage & PIPE_BIND_TRANSFER_READ)
336 retval |= PIPE_BIND_TRANSFER_READ;
337 if (usage & PIPE_BIND_TRANSFER_WRITE)
338 retval |= PIPE_BIND_TRANSFER_WRITE;
339
340 return retval == usage;
341 }
342
343 static void r300_destroy_screen(struct pipe_screen* pscreen)
344 {
345 struct r300_screen* r300screen = r300_screen(pscreen);
346 struct r300_winsys_screen *rws = r300_winsys_screen(pscreen);
347
348 if (rws)
349 rws->destroy(rws);
350
351 FREE(r300screen);
352 }
353
354 static void r300_fence_reference(struct pipe_screen *screen,
355 struct pipe_fence_handle **ptr,
356 struct pipe_fence_handle *fence)
357 {
358 struct r300_fence **oldf = (struct r300_fence**)ptr;
359 struct r300_fence *newf = (struct r300_fence*)fence;
360
361 if (pipe_reference(&(*oldf)->reference, &newf->reference))
362 FREE(*oldf);
363
364 *ptr = fence;
365 }
366
367 static int r300_fence_signalled(struct pipe_screen *screen,
368 struct pipe_fence_handle *fence,
369 unsigned flags)
370 {
371 struct r300_fence *rfence = (struct r300_fence*)fence;
372
373 return rfence->signalled ? 0 : 1; /* 0 == success */
374 }
375
376 static int r300_fence_finish(struct pipe_screen *screen,
377 struct pipe_fence_handle *fence,
378 unsigned flags)
379 {
380 struct r300_fence *rfence = (struct r300_fence*)fence;
381
382 r300_finish(rfence->ctx);
383 rfence->signalled = TRUE;
384 return 0; /* 0 == success */
385 }
386
387 struct pipe_screen* r300_screen_create(struct r300_winsys_screen *rws)
388 {
389 struct r300_screen *r300screen = CALLOC_STRUCT(r300_screen);
390
391 if (!r300screen) {
392 FREE(r300screen);
393 return NULL;
394 }
395
396 r300screen->caps.pci_id = rws->get_value(rws, R300_VID_PCI_ID);
397 r300screen->caps.num_frag_pipes = rws->get_value(rws, R300_VID_GB_PIPES);
398 r300screen->caps.num_z_pipes = rws->get_value(rws, R300_VID_Z_PIPES);
399
400 r300_init_debug(r300screen);
401 r300_parse_chipset(&r300screen->caps);
402
403 r300screen->rws = rws;
404 r300screen->screen.winsys = (struct pipe_winsys*)rws;
405 r300screen->screen.destroy = r300_destroy_screen;
406 r300screen->screen.get_name = r300_get_name;
407 r300screen->screen.get_vendor = r300_get_vendor;
408 r300screen->screen.get_param = r300_get_param;
409 r300screen->screen.get_paramf = r300_get_paramf;
410 r300screen->screen.is_format_supported = r300_is_format_supported;
411 r300screen->screen.context_create = r300_create_context;
412
413 r300screen->screen.fence_reference = r300_fence_reference;
414 r300screen->screen.fence_signalled = r300_fence_signalled;
415 r300screen->screen.fence_finish = r300_fence_finish;
416
417 r300_init_screen_resource_functions(r300screen);
418
419 util_format_s3tc_init();
420
421 return &r300screen->screen;
422 }