2 * Copyright 2008 Ben Skeggs
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
18 * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF
19 * OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
23 #include "util/u_format_s3tc.h"
24 #include "pipe/p_screen.h"
26 #include "nv50_context.h"
27 #include "nv50_screen.h"
28 #include "nv50_resource.h"
30 #include "nouveau/nouveau_stateobj.h"
33 nv50_screen_is_format_supported(struct pipe_screen
*pscreen
,
34 enum pipe_format format
,
35 enum pipe_texture_target target
,
36 unsigned sample_count
,
37 unsigned usage
, unsigned geom_flags
)
42 if (!util_format_s3tc_enabled
) {
44 case PIPE_FORMAT_DXT1_RGB
:
45 case PIPE_FORMAT_DXT1_RGBA
:
46 case PIPE_FORMAT_DXT3_RGBA
:
47 case PIPE_FORMAT_DXT5_RGBA
:
55 case PIPE_FORMAT_Z16_UNORM
:
56 if ((nouveau_screen(pscreen
)->device
->chipset
& 0xf0) != 0xa0)
63 /* transfers & shared are always supported */
64 usage
&= ~(PIPE_BIND_TRANSFER_READ
|
65 PIPE_BIND_TRANSFER_WRITE
|
68 return (nv50_format_table
[format
].usage
& usage
) == usage
;
72 nv50_screen_get_param(struct pipe_screen
*pscreen
, enum pipe_cap param
)
75 case PIPE_CAP_MAX_TEXTURE_IMAGE_UNITS
:
77 case PIPE_CAP_MAX_VERTEX_TEXTURE_UNITS
:
79 case PIPE_CAP_MAX_COMBINED_SAMPLERS
:
81 case PIPE_CAP_NPOT_TEXTURES
:
83 case PIPE_CAP_TWO_SIDED_STENCIL
:
87 case PIPE_CAP_GEOMETRY_SHADER4
:
89 case PIPE_CAP_ANISOTROPIC_FILTER
:
91 case PIPE_CAP_POINT_SPRITE
:
93 case PIPE_CAP_MAX_RENDER_TARGETS
:
95 case PIPE_CAP_OCCLUSION_QUERY
:
97 case PIPE_CAP_TIMER_QUERY
:
99 case PIPE_CAP_TEXTURE_SHADOW_MAP
:
101 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS
:
103 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS
:
105 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS
:
107 case PIPE_CAP_TEXTURE_MIRROR_CLAMP
:
108 case PIPE_CAP_TEXTURE_MIRROR_REPEAT
:
110 case PIPE_CAP_TEXTURE_SWIZZLE
:
112 case PIPE_CAP_TGSI_CONT_SUPPORTED
:
114 case PIPE_CAP_BLEND_EQUATION_SEPARATE
:
116 case PIPE_CAP_INDEP_BLEND_ENABLE
:
118 case PIPE_CAP_INDEP_BLEND_FUNC
:
120 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE
:
122 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT
:
123 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER
:
125 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT
:
126 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER
:
128 case PIPE_CAP_MAX_VS_INSTRUCTIONS
:
129 case PIPE_CAP_MAX_FS_INSTRUCTIONS
:
130 case PIPE_CAP_MAX_VS_ALU_INSTRUCTIONS
:
131 case PIPE_CAP_MAX_FS_ALU_INSTRUCTIONS
:
132 case PIPE_CAP_MAX_VS_TEX_INSTRUCTIONS
:
133 case PIPE_CAP_MAX_FS_TEX_INSTRUCTIONS
:
134 case PIPE_CAP_MAX_VS_TEX_INDIRECTIONS
:
135 case PIPE_CAP_MAX_FS_TEX_INDIRECTIONS
: /* arbitrary limit */
137 case PIPE_CAP_MAX_VS_CONTROL_FLOW_DEPTH
:
138 case PIPE_CAP_MAX_FS_CONTROL_FLOW_DEPTH
: /* need stack bo */
140 case PIPE_CAP_MAX_VS_INPUTS
:
142 case PIPE_CAP_MAX_FS_INPUTS
: /* 128 / 4 with GP */
144 case PIPE_CAP_MAX_VS_CONSTS
:
145 case PIPE_CAP_MAX_FS_CONSTS
:
147 case PIPE_CAP_MAX_VS_ADDRS
:
148 case PIPE_CAP_MAX_FS_ADDRS
: /* no spilling atm */
150 case PIPE_CAP_MAX_VS_PREDS
:
151 case PIPE_CAP_MAX_FS_PREDS
: /* not yet handled */
153 case PIPE_CAP_MAX_VS_TEMPS
:
154 case PIPE_CAP_MAX_FS_TEMPS
: /* no spilling atm */
156 case PIPE_CAP_DEPTH_CLAMP
:
159 NOUVEAU_ERR("Unknown PIPE_CAP %d\n", param
);
165 nv50_screen_get_paramf(struct pipe_screen
*pscreen
, enum pipe_cap param
)
168 case PIPE_CAP_MAX_LINE_WIDTH
:
169 case PIPE_CAP_MAX_LINE_WIDTH_AA
:
171 case PIPE_CAP_MAX_POINT_WIDTH
:
172 case PIPE_CAP_MAX_POINT_WIDTH_AA
:
174 case PIPE_CAP_MAX_TEXTURE_ANISOTROPY
:
176 case PIPE_CAP_MAX_TEXTURE_LOD_BIAS
:
179 NOUVEAU_ERR("Unknown PIPE_CAP %d\n", param
);
185 nv50_screen_destroy(struct pipe_screen
*pscreen
)
187 struct nv50_screen
*screen
= nv50_screen(pscreen
);
190 for (i
= 0; i
< 3; i
++) {
191 if (screen
->constbuf_parm
[i
])
192 nouveau_bo_ref(NULL
, &screen
->constbuf_parm
[i
]);
195 if (screen
->constbuf_misc
[0])
196 nouveau_bo_ref(NULL
, &screen
->constbuf_misc
[0]);
198 nouveau_bo_ref(NULL
, &screen
->tic
);
200 nouveau_bo_ref(NULL
, &screen
->tsc
);
202 nouveau_notifier_free(&screen
->sync
);
203 nouveau_grobj_free(&screen
->tesla
);
204 nouveau_grobj_free(&screen
->eng2d
);
205 nouveau_grobj_free(&screen
->m2mf
);
206 nouveau_resource_destroy(&screen
->immd_heap
);
207 nouveau_screen_fini(&screen
->base
);
211 #define BGN_RELOC(ch, bo, gr, m, n, fl) \
212 OUT_RELOC(ch, bo, (n << 18) | (gr->subc << 13) | m, fl, 0, 0)
215 nv50_screen_relocs(struct nv50_screen
*screen
)
217 struct nouveau_channel
*chan
= screen
->base
.channel
;
218 struct nouveau_grobj
*tesla
= screen
->tesla
;
220 const unsigned rl
= NOUVEAU_BO_VRAM
| NOUVEAU_BO_RD
| NOUVEAU_BO_DUMMY
;
222 MARK_RING (chan
, 28, 26);
224 /* cause grobj autobind */
225 BEGIN_RING(chan
, tesla
, 0x0100, 1);
228 BGN_RELOC (chan
, screen
->tic
, tesla
, NV50TCL_TIC_ADDRESS_HIGH
, 2, rl
);
229 OUT_RELOCh(chan
, screen
->tic
, 0, rl
);
230 OUT_RELOCl(chan
, screen
->tic
, 0, rl
);
232 BGN_RELOC (chan
, screen
->tsc
, tesla
, NV50TCL_TSC_ADDRESS_HIGH
, 2, rl
);
233 OUT_RELOCh(chan
, screen
->tsc
, 0, rl
);
234 OUT_RELOCl(chan
, screen
->tsc
, 0, rl
);
236 BGN_RELOC (chan
, screen
->constbuf_misc
[0],
237 tesla
, NV50TCL_CB_DEF_ADDRESS_HIGH
, 3, rl
);
238 OUT_RELOCh(chan
, screen
->constbuf_misc
[0], 0, rl
);
239 OUT_RELOCl(chan
, screen
->constbuf_misc
[0], 0, rl
);
240 OUT_RELOC (chan
, screen
->constbuf_misc
[0],
241 (NV50_CB_PMISC
<< 16) | 0x0200, rl
, 0, 0);
243 BGN_RELOC (chan
, screen
->constbuf_misc
[0],
244 tesla
, NV50TCL_CB_DEF_ADDRESS_HIGH
, 3, rl
);
245 OUT_RELOCh(chan
, screen
->constbuf_misc
[0], 0x200, rl
);
246 OUT_RELOCl(chan
, screen
->constbuf_misc
[0], 0x200, rl
);
247 OUT_RELOC (chan
, screen
->constbuf_misc
[0],
248 (NV50_CB_AUX
<< 16) | 0x0200, rl
, 0, 0);
250 for (i
= 0; i
< 3; ++i
) {
251 BGN_RELOC (chan
, screen
->constbuf_parm
[i
],
252 tesla
, NV50TCL_CB_DEF_ADDRESS_HIGH
, 3, rl
);
253 OUT_RELOCh(chan
, screen
->constbuf_parm
[i
], 0, rl
);
254 OUT_RELOCl(chan
, screen
->constbuf_parm
[i
], 0, rl
);
255 OUT_RELOC (chan
, screen
->constbuf_parm
[i
],
256 ((NV50_CB_PVP
+ i
) << 16) | 0x0000, rl
, 0, 0);
260 #ifndef NOUVEAU_GETPARAM_GRAPH_UNITS
261 # define NOUVEAU_GETPARAM_GRAPH_UNITS 13
264 extern int nouveau_device_get_param(struct nouveau_device
*dev
,
265 uint64_t param
, uint64_t *value
);
268 nv50_screen_create(struct pipe_winsys
*ws
, struct nouveau_device
*dev
)
270 struct nv50_screen
*screen
= CALLOC_STRUCT(nv50_screen
);
271 struct nouveau_channel
*chan
;
272 struct pipe_screen
*pscreen
;
274 unsigned chipset
= dev
->chipset
;
275 unsigned tesla_class
= 0;
278 const unsigned rl
= NOUVEAU_BO_VRAM
| NOUVEAU_BO_RD
;
282 pscreen
= &screen
->base
.base
;
284 ret
= nouveau_screen_init(&screen
->base
, dev
);
286 nv50_screen_destroy(pscreen
);
289 chan
= screen
->base
.channel
;
291 pscreen
->winsys
= ws
;
292 pscreen
->destroy
= nv50_screen_destroy
;
293 pscreen
->get_param
= nv50_screen_get_param
;
294 pscreen
->get_paramf
= nv50_screen_get_paramf
;
295 pscreen
->is_format_supported
= nv50_screen_is_format_supported
;
296 pscreen
->context_create
= nv50_create
;
298 nv50_screen_init_resource_functions(pscreen
);
300 /* DMA engine object */
301 ret
= nouveau_grobj_alloc(chan
, 0xbeef5039,
302 NV50_MEMORY_TO_MEMORY_FORMAT
, &screen
->m2mf
);
304 NOUVEAU_ERR("Error creating M2MF object: %d\n", ret
);
305 nv50_screen_destroy(pscreen
);
310 ret
= nouveau_grobj_alloc(chan
, 0xbeef502d, NV50_2D
, &screen
->eng2d
);
312 NOUVEAU_ERR("Error creating 2D object: %d\n", ret
);
313 nv50_screen_destroy(pscreen
);
318 switch (chipset
& 0xf0) {
320 tesla_class
= NV50TCL
;
324 tesla_class
= NV84TCL
;
331 tesla_class
= NVA0TCL
;
334 tesla_class
= NVA8TCL
;
339 NOUVEAU_ERR("Not a known NV50 chipset: NV%02x\n", chipset
);
340 nv50_screen_destroy(pscreen
);
344 ret
= nouveau_grobj_alloc(chan
, 0xbeef5097, tesla_class
,
347 NOUVEAU_ERR("Error creating 3D object: %d\n", ret
);
348 nv50_screen_destroy(pscreen
);
352 /* this is necessary for the new RING_3D / statebuffer code */
353 BIND_RING(chan
, screen
->tesla
, 7);
356 ret
= nouveau_notifier_alloc(chan
, 0xbeef0301, 1, &screen
->sync
);
358 NOUVEAU_ERR("Error creating notifier object: %d\n", ret
);
359 nv50_screen_destroy(pscreen
);
363 /* Static M2MF init */
364 BEGIN_RING(chan
, screen
->m2mf
,
365 NV04_MEMORY_TO_MEMORY_FORMAT_DMA_NOTIFY
, 3);
366 OUT_RING (chan
, screen
->sync
->handle
);
367 OUT_RING (chan
, chan
->vram
->handle
);
368 OUT_RING (chan
, chan
->vram
->handle
);
371 BEGIN_RING(chan
, screen
->eng2d
, NV50_2D_DMA_NOTIFY
, 4);
372 OUT_RING (chan
, screen
->sync
->handle
);
373 OUT_RING (chan
, chan
->vram
->handle
);
374 OUT_RING (chan
, chan
->vram
->handle
);
375 OUT_RING (chan
, chan
->vram
->handle
);
376 BEGIN_RING(chan
, screen
->eng2d
, NV50_2D_OPERATION
, 1);
377 OUT_RING (chan
, NV50_2D_OPERATION_SRCCOPY
);
378 BEGIN_RING(chan
, screen
->eng2d
, NV50_2D_CLIP_ENABLE
, 1);
380 BEGIN_RING(chan
, screen
->eng2d
, 0x0888, 1);
383 /* Static tesla init */
384 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_COND_MODE
, 1);
385 OUT_RING (chan
, NV50TCL_COND_MODE_ALWAYS
);
386 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_DMA_NOTIFY
, 1);
387 OUT_RING (chan
, screen
->sync
->handle
);
388 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_DMA_ZETA
, 11);
389 for (i
= 0; i
< 11; i
++)
390 OUT_RING (chan
, chan
->vram
->handle
);
391 BEGIN_RING(chan
, screen
->tesla
,
392 NV50TCL_DMA_COLOR(0), NV50TCL_DMA_COLOR__SIZE
);
393 for (i
= 0; i
< NV50TCL_DMA_COLOR__SIZE
; i
++)
394 OUT_RING (chan
, chan
->vram
->handle
);
396 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_RT_CONTROL
, 1);
399 /* activate all 32 lanes (threads) in a warp */
400 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_REG_MODE
, 1);
401 OUT_RING (chan
, NV50TCL_REG_MODE_STRIPED
);
402 BEGIN_RING(chan
, screen
->tesla
, 0x1400, 1);
403 OUT_RING (chan
, 0xf);
405 /* max TIC (bits 4:8) & TSC (ignored) bindings, per program type */
406 for (i
= 0; i
< 3; ++i
) {
407 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_TEX_LIMITS(i
), 1);
408 OUT_RING (chan
, 0x54);
411 /* origin is top left (set to 1 for bottom left) */
412 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_Y_ORIGIN_BOTTOM
, 1);
414 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_VP_REG_ALLOC_RESULT
, 1);
417 /* constant buffers for immediates and VP/FP parameters */
418 ret
= nouveau_bo_new(dev
, NOUVEAU_BO_VRAM
, 0, (32 * 4) * 4,
419 &screen
->constbuf_misc
[0]);
421 nv50_screen_destroy(pscreen
);
424 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_CB_DEF_ADDRESS_HIGH
, 3);
425 OUT_RELOCh(chan
, screen
->constbuf_misc
[0], 0, rl
);
426 OUT_RELOCl(chan
, screen
->constbuf_misc
[0], 0, rl
);
427 OUT_RING (chan
, (NV50_CB_PMISC
<< 16) | 0x0200);
428 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_CB_DEF_ADDRESS_HIGH
, 3);
429 OUT_RELOCh(chan
, screen
->constbuf_misc
[0], 0x200, rl
);
430 OUT_RELOCl(chan
, screen
->constbuf_misc
[0], 0x200, rl
);
431 OUT_RING (chan
, (NV50_CB_AUX
<< 16) | 0x0200);
433 for (i
= 0; i
< 3; i
++) {
434 ret
= nouveau_bo_new(dev
, NOUVEAU_BO_VRAM
, 0, (4096 * 4) * 4,
435 &screen
->constbuf_parm
[i
]);
437 nv50_screen_destroy(pscreen
);
440 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_CB_DEF_ADDRESS_HIGH
, 3);
441 OUT_RELOCh(chan
, screen
->constbuf_parm
[i
], 0, rl
);
442 OUT_RELOCl(chan
, screen
->constbuf_parm
[i
], 0, rl
);
443 /* CB_DEF_SET_SIZE value of 0x0000 means 65536 */
444 OUT_RING (chan
, ((NV50_CB_PVP
+ i
) << 16) | 0x0000);
447 if (nouveau_resource_init(&screen
->immd_heap
, 0, 128)) {
448 NOUVEAU_ERR("Error initialising shader immediates heap.\n");
449 nv50_screen_destroy(pscreen
);
453 ret
= nouveau_bo_new(dev
, NOUVEAU_BO_VRAM
, 0, 3 * 32 * (8 * 4),
456 nv50_screen_destroy(pscreen
);
459 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_TIC_ADDRESS_HIGH
, 3);
460 OUT_RELOCh(chan
, screen
->tic
, 0, NOUVEAU_BO_VRAM
| NOUVEAU_BO_RD
);
461 OUT_RELOCl(chan
, screen
->tic
, 0, NOUVEAU_BO_VRAM
| NOUVEAU_BO_RD
);
462 OUT_RING (chan
, 3 * 32 - 1);
464 ret
= nouveau_bo_new(dev
, NOUVEAU_BO_VRAM
, 0, 3 * 32 * (8 * 4),
467 nv50_screen_destroy(pscreen
);
470 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_TSC_ADDRESS_HIGH
, 3);
471 OUT_RELOCh(chan
, screen
->tsc
, 0, NOUVEAU_BO_VRAM
| NOUVEAU_BO_RD
);
472 OUT_RELOCl(chan
, screen
->tsc
, 0, NOUVEAU_BO_VRAM
| NOUVEAU_BO_RD
);
473 OUT_RING (chan
, 0); /* ignored if TSC_LINKED (0x1234) == 1 */
475 /* map constant buffers:
476 * B = buffer ID (maybe more than 1 byte)
477 * N = CB index used in shader instruction
478 * P = program type (0 = VP, 2 = GP, 3 = FP)
479 * SET_PROGRAM_CB = 0x000BBNP1
481 BEGIN_RING_NI(chan
, screen
->tesla
, NV50TCL_SET_PROGRAM_CB
, 8);
482 /* bind immediate buffer */
483 OUT_RING (chan
, 0x001 | (NV50_CB_PMISC
<< 12));
484 OUT_RING (chan
, 0x021 | (NV50_CB_PMISC
<< 12));
485 OUT_RING (chan
, 0x031 | (NV50_CB_PMISC
<< 12));
486 /* bind auxiliary constbuf to immediate data bo */
487 OUT_RING (chan
, 0x201 | (NV50_CB_AUX
<< 12));
488 OUT_RING (chan
, 0x221 | (NV50_CB_AUX
<< 12));
489 /* bind parameter buffers */
490 OUT_RING (chan
, 0x101 | (NV50_CB_PVP
<< 12));
491 OUT_RING (chan
, 0x121 | (NV50_CB_PGP
<< 12));
492 OUT_RING (chan
, 0x131 | (NV50_CB_PFP
<< 12));
495 nouveau_device_get_param(dev
, NOUVEAU_GETPARAM_GRAPH_UNITS
, &value
);
497 stack_size
= util_bitcount(value
& 0xffff);
498 stack_size
*= util_bitcount((value
>> 24) & 0xf);
499 stack_size
*= 32 * 64 * 8;
501 ret
= nouveau_bo_new(dev
, NOUVEAU_BO_VRAM
, 1 << 16,
502 stack_size
, &screen
->stack_bo
);
504 nv50_screen_destroy(pscreen
);
507 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_STACK_ADDRESS_HIGH
, 3);
508 OUT_RELOCh(chan
, screen
->stack_bo
, 0, NOUVEAU_BO_VRAM
| NOUVEAU_BO_WR
);
509 OUT_RELOCl(chan
, screen
->stack_bo
, 0, NOUVEAU_BO_VRAM
| NOUVEAU_BO_WR
);
512 /* Vertex array limits - max them out */
513 for (i
= 0; i
< 16; i
++) {
514 BEGIN_RING(chan
, screen
->tesla
,
515 NV50TCL_VERTEX_ARRAY_LIMIT_HIGH(i
), 2);
516 OUT_RING (chan
, 0x000000ff);
517 OUT_RING (chan
, 0xffffffff);
520 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_DEPTH_RANGE_NEAR(0), 2);
521 OUT_RINGf (chan
, 0.0f
);
522 OUT_RINGf (chan
, 1.0f
);
524 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_VIEWPORT_TRANSFORM_EN
, 1);
527 /* no dynamic combination of TIC & TSC entries => only BIND_TIC used */
528 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_LINKED_TSC
, 1);
531 BEGIN_RING(chan
, screen
->tesla
, NV50TCL_EDGEFLAG_ENABLE
, 1);
532 OUT_RING (chan
, 1); /* default edgeflag to TRUE */
536 screen
->force_push
= debug_get_bool_option("NV50_ALWAYS_PUSH", FALSE
);
537 if(!screen
->force_push
)
538 screen
->base
.vertex_buffer_flags
= screen
->base
.index_buffer_flags
= NOUVEAU_BO_GART
;