1 #include "pipe/p_screen.h"
2 #include "pipe/p_state.h"
3 #include "util/u_simple_screen.h"
5 #include "nouveau/nouveau_screen.h"
7 #include "nvfx_context.h"
8 #include "nvfx_screen.h"
9 #include "nvfx_resource.h"
11 #define NV30TCL_CHIPSET_3X_MASK 0x00000003
12 #define NV34TCL_CHIPSET_3X_MASK 0x00000010
13 #define NV35TCL_CHIPSET_3X_MASK 0x000001e0
15 /* FIXME: It seems I should not include directly ../../winsys/drm/nouveau/drm/nouveau_drm_api.h
16 * to get the pointer to the context front buffer, so I copied nouveau_winsys here.
17 * nv30_screen_surface_format_supported() can then use it to enforce creating fbo
18 * with same number of bits everywhere.
20 struct nouveau_winsys
{
21 struct pipe_winsys base
;
23 struct pipe_screen
*pscreen
;
25 struct pipe_surface
*front
;
27 #define NV4X_GRCLASS4097_CHIPSETS 0x00000baf
28 #define NV4X_GRCLASS4497_CHIPSETS 0x00005450
29 #define NV6X_GRCLASS4497_CHIPSETS 0x00000088
32 nvfx_screen_get_param(struct pipe_screen
*pscreen
, int param
)
34 struct nvfx_screen
*screen
= nvfx_screen(pscreen
);
37 case PIPE_CAP_MAX_TEXTURE_IMAGE_UNITS
:
38 /* TODO: check this */
39 return screen
->is_nv4x
? 16 : 8;
40 case PIPE_CAP_NPOT_TEXTURES
:
41 return !!screen
->is_nv4x
;
42 case PIPE_CAP_TWO_SIDED_STENCIL
:
46 case PIPE_CAP_ANISOTROPIC_FILTER
:
48 case PIPE_CAP_POINT_SPRITE
:
50 case PIPE_CAP_MAX_RENDER_TARGETS
:
51 return screen
->is_nv4x
? 4 : 2;
52 case PIPE_CAP_OCCLUSION_QUERY
:
54 case PIPE_CAP_TEXTURE_SHADOW_MAP
:
56 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS
:
58 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS
:
60 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS
:
62 case PIPE_CAP_TEXTURE_MIRROR_CLAMP
:
63 return !!screen
->is_nv4x
;
64 case PIPE_CAP_TEXTURE_MIRROR_REPEAT
:
66 case PIPE_CAP_MAX_VERTEX_TEXTURE_UNITS
:
67 return 0; /* We have 4 on nv40 - but unsupported currently */
68 case PIPE_CAP_TGSI_CONT_SUPPORTED
:
70 case PIPE_CAP_BLEND_EQUATION_SEPARATE
:
71 return !!screen
->is_nv4x
;
72 case PIPE_CAP_MAX_COMBINED_SAMPLERS
:
74 case PIPE_CAP_INDEP_BLEND_ENABLE
:
75 /* TODO: on nv40 we have separate color masks */
76 /* TODO: nv40 mrt blending is probably broken */
78 case PIPE_CAP_INDEP_BLEND_FUNC
:
80 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT
:
81 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER
:
83 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT
:
84 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER
:
87 NOUVEAU_ERR("Unknown PIPE_CAP %d\n", param
);
93 nvfx_screen_get_paramf(struct pipe_screen
*pscreen
, int param
)
95 struct nvfx_screen
*screen
= nvfx_screen(pscreen
);
98 case PIPE_CAP_MAX_LINE_WIDTH
:
99 case PIPE_CAP_MAX_LINE_WIDTH_AA
:
101 case PIPE_CAP_MAX_POINT_WIDTH
:
102 case PIPE_CAP_MAX_POINT_WIDTH_AA
:
104 case PIPE_CAP_MAX_TEXTURE_ANISOTROPY
:
105 return screen
->is_nv4x
? 16.0 : 8.0;
106 case PIPE_CAP_MAX_TEXTURE_LOD_BIAS
:
107 return screen
->is_nv4x
? 16.0 : 4.0;
109 NOUVEAU_ERR("Unknown PIPE_CAP %d\n", param
);
115 nvfx_screen_surface_format_supported(struct pipe_screen
*pscreen
,
116 enum pipe_format format
,
117 enum pipe_texture_target target
,
118 unsigned tex_usage
, unsigned geom_flags
)
120 struct nvfx_screen
*screen
= nvfx_screen(pscreen
);
121 struct pipe_surface
*front
= ((struct nouveau_winsys
*) pscreen
->winsys
)->front
;
123 if (tex_usage
& PIPE_BIND_RENDER_TARGET
) {
125 case PIPE_FORMAT_B8G8R8A8_UNORM
:
126 case PIPE_FORMAT_B8G8R8X8_UNORM
:
127 case PIPE_FORMAT_B5G6R5_UNORM
:
133 if (tex_usage
& PIPE_BIND_DEPTH_STENCIL
) {
135 case PIPE_FORMAT_S8_USCALED_Z24_UNORM
:
136 case PIPE_FORMAT_X8Z24_UNORM
:
138 case PIPE_FORMAT_Z16_UNORM
:
139 /* TODO: this nv30 limitation probably does not exist */
140 if (!screen
->is_nv4x
&& front
)
141 return (front
->format
== PIPE_FORMAT_B5G6R5_UNORM
);
148 case PIPE_FORMAT_B8G8R8A8_UNORM
:
149 case PIPE_FORMAT_B8G8R8X8_UNORM
:
150 case PIPE_FORMAT_B5G5R5A1_UNORM
:
151 case PIPE_FORMAT_B4G4R4A4_UNORM
:
152 case PIPE_FORMAT_B5G6R5_UNORM
:
153 case PIPE_FORMAT_L8_UNORM
:
154 case PIPE_FORMAT_A8_UNORM
:
155 case PIPE_FORMAT_I8_UNORM
:
156 case PIPE_FORMAT_L8A8_UNORM
:
157 case PIPE_FORMAT_Z16_UNORM
:
158 case PIPE_FORMAT_S8_USCALED_Z24_UNORM
:
159 case PIPE_FORMAT_DXT1_RGB
:
160 case PIPE_FORMAT_DXT1_RGBA
:
161 case PIPE_FORMAT_DXT3_RGBA
:
162 case PIPE_FORMAT_DXT5_RGBA
:
164 /* TODO: does nv30 support this? */
165 case PIPE_FORMAT_R16_SNORM
:
166 return !!screen
->is_nv4x
;
177 nvfx_screen_destroy(struct pipe_screen
*pscreen
)
179 struct nvfx_screen
*screen
= nvfx_screen(pscreen
);
181 nouveau_resource_destroy(&screen
->vp_exec_heap
);
182 nouveau_resource_destroy(&screen
->vp_data_heap
);
183 nouveau_resource_destroy(&screen
->query_heap
);
184 nouveau_notifier_free(&screen
->query
);
185 nouveau_notifier_free(&screen
->sync
);
186 nouveau_grobj_free(&screen
->eng3d
);
187 nv04_surface_2d_takedown(&screen
->eng2d
);
189 nouveau_screen_fini(&screen
->base
);
194 static void nv30_screen_init(struct nvfx_screen
*screen
)
196 struct nouveau_channel
*chan
= screen
->base
.channel
;
199 /* TODO: perhaps we should do some of this on nv40 too? */
200 for (i
=1; i
<8; i
++) {
201 OUT_RING(chan
, RING_3D(NV34TCL_VIEWPORT_CLIP_HORIZ(i
), 1));
203 OUT_RING(chan
, RING_3D(NV34TCL_VIEWPORT_CLIP_VERT(i
), 1));
207 OUT_RING(chan
, RING_3D(0x220, 1));
210 OUT_RING(chan
, RING_3D(0x03b0, 1));
211 OUT_RING(chan
, 0x00100000);
212 OUT_RING(chan
, RING_3D(0x1454, 1));
214 OUT_RING(chan
, RING_3D(0x1d80, 1));
216 OUT_RING(chan
, RING_3D(0x1450, 1));
217 OUT_RING(chan
, 0x00030004);
220 OUT_RING(chan
, RING_3D(0x1e98, 1));
222 OUT_RING(chan
, RING_3D(0x17e0, 3));
223 OUT_RING(chan
, fui(0.0));
224 OUT_RING(chan
, fui(0.0));
225 OUT_RING(chan
, fui(1.0));
226 OUT_RING(chan
, RING_3D(0x1f80, 16));
227 for (i
=0; i
<16; i
++) {
228 OUT_RING(chan
, (i
==8) ? 0x0000ffff : 0);
231 OUT_RING(chan
, RING_3D(0x120, 3));
236 OUT_RING(chan
, RING_3D(0x1d88, 1));
237 OUT_RING(chan
, 0x00001200);
239 OUT_RING(chan
, RING_3D(NV34TCL_RC_ENABLE
, 1));
242 OUT_RING(chan
, RING_3D(NV34TCL_DEPTH_RANGE_NEAR
, 2));
243 OUT_RING(chan
, fui(0.0));
244 OUT_RING(chan
, fui(1.0));
246 OUT_RING(chan
, RING_3D(NV34TCL_MULTISAMPLE_CONTROL
, 1));
247 OUT_RING(chan
, 0xffff0000);
249 /* enables use of vp rather than fixed-function somehow */
250 OUT_RING(chan
, RING_3D(0x1e94, 1));
251 OUT_RING(chan
, 0x13);
254 static void nv40_screen_init(struct nvfx_screen
*screen
)
256 struct nouveau_channel
*chan
= screen
->base
.channel
;
258 OUT_RING(chan
, RING_3D(NV40TCL_DMA_COLOR2
, 2));
259 OUT_RING(chan
, screen
->base
.channel
->vram
->handle
);
260 OUT_RING(chan
, screen
->base
.channel
->vram
->handle
);
262 OUT_RING(chan
, RING_3D(0x1ea4, 3));
263 OUT_RING(chan
, 0x00000010);
264 OUT_RING(chan
, 0x01000100);
265 OUT_RING(chan
, 0xff800006);
267 /* vtxprog output routing */
268 OUT_RING(chan
, RING_3D(0x1fc4, 1));
269 OUT_RING(chan
, 0x06144321);
270 OUT_RING(chan
, RING_3D(0x1fc8, 2));
271 OUT_RING(chan
, 0xedcba987);
272 OUT_RING(chan
, 0x00000021);
273 OUT_RING(chan
, RING_3D(0x1fd0, 1));
274 OUT_RING(chan
, 0x00171615);
275 OUT_RING(chan
, RING_3D(0x1fd4, 1));
276 OUT_RING(chan
, 0x001b1a19);
278 OUT_RING(chan
, RING_3D(0x1ef8, 1));
279 OUT_RING(chan
, 0x0020ffff);
280 OUT_RING(chan
, RING_3D(0x1d64, 1));
281 OUT_RING(chan
, 0x00d30000);
282 OUT_RING(chan
, RING_3D(0x1e94, 1));
283 OUT_RING(chan
, 0x00000001);
287 nvfx_screen_get_vertex_buffer_flags(struct nvfx_screen
* screen
)
289 int vram_hack_default
= 0;
291 // TODO: this is a bit of a guess; also add other cards that may need this hack.
292 // It may also depend on the specific card or the AGP/PCIe chipset.
293 if(screen
->base
.device
->chipset
== 0x47 /* G70 */
294 || screen
->base
.device
->chipset
== 0x49 /* G71 */
295 || screen
->base
.device
->chipset
== 0x46 /* G72 */
297 vram_hack_default
= 1;
298 vram_hack
= debug_get_bool_option("NOUVEAU_VTXIDX_IN_VRAM", vram_hack_default
);
303 fprintf(stderr
, "Some systems may experience graphics corruption due to randomly misplaced vertices.\n"
304 "If this is happening, export NOUVEAU_VTXIDX_IN_VRAM=1 may reduce or eliminate the problem\n");
308 fprintf(stderr
, "A performance reducing hack is being used to help avoid graphics corruption.\n"
309 "You can try export NOUVEAU_VTXIDX_IN_VRAM=0 to disable it.\n");
313 return vram_hack
? NOUVEAU_BO_VRAM
: NOUVEAU_BO_GART
;
317 nvfx_screen_create(struct pipe_winsys
*ws
, struct nouveau_device
*dev
)
319 static const unsigned query_sizes
[] = {(4096 - 4 * 32) / 32, 3 * 1024 / 32, 2 * 1024 / 32, 1024 / 32};
320 struct nvfx_screen
*screen
= CALLOC_STRUCT(nvfx_screen
);
321 struct nouveau_channel
*chan
;
322 struct pipe_screen
*pscreen
;
323 unsigned eng3d_class
= 0;
329 pscreen
= &screen
->base
.base
;
331 ret
= nouveau_screen_init(&screen
->base
, dev
);
333 nvfx_screen_destroy(pscreen
);
336 chan
= screen
->base
.channel
;
338 pscreen
->winsys
= ws
;
339 pscreen
->destroy
= nvfx_screen_destroy
;
340 pscreen
->get_param
= nvfx_screen_get_param
;
341 pscreen
->get_paramf
= nvfx_screen_get_paramf
;
342 pscreen
->is_format_supported
= nvfx_screen_surface_format_supported
;
343 pscreen
->context_create
= nvfx_create
;
345 switch (dev
->chipset
& 0xf0) {
347 if (NV30TCL_CHIPSET_3X_MASK
& (1 << (dev
->chipset
& 0x0f)))
348 eng3d_class
= 0x0397;
349 else if (NV34TCL_CHIPSET_3X_MASK
& (1 << (dev
->chipset
& 0x0f)))
350 eng3d_class
= 0x0697;
351 else if (NV35TCL_CHIPSET_3X_MASK
& (1 << (dev
->chipset
& 0x0f)))
352 eng3d_class
= 0x0497;
355 if (NV4X_GRCLASS4097_CHIPSETS
& (1 << (dev
->chipset
& 0x0f)))
356 eng3d_class
= NV40TCL
;
357 else if (NV4X_GRCLASS4497_CHIPSETS
& (1 << (dev
->chipset
& 0x0f)))
358 eng3d_class
= NV44TCL
;
359 screen
->is_nv4x
= ~0;
362 if (NV6X_GRCLASS4497_CHIPSETS
& (1 << (dev
->chipset
& 0x0f)))
363 eng3d_class
= NV44TCL
;
364 screen
->is_nv4x
= ~0;
369 NOUVEAU_ERR("Unknown nv3x/nv4x chipset: nv%02x\n", dev
->chipset
);
373 screen
->force_swtnl
= debug_get_bool_option("NOUVEAU_SWTNL", FALSE
);
375 screen
->vertex_buffer_reloc_flags
= nvfx_screen_get_vertex_buffer_flags(screen
);
377 /* surely both nv3x and nv44 support index buffers too: find out how and test that */
378 if(eng3d_class
== NV40TCL
)
379 screen
->index_buffer_reloc_flags
= screen
->vertex_buffer_reloc_flags
;
381 if(!screen
->force_swtnl
&& screen
->vertex_buffer_reloc_flags
== screen
->index_buffer_reloc_flags
)
382 screen
->base
.vertex_buffer_flags
= screen
->base
.index_buffer_flags
= screen
->vertex_buffer_reloc_flags
;
384 nvfx_screen_init_resource_functions(pscreen
);
386 ret
= nouveau_grobj_alloc(chan
, 0xbeef3097, eng3d_class
, &screen
->eng3d
);
388 NOUVEAU_ERR("Error creating 3D object: %d\n", ret
);
392 /* 2D engine setup */
393 screen
->eng2d
= nv04_surface_2d_init(&screen
->base
);
394 screen
->eng2d
->buf
= nvfx_surface_buffer
;
396 /* Notifier for sync purposes */
397 ret
= nouveau_notifier_alloc(chan
, 0xbeef0301, 1, &screen
->sync
);
399 NOUVEAU_ERR("Error creating notifier object: %d\n", ret
);
400 nvfx_screen_destroy(pscreen
);
405 for(i
= 0; i
< sizeof(query_sizes
) / sizeof(query_sizes
[0]); ++i
)
407 ret
= nouveau_notifier_alloc(chan
, 0xbeef0302, query_sizes
[i
], &screen
->query
);
413 NOUVEAU_ERR("Error initialising query objects: %d\n", ret
);
414 nvfx_screen_destroy(pscreen
);
418 ret
= nouveau_resource_init(&screen
->query_heap
, 0, query_sizes
[i
]);
420 NOUVEAU_ERR("Error initialising query object heap: %d\n", ret
);
421 nvfx_screen_destroy(pscreen
);
425 LIST_INITHEAD(&screen
->query_list
);
427 /* Vtxprog resources */
428 if (nouveau_resource_init(&screen
->vp_exec_heap
, 0, screen
->is_nv4x
? 512 : 256) ||
429 nouveau_resource_init(&screen
->vp_data_heap
, 0, 256)) {
430 nvfx_screen_destroy(pscreen
);
434 BIND_RING(chan
, screen
->eng3d
, 7);
436 /* Static eng3d initialisation */
437 /* note that we just started using the channel, so we must have space in the pushbuffer */
438 OUT_RING(chan
, RING_3D(NV34TCL_DMA_NOTIFY
, 1));
439 OUT_RING(chan
, screen
->sync
->handle
);
440 OUT_RING(chan
, RING_3D(NV34TCL_DMA_TEXTURE0
, 2));
441 OUT_RING(chan
, chan
->vram
->handle
);
442 OUT_RING(chan
, chan
->gart
->handle
);
443 OUT_RING(chan
, RING_3D(NV34TCL_DMA_COLOR1
, 1));
444 OUT_RING(chan
, chan
->vram
->handle
);
445 OUT_RING(chan
, RING_3D(NV34TCL_DMA_COLOR0
, 2));
446 OUT_RING(chan
, chan
->vram
->handle
);
447 OUT_RING(chan
, chan
->vram
->handle
);
448 OUT_RING(chan
, RING_3D(NV34TCL_DMA_VTXBUF0
, 2));
449 OUT_RING(chan
, chan
->vram
->handle
);
450 OUT_RING(chan
, chan
->gart
->handle
);
452 OUT_RING(chan
, RING_3D(NV34TCL_DMA_FENCE
, 2));
454 OUT_RING(chan
, screen
->query
->handle
);
456 OUT_RING(chan
, RING_3D(NV34TCL_DMA_IN_MEMORY7
, 2));
457 OUT_RING(chan
, chan
->vram
->handle
);
458 OUT_RING(chan
, chan
->vram
->handle
);
461 nv30_screen_init(screen
);
463 nv40_screen_init(screen
);