2 #include "nv50/nv50_context.h"
3 #include "nv50/nv50_defs.xml.h"
6 nv50_fb_set_null_rt(struct nouveau_pushbuf
*push
, unsigned i
)
8 BEGIN_NV04(push
, NV50_3D(RT_ADDRESS_HIGH(i
)), 4);
11 PUSH_DATA (push
, NV50_SURFACE_FORMAT_NONE
);
13 BEGIN_NV04(push
, NV50_3D(RT_HORIZ(i
)), 2);
19 nv50_validate_fb(struct nv50_context
*nv50
)
21 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
22 struct pipe_framebuffer_state
*fb
= &nv50
->framebuffer
;
24 unsigned ms_mode
= NV50_3D_MULTISAMPLE_MODE_MS1
;
25 uint32_t array_size
= 0xffff, array_mode
= 0;
27 nouveau_bufctx_reset(nv50
->bufctx_3d
, NV50_BIND_FB
);
29 BEGIN_NV04(push
, NV50_3D(RT_CONTROL
), 1);
30 PUSH_DATA (push
, (076543210 << 4) | fb
->nr_cbufs
);
31 BEGIN_NV04(push
, NV50_3D(SCREEN_SCISSOR_HORIZ
), 2);
32 PUSH_DATA (push
, fb
->width
<< 16);
33 PUSH_DATA (push
, fb
->height
<< 16);
35 for (i
= 0; i
< fb
->nr_cbufs
; ++i
) {
36 struct nv50_miptree
*mt
;
37 struct nv50_surface
*sf
;
38 struct nouveau_bo
*bo
;
41 nv50_fb_set_null_rt(push
, i
);
45 mt
= nv50_miptree(fb
->cbufs
[i
]->texture
);
46 sf
= nv50_surface(fb
->cbufs
[i
]);
49 array_size
= MIN2(array_size
, sf
->depth
);
51 array_mode
= NV50_3D_RT_ARRAY_MODE_MODE_3D
; /* 1 << 16 */
53 /* can't mix 3D with ARRAY or have RTs of different depth/array_size */
54 assert(mt
->layout_3d
|| !array_mode
|| array_size
== 1);
56 BEGIN_NV04(push
, NV50_3D(RT_ADDRESS_HIGH(i
)), 5);
57 PUSH_DATAh(push
, bo
->offset
+ sf
->offset
);
58 PUSH_DATA (push
, bo
->offset
+ sf
->offset
);
59 PUSH_DATA (push
, nv50_format_table
[sf
->base
.format
].rt
);
60 if (likely(nouveau_bo_memtype(bo
))) {
61 PUSH_DATA (push
, mt
->level
[sf
->base
.u
.tex
.level
].tile_mode
);
62 PUSH_DATA (push
, mt
->layer_stride
>> 2);
63 BEGIN_NV04(push
, NV50_3D(RT_HORIZ(i
)), 2);
64 PUSH_DATA (push
, sf
->width
);
65 PUSH_DATA (push
, sf
->height
);
66 BEGIN_NV04(push
, NV50_3D(RT_ARRAY_MODE
), 1);
67 PUSH_DATA (push
, array_mode
| array_size
);
68 nv50
->rt_array_mode
= array_mode
| array_size
;
72 BEGIN_NV04(push
, NV50_3D(RT_HORIZ(i
)), 2);
73 PUSH_DATA (push
, NV50_3D_RT_HORIZ_LINEAR
| mt
->level
[0].pitch
);
74 PUSH_DATA (push
, sf
->height
);
75 BEGIN_NV04(push
, NV50_3D(RT_ARRAY_MODE
), 1);
82 ms_mode
= mt
->ms_mode
;
84 if (mt
->base
.status
& NOUVEAU_BUFFER_STATUS_GPU_READING
)
85 nv50
->state
.rt_serialize
= TRUE
;
86 mt
->base
.status
|= NOUVEAU_BUFFER_STATUS_GPU_WRITING
;
87 mt
->base
.status
&= ~NOUVEAU_BUFFER_STATUS_GPU_READING
;
89 /* only register for writing, otherwise we'd always serialize here */
90 BCTX_REFN(nv50
->bufctx_3d
, FB
, &mt
->base
, WR
);
94 struct nv50_miptree
*mt
= nv50_miptree(fb
->zsbuf
->texture
);
95 struct nv50_surface
*sf
= nv50_surface(fb
->zsbuf
);
96 struct nouveau_bo
*bo
= mt
->base
.bo
;
97 int unk
= mt
->base
.base
.target
== PIPE_TEXTURE_3D
|| sf
->depth
== 1;
99 BEGIN_NV04(push
, NV50_3D(ZETA_ADDRESS_HIGH
), 5);
100 PUSH_DATAh(push
, bo
->offset
+ sf
->offset
);
101 PUSH_DATA (push
, bo
->offset
+ sf
->offset
);
102 PUSH_DATA (push
, nv50_format_table
[fb
->zsbuf
->format
].rt
);
103 PUSH_DATA (push
, mt
->level
[sf
->base
.u
.tex
.level
].tile_mode
);
104 PUSH_DATA (push
, mt
->layer_stride
>> 2);
105 BEGIN_NV04(push
, NV50_3D(ZETA_ENABLE
), 1);
107 BEGIN_NV04(push
, NV50_3D(ZETA_HORIZ
), 3);
108 PUSH_DATA (push
, sf
->width
);
109 PUSH_DATA (push
, sf
->height
);
110 PUSH_DATA (push
, (unk
<< 16) | sf
->depth
);
112 ms_mode
= mt
->ms_mode
;
114 if (mt
->base
.status
& NOUVEAU_BUFFER_STATUS_GPU_READING
)
115 nv50
->state
.rt_serialize
= TRUE
;
116 mt
->base
.status
|= NOUVEAU_BUFFER_STATUS_GPU_WRITING
;
117 mt
->base
.status
&= ~NOUVEAU_BUFFER_STATUS_GPU_READING
;
119 BCTX_REFN(nv50
->bufctx_3d
, FB
, &mt
->base
, WR
);
121 BEGIN_NV04(push
, NV50_3D(ZETA_ENABLE
), 1);
125 BEGIN_NV04(push
, NV50_3D(MULTISAMPLE_MODE
), 1);
126 PUSH_DATA (push
, ms_mode
);
128 /* Only need to initialize the first viewport, which is used for clears */
129 BEGIN_NV04(push
, NV50_3D(VIEWPORT_HORIZ(0)), 2);
130 PUSH_DATA (push
, fb
->width
<< 16);
131 PUSH_DATA (push
, fb
->height
<< 16);
133 if (nv50
->screen
->tesla
->oclass
>= NVA3_3D_CLASS
) {
134 unsigned ms
= 1 << ms_mode
;
135 BEGIN_NV04(push
, NV50_3D(CB_ADDR
), 1);
136 PUSH_DATA (push
, (NV50_CB_AUX_SAMPLE_OFFSET
<< (8 - 2)) | NV50_CB_AUX
);
137 BEGIN_NI04(push
, NV50_3D(CB_DATA(0)), 2 * ms
);
138 for (i
= 0; i
< ms
; i
++) {
140 nv50
->base
.pipe
.get_sample_position(&nv50
->base
.pipe
, ms
, i
, xy
);
141 PUSH_DATAf(push
, xy
[0]);
142 PUSH_DATAf(push
, xy
[1]);
148 nv50_validate_blend_colour(struct nv50_context
*nv50
)
150 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
152 BEGIN_NV04(push
, NV50_3D(BLEND_COLOR(0)), 4);
153 PUSH_DATAf(push
, nv50
->blend_colour
.color
[0]);
154 PUSH_DATAf(push
, nv50
->blend_colour
.color
[1]);
155 PUSH_DATAf(push
, nv50
->blend_colour
.color
[2]);
156 PUSH_DATAf(push
, nv50
->blend_colour
.color
[3]);
160 nv50_validate_stencil_ref(struct nv50_context
*nv50
)
162 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
164 BEGIN_NV04(push
, NV50_3D(STENCIL_FRONT_FUNC_REF
), 1);
165 PUSH_DATA (push
, nv50
->stencil_ref
.ref_value
[0]);
166 BEGIN_NV04(push
, NV50_3D(STENCIL_BACK_FUNC_REF
), 1);
167 PUSH_DATA (push
, nv50
->stencil_ref
.ref_value
[1]);
171 nv50_validate_stipple(struct nv50_context
*nv50
)
173 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
176 BEGIN_NV04(push
, NV50_3D(POLYGON_STIPPLE_PATTERN(0)), 32);
177 for (i
= 0; i
< 32; ++i
)
178 PUSH_DATA(push
, util_bswap32(nv50
->stipple
.stipple
[i
]));
182 nv50_validate_scissor(struct nv50_context
*nv50
)
184 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
185 #ifdef NV50_SCISSORS_CLIPPING
186 int minx
, maxx
, miny
, maxy
, i
;
189 (NV50_NEW_SCISSOR
| NV50_NEW_VIEWPORT
| NV50_NEW_FRAMEBUFFER
)) &&
190 nv50
->state
.scissor
== nv50
->rast
->pipe
.scissor
)
193 if (nv50
->state
.scissor
!= nv50
->rast
->pipe
.scissor
)
194 nv50
->scissors_dirty
= (1 << NV50_MAX_VIEWPORTS
) - 1;
196 nv50
->state
.scissor
= nv50
->rast
->pipe
.scissor
;
198 if ((nv50
->dirty
& NV50_NEW_FRAMEBUFFER
) && !nv50
->state
.scissor
)
199 nv50
->scissors_dirty
= (1 << NV50_MAX_VIEWPORTS
) - 1;
201 for (i
= 0; i
< NV50_MAX_VIEWPORTS
; i
++) {
202 struct pipe_scissor_state
*s
= &nv50
->scissors
[i
];
203 struct pipe_viewport_state
*vp
= &nv50
->viewports
[i
];
205 if (!(nv50
->scissors_dirty
& (1 << i
)) &&
206 !(nv50
->viewports_dirty
& (1 << i
)))
209 if (nv50
->state
.scissor
) {
216 maxx
= nv50
->framebuffer
.width
;
218 maxy
= nv50
->framebuffer
.height
;
221 minx
= MAX2(minx
, (int)(vp
->translate
[0] - fabsf(vp
->scale
[0])));
222 maxx
= MIN2(maxx
, (int)(vp
->translate
[0] + fabsf(vp
->scale
[0])));
223 miny
= MAX2(miny
, (int)(vp
->translate
[1] - fabsf(vp
->scale
[1])));
224 maxy
= MIN2(maxy
, (int)(vp
->translate
[1] + fabsf(vp
->scale
[1])));
226 minx
= MIN2(minx
, 8192);
227 maxx
= MAX2(maxx
, 0);
228 miny
= MIN2(miny
, 8192);
229 maxy
= MAX2(maxy
, 0);
231 BEGIN_NV04(push
, NV50_3D(SCISSOR_HORIZ(i
)), 2);
232 PUSH_DATA (push
, (maxx
<< 16) | minx
);
233 PUSH_DATA (push
, (maxy
<< 16) | miny
);
235 BEGIN_NV04(push
, NV50_3D(SCISSOR_HORIZ(i
)), 2);
236 PUSH_DATA (push
, (s
->maxx
<< 16) | s
->minx
);
237 PUSH_DATA (push
, (s
->maxy
<< 16) | s
->miny
);
241 nv50
->scissors_dirty
= 0;
245 nv50_validate_viewport(struct nv50_context
*nv50
)
247 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
251 for (i
= 0; i
< NV50_MAX_VIEWPORTS
; i
++) {
252 struct pipe_viewport_state
*vpt
= &nv50
->viewports
[i
];
254 if (!(nv50
->viewports_dirty
& (1 << i
)))
257 BEGIN_NV04(push
, NV50_3D(VIEWPORT_TRANSLATE_X(i
)), 3);
258 PUSH_DATAf(push
, vpt
->translate
[0]);
259 PUSH_DATAf(push
, vpt
->translate
[1]);
260 PUSH_DATAf(push
, vpt
->translate
[2]);
261 BEGIN_NV04(push
, NV50_3D(VIEWPORT_SCALE_X(i
)), 3);
262 PUSH_DATAf(push
, vpt
->scale
[0]);
263 PUSH_DATAf(push
, vpt
->scale
[1]);
264 PUSH_DATAf(push
, vpt
->scale
[2]);
266 zmin
= vpt
->translate
[2] - fabsf(vpt
->scale
[2]);
267 zmax
= vpt
->translate
[2] + fabsf(vpt
->scale
[2]);
269 #ifdef NV50_SCISSORS_CLIPPING
270 BEGIN_NV04(push
, NV50_3D(DEPTH_RANGE_NEAR(i
)), 2);
271 PUSH_DATAf(push
, zmin
);
272 PUSH_DATAf(push
, zmax
);
276 nv50
->viewports_dirty
= 0;
280 nv50_check_program_ucps(struct nv50_context
*nv50
,
281 struct nv50_program
*vp
, uint8_t mask
)
283 const unsigned n
= util_logbase2(mask
) + 1;
285 if (vp
->vp
.clpd_nr
>= n
)
287 nv50_program_destroy(nv50
, vp
);
290 if (likely(vp
== nv50
->vertprog
)) {
291 nv50
->dirty
|= NV50_NEW_VERTPROG
;
292 nv50_vertprog_validate(nv50
);
294 nv50
->dirty
|= NV50_NEW_GMTYPROG
;
295 nv50_gmtyprog_validate(nv50
);
297 nv50_fp_linkage_validate(nv50
);
301 nv50_validate_clip(struct nv50_context
*nv50
)
303 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
304 struct nv50_program
*vp
;
307 if (nv50
->dirty
& NV50_NEW_CLIP
) {
308 BEGIN_NV04(push
, NV50_3D(CB_ADDR
), 1);
309 PUSH_DATA (push
, (NV50_CB_AUX_UCP_OFFSET
<< 8) | NV50_CB_AUX
);
310 BEGIN_NI04(push
, NV50_3D(CB_DATA(0)), PIPE_MAX_CLIP_PLANES
* 4);
311 PUSH_DATAp(push
, &nv50
->clip
.ucp
[0][0], PIPE_MAX_CLIP_PLANES
* 4);
318 clip_enable
= nv50
->rast
->pipe
.clip_plane_enable
;
320 BEGIN_NV04(push
, NV50_3D(CLIP_DISTANCE_ENABLE
), 1);
321 PUSH_DATA (push
, clip_enable
);
324 nv50_check_program_ucps(nv50
, vp
, clip_enable
);
328 nv50_validate_blend(struct nv50_context
*nv50
)
330 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
332 PUSH_SPACE(push
, nv50
->blend
->size
);
333 PUSH_DATAp(push
, nv50
->blend
->state
, nv50
->blend
->size
);
337 nv50_validate_zsa(struct nv50_context
*nv50
)
339 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
341 PUSH_SPACE(push
, nv50
->zsa
->size
);
342 PUSH_DATAp(push
, nv50
->zsa
->state
, nv50
->zsa
->size
);
346 nv50_validate_rasterizer(struct nv50_context
*nv50
)
348 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
350 PUSH_SPACE(push
, nv50
->rast
->size
);
351 PUSH_DATAp(push
, nv50
->rast
->state
, nv50
->rast
->size
);
355 nv50_validate_sample_mask(struct nv50_context
*nv50
)
357 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
361 nv50
->sample_mask
& 0xffff,
362 nv50
->sample_mask
& 0xffff,
363 nv50
->sample_mask
& 0xffff,
364 nv50
->sample_mask
& 0xffff
367 BEGIN_NV04(push
, NV50_3D(MSAA_MASK(0)), 4);
368 PUSH_DATA (push
, mask
[0]);
369 PUSH_DATA (push
, mask
[1]);
370 PUSH_DATA (push
, mask
[2]);
371 PUSH_DATA (push
, mask
[3]);
375 nv50_validate_min_samples(struct nv50_context
*nv50
)
377 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
380 if (nv50
->screen
->tesla
->oclass
< NVA3_3D_CLASS
)
383 samples
= util_next_power_of_two(nv50
->min_samples
);
385 samples
|= NVA3_3D_SAMPLE_SHADING_ENABLE
;
387 BEGIN_NV04(push
, SUBC_3D(NVA3_3D_SAMPLE_SHADING
), 1);
388 PUSH_DATA (push
, samples
);
392 nv50_switch_pipe_context(struct nv50_context
*ctx_to
)
394 struct nv50_context
*ctx_from
= ctx_to
->screen
->cur_ctx
;
397 ctx_to
->state
= ctx_from
->state
;
400 ctx_to
->viewports_dirty
= ~0;
401 ctx_to
->scissors_dirty
= ~0;
403 ctx_to
->constbuf_dirty
[0] =
404 ctx_to
->constbuf_dirty
[1] =
405 ctx_to
->constbuf_dirty
[2] = (1 << NV50_MAX_PIPE_CONSTBUFS
) - 1;
408 ctx_to
->dirty
&= ~(NV50_NEW_VERTEX
| NV50_NEW_ARRAYS
);
410 if (!ctx_to
->vertprog
)
411 ctx_to
->dirty
&= ~NV50_NEW_VERTPROG
;
412 if (!ctx_to
->fragprog
)
413 ctx_to
->dirty
&= ~NV50_NEW_FRAGPROG
;
416 ctx_to
->dirty
&= ~NV50_NEW_BLEND
;
418 #ifdef NV50_SCISSORS_CLIPPING
419 ctx_to
->dirty
&= ~(NV50_NEW_RASTERIZER
| NV50_NEW_SCISSOR
);
421 ctx_to
->dirty
&= ~NV50_NEW_RASTERIZER
;
424 ctx_to
->dirty
&= ~NV50_NEW_ZSA
;
426 ctx_to
->screen
->cur_ctx
= ctx_to
;
429 static struct state_validate
{
430 void (*func
)(struct nv50_context
*);
432 } validate_list
[] = {
433 { nv50_validate_fb
, NV50_NEW_FRAMEBUFFER
},
434 { nv50_validate_blend
, NV50_NEW_BLEND
},
435 { nv50_validate_zsa
, NV50_NEW_ZSA
},
436 { nv50_validate_sample_mask
, NV50_NEW_SAMPLE_MASK
},
437 { nv50_validate_rasterizer
, NV50_NEW_RASTERIZER
},
438 { nv50_validate_blend_colour
, NV50_NEW_BLEND_COLOUR
},
439 { nv50_validate_stencil_ref
, NV50_NEW_STENCIL_REF
},
440 { nv50_validate_stipple
, NV50_NEW_STIPPLE
},
441 #ifdef NV50_SCISSORS_CLIPPING
442 { nv50_validate_scissor
, NV50_NEW_SCISSOR
| NV50_NEW_VIEWPORT
|
443 NV50_NEW_RASTERIZER
|
444 NV50_NEW_FRAMEBUFFER
},
446 { nv50_validate_scissor
, NV50_NEW_SCISSOR
},
448 { nv50_validate_viewport
, NV50_NEW_VIEWPORT
},
449 { nv50_vertprog_validate
, NV50_NEW_VERTPROG
},
450 { nv50_gmtyprog_validate
, NV50_NEW_GMTYPROG
},
451 { nv50_fragprog_validate
, NV50_NEW_FRAGPROG
|
452 NV50_NEW_MIN_SAMPLES
},
453 { nv50_fp_linkage_validate
, NV50_NEW_FRAGPROG
| NV50_NEW_VERTPROG
|
454 NV50_NEW_GMTYPROG
| NV50_NEW_RASTERIZER
},
455 { nv50_gp_linkage_validate
, NV50_NEW_GMTYPROG
| NV50_NEW_VERTPROG
},
456 { nv50_validate_derived_rs
, NV50_NEW_FRAGPROG
| NV50_NEW_RASTERIZER
|
457 NV50_NEW_VERTPROG
| NV50_NEW_GMTYPROG
},
458 { nv50_validate_clip
, NV50_NEW_CLIP
| NV50_NEW_RASTERIZER
|
459 NV50_NEW_VERTPROG
| NV50_NEW_GMTYPROG
},
460 { nv50_constbufs_validate
, NV50_NEW_CONSTBUF
},
461 { nv50_validate_textures
, NV50_NEW_TEXTURES
},
462 { nv50_validate_samplers
, NV50_NEW_SAMPLERS
},
463 { nv50_stream_output_validate
, NV50_NEW_STRMOUT
|
464 NV50_NEW_VERTPROG
| NV50_NEW_GMTYPROG
},
465 { nv50_vertex_arrays_validate
, NV50_NEW_VERTEX
| NV50_NEW_ARRAYS
},
466 { nv50_validate_min_samples
, NV50_NEW_MIN_SAMPLES
},
468 #define validate_list_len (sizeof(validate_list) / sizeof(validate_list[0]))
471 nv50_state_validate(struct nv50_context
*nv50
, uint32_t mask
, unsigned words
)
477 if (nv50
->screen
->cur_ctx
!= nv50
)
478 nv50_switch_pipe_context(nv50
);
480 state_mask
= nv50
->dirty
& mask
;
483 for (i
= 0; i
< validate_list_len
; ++i
) {
484 struct state_validate
*validate
= &validate_list
[i
];
486 if (state_mask
& validate
->states
)
487 validate
->func(nv50
);
489 nv50
->dirty
&= ~state_mask
;
491 if (nv50
->state
.rt_serialize
) {
492 nv50
->state
.rt_serialize
= FALSE
;
493 BEGIN_NV04(nv50
->base
.pushbuf
, SUBC_3D(NV50_GRAPH_SERIALIZE
), 1);
494 PUSH_DATA (nv50
->base
.pushbuf
, 0);
497 nv50_bufctx_fence(nv50
->bufctx_3d
, FALSE
);
499 nouveau_pushbuf_bufctx(nv50
->base
.pushbuf
, nv50
->bufctx_3d
);
500 ret
= nouveau_pushbuf_validate(nv50
->base
.pushbuf
);
502 if (unlikely(nv50
->state
.flushed
)) {
503 nv50
->state
.flushed
= FALSE
;
504 nv50_bufctx_fence(nv50
->bufctx_3d
, TRUE
);