2 #include "nv50/nv50_context.h"
3 #include "nv50/nv50_defs.xml.h"
6 nv50_fb_set_null_rt(struct nouveau_pushbuf
*push
, unsigned i
)
8 BEGIN_NV04(push
, NV50_3D(RT_ADDRESS_HIGH(i
)), 4);
11 PUSH_DATA (push
, NV50_SURFACE_FORMAT_NONE
);
13 BEGIN_NV04(push
, NV50_3D(RT_HORIZ(i
)), 2);
19 nv50_validate_fb(struct nv50_context
*nv50
)
21 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
22 struct pipe_framebuffer_state
*fb
= &nv50
->framebuffer
;
24 unsigned ms_mode
= NV50_3D_MULTISAMPLE_MODE_MS1
;
25 uint32_t array_size
= 0xffff, array_mode
= 0;
27 nouveau_bufctx_reset(nv50
->bufctx_3d
, NV50_BIND_FB
);
29 BEGIN_NV04(push
, NV50_3D(RT_CONTROL
), 1);
30 PUSH_DATA (push
, (076543210 << 4) | fb
->nr_cbufs
);
31 BEGIN_NV04(push
, NV50_3D(SCREEN_SCISSOR_HORIZ
), 2);
32 PUSH_DATA (push
, fb
->width
<< 16);
33 PUSH_DATA (push
, fb
->height
<< 16);
35 for (i
= 0; i
< fb
->nr_cbufs
; ++i
) {
36 struct nv50_miptree
*mt
;
37 struct nv50_surface
*sf
;
38 struct nouveau_bo
*bo
;
41 nv50_fb_set_null_rt(push
, i
);
45 mt
= nv50_miptree(fb
->cbufs
[i
]->texture
);
46 sf
= nv50_surface(fb
->cbufs
[i
]);
49 array_size
= MIN2(array_size
, sf
->depth
);
51 array_mode
= NV50_3D_RT_ARRAY_MODE_MODE_3D
; /* 1 << 16 */
53 /* can't mix 3D with ARRAY or have RTs of different depth/array_size */
54 assert(mt
->layout_3d
|| !array_mode
|| array_size
== 1);
56 BEGIN_NV04(push
, NV50_3D(RT_ADDRESS_HIGH(i
)), 5);
57 PUSH_DATAh(push
, bo
->offset
+ sf
->offset
);
58 PUSH_DATA (push
, bo
->offset
+ sf
->offset
);
59 PUSH_DATA (push
, nv50_format_table
[sf
->base
.format
].rt
);
60 if (likely(nouveau_bo_memtype(bo
))) {
61 PUSH_DATA (push
, mt
->level
[sf
->base
.u
.tex
.level
].tile_mode
);
62 PUSH_DATA (push
, mt
->layer_stride
>> 2);
63 BEGIN_NV04(push
, NV50_3D(RT_HORIZ(i
)), 2);
64 PUSH_DATA (push
, sf
->width
);
65 PUSH_DATA (push
, sf
->height
);
66 BEGIN_NV04(push
, NV50_3D(RT_ARRAY_MODE
), 1);
67 PUSH_DATA (push
, array_mode
| array_size
);
71 BEGIN_NV04(push
, NV50_3D(RT_HORIZ(i
)), 2);
72 PUSH_DATA (push
, NV50_3D_RT_HORIZ_LINEAR
| mt
->level
[0].pitch
);
73 PUSH_DATA (push
, sf
->height
);
74 BEGIN_NV04(push
, NV50_3D(RT_ARRAY_MODE
), 1);
81 ms_mode
= mt
->ms_mode
;
83 if (mt
->base
.status
& NOUVEAU_BUFFER_STATUS_GPU_READING
)
84 nv50
->state
.rt_serialize
= TRUE
;
85 mt
->base
.status
|= NOUVEAU_BUFFER_STATUS_GPU_WRITING
;
86 mt
->base
.status
&= ~NOUVEAU_BUFFER_STATUS_GPU_READING
;
88 /* only register for writing, otherwise we'd always serialize here */
89 BCTX_REFN(nv50
->bufctx_3d
, FB
, &mt
->base
, WR
);
93 struct nv50_miptree
*mt
= nv50_miptree(fb
->zsbuf
->texture
);
94 struct nv50_surface
*sf
= nv50_surface(fb
->zsbuf
);
95 struct nouveau_bo
*bo
= mt
->base
.bo
;
96 int unk
= mt
->base
.base
.target
== PIPE_TEXTURE_3D
|| sf
->depth
== 1;
98 BEGIN_NV04(push
, NV50_3D(ZETA_ADDRESS_HIGH
), 5);
99 PUSH_DATAh(push
, bo
->offset
+ sf
->offset
);
100 PUSH_DATA (push
, bo
->offset
+ sf
->offset
);
101 PUSH_DATA (push
, nv50_format_table
[fb
->zsbuf
->format
].rt
);
102 PUSH_DATA (push
, mt
->level
[sf
->base
.u
.tex
.level
].tile_mode
);
103 PUSH_DATA (push
, mt
->layer_stride
>> 2);
104 BEGIN_NV04(push
, NV50_3D(ZETA_ENABLE
), 1);
106 BEGIN_NV04(push
, NV50_3D(ZETA_HORIZ
), 3);
107 PUSH_DATA (push
, sf
->width
);
108 PUSH_DATA (push
, sf
->height
);
109 PUSH_DATA (push
, (unk
<< 16) | sf
->depth
);
111 ms_mode
= mt
->ms_mode
;
113 if (mt
->base
.status
& NOUVEAU_BUFFER_STATUS_GPU_READING
)
114 nv50
->state
.rt_serialize
= TRUE
;
115 mt
->base
.status
|= NOUVEAU_BUFFER_STATUS_GPU_WRITING
;
116 mt
->base
.status
&= ~NOUVEAU_BUFFER_STATUS_GPU_READING
;
118 BCTX_REFN(nv50
->bufctx_3d
, FB
, &mt
->base
, WR
);
120 BEGIN_NV04(push
, NV50_3D(ZETA_ENABLE
), 1);
124 BEGIN_NV04(push
, NV50_3D(MULTISAMPLE_MODE
), 1);
125 PUSH_DATA (push
, ms_mode
);
127 BEGIN_NV04(push
, NV50_3D(VIEWPORT_HORIZ(0)), 2);
128 PUSH_DATA (push
, fb
->width
<< 16);
129 PUSH_DATA (push
, fb
->height
<< 16);
133 nv50_validate_blend_colour(struct nv50_context
*nv50
)
135 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
137 BEGIN_NV04(push
, NV50_3D(BLEND_COLOR(0)), 4);
138 PUSH_DATAf(push
, nv50
->blend_colour
.color
[0]);
139 PUSH_DATAf(push
, nv50
->blend_colour
.color
[1]);
140 PUSH_DATAf(push
, nv50
->blend_colour
.color
[2]);
141 PUSH_DATAf(push
, nv50
->blend_colour
.color
[3]);
145 nv50_validate_stencil_ref(struct nv50_context
*nv50
)
147 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
149 BEGIN_NV04(push
, NV50_3D(STENCIL_FRONT_FUNC_REF
), 1);
150 PUSH_DATA (push
, nv50
->stencil_ref
.ref_value
[0]);
151 BEGIN_NV04(push
, NV50_3D(STENCIL_BACK_FUNC_REF
), 1);
152 PUSH_DATA (push
, nv50
->stencil_ref
.ref_value
[1]);
156 nv50_validate_stipple(struct nv50_context
*nv50
)
158 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
161 BEGIN_NV04(push
, NV50_3D(POLYGON_STIPPLE_PATTERN(0)), 32);
162 for (i
= 0; i
< 32; ++i
)
163 PUSH_DATA(push
, util_bswap32(nv50
->stipple
.stipple
[i
]));
167 nv50_validate_scissor(struct nv50_context
*nv50
)
169 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
170 struct pipe_scissor_state
*s
= &nv50
->scissor
;
171 #ifdef NV50_SCISSORS_CLIPPING
172 struct pipe_viewport_state
*vp
= &nv50
->viewport
;
173 int minx
, maxx
, miny
, maxy
;
176 (NV50_NEW_SCISSOR
| NV50_NEW_VIEWPORT
| NV50_NEW_FRAMEBUFFER
)) &&
177 nv50
->state
.scissor
== nv50
->rast
->pipe
.scissor
)
179 nv50
->state
.scissor
= nv50
->rast
->pipe
.scissor
;
181 if (nv50
->state
.scissor
) {
188 maxx
= nv50
->framebuffer
.width
;
190 maxy
= nv50
->framebuffer
.height
;
193 minx
= MAX2(minx
, (int)(vp
->translate
[0] - fabsf(vp
->scale
[0])));
194 maxx
= MIN2(maxx
, (int)(vp
->translate
[0] + fabsf(vp
->scale
[0])));
195 miny
= MAX2(miny
, (int)(vp
->translate
[1] - fabsf(vp
->scale
[1])));
196 maxy
= MIN2(maxy
, (int)(vp
->translate
[1] + fabsf(vp
->scale
[1])));
198 BEGIN_NV04(push
, NV50_3D(SCISSOR_HORIZ(0)), 2);
199 PUSH_DATA (push
, (maxx
<< 16) | minx
);
200 PUSH_DATA (push
, (maxy
<< 16) | miny
);
202 BEGIN_NV04(push
, NV50_3D(SCISSOR_HORIZ(0)), 2);
203 PUSH_DATA (push
, (s
->maxx
<< 16) | s
->minx
);
204 PUSH_DATA (push
, (s
->maxy
<< 16) | s
->miny
);
209 nv50_validate_viewport(struct nv50_context
*nv50
)
211 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
214 BEGIN_NV04(push
, NV50_3D(VIEWPORT_TRANSLATE_X(0)), 3);
215 PUSH_DATAf(push
, nv50
->viewport
.translate
[0]);
216 PUSH_DATAf(push
, nv50
->viewport
.translate
[1]);
217 PUSH_DATAf(push
, nv50
->viewport
.translate
[2]);
218 BEGIN_NV04(push
, NV50_3D(VIEWPORT_SCALE_X(0)), 3);
219 PUSH_DATAf(push
, nv50
->viewport
.scale
[0]);
220 PUSH_DATAf(push
, nv50
->viewport
.scale
[1]);
221 PUSH_DATAf(push
, nv50
->viewport
.scale
[2]);
223 zmin
= nv50
->viewport
.translate
[2] - fabsf(nv50
->viewport
.scale
[2]);
224 zmax
= nv50
->viewport
.translate
[2] + fabsf(nv50
->viewport
.scale
[2]);
226 #ifdef NV50_SCISSORS_CLIPPING
227 BEGIN_NV04(push
, NV50_3D(DEPTH_RANGE_NEAR(0)), 2);
228 PUSH_DATAf(push
, zmin
);
229 PUSH_DATAf(push
, zmax
);
234 nv50_check_program_ucps(struct nv50_context
*nv50
,
235 struct nv50_program
*vp
, uint8_t mask
)
237 const unsigned n
= util_logbase2(mask
) + 1;
239 if (vp
->vp
.clpd_nr
>= n
)
241 nv50_program_destroy(nv50
, vp
);
244 if (likely(vp
== nv50
->vertprog
)) {
245 nv50
->dirty
|= NV50_NEW_VERTPROG
;
246 nv50_vertprog_validate(nv50
);
248 nv50
->dirty
|= NV50_NEW_GMTYPROG
;
249 nv50_gmtyprog_validate(nv50
);
251 nv50_fp_linkage_validate(nv50
);
255 nv50_validate_clip(struct nv50_context
*nv50
)
257 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
258 struct nv50_program
*vp
;
261 if (nv50
->dirty
& NV50_NEW_CLIP
) {
262 BEGIN_NV04(push
, NV50_3D(CB_ADDR
), 1);
263 PUSH_DATA (push
, (NV50_CB_AUX_UCP_OFFSET
<< 8) | NV50_CB_AUX
);
264 BEGIN_NI04(push
, NV50_3D(CB_DATA(0)), PIPE_MAX_CLIP_PLANES
* 4);
265 PUSH_DATAp(push
, &nv50
->clip
.ucp
[0][0], PIPE_MAX_CLIP_PLANES
* 4);
272 clip_enable
= nv50
->rast
->pipe
.clip_plane_enable
;
274 BEGIN_NV04(push
, NV50_3D(CLIP_DISTANCE_ENABLE
), 1);
275 PUSH_DATA (push
, clip_enable
);
278 nv50_check_program_ucps(nv50
, vp
, clip_enable
);
282 nv50_validate_blend(struct nv50_context
*nv50
)
284 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
286 PUSH_SPACE(push
, nv50
->blend
->size
);
287 PUSH_DATAp(push
, nv50
->blend
->state
, nv50
->blend
->size
);
291 nv50_validate_zsa(struct nv50_context
*nv50
)
293 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
295 PUSH_SPACE(push
, nv50
->zsa
->size
);
296 PUSH_DATAp(push
, nv50
->zsa
->state
, nv50
->zsa
->size
);
300 nv50_validate_rasterizer(struct nv50_context
*nv50
)
302 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
304 PUSH_SPACE(push
, nv50
->rast
->size
);
305 PUSH_DATAp(push
, nv50
->rast
->state
, nv50
->rast
->size
);
309 nv50_validate_sample_mask(struct nv50_context
*nv50
)
311 struct nouveau_pushbuf
*push
= nv50
->base
.pushbuf
;
315 nv50
->sample_mask
& 0xffff,
316 nv50
->sample_mask
& 0xffff,
317 nv50
->sample_mask
& 0xffff,
318 nv50
->sample_mask
& 0xffff
321 BEGIN_NV04(push
, NV50_3D(MSAA_MASK(0)), 4);
322 PUSH_DATA (push
, mask
[0]);
323 PUSH_DATA (push
, mask
[1]);
324 PUSH_DATA (push
, mask
[2]);
325 PUSH_DATA (push
, mask
[3]);
329 nv50_switch_pipe_context(struct nv50_context
*ctx_to
)
331 struct nv50_context
*ctx_from
= ctx_to
->screen
->cur_ctx
;
334 ctx_to
->state
= ctx_from
->state
;
339 ctx_to
->dirty
&= ~(NV50_NEW_VERTEX
| NV50_NEW_ARRAYS
);
341 if (!ctx_to
->vertprog
)
342 ctx_to
->dirty
&= ~NV50_NEW_VERTPROG
;
343 if (!ctx_to
->fragprog
)
344 ctx_to
->dirty
&= ~NV50_NEW_FRAGPROG
;
347 ctx_to
->dirty
&= ~NV50_NEW_BLEND
;
349 #ifdef NV50_SCISSORS_CLIPPING
350 ctx_to
->dirty
&= ~(NV50_NEW_RASTERIZER
| NV50_NEW_SCISSOR
);
352 ctx_to
->dirty
&= ~NV50_NEW_RASTERIZER
;
355 ctx_to
->dirty
&= ~NV50_NEW_ZSA
;
357 ctx_to
->screen
->cur_ctx
= ctx_to
;
360 static struct state_validate
{
361 void (*func
)(struct nv50_context
*);
363 } validate_list
[] = {
364 { nv50_validate_fb
, NV50_NEW_FRAMEBUFFER
},
365 { nv50_validate_blend
, NV50_NEW_BLEND
},
366 { nv50_validate_zsa
, NV50_NEW_ZSA
},
367 { nv50_validate_sample_mask
, NV50_NEW_SAMPLE_MASK
},
368 { nv50_validate_rasterizer
, NV50_NEW_RASTERIZER
},
369 { nv50_validate_blend_colour
, NV50_NEW_BLEND_COLOUR
},
370 { nv50_validate_stencil_ref
, NV50_NEW_STENCIL_REF
},
371 { nv50_validate_stipple
, NV50_NEW_STIPPLE
},
372 #ifdef NV50_SCISSORS_CLIPPING
373 { nv50_validate_scissor
, NV50_NEW_SCISSOR
| NV50_NEW_VIEWPORT
|
374 NV50_NEW_RASTERIZER
|
375 NV50_NEW_FRAMEBUFFER
},
377 { nv50_validate_scissor
, NV50_NEW_SCISSOR
},
379 { nv50_validate_viewport
, NV50_NEW_VIEWPORT
},
380 { nv50_vertprog_validate
, NV50_NEW_VERTPROG
},
381 { nv50_gmtyprog_validate
, NV50_NEW_GMTYPROG
},
382 { nv50_fragprog_validate
, NV50_NEW_FRAGPROG
},
383 { nv50_fp_linkage_validate
, NV50_NEW_FRAGPROG
| NV50_NEW_VERTPROG
|
384 NV50_NEW_GMTYPROG
| NV50_NEW_RASTERIZER
},
385 { nv50_gp_linkage_validate
, NV50_NEW_GMTYPROG
| NV50_NEW_VERTPROG
},
386 { nv50_validate_derived_rs
, NV50_NEW_FRAGPROG
| NV50_NEW_RASTERIZER
|
387 NV50_NEW_VERTPROG
| NV50_NEW_GMTYPROG
},
388 { nv50_validate_clip
, NV50_NEW_CLIP
| NV50_NEW_RASTERIZER
|
389 NV50_NEW_VERTPROG
| NV50_NEW_GMTYPROG
},
390 { nv50_constbufs_validate
, NV50_NEW_CONSTBUF
},
391 { nv50_validate_textures
, NV50_NEW_TEXTURES
},
392 { nv50_validate_samplers
, NV50_NEW_SAMPLERS
},
393 { nv50_stream_output_validate
, NV50_NEW_STRMOUT
|
394 NV50_NEW_VERTPROG
| NV50_NEW_GMTYPROG
},
395 { nv50_vertex_arrays_validate
, NV50_NEW_VERTEX
| NV50_NEW_ARRAYS
}
397 #define validate_list_len (sizeof(validate_list) / sizeof(validate_list[0]))
400 nv50_state_validate(struct nv50_context
*nv50
, uint32_t mask
, unsigned words
)
406 if (nv50
->screen
->cur_ctx
!= nv50
)
407 nv50_switch_pipe_context(nv50
);
409 state_mask
= nv50
->dirty
& mask
;
412 for (i
= 0; i
< validate_list_len
; ++i
) {
413 struct state_validate
*validate
= &validate_list
[i
];
415 if (state_mask
& validate
->states
)
416 validate
->func(nv50
);
418 nv50
->dirty
&= ~state_mask
;
420 if (nv50
->state
.rt_serialize
) {
421 nv50
->state
.rt_serialize
= FALSE
;
422 BEGIN_NV04(nv50
->base
.pushbuf
, SUBC_3D(NV50_GRAPH_SERIALIZE
), 1);
423 PUSH_DATA (nv50
->base
.pushbuf
, 0);
426 nv50_bufctx_fence(nv50
->bufctx_3d
, FALSE
);
428 nouveau_pushbuf_bufctx(nv50
->base
.pushbuf
, nv50
->bufctx_3d
);
429 ret
= nouveau_pushbuf_validate(nv50
->base
.pushbuf
);
431 if (unlikely(nv50
->state
.flushed
)) {
432 nv50
->state
.flushed
= FALSE
;
433 nv50_bufctx_fence(nv50
->bufctx_3d
, TRUE
);