nvc0: support PIPE_CAP_RESOURCE_FROM_USER_MEMORY_COMPUTE_ONLY
[mesa.git] / src / gallium / drivers / nouveau / nv50 / nv50_context.c
1 /*
2 * Copyright 2010 Christoph Bumiller
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 */
22
23 #include "pipe/p_defines.h"
24 #include "util/u_framebuffer.h"
25 #include "util/u_upload_mgr.h"
26
27 #include "nv50/nv50_context.h"
28 #include "nv50/nv50_screen.h"
29 #include "nv50/nv50_resource.h"
30
31 static void
32 nv50_flush(struct pipe_context *pipe,
33 struct pipe_fence_handle **fence,
34 unsigned flags)
35 {
36 struct nouveau_screen *screen = nouveau_screen(pipe->screen);
37
38 if (fence)
39 nouveau_fence_ref(screen->fence.current, (struct nouveau_fence **)fence);
40
41 PUSH_KICK(screen->pushbuf);
42
43 nouveau_context_update_frame_stats(nouveau_context(pipe));
44 }
45
46 static void
47 nv50_texture_barrier(struct pipe_context *pipe, unsigned flags)
48 {
49 struct nouveau_pushbuf *push = nv50_context(pipe)->base.pushbuf;
50
51 BEGIN_NV04(push, SUBC_3D(NV50_GRAPH_SERIALIZE), 1);
52 PUSH_DATA (push, 0);
53 BEGIN_NV04(push, NV50_3D(TEX_CACHE_CTL), 1);
54 PUSH_DATA (push, 0x20);
55 }
56
57 static void
58 nv50_memory_barrier(struct pipe_context *pipe, unsigned flags)
59 {
60 struct nv50_context *nv50 = nv50_context(pipe);
61 int i, s;
62
63 if (flags & PIPE_BARRIER_MAPPED_BUFFER) {
64 for (i = 0; i < nv50->num_vtxbufs; ++i) {
65 if (!nv50->vtxbuf[i].buffer.resource && !nv50->vtxbuf[i].is_user_buffer)
66 continue;
67 if (nv50->vtxbuf[i].buffer.resource->flags & PIPE_RESOURCE_FLAG_MAP_PERSISTENT)
68 nv50->base.vbo_dirty = true;
69 }
70
71 for (s = 0; s < 3 && !nv50->cb_dirty; ++s) {
72 uint32_t valid = nv50->constbuf_valid[s];
73
74 while (valid && !nv50->cb_dirty) {
75 const unsigned i = ffs(valid) - 1;
76 struct pipe_resource *res;
77
78 valid &= ~(1 << i);
79 if (nv50->constbuf[s][i].user)
80 continue;
81
82 res = nv50->constbuf[s][i].u.buf;
83 if (!res)
84 continue;
85
86 if (res->flags & PIPE_RESOURCE_FLAG_MAP_PERSISTENT)
87 nv50->cb_dirty = true;
88 }
89 }
90 }
91 }
92
93 static void
94 nv50_emit_string_marker(struct pipe_context *pipe, const char *str, int len)
95 {
96 struct nouveau_pushbuf *push = nv50_context(pipe)->base.pushbuf;
97 int string_words = len / 4;
98 int data_words;
99
100 if (len <= 0)
101 return;
102 string_words = MIN2(string_words, NV04_PFIFO_MAX_PACKET_LEN);
103 if (string_words == NV04_PFIFO_MAX_PACKET_LEN)
104 data_words = string_words;
105 else
106 data_words = string_words + !!(len & 3);
107 BEGIN_NI04(push, SUBC_3D(NV04_GRAPH_NOP), data_words);
108 if (string_words)
109 PUSH_DATAp(push, str, string_words);
110 if (string_words != data_words) {
111 int data = 0;
112 memcpy(&data, &str[string_words * 4], len & 3);
113 PUSH_DATA (push, data);
114 }
115 }
116
117 void
118 nv50_default_kick_notify(struct nouveau_pushbuf *push)
119 {
120 struct nv50_screen *screen = push->user_priv;
121
122 if (screen) {
123 nouveau_fence_next(&screen->base);
124 nouveau_fence_update(&screen->base, true);
125 if (screen->cur_ctx)
126 screen->cur_ctx->state.flushed = true;
127 }
128 }
129
130 static void
131 nv50_context_unreference_resources(struct nv50_context *nv50)
132 {
133 unsigned s, i;
134
135 nouveau_bufctx_del(&nv50->bufctx_3d);
136 nouveau_bufctx_del(&nv50->bufctx);
137 nouveau_bufctx_del(&nv50->bufctx_cp);
138
139 util_unreference_framebuffer_state(&nv50->framebuffer);
140
141 assert(nv50->num_vtxbufs <= PIPE_MAX_ATTRIBS);
142 for (i = 0; i < nv50->num_vtxbufs; ++i)
143 pipe_vertex_buffer_unreference(&nv50->vtxbuf[i]);
144
145 for (s = 0; s < 3; ++s) {
146 assert(nv50->num_textures[s] <= PIPE_MAX_SAMPLERS);
147 for (i = 0; i < nv50->num_textures[s]; ++i)
148 pipe_sampler_view_reference(&nv50->textures[s][i], NULL);
149
150 for (i = 0; i < NV50_MAX_PIPE_CONSTBUFS; ++i)
151 if (!nv50->constbuf[s][i].user)
152 pipe_resource_reference(&nv50->constbuf[s][i].u.buf, NULL);
153 }
154
155 for (i = 0; i < nv50->global_residents.size / sizeof(struct pipe_resource *);
156 ++i) {
157 struct pipe_resource **res = util_dynarray_element(
158 &nv50->global_residents, struct pipe_resource *, i);
159 pipe_resource_reference(res, NULL);
160 }
161 util_dynarray_fini(&nv50->global_residents);
162 }
163
164 static void
165 nv50_destroy(struct pipe_context *pipe)
166 {
167 struct nv50_context *nv50 = nv50_context(pipe);
168
169 if (nv50->screen->cur_ctx == nv50) {
170 nv50->screen->cur_ctx = NULL;
171 /* Save off the state in case another context gets created */
172 nv50->screen->save_state = nv50->state;
173 }
174
175 if (nv50->base.pipe.stream_uploader)
176 u_upload_destroy(nv50->base.pipe.stream_uploader);
177
178 nouveau_pushbuf_bufctx(nv50->base.pushbuf, NULL);
179 nouveau_pushbuf_kick(nv50->base.pushbuf, nv50->base.pushbuf->channel);
180
181 nv50_context_unreference_resources(nv50);
182
183 FREE(nv50->blit);
184
185 nouveau_context_destroy(&nv50->base);
186 }
187
188 static int
189 nv50_invalidate_resource_storage(struct nouveau_context *ctx,
190 struct pipe_resource *res,
191 int ref)
192 {
193 struct nv50_context *nv50 = nv50_context(&ctx->pipe);
194 unsigned bind = res->bind ? res->bind : PIPE_BIND_VERTEX_BUFFER;
195 unsigned s, i;
196
197 if (bind & PIPE_BIND_RENDER_TARGET) {
198 assert(nv50->framebuffer.nr_cbufs <= PIPE_MAX_COLOR_BUFS);
199 for (i = 0; i < nv50->framebuffer.nr_cbufs; ++i) {
200 if (nv50->framebuffer.cbufs[i] &&
201 nv50->framebuffer.cbufs[i]->texture == res) {
202 nv50->dirty_3d |= NV50_NEW_3D_FRAMEBUFFER;
203 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_FB);
204 if (!--ref)
205 return ref;
206 }
207 }
208 }
209 if (bind & PIPE_BIND_DEPTH_STENCIL) {
210 if (nv50->framebuffer.zsbuf &&
211 nv50->framebuffer.zsbuf->texture == res) {
212 nv50->dirty_3d |= NV50_NEW_3D_FRAMEBUFFER;
213 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_FB);
214 if (!--ref)
215 return ref;
216 }
217 }
218
219 if (bind & (PIPE_BIND_VERTEX_BUFFER |
220 PIPE_BIND_INDEX_BUFFER |
221 PIPE_BIND_CONSTANT_BUFFER |
222 PIPE_BIND_STREAM_OUTPUT |
223 PIPE_BIND_SAMPLER_VIEW)) {
224
225 assert(nv50->num_vtxbufs <= PIPE_MAX_ATTRIBS);
226 for (i = 0; i < nv50->num_vtxbufs; ++i) {
227 if (nv50->vtxbuf[i].buffer.resource == res) {
228 nv50->dirty_3d |= NV50_NEW_3D_ARRAYS;
229 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_VERTEX);
230 if (!--ref)
231 return ref;
232 }
233 }
234
235 for (s = 0; s < 3; ++s) {
236 assert(nv50->num_textures[s] <= PIPE_MAX_SAMPLERS);
237 for (i = 0; i < nv50->num_textures[s]; ++i) {
238 if (nv50->textures[s][i] &&
239 nv50->textures[s][i]->texture == res) {
240 nv50->dirty_3d |= NV50_NEW_3D_TEXTURES;
241 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_TEXTURES);
242 if (!--ref)
243 return ref;
244 }
245 }
246 }
247
248 for (s = 0; s < 3; ++s) {
249 for (i = 0; i < NV50_MAX_PIPE_CONSTBUFS; ++i) {
250 if (!(nv50->constbuf_valid[s] & (1 << i)))
251 continue;
252 if (!nv50->constbuf[s][i].user &&
253 nv50->constbuf[s][i].u.buf == res) {
254 nv50->dirty_3d |= NV50_NEW_3D_CONSTBUF;
255 nv50->constbuf_dirty[s] |= 1 << i;
256 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_CB(s, i));
257 if (!--ref)
258 return ref;
259 }
260 }
261 }
262 }
263
264 return ref;
265 }
266
267 static void
268 nv50_context_get_sample_position(struct pipe_context *, unsigned, unsigned,
269 float *);
270
271 struct pipe_context *
272 nv50_create(struct pipe_screen *pscreen, void *priv, unsigned ctxflags)
273 {
274 struct nv50_screen *screen = nv50_screen(pscreen);
275 struct nv50_context *nv50;
276 struct pipe_context *pipe;
277 int ret;
278 uint32_t flags;
279
280 nv50 = CALLOC_STRUCT(nv50_context);
281 if (!nv50)
282 return NULL;
283 pipe = &nv50->base.pipe;
284
285 if (!nv50_blitctx_create(nv50))
286 goto out_err;
287
288 nv50->base.pushbuf = screen->base.pushbuf;
289 nv50->base.client = screen->base.client;
290
291 ret = nouveau_bufctx_new(screen->base.client, 2, &nv50->bufctx);
292 if (!ret)
293 ret = nouveau_bufctx_new(screen->base.client, NV50_BIND_3D_COUNT,
294 &nv50->bufctx_3d);
295 if (!ret)
296 ret = nouveau_bufctx_new(screen->base.client, NV50_BIND_CP_COUNT,
297 &nv50->bufctx_cp);
298 if (ret)
299 goto out_err;
300
301 nv50->base.screen = &screen->base;
302 nv50->base.copy_data = nv50_m2mf_copy_linear;
303 nv50->base.push_data = nv50_sifc_linear_u8;
304 nv50->base.push_cb = nv50_cb_push;
305
306 nv50->screen = screen;
307 pipe->screen = pscreen;
308 pipe->priv = priv;
309 pipe->stream_uploader = u_upload_create_default(pipe);
310 if (!pipe->stream_uploader)
311 goto out_err;
312 pipe->const_uploader = pipe->stream_uploader;
313
314 pipe->destroy = nv50_destroy;
315
316 pipe->draw_vbo = nv50_draw_vbo;
317 pipe->clear = nv50_clear;
318 pipe->launch_grid = nv50_launch_grid;
319
320 pipe->flush = nv50_flush;
321 pipe->texture_barrier = nv50_texture_barrier;
322 pipe->memory_barrier = nv50_memory_barrier;
323 pipe->get_sample_position = nv50_context_get_sample_position;
324 pipe->emit_string_marker = nv50_emit_string_marker;
325
326 if (!screen->cur_ctx) {
327 /* Restore the last context's state here, normally handled during
328 * context switch
329 */
330 nv50->state = screen->save_state;
331 screen->cur_ctx = nv50;
332 nouveau_pushbuf_bufctx(screen->base.pushbuf, nv50->bufctx);
333 }
334 nv50->base.pushbuf->kick_notify = nv50_default_kick_notify;
335
336 nouveau_context_init(&nv50->base);
337 nv50_init_query_functions(nv50);
338 nv50_init_surface_functions(nv50);
339 nv50_init_state_functions(nv50);
340 nv50_init_resource_functions(pipe);
341
342 nv50->base.invalidate_resource_storage = nv50_invalidate_resource_storage;
343
344 if (screen->base.device->chipset < 0x84 ||
345 debug_get_bool_option("NOUVEAU_PMPEG", false)) {
346 /* PMPEG */
347 nouveau_context_init_vdec(&nv50->base);
348 } else if (screen->base.device->chipset < 0x98 ||
349 screen->base.device->chipset == 0xa0) {
350 /* VP2 */
351 pipe->create_video_codec = nv84_create_decoder;
352 pipe->create_video_buffer = nv84_video_buffer_create;
353 } else {
354 /* VP3/4 */
355 pipe->create_video_codec = nv98_create_decoder;
356 pipe->create_video_buffer = nv98_video_buffer_create;
357 }
358
359 flags = NOUVEAU_BO_VRAM | NOUVEAU_BO_RD;
360
361 BCTX_REFN_bo(nv50->bufctx_3d, 3D_SCREEN, flags, screen->code);
362 BCTX_REFN_bo(nv50->bufctx_3d, 3D_SCREEN, flags, screen->uniforms);
363 BCTX_REFN_bo(nv50->bufctx_3d, 3D_SCREEN, flags, screen->txc);
364 BCTX_REFN_bo(nv50->bufctx_3d, 3D_SCREEN, flags, screen->stack_bo);
365 if (screen->compute) {
366 BCTX_REFN_bo(nv50->bufctx_cp, CP_SCREEN, flags, screen->code);
367 BCTX_REFN_bo(nv50->bufctx_cp, CP_SCREEN, flags, screen->txc);
368 BCTX_REFN_bo(nv50->bufctx_cp, CP_SCREEN, flags, screen->stack_bo);
369 }
370
371 flags = NOUVEAU_BO_GART | NOUVEAU_BO_WR;
372
373 BCTX_REFN_bo(nv50->bufctx_3d, 3D_SCREEN, flags, screen->fence.bo);
374 BCTX_REFN_bo(nv50->bufctx, FENCE, flags, screen->fence.bo);
375 if (screen->compute)
376 BCTX_REFN_bo(nv50->bufctx_cp, CP_SCREEN, flags, screen->fence.bo);
377
378 nv50->base.scratch.bo_size = 2 << 20;
379
380 util_dynarray_init(&nv50->global_residents, NULL);
381
382 // Make sure that the first TSC entry has SRGB conversion bit set, since we
383 // use it as a fallback.
384 if (!screen->tsc.entries[0])
385 nv50_upload_tsc0(nv50);
386
387 // And mark samplers as dirty so that the first slot would get bound to the
388 // zero entry if it's not otherwise set.
389 nv50->dirty_3d |= NV50_NEW_3D_SAMPLERS;
390
391 return pipe;
392
393 out_err:
394 if (pipe->stream_uploader)
395 u_upload_destroy(pipe->stream_uploader);
396 if (nv50->bufctx_3d)
397 nouveau_bufctx_del(&nv50->bufctx_3d);
398 if (nv50->bufctx_cp)
399 nouveau_bufctx_del(&nv50->bufctx_cp);
400 if (nv50->bufctx)
401 nouveau_bufctx_del(&nv50->bufctx);
402 FREE(nv50->blit);
403 FREE(nv50);
404 return NULL;
405 }
406
407 void
408 nv50_bufctx_fence(struct nouveau_bufctx *bufctx, bool on_flush)
409 {
410 struct nouveau_list *list = on_flush ? &bufctx->current : &bufctx->pending;
411 struct nouveau_list *it;
412
413 for (it = list->next; it != list; it = it->next) {
414 struct nouveau_bufref *ref = (struct nouveau_bufref *)it;
415 struct nv04_resource *res = ref->priv;
416 if (res)
417 nv50_resource_validate(res, (unsigned)ref->priv_data);
418 }
419 }
420
421 static void
422 nv50_context_get_sample_position(struct pipe_context *pipe,
423 unsigned sample_count, unsigned sample_index,
424 float *xy)
425 {
426 static const uint8_t ms1[1][2] = { { 0x8, 0x8 } };
427 static const uint8_t ms2[2][2] = {
428 { 0x4, 0x4 }, { 0xc, 0xc } }; /* surface coords (0,0), (1,0) */
429 static const uint8_t ms4[4][2] = {
430 { 0x6, 0x2 }, { 0xe, 0x6 }, /* (0,0), (1,0) */
431 { 0x2, 0xa }, { 0xa, 0xe } }; /* (0,1), (1,1) */
432 static const uint8_t ms8[8][2] = {
433 { 0x1, 0x7 }, { 0x5, 0x3 }, /* (0,0), (1,0) */
434 { 0x3, 0xd }, { 0x7, 0xb }, /* (0,1), (1,1) */
435 { 0x9, 0x5 }, { 0xf, 0x1 }, /* (2,0), (3,0) */
436 { 0xb, 0xf }, { 0xd, 0x9 } }; /* (2,1), (3,1) */
437 #if 0
438 /* NOTE: there are alternative modes for MS2 and MS8, currently not used */
439 static const uint8_t ms8_alt[8][2] = {
440 { 0x9, 0x5 }, { 0x7, 0xb }, /* (2,0), (1,1) */
441 { 0xd, 0x9 }, { 0x5, 0x3 }, /* (3,1), (1,0) */
442 { 0x3, 0xd }, { 0x1, 0x7 }, /* (0,1), (0,0) */
443 { 0xb, 0xf }, { 0xf, 0x1 } }; /* (2,1), (3,0) */
444 #endif
445
446 const uint8_t (*ptr)[2];
447
448 switch (sample_count) {
449 case 0:
450 case 1: ptr = ms1; break;
451 case 2: ptr = ms2; break;
452 case 4: ptr = ms4; break;
453 case 8: ptr = ms8; break;
454 default:
455 assert(0);
456 return; /* bad sample count -> undefined locations */
457 }
458 xy[0] = ptr[sample_index][0] * 0.0625f;
459 xy[1] = ptr[sample_index][1] * 0.0625f;
460 }