freedreno: re-order support for hw queries
[mesa.git] / src / gallium / drivers / freedreno / freedreno_context.c
1 /* -*- mode: C; c-file-style: "k&r"; tab-width 4; indent-tabs-mode: t; -*- */
2
3 /*
4 * Copyright (C) 2012 Rob Clark <robclark@freedesktop.org>
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice (including the next
14 * paragraph) shall be included in all copies or substantial portions of the
15 * Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
23 * SOFTWARE.
24 *
25 * Authors:
26 * Rob Clark <robclark@freedesktop.org>
27 */
28
29 #include "freedreno_context.h"
30 #include "freedreno_draw.h"
31 #include "freedreno_fence.h"
32 #include "freedreno_program.h"
33 #include "freedreno_resource.h"
34 #include "freedreno_texture.h"
35 #include "freedreno_state.h"
36 #include "freedreno_gmem.h"
37 #include "freedreno_query.h"
38 #include "freedreno_query_hw.h"
39 #include "freedreno_util.h"
40
41 static void
42 fd_context_flush(struct pipe_context *pctx, struct pipe_fence_handle **fence,
43 unsigned flags)
44 {
45 struct fd_context *ctx = fd_context(pctx);
46 uint32_t timestamp;
47
48 if (!ctx->screen->reorder) {
49 struct fd_batch *batch = NULL;
50 fd_batch_reference(&batch, ctx->batch);
51 fd_batch_flush(batch);
52 timestamp = fd_ringbuffer_timestamp(batch->gmem);
53 fd_batch_reference(&batch, NULL);
54 } else {
55 timestamp = fd_bc_flush(&ctx->screen->batch_cache, ctx);
56 }
57
58 if (fence) {
59 fd_screen_fence_ref(pctx->screen, fence, NULL);
60 *fence = fd_fence_create(pctx, timestamp);
61 }
62 }
63
64 /**
65 * emit marker string as payload of a no-op packet, which can be
66 * decoded by cffdump.
67 */
68 static void
69 fd_emit_string_marker(struct pipe_context *pctx, const char *string, int len)
70 {
71 struct fd_context *ctx = fd_context(pctx);
72 struct fd_ringbuffer *ring;
73 const uint32_t *buf = (const void *)string;
74
75 if (!ctx->batch)
76 return;
77
78 ring = ctx->batch->draw;
79
80 /* max packet size is 0x3fff dwords: */
81 len = MIN2(len, 0x3fff * 4);
82
83 OUT_PKT3(ring, CP_NOP, align(len, 4) / 4);
84 while (len >= 4) {
85 OUT_RING(ring, *buf);
86 buf++;
87 len -= 4;
88 }
89
90 /* copy remainder bytes without reading past end of input string: */
91 if (len > 0) {
92 uint32_t w = 0;
93 memcpy(&w, buf, len);
94 OUT_RING(ring, w);
95 }
96 }
97
98 void
99 fd_context_destroy(struct pipe_context *pctx)
100 {
101 struct fd_context *ctx = fd_context(pctx);
102 unsigned i;
103
104 DBG("");
105
106 fd_batch_reference(&ctx->batch, NULL); /* unref current batch */
107 fd_bc_invalidate_context(ctx);
108
109 fd_prog_fini(pctx);
110 fd_hw_query_fini(pctx);
111
112 if (ctx->blitter)
113 util_blitter_destroy(ctx->blitter);
114
115 if (ctx->primconvert)
116 util_primconvert_destroy(ctx->primconvert);
117
118 util_slab_destroy(&ctx->transfer_pool);
119
120 for (i = 0; i < ARRAY_SIZE(ctx->pipe); i++) {
121 struct fd_vsc_pipe *pipe = &ctx->pipe[i];
122 if (!pipe->bo)
123 break;
124 fd_bo_del(pipe->bo);
125 }
126
127 fd_device_del(ctx->dev);
128
129 if (fd_mesa_debug & (FD_DBG_BSTAT | FD_DBG_MSGS)) {
130 printf("batch_total=%u, batch_sysmem=%u, batch_gmem=%u, batch_restore=%u\n",
131 (uint32_t)ctx->stats.batch_total, (uint32_t)ctx->stats.batch_sysmem,
132 (uint32_t)ctx->stats.batch_gmem, (uint32_t)ctx->stats.batch_restore);
133 }
134
135 FREE(ctx);
136 }
137
138 static void
139 fd_set_debug_callback(struct pipe_context *pctx,
140 const struct pipe_debug_callback *cb)
141 {
142 struct fd_context *ctx = fd_context(pctx);
143
144 if (cb)
145 ctx->debug = *cb;
146 else
147 memset(&ctx->debug, 0, sizeof(ctx->debug));
148 }
149
150 struct pipe_context *
151 fd_context_init(struct fd_context *ctx, struct pipe_screen *pscreen,
152 const uint8_t *primtypes, void *priv)
153 {
154 struct fd_screen *screen = fd_screen(pscreen);
155 struct pipe_context *pctx;
156 int i;
157
158 ctx->screen = screen;
159
160 ctx->primtypes = primtypes;
161 ctx->primtype_mask = 0;
162 for (i = 0; i < PIPE_PRIM_MAX; i++)
163 if (primtypes[i])
164 ctx->primtype_mask |= (1 << i);
165
166 /* need some sane default in case state tracker doesn't
167 * set some state:
168 */
169 ctx->sample_mask = 0xffff;
170
171 pctx = &ctx->base;
172 pctx->screen = pscreen;
173 pctx->priv = priv;
174 pctx->flush = fd_context_flush;
175 pctx->emit_string_marker = fd_emit_string_marker;
176 pctx->set_debug_callback = fd_set_debug_callback;
177
178 /* TODO what about compute? Ideally it creates it's own independent
179 * batches per compute job (since it isn't using tiling, so no point
180 * in getting involved with the re-ordering madness)..
181 */
182 if (!screen->reorder)
183 ctx->batch = fd_bc_alloc_batch(&screen->batch_cache, ctx);
184
185 fd_reset_wfi(ctx);
186
187 util_slab_create(&ctx->transfer_pool, sizeof(struct fd_transfer),
188 16, UTIL_SLAB_SINGLETHREADED);
189
190 fd_draw_init(pctx);
191 fd_resource_context_init(pctx);
192 fd_query_context_init(pctx);
193 fd_texture_init(pctx);
194 fd_state_init(pctx);
195 fd_hw_query_init(pctx);
196
197 ctx->blitter = util_blitter_create(pctx);
198 if (!ctx->blitter)
199 goto fail;
200
201 ctx->primconvert = util_primconvert_create(pctx, ctx->primtype_mask);
202 if (!ctx->primconvert)
203 goto fail;
204
205 return pctx;
206
207 fail:
208 pctx->destroy(pctx);
209 return NULL;
210 }