r600g: add occlusion query support
[mesa.git] / src / gallium / drivers / r600 / r600_context.c
1 /*
2 * Copyright 2010 Jerome Glisse <glisse@freedesktop.org>
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 *
23 * Authors:
24 * Jerome Glisse
25 * Corbin Simpson
26 */
27 #include <stdio.h>
28 #include <util/u_inlines.h>
29 #include <util/u_format.h>
30 #include <util/u_memory.h>
31 #include <util/u_blitter.h>
32 #include "r600_screen.h"
33 #include "r600_context.h"
34 #include "r600_resource.h"
35 #include "r600d.h"
36
37
38 static void r600_destroy_context(struct pipe_context *context)
39 {
40 struct r600_context *rctx = r600_context(context);
41
42 FREE(rctx);
43 }
44
45 void r600_flush(struct pipe_context *ctx, unsigned flags,
46 struct pipe_fence_handle **fence)
47 {
48 struct r600_context *rctx = r600_context(ctx);
49 struct r600_screen *rscreen = rctx->screen;
50 struct r600_query *rquery;
51 static int dc = 0;
52 char dname[256];
53
54 /* suspend queries */
55 r600_queries_suspend(rctx);
56 if (radeon_ctx_pm4(rctx->ctx))
57 goto out;
58 /* FIXME dumping should be removed once shader support instructions
59 * without throwing bad code
60 */
61 if (!rctx->ctx->cpm4)
62 goto out;
63 sprintf(dname, "gallium-%08d.bof", dc);
64 if (dc < 10)
65 radeon_ctx_dump_bof(rctx->ctx, dname);
66 #if 1
67 radeon_ctx_submit(rctx->ctx);
68 #endif
69 LIST_FOR_EACH_ENTRY(rquery, &rctx->query_list, list) {
70 rquery->flushed = true;
71 }
72 dc++;
73 out:
74 rctx->ctx = radeon_ctx_decref(rctx->ctx);
75 rctx->ctx = radeon_ctx(rscreen->rw);
76 /* resume queries */
77 r600_queries_resume(rctx);
78 }
79
80 static void r600_init_config(struct r600_context *rctx)
81 {
82 int ps_prio;
83 int vs_prio;
84 int gs_prio;
85 int es_prio;
86 int num_ps_gprs;
87 int num_vs_gprs;
88 int num_gs_gprs;
89 int num_es_gprs;
90 int num_temp_gprs;
91 int num_ps_threads;
92 int num_vs_threads;
93 int num_gs_threads;
94 int num_es_threads;
95 int num_ps_stack_entries;
96 int num_vs_stack_entries;
97 int num_gs_stack_entries;
98 int num_es_stack_entries;
99 enum radeon_family family;
100
101 family = radeon_get_family(rctx->rw);
102 ps_prio = 0;
103 vs_prio = 1;
104 gs_prio = 2;
105 es_prio = 3;
106 switch (family) {
107 case CHIP_R600:
108 num_ps_gprs = 192;
109 num_vs_gprs = 56;
110 num_temp_gprs = 4;
111 num_gs_gprs = 0;
112 num_es_gprs = 0;
113 num_ps_threads = 136;
114 num_vs_threads = 48;
115 num_gs_threads = 4;
116 num_es_threads = 4;
117 num_ps_stack_entries = 128;
118 num_vs_stack_entries = 128;
119 num_gs_stack_entries = 0;
120 num_es_stack_entries = 0;
121 break;
122 case CHIP_RV630:
123 case CHIP_RV635:
124 num_ps_gprs = 84;
125 num_vs_gprs = 36;
126 num_temp_gprs = 4;
127 num_gs_gprs = 0;
128 num_es_gprs = 0;
129 num_ps_threads = 144;
130 num_vs_threads = 40;
131 num_gs_threads = 4;
132 num_es_threads = 4;
133 num_ps_stack_entries = 40;
134 num_vs_stack_entries = 40;
135 num_gs_stack_entries = 32;
136 num_es_stack_entries = 16;
137 break;
138 case CHIP_RV610:
139 case CHIP_RV620:
140 case CHIP_RS780:
141 case CHIP_RS880:
142 default:
143 num_ps_gprs = 84;
144 num_vs_gprs = 36;
145 num_temp_gprs = 4;
146 num_gs_gprs = 0;
147 num_es_gprs = 0;
148 num_ps_threads = 136;
149 num_vs_threads = 48;
150 num_gs_threads = 4;
151 num_es_threads = 4;
152 num_ps_stack_entries = 40;
153 num_vs_stack_entries = 40;
154 num_gs_stack_entries = 32;
155 num_es_stack_entries = 16;
156 break;
157 case CHIP_RV670:
158 num_ps_gprs = 144;
159 num_vs_gprs = 40;
160 num_temp_gprs = 4;
161 num_gs_gprs = 0;
162 num_es_gprs = 0;
163 num_ps_threads = 136;
164 num_vs_threads = 48;
165 num_gs_threads = 4;
166 num_es_threads = 4;
167 num_ps_stack_entries = 40;
168 num_vs_stack_entries = 40;
169 num_gs_stack_entries = 32;
170 num_es_stack_entries = 16;
171 break;
172 case CHIP_RV770:
173 num_ps_gprs = 192;
174 num_vs_gprs = 56;
175 num_temp_gprs = 4;
176 num_gs_gprs = 0;
177 num_es_gprs = 0;
178 num_ps_threads = 188;
179 num_vs_threads = 60;
180 num_gs_threads = 0;
181 num_es_threads = 0;
182 num_ps_stack_entries = 256;
183 num_vs_stack_entries = 256;
184 num_gs_stack_entries = 0;
185 num_es_stack_entries = 0;
186 break;
187 case CHIP_RV730:
188 case CHIP_RV740:
189 num_ps_gprs = 84;
190 num_vs_gprs = 36;
191 num_temp_gprs = 4;
192 num_gs_gprs = 0;
193 num_es_gprs = 0;
194 num_ps_threads = 188;
195 num_vs_threads = 60;
196 num_gs_threads = 0;
197 num_es_threads = 0;
198 num_ps_stack_entries = 128;
199 num_vs_stack_entries = 128;
200 num_gs_stack_entries = 0;
201 num_es_stack_entries = 0;
202 break;
203 case CHIP_RV710:
204 num_ps_gprs = 192;
205 num_vs_gprs = 56;
206 num_temp_gprs = 4;
207 num_gs_gprs = 0;
208 num_es_gprs = 0;
209 num_ps_threads = 144;
210 num_vs_threads = 48;
211 num_gs_threads = 0;
212 num_es_threads = 0;
213 num_ps_stack_entries = 128;
214 num_vs_stack_entries = 128;
215 num_gs_stack_entries = 0;
216 num_es_stack_entries = 0;
217 break;
218 }
219 rctx->hw_states.config = radeon_state(rctx->rw, R600_CONFIG_TYPE, R600_CONFIG);
220
221 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] = 0x00000000;
222 switch (family) {
223 case CHIP_RV610:
224 case CHIP_RV620:
225 case CHIP_RS780:
226 case CHIP_RS880:
227 case CHIP_RV710:
228 break;
229 default:
230 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_VC_ENABLE(1);
231 break;
232 }
233 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_DX9_CONSTS(1);
234 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_ALU_INST_PREFER_VECTOR(1);
235 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_PS_PRIO(ps_prio);
236 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_VS_PRIO(vs_prio);
237 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_GS_PRIO(gs_prio);
238 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_ES_PRIO(es_prio);
239
240 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_1] = 0;
241 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_1] |= S_008C04_NUM_PS_GPRS(num_ps_gprs);
242 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_1] |= S_008C04_NUM_VS_GPRS(num_vs_gprs);
243 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_1] |= S_008C04_NUM_CLAUSE_TEMP_GPRS(num_temp_gprs);
244
245 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_2] = 0;
246 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_2] |= S_008C08_NUM_GS_GPRS(num_gs_gprs);
247 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_2] |= S_008C08_NUM_GS_GPRS(num_es_gprs);
248
249 rctx->hw_states.config->states[R600_CONFIG__SQ_THREAD_RESOURCE_MGMT] = 0;
250 rctx->hw_states.config->states[R600_CONFIG__SQ_THREAD_RESOURCE_MGMT] |= S_008C0C_NUM_PS_THREADS(num_ps_threads);
251 rctx->hw_states.config->states[R600_CONFIG__SQ_THREAD_RESOURCE_MGMT] |= S_008C0C_NUM_VS_THREADS(num_vs_threads);
252 rctx->hw_states.config->states[R600_CONFIG__SQ_THREAD_RESOURCE_MGMT] |= S_008C0C_NUM_GS_THREADS(num_gs_threads);
253 rctx->hw_states.config->states[R600_CONFIG__SQ_THREAD_RESOURCE_MGMT] |= S_008C0C_NUM_ES_THREADS(num_es_threads);
254
255 rctx->hw_states.config->states[R600_CONFIG__SQ_STACK_RESOURCE_MGMT_1] = 0;
256 rctx->hw_states.config->states[R600_CONFIG__SQ_STACK_RESOURCE_MGMT_1] |= S_008C10_NUM_PS_STACK_ENTRIES(num_ps_stack_entries);
257 rctx->hw_states.config->states[R600_CONFIG__SQ_STACK_RESOURCE_MGMT_1] |= S_008C10_NUM_VS_STACK_ENTRIES(num_vs_stack_entries);
258
259 rctx->hw_states.config->states[R600_CONFIG__SQ_STACK_RESOURCE_MGMT_2] = 0;
260 rctx->hw_states.config->states[R600_CONFIG__SQ_STACK_RESOURCE_MGMT_2] |= S_008C14_NUM_GS_STACK_ENTRIES(num_gs_stack_entries);
261 rctx->hw_states.config->states[R600_CONFIG__SQ_STACK_RESOURCE_MGMT_2] |= S_008C14_NUM_ES_STACK_ENTRIES(num_es_stack_entries);
262
263 rctx->hw_states.config->states[R600_CONFIG__SQ_DYN_GPR_CNTL_PS_FLUSH_REQ] = 0x00004000;
264 rctx->hw_states.config->states[R600_CONFIG__TA_CNTL_AUX] = 0x07000002;
265 rctx->hw_states.config->states[R600_CONFIG__VC_ENHANCE] = 0x00000000;
266 rctx->hw_states.config->states[R600_CONFIG__DB_DEBUG] = 0x00000000;
267 rctx->hw_states.config->states[R600_CONFIG__DB_WATERMARKS] = 0x00420204;
268 rctx->hw_states.config->states[R600_CONFIG__SX_MISC] = 0x00000000;
269 rctx->hw_states.config->states[R600_CONFIG__SPI_THREAD_GROUPING] = 0x00000001;
270 rctx->hw_states.config->states[R600_CONFIG__CB_SHADER_CONTROL] = 0x00000003;
271 rctx->hw_states.config->states[R600_CONFIG__SQ_ESGS_RING_ITEMSIZE] = 0x00000000;
272 rctx->hw_states.config->states[R600_CONFIG__SQ_GSVS_RING_ITEMSIZE] = 0x00000000;
273 rctx->hw_states.config->states[R600_CONFIG__SQ_ESTMP_RING_ITEMSIZE] = 0x00000000;
274 rctx->hw_states.config->states[R600_CONFIG__SQ_GSTMP_RING_ITEMSIZE] = 0x00000000;
275 rctx->hw_states.config->states[R600_CONFIG__SQ_VSTMP_RING_ITEMSIZE] = 0x00000000;
276 rctx->hw_states.config->states[R600_CONFIG__SQ_PSTMP_RING_ITEMSIZE] = 0x00000000;
277 rctx->hw_states.config->states[R600_CONFIG__SQ_FBUF_RING_ITEMSIZE] = 0x00000000;
278 rctx->hw_states.config->states[R600_CONFIG__SQ_REDUC_RING_ITEMSIZE] = 0x00000000;
279 rctx->hw_states.config->states[R600_CONFIG__SQ_GS_VERT_ITEMSIZE] = 0x00000000;
280 rctx->hw_states.config->states[R600_CONFIG__VGT_OUTPUT_PATH_CNTL] = 0x00000000;
281 rctx->hw_states.config->states[R600_CONFIG__VGT_HOS_CNTL] = 0x00000000;
282 rctx->hw_states.config->states[R600_CONFIG__VGT_HOS_MAX_TESS_LEVEL] = 0x00000000;
283 rctx->hw_states.config->states[R600_CONFIG__VGT_HOS_MIN_TESS_LEVEL] = 0x00000000;
284 rctx->hw_states.config->states[R600_CONFIG__VGT_HOS_REUSE_DEPTH] = 0x00000000;
285 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_PRIM_TYPE] = 0x00000000;
286 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_FIRST_DECR] = 0x00000000;
287 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_DECR] = 0x00000000;
288 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_VECT_0_CNTL] = 0x00000000;
289 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_VECT_1_CNTL] = 0x00000000;
290 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_VECT_0_FMT_CNTL] = 0x00000000;
291 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_VECT_1_FMT_CNTL] = 0x00000000;
292 rctx->hw_states.config->states[R600_CONFIG__VGT_GS_MODE] = 0x00000000;
293 rctx->hw_states.config->states[R600_CONFIG__PA_SC_MODE_CNTL] = 0x00514000;
294 rctx->hw_states.config->states[R600_CONFIG__VGT_STRMOUT_EN] = 0x00000000;
295 rctx->hw_states.config->states[R600_CONFIG__VGT_REUSE_OFF] = 0x00000001;
296 rctx->hw_states.config->states[R600_CONFIG__VGT_VTX_CNT_EN] = 0x00000000;
297 rctx->hw_states.config->states[R600_CONFIG__VGT_STRMOUT_BUFFER_EN] = 0x00000000;
298 radeon_state_pm4(rctx->hw_states.config);
299 }
300
301 struct pipe_context *r600_create_context(struct pipe_screen *screen, void *priv)
302 {
303 struct r600_context *rctx = CALLOC_STRUCT(r600_context);
304 struct r600_screen* rscreen = r600_screen(screen);
305
306 if (rctx == NULL)
307 return NULL;
308 rctx->context.winsys = rscreen->screen.winsys;
309 rctx->context.screen = screen;
310 rctx->context.priv = priv;
311 rctx->context.destroy = r600_destroy_context;
312 rctx->context.draw_vbo = r600_draw_vbo;
313 rctx->context.flush = r600_flush;
314
315 /* Easy accessing of screen/winsys. */
316 rctx->screen = rscreen;
317 rctx->rw = rscreen->rw;
318
319 r600_init_blit_functions(rctx);
320 r600_init_query_functions(rctx);
321 r600_init_state_functions(rctx);
322 r600_init_context_resource_functions(rctx);
323
324 rctx->blitter = util_blitter_create(&rctx->context);
325 if (rctx->blitter == NULL) {
326 FREE(rctx);
327 return NULL;
328 }
329
330 r600_init_config(rctx);
331
332 rctx->ctx = radeon_ctx(rscreen->rw);
333 rctx->draw = radeon_draw(rscreen->rw);
334 return &rctx->context;
335 }