Merge remote branch 'origin/master' into nv50-compiler
[mesa.git] / src / gallium / drivers / r600 / r600_context.c
1 /*
2 * Copyright 2010 Jerome Glisse <glisse@freedesktop.org>
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 *
23 * Authors:
24 * Jerome Glisse
25 * Corbin Simpson
26 */
27 #include <stdio.h>
28 #include <util/u_inlines.h>
29 #include <util/u_format.h>
30 #include <util/u_memory.h>
31 #include <util/u_blitter.h>
32 #include "r600_screen.h"
33 #include "r600_context.h"
34 #include "r600_resource.h"
35 #include "r600d.h"
36
37 static void r600_destroy_context(struct pipe_context *context)
38 {
39 struct r600_context *rctx = r600_context(context);
40
41 FREE(rctx);
42 }
43
44 void r600_flush(struct pipe_context *ctx, unsigned flags,
45 struct pipe_fence_handle **fence)
46 {
47 struct r600_context *rctx = r600_context(ctx);
48 struct r600_screen *rscreen = rctx->screen;
49 static int dc = 0;
50 char dname[256];
51
52 if (radeon_ctx_pm4(rctx->ctx))
53 return;
54 /* FIXME dumping should be removed once shader support instructions
55 * without throwing bad code
56 */
57 if (!rctx->ctx->cpm4)
58 goto out;
59 sprintf(dname, "gallium-%08d.bof", dc);
60 if (dc < 1)
61 radeon_ctx_dump_bof(rctx->ctx, dname);
62 #if 1
63 radeon_ctx_submit(rctx->ctx);
64 #endif
65 dc++;
66 out:
67 rctx->ctx = radeon_ctx_decref(rctx->ctx);
68 rctx->ctx = radeon_ctx(rscreen->rw);
69 }
70
71 static void r600_init_config(struct r600_context *rctx)
72 {
73 int ps_prio;
74 int vs_prio;
75 int gs_prio;
76 int es_prio;
77 int num_ps_gprs;
78 int num_vs_gprs;
79 int num_gs_gprs;
80 int num_es_gprs;
81 int num_temp_gprs;
82 int num_ps_threads;
83 int num_vs_threads;
84 int num_gs_threads;
85 int num_es_threads;
86 int num_ps_stack_entries;
87 int num_vs_stack_entries;
88 int num_gs_stack_entries;
89 int num_es_stack_entries;
90 enum radeon_family family;
91
92 family = radeon_get_family(rctx->rw);
93 ps_prio = 0;
94 vs_prio = 1;
95 gs_prio = 2;
96 es_prio = 3;
97 switch (family) {
98 case CHIP_R600:
99 num_ps_gprs = 192;
100 num_vs_gprs = 56;
101 num_temp_gprs = 4;
102 num_gs_gprs = 0;
103 num_es_gprs = 0;
104 num_ps_threads = 136;
105 num_vs_threads = 48;
106 num_gs_threads = 4;
107 num_es_threads = 4;
108 num_ps_stack_entries = 128;
109 num_vs_stack_entries = 128;
110 num_gs_stack_entries = 0;
111 num_es_stack_entries = 0;
112 break;
113 case CHIP_RV630:
114 case CHIP_RV635:
115 num_ps_gprs = 84;
116 num_vs_gprs = 36;
117 num_temp_gprs = 4;
118 num_gs_gprs = 0;
119 num_es_gprs = 0;
120 num_ps_threads = 144;
121 num_vs_threads = 40;
122 num_gs_threads = 4;
123 num_es_threads = 4;
124 num_ps_stack_entries = 40;
125 num_vs_stack_entries = 40;
126 num_gs_stack_entries = 32;
127 num_es_stack_entries = 16;
128 break;
129 case CHIP_RV610:
130 case CHIP_RV620:
131 case CHIP_RS780:
132 case CHIP_RS880:
133 default:
134 num_ps_gprs = 84;
135 num_vs_gprs = 36;
136 num_temp_gprs = 4;
137 num_gs_gprs = 0;
138 num_es_gprs = 0;
139 num_ps_threads = 136;
140 num_vs_threads = 48;
141 num_gs_threads = 4;
142 num_es_threads = 4;
143 num_ps_stack_entries = 40;
144 num_vs_stack_entries = 40;
145 num_gs_stack_entries = 32;
146 num_es_stack_entries = 16;
147 break;
148 case CHIP_RV670:
149 num_ps_gprs = 144;
150 num_vs_gprs = 40;
151 num_temp_gprs = 4;
152 num_gs_gprs = 0;
153 num_es_gprs = 0;
154 num_ps_threads = 136;
155 num_vs_threads = 48;
156 num_gs_threads = 4;
157 num_es_threads = 4;
158 num_ps_stack_entries = 40;
159 num_vs_stack_entries = 40;
160 num_gs_stack_entries = 32;
161 num_es_stack_entries = 16;
162 break;
163 case CHIP_RV770:
164 num_ps_gprs = 192;
165 num_vs_gprs = 56;
166 num_temp_gprs = 4;
167 num_gs_gprs = 0;
168 num_es_gprs = 0;
169 num_ps_threads = 188;
170 num_vs_threads = 60;
171 num_gs_threads = 0;
172 num_es_threads = 0;
173 num_ps_stack_entries = 256;
174 num_vs_stack_entries = 256;
175 num_gs_stack_entries = 0;
176 num_es_stack_entries = 0;
177 break;
178 case CHIP_RV730:
179 case CHIP_RV740:
180 num_ps_gprs = 84;
181 num_vs_gprs = 36;
182 num_temp_gprs = 4;
183 num_gs_gprs = 0;
184 num_es_gprs = 0;
185 num_ps_threads = 188;
186 num_vs_threads = 60;
187 num_gs_threads = 0;
188 num_es_threads = 0;
189 num_ps_stack_entries = 128;
190 num_vs_stack_entries = 128;
191 num_gs_stack_entries = 0;
192 num_es_stack_entries = 0;
193 break;
194 case CHIP_RV710:
195 num_ps_gprs = 192;
196 num_vs_gprs = 56;
197 num_temp_gprs = 4;
198 num_gs_gprs = 0;
199 num_es_gprs = 0;
200 num_ps_threads = 144;
201 num_vs_threads = 48;
202 num_gs_threads = 0;
203 num_es_threads = 0;
204 num_ps_stack_entries = 128;
205 num_vs_stack_entries = 128;
206 num_gs_stack_entries = 0;
207 num_es_stack_entries = 0;
208 break;
209 }
210 rctx->hw_states.config = radeon_state(rctx->rw, R600_CONFIG_TYPE, R600_CONFIG);
211
212 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] = 0x00000000;
213 switch (family) {
214 case CHIP_RV610:
215 case CHIP_RV620:
216 case CHIP_RS780:
217 case CHIP_RS880:
218 case CHIP_RV710:
219 break;
220 default:
221 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_VC_ENABLE(1);
222 break;
223 }
224 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_DX9_CONSTS(1);
225 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_ALU_INST_PREFER_VECTOR(1);
226 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_PS_PRIO(ps_prio);
227 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_VS_PRIO(vs_prio);
228 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_GS_PRIO(gs_prio);
229 rctx->hw_states.config->states[R600_CONFIG__SQ_CONFIG] |= S_008C00_ES_PRIO(es_prio);
230
231 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_1] = 0;
232 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_1] |= S_008C04_NUM_PS_GPRS(num_ps_gprs);
233 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_1] |= S_008C04_NUM_VS_GPRS(num_vs_gprs);
234 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_1] |= S_008C04_NUM_CLAUSE_TEMP_GPRS(num_temp_gprs);
235
236 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_2] = 0;
237 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_2] |= S_008C08_NUM_GS_GPRS(num_gs_gprs);
238 rctx->hw_states.config->states[R600_CONFIG__SQ_GPR_RESOURCE_MGMT_2] |= S_008C08_NUM_GS_GPRS(num_es_gprs);
239
240 rctx->hw_states.config->states[R600_CONFIG__SQ_THREAD_RESOURCE_MGMT] = 0;
241 rctx->hw_states.config->states[R600_CONFIG__SQ_THREAD_RESOURCE_MGMT] |= S_008C0C_NUM_PS_THREADS(num_ps_threads);
242 rctx->hw_states.config->states[R600_CONFIG__SQ_THREAD_RESOURCE_MGMT] |= S_008C0C_NUM_VS_THREADS(num_vs_threads);
243 rctx->hw_states.config->states[R600_CONFIG__SQ_THREAD_RESOURCE_MGMT] |= S_008C0C_NUM_GS_THREADS(num_gs_threads);
244 rctx->hw_states.config->states[R600_CONFIG__SQ_THREAD_RESOURCE_MGMT] |= S_008C0C_NUM_ES_THREADS(num_es_threads);
245
246 rctx->hw_states.config->states[R600_CONFIG__SQ_STACK_RESOURCE_MGMT_1] = 0;
247 rctx->hw_states.config->states[R600_CONFIG__SQ_STACK_RESOURCE_MGMT_1] |= S_008C10_NUM_PS_STACK_ENTRIES(num_ps_stack_entries);
248 rctx->hw_states.config->states[R600_CONFIG__SQ_STACK_RESOURCE_MGMT_1] |= S_008C10_NUM_VS_STACK_ENTRIES(num_vs_stack_entries);
249
250 rctx->hw_states.config->states[R600_CONFIG__SQ_STACK_RESOURCE_MGMT_2] = 0;
251 rctx->hw_states.config->states[R600_CONFIG__SQ_STACK_RESOURCE_MGMT_2] |= S_008C14_NUM_GS_STACK_ENTRIES(num_gs_stack_entries);
252 rctx->hw_states.config->states[R600_CONFIG__SQ_STACK_RESOURCE_MGMT_2] |= S_008C14_NUM_ES_STACK_ENTRIES(num_es_stack_entries);
253
254 rctx->hw_states.config->states[R600_CONFIG__SQ_DYN_GPR_CNTL_PS_FLUSH_REQ] = 0x00004000;
255 rctx->hw_states.config->states[R600_CONFIG__TA_CNTL_AUX] = 0x07000002;
256 rctx->hw_states.config->states[R600_CONFIG__VC_ENHANCE] = 0x00000000;
257 rctx->hw_states.config->states[R600_CONFIG__DB_DEBUG] = 0x00000000;
258 rctx->hw_states.config->states[R600_CONFIG__DB_WATERMARKS] = 0x00420204;
259 rctx->hw_states.config->states[R600_CONFIG__SX_MISC] = 0x00000000;
260 rctx->hw_states.config->states[R600_CONFIG__SPI_THREAD_GROUPING] = 0x00000001;
261 rctx->hw_states.config->states[R600_CONFIG__CB_SHADER_CONTROL] = 0x00000003;
262 rctx->hw_states.config->states[R600_CONFIG__SQ_ESGS_RING_ITEMSIZE] = 0x00000000;
263 rctx->hw_states.config->states[R600_CONFIG__SQ_GSVS_RING_ITEMSIZE] = 0x00000000;
264 rctx->hw_states.config->states[R600_CONFIG__SQ_ESTMP_RING_ITEMSIZE] = 0x00000000;
265 rctx->hw_states.config->states[R600_CONFIG__SQ_GSTMP_RING_ITEMSIZE] = 0x00000000;
266 rctx->hw_states.config->states[R600_CONFIG__SQ_VSTMP_RING_ITEMSIZE] = 0x00000000;
267 rctx->hw_states.config->states[R600_CONFIG__SQ_PSTMP_RING_ITEMSIZE] = 0x00000000;
268 rctx->hw_states.config->states[R600_CONFIG__SQ_FBUF_RING_ITEMSIZE] = 0x00000000;
269 rctx->hw_states.config->states[R600_CONFIG__SQ_REDUC_RING_ITEMSIZE] = 0x00000000;
270 rctx->hw_states.config->states[R600_CONFIG__SQ_GS_VERT_ITEMSIZE] = 0x00000000;
271 rctx->hw_states.config->states[R600_CONFIG__VGT_OUTPUT_PATH_CNTL] = 0x00000000;
272 rctx->hw_states.config->states[R600_CONFIG__VGT_HOS_CNTL] = 0x00000000;
273 rctx->hw_states.config->states[R600_CONFIG__VGT_HOS_MAX_TESS_LEVEL] = 0x00000000;
274 rctx->hw_states.config->states[R600_CONFIG__VGT_HOS_MIN_TESS_LEVEL] = 0x00000000;
275 rctx->hw_states.config->states[R600_CONFIG__VGT_HOS_REUSE_DEPTH] = 0x00000000;
276 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_PRIM_TYPE] = 0x00000000;
277 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_FIRST_DECR] = 0x00000000;
278 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_DECR] = 0x00000000;
279 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_VECT_0_CNTL] = 0x00000000;
280 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_VECT_1_CNTL] = 0x00000000;
281 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_VECT_0_FMT_CNTL] = 0x00000000;
282 rctx->hw_states.config->states[R600_CONFIG__VGT_GROUP_VECT_1_FMT_CNTL] = 0x00000000;
283 rctx->hw_states.config->states[R600_CONFIG__VGT_GS_MODE] = 0x00000000;
284 rctx->hw_states.config->states[R600_CONFIG__PA_SC_MODE_CNTL] = 0x00514000;
285 rctx->hw_states.config->states[R600_CONFIG__VGT_STRMOUT_EN] = 0x00000000;
286 rctx->hw_states.config->states[R600_CONFIG__VGT_REUSE_OFF] = 0x00000001;
287 rctx->hw_states.config->states[R600_CONFIG__VGT_VTX_CNT_EN] = 0x00000000;
288 rctx->hw_states.config->states[R600_CONFIG__VGT_STRMOUT_BUFFER_EN] = 0x00000000;
289 radeon_state_pm4(rctx->hw_states.config);
290 }
291
292 struct pipe_context *r600_create_context(struct pipe_screen *screen, void *priv)
293 {
294 struct r600_context *rctx = CALLOC_STRUCT(r600_context);
295 struct r600_screen* rscreen = r600_screen(screen);
296
297 if (rctx == NULL)
298 return NULL;
299 rctx->context.winsys = rscreen->screen.winsys;
300 rctx->context.screen = screen;
301 rctx->context.priv = priv;
302 rctx->context.destroy = r600_destroy_context;
303 rctx->context.draw_vbo = r600_draw_vbo;
304 rctx->context.flush = r600_flush;
305
306 /* Easy accessing of screen/winsys. */
307 rctx->screen = rscreen;
308 rctx->rw = rscreen->rw;
309
310 r600_init_blit_functions(rctx);
311 r600_init_query_functions(rctx);
312 r600_init_state_functions(rctx);
313 r600_init_context_resource_functions(rctx);
314
315 rctx->blitter = util_blitter_create(&rctx->context);
316 if (rctx->blitter == NULL) {
317 FREE(rctx);
318 return NULL;
319 }
320
321 r600_init_config(rctx);
322
323 rctx->ctx = radeon_ctx(rscreen->rw);
324 rctx->draw = radeon_draw(rscreen->rw);
325 return &rctx->context;
326 }