r200: Convert r200 to use new style debug code.
[mesa.git] / src / mesa / drivers / dri / r200 / r200_cmdbuf.c
1 /*
2 Copyright (C) The Weather Channel, Inc. 2002. All Rights Reserved.
3
4 The Weather Channel (TM) funded Tungsten Graphics to develop the
5 initial release of the Radeon 8500 driver under the XFree86 license.
6 This notice must be preserved.
7
8 Permission is hereby granted, free of charge, to any person obtaining
9 a copy of this software and associated documentation files (the
10 "Software"), to deal in the Software without restriction, including
11 without limitation the rights to use, copy, modify, merge, publish,
12 distribute, sublicense, and/or sell copies of the Software, and to
13 permit persons to whom the Software is furnished to do so, subject to
14 the following conditions:
15
16 The above copyright notice and this permission notice (including the
17 next paragraph) shall be included in all copies or substantial
18 portions of the Software.
19
20 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
21 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
22 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
23 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
24 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
25 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
26 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
27 */
28
29 /*
30 * Authors:
31 * Keith Whitwell <keith@tungstengraphics.com>
32 */
33
34 #include "main/glheader.h"
35 #include "main/imports.h"
36 #include "main/macros.h"
37 #include "main/context.h"
38 #include "swrast/swrast.h"
39 #include "main/simple_list.h"
40
41 #include "radeon_common.h"
42 #include "r200_context.h"
43 #include "r200_state.h"
44 #include "r200_ioctl.h"
45 #include "r200_tcl.h"
46 #include "r200_sanity.h"
47 #include "radeon_reg.h"
48
49 /* The state atoms will be emitted in the order they appear in the atom list,
50 * so this step is important.
51 */
52 #define insert_at_tail_if(atom_list, atom) \
53 do { \
54 struct radeon_state_atom* __atom = (atom); \
55 if (__atom->check) \
56 insert_at_tail((atom_list), __atom); \
57 } while(0)
58
59 void r200SetUpAtomList( r200ContextPtr rmesa )
60 {
61 int i, mtu;
62
63 mtu = rmesa->radeon.glCtx->Const.MaxTextureUnits;
64
65 make_empty_list(&rmesa->radeon.hw.atomlist);
66 rmesa->radeon.hw.atomlist.name = "atom-list";
67
68 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.ctx );
69 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.set );
70 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.lin );
71 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.msk );
72 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.vpt );
73 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.vtx );
74 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.vap );
75 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.vte );
76 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.msc );
77 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.cst );
78 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.zbs );
79 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.tcl );
80 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.msl );
81 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.tcg );
82 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.grd );
83 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.fog );
84 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.tam );
85 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.tf );
86 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.atf );
87 for (i = 0; i < mtu; ++i)
88 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.tex[i] );
89 for (i = 0; i < mtu; ++i)
90 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.cube[i] );
91 for (i = 0; i < 6; ++i)
92 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.pix[i] );
93 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.afs[0] );
94 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.afs[1] );
95 for (i = 0; i < 8; ++i)
96 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.lit[i] );
97 for (i = 0; i < 3 + mtu; ++i)
98 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.mat[i] );
99 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.eye );
100 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.glt );
101 for (i = 0; i < 2; ++i)
102 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.mtl[i] );
103 for (i = 0; i < 6; ++i)
104 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.ucp[i] );
105 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.spr );
106 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.ptp );
107 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.prf );
108 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.pvs );
109 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.vpp[0] );
110 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.vpp[1] );
111 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.vpi[0] );
112 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.vpi[1] );
113 insert_at_tail_if( &rmesa->radeon.hw.atomlist, &rmesa->hw.sci );
114 }
115
116 /* Fire a section of the retained (indexed_verts) buffer as a regular
117 * primtive.
118 */
119 void r200EmitVbufPrim( r200ContextPtr rmesa,
120 GLuint primitive,
121 GLuint vertex_nr )
122 {
123 BATCH_LOCALS(&rmesa->radeon);
124
125 assert(!(primitive & R200_VF_PRIM_WALK_IND));
126
127 radeonEmitState(&rmesa->radeon);
128
129 radeon_print(RADEON_RENDER|RADEON_SWRENDER,RADEON_VERBOSE,
130 "%s cmd_used/4: %d prim %x nr %d\n", __FUNCTION__,
131 rmesa->store.cmd_used/4, primitive, vertex_nr);
132
133 BEGIN_BATCH(3);
134 OUT_BATCH_PACKET3_CLIP(R200_CP_CMD_3D_DRAW_VBUF_2, 0);
135 OUT_BATCH(primitive | R200_VF_PRIM_WALK_LIST | R200_VF_COLOR_ORDER_RGBA |
136 (vertex_nr << R200_VF_VERTEX_NUMBER_SHIFT));
137 END_BATCH();
138 }
139
140 static void r200FireEB(r200ContextPtr rmesa, int vertex_count, int type)
141 {
142 BATCH_LOCALS(&rmesa->radeon);
143
144 if (vertex_count > 0) {
145 BEGIN_BATCH(8+2);
146 OUT_BATCH_PACKET3_CLIP(R200_CP_CMD_3D_DRAW_INDX_2, 0);
147 OUT_BATCH(R200_VF_PRIM_WALK_IND |
148 R200_VF_COLOR_ORDER_RGBA |
149 ((vertex_count + 0) << 16) |
150 type);
151
152 if (!rmesa->radeon.radeonScreen->kernel_mm) {
153 OUT_BATCH_PACKET3(R200_CP_CMD_INDX_BUFFER, 2);
154 OUT_BATCH((0x80 << 24) | (0 << 16) | 0x810);
155 OUT_BATCH_RELOC(rmesa->radeon.tcl.elt_dma_offset,
156 rmesa->radeon.tcl.elt_dma_bo,
157 rmesa->radeon.tcl.elt_dma_offset,
158 RADEON_GEM_DOMAIN_GTT, 0, 0);
159 OUT_BATCH((vertex_count + 1)/2);
160 } else {
161 OUT_BATCH_PACKET3(R200_CP_CMD_INDX_BUFFER, 2);
162 OUT_BATCH((0x80 << 24) | (0 << 16) | 0x810);
163 OUT_BATCH(rmesa->radeon.tcl.elt_dma_offset);
164 OUT_BATCH((vertex_count + 1)/2);
165 radeon_cs_write_reloc(rmesa->radeon.cmdbuf.cs,
166 rmesa->radeon.tcl.elt_dma_bo,
167 RADEON_GEM_DOMAIN_GTT, 0, 0);
168 }
169 END_BATCH();
170 }
171 }
172
173 void r200FlushElts(GLcontext *ctx)
174 {
175 r200ContextPtr rmesa = R200_CONTEXT(ctx);
176 int nr, elt_used = rmesa->tcl.elt_used;
177
178 radeon_print(RADEON_RENDER, RADEON_VERBOSE, "%s %x %d\n", __FUNCTION__, rmesa->tcl.hw_primitive, elt_used);
179
180 assert( rmesa->radeon.dma.flush == r200FlushElts );
181 rmesa->radeon.dma.flush = NULL;
182
183 nr = elt_used / 2;
184
185 radeon_bo_unmap(rmesa->radeon.tcl.elt_dma_bo);
186
187 r200FireEB(rmesa, nr, rmesa->tcl.hw_primitive);
188
189 radeon_bo_unref(rmesa->radeon.tcl.elt_dma_bo);
190 rmesa->radeon.tcl.elt_dma_bo = NULL;
191
192 if (R200_ELT_BUF_SZ > elt_used)
193 radeonReturnDmaRegion(&rmesa->radeon, R200_ELT_BUF_SZ - elt_used);
194
195 if (radeon_is_debug_enabled(RADEON_SYNC, RADEON_CRITICAL)) {
196 radeon_print(RADEON_SYNC, RADEON_NORMAL, "%s: Syncing\n", __FUNCTION__);
197 radeonFinish( rmesa->radeon.glCtx );
198 }
199 }
200
201
202 GLushort *r200AllocEltsOpenEnded( r200ContextPtr rmesa,
203 GLuint primitive,
204 GLuint min_nr )
205 {
206 GLushort *retval;
207
208 radeon_print(RADEON_RENDER, RADEON_VERBOSE, "%s %d prim %x\n", __FUNCTION__, min_nr, primitive);
209
210 assert((primitive & R200_VF_PRIM_WALK_IND));
211
212 radeonEmitState(&rmesa->radeon);
213
214 radeonAllocDmaRegion(&rmesa->radeon, &rmesa->radeon.tcl.elt_dma_bo,
215 &rmesa->radeon.tcl.elt_dma_offset, R200_ELT_BUF_SZ, 4);
216 rmesa->tcl.elt_used = min_nr * 2;
217
218 radeon_bo_map(rmesa->radeon.tcl.elt_dma_bo, 1);
219 retval = rmesa->radeon.tcl.elt_dma_bo->ptr + rmesa->radeon.tcl.elt_dma_offset;
220
221 assert(!rmesa->radeon.dma.flush);
222 rmesa->radeon.glCtx->Driver.NeedFlush |= FLUSH_STORED_VERTICES;
223 rmesa->radeon.dma.flush = r200FlushElts;
224
225 return retval;
226 }
227
228
229
230 void r200EmitVertexAOS( r200ContextPtr rmesa,
231 GLuint vertex_size,
232 struct radeon_bo *bo,
233 GLuint offset )
234 {
235 BATCH_LOCALS(&rmesa->radeon);
236
237 radeon_print(RADEON_SWRENDER, RADEON_VERBOSE, "%s: vertex_size 0x%x offset 0x%x \n",
238 __FUNCTION__, vertex_size, offset);
239
240
241 BEGIN_BATCH(7);
242 OUT_BATCH_PACKET3(R200_CP_CMD_3D_LOAD_VBPNTR, 2);
243 OUT_BATCH(1);
244 OUT_BATCH(vertex_size | (vertex_size << 8));
245 OUT_BATCH_RELOC(offset, bo, offset, RADEON_GEM_DOMAIN_GTT, 0, 0);
246 END_BATCH();
247 }
248
249 void r200EmitAOS(r200ContextPtr rmesa, GLuint nr, GLuint offset)
250 {
251 BATCH_LOCALS(&rmesa->radeon);
252 uint32_t voffset;
253 int sz = 1 + (nr >> 1) * 3 + (nr & 1) * 2;
254 int i;
255
256 radeon_print(RADEON_RENDER, RADEON_VERBOSE,
257 "%s: nr=%d, ofs=0x%08x\n",
258 __FUNCTION__, nr, offset);
259
260 BEGIN_BATCH(sz+2+ (nr*2));
261 OUT_BATCH_PACKET3(R200_CP_CMD_3D_LOAD_VBPNTR, sz - 1);
262 OUT_BATCH(nr);
263
264
265 if (!rmesa->radeon.radeonScreen->kernel_mm) {
266 for (i = 0; i + 1 < nr; i += 2) {
267 OUT_BATCH((rmesa->radeon.tcl.aos[i].components << 0) |
268 (rmesa->radeon.tcl.aos[i].stride << 8) |
269 (rmesa->radeon.tcl.aos[i + 1].components << 16) |
270 (rmesa->radeon.tcl.aos[i + 1].stride << 24));
271
272 voffset = rmesa->radeon.tcl.aos[i + 0].offset +
273 offset * 4 * rmesa->radeon.tcl.aos[i + 0].stride;
274 OUT_BATCH_RELOC(voffset,
275 rmesa->radeon.tcl.aos[i].bo,
276 voffset,
277 RADEON_GEM_DOMAIN_GTT,
278 0, 0);
279 voffset = rmesa->radeon.tcl.aos[i + 1].offset +
280 offset * 4 * rmesa->radeon.tcl.aos[i + 1].stride;
281 OUT_BATCH_RELOC(voffset,
282 rmesa->radeon.tcl.aos[i+1].bo,
283 voffset,
284 RADEON_GEM_DOMAIN_GTT,
285 0, 0);
286 }
287
288 if (nr & 1) {
289 OUT_BATCH((rmesa->radeon.tcl.aos[nr - 1].components << 0) |
290 (rmesa->radeon.tcl.aos[nr - 1].stride << 8));
291 voffset = rmesa->radeon.tcl.aos[nr - 1].offset +
292 offset * 4 * rmesa->radeon.tcl.aos[nr - 1].stride;
293 OUT_BATCH_RELOC(voffset,
294 rmesa->radeon.tcl.aos[nr - 1].bo,
295 voffset,
296 RADEON_GEM_DOMAIN_GTT,
297 0, 0);
298 }
299 } else {
300 for (i = 0; i + 1 < nr; i += 2) {
301 OUT_BATCH((rmesa->radeon.tcl.aos[i].components << 0) |
302 (rmesa->radeon.tcl.aos[i].stride << 8) |
303 (rmesa->radeon.tcl.aos[i + 1].components << 16) |
304 (rmesa->radeon.tcl.aos[i + 1].stride << 24));
305
306 voffset = rmesa->radeon.tcl.aos[i + 0].offset +
307 offset * 4 * rmesa->radeon.tcl.aos[i + 0].stride;
308 OUT_BATCH(voffset);
309 voffset = rmesa->radeon.tcl.aos[i + 1].offset +
310 offset * 4 * rmesa->radeon.tcl.aos[i + 1].stride;
311 OUT_BATCH(voffset);
312 }
313
314 if (nr & 1) {
315 OUT_BATCH((rmesa->radeon.tcl.aos[nr - 1].components << 0) |
316 (rmesa->radeon.tcl.aos[nr - 1].stride << 8));
317 voffset = rmesa->radeon.tcl.aos[nr - 1].offset +
318 offset * 4 * rmesa->radeon.tcl.aos[nr - 1].stride;
319 OUT_BATCH(voffset);
320 }
321 for (i = 0; i + 1 < nr; i += 2) {
322 voffset = rmesa->radeon.tcl.aos[i + 0].offset +
323 offset * 4 * rmesa->radeon.tcl.aos[i + 0].stride;
324 radeon_cs_write_reloc(rmesa->radeon.cmdbuf.cs,
325 rmesa->radeon.tcl.aos[i+0].bo,
326 RADEON_GEM_DOMAIN_GTT,
327 0, 0);
328 voffset = rmesa->radeon.tcl.aos[i + 1].offset +
329 offset * 4 * rmesa->radeon.tcl.aos[i + 1].stride;
330 radeon_cs_write_reloc(rmesa->radeon.cmdbuf.cs,
331 rmesa->radeon.tcl.aos[i+1].bo,
332 RADEON_GEM_DOMAIN_GTT,
333 0, 0);
334 }
335 if (nr & 1) {
336 voffset = rmesa->radeon.tcl.aos[nr - 1].offset +
337 offset * 4 * rmesa->radeon.tcl.aos[nr - 1].stride;
338 radeon_cs_write_reloc(rmesa->radeon.cmdbuf.cs,
339 rmesa->radeon.tcl.aos[nr-1].bo,
340 RADEON_GEM_DOMAIN_GTT,
341 0, 0);
342 }
343 }
344 END_BATCH();
345 }