Turns out I left flat primitives in vertex buffer mode. Switch them back to immediate...
[mesa.git] / src / mesa / drivers / dri / r300 / r300_ioctl.c
1 /*
2 Copyright (C) The Weather Channel, Inc. 2002.
3 Copyright (C) 2004 Nicolai Haehnle.
4 All Rights Reserved.
5
6 The Weather Channel (TM) funded Tungsten Graphics to develop the
7 initial release of the Radeon 8500 driver under the XFree86 license.
8 This notice must be preserved.
9
10 Permission is hereby granted, free of charge, to any person obtaining
11 a copy of this software and associated documentation files (the
12 "Software"), to deal in the Software without restriction, including
13 without limitation the rights to use, copy, modify, merge, publish,
14 distribute, sublicense, and/or sell copies of the Software, and to
15 permit persons to whom the Software is furnished to do so, subject to
16 the following conditions:
17
18 The above copyright notice and this permission notice (including the
19 next paragraph) shall be included in all copies or substantial
20 portions of the Software.
21
22 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
23 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
24 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
25 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
26 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
27 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
28 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
29
30 **************************************************************************/
31
32 /*
33 * Authors:
34 * Keith Whitwell <keith@tungstengraphics.com>
35 * Nicolai Haehnle <prefect_@gmx.net>
36 */
37
38 #include <sched.h>
39 #include <errno.h>
40
41 #include "glheader.h"
42 #include "imports.h"
43 #include "macros.h"
44 #include "context.h"
45 #include "swrast/swrast.h"
46
47 #include "r300_context.h"
48 #include "radeon_ioctl.h"
49 #include "r300_ioctl.h"
50 #include "r300_cmdbuf.h"
51 #include "r300_state.h"
52 #include "r300_program.h"
53 #include "radeon_reg.h"
54
55 #include "vblank.h"
56
57
58 #define CLEARBUFFER_COLOR 0x1
59 #define CLEARBUFFER_DEPTH 0x2
60
61 static void r300ClearBuffer(r300ContextPtr r300, int flags, int buffer)
62 {
63 GLcontext* ctx = r300->radeon.glCtx;
64 __DRIdrawablePrivate *dPriv = r300->radeon.dri.drawable;
65 int i;
66 GLuint cboffset, cbpitch;
67 drm_r300_cmd_header_t* cmd;
68
69 if (RADEON_DEBUG & DEBUG_IOCTL)
70 fprintf(stderr, "%s: %s buffer (%i,%i %ix%i)\n",
71 __FUNCTION__, buffer ? "back" : "front",
72 dPriv->x, dPriv->y, dPriv->w, dPriv->h);
73
74 if (buffer) {
75 cboffset = r300->radeon.radeonScreen->backOffset;
76 cbpitch = r300->radeon.radeonScreen->backPitch;
77 } else {
78 cboffset = r300->radeon.radeonScreen->frontOffset;
79 cbpitch = r300->radeon.radeonScreen->frontPitch;
80 }
81
82 cboffset += r300->radeon.radeonScreen->fbLocation;
83
84 R300_STATECHANGE(r300, vpt);
85 r300->hw.vpt.cmd[R300_VPT_XSCALE] = r300PackFloat32(1.0);
86 r300->hw.vpt.cmd[R300_VPT_XOFFSET] = r300PackFloat32(dPriv->x);
87 r300->hw.vpt.cmd[R300_VPT_YSCALE] = r300PackFloat32(1.0);
88 r300->hw.vpt.cmd[R300_VPT_YOFFSET] = r300PackFloat32(dPriv->y);
89 r300->hw.vpt.cmd[R300_VPT_ZSCALE] = r300PackFloat32(1.0);
90 r300->hw.vpt.cmd[R300_VPT_ZOFFSET] = r300PackFloat32(0.0);
91
92 R300_STATECHANGE(r300, cb);
93 r300->hw.cb.cmd[R300_CB_OFFSET] = cboffset;
94 r300->hw.cb.cmd[R300_CB_PITCH] = cbpitch | R300_COLOR_UNKNOWN_22_23;
95
96 R300_STATECHANGE(r300, unk221C);
97 r300->hw.unk221C.cmd[1] = R300_221C_CLEAR;
98
99 R300_STATECHANGE(r300, ps);
100 r300->hw.ps.cmd[R300_PS_POINTSIZE] =
101 ((dPriv->w * 6) << R300_POINTSIZE_X_SHIFT) |
102 ((dPriv->h * 6) << R300_POINTSIZE_Y_SHIFT);
103
104 R300_STATECHANGE(r300, ri);
105 for(i = 1; i <= 8; ++i)
106 r300->hw.ri.cmd[i] = R300_RS_INTERP_USED;
107
108 R300_STATECHANGE(r300, rr);
109 ((drm_r300_cmd_header_t*)r300->hw.rr.cmd)->unchecked_state.count = 1;
110 r300->hw.rr.cmd[1] = 0x00004000;
111
112 R300_STATECHANGE(r300, cmk);
113 if (flags & CLEARBUFFER_COLOR) {
114 r300->hw.cmk.cmd[R300_CMK_COLORMASK] =
115 (ctx->Color.ColorMask[BCOMP] ? R300_COLORMASK0_B : 0) |
116 (ctx->Color.ColorMask[GCOMP] ? R300_COLORMASK0_G : 0) |
117 (ctx->Color.ColorMask[RCOMP] ? R300_COLORMASK0_R : 0) |
118 (ctx->Color.ColorMask[ACOMP] ? R300_COLORMASK0_A : 0);
119 } else {
120 r300->hw.cmk.cmd[R300_CMK_COLORMASK] = 0;
121 }
122
123 R300_STATECHANGE(r300, fp);
124 r300->hw.fp.cmd[R300_FP_CNTL0] = 0; /* 1 pass, no textures */
125 r300->hw.fp.cmd[R300_FP_CNTL1] = 0; /* no temporaries */
126 r300->hw.fp.cmd[R300_FP_CNTL2] = 0; /* no offset, one ALU instr */
127 r300->hw.fp.cmd[R300_FP_NODE0] = 0;
128 r300->hw.fp.cmd[R300_FP_NODE1] = 0;
129 r300->hw.fp.cmd[R300_FP_NODE2] = 0;
130 r300->hw.fp.cmd[R300_FP_NODE3] = R300_PFS_NODE_LAST_NODE;
131
132 R300_STATECHANGE(r300, fpi[0]);
133 R300_STATECHANGE(r300, fpi[1]);
134 R300_STATECHANGE(r300, fpi[2]);
135 R300_STATECHANGE(r300, fpi[3]);
136 ((drm_r300_cmd_header_t*)r300->hw.fpi[0].cmd)->unchecked_state.count = 1;
137 ((drm_r300_cmd_header_t*)r300->hw.fpi[1].cmd)->unchecked_state.count = 1;
138 ((drm_r300_cmd_header_t*)r300->hw.fpi[2].cmd)->unchecked_state.count = 1;
139 ((drm_r300_cmd_header_t*)r300->hw.fpi[3].cmd)->unchecked_state.count = 1;
140
141 /* MOV o0, t0 */
142 r300->hw.fpi[0].cmd[1] = FP_INSTRC(MAD, FP_ARGC(SRC0C_XYZ), FP_ARGC(ONE), FP_ARGC(ZERO));
143 r300->hw.fpi[1].cmd[1] = FP_SELC(0,NO,XYZ,FP_TMP(0),0,0);
144 r300->hw.fpi[2].cmd[1] = FP_INSTRA(MAD, FP_ARGA(SRC0A), FP_ARGA(ONE), FP_ARGA(ZERO));
145 r300->hw.fpi[3].cmd[1] = FP_SELA(0,NO,W,FP_TMP(0),0,0);
146
147 R300_STATECHANGE(r300, pvs);
148 r300->hw.pvs.cmd[R300_PVS_CNTL_1] =
149 (0 << R300_PVS_CNTL_1_PROGRAM_START_SHIFT) |
150 (0 << R300_PVS_CNTL_1_UNKNOWN_SHIFT) |
151 (1 << R300_PVS_CNTL_1_PROGRAM_END_SHIFT);
152 r300->hw.pvs.cmd[R300_PVS_CNTL_2] = 0; /* no parameters */
153 r300->hw.pvs.cmd[R300_PVS_CNTL_3] =
154 (1 << R300_PVS_CNTL_3_PROGRAM_UNKNOWN_SHIFT);
155
156 R300_STATECHANGE(r300, vpi);
157 ((drm_r300_cmd_header_t*)r300->hw.vpi.cmd)->unchecked_state.count = 8;
158
159 /* MOV o0, i0; */
160 r300->hw.vpi.cmd[1] = VP_OUT(ADD,OUT,0,XYZW);
161 r300->hw.vpi.cmd[2] = VP_IN(IN,0);
162 r300->hw.vpi.cmd[3] = VP_ZERO();
163 r300->hw.vpi.cmd[4] = 0;
164
165 /* MOV o1, i1; */
166 r300->hw.vpi.cmd[5] = VP_OUT(ADD,OUT,1,XYZW);
167 r300->hw.vpi.cmd[6] = VP_IN(IN,1);
168 r300->hw.vpi.cmd[7] = VP_ZERO();
169 r300->hw.vpi.cmd[8] = 0;
170
171 R300_STATECHANGE(r300, zc);
172 if (flags & CLEARBUFFER_DEPTH) {
173 r300->hw.zc.cmd[R300_ZC_CNTL_0] = 0x6; // test and write
174 r300->hw.zc.cmd[R300_ZC_CNTL_1] = R300_Z_TEST_ALWAYS;
175 /*
176 R300_STATECHANGE(r300, zb);
177 r300->hw.zb.cmd[R300_ZB_OFFSET] =
178 1024*4*300 +
179 r300->radeon.radeonScreen->frontOffset +
180 r300->radeon.radeonScreen->fbLocation;
181 r300->hw.zb.cmd[R300_ZB_PITCH] =
182 r300->radeon.radeonScreen->depthPitch;
183 */
184 } else {
185 r300->hw.zc.cmd[R300_ZC_CNTL_0] = 0; // disable
186 r300->hw.zc.cmd[R300_ZC_CNTL_1] = 0;
187 }
188
189 /* Make sure we have enough space */
190 r300EnsureCmdBufSpace(r300, r300->hw.max_state_size + 9, __FUNCTION__);
191
192 r300EmitState(r300);
193
194 cmd = (drm_r300_cmd_header_t*)r300AllocCmdBuf(r300, 9, __FUNCTION__);
195 cmd[0].packet3.cmd_type = R300_CMD_PACKET3;
196 cmd[0].packet3.packet = R300_CMD_PACKET3_CLEAR;
197 cmd[1].u = r300PackFloat32(dPriv->w / 2.0);
198 cmd[2].u = r300PackFloat32(dPriv->h / 2.0);
199 cmd[3].u = r300PackFloat32(ctx->Depth.Clear);
200 cmd[4].u = r300PackFloat32(1.0);
201 cmd[5].u = r300PackFloat32(ctx->Color.ClearColor[0]);
202 cmd[6].u = r300PackFloat32(ctx->Color.ClearColor[1]);
203 cmd[7].u = r300PackFloat32(ctx->Color.ClearColor[2]);
204 cmd[8].u = r300PackFloat32(ctx->Color.ClearColor[3]);
205 }
206
207
208 /**
209 * Buffer clear
210 */
211 static void r300Clear(GLcontext * ctx, GLbitfield mask, GLboolean all,
212 GLint cx, GLint cy, GLint cw, GLint ch)
213 {
214 r300ContextPtr r300 = R300_CONTEXT(ctx);
215 __DRIdrawablePrivate *dPriv = r300->radeon.dri.drawable;
216 int flags = 0;
217 int bits = 0;
218 int swapped;
219
220 if (RADEON_DEBUG & DEBUG_IOCTL)
221 fprintf(stderr, "%s: all=%d cx=%d cy=%d cw=%d ch=%d\n",
222 __FUNCTION__, all, cx, cy, cw, ch);
223
224 {
225 LOCK_HARDWARE(&r300->radeon);
226 UNLOCK_HARDWARE(&r300->radeon);
227 if (dPriv->numClipRects == 0)
228 return;
229 }
230
231 if (mask & DD_FRONT_LEFT_BIT) {
232 flags |= DD_FRONT_LEFT_BIT;
233 mask &= ~DD_FRONT_LEFT_BIT;
234 }
235
236 if (mask & DD_BACK_LEFT_BIT) {
237 flags |= DD_BACK_LEFT_BIT;
238 mask &= ~DD_BACK_LEFT_BIT;
239 }
240
241 if (mask & DD_DEPTH_BIT) {
242 bits |= CLEARBUFFER_DEPTH;
243 mask &= ~DD_DEPTH_BIT;
244 }
245
246 if (mask) {
247 if (RADEON_DEBUG & DEBUG_FALLBACKS)
248 fprintf(stderr, "%s: swrast clear, mask: %x\n",
249 __FUNCTION__, mask);
250 _swrast_Clear(ctx, mask, all, cx, cy, cw, ch);
251 }
252
253 swapped = r300->radeon.doPageFlip && (r300->radeon.sarea->pfCurrentPage == 1);
254
255 if (flags & DD_FRONT_LEFT_BIT) {
256 r300ClearBuffer(r300, bits | CLEARBUFFER_COLOR, swapped);
257 bits = 0;
258 }
259
260 if (flags & DD_BACK_LEFT_BIT) {
261 r300ClearBuffer(r300, bits | CLEARBUFFER_COLOR, swapped ^ 1);
262 bits = 0;
263 }
264
265 if (bits)
266 r300ClearBuffer(r300, bits, 0);
267
268 /* Recalculate the hardware state. This could be done more efficiently,
269 * but do keep it like this for now.
270 */
271 r300ResetHwState(r300);
272 }
273
274 void r300Flush(GLcontext * ctx)
275 {
276 r300ContextPtr r300 = R300_CONTEXT(ctx);
277
278 if (RADEON_DEBUG & DEBUG_IOCTL)
279 fprintf(stderr, "%s\n", __FUNCTION__);
280
281 if (r300->cmdbuf.count_used > r300->cmdbuf.count_reemit)
282 r300FlushCmdBuf(r300, __FUNCTION__);
283 }
284
285 void r300RefillCurrentDmaRegion(r300ContextPtr rmesa)
286 {
287 struct r200_dma_buffer *dmabuf;
288 int fd = rmesa->radeon.dri.fd;
289 int index = 0;
290 int size = 0;
291 drmDMAReq dma;
292 int ret;
293
294 if (RADEON_DEBUG & (DEBUG_IOCTL | DEBUG_DMA))
295 fprintf(stderr, "%s\n", __FUNCTION__);
296
297 if (rmesa->dma.flush) {
298 rmesa->dma.flush(rmesa);
299 }
300
301 if (rmesa->dma.current.buf)
302 r300ReleaseDmaRegion(rmesa, &rmesa->dma.current, __FUNCTION__);
303
304 if (rmesa->dma.nr_released_bufs > 4)
305 r300FlushCmdBuf(rmesa, __FUNCTION__);
306
307 dma.context = rmesa->radeon.dri.hwContext;
308 dma.send_count = 0;
309 dma.send_list = NULL;
310 dma.send_sizes = NULL;
311 dma.flags = 0;
312 dma.request_count = 1;
313 dma.request_size = RADEON_BUFFER_SIZE;
314 dma.request_list = &index;
315 dma.request_sizes = &size;
316 dma.granted_count = 0;
317
318 LOCK_HARDWARE(&rmesa->radeon); /* no need to validate */
319
320 while (1) {
321 ret = drmDMA(fd, &dma);
322 if (ret == 0)
323 break;
324
325 if (rmesa->dma.nr_released_bufs) {
326 r200FlushCmdBufLocked(rmesa, __FUNCTION__);
327 }
328
329 if (rmesa->radeon.do_usleeps) {
330 UNLOCK_HARDWARE(&rmesa->radeon);
331 DO_USLEEP(1);
332 LOCK_HARDWARE(&rmesa->radeon);
333 }
334 }
335
336 UNLOCK_HARDWARE(&rmesa->radeon);
337
338 if (RADEON_DEBUG & DEBUG_DMA)
339 fprintf(stderr, "Allocated buffer %d\n", index);
340
341 dmabuf = CALLOC_STRUCT(r300_dma_buffer);
342 dmabuf->buf = &rmesa->radeon.radeonScreen->buffers->list[index];
343 dmabuf->refcount = 1;
344
345 rmesa->dma.current.buf = dmabuf;
346 rmesa->dma.current.address = dmabuf->buf->address;
347 rmesa->dma.current.end = dmabuf->buf->total;
348 rmesa->dma.current.start = 0;
349 rmesa->dma.current.ptr = 0;
350 }
351
352 void r300ReleaseDmaRegion(r300ContextPtr rmesa,
353 struct r300_dma_region *region, const char *caller)
354 {
355 if (RADEON_DEBUG & DEBUG_IOCTL)
356 fprintf(stderr, "%s from %s\n", __FUNCTION__, caller);
357
358 if (!region->buf)
359 return;
360
361 if (rmesa->dma.flush)
362 rmesa->dma.flush(rmesa);
363
364 if (--region->buf->refcount == 0) {
365 drm_radeon_cmd_header_t *cmd;
366
367 if (RADEON_DEBUG & (DEBUG_IOCTL | DEBUG_DMA))
368 fprintf(stderr, "%s -- DISCARD BUF %d\n", __FUNCTION__,
369 region->buf->buf->idx);
370
371 cmd =
372 (drm_radeon_cmd_header_t *) r300AllocCmdBuf(rmesa,
373 sizeof(*cmd),
374 __FUNCTION__);
375 cmd->dma.cmd_type = RADEON_CMD_DMA_DISCARD;
376 cmd->dma.buf_idx = region->buf->buf->idx;
377 FREE(region->buf);
378 rmesa->dma.nr_released_bufs++;
379 }
380
381 region->buf = 0;
382 region->start = 0;
383 }
384
385 /* Allocates a region from rmesa->dma.current. If there isn't enough
386 * space in current, grab a new buffer (and discard what was left of current)
387 */
388 void r300AllocDmaRegion(r300ContextPtr rmesa,
389 struct r300_dma_region *region,
390 int bytes, int alignment)
391 {
392 if (RADEON_DEBUG & DEBUG_IOCTL)
393 fprintf(stderr, "%s %d\n", __FUNCTION__, bytes);
394
395 if (rmesa->dma.flush)
396 rmesa->dma.flush(rmesa);
397
398 if (region->buf)
399 r300ReleaseDmaRegion(rmesa, region, __FUNCTION__);
400
401 alignment--;
402 rmesa->dma.current.start = rmesa->dma.current.ptr =
403 (rmesa->dma.current.ptr + alignment) & ~alignment;
404
405 if (rmesa->dma.current.ptr + bytes > rmesa->dma.current.end)
406 r300RefillCurrentDmaRegion(rmesa);
407
408 region->start = rmesa->dma.current.start;
409 region->ptr = rmesa->dma.current.start;
410 region->end = rmesa->dma.current.start + bytes;
411 region->address = rmesa->dma.current.address;
412 region->buf = rmesa->dma.current.buf;
413 region->buf->refcount++;
414
415 rmesa->dma.current.ptr += bytes; /* bug - if alignment > 7 */
416 rmesa->dma.current.start =
417 rmesa->dma.current.ptr = (rmesa->dma.current.ptr + 0x7) & ~0x7;
418
419 assert(rmesa->dma.current.ptr <= rmesa->dma.current.end);
420 }
421
422 /* Called via glXGetMemoryOffsetMESA() */
423 GLuint r300GetMemoryOffsetMESA(__DRInativeDisplay * dpy, int scrn,
424 const GLvoid * pointer)
425 {
426 GET_CURRENT_CONTEXT(ctx);
427 r300ContextPtr rmesa;
428 GLuint card_offset;
429
430 if (!ctx || !(rmesa = R300_CONTEXT(ctx))) {
431 fprintf(stderr, "%s: no context\n", __FUNCTION__);
432 return ~0;
433 }
434
435 if (!r300IsGartMemory(rmesa, pointer, 0))
436 return ~0;
437
438 if (rmesa->radeon.dri.drmMinor < 6)
439 return ~0;
440
441 card_offset = r300GartOffsetFromVirtual(rmesa, pointer);
442
443 return card_offset - rmesa->radeon.radeonScreen->gart_base;
444 }
445
446 GLboolean r300IsGartMemory(r300ContextPtr rmesa, const GLvoid * pointer,
447 GLint size)
448 {
449 int offset =
450 (char *)pointer - (char *)rmesa->radeon.radeonScreen->gartTextures.map;
451 int valid = (size >= 0 && offset >= 0
452 && offset + size < rmesa->radeon.radeonScreen->gartTextures.size);
453
454 if (RADEON_DEBUG & DEBUG_IOCTL)
455 fprintf(stderr, "r300IsGartMemory( %p ) : %d\n", pointer,
456 valid);
457
458 return valid;
459 }
460
461 GLuint r300GartOffsetFromVirtual(r300ContextPtr rmesa, const GLvoid * pointer)
462 {
463 int offset =
464 (char *)pointer - (char *)rmesa->radeon.radeonScreen->gartTextures.map;
465
466 fprintf(stderr, "offset=%08x\n", offset);
467
468 if (offset < 0 || offset > rmesa->radeon.radeonScreen->gartTextures.size)
469 return ~0;
470 else
471 return rmesa->radeon.radeonScreen->gart_texture_offset + offset;
472 }
473
474 void r300InitIoctlFuncs(struct dd_function_table *functions)
475 {
476 functions->Clear = r300Clear;
477 functions->Finish = radeonFinish;
478 functions->Flush = r300Flush;
479 }