Merge branch 'mesa_7_5_branch' into mesa_7_6_branch
[mesa.git] / src / gallium / drivers / nv20 / nv20_prim_vbuf.c
index a51d657d2741e7200664ed64ad05254a7333efe4..ddfcdb8057ae19535fa697e976a4e47531e8a701 100644 (file)
@@ -38,9 +38,9 @@
  */
 
 
-#include "pipe/p_debug.h"
+#include "util/u_debug.h"
 #include "pipe/p_inlines.h"
-#include "pipe/p_winsys.h"
+#include "pipe/internal/p_winsys_screen.h"
 
 #include "nv20_context.h"
 #include "nv20_state.h"
@@ -55,38 +55,41 @@ struct nv20_vbuf_render {
 
        struct nv20_context *nv20;   
 
-       /** Vertex buffer */
-       struct pipe_buffer* buffer;
+       /** Vertex buffer in VRAM */
+       struct pipe_buffer *pbuffer;
+
+       /** Vertex buffer in normal memory */
+       void *mbuffer;
 
        /** Vertex size in bytes */
-       unsigned vertex_size;
+       /*unsigned vertex_size;*/
 
        /** Hardware primitive */
        unsigned hwprim;
 };
 
-
-void nv20_vtxbuf_bind( struct nv20_context* nv20 )
-{
-       int i;
-       for(i = 0; i < 8; i++) {
-               BEGIN_RING(kelvin, NV10TCL_VERTEX_ARRAY_ATTRIB_OFFSET(i), 1);
-               OUT_RING(0/*nv20->vtxbuf*/);
-               BEGIN_RING(kelvin, NV10TCL_VERTEX_ARRAY_ATTRIB_FORMAT(i) ,1);
-               OUT_RING(0/*XXX*/);
-       }
-}
-
 /**
  * Basically a cast wrapper.
  */
 static INLINE struct nv20_vbuf_render *
-nv20_vbuf_render( struct vbuf_render *render )
+nv20_vbuf_render(struct vbuf_render *render)
 {
        assert(render);
        return (struct nv20_vbuf_render *)render;
 }
 
+void nv20_vtxbuf_bind( struct nv20_context* nv20 )
+{
+#if 0
+       int i;
+       for(i = 0; i < NV20TCL_VTXBUF_ADDRESS__SIZE; i++) {
+               BEGIN_RING(kelvin, NV20TCL_VTXBUF_ADDRESS(i), 1);
+               OUT_RING(0/*nv20->vtxbuf*/);
+               BEGIN_RING(kelvin, NV20TCL_VTXFMT(i) ,1);
+               OUT_RING(0/*XXX*/);
+       }
+#endif
+}
 
 static const struct vertex_info *
 nv20_vbuf_render_get_vertex_info( struct vbuf_render *render )
@@ -99,50 +102,212 @@ nv20_vbuf_render_get_vertex_info( struct vbuf_render *render )
        return &nv20->vertex_info;
 }
 
-
 static void *
+nv20__allocate_mbuffer(struct nv20_vbuf_render *nv20_render, size_t size)
+{
+       nv20_render->mbuffer = MALLOC(size);
+       return nv20_render->mbuffer;
+}
+
+static void
+nv20__allocate_pbuffer(struct nv20_vbuf_render *nv20_render, size_t size)
+{
+       struct pipe_screen *screen = nv20_render->nv20->pipe.screen;
+       nv20_render->pbuffer = screen->buffer_create(screen, 64,
+                                       PIPE_BUFFER_USAGE_VERTEX, size);
+}
+
+static boolean
 nv20_vbuf_render_allocate_vertices( struct vbuf_render *render,
                ushort vertex_size,
                ushort nr_vertices )
 {
        struct nv20_vbuf_render *nv20_render = nv20_vbuf_render(render);
-       struct nv20_context *nv20 = nv20_render->nv20;
-       struct pipe_winsys *winsys = nv20->pipe.winsys;
        size_t size = (size_t)vertex_size * (size_t)nr_vertices;
+       void *buf;
+
+       assert(!nv20_render->pbuffer);
+       assert(!nv20_render->mbuffer);
+
+       /*
+        * For small amount of vertices, don't bother with pipe vertex
+        * buffer, the data will be passed directly via the fifo.
+        */
+       /* XXX: Pipe vertex buffers don't work. */
+       if (0 && size > 16 * 1024) {
+               nv20__allocate_pbuffer(nv20_render, size);
+               /* umm yeah so this is ugly */
+               buf = nv20_render->pbuffer;
+       } else {
+               buf = nv20__allocate_mbuffer(nv20_render, size);
+       }
 
-       assert(!nv20_render->buffer);
-       nv20_render->buffer = winsys->buffer_create(winsys, 64, PIPE_BUFFER_USAGE_VERTEX, size);
+       if (buf)
+               nv20_render->nv20->dirty |= NV20_NEW_VTXARRAYS;
 
-       nv20->dirty |= NV20_NEW_VTXARRAYS;
+       return buf ? TRUE : FALSE;
+}
 
-       return winsys->buffer_map(winsys, 
-                       nv20_render->buffer, 
-                       PIPE_BUFFER_USAGE_CPU_WRITE);
+static void *
+nv20_vbuf_render_map_vertices( struct vbuf_render *render )
+{
+       struct nv20_vbuf_render *nv20_render = nv20_vbuf_render(render);
+       struct pipe_screen *pscreen = nv20_render->nv20->pipe.screen;
+
+       if (nv20_render->pbuffer) {
+               return pipe_buffer_map(pscreen, nv20_render->pbuffer,
+                                      PIPE_BUFFER_USAGE_CPU_WRITE);
+       } else if (nv20_render->mbuffer) {
+               return nv20_render->mbuffer;
+       } else
+               assert(0);
+
+       /* warnings be gone */
+       return NULL;
 }
 
+static void
+nv20_vbuf_render_unmap_vertices( struct vbuf_render *render,
+               ushort min_index,
+               ushort max_index )
+{
+       struct nv20_vbuf_render *nv20_render = nv20_vbuf_render(render);
+       struct pipe_screen *pscreen = nv20_render->nv20->pipe.screen;
+
+       if (nv20_render->pbuffer)
+               pipe_buffer_unmap(pscreen, nv20_render->pbuffer);
+}
 
-static void 
+static boolean
 nv20_vbuf_render_set_primitive( struct vbuf_render *render, 
                unsigned prim )
 {
        struct nv20_vbuf_render *nv20_render = nv20_vbuf_render(render);
-       nv20_render->hwprim = prim + 1;
+       unsigned hwp = nvgl_primitive(prim);
+       if (hwp == 0)
+               return FALSE;
+
+       nv20_render->hwprim = hwp;
+       return TRUE;
 }
 
+static uint32_t
+nv20__vtxhwformat(unsigned stride, unsigned fields, unsigned type)
+{
+       return (stride << NV20TCL_VTXFMT_STRIDE_SHIFT) |
+               (fields << NV20TCL_VTXFMT_SIZE_SHIFT) |
+               (type << NV20TCL_VTXFMT_TYPE_SHIFT);
+}
 
-static void 
-nv20_vbuf_render_draw( struct vbuf_render *render,
+static unsigned
+nv20__emit_format(struct nv20_context *nv20, enum attrib_emit type, int hwattr)
+{
+       uint32_t hwfmt = 0;
+       unsigned fields;
+
+       switch (type) {
+       case EMIT_OMIT:
+               hwfmt = nv20__vtxhwformat(0, 0, 2);
+               fields = 0;
+               break;
+       case EMIT_1F:
+               hwfmt = nv20__vtxhwformat(4, 1, 2);
+               fields = 1;
+               break;
+       case EMIT_2F:
+               hwfmt = nv20__vtxhwformat(8, 2, 2);
+               fields = 2;
+               break;
+       case EMIT_3F:
+               hwfmt = nv20__vtxhwformat(12, 3, 2);
+               fields = 3;
+               break;
+       case EMIT_4F:
+               hwfmt = nv20__vtxhwformat(16, 4, 2);
+               fields = 4;
+               break;
+       default:
+               NOUVEAU_ERR("unhandled attrib_emit %d\n", type);
+               return 0;
+       }
+
+       BEGIN_RING(kelvin, NV20TCL_VTXFMT(hwattr), 1);
+       OUT_RING(hwfmt);
+       return fields;
+}
+
+static unsigned
+nv20__emit_vertex_array_format(struct nv20_context *nv20)
+{
+       struct vertex_info *vinfo = &nv20->vertex_info;
+       int hwattr = NV20TCL_VTXFMT__SIZE;
+       int attr = 0;
+       unsigned nr_fields = 0;
+
+       while (hwattr-- > 0) {
+               if (vinfo->hwfmt[0] & (1 << hwattr)) {
+                       nr_fields += nv20__emit_format(nv20,
+                                       vinfo->attrib[attr].emit, hwattr);
+                       attr++;
+               } else
+                       nv20__emit_format(nv20, EMIT_OMIT, hwattr);
+       }
+
+       return nr_fields;
+}
+
+static void
+nv20__draw_mbuffer(struct nv20_vbuf_render *nv20_render,
+               const ushort *indices,
+               uint nr_indices)
+{
+       struct nv20_context *nv20 = nv20_render->nv20;
+       struct vertex_info *vinfo = &nv20->vertex_info;
+       unsigned nr_fields;
+       int max_push;
+       ubyte *data = nv20_render->mbuffer;
+       int vsz = 4 * vinfo->size;
+
+       nr_fields = nv20__emit_vertex_array_format(nv20);
+
+       BEGIN_RING(kelvin, NV20TCL_VERTEX_BEGIN_END, 1);
+       OUT_RING(nv20_render->hwprim);
+
+       max_push = 1200 / nr_fields;
+       while (nr_indices) {
+               int i;
+               int push = MIN2(nr_indices, max_push);
+
+               BEGIN_RING_NI(kelvin, NV20TCL_VERTEX_DATA, push * nr_fields);
+               for (i = 0; i < push; i++) {
+                       /* XXX: fixme to handle other than floats? */
+                       int f = nr_fields;
+                       float *attrv = (float*)&data[indices[i] * vsz];
+                       while (f-- > 0)
+                               OUT_RINGf(*attrv++);
+               }
+
+               nr_indices -= push;
+               indices += push;
+       }
+
+       BEGIN_RING(kelvin, NV20TCL_VERTEX_BEGIN_END, 1);
+       OUT_RING(NV20TCL_VERTEX_BEGIN_END_STOP);
+}
+
+static void
+nv20__draw_pbuffer(struct nv20_vbuf_render *nv20_render,
                const ushort *indices,
                uint nr_indices)
 {
-       struct nv20_vbuf_render *nv20_render = nv20_vbuf_render(render);
        struct nv20_context *nv20 = nv20_render->nv20;
        int push, i;
 
-       nv20_emit_hw_state(nv20);
+       NOUVEAU_ERR("nv20__draw_pbuffer: this path is broken.\n");
 
        BEGIN_RING(kelvin, NV10TCL_VERTEX_ARRAY_OFFSET_POS, 1);
-       OUT_RELOCl(nv20_render->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_GART | NOUVEAU_BO_RD);
+       OUT_RELOCl(nv20_render->pbuffer, 0,
+                       NOUVEAU_BO_VRAM | NOUVEAU_BO_GART | NOUVEAU_BO_RD);
 
        BEGIN_RING(kelvin, NV10TCL_VERTEX_BUFFER_BEGIN_END, 1);
        OUT_RING(nv20_render->hwprim);
@@ -169,21 +334,37 @@ nv20_vbuf_render_draw( struct vbuf_render *render,
        OUT_RING  (0);
 }
 
+static void
+nv20_vbuf_render_draw( struct vbuf_render *render,
+               const ushort *indices,
+               uint nr_indices)
+{
+       struct nv20_vbuf_render *nv20_render = nv20_vbuf_render(render);
+
+       nv20_emit_hw_state(nv20_render->nv20);
+
+       if (nv20_render->pbuffer)
+               nv20__draw_pbuffer(nv20_render, indices, nr_indices);
+       else if (nv20_render->mbuffer)
+               nv20__draw_mbuffer(nv20_render, indices, nr_indices);
+       else
+               assert(0);
+}
+
 
 static void
-nv20_vbuf_render_release_vertices( struct vbuf_render *render,
-               void *vertices, 
-               unsigned vertex_size,
-               unsigned vertices_used )
+nv20_vbuf_render_release_vertices( struct vbuf_render *render )
 {
        struct nv20_vbuf_render *nv20_render = nv20_vbuf_render(render);
        struct nv20_context *nv20 = nv20_render->nv20;
-       struct pipe_winsys *winsys = nv20->pipe.winsys;
-       struct pipe_screen *pscreen = &nv20->screen->pipe;
 
-       assert(nv20_render->buffer);
-       winsys->buffer_unmap(winsys, nv20_render->buffer);
-       pipe_buffer_reference(pscreen, &nv20_render->buffer, NULL);
+       if (nv20_render->pbuffer) {
+               pipe_buffer_reference(&nv20_render->pbuffer, NULL);
+       } else if (nv20_render->mbuffer) {
+               FREE(nv20_render->mbuffer);
+               nv20_render->mbuffer = NULL;
+       } else
+               assert(0);
 }
 
 
@@ -191,6 +372,10 @@ static void
 nv20_vbuf_render_destroy( struct vbuf_render *render )
 {
        struct nv20_vbuf_render *nv20_render = nv20_vbuf_render(render);
+
+       assert(!nv20_render->pbuffer);
+       assert(!nv20_render->mbuffer);
+
        FREE(nv20_render);
 }
 
@@ -208,7 +393,10 @@ nv20_vbuf_render_create( struct nv20_context *nv20 )
        nv20_render->base.max_vertex_buffer_bytes = 16*1024;
        nv20_render->base.max_indices = 1024;
        nv20_render->base.get_vertex_info = nv20_vbuf_render_get_vertex_info;
-       nv20_render->base.allocate_vertices = nv20_vbuf_render_allocate_vertices;
+       nv20_render->base.allocate_vertices =
+                                       nv20_vbuf_render_allocate_vertices;
+       nv20_render->base.map_vertices = nv20_vbuf_render_map_vertices;
+       nv20_render->base.unmap_vertices = nv20_vbuf_render_unmap_vertices;
        nv20_render->base.set_primitive = nv20_vbuf_render_set_primitive;
        nv20_render->base.draw = nv20_vbuf_render_draw;
        nv20_render->base.release_vertices = nv20_vbuf_render_release_vertices;