svga: fix draw elements with 8-bits indices
[mesa.git] / src / gallium / drivers / svga / svga_draw_elements.c
index 83527c6ef496ce4d04084adf8ce7f50152251a3a..dd977b1bc2da69eaeea0e0382194d504392ccb03 100644 (file)
@@ -24,6 +24,7 @@
  **********************************************************/
 
 #include "util/u_inlines.h"
+#include "util/u_prim.h"
 #include "util/u_upload_mgr.h"
 #include "indices/u_indices.h"
 
 #include "svga_resource_buffer.h"
 #include "svga_winsys.h"
 #include "svga_context.h"
-
 #include "svga_hw_reg.h"
 
 
+/**
+ * Return a new index buffer which contains a translation of the original
+ * index buffer.  An example of a translation is converting from QUAD
+ * primitives to TRIANGLE primitives.  Each set of four indexes for a quad
+ * will be converted to six indices for two triangles.
+ *
+ * Before generating the new index buffer we'll check if the incoming
+ * buffer already has a translated buffer that can be re-used.
+ * This benefits demos like Cinebench R15 which has many
+ * glDrawElements(GL_QUADS) commands (we can't draw quads natively).
+ *
+ * \param offset  offset in bytes to first index to translate in src buffer
+ * \param orig_prim  original primitive type (like PIPE_PRIM_QUADS)
+ * \param gen_prim  new/generated primitive type (like PIPE_PRIM_TRIANGLES)
+ * \param orig_nr  number of indexes to translate in source buffer
+ * \param gen_nr  number of indexes to write into new/dest buffer
+ * \param index_size  bytes per index (2 or 4)
+ * \param translate  the translation function from the u_translate module
+ * \param out_buf  returns the new/translated index buffer
+ * \return error code to indicate success failure
+ */
 static enum pipe_error
-translate_indices( struct svga_hwtnl *hwtnl,
-                   struct pipe_resource *src,
-                   unsigned offset,
-                   unsigned nr,
-                   unsigned index_size,
-                   u_translate_func translate,
-                   struct pipe_resource **out_buf )
+translate_indices(struct svga_hwtnl *hwtnl,
+                  const struct pipe_draw_info *info,
+                  enum pipe_prim_type gen_prim,
+                  unsigned orig_nr, unsigned gen_nr,
+                  unsigned gen_size,
+                  u_translate_func translate,
+                  struct pipe_resource **out_buf,
+                  unsigned *out_offset)
 {
    struct pipe_context *pipe = &hwtnl->svga->pipe;
+   struct svga_screen *screen = svga_screen(pipe->screen);
+   struct svga_buffer *src_sbuf = NULL;
    struct pipe_transfer *src_transfer = NULL;
    struct pipe_transfer *dst_transfer = NULL;
-   unsigned size = index_size * nr;
+   const unsigned size = gen_size * gen_nr;
+   const unsigned offset = info->start * info->index_size;
    const void *src_map = NULL;
    struct pipe_resource *dst = NULL;
    void *dst_map = NULL;
 
-   dst = pipe_buffer_create( pipe->screen, 
-                            PIPE_BIND_INDEX_BUFFER, 
-                            size );
-   if (dst == NULL)
-      goto fail;
+   assert(gen_size == 2 || gen_size == 4);
+   if (!info->has_user_indices)
+      src_sbuf = svga_buffer(info->index.resource);
+
+   /* If the draw_info provides us with a buffer rather than a
+    * user pointer, Check to see if we've already translated that buffer
+    */
+   if (src_sbuf && !screen->debug.no_cache_index_buffers) {
+      /* Check if we already have a translated index buffer */
+      if (src_sbuf->translated_indices.buffer &&
+          src_sbuf->translated_indices.orig_prim == info->mode &&
+          src_sbuf->translated_indices.new_prim == gen_prim &&
+          src_sbuf->translated_indices.offset == offset &&
+          src_sbuf->translated_indices.count == orig_nr &&
+          src_sbuf->translated_indices.index_size == gen_size) {
+         pipe_resource_reference(out_buf, src_sbuf->translated_indices.buffer);
+         return PIPE_OK;
+      }
+   }
 
-   src_map = pipe_buffer_map( pipe, src, PIPE_TRANSFER_READ, &src_transfer );
-   if (src_map == NULL)
-      goto fail;
+   /* Need to trim vertex count to make sure we don't write too much data
+    * to the dst buffer in the translate() call.
+    */
+   u_trim_pipe_prim(gen_prim, &gen_nr);
 
-   dst_map = pipe_buffer_map( pipe, dst, PIPE_TRANSFER_WRITE, &dst_transfer );
-   if (dst_map == NULL)
-      goto fail;
+   if (src_sbuf) {
+      /* If we have a source buffer, create a destination buffer in the
+       * hope that we can reuse the translated data later. If not,
+       * we'd probably be better off using the upload buffer.
+       */
+      dst = pipe_buffer_create(pipe->screen,
+                               PIPE_BIND_INDEX_BUFFER, PIPE_USAGE_IMMUTABLE,
+                               size);
+      if (!dst)
+         goto fail;
+
+      dst_map = pipe_buffer_map(pipe, dst, PIPE_TRANSFER_WRITE, &dst_transfer);
+      if (!dst_map)
+         goto fail;
+
+      *out_offset = 0;
+      src_map = pipe_buffer_map(pipe, info->index.resource,
+                                PIPE_TRANSFER_READ |
+                                PIPE_TRANSFER_UNSYNCHRONIZED,
+                                &src_transfer);
+      if (!src_map)
+         goto fail;
+   } else {
+      /* Allocate upload buffer space. Align to the index size. */
+      u_upload_alloc(pipe->stream_uploader, 0, size, gen_size,
+                     out_offset, &dst, &dst_map);
+      if (!dst)
+         goto fail;
+
+      src_map = info->index.user;
+   }
+
+   translate((const char *) src_map + offset, 0, 0, gen_nr, 0, dst_map);
 
-   translate( (const char *)src_map + offset,
-              nr,
-              dst_map );
+   if (src_transfer)
+      pipe_buffer_unmap(pipe, src_transfer);
 
-   pipe_buffer_unmap( pipe, src_transfer );
-   pipe_buffer_unmap( pipe, dst_transfer );
+   if (dst_transfer)
+      pipe_buffer_unmap(pipe, dst_transfer);
+   else
+      u_upload_unmap(pipe->stream_uploader);
 
    *out_buf = dst;
+
+   if (src_sbuf && !screen->debug.no_cache_index_buffers) {
+      /* Save the new, translated index buffer in the hope we can use it
+       * again in the future.
+       */
+      pipe_resource_reference(&src_sbuf->translated_indices.buffer, dst);
+      src_sbuf->translated_indices.orig_prim = info->mode;
+      src_sbuf->translated_indices.new_prim = gen_prim;
+      src_sbuf->translated_indices.offset = offset;
+      src_sbuf->translated_indices.count = orig_nr;
+      src_sbuf->translated_indices.index_size = gen_size;
+   }
+
    return PIPE_OK;
 
-fail:
-   if (src_map)
-      pipe_buffer_unmap( pipe, src_transfer );
+ fail:
+   if (src_transfer)
+      pipe_buffer_unmap(pipe, src_transfer);
 
-   if (dst_map)
-      pipe_buffer_unmap( pipe, dst_transfer );
+   if (dst_transfer)
+      pipe_buffer_unmap(pipe, dst_transfer);
+   else if (dst_map)
+      u_upload_unmap(pipe->stream_uploader);
 
    if (dst)
-      pipe->screen->resource_destroy( pipe->screen, dst );
+      pipe_resource_reference(&dst, NULL);
 
    return PIPE_ERROR_OUT_OF_MEMORY;
 }
 
 
-
-
-
 enum pipe_error
-svga_hwtnl_simple_draw_range_elements( struct svga_hwtnl *hwtnl,
-                                       struct pipe_resource *index_buffer,
-                                       unsigned index_size,
-                                       int index_bias,
-                                       unsigned min_index,
-                                       unsigned max_index,
-                                       unsigned prim, 
-                                       unsigned start,
-                                       unsigned count )
+svga_hwtnl_simple_draw_range_elements(struct svga_hwtnl *hwtnl,
+                                      struct pipe_resource *index_buffer,
+                                      unsigned index_size, int index_bias,
+                                      unsigned min_index, unsigned max_index,
+                                      enum pipe_prim_type prim, unsigned start,
+                                      unsigned count,
+                                      unsigned start_instance,
+                                      unsigned instance_count,
+                                      ubyte vertices_per_patch)
 {
-   struct pipe_resource *upload_buffer = NULL;
    SVGA3dPrimitiveRange range;
    unsigned hw_prim;
    unsigned hw_count;
    unsigned index_offset = start * index_size;
-   int ret = PIPE_OK;
 
-   hw_prim = svga_translate_prim(prim, count, &hw_count);
+   hw_prim = svga_translate_prim(prim, count, &hw_count, vertices_per_patch);
    if (hw_count == 0)
-      goto done;
-
-   if (index_buffer && 
-       svga_buffer_is_user_buffer(index_buffer)) 
-   {
-      boolean flushed;
-      assert( index_buffer->width0 >= index_offset + count * index_size );
-
-      ret = u_upload_buffer( hwtnl->upload_ib,
-                             0,
-                             index_offset,
-                             count * index_size,
-                             index_buffer,
-                             &index_offset,
-                             &upload_buffer,
-                             &flushed );
-      if (ret)
-         goto done;
-
-      /* Don't need to worry about refcounting index_buffer as this is
-       * just a stack variable without a counted reference of its own.
-       * The caller holds the reference.
-       */
-      index_buffer = upload_buffer;
-   }
+      return PIPE_OK; /* nothing to draw */
 
    range.primType = hw_prim;
    range.primitiveCount = hw_count;
@@ -147,73 +204,90 @@ svga_hwtnl_simple_draw_range_elements( struct svga_hwtnl *hwtnl,
    range.indexArray.stride = index_size;
    range.indexWidth = index_size;
    range.indexBias = index_bias;
-      
-   ret = svga_hwtnl_prim( hwtnl, &range, min_index, max_index, index_buffer );
-   if (ret)
-      goto done;
 
-done:
-   if (upload_buffer)
-      pipe_resource_reference( &upload_buffer, NULL );
-
-   return ret;
+   return svga_hwtnl_prim(hwtnl, &range, count,
+                          min_index, max_index, index_buffer,
+                          start_instance, instance_count,
+                          NULL, NULL);
 }
 
 
-
-
 enum pipe_error
-svga_hwtnl_draw_range_elements( struct svga_hwtnl *hwtnl,
-                                struct pipe_resource *index_buffer,
-                                unsigned index_size,
-                                int index_bias,
-                                unsigned min_index,
-                                unsigned max_index,
-                                unsigned prim, unsigned start, unsigned count)
+svga_hwtnl_draw_range_elements(struct svga_hwtnl *hwtnl,
+                               const struct pipe_draw_info *info,
+                               unsigned count)
 {
-   unsigned gen_prim, gen_size, gen_nr, gen_type;
+   struct pipe_context *pipe = &hwtnl->svga->pipe;
+   enum pipe_prim_type gen_prim;
+   unsigned gen_size, gen_nr;
+   enum indices_mode gen_type;
    u_translate_func gen_func;
    enum pipe_error ret = PIPE_OK;
 
-   if (hwtnl->api_fillmode != PIPE_POLYGON_MODE_FILL && 
-       prim >= PIPE_PRIM_TRIANGLES) 
-   {
-      gen_type = u_unfilled_translator( prim,
-                                        index_size,
-                                        count,
-                                        hwtnl->api_fillmode,
-                                        &gen_prim,
-                                        &gen_size,
-                                        &gen_nr,
-                                        &gen_func );
+   SVGA_STATS_TIME_PUSH(svga_sws(hwtnl->svga),
+                        SVGA_STATS_TIME_HWTNLDRAWELEMENTS);
+
+   if (svga_need_unfilled_fallback(hwtnl, info->mode)) {
+      gen_type = u_unfilled_translator(info->mode,
+                                       info->index_size,
+                                       count,
+                                       hwtnl->api_fillmode,
+                                       &gen_prim,
+                                       &gen_size, &gen_nr, &gen_func);
    }
-   else
-   {
-      gen_type = u_index_translator( svga_hw_prims,
-                                     prim,
-                                     index_size,
-                                     count,
-                                     hwtnl->api_pv,
-                                     hwtnl->hw_pv,
-                                     &gen_prim,
-                                     &gen_size,
-                                     &gen_nr,
-                                     &gen_func );
+   else {
+      unsigned hw_pv;
+
+      /* There is no geometry ordering with PATCH, so no need to
+       * consider provoking vertex mode for the translation.
+       * So use the same api_pv as the hw_pv.
+       */
+      hw_pv = info->mode == PIPE_PRIM_PATCHES ? hwtnl->api_pv :
+                                                hwtnl->hw_pv;
+      gen_type = u_index_translator(svga_hw_prims,
+                                    info->mode,
+                                    info->index_size,
+                                    count,
+                                    hwtnl->api_pv,
+                                    hw_pv,
+                                    PR_DISABLE,
+                                    &gen_prim, &gen_size, &gen_nr, &gen_func);
    }
 
-   
-   if (gen_type == U_TRANSLATE_MEMCPY) {
-      /* No need for translation, just pass through to hardware: 
+   if ((gen_type == U_TRANSLATE_MEMCPY) && (info->index_size == gen_size)) {
+      /* No need for translation, just pass through to hardware:
        */
-      return svga_hwtnl_simple_draw_range_elements( hwtnl, index_buffer,
-                                                    index_size,
-                                                    index_bias,
-                                                    min_index,
-                                                    max_index,
-                                                    gen_prim, start, count );
+      unsigned start_offset = info->start * info->index_size;
+      struct pipe_resource *index_buffer = NULL;
+      unsigned index_offset;
+
+      if (info->has_user_indices) {
+         u_upload_data(pipe->stream_uploader, 0, count * info->index_size,
+                       info->index_size, (char *) info->index.user + start_offset,
+                       &index_offset, &index_buffer);
+         u_upload_unmap(pipe->stream_uploader);
+         index_offset /= info->index_size;
+      } else {
+         pipe_resource_reference(&index_buffer, info->index.resource);
+         index_offset = info->start;
+      }
+
+      assert(index_buffer != NULL);
+
+      ret = svga_hwtnl_simple_draw_range_elements(hwtnl, index_buffer,
+                                                  info->index_size,
+                                                  info->index_bias,
+                                                  info->min_index,
+                                                  info->max_index,
+                                                  gen_prim, index_offset, count,
+                                                  info->start_instance,
+                                                  info->instance_count,
+                                                  info->vertices_per_patch);
+      pipe_resource_reference(&index_buffer, NULL);
    }
    else {
       struct pipe_resource *gen_buf = NULL;
+      unsigned gen_offset = 0;
 
       /* Need to allocate a new index buffer and run the translate
        * func to populate it.  Could potentially cache this translated
@@ -222,37 +296,29 @@ svga_hwtnl_draw_range_elements( struct svga_hwtnl *hwtnl,
        * GL though, as index buffers are typically used only once
        * there.
        */
-      ret = translate_indices( hwtnl,
-                               index_buffer,
-                               start * index_size,
-                               gen_nr,
-                               gen_size,
-                               gen_func,
-                               &gen_buf );
-      if (ret)
-         goto done;
-
-      ret = svga_hwtnl_simple_draw_range_elements( hwtnl,
-                                                   gen_buf,
-                                                   gen_size,
-                                                   index_bias,
-                                                   min_index,
-                                                   max_index,
-                                                   gen_prim,
-                                                   0,
-                                                   gen_nr );
-      if (ret)
-         goto done;
-
-   done:
-      if (gen_buf)
-         pipe_resource_reference( &gen_buf, NULL );
-
-      return ret;
+      ret = translate_indices(hwtnl, info, gen_prim,
+                              count, gen_nr, gen_size,
+                              gen_func, &gen_buf, &gen_offset);
+      if (ret == PIPE_OK) {
+         gen_offset /= gen_size;
+         ret = svga_hwtnl_simple_draw_range_elements(hwtnl,
+                                                     gen_buf,
+                                                     gen_size,
+                                                     info->index_bias,
+                                                     info->min_index,
+                                                     info->max_index,
+                                                     gen_prim, gen_offset,
+                                                     gen_nr,
+                                                     info->start_instance,
+                                                     info->instance_count,
+                                                     info->vertices_per_patch);
+      }
+
+      if (gen_buf) {
+         pipe_resource_reference(&gen_buf, NULL);
+      }
    }
-}
-
-
-
-
 
+   SVGA_STATS_TIME_POP(svga_sws(hwtnl->svga));
+   return ret;
+}