Merge remote branch 'origin/mesa_7_7_branch'

[mesa.git] / src / mesa / drivers / dri / i965 / brw_sf_state.c
diff --git a/src/mesa/drivers/dri/i965/brw_sf_state.c b/src/mesa/drivers/dri/i965/brw_sf_state.c

index 38733c8c73462b8582e6647200f4b61c7673dc53..09223b7cfb1d95b01f9be4f39e8567b942ab65fb 100644 (file)
--- a/src/mesa/drivers/dri/i965/brw_sf_state.c
+++ b/src/mesa/drivers/dri/i965/brw_sf_state.c
@@ -93,7 +93,8 @@ static void upload_sf_vp(struct brw_context *brw)
     }
  
     dri_bo_unreference(brw->sf.vp_bo);
-   brw->sf.vp_bo = brw_cache_data( &brw->cache, BRW_SF_VP, &sfv, NULL, 0 );
+   brw->sf.vp_bo = brw_cache_data(&brw->cache, BRW_SF_VP, &sfv, sizeof(sfv),
+                                 NULL, 0);
  }
  
  const struct brw_tracked_state brw_sf_vp = {
@@ -114,6 +115,7 @@ struct brw_sf_unit_key {
     unsigned int nr_urb_entries, urb_size, sfsize;
  
     GLenum front_face, cull_face;
+   unsigned pv_first:1;
     unsigned scissor:1;
     unsigned line_smooth:1;
     unsigned point_sprite:1;
@@ -153,6 +155,9 @@ sf_unit_populate_key(struct brw_context *brw, struct brw_sf_unit_key *key)
     key->point_size = CLAMP(ctx->Point.Size, ctx->Point.MinSize, ctx->Point.MaxSize);
     key->point_attenuated = ctx->Point._Attenuated;
  
+   /* _NEW_LIGHT */
+   key->pv_first = (ctx->Light.ProvokingVertex == GL_FIRST_VERTEX_CONVENTION);
+
     key->render_to_fbo = brw->intel.ctx.DrawBuffer->Name != 0;
  }
  
@@ -160,9 +165,10 @@ static dri_bo *
  sf_unit_create_from_key(struct brw_context *brw, struct brw_sf_unit_key *key,
                         dri_bo **reloc_bufs)
  {
+   struct intel_context *intel = &brw->intel;
     struct brw_sf_unit_state sf;
     dri_bo *bo;
-
+   int chipset_max_threads;
     memset(&sf, 0, sizeof(sf));
  
     sf.thread0.grf_reg_count = ALIGN(key->total_grf, 16) / 16 - 1;
@@ -171,13 +177,26 @@ sf_unit_create_from_key(struct brw_context *brw, struct brw_sf_unit_key *key,
     sf.thread1.floating_point_mode = BRW_FLOATING_POINT_NON_IEEE_754;
  
     sf.thread3.dispatch_grf_start_reg = 3;
-   sf.thread3.urb_entry_read_offset = 1;
+
+   if (intel->is_ironlake)
+       sf.thread3.urb_entry_read_offset = 3;
+   else
+       sf.thread3.urb_entry_read_offset = 1;
+
     sf.thread3.urb_entry_read_length = key->urb_entry_read_length;
  
     sf.thread4.nr_urb_entries = key->nr_urb_entries;
     sf.thread4.urb_entry_allocation_size = key->sfsize - 1;
-   /* Each SF thread produces 1 PUE, and there can be up to 24 threads */
-   sf.thread4.max_threads = MIN2(24, key->nr_urb_entries) - 1;
+
+   /* Each SF thread produces 1 PUE, and there can be up to 24 (Pre-Ironlake) or
+    * 48 (Ironlake) threads.
+    */
+   if (intel->is_ironlake)
+      chipset_max_threads = 48;
+   else
+      chipset_max_threads = 24;
+
+   sf.thread4.max_threads = MIN2(chipset_max_threads, key->nr_urb_entries) - 1;
  
     if (INTEL_DEBUG & DEBUG_SINGLE_THREAD)
        sf.thread4.max_threads = 0;
@@ -271,9 +290,15 @@ sf_unit_create_from_key(struct brw_context *brw, struct brw_sf_unit_key *key,
  
     /* might be BRW_NEW_PRIMITIVE if we have to adjust pv for polygons:
      */
-   sf.sf7.trifan_pv = 2;
-   sf.sf7.linestrip_pv = 1;
-   sf.sf7.tristrip_pv = 2;
+   if (!key->pv_first) {
+      sf.sf7.trifan_pv = 2;
+      sf.sf7.linestrip_pv = 1;
+      sf.sf7.tristrip_pv = 2;
+   } else {
+      sf.sf7.trifan_pv = 1;
+      sf.sf7.linestrip_pv = 0;
+      sf.sf7.tristrip_pv = 0;
+   }
     sf.sf7.line_last_pixel_enable = 0;
  
     /* Set bias for OpenGL rasterization rules:
@@ -287,6 +312,9 @@ sf_unit_create_from_key(struct brw_context *brw, struct brw_sf_unit_key *key,
                          &sf, sizeof(sf),
                          NULL, NULL);
  
+   /* STATE_PREFETCH command description describes this state as being
+    * something loaded through the GPE (L2 ISC), so it's INSTRUCTION domain.
+    */
     /* Emit SF program relocation */
     dri_bo_emit_reloc(bo,
                      I915_GEM_DOMAIN_INSTRUCTION, 0,
@@ -327,6 +355,7 @@ static void upload_sf_unit( struct brw_context *brw )
  const struct brw_tracked_state brw_sf_unit = {
     .dirty = {
        .mesa  = (_NEW_POLYGON | 
+               _NEW_LIGHT |
                 _NEW_LINE | 
                 _NEW_POINT | 
                 _NEW_SCISSOR |