i965/fs: Support arbitrarily large sampler state indices on Haswell+.

author Kenneth Graunke <kenneth@whitecape.org>

Sat, 18 Jan 2014 21:29:39 +0000 (13:29 -0800)

committer Kenneth Graunke <kenneth@whitecape.org>

Thu, 23 Jan 2014 01:18:48 +0000 (17:18 -0800)
author Kenneth Graunke <kenneth@whitecape.org>
Sat, 18 Jan 2014 21:29:39 +0000 (13:29 -0800)
committer Kenneth Graunke <kenneth@whitecape.org>
Thu, 23 Jan 2014 01:18:48 +0000 (17:18 -0800)
diff --git a/src/mesa/drivers/dri/i965/brw_fs_generator.cpp b/src/mesa/drivers/dri/i965/brw_fs_generator.cpp

index 38c7c5c5e5e21dbbebd476dadc5674577c0e9554..40d86ebba238598840724d3e27f2329edefd6aa9 100644 (file)
--- a/src/mesa/drivers/dri/i965/brw_fs_generator.cpp
+++ b/src/mesa/drivers/dri/i965/brw_fs_generator.cpp
@@ -559,6 +559,23 @@ fs_generator::generate_tex(fs_inst *inst, struct brw_reg dst, struct brw_reg src
              brw_MOV(p, get_element_ud(header_reg, 2),
                         brw_imm_ud(inst->texture_offset));
           }
+
+         if (inst->sampler >= 16) {
+            /* The "Sampler Index" field can only store values between 0 and 15.
+             * However, we can add an offset to the "Sampler State Pointer"
+             * field, effectively selecting a different set of 16 samplers.
+             *
+             * The "Sampler State Pointer" needs to be aligned to a 32-byte
+             * offset, and each sampler state is only 16-bytes, so we can't
+             * exclusively use the offset - we have to use both.
+             */
+            assert(brw->is_haswell); /* field only exists on Haswell */
+            brw_ADD(p,
+                    get_element_ud(header_reg, 3),
+                    get_element_ud(brw_vec8_grf(0, 0), 3),
+                    brw_imm_ud(16 * (inst->sampler / 16) *
+                               sizeof(gen7_sampler_state)));
+         }
           brw_pop_insn_state(p);
        }
     }
@@ -573,7 +590,7 @@ fs_generator::generate_tex(fs_inst *inst, struct brw_reg dst, struct brw_reg src
               inst->base_mrf,
               src,
                surface_index,
-             inst->sampler,
+             inst->sampler % 16,
               msg_type,
               rlen,
               inst->mlen,
diff --git a/src/mesa/drivers/dri/i965/brw_fs_visitor.cpp b/src/mesa/drivers/dri/i965/brw_fs_visitor.cpp

index f49fcc71d5fed4051f210982660e096fd786fff7..28e4dd6c7926d3526741394a81d37b730ee05f5b 100644 (file)
--- a/src/mesa/drivers/dri/i965/brw_fs_visitor.cpp
+++ b/src/mesa/drivers/dri/i965/brw_fs_visitor.cpp
@@ -1250,13 +1250,16 @@ fs_visitor::emit_texture_gen7(ir_texture *ir, fs_reg dst, fs_reg coordinate,
     fs_reg payload = fs_reg(this, glsl_type::float_type);
     fs_reg next = payload;
  
-   if (ir->op == ir_tg4 || (ir->offset && ir->op != ir_txf)) {
+   if (ir->op == ir_tg4 || (ir->offset && ir->op != ir_txf) || sampler >= 16) {
        /* For general texture offsets (no txf workaround), we need a header to
         * put them in.  Note that for SIMD16 we're making space for two actual
         * hardware registers here, so the emit will have to fix up for this.
         *
         * * ir4_tg4 needs to place its channel select in the header,
         * for interaction with ARB_texture_swizzle
+       *
+       * The sampler index is only 4-bits, so for larger sampler numbers we
+       * need to offset the Sampler State Pointer in the header.
         */
        header_present = true;
        next.reg_offset++;
author	Kenneth Graunke <kenneth@whitecape.org>
	Sat, 18 Jan 2014 21:29:39 +0000 (13:29 -0800)
committer	Kenneth Graunke <kenneth@whitecape.org>
	Thu, 23 Jan 2014 01:18:48 +0000 (17:18 -0800)
src/mesa/drivers/dri/i965/brw_fs_generator.cpp		patch \| blob \| history
src/mesa/drivers/dri/i965/brw_fs_visitor.cpp		patch \| blob \| history