Merge branch 'mesa_7_5_branch'
[mesa.git] / src / mesa / drivers / dri / r600 / r700_render.c
index 78b92d695e47080f0c483cb18512ce361c23aa5b..6705dbcf4b9aff5ba66fe5262872d4473f86a257 100644 (file)
 #include "r600_context.h"
 #include "r600_cmdbuf.h"
 
-#include "r700_chip.h"
-#include "r700_tex.h"
+#include "r600_tex.h"
 
 #include "r700_vertprog.h"
 #include "r700_fragprog.h"
 #include "r700_state.h"
 
+void r700WaitForIdle(context_t *context);
+void r700WaitForIdleClean(context_t *context);
+void r700Start3D(context_t *context);
+GLboolean r700SendTextureState(context_t *context);
+static unsigned int r700PrimitiveType(int prim);
+void r600UpdateTextureState(GLcontext * ctx);
+GLboolean r700SyncSurf(context_t *context,
+                      struct radeon_bo *pbo,
+                      uint32_t read_domain,
+                      uint32_t write_domain,
+                      uint32_t sync_type);
+
 void r700WaitForIdle(context_t *context)
 {
     BATCH_LOCALS(&context->radeon);
@@ -109,82 +120,60 @@ static GLboolean r700SetupShaders(GLcontext * ctx)
 {
     context_t *context = R700_CONTEXT(ctx);
 
-    R700_CHIP_CONTEXT *r700 = (R700_CHIP_CONTEXT*)(context->chipobj.pvChipObj);
+    R700_CHIP_CONTEXT *r700 = (R700_CHIP_CONTEXT*)(&context->hw);
 
     GLuint exportCount;
 
-       r700->SQ_PGM_RESOURCES_PS.u32All = 0;
-       r700->SQ_PGM_RESOURCES_VS.u32All = 0;
+    r700->ps.SQ_PGM_RESOURCES_PS.u32All = 0;
+    r700->vs.SQ_PGM_RESOURCES_VS.u32All = 0;
 
-       SETbit(r700->SQ_PGM_RESOURCES_PS.u32All, PGM_RESOURCES__PRIME_CACHE_ON_DRAW_bit);
-    SETbit(r700->SQ_PGM_RESOURCES_VS.u32All, PGM_RESOURCES__PRIME_CACHE_ON_DRAW_bit);
+    SETbit(r700->ps.SQ_PGM_RESOURCES_PS.u32All, PGM_RESOURCES__PRIME_CACHE_ON_DRAW_bit);
+    SETbit(r700->vs.SQ_PGM_RESOURCES_VS.u32All, PGM_RESOURCES__PRIME_CACHE_ON_DRAW_bit);
 
     r700SetupVertexProgram(ctx);
 
     r700SetupFragmentProgram(ctx);
 
-       exportCount = (r700->SQ_PGM_EXPORTS_PS.u32All & EXPORT_MODE_mask) / (1 << EXPORT_MODE_shift);
+    exportCount = (r700->ps.SQ_PGM_EXPORTS_PS.u32All & EXPORT_MODE_mask) / (1 << EXPORT_MODE_shift);
     r700->CB_SHADER_CONTROL.u32All = (1 << exportCount) - 1;
 
-    return GL_TRUE;
-}
+    r600UpdateTextureState(ctx);
 
-GLboolean r700SendTextureState(context_t *context)
-{
-    unsigned int i;
+    r700SendFSState(context); // FIXME just a place holder for now
+    r700SendPSState(context);
+    r700SendVSState(context);
 
-    R700_CHIP_CONTEXT *r700 = (R700_CHIP_CONTEXT*)(context->chipobj.pvChipObj);
-#if 0 /* to be enabled */
-    for(i=0; i<R700_TEXTURE_NUMBERUNITS; i++)
-    {
-        if(r700->texture_states.textures[i] != 0)
-        {
-            R700_CMDBUF_CHECK_SPACE(9);
-            R700EP3 (context, IT_SET_RESOURCE, 7);
-            R700E32 (context, i * 7);
-            R700E32 (context, r700->texture_states.textures[i]->SQ_TEX_RESOURCE0.u32All);
-            R700E32 (context, r700->texture_states.textures[i]->SQ_TEX_RESOURCE1.u32All);
-            R700E32 (context, r700->texture_states.textures[i]->SQ_TEX_RESOURCE2.u32All);
-            R700E32 (context, r700->texture_states.textures[i]->SQ_TEX_RESOURCE3.u32All);
-            R700E32 (context, r700->texture_states.textures[i]->SQ_TEX_RESOURCE4.u32All);
-            R700E32 (context, r700->texture_states.textures[i]->SQ_TEX_RESOURCE5.u32All);
-            R700E32 (context, r700->texture_states.textures[i]->SQ_TEX_RESOURCE6.u32All);
-        }
+    r700SendTextureState(context);
+    r700SetupStreams(ctx);
 
-        if(r700->texture_states.samplers[i] != 0)
-        {
-            R700_CMDBUF_CHECK_SPACE(5);
-            R700EP3 (context, IT_SET_SAMPLER, 3);        
-            R700E32 (context, i * 3);   // Base at 0x7000
-            R700E32 (context, r700->texture_states.samplers[i]->SQ_TEX_SAMPLER0.u32All);
-            R700E32 (context, r700->texture_states.samplers[i]->SQ_TEX_SAMPLER1.u32All);
-            R700E32 (context, r700->texture_states.samplers[i]->SQ_TEX_SAMPLER2.u32All);
-        }
-    }
-#endif
     return GL_TRUE;
 }
 
-GLboolean r700SyncSurf(context_t *context)
+GLboolean r700SyncSurf(context_t *context,
+                      struct radeon_bo *pbo,
+                      uint32_t read_domain,
+                      uint32_t write_domain,
+                      uint32_t sync_type)
 {
     BATCH_LOCALS(&context->radeon);
+    uint32_t cp_coher_size;
 
-    /* TODO : too heavy? */
-    unsigned int CP_COHER_CNTL   = 0;
-
-    CP_COHER_CNTL |= (TC_ACTION_ENA_bit
-                     | VC_ACTION_ENA_bit
-                     | CB_ACTION_ENA_bit
-                     | DB_ACTION_ENA_bit
-                     | SH_ACTION_ENA_bit
-                     | SMX_ACTION_ENA_bit);
+    if (!pbo)
+           return GL_FALSE;
 
+    if (pbo->size == 0xffffffff)
+           cp_coher_size = 0xffffffff;
+    else
+           cp_coher_size = ((pbo->size + 255) >> 8);
 
     BEGIN_BATCH_NO_AUTOSTATE(5);
     R600_OUT_BATCH(CP_PACKET3(R600_IT_SURFACE_SYNC, 3));
-    R600_OUT_BATCH(CP_COHER_CNTL);
-    R600_OUT_BATCH(0xFFFFFFFF);
-    R600_OUT_BATCH(0x00000000);
+    R600_OUT_BATCH(sync_type);
+    R600_OUT_BATCH(cp_coher_size);
+    R600_OUT_BATCH_RELOC(0,
+                        pbo,
+                        0,
+                        read_domain, write_domain, 0); // ???
     R600_OUT_BATCH(10);
 
     END_BATCH();
@@ -193,9 +182,9 @@ GLboolean r700SyncSurf(context_t *context)
     return GL_TRUE;
 }
 
-unsigned int r700PrimitiveType(int prim)
+static unsigned int r700PrimitiveType(int prim)
 {
-    switch (prim & PRIM_MODE_MASK) 
+    switch (prim & PRIM_MODE_MASK)
     {
     case GL_POINTS:
         return DI_PT_POINTLIST;
@@ -234,135 +223,110 @@ unsigned int r700PrimitiveType(int prim)
     }
 }
 
-static GLboolean r700RunRender(GLcontext * ctx,
-                                          struct tnl_pipeline_stage *stage)
+static void r700RunRenderPrimitive(GLcontext * ctx, int start, int end, int prim)
 {
-    context_t *context = R700_CONTEXT(ctx);
-    R700_CHIP_CONTEXT *r700 = (R700_CHIP_CONTEXT*)(context->chipobj.pvChipObj);
-#if 1
-    BATCH_LOCALS(&context->radeon);
+       context_t *context = R700_CONTEXT(ctx);
+       BATCH_LOCALS(&context->radeon);
+       int type, i, total_emit;
+       int num_indices = end - start;
+       uint32_t vgt_draw_initiator = 0;
+       uint32_t vgt_index_type     = 0;
+       uint32_t vgt_primitive_type = 0;
+       uint32_t vgt_num_indices    = 0;
+
+       type = r700PrimitiveType(prim);
+
+       if (type < 0 || num_indices <= 0)
+               return;
+
+        total_emit =   3 /* VGT_PRIMITIVE_TYPE */
+                    + 2 /* VGT_INDEX_TYPE */
+                    + 2 /* NUM_INSTANCES */
+                     + num_indices + 3; /* DRAW_INDEX_IMMD */
+
+        BEGIN_BATCH_NO_AUTOSTATE(total_emit);
+       // prim
+        SETfield(vgt_primitive_type, type,
+                VGT_PRIMITIVE_TYPE__PRIM_TYPE_shift, VGT_PRIMITIVE_TYPE__PRIM_TYPE_mask);
+        R600_OUT_BATCH(CP_PACKET3(R600_IT_SET_CONFIG_REG, 1));
+        R600_OUT_BATCH(mmVGT_PRIMITIVE_TYPE - ASIC_CONFIG_BASE_INDEX);
+        R600_OUT_BATCH(vgt_primitive_type);
 
-    unsigned int i, j;
-    TNLcontext *tnl = TNL_CONTEXT(ctx);
-    struct vertex_buffer *vb = &tnl->vb;
+       // index type
+        SETfield(vgt_index_type, DI_INDEX_SIZE_32_BIT, INDEX_TYPE_shift, INDEX_TYPE_mask);
+        R600_OUT_BATCH(CP_PACKET3(R600_IT_INDEX_TYPE, 0));
+        R600_OUT_BATCH(vgt_index_type);
 
-    struct r700_fragment_program *fp = (struct r700_fragment_program *)
-                                          (ctx->FragmentProgram._Current);
-    if (context->radeon.radeonScreen->chip_family < CHIP_FAMILY_RV770)
-    {
-        fp->r700AsmCode.bR6xx = 1;
-    }
+       // num instances
+       R600_OUT_BATCH(CP_PACKET3(R600_IT_NUM_INSTANCES, 0));
+        R600_OUT_BATCH(1);
 
-    r700Start3D(context); /* TODO : this is too much. */
+       // draw packet
+        vgt_num_indices = num_indices;
+        SETfield(vgt_draw_initiator, DI_SRC_SEL_IMMEDIATE, SOURCE_SELECT_shift, SOURCE_SELECT_mask);
+       SETfield(vgt_draw_initiator, DI_MAJOR_MODE_0, MAJOR_MODE_shift, MAJOR_MODE_mask);
 
-    r700SyncSurf(context); /* TODO : make it light. */
+        R600_OUT_BATCH(CP_PACKET3(R600_IT_DRAW_INDEX_IMMD, (num_indices + 1)));
+        R600_OUT_BATCH(vgt_num_indices);
+        R600_OUT_BATCH(vgt_draw_initiator);
 
-    r700UpdateShaders(ctx);
+        for (i = start; i < end; i++) {
+            R600_OUT_BATCH(i);
+        }
+        END_BATCH();
+        COMMIT_BATCH();
 
-    r700SetRenderTarget(context);
+}
 
-    if(r700SetupStreams(ctx))
-    {
-        return GL_TRUE;
-    }
+void r700EmitState(GLcontext * ctx)
+{
+       context_t *context = R700_CONTEXT(ctx);
+       radeonContextPtr radeon = &context->radeon;
 
-    /* flush TX */
-    //r700SyncSurf(context); /*  */
+       if (radeon->cmdbuf.cs->cdw && !radeon->hw.is_dirty && !radeon->hw.all_dirty)
+               return;
 
-    r700UpdateTextureState(context);
-    r700SendTextureState(context);
+       rcommonEnsureCmdBufSpace(&context->radeon,
+                                context->radeon.hw.max_state_size, __FUNCTION__);
 
-    if(GL_FALSE == fp->translated)
-    {
-        if( GL_FALSE == r700TranslateFragmentShader(fp, &(fp->mesa_program)) )
-        {
-            return GL_TRUE;
-        }
-    }
+       r700SendSQConfig(context);
 
-    /* flush SQ */
-    //r700SyncSurf(context); /*  */
-    //r700SyncSurf(context); /*  */
+       r700SendUCPState(context);
+       r700SendContextStates(context);
+       r700SendViewportState(context, 0);
+       r700SendRenderTargetState(context, 0);
+       r700SendDepthTargetState(context);
 
-    r700SetupShaders(ctx);
+}
+
+static GLboolean r700RunRender(GLcontext * ctx,
+                                          struct tnl_pipeline_stage *stage)
+{
+    context_t *context = R700_CONTEXT(ctx);
+    unsigned int i;
+    TNLcontext *tnl = TNL_CONTEXT(ctx);
+    struct vertex_buffer *vb = &tnl->vb;
 
-    /* set a valid base address to make the command checker happy */
-    r700->SQ_PGM_START_FS.u32All     = r700->SQ_PGM_START_PS.u32All;
-    r700->SQ_PGM_START_ES.u32All     = r700->SQ_PGM_START_PS.u32All;
-    r700->SQ_PGM_START_GS.u32All     = r700->SQ_PGM_START_PS.u32All;
+    r700Start3D(context);
 
-    /* flush vtx */
-    //r700SyncSurf(context); /*  */
+    r700UpdateShaders(ctx);
+    r700SetScissor(context);
+    r700SetupShaders(ctx);
 
-    r700SendContextStates(context, GL_FALSE);
+    r700EmitState(ctx);
 
     /* richard test code */
-    for (i = 0; i < vb->PrimitiveCount; i++) 
-    {
+    for (i = 0; i < vb->PrimitiveCount; i++) {
         GLuint prim = _tnl_translate_prim(&vb->Primitive[i]);
         GLuint start = vb->Primitive[i].start;
         GLuint end = vb->Primitive[i].start + vb->Primitive[i].count;
-        GLuint numIndices = vb->Primitive[i].count;
-        GLuint numEntires;
-               //r300RunRenderPrimitive(rmesa, ctx, start, end, prim);
-
-        unsigned int VGT_DRAW_INITIATOR = 0;
-        unsigned int VGT_INDEX_TYPE     = 0;
-        unsigned int VGT_PRIMITIVE_TYPE = 0;
-        unsigned int VGT_NUM_INDICES    = 0;
-        
-        numEntires = 2 /* VGT_INDEX_TYPE */
-                     + 3 /* VGT_PRIMITIVE_TYPE */
-                     + numIndices + 3; /* DRAW_INDEX_IMMD */                  
-                     
-        BEGIN_BATCH_NO_AUTOSTATE(numEntires);  
-
-        VGT_INDEX_TYPE |= DI_INDEX_SIZE_32_BIT << INDEX_TYPE_shift;
-
-        R600_OUT_BATCH(CP_PACKET3(R600_IT_INDEX_TYPE, 0));
-        R600_OUT_BATCH(VGT_INDEX_TYPE);
-
-        VGT_NUM_INDICES = numIndices;
-
-        VGT_PRIMITIVE_TYPE |= r700PrimitiveType(prim) << VGT_PRIMITIVE_TYPE__PRIM_TYPE_shift;
-        R600_OUT_BATCH(CP_PACKET3(R600_IT_SET_CONFIG_REG, 1));
-        R600_OUT_BATCH(mmVGT_PRIMITIVE_TYPE - ASIC_CONFIG_BASE_INDEX);
-        R600_OUT_BATCH(VGT_PRIMITIVE_TYPE);
-
-        VGT_DRAW_INITIATOR |= DI_SRC_SEL_IMMEDIATE << SOURCE_SELECT_shift;
-        VGT_DRAW_INITIATOR |= DI_MAJOR_MODE_0 << MAJOR_MODE_shift;
-
-        R600_OUT_BATCH(CP_PACKET3(R600_IT_DRAW_INDEX_IMMD, (numIndices + 1)));
-        R600_OUT_BATCH(VGT_NUM_INDICES);
-        R600_OUT_BATCH(VGT_DRAW_INITIATOR);
-
-        for (j=0; j<numIndices; j++)
-        {
-            R600_OUT_BATCH(j);
-        }
-        END_BATCH();
-        COMMIT_BATCH();
+       r700RunRenderPrimitive(ctx, start, end, prim);
     }
 
     /* Flush render op cached for last several quads. */
     r700WaitForIdleClean(context);
 
-    /* flush dst */
-    //r700SyncSurf(context); /*  */
-
-    radeonReleaseArrays(ctx, 0);
-
-    //richard test
-    /* test stamp, write a number to mmSCRATCH4 */
-#if 0
-    BEGIN_BATCH_NO_AUTOSTATE(3);
-    R600_OUT_BATCH_REGVAL((0x2144 << 2), 0x56785678);
-    END_BATCH();
-    COMMIT_BATCH();
-#endif
-
-#endif //0
-    rcommonFlushCmdBuf( &context->radeon, __FUNCTION__ );
+    radeonReleaseArrays(ctx, ~0);
 
     return GL_FALSE;
 }
@@ -385,15 +349,11 @@ static GLboolean r700RunTCLRender(GLcontext * ctx,  /*----------------------*/
     /**
     * Ensure all enabled and complete textures are uploaded along with any buffers being used.
     */
-    if(!r700ValidateBuffers(ctx))
+    if(!r600ValidateBuffers(ctx))
     {
         return GL_TRUE;
     }
 
-    context_t *context = R700_CONTEXT(ctx);
-
-    r700UpdateShaders(ctx);
-
     bRet = r700RunRender(ctx, stage);
 
     return bRet;