X-Git-Url: https://git.libre-soc.org/?a=blobdiff_plain;f=src%2Fmesa%2Fdrivers%2Fdri%2Fradeon%2Fradeon_span.c;h=fa5b2d98ff41e9f3816e1deeb36b097a55280d7e;hb=69d7782b155b72707d95a2f6b0c0776afbb888e3;hp=0c49c3713af2ee201272cb93b6aec6fd2459f010;hpb=46a784b7fd2dcab97c26d5ca02fb8f74945ba157;p=mesa.git

diff --git a/src/mesa/drivers/dri/radeon/radeon_span.c b/src/mesa/drivers/dri/radeon/radeon_span.c
index 0c49c3713af..fa5b2d98ff4 100644
--- a/src/mesa/drivers/dri/radeon/radeon_span.c
+++ b/src/mesa/drivers/dri/radeon/radeon_span.c
@@ -36,822 +36,116 @@ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  * Authors:
  *   Kevin E. Martin <martin@valinux.com>
  *   Gareth Hughes <gareth@valinux.com>
- *   Keith Whitwell <keith@tungstengraphics.com>
+ *   Keith Whitwell <keithw@vmware.com>
  *
  */
 
 #include "main/glheader.h"
+#include "main/texformat.h"
+#include "main/renderbuffer.h"
+#include "main/samplerobj.h"
+#include "main/framebuffer.h"
 #include "swrast/swrast.h"
+#include "swrast/s_renderbuffer.h"
 
 #include "radeon_common.h"
-#include "radeon_lock.h"
 #include "radeon_span.h"
 
-#define DBG 0
 
-static void radeonSetSpanFunctions(struct radeon_renderbuffer *rrb);
-
-
-/* r200 depth buffer is always tiled - this is the formula
-   according to the docs unless I typo'ed in it
-*/
-#if defined(RADEON_R200)
-static GLubyte *r200_depth_2byte(const struct radeon_renderbuffer * rrb,
-				 GLint x, GLint y)
-{
-    GLubyte *ptr = rrb->bo->ptr;
-    GLint offset;
-    if (rrb->has_surface) {
-	offset = x * rrb->cpp + y * rrb->pitch;
-    } else {
-	GLuint b;
-	offset = 0;
-	b = (((y  >> 4) * (rrb->pitch >> 8) + (x >> 6)));
-	offset += (b >> 1) << 12;
-	offset += (((rrb->pitch >> 8) & 0x1) ? (b & 0x1) : ((b & 0x1) ^ ((y >> 4) & 0x1))) << 11;
-	offset += ((y >> 2) & 0x3) << 9;
-	offset += ((x >> 3) & 0x1) << 8;
-	offset += ((x >> 4) & 0x3) << 6;
-	offset += ((x >> 2) & 0x1) << 5;
-	offset += ((y >> 1) & 0x1) << 4;
-	offset += ((x >> 1) & 0x1) << 3;
-	offset += (y & 0x1) << 2;
-	offset += (x & 0x1) << 1;
-    }
-    return &ptr[offset];
-}
-
-static GLubyte *r200_depth_4byte(const struct radeon_renderbuffer * rrb,
-				 GLint x, GLint y)
+static void
+radeon_renderbuffer_map(struct gl_context *ctx,
+			struct gl_renderbuffer *rb,
+			bool flip_y)
 {
-    GLubyte *ptr = rrb->bo->ptr;
-    GLint offset;
-    if (rrb->has_surface) {
-	offset = x * rrb->cpp + y * rrb->pitch;
-    } else {
-	GLuint b;
-	offset = 0;
-	b = (((y & 0x7ff) >> 4) * (rrb->pitch >> 7) + (x >> 5));
-	offset += (b >> 1) << 12;
-	offset += (((rrb->pitch >> 7) & 0x1) ? (b & 0x1) : ((b & 0x1) ^ ((y >> 4) & 0x1))) << 11;
-	offset += ((y >> 2) & 0x3) << 9;
-	offset += ((x >> 2) & 0x1) << 8;
-	offset += ((x >> 3) & 0x3) << 6;
-	offset += ((y >> 1) & 0x1) << 5;
-	offset += ((x >> 1) & 0x1) << 4;
-	offset += (y & 0x1) << 3;
-	offset += (x & 0x1) << 2;
-    }
-    return &ptr[offset];
-}
-#endif
+	struct radeon_renderbuffer *rrb = radeon_renderbuffer(rb);
+	GLubyte *map;
+	int stride;
 
-/* r600 tiling
- * two main types:
- * - 1D (akin to macro-linear/micro-tiled on older asics)
- * - 2D (akin to macro-tiled/micro-tiled on older asics)
- * only 1D tiling is implemented below
- */
-#if defined(RADEON_R600)
-static inline GLint r600_1d_tile_helper(const struct radeon_renderbuffer * rrb,
-					GLint x, GLint y, GLint is_depth, GLint is_stencil)
-{
-    GLint element_bytes = rrb->cpp;
-    GLint num_samples = 1;
-    GLint tile_width = 8;
-    GLint tile_height = 8;
-    GLint tile_thickness = 1;
-    GLint pitch_elements = rrb->pitch / element_bytes;
-    GLint height = rrb->base.Height;
-    GLint z = 0;
-    GLint sample_number = 0;
-    /* */
-    GLint tile_bytes;
-    GLint tiles_per_row;
-    GLint tiles_per_slice;
-    GLint slice_offset;
-    GLint tile_row_index;
-    GLint tile_column_index;
-    GLint tile_offset;
-    GLint pixel_number = 0;
-    GLint element_offset;
-    GLint offset = 0;
-
-    tile_bytes = tile_width * tile_height * tile_thickness * element_bytes * num_samples;
-    tiles_per_row = pitch_elements / tile_width;
-    tiles_per_slice = tiles_per_row * (height / tile_height);
-    slice_offset = (z / tile_thickness) * tiles_per_slice * tile_bytes;
-    tile_row_index = y / tile_height;
-    tile_column_index = x / tile_width;
-    tile_offset = ((tile_row_index * tiles_per_row) + tile_column_index) * tile_bytes;
-
-    if (is_depth) {
-	    GLint pixel_offset = 0;
-
-	    pixel_number |= ((x >> 0) & 1) << 0; // pn[0] = x[0]
-	    pixel_number |= ((y >> 0) & 1) << 1; // pn[1] = y[0]
-	    pixel_number |= ((x >> 1) & 1) << 2; // pn[2] = x[1]
-	    pixel_number |= ((y >> 1) & 1) << 3; // pn[3] = y[1]
-	    pixel_number |= ((x >> 2) & 1) << 4; // pn[4] = x[2]
-	    pixel_number |= ((y >> 2) & 1) << 5; // pn[5] = y[2]
-	    switch (element_bytes) {
-	    case 2:
-		    pixel_offset = pixel_number * element_bytes * num_samples;
-		    break;
-	    case 4:
-		    /* stencil and depth data are stored separately within a tile.
-		     * stencil is stored in a contiguous tile before the depth tile.
-		     * stencil element is 1 byte, depth element is 3 bytes.
-		     * stencil tile is 64 bytes.
-		     */
-		    if (is_stencil)
-			    pixel_offset = pixel_number * 1 * num_samples;
-		    else
-			    pixel_offset = (pixel_number * 3 * num_samples) + 64;
-		    break;
-	    }
-	    element_offset = pixel_offset + (sample_number * element_bytes);
-    } else {
-	    GLint sample_offset;
-
-	    switch (element_bytes) {
-	    case 1:
-		    pixel_number |= ((x >> 0) & 1) << 0; // pn[0] = x[0]
-		    pixel_number |= ((x >> 1) & 1) << 1; // pn[1] = x[1]
-		    pixel_number |= ((x >> 2) & 1) << 2; // pn[2] = x[2]
-		    pixel_number |= ((y >> 1) & 1) << 3; // pn[3] = y[1]
-		    pixel_number |= ((y >> 0) & 1) << 4; // pn[4] = y[0]
-		    pixel_number |= ((y >> 2) & 1) << 5; // pn[5] = y[2]
-		    break;
-	    case 2:
-		    pixel_number |= ((x >> 0) & 1) << 0; // pn[0] = x[0]
-		    pixel_number |= ((x >> 1) & 1) << 1; // pn[1] = x[1]
-		    pixel_number |= ((x >> 2) & 1) << 2; // pn[2] = x[2]
-		    pixel_number |= ((y >> 0) & 1) << 3; // pn[3] = y[0]
-		    pixel_number |= ((y >> 1) & 1) << 4; // pn[4] = y[1]
-		    pixel_number |= ((y >> 2) & 1) << 5; // pn[5] = y[2]
-		    break;
-	    case 4:
-		    pixel_number |= ((x >> 0) & 1) << 0; // pn[0] = x[0]
-		    pixel_number |= ((x >> 1) & 1) << 1; // pn[1] = x[1]
-		    pixel_number |= ((y >> 0) & 1) << 2; // pn[2] = y[0]
-		    pixel_number |= ((x >> 2) & 1) << 3; // pn[3] = x[2]
-		    pixel_number |= ((y >> 1) & 1) << 4; // pn[4] = y[1]
-		    pixel_number |= ((y >> 2) & 1) << 5; // pn[5] = y[2]
-		    break;
-	    }
-	    sample_offset = sample_number * (tile_bytes / num_samples);
-	    element_offset = sample_offset + (pixel_number * element_bytes);
-    }
-    offset = slice_offset + tile_offset + element_offset;
-    return offset;
-}
+	if (!rb || !rrb)
+		return;
 
-/* depth buffers */
-static GLubyte *r600_ptr_depth(const struct radeon_renderbuffer * rrb,
-			       GLint x, GLint y)
-{
-    GLubyte *ptr = rrb->bo->ptr;
-    GLint offset = r600_1d_tile_helper(rrb, x, y, 1, 0);
-    return &ptr[offset];
-}
+	ctx->Driver.MapRenderbuffer(ctx, rb, 0, 0, rb->Width, rb->Height,
+				    GL_MAP_READ_BIT | GL_MAP_WRITE_BIT,
+				    &map, &stride, flip_y);
 
-static GLubyte *r600_ptr_stencil(const struct radeon_renderbuffer * rrb,
-				 GLint x, GLint y)
-{
-    GLubyte *ptr = rrb->bo->ptr;
-    GLint offset = r600_1d_tile_helper(rrb, x, y, 1, 1);
-    return &ptr[offset];
+	rrb->base.Map = map;
+	rrb->base.RowStride = stride;
+	/* No floating point color buffers, use GLubytes */
+	rrb->base.ColorType = GL_UNSIGNED_BYTE;
 }
 
-static GLubyte *r600_ptr_color(const struct radeon_renderbuffer * rrb,
-			       GLint x, GLint y)
+static void
+radeon_renderbuffer_unmap(struct gl_context *ctx, struct gl_renderbuffer *rb)
 {
-    GLubyte *ptr = rrb->bo->ptr;
-    uint32_t mask = RADEON_BO_FLAGS_MACRO_TILE | RADEON_BO_FLAGS_MICRO_TILE;
-    GLint offset;
-
-    if (rrb->has_surface || !(rrb->bo->flags & mask)) {
-        offset = x * rrb->cpp + y * rrb->pitch;
-    } else {
-	    offset = r600_1d_tile_helper(rrb, x, y, 0, 0);
-    }
-    return &ptr[offset];
-}
+	struct radeon_renderbuffer *rrb = radeon_renderbuffer(rb);
+	if (!rb || !rrb)
+		return;
 
-#else
-
-/* radeon tiling on r300-r500 has 4 states,
-   macro-linear/micro-linear
-   macro-linear/micro-tiled
-   macro-tiled /micro-linear
-   macro-tiled /micro-tiled
-   1 byte surface 
-   2 byte surface - two types - we only provide 8x2 microtiling
-   4 byte surface
-   8/16 byte (unused)
-*/
-static GLubyte *radeon_ptr_4byte(const struct radeon_renderbuffer * rrb,
-			     GLint x, GLint y)
-{
-    GLubyte *ptr = rrb->bo->ptr;
-    uint32_t mask = RADEON_BO_FLAGS_MACRO_TILE | RADEON_BO_FLAGS_MICRO_TILE;
-    GLint offset;
-
-    if (rrb->has_surface || !(rrb->bo->flags & mask)) {
-        offset = x * rrb->cpp + y * rrb->pitch;
-    } else {
-        offset = 0;
-        if (rrb->bo->flags & RADEON_BO_FLAGS_MACRO_TILE) {
-	    if (rrb->bo->flags & RADEON_BO_FLAGS_MICRO_TILE) {
-		offset = ((y >> 4) * (rrb->pitch >> 7) + (x >> 5)) << 11;
-		offset += (((y >> 3) ^ (x >> 5)) & 0x1) << 10;
-		offset += (((y >> 4) ^ (x >> 4)) & 0x1) << 9;
-		offset += (((y >> 2) ^ (x >> 4)) & 0x1) << 8;
-		offset += (((y >> 3) ^ (x >> 3)) & 0x1) << 7;
-		offset += ((y >> 1) & 0x1) << 6;
-		offset += ((x >> 2) & 0x1) << 5;
-		offset += (y & 1) << 4;
-		offset += (x & 3) << 2;
-            } else {
-		offset = ((y >> 3) * (rrb->pitch >> 8) + (x >> 6)) << 11;
-		offset += (((y >> 2) ^ (x >> 6)) & 0x1) << 10;
-		offset += (((y >> 3) ^ (x >> 5)) & 0x1) << 9;
-		offset += (((y >> 1) ^ (x >> 5)) & 0x1) << 8;
-		offset += (((y >> 2) ^ (x >> 4)) & 0x1) << 7;
-		offset += (y & 1) << 6;
-		offset += (x & 15) << 2;
-            }
-        } else {
-	    offset = ((y >> 1) * (rrb->pitch >> 4) + (x >> 2)) << 5;
-	    offset += (y & 1) << 4;
-	    offset += (x & 3) << 2;
-        }
-    }
-    return &ptr[offset];
-}
+	ctx->Driver.UnmapRenderbuffer(ctx, rb);
 
-static GLubyte *radeon_ptr_2byte_8x2(const struct radeon_renderbuffer * rrb,
-				     GLint x, GLint y)
-{
-    GLubyte *ptr = rrb->bo->ptr;
-    uint32_t mask = RADEON_BO_FLAGS_MACRO_TILE | RADEON_BO_FLAGS_MICRO_TILE;
-    GLint offset;
-
-    if (rrb->has_surface || !(rrb->bo->flags & mask)) {
-        offset = x * rrb->cpp + y * rrb->pitch;
-    } else {
-        offset = 0;
-        if (rrb->bo->flags & RADEON_BO_FLAGS_MACRO_TILE) {
-            if (rrb->bo->flags & RADEON_BO_FLAGS_MICRO_TILE) {
-		offset = ((y >> 4) * (rrb->pitch >> 7) + (x >> 6)) << 11;
-		offset += (((y >> 3) ^ (x >> 6)) & 0x1) << 10;
-		offset += (((y >> 4) ^ (x >> 5)) & 0x1) << 9;
-		offset += (((y >> 2) ^ (x >> 5)) & 0x1) << 8;
-		offset += (((y >> 3) ^ (x >> 4)) & 0x1) << 7;
-		offset += ((y >> 1) & 0x1) << 6;
-		offset += ((x >> 3) & 0x1) << 5;
-		offset += (y & 1) << 4;
-		offset += (x & 3) << 2;
-            } else {
-		offset = ((y >> 3) * (rrb->pitch >> 8) + (x >> 7)) << 11;
-		offset += (((y >> 2) ^ (x >> 7)) & 0x1) << 10;
-		offset += (((y >> 3) ^ (x >> 6)) & 0x1) << 9;
-		offset += (((y >> 1) ^ (x >> 6)) & 0x1) << 8;
-		offset += (((y >> 2) ^ (x >> 5)) & 0x1) << 7;
-		offset += (y & 1) << 6;
-		offset += ((x >> 4) & 0x1) << 5;
-                offset += (x & 15) << 2;
-            }
-        } else {
-	    offset = ((y >> 1) * (rrb->pitch >> 4) + (x >> 3)) << 5;
-	    offset += (y & 0x1) << 4;
-	    offset += (x & 0x7) << 1;
-        }
-    }
-    return &ptr[offset];
+	rrb->base.Map = NULL;
+	rrb->base.RowStride = 0;
 }
 
-#endif
-
-#ifndef RADEON_R300
-#ifndef RADEON_R600
-static uint32_t
-z24s8_to_s8z24(uint32_t val)
+static void
+radeon_map_framebuffer(struct gl_context *ctx, struct gl_framebuffer *fb)
 {
-   return (val << 24) | (val >> 8);
-}
+	GLuint i;
 
-static uint32_t
-s8z24_to_z24s8(uint32_t val)
-{
-   return (val >> 24) | (val << 8);
-}
-#endif
-#endif
+	radeon_print(RADEON_MEMORY, RADEON_TRACE,
+		"%s( %p , fb %p )\n",
+		     __func__, ctx, fb);
 
-/*
- * Note that all information needed to access pixels in a renderbuffer
- * should be obtained through the gl_renderbuffer parameter, not per-context
- * information.
- */
-#define LOCAL_VARS						\
-   struct radeon_context *radeon = RADEON_CONTEXT(ctx);			\
-   struct radeon_renderbuffer *rrb = (void *) rb;		\
-   const GLint yScale = ctx->DrawBuffer->Name ? 1 : -1;			\
-   const GLint yBias = ctx->DrawBuffer->Name ? 0 : rrb->base.Height - 1;\
-   unsigned int num_cliprects;						\
-   struct drm_clip_rect *cliprects;					\
-   int x_off, y_off;							\
-   GLuint p;						\
-   (void)p;						\
-   radeon_get_cliprects(radeon, &cliprects, &num_cliprects, &x_off, &y_off);
-
-#define LOCAL_DEPTH_VARS				\
-   struct radeon_context *radeon = RADEON_CONTEXT(ctx);			\
-   struct radeon_renderbuffer *rrb = (void *) rb;	\
-   const GLint yScale = ctx->DrawBuffer->Name ? 1 : -1;			\
-   const GLint yBias = ctx->DrawBuffer->Name ? 0 : rrb->base.Height - 1;\
-   unsigned int num_cliprects;						\
-   struct drm_clip_rect *cliprects;					\
-   int x_off, y_off;							\
-  radeon_get_cliprects(radeon, &cliprects, &num_cliprects, &x_off, &y_off);
-
-#define LOCAL_STENCIL_VARS LOCAL_DEPTH_VARS
-
-#define Y_FLIP(_y) ((_y) * yScale + yBias)
-
-#define HW_LOCK()
-
-#define HW_UNLOCK()
-
-/* XXX FBO: this is identical to the macro in spantmp2.h except we get
- * the cliprect info from the context, not the driDrawable.
- * Move this into spantmp2.h someday.
- */
-#define HW_CLIPLOOP()							\
-   do {									\
-      int _nc = num_cliprects;						\
-      while ( _nc-- ) {							\
-	 int minx = cliprects[_nc].x1 - x_off;				\
-	 int miny = cliprects[_nc].y1 - y_off;				\
-	 int maxx = cliprects[_nc].x2 - x_off;				\
-	 int maxy = cliprects[_nc].y2 - y_off;
-
-/* ================================================================
- * Color buffer
- */
-
-/* 16 bit, RGB565 color spanline and pixel functions
- */
-#define SPANTMP_PIXEL_FMT GL_RGB
-#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_SHORT_5_6_5
-
-#define TAG(x)    radeon##x##_RGB565
-#define TAG2(x,y) radeon##x##_RGB565##y
-#if defined(RADEON_R600)
-#define GET_PTR(X,Y) r600_ptr_color(rrb, (X) + x_off, (Y) + y_off)
-#else
-#define GET_PTR(X,Y) radeon_ptr_2byte_8x2(rrb, (X) + x_off, (Y) + y_off)
-#endif
-#include "spantmp2.h"
-
-/* 16 bit, ARGB1555 color spanline and pixel functions
- */
-#define SPANTMP_PIXEL_FMT GL_BGRA
-#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_SHORT_1_5_5_5_REV
-
-#define TAG(x)    radeon##x##_ARGB1555
-#define TAG2(x,y) radeon##x##_ARGB1555##y
-#if defined(RADEON_R600)
-#define GET_PTR(X,Y) r600_ptr_color(rrb, (X) + x_off, (Y) + y_off)
-#else
-#define GET_PTR(X,Y) radeon_ptr_2byte_8x2(rrb, (X) + x_off, (Y) + y_off)
-#endif
-#include "spantmp2.h"
-
-/* 16 bit, RGBA4 color spanline and pixel functions
- */
-#define SPANTMP_PIXEL_FMT GL_BGRA
-#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_SHORT_4_4_4_4_REV
-
-#define TAG(x)    radeon##x##_ARGB4444
-#define TAG2(x,y) radeon##x##_ARGB4444##y
-#if defined(RADEON_R600)
-#define GET_PTR(X,Y) r600_ptr_color(rrb, (X) + x_off, (Y) + y_off)
-#else
-#define GET_PTR(X,Y) radeon_ptr_2byte_8x2(rrb, (X) + x_off, (Y) + y_off)
-#endif
-#include "spantmp2.h"
-
-/* 32 bit, xRGB8888 color spanline and pixel functions
- */
-#define SPANTMP_PIXEL_FMT GL_BGRA
-#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_INT_8_8_8_8_REV
-
-#define TAG(x)    radeon##x##_xRGB8888
-#define TAG2(x,y) radeon##x##_xRGB8888##y
-#if defined(RADEON_R600)
-#define GET_VALUE(_x, _y) ((*(GLuint*)(r600_ptr_color(rrb, _x + x_off, _y + y_off)) | 0xff000000))
-#define PUT_VALUE(_x, _y, d) { \
-   GLuint *_ptr = (GLuint*)r600_ptr_color( rrb, _x + x_off, _y + y_off );		\
-   *_ptr = d;								\
-} while (0)
-#else
-#define GET_VALUE(_x, _y) ((*(GLuint*)(radeon_ptr_4byte(rrb, _x + x_off, _y + y_off)) | 0xff000000))
-#define PUT_VALUE(_x, _y, d) { \
-   GLuint *_ptr = (GLuint*)radeon_ptr_4byte( rrb, _x + x_off, _y + y_off );		\
-   *_ptr = d;								\
-} while (0)
-#endif
-#include "spantmp2.h"
-
-/* 32 bit, ARGB8888 color spanline and pixel functions
- */
-#define SPANTMP_PIXEL_FMT GL_BGRA
-#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_INT_8_8_8_8_REV
-
-#define TAG(x)    radeon##x##_ARGB8888
-#define TAG2(x,y) radeon##x##_ARGB8888##y
-#if defined(RADEON_R600)
-#define GET_VALUE(_x, _y) (*(GLuint*)(r600_ptr_color(rrb, _x + x_off, _y + y_off)))
-#define PUT_VALUE(_x, _y, d) { \
-   GLuint *_ptr = (GLuint*)r600_ptr_color( rrb, _x + x_off, _y + y_off );		\
-   *_ptr = d;								\
-} while (0)
-#else
-#define GET_VALUE(_x, _y) (*(GLuint*)(radeon_ptr_4byte(rrb, _x + x_off, _y + y_off)))
-#define PUT_VALUE(_x, _y, d) { \
-   GLuint *_ptr = (GLuint*)radeon_ptr_4byte( rrb, _x + x_off, _y + y_off );		\
-   *_ptr = d;								\
-} while (0)
-#endif
-#include "spantmp2.h"
-
-/* ================================================================
- * Depth buffer
- */
-
-/* The Radeon family has depth tiling on all the time, so we have to convert
- * the x,y coordinates into the memory bus address (mba) in the same
- * manner as the engine.  In each case, the linear block address (ba)
- * is calculated, and then wired with x and y to produce the final
- * memory address.
- * The chip will do address translation on its own if the surface registers
- * are set up correctly. It is not quite enough to get it working with hyperz
- * too...
- */
-
-/* 16-bit depth buffer functions
- */
-#define VALUE_TYPE GLushort
-
-#if defined(RADEON_R200)
-#define WRITE_DEPTH( _x, _y, d )					\
-   *(GLushort *)r200_depth_2byte(rrb, _x + x_off, _y + y_off) = d
-#elif defined(RADEON_R600)
-#define WRITE_DEPTH( _x, _y, d )					\
-   *(GLushort *)r600_ptr_depth(rrb, _x + x_off, _y + y_off) = d
-#else
-#define WRITE_DEPTH( _x, _y, d )					\
-   *(GLushort *)radeon_ptr_2byte_8x2(rrb, _x + x_off, _y + y_off) = d
-#endif
-
-#if defined(RADEON_R200)
-#define READ_DEPTH( d, _x, _y )						\
-   d = *(GLushort *)r200_depth_2byte(rrb, _x + x_off, _y + y_off)
-#elif defined(RADEON_R600)
-#define READ_DEPTH( d, _x, _y )						\
-   d = *(GLushort *)r600_ptr_depth(rrb, _x + x_off, _y + y_off)
-#else
-#define READ_DEPTH( d, _x, _y )						\
-   d = *(GLushort *)radeon_ptr_2byte_8x2(rrb, _x + x_off, _y + y_off)
-#endif
-
-#define TAG(x) radeon##x##_z16
-#include "depthtmp.h"
-
-/* 24 bit depth
- *
- * Careful: It looks like the R300 uses ZZZS byte order while the R200
- * uses SZZZ for 24 bit depth, 8 bit stencil mode.
- */
-#define VALUE_TYPE GLuint
-
-#if defined(RADEON_R300)
-#define WRITE_DEPTH( _x, _y, d )					\
-do {									\
-   GLuint *_ptr = (GLuint*)radeon_ptr_4byte( rrb, _x + x_off, _y + y_off );		\
-   GLuint tmp = *_ptr;				\
-   tmp &= 0x000000ff;							\
-   tmp |= ((d << 8) & 0xffffff00);					\
-   *_ptr = tmp;					\
-} while (0)
-#elif defined(RADEON_R600)
-#define WRITE_DEPTH( _x, _y, d )					\
-do {									\
-   GLuint *_ptr = (GLuint*)r600_ptr_depth( rrb, _x + x_off, _y + y_off );		\
-   GLuint tmp = *_ptr;				\
-   tmp &= 0xff000000;							\
-   tmp |= ((d) & 0x00ffffff);					\
-   *_ptr = tmp;					\
-} while (0)
-#elif defined(RADEON_R200)
-#define WRITE_DEPTH( _x, _y, d )					\
-do {									\
-   GLuint *_ptr = (GLuint*)r200_depth_4byte( rrb, _x + x_off, _y + y_off );		\
-   GLuint tmp = *_ptr;				\
-   tmp &= 0xff000000;							\
-   tmp |= ((d) & 0x00ffffff);						\
-   *_ptr = tmp;					\
-} while (0)
-#else
-#define WRITE_DEPTH( _x, _y, d )					\
-do {									\
-   GLuint *_ptr = (GLuint*)radeon_ptr_4byte( rrb, _x + x_off, _y + y_off );	\
-   GLuint tmp = *_ptr;							\
-   tmp &= 0xff000000;							\
-   tmp |= ((d) & 0x00ffffff);						\
-   *_ptr = tmp;					\
-} while (0)
-#endif
-
-#if defined(RADEON_R300)
-#define READ_DEPTH( d, _x, _y )						\
-  do {									\
-    d = (*(GLuint*)(radeon_ptr_4byte(rrb, _x + x_off, _y + y_off)) & 0xffffff00) >> 8; \
-  }while(0)
-#elif defined(RADEON_R600)
-#define READ_DEPTH( d, _x, _y )						\
-  do {									\
-    d = (*(GLuint*)(r600_ptr_depth(rrb, _x + x_off, _y + y_off)) & 0x00ffffff); \
-  }while(0)
-#elif defined(RADEON_R200)
-#define READ_DEPTH( d, _x, _y )						\
-  do {									\
-    d = *(GLuint*)(r200_depth_4byte(rrb, _x + x_off, _y + y_off)) & 0x00ffffff; \
-  }while(0)
-#else
-#define READ_DEPTH( d, _x, _y )	\
-  d = *(GLuint*)(radeon_ptr_4byte(rrb, _x + x_off,	_y + y_off)) & 0x00ffffff;
-#endif
-
-#define TAG(x) radeon##x##_z24
-#include "depthtmp.h"
-
-/* 24 bit depth, 8 bit stencil depthbuffer functions
- * EXT_depth_stencil
- *
- * Careful: It looks like the R300 uses ZZZS byte order while the R200
- * uses SZZZ for 24 bit depth, 8 bit stencil mode.
- */
-#define VALUE_TYPE GLuint
-
-#if defined(RADEON_R300)
-#define WRITE_DEPTH( _x, _y, d )					\
-do {									\
-   GLuint *_ptr = (GLuint*)radeon_ptr_4byte( rrb, _x + x_off, _y + y_off );		\
-   *_ptr = d;								\
-} while (0)
-#elif defined(RADEON_R600)
-#define WRITE_DEPTH( _x, _y, d )					\
-do {									\
-   GLuint *_ptr = (GLuint*)r600_ptr_depth( rrb, _x + x_off, _y + y_off );		\
-   GLuint tmp = *_ptr;				\
-   tmp &= 0xff000000;							\
-   tmp |= (((d) >> 8) & 0x00ffffff);					\
-   *_ptr = tmp;					\
-   _ptr = (GLuint*)r600_ptr_stencil(rrb, _x + x_off, _y + y_off);		\
-   tmp = *_ptr;				\
-   tmp &= 0xffffff00;							\
-   tmp |= (d) & 0xff;							\
-   *_ptr = tmp;					\
-} while (0)
-#elif defined(RADEON_R200)
-#define WRITE_DEPTH( _x, _y, d )					\
-do {									\
-   GLuint *_ptr = (GLuint*)r200_depth_4byte( rrb, _x + x_off, _y + y_off );		\
-   GLuint tmp = z24s8_to_s8z24(d);					\
-   *_ptr = tmp;								\
-} while (0)
-#else
-#define WRITE_DEPTH( _x, _y, d )					\
-do {									\
-   GLuint *_ptr = (GLuint*)radeon_ptr_4byte( rrb, _x + x_off, _y + y_off );	\
-   GLuint tmp = z24s8_to_s8z24(d);					\
-   *_ptr = tmp;					\
-} while (0)
-#endif
-
-#if defined(RADEON_R300)
-#define READ_DEPTH( d, _x, _y )						\
-  do { \
-    d = (*(GLuint*)(radeon_ptr_4byte(rrb, _x + x_off, _y + y_off)));	\
-  }while(0)
-#elif defined(RADEON_R600)
-#define READ_DEPTH( d, _x, _y )						\
-  do { \
-    d = ((*(GLuint*)(r600_ptr_depth(rrb, _x + x_off, _y + y_off))) << 8) & 0xffffff00; \
-    d |= (*(GLuint*)(r600_ptr_stencil(rrb, _x + x_off, _y + y_off))) & 0x000000ff;	\
-  }while(0)
-#elif defined(RADEON_R200)
-#define READ_DEPTH( d, _x, _y )						\
-  do { \
-    d = s8z24_to_z24s8(*(GLuint*)(r200_depth_4byte(rrb, _x + x_off, _y + y_off)));	\
-  }while(0)
-#else
-#define READ_DEPTH( d, _x, _y )	do {					\
-    d = s8z24_to_z24s8(*(GLuint*)(radeon_ptr_4byte(rrb, _x + x_off,	_y + y_off ))); \
-  } while (0)
-#endif
-
-#define TAG(x) radeon##x##_z24_s8
-#include "depthtmp.h"
-
-/* ================================================================
- * Stencil buffer
- */
-
-/* 24 bit depth, 8 bit stencil depthbuffer functions
- */
-#ifdef RADEON_R300
-#define WRITE_STENCIL( _x, _y, d )					\
-do {									\
-   GLuint *_ptr = (GLuint*)radeon_ptr_4byte(rrb, _x + x_off, _y + y_off);		\
-   GLuint tmp = *_ptr;				\
-   tmp &= 0xffffff00;							\
-   tmp |= (d) & 0xff;							\
-   *_ptr = tmp;					\
-} while (0)
-#elif defined(RADEON_R600)
-#define WRITE_STENCIL( _x, _y, d )					\
-do {									\
-   GLuint *_ptr = (GLuint*)r600_ptr_stencil(rrb, _x + x_off, _y + y_off);		\
-   GLuint tmp = *_ptr;				\
-   tmp &= 0xffffff00;							\
-   tmp |= (d) & 0xff;							\
-   *_ptr = tmp;					\
-} while (0)
-#elif defined(RADEON_R200)
-#define WRITE_STENCIL( _x, _y, d )					\
-do {									\
-   GLuint *_ptr = (GLuint*)r200_depth_4byte(rrb, _x + x_off, _y + y_off);		\
-   GLuint tmp = *_ptr;				\
-   tmp &= 0x00ffffff;							\
-   tmp |= (((d) & 0xff) << 24);						\
-   *_ptr = tmp;					\
-} while (0)
-#else
-#define WRITE_STENCIL( _x, _y, d )					\
-do {									\
-   GLuint *_ptr = (GLuint*)radeon_ptr_4byte(rrb, _x + x_off, _y + y_off);		\
-   GLuint tmp = *_ptr;				\
-   tmp &= 0x00ffffff;							\
-   tmp |= (((d) & 0xff) << 24);						\
-   *_ptr = tmp;					\
-} while (0)
-#endif
-
-#ifdef RADEON_R300
-#define READ_STENCIL( d, _x, _y )					\
-do {									\
-   GLuint *_ptr = (GLuint*)radeon_ptr_4byte( rrb, _x + x_off, _y + y_off );		\
-   GLuint tmp = *_ptr;				\
-   d = tmp & 0x000000ff;						\
-} while (0)
-#elif defined(RADEON_R600)
-#define READ_STENCIL( d, _x, _y )					\
-do {									\
-   GLuint *_ptr = (GLuint*)r600_ptr_stencil( rrb, _x + x_off, _y + y_off );		\
-   GLuint tmp = *_ptr;				\
-   d = tmp & 0x000000ff;						\
-} while (0)
-#elif defined(RADEON_R200)
-#define READ_STENCIL( d, _x, _y )					\
-do {									\
-   GLuint *_ptr = (GLuint*)r200_depth_4byte( rrb, _x + x_off, _y + y_off );		\
-   GLuint tmp = *_ptr;				\
-   d = (tmp & 0xff000000) >> 24;					\
-} while (0)
-#else
-#define READ_STENCIL( d, _x, _y )					\
-do {									\
-   GLuint *_ptr = (GLuint*)radeon_ptr_4byte( rrb, _x + x_off, _y + y_off );		\
-   GLuint tmp = *_ptr;				\
-   d = (tmp & 0xff000000) >> 24;					\
-} while (0)
-#endif
-
-#define TAG(x) radeon##x##_z24_s8
-#include "stenciltmp.h"
-
-
-static void map_unmap_rb(struct gl_renderbuffer *rb, int flag)
-{
-	struct radeon_renderbuffer *rrb = radeon_renderbuffer(rb);
-	int r;
-
-	if (rrb == NULL || !rrb->bo)
-		return;
+	/* check for render to textures */
+	for (i = 0; i < BUFFER_COUNT; i++)
+		radeon_renderbuffer_map(ctx, fb->Attachment[i].Renderbuffer,
+			fb->FlipY);
 
-	if (flag) {
-		if (rrb->bo->bom->funcs->bo_wait)
-			radeon_bo_wait(rrb->bo);
-		r = radeon_bo_map(rrb->bo, 1);
-		if (r) {
-			fprintf(stderr, "(%s) error(%d) mapping buffer.\n",
-				__FUNCTION__, r);
-		}
-
-		radeonSetSpanFunctions(rrb);
-	} else {
-		radeon_bo_unmap(rrb->bo);
-		rb->GetRow = NULL;
-		rb->PutRow = NULL;
-	}
+        if (_mesa_is_front_buffer_drawing(fb))
+		RADEON_CONTEXT(ctx)->front_buffer_dirty = true;
 }
 
 static void
-radeon_map_unmap_buffers(GLcontext *ctx, GLboolean map)
+radeon_unmap_framebuffer(struct gl_context *ctx, struct gl_framebuffer *fb)
 {
-	GLuint i, j;
+	GLuint i;
 
-	/* color draw buffers */
-	for (j = 0; j < ctx->DrawBuffer->_NumColorDrawBuffers; j++)
-		map_unmap_rb(ctx->DrawBuffer->_ColorDrawBuffers[j], map);
+	radeon_print(RADEON_MEMORY, RADEON_TRACE,
+		"%s( %p , fb %p)\n",
+		     __func__, ctx, fb);
 
 	/* check for render to textures */
-	for (i = 0; i < BUFFER_COUNT; i++) {
-		struct gl_renderbuffer_attachment *att =
-			ctx->DrawBuffer->Attachment + i;
-		struct gl_texture_object *tex = att->Texture;
-		if (tex) {
-			/* Render to texture. Note that a mipmapped texture need not
-			 * be complete for render to texture, so we must restrict to
-			 * mapping only the attached image.
-			 */
-			radeon_texture_image *image = get_radeon_texture_image(tex->Image[att->CubeMapFace][att->TextureLevel]);
-			ASSERT(att->Renderbuffer);
-
-			if (map)
-				radeon_teximage_map(image, GL_TRUE);
-			else
-				radeon_teximage_unmap(image);
-		}
-	}
-
-	map_unmap_rb(ctx->ReadBuffer->_ColorReadBuffer, map);
-
-	/* depth buffer (Note wrapper!) */
-	if (ctx->DrawBuffer->_DepthBuffer)
-		map_unmap_rb(ctx->DrawBuffer->_DepthBuffer->Wrapped, map);
-
-	if (ctx->DrawBuffer->_StencilBuffer)
-		map_unmap_rb(ctx->DrawBuffer->_StencilBuffer->Wrapped, map);
+	for (i = 0; i < BUFFER_COUNT; i++)
+		radeon_renderbuffer_unmap(ctx, fb->Attachment[i].Renderbuffer);
+
+        if (_mesa_is_front_buffer_drawing(fb))
+		RADEON_CONTEXT(ctx)->front_buffer_dirty = true;
 }
 
-static void radeonSpanRenderStart(GLcontext * ctx)
+static void radeonSpanRenderStart(struct gl_context * ctx)
 {
 	radeonContextPtr rmesa = RADEON_CONTEXT(ctx);
-	int i;
 
 	radeon_firevertices(rmesa);
 
-	/* The locking and wait for idle should really only be needed in classic mode.
-	 * In a future memory manager based implementation, this should become
-	 * unnecessary due to the fact that mapping our buffers, textures, etc.
-	 * should implicitly wait for any previous rendering commands that must
-	 * be waited on. */
-	if (!rmesa->radeonScreen->driScreen->dri2.enabled) {
-		LOCK_HARDWARE(rmesa);
-		radeonWaitForIdleLocked(rmesa);
-	}
-
-	for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) {
-		if (ctx->Texture.Unit[i]._ReallyEnabled)
-			ctx->Driver.MapTexture(ctx, ctx->Texture.Unit[i]._Current);
-	}
-
-	radeon_map_unmap_buffers(ctx, 1);
+	_swrast_map_textures(ctx);
+
+	radeon_map_framebuffer(ctx, ctx->DrawBuffer);
+	if (ctx->ReadBuffer != ctx->DrawBuffer)
+		radeon_map_framebuffer(ctx, ctx->ReadBuffer);
 }
 
-static void radeonSpanRenderFinish(GLcontext * ctx)
+static void radeonSpanRenderFinish(struct gl_context * ctx)
 {
-	radeonContextPtr rmesa = RADEON_CONTEXT(ctx);
-	int i;
 	_swrast_flush(ctx);
-	if (!rmesa->radeonScreen->driScreen->dri2.enabled) {
-		UNLOCK_HARDWARE(rmesa);
-	}
-	for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) {
-		if (ctx->Texture.Unit[i]._ReallyEnabled)
-			ctx->Driver.UnmapTexture(ctx, ctx->Texture.Unit[i]._Current);
-	}
-
-	radeon_map_unmap_buffers(ctx, 0);
+	_swrast_unmap_textures(ctx);
+
+	radeon_unmap_framebuffer(ctx, ctx->DrawBuffer);
+	if (ctx->ReadBuffer != ctx->DrawBuffer)
+		radeon_unmap_framebuffer(ctx, ctx->ReadBuffer);
 }
 
-void radeonInitSpanFuncs(GLcontext * ctx)
+void radeonInitSpanFuncs(struct gl_context * ctx)
 {
 	struct swrast_device_driver *swdd =
 	    _swrast_GetDeviceDriverReference(ctx);
@@ -859,30 +153,3 @@ void radeonInitSpanFuncs(GLcontext * ctx)
 	swdd->SpanRenderFinish = radeonSpanRenderFinish;
 }
 
-/**
- * Plug in the Get/Put routines for the given driRenderbuffer.
- */
-static void radeonSetSpanFunctions(struct radeon_renderbuffer *rrb)
-{
-	if (rrb->base._ActualFormat == GL_RGB5) {
-		radeonInitPointers_RGB565(&rrb->base);
-	} else if (rrb->base._ActualFormat == GL_RGB8) {
-		radeonInitPointers_xRGB8888(&rrb->base);
-	} else if (rrb->base._ActualFormat == GL_RGBA8) {
-		radeonInitPointers_ARGB8888(&rrb->base);
-	} else if (rrb->base._ActualFormat == GL_RGBA4) {
-		radeonInitPointers_ARGB4444(&rrb->base);
-	} else if (rrb->base._ActualFormat == GL_RGB5_A1) {
-		radeonInitPointers_ARGB1555(&rrb->base);
-	} else if (rrb->base._ActualFormat == GL_DEPTH_COMPONENT16) {
-		radeonInitDepthPointers_z16(&rrb->base);
-	} else if (rrb->base._ActualFormat == GL_DEPTH_COMPONENT24) {
-		radeonInitDepthPointers_z24(&rrb->base);
-	} else if (rrb->base._ActualFormat == GL_DEPTH24_STENCIL8_EXT) {
-		radeonInitDepthPointers_z24_s8(&rrb->base);
-	} else if (rrb->base._ActualFormat == GL_STENCIL_INDEX8_EXT) {
-		radeonInitStencilPointers_z24_s8(&rrb->base);
-	} else {
-		fprintf(stderr, "radeonSetSpanFunctions: bad actual format: 0x%04X\n", rrb->base._ActualFormat);
-	}
-}