Merge branch 'gallium-polygon-stipple'
[mesa.git] / src / mesa / drivers / dri / intel / intel_span.c
1 /**************************************************************************
2 *
3 * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * Copyright 2011 Intel Corporation
5 * All Rights Reserved.
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining a
8 * copy of this software and associated documentation files (the
9 * "Software"), to deal in the Software without restriction, including
10 * without limitation the rights to use, copy, modify, merge, publish,
11 * distribute, sub license, and/or sell copies of the Software, and to
12 * permit persons to whom the Software is furnished to do so, subject to
13 * the following conditions:
14 *
15 * The above copyright notice and this permission notice (including the
16 * next paragraph) shall be included in all copies or substantial portions
17 * of the Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
20 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
21 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
22 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
23 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
24 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
25 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 *
27 * Authors:
28 * Chad Versace <chad@chad-versace.us>
29 *
30 **************************************************************************/
31
32 #include <stdbool.h>
33 #include <stdint.h>
34 #include "main/glheader.h"
35 #include "main/macros.h"
36 #include "main/mtypes.h"
37 #include "main/colormac.h"
38 #include "main/renderbuffer.h"
39
40 #include "intel_buffers.h"
41 #include "intel_fbo.h"
42 #include "intel_screen.h"
43 #include "intel_span.h"
44 #include "intel_regions.h"
45 #include "intel_tex.h"
46
47 #include "swrast/swrast.h"
48
49 static void
50 intel_set_span_functions(struct intel_context *intel,
51 struct gl_renderbuffer *rb);
52
53 #undef DBG
54 #define DBG 0
55
56 #define LOCAL_VARS \
57 struct intel_renderbuffer *irb = intel_renderbuffer(rb); \
58 int minx = 0, miny = 0; \
59 int maxx = rb->Width; \
60 int maxy = rb->Height; \
61 int pitch = rb->RowStride * irb->region->cpp; \
62 void *buf = rb->Data; \
63 GLuint p; \
64 (void) p;
65
66 #define HW_CLIPLOOP()
67 #define HW_ENDCLIPLOOP()
68
69 #define Y_FLIP(_y) (_y)
70
71 #define HW_LOCK()
72
73 #define HW_UNLOCK()
74
75 /* r5g6b5 color span and pixel functions */
76 #define SPANTMP_PIXEL_FMT GL_RGB
77 #define SPANTMP_PIXEL_TYPE GL_UNSIGNED_SHORT_5_6_5
78 #define TAG(x) intel_##x##_RGB565
79 #define TAG2(x,y) intel_##x##y_RGB565
80 #include "spantmp2.h"
81
82 /* a4r4g4b4 color span and pixel functions */
83 #define SPANTMP_PIXEL_FMT GL_BGRA
84 #define SPANTMP_PIXEL_TYPE GL_UNSIGNED_SHORT_4_4_4_4_REV
85 #define TAG(x) intel_##x##_ARGB4444
86 #define TAG2(x,y) intel_##x##y_ARGB4444
87 #include "spantmp2.h"
88
89 /* a1r5g5b5 color span and pixel functions */
90 #define SPANTMP_PIXEL_FMT GL_BGRA
91 #define SPANTMP_PIXEL_TYPE GL_UNSIGNED_SHORT_1_5_5_5_REV
92 #define TAG(x) intel_##x##_ARGB1555
93 #define TAG2(x,y) intel_##x##y##_ARGB1555
94 #include "spantmp2.h"
95
96 /* a8r8g8b8 color span and pixel functions */
97 #define SPANTMP_PIXEL_FMT GL_BGRA
98 #define SPANTMP_PIXEL_TYPE GL_UNSIGNED_INT_8_8_8_8_REV
99 #define TAG(x) intel_##x##_ARGB8888
100 #define TAG2(x,y) intel_##x##y##_ARGB8888
101 #include "spantmp2.h"
102
103 /* x8r8g8b8 color span and pixel functions */
104 #define SPANTMP_PIXEL_FMT GL_BGR
105 #define SPANTMP_PIXEL_TYPE GL_UNSIGNED_INT_8_8_8_8_REV
106 #define TAG(x) intel_##x##_xRGB8888
107 #define TAG2(x,y) intel_##x##y##_xRGB8888
108 #include "spantmp2.h"
109
110 /* a8 color span and pixel functions */
111 #define SPANTMP_PIXEL_FMT GL_ALPHA
112 #define SPANTMP_PIXEL_TYPE GL_UNSIGNED_BYTE
113 #define TAG(x) intel_##x##_A8
114 #define TAG2(x,y) intel_##x##y##_A8
115 #include "spantmp2.h"
116
117 /* ------------------------------------------------------------------------- */
118 /* s8 stencil span and pixel functions */
119 /* ------------------------------------------------------------------------- */
120
121 /*
122 * HAVE_HW_STENCIL_SPANS determines if stencil buffer read/writes are done with
123 * memcpy or for loops. Since the stencil buffer is interleaved, memcpy won't
124 * work.
125 */
126 #define HAVE_HW_STENCIL_SPANS 0
127
128 #define LOCAL_STENCIL_VARS \
129 (void) ctx; \
130 int minx = 0; \
131 int miny = 0; \
132 int maxx = rb->Width; \
133 int maxy = rb->Height; \
134 \
135 /* \
136 * Here we ignore rb->Data and rb->RowStride as set by \
137 * intelSpanRenderStart. Since intel_offset_S8 decodes the W tile \
138 * manually, the region's *real* base address and stride is \
139 * required. \
140 */ \
141 struct intel_renderbuffer *irb = intel_renderbuffer(rb); \
142 uint8_t *buf = irb->region->buffer->virtual; \
143 unsigned stride = irb->region->pitch; \
144 unsigned height = 2 * irb->region->height; \
145 bool flip = rb->Name == 0; \
146 int y_scale = flip ? -1 : 1; \
147 int y_bias = flip ? (height - 1) : 0; \
148
149 #undef Y_FLIP
150 #define Y_FLIP(y) (y_scale * (y) + y_bias)
151
152 /**
153 * \brief Get pointer offset into stencil buffer.
154 *
155 * The stencil buffer is W tiled. Since the GTT is incapable of W fencing, we
156 * must decode the tile's layout in software.
157 *
158 * See
159 * - PRM, 2011 Sandy Bridge, Volume 1, Part 2, Section 4.5.2.1 W-Major Tile
160 * Format.
161 * - PRM, 2011 Sandy Bridge, Volume 1, Part 2, Section 4.5.3 Tiling Algorithm
162 *
163 * Even though the returned offset is always positive, the return type is
164 * signed due to
165 * commit e8b1c6d6f55f5be3bef25084fdd8b6127517e137
166 * mesa: Fix return type of _mesa_get_format_bytes() (#37351)
167 */
168 static inline intptr_t
169 intel_offset_S8(uint32_t stride, uint32_t x, uint32_t y)
170 {
171 uint32_t tile_size = 4096;
172 uint32_t tile_width = 64;
173 uint32_t tile_height = 64;
174 uint32_t row_size = 64 * stride;
175
176 uint32_t tile_x = x / tile_width;
177 uint32_t tile_y = y / tile_height;
178
179 /* The byte's address relative to the tile's base addres. */
180 uint32_t byte_x = x % tile_width;
181 uint32_t byte_y = y % tile_height;
182
183 uintptr_t u = tile_y * row_size
184 + tile_x * tile_size
185 + 512 * (byte_x / 8)
186 + 64 * (byte_y / 8)
187 + 32 * ((byte_y / 4) % 2)
188 + 16 * ((byte_x / 4) % 2)
189 + 8 * ((byte_y / 2) % 2)
190 + 4 * ((byte_x / 2) % 2)
191 + 2 * (byte_y % 2)
192 + 1 * (byte_x % 2);
193
194 /*
195 * Errata for Gen5:
196 *
197 * An additional offset is needed which is not documented in the PRM.
198 *
199 * if ((byte_x / 8) % 2 == 1) {
200 * if ((byte_y / 8) % 2) == 0) {
201 * u += 64;
202 * } else {
203 * u -= 64;
204 * }
205 * }
206 *
207 * The offset is expressed more tersely as
208 * u += ((int) x & 0x8) * (8 - (((int) y & 0x8) << 1));
209 */
210
211 return u;
212 }
213
214 #define WRITE_STENCIL(x, y, src) buf[intel_offset_S8(stride, x, y)] = src;
215 #define READ_STENCIL(dest, x, y) dest = buf[intel_offset_S8(stride, x, y)]
216 #define TAG(x) intel_##x##_S8
217 #include "stenciltmp.h"
218
219 /* ------------------------------------------------------------------------- */
220
221 void
222 intel_renderbuffer_map(struct intel_context *intel, struct gl_renderbuffer *rb)
223 {
224 struct intel_renderbuffer *irb = intel_renderbuffer(rb);
225
226 if (!irb)
227 return;
228
229 if (irb->wrapped_depth)
230 intel_renderbuffer_map(intel, irb->wrapped_depth);
231 if (irb->wrapped_stencil)
232 intel_renderbuffer_map(intel, irb->wrapped_stencil);
233
234 if (!irb->region)
235 return;
236
237 drm_intel_gem_bo_map_gtt(irb->region->buffer);
238
239 rb->Data = irb->region->buffer->virtual;
240 rb->RowStride = irb->region->pitch;
241
242 if (!rb->Name) {
243 /* Flip orientation of the window system buffer */
244 rb->Data += rb->RowStride * (irb->region->height - 1) * irb->region->cpp;
245 rb->RowStride = -rb->RowStride;
246 } else {
247 /* Adjust the base pointer of a texture image drawbuffer to the image
248 * within the miptree region (all else has draw_x/y = 0).
249 */
250 rb->Data += irb->draw_x * irb->region->cpp;
251 rb->Data += irb->draw_y * rb->RowStride * irb->region->cpp;
252 }
253
254 intel_set_span_functions(intel, rb);
255 }
256
257 void
258 intel_renderbuffer_unmap(struct intel_context *intel,
259 struct gl_renderbuffer *rb)
260 {
261 struct intel_renderbuffer *irb = intel_renderbuffer(rb);
262
263 if (!irb)
264 return;
265
266 if (irb->wrapped_depth)
267 intel_renderbuffer_unmap(intel, irb->wrapped_depth);
268 if (irb->wrapped_stencil)
269 intel_renderbuffer_unmap(intel, irb->wrapped_stencil);
270
271 if (!irb->region)
272 return;
273
274 drm_intel_gem_bo_unmap_gtt(irb->region->buffer);
275
276 rb->GetRow = NULL;
277 rb->PutRow = NULL;
278 rb->Data = NULL;
279 rb->RowStride = 0;
280 }
281
282 static void
283 intel_framebuffer_map(struct intel_context *intel, struct gl_framebuffer *fb)
284 {
285 int i;
286
287 for (i = 0; i < BUFFER_COUNT; i++) {
288 intel_renderbuffer_map(intel, fb->Attachment[i].Renderbuffer);
289 }
290
291 intel_check_front_buffer_rendering(intel);
292 }
293
294 static void
295 intel_framebuffer_unmap(struct intel_context *intel, struct gl_framebuffer *fb)
296 {
297 int i;
298
299 for (i = 0; i < BUFFER_COUNT; i++) {
300 intel_renderbuffer_unmap(intel, fb->Attachment[i].Renderbuffer);
301 }
302 }
303
304 /**
305 * Prepare for software rendering. Map current read/draw framebuffers'
306 * renderbuffes and all currently bound texture objects.
307 *
308 * Old note: Moved locking out to get reasonable span performance.
309 */
310 void
311 intelSpanRenderStart(struct gl_context * ctx)
312 {
313 struct intel_context *intel = intel_context(ctx);
314 GLuint i;
315
316 intel_flush(&intel->ctx);
317 intel_prepare_render(intel);
318
319 for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) {
320 if (ctx->Texture.Unit[i]._ReallyEnabled) {
321 struct gl_texture_object *texObj = ctx->Texture.Unit[i]._Current;
322
323 intel_finalize_mipmap_tree(intel, i);
324 intel_tex_map_images(intel, intel_texture_object(texObj));
325 }
326 }
327
328 intel_framebuffer_map(intel, ctx->DrawBuffer);
329 if (ctx->ReadBuffer != ctx->DrawBuffer) {
330 intel_framebuffer_map(intel, ctx->ReadBuffer);
331 }
332 }
333
334 /**
335 * Called when done software rendering. Unmap the buffers we mapped in
336 * the above function.
337 */
338 void
339 intelSpanRenderFinish(struct gl_context * ctx)
340 {
341 struct intel_context *intel = intel_context(ctx);
342 GLuint i;
343
344 _swrast_flush(ctx);
345
346 for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) {
347 if (ctx->Texture.Unit[i]._ReallyEnabled) {
348 struct gl_texture_object *texObj = ctx->Texture.Unit[i]._Current;
349 intel_tex_unmap_images(intel, intel_texture_object(texObj));
350 }
351 }
352
353 intel_framebuffer_unmap(intel, ctx->DrawBuffer);
354 if (ctx->ReadBuffer != ctx->DrawBuffer) {
355 intel_framebuffer_unmap(intel, ctx->ReadBuffer);
356 }
357 }
358
359
360 void
361 intelInitSpanFuncs(struct gl_context * ctx)
362 {
363 struct swrast_device_driver *swdd = _swrast_GetDeviceDriverReference(ctx);
364 swdd->SpanRenderStart = intelSpanRenderStart;
365 swdd->SpanRenderFinish = intelSpanRenderFinish;
366 }
367
368 void
369 intel_map_vertex_shader_textures(struct gl_context *ctx)
370 {
371 struct intel_context *intel = intel_context(ctx);
372 int i;
373
374 if (ctx->VertexProgram._Current == NULL)
375 return;
376
377 for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) {
378 if (ctx->Texture.Unit[i]._ReallyEnabled &&
379 ctx->VertexProgram._Current->Base.TexturesUsed[i] != 0) {
380 struct gl_texture_object *texObj = ctx->Texture.Unit[i]._Current;
381
382 intel_tex_map_images(intel, intel_texture_object(texObj));
383 }
384 }
385 }
386
387 void
388 intel_unmap_vertex_shader_textures(struct gl_context *ctx)
389 {
390 struct intel_context *intel = intel_context(ctx);
391 int i;
392
393 if (ctx->VertexProgram._Current == NULL)
394 return;
395
396 for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) {
397 if (ctx->Texture.Unit[i]._ReallyEnabled &&
398 ctx->VertexProgram._Current->Base.TexturesUsed[i] != 0) {
399 struct gl_texture_object *texObj = ctx->Texture.Unit[i]._Current;
400
401 intel_tex_unmap_images(intel, intel_texture_object(texObj));
402 }
403 }
404 }
405
406 typedef void (*span_init_func)(struct gl_renderbuffer *rb);
407
408 static span_init_func intel_span_init_funcs[MESA_FORMAT_COUNT] =
409 {
410 [MESA_FORMAT_A8] = intel_InitPointers_A8,
411 [MESA_FORMAT_RGB565] = intel_InitPointers_RGB565,
412 [MESA_FORMAT_ARGB4444] = intel_InitPointers_ARGB4444,
413 [MESA_FORMAT_ARGB1555] = intel_InitPointers_ARGB1555,
414 [MESA_FORMAT_XRGB8888] = intel_InitPointers_xRGB8888,
415 [MESA_FORMAT_ARGB8888] = intel_InitPointers_ARGB8888,
416 [MESA_FORMAT_SARGB8] = intel_InitPointers_ARGB8888,
417 [MESA_FORMAT_Z16] = _mesa_set_renderbuffer_accessors,
418 [MESA_FORMAT_X8_Z24] = _mesa_set_renderbuffer_accessors,
419 [MESA_FORMAT_S8_Z24] = _mesa_set_renderbuffer_accessors,
420 [MESA_FORMAT_S8] = intel_InitStencilPointers_S8,
421 [MESA_FORMAT_R8] = _mesa_set_renderbuffer_accessors,
422 [MESA_FORMAT_RG88] = _mesa_set_renderbuffer_accessors,
423 [MESA_FORMAT_R16] = _mesa_set_renderbuffer_accessors,
424 [MESA_FORMAT_RG1616] = _mesa_set_renderbuffer_accessors,
425 [MESA_FORMAT_RGBA_FLOAT32] = _mesa_set_renderbuffer_accessors,
426 [MESA_FORMAT_RG_FLOAT32] = _mesa_set_renderbuffer_accessors,
427 [MESA_FORMAT_R_FLOAT32] = _mesa_set_renderbuffer_accessors,
428 [MESA_FORMAT_INTENSITY_FLOAT32] = _mesa_set_renderbuffer_accessors,
429 [MESA_FORMAT_LUMINANCE_FLOAT32] = _mesa_set_renderbuffer_accessors,
430 };
431
432 bool
433 intel_span_supports_format(gl_format format)
434 {
435 return intel_span_init_funcs[format] != NULL;
436 }
437
438 /**
439 * Plug in appropriate span read/write functions for the given renderbuffer.
440 * These are used for the software fallbacks.
441 */
442 static void
443 intel_set_span_functions(struct intel_context *intel,
444 struct gl_renderbuffer *rb)
445 {
446 struct intel_renderbuffer *irb = (struct intel_renderbuffer *) rb;
447
448 assert(intel_span_init_funcs[irb->Base.Format]);
449 intel_span_init_funcs[irb->Base.Format](rb);
450 }