Merge branch 'gallium-polygon-stipple'
[mesa.git] / src / gallium / auxiliary / util / u_tile.c
1 /**************************************************************************
2 *
3 * Copyright 2007 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /**
29 * RGBA/float tile get/put functions.
30 * Usable both by drivers and state trackers.
31 */
32
33
34 #include "pipe/p_defines.h"
35 #include "util/u_inlines.h"
36
37 #include "util/u_format.h"
38 #include "util/u_math.h"
39 #include "util/u_memory.h"
40 #include "util/u_rect.h"
41 #include "util/u_tile.h"
42
43
44 /**
45 * Move raw block of pixels from transfer object to user memory.
46 */
47 void
48 pipe_get_tile_raw(struct pipe_context *pipe,
49 struct pipe_transfer *pt,
50 uint x, uint y, uint w, uint h,
51 void *dst, int dst_stride)
52 {
53 const void *src;
54
55 if (dst_stride == 0)
56 dst_stride = util_format_get_stride(pt->resource->format, w);
57
58 if (u_clip_tile(x, y, &w, &h, &pt->box))
59 return;
60
61 src = pipe->transfer_map(pipe, pt);
62 assert(src);
63 if(!src)
64 return;
65
66 util_copy_rect(dst, pt->resource->format, dst_stride, 0, 0, w, h, src, pt->stride, x, y);
67
68 pipe->transfer_unmap(pipe, pt);
69 }
70
71
72 /**
73 * Move raw block of pixels from user memory to transfer object.
74 */
75 void
76 pipe_put_tile_raw(struct pipe_context *pipe,
77 struct pipe_transfer *pt,
78 uint x, uint y, uint w, uint h,
79 const void *src, int src_stride)
80 {
81 void *dst;
82 enum pipe_format format = pt->resource->format;
83
84 if (src_stride == 0)
85 src_stride = util_format_get_stride(format, w);
86
87 if (u_clip_tile(x, y, &w, &h, &pt->box))
88 return;
89
90 dst = pipe->transfer_map(pipe, pt);
91 assert(dst);
92 if(!dst)
93 return;
94
95 util_copy_rect(dst, format, pt->stride, x, y, w, h, src, src_stride, 0, 0);
96
97 pipe->transfer_unmap(pipe, pt);
98 }
99
100
101
102
103 /** Convert short in [-32768,32767] to GLfloat in [-1.0,1.0] */
104 #define SHORT_TO_FLOAT(S) ((2.0F * (S) + 1.0F) * (1.0F/65535.0F))
105
106 #define UNCLAMPED_FLOAT_TO_SHORT(us, f) \
107 us = ( (short) ( CLAMP((f), -1.0, 1.0) * 32767.0F) )
108
109
110
111 /*** PIPE_FORMAT_Z16_UNORM ***/
112
113 /**
114 * Return each Z value as four floats in [0,1].
115 */
116 static void
117 z16_get_tile_rgba(const ushort *src,
118 unsigned w, unsigned h,
119 float *p,
120 unsigned dst_stride)
121 {
122 const float scale = 1.0f / 65535.0f;
123 unsigned i, j;
124
125 for (i = 0; i < h; i++) {
126 float *pRow = p;
127 for (j = 0; j < w; j++, pRow += 4) {
128 pRow[0] =
129 pRow[1] =
130 pRow[2] =
131 pRow[3] = *src++ * scale;
132 }
133 p += dst_stride;
134 }
135 }
136
137
138
139
140 /*** PIPE_FORMAT_Z32_UNORM ***/
141
142 /**
143 * Return each Z value as four floats in [0,1].
144 */
145 static void
146 z32_get_tile_rgba(const unsigned *src,
147 unsigned w, unsigned h,
148 float *p,
149 unsigned dst_stride)
150 {
151 const double scale = 1.0 / (double) 0xffffffff;
152 unsigned i, j;
153
154 for (i = 0; i < h; i++) {
155 float *pRow = p;
156 for (j = 0; j < w; j++, pRow += 4) {
157 pRow[0] =
158 pRow[1] =
159 pRow[2] =
160 pRow[3] = (float) (*src++ * scale);
161 }
162 p += dst_stride;
163 }
164 }
165
166
167 /*** PIPE_FORMAT_Z24_UNORM_S8_USCALED ***/
168
169 /**
170 * Return Z component as four float in [0,1]. Stencil part ignored.
171 */
172 static void
173 s8z24_get_tile_rgba(const unsigned *src,
174 unsigned w, unsigned h,
175 float *p,
176 unsigned dst_stride)
177 {
178 const double scale = 1.0 / ((1 << 24) - 1);
179 unsigned i, j;
180
181 for (i = 0; i < h; i++) {
182 float *pRow = p;
183 for (j = 0; j < w; j++, pRow += 4) {
184 pRow[0] =
185 pRow[1] =
186 pRow[2] =
187 pRow[3] = (float) (scale * (*src++ & 0xffffff));
188 }
189 p += dst_stride;
190 }
191 }
192
193
194 /*** PIPE_FORMAT_S8_USCALED_Z24_UNORM ***/
195
196 /**
197 * Return Z component as four float in [0,1]. Stencil part ignored.
198 */
199 static void
200 z24s8_get_tile_rgba(const unsigned *src,
201 unsigned w, unsigned h,
202 float *p,
203 unsigned dst_stride)
204 {
205 const double scale = 1.0 / ((1 << 24) - 1);
206 unsigned i, j;
207
208 for (i = 0; i < h; i++) {
209 float *pRow = p;
210 for (j = 0; j < w; j++, pRow += 4) {
211 pRow[0] =
212 pRow[1] =
213 pRow[2] =
214 pRow[3] = (float) (scale * (*src++ >> 8));
215 }
216 p += dst_stride;
217 }
218 }
219
220 /*** PIPE_FORMAT_S8X24_USCALED ***/
221
222 /**
223 * Return S component as four uint32_t in [0..255]. Z part ignored.
224 */
225 static void
226 s8x24_get_tile_rgba(const unsigned *src,
227 unsigned w, unsigned h,
228 float *p,
229 unsigned dst_stride)
230 {
231 unsigned i, j;
232
233 for (i = 0; i < h; i++) {
234 float *pRow = p;
235
236 for (j = 0; j < w; j++, pRow += 4) {
237 pRow[0] =
238 pRow[1] =
239 pRow[2] =
240 pRow[3] = (float)((*src++ >> 24) & 0xff);
241 }
242
243 p += dst_stride;
244 }
245 }
246
247 /*** PIPE_FORMAT_X24S8_USCALED ***/
248
249 /**
250 * Return S component as four uint32_t in [0..255]. Z part ignored.
251 */
252 static void
253 x24s8_get_tile_rgba(const unsigned *src,
254 unsigned w, unsigned h,
255 float *p,
256 unsigned dst_stride)
257 {
258 unsigned i, j;
259
260 for (i = 0; i < h; i++) {
261 float *pRow = p;
262 for (j = 0; j < w; j++, pRow += 4) {
263 pRow[0] =
264 pRow[1] =
265 pRow[2] =
266 pRow[3] = (float)(*src++ & 0xff);
267 }
268 p += dst_stride;
269 }
270 }
271
272
273 /**
274 * Return S component as four uint32_t in [0..255]. Z part ignored.
275 */
276 static void
277 s8_get_tile_rgba(const unsigned char *src,
278 unsigned w, unsigned h,
279 float *p,
280 unsigned dst_stride)
281 {
282 unsigned i, j;
283
284 for (i = 0; i < h; i++) {
285 float *pRow = p;
286 for (j = 0; j < w; j++, pRow += 4) {
287 pRow[0] =
288 pRow[1] =
289 pRow[2] =
290 pRow[3] = (float)(*src++ & 0xff);
291 }
292 p += dst_stride;
293 }
294 }
295
296 /*** PIPE_FORMAT_Z32_FLOAT ***/
297
298 /**
299 * Return each Z value as four floats in [0,1].
300 */
301 static void
302 z32f_get_tile_rgba(const float *src,
303 unsigned w, unsigned h,
304 float *p,
305 unsigned dst_stride)
306 {
307 unsigned i, j;
308
309 for (i = 0; i < h; i++) {
310 float *pRow = p;
311 for (j = 0; j < w; j++, pRow += 4) {
312 pRow[0] =
313 pRow[1] =
314 pRow[2] =
315 pRow[3] = *src++;
316 }
317 p += dst_stride;
318 }
319 }
320
321 /*** PIPE_FORMAT_Z32_FLOAT_S8X24_USCALED ***/
322
323 /**
324 * Return each Z value as four floats in [0,1].
325 */
326 static void
327 z32f_x24s8_get_tile_rgba(const float *src,
328 unsigned w, unsigned h,
329 float *p,
330 unsigned dst_stride)
331 {
332 unsigned i, j;
333
334 for (i = 0; i < h; i++) {
335 float *pRow = p;
336 for (j = 0; j < w; j++, pRow += 4) {
337 pRow[0] =
338 pRow[1] =
339 pRow[2] =
340 pRow[3] = *src;
341 src += 2;
342 }
343 p += dst_stride;
344 }
345 }
346
347
348 void
349 pipe_tile_raw_to_rgba(enum pipe_format format,
350 void *src,
351 uint w, uint h,
352 float *dst, unsigned dst_stride)
353 {
354 switch (format) {
355 case PIPE_FORMAT_Z16_UNORM:
356 z16_get_tile_rgba((ushort *) src, w, h, dst, dst_stride);
357 break;
358 case PIPE_FORMAT_Z32_UNORM:
359 z32_get_tile_rgba((unsigned *) src, w, h, dst, dst_stride);
360 break;
361 case PIPE_FORMAT_Z24_UNORM_S8_USCALED:
362 case PIPE_FORMAT_Z24X8_UNORM:
363 s8z24_get_tile_rgba((unsigned *) src, w, h, dst, dst_stride);
364 break;
365 case PIPE_FORMAT_S8_USCALED:
366 s8_get_tile_rgba((unsigned char *) src, w, h, dst, dst_stride);
367 break;
368 case PIPE_FORMAT_X24S8_USCALED:
369 s8x24_get_tile_rgba((unsigned *) src, w, h, dst, dst_stride);
370 break;
371 case PIPE_FORMAT_S8_USCALED_Z24_UNORM:
372 case PIPE_FORMAT_X8Z24_UNORM:
373 z24s8_get_tile_rgba((unsigned *) src, w, h, dst, dst_stride);
374 break;
375 case PIPE_FORMAT_S8X24_USCALED:
376 x24s8_get_tile_rgba((unsigned *) src, w, h, dst, dst_stride);
377 break;
378 case PIPE_FORMAT_Z32_FLOAT:
379 z32f_get_tile_rgba((float *) src, w, h, dst, dst_stride);
380 break;
381 case PIPE_FORMAT_Z32_FLOAT_S8X24_USCALED:
382 z32f_x24s8_get_tile_rgba((float *) src, w, h, dst, dst_stride);
383 break;
384 default:
385 util_format_read_4f(format,
386 dst, dst_stride * sizeof(float),
387 src, util_format_get_stride(format, w),
388 0, 0, w, h);
389 }
390 }
391
392
393 void
394 pipe_get_tile_rgba(struct pipe_context *pipe,
395 struct pipe_transfer *pt,
396 uint x, uint y, uint w, uint h,
397 float *p)
398 {
399 pipe_get_tile_rgba_format(pipe, pt, x, y, w, h, pt->resource->format, p);
400 }
401
402
403 void
404 pipe_get_tile_rgba_format(struct pipe_context *pipe,
405 struct pipe_transfer *pt,
406 uint x, uint y, uint w, uint h,
407 enum pipe_format format,
408 float *p)
409 {
410 unsigned dst_stride = w * 4;
411 void *packed;
412
413 if (u_clip_tile(x, y, &w, &h, &pt->box)) {
414 return;
415 }
416
417 packed = MALLOC(util_format_get_nblocks(format, w, h) * util_format_get_blocksize(format));
418 if (!packed) {
419 return;
420 }
421
422 if (format == PIPE_FORMAT_UYVY || format == PIPE_FORMAT_YUYV) {
423 assert((x & 1) == 0);
424 }
425
426 pipe_get_tile_raw(pipe, pt, x, y, w, h, packed, 0);
427
428 pipe_tile_raw_to_rgba(format, packed, w, h, p, dst_stride);
429
430 FREE(packed);
431 }
432
433
434 void
435 pipe_put_tile_rgba(struct pipe_context *pipe,
436 struct pipe_transfer *pt,
437 uint x, uint y, uint w, uint h,
438 const float *p)
439 {
440 pipe_put_tile_rgba_format(pipe, pt, x, y, w, h, pt->resource->format, p);
441 }
442
443
444 void
445 pipe_put_tile_rgba_format(struct pipe_context *pipe,
446 struct pipe_transfer *pt,
447 uint x, uint y, uint w, uint h,
448 enum pipe_format format,
449 const float *p)
450 {
451 unsigned src_stride = w * 4;
452 void *packed;
453
454 if (u_clip_tile(x, y, &w, &h, &pt->box))
455 return;
456
457 packed = MALLOC(util_format_get_nblocks(format, w, h) * util_format_get_blocksize(format));
458
459 if (!packed)
460 return;
461
462 switch (format) {
463 case PIPE_FORMAT_Z16_UNORM:
464 /*z16_put_tile_rgba((ushort *) packed, w, h, p, src_stride);*/
465 break;
466 case PIPE_FORMAT_Z32_UNORM:
467 /*z32_put_tile_rgba((unsigned *) packed, w, h, p, src_stride);*/
468 break;
469 case PIPE_FORMAT_Z24_UNORM_S8_USCALED:
470 case PIPE_FORMAT_Z24X8_UNORM:
471 /*s8z24_put_tile_rgba((unsigned *) packed, w, h, p, src_stride);*/
472 break;
473 case PIPE_FORMAT_S8_USCALED_Z24_UNORM:
474 case PIPE_FORMAT_X8Z24_UNORM:
475 /*z24s8_put_tile_rgba((unsigned *) packed, w, h, p, src_stride);*/
476 break;
477 case PIPE_FORMAT_Z32_FLOAT:
478 /*z32f_put_tile_rgba((unsigned *) packed, w, h, p, src_stride);*/
479 break;
480 case PIPE_FORMAT_Z32_FLOAT_S8X24_USCALED:
481 /*z32f_s8x24_put_tile_rgba((unsigned *) packed, w, h, p, src_stride);*/
482 break;
483 default:
484 util_format_write_4f(format,
485 p, src_stride * sizeof(float),
486 packed, util_format_get_stride(format, w),
487 0, 0, w, h);
488 }
489
490 pipe_put_tile_raw(pipe, pt, x, y, w, h, packed, 0);
491
492 FREE(packed);
493 }
494
495
496 /**
497 * Get a block of Z values, converted to 32-bit range.
498 */
499 void
500 pipe_get_tile_z(struct pipe_context *pipe,
501 struct pipe_transfer *pt,
502 uint x, uint y, uint w, uint h,
503 uint *z)
504 {
505 const uint dstStride = w;
506 ubyte *map;
507 uint *pDest = z;
508 uint i, j;
509 enum pipe_format format = pt->resource->format;
510
511 if (u_clip_tile(x, y, &w, &h, &pt->box))
512 return;
513
514 map = (ubyte *)pipe->transfer_map(pipe, pt);
515 if (!map) {
516 assert(0);
517 return;
518 }
519
520 switch (format) {
521 case PIPE_FORMAT_Z32_UNORM:
522 {
523 const uint *ptrc
524 = (const uint *)(map + y * pt->stride + x*4);
525 for (i = 0; i < h; i++) {
526 memcpy(pDest, ptrc, 4 * w);
527 pDest += dstStride;
528 ptrc += pt->stride/4;
529 }
530 }
531 break;
532 case PIPE_FORMAT_Z24_UNORM_S8_USCALED:
533 case PIPE_FORMAT_Z24X8_UNORM:
534 {
535 const uint *ptrc
536 = (const uint *)(map + y * pt->stride + x*4);
537 for (i = 0; i < h; i++) {
538 for (j = 0; j < w; j++) {
539 /* convert 24-bit Z to 32-bit Z */
540 pDest[j] = (ptrc[j] << 8) | ((ptrc[j] >> 16) & 0xff);
541 }
542 pDest += dstStride;
543 ptrc += pt->stride/4;
544 }
545 }
546 break;
547 case PIPE_FORMAT_S8_USCALED_Z24_UNORM:
548 case PIPE_FORMAT_X8Z24_UNORM:
549 {
550 const uint *ptrc
551 = (const uint *)(map + y * pt->stride + x*4);
552 for (i = 0; i < h; i++) {
553 for (j = 0; j < w; j++) {
554 /* convert 24-bit Z to 32-bit Z */
555 pDest[j] = (ptrc[j] & 0xffffff00) | ((ptrc[j] >> 24) & 0xff);
556 }
557 pDest += dstStride;
558 ptrc += pt->stride/4;
559 }
560 }
561 break;
562 case PIPE_FORMAT_Z16_UNORM:
563 {
564 const ushort *ptrc
565 = (const ushort *)(map + y * pt->stride + x*2);
566 for (i = 0; i < h; i++) {
567 for (j = 0; j < w; j++) {
568 /* convert 16-bit Z to 32-bit Z */
569 pDest[j] = (ptrc[j] << 16) | ptrc[j];
570 }
571 pDest += dstStride;
572 ptrc += pt->stride/2;
573 }
574 }
575 break;
576 default:
577 assert(0);
578 }
579
580 pipe->transfer_unmap(pipe, pt);
581 }
582
583
584 void
585 pipe_put_tile_z(struct pipe_context *pipe,
586 struct pipe_transfer *pt,
587 uint x, uint y, uint w, uint h,
588 const uint *zSrc)
589 {
590 const uint srcStride = w;
591 const uint *ptrc = zSrc;
592 ubyte *map;
593 uint i, j;
594 enum pipe_format format = pt->resource->format;
595
596 if (u_clip_tile(x, y, &w, &h, &pt->box))
597 return;
598
599 map = (ubyte *)pipe->transfer_map(pipe, pt);
600 if (!map) {
601 assert(0);
602 return;
603 }
604
605 switch (format) {
606 case PIPE_FORMAT_Z32_UNORM:
607 {
608 uint *pDest = (uint *) (map + y * pt->stride + x*4);
609 for (i = 0; i < h; i++) {
610 memcpy(pDest, ptrc, 4 * w);
611 pDest += pt->stride/4;
612 ptrc += srcStride;
613 }
614 }
615 break;
616 case PIPE_FORMAT_Z24_UNORM_S8_USCALED:
617 {
618 uint *pDest = (uint *) (map + y * pt->stride + x*4);
619 /*assert((pt->usage & PIPE_TRANSFER_READ_WRITE) == PIPE_TRANSFER_READ_WRITE);*/
620 for (i = 0; i < h; i++) {
621 for (j = 0; j < w; j++) {
622 /* convert 32-bit Z to 24-bit Z, preserve stencil */
623 pDest[j] = (pDest[j] & 0xff000000) | ptrc[j] >> 8;
624 }
625 pDest += pt->stride/4;
626 ptrc += srcStride;
627 }
628 }
629 break;
630 case PIPE_FORMAT_Z24X8_UNORM:
631 {
632 uint *pDest = (uint *) (map + y * pt->stride + x*4);
633 for (i = 0; i < h; i++) {
634 for (j = 0; j < w; j++) {
635 /* convert 32-bit Z to 24-bit Z (0 stencil) */
636 pDest[j] = ptrc[j] >> 8;
637 }
638 pDest += pt->stride/4;
639 ptrc += srcStride;
640 }
641 }
642 break;
643 case PIPE_FORMAT_S8_USCALED_Z24_UNORM:
644 {
645 uint *pDest = (uint *) (map + y * pt->stride + x*4);
646 /*assert((pt->usage & PIPE_TRANSFER_READ_WRITE) == PIPE_TRANSFER_READ_WRITE);*/
647 for (i = 0; i < h; i++) {
648 for (j = 0; j < w; j++) {
649 /* convert 32-bit Z to 24-bit Z, preserve stencil */
650 pDest[j] = (pDest[j] & 0xff) | (ptrc[j] & 0xffffff00);
651 }
652 pDest += pt->stride/4;
653 ptrc += srcStride;
654 }
655 }
656 break;
657 case PIPE_FORMAT_X8Z24_UNORM:
658 {
659 uint *pDest = (uint *) (map + y * pt->stride + x*4);
660 for (i = 0; i < h; i++) {
661 for (j = 0; j < w; j++) {
662 /* convert 32-bit Z to 24-bit Z (0 stencil) */
663 pDest[j] = ptrc[j] & 0xffffff00;
664 }
665 pDest += pt->stride/4;
666 ptrc += srcStride;
667 }
668 }
669 break;
670 case PIPE_FORMAT_Z16_UNORM:
671 {
672 ushort *pDest = (ushort *) (map + y * pt->stride + x*2);
673 for (i = 0; i < h; i++) {
674 for (j = 0; j < w; j++) {
675 /* convert 32-bit Z to 16-bit Z */
676 pDest[j] = ptrc[j] >> 16;
677 }
678 pDest += pt->stride/2;
679 ptrc += srcStride;
680 }
681 }
682 break;
683 default:
684 assert(0);
685 }
686
687 pipe->transfer_unmap(pipe, pt);
688 }
689
690