1 /**************************************************************************
3 * Copyright 2007 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
33 #include "main/errors.h"
34 #include "main/imports.h"
35 #include "main/image.h"
36 #include "main/bufferobj.h"
37 #include "main/blit.h"
38 #include "main/format_pack.h"
39 #include "main/framebuffer.h"
40 #include "main/macros.h"
41 #include "main/mtypes.h"
42 #include "main/pack.h"
44 #include "main/readpix.h"
45 #include "main/state.h"
46 #include "main/texformat.h"
47 #include "main/teximage.h"
48 #include "main/texstore.h"
49 #include "main/glformats.h"
50 #include "program/program.h"
51 #include "program/prog_print.h"
52 #include "program/prog_instruction.h"
55 #include "st_atom_constbuf.h"
56 #include "st_cb_bitmap.h"
57 #include "st_cb_drawpixels.h"
58 #include "st_cb_readpixels.h"
59 #include "st_cb_fbo.h"
60 #include "st_context.h"
63 #include "st_format.h"
64 #include "st_program.h"
65 #include "st_sampler_view.h"
66 #include "st_scissor.h"
67 #include "st_texture.h"
71 #include "pipe/p_context.h"
72 #include "pipe/p_defines.h"
73 #include "tgsi/tgsi_ureg.h"
74 #include "util/format/u_format.h"
75 #include "util/u_inlines.h"
76 #include "util/u_math.h"
77 #include "util/u_simple_shaders.h"
78 #include "util/u_tile.h"
79 #include "cso_cache/cso_context.h"
81 #include "compiler/nir/nir_builder.h"
84 * We have a simple glDrawPixels cache to try to optimize the case where the
85 * same image is drawn over and over again. It basically works as follows:
87 * 1. After we construct a texture map with the image and draw it, we do
88 * not discard the texture. We keep it around, plus we note the
89 * glDrawPixels width, height, format, etc. parameters and keep a copy
90 * of the image in a malloc'd buffer.
92 * 2. On the next glDrawPixels we check if the parameters match the previous
93 * call. If those match, we check if the image matches the previous image
94 * via a memcmp() call. If everything matches, we re-use the previous
95 * texture, thereby avoiding the cost creating a new texture and copying
98 * The effectiveness of this cache depends upon:
99 * 1. If the memcmp() finds a difference, it happens relatively quickly.
100 Hopefully, not just the last pixels differ!
101 * 2. If the memcmp() finds no difference, doing that check is faster than
102 * creating and loading a texture.
105 * 1. We don't support any pixel unpacking parameters.
106 * 2. We don't try to cache images in Pixel Buffer Objects.
107 * 3. Instead of saving the whole image, perhaps some sort of reliable
108 * checksum function could be used instead.
110 #define USE_DRAWPIXELS_CACHE 1
113 sample_via_nir(nir_builder
*b
, nir_variable
*texcoord
,
114 const char *name
, int sampler
, enum glsl_base_type base_type
,
115 nir_alu_type alu_type
)
117 const struct glsl_type
*sampler2D
=
118 glsl_sampler_type(GLSL_SAMPLER_DIM_2D
, false, false, base_type
);
121 nir_variable_create(b
->shader
, nir_var_uniform
, sampler2D
, name
);
122 var
->data
.binding
= sampler
;
123 var
->data
.explicit_binding
= true;
125 nir_deref_instr
*deref
= nir_build_deref_var(b
, var
);
127 nir_tex_instr
*tex
= nir_tex_instr_create(b
->shader
, 3);
128 tex
->op
= nir_texop_tex
;
129 tex
->sampler_dim
= GLSL_SAMPLER_DIM_2D
;
130 tex
->coord_components
= 2;
131 tex
->dest_type
= alu_type
;
132 tex
->src
[0].src_type
= nir_tex_src_texture_deref
;
133 tex
->src
[0].src
= nir_src_for_ssa(&deref
->dest
.ssa
);
134 tex
->src
[1].src_type
= nir_tex_src_sampler_deref
;
135 tex
->src
[1].src
= nir_src_for_ssa(&deref
->dest
.ssa
);
136 tex
->src
[2].src_type
= nir_tex_src_coord
;
138 nir_src_for_ssa(nir_channels(b
, nir_load_var(b
, texcoord
),
139 (1 << tex
->coord_components
) - 1));
141 nir_ssa_dest_init(&tex
->instr
, &tex
->dest
, 4, 32, NULL
);
142 nir_builder_instr_insert(b
, &tex
->instr
);
143 return nir_channel(b
, &tex
->dest
.ssa
, 0);
147 make_drawpix_z_stencil_program_nir(struct st_context
*st
,
151 struct nir_builder b
;
152 const nir_shader_compiler_options
*options
=
153 st
->ctx
->Const
.ShaderCompilerOptions
[MESA_SHADER_FRAGMENT
].NirOptions
;
155 nir_builder_init_simple_shader(&b
, NULL
, MESA_SHADER_FRAGMENT
, options
);
157 nir_variable
*texcoord
=
158 nir_variable_create(b
.shader
, nir_var_shader_in
, glsl_vec_type(2),
160 texcoord
->data
.location
= VARYING_SLOT_TEX0
;
164 nir_variable_create(b
.shader
, nir_var_shader_out
, glsl_float_type(),
166 out
->data
.location
= FRAG_RESULT_DEPTH
;
167 nir_ssa_def
*depth
= sample_via_nir(&b
, texcoord
, "depth", 0,
168 GLSL_TYPE_FLOAT
, nir_type_float
);
169 nir_store_var(&b
, out
, depth
, 0x1);
171 /* Also copy color */
172 nir_variable
*color_in
=
173 nir_variable_create(b
.shader
, nir_var_shader_in
, glsl_vec_type(4),
175 color_in
->data
.location
= VARYING_SLOT_COL0
;
177 nir_variable
*color_out
=
178 nir_variable_create(b
.shader
, nir_var_shader_out
, glsl_vec_type(4),
180 color_out
->data
.location
= FRAG_RESULT_COLOR
;
181 nir_copy_var(&b
, color_out
, color_in
);
186 nir_variable_create(b
.shader
, nir_var_shader_out
, glsl_uint_type(),
187 "gl_FragStencilRefARB");
188 out
->data
.location
= FRAG_RESULT_STENCIL
;
189 nir_ssa_def
*stencil
= sample_via_nir(&b
, texcoord
, "stencil", 1,
190 GLSL_TYPE_UINT
, nir_type_uint
);
191 nir_store_var(&b
, out
, stencil
, 0x1);
195 snprintf(name
, 14, "drawpixels %s%s",
196 write_depth
? "Z" : "", write_stencil
? "S" : "");
198 return st_nir_finish_builtin_shader(st
, b
.shader
, name
);
203 make_drawpix_z_stencil_program_tgsi(struct st_context
*st
,
207 struct ureg_program
*ureg
;
208 struct ureg_src depth_sampler
, stencil_sampler
;
209 struct ureg_src texcoord
, color
;
210 struct ureg_dst out_color
, out_depth
, out_stencil
;
212 ureg
= ureg_create(PIPE_SHADER_FRAGMENT
);
216 ureg_property(ureg
, TGSI_PROPERTY_FS_COLOR0_WRITES_ALL_CBUFS
, TRUE
);
219 color
= ureg_DECL_fs_input(ureg
, TGSI_SEMANTIC_COLOR
, 0,
220 TGSI_INTERPOLATE_COLOR
);
221 out_color
= ureg_DECL_output(ureg
, TGSI_SEMANTIC_COLOR
, 0);
223 depth_sampler
= ureg_DECL_sampler(ureg
, 0);
224 ureg_DECL_sampler_view(ureg
, 0, TGSI_TEXTURE_2D
,
225 TGSI_RETURN_TYPE_FLOAT
,
226 TGSI_RETURN_TYPE_FLOAT
,
227 TGSI_RETURN_TYPE_FLOAT
,
228 TGSI_RETURN_TYPE_FLOAT
);
229 out_depth
= ureg_DECL_output(ureg
, TGSI_SEMANTIC_POSITION
, 0);
233 stencil_sampler
= ureg_DECL_sampler(ureg
, 1);
234 ureg_DECL_sampler_view(ureg
, 1, TGSI_TEXTURE_2D
,
235 TGSI_RETURN_TYPE_UINT
,
236 TGSI_RETURN_TYPE_UINT
,
237 TGSI_RETURN_TYPE_UINT
,
238 TGSI_RETURN_TYPE_UINT
);
239 out_stencil
= ureg_DECL_output(ureg
, TGSI_SEMANTIC_STENCIL
, 0);
242 texcoord
= ureg_DECL_fs_input(ureg
,
243 st
->needs_texcoord_semantic
?
244 TGSI_SEMANTIC_TEXCOORD
:
245 TGSI_SEMANTIC_GENERIC
,
246 0, TGSI_INTERPOLATE_LINEAR
);
249 ureg_TEX(ureg
, ureg_writemask(out_depth
, TGSI_WRITEMASK_Z
),
250 TGSI_TEXTURE_2D
, texcoord
, depth_sampler
);
251 ureg_MOV(ureg
, out_color
, color
);
255 ureg_TEX(ureg
, ureg_writemask(out_stencil
, TGSI_WRITEMASK_Y
),
256 TGSI_TEXTURE_2D
, texcoord
, stencil_sampler
);
259 return ureg_create_shader_and_destroy(ureg
, st
->pipe
);
264 * Create fragment program that does a TEX() instruction to get a Z and/or
265 * stencil value value, then writes to FRAG_RESULT_DEPTH/FRAG_RESULT_STENCIL.
266 * Used for glDrawPixels(GL_DEPTH_COMPONENT / GL_STENCIL_INDEX).
267 * Pass fragment color through as-is.
269 * \return CSO of the fragment shader.
272 get_drawpix_z_stencil_program(struct st_context
*st
,
276 struct pipe_screen
*pscreen
= st
->pipe
->screen
;
277 const GLuint shaderIndex
= write_depth
* 2 + write_stencil
;
280 assert(shaderIndex
< ARRAY_SIZE(st
->drawpix
.zs_shaders
));
282 if (st
->drawpix
.zs_shaders
[shaderIndex
]) {
283 /* already have the proper shader */
284 return st
->drawpix
.zs_shaders
[shaderIndex
];
287 enum pipe_shader_ir preferred_ir
=
288 pscreen
->get_shader_param(pscreen
, PIPE_SHADER_FRAGMENT
,
289 PIPE_SHADER_CAP_PREFERRED_IR
);
291 if (preferred_ir
== PIPE_SHADER_IR_NIR
)
292 cso
= make_drawpix_z_stencil_program_nir(st
, write_depth
, write_stencil
);
294 cso
= make_drawpix_z_stencil_program_tgsi(st
, write_depth
, write_stencil
);
296 /* save the new shader */
297 st
->drawpix
.zs_shaders
[shaderIndex
] = cso
;
303 * Create a simple vertex shader that just passes through the
304 * vertex position, texcoord, and color.
307 st_make_passthrough_vertex_shader(struct st_context
*st
)
309 struct pipe_context
*pipe
= st
->pipe
;
310 struct pipe_screen
*screen
= pipe
->screen
;
312 if (st
->passthrough_vs
)
315 enum pipe_shader_ir preferred_ir
=
316 screen
->get_shader_param(screen
, PIPE_SHADER_VERTEX
,
317 PIPE_SHADER_CAP_PREFERRED_IR
);
319 if (preferred_ir
== PIPE_SHADER_IR_NIR
) {
321 { VERT_ATTRIB_POS
, VERT_ATTRIB_COLOR0
, VERT_ATTRIB_GENERIC0
};
323 { VARYING_SLOT_POS
, VARYING_SLOT_COL0
, VARYING_SLOT_TEX0
};
326 st_nir_make_passthrough_shader(st
, "drawpixels VS",
327 MESA_SHADER_VERTEX
, 3,
328 inputs
, outputs
, NULL
, 0);
330 const enum tgsi_semantic semantic_names
[] = {
331 TGSI_SEMANTIC_POSITION
,
333 st
->needs_texcoord_semantic
? TGSI_SEMANTIC_TEXCOORD
:
334 TGSI_SEMANTIC_GENERIC
336 const uint semantic_indexes
[] = { 0, 0, 0 };
339 util_make_vertex_passthrough_shader(st
->pipe
, 3, semantic_names
,
340 semantic_indexes
, false);
346 * Return a texture internalFormat for drawing/copying an image
347 * of the given format and type.
350 internal_format(struct gl_context
*ctx
, GLenum format
, GLenum type
)
353 case GL_DEPTH_COMPONENT
:
355 case GL_UNSIGNED_SHORT
:
356 return GL_DEPTH_COMPONENT16
;
358 case GL_UNSIGNED_INT
:
359 return GL_DEPTH_COMPONENT32
;
362 if (ctx
->Extensions
.ARB_depth_buffer_float
)
363 return GL_DEPTH_COMPONENT32F
;
365 return GL_DEPTH_COMPONENT
;
368 return GL_DEPTH_COMPONENT
;
371 case GL_DEPTH_STENCIL
:
373 case GL_FLOAT_32_UNSIGNED_INT_24_8_REV
:
374 return GL_DEPTH32F_STENCIL8
;
376 case GL_UNSIGNED_INT_24_8
:
378 return GL_DEPTH24_STENCIL8
;
381 case GL_STENCIL_INDEX
:
382 return GL_STENCIL_INDEX
;
385 if (_mesa_is_enum_format_integer(format
)) {
389 case GL_UNSIGNED_BYTE
:
393 case GL_UNSIGNED_SHORT
:
397 case GL_UNSIGNED_INT
:
400 assert(0 && "Unexpected type in internal_format()");
401 return GL_RGBA_INTEGER
;
406 case GL_UNSIGNED_BYTE
:
407 case GL_UNSIGNED_INT_8_8_8_8
:
408 case GL_UNSIGNED_INT_8_8_8_8_REV
:
412 case GL_UNSIGNED_BYTE_3_3_2
:
413 case GL_UNSIGNED_BYTE_2_3_3_REV
:
416 case GL_UNSIGNED_SHORT_4_4_4_4
:
417 case GL_UNSIGNED_SHORT_4_4_4_4_REV
:
420 case GL_UNSIGNED_SHORT_5_6_5
:
421 case GL_UNSIGNED_SHORT_5_6_5_REV
:
424 case GL_UNSIGNED_SHORT_5_5_5_1
:
425 case GL_UNSIGNED_SHORT_1_5_5_5_REV
:
428 case GL_UNSIGNED_INT_10_10_10_2
:
429 case GL_UNSIGNED_INT_2_10_10_10_REV
:
432 case GL_UNSIGNED_SHORT
:
433 case GL_UNSIGNED_INT
:
438 ctx
->Extensions
.EXT_texture_snorm
? GL_RGBA8_SNORM
: GL_RGBA8
;
443 ctx
->Extensions
.EXT_texture_snorm
? GL_RGBA16_SNORM
: GL_RGBA16
;
445 case GL_HALF_FLOAT_ARB
:
447 ctx
->Extensions
.ARB_texture_float
? GL_RGBA16F
:
448 ctx
->Extensions
.EXT_texture_snorm
? GL_RGBA16_SNORM
: GL_RGBA16
;
453 ctx
->Extensions
.ARB_texture_float
? GL_RGBA32F
:
454 ctx
->Extensions
.EXT_texture_snorm
? GL_RGBA16_SNORM
: GL_RGBA16
;
456 case GL_UNSIGNED_INT_5_9_9_9_REV
:
457 assert(ctx
->Extensions
.EXT_texture_shared_exponent
);
460 case GL_UNSIGNED_INT_10F_11F_11F_REV
:
461 assert(ctx
->Extensions
.EXT_packed_float
);
462 return GL_R11F_G11F_B10F
;
470 * Create a temporary texture to hold an image of the given size.
471 * If width, height are not POT and the driver only handles POT textures,
472 * allocate the next larger size of texture that is POT.
474 static struct pipe_resource
*
475 alloc_texture(struct st_context
*st
, GLsizei width
, GLsizei height
,
476 enum pipe_format texFormat
, unsigned bind
)
478 struct pipe_resource
*pt
;
480 pt
= st_texture_create(st
, st
->internal_target
, texFormat
, 0,
481 width
, height
, 1, 1, 0, bind
);
488 * Search the cache for an image which matches the given parameters.
489 * \return pipe_resource pointer if found, NULL if not found.
491 static struct pipe_resource
*
492 search_drawpixels_cache(struct st_context
*st
,
493 GLsizei width
, GLsizei height
,
494 GLenum format
, GLenum type
,
495 const struct gl_pixelstore_attrib
*unpack
,
498 struct pipe_resource
*pt
= NULL
;
499 const GLint bpp
= _mesa_bytes_per_pixel(format
, type
);
502 if ((unpack
->RowLength
!= 0 && unpack
->RowLength
!= width
) ||
503 unpack
->SkipPixels
!= 0 ||
504 unpack
->SkipRows
!= 0 ||
506 _mesa_is_bufferobj(unpack
->BufferObj
)) {
507 /* we don't allow non-default pixel unpacking values */
511 /* Search cache entries for a match */
512 for (i
= 0; i
< ARRAY_SIZE(st
->drawpix_cache
.entries
); i
++) {
513 struct drawpix_cache_entry
*entry
= &st
->drawpix_cache
.entries
[i
];
515 if (width
== entry
->width
&&
516 height
== entry
->height
&&
517 format
== entry
->format
&&
518 type
== entry
->type
&&
519 pixels
== entry
->user_pointer
&&
521 assert(entry
->texture
);
523 /* check if the pixel data is the same */
524 if (memcmp(pixels
, entry
->image
, width
* height
* bpp
) == 0) {
525 /* Success - found a cache match */
526 pipe_resource_reference(&pt
, entry
->texture
);
527 /* refcount of returned texture should be at least two here. One
528 * reference for the cache to hold on to, one for the caller (which
529 * it will release), and possibly more held by the driver.
531 assert(pt
->reference
.count
>= 2);
533 /* update the age of this entry */
534 entry
->age
= ++st
->drawpix_cache
.age
;
541 /* no cache match found */
547 * Find the oldest entry in the glDrawPixels cache. We'll replace this
548 * one when we need to store a new image.
550 static struct drawpix_cache_entry
*
551 find_oldest_drawpixels_cache_entry(struct st_context
*st
)
553 unsigned oldest_age
= ~0u, oldest_index
= ~0u;
556 /* Find entry with oldest (lowest) age */
557 for (i
= 0; i
< ARRAY_SIZE(st
->drawpix_cache
.entries
); i
++) {
558 const struct drawpix_cache_entry
*entry
= &st
->drawpix_cache
.entries
[i
];
559 if (entry
->age
< oldest_age
) {
560 oldest_age
= entry
->age
;
565 assert(oldest_index
!= ~0u);
567 return &st
->drawpix_cache
.entries
[oldest_index
];
572 * Try to save the given glDrawPixels image in the cache.
575 cache_drawpixels_image(struct st_context
*st
,
576 GLsizei width
, GLsizei height
,
577 GLenum format
, GLenum type
,
578 const struct gl_pixelstore_attrib
*unpack
,
580 struct pipe_resource
*pt
)
582 if ((unpack
->RowLength
== 0 || unpack
->RowLength
== width
) &&
583 unpack
->SkipPixels
== 0 &&
584 unpack
->SkipRows
== 0) {
585 const GLint bpp
= _mesa_bytes_per_pixel(format
, type
);
586 struct drawpix_cache_entry
*entry
=
587 find_oldest_drawpixels_cache_entry(st
);
589 entry
->width
= width
;
590 entry
->height
= height
;
591 entry
->format
= format
;
593 entry
->user_pointer
= pixels
;
595 entry
->image
= malloc(width
* height
* bpp
);
597 memcpy(entry
->image
, pixels
, width
* height
* bpp
);
598 pipe_resource_reference(&entry
->texture
, pt
);
599 entry
->age
= ++st
->drawpix_cache
.age
;
602 /* out of memory, free/disable cached texture */
605 pipe_resource_reference(&entry
->texture
, NULL
);
612 * Make texture containing an image for glDrawPixels image.
613 * If 'pixels' is NULL, leave the texture image data undefined.
615 static struct pipe_resource
*
616 make_texture(struct st_context
*st
,
617 GLsizei width
, GLsizei height
, GLenum format
, GLenum type
,
618 const struct gl_pixelstore_attrib
*unpack
,
621 struct gl_context
*ctx
= st
->ctx
;
622 struct pipe_context
*pipe
= st
->pipe
;
624 struct pipe_resource
*pt
= NULL
;
625 enum pipe_format pipeFormat
;
626 GLenum baseInternalFormat
;
628 #if USE_DRAWPIXELS_CACHE
629 pt
= search_drawpixels_cache(st
, width
, height
, format
, type
,
636 /* Choose a pixel format for the temp texture which will hold the
639 pipeFormat
= st_choose_matching_format(st
, PIPE_BIND_SAMPLER_VIEW
,
640 format
, type
, unpack
->SwapBytes
);
642 if (pipeFormat
== PIPE_FORMAT_NONE
) {
643 /* Use the generic approach. */
644 GLenum intFormat
= internal_format(ctx
, format
, type
);
646 pipeFormat
= st_choose_format(st
, intFormat
, format
, type
,
647 st
->internal_target
, 0, 0,
648 PIPE_BIND_SAMPLER_VIEW
,
650 assert(pipeFormat
!= PIPE_FORMAT_NONE
);
653 mformat
= st_pipe_format_to_mesa_format(pipeFormat
);
654 baseInternalFormat
= _mesa_get_format_base_format(mformat
);
656 pixels
= _mesa_map_pbo_source(ctx
, unpack
, pixels
);
660 /* alloc temporary texture */
661 pt
= alloc_texture(st
, width
, height
, pipeFormat
, PIPE_BIND_SAMPLER_VIEW
);
663 _mesa_unmap_pbo_source(ctx
, unpack
);
668 struct pipe_transfer
*transfer
;
670 const GLbitfield imageTransferStateSave
= ctx
->_ImageTransferState
;
672 /* we'll do pixel transfer in a fragment shader */
673 ctx
->_ImageTransferState
= 0x0;
675 /* map texture transfer */
676 dest
= pipe_transfer_map(pipe
, pt
, 0, 0,
677 PIPE_TRANSFER_WRITE
, 0, 0,
678 width
, height
, &transfer
);
680 pipe_resource_reference(&pt
, NULL
);
681 _mesa_unmap_pbo_source(ctx
, unpack
);
685 /* Put image into texture transfer.
686 * Note that the image is actually going to be upside down in
687 * the texture. We deal with that with texcoords.
689 if ((format
== GL_RGBA
|| format
== GL_BGRA
)
690 && type
== GL_UNSIGNED_BYTE
) {
691 /* Use a memcpy-based texstore to avoid software pixel swizzling.
692 * We'll do the necessary swizzling with the pipe_sampler_view to
693 * give much better performance.
694 * XXX in the future, expand this to accomodate more format and
697 _mesa_memcpy_texture(ctx
, 2,
698 mformat
, /* mesa_format */
699 transfer
->stride
, /* dstRowStride, bytes */
700 &dest
, /* destSlices */
701 width
, height
, 1, /* size */
702 format
, type
, /* src format/type */
703 pixels
, /* data source */
707 ASSERTED
bool success
;
708 success
= _mesa_texstore(ctx
, 2, /* dims */
709 baseInternalFormat
, /* baseInternalFormat */
710 mformat
, /* mesa_format */
711 transfer
->stride
, /* dstRowStride, bytes */
712 &dest
, /* destSlices */
713 width
, height
, 1, /* size */
714 format
, type
, /* src format/type */
715 pixels
, /* data source */
722 pipe_transfer_unmap(pipe
, transfer
);
725 ctx
->_ImageTransferState
= imageTransferStateSave
;
728 #if USE_DRAWPIXELS_CACHE
729 cache_drawpixels_image(st
, width
, height
, format
, type
, unpack
, pixels
, pt
);
732 _mesa_unmap_pbo_source(ctx
, unpack
);
739 draw_textured_quad(struct gl_context
*ctx
, GLint x
, GLint y
, GLfloat z
,
740 GLsizei width
, GLsizei height
,
741 GLfloat zoomX
, GLfloat zoomY
,
742 struct pipe_sampler_view
**sv
,
743 int num_sampler_view
,
746 struct st_fp_variant
*fpv
,
747 const GLfloat
*color
,
749 GLboolean write_depth
, GLboolean write_stencil
)
751 struct st_context
*st
= st_context(ctx
);
752 struct pipe_context
*pipe
= st
->pipe
;
753 struct cso_context
*cso
= st
->cso_context
;
754 const unsigned fb_width
= _mesa_geometric_width(ctx
->DrawBuffer
);
755 const unsigned fb_height
= _mesa_geometric_height(ctx
->DrawBuffer
);
756 GLfloat x0
, y0
, x1
, y1
;
757 ASSERTED GLsizei maxSize
;
758 boolean normalized
= sv
[0]->texture
->target
== PIPE_TEXTURE_2D
;
759 unsigned cso_state_mask
;
761 assert(sv
[0]->texture
->target
== st
->internal_target
);
764 /* XXX if DrawPixels image is larger than max texture size, break
767 maxSize
= pipe
->screen
->get_param(pipe
->screen
,
768 PIPE_CAP_MAX_TEXTURE_2D_SIZE
);
769 assert(width
<= maxSize
);
770 assert(height
<= maxSize
);
772 cso_state_mask
= (CSO_BIT_RASTERIZER
|
774 CSO_BIT_FRAGMENT_SAMPLERS
|
775 CSO_BIT_FRAGMENT_SAMPLER_VIEWS
|
776 CSO_BIT_STREAM_OUTPUTS
|
777 CSO_BIT_VERTEX_ELEMENTS
|
778 CSO_BIT_AUX_VERTEX_BUFFER_SLOT
|
779 CSO_BITS_ALL_SHADERS
);
781 cso_state_mask
|= (CSO_BIT_DEPTH_STENCIL_ALPHA
|
784 cso_save_state(cso
, cso_state_mask
);
786 /* rasterizer state: just scissor */
788 struct pipe_rasterizer_state rasterizer
;
789 memset(&rasterizer
, 0, sizeof(rasterizer
));
790 rasterizer
.clamp_fragment_color
= !st
->clamp_frag_color_in_shader
&&
791 ctx
->Color
._ClampFragmentColor
;
792 rasterizer
.half_pixel_center
= 1;
793 rasterizer
.bottom_edge_rule
= 1;
794 rasterizer
.depth_clip_near
= st
->clamp_frag_depth_in_shader
||
795 !ctx
->Transform
.DepthClampNear
;
796 rasterizer
.depth_clip_far
= st
->clamp_frag_depth_in_shader
||
797 !ctx
->Transform
.DepthClampFar
;
798 rasterizer
.scissor
= ctx
->Scissor
.EnableFlags
;
799 cso_set_rasterizer(cso
, &rasterizer
);
803 /* Stencil writing bypasses the normal fragment pipeline to
804 * disable color writing and set stencil test to always pass.
806 struct pipe_depth_stencil_alpha_state dsa
;
807 struct pipe_blend_state blend
;
810 memset(&dsa
, 0, sizeof(dsa
));
811 dsa
.stencil
[0].enabled
= 1;
812 dsa
.stencil
[0].func
= PIPE_FUNC_ALWAYS
;
813 dsa
.stencil
[0].writemask
= ctx
->Stencil
.WriteMask
[0] & 0xff;
814 dsa
.stencil
[0].zpass_op
= PIPE_STENCIL_OP_REPLACE
;
816 /* writing depth+stencil: depth test always passes */
817 dsa
.depth
.enabled
= 1;
818 dsa
.depth
.writemask
= ctx
->Depth
.Mask
;
819 dsa
.depth
.func
= PIPE_FUNC_ALWAYS
;
821 cso_set_depth_stencil_alpha(cso
, &dsa
);
823 /* blend (colormask) */
824 memset(&blend
, 0, sizeof(blend
));
825 cso_set_blend(cso
, &blend
);
828 /* fragment shader state: TEX lookup program */
829 cso_set_fragment_shader_handle(cso
, driver_fp
);
831 /* vertex shader state: position + texcoord pass-through */
832 cso_set_vertex_shader_handle(cso
, driver_vp
);
834 /* disable other shaders */
835 cso_set_tessctrl_shader_handle(cso
, NULL
);
836 cso_set_tesseval_shader_handle(cso
, NULL
);
837 cso_set_geometry_shader_handle(cso
, NULL
);
839 /* user samplers, plus the drawpix samplers */
841 struct pipe_sampler_state sampler
;
843 memset(&sampler
, 0, sizeof(sampler
));
844 sampler
.wrap_s
= PIPE_TEX_WRAP_CLAMP
;
845 sampler
.wrap_t
= PIPE_TEX_WRAP_CLAMP
;
846 sampler
.wrap_r
= PIPE_TEX_WRAP_CLAMP
;
847 sampler
.min_img_filter
= PIPE_TEX_FILTER_NEAREST
;
848 sampler
.min_mip_filter
= PIPE_TEX_MIPFILTER_NONE
;
849 sampler
.mag_img_filter
= PIPE_TEX_FILTER_NEAREST
;
850 sampler
.normalized_coords
= normalized
;
853 /* drawing a color image */
854 const struct pipe_sampler_state
*samplers
[PIPE_MAX_SAMPLERS
];
855 uint num
= MAX3(fpv
->drawpix_sampler
+ 1,
856 fpv
->pixelmap_sampler
+ 1,
857 st
->state
.num_frag_samplers
);
860 for (i
= 0; i
< st
->state
.num_frag_samplers
; i
++)
861 samplers
[i
] = &st
->state
.frag_samplers
[i
];
863 samplers
[fpv
->drawpix_sampler
] = &sampler
;
865 samplers
[fpv
->pixelmap_sampler
] = &sampler
;
867 cso_set_samplers(cso
, PIPE_SHADER_FRAGMENT
, num
, samplers
);
869 /* drawing a depth/stencil image */
870 const struct pipe_sampler_state
*samplers
[2] = {&sampler
, &sampler
};
872 cso_set_samplers(cso
, PIPE_SHADER_FRAGMENT
, num_sampler_view
, samplers
);
876 /* user textures, plus the drawpix textures */
878 /* drawing a color image */
879 struct pipe_sampler_view
*sampler_views
[PIPE_MAX_SAMPLERS
];
880 uint num
= MAX3(fpv
->drawpix_sampler
+ 1,
881 fpv
->pixelmap_sampler
+ 1,
882 st
->state
.num_sampler_views
[PIPE_SHADER_FRAGMENT
]);
884 memcpy(sampler_views
, st
->state
.frag_sampler_views
,
885 sizeof(sampler_views
));
887 sampler_views
[fpv
->drawpix_sampler
] = sv
[0];
889 sampler_views
[fpv
->pixelmap_sampler
] = sv
[1];
890 cso_set_sampler_views(cso
, PIPE_SHADER_FRAGMENT
, num
, sampler_views
);
892 /* drawing a depth/stencil image */
893 cso_set_sampler_views(cso
, PIPE_SHADER_FRAGMENT
, num_sampler_view
, sv
);
896 /* viewport state: viewport matching window dims */
897 cso_set_viewport_dims(cso
, fb_width
, fb_height
, TRUE
);
899 cso_set_vertex_elements(cso
, 3, st
->util_velems
);
900 cso_set_stream_outputs(cso
, 0, NULL
, NULL
);
902 /* Compute Gallium window coords (y=0=top) with pixel zoom.
903 * Recall that these coords are transformed by the current
904 * vertex shader and viewport transformation.
906 if (st_fb_orientation(ctx
->DrawBuffer
) == Y_0_BOTTOM
) {
907 y
= fb_height
- (int) (y
+ height
* ctx
->Pixel
.ZoomY
);
908 invertTex
= !invertTex
;
912 x1
= x
+ width
* ctx
->Pixel
.ZoomX
;
914 y1
= y
+ height
* ctx
->Pixel
.ZoomY
;
916 /* convert Z from [0,1] to [-1,-1] to match viewport Z scale/bias */
920 const float clip_x0
= x0
/ (float) fb_width
* 2.0f
- 1.0f
;
921 const float clip_y0
= y0
/ (float) fb_height
* 2.0f
- 1.0f
;
922 const float clip_x1
= x1
/ (float) fb_width
* 2.0f
- 1.0f
;
923 const float clip_y1
= y1
/ (float) fb_height
* 2.0f
- 1.0f
;
924 const float maxXcoord
= normalized
?
925 ((float) width
/ sv
[0]->texture
->width0
) : (float) width
;
926 const float maxYcoord
= normalized
927 ? ((float) height
/ sv
[0]->texture
->height0
) : (float) height
;
928 const float sLeft
= 0.0f
, sRight
= maxXcoord
;
929 const float tTop
= invertTex
? maxYcoord
: 0.0f
;
930 const float tBot
= invertTex
? 0.0f
: maxYcoord
;
932 if (!st_draw_quad(st
, clip_x0
, clip_y0
, clip_x1
, clip_y1
, z
,
933 sLeft
, tBot
, sRight
, tTop
, color
, 0)) {
934 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "glDrawPixels");
939 cso_restore_state(cso
);
944 * Software fallback to do glDrawPixels(GL_STENCIL_INDEX) when we
945 * can't use a fragment shader to write stencil values.
948 draw_stencil_pixels(struct gl_context
*ctx
, GLint x
, GLint y
,
949 GLsizei width
, GLsizei height
, GLenum format
, GLenum type
,
950 const struct gl_pixelstore_attrib
*unpack
,
953 struct st_context
*st
= st_context(ctx
);
954 struct pipe_context
*pipe
= st
->pipe
;
955 struct st_renderbuffer
*strb
;
956 enum pipe_transfer_usage usage
;
957 struct pipe_transfer
*pt
;
958 const GLboolean zoom
= ctx
->Pixel
.ZoomX
!= 1.0 || ctx
->Pixel
.ZoomY
!= 1.0;
960 struct gl_pixelstore_attrib clippedUnpack
= *unpack
;
965 if (!_mesa_clip_drawpixels(ctx
, &x
, &y
, &width
, &height
,
967 /* totally clipped */
972 strb
= st_renderbuffer(ctx
->DrawBuffer
->
973 Attachment
[BUFFER_STENCIL
].Renderbuffer
);
975 if (st_fb_orientation(ctx
->DrawBuffer
) == Y_0_TOP
) {
976 y
= ctx
->DrawBuffer
->Height
- y
- height
;
979 if (format
== GL_STENCIL_INDEX
&&
980 _mesa_is_format_packed_depth_stencil(strb
->Base
.Format
)) {
981 /* writing stencil to a combined depth+stencil buffer */
982 usage
= PIPE_TRANSFER_READ_WRITE
;
985 usage
= PIPE_TRANSFER_WRITE
;
988 stmap
= pipe_transfer_map(pipe
, strb
->texture
,
989 strb
->surface
->u
.tex
.level
,
990 strb
->surface
->u
.tex
.first_layer
,
994 pixels
= _mesa_map_pbo_source(ctx
, &clippedUnpack
, pixels
);
997 sValues
= malloc(width
* sizeof(GLubyte
));
998 zValues
= malloc(width
* sizeof(GLuint
));
1000 if (sValues
&& zValues
) {
1002 for (row
= 0; row
< height
; row
++) {
1003 GLfloat
*zValuesFloat
= (GLfloat
*)zValues
;
1004 GLenum destType
= GL_UNSIGNED_BYTE
;
1005 const void *source
= _mesa_image_address2d(&clippedUnpack
, pixels
,
1009 _mesa_unpack_stencil_span(ctx
, width
, destType
, sValues
,
1010 type
, source
, &clippedUnpack
,
1011 ctx
->_ImageTransferState
);
1013 if (format
== GL_DEPTH_STENCIL
) {
1015 pt
->resource
->format
== PIPE_FORMAT_Z32_FLOAT_S8X24_UINT
?
1016 GL_FLOAT
: GL_UNSIGNED_INT
;
1018 _mesa_unpack_depth_span(ctx
, width
, ztype
, zValues
,
1019 (1 << 24) - 1, type
, source
,
1024 _mesa_problem(ctx
, "Gallium glDrawPixels(GL_STENCIL) with "
1025 "zoom not complete");
1031 if (st_fb_orientation(ctx
->DrawBuffer
) == Y_0_TOP
) {
1032 spanY
= height
- row
- 1;
1038 /* now pack the stencil (and Z) values in the dest format */
1039 switch (pt
->resource
->format
) {
1040 case PIPE_FORMAT_S8_UINT
:
1042 ubyte
*dest
= stmap
+ spanY
* pt
->stride
;
1043 assert(usage
== PIPE_TRANSFER_WRITE
);
1044 memcpy(dest
, sValues
, width
);
1047 case PIPE_FORMAT_Z24_UNORM_S8_UINT
:
1048 if (format
== GL_DEPTH_STENCIL
) {
1049 uint
*dest
= (uint
*) (stmap
+ spanY
* pt
->stride
);
1051 assert(usage
== PIPE_TRANSFER_WRITE
);
1052 for (k
= 0; k
< width
; k
++) {
1053 dest
[k
] = zValues
[k
] | (sValues
[k
] << 24);
1057 uint
*dest
= (uint
*) (stmap
+ spanY
* pt
->stride
);
1059 assert(usage
== PIPE_TRANSFER_READ_WRITE
);
1060 for (k
= 0; k
< width
; k
++) {
1061 dest
[k
] = (dest
[k
] & 0xffffff) | (sValues
[k
] << 24);
1065 case PIPE_FORMAT_S8_UINT_Z24_UNORM
:
1066 if (format
== GL_DEPTH_STENCIL
) {
1067 uint
*dest
= (uint
*) (stmap
+ spanY
* pt
->stride
);
1069 assert(usage
== PIPE_TRANSFER_WRITE
);
1070 for (k
= 0; k
< width
; k
++) {
1071 dest
[k
] = (zValues
[k
] << 8) | (sValues
[k
] & 0xff);
1075 uint
*dest
= (uint
*) (stmap
+ spanY
* pt
->stride
);
1077 assert(usage
== PIPE_TRANSFER_READ_WRITE
);
1078 for (k
= 0; k
< width
; k
++) {
1079 dest
[k
] = (dest
[k
] & 0xffffff00) | (sValues
[k
] & 0xff);
1083 case PIPE_FORMAT_Z32_FLOAT_S8X24_UINT
:
1084 if (format
== GL_DEPTH_STENCIL
) {
1085 uint
*dest
= (uint
*) (stmap
+ spanY
* pt
->stride
);
1086 GLfloat
*destf
= (GLfloat
*)dest
;
1088 assert(usage
== PIPE_TRANSFER_WRITE
);
1089 for (k
= 0; k
< width
; k
++) {
1090 destf
[k
*2] = zValuesFloat
[k
];
1091 dest
[k
*2+1] = sValues
[k
] & 0xff;
1095 uint
*dest
= (uint
*) (stmap
+ spanY
* pt
->stride
);
1097 assert(usage
== PIPE_TRANSFER_READ_WRITE
);
1098 for (k
= 0; k
< width
; k
++) {
1099 dest
[k
*2+1] = sValues
[k
] & 0xff;
1110 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "glDrawPixels()");
1116 _mesa_unmap_pbo_source(ctx
, &clippedUnpack
);
1118 /* unmap the stencil buffer */
1119 pipe_transfer_unmap(pipe
, pt
);
1124 * Get fragment program variant for a glDrawPixels or glCopyPixels
1125 * command for RGBA data.
1127 static struct st_fp_variant
*
1128 get_color_fp_variant(struct st_context
*st
)
1130 struct gl_context
*ctx
= st
->ctx
;
1131 struct st_fp_variant_key key
;
1132 struct st_fp_variant
*fpv
;
1134 memset(&key
, 0, sizeof(key
));
1136 key
.st
= st
->has_shareable_shaders
? NULL
: st
;
1138 key
.scaleAndBias
= (ctx
->Pixel
.RedBias
!= 0.0 ||
1139 ctx
->Pixel
.RedScale
!= 1.0 ||
1140 ctx
->Pixel
.GreenBias
!= 0.0 ||
1141 ctx
->Pixel
.GreenScale
!= 1.0 ||
1142 ctx
->Pixel
.BlueBias
!= 0.0 ||
1143 ctx
->Pixel
.BlueScale
!= 1.0 ||
1144 ctx
->Pixel
.AlphaBias
!= 0.0 ||
1145 ctx
->Pixel
.AlphaScale
!= 1.0);
1146 key
.pixelMaps
= ctx
->Pixel
.MapColorFlag
;
1147 key
.clamp_color
= st
->clamp_frag_color_in_shader
&&
1148 ctx
->Color
._ClampFragmentColor
;
1150 fpv
= st_get_fp_variant(st
, st
->fp
, &key
);
1156 * Get fragment program variant for a glDrawPixels command
1157 * for COLOR_INDEX data
1159 static struct st_fp_variant
*
1160 get_color_index_fp_variant(struct st_context
*st
)
1162 struct gl_context
*ctx
= st
->ctx
;
1163 struct st_fp_variant_key key
;
1164 struct st_fp_variant
*fpv
;
1166 memset(&key
, 0, sizeof(key
));
1168 key
.st
= st
->has_shareable_shaders
? NULL
: st
;
1170 /* Since GL is always in RGBA mode MapColorFlag does not
1171 * affect GL_COLOR_INDEX format.
1172 * Scale and bias also never affect GL_COLOR_INDEX format.
1174 key
.scaleAndBias
= 0;
1176 key
.clamp_color
= st
->clamp_frag_color_in_shader
&&
1177 ctx
->Color
._ClampFragmentColor
;
1179 fpv
= st_get_fp_variant(st
, st
->fp
, &key
);
1186 * Clamp glDrawPixels width and height to the maximum texture size.
1189 clamp_size(struct pipe_context
*pipe
, GLsizei
*width
, GLsizei
*height
,
1190 struct gl_pixelstore_attrib
*unpack
)
1192 const int maxSize
= pipe
->screen
->get_param(pipe
->screen
,
1193 PIPE_CAP_MAX_TEXTURE_2D_SIZE
);
1195 if (*width
> maxSize
) {
1196 if (unpack
->RowLength
== 0)
1197 unpack
->RowLength
= *width
;
1200 if (*height
> maxSize
) {
1207 * Search the array of 4 swizzle components for the named component and return
1211 search_swizzle(const unsigned char swizzle
[4], unsigned component
)
1214 for (i
= 0; i
< 4; i
++) {
1215 if (swizzle
[i
] == component
)
1218 assert(!"search_swizzle() failed");
1224 * Set the sampler view's swizzle terms. This is used to handle RGBA
1225 * swizzling when the incoming image format isn't an exact match for
1226 * the actual texture format. For example, if we have glDrawPixels(
1227 * GL_RGBA, GL_UNSIGNED_BYTE) and we chose the texture format
1228 * PIPE_FORMAT_B8G8R8A8 then we can do use the sampler view swizzle to
1229 * avoid swizzling all the pixels in software in the texstore code.
1232 setup_sampler_swizzle(struct pipe_sampler_view
*sv
, GLenum format
, GLenum type
)
1234 if ((format
== GL_RGBA
|| format
== GL_BGRA
) && type
== GL_UNSIGNED_BYTE
) {
1235 const struct util_format_description
*desc
=
1236 util_format_description(sv
->texture
->format
);
1237 unsigned c0
, c1
, c2
, c3
;
1239 /* Every gallium driver supports at least one 32-bit packed RGBA format.
1240 * We must have chosen one for (GL_RGBA, GL_UNSIGNED_BYTE).
1242 assert(desc
->block
.bits
== 32);
1244 /* invert the format's swizzle to setup the sampler's swizzle */
1245 if (format
== GL_RGBA
) {
1246 c0
= PIPE_SWIZZLE_X
;
1247 c1
= PIPE_SWIZZLE_Y
;
1248 c2
= PIPE_SWIZZLE_Z
;
1249 c3
= PIPE_SWIZZLE_W
;
1252 assert(format
== GL_BGRA
);
1253 c0
= PIPE_SWIZZLE_Z
;
1254 c1
= PIPE_SWIZZLE_Y
;
1255 c2
= PIPE_SWIZZLE_X
;
1256 c3
= PIPE_SWIZZLE_W
;
1258 sv
->swizzle_r
= search_swizzle(desc
->swizzle
, c0
);
1259 sv
->swizzle_g
= search_swizzle(desc
->swizzle
, c1
);
1260 sv
->swizzle_b
= search_swizzle(desc
->swizzle
, c2
);
1261 sv
->swizzle_a
= search_swizzle(desc
->swizzle
, c3
);
1264 /* use the default sampler swizzle */
1270 * Compute the effective raster z position. This performs depth-clamping
1274 get_effective_raster_z(struct gl_context
*ctx
)
1276 float z
= ctx
->Current
.RasterPos
[2];
1277 if (st_context(ctx
)->clamp_frag_depth_in_shader
) {
1280 if (ctx
->ViewportArray
[0].Near
< ctx
->ViewportArray
[0].Far
) {
1281 depth_near
= ctx
->ViewportArray
[0].Near
;
1282 depth_far
= ctx
->ViewportArray
[0].Far
;
1284 depth_near
= ctx
->ViewportArray
[0].Far
;
1285 depth_far
= ctx
->ViewportArray
[0].Near
;
1288 if (ctx
->Transform
.DepthClampNear
)
1289 z
= MAX2(z
, depth_near
);
1290 if (ctx
->Transform
.DepthClampFar
)
1291 z
= MIN2(z
, depth_far
);
1298 * Called via ctx->Driver.DrawPixels()
1301 st_DrawPixels(struct gl_context
*ctx
, GLint x
, GLint y
,
1302 GLsizei width
, GLsizei height
,
1303 GLenum format
, GLenum type
,
1304 const struct gl_pixelstore_attrib
*unpack
, const void *pixels
)
1307 struct st_context
*st
= st_context(ctx
);
1308 struct pipe_context
*pipe
= st
->pipe
;
1309 GLboolean write_stencil
= GL_FALSE
, write_depth
= GL_FALSE
;
1310 struct pipe_sampler_view
*sv
[2] = { NULL
};
1311 int num_sampler_view
= 1;
1312 struct gl_pixelstore_attrib clippedUnpack
;
1313 struct st_fp_variant
*fpv
= NULL
;
1314 struct pipe_resource
*pt
;
1316 /* Mesa state should be up to date by now */
1317 assert(ctx
->NewState
== 0x0);
1319 _mesa_update_draw_buffer_bounds(ctx
, ctx
->DrawBuffer
);
1321 st_flush_bitmap_cache(st
);
1322 st_invalidate_readpix_cache(st
);
1324 st_validate_state(st
, ST_PIPELINE_META
);
1326 /* Limit the size of the glDrawPixels to the max texture size.
1327 * Strictly speaking, that's not correct but since we don't handle
1328 * larger images yet, this is better than crashing.
1330 clippedUnpack
= *unpack
;
1331 unpack
= &clippedUnpack
;
1332 clamp_size(st
->pipe
, &width
, &height
, &clippedUnpack
);
1334 if (format
== GL_DEPTH_STENCIL
)
1335 write_stencil
= write_depth
= GL_TRUE
;
1336 else if (format
== GL_STENCIL_INDEX
)
1337 write_stencil
= GL_TRUE
;
1338 else if (format
== GL_DEPTH_COMPONENT
)
1339 write_depth
= GL_TRUE
;
1341 if (write_stencil
&&
1342 !pipe
->screen
->get_param(pipe
->screen
, PIPE_CAP_SHADER_STENCIL_EXPORT
)) {
1343 /* software fallback */
1344 draw_stencil_pixels(ctx
, x
, y
, width
, height
, format
, type
,
1349 /* Put glDrawPixels image into a texture */
1350 pt
= make_texture(st
, width
, height
, format
, type
, unpack
, pixels
);
1352 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "glDrawPixels");
1356 st_make_passthrough_vertex_shader(st
);
1359 * Get vertex/fragment shaders
1361 if (write_depth
|| write_stencil
) {
1362 driver_fp
= get_drawpix_z_stencil_program(st
, write_depth
,
1366 fpv
= (format
!= GL_COLOR_INDEX
) ? get_color_fp_variant(st
) :
1367 get_color_index_fp_variant(st
);
1369 driver_fp
= fpv
->base
.driver_shader
;
1371 if (ctx
->Pixel
.MapColorFlag
&& format
!= GL_COLOR_INDEX
) {
1372 pipe_sampler_view_reference(&sv
[1],
1373 st
->pixel_xfer
.pixelmap_sampler_view
);
1377 /* compiling a new fragment shader variant added new state constants
1378 * into the constant buffer, we need to update them
1380 st_upload_constants(st
, &st
->fp
->Base
);
1383 /* create sampler view for the image */
1384 sv
[0] = st_create_texture_sampler_view(st
->pipe
, pt
);
1386 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "glDrawPixels");
1387 pipe_resource_reference(&pt
, NULL
);
1391 /* Set up the sampler view's swizzle */
1392 setup_sampler_swizzle(sv
[0], format
, type
);
1394 /* Create a second sampler view to read stencil. The stencil is
1395 * written using the shader stencil export functionality.
1397 if (write_stencil
) {
1398 enum pipe_format stencil_format
=
1399 util_format_stencil_only(pt
->format
);
1400 /* we should not be doing pixel map/transfer (see above) */
1401 assert(num_sampler_view
== 1);
1402 sv
[1] = st_create_texture_sampler_view_format(st
->pipe
, pt
,
1405 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "glDrawPixels");
1406 pipe_resource_reference(&pt
, NULL
);
1407 pipe_sampler_view_reference(&sv
[0], NULL
);
1413 draw_textured_quad(ctx
, x
, y
, get_effective_raster_z(ctx
),
1415 ctx
->Pixel
.ZoomX
, ctx
->Pixel
.ZoomY
,
1420 ctx
->Current
.RasterColor
,
1421 GL_FALSE
, write_depth
, write_stencil
);
1422 pipe_sampler_view_reference(&sv
[0], NULL
);
1423 if (num_sampler_view
> 1)
1424 pipe_sampler_view_reference(&sv
[1], NULL
);
1426 /* free the texture (but may persist in the cache) */
1427 pipe_resource_reference(&pt
, NULL
);
1433 * Software fallback for glCopyPixels(GL_STENCIL).
1436 copy_stencil_pixels(struct gl_context
*ctx
, GLint srcx
, GLint srcy
,
1437 GLsizei width
, GLsizei height
,
1438 GLint dstx
, GLint dsty
)
1440 struct st_renderbuffer
*rbDraw
;
1441 struct pipe_context
*pipe
= st_context(ctx
)->pipe
;
1442 enum pipe_transfer_usage usage
;
1443 struct pipe_transfer
*ptDraw
;
1448 buffer
= malloc(width
* height
* sizeof(ubyte
));
1450 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "glCopyPixels(stencil)");
1454 /* Get the dest renderbuffer */
1455 rbDraw
= st_renderbuffer(ctx
->DrawBuffer
->
1456 Attachment
[BUFFER_STENCIL
].Renderbuffer
);
1458 /* this will do stencil pixel transfer ops */
1459 _mesa_readpixels(ctx
, srcx
, srcy
, width
, height
,
1460 GL_STENCIL_INDEX
, GL_UNSIGNED_BYTE
,
1461 &ctx
->DefaultPacking
, buffer
);
1464 /* debug code: dump stencil values */
1466 for (row
= 0; row
< height
; row
++) {
1467 printf("%3d: ", row
);
1468 for (col
= 0; col
< width
; col
++) {
1469 printf("%02x ", buffer
[col
+ row
* width
]);
1475 if (_mesa_is_format_packed_depth_stencil(rbDraw
->Base
.Format
))
1476 usage
= PIPE_TRANSFER_READ_WRITE
;
1478 usage
= PIPE_TRANSFER_WRITE
;
1480 if (st_fb_orientation(ctx
->DrawBuffer
) == Y_0_TOP
) {
1481 dsty
= rbDraw
->Base
.Height
- dsty
- height
;
1484 assert(util_format_get_blockwidth(rbDraw
->texture
->format
) == 1);
1485 assert(util_format_get_blockheight(rbDraw
->texture
->format
) == 1);
1487 /* map the stencil buffer */
1488 drawMap
= pipe_transfer_map(pipe
,
1490 rbDraw
->surface
->u
.tex
.level
,
1491 rbDraw
->surface
->u
.tex
.first_layer
,
1493 width
, height
, &ptDraw
);
1496 /* XXX PixelZoom not handled yet */
1497 for (i
= 0; i
< height
; i
++) {
1504 if (st_fb_orientation(ctx
->DrawBuffer
) == Y_0_TOP
) {
1508 dst
= drawMap
+ y
* ptDraw
->stride
;
1509 src
= buffer
+ i
* width
;
1511 _mesa_pack_ubyte_stencil_row(rbDraw
->Base
.Format
, width
, src
, dst
);
1516 /* unmap the stencil buffer */
1517 pipe_transfer_unmap(pipe
, ptDraw
);
1522 * Return renderbuffer to use for reading color pixels for glCopyPixels
1524 static struct st_renderbuffer
*
1525 st_get_color_read_renderbuffer(struct gl_context
*ctx
)
1527 struct gl_framebuffer
*fb
= ctx
->ReadBuffer
;
1528 struct st_renderbuffer
*strb
=
1529 st_renderbuffer(fb
->_ColorReadBuffer
);
1536 * Try to do a glCopyPixels for simple cases with a blit by calling
1539 * We can do this when we're copying color pixels (depth/stencil
1540 * eventually) with no pixel zoom, no pixel transfer ops, no
1541 * per-fragment ops, and the src/dest regions don't overlap.
1544 blit_copy_pixels(struct gl_context
*ctx
, GLint srcx
, GLint srcy
,
1545 GLsizei width
, GLsizei height
,
1546 GLint dstx
, GLint dsty
, GLenum type
)
1548 struct st_context
*st
= st_context(ctx
);
1549 struct pipe_context
*pipe
= st
->pipe
;
1550 struct pipe_screen
*screen
= pipe
->screen
;
1551 struct gl_pixelstore_attrib pack
, unpack
;
1552 GLint readX
, readY
, readW
, readH
, drawX
, drawY
, drawW
, drawH
;
1554 if (ctx
->Pixel
.ZoomX
== 1.0 &&
1555 ctx
->Pixel
.ZoomY
== 1.0 &&
1556 (type
!= GL_COLOR
||
1557 (ctx
->_ImageTransferState
== 0x0 &&
1558 !ctx
->Color
.BlendEnabled
&&
1559 !ctx
->Color
.AlphaEnabled
&&
1560 (!ctx
->Color
.ColorLogicOpEnabled
|| ctx
->Color
.LogicOp
== GL_COPY
) &&
1562 !ctx
->Fog
.Enabled
&&
1563 !ctx
->Stencil
.Enabled
&&
1564 !ctx
->FragmentProgram
.Enabled
&&
1565 !ctx
->VertexProgram
.Enabled
&&
1566 !ctx
->_Shader
->CurrentProgram
[MESA_SHADER_FRAGMENT
] &&
1567 !_mesa_ati_fragment_shader_enabled(ctx
) &&
1568 ctx
->DrawBuffer
->_NumColorDrawBuffers
== 1)) &&
1569 !ctx
->Query
.CondRenderQuery
&&
1570 !ctx
->Query
.CurrentOcclusionObject
) {
1571 struct st_renderbuffer
*rbRead
, *rbDraw
;
1574 * Clip the read region against the src buffer bounds.
1575 * We'll still allocate a temporary buffer/texture for the original
1576 * src region size but we'll only read the region which is on-screen.
1577 * This may mean that we draw garbage pixels into the dest region, but
1584 pack
= ctx
->DefaultPacking
;
1585 if (!_mesa_clip_readpixels(ctx
, &readX
, &readY
, &readW
, &readH
, &pack
))
1586 return GL_TRUE
; /* all done */
1588 /* clip against dest buffer bounds and scissor box */
1589 drawX
= dstx
+ pack
.SkipPixels
;
1590 drawY
= dsty
+ pack
.SkipRows
;
1592 if (!_mesa_clip_drawpixels(ctx
, &drawX
, &drawY
, &readW
, &readH
, &unpack
))
1593 return GL_TRUE
; /* all done */
1595 readX
= readX
- pack
.SkipPixels
+ unpack
.SkipPixels
;
1596 readY
= readY
- pack
.SkipRows
+ unpack
.SkipRows
;
1601 if (type
== GL_COLOR
) {
1602 rbRead
= st_get_color_read_renderbuffer(ctx
);
1603 rbDraw
= st_renderbuffer(ctx
->DrawBuffer
->_ColorDrawBuffers
[0]);
1604 } else if (type
== GL_DEPTH
|| type
== GL_DEPTH_STENCIL
) {
1605 rbRead
= st_renderbuffer(ctx
->ReadBuffer
->Attachment
[BUFFER_DEPTH
].Renderbuffer
);
1606 rbDraw
= st_renderbuffer(ctx
->DrawBuffer
->Attachment
[BUFFER_DEPTH
].Renderbuffer
);
1607 } else if (type
== GL_STENCIL
) {
1608 rbRead
= st_renderbuffer(ctx
->ReadBuffer
->Attachment
[BUFFER_STENCIL
].Renderbuffer
);
1609 rbDraw
= st_renderbuffer(ctx
->DrawBuffer
->Attachment
[BUFFER_STENCIL
].Renderbuffer
);
1614 /* Flip src/dst position depending on the orientation of buffers. */
1615 if (st_fb_orientation(ctx
->ReadBuffer
) == Y_0_TOP
) {
1616 readY
= rbRead
->Base
.Height
- readY
;
1620 if (st_fb_orientation(ctx
->DrawBuffer
) == Y_0_TOP
) {
1621 /* We can't flip the destination for pipe->blit, so we only adjust
1622 * its position and flip the source.
1624 drawY
= rbDraw
->Base
.Height
- drawY
- drawH
;
1629 if (rbRead
!= rbDraw
||
1630 !_mesa_regions_overlap(readX
, readY
, readX
+ readW
, readY
+ readH
,
1631 drawX
, drawY
, drawX
+ drawW
, drawY
+ drawH
)) {
1632 struct pipe_blit_info blit
;
1634 memset(&blit
, 0, sizeof(blit
));
1635 blit
.src
.resource
= rbRead
->texture
;
1636 blit
.src
.level
= rbRead
->surface
->u
.tex
.level
;
1637 blit
.src
.format
= rbRead
->texture
->format
;
1638 blit
.src
.box
.x
= readX
;
1639 blit
.src
.box
.y
= readY
;
1640 blit
.src
.box
.z
= rbRead
->surface
->u
.tex
.first_layer
;
1641 blit
.src
.box
.width
= readW
;
1642 blit
.src
.box
.height
= readH
;
1643 blit
.src
.box
.depth
= 1;
1644 blit
.dst
.resource
= rbDraw
->texture
;
1645 blit
.dst
.level
= rbDraw
->surface
->u
.tex
.level
;
1646 blit
.dst
.format
= rbDraw
->texture
->format
;
1647 blit
.dst
.box
.x
= drawX
;
1648 blit
.dst
.box
.y
= drawY
;
1649 blit
.dst
.box
.z
= rbDraw
->surface
->u
.tex
.first_layer
;
1650 blit
.dst
.box
.width
= drawW
;
1651 blit
.dst
.box
.height
= drawH
;
1652 blit
.dst
.box
.depth
= 1;
1653 blit
.filter
= PIPE_TEX_FILTER_NEAREST
;
1655 if (type
== GL_COLOR
)
1656 blit
.mask
|= PIPE_MASK_RGBA
;
1657 if (type
== GL_DEPTH
)
1658 blit
.mask
|= PIPE_MASK_Z
;
1659 if (type
== GL_STENCIL
)
1660 blit
.mask
|= PIPE_MASK_S
;
1661 if (type
== GL_DEPTH_STENCIL
)
1662 blit
.mask
|= PIPE_MASK_ZS
;
1664 if (ctx
->DrawBuffer
!= ctx
->WinSysDrawBuffer
)
1665 st_window_rectangles_to_blit(ctx
, &blit
);
1667 if (screen
->is_format_supported(screen
, blit
.src
.format
,
1668 blit
.src
.resource
->target
,
1669 blit
.src
.resource
->nr_samples
,
1670 blit
.src
.resource
->nr_storage_samples
,
1671 PIPE_BIND_SAMPLER_VIEW
) &&
1672 screen
->is_format_supported(screen
, blit
.dst
.format
,
1673 blit
.dst
.resource
->target
,
1674 blit
.dst
.resource
->nr_samples
,
1675 blit
.dst
.resource
->nr_storage_samples
,
1676 PIPE_BIND_RENDER_TARGET
)) {
1677 pipe
->blit(pipe
, &blit
);
1688 st_CopyPixels(struct gl_context
*ctx
, GLint srcx
, GLint srcy
,
1689 GLsizei width
, GLsizei height
,
1690 GLint dstx
, GLint dsty
, GLenum type
)
1692 struct st_context
*st
= st_context(ctx
);
1693 struct pipe_context
*pipe
= st
->pipe
;
1694 struct pipe_screen
*screen
= pipe
->screen
;
1695 struct st_renderbuffer
*rbRead
;
1697 struct pipe_resource
*pt
;
1698 struct pipe_sampler_view
*sv
[2] = { NULL
};
1699 struct st_fp_variant
*fpv
= NULL
;
1700 int num_sampler_view
= 1;
1701 enum pipe_format srcFormat
;
1703 GLboolean invertTex
= GL_FALSE
;
1704 GLint readX
, readY
, readW
, readH
;
1705 struct gl_pixelstore_attrib pack
= ctx
->DefaultPacking
;
1707 _mesa_update_draw_buffer_bounds(ctx
, ctx
->DrawBuffer
);
1709 st_flush_bitmap_cache(st
);
1710 st_invalidate_readpix_cache(st
);
1712 st_validate_state(st
, ST_PIPELINE_META
);
1714 if (blit_copy_pixels(ctx
, srcx
, srcy
, width
, height
, dstx
, dsty
, type
))
1717 if (type
== GL_DEPTH_STENCIL
) {
1718 /* XXX make this more efficient */
1719 st_CopyPixels(ctx
, srcx
, srcy
, width
, height
, dstx
, dsty
, GL_STENCIL
);
1720 st_CopyPixels(ctx
, srcx
, srcy
, width
, height
, dstx
, dsty
, GL_DEPTH
);
1724 if (type
== GL_STENCIL
) {
1725 /* can't use texturing to do stencil */
1726 copy_stencil_pixels(ctx
, srcx
, srcy
, width
, height
, dstx
, dsty
);
1731 * The subsequent code implements glCopyPixels by copying the source
1732 * pixels into a temporary texture that's then applied to a textured quad.
1733 * When we draw the textured quad, all the usual per-fragment operations
1737 st_make_passthrough_vertex_shader(st
);
1740 * Get vertex/fragment shaders
1742 if (type
== GL_COLOR
) {
1743 fpv
= get_color_fp_variant(st
);
1745 rbRead
= st_get_color_read_renderbuffer(ctx
);
1747 driver_fp
= fpv
->base
.driver_shader
;
1749 if (ctx
->Pixel
.MapColorFlag
) {
1750 pipe_sampler_view_reference(&sv
[1],
1751 st
->pixel_xfer
.pixelmap_sampler_view
);
1755 /* compiling a new fragment shader variant added new state constants
1756 * into the constant buffer, we need to update them
1758 st_upload_constants(st
, &st
->fp
->Base
);
1761 assert(type
== GL_DEPTH
);
1762 rbRead
= st_renderbuffer(ctx
->ReadBuffer
->
1763 Attachment
[BUFFER_DEPTH
].Renderbuffer
);
1765 driver_fp
= get_drawpix_z_stencil_program(st
, GL_TRUE
, GL_FALSE
);
1768 /* Choose the format for the temporary texture. */
1769 srcFormat
= rbRead
->texture
->format
;
1770 srcBind
= PIPE_BIND_SAMPLER_VIEW
|
1771 (type
== GL_COLOR
? PIPE_BIND_RENDER_TARGET
: PIPE_BIND_DEPTH_STENCIL
);
1773 if (!screen
->is_format_supported(screen
, srcFormat
, st
->internal_target
, 0,
1775 /* srcFormat is non-renderable. Find a compatible renderable format. */
1776 if (type
== GL_DEPTH
) {
1777 srcFormat
= st_choose_format(st
, GL_DEPTH_COMPONENT
, GL_NONE
,
1778 GL_NONE
, st
->internal_target
, 0, 0,
1779 srcBind
, false, false);
1782 assert(type
== GL_COLOR
);
1784 if (util_format_is_float(srcFormat
)) {
1785 srcFormat
= st_choose_format(st
, GL_RGBA32F
, GL_NONE
,
1786 GL_NONE
, st
->internal_target
, 0, 0,
1787 srcBind
, false, false);
1789 else if (util_format_is_pure_sint(srcFormat
)) {
1790 srcFormat
= st_choose_format(st
, GL_RGBA32I
, GL_NONE
,
1791 GL_NONE
, st
->internal_target
, 0, 0,
1792 srcBind
, false, false);
1794 else if (util_format_is_pure_uint(srcFormat
)) {
1795 srcFormat
= st_choose_format(st
, GL_RGBA32UI
, GL_NONE
,
1796 GL_NONE
, st
->internal_target
, 0, 0,
1797 srcBind
, false, false);
1799 else if (util_format_is_snorm(srcFormat
)) {
1800 srcFormat
= st_choose_format(st
, GL_RGBA16_SNORM
, GL_NONE
,
1801 GL_NONE
, st
->internal_target
, 0, 0,
1802 srcBind
, false, false);
1805 srcFormat
= st_choose_format(st
, GL_RGBA
, GL_NONE
,
1806 GL_NONE
, st
->internal_target
, 0, 0,
1807 srcBind
, false, false);
1811 if (srcFormat
== PIPE_FORMAT_NONE
) {
1812 assert(0 && "cannot choose a format for src of CopyPixels");
1817 /* Invert src region if needed */
1818 if (st_fb_orientation(ctx
->ReadBuffer
) == Y_0_TOP
) {
1819 srcy
= ctx
->ReadBuffer
->Height
- srcy
- height
;
1820 invertTex
= !invertTex
;
1823 /* Clip the read region against the src buffer bounds.
1824 * We'll still allocate a temporary buffer/texture for the original
1825 * src region size but we'll only read the region which is on-screen.
1826 * This may mean that we draw garbage pixels into the dest region, but
1833 if (!_mesa_clip_readpixels(ctx
, &readX
, &readY
, &readW
, &readH
, &pack
)) {
1834 /* The source region is completely out of bounds. Do nothing.
1835 * The GL spec says "Results of copies from outside the window,
1836 * or from regions of the window that are not exposed, are
1837 * hardware dependent and undefined."
1842 readW
= MAX2(0, readW
);
1843 readH
= MAX2(0, readH
);
1845 /* Allocate the temporary texture. */
1846 pt
= alloc_texture(st
, width
, height
, srcFormat
, srcBind
);
1850 sv
[0] = st_create_texture_sampler_view(st
->pipe
, pt
);
1852 pipe_resource_reference(&pt
, NULL
);
1856 /* Copy the src region to the temporary texture. */
1858 struct pipe_blit_info blit
;
1860 memset(&blit
, 0, sizeof(blit
));
1861 blit
.src
.resource
= rbRead
->texture
;
1862 blit
.src
.level
= rbRead
->surface
->u
.tex
.level
;
1863 blit
.src
.format
= rbRead
->texture
->format
;
1864 blit
.src
.box
.x
= readX
;
1865 blit
.src
.box
.y
= readY
;
1866 blit
.src
.box
.z
= rbRead
->surface
->u
.tex
.first_layer
;
1867 blit
.src
.box
.width
= readW
;
1868 blit
.src
.box
.height
= readH
;
1869 blit
.src
.box
.depth
= 1;
1870 blit
.dst
.resource
= pt
;
1872 blit
.dst
.format
= pt
->format
;
1873 blit
.dst
.box
.x
= pack
.SkipPixels
;
1874 blit
.dst
.box
.y
= pack
.SkipRows
;
1876 blit
.dst
.box
.width
= readW
;
1877 blit
.dst
.box
.height
= readH
;
1878 blit
.dst
.box
.depth
= 1;
1879 blit
.mask
= util_format_get_mask(pt
->format
) & ~PIPE_MASK_S
;
1880 blit
.filter
= PIPE_TEX_FILTER_NEAREST
;
1882 pipe
->blit(pipe
, &blit
);
1885 /* OK, the texture 'pt' contains the src image/pixels. Now draw a
1886 * textured quad with that texture.
1889 draw_textured_quad(ctx
, dstx
, dsty
, get_effective_raster_z(ctx
),
1890 width
, height
, ctx
->Pixel
.ZoomX
, ctx
->Pixel
.ZoomY
,
1895 ctx
->Current
.Attrib
[VERT_ATTRIB_COLOR0
],
1896 invertTex
, GL_FALSE
, GL_FALSE
);
1898 pipe_resource_reference(&pt
, NULL
);
1899 pipe_sampler_view_reference(&sv
[0], NULL
);
1904 void st_init_drawpixels_functions(struct dd_function_table
*functions
)
1906 functions
->DrawPixels
= st_DrawPixels
;
1907 functions
->CopyPixels
= st_CopyPixels
;
1912 st_destroy_drawpix(struct st_context
*st
)
1916 for (i
= 0; i
< ARRAY_SIZE(st
->drawpix
.zs_shaders
); i
++) {
1917 if (st
->drawpix
.zs_shaders
[i
])
1918 cso_delete_fragment_shader(st
->cso_context
,
1919 st
->drawpix
.zs_shaders
[i
]);
1922 if (st
->passthrough_vs
)
1923 cso_delete_vertex_shader(st
->cso_context
, st
->passthrough_vs
);
1925 /* Free cache data */
1926 for (i
= 0; i
< ARRAY_SIZE(st
->drawpix_cache
.entries
); i
++) {
1927 struct drawpix_cache_entry
*entry
= &st
->drawpix_cache
.entries
[i
];
1929 pipe_resource_reference(&entry
->texture
, NULL
);