2 * Mesa 3-D graphics library
4 * Copyright (C) 2014 Intel Corporation All Rights Reserved.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included
14 * in all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
17 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
25 * Jason Ekstrand <jason.ekstrand@intel.com>
28 #include "intel_tex.h"
29 #include "intel_blit.h"
30 #include "intel_mipmap_tree.h"
31 #include "main/formats.h"
32 #include "drivers/common/meta.h"
35 copy_image_with_blitter(struct brw_context
*brw
,
36 struct intel_mipmap_tree
*src_mt
, int src_level
,
37 int src_x
, int src_y
, int src_z
,
38 struct intel_mipmap_tree
*dst_mt
, int dst_level
,
39 int dst_x
, int dst_y
, int dst_z
,
40 int src_width
, int src_height
)
43 uint32_t src_image_x
, src_image_y
, dst_image_x
, dst_image_y
;
46 /* The blitter doesn't understand multisampling at all. */
47 if (src_mt
->num_samples
> 0 || dst_mt
->num_samples
> 0)
50 /* According to the Ivy Bridge PRM, Vol1 Part4, section 1.2.1.2 (Graphics
51 * Data Size Limitations):
53 * The BLT engine is capable of transferring very large quantities of
54 * graphics data. Any graphics data read from and written to the
55 * destination is permitted to represent a number of pixels that
56 * occupies up to 65,536 scan lines and up to 32,768 bytes per scan line
57 * at the destination. The maximum number of pixels that may be
58 * represented per scan line’s worth of graphics data depends on the
61 * Furthermore, intelEmitCopyBlit (which is called below) uses a signed
62 * 16-bit integer to represent buffer pitch, so it can only handle buffer
65 * As a result of these two limitations, we can only use the blitter to do
66 * this copy when the miptree's pitch is less than 32k.
68 if (src_mt
->pitch
>= 32768 ||
69 dst_mt
->pitch
>= 32768) {
70 perf_debug("Falling back due to >=32k pitch\n");
74 intel_miptree_get_image_offset(src_mt
, src_level
, src_z
,
75 &src_image_x
, &src_image_y
);
77 if (_mesa_is_format_compressed(src_mt
->format
)) {
78 _mesa_get_format_block_size(src_mt
->format
, &bw
, &bh
);
80 assert(src_x
% bw
== 0);
81 assert(src_y
% bh
== 0);
82 assert(src_width
% bw
== 0);
83 assert(src_height
% bh
== 0);
88 src_height
/= (int)bh
;
90 /* Inside of the miptree, the x offsets are stored in pixels while
91 * the y offsets are stored in blocks. We need to scale just the x
96 cpp
= _mesa_get_format_bytes(src_mt
->format
);
100 src_x
+= src_image_x
;
101 src_y
+= src_image_y
;
103 intel_miptree_get_image_offset(dst_mt
, dst_level
, dst_z
,
104 &dst_image_x
, &dst_image_y
);
106 if (_mesa_is_format_compressed(dst_mt
->format
)) {
107 _mesa_get_format_block_size(dst_mt
->format
, &bw
, &bh
);
109 assert(dst_x
% bw
== 0);
110 assert(dst_y
% bh
== 0);
115 /* Inside of the miptree, the x offsets are stored in pixels while
116 * the y offsets are stored in blocks. We need to scale just the x
121 dst_x
+= dst_image_x
;
122 dst_y
+= dst_image_y
;
124 return intelEmitCopyBlit(brw
,
127 src_mt
->bo
, src_mt
->offset
,
131 dst_mt
->bo
, dst_mt
->offset
,
136 src_width
, src_height
,
141 copy_image_with_memcpy(struct brw_context
*brw
,
142 struct intel_mipmap_tree
*src_mt
, int src_level
,
143 int src_x
, int src_y
, int src_z
,
144 struct intel_mipmap_tree
*dst_mt
, int dst_level
,
145 int dst_x
, int dst_y
, int dst_z
,
146 int src_width
, int src_height
)
149 void *mapped
, *src_mapped
, *dst_mapped
;
150 ptrdiff_t src_stride
, dst_stride
, cpp
;
151 int map_x1
, map_y1
, map_x2
, map_y2
;
152 GLuint src_bw
, src_bh
;
154 cpp
= _mesa_get_format_bytes(src_mt
->format
);
155 _mesa_get_format_block_size(src_mt
->format
, &src_bw
, &src_bh
);
157 assert(src_width
% src_bw
== 0);
158 assert(src_height
% src_bw
== 0);
159 assert(src_x
% src_bw
== 0);
160 assert(src_y
% src_bw
== 0);
162 /* If we are on the same miptree, same level, and same slice, then
163 * intel_miptree_map won't let us map it twice. We have to do things a
164 * bit differently. In particular, we do a single map large enough for
165 * both portions and in read-write mode.
167 same_slice
= src_mt
== dst_mt
&& src_level
== dst_level
&& src_z
== dst_z
;
170 assert(dst_x
% src_bw
== 0);
171 assert(dst_y
% src_bw
== 0);
173 map_x1
= MIN2(src_x
, dst_x
);
174 map_y1
= MIN2(src_y
, dst_y
);
175 map_x2
= MAX2(src_x
, dst_x
) + src_width
;
176 map_y2
= MAX2(src_y
, dst_y
) + src_height
;
178 intel_miptree_map(brw
, src_mt
, src_level
, src_z
,
179 map_x1
, map_y1
, map_x2
- map_x1
, map_y2
- map_y1
,
180 GL_MAP_READ_BIT
| GL_MAP_WRITE_BIT
,
181 &mapped
, &src_stride
);
183 dst_stride
= src_stride
;
185 /* Set the offsets here so we don't have to think about while looping */
186 src_mapped
= mapped
+ ((src_y
- map_y1
) / src_bh
) * src_stride
+
187 ((src_x
- map_x1
) / src_bw
) * cpp
;
188 dst_mapped
= mapped
+ ((dst_y
- map_y1
) / src_bh
) * dst_stride
+
189 ((dst_x
- map_x1
) / src_bw
) * cpp
;
191 intel_miptree_map(brw
, src_mt
, src_level
, src_z
,
192 src_x
, src_y
, src_width
, src_height
,
193 GL_MAP_READ_BIT
, &src_mapped
, &src_stride
);
194 intel_miptree_map(brw
, dst_mt
, dst_level
, dst_z
,
195 dst_x
, dst_y
, src_width
, src_height
,
196 GL_MAP_WRITE_BIT
, &dst_mapped
, &dst_stride
);
199 src_width
/= (int)src_bw
;
200 src_height
/= (int)src_bh
;
202 for (int i
= 0; i
< src_height
; ++i
) {
203 memcpy(dst_mapped
, src_mapped
, src_width
* cpp
);
204 src_mapped
+= src_stride
;
205 dst_mapped
+= dst_stride
;
209 intel_miptree_unmap(brw
, src_mt
, src_level
, src_z
);
211 intel_miptree_unmap(brw
, dst_mt
, dst_level
, dst_z
);
212 intel_miptree_unmap(brw
, src_mt
, src_level
, src_z
);
217 intel_copy_image_sub_data(struct gl_context
*ctx
,
218 struct gl_texture_image
*src_image
,
219 int src_x
, int src_y
, int src_z
,
220 struct gl_texture_image
*dst_image
,
221 int dst_x
, int dst_y
, int dst_z
,
222 int src_width
, int src_height
)
224 struct brw_context
*brw
= brw_context(ctx
);
225 struct intel_texture_image
*intel_src_image
= intel_texture_image(src_image
);
226 struct intel_texture_image
*intel_dst_image
= intel_texture_image(dst_image
);
228 if (_mesa_meta_CopyImageSubData_uncompressed(ctx
,
229 src_image
, src_x
, src_y
, src_z
,
230 dst_image
, dst_x
, dst_y
, dst_z
,
231 src_width
, src_height
)) {
235 if (intel_src_image
->mt
->num_samples
> 0 ||
236 intel_dst_image
->mt
->num_samples
> 0) {
237 _mesa_problem(ctx
, "Failed to copy multisampled texture with meta path\n");
241 /* Cube maps actually have different images per face */
242 if (src_image
->TexObject
->Target
== GL_TEXTURE_CUBE_MAP
)
243 src_z
= src_image
->Face
;
244 if (dst_image
->TexObject
->Target
== GL_TEXTURE_CUBE_MAP
)
245 dst_z
= dst_image
->Face
;
247 /* We are now going to try and copy the texture using the blitter. If
248 * that fails, we will fall back mapping the texture and using memcpy.
249 * In either case, we need to do a full resolve.
251 intel_miptree_all_slices_resolve_hiz(brw
, intel_src_image
->mt
);
252 intel_miptree_all_slices_resolve_depth(brw
, intel_src_image
->mt
);
253 intel_miptree_resolve_color(brw
, intel_src_image
->mt
);
255 intel_miptree_all_slices_resolve_hiz(brw
, intel_dst_image
->mt
);
256 intel_miptree_all_slices_resolve_depth(brw
, intel_dst_image
->mt
);
257 intel_miptree_resolve_color(brw
, intel_dst_image
->mt
);
259 unsigned src_level
= src_image
->Level
+ src_image
->TexObject
->MinLevel
;
260 unsigned dst_level
= dst_image
->Level
+ dst_image
->TexObject
->MinLevel
;
261 if (copy_image_with_blitter(brw
, intel_src_image
->mt
, src_level
,
263 intel_dst_image
->mt
, dst_level
,
265 src_width
, src_height
))
268 /* This is a worst-case scenario software fallback that maps the two
269 * textures and does a memcpy between them.
271 copy_image_with_memcpy(brw
, intel_src_image
->mt
, src_level
,
273 intel_dst_image
->mt
, dst_level
,
275 src_width
, src_height
);
279 intelInitCopyImageFuncs(struct dd_function_table
*functions
)
281 functions
->CopyImageSubData
= intel_copy_image_sub_data
;