anv: Use an address for each anv_image plane
[mesa.git] / src / intel / vulkan / anv_image.c
1 /*
2 * Copyright © 2015 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 #include <assert.h>
25 #include <stdbool.h>
26 #include <string.h>
27 #include <unistd.h>
28 #include <fcntl.h>
29 #include <sys/mman.h>
30 #include <drm_fourcc.h>
31
32 #include "anv_private.h"
33 #include "util/debug.h"
34 #include "vk_util.h"
35
36 #include "vk_format_info.h"
37
38 static isl_surf_usage_flags_t
39 choose_isl_surf_usage(VkImageCreateFlags vk_create_flags,
40 VkImageUsageFlags vk_usage,
41 isl_surf_usage_flags_t isl_extra_usage,
42 VkImageAspectFlagBits aspect)
43 {
44 isl_surf_usage_flags_t isl_usage = isl_extra_usage;
45
46 if (vk_usage & VK_IMAGE_USAGE_SAMPLED_BIT)
47 isl_usage |= ISL_SURF_USAGE_TEXTURE_BIT;
48
49 if (vk_usage & VK_IMAGE_USAGE_INPUT_ATTACHMENT_BIT)
50 isl_usage |= ISL_SURF_USAGE_TEXTURE_BIT;
51
52 if (vk_usage & VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT)
53 isl_usage |= ISL_SURF_USAGE_RENDER_TARGET_BIT;
54
55 if (vk_create_flags & VK_IMAGE_CREATE_CUBE_COMPATIBLE_BIT)
56 isl_usage |= ISL_SURF_USAGE_CUBE_BIT;
57
58 /* Even if we're only using it for transfer operations, clears to depth and
59 * stencil images happen as depth and stencil so they need the right ISL
60 * usage bits or else things will fall apart.
61 */
62 switch (aspect) {
63 case VK_IMAGE_ASPECT_DEPTH_BIT:
64 isl_usage |= ISL_SURF_USAGE_DEPTH_BIT;
65 break;
66 case VK_IMAGE_ASPECT_STENCIL_BIT:
67 isl_usage |= ISL_SURF_USAGE_STENCIL_BIT;
68 break;
69 case VK_IMAGE_ASPECT_COLOR_BIT:
70 case VK_IMAGE_ASPECT_PLANE_0_BIT:
71 case VK_IMAGE_ASPECT_PLANE_1_BIT:
72 case VK_IMAGE_ASPECT_PLANE_2_BIT:
73 break;
74 default:
75 unreachable("bad VkImageAspect");
76 }
77
78 if (vk_usage & VK_IMAGE_USAGE_TRANSFER_SRC_BIT) {
79 /* blorp implements transfers by sampling from the source image. */
80 isl_usage |= ISL_SURF_USAGE_TEXTURE_BIT;
81 }
82
83 if (vk_usage & VK_IMAGE_USAGE_TRANSFER_DST_BIT &&
84 aspect == VK_IMAGE_ASPECT_COLOR_BIT) {
85 /* blorp implements transfers by rendering into the destination image.
86 * Only request this with color images, as we deal with depth/stencil
87 * formats differently. */
88 isl_usage |= ISL_SURF_USAGE_RENDER_TARGET_BIT;
89 }
90
91 return isl_usage;
92 }
93
94 static isl_tiling_flags_t
95 choose_isl_tiling_flags(const struct anv_image_create_info *anv_info,
96 const struct isl_drm_modifier_info *isl_mod_info,
97 bool legacy_scanout)
98 {
99 const VkImageCreateInfo *base_info = anv_info->vk_info;
100 isl_tiling_flags_t flags = 0;
101
102 switch (base_info->tiling) {
103 default:
104 unreachable("bad VkImageTiling");
105 case VK_IMAGE_TILING_OPTIMAL:
106 flags = ISL_TILING_ANY_MASK;
107 break;
108 case VK_IMAGE_TILING_LINEAR:
109 flags = ISL_TILING_LINEAR_BIT;
110 break;
111 }
112
113 if (anv_info->isl_tiling_flags)
114 flags &= anv_info->isl_tiling_flags;
115
116 if (legacy_scanout)
117 flags &= ISL_TILING_LINEAR_BIT | ISL_TILING_X_BIT;
118
119 if (isl_mod_info)
120 flags &= 1 << isl_mod_info->tiling;
121
122 assert(flags);
123
124 return flags;
125 }
126
127 static struct anv_surface *
128 get_surface(struct anv_image *image, VkImageAspectFlagBits aspect)
129 {
130 uint32_t plane = anv_image_aspect_to_plane(image->aspects, aspect);
131 return &image->planes[plane].surface;
132 }
133
134 static void
135 add_surface(struct anv_image *image, struct anv_surface *surf, uint32_t plane)
136 {
137 assert(surf->isl.size > 0); /* isl surface must be initialized */
138
139 if (image->disjoint) {
140 surf->offset = align_u32(image->planes[plane].size, surf->isl.alignment);
141 /* Plane offset is always 0 when it's disjoint. */
142 } else {
143 surf->offset = align_u32(image->size, surf->isl.alignment);
144 /* Determine plane's offset only once when the first surface is added. */
145 if (image->planes[plane].size == 0)
146 image->planes[plane].offset = image->size;
147 }
148
149 image->size = surf->offset + surf->isl.size;
150 image->planes[plane].size = (surf->offset + surf->isl.size) - image->planes[plane].offset;
151
152 image->alignment = MAX2(image->alignment, surf->isl.alignment);
153 image->planes[plane].alignment = MAX2(image->planes[plane].alignment,
154 surf->isl.alignment);
155 }
156
157
158 static bool
159 all_formats_ccs_e_compatible(const struct gen_device_info *devinfo,
160 const struct VkImageCreateInfo *vk_info)
161 {
162 enum isl_format format =
163 anv_get_isl_format(devinfo, vk_info->format,
164 VK_IMAGE_ASPECT_COLOR_BIT, vk_info->tiling);
165
166 if (!isl_format_supports_ccs_e(devinfo, format))
167 return false;
168
169 if (!(vk_info->flags & VK_IMAGE_CREATE_MUTABLE_FORMAT_BIT))
170 return true;
171
172 const VkImageFormatListCreateInfoKHR *fmt_list =
173 vk_find_struct_const(vk_info->pNext, IMAGE_FORMAT_LIST_CREATE_INFO_KHR);
174
175 if (!fmt_list || fmt_list->viewFormatCount == 0)
176 return false;
177
178 for (uint32_t i = 0; i < fmt_list->viewFormatCount; i++) {
179 enum isl_format view_format =
180 anv_get_isl_format(devinfo, fmt_list->pViewFormats[i],
181 VK_IMAGE_ASPECT_COLOR_BIT, vk_info->tiling);
182
183 if (!isl_formats_are_ccs_e_compatible(devinfo, format, view_format))
184 return false;
185 }
186
187 return true;
188 }
189
190 /**
191 * For color images that have an auxiliary surface, request allocation for an
192 * additional buffer that mainly stores fast-clear values. Use of this buffer
193 * allows us to access the image's subresources while being aware of their
194 * fast-clear values in non-trivial cases (e.g., outside of a render pass in
195 * which a fast clear has occurred).
196 *
197 * In order to avoid having multiple clear colors for a single plane of an
198 * image (hence a single RENDER_SURFACE_STATE), we only allow fast-clears on
199 * the first slice (level 0, layer 0). At the time of our testing (Jan 17,
200 * 2018), there were no known applications which would benefit from fast-
201 * clearing more than just the first slice.
202 *
203 * The fast clear portion of the image is laid out in the following order:
204 *
205 * * 1 or 4 dwords (depending on hardware generation) for the clear color
206 * * 1 dword for the anv_fast_clear_type of the clear color
207 * * On gen9+, 1 dword per level and layer of the image (3D levels count
208 * multiple layers) in level-major order for compression state.
209 *
210 * For the purpose of discoverability, the algorithm used to manage
211 * compression and fast-clears is described here:
212 *
213 * * On a transition from UNDEFINED or PREINITIALIZED to a defined layout,
214 * all of the values in the fast clear portion of the image are initialized
215 * to default values.
216 *
217 * * On fast-clear, the clear value is written into surface state and also
218 * into the buffer and the fast clear type is set appropriately. Both
219 * setting the fast-clear value in the buffer and setting the fast-clear
220 * type happen from the GPU using MI commands.
221 *
222 * * Whenever a render or blorp operation is performed with CCS_E, we call
223 * genX(cmd_buffer_mark_image_written) to set the compression state to
224 * true (which is represented by UINT32_MAX).
225 *
226 * * On pipeline barrier transitions, the worst-case transition is computed
227 * from the image layouts. The command streamer inspects the fast clear
228 * type and compression state dwords and constructs a predicate. The
229 * worst-case resolve is performed with the given predicate and the fast
230 * clear and compression state is set accordingly.
231 *
232 * See anv_layout_to_aux_usage and anv_layout_to_fast_clear_type functions for
233 * details on exactly what is allowed in what layouts.
234 *
235 * On gen7-9, we do not have a concept of indirect clear colors in hardware.
236 * In order to deal with this, we have to do some clear color management.
237 *
238 * * For LOAD_OP_LOAD at the top of a renderpass, we have to copy the clear
239 * value from the buffer into the surface state with MI commands.
240 *
241 * * For any blorp operations, we pass the address to the clear value into
242 * blorp and it knows to copy the clear color.
243 */
244 static void
245 add_aux_state_tracking_buffer(struct anv_image *image,
246 VkImageAspectFlagBits aspect,
247 uint32_t plane,
248 const struct anv_device *device)
249 {
250 assert(image && device);
251 assert(image->planes[plane].aux_surface.isl.size > 0 &&
252 image->aspects & VK_IMAGE_ASPECT_ANY_COLOR_BIT_ANV);
253
254 /* Compressed images must be tiled and therefore everything should be 4K
255 * aligned. The CCS has the same alignment requirements. This is good
256 * because we need at least dword-alignment for MI_LOAD/STORE operations.
257 */
258 assert(image->alignment % 4 == 0);
259 assert((image->planes[plane].offset + image->planes[plane].size) % 4 == 0);
260
261 /* This buffer should be at the very end of the plane. */
262 if (image->disjoint) {
263 assert(image->planes[plane].size ==
264 (image->planes[plane].offset + image->planes[plane].size));
265 } else {
266 assert(image->size ==
267 (image->planes[plane].offset + image->planes[plane].size));
268 }
269
270 const unsigned clear_color_state_size = device->info.gen >= 10 ?
271 device->isl_dev.ss.clear_color_state_size :
272 device->isl_dev.ss.clear_value_size;
273
274 /* Clear color and fast clear type */
275 unsigned state_size = clear_color_state_size + 4;
276
277 /* We only need to track compression on CCS_E surfaces. */
278 if (image->planes[plane].aux_usage == ISL_AUX_USAGE_CCS_E) {
279 if (image->type == VK_IMAGE_TYPE_3D) {
280 for (uint32_t l = 0; l < image->levels; l++)
281 state_size += anv_minify(image->extent.depth, l) * 4;
282 } else {
283 state_size += image->levels * image->array_size * 4;
284 }
285 }
286
287 image->planes[plane].fast_clear_state_offset =
288 image->planes[plane].offset + image->planes[plane].size;
289
290 image->planes[plane].size += state_size;
291 image->size += state_size;
292 }
293
294 /**
295 * Initialize the anv_image::*_surface selected by \a aspect. Then update the
296 * image's memory requirements (that is, the image's size and alignment).
297 */
298 static VkResult
299 make_surface(const struct anv_device *dev,
300 struct anv_image *image,
301 const struct anv_image_create_info *anv_info,
302 isl_tiling_flags_t tiling_flags,
303 VkImageAspectFlagBits aspect)
304 {
305 const VkImageCreateInfo *vk_info = anv_info->vk_info;
306 bool ok UNUSED;
307
308 static const enum isl_surf_dim vk_to_isl_surf_dim[] = {
309 [VK_IMAGE_TYPE_1D] = ISL_SURF_DIM_1D,
310 [VK_IMAGE_TYPE_2D] = ISL_SURF_DIM_2D,
311 [VK_IMAGE_TYPE_3D] = ISL_SURF_DIM_3D,
312 };
313
314 image->extent = anv_sanitize_image_extent(vk_info->imageType,
315 vk_info->extent);
316
317 const unsigned plane = anv_image_aspect_to_plane(image->aspects, aspect);
318 const struct anv_format_plane plane_format =
319 anv_get_format_plane(&dev->info, image->vk_format, aspect, image->tiling);
320 struct anv_surface *anv_surf = &image->planes[plane].surface;
321
322 const isl_surf_usage_flags_t usage =
323 choose_isl_surf_usage(vk_info->flags, image->usage,
324 anv_info->isl_extra_usage_flags, aspect);
325
326 /* If an image is created as BLOCK_TEXEL_VIEW_COMPATIBLE, then we need to
327 * fall back to linear on Broadwell and earlier because we aren't
328 * guaranteed that we can handle offsets correctly. On Sky Lake, the
329 * horizontal and vertical alignments are sufficiently high that we can
330 * just use RENDER_SURFACE_STATE::X/Y Offset.
331 */
332 bool needs_shadow = false;
333 if (dev->info.gen <= 8 &&
334 (vk_info->flags & VK_IMAGE_CREATE_BLOCK_TEXEL_VIEW_COMPATIBLE_BIT) &&
335 vk_info->tiling == VK_IMAGE_TILING_OPTIMAL) {
336 assert(isl_format_is_compressed(plane_format.isl_format));
337 tiling_flags = ISL_TILING_LINEAR_BIT;
338 needs_shadow = true;
339 }
340
341 ok = isl_surf_init(&dev->isl_dev, &anv_surf->isl,
342 .dim = vk_to_isl_surf_dim[vk_info->imageType],
343 .format = plane_format.isl_format,
344 .width = image->extent.width / plane_format.denominator_scales[0],
345 .height = image->extent.height / plane_format.denominator_scales[1],
346 .depth = image->extent.depth,
347 .levels = vk_info->mipLevels,
348 .array_len = vk_info->arrayLayers,
349 .samples = vk_info->samples,
350 .min_alignment = 0,
351 .row_pitch = anv_info->stride,
352 .usage = usage,
353 .tiling_flags = tiling_flags);
354
355 if (!ok)
356 return VK_ERROR_OUT_OF_DEVICE_MEMORY;
357
358 image->planes[plane].aux_usage = ISL_AUX_USAGE_NONE;
359
360 add_surface(image, anv_surf, plane);
361
362 /* If an image is created as BLOCK_TEXEL_VIEW_COMPATIBLE, then we need to
363 * create an identical tiled shadow surface for use while texturing so we
364 * don't get garbage performance.
365 */
366 if (needs_shadow) {
367 assert(aspect == VK_IMAGE_ASPECT_COLOR_BIT);
368 assert(tiling_flags == ISL_TILING_LINEAR_BIT);
369
370 ok = isl_surf_init(&dev->isl_dev, &image->planes[plane].shadow_surface.isl,
371 .dim = vk_to_isl_surf_dim[vk_info->imageType],
372 .format = plane_format.isl_format,
373 .width = image->extent.width,
374 .height = image->extent.height,
375 .depth = image->extent.depth,
376 .levels = vk_info->mipLevels,
377 .array_len = vk_info->arrayLayers,
378 .samples = vk_info->samples,
379 .min_alignment = 0,
380 .row_pitch = anv_info->stride,
381 .usage = usage,
382 .tiling_flags = ISL_TILING_ANY_MASK);
383
384 /* isl_surf_init() will fail only if provided invalid input. Invalid input
385 * is illegal in Vulkan.
386 */
387 assert(ok);
388
389 add_surface(image, &image->planes[plane].shadow_surface, plane);
390 }
391
392 /* Add a HiZ surface to a depth buffer that will be used for rendering.
393 */
394 if (aspect == VK_IMAGE_ASPECT_DEPTH_BIT) {
395 /* We don't advertise that depth buffers could be used as storage
396 * images.
397 */
398 assert(!(image->usage & VK_IMAGE_USAGE_STORAGE_BIT));
399
400 /* Allow the user to control HiZ enabling. Disable by default on gen7
401 * because resolves are not currently implemented pre-BDW.
402 */
403 if (!(image->usage & VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT)) {
404 /* It will never be used as an attachment, HiZ is pointless. */
405 } else if (dev->info.gen == 7) {
406 anv_perf_warn(dev->instance, image, "Implement gen7 HiZ");
407 } else if (vk_info->mipLevels > 1) {
408 anv_perf_warn(dev->instance, image, "Enable multi-LOD HiZ");
409 } else if (vk_info->arrayLayers > 1) {
410 anv_perf_warn(dev->instance, image,
411 "Implement multi-arrayLayer HiZ clears and resolves");
412 } else if (dev->info.gen == 8 && vk_info->samples > 1) {
413 anv_perf_warn(dev->instance, image, "Enable gen8 multisampled HiZ");
414 } else if (!unlikely(INTEL_DEBUG & DEBUG_NO_HIZ)) {
415 assert(image->planes[plane].aux_surface.isl.size == 0);
416 ok = isl_surf_get_hiz_surf(&dev->isl_dev,
417 &image->planes[plane].surface.isl,
418 &image->planes[plane].aux_surface.isl);
419 assert(ok);
420 add_surface(image, &image->planes[plane].aux_surface, plane);
421 image->planes[plane].aux_usage = ISL_AUX_USAGE_HIZ;
422 }
423 } else if ((aspect & VK_IMAGE_ASPECT_ANY_COLOR_BIT_ANV) && vk_info->samples == 1) {
424 /* TODO: Disallow compression with :
425 *
426 * 1) non multiplanar images (We appear to hit a sampler bug with
427 * CCS & R16G16 format. Putting the clear state a page/4096bytes
428 * further fixes the issue).
429 *
430 * 2) alias images, because they might be aliases of images
431 * described in 1)
432 *
433 * 3) compression disabled by debug
434 */
435 const bool allow_compression =
436 image->n_planes == 1 &&
437 (vk_info->flags & VK_IMAGE_CREATE_ALIAS_BIT) == 0 &&
438 likely((INTEL_DEBUG & DEBUG_NO_RBC) == 0);
439
440 if (allow_compression) {
441 assert(image->planes[plane].aux_surface.isl.size == 0);
442 ok = isl_surf_get_ccs_surf(&dev->isl_dev,
443 &image->planes[plane].surface.isl,
444 &image->planes[plane].aux_surface.isl, 0);
445 if (ok) {
446
447 /* Disable CCS when it is not useful (i.e., when you can't render
448 * to the image with CCS enabled).
449 */
450 if (!isl_format_supports_rendering(&dev->info,
451 plane_format.isl_format)) {
452 /* While it may be technically possible to enable CCS for this
453 * image, we currently don't have things hooked up to get it
454 * working.
455 */
456 anv_perf_warn(dev->instance, image,
457 "This image format doesn't support rendering. "
458 "Not allocating an CCS buffer.");
459 image->planes[plane].aux_surface.isl.size = 0;
460 return VK_SUCCESS;
461 }
462
463 add_surface(image, &image->planes[plane].aux_surface, plane);
464 add_aux_state_tracking_buffer(image, aspect, plane, dev);
465
466 /* For images created without MUTABLE_FORMAT_BIT set, we know that
467 * they will always be used with the original format. In
468 * particular, they will always be used with a format that
469 * supports color compression. If it's never used as a storage
470 * image, then it will only be used through the sampler or the as
471 * a render target. This means that it's safe to just leave
472 * compression on at all times for these formats.
473 */
474 if (!(vk_info->usage & VK_IMAGE_USAGE_STORAGE_BIT) &&
475 all_formats_ccs_e_compatible(&dev->info, vk_info)) {
476 image->planes[plane].aux_usage = ISL_AUX_USAGE_CCS_E;
477 }
478 }
479 }
480 } else if ((aspect & VK_IMAGE_ASPECT_ANY_COLOR_BIT_ANV) && vk_info->samples > 1) {
481 assert(!(vk_info->usage & VK_IMAGE_USAGE_STORAGE_BIT));
482 assert(image->planes[plane].aux_surface.isl.size == 0);
483 ok = isl_surf_get_mcs_surf(&dev->isl_dev,
484 &image->planes[plane].surface.isl,
485 &image->planes[plane].aux_surface.isl);
486 if (ok) {
487 add_surface(image, &image->planes[plane].aux_surface, plane);
488 add_aux_state_tracking_buffer(image, aspect, plane, dev);
489 image->planes[plane].aux_usage = ISL_AUX_USAGE_MCS;
490 }
491 }
492
493 assert((image->planes[plane].offset + image->planes[plane].size) == image->size);
494
495 /* Upper bound of the last surface should be smaller than the plane's
496 * size.
497 */
498 assert((MAX2(image->planes[plane].surface.offset,
499 image->planes[plane].aux_surface.offset) +
500 (image->planes[plane].aux_surface.isl.size > 0 ?
501 image->planes[plane].aux_surface.isl.size :
502 image->planes[plane].surface.isl.size)) <=
503 (image->planes[plane].offset + image->planes[plane].size));
504
505 if (image->planes[plane].aux_surface.isl.size) {
506 /* assert(image->planes[plane].fast_clear_state_offset == */
507 /* (image->planes[plane].aux_surface.offset + image->planes[plane].aux_surface.isl.size)); */
508 assert(image->planes[plane].fast_clear_state_offset <
509 (image->planes[plane].offset + image->planes[plane].size));
510 }
511
512 return VK_SUCCESS;
513 }
514
515 static uint32_t
516 score_drm_format_mod(uint64_t modifier)
517 {
518 switch (modifier) {
519 case DRM_FORMAT_MOD_LINEAR: return 1;
520 case I915_FORMAT_MOD_X_TILED: return 2;
521 case I915_FORMAT_MOD_Y_TILED: return 3;
522 case I915_FORMAT_MOD_Y_TILED_CCS: return 4;
523 default: unreachable("bad DRM format modifier");
524 }
525 }
526
527 static const struct isl_drm_modifier_info *
528 choose_drm_format_mod(const struct anv_physical_device *device,
529 uint32_t modifier_count, const uint64_t *modifiers)
530 {
531 uint64_t best_mod = UINT64_MAX;
532 uint32_t best_score = 0;
533
534 for (uint32_t i = 0; i < modifier_count; ++i) {
535 uint32_t score = score_drm_format_mod(modifiers[i]);
536 if (score > best_score) {
537 best_mod = modifiers[i];
538 best_score = score;
539 }
540 }
541
542 if (best_score > 0)
543 return isl_drm_modifier_get_info(best_mod);
544 else
545 return NULL;
546 }
547
548 VkResult
549 anv_image_create(VkDevice _device,
550 const struct anv_image_create_info *create_info,
551 const VkAllocationCallbacks* alloc,
552 VkImage *pImage)
553 {
554 ANV_FROM_HANDLE(anv_device, device, _device);
555 const VkImageCreateInfo *pCreateInfo = create_info->vk_info;
556 const struct isl_drm_modifier_info *isl_mod_info = NULL;
557 struct anv_image *image = NULL;
558 VkResult r;
559
560 assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO);
561
562 const struct wsi_image_create_info *wsi_info =
563 vk_find_struct_const(pCreateInfo->pNext, WSI_IMAGE_CREATE_INFO_MESA);
564 if (wsi_info && wsi_info->modifier_count > 0) {
565 isl_mod_info = choose_drm_format_mod(&device->instance->physicalDevice,
566 wsi_info->modifier_count,
567 wsi_info->modifiers);
568 assert(isl_mod_info);
569 }
570
571 anv_assert(pCreateInfo->mipLevels > 0);
572 anv_assert(pCreateInfo->arrayLayers > 0);
573 anv_assert(pCreateInfo->samples > 0);
574 anv_assert(pCreateInfo->extent.width > 0);
575 anv_assert(pCreateInfo->extent.height > 0);
576 anv_assert(pCreateInfo->extent.depth > 0);
577
578 image = vk_zalloc2(&device->alloc, alloc, sizeof(*image), 8,
579 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
580 if (!image)
581 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
582
583 image->type = pCreateInfo->imageType;
584 image->extent = pCreateInfo->extent;
585 image->vk_format = pCreateInfo->format;
586 image->format = anv_get_format(pCreateInfo->format);
587 image->aspects = vk_format_aspects(image->vk_format);
588 image->levels = pCreateInfo->mipLevels;
589 image->array_size = pCreateInfo->arrayLayers;
590 image->samples = pCreateInfo->samples;
591 image->usage = pCreateInfo->usage;
592 image->tiling = pCreateInfo->tiling;
593 image->disjoint = pCreateInfo->flags & VK_IMAGE_CREATE_DISJOINT_BIT;
594 image->needs_set_tiling = wsi_info && wsi_info->scanout;
595 image->drm_format_mod = isl_mod_info ? isl_mod_info->modifier :
596 DRM_FORMAT_MOD_INVALID;
597
598 const struct anv_format *format = anv_get_format(image->vk_format);
599 assert(format != NULL);
600
601 const isl_tiling_flags_t isl_tiling_flags =
602 choose_isl_tiling_flags(create_info, isl_mod_info,
603 image->needs_set_tiling);
604
605 image->n_planes = format->n_planes;
606
607 uint32_t b;
608 for_each_bit(b, image->aspects) {
609 r = make_surface(device, image, create_info, isl_tiling_flags,
610 (1 << b));
611 if (r != VK_SUCCESS)
612 goto fail;
613 }
614
615 *pImage = anv_image_to_handle(image);
616
617 return VK_SUCCESS;
618
619 fail:
620 if (image)
621 vk_free2(&device->alloc, alloc, image);
622
623 return r;
624 }
625
626 VkResult
627 anv_CreateImage(VkDevice device,
628 const VkImageCreateInfo *pCreateInfo,
629 const VkAllocationCallbacks *pAllocator,
630 VkImage *pImage)
631 {
632 #ifdef ANDROID
633 const VkNativeBufferANDROID *gralloc_info =
634 vk_find_struct_const(pCreateInfo->pNext, NATIVE_BUFFER_ANDROID);
635
636 if (gralloc_info)
637 return anv_image_from_gralloc(device, pCreateInfo, gralloc_info,
638 pAllocator, pImage);
639 #endif
640
641 return anv_image_create(device,
642 &(struct anv_image_create_info) {
643 .vk_info = pCreateInfo,
644 },
645 pAllocator,
646 pImage);
647 }
648
649 void
650 anv_DestroyImage(VkDevice _device, VkImage _image,
651 const VkAllocationCallbacks *pAllocator)
652 {
653 ANV_FROM_HANDLE(anv_device, device, _device);
654 ANV_FROM_HANDLE(anv_image, image, _image);
655
656 if (!image)
657 return;
658
659 for (uint32_t p = 0; p < image->n_planes; ++p) {
660 if (image->planes[p].bo_is_owned) {
661 assert(image->planes[p].address.bo != NULL);
662 anv_bo_cache_release(device, &device->bo_cache,
663 image->planes[p].address.bo);
664 }
665 }
666
667 vk_free2(&device->alloc, pAllocator, image);
668 }
669
670 static void anv_image_bind_memory_plane(struct anv_device *device,
671 struct anv_image *image,
672 uint32_t plane,
673 struct anv_device_memory *memory,
674 uint32_t memory_offset)
675 {
676 assert(!image->planes[plane].bo_is_owned);
677
678 if (!memory) {
679 image->planes[plane].address = ANV_NULL_ADDRESS;
680 return;
681 }
682
683 image->planes[plane].address = (struct anv_address) {
684 .bo = memory->bo,
685 .offset = memory_offset,
686 };
687 }
688
689 VkResult anv_BindImageMemory(
690 VkDevice _device,
691 VkImage _image,
692 VkDeviceMemory _memory,
693 VkDeviceSize memoryOffset)
694 {
695 ANV_FROM_HANDLE(anv_device, device, _device);
696 ANV_FROM_HANDLE(anv_device_memory, mem, _memory);
697 ANV_FROM_HANDLE(anv_image, image, _image);
698
699 uint32_t aspect_bit;
700 anv_foreach_image_aspect_bit(aspect_bit, image, image->aspects) {
701 uint32_t plane =
702 anv_image_aspect_to_plane(image->aspects, 1UL << aspect_bit);
703 anv_image_bind_memory_plane(device, image, plane, mem, memoryOffset);
704 }
705
706 return VK_SUCCESS;
707 }
708
709 VkResult anv_BindImageMemory2(
710 VkDevice _device,
711 uint32_t bindInfoCount,
712 const VkBindImageMemoryInfo* pBindInfos)
713 {
714 ANV_FROM_HANDLE(anv_device, device, _device);
715
716 for (uint32_t i = 0; i < bindInfoCount; i++) {
717 const VkBindImageMemoryInfo *bind_info = &pBindInfos[i];
718 ANV_FROM_HANDLE(anv_device_memory, mem, bind_info->memory);
719 ANV_FROM_HANDLE(anv_image, image, bind_info->image);
720 VkImageAspectFlags aspects = image->aspects;
721
722 vk_foreach_struct_const(s, bind_info->pNext) {
723 switch (s->sType) {
724 case VK_STRUCTURE_TYPE_BIND_IMAGE_PLANE_MEMORY_INFO: {
725 const VkBindImagePlaneMemoryInfo *plane_info =
726 (const VkBindImagePlaneMemoryInfo *) s;
727
728 aspects = plane_info->planeAspect;
729 break;
730 }
731 default:
732 anv_debug_ignored_stype(s->sType);
733 break;
734 }
735 }
736
737 uint32_t aspect_bit;
738 anv_foreach_image_aspect_bit(aspect_bit, image, aspects) {
739 uint32_t plane =
740 anv_image_aspect_to_plane(image->aspects, 1UL << aspect_bit);
741 anv_image_bind_memory_plane(device, image, plane,
742 mem, bind_info->memoryOffset);
743 }
744 }
745
746 return VK_SUCCESS;
747 }
748
749 void anv_GetImageSubresourceLayout(
750 VkDevice device,
751 VkImage _image,
752 const VkImageSubresource* subresource,
753 VkSubresourceLayout* layout)
754 {
755 ANV_FROM_HANDLE(anv_image, image, _image);
756
757 const struct anv_surface *surface;
758 if (subresource->aspectMask == VK_IMAGE_ASPECT_PLANE_1_BIT_KHR &&
759 image->drm_format_mod != DRM_FORMAT_MOD_INVALID &&
760 isl_drm_modifier_has_aux(image->drm_format_mod))
761 surface = &image->planes[0].aux_surface;
762 else
763 surface = get_surface(image, subresource->aspectMask);
764
765 assert(__builtin_popcount(subresource->aspectMask) == 1);
766
767 /* If we are on a non-zero mip level or array slice, we need to
768 * calculate a real offset.
769 */
770 anv_assert(subresource->mipLevel == 0);
771 anv_assert(subresource->arrayLayer == 0);
772
773 layout->offset = surface->offset;
774 layout->rowPitch = surface->isl.row_pitch;
775 layout->depthPitch = isl_surf_get_array_pitch(&surface->isl);
776 layout->arrayPitch = isl_surf_get_array_pitch(&surface->isl);
777 layout->size = surface->isl.size;
778 }
779
780 /**
781 * This function determines the optimal buffer to use for a given
782 * VkImageLayout and other pieces of information needed to make that
783 * determination. This does not determine the optimal buffer to use
784 * during a resolve operation.
785 *
786 * @param devinfo The device information of the Intel GPU.
787 * @param image The image that may contain a collection of buffers.
788 * @param aspect The aspect of the image to be accessed.
789 * @param layout The current layout of the image aspect(s).
790 *
791 * @return The primary buffer that should be used for the given layout.
792 */
793 enum isl_aux_usage
794 anv_layout_to_aux_usage(const struct gen_device_info * const devinfo,
795 const struct anv_image * const image,
796 const VkImageAspectFlagBits aspect,
797 const VkImageLayout layout)
798 {
799 /* Validate the inputs. */
800
801 /* The devinfo is needed as the optimal buffer varies across generations. */
802 assert(devinfo != NULL);
803
804 /* The layout of a NULL image is not properly defined. */
805 assert(image != NULL);
806
807 /* The aspect must be exactly one of the image aspects. */
808 assert(_mesa_bitcount(aspect) == 1 && (aspect & image->aspects));
809
810 /* Determine the optimal buffer. */
811
812 uint32_t plane = anv_image_aspect_to_plane(image->aspects, aspect);
813
814 /* If there is no auxiliary surface allocated, we must use the one and only
815 * main buffer.
816 */
817 if (image->planes[plane].aux_surface.isl.size == 0)
818 return ISL_AUX_USAGE_NONE;
819
820 /* All images that use an auxiliary surface are required to be tiled. */
821 assert(image->tiling == VK_IMAGE_TILING_OPTIMAL);
822
823 /* Stencil has no aux */
824 assert(aspect != VK_IMAGE_ASPECT_STENCIL_BIT);
825
826 switch (layout) {
827
828 /* Invalid Layouts */
829 case VK_IMAGE_LAYOUT_RANGE_SIZE:
830 case VK_IMAGE_LAYOUT_MAX_ENUM:
831 unreachable("Invalid image layout.");
832
833 /* Undefined layouts
834 *
835 * The pre-initialized layout is equivalent to the undefined layout for
836 * optimally-tiled images. We can only do color compression (CCS or HiZ)
837 * on tiled images.
838 */
839 case VK_IMAGE_LAYOUT_UNDEFINED:
840 case VK_IMAGE_LAYOUT_PREINITIALIZED:
841 return ISL_AUX_USAGE_NONE;
842
843
844 /* Transfer Layouts
845 */
846 case VK_IMAGE_LAYOUT_GENERAL:
847 case VK_IMAGE_LAYOUT_TRANSFER_DST_OPTIMAL:
848 case VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL:
849 if (aspect == VK_IMAGE_ASPECT_DEPTH_BIT) {
850 /* This buffer could be a depth buffer used in a transfer operation.
851 * BLORP currently doesn't use HiZ for transfer operations so we must
852 * use the main buffer for this layout. TODO: Enable HiZ in BLORP.
853 */
854 assert(image->planes[plane].aux_usage == ISL_AUX_USAGE_HIZ);
855 return ISL_AUX_USAGE_NONE;
856 } else {
857 assert(image->aspects & VK_IMAGE_ASPECT_ANY_COLOR_BIT_ANV);
858 return image->planes[plane].aux_usage;
859 }
860
861
862 /* Sampling Layouts */
863 case VK_IMAGE_LAYOUT_DEPTH_STENCIL_READ_ONLY_OPTIMAL:
864 case VK_IMAGE_LAYOUT_DEPTH_READ_ONLY_STENCIL_ATTACHMENT_OPTIMAL:
865 assert((image->aspects & VK_IMAGE_ASPECT_ANY_COLOR_BIT_ANV) == 0);
866 /* Fall-through */
867 case VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL:
868 if (aspect == VK_IMAGE_ASPECT_DEPTH_BIT) {
869 if (anv_can_sample_with_hiz(devinfo, image))
870 return ISL_AUX_USAGE_HIZ;
871 else
872 return ISL_AUX_USAGE_NONE;
873 } else {
874 return image->planes[plane].aux_usage;
875 }
876
877
878 case VK_IMAGE_LAYOUT_PRESENT_SRC_KHR: {
879 assert(image->aspects == VK_IMAGE_ASPECT_COLOR_BIT);
880
881 /* When handing the image off to the presentation engine, we need to
882 * ensure that things are properly resolved. For images with no
883 * modifier, we assume that they follow the old rules and always need
884 * a full resolve because the PE doesn't understand any form of
885 * compression. For images with modifiers, we use the aux usage from
886 * the modifier.
887 */
888 const struct isl_drm_modifier_info *mod_info =
889 isl_drm_modifier_get_info(image->drm_format_mod);
890 return mod_info ? mod_info->aux_usage : ISL_AUX_USAGE_NONE;
891 }
892
893
894 /* Rendering Layouts */
895 case VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL:
896 assert(aspect & VK_IMAGE_ASPECT_ANY_COLOR_BIT_ANV);
897 if (image->planes[plane].aux_usage == ISL_AUX_USAGE_NONE) {
898 assert(image->samples == 1);
899 return ISL_AUX_USAGE_CCS_D;
900 } else {
901 assert(image->planes[plane].aux_usage != ISL_AUX_USAGE_CCS_D);
902 return image->planes[plane].aux_usage;
903 }
904
905 case VK_IMAGE_LAYOUT_DEPTH_STENCIL_ATTACHMENT_OPTIMAL:
906 case VK_IMAGE_LAYOUT_DEPTH_ATTACHMENT_STENCIL_READ_ONLY_OPTIMAL:
907 assert(aspect == VK_IMAGE_ASPECT_DEPTH_BIT);
908 return ISL_AUX_USAGE_HIZ;
909
910 case VK_IMAGE_LAYOUT_SHARED_PRESENT_KHR:
911 unreachable("VK_KHR_shared_presentable_image is unsupported");
912 }
913
914 /* If the layout isn't recognized in the exhaustive switch above, the
915 * VkImageLayout value is not defined in vulkan.h.
916 */
917 unreachable("layout is not a VkImageLayout enumeration member.");
918 }
919
920 /**
921 * This function returns the level of unresolved fast-clear support of the
922 * given image in the given VkImageLayout.
923 *
924 * @param devinfo The device information of the Intel GPU.
925 * @param image The image that may contain a collection of buffers.
926 * @param aspect The aspect of the image to be accessed.
927 * @param layout The current layout of the image aspect(s).
928 */
929 enum anv_fast_clear_type
930 anv_layout_to_fast_clear_type(const struct gen_device_info * const devinfo,
931 const struct anv_image * const image,
932 const VkImageAspectFlagBits aspect,
933 const VkImageLayout layout)
934 {
935 /* The aspect must be exactly one of the image aspects. */
936 assert(_mesa_bitcount(aspect) == 1 && (aspect & image->aspects));
937
938 uint32_t plane = anv_image_aspect_to_plane(image->aspects, aspect);
939
940 /* If there is no auxiliary surface allocated, there are no fast-clears */
941 if (image->planes[plane].aux_surface.isl.size == 0)
942 return ANV_FAST_CLEAR_NONE;
943
944 /* All images that use an auxiliary surface are required to be tiled. */
945 assert(image->tiling == VK_IMAGE_TILING_OPTIMAL);
946
947 /* Stencil has no aux */
948 assert(aspect != VK_IMAGE_ASPECT_STENCIL_BIT);
949
950 if (aspect == VK_IMAGE_ASPECT_DEPTH_BIT) {
951 /* For depth images (with HiZ), the layout supports fast-clears if and
952 * only if it supports HiZ. However, we only support fast-clears to the
953 * default depth value.
954 */
955 enum isl_aux_usage aux_usage =
956 anv_layout_to_aux_usage(devinfo, image, aspect, layout);
957 return aux_usage == ISL_AUX_USAGE_HIZ ?
958 ANV_FAST_CLEAR_DEFAULT_VALUE : ANV_FAST_CLEAR_NONE;
959 }
960
961 assert(image->aspects & VK_IMAGE_ASPECT_ANY_COLOR_BIT_ANV);
962
963 /* We don't support MSAA fast-clears on Ivybridge or Bay Trail because they
964 * lack the MI ALU which we need to determine the predicates.
965 */
966 if (devinfo->gen == 7 && !devinfo->is_haswell && image->samples > 1)
967 return ANV_FAST_CLEAR_NONE;
968
969 switch (layout) {
970 case VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL:
971 return ANV_FAST_CLEAR_ANY;
972
973 case VK_IMAGE_LAYOUT_PRESENT_SRC_KHR: {
974 assert(image->aspects == VK_IMAGE_ASPECT_COLOR_BIT);
975 #ifndef NDEBUG
976 /* We do not yet support any modifiers which support clear color so we
977 * just always return NONE. One day, this will change.
978 */
979 const struct isl_drm_modifier_info *mod_info =
980 isl_drm_modifier_get_info(image->drm_format_mod);
981 assert(!mod_info || !mod_info->supports_clear_color);
982 #endif
983 return ANV_FAST_CLEAR_NONE;
984 }
985
986 default:
987 /* If the image has MCS or CCS_E enabled all the time then we can use
988 * fast-clear as long as the clear color is the default value of zero
989 * since this is the default value we program into every surface state
990 * used for texturing.
991 */
992 if (image->planes[plane].aux_usage == ISL_AUX_USAGE_MCS ||
993 image->planes[plane].aux_usage == ISL_AUX_USAGE_CCS_E)
994 return ANV_FAST_CLEAR_DEFAULT_VALUE;
995 else
996 return ANV_FAST_CLEAR_NONE;
997 }
998 }
999
1000
1001 static struct anv_state
1002 alloc_surface_state(struct anv_device *device)
1003 {
1004 return anv_state_pool_alloc(&device->surface_state_pool, 64, 64);
1005 }
1006
1007 static enum isl_channel_select
1008 remap_swizzle(VkComponentSwizzle swizzle, VkComponentSwizzle component,
1009 struct isl_swizzle format_swizzle)
1010 {
1011 if (swizzle == VK_COMPONENT_SWIZZLE_IDENTITY)
1012 swizzle = component;
1013
1014 switch (swizzle) {
1015 case VK_COMPONENT_SWIZZLE_ZERO: return ISL_CHANNEL_SELECT_ZERO;
1016 case VK_COMPONENT_SWIZZLE_ONE: return ISL_CHANNEL_SELECT_ONE;
1017 case VK_COMPONENT_SWIZZLE_R: return format_swizzle.r;
1018 case VK_COMPONENT_SWIZZLE_G: return format_swizzle.g;
1019 case VK_COMPONENT_SWIZZLE_B: return format_swizzle.b;
1020 case VK_COMPONENT_SWIZZLE_A: return format_swizzle.a;
1021 default:
1022 unreachable("Invalid swizzle");
1023 }
1024 }
1025
1026 void
1027 anv_image_fill_surface_state(struct anv_device *device,
1028 const struct anv_image *image,
1029 VkImageAspectFlagBits aspect,
1030 const struct isl_view *view_in,
1031 isl_surf_usage_flags_t view_usage,
1032 enum isl_aux_usage aux_usage,
1033 const union isl_color_value *clear_color,
1034 enum anv_image_view_state_flags flags,
1035 struct anv_surface_state *state_inout,
1036 struct brw_image_param *image_param_out)
1037 {
1038 uint32_t plane = anv_image_aspect_to_plane(image->aspects, aspect);
1039
1040 const struct anv_surface *surface = &image->planes[plane].surface,
1041 *aux_surface = &image->planes[plane].aux_surface;
1042
1043 struct isl_view view = *view_in;
1044 view.usage |= view_usage;
1045
1046 /* For texturing with VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL from a
1047 * compressed surface with a shadow surface, we use the shadow instead of
1048 * the primary surface. The shadow surface will be tiled, unlike the main
1049 * surface, so it should get significantly better performance.
1050 */
1051 if (image->planes[plane].shadow_surface.isl.size > 0 &&
1052 isl_format_is_compressed(view.format) &&
1053 (flags & ANV_IMAGE_VIEW_STATE_TEXTURE_OPTIMAL)) {
1054 assert(isl_format_is_compressed(surface->isl.format));
1055 assert(surface->isl.tiling == ISL_TILING_LINEAR);
1056 assert(image->planes[plane].shadow_surface.isl.tiling != ISL_TILING_LINEAR);
1057 surface = &image->planes[plane].shadow_surface;
1058 }
1059
1060 if (view_usage == ISL_SURF_USAGE_RENDER_TARGET_BIT)
1061 view.swizzle = anv_swizzle_for_render(view.swizzle);
1062
1063 /* If this is a HiZ buffer we can sample from with a programmable clear
1064 * value (SKL+), define the clear value to the optimal constant.
1065 */
1066 union isl_color_value default_clear_color = { .u32 = { 0, } };
1067 if (device->info.gen >= 9 && aux_usage == ISL_AUX_USAGE_HIZ)
1068 default_clear_color.f32[0] = ANV_HZ_FC_VAL;
1069 if (!clear_color)
1070 clear_color = &default_clear_color;
1071
1072 const struct anv_address address =
1073 anv_address_add(image->planes[plane].address, surface->offset);
1074
1075 if (view_usage == ISL_SURF_USAGE_STORAGE_BIT &&
1076 !(flags & ANV_IMAGE_VIEW_STATE_STORAGE_WRITE_ONLY) &&
1077 !isl_has_matching_typed_storage_image_format(&device->info,
1078 view.format)) {
1079 /* In this case, we are a writeable storage buffer which needs to be
1080 * lowered to linear. All tiling and offset calculations will be done in
1081 * the shader.
1082 */
1083 assert(aux_usage == ISL_AUX_USAGE_NONE);
1084 isl_buffer_fill_state(&device->isl_dev, state_inout->state.map,
1085 .address = anv_address_physical(address),
1086 .size = surface->isl.size,
1087 .format = ISL_FORMAT_RAW,
1088 .stride = 1,
1089 .mocs = device->default_mocs);
1090 state_inout->address = address,
1091 state_inout->aux_address = ANV_NULL_ADDRESS;
1092 state_inout->clear_address = ANV_NULL_ADDRESS;
1093 } else {
1094 if (view_usage == ISL_SURF_USAGE_STORAGE_BIT &&
1095 !(flags & ANV_IMAGE_VIEW_STATE_STORAGE_WRITE_ONLY)) {
1096 /* Typed surface reads support a very limited subset of the shader
1097 * image formats. Translate it into the closest format the hardware
1098 * supports.
1099 */
1100 assert(aux_usage == ISL_AUX_USAGE_NONE);
1101 view.format = isl_lower_storage_image_format(&device->info,
1102 view.format);
1103 }
1104
1105 const struct isl_surf *isl_surf = &surface->isl;
1106
1107 struct isl_surf tmp_surf;
1108 uint32_t offset_B = 0, tile_x_sa = 0, tile_y_sa = 0;
1109 if (isl_format_is_compressed(surface->isl.format) &&
1110 !isl_format_is_compressed(view.format)) {
1111 /* We're creating an uncompressed view of a compressed surface. This
1112 * is allowed but only for a single level/layer.
1113 */
1114 assert(surface->isl.samples == 1);
1115 assert(view.levels == 1);
1116 assert(view.array_len == 1);
1117
1118 isl_surf_get_image_surf(&device->isl_dev, isl_surf,
1119 view.base_level,
1120 surface->isl.dim == ISL_SURF_DIM_3D ?
1121 0 : view.base_array_layer,
1122 surface->isl.dim == ISL_SURF_DIM_3D ?
1123 view.base_array_layer : 0,
1124 &tmp_surf,
1125 &offset_B, &tile_x_sa, &tile_y_sa);
1126
1127 /* The newly created image represents the one subimage we're
1128 * referencing with this view so it only has one array slice and
1129 * miplevel.
1130 */
1131 view.base_array_layer = 0;
1132 view.base_level = 0;
1133
1134 /* We're making an uncompressed view here. The image dimensions need
1135 * to be scaled down by the block size.
1136 */
1137 const struct isl_format_layout *fmtl =
1138 isl_format_get_layout(surface->isl.format);
1139 tmp_surf.format = view.format;
1140 tmp_surf.logical_level0_px.width =
1141 DIV_ROUND_UP(tmp_surf.logical_level0_px.width, fmtl->bw);
1142 tmp_surf.logical_level0_px.height =
1143 DIV_ROUND_UP(tmp_surf.logical_level0_px.height, fmtl->bh);
1144 tmp_surf.phys_level0_sa.width /= fmtl->bw;
1145 tmp_surf.phys_level0_sa.height /= fmtl->bh;
1146 tile_x_sa /= fmtl->bw;
1147 tile_y_sa /= fmtl->bh;
1148
1149 isl_surf = &tmp_surf;
1150
1151 if (device->info.gen <= 8) {
1152 assert(surface->isl.tiling == ISL_TILING_LINEAR);
1153 assert(tile_x_sa == 0);
1154 assert(tile_y_sa == 0);
1155 }
1156 }
1157
1158 state_inout->address = anv_address_add(address, offset_B);
1159
1160 struct anv_address aux_address = ANV_NULL_ADDRESS;
1161 if (aux_usage != ISL_AUX_USAGE_NONE) {
1162 aux_address = anv_address_add(image->planes[plane].address,
1163 aux_surface->offset);
1164 }
1165 state_inout->aux_address = aux_address;
1166
1167 struct anv_address clear_address = ANV_NULL_ADDRESS;
1168 if (device->info.gen >= 10 && aux_usage != ISL_AUX_USAGE_NONE) {
1169 if (aux_usage == ISL_AUX_USAGE_HIZ) {
1170 clear_address = (struct anv_address) {
1171 .bo = &device->hiz_clear_bo,
1172 .offset = 0,
1173 };
1174 } else {
1175 clear_address = anv_image_get_clear_color_addr(device, image, aspect);
1176 }
1177 }
1178 state_inout->clear_address = clear_address;
1179
1180 isl_surf_fill_state(&device->isl_dev, state_inout->state.map,
1181 .surf = isl_surf,
1182 .view = &view,
1183 .address = anv_address_physical(state_inout->address),
1184 .clear_color = *clear_color,
1185 .aux_surf = &aux_surface->isl,
1186 .aux_usage = aux_usage,
1187 .aux_address = anv_address_physical(aux_address),
1188 .clear_address = anv_address_physical(clear_address),
1189 .use_clear_address = !anv_address_is_null(clear_address),
1190 .mocs = device->default_mocs,
1191 .x_offset_sa = tile_x_sa,
1192 .y_offset_sa = tile_y_sa);
1193
1194 /* With the exception of gen8, the bottom 12 bits of the MCS base address
1195 * are used to store other information. This should be ok, however,
1196 * because the surface buffer addresses are always 4K page aligned.
1197 */
1198 uint32_t *aux_addr_dw = state_inout->state.map +
1199 device->isl_dev.ss.aux_addr_offset;
1200 assert((aux_address.offset & 0xfff) == 0);
1201 state_inout->aux_address.offset |= *aux_addr_dw & 0xfff;
1202
1203 if (device->info.gen >= 10 && clear_address.bo) {
1204 uint32_t *clear_addr_dw = state_inout->state.map +
1205 device->isl_dev.ss.clear_color_state_offset;
1206 assert((clear_address.offset & 0x3f) == 0);
1207 state_inout->clear_address.offset |= *clear_addr_dw & 0x3f;
1208 }
1209 }
1210
1211 anv_state_flush(device, state_inout->state);
1212
1213 if (image_param_out) {
1214 assert(view_usage == ISL_SURF_USAGE_STORAGE_BIT);
1215 isl_surf_fill_image_param(&device->isl_dev, image_param_out,
1216 &surface->isl, &view);
1217 }
1218 }
1219
1220 static VkImageAspectFlags
1221 remap_aspect_flags(VkImageAspectFlags view_aspects)
1222 {
1223 if (view_aspects & VK_IMAGE_ASPECT_ANY_COLOR_BIT_ANV) {
1224 if (_mesa_bitcount(view_aspects) == 1)
1225 return VK_IMAGE_ASPECT_COLOR_BIT;
1226
1227 VkImageAspectFlags color_aspects = 0;
1228 for (uint32_t i = 0; i < _mesa_bitcount(view_aspects); i++)
1229 color_aspects |= VK_IMAGE_ASPECT_PLANE_0_BIT << i;
1230 return color_aspects;
1231 }
1232 /* No special remapping needed for depth & stencil aspects. */
1233 return view_aspects;
1234 }
1235
1236 VkResult
1237 anv_CreateImageView(VkDevice _device,
1238 const VkImageViewCreateInfo *pCreateInfo,
1239 const VkAllocationCallbacks *pAllocator,
1240 VkImageView *pView)
1241 {
1242 ANV_FROM_HANDLE(anv_device, device, _device);
1243 ANV_FROM_HANDLE(anv_image, image, pCreateInfo->image);
1244 struct anv_image_view *iview;
1245
1246 iview = vk_zalloc2(&device->alloc, pAllocator, sizeof(*iview), 8,
1247 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
1248 if (iview == NULL)
1249 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
1250
1251 const VkImageSubresourceRange *range = &pCreateInfo->subresourceRange;
1252
1253 assert(range->layerCount > 0);
1254 assert(range->baseMipLevel < image->levels);
1255
1256 const VkImageViewUsageCreateInfo *usage_info =
1257 vk_find_struct_const(pCreateInfo, IMAGE_VIEW_USAGE_CREATE_INFO);
1258 VkImageUsageFlags view_usage = usage_info ? usage_info->usage : image->usage;
1259 /* View usage should be a subset of image usage */
1260 assert((view_usage & ~image->usage) == 0);
1261 assert(view_usage & (VK_IMAGE_USAGE_SAMPLED_BIT |
1262 VK_IMAGE_USAGE_STORAGE_BIT |
1263 VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT |
1264 VK_IMAGE_USAGE_INPUT_ATTACHMENT_BIT |
1265 VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT));
1266
1267 switch (image->type) {
1268 default:
1269 unreachable("bad VkImageType");
1270 case VK_IMAGE_TYPE_1D:
1271 case VK_IMAGE_TYPE_2D:
1272 assert(range->baseArrayLayer + anv_get_layerCount(image, range) - 1 <= image->array_size);
1273 break;
1274 case VK_IMAGE_TYPE_3D:
1275 assert(range->baseArrayLayer + anv_get_layerCount(image, range) - 1
1276 <= anv_minify(image->extent.depth, range->baseMipLevel));
1277 break;
1278 }
1279
1280 /* First expand aspects to the image's ones (for example
1281 * VK_IMAGE_ASPECT_COLOR_BIT will be converted to
1282 * VK_IMAGE_ASPECT_PLANE_0_BIT | VK_IMAGE_ASPECT_PLANE_1_BIT |
1283 * VK_IMAGE_ASPECT_PLANE_2_BIT for an image of format
1284 * VK_FORMAT_G8_B8_R8_3PLANE_420_UNORM_KHR.
1285 */
1286 VkImageAspectFlags expanded_aspects =
1287 anv_image_expand_aspects(image, range->aspectMask);
1288
1289 iview->image = image;
1290
1291 /* Remap the expanded aspects for the image view. For example if only
1292 * VK_IMAGE_ASPECT_PLANE_1_BIT was given in range->aspectMask, we will
1293 * convert it to VK_IMAGE_ASPECT_COLOR_BIT since from the point of view of
1294 * the image view, it only has a single plane.
1295 */
1296 iview->aspect_mask = remap_aspect_flags(expanded_aspects);
1297 iview->n_planes = anv_image_aspect_get_planes(iview->aspect_mask);
1298 iview->vk_format = pCreateInfo->format;
1299
1300 iview->extent = (VkExtent3D) {
1301 .width = anv_minify(image->extent.width , range->baseMipLevel),
1302 .height = anv_minify(image->extent.height, range->baseMipLevel),
1303 .depth = anv_minify(image->extent.depth , range->baseMipLevel),
1304 };
1305
1306 /* Now go through the underlying image selected planes (computed in
1307 * expanded_aspects) and map them to planes in the image view.
1308 */
1309 uint32_t iaspect_bit, vplane = 0;
1310 anv_foreach_image_aspect_bit(iaspect_bit, image, expanded_aspects) {
1311 uint32_t iplane =
1312 anv_image_aspect_to_plane(expanded_aspects, 1UL << iaspect_bit);
1313 VkImageAspectFlags vplane_aspect =
1314 anv_plane_to_aspect(iview->aspect_mask, vplane);
1315 struct anv_format_plane format =
1316 anv_get_format_plane(&device->info, pCreateInfo->format,
1317 vplane_aspect, image->tiling);
1318
1319 iview->planes[vplane].image_plane = iplane;
1320
1321 iview->planes[vplane].isl = (struct isl_view) {
1322 .format = format.isl_format,
1323 .base_level = range->baseMipLevel,
1324 .levels = anv_get_levelCount(image, range),
1325 .base_array_layer = range->baseArrayLayer,
1326 .array_len = anv_get_layerCount(image, range),
1327 .swizzle = {
1328 .r = remap_swizzle(pCreateInfo->components.r,
1329 VK_COMPONENT_SWIZZLE_R, format.swizzle),
1330 .g = remap_swizzle(pCreateInfo->components.g,
1331 VK_COMPONENT_SWIZZLE_G, format.swizzle),
1332 .b = remap_swizzle(pCreateInfo->components.b,
1333 VK_COMPONENT_SWIZZLE_B, format.swizzle),
1334 .a = remap_swizzle(pCreateInfo->components.a,
1335 VK_COMPONENT_SWIZZLE_A, format.swizzle),
1336 },
1337 };
1338
1339 if (pCreateInfo->viewType == VK_IMAGE_VIEW_TYPE_3D) {
1340 iview->planes[vplane].isl.base_array_layer = 0;
1341 iview->planes[vplane].isl.array_len = iview->extent.depth;
1342 }
1343
1344 if (pCreateInfo->viewType == VK_IMAGE_VIEW_TYPE_CUBE ||
1345 pCreateInfo->viewType == VK_IMAGE_VIEW_TYPE_CUBE_ARRAY) {
1346 iview->planes[vplane].isl.usage = ISL_SURF_USAGE_CUBE_BIT;
1347 } else {
1348 iview->planes[vplane].isl.usage = 0;
1349 }
1350
1351 if (view_usage & VK_IMAGE_USAGE_SAMPLED_BIT ||
1352 (view_usage & VK_IMAGE_USAGE_INPUT_ATTACHMENT_BIT &&
1353 !(iview->aspect_mask & VK_IMAGE_ASPECT_COLOR_BIT))) {
1354 iview->planes[vplane].optimal_sampler_surface_state.state = alloc_surface_state(device);
1355 iview->planes[vplane].general_sampler_surface_state.state = alloc_surface_state(device);
1356
1357 enum isl_aux_usage general_aux_usage =
1358 anv_layout_to_aux_usage(&device->info, image, 1UL << iaspect_bit,
1359 VK_IMAGE_LAYOUT_GENERAL);
1360 enum isl_aux_usage optimal_aux_usage =
1361 anv_layout_to_aux_usage(&device->info, image, 1UL << iaspect_bit,
1362 VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL);
1363
1364 anv_image_fill_surface_state(device, image, 1ULL << iaspect_bit,
1365 &iview->planes[vplane].isl,
1366 ISL_SURF_USAGE_TEXTURE_BIT,
1367 optimal_aux_usage, NULL,
1368 ANV_IMAGE_VIEW_STATE_TEXTURE_OPTIMAL,
1369 &iview->planes[vplane].optimal_sampler_surface_state,
1370 NULL);
1371
1372 anv_image_fill_surface_state(device, image, 1ULL << iaspect_bit,
1373 &iview->planes[vplane].isl,
1374 ISL_SURF_USAGE_TEXTURE_BIT,
1375 general_aux_usage, NULL,
1376 0,
1377 &iview->planes[vplane].general_sampler_surface_state,
1378 NULL);
1379 }
1380
1381 /* NOTE: This one needs to go last since it may stomp isl_view.format */
1382 if (view_usage & VK_IMAGE_USAGE_STORAGE_BIT) {
1383 iview->planes[vplane].storage_surface_state.state = alloc_surface_state(device);
1384 iview->planes[vplane].writeonly_storage_surface_state.state = alloc_surface_state(device);
1385
1386 anv_image_fill_surface_state(device, image, 1ULL << iaspect_bit,
1387 &iview->planes[vplane].isl,
1388 ISL_SURF_USAGE_STORAGE_BIT,
1389 ISL_AUX_USAGE_NONE, NULL,
1390 0,
1391 &iview->planes[vplane].storage_surface_state,
1392 &iview->planes[vplane].storage_image_param);
1393
1394 anv_image_fill_surface_state(device, image, 1ULL << iaspect_bit,
1395 &iview->planes[vplane].isl,
1396 ISL_SURF_USAGE_STORAGE_BIT,
1397 ISL_AUX_USAGE_NONE, NULL,
1398 ANV_IMAGE_VIEW_STATE_STORAGE_WRITE_ONLY,
1399 &iview->planes[vplane].writeonly_storage_surface_state,
1400 NULL);
1401 }
1402
1403 vplane++;
1404 }
1405
1406 *pView = anv_image_view_to_handle(iview);
1407
1408 return VK_SUCCESS;
1409 }
1410
1411 void
1412 anv_DestroyImageView(VkDevice _device, VkImageView _iview,
1413 const VkAllocationCallbacks *pAllocator)
1414 {
1415 ANV_FROM_HANDLE(anv_device, device, _device);
1416 ANV_FROM_HANDLE(anv_image_view, iview, _iview);
1417
1418 if (!iview)
1419 return;
1420
1421 for (uint32_t plane = 0; plane < iview->n_planes; plane++) {
1422 if (iview->planes[plane].optimal_sampler_surface_state.state.alloc_size > 0) {
1423 anv_state_pool_free(&device->surface_state_pool,
1424 iview->planes[plane].optimal_sampler_surface_state.state);
1425 }
1426
1427 if (iview->planes[plane].general_sampler_surface_state.state.alloc_size > 0) {
1428 anv_state_pool_free(&device->surface_state_pool,
1429 iview->planes[plane].general_sampler_surface_state.state);
1430 }
1431
1432 if (iview->planes[plane].storage_surface_state.state.alloc_size > 0) {
1433 anv_state_pool_free(&device->surface_state_pool,
1434 iview->planes[plane].storage_surface_state.state);
1435 }
1436
1437 if (iview->planes[plane].writeonly_storage_surface_state.state.alloc_size > 0) {
1438 anv_state_pool_free(&device->surface_state_pool,
1439 iview->planes[plane].writeonly_storage_surface_state.state);
1440 }
1441 }
1442
1443 vk_free2(&device->alloc, pAllocator, iview);
1444 }
1445
1446
1447 VkResult
1448 anv_CreateBufferView(VkDevice _device,
1449 const VkBufferViewCreateInfo *pCreateInfo,
1450 const VkAllocationCallbacks *pAllocator,
1451 VkBufferView *pView)
1452 {
1453 ANV_FROM_HANDLE(anv_device, device, _device);
1454 ANV_FROM_HANDLE(anv_buffer, buffer, pCreateInfo->buffer);
1455 struct anv_buffer_view *view;
1456
1457 view = vk_alloc2(&device->alloc, pAllocator, sizeof(*view), 8,
1458 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
1459 if (!view)
1460 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
1461
1462 /* TODO: Handle the format swizzle? */
1463
1464 view->format = anv_get_isl_format(&device->info, pCreateInfo->format,
1465 VK_IMAGE_ASPECT_COLOR_BIT,
1466 VK_IMAGE_TILING_LINEAR);
1467 const uint32_t format_bs = isl_format_get_layout(view->format)->bpb / 8;
1468 view->range = anv_buffer_get_range(buffer, pCreateInfo->offset,
1469 pCreateInfo->range);
1470 view->range = align_down_npot_u32(view->range, format_bs);
1471
1472 view->address = anv_address_add(buffer->address, pCreateInfo->offset);
1473
1474 if (buffer->usage & VK_BUFFER_USAGE_UNIFORM_TEXEL_BUFFER_BIT) {
1475 view->surface_state = alloc_surface_state(device);
1476
1477 anv_fill_buffer_surface_state(device, view->surface_state,
1478 view->format,
1479 view->address, view->range, format_bs);
1480 } else {
1481 view->surface_state = (struct anv_state){ 0 };
1482 }
1483
1484 if (buffer->usage & VK_BUFFER_USAGE_STORAGE_TEXEL_BUFFER_BIT) {
1485 view->storage_surface_state = alloc_surface_state(device);
1486 view->writeonly_storage_surface_state = alloc_surface_state(device);
1487
1488 enum isl_format storage_format =
1489 isl_has_matching_typed_storage_image_format(&device->info,
1490 view->format) ?
1491 isl_lower_storage_image_format(&device->info, view->format) :
1492 ISL_FORMAT_RAW;
1493
1494 anv_fill_buffer_surface_state(device, view->storage_surface_state,
1495 storage_format,
1496 view->address, view->range,
1497 (storage_format == ISL_FORMAT_RAW ? 1 :
1498 isl_format_get_layout(storage_format)->bpb / 8));
1499
1500 /* Write-only accesses should use the original format. */
1501 anv_fill_buffer_surface_state(device, view->writeonly_storage_surface_state,
1502 view->format,
1503 view->address, view->range,
1504 isl_format_get_layout(view->format)->bpb / 8);
1505
1506 isl_buffer_fill_image_param(&device->isl_dev,
1507 &view->storage_image_param,
1508 view->format, view->range);
1509 } else {
1510 view->storage_surface_state = (struct anv_state){ 0 };
1511 view->writeonly_storage_surface_state = (struct anv_state){ 0 };
1512 }
1513
1514 *pView = anv_buffer_view_to_handle(view);
1515
1516 return VK_SUCCESS;
1517 }
1518
1519 void
1520 anv_DestroyBufferView(VkDevice _device, VkBufferView bufferView,
1521 const VkAllocationCallbacks *pAllocator)
1522 {
1523 ANV_FROM_HANDLE(anv_device, device, _device);
1524 ANV_FROM_HANDLE(anv_buffer_view, view, bufferView);
1525
1526 if (!view)
1527 return;
1528
1529 if (view->surface_state.alloc_size > 0)
1530 anv_state_pool_free(&device->surface_state_pool,
1531 view->surface_state);
1532
1533 if (view->storage_surface_state.alloc_size > 0)
1534 anv_state_pool_free(&device->surface_state_pool,
1535 view->storage_surface_state);
1536
1537 if (view->writeonly_storage_surface_state.alloc_size > 0)
1538 anv_state_pool_free(&device->surface_state_pool,
1539 view->writeonly_storage_surface_state);
1540
1541 vk_free2(&device->alloc, pAllocator, view);
1542 }
1543
1544 const struct anv_surface *
1545 anv_image_get_surface_for_aspect_mask(const struct anv_image *image,
1546 VkImageAspectFlags aspect_mask)
1547 {
1548 VkImageAspectFlags sanitized_mask;
1549
1550 switch (aspect_mask) {
1551 case VK_IMAGE_ASPECT_COLOR_BIT:
1552 assert(image->aspects == VK_IMAGE_ASPECT_COLOR_BIT);
1553 sanitized_mask = VK_IMAGE_ASPECT_COLOR_BIT;
1554 break;
1555 case VK_IMAGE_ASPECT_DEPTH_BIT:
1556 assert(image->aspects & VK_IMAGE_ASPECT_DEPTH_BIT);
1557 sanitized_mask = VK_IMAGE_ASPECT_DEPTH_BIT;
1558 break;
1559 case VK_IMAGE_ASPECT_STENCIL_BIT:
1560 assert(image->aspects & VK_IMAGE_ASPECT_STENCIL_BIT);
1561 sanitized_mask = VK_IMAGE_ASPECT_STENCIL_BIT;
1562 break;
1563 case VK_IMAGE_ASPECT_DEPTH_BIT | VK_IMAGE_ASPECT_STENCIL_BIT:
1564 /* FINISHME: The Vulkan spec (git a511ba2) requires support for
1565 * combined depth stencil formats. Specifically, it states:
1566 *
1567 * At least one of ename:VK_FORMAT_D24_UNORM_S8_UINT or
1568 * ename:VK_FORMAT_D32_SFLOAT_S8_UINT must be supported.
1569 *
1570 * Image views with both depth and stencil aspects are only valid for
1571 * render target attachments, in which case
1572 * cmd_buffer_emit_depth_stencil() will pick out both the depth and
1573 * stencil surfaces from the underlying surface.
1574 */
1575 if (image->aspects & VK_IMAGE_ASPECT_DEPTH_BIT) {
1576 sanitized_mask = VK_IMAGE_ASPECT_DEPTH_BIT;
1577 } else {
1578 assert(image->aspects == VK_IMAGE_ASPECT_STENCIL_BIT);
1579 sanitized_mask = VK_IMAGE_ASPECT_STENCIL_BIT;
1580 }
1581 break;
1582 case VK_IMAGE_ASPECT_PLANE_0_BIT:
1583 assert((image->aspects & ~VK_IMAGE_ASPECT_ANY_COLOR_BIT_ANV) == 0);
1584 sanitized_mask = VK_IMAGE_ASPECT_PLANE_0_BIT;
1585 break;
1586 case VK_IMAGE_ASPECT_PLANE_1_BIT:
1587 assert((image->aspects & ~VK_IMAGE_ASPECT_ANY_COLOR_BIT_ANV) == 0);
1588 sanitized_mask = VK_IMAGE_ASPECT_PLANE_1_BIT;
1589 break;
1590 case VK_IMAGE_ASPECT_PLANE_2_BIT:
1591 assert((image->aspects & ~VK_IMAGE_ASPECT_ANY_COLOR_BIT_ANV) == 0);
1592 sanitized_mask = VK_IMAGE_ASPECT_PLANE_2_BIT;
1593 break;
1594 default:
1595 unreachable("image does not have aspect");
1596 return NULL;
1597 }
1598
1599 uint32_t plane = anv_image_aspect_to_plane(image->aspects, sanitized_mask);
1600 return &image->planes[plane].surface;
1601 }