iris: Initial import of resolve code
[mesa.git] / src / gallium / drivers / iris / iris_resource.c
1 /*
2 * Copyright © 2017 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included
12 * in all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
15 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
18 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
19 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
20 * DEALINGS IN THE SOFTWARE.
21 */
22
23 /**
24 * @file iris_resource.c
25 *
26 * Resources are images, buffers, and other objects used by the GPU.
27 *
28 * XXX: explain resources
29 */
30
31 #include <stdio.h>
32 #include <errno.h>
33 #include "pipe/p_defines.h"
34 #include "pipe/p_state.h"
35 #include "pipe/p_context.h"
36 #include "pipe/p_screen.h"
37 #include "util/os_memory.h"
38 #include "util/u_cpu_detect.h"
39 #include "util/u_inlines.h"
40 #include "util/u_format.h"
41 #include "util/u_transfer.h"
42 #include "util/u_transfer_helper.h"
43 #include "util/u_upload_mgr.h"
44 #include "util/ralloc.h"
45 #include "iris_batch.h"
46 #include "iris_context.h"
47 #include "iris_resource.h"
48 #include "iris_screen.h"
49 #include "intel/common/gen_debug.h"
50 #include "isl/isl.h"
51 #include "drm-uapi/drm_fourcc.h"
52 #include "drm-uapi/i915_drm.h"
53
54 enum modifier_priority {
55 MODIFIER_PRIORITY_INVALID = 0,
56 MODIFIER_PRIORITY_LINEAR,
57 MODIFIER_PRIORITY_X,
58 MODIFIER_PRIORITY_Y,
59 MODIFIER_PRIORITY_Y_CCS,
60 };
61
62 static const uint64_t priority_to_modifier[] = {
63 [MODIFIER_PRIORITY_INVALID] = DRM_FORMAT_MOD_INVALID,
64 [MODIFIER_PRIORITY_LINEAR] = DRM_FORMAT_MOD_LINEAR,
65 [MODIFIER_PRIORITY_X] = I915_FORMAT_MOD_X_TILED,
66 [MODIFIER_PRIORITY_Y] = I915_FORMAT_MOD_Y_TILED,
67 [MODIFIER_PRIORITY_Y_CCS] = I915_FORMAT_MOD_Y_TILED_CCS,
68 };
69
70 static bool
71 modifier_is_supported(const struct gen_device_info *devinfo,
72 uint64_t modifier)
73 {
74 /* XXX: do something real */
75 switch (modifier) {
76 case I915_FORMAT_MOD_Y_TILED:
77 case I915_FORMAT_MOD_X_TILED:
78 case DRM_FORMAT_MOD_LINEAR:
79 return true;
80 case I915_FORMAT_MOD_Y_TILED_CCS:
81 case DRM_FORMAT_MOD_INVALID:
82 default:
83 return false;
84 }
85 }
86
87 static uint64_t
88 select_best_modifier(struct gen_device_info *devinfo,
89 const uint64_t *modifiers,
90 int count)
91 {
92 enum modifier_priority prio = MODIFIER_PRIORITY_INVALID;
93
94 for (int i = 0; i < count; i++) {
95 if (!modifier_is_supported(devinfo, modifiers[i]))
96 continue;
97
98 switch (modifiers[i]) {
99 case I915_FORMAT_MOD_Y_TILED_CCS:
100 prio = MAX2(prio, MODIFIER_PRIORITY_Y_CCS);
101 break;
102 case I915_FORMAT_MOD_Y_TILED:
103 prio = MAX2(prio, MODIFIER_PRIORITY_Y);
104 break;
105 case I915_FORMAT_MOD_X_TILED:
106 prio = MAX2(prio, MODIFIER_PRIORITY_X);
107 break;
108 case DRM_FORMAT_MOD_LINEAR:
109 prio = MAX2(prio, MODIFIER_PRIORITY_LINEAR);
110 break;
111 case DRM_FORMAT_MOD_INVALID:
112 default:
113 break;
114 }
115 }
116
117 return priority_to_modifier[prio];
118 }
119
120 static enum isl_surf_dim
121 target_to_isl_surf_dim(enum pipe_texture_target target)
122 {
123 switch (target) {
124 case PIPE_BUFFER:
125 case PIPE_TEXTURE_1D:
126 case PIPE_TEXTURE_1D_ARRAY:
127 return ISL_SURF_DIM_1D;
128 case PIPE_TEXTURE_2D:
129 case PIPE_TEXTURE_CUBE:
130 case PIPE_TEXTURE_RECT:
131 case PIPE_TEXTURE_2D_ARRAY:
132 case PIPE_TEXTURE_CUBE_ARRAY:
133 return ISL_SURF_DIM_2D;
134 case PIPE_TEXTURE_3D:
135 return ISL_SURF_DIM_3D;
136 case PIPE_MAX_TEXTURE_TYPES:
137 break;
138 }
139 unreachable("invalid texture type");
140 }
141
142 static isl_surf_usage_flags_t
143 pipe_bind_to_isl_usage(unsigned bindings)
144 {
145 isl_surf_usage_flags_t usage = 0;
146
147 if (bindings & PIPE_BIND_RENDER_TARGET)
148 usage |= ISL_SURF_USAGE_RENDER_TARGET_BIT;
149
150 if (bindings & PIPE_BIND_SAMPLER_VIEW)
151 usage |= ISL_SURF_USAGE_TEXTURE_BIT;
152
153 if (bindings & (PIPE_BIND_SHADER_IMAGE | PIPE_BIND_SHADER_BUFFER))
154 usage |= ISL_SURF_USAGE_STORAGE_BIT;
155
156 if (bindings & PIPE_BIND_DISPLAY_TARGET)
157 usage |= ISL_SURF_USAGE_DISPLAY_BIT;
158
159 return usage;
160 }
161
162 struct pipe_resource *
163 iris_resource_get_separate_stencil(struct pipe_resource *p_res)
164 {
165 /* For packed depth-stencil, we treat depth as the primary resource
166 * and store S8 as the "second plane" resource.
167 */
168 return p_res->next;
169 }
170
171 static void
172 iris_resource_set_separate_stencil(struct pipe_resource *p_res,
173 struct pipe_resource *stencil)
174 {
175 assert(util_format_has_depth(util_format_description(p_res->format)));
176 pipe_resource_reference(&p_res->next, stencil);
177 }
178
179 void
180 iris_get_depth_stencil_resources(struct pipe_resource *res,
181 struct iris_resource **out_z,
182 struct iris_resource **out_s)
183 {
184 if (!res) {
185 *out_z = NULL;
186 *out_s = NULL;
187 return;
188 }
189
190 if (res->format != PIPE_FORMAT_S8_UINT) {
191 *out_z = (void *) res;
192 *out_s = (void *) iris_resource_get_separate_stencil(res);
193 } else {
194 *out_z = NULL;
195 *out_s = (void *) res;
196 }
197 }
198
199 void
200 iris_resource_disable_aux(struct iris_resource *res)
201 {
202 iris_bo_unreference(res->aux.bo);
203 free(res->aux.state);
204
205 // XXX: clear color BO
206 // XXX: HiZ
207
208 res->aux.usage = ISL_AUX_USAGE_NONE;
209 res->aux.surf.size_B = 0;
210 res->aux.bo = NULL;
211 res->aux.state = NULL;
212 }
213
214 static void
215 iris_resource_destroy(struct pipe_screen *screen,
216 struct pipe_resource *resource)
217 {
218 struct iris_resource *res = (struct iris_resource *)resource;
219
220 iris_resource_disable_aux(res);
221
222 iris_bo_unreference(res->bo);
223 free(res);
224 }
225
226 static struct iris_resource *
227 iris_alloc_resource(struct pipe_screen *pscreen,
228 const struct pipe_resource *templ)
229 {
230 struct iris_resource *res = calloc(1, sizeof(struct iris_resource));
231 if (!res)
232 return NULL;
233
234 res->base = *templ;
235 res->base.screen = pscreen;
236 pipe_reference_init(&res->base.reference, 1);
237
238 res->aux.possible_usages = 1 << ISL_AUX_USAGE_NONE;
239
240 return res;
241 }
242
243 unsigned
244 iris_get_num_logical_layers(const struct iris_resource *res, unsigned level)
245 {
246 if (res->surf.dim == ISL_SURF_DIM_3D)
247 return minify(res->surf.logical_level0_px.depth, level);
248 else
249 return res->surf.logical_level0_px.array_len;
250 }
251
252 static enum isl_aux_state **
253 create_aux_state_map(struct iris_resource *res, enum isl_aux_state initial)
254 {
255 uint32_t total_slices = 0;
256 for (uint32_t level = 0; level < res->surf.levels; level++)
257 total_slices += iris_get_num_logical_layers(res, level);
258
259 const size_t per_level_array_size =
260 res->surf.levels * sizeof(enum isl_aux_state *);
261
262 /* We're going to allocate a single chunk of data for both the per-level
263 * reference array and the arrays of aux_state. This makes cleanup
264 * significantly easier.
265 */
266 const size_t total_size =
267 per_level_array_size + total_slices * sizeof(enum isl_aux_state);
268
269 void *data = malloc(total_size);
270 if (!data)
271 return NULL;
272
273 enum isl_aux_state **per_level_arr = data;
274 enum isl_aux_state *s = data + per_level_array_size;
275 for (uint32_t level = 0; level < res->surf.levels; level++) {
276 per_level_arr[level] = s;
277 const unsigned level_layers = iris_get_num_logical_layers(res, level);
278 for (uint32_t a = 0; a < level_layers; a++)
279 *(s++) = initial;
280 }
281 assert((void *)s == data + total_size);
282
283 return per_level_arr;
284 }
285
286 /**
287 * Allocate the initial aux surface for a resource based on aux.usage
288 */
289 static bool
290 iris_resource_alloc_aux(struct iris_screen *screen, struct iris_resource *res)
291 {
292 struct isl_device *isl_dev = &screen->isl_dev;
293 enum isl_aux_state initial_state;
294 UNUSED bool ok = false;
295 uint8_t memset_value = 0;
296 uint32_t alloc_flags = 0;
297
298 assert(!res->aux.bo);
299
300 switch (res->aux.usage) {
301 case ISL_AUX_USAGE_NONE:
302 res->aux.surf.size_B = 0;
303 break;
304 case ISL_AUX_USAGE_HIZ:
305 initial_state = ISL_AUX_STATE_AUX_INVALID;
306 memset_value = 0;
307 ok = isl_surf_get_hiz_surf(isl_dev, &res->surf, &res->aux.surf);
308 break;
309 case ISL_AUX_USAGE_MCS:
310 /* The Ivybridge PRM, Vol 2 Part 1 p326 says:
311 *
312 * "When MCS buffer is enabled and bound to MSRT, it is required
313 * that it is cleared prior to any rendering."
314 *
315 * Since we only use the MCS buffer for rendering, we just clear it
316 * immediately on allocation. The clear value for MCS buffers is all
317 * 1's, so we simply memset it to 0xff.
318 */
319 initial_state = ISL_AUX_STATE_CLEAR;
320 memset_value = 0xFF;
321 ok = isl_surf_get_mcs_surf(isl_dev, &res->surf, &res->aux.surf);
322 break;
323 case ISL_AUX_USAGE_CCS_D:
324 case ISL_AUX_USAGE_CCS_E:
325 /* When CCS_E is used, we need to ensure that the CCS starts off in
326 * a valid state. From the Sky Lake PRM, "MCS Buffer for Render
327 * Target(s)":
328 *
329 * "If Software wants to enable Color Compression without Fast
330 * clear, Software needs to initialize MCS with zeros."
331 *
332 * A CCS value of 0 indicates that the corresponding block is in the
333 * pass-through state which is what we want.
334 *
335 * For CCS_D, do the same thing. On Gen9+, this avoids having any
336 * undefined bits in the aux buffer.
337 */
338 initial_state = ISL_AUX_STATE_PASS_THROUGH;
339 alloc_flags |= BO_ALLOC_ZEROED;
340 ok = isl_surf_get_ccs_surf(isl_dev, &res->surf, &res->aux.surf, 0);
341 break;
342 }
343
344 /* No work is needed for a zero-sized auxiliary buffer. */
345 if (res->aux.surf.size_B == 0)
346 return true;
347
348 /* Assert that ISL gave us a valid aux surf */
349 assert(ok);
350
351 /* Create the aux_state for the auxiliary buffer. */
352 res->aux.state = create_aux_state_map(res, initial_state);
353 if (!res->aux.state)
354 return false;
355
356 /* Allocate the auxiliary buffer. ISL has stricter set of alignment rules
357 * the drm allocator. Therefore, one can pass the ISL dimensions in terms
358 * of bytes instead of trying to recalculate based on different format
359 * block sizes.
360 */
361 res->aux.bo = iris_bo_alloc_tiled(screen->bufmgr, "aux buffer",
362 res->aux.surf.size_B,
363 IRIS_MEMZONE_OTHER, I915_TILING_Y,
364 res->aux.surf.row_pitch_B, alloc_flags);
365 if (!res->aux.bo)
366 return false;
367
368 /* Optionally, initialize the auxiliary data to the desired value. */
369 if (memset_value != 0) {
370 void *map = iris_bo_map(NULL, res->aux.bo, MAP_WRITE | MAP_RAW);
371 if (!map)
372 return false;
373
374 memset(map, memset_value, res->aux.surf.size_B);
375 iris_bo_unmap(res->aux.bo);
376 }
377
378 // XXX: HIZ enabling
379
380 return true;
381 }
382
383 static bool
384 supports_mcs(const struct isl_surf *surf)
385 {
386 /* MCS compression only applies to multisampled resources. */
387 if (surf->samples <= 1)
388 return false;
389
390 /* See isl_surf_get_mcs_surf for details. */
391 if (surf->samples == 16 && surf->logical_level0_px.width > 8192)
392 return false;
393
394 /* Depth and stencil buffers use the IMS (interleaved) layout. */
395 if (isl_surf_usage_is_depth_or_stencil(surf->usage))
396 return false;
397
398 return true;
399 }
400
401 static bool
402 supports_ccs(const struct gen_device_info *devinfo,
403 const struct isl_surf *surf)
404 {
405 /* Gen9+ only supports CCS for Y-tiled buffers. */
406 if (surf->tiling != ISL_TILING_Y0)
407 return false;
408
409 /* CCS only supports singlesampled resources. */
410 if (surf->samples > 1)
411 return false;
412
413 /* The PRM doesn't say this explicitly, but fast-clears don't appear to
414 * work for 3D textures until Gen9 where the layout of 3D textures changes
415 * to match 2D array textures.
416 */
417 if (devinfo->gen < 9 && surf->dim != ISL_SURF_DIM_2D)
418 return false;
419
420 /* Note: still need to check the format! */
421
422 return true;
423 }
424
425 static struct pipe_resource *
426 iris_resource_create_for_buffer(struct pipe_screen *pscreen,
427 const struct pipe_resource *templ)
428 {
429 struct iris_screen *screen = (struct iris_screen *)pscreen;
430 struct iris_resource *res = iris_alloc_resource(pscreen, templ);
431
432 assert(templ->target == PIPE_BUFFER);
433 assert(templ->height0 <= 1);
434 assert(templ->depth0 <= 1);
435 assert(templ->format == PIPE_FORMAT_NONE ||
436 util_format_get_blocksize(templ->format) == 1);
437
438 res->internal_format = templ->format;
439 res->surf.tiling = ISL_TILING_LINEAR;
440
441 enum iris_memory_zone memzone = IRIS_MEMZONE_OTHER;
442 const char *name = templ->target == PIPE_BUFFER ? "buffer" : "miptree";
443 if (templ->flags & IRIS_RESOURCE_FLAG_SHADER_MEMZONE) {
444 memzone = IRIS_MEMZONE_SHADER;
445 name = "shader kernels";
446 } else if (templ->flags & IRIS_RESOURCE_FLAG_SURFACE_MEMZONE) {
447 memzone = IRIS_MEMZONE_SURFACE;
448 name = "surface state";
449 } else if (templ->flags & IRIS_RESOURCE_FLAG_DYNAMIC_MEMZONE) {
450 memzone = IRIS_MEMZONE_DYNAMIC;
451 name = "dynamic state";
452 }
453
454 res->bo = iris_bo_alloc(screen->bufmgr, name, templ->width0, memzone);
455 if (!res->bo) {
456 iris_resource_destroy(pscreen, &res->base);
457 return NULL;
458 }
459
460 return &res->base;
461 }
462
463 static struct pipe_resource *
464 iris_resource_create_with_modifiers(struct pipe_screen *pscreen,
465 const struct pipe_resource *templ,
466 const uint64_t *modifiers,
467 int modifiers_count)
468 {
469 struct iris_screen *screen = (struct iris_screen *)pscreen;
470 struct gen_device_info *devinfo = &screen->devinfo;
471 struct iris_resource *res = iris_alloc_resource(pscreen, templ);
472
473 if (!res)
474 return NULL;
475
476 const struct util_format_description *format_desc =
477 util_format_description(templ->format);
478 const bool has_depth = util_format_has_depth(format_desc);
479 const struct isl_drm_modifier_info *mod_info = NULL;
480 uint64_t modifier =
481 select_best_modifier(devinfo, modifiers, modifiers_count);
482
483 isl_tiling_flags_t tiling_flags = ISL_TILING_ANY_MASK;
484
485 if (modifier != DRM_FORMAT_MOD_INVALID) {
486 mod_info = isl_drm_modifier_get_info(modifier);
487
488 tiling_flags = 1 << mod_info->tiling;
489 } else {
490 if (modifiers_count > 0) {
491 fprintf(stderr, "Unsupported modifier, resource creation failed.\n");
492 return NULL;
493 }
494
495 /* No modifiers - we can select our own tiling. */
496
497 if (has_depth) {
498 /* Depth must be Y-tiled */
499 tiling_flags = ISL_TILING_Y0_BIT;
500 } else if (templ->format == PIPE_FORMAT_S8_UINT) {
501 /* Stencil must be W-tiled */
502 tiling_flags = ISL_TILING_W_BIT;
503 } else if (templ->target == PIPE_BUFFER ||
504 templ->target == PIPE_TEXTURE_1D ||
505 templ->target == PIPE_TEXTURE_1D_ARRAY) {
506 /* Use linear for buffers and 1D textures */
507 tiling_flags = ISL_TILING_LINEAR_BIT;
508 }
509
510 /* Use linear for staging buffers */
511 if (templ->usage == PIPE_USAGE_STAGING ||
512 templ->bind & (PIPE_BIND_LINEAR | PIPE_BIND_CURSOR) )
513 tiling_flags = ISL_TILING_LINEAR_BIT;
514 }
515
516 isl_surf_usage_flags_t usage = pipe_bind_to_isl_usage(templ->bind);
517
518 if (templ->target == PIPE_TEXTURE_CUBE ||
519 templ->target == PIPE_TEXTURE_CUBE_ARRAY)
520 usage |= ISL_SURF_USAGE_CUBE_BIT;
521
522 if (templ->usage != PIPE_USAGE_STAGING) {
523 if (templ->format == PIPE_FORMAT_S8_UINT)
524 usage |= ISL_SURF_USAGE_STENCIL_BIT;
525 else if (has_depth)
526 usage |= ISL_SURF_USAGE_DEPTH_BIT;
527 }
528
529 enum pipe_format pfmt = templ->format;
530 res->internal_format = pfmt;
531
532 /* Should be handled by u_transfer_helper */
533 assert(!util_format_is_depth_and_stencil(pfmt));
534
535 struct iris_format_info fmt = iris_format_for_usage(devinfo, pfmt, usage);
536 assert(fmt.fmt != ISL_FORMAT_UNSUPPORTED);
537
538 UNUSED const bool isl_surf_created_successfully =
539 isl_surf_init(&screen->isl_dev, &res->surf,
540 .dim = target_to_isl_surf_dim(templ->target),
541 .format = fmt.fmt,
542 .width = templ->width0,
543 .height = templ->height0,
544 .depth = templ->depth0,
545 .levels = templ->last_level + 1,
546 .array_len = templ->array_size,
547 .samples = MAX2(templ->nr_samples, 1),
548 .min_alignment_B = 0,
549 .row_pitch_B = 0,
550 .usage = usage,
551 .tiling_flags = tiling_flags);
552 assert(isl_surf_created_successfully);
553
554 if (mod_info) {
555 res->aux.possible_usages |= 1 << mod_info->aux_usage;
556 } else if (has_depth) {
557 res->aux.possible_usages |= 1 << ISL_AUX_USAGE_HIZ;
558 } else if (supports_mcs(&res->surf)) {
559 res->aux.possible_usages |= 1 << ISL_AUX_USAGE_MCS;
560 } else if (supports_ccs(devinfo, &res->surf)) {
561 if (isl_format_supports_ccs_e(devinfo, res->surf.format))
562 res->aux.possible_usages |= 1 << ISL_AUX_USAGE_CCS_E;
563 else if (isl_format_supports_ccs_d(devinfo, res->surf.format))
564 res->aux.possible_usages |= 1 << ISL_AUX_USAGE_CCS_D;
565 }
566
567 // XXX: we don't actually do aux yet
568 res->aux.possible_usages = 1 << ISL_AUX_USAGE_NONE;
569
570 res->aux.usage = util_last_bit(res->aux.possible_usages) - 1;
571
572 const char *name = "miptree";
573 enum iris_memory_zone memzone = IRIS_MEMZONE_OTHER;
574
575 /* These are for u_upload_mgr buffers only */
576 assert(!(templ->flags & (IRIS_RESOURCE_FLAG_SHADER_MEMZONE |
577 IRIS_RESOURCE_FLAG_SURFACE_MEMZONE |
578 IRIS_RESOURCE_FLAG_DYNAMIC_MEMZONE)));
579
580 res->bo = iris_bo_alloc_tiled(screen->bufmgr, name, res->surf.size_B,
581 memzone,
582 isl_tiling_to_i915_tiling(res->surf.tiling),
583 res->surf.row_pitch_B, 0);
584
585 if (!res->bo)
586 goto fail;
587
588 if (!iris_resource_alloc_aux(screen, res))
589 goto fail;
590
591 return &res->base;
592
593 fail:
594 fprintf(stderr, "XXX: resource creation failed\n");
595 iris_resource_destroy(pscreen, &res->base);
596 return NULL;
597
598 }
599
600 static struct pipe_resource *
601 iris_resource_create(struct pipe_screen *pscreen,
602 const struct pipe_resource *templ)
603 {
604 if (templ->target == PIPE_BUFFER)
605 return iris_resource_create_for_buffer(pscreen, templ);
606 else
607 return iris_resource_create_with_modifiers(pscreen, templ, NULL, 0);
608 }
609
610 static uint64_t
611 tiling_to_modifier(uint32_t tiling)
612 {
613 static const uint64_t map[] = {
614 [I915_TILING_NONE] = DRM_FORMAT_MOD_LINEAR,
615 [I915_TILING_X] = I915_FORMAT_MOD_X_TILED,
616 [I915_TILING_Y] = I915_FORMAT_MOD_Y_TILED,
617 };
618
619 assert(tiling < ARRAY_SIZE(map));
620
621 return map[tiling];
622 }
623
624 static struct pipe_resource *
625 iris_resource_from_user_memory(struct pipe_screen *pscreen,
626 const struct pipe_resource *templ,
627 void *user_memory)
628 {
629 struct iris_screen *screen = (struct iris_screen *)pscreen;
630 struct iris_bufmgr *bufmgr = screen->bufmgr;
631 struct iris_resource *res = iris_alloc_resource(pscreen, templ);
632 if (!res)
633 return NULL;
634
635 assert(templ->target == PIPE_BUFFER);
636
637 res->internal_format = templ->format;
638 res->bo = iris_bo_create_userptr(bufmgr, "user",
639 user_memory, templ->width0,
640 IRIS_MEMZONE_OTHER);
641 if (!res->bo) {
642 free(res);
643 return NULL;
644 }
645
646 return &res->base;
647 }
648
649 static struct pipe_resource *
650 iris_resource_from_handle(struct pipe_screen *pscreen,
651 const struct pipe_resource *templ,
652 struct winsys_handle *whandle,
653 unsigned usage)
654 {
655 struct iris_screen *screen = (struct iris_screen *)pscreen;
656 struct gen_device_info *devinfo = &screen->devinfo;
657 struct iris_bufmgr *bufmgr = screen->bufmgr;
658 struct iris_resource *res = iris_alloc_resource(pscreen, templ);
659 if (!res)
660 return NULL;
661
662 if (whandle->offset != 0) {
663 dbg_printf("Attempt to import unsupported winsys offset %u\n",
664 whandle->offset);
665 goto fail;
666 }
667
668 switch (whandle->type) {
669 case WINSYS_HANDLE_TYPE_FD:
670 res->bo = iris_bo_import_dmabuf(bufmgr, whandle->handle);
671 break;
672 case WINSYS_HANDLE_TYPE_SHARED:
673 res->bo = iris_bo_gem_create_from_name(bufmgr, "winsys image",
674 whandle->handle);
675 break;
676 default:
677 unreachable("invalid winsys handle type");
678 }
679 if (!res->bo)
680 return NULL;
681
682 uint64_t modifier = whandle->modifier;
683 if (modifier == DRM_FORMAT_MOD_INVALID) {
684 modifier = tiling_to_modifier(res->bo->tiling_mode);
685 }
686 const struct isl_drm_modifier_info *mod_info =
687 isl_drm_modifier_get_info(modifier);
688 assert(mod_info);
689
690 isl_surf_usage_flags_t isl_usage = pipe_bind_to_isl_usage(templ->bind);
691
692 const struct iris_format_info fmt =
693 iris_format_for_usage(devinfo, templ->format, isl_usage);
694 res->internal_format = templ->format;
695
696 if (templ->target == PIPE_BUFFER) {
697 res->surf.tiling = ISL_TILING_LINEAR;
698 } else {
699 isl_surf_init(&screen->isl_dev, &res->surf,
700 .dim = target_to_isl_surf_dim(templ->target),
701 .format = fmt.fmt,
702 .width = templ->width0,
703 .height = templ->height0,
704 .depth = templ->depth0,
705 .levels = templ->last_level + 1,
706 .array_len = templ->array_size,
707 .samples = MAX2(templ->nr_samples, 1),
708 .min_alignment_B = 0,
709 .row_pitch_B = whandle->stride,
710 .usage = isl_usage,
711 .tiling_flags = 1 << mod_info->tiling);
712
713 assert(res->bo->tiling_mode ==
714 isl_tiling_to_i915_tiling(res->surf.tiling));
715
716 // XXX: create_ccs_buf_for_image?
717 if (!iris_resource_alloc_aux(screen, res))
718 goto fail;
719 }
720
721 return &res->base;
722
723 fail:
724 iris_resource_destroy(pscreen, &res->base);
725 return NULL;
726 }
727
728 static boolean
729 iris_resource_get_handle(struct pipe_screen *pscreen,
730 struct pipe_context *ctx,
731 struct pipe_resource *resource,
732 struct winsys_handle *whandle,
733 unsigned usage)
734 {
735 struct iris_resource *res = (struct iris_resource *)resource;
736
737 /* If this is a buffer, stride should be 0 - no need to special case */
738 whandle->stride = res->surf.row_pitch_B;
739 whandle->modifier = tiling_to_modifier(res->bo->tiling_mode);
740
741 switch (whandle->type) {
742 case WINSYS_HANDLE_TYPE_SHARED:
743 return iris_bo_flink(res->bo, &whandle->handle) == 0;
744 case WINSYS_HANDLE_TYPE_KMS:
745 whandle->handle = iris_bo_export_gem_handle(res->bo);
746 return true;
747 case WINSYS_HANDLE_TYPE_FD:
748 return iris_bo_export_dmabuf(res->bo, (int *) &whandle->handle) == 0;
749 }
750
751 return false;
752 }
753
754 static void
755 get_image_offset_el(struct isl_surf *surf, unsigned level, unsigned z,
756 unsigned *out_x0_el, unsigned *out_y0_el)
757 {
758 if (surf->dim == ISL_SURF_DIM_3D) {
759 isl_surf_get_image_offset_el(surf, level, 0, z, out_x0_el, out_y0_el);
760 } else {
761 isl_surf_get_image_offset_el(surf, level, z, 0, out_x0_el, out_y0_el);
762 }
763 }
764
765 /**
766 * Get pointer offset into stencil buffer.
767 *
768 * The stencil buffer is W tiled. Since the GTT is incapable of W fencing, we
769 * must decode the tile's layout in software.
770 *
771 * See
772 * - PRM, 2011 Sandy Bridge, Volume 1, Part 2, Section 4.5.2.1 W-Major Tile
773 * Format.
774 * - PRM, 2011 Sandy Bridge, Volume 1, Part 2, Section 4.5.3 Tiling Algorithm
775 *
776 * Even though the returned offset is always positive, the return type is
777 * signed due to
778 * commit e8b1c6d6f55f5be3bef25084fdd8b6127517e137
779 * mesa: Fix return type of _mesa_get_format_bytes() (#37351)
780 */
781 static intptr_t
782 s8_offset(uint32_t stride, uint32_t x, uint32_t y, bool swizzled)
783 {
784 uint32_t tile_size = 4096;
785 uint32_t tile_width = 64;
786 uint32_t tile_height = 64;
787 uint32_t row_size = 64 * stride / 2; /* Two rows are interleaved. */
788
789 uint32_t tile_x = x / tile_width;
790 uint32_t tile_y = y / tile_height;
791
792 /* The byte's address relative to the tile's base addres. */
793 uint32_t byte_x = x % tile_width;
794 uint32_t byte_y = y % tile_height;
795
796 uintptr_t u = tile_y * row_size
797 + tile_x * tile_size
798 + 512 * (byte_x / 8)
799 + 64 * (byte_y / 8)
800 + 32 * ((byte_y / 4) % 2)
801 + 16 * ((byte_x / 4) % 2)
802 + 8 * ((byte_y / 2) % 2)
803 + 4 * ((byte_x / 2) % 2)
804 + 2 * (byte_y % 2)
805 + 1 * (byte_x % 2);
806
807 if (swizzled) {
808 /* adjust for bit6 swizzling */
809 if (((byte_x / 8) % 2) == 1) {
810 if (((byte_y / 8) % 2) == 0) {
811 u += 64;
812 } else {
813 u -= 64;
814 }
815 }
816 }
817
818 return u;
819 }
820
821 static void
822 iris_unmap_s8(struct iris_transfer *map)
823 {
824 struct pipe_transfer *xfer = &map->base;
825 struct iris_resource *res = (struct iris_resource *) xfer->resource;
826 struct isl_surf *surf = &res->surf;
827 const bool has_swizzling = false;
828
829 if (xfer->usage & PIPE_TRANSFER_WRITE) {
830 uint8_t *untiled_s8_map = map->ptr;
831 uint8_t *tiled_s8_map =
832 iris_bo_map(map->dbg, res->bo, xfer->usage | MAP_RAW);
833
834 struct pipe_box box = xfer->box;
835
836 for (int s = 0; s < box.depth; s++) {
837 unsigned x0_el, y0_el;
838 get_image_offset_el(surf, xfer->level, box.z, &x0_el, &y0_el);
839
840 for (uint32_t y = 0; y < box.height; y++) {
841 for (uint32_t x = 0; x < box.width; x++) {
842 ptrdiff_t offset = s8_offset(surf->row_pitch_B,
843 x0_el + box.x + x,
844 y0_el + box.y + y,
845 has_swizzling);
846 tiled_s8_map[offset] =
847 untiled_s8_map[s * xfer->layer_stride + y * xfer->stride + x];
848 }
849 }
850
851 box.z++;
852 }
853 }
854
855 free(map->buffer);
856 }
857
858 static void
859 iris_map_s8(struct iris_transfer *map)
860 {
861 struct pipe_transfer *xfer = &map->base;
862 struct iris_resource *res = (struct iris_resource *) xfer->resource;
863 struct isl_surf *surf = &res->surf;
864
865 xfer->stride = surf->row_pitch_B;
866 xfer->layer_stride = xfer->stride * xfer->box.height;
867
868 /* The tiling and detiling functions require that the linear buffer has
869 * a 16-byte alignment (that is, its `x0` is 16-byte aligned). Here we
870 * over-allocate the linear buffer to get the proper alignment.
871 */
872 map->buffer = map->ptr = malloc(xfer->layer_stride * xfer->box.depth);
873 assert(map->buffer);
874
875 const bool has_swizzling = false;
876
877 /* One of either READ_BIT or WRITE_BIT or both is set. READ_BIT implies no
878 * INVALIDATE_RANGE_BIT. WRITE_BIT needs the original values read in unless
879 * invalidate is set, since we'll be writing the whole rectangle from our
880 * temporary buffer back out.
881 */
882 if (!(xfer->usage & PIPE_TRANSFER_DISCARD_RANGE)) {
883 uint8_t *untiled_s8_map = map->ptr;
884 uint8_t *tiled_s8_map =
885 iris_bo_map(map->dbg, res->bo, xfer->usage | MAP_RAW);
886
887 struct pipe_box box = xfer->box;
888
889 for (int s = 0; s < box.depth; s++) {
890 unsigned x0_el, y0_el;
891 get_image_offset_el(surf, xfer->level, box.z, &x0_el, &y0_el);
892
893 for (uint32_t y = 0; y < box.height; y++) {
894 for (uint32_t x = 0; x < box.width; x++) {
895 ptrdiff_t offset = s8_offset(surf->row_pitch_B,
896 x0_el + box.x + x,
897 y0_el + box.y + y,
898 has_swizzling);
899 untiled_s8_map[s * xfer->layer_stride + y * xfer->stride + x] =
900 tiled_s8_map[offset];
901 }
902 }
903
904 box.z++;
905 }
906 }
907
908 map->unmap = iris_unmap_s8;
909 }
910
911 /* Compute extent parameters for use with tiled_memcpy functions.
912 * xs are in units of bytes and ys are in units of strides.
913 */
914 static inline void
915 tile_extents(struct isl_surf *surf,
916 const struct pipe_box *box,
917 unsigned level,
918 unsigned *x1_B, unsigned *x2_B,
919 unsigned *y1_el, unsigned *y2_el)
920 {
921 const struct isl_format_layout *fmtl = isl_format_get_layout(surf->format);
922 const unsigned cpp = fmtl->bpb / 8;
923
924 assert(box->x % fmtl->bw == 0);
925 assert(box->y % fmtl->bh == 0);
926
927 unsigned x0_el, y0_el;
928 get_image_offset_el(surf, level, box->z, &x0_el, &y0_el);
929
930 *x1_B = (box->x / fmtl->bw + x0_el) * cpp;
931 *y1_el = box->y / fmtl->bh + y0_el;
932 *x2_B = (DIV_ROUND_UP(box->x + box->width, fmtl->bw) + x0_el) * cpp;
933 *y2_el = DIV_ROUND_UP(box->y + box->height, fmtl->bh) + y0_el;
934 }
935
936 static void
937 iris_unmap_tiled_memcpy(struct iris_transfer *map)
938 {
939 struct pipe_transfer *xfer = &map->base;
940 struct pipe_box box = xfer->box;
941 struct iris_resource *res = (struct iris_resource *) xfer->resource;
942 struct isl_surf *surf = &res->surf;
943
944 const bool has_swizzling = false;
945
946 if (xfer->usage & PIPE_TRANSFER_WRITE) {
947 char *dst = iris_bo_map(map->dbg, res->bo, xfer->usage | MAP_RAW);
948
949 for (int s = 0; s < box.depth; s++) {
950 unsigned x1, x2, y1, y2;
951 tile_extents(surf, &box, xfer->level, &x1, &x2, &y1, &y2);
952
953 void *ptr = map->ptr + s * xfer->layer_stride;
954
955 isl_memcpy_linear_to_tiled(x1, x2, y1, y2, dst, ptr,
956 surf->row_pitch_B, xfer->stride,
957 has_swizzling, surf->tiling, ISL_MEMCPY);
958 box.z++;
959 }
960 }
961 os_free_aligned(map->buffer);
962 map->buffer = map->ptr = NULL;
963 }
964
965 static void
966 iris_map_tiled_memcpy(struct iris_transfer *map)
967 {
968 struct pipe_transfer *xfer = &map->base;
969 struct iris_resource *res = (struct iris_resource *) xfer->resource;
970 struct isl_surf *surf = &res->surf;
971
972 xfer->stride = ALIGN(surf->row_pitch_B, 16);
973 xfer->layer_stride = xfer->stride * xfer->box.height;
974
975 unsigned x1, x2, y1, y2;
976 tile_extents(surf, &xfer->box, xfer->level, &x1, &x2, &y1, &y2);
977
978 /* The tiling and detiling functions require that the linear buffer has
979 * a 16-byte alignment (that is, its `x0` is 16-byte aligned). Here we
980 * over-allocate the linear buffer to get the proper alignment.
981 */
982 map->buffer =
983 os_malloc_aligned(xfer->layer_stride * xfer->box.depth, 16);
984 assert(map->buffer);
985 map->ptr = (char *)map->buffer + (x1 & 0xf);
986
987 const bool has_swizzling = false;
988
989 // XXX: PIPE_TRANSFER_READ?
990 if (!(xfer->usage & PIPE_TRANSFER_DISCARD_RANGE)) {
991 char *src = iris_bo_map(map->dbg, res->bo, xfer->usage | MAP_RAW);
992
993 struct pipe_box box = xfer->box;
994
995 for (int s = 0; s < box.depth; s++) {
996 unsigned x1, x2, y1, y2;
997 tile_extents(surf, &box, xfer->level, &x1, &x2, &y1, &y2);
998
999 /* Use 's' rather than 'box.z' to rebase the first slice to 0. */
1000 void *ptr = map->ptr + s * xfer->layer_stride;
1001
1002 isl_memcpy_tiled_to_linear(x1, x2, y1, y2, ptr, src, xfer->stride,
1003 surf->row_pitch_B, has_swizzling,
1004 surf->tiling, ISL_MEMCPY);
1005 box.z++;
1006 }
1007 }
1008
1009 map->unmap = iris_unmap_tiled_memcpy;
1010 }
1011
1012 static void
1013 iris_map_direct(struct iris_transfer *map)
1014 {
1015 struct pipe_transfer *xfer = &map->base;
1016 struct pipe_box *box = &xfer->box;
1017 struct iris_resource *res = (struct iris_resource *) xfer->resource;
1018
1019 void *ptr = iris_bo_map(map->dbg, res->bo, xfer->usage);
1020
1021 if (res->base.target == PIPE_BUFFER) {
1022 xfer->stride = 0;
1023 xfer->layer_stride = 0;
1024
1025 map->ptr = ptr + box->x;
1026 } else {
1027 struct isl_surf *surf = &res->surf;
1028 const struct isl_format_layout *fmtl =
1029 isl_format_get_layout(surf->format);
1030 const unsigned cpp = fmtl->bpb / 8;
1031 unsigned x0_el, y0_el;
1032
1033 get_image_offset_el(surf, xfer->level, box->z, &x0_el, &y0_el);
1034
1035 xfer->stride = isl_surf_get_row_pitch_B(surf);
1036 xfer->layer_stride = isl_surf_get_array_pitch(surf);
1037
1038 map->ptr = ptr + (y0_el + box->y) * xfer->stride + (x0_el + box->x) * cpp;
1039 }
1040 }
1041
1042 static void *
1043 iris_transfer_map(struct pipe_context *ctx,
1044 struct pipe_resource *resource,
1045 unsigned level,
1046 enum pipe_transfer_usage usage,
1047 const struct pipe_box *box,
1048 struct pipe_transfer **ptransfer)
1049 {
1050 struct iris_context *ice = (struct iris_context *)ctx;
1051 struct iris_resource *res = (struct iris_resource *)resource;
1052 struct isl_surf *surf = &res->surf;
1053
1054 /* If we can discard the whole resource, we can also discard the
1055 * subrange being accessed.
1056 */
1057 if (usage & PIPE_TRANSFER_DISCARD_WHOLE_RESOURCE)
1058 usage |= PIPE_TRANSFER_DISCARD_RANGE;
1059
1060 if (surf->tiling != ISL_TILING_LINEAR &&
1061 (usage & PIPE_TRANSFER_MAP_DIRECTLY))
1062 return NULL;
1063
1064 if (!(usage & PIPE_TRANSFER_UNSYNCHRONIZED)) {
1065 for (int i = 0; i < IRIS_BATCH_COUNT; i++) {
1066 if (iris_batch_references(&ice->batches[i], res->bo))
1067 iris_batch_flush(&ice->batches[i]);
1068 }
1069 }
1070
1071 if ((usage & PIPE_TRANSFER_DONTBLOCK) && iris_bo_busy(res->bo))
1072 return NULL;
1073
1074 struct iris_transfer *map = slab_alloc(&ice->transfer_pool);
1075 struct pipe_transfer *xfer = &map->base;
1076
1077 if (!map)
1078 return NULL;
1079
1080 memset(map, 0, sizeof(*map));
1081 map->dbg = &ice->dbg;
1082
1083 pipe_resource_reference(&xfer->resource, resource);
1084 xfer->level = level;
1085 xfer->usage = usage;
1086 xfer->box = *box;
1087 *ptransfer = xfer;
1088
1089 xfer->usage &= (PIPE_TRANSFER_READ |
1090 PIPE_TRANSFER_WRITE |
1091 PIPE_TRANSFER_UNSYNCHRONIZED |
1092 PIPE_TRANSFER_PERSISTENT |
1093 PIPE_TRANSFER_COHERENT |
1094 PIPE_TRANSFER_DISCARD_RANGE);
1095
1096 if (surf->tiling == ISL_TILING_W) {
1097 // XXX: just teach iris_map_tiled_memcpy about W tiling...
1098 iris_map_s8(map);
1099 } else if (surf->tiling != ISL_TILING_LINEAR) {
1100 iris_map_tiled_memcpy(map);
1101 } else {
1102 iris_map_direct(map);
1103 }
1104
1105 return map->ptr;
1106 }
1107
1108 static void
1109 iris_transfer_flush_region(struct pipe_context *ctx,
1110 struct pipe_transfer *xfer,
1111 const struct pipe_box *box)
1112 {
1113 struct iris_context *ice = (struct iris_context *)ctx;
1114 struct iris_resource *res = (struct iris_resource *) xfer->resource;
1115
1116
1117 // XXX: don't emit flushes in both engines...? we may also need to flush
1118 // even if there isn't a draw yet - may still be stale data in caches...
1119 for (int i = 0; i < IRIS_BATCH_COUNT; i++) {
1120 if (ice->batches[i].contains_draw) {
1121 iris_batch_maybe_flush(&ice->batches[i], 24);
1122 iris_flush_and_dirty_for_history(ice, &ice->batches[i], res);
1123 }
1124 }
1125 }
1126
1127 static void
1128 iris_transfer_unmap(struct pipe_context *ctx, struct pipe_transfer *xfer)
1129 {
1130 struct iris_context *ice = (struct iris_context *)ctx;
1131 struct iris_transfer *map = (void *) xfer;
1132 struct iris_resource *res = (struct iris_resource *) xfer->resource;
1133
1134 if (map->unmap)
1135 map->unmap(map);
1136
1137 // XXX: don't emit flushes in both engines...?
1138 for (int i = 0; i < IRIS_BATCH_COUNT; i++) {
1139 if (ice->batches[i].contains_draw) {
1140 iris_batch_maybe_flush(&ice->batches[i], 24);
1141 iris_flush_and_dirty_for_history(ice, &ice->batches[i], res);
1142 }
1143 }
1144
1145 pipe_resource_reference(&xfer->resource, NULL);
1146 slab_free(&ice->transfer_pool, map);
1147 }
1148
1149 static void
1150 iris_flush_resource(struct pipe_context *ctx, struct pipe_resource *resource)
1151 {
1152 }
1153
1154 void
1155 iris_flush_and_dirty_for_history(struct iris_context *ice,
1156 struct iris_batch *batch,
1157 struct iris_resource *res)
1158 {
1159 if (res->base.target != PIPE_BUFFER)
1160 return;
1161
1162 unsigned flush = PIPE_CONTROL_CS_STALL;
1163
1164 /* We've likely used the rendering engine (i.e. BLORP) to write to this
1165 * surface. Flush the render cache so the data actually lands.
1166 */
1167 if (batch->name != IRIS_BATCH_COMPUTE)
1168 flush |= PIPE_CONTROL_RENDER_TARGET_FLUSH;
1169
1170 uint64_t dirty = 0ull;
1171
1172 if (res->bind_history & PIPE_BIND_CONSTANT_BUFFER) {
1173 flush |= PIPE_CONTROL_CONST_CACHE_INVALIDATE |
1174 PIPE_CONTROL_TEXTURE_CACHE_INVALIDATE;
1175 dirty |= IRIS_DIRTY_CONSTANTS_VS |
1176 IRIS_DIRTY_CONSTANTS_TCS |
1177 IRIS_DIRTY_CONSTANTS_TES |
1178 IRIS_DIRTY_CONSTANTS_GS |
1179 IRIS_DIRTY_CONSTANTS_FS |
1180 IRIS_DIRTY_CONSTANTS_CS |
1181 IRIS_ALL_DIRTY_BINDINGS;
1182 }
1183
1184 if (res->bind_history & PIPE_BIND_SAMPLER_VIEW)
1185 flush |= PIPE_CONTROL_TEXTURE_CACHE_INVALIDATE;
1186
1187 if (res->bind_history & (PIPE_BIND_VERTEX_BUFFER | PIPE_BIND_INDEX_BUFFER))
1188 flush |= PIPE_CONTROL_VF_CACHE_INVALIDATE;
1189
1190 if (res->bind_history & (PIPE_BIND_SHADER_BUFFER | PIPE_BIND_SHADER_IMAGE))
1191 flush |= PIPE_CONTROL_DATA_CACHE_FLUSH;
1192
1193 iris_emit_pipe_control_flush(batch, flush);
1194
1195 ice->state.dirty |= dirty;
1196 }
1197
1198 static enum pipe_format
1199 iris_resource_get_internal_format(struct pipe_resource *p_res)
1200 {
1201 struct iris_resource *res = (void *) p_res;
1202 return res->internal_format;
1203 }
1204
1205 static const struct u_transfer_vtbl transfer_vtbl = {
1206 .resource_create = iris_resource_create,
1207 .resource_destroy = iris_resource_destroy,
1208 .transfer_map = iris_transfer_map,
1209 .transfer_unmap = iris_transfer_unmap,
1210 .transfer_flush_region = iris_transfer_flush_region,
1211 .get_internal_format = iris_resource_get_internal_format,
1212 .set_stencil = iris_resource_set_separate_stencil,
1213 .get_stencil = iris_resource_get_separate_stencil,
1214 };
1215
1216 void
1217 iris_init_screen_resource_functions(struct pipe_screen *pscreen)
1218 {
1219 pscreen->resource_create_with_modifiers =
1220 iris_resource_create_with_modifiers;
1221 pscreen->resource_create = u_transfer_helper_resource_create;
1222 pscreen->resource_from_user_memory = iris_resource_from_user_memory;
1223 pscreen->resource_from_handle = iris_resource_from_handle;
1224 pscreen->resource_get_handle = iris_resource_get_handle;
1225 pscreen->resource_destroy = u_transfer_helper_resource_destroy;
1226 pscreen->transfer_helper =
1227 u_transfer_helper_create(&transfer_vtbl, true, true, false, true);
1228 }
1229
1230 void
1231 iris_init_resource_functions(struct pipe_context *ctx)
1232 {
1233 ctx->flush_resource = iris_flush_resource;
1234 ctx->transfer_map = u_transfer_helper_transfer_map;
1235 ctx->transfer_flush_region = u_transfer_helper_transfer_flush_region;
1236 ctx->transfer_unmap = u_transfer_helper_transfer_unmap;
1237 ctx->buffer_subdata = u_default_buffer_subdata;
1238 ctx->texture_subdata = u_default_texture_subdata;
1239 }