turnip: MSAA resolve directly from GMEM
[mesa.git] / src / freedreno / vulkan / tu_pass.c
1 /*
2 * Copyright © 2016 Red Hat.
3 * Copyright © 2016 Bas Nieuwenhuizen
4 *
5 * based in part on anv driver which is:
6 * Copyright © 2015 Intel Corporation
7 *
8 * Permission is hereby granted, free of charge, to any person obtaining a
9 * copy of this software and associated documentation files (the "Software"),
10 * to deal in the Software without restriction, including without limitation
11 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
12 * and/or sell copies of the Software, and to permit persons to whom the
13 * Software is furnished to do so, subject to the following conditions:
14 *
15 * The above copyright notice and this permission notice (including the next
16 * paragraph) shall be included in all copies or substantial portions of the
17 * Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
20 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
22 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
23 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
24 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
25 * DEALINGS IN THE SOFTWARE.
26 */
27 #include "tu_private.h"
28
29 #include "vk_util.h"
30
31 VkResult
32 tu_CreateRenderPass(VkDevice _device,
33 const VkRenderPassCreateInfo *pCreateInfo,
34 const VkAllocationCallbacks *pAllocator,
35 VkRenderPass *pRenderPass)
36 {
37 TU_FROM_HANDLE(tu_device, device, _device);
38 struct tu_render_pass *pass;
39 size_t size;
40 size_t attachments_offset;
41 VkRenderPassMultiviewCreateInfo *multiview_info = NULL;
42
43 assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_RENDER_PASS_CREATE_INFO);
44
45 size = sizeof(*pass);
46 size += pCreateInfo->subpassCount * sizeof(pass->subpasses[0]);
47 attachments_offset = size;
48 size += pCreateInfo->attachmentCount * sizeof(pass->attachments[0]);
49
50 pass = vk_alloc2(&device->alloc, pAllocator, size, 8,
51 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
52 if (pass == NULL)
53 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
54
55 memset(pass, 0, size);
56 pass->attachment_count = pCreateInfo->attachmentCount;
57 pass->subpass_count = pCreateInfo->subpassCount;
58 pass->attachments = (void *) pass + attachments_offset;
59
60 vk_foreach_struct(ext, pCreateInfo->pNext)
61 {
62 switch (ext->sType) {
63 case VK_STRUCTURE_TYPE_RENDER_PASS_MULTIVIEW_CREATE_INFO:
64 multiview_info = (VkRenderPassMultiviewCreateInfo *) ext;
65 break;
66 default:
67 break;
68 }
69 }
70
71 for (uint32_t i = 0; i < pCreateInfo->attachmentCount; i++) {
72 struct tu_render_pass_attachment *att = &pass->attachments[i];
73
74 att->format = pCreateInfo->pAttachments[i].format;
75 att->samples = pCreateInfo->pAttachments[i].samples;
76 att->load_op = pCreateInfo->pAttachments[i].loadOp;
77 att->stencil_load_op = pCreateInfo->pAttachments[i].stencilLoadOp;
78 att->initial_layout = pCreateInfo->pAttachments[i].initialLayout;
79 att->final_layout = pCreateInfo->pAttachments[i].finalLayout;
80 // att->store_op = pCreateInfo->pAttachments[i].storeOp;
81 // att->stencil_store_op = pCreateInfo->pAttachments[i].stencilStoreOp;
82 }
83 uint32_t subpass_attachment_count = 0;
84 struct tu_subpass_attachment *p;
85 for (uint32_t i = 0; i < pCreateInfo->subpassCount; i++) {
86 const VkSubpassDescription *desc = &pCreateInfo->pSubpasses[i];
87
88 subpass_attachment_count +=
89 desc->inputAttachmentCount + desc->colorAttachmentCount +
90 (desc->pResolveAttachments ? desc->colorAttachmentCount : 0) +
91 (desc->pDepthStencilAttachment != NULL);
92 }
93
94 if (subpass_attachment_count) {
95 pass->subpass_attachments = vk_alloc2(
96 &device->alloc, pAllocator,
97 subpass_attachment_count * sizeof(struct tu_subpass_attachment), 8,
98 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
99 if (pass->subpass_attachments == NULL) {
100 vk_free2(&device->alloc, pAllocator, pass);
101 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
102 }
103 } else
104 pass->subpass_attachments = NULL;
105
106 p = pass->subpass_attachments;
107 for (uint32_t i = 0; i < pCreateInfo->subpassCount; i++) {
108 const VkSubpassDescription *desc = &pCreateInfo->pSubpasses[i];
109 uint32_t color_sample_count = 1, depth_sample_count = 1;
110 struct tu_subpass *subpass = &pass->subpasses[i];
111
112 subpass->input_count = desc->inputAttachmentCount;
113 subpass->color_count = desc->colorAttachmentCount;
114 if (multiview_info)
115 subpass->view_mask = multiview_info->pViewMasks[i];
116
117 if (desc->inputAttachmentCount > 0) {
118 subpass->input_attachments = p;
119 p += desc->inputAttachmentCount;
120
121 for (uint32_t j = 0; j < desc->inputAttachmentCount; j++) {
122 subpass->input_attachments[j] = (struct tu_subpass_attachment) {
123 .attachment = desc->pInputAttachments[j].attachment,
124 .layout = desc->pInputAttachments[j].layout,
125 };
126 if (desc->pInputAttachments[j].attachment != VK_ATTACHMENT_UNUSED)
127 pass->attachments[desc->pInputAttachments[j].attachment]
128 .view_mask |= subpass->view_mask;
129 }
130 }
131
132 if (desc->colorAttachmentCount > 0) {
133 subpass->color_attachments = p;
134 p += desc->colorAttachmentCount;
135
136 for (uint32_t j = 0; j < desc->colorAttachmentCount; j++) {
137 subpass->color_attachments[j] = (struct tu_subpass_attachment) {
138 .attachment = desc->pColorAttachments[j].attachment,
139 .layout = desc->pColorAttachments[j].layout,
140 };
141 if (desc->pColorAttachments[j].attachment !=
142 VK_ATTACHMENT_UNUSED) {
143 pass->attachments[desc->pColorAttachments[j].attachment]
144 .view_mask |= subpass->view_mask;
145 color_sample_count =
146 pCreateInfo
147 ->pAttachments[desc->pColorAttachments[j].attachment]
148 .samples;
149 }
150 }
151 }
152
153 subpass->resolve_attachments = desc->pResolveAttachments ? p : NULL;
154 if (desc->pResolveAttachments) {
155 p += desc->colorAttachmentCount;
156
157 for (uint32_t j = 0; j < desc->colorAttachmentCount; j++) {
158 uint32_t a = desc->pResolveAttachments[j].attachment;
159 subpass->resolve_attachments[j] = (struct tu_subpass_attachment) {
160 .attachment = desc->pResolveAttachments[j].attachment,
161 .layout = desc->pResolveAttachments[j].layout,
162 };
163 if (a != VK_ATTACHMENT_UNUSED) {
164 pass->attachments[desc->pResolveAttachments[j].attachment]
165 .view_mask |= subpass->view_mask;
166 }
167 }
168 }
169
170 if (desc->pDepthStencilAttachment) {
171 subpass->depth_stencil_attachment = (struct tu_subpass_attachment) {
172 .attachment = desc->pDepthStencilAttachment->attachment,
173 .layout = desc->pDepthStencilAttachment->layout,
174 };
175 if (desc->pDepthStencilAttachment->attachment !=
176 VK_ATTACHMENT_UNUSED) {
177 pass->attachments[desc->pDepthStencilAttachment->attachment]
178 .view_mask |= subpass->view_mask;
179 depth_sample_count =
180 pCreateInfo
181 ->pAttachments[desc->pDepthStencilAttachment->attachment]
182 .samples;
183 }
184 } else {
185 subpass->depth_stencil_attachment.attachment = VK_ATTACHMENT_UNUSED;
186 }
187
188 subpass->max_sample_count =
189 MAX2(color_sample_count, depth_sample_count);
190 }
191
192 for (unsigned i = 0; i < pCreateInfo->dependencyCount; ++i) {
193 uint32_t dst = pCreateInfo->pDependencies[i].dstSubpass;
194 if (dst == VK_SUBPASS_EXTERNAL) {
195 pass->end_barrier.src_stage_mask =
196 pCreateInfo->pDependencies[i].srcStageMask;
197 pass->end_barrier.src_access_mask =
198 pCreateInfo->pDependencies[i].srcAccessMask;
199 pass->end_barrier.dst_access_mask =
200 pCreateInfo->pDependencies[i].dstAccessMask;
201 } else {
202 pass->subpasses[dst].start_barrier.src_stage_mask =
203 pCreateInfo->pDependencies[i].srcStageMask;
204 pass->subpasses[dst].start_barrier.src_access_mask =
205 pCreateInfo->pDependencies[i].srcAccessMask;
206 pass->subpasses[dst].start_barrier.dst_access_mask =
207 pCreateInfo->pDependencies[i].dstAccessMask;
208 }
209 }
210
211 *pRenderPass = tu_render_pass_to_handle(pass);
212
213 return VK_SUCCESS;
214 }
215
216 VkResult
217 tu_CreateRenderPass2KHR(VkDevice _device,
218 const VkRenderPassCreateInfo2KHR *pCreateInfo,
219 const VkAllocationCallbacks *pAllocator,
220 VkRenderPass *pRenderPass)
221 {
222 TU_FROM_HANDLE(tu_device, device, _device);
223 struct tu_render_pass *pass;
224 size_t size;
225 size_t attachments_offset;
226
227 assert(pCreateInfo->sType ==
228 VK_STRUCTURE_TYPE_RENDER_PASS_CREATE_INFO_2_KHR);
229
230 size = sizeof(*pass);
231 size += pCreateInfo->subpassCount * sizeof(pass->subpasses[0]);
232 attachments_offset = size;
233 size += pCreateInfo->attachmentCount * sizeof(pass->attachments[0]);
234
235 pass = vk_alloc2(&device->alloc, pAllocator, size, 8,
236 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
237 if (pass == NULL)
238 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
239
240 memset(pass, 0, size);
241 pass->attachment_count = pCreateInfo->attachmentCount;
242 pass->subpass_count = pCreateInfo->subpassCount;
243 pass->attachments = (void *) pass + attachments_offset;
244
245 for (uint32_t i = 0; i < pCreateInfo->attachmentCount; i++) {
246 struct tu_render_pass_attachment *att = &pass->attachments[i];
247
248 att->format = pCreateInfo->pAttachments[i].format;
249 att->samples = pCreateInfo->pAttachments[i].samples;
250 att->load_op = pCreateInfo->pAttachments[i].loadOp;
251 att->stencil_load_op = pCreateInfo->pAttachments[i].stencilLoadOp;
252 att->initial_layout = pCreateInfo->pAttachments[i].initialLayout;
253 att->final_layout = pCreateInfo->pAttachments[i].finalLayout;
254 // att->store_op = pCreateInfo->pAttachments[i].storeOp;
255 // att->stencil_store_op = pCreateInfo->pAttachments[i].stencilStoreOp;
256 }
257 uint32_t subpass_attachment_count = 0;
258 struct tu_subpass_attachment *p;
259 for (uint32_t i = 0; i < pCreateInfo->subpassCount; i++) {
260 const VkSubpassDescription2KHR *desc = &pCreateInfo->pSubpasses[i];
261
262 subpass_attachment_count +=
263 desc->inputAttachmentCount + desc->colorAttachmentCount +
264 (desc->pResolveAttachments ? desc->colorAttachmentCount : 0) +
265 (desc->pDepthStencilAttachment != NULL);
266 }
267
268 if (subpass_attachment_count) {
269 pass->subpass_attachments = vk_alloc2(
270 &device->alloc, pAllocator,
271 subpass_attachment_count * sizeof(struct tu_subpass_attachment), 8,
272 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
273 if (pass->subpass_attachments == NULL) {
274 vk_free2(&device->alloc, pAllocator, pass);
275 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
276 }
277 } else
278 pass->subpass_attachments = NULL;
279
280 p = pass->subpass_attachments;
281 for (uint32_t i = 0; i < pCreateInfo->subpassCount; i++) {
282 const VkSubpassDescription2KHR *desc = &pCreateInfo->pSubpasses[i];
283 uint32_t color_sample_count = 1, depth_sample_count = 1;
284 struct tu_subpass *subpass = &pass->subpasses[i];
285
286 subpass->input_count = desc->inputAttachmentCount;
287 subpass->color_count = desc->colorAttachmentCount;
288 subpass->view_mask = desc->viewMask;
289
290 if (desc->inputAttachmentCount > 0) {
291 subpass->input_attachments = p;
292 p += desc->inputAttachmentCount;
293
294 for (uint32_t j = 0; j < desc->inputAttachmentCount; j++) {
295 subpass->input_attachments[j] = (struct tu_subpass_attachment) {
296 .attachment = desc->pInputAttachments[j].attachment,
297 .layout = desc->pInputAttachments[j].layout,
298 };
299 if (desc->pInputAttachments[j].attachment != VK_ATTACHMENT_UNUSED)
300 pass->attachments[desc->pInputAttachments[j].attachment]
301 .view_mask |= subpass->view_mask;
302 }
303 }
304
305 if (desc->colorAttachmentCount > 0) {
306 subpass->color_attachments = p;
307 p += desc->colorAttachmentCount;
308
309 for (uint32_t j = 0; j < desc->colorAttachmentCount; j++) {
310 subpass->color_attachments[j] = (struct tu_subpass_attachment) {
311 .attachment = desc->pColorAttachments[j].attachment,
312 .layout = desc->pColorAttachments[j].layout,
313 };
314 if (desc->pColorAttachments[j].attachment !=
315 VK_ATTACHMENT_UNUSED) {
316 pass->attachments[desc->pColorAttachments[j].attachment]
317 .view_mask |= subpass->view_mask;
318 color_sample_count =
319 pCreateInfo
320 ->pAttachments[desc->pColorAttachments[j].attachment]
321 .samples;
322 }
323 }
324 }
325
326 subpass->resolve_attachments = desc->pResolveAttachments ? p : NULL;
327 if (desc->pResolveAttachments) {
328 p += desc->colorAttachmentCount;
329
330 for (uint32_t j = 0; j < desc->colorAttachmentCount; j++) {
331 uint32_t a = desc->pResolveAttachments[j].attachment;
332 subpass->resolve_attachments[j] = (struct tu_subpass_attachment) {
333 .attachment = desc->pResolveAttachments[j].attachment,
334 .layout = desc->pResolveAttachments[j].layout,
335 };
336 if (a != VK_ATTACHMENT_UNUSED) {
337 pass->attachments[desc->pResolveAttachments[j].attachment]
338 .view_mask |= subpass->view_mask;
339 }
340 }
341 }
342
343 if (desc->pDepthStencilAttachment) {
344 subpass->depth_stencil_attachment = (struct tu_subpass_attachment) {
345 .attachment = desc->pDepthStencilAttachment->attachment,
346 .layout = desc->pDepthStencilAttachment->layout,
347 };
348 if (desc->pDepthStencilAttachment->attachment !=
349 VK_ATTACHMENT_UNUSED) {
350 pass->attachments[desc->pDepthStencilAttachment->attachment]
351 .view_mask |= subpass->view_mask;
352 depth_sample_count =
353 pCreateInfo
354 ->pAttachments[desc->pDepthStencilAttachment->attachment]
355 .samples;
356 }
357 } else {
358 subpass->depth_stencil_attachment.attachment = VK_ATTACHMENT_UNUSED;
359 }
360
361 subpass->max_sample_count =
362 MAX2(color_sample_count, depth_sample_count);
363 }
364
365 for (unsigned i = 0; i < pCreateInfo->dependencyCount; ++i) {
366 uint32_t dst = pCreateInfo->pDependencies[i].dstSubpass;
367 if (dst == VK_SUBPASS_EXTERNAL) {
368 pass->end_barrier.src_stage_mask =
369 pCreateInfo->pDependencies[i].srcStageMask;
370 pass->end_barrier.src_access_mask =
371 pCreateInfo->pDependencies[i].srcAccessMask;
372 pass->end_barrier.dst_access_mask =
373 pCreateInfo->pDependencies[i].dstAccessMask;
374 } else {
375 pass->subpasses[dst].start_barrier.src_stage_mask =
376 pCreateInfo->pDependencies[i].srcStageMask;
377 pass->subpasses[dst].start_barrier.src_access_mask =
378 pCreateInfo->pDependencies[i].srcAccessMask;
379 pass->subpasses[dst].start_barrier.dst_access_mask =
380 pCreateInfo->pDependencies[i].dstAccessMask;
381 }
382 }
383
384 *pRenderPass = tu_render_pass_to_handle(pass);
385
386 return VK_SUCCESS;
387 }
388
389 void
390 tu_DestroyRenderPass(VkDevice _device,
391 VkRenderPass _pass,
392 const VkAllocationCallbacks *pAllocator)
393 {
394 TU_FROM_HANDLE(tu_device, device, _device);
395 TU_FROM_HANDLE(tu_render_pass, pass, _pass);
396
397 if (!_pass)
398 return;
399 vk_free2(&device->alloc, pAllocator, pass->subpass_attachments);
400 vk_free2(&device->alloc, pAllocator, pass);
401 }
402
403 void
404 tu_GetRenderAreaGranularity(VkDevice _device,
405 VkRenderPass renderPass,
406 VkExtent2D *pGranularity)
407 {
408 TU_FROM_HANDLE(tu_device, device, _device);
409
410 pGranularity->width = device->physical_device->tile_align_w;
411 pGranularity->height = device->physical_device->tile_align_h;
412 }