radv: ignore subpass self-dependencies for CreateRenderPass() too
[mesa.git] / src / amd / vulkan / radv_pass.c
1 /*
2 * Copyright © 2016 Red Hat.
3 * Copyright © 2016 Bas Nieuwenhuizen
4 *
5 * based in part on anv driver which is:
6 * Copyright © 2015 Intel Corporation
7 *
8 * Permission is hereby granted, free of charge, to any person obtaining a
9 * copy of this software and associated documentation files (the "Software"),
10 * to deal in the Software without restriction, including without limitation
11 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
12 * and/or sell copies of the Software, and to permit persons to whom the
13 * Software is furnished to do so, subject to the following conditions:
14 *
15 * The above copyright notice and this permission notice (including the next
16 * paragraph) shall be included in all copies or substantial portions of the
17 * Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
20 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
22 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
23 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
24 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
25 * IN THE SOFTWARE.
26 */
27 #include "radv_private.h"
28
29 #include "vk_util.h"
30
31 VkResult radv_CreateRenderPass(
32 VkDevice _device,
33 const VkRenderPassCreateInfo* pCreateInfo,
34 const VkAllocationCallbacks* pAllocator,
35 VkRenderPass* pRenderPass)
36 {
37 RADV_FROM_HANDLE(radv_device, device, _device);
38 struct radv_render_pass *pass;
39 size_t size;
40 size_t attachments_offset;
41 VkRenderPassMultiviewCreateInfoKHR *multiview_info = NULL;
42
43 assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_RENDER_PASS_CREATE_INFO);
44
45 size = sizeof(*pass);
46 size += pCreateInfo->subpassCount * sizeof(pass->subpasses[0]);
47 attachments_offset = size;
48 size += pCreateInfo->attachmentCount * sizeof(pass->attachments[0]);
49
50 pass = vk_alloc2(&device->alloc, pAllocator, size, 8,
51 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
52 if (pass == NULL)
53 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
54
55 memset(pass, 0, size);
56 pass->attachment_count = pCreateInfo->attachmentCount;
57 pass->subpass_count = pCreateInfo->subpassCount;
58 pass->attachments = (void *) pass + attachments_offset;
59
60 vk_foreach_struct(ext, pCreateInfo->pNext) {
61 switch(ext->sType) {
62 case VK_STRUCTURE_TYPE_RENDER_PASS_MULTIVIEW_CREATE_INFO_KHR:
63 multiview_info = ( VkRenderPassMultiviewCreateInfoKHR*)ext;
64 break;
65 default:
66 break;
67 }
68 }
69
70 for (uint32_t i = 0; i < pCreateInfo->attachmentCount; i++) {
71 struct radv_render_pass_attachment *att = &pass->attachments[i];
72
73 att->format = pCreateInfo->pAttachments[i].format;
74 att->samples = pCreateInfo->pAttachments[i].samples;
75 att->load_op = pCreateInfo->pAttachments[i].loadOp;
76 att->stencil_load_op = pCreateInfo->pAttachments[i].stencilLoadOp;
77 att->initial_layout = pCreateInfo->pAttachments[i].initialLayout;
78 att->final_layout = pCreateInfo->pAttachments[i].finalLayout;
79 // att->store_op = pCreateInfo->pAttachments[i].storeOp;
80 // att->stencil_store_op = pCreateInfo->pAttachments[i].stencilStoreOp;
81 }
82 uint32_t subpass_attachment_count = 0;
83 struct radv_subpass_attachment *p;
84 for (uint32_t i = 0; i < pCreateInfo->subpassCount; i++) {
85 const VkSubpassDescription *desc = &pCreateInfo->pSubpasses[i];
86
87 subpass_attachment_count +=
88 desc->inputAttachmentCount +
89 desc->colorAttachmentCount +
90 (desc->pResolveAttachments ? desc->colorAttachmentCount : 0) +
91 (desc->pDepthStencilAttachment != NULL);
92 }
93
94 if (subpass_attachment_count) {
95 pass->subpass_attachments =
96 vk_alloc2(&device->alloc, pAllocator,
97 subpass_attachment_count * sizeof(struct radv_subpass_attachment), 8,
98 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
99 if (pass->subpass_attachments == NULL) {
100 vk_free2(&device->alloc, pAllocator, pass);
101 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
102 }
103 } else
104 pass->subpass_attachments = NULL;
105
106 p = pass->subpass_attachments;
107 for (uint32_t i = 0; i < pCreateInfo->subpassCount; i++) {
108 const VkSubpassDescription *desc = &pCreateInfo->pSubpasses[i];
109 uint32_t color_sample_count = 1, depth_sample_count = 1;
110 struct radv_subpass *subpass = &pass->subpasses[i];
111
112 subpass->input_count = desc->inputAttachmentCount;
113 subpass->color_count = desc->colorAttachmentCount;
114 if (multiview_info)
115 subpass->view_mask = multiview_info->pViewMasks[i];
116
117 if (desc->inputAttachmentCount > 0) {
118 subpass->input_attachments = p;
119 p += desc->inputAttachmentCount;
120
121 for (uint32_t j = 0; j < desc->inputAttachmentCount; j++) {
122 subpass->input_attachments[j] = (struct radv_subpass_attachment) {
123 .attachment = desc->pInputAttachments[j].attachment,
124 .layout = desc->pInputAttachments[j].layout,
125 };
126 if (desc->pInputAttachments[j].attachment != VK_ATTACHMENT_UNUSED)
127 pass->attachments[desc->pInputAttachments[j].attachment].view_mask |= subpass->view_mask;
128 }
129 }
130
131 if (desc->colorAttachmentCount > 0) {
132 subpass->color_attachments = p;
133 p += desc->colorAttachmentCount;
134
135 for (uint32_t j = 0; j < desc->colorAttachmentCount; j++) {
136 subpass->color_attachments[j] = (struct radv_subpass_attachment) {
137 .attachment = desc->pColorAttachments[j].attachment,
138 .layout = desc->pColorAttachments[j].layout,
139 };
140 if (desc->pColorAttachments[j].attachment != VK_ATTACHMENT_UNUSED) {
141 pass->attachments[desc->pColorAttachments[j].attachment].view_mask |= subpass->view_mask;
142 color_sample_count = pCreateInfo->pAttachments[desc->pColorAttachments[j].attachment].samples;
143 }
144 }
145 }
146
147 subpass->has_resolve = false;
148 if (desc->pResolveAttachments) {
149 subpass->resolve_attachments = p;
150 p += desc->colorAttachmentCount;
151
152 for (uint32_t j = 0; j < desc->colorAttachmentCount; j++) {
153 uint32_t a = desc->pResolveAttachments[j].attachment;
154 subpass->resolve_attachments[j] = (struct radv_subpass_attachment) {
155 .attachment = desc->pResolveAttachments[j].attachment,
156 .layout = desc->pResolveAttachments[j].layout,
157 };
158 if (a != VK_ATTACHMENT_UNUSED) {
159 subpass->has_resolve = true;
160 pass->attachments[desc->pResolveAttachments[j].attachment].view_mask |= subpass->view_mask;
161 }
162 }
163 }
164
165 if (desc->pDepthStencilAttachment) {
166 subpass->depth_stencil_attachment = (struct radv_subpass_attachment) {
167 .attachment = desc->pDepthStencilAttachment->attachment,
168 .layout = desc->pDepthStencilAttachment->layout,
169 };
170 if (desc->pDepthStencilAttachment->attachment != VK_ATTACHMENT_UNUSED) {
171 pass->attachments[desc->pDepthStencilAttachment->attachment].view_mask |= subpass->view_mask;
172 depth_sample_count = pCreateInfo->pAttachments[desc->pDepthStencilAttachment->attachment].samples;
173 }
174 } else {
175 subpass->depth_stencil_attachment.attachment = VK_ATTACHMENT_UNUSED;
176 }
177
178 subpass->max_sample_count = MAX2(color_sample_count,
179 depth_sample_count);
180 }
181
182 for (unsigned i = 0; i < pCreateInfo->dependencyCount; ++i) {
183 uint32_t src = pCreateInfo->pDependencies[i].srcSubpass;
184 uint32_t dst = pCreateInfo->pDependencies[i].dstSubpass;
185
186 /* Ignore subpass self-dependencies as they allow the app to
187 * call vkCmdPipelineBarrier() inside the render pass and the
188 * driver should only do the barrier when called, not when
189 * starting the render pass.
190 */
191 if (src == dst)
192 continue;
193
194 if (dst == VK_SUBPASS_EXTERNAL) {
195 pass->end_barrier.src_stage_mask = pCreateInfo->pDependencies[i].srcStageMask;
196 pass->end_barrier.src_access_mask = pCreateInfo->pDependencies[i].srcAccessMask;
197 pass->end_barrier.dst_access_mask = pCreateInfo->pDependencies[i].dstAccessMask;
198 } else {
199 pass->subpasses[dst].start_barrier.src_stage_mask = pCreateInfo->pDependencies[i].srcStageMask;
200 pass->subpasses[dst].start_barrier.src_access_mask = pCreateInfo->pDependencies[i].srcAccessMask;
201 pass->subpasses[dst].start_barrier.dst_access_mask = pCreateInfo->pDependencies[i].dstAccessMask;
202 }
203 }
204
205 *pRenderPass = radv_render_pass_to_handle(pass);
206
207 return VK_SUCCESS;
208 }
209
210 VkResult radv_CreateRenderPass2KHR(
211 VkDevice _device,
212 const VkRenderPassCreateInfo2KHR* pCreateInfo,
213 const VkAllocationCallbacks* pAllocator,
214 VkRenderPass* pRenderPass)
215 {
216 RADV_FROM_HANDLE(radv_device, device, _device);
217 struct radv_render_pass *pass;
218 size_t size;
219 size_t attachments_offset;
220
221 assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_RENDER_PASS_CREATE_INFO_2_KHR);
222
223 size = sizeof(*pass);
224 size += pCreateInfo->subpassCount * sizeof(pass->subpasses[0]);
225 attachments_offset = size;
226 size += pCreateInfo->attachmentCount * sizeof(pass->attachments[0]);
227
228 pass = vk_alloc2(&device->alloc, pAllocator, size, 8,
229 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
230 if (pass == NULL)
231 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
232
233 memset(pass, 0, size);
234 pass->attachment_count = pCreateInfo->attachmentCount;
235 pass->subpass_count = pCreateInfo->subpassCount;
236 pass->attachments = (void *) pass + attachments_offset;
237
238 for (uint32_t i = 0; i < pCreateInfo->attachmentCount; i++) {
239 struct radv_render_pass_attachment *att = &pass->attachments[i];
240
241 att->format = pCreateInfo->pAttachments[i].format;
242 att->samples = pCreateInfo->pAttachments[i].samples;
243 att->load_op = pCreateInfo->pAttachments[i].loadOp;
244 att->stencil_load_op = pCreateInfo->pAttachments[i].stencilLoadOp;
245 att->initial_layout = pCreateInfo->pAttachments[i].initialLayout;
246 att->final_layout = pCreateInfo->pAttachments[i].finalLayout;
247 // att->store_op = pCreateInfo->pAttachments[i].storeOp;
248 // att->stencil_store_op = pCreateInfo->pAttachments[i].stencilStoreOp;
249 }
250 uint32_t subpass_attachment_count = 0;
251 struct radv_subpass_attachment *p;
252 for (uint32_t i = 0; i < pCreateInfo->subpassCount; i++) {
253 const VkSubpassDescription2KHR *desc = &pCreateInfo->pSubpasses[i];
254
255 subpass_attachment_count +=
256 desc->inputAttachmentCount +
257 desc->colorAttachmentCount +
258 (desc->pResolveAttachments ? desc->colorAttachmentCount : 0) +
259 (desc->pDepthStencilAttachment != NULL);
260 }
261
262 if (subpass_attachment_count) {
263 pass->subpass_attachments =
264 vk_alloc2(&device->alloc, pAllocator,
265 subpass_attachment_count * sizeof(struct radv_subpass_attachment), 8,
266 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
267 if (pass->subpass_attachments == NULL) {
268 vk_free2(&device->alloc, pAllocator, pass);
269 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
270 }
271 } else
272 pass->subpass_attachments = NULL;
273
274 p = pass->subpass_attachments;
275 for (uint32_t i = 0; i < pCreateInfo->subpassCount; i++) {
276 const VkSubpassDescription2KHR *desc = &pCreateInfo->pSubpasses[i];
277 uint32_t color_sample_count = 1, depth_sample_count = 1;
278 struct radv_subpass *subpass = &pass->subpasses[i];
279
280 subpass->input_count = desc->inputAttachmentCount;
281 subpass->color_count = desc->colorAttachmentCount;
282 subpass->view_mask = desc->viewMask;
283
284 if (desc->inputAttachmentCount > 0) {
285 subpass->input_attachments = p;
286 p += desc->inputAttachmentCount;
287
288 for (uint32_t j = 0; j < desc->inputAttachmentCount; j++) {
289 subpass->input_attachments[j] = (struct radv_subpass_attachment) {
290 .attachment = desc->pInputAttachments[j].attachment,
291 .layout = desc->pInputAttachments[j].layout,
292 };
293 if (desc->pInputAttachments[j].attachment != VK_ATTACHMENT_UNUSED)
294 pass->attachments[desc->pInputAttachments[j].attachment].view_mask |= subpass->view_mask;
295 }
296 }
297
298 if (desc->colorAttachmentCount > 0) {
299 subpass->color_attachments = p;
300 p += desc->colorAttachmentCount;
301
302 for (uint32_t j = 0; j < desc->colorAttachmentCount; j++) {
303 subpass->color_attachments[j] = (struct radv_subpass_attachment) {
304 .attachment = desc->pColorAttachments[j].attachment,
305 .layout = desc->pColorAttachments[j].layout,
306 };
307 if (desc->pColorAttachments[j].attachment != VK_ATTACHMENT_UNUSED) {
308 pass->attachments[desc->pColorAttachments[j].attachment].view_mask |= subpass->view_mask;
309 color_sample_count = pCreateInfo->pAttachments[desc->pColorAttachments[j].attachment].samples;
310 }
311 }
312 }
313
314 subpass->has_resolve = false;
315 if (desc->pResolveAttachments) {
316 subpass->resolve_attachments = p;
317 p += desc->colorAttachmentCount;
318
319 for (uint32_t j = 0; j < desc->colorAttachmentCount; j++) {
320 uint32_t a = desc->pResolveAttachments[j].attachment;
321 subpass->resolve_attachments[j] = (struct radv_subpass_attachment) {
322 .attachment = desc->pResolveAttachments[j].attachment,
323 .layout = desc->pResolveAttachments[j].layout,
324 };
325 if (a != VK_ATTACHMENT_UNUSED) {
326 subpass->has_resolve = true;
327 pass->attachments[desc->pResolveAttachments[j].attachment].view_mask |= subpass->view_mask;
328 }
329 }
330 }
331
332 if (desc->pDepthStencilAttachment) {
333 subpass->depth_stencil_attachment = (struct radv_subpass_attachment) {
334 .attachment = desc->pDepthStencilAttachment->attachment,
335 .layout = desc->pDepthStencilAttachment->layout,
336 };
337 if (desc->pDepthStencilAttachment->attachment != VK_ATTACHMENT_UNUSED) {
338 pass->attachments[desc->pDepthStencilAttachment->attachment].view_mask |= subpass->view_mask;
339 depth_sample_count = pCreateInfo->pAttachments[desc->pDepthStencilAttachment->attachment].samples;
340 }
341 } else {
342 subpass->depth_stencil_attachment.attachment = VK_ATTACHMENT_UNUSED;
343 }
344
345 subpass->max_sample_count = MAX2(color_sample_count,
346 depth_sample_count);
347 }
348
349 for (unsigned i = 0; i < pCreateInfo->dependencyCount; ++i) {
350 uint32_t src = pCreateInfo->pDependencies[i].srcSubpass;
351 uint32_t dst = pCreateInfo->pDependencies[i].dstSubpass;
352
353 /* Ignore subpass self-dependencies as they allow the app to
354 * call vkCmdPipelineBarrier() inside the render pass and the
355 * driver should only do the barrier when called, not when
356 * starting the render pass.
357 */
358 if (src == dst)
359 continue;
360
361 if (dst == VK_SUBPASS_EXTERNAL) {
362 pass->end_barrier.src_stage_mask = pCreateInfo->pDependencies[i].srcStageMask;
363 pass->end_barrier.src_access_mask = pCreateInfo->pDependencies[i].srcAccessMask;
364 pass->end_barrier.dst_access_mask = pCreateInfo->pDependencies[i].dstAccessMask;
365 } else {
366 pass->subpasses[dst].start_barrier.src_stage_mask = pCreateInfo->pDependencies[i].srcStageMask;
367 pass->subpasses[dst].start_barrier.src_access_mask = pCreateInfo->pDependencies[i].srcAccessMask;
368 pass->subpasses[dst].start_barrier.dst_access_mask = pCreateInfo->pDependencies[i].dstAccessMask;
369 }
370 }
371
372 *pRenderPass = radv_render_pass_to_handle(pass);
373
374 return VK_SUCCESS;
375 }
376
377 void radv_DestroyRenderPass(
378 VkDevice _device,
379 VkRenderPass _pass,
380 const VkAllocationCallbacks* pAllocator)
381 {
382 RADV_FROM_HANDLE(radv_device, device, _device);
383 RADV_FROM_HANDLE(radv_render_pass, pass, _pass);
384
385 if (!_pass)
386 return;
387 vk_free2(&device->alloc, pAllocator, pass->subpass_attachments);
388 vk_free2(&device->alloc, pAllocator, pass);
389 }
390
391 void radv_GetRenderAreaGranularity(
392 VkDevice device,
393 VkRenderPass renderPass,
394 VkExtent2D* pGranularity)
395 {
396 pGranularity->width = 1;
397 pGranularity->height = 1;
398 }
399