anv_pass.c revision 01e04c3f
1/*
2 * Copyright © 2015 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24#include "anv_private.h"
25
26#include "vk_util.h"
27
28static void
29anv_render_pass_add_subpass_dep(struct anv_render_pass *pass,
30                                const VkSubpassDependency2KHR *dep)
31{
32   if (dep->dstSubpass == VK_SUBPASS_EXTERNAL) {
33      pass->subpass_flushes[pass->subpass_count] |=
34         anv_pipe_invalidate_bits_for_access_flags(dep->dstAccessMask);
35   } else {
36      assert(dep->dstSubpass < pass->subpass_count);
37      pass->subpass_flushes[dep->dstSubpass] |=
38         anv_pipe_invalidate_bits_for_access_flags(dep->dstAccessMask);
39   }
40
41   if (dep->srcSubpass == VK_SUBPASS_EXTERNAL) {
42      pass->subpass_flushes[0] |=
43         anv_pipe_flush_bits_for_access_flags(dep->srcAccessMask);
44   } else {
45      assert(dep->srcSubpass < pass->subpass_count);
46      pass->subpass_flushes[dep->srcSubpass + 1] |=
47         anv_pipe_flush_bits_for_access_flags(dep->srcAccessMask);
48   }
49}
50
51/* Do a second "compile" step on a render pass */
52static void
53anv_render_pass_compile(struct anv_render_pass *pass)
54{
55   /* The CreateRenderPass code zeros the entire render pass and also uses a
56    * designated initializer for filling these out.  There's no need for us to
57    * do it again.
58    *
59    * for (uint32_t i = 0; i < pass->attachment_count; i++) {
60    *    pass->attachments[i].usage = 0;
61    *    pass->attachments[i].first_subpass_layout = VK_IMAGE_LAYOUT_UNDEFINED;
62    * }
63    */
64
65   VkImageUsageFlags all_usage = 0;
66   for (uint32_t i = 0; i < pass->subpass_count; i++) {
67      struct anv_subpass *subpass = &pass->subpasses[i];
68
69      /* We don't allow depth_stencil_attachment to be non-NULL and be
70       * VK_ATTACHMENT_UNUSED.  This way something can just check for NULL
71       * and be guaranteed that they have a valid attachment.
72       */
73      if (subpass->depth_stencil_attachment &&
74          subpass->depth_stencil_attachment->attachment == VK_ATTACHMENT_UNUSED)
75         subpass->depth_stencil_attachment = NULL;
76
77      for (uint32_t j = 0; j < subpass->attachment_count; j++) {
78         struct anv_subpass_attachment *subpass_att = &subpass->attachments[j];
79         if (subpass_att->attachment == VK_ATTACHMENT_UNUSED)
80            continue;
81
82         struct anv_render_pass_attachment *pass_att =
83            &pass->attachments[subpass_att->attachment];
84
85         assert(__builtin_popcount(subpass_att->usage) == 1);
86         pass_att->usage |= subpass_att->usage;
87         pass_att->last_subpass_idx = i;
88
89         all_usage |= subpass_att->usage;
90
91         if (pass_att->first_subpass_layout == VK_IMAGE_LAYOUT_UNDEFINED) {
92            pass_att->first_subpass_layout = subpass_att->layout;
93            assert(pass_att->first_subpass_layout != VK_IMAGE_LAYOUT_UNDEFINED);
94         }
95
96         if (subpass_att->usage == VK_IMAGE_USAGE_INPUT_ATTACHMENT_BIT &&
97             subpass->depth_stencil_attachment &&
98             subpass_att->attachment == subpass->depth_stencil_attachment->attachment)
99            subpass->has_ds_self_dep = true;
100      }
101
102      /* We have to handle resolve attachments specially */
103      subpass->has_resolve = false;
104      if (subpass->resolve_attachments) {
105         for (uint32_t j = 0; j < subpass->color_count; j++) {
106            struct anv_subpass_attachment *color_att =
107               &subpass->color_attachments[j];
108            struct anv_subpass_attachment *resolve_att =
109               &subpass->resolve_attachments[j];
110            if (resolve_att->attachment == VK_ATTACHMENT_UNUSED)
111               continue;
112
113            subpass->has_resolve = true;
114
115            assert(resolve_att->usage == VK_IMAGE_USAGE_TRANSFER_DST_BIT);
116            color_att->usage |= VK_IMAGE_USAGE_TRANSFER_SRC_BIT;
117         }
118      }
119   }
120
121   /* From the Vulkan 1.0.39 spec:
122    *
123    *    If there is no subpass dependency from VK_SUBPASS_EXTERNAL to the
124    *    first subpass that uses an attachment, then an implicit subpass
125    *    dependency exists from VK_SUBPASS_EXTERNAL to the first subpass it is
126    *    used in. The subpass dependency operates as if defined with the
127    *    following parameters:
128    *
129    *    VkSubpassDependency implicitDependency = {
130    *        .srcSubpass = VK_SUBPASS_EXTERNAL;
131    *        .dstSubpass = firstSubpass; // First subpass attachment is used in
132    *        .srcStageMask = VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT;
133    *        .dstStageMask = VK_PIPELINE_STAGE_ALL_COMMANDS_BIT;
134    *        .srcAccessMask = 0;
135    *        .dstAccessMask = VK_ACCESS_INPUT_ATTACHMENT_READ_BIT |
136    *                         VK_ACCESS_COLOR_ATTACHMENT_READ_BIT |
137    *                         VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT |
138    *                         VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_READ_BIT |
139    *                         VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT;
140    *        .dependencyFlags = 0;
141    *    };
142    *
143    *    Similarly, if there is no subpass dependency from the last subpass
144    *    that uses an attachment to VK_SUBPASS_EXTERNAL, then an implicit
145    *    subpass dependency exists from the last subpass it is used in to
146    *    VK_SUBPASS_EXTERNAL. The subpass dependency operates as if defined
147    *    with the following parameters:
148    *
149    *    VkSubpassDependency implicitDependency = {
150    *        .srcSubpass = lastSubpass; // Last subpass attachment is used in
151    *        .dstSubpass = VK_SUBPASS_EXTERNAL;
152    *        .srcStageMask = VK_PIPELINE_STAGE_ALL_COMMANDS_BIT;
153    *        .dstStageMask = VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT;
154    *        .srcAccessMask = VK_ACCESS_INPUT_ATTACHMENT_READ_BIT |
155    *                         VK_ACCESS_COLOR_ATTACHMENT_READ_BIT |
156    *                         VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT |
157    *                         VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_READ_BIT |
158    *                         VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT;
159    *        .dstAccessMask = 0;
160    *        .dependencyFlags = 0;
161    *    };
162    *
163    * We could implement this by walking over all of the attachments and
164    * subpasses and checking to see if any of them don't have an external
165    * dependency.  Or, we could just be lazy and add a couple extra flushes.
166    * We choose to be lazy.
167    */
168   if (all_usage & VK_IMAGE_USAGE_INPUT_ATTACHMENT_BIT) {
169      pass->subpass_flushes[0] |=
170         ANV_PIPE_TEXTURE_CACHE_INVALIDATE_BIT;
171   }
172   if (all_usage & VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT) {
173      pass->subpass_flushes[pass->subpass_count] |=
174         ANV_PIPE_RENDER_TARGET_CACHE_FLUSH_BIT;
175   }
176   if (all_usage & VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT) {
177      pass->subpass_flushes[pass->subpass_count] |=
178         ANV_PIPE_DEPTH_CACHE_FLUSH_BIT;
179   }
180}
181
182static unsigned
183num_subpass_attachments(const VkSubpassDescription *desc)
184{
185   return desc->inputAttachmentCount +
186          desc->colorAttachmentCount +
187          (desc->pResolveAttachments ? desc->colorAttachmentCount : 0) +
188          (desc->pDepthStencilAttachment != NULL);
189}
190
191VkResult anv_CreateRenderPass(
192    VkDevice                                    _device,
193    const VkRenderPassCreateInfo*               pCreateInfo,
194    const VkAllocationCallbacks*                pAllocator,
195    VkRenderPass*                               pRenderPass)
196{
197   ANV_FROM_HANDLE(anv_device, device, _device);
198
199   assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_RENDER_PASS_CREATE_INFO);
200
201   struct anv_render_pass *pass;
202   struct anv_subpass *subpasses;
203   struct anv_render_pass_attachment *attachments;
204   enum anv_pipe_bits *subpass_flushes;
205
206   ANV_MULTIALLOC(ma);
207   anv_multialloc_add(&ma, &pass, 1);
208   anv_multialloc_add(&ma, &subpasses, pCreateInfo->subpassCount);
209   anv_multialloc_add(&ma, &attachments, pCreateInfo->attachmentCount);
210   anv_multialloc_add(&ma, &subpass_flushes, pCreateInfo->subpassCount + 1);
211
212   struct anv_subpass_attachment *subpass_attachments;
213   uint32_t subpass_attachment_count = 0;
214   for (uint32_t i = 0; i < pCreateInfo->subpassCount; i++) {
215      subpass_attachment_count +=
216         num_subpass_attachments(&pCreateInfo->pSubpasses[i]);
217   }
218   anv_multialloc_add(&ma, &subpass_attachments, subpass_attachment_count);
219
220   if (!anv_multialloc_alloc2(&ma, &device->alloc, pAllocator,
221                              VK_SYSTEM_ALLOCATION_SCOPE_OBJECT))
222      return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
223
224   /* Clear the subpasses along with the parent pass. This required because
225    * each array member of anv_subpass must be a valid pointer if not NULL.
226    */
227   memset(pass, 0, ma.size);
228   pass->attachment_count = pCreateInfo->attachmentCount;
229   pass->subpass_count = pCreateInfo->subpassCount;
230   pass->attachments = attachments;
231   pass->subpass_flushes = subpass_flushes;
232
233   for (uint32_t i = 0; i < pCreateInfo->attachmentCount; i++) {
234      pass->attachments[i] = (struct anv_render_pass_attachment) {
235         .format                 = pCreateInfo->pAttachments[i].format,
236         .samples                = pCreateInfo->pAttachments[i].samples,
237         .load_op                = pCreateInfo->pAttachments[i].loadOp,
238         .store_op               = pCreateInfo->pAttachments[i].storeOp,
239         .stencil_load_op        = pCreateInfo->pAttachments[i].stencilLoadOp,
240         .initial_layout         = pCreateInfo->pAttachments[i].initialLayout,
241         .final_layout           = pCreateInfo->pAttachments[i].finalLayout,
242      };
243   }
244
245   for (uint32_t i = 0; i < pCreateInfo->subpassCount; i++) {
246      const VkSubpassDescription *desc = &pCreateInfo->pSubpasses[i];
247      struct anv_subpass *subpass = &pass->subpasses[i];
248
249      subpass->input_count = desc->inputAttachmentCount;
250      subpass->color_count = desc->colorAttachmentCount;
251      subpass->attachment_count = num_subpass_attachments(desc);
252      subpass->attachments = subpass_attachments;
253      subpass->view_mask = 0;
254
255      if (desc->inputAttachmentCount > 0) {
256         subpass->input_attachments = subpass_attachments;
257         subpass_attachments += desc->inputAttachmentCount;
258
259         for (uint32_t j = 0; j < desc->inputAttachmentCount; j++) {
260            subpass->input_attachments[j] = (struct anv_subpass_attachment) {
261               .usage =       VK_IMAGE_USAGE_INPUT_ATTACHMENT_BIT,
262               .attachment =  desc->pInputAttachments[j].attachment,
263               .layout =      desc->pInputAttachments[j].layout,
264            };
265         }
266      }
267
268      if (desc->colorAttachmentCount > 0) {
269         subpass->color_attachments = subpass_attachments;
270         subpass_attachments += desc->colorAttachmentCount;
271
272         for (uint32_t j = 0; j < desc->colorAttachmentCount; j++) {
273            subpass->color_attachments[j] = (struct anv_subpass_attachment) {
274               .usage =       VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT,
275               .attachment =  desc->pColorAttachments[j].attachment,
276               .layout =      desc->pColorAttachments[j].layout,
277            };
278         }
279      }
280
281      if (desc->pResolveAttachments) {
282         subpass->resolve_attachments = subpass_attachments;
283         subpass_attachments += desc->colorAttachmentCount;
284
285         for (uint32_t j = 0; j < desc->colorAttachmentCount; j++) {
286            subpass->resolve_attachments[j] = (struct anv_subpass_attachment) {
287               .usage =       VK_IMAGE_USAGE_TRANSFER_DST_BIT,
288               .attachment =  desc->pResolveAttachments[j].attachment,
289               .layout =      desc->pResolveAttachments[j].layout,
290            };
291         }
292      }
293
294      if (desc->pDepthStencilAttachment) {
295         subpass->depth_stencil_attachment = subpass_attachments++;
296
297         *subpass->depth_stencil_attachment = (struct anv_subpass_attachment) {
298            .usage =       VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT,
299            .attachment =  desc->pDepthStencilAttachment->attachment,
300            .layout =      desc->pDepthStencilAttachment->layout,
301         };
302      }
303   }
304
305   for (uint32_t i = 0; i < pCreateInfo->dependencyCount; i++) {
306      /* Convert to a Dependency2KHR */
307      struct VkSubpassDependency2KHR dep2 = {
308         .srcSubpass       = pCreateInfo->pDependencies[i].srcSubpass,
309         .dstSubpass       = pCreateInfo->pDependencies[i].dstSubpass,
310         .srcStageMask     = pCreateInfo->pDependencies[i].srcStageMask,
311         .dstStageMask     = pCreateInfo->pDependencies[i].dstStageMask,
312         .srcAccessMask    = pCreateInfo->pDependencies[i].srcAccessMask,
313         .dstAccessMask    = pCreateInfo->pDependencies[i].dstAccessMask,
314         .dependencyFlags  = pCreateInfo->pDependencies[i].dependencyFlags,
315      };
316      anv_render_pass_add_subpass_dep(pass, &dep2);
317   }
318
319   vk_foreach_struct(ext, pCreateInfo->pNext) {
320      switch (ext->sType) {
321      case VK_STRUCTURE_TYPE_RENDER_PASS_MULTIVIEW_CREATE_INFO_KHR: {
322         VkRenderPassMultiviewCreateInfoKHR *mv = (void *)ext;
323
324         for (uint32_t i = 0; i < mv->subpassCount; i++) {
325            pass->subpasses[i].view_mask = mv->pViewMasks[i];
326         }
327         break;
328      }
329
330      default:
331         anv_debug_ignored_stype(ext->sType);
332      }
333   }
334
335   anv_render_pass_compile(pass);
336
337   *pRenderPass = anv_render_pass_to_handle(pass);
338
339   return VK_SUCCESS;
340}
341
342static unsigned
343num_subpass_attachments2(const VkSubpassDescription2KHR *desc)
344{
345   return desc->inputAttachmentCount +
346          desc->colorAttachmentCount +
347          (desc->pResolveAttachments ? desc->colorAttachmentCount : 0) +
348          (desc->pDepthStencilAttachment != NULL);
349}
350
351VkResult anv_CreateRenderPass2KHR(
352    VkDevice                                    _device,
353    const VkRenderPassCreateInfo2KHR*           pCreateInfo,
354    const VkAllocationCallbacks*                pAllocator,
355    VkRenderPass*                               pRenderPass)
356{
357   ANV_FROM_HANDLE(anv_device, device, _device);
358
359   assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_RENDER_PASS_CREATE_INFO_2_KHR);
360
361   struct anv_render_pass *pass;
362   struct anv_subpass *subpasses;
363   struct anv_render_pass_attachment *attachments;
364   enum anv_pipe_bits *subpass_flushes;
365
366   ANV_MULTIALLOC(ma);
367   anv_multialloc_add(&ma, &pass, 1);
368   anv_multialloc_add(&ma, &subpasses, pCreateInfo->subpassCount);
369   anv_multialloc_add(&ma, &attachments, pCreateInfo->attachmentCount);
370   anv_multialloc_add(&ma, &subpass_flushes, pCreateInfo->subpassCount + 1);
371
372   struct anv_subpass_attachment *subpass_attachments;
373   uint32_t subpass_attachment_count = 0;
374   for (uint32_t i = 0; i < pCreateInfo->subpassCount; i++) {
375      subpass_attachment_count +=
376         num_subpass_attachments2(&pCreateInfo->pSubpasses[i]);
377   }
378   anv_multialloc_add(&ma, &subpass_attachments, subpass_attachment_count);
379
380   if (!anv_multialloc_alloc2(&ma, &device->alloc, pAllocator,
381                              VK_SYSTEM_ALLOCATION_SCOPE_OBJECT))
382      return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
383
384   /* Clear the subpasses along with the parent pass. This required because
385    * each array member of anv_subpass must be a valid pointer if not NULL.
386    */
387   memset(pass, 0, ma.size);
388   pass->attachment_count = pCreateInfo->attachmentCount;
389   pass->subpass_count = pCreateInfo->subpassCount;
390   pass->attachments = attachments;
391   pass->subpass_flushes = subpass_flushes;
392
393   for (uint32_t i = 0; i < pCreateInfo->attachmentCount; i++) {
394      pass->attachments[i] = (struct anv_render_pass_attachment) {
395         .format                 = pCreateInfo->pAttachments[i].format,
396         .samples                = pCreateInfo->pAttachments[i].samples,
397         .load_op                = pCreateInfo->pAttachments[i].loadOp,
398         .store_op               = pCreateInfo->pAttachments[i].storeOp,
399         .stencil_load_op        = pCreateInfo->pAttachments[i].stencilLoadOp,
400         .initial_layout         = pCreateInfo->pAttachments[i].initialLayout,
401         .final_layout           = pCreateInfo->pAttachments[i].finalLayout,
402      };
403   }
404
405   for (uint32_t i = 0; i < pCreateInfo->subpassCount; i++) {
406      const VkSubpassDescription2KHR *desc = &pCreateInfo->pSubpasses[i];
407      struct anv_subpass *subpass = &pass->subpasses[i];
408
409      subpass->input_count = desc->inputAttachmentCount;
410      subpass->color_count = desc->colorAttachmentCount;
411      subpass->attachment_count = num_subpass_attachments2(desc);
412      subpass->attachments = subpass_attachments;
413      subpass->view_mask = desc->viewMask;
414
415      if (desc->inputAttachmentCount > 0) {
416         subpass->input_attachments = subpass_attachments;
417         subpass_attachments += desc->inputAttachmentCount;
418
419         for (uint32_t j = 0; j < desc->inputAttachmentCount; j++) {
420            subpass->input_attachments[j] = (struct anv_subpass_attachment) {
421               .usage =       VK_IMAGE_USAGE_INPUT_ATTACHMENT_BIT,
422               .attachment =  desc->pInputAttachments[j].attachment,
423               .layout =      desc->pInputAttachments[j].layout,
424            };
425         }
426      }
427
428      if (desc->colorAttachmentCount > 0) {
429         subpass->color_attachments = subpass_attachments;
430         subpass_attachments += desc->colorAttachmentCount;
431
432         for (uint32_t j = 0; j < desc->colorAttachmentCount; j++) {
433            subpass->color_attachments[j] = (struct anv_subpass_attachment) {
434               .usage =       VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT,
435               .attachment =  desc->pColorAttachments[j].attachment,
436               .layout =      desc->pColorAttachments[j].layout,
437            };
438         }
439      }
440
441      if (desc->pResolveAttachments) {
442         subpass->resolve_attachments = subpass_attachments;
443         subpass_attachments += desc->colorAttachmentCount;
444
445         for (uint32_t j = 0; j < desc->colorAttachmentCount; j++) {
446            subpass->resolve_attachments[j] = (struct anv_subpass_attachment) {
447               .usage =       VK_IMAGE_USAGE_TRANSFER_DST_BIT,
448               .attachment =  desc->pResolveAttachments[j].attachment,
449               .layout =      desc->pResolveAttachments[j].layout,
450            };
451         }
452      }
453
454      if (desc->pDepthStencilAttachment) {
455         subpass->depth_stencil_attachment = subpass_attachments++;
456
457         *subpass->depth_stencil_attachment = (struct anv_subpass_attachment) {
458            .usage =       VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT,
459            .attachment =  desc->pDepthStencilAttachment->attachment,
460            .layout =      desc->pDepthStencilAttachment->layout,
461         };
462      }
463   }
464
465   for (uint32_t i = 0; i < pCreateInfo->dependencyCount; i++)
466      anv_render_pass_add_subpass_dep(pass, &pCreateInfo->pDependencies[i]);
467
468   vk_foreach_struct(ext, pCreateInfo->pNext) {
469      switch (ext->sType) {
470      default:
471         anv_debug_ignored_stype(ext->sType);
472      }
473   }
474
475   anv_render_pass_compile(pass);
476
477   *pRenderPass = anv_render_pass_to_handle(pass);
478
479   return VK_SUCCESS;
480}
481
482void anv_DestroyRenderPass(
483    VkDevice                                    _device,
484    VkRenderPass                                _pass,
485    const VkAllocationCallbacks*                pAllocator)
486{
487   ANV_FROM_HANDLE(anv_device, device, _device);
488   ANV_FROM_HANDLE(anv_render_pass, pass, _pass);
489
490   vk_free2(&device->alloc, pAllocator, pass);
491}
492
493void anv_GetRenderAreaGranularity(
494    VkDevice                                    device,
495    VkRenderPass                                renderPass,
496    VkExtent2D*                                 pGranularity)
497{
498   ANV_FROM_HANDLE(anv_render_pass, pass, renderPass);
499
500   /* This granularity satisfies HiZ fast clear alignment requirements
501    * for all sample counts.
502    */
503   for (unsigned i = 0; i < pass->subpass_count; ++i) {
504      if (pass->subpasses[i].depth_stencil_attachment) {
505         *pGranularity = (VkExtent2D) { .width = 8, .height = 4 };
506         return;
507      }
508   }
509
510   *pGranularity = (VkExtent2D) { 1, 1 };
511}
512