blob: 4ccc38c17b49183a8654385dc6f223836126459c [file] [log] [blame]
/*
* Copyright © 2015 Intel Corporation
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice (including the next
* paragraph) shall be included in all copies or substantial portions of the
* Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
* IN THE SOFTWARE.
*/
#include <assert.h>
#include <stdbool.h>
#include <string.h>
#include <unistd.h>
#include <fcntl.h>
#include "util/mesa-sha1.h"
#include "vk_util.h"
#include "anv_private.h"
/*
* Descriptor set layouts.
*/
static void
anv_descriptor_data_alignment(enum anv_descriptor_data data,
enum anv_descriptor_set_layout_type layout_type,
unsigned *out_surface_align,
unsigned *out_sampler_align)
{
unsigned surface_align = 1, sampler_align = 1;
if (data & (ANV_DESCRIPTOR_INDIRECT_SAMPLED_IMAGE |
ANV_DESCRIPTOR_INDIRECT_STORAGE_IMAGE |
ANV_DESCRIPTOR_INDIRECT_ADDRESS_RANGE))
surface_align = MAX2(surface_align, 8);
if (data & ANV_DESCRIPTOR_SURFACE)
surface_align = MAX2(surface_align, ANV_SURFACE_STATE_SIZE);
if (data & ANV_DESCRIPTOR_SURFACE_SAMPLER) {
surface_align = MAX2(surface_align, ANV_SURFACE_STATE_SIZE);
if (layout_type == ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_DIRECT)
sampler_align = MAX2(sampler_align, ANV_SAMPLER_STATE_SIZE);
}
if (data & ANV_DESCRIPTOR_SAMPLER) {
if (layout_type == ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_DIRECT)
sampler_align = MAX2(sampler_align, ANV_SAMPLER_STATE_SIZE);
else
surface_align = MAX2(surface_align, ANV_SAMPLER_STATE_SIZE);
}
if (data & ANV_DESCRIPTOR_INLINE_UNIFORM)
surface_align = MAX2(surface_align, ANV_UBO_ALIGNMENT);
*out_surface_align = surface_align;
*out_sampler_align = sampler_align;
}
static enum anv_descriptor_data
anv_indirect_descriptor_data_for_type(VkDescriptorType type)
{
enum anv_descriptor_data data = 0;
switch (type) {
case VK_DESCRIPTOR_TYPE_SAMPLER:
data = ANV_DESCRIPTOR_BTI_SAMPLER_STATE |
ANV_DESCRIPTOR_INDIRECT_SAMPLED_IMAGE;
break;
case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
data = ANV_DESCRIPTOR_BTI_SURFACE_STATE |
ANV_DESCRIPTOR_BTI_SAMPLER_STATE |
ANV_DESCRIPTOR_INDIRECT_SAMPLED_IMAGE;
break;
case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
data = ANV_DESCRIPTOR_BTI_SURFACE_STATE |
ANV_DESCRIPTOR_INDIRECT_SAMPLED_IMAGE;
break;
case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
data = ANV_DESCRIPTOR_BTI_SURFACE_STATE |
ANV_DESCRIPTOR_INDIRECT_STORAGE_IMAGE;
break;
case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
data = ANV_DESCRIPTOR_BTI_SURFACE_STATE |
ANV_DESCRIPTOR_BUFFER_VIEW;
break;
case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
data = ANV_DESCRIPTOR_BTI_SURFACE_STATE;
break;
case VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK:
data = ANV_DESCRIPTOR_INLINE_UNIFORM;
break;
case VK_DESCRIPTOR_TYPE_ACCELERATION_STRUCTURE_KHR:
data = ANV_DESCRIPTOR_INDIRECT_ADDRESS_RANGE;
break;
default:
unreachable("Unsupported descriptor type");
}
/* We also need to push SSBO address ranges so that we can use A64
* messages in the shader.
*/
if (type == VK_DESCRIPTOR_TYPE_STORAGE_BUFFER ||
type == VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC ||
type == VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER ||
type == VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC)
data |= ANV_DESCRIPTOR_INDIRECT_ADDRESS_RANGE;
return data;
}
static enum anv_descriptor_data
anv_direct_descriptor_data_for_type(const struct anv_physical_device *device,
enum anv_descriptor_set_layout_type layout_type,
VkDescriptorSetLayoutCreateFlags set_flags,
VkDescriptorType type)
{
enum anv_descriptor_data data = 0;
switch (type) {
case VK_DESCRIPTOR_TYPE_SAMPLER:
if (set_flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_EMBEDDED_IMMUTABLE_SAMPLERS_BIT_EXT)
return 0;
data = ANV_DESCRIPTOR_BTI_SAMPLER_STATE |
ANV_DESCRIPTOR_SAMPLER;
break;
case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
if (layout_type == ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_DIRECT) {
data = ANV_DESCRIPTOR_BTI_SURFACE_STATE |
ANV_DESCRIPTOR_BTI_SAMPLER_STATE |
ANV_DESCRIPTOR_SURFACE |
ANV_DESCRIPTOR_SAMPLER;
} else {
data = ANV_DESCRIPTOR_BTI_SURFACE_STATE |
ANV_DESCRIPTOR_BTI_SAMPLER_STATE |
ANV_DESCRIPTOR_SURFACE_SAMPLER;
}
break;
case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
data = ANV_DESCRIPTOR_BTI_SURFACE_STATE |
ANV_DESCRIPTOR_SURFACE;
break;
case VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK:
data = ANV_DESCRIPTOR_INLINE_UNIFORM;
break;
case VK_DESCRIPTOR_TYPE_ACCELERATION_STRUCTURE_KHR:
data = ANV_DESCRIPTOR_INDIRECT_ADDRESS_RANGE;
break;
default:
unreachable("Unsupported descriptor type");
}
if (layout_type == ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_BUFFER) {
if (set_flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR) {
/* Push descriptors are special with descriptor buffers. On Gfx12.5+
* they have their own pool and are not reachable by the binding
* table. On previous generations, they are only reachable through
* the binding table.
*/
if (device->uses_ex_bso) {
data &= ~(ANV_DESCRIPTOR_BTI_SURFACE_STATE |
ANV_DESCRIPTOR_BTI_SAMPLER_STATE);
}
} else {
/* Non push descriptor buffers cannot be accesses through the binding
* table on all platforms.
*/
data &= ~(ANV_DESCRIPTOR_BTI_SURFACE_STATE |
ANV_DESCRIPTOR_BTI_SAMPLER_STATE);
}
}
return data;
}
static enum anv_descriptor_data
anv_descriptor_data_for_type(const struct anv_physical_device *device,
enum anv_descriptor_set_layout_type layout_type,
VkDescriptorSetLayoutCreateFlags set_flags,
VkDescriptorType type)
{
if (layout_type == ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_BUFFER)
return anv_direct_descriptor_data_for_type(device, layout_type, set_flags, type);
else if (device->indirect_descriptors)
return anv_indirect_descriptor_data_for_type(type);
else
return anv_direct_descriptor_data_for_type(device, layout_type, set_flags, type);
}
static enum anv_descriptor_data
anv_descriptor_data_for_mutable_type(const struct anv_physical_device *device,
enum anv_descriptor_set_layout_type layout_type,
VkDescriptorSetLayoutCreateFlags set_flags,
const VkMutableDescriptorTypeCreateInfoEXT *mutable_info,
int binding)
{
enum anv_descriptor_data desc_data = 0;
if (!mutable_info || mutable_info->mutableDescriptorTypeListCount <= binding) {
for(VkDescriptorType i = 0; i <= VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT; i++) {
if (i == VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC ||
i == VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC ||
i == VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK)
continue;
desc_data |= anv_descriptor_data_for_type(device, layout_type, set_flags, i);
}
desc_data |= anv_descriptor_data_for_type(
device, layout_type, set_flags, VK_DESCRIPTOR_TYPE_ACCELERATION_STRUCTURE_KHR);
return desc_data;
}
const VkMutableDescriptorTypeListEXT *type_list =
&mutable_info->pMutableDescriptorTypeLists[binding];
for (uint32_t i = 0; i < type_list->descriptorTypeCount; i++) {
desc_data |=
anv_descriptor_data_for_type(device, layout_type, set_flags,
type_list->pDescriptorTypes[i]);
}
return desc_data;
}
static void
anv_descriptor_data_size(enum anv_descriptor_data data,
enum anv_descriptor_set_layout_type layout_type,
uint16_t *out_surface_size,
uint16_t *out_sampler_size)
{
unsigned surface_size = 0;
unsigned sampler_size = 0;
if (data & ANV_DESCRIPTOR_INDIRECT_SAMPLED_IMAGE)
surface_size += sizeof(struct anv_sampled_image_descriptor);
if (data & ANV_DESCRIPTOR_INDIRECT_STORAGE_IMAGE)
surface_size += sizeof(struct anv_storage_image_descriptor);
if (data & ANV_DESCRIPTOR_INDIRECT_ADDRESS_RANGE)
surface_size += sizeof(struct anv_address_range_descriptor);
if (data & ANV_DESCRIPTOR_SURFACE)
surface_size += ANV_SURFACE_STATE_SIZE;
/* Direct descriptors have sampler states stored separately */
if (layout_type == ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_DIRECT) {
if (data & ANV_DESCRIPTOR_SAMPLER)
sampler_size += ANV_SAMPLER_STATE_SIZE;
if (data & ANV_DESCRIPTOR_SURFACE_SAMPLER) {
surface_size += ANV_SURFACE_STATE_SIZE;
sampler_size += ANV_SAMPLER_STATE_SIZE;
}
} else {
if (data & ANV_DESCRIPTOR_SAMPLER)
surface_size += ANV_SAMPLER_STATE_SIZE;
if (data & ANV_DESCRIPTOR_SURFACE_SAMPLER) {
surface_size += ALIGN(ANV_SURFACE_STATE_SIZE + ANV_SAMPLER_STATE_SIZE,
ANV_SURFACE_STATE_SIZE);
}
}
*out_surface_size = surface_size;
*out_sampler_size = sampler_size;
}
static bool
anv_needs_descriptor_buffer(VkDescriptorType desc_type,
enum anv_descriptor_set_layout_type layout_type,
enum anv_descriptor_data desc_data)
{
if (desc_type == VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK)
return true;
uint16_t surface_size, sampler_size;
anv_descriptor_data_size(desc_data, layout_type,
&surface_size, &sampler_size);
return surface_size > 0 || sampler_size > 0;
}
/** Returns the size in bytes of each descriptor with the given layout */
static void
anv_descriptor_size(const struct anv_descriptor_set_binding_layout *layout,
enum anv_descriptor_set_layout_type layout_type,
uint16_t *out_surface_stride,
uint16_t *out_sampler_stride)
{
if (layout->data & ANV_DESCRIPTOR_INLINE_UNIFORM) {
assert(layout->data == ANV_DESCRIPTOR_INLINE_UNIFORM);
assert(layout->array_size <= UINT16_MAX);
*out_surface_stride = layout->array_size;
*out_sampler_stride = 0;
return;
}
anv_descriptor_data_size(layout->data, layout_type,
out_surface_stride,
out_sampler_stride);
}
/** Returns size in bytes of the biggest descriptor in the given layout */
static void
anv_descriptor_size_for_mutable_type(const struct anv_physical_device *device,
enum anv_descriptor_set_layout_type layout_type,
VkDescriptorSetLayoutCreateFlags set_flags,
const VkMutableDescriptorTypeCreateInfoEXT *mutable_info,
int binding,
uint16_t *out_surface_stride,
uint16_t *out_sampler_stride)
{
*out_surface_stride = 0;
*out_sampler_stride = 0;
if (!mutable_info ||
mutable_info->mutableDescriptorTypeListCount <= binding ||
binding >= mutable_info->mutableDescriptorTypeListCount) {
for(VkDescriptorType i = 0; i <= VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT; i++) {
if (i == VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC ||
i == VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC ||
i == VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK)
continue;
enum anv_descriptor_data desc_data =
anv_descriptor_data_for_type(device, layout_type, set_flags, i);
uint16_t surface_stride, sampler_stride;
anv_descriptor_data_size(desc_data, layout_type,
&surface_stride, &sampler_stride);
*out_surface_stride = MAX2(*out_surface_stride, surface_stride);
*out_sampler_stride = MAX2(*out_sampler_stride, sampler_stride);
}
enum anv_descriptor_data desc_data =
anv_descriptor_data_for_type(device, layout_type, set_flags,
VK_DESCRIPTOR_TYPE_ACCELERATION_STRUCTURE_KHR);
uint16_t surface_stride, sampler_stride;
anv_descriptor_data_size(desc_data, layout_type,
&surface_stride, &sampler_stride);
*out_surface_stride = MAX2(*out_surface_stride, surface_stride);
*out_sampler_stride = MAX2(*out_sampler_stride, sampler_stride);
return;
}
const VkMutableDescriptorTypeListEXT *type_list =
&mutable_info->pMutableDescriptorTypeLists[binding];
for (uint32_t i = 0; i < type_list->descriptorTypeCount; i++) {
enum anv_descriptor_data desc_data =
anv_descriptor_data_for_type(device, layout_type, set_flags,
type_list->pDescriptorTypes[i]);
uint16_t surface_stride, sampler_stride;
anv_descriptor_data_size(desc_data, layout_type,
&surface_stride, &sampler_stride);
*out_surface_stride = MAX2(*out_surface_stride, surface_stride);
*out_sampler_stride = MAX2(*out_sampler_stride, sampler_stride);
}
}
static bool
anv_descriptor_data_supports_bindless(const struct anv_physical_device *pdevice,
VkDescriptorSetLayoutCreateFlags set_flags,
enum anv_descriptor_data data)
{
if (set_flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_DESCRIPTOR_BUFFER_BIT_EXT) {
/* When using descriptor buffers, on platforms that don't have extended
* bindless offset, all push descriptors have to go through the binding
* tables.
*/
if (!pdevice->uses_ex_bso &&
(set_flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR)) {
return data & (ANV_DESCRIPTOR_INDIRECT_ADDRESS_RANGE |
ANV_DESCRIPTOR_INDIRECT_SAMPLED_IMAGE |
ANV_DESCRIPTOR_INDIRECT_STORAGE_IMAGE);
}
/* Otherwise we can do bindless for everything */
return true;
} else {
if (pdevice->indirect_descriptors) {
return data & (ANV_DESCRIPTOR_INDIRECT_ADDRESS_RANGE |
ANV_DESCRIPTOR_INDIRECT_SAMPLED_IMAGE |
ANV_DESCRIPTOR_INDIRECT_STORAGE_IMAGE);
}
/* Direct descriptor support bindless for everything */
return true;
}
}
bool
anv_descriptor_supports_bindless(const struct anv_physical_device *pdevice,
const struct anv_descriptor_set_layout *set,
const struct anv_descriptor_set_binding_layout *binding)
{
return anv_descriptor_data_supports_bindless(pdevice, set->flags, binding->data);
}
bool
anv_descriptor_requires_bindless(const struct anv_physical_device *pdevice,
const struct anv_descriptor_set_layout *set,
const struct anv_descriptor_set_binding_layout *binding)
{
if (pdevice->always_use_bindless)
return anv_descriptor_supports_bindless(pdevice, set, binding);
if (set->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR)
return false;
if (set->flags & (VK_DESCRIPTOR_SET_LAYOUT_CREATE_DESCRIPTOR_BUFFER_BIT_EXT |
VK_DESCRIPTOR_SET_LAYOUT_CREATE_EMBEDDED_IMMUTABLE_SAMPLERS_BIT_EXT))
return true;
static const VkDescriptorBindingFlagBits flags_requiring_bindless =
VK_DESCRIPTOR_BINDING_UPDATE_AFTER_BIND_BIT |
VK_DESCRIPTOR_BINDING_UPDATE_UNUSED_WHILE_PENDING_BIT |
VK_DESCRIPTOR_BINDING_PARTIALLY_BOUND_BIT;
return (binding->flags & flags_requiring_bindless) != 0;
}
static enum anv_descriptor_set_layout_type
anv_descriptor_set_layout_type_for_flags(const struct anv_physical_device *device,
const VkDescriptorSetLayoutCreateInfo *pCreateInfo)
{
if (pCreateInfo->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_DESCRIPTOR_BUFFER_BIT_EXT)
return ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_BUFFER;
else if (device->indirect_descriptors)
return ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_INDIRECT;
else
return ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_DIRECT;
}
static bool
mutable_list_includes_type(const VkMutableDescriptorTypeCreateInfoEXT *mutable_info,
uint32_t binding, VkDescriptorType type)
{
if (!mutable_info || mutable_info->mutableDescriptorTypeListCount == 0)
return true;
const VkMutableDescriptorTypeListEXT *type_list =
&mutable_info->pMutableDescriptorTypeLists[binding];
for (uint32_t i = 0; i < type_list->descriptorTypeCount; i++) {
if (type_list->pDescriptorTypes[i] == type)
return true;
}
return false;
}
void anv_GetDescriptorSetLayoutSupport(
VkDevice _device,
const VkDescriptorSetLayoutCreateInfo* pCreateInfo,
VkDescriptorSetLayoutSupport* pSupport)
{
ANV_FROM_HANDLE(anv_device, device, _device);
const struct anv_physical_device *pdevice = device->physical;
uint32_t surface_count[MESA_VULKAN_SHADER_STAGES] = { 0, };
VkDescriptorType varying_desc_type = VK_DESCRIPTOR_TYPE_MAX_ENUM;
bool needs_descriptor_buffer = false;
const VkDescriptorSetLayoutBindingFlagsCreateInfo *binding_flags_info =
vk_find_struct_const(pCreateInfo->pNext,
DESCRIPTOR_SET_LAYOUT_BINDING_FLAGS_CREATE_INFO);
const VkMutableDescriptorTypeCreateInfoEXT *mutable_info =
vk_find_struct_const(pCreateInfo->pNext,
MUTABLE_DESCRIPTOR_TYPE_CREATE_INFO_EXT);
enum anv_descriptor_set_layout_type layout_type =
anv_descriptor_set_layout_type_for_flags(pdevice, pCreateInfo);
for (uint32_t b = 0; b < pCreateInfo->bindingCount; b++) {
const VkDescriptorSetLayoutBinding *binding = &pCreateInfo->pBindings[b];
VkDescriptorBindingFlags flags = 0;
if (binding_flags_info && binding_flags_info->bindingCount > 0) {
assert(binding_flags_info->bindingCount == pCreateInfo->bindingCount);
flags = binding_flags_info->pBindingFlags[b];
}
/* Combined image/sampler descriptor are not supported with descriptor
* buffers & mutable descriptor types because we cannot know from the
* shader where to find the sampler structure. It can be written to the
* beginning of the descriptor (at offset 0) or in the second part (at
* offset 64bytes).
*/
if ((pCreateInfo->flags &
VK_DESCRIPTOR_SET_LAYOUT_CREATE_DESCRIPTOR_BUFFER_BIT_EXT) &&
binding->descriptorType == VK_DESCRIPTOR_TYPE_MUTABLE_EXT &&
mutable_list_includes_type(mutable_info, b,
VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER)) {
pSupport->supported = false;
return;
}
enum anv_descriptor_data desc_data =
binding->descriptorType == VK_DESCRIPTOR_TYPE_MUTABLE_EXT ?
anv_descriptor_data_for_mutable_type(pdevice, layout_type,
pCreateInfo->flags,
mutable_info, b) :
anv_descriptor_data_for_type(pdevice, layout_type,
pCreateInfo->flags,
binding->descriptorType);
if (anv_needs_descriptor_buffer(binding->descriptorType,
layout_type, desc_data))
needs_descriptor_buffer = true;
if (flags & VK_DESCRIPTOR_BINDING_VARIABLE_DESCRIPTOR_COUNT_BIT)
varying_desc_type = binding->descriptorType;
switch (binding->descriptorType) {
case VK_DESCRIPTOR_TYPE_SAMPLER:
/* There is no real limit on samplers */
break;
case VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK:
/* Inline uniforms don't use a binding */
break;
case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
if (anv_descriptor_data_supports_bindless(pdevice,
pCreateInfo->flags,
desc_data))
break;
if (binding->pImmutableSamplers) {
for (uint32_t i = 0; i < binding->descriptorCount; i++) {
ANV_FROM_HANDLE(anv_sampler, sampler,
binding->pImmutableSamplers[i]);
anv_foreach_stage(s, binding->stageFlags)
surface_count[s] += sampler->n_planes;
}
} else {
anv_foreach_stage(s, binding->stageFlags)
surface_count[s] += binding->descriptorCount;
}
break;
default:
if (anv_descriptor_data_supports_bindless(pdevice,
pCreateInfo->flags,
desc_data))
break;
anv_foreach_stage(s, binding->stageFlags)
surface_count[s] += binding->descriptorCount;
break;
}
}
for (unsigned s = 0; s < ARRAY_SIZE(surface_count); s++) {
if (needs_descriptor_buffer)
surface_count[s] += 1;
}
VkDescriptorSetVariableDescriptorCountLayoutSupport *vdcls =
vk_find_struct(pSupport->pNext,
DESCRIPTOR_SET_VARIABLE_DESCRIPTOR_COUNT_LAYOUT_SUPPORT);
if (vdcls != NULL) {
if (varying_desc_type == VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK) {
vdcls->maxVariableDescriptorCount = MAX_INLINE_UNIFORM_BLOCK_SIZE;
} else if (varying_desc_type != VK_DESCRIPTOR_TYPE_MAX_ENUM) {
vdcls->maxVariableDescriptorCount = UINT16_MAX;
} else {
vdcls->maxVariableDescriptorCount = 0;
}
}
bool supported = true;
for (unsigned s = 0; s < ARRAY_SIZE(surface_count); s++) {
/* Our maximum binding table size is 240 and we need to reserve 8 for
* render targets.
*/
if (surface_count[s] > MAX_BINDING_TABLE_SIZE - MAX_RTS)
supported = false;
}
pSupport->supported = supported;
}
VkResult anv_CreateDescriptorSetLayout(
VkDevice _device,
const VkDescriptorSetLayoutCreateInfo* pCreateInfo,
const VkAllocationCallbacks* pAllocator,
VkDescriptorSetLayout* pSetLayout)
{
ANV_FROM_HANDLE(anv_device, device, _device);
assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_DESCRIPTOR_SET_LAYOUT_CREATE_INFO);
uint32_t num_bindings = 0;
uint32_t immutable_sampler_count = 0;
for (uint32_t j = 0; j < pCreateInfo->bindingCount; j++) {
num_bindings = MAX2(num_bindings, pCreateInfo->pBindings[j].binding + 1);
/* From the Vulkan 1.1.97 spec for VkDescriptorSetLayoutBinding:
*
* "If descriptorType specifies a VK_DESCRIPTOR_TYPE_SAMPLER or
* VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER type descriptor, then
* pImmutableSamplers can be used to initialize a set of immutable
* samplers. [...] If descriptorType is not one of these descriptor
* types, then pImmutableSamplers is ignored.
*
* We need to be careful here and only parse pImmutableSamplers if we
* have one of the right descriptor types.
*/
VkDescriptorType desc_type = pCreateInfo->pBindings[j].descriptorType;
if ((desc_type == VK_DESCRIPTOR_TYPE_SAMPLER ||
desc_type == VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER) &&
pCreateInfo->pBindings[j].pImmutableSamplers)
immutable_sampler_count += pCreateInfo->pBindings[j].descriptorCount;
}
/* We need to allocate descriptor set layouts off the device allocator
* with DEVICE scope because they are reference counted and may not be
* destroyed when vkDestroyDescriptorSetLayout is called.
*/
VK_MULTIALLOC(ma);
VK_MULTIALLOC_DECL(&ma, struct anv_descriptor_set_layout, set_layout, 1);
VK_MULTIALLOC_DECL(&ma, struct anv_descriptor_set_binding_layout,
bindings, num_bindings);
VK_MULTIALLOC_DECL(&ma, struct anv_sampler *, samplers,
immutable_sampler_count);
if (!vk_object_multizalloc(&device->vk, &ma, NULL,
VK_OBJECT_TYPE_DESCRIPTOR_SET_LAYOUT))
return vk_error(device, VK_ERROR_OUT_OF_HOST_MEMORY);
set_layout->ref_cnt = 1;
set_layout->binding_count = num_bindings;
set_layout->flags = pCreateInfo->flags;
set_layout->type = anv_descriptor_set_layout_type_for_flags(device->physical,
pCreateInfo);
for (uint32_t b = 0; b < num_bindings; b++) {
/* Initialize all binding_layout entries to -1 */
memset(&set_layout->binding[b], -1, sizeof(set_layout->binding[b]));
set_layout->binding[b].flags = 0;
set_layout->binding[b].data = 0;
set_layout->binding[b].max_plane_count = 0;
set_layout->binding[b].array_size = 0;
set_layout->binding[b].immutable_samplers = NULL;
}
/* Initialize all samplers to 0 */
assert((samplers == NULL) == (immutable_sampler_count == 0));
if (samplers != NULL) {
memset(samplers, 0, immutable_sampler_count * sizeof(*samplers));
}
uint32_t buffer_view_count = 0;
uint32_t dynamic_offset_count = 0;
uint32_t descriptor_buffer_surface_size = 0;
uint32_t descriptor_buffer_sampler_size = 0;
uint32_t sampler_count = 0;
for (uint32_t j = 0; j < pCreateInfo->bindingCount; j++) {
const VkDescriptorSetLayoutBinding *binding = &pCreateInfo->pBindings[j];
uint32_t b = binding->binding;
/* We temporarily store pCreateInfo->pBindings[] index (plus one) in the
* immutable_samplers pointer. This provides us with a quick-and-dirty
* way to sort the bindings by binding number.
*/
set_layout->binding[b].immutable_samplers = (void *)(uintptr_t)(j + 1);
}
const VkDescriptorSetLayoutBindingFlagsCreateInfo *binding_flags_info =
vk_find_struct_const(pCreateInfo->pNext,
DESCRIPTOR_SET_LAYOUT_BINDING_FLAGS_CREATE_INFO);
const VkMutableDescriptorTypeCreateInfoEXT *mutable_info =
vk_find_struct_const(pCreateInfo->pNext,
MUTABLE_DESCRIPTOR_TYPE_CREATE_INFO_EXT);
for (uint32_t b = 0; b < num_bindings; b++) {
/* We stashed the pCreateInfo->pBindings[] index (plus one) in the
* immutable_samplers pointer. Check for NULL (empty binding) and then
* reset it and compute the index.
*/
if (set_layout->binding[b].immutable_samplers == NULL)
continue;
const uint32_t info_idx =
(uintptr_t)(void *)set_layout->binding[b].immutable_samplers - 1;
set_layout->binding[b].immutable_samplers = NULL;
const VkDescriptorSetLayoutBinding *binding =
&pCreateInfo->pBindings[info_idx];
if (binding->descriptorCount == 0)
continue;
set_layout->binding[b].type = binding->descriptorType;
if (binding_flags_info && binding_flags_info->bindingCount > 0) {
assert(binding_flags_info->bindingCount == pCreateInfo->bindingCount);
set_layout->binding[b].flags =
binding_flags_info->pBindingFlags[info_idx];
/* From the Vulkan spec:
*
* "If VkDescriptorSetLayoutCreateInfo::flags includes
* VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR, then
* all elements of pBindingFlags must not include
* VK_DESCRIPTOR_BINDING_UPDATE_AFTER_BIND_BIT,
* VK_DESCRIPTOR_BINDING_UPDATE_UNUSED_WHILE_PENDING_BIT, or
* VK_DESCRIPTOR_BINDING_VARIABLE_DESCRIPTOR_COUNT_BIT"
*/
if (pCreateInfo->flags &
VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR) {
assert(!(set_layout->binding[b].flags &
(VK_DESCRIPTOR_BINDING_UPDATE_AFTER_BIND_BIT |
VK_DESCRIPTOR_BINDING_UPDATE_UNUSED_WHILE_PENDING_BIT |
VK_DESCRIPTOR_BINDING_VARIABLE_DESCRIPTOR_COUNT_BIT)));
}
}
set_layout->binding[b].data =
binding->descriptorType == VK_DESCRIPTOR_TYPE_MUTABLE_EXT ?
anv_descriptor_data_for_mutable_type(device->physical,
set_layout->type,
pCreateInfo->flags,
mutable_info, b) :
anv_descriptor_data_for_type(device->physical,
set_layout->type,
pCreateInfo->flags,
binding->descriptorType);
set_layout->binding[b].array_size = binding->descriptorCount;
set_layout->binding[b].descriptor_index = set_layout->descriptor_count;
set_layout->descriptor_count += binding->descriptorCount;
if (set_layout->binding[b].data & ANV_DESCRIPTOR_BUFFER_VIEW) {
set_layout->binding[b].buffer_view_index = buffer_view_count;
buffer_view_count += binding->descriptorCount;
}
set_layout->binding[b].max_plane_count = 1;
switch (binding->descriptorType) {
case VK_DESCRIPTOR_TYPE_SAMPLER:
case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
case VK_DESCRIPTOR_TYPE_MUTABLE_EXT:
if (binding->pImmutableSamplers) {
set_layout->binding[b].immutable_samplers = samplers;
samplers += binding->descriptorCount;
for (uint32_t i = 0; i < binding->descriptorCount; i++) {
ANV_FROM_HANDLE(anv_sampler, sampler,
binding->pImmutableSamplers[i]);
set_layout->binding[b].immutable_samplers[i] = sampler;
if (set_layout->binding[b].max_plane_count < sampler->n_planes)
set_layout->binding[b].max_plane_count = sampler->n_planes;
}
}
break;
default:
break;
}
switch (binding->descriptorType) {
case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
set_layout->binding[b].dynamic_offset_index = dynamic_offset_count;
set_layout->dynamic_offset_stages[dynamic_offset_count] = binding->stageFlags;
dynamic_offset_count += binding->descriptorCount;
assert(dynamic_offset_count < MAX_DYNAMIC_BUFFERS);
break;
default:
break;
}
if (binding->descriptorType == VK_DESCRIPTOR_TYPE_MUTABLE_EXT) {
anv_descriptor_size_for_mutable_type(
device->physical, set_layout->type,
pCreateInfo->flags, mutable_info, b,
&set_layout->binding[b].descriptor_data_surface_size,
&set_layout->binding[b].descriptor_data_sampler_size);
} else {
anv_descriptor_size(&set_layout->binding[b],
set_layout->type,
&set_layout->binding[b].descriptor_data_surface_size,
&set_layout->binding[b].descriptor_data_sampler_size);
}
/* For multi-planar bindings, we make every descriptor consume the maximum
* number of planes so we don't have to bother with walking arrays and
* adding things up every time. Fortunately, YCbCr samplers aren't all
* that common and likely won't be in the middle of big arrays.
*/
set_layout->binding[b].descriptor_surface_stride =
set_layout->binding[b].max_plane_count *
set_layout->binding[b].descriptor_data_surface_size;
set_layout->binding[b].descriptor_sampler_stride =
set_layout->binding[b].max_plane_count *
set_layout->binding[b].descriptor_data_sampler_size;
if (binding->descriptorType == VK_DESCRIPTOR_TYPE_SAMPLER) {
sampler_count += binding->descriptorCount *
set_layout->binding[b].max_plane_count;
}
unsigned surface_align, sampler_align;
anv_descriptor_data_alignment(set_layout->binding[b].data,
set_layout->type,
&surface_align,
&sampler_align);
descriptor_buffer_surface_size =
align(descriptor_buffer_surface_size, surface_align);
descriptor_buffer_sampler_size =
align(descriptor_buffer_sampler_size, sampler_align);
if (binding->descriptorType == VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK) {
set_layout->binding[b].descriptor_surface_offset = descriptor_buffer_surface_size;
descriptor_buffer_surface_size += binding->descriptorCount;
} else {
set_layout->binding[b].descriptor_surface_offset = descriptor_buffer_surface_size;
descriptor_buffer_surface_size +=
set_layout->binding[b].descriptor_surface_stride * binding->descriptorCount;
}
set_layout->binding[b].descriptor_sampler_offset = descriptor_buffer_sampler_size;
descriptor_buffer_sampler_size +=
set_layout->binding[b].descriptor_sampler_stride * binding->descriptorCount;
set_layout->shader_stages |= binding->stageFlags;
}
/* Sanity checks */
assert(descriptor_buffer_sampler_size == 0 ||
set_layout->type == ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_DIRECT);
set_layout->buffer_view_count = buffer_view_count;
set_layout->dynamic_offset_count = dynamic_offset_count;
set_layout->descriptor_buffer_surface_size = descriptor_buffer_surface_size;
set_layout->descriptor_buffer_sampler_size = descriptor_buffer_sampler_size;
if (pCreateInfo->flags &
VK_DESCRIPTOR_SET_LAYOUT_CREATE_EMBEDDED_IMMUTABLE_SAMPLERS_BIT_EXT) {
assert(set_layout->descriptor_buffer_surface_size == 0);
assert(set_layout->descriptor_buffer_sampler_size == 0);
set_layout->embedded_sampler_count = sampler_count;
}
*pSetLayout = anv_descriptor_set_layout_to_handle(set_layout);
return VK_SUCCESS;
}
void
anv_descriptor_set_layout_destroy(struct anv_device *device,
struct anv_descriptor_set_layout *layout)
{
assert(layout->ref_cnt == 0);
vk_object_free(&device->vk, NULL, layout);
}
static const struct anv_descriptor_set_binding_layout *
set_layout_dynamic_binding(const struct anv_descriptor_set_layout *set_layout)
{
if (set_layout->binding_count == 0)
return NULL;
const struct anv_descriptor_set_binding_layout *last_binding =
&set_layout->binding[set_layout->binding_count - 1];
if (!(last_binding->flags & VK_DESCRIPTOR_BINDING_VARIABLE_DESCRIPTOR_COUNT_BIT))
return NULL;
return last_binding;
}
static uint32_t
set_layout_descriptor_count(const struct anv_descriptor_set_layout *set_layout,
uint32_t var_desc_count)
{
const struct anv_descriptor_set_binding_layout *dynamic_binding =
set_layout_dynamic_binding(set_layout);
if (dynamic_binding == NULL)
return set_layout->descriptor_count;
assert(var_desc_count <= dynamic_binding->array_size);
uint32_t shrink = dynamic_binding->array_size - var_desc_count;
if (dynamic_binding->type == VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK)
return set_layout->descriptor_count;
return set_layout->descriptor_count - shrink;
}
static uint32_t
set_layout_buffer_view_count(const struct anv_descriptor_set_layout *set_layout,
uint32_t var_desc_count)
{
const struct anv_descriptor_set_binding_layout *dynamic_binding =
set_layout_dynamic_binding(set_layout);
if (dynamic_binding == NULL)
return set_layout->buffer_view_count;
assert(var_desc_count <= dynamic_binding->array_size);
uint32_t shrink = dynamic_binding->array_size - var_desc_count;
if (!(dynamic_binding->data & ANV_DESCRIPTOR_BUFFER_VIEW))
return set_layout->buffer_view_count;
return set_layout->buffer_view_count - shrink;
}
static bool
anv_descriptor_set_layout_empty(const struct anv_descriptor_set_layout *set_layout)
{
return set_layout->binding_count == 0;
}
static void
anv_descriptor_set_layout_descriptor_buffer_size(const struct anv_descriptor_set_layout *set_layout,
uint32_t var_desc_count,
uint32_t *out_surface_size,
uint32_t *out_sampler_size)
{
const struct anv_descriptor_set_binding_layout *dynamic_binding =
set_layout_dynamic_binding(set_layout);
if (dynamic_binding == NULL) {
*out_surface_size = ALIGN(set_layout->descriptor_buffer_surface_size,
ANV_UBO_ALIGNMENT);
*out_sampler_size = set_layout->descriptor_buffer_sampler_size;
return;
}
assert(var_desc_count <= dynamic_binding->array_size);
uint32_t shrink = dynamic_binding->array_size - var_desc_count;
uint32_t set_surface_size, set_sampler_size;
if (dynamic_binding->type == VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK) {
/* Inline uniform blocks are specified to use the descriptor array
* size as the size in bytes of the block.
*/
set_surface_size = set_layout->descriptor_buffer_surface_size - shrink;
set_sampler_size = 0;
} else {
set_surface_size =
set_layout->descriptor_buffer_surface_size > 0 ?
(set_layout->descriptor_buffer_surface_size -
shrink * dynamic_binding->descriptor_surface_stride) : 0;
set_sampler_size =
set_layout->descriptor_buffer_sampler_size > 0 ?
(set_layout->descriptor_buffer_sampler_size -
shrink * dynamic_binding->descriptor_sampler_stride) : 0;
}
*out_surface_size = ALIGN(set_surface_size, ANV_UBO_ALIGNMENT);
*out_sampler_size = set_sampler_size;
}
void anv_DestroyDescriptorSetLayout(
VkDevice _device,
VkDescriptorSetLayout _set_layout,
const VkAllocationCallbacks* pAllocator)
{
ANV_FROM_HANDLE(anv_device, device, _device);
ANV_FROM_HANDLE(anv_descriptor_set_layout, set_layout, _set_layout);
if (!set_layout)
return;
anv_descriptor_set_layout_unref(device, set_layout);
}
void
anv_descriptor_set_layout_print(const struct anv_descriptor_set_layout *layout)
{
fprintf(stderr, "set layout:\n");
for (uint32_t b = 0; b < layout->binding_count; b++) {
fprintf(stderr, " binding%03u: offsets=0x%08x/0x%08x sizes=%04u/%04u strides=%03u/%03u planes=%hhu count=%03u\n",
b,
layout->binding[b].descriptor_surface_offset,
layout->binding[b].descriptor_sampler_offset,
layout->binding[b].descriptor_data_surface_size,
layout->binding[b].descriptor_data_sampler_size,
layout->binding[b].descriptor_surface_stride,
layout->binding[b].descriptor_sampler_stride,
layout->binding[b].max_plane_count,
layout->binding[b].array_size);
}
}
#define SHA1_UPDATE_VALUE(ctx, x) _mesa_sha1_update(ctx, &(x), sizeof(x));
static void
sha1_update_immutable_sampler(struct mesa_sha1 *ctx,
bool embedded_sampler,
const struct anv_sampler *sampler)
{
if (!sampler->vk.ycbcr_conversion)
return;
/* Hash the conversion if any as this affect placement of descriptors in
* the set due to the number of planes.
*/
SHA1_UPDATE_VALUE(ctx, sampler->vk.ycbcr_conversion->state);
/* For embedded samplers, we need to hash the sampler parameters as the
* sampler handle is baked into the shader and this ultimately is part of
* the shader hash key. We can only consider 2 shaders identical if all
* their embedded samplers parameters are identical.
*/
if (embedded_sampler)
SHA1_UPDATE_VALUE(ctx, sampler->sha1);
}
static void
sha1_update_descriptor_set_binding_layout(struct mesa_sha1 *ctx,
bool embedded_samplers,
const struct anv_descriptor_set_binding_layout *layout)
{
SHA1_UPDATE_VALUE(ctx, layout->flags);
SHA1_UPDATE_VALUE(ctx, layout->data);
SHA1_UPDATE_VALUE(ctx, layout->max_plane_count);
SHA1_UPDATE_VALUE(ctx, layout->array_size);
SHA1_UPDATE_VALUE(ctx, layout->descriptor_index);
SHA1_UPDATE_VALUE(ctx, layout->dynamic_offset_index);
SHA1_UPDATE_VALUE(ctx, layout->buffer_view_index);
SHA1_UPDATE_VALUE(ctx, layout->descriptor_surface_offset);
SHA1_UPDATE_VALUE(ctx, layout->descriptor_sampler_offset);
if (layout->immutable_samplers) {
for (uint16_t i = 0; i < layout->array_size; i++) {
sha1_update_immutable_sampler(ctx, embedded_samplers,
layout->immutable_samplers[i]);
}
}
}
static void
sha1_update_descriptor_set_layout(struct mesa_sha1 *ctx,
const struct anv_descriptor_set_layout *layout)
{
SHA1_UPDATE_VALUE(ctx, layout->flags);
SHA1_UPDATE_VALUE(ctx, layout->binding_count);
SHA1_UPDATE_VALUE(ctx, layout->descriptor_count);
SHA1_UPDATE_VALUE(ctx, layout->shader_stages);
SHA1_UPDATE_VALUE(ctx, layout->buffer_view_count);
SHA1_UPDATE_VALUE(ctx, layout->dynamic_offset_count);
SHA1_UPDATE_VALUE(ctx, layout->descriptor_buffer_surface_size);
SHA1_UPDATE_VALUE(ctx, layout->descriptor_buffer_sampler_size);
bool embedded_samplers =
layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_EMBEDDED_IMMUTABLE_SAMPLERS_BIT_EXT;
for (uint16_t i = 0; i < layout->binding_count; i++) {
sha1_update_descriptor_set_binding_layout(ctx, embedded_samplers,
&layout->binding[i]);
}
}
/*
* Pipeline layouts. These have nothing to do with the pipeline. They are
* just multiple descriptor set layouts pasted together
*/
void
anv_pipeline_sets_layout_init(struct anv_pipeline_sets_layout *layout,
struct anv_device *device,
bool independent_sets)
{
memset(layout, 0, sizeof(*layout));
layout->device = device;
layout->push_descriptor_set_index = -1;
layout->independent_sets = independent_sets;
}
void
anv_pipeline_sets_layout_add(struct anv_pipeline_sets_layout *layout,
uint32_t set_idx,
struct anv_descriptor_set_layout *set_layout)
{
if (layout->set[set_idx].layout)
return;
/* Workaround CTS : Internal CTS issue 3584 */
if (layout->independent_sets && anv_descriptor_set_layout_empty(set_layout))
return;
if (layout->type == ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_UNKNOWN)
layout->type = set_layout->type;
else
assert(layout->type == set_layout->type);
layout->num_sets = MAX2(set_idx + 1, layout->num_sets);
layout->set[set_idx].layout =
anv_descriptor_set_layout_ref(set_layout);
layout->set[set_idx].dynamic_offset_start = layout->num_dynamic_buffers;
layout->num_dynamic_buffers += set_layout->dynamic_offset_count;
assert(layout->num_dynamic_buffers < MAX_DYNAMIC_BUFFERS);
if (set_layout->flags &
VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR) {
assert(layout->push_descriptor_set_index == -1);
layout->push_descriptor_set_index = set_idx;
}
}
uint32_t
anv_pipeline_sets_layout_embedded_sampler_count(const struct anv_pipeline_sets_layout *layout)
{
uint32_t count = 0;
for (unsigned s = 0; s < layout->num_sets; s++) {
if (!layout->set[s].layout)
continue;
count += layout->set[s].layout->embedded_sampler_count;
}
return count;
}
void
anv_pipeline_sets_layout_hash(struct anv_pipeline_sets_layout *layout)
{
struct mesa_sha1 ctx;
_mesa_sha1_init(&ctx);
for (unsigned s = 0; s < layout->num_sets; s++) {
if (!layout->set[s].layout)
continue;
sha1_update_descriptor_set_layout(&ctx, layout->set[s].layout);
_mesa_sha1_update(&ctx, &layout->set[s].dynamic_offset_start,
sizeof(layout->set[s].dynamic_offset_start));
}
_mesa_sha1_update(&ctx, &layout->num_sets, sizeof(layout->num_sets));
_mesa_sha1_final(&ctx, layout->sha1);
}
void
anv_pipeline_sets_layout_fini(struct anv_pipeline_sets_layout *layout)
{
for (unsigned s = 0; s < layout->num_sets; s++) {
if (!layout->set[s].layout)
continue;
anv_descriptor_set_layout_unref(layout->device, layout->set[s].layout);
}
}
void
anv_pipeline_sets_layout_print(const struct anv_pipeline_sets_layout *layout)
{
fprintf(stderr, "layout: dyn_count=%u sets=%u ind=%u\n",
layout->num_dynamic_buffers,
layout->num_sets,
layout->independent_sets);
for (unsigned s = 0; s < layout->num_sets; s++) {
if (!layout->set[s].layout)
continue;
fprintf(stderr, " set%i: dyn_start=%u flags=0x%x\n",
s, layout->set[s].dynamic_offset_start, layout->set[s].layout->flags);
}
}
VkResult anv_CreatePipelineLayout(
VkDevice _device,
const VkPipelineLayoutCreateInfo* pCreateInfo,
const VkAllocationCallbacks* pAllocator,
VkPipelineLayout* pPipelineLayout)
{
ANV_FROM_HANDLE(anv_device, device, _device);
struct anv_pipeline_layout *layout;
assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO);
layout = vk_object_zalloc(&device->vk, pAllocator, sizeof(*layout),
VK_OBJECT_TYPE_PIPELINE_LAYOUT);
if (layout == NULL)
return vk_error(device, VK_ERROR_OUT_OF_HOST_MEMORY);
anv_pipeline_sets_layout_init(&layout->sets_layout, device,
pCreateInfo->flags & VK_PIPELINE_LAYOUT_CREATE_INDEPENDENT_SETS_BIT_EXT);
for (uint32_t set = 0; set < pCreateInfo->setLayoutCount; set++) {
ANV_FROM_HANDLE(anv_descriptor_set_layout, set_layout,
pCreateInfo->pSetLayouts[set]);
/* VUID-VkPipelineLayoutCreateInfo-graphicsPipelineLibrary-06753
*
* "If graphicsPipelineLibrary is not enabled, elements of
* pSetLayouts must be valid VkDescriptorSetLayout objects"
*
* As a result of supporting graphicsPipelineLibrary, we need to allow
* null descriptor set layouts.
*/
if (set_layout == NULL)
continue;
anv_pipeline_sets_layout_add(&layout->sets_layout, set, set_layout);
}
anv_pipeline_sets_layout_hash(&layout->sets_layout);
*pPipelineLayout = anv_pipeline_layout_to_handle(layout);
return VK_SUCCESS;
}
void anv_DestroyPipelineLayout(
VkDevice _device,
VkPipelineLayout _pipelineLayout,
const VkAllocationCallbacks* pAllocator)
{
ANV_FROM_HANDLE(anv_device, device, _device);
ANV_FROM_HANDLE(anv_pipeline_layout, layout, _pipelineLayout);
if (!layout)
return;
anv_pipeline_sets_layout_fini(&layout->sets_layout);
vk_object_free(&device->vk, pAllocator, layout);
}
/*
* Descriptor pools.
*
* These are implemented using a big pool of memory and a vma heap for the
* host memory allocations and a state_stream and a free list for the buffer
* view surface state. The spec allows us to fail to allocate due to
* fragmentation in all cases but two: 1) after pool reset, allocating up
* until the pool size with no freeing must succeed and 2) allocating and
* freeing only descriptor sets with the same layout. Case 1) is easy enough,
* and the vma heap ensures case 2).
*/
/* The vma heap reserves 0 to mean NULL; we have to offset by some amount to
* ensure we can allocate the entire BO without hitting zero. The actual
* amount doesn't matter.
*/
#define POOL_HEAP_OFFSET 64
#define EMPTY 1
static VkResult
anv_descriptor_pool_heap_init(struct anv_device *device,
struct anv_descriptor_pool_heap *heap,
uint32_t size,
bool host_only,
bool samplers)
{
if (size == 0)
return VK_SUCCESS;
if (host_only) {
heap->size = size;
heap->host_mem = vk_zalloc(&device->vk.alloc, size, 8,
VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
if (heap->host_mem == NULL)
return vk_error(device, VK_ERROR_OUT_OF_HOST_MEMORY);
} else {
const char *bo_name =
device->physical->indirect_descriptors ? "indirect descriptors" :
samplers ? "direct sampler" : "direct surfaces";
heap->size = align(size, 4096);
VkResult result = anv_device_alloc_bo(device,
bo_name, heap->size,
ANV_BO_ALLOC_CAPTURE |
ANV_BO_ALLOC_MAPPED |
ANV_BO_ALLOC_HOST_CACHED_COHERENT |
(samplers ?
ANV_BO_ALLOC_DYNAMIC_VISIBLE_POOL :
ANV_BO_ALLOC_DESCRIPTOR_POOL),
0 /* explicit_address */,
&heap->bo);
if (result != VK_SUCCESS)
return vk_error(device, VK_ERROR_OUT_OF_DEVICE_MEMORY);
}
util_vma_heap_init(&heap->heap, POOL_HEAP_OFFSET, heap->size);
return VK_SUCCESS;
}
static void
anv_descriptor_pool_heap_fini(struct anv_device *device,
struct anv_descriptor_pool_heap *heap)
{
if (heap->size == 0)
return;
util_vma_heap_finish(&heap->heap);
if (heap->bo)
anv_device_release_bo(device, heap->bo);
if (heap->host_mem)
vk_free(&device->vk.alloc, heap->host_mem);
}
static void
anv_descriptor_pool_heap_reset(struct anv_device *device,
struct anv_descriptor_pool_heap *heap)
{
if (heap->size == 0)
return;
util_vma_heap_finish(&heap->heap);
util_vma_heap_init(&heap->heap, POOL_HEAP_OFFSET, heap->size);
}
static VkResult
anv_descriptor_pool_heap_alloc(struct anv_descriptor_pool *pool,
struct anv_descriptor_pool_heap *heap,
uint32_t size, uint32_t alignment,
struct anv_state *state)
{
uint64_t pool_vma_offset =
util_vma_heap_alloc(&heap->heap, size, alignment);
if (pool_vma_offset == 0) {
if (size > heap->size - heap->alloc_size)
return vk_error(pool, VK_ERROR_OUT_OF_POOL_MEMORY);
else
return vk_error(pool, VK_ERROR_FRAGMENTED_POOL);
}
assert(pool_vma_offset >= POOL_HEAP_OFFSET &&
pool_vma_offset - POOL_HEAP_OFFSET <= INT32_MAX);
state->offset = pool_vma_offset - POOL_HEAP_OFFSET;
state->alloc_size = size;
if (heap->host_mem)
state->map = heap->host_mem + state->offset;
else
state->map = heap->bo->map + state->offset;
heap->alloc_size += size;
return VK_SUCCESS;
}
static void
anv_descriptor_pool_heap_free(struct anv_descriptor_pool_heap *heap,
struct anv_state state)
{
heap->alloc_size -= state.alloc_size;
util_vma_heap_free(&heap->heap,
(uint64_t)state.offset + POOL_HEAP_OFFSET,
state.alloc_size);
}
VkResult anv_CreateDescriptorPool(
VkDevice _device,
const VkDescriptorPoolCreateInfo* pCreateInfo,
const VkAllocationCallbacks* pAllocator,
VkDescriptorPool* pDescriptorPool)
{
ANV_FROM_HANDLE(anv_device, device, _device);
struct anv_descriptor_pool *pool;
const VkDescriptorPoolInlineUniformBlockCreateInfo *inline_info =
vk_find_struct_const(pCreateInfo->pNext,
DESCRIPTOR_POOL_INLINE_UNIFORM_BLOCK_CREATE_INFO);
const VkMutableDescriptorTypeCreateInfoEXT *mutable_info =
vk_find_struct_const(pCreateInfo->pNext,
MUTABLE_DESCRIPTOR_TYPE_CREATE_INFO_EXT);
uint32_t descriptor_count = 0;
uint32_t buffer_view_count = 0;
uint32_t descriptor_bo_surface_size = 0;
uint32_t descriptor_bo_sampler_size = 0;
const enum anv_descriptor_set_layout_type layout_type =
device->physical->indirect_descriptors ?
ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_INDIRECT :
ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_DIRECT;
/* Workaround application bugs when we're allocating surfaces & samplers in
* separate heaps (!indirect_descriptors). Some applications will specify a
* count of samplers too small and we might fail allocations in
* vkAllocateDescriptorsSets().
*
* Find the highest count across all descriptor types and use that for
* samplers.
*/
uint32_t max_descriptor_count = 0;
if (device->physical->instance->anv_upper_bound_descriptor_pool_sampler &&
!device->physical->indirect_descriptors) {
for (uint32_t i = 0; i < pCreateInfo->poolSizeCount; i++) {
max_descriptor_count = MAX2(pCreateInfo->pPoolSizes[i].descriptorCount,
max_descriptor_count);
}
}
for (uint32_t i = 0; i < pCreateInfo->poolSizeCount; i++) {
enum anv_descriptor_data desc_data =
pCreateInfo->pPoolSizes[i].type == VK_DESCRIPTOR_TYPE_MUTABLE_EXT ?
anv_descriptor_data_for_mutable_type(device->physical, layout_type,
pCreateInfo->flags,
mutable_info, i) :
anv_descriptor_data_for_type(device->physical, layout_type,
pCreateInfo->flags,
pCreateInfo->pPoolSizes[i].type);
if (desc_data & ANV_DESCRIPTOR_BUFFER_VIEW)
buffer_view_count += pCreateInfo->pPoolSizes[i].descriptorCount;
uint16_t desc_surface_size, desc_sampler_size;
if (pCreateInfo->pPoolSizes[i].type == VK_DESCRIPTOR_TYPE_MUTABLE_EXT) {
anv_descriptor_size_for_mutable_type(device->physical, layout_type,
pCreateInfo->flags, mutable_info, i,
&desc_surface_size, &desc_sampler_size);
} else {
anv_descriptor_data_size(desc_data, layout_type,
&desc_surface_size, &desc_sampler_size);
}
uint32_t desc_data_surface_size =
desc_surface_size * pCreateInfo->pPoolSizes[i].descriptorCount;
uint32_t desc_data_sampler_size =
desc_sampler_size * MAX2(max_descriptor_count,
pCreateInfo->pPoolSizes[i].descriptorCount);
/* Combined image sampler descriptors can take up to 3 slots if they
* hold a YCbCr image.
*/
if (pCreateInfo->pPoolSizes[i].type ==
VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER) {
desc_data_surface_size *= 3;
desc_data_sampler_size *= 3;
}
if (pCreateInfo->pPoolSizes[i].type ==
VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK) {
/* Inline uniform blocks are specified to use the descriptor array
* size as the size in bytes of the block.
*/
assert(inline_info);
desc_data_surface_size += pCreateInfo->pPoolSizes[i].descriptorCount;
}
descriptor_bo_surface_size += desc_data_surface_size;
descriptor_bo_sampler_size += desc_data_sampler_size;
descriptor_count += pCreateInfo->pPoolSizes[i].descriptorCount;
}
/* We have to align descriptor buffer allocations to 32B so that we can
* push descriptor buffers. This means that each descriptor buffer
* allocated may burn up to 32B of extra space to get the right alignment.
* (Technically, it's at most 28B because we're always going to start at
* least 4B aligned but we're being conservative here.) Allocate enough
* extra space that we can chop it into maxSets pieces and align each one
* of them to 32B.
*/
descriptor_bo_surface_size += ANV_UBO_ALIGNMENT * pCreateInfo->maxSets;
/* We align inline uniform blocks to ANV_UBO_ALIGNMENT */
if (inline_info) {
descriptor_bo_surface_size +=
ANV_UBO_ALIGNMENT * inline_info->maxInlineUniformBlockBindings;
}
const bool host_only =
pCreateInfo->flags & VK_DESCRIPTOR_POOL_CREATE_HOST_ONLY_BIT_EXT;
/* For host_only pools, allocate some memory to hold the written surface
* states of the internal anv_buffer_view. With normal pools, the memory
* holding surface state is allocated from the device surface_state_pool.
*/
const size_t host_mem_size =
pCreateInfo->maxSets * sizeof(struct anv_descriptor_set) +
descriptor_count * sizeof(struct anv_descriptor) +
buffer_view_count * sizeof(struct anv_buffer_view) +
(host_only ? buffer_view_count * ANV_SURFACE_STATE_SIZE : 0);
pool = vk_object_zalloc(&device->vk, pAllocator,
sizeof(*pool) + host_mem_size,
VK_OBJECT_TYPE_DESCRIPTOR_POOL);
if (!pool)
return vk_error(device, VK_ERROR_OUT_OF_HOST_MEMORY);
pool->host_mem_size = host_mem_size;
util_vma_heap_init(&pool->host_heap, POOL_HEAP_OFFSET, host_mem_size);
pool->host_only = host_only;
VkResult result = anv_descriptor_pool_heap_init(device,
&pool->surfaces,
descriptor_bo_surface_size,
pool->host_only,
false /* samplers */);
if (result != VK_SUCCESS) {
vk_object_free(&device->vk, pAllocator, pool);
return result;
}
result = anv_descriptor_pool_heap_init(device,
&pool->samplers,
descriptor_bo_sampler_size,
pool->host_only,
true /* samplers */);
if (result != VK_SUCCESS) {
anv_descriptor_pool_heap_fini(device, &pool->surfaces);
vk_object_free(&device->vk, pAllocator, pool);
return result;
}
/* All the surface states allocated by the descriptor pool are internal. We
* have to allocate them to handle the fact that we do not have surface
* states for VkBuffers.
*/
anv_state_stream_init(&pool->surface_state_stream,
&device->internal_surface_state_pool, 4096);
pool->surface_state_free_list = NULL;
list_inithead(&pool->desc_sets);
ANV_RMV(descriptor_pool_create, device, pCreateInfo, pool, false);
*pDescriptorPool = anv_descriptor_pool_to_handle(pool);
return VK_SUCCESS;
}
void anv_DestroyDescriptorPool(
VkDevice _device,
VkDescriptorPool _pool,
const VkAllocationCallbacks* pAllocator)
{
ANV_FROM_HANDLE(anv_device, device, _device);
ANV_FROM_HANDLE(anv_descriptor_pool, pool, _pool);
if (!pool)
return;
ANV_RMV(resource_destroy, device, pool);
list_for_each_entry_safe(struct anv_descriptor_set, set,
&pool->desc_sets, pool_link) {
anv_descriptor_set_layout_unref(device, set->layout);
}
util_vma_heap_finish(&pool->host_heap);
anv_state_stream_finish(&pool->surface_state_stream);
anv_descriptor_pool_heap_fini(device, &pool->surfaces);
anv_descriptor_pool_heap_fini(device, &pool->samplers);
vk_object_free(&device->vk, pAllocator, pool);
}
VkResult anv_ResetDescriptorPool(
VkDevice _device,
VkDescriptorPool descriptorPool,
VkDescriptorPoolResetFlags flags)
{
ANV_FROM_HANDLE(anv_device, device, _device);
ANV_FROM_HANDLE(anv_descriptor_pool, pool, descriptorPool);
list_for_each_entry_safe(struct anv_descriptor_set, set,
&pool->desc_sets, pool_link) {
anv_descriptor_set_layout_unref(device, set->layout);
}
list_inithead(&pool->desc_sets);
util_vma_heap_finish(&pool->host_heap);
util_vma_heap_init(&pool->host_heap, POOL_HEAP_OFFSET, pool->host_mem_size);
anv_descriptor_pool_heap_reset(device, &pool->surfaces);
anv_descriptor_pool_heap_reset(device, &pool->samplers);
anv_state_stream_finish(&pool->surface_state_stream);
anv_state_stream_init(&pool->surface_state_stream,
&device->internal_surface_state_pool, 4096);
pool->surface_state_free_list = NULL;
return VK_SUCCESS;
}
static VkResult
anv_descriptor_pool_alloc_set(struct anv_descriptor_pool *pool,
uint32_t size,
struct anv_descriptor_set **set)
{
uint64_t vma_offset = util_vma_heap_alloc(&pool->host_heap, size, 1);
if (vma_offset == 0) {
if (size <= pool->host_heap.free_size) {
return VK_ERROR_FRAGMENTED_POOL;
} else {
return VK_ERROR_OUT_OF_POOL_MEMORY;
}
}
assert(vma_offset >= POOL_HEAP_OFFSET);
uint64_t host_mem_offset = vma_offset - POOL_HEAP_OFFSET;
*set = (struct anv_descriptor_set *) (pool->host_mem + host_mem_offset);
(*set)->size = size;
return VK_SUCCESS;
}
static void
anv_descriptor_pool_free_set(struct anv_descriptor_pool *pool,
struct anv_descriptor_set *set)
{
util_vma_heap_free(&pool->host_heap,
((char *) set - pool->host_mem) + POOL_HEAP_OFFSET,
set->size);
}
struct surface_state_free_list_entry {
void *next;
struct anv_state state;
};
static struct anv_state
anv_descriptor_pool_alloc_state(struct anv_descriptor_pool *pool)
{
assert(!pool->host_only);
struct surface_state_free_list_entry *entry =
pool->surface_state_free_list;
if (entry) {
struct anv_state state = entry->state;
pool->surface_state_free_list = entry->next;
assert(state.alloc_size == ANV_SURFACE_STATE_SIZE);
return state;
} else {
struct anv_state state =
anv_state_stream_alloc(&pool->surface_state_stream,
ANV_SURFACE_STATE_SIZE, 64);
return state;
}
}
static void
anv_descriptor_pool_free_state(struct anv_descriptor_pool *pool,
struct anv_state state)
{
assert(state.alloc_size);
/* Put the buffer view surface state back on the free list. */
struct surface_state_free_list_entry *entry = state.map;
entry->next = pool->surface_state_free_list;
entry->state = state;
pool->surface_state_free_list = entry;
}
static size_t
anv_descriptor_set_layout_size(const struct anv_descriptor_set_layout *layout,
bool host_only, uint32_t var_desc_count)
{
const uint32_t descriptor_count =
set_layout_descriptor_count(layout, var_desc_count);
const uint32_t buffer_view_count =
set_layout_buffer_view_count(layout, var_desc_count);
return sizeof(struct anv_descriptor_set) +
descriptor_count * sizeof(struct anv_descriptor) +
buffer_view_count * sizeof(struct anv_buffer_view) +
(host_only ? buffer_view_count * ANV_SURFACE_STATE_SIZE : 0);
}
static VkResult
anv_descriptor_set_create(struct anv_device *device,
struct anv_descriptor_pool *pool,
struct anv_descriptor_set_layout *layout,
uint32_t var_desc_count,
struct anv_descriptor_set **out_set)
{
struct anv_descriptor_set *set;
const size_t size = anv_descriptor_set_layout_size(layout,
pool->host_only,
var_desc_count);
VkResult result = anv_descriptor_pool_alloc_set(pool, size, &set);
if (result != VK_SUCCESS)
return result;
uint32_t descriptor_buffer_surface_size, descriptor_buffer_sampler_size;
anv_descriptor_set_layout_descriptor_buffer_size(layout, var_desc_count,
&descriptor_buffer_surface_size,
&descriptor_buffer_sampler_size);
set->desc_surface_state = ANV_STATE_NULL;
set->is_push = false;
if (descriptor_buffer_surface_size) {
result = anv_descriptor_pool_heap_alloc(pool, &pool->surfaces,
descriptor_buffer_surface_size,
ANV_UBO_ALIGNMENT,
&set->desc_surface_mem);
if (result != VK_SUCCESS) {
anv_descriptor_pool_free_set(pool, set);
return result;
}
set->desc_surface_addr = (struct anv_address) {
.bo = pool->surfaces.bo,
.offset = set->desc_surface_mem.offset,
};
set->desc_offset = anv_address_physical(set->desc_surface_addr) -
device->physical->va.internal_surface_state_pool.addr;
enum isl_format format =
anv_isl_format_for_descriptor_type(device,
VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER);
if (!pool->host_only) {
set->desc_surface_state = anv_descriptor_pool_alloc_state(pool);
if (set->desc_surface_state.map == NULL) {
anv_descriptor_pool_free_set(pool, set);
return vk_error(pool, VK_ERROR_OUT_OF_DEVICE_MEMORY);
}
anv_fill_buffer_surface_state(device, set->desc_surface_state.map,
format, ISL_SWIZZLE_IDENTITY,
ISL_SURF_USAGE_CONSTANT_BUFFER_BIT,
set->desc_surface_addr,
descriptor_buffer_surface_size, 1);
}
} else {
set->desc_surface_mem = ANV_STATE_NULL;
set->desc_surface_addr = ANV_NULL_ADDRESS;
}
if (descriptor_buffer_sampler_size) {
result = anv_descriptor_pool_heap_alloc(pool, &pool->samplers,
descriptor_buffer_sampler_size,
ANV_SAMPLER_STATE_SIZE,
&set->desc_sampler_mem);
if (result != VK_SUCCESS) {
anv_descriptor_pool_free_set(pool, set);
return result;
}
set->desc_sampler_addr = (struct anv_address) {
.bo = pool->samplers.bo,
.offset = set->desc_sampler_mem.offset,
};
} else {
set->desc_sampler_mem = ANV_STATE_NULL;
set->desc_sampler_addr = ANV_NULL_ADDRESS;
}
vk_object_base_init(&device->vk, &set->base,
VK_OBJECT_TYPE_DESCRIPTOR_SET);
set->pool = pool;
set->layout = layout;
anv_descriptor_set_layout_ref(layout);
set->buffer_view_count =
set_layout_buffer_view_count(layout, var_desc_count);
set->descriptor_count =
set_layout_descriptor_count(layout, var_desc_count);
set->buffer_views =
(struct anv_buffer_view *) &set->descriptors[set->descriptor_count];
/* By defining the descriptors to be zero now, we can later verify that
* a descriptor has not been populated with user data.
*/
memset(set->descriptors, 0,
sizeof(struct anv_descriptor) * set->descriptor_count);
/* Go through and fill out immutable samplers if we have any */
for (uint32_t b = 0; b < layout->binding_count; b++) {
if (layout->binding[b].immutable_samplers) {
for (uint32_t i = 0; i < layout->binding[b].array_size; i++) {
/* The type will get changed to COMBINED_IMAGE_SAMPLER in
* UpdateDescriptorSets if needed. However, if the descriptor
* set has an immutable sampler, UpdateDescriptorSets may never
* touch it, so we need to make sure it's 100% valid now.
*
* We don't need to actually provide a sampler because the helper
* will always write in the immutable sampler regardless of what
* is in the sampler parameter.
*/
VkDescriptorImageInfo info = { };
anv_descriptor_set_write_image_view(device, set, &info,
VK_DESCRIPTOR_TYPE_SAMPLER,
b, i);
}
}
}
/* Allocate surface states for real descriptor sets if we're using indirect
* descriptors. For host only sets, we just store the surface state data in
* malloc memory.
*/
if (device->physical->indirect_descriptors) {
if (!pool->host_only) {
for (uint32_t b = 0; b < set->buffer_view_count; b++) {
set->buffer_views[b].general.state =
anv_descriptor_pool_alloc_state(pool);
}
} else {
void *host_surface_states =
set->buffer_views + set->buffer_view_count;
memset(host_surface_states, 0,
set->buffer_view_count * ANV_SURFACE_STATE_SIZE);
for (uint32_t b = 0; b < set->buffer_view_count; b++) {
set->buffer_views[b].general.state = (struct anv_state) {
.alloc_size = ANV_SURFACE_STATE_SIZE,
.map = host_surface_states + b * ANV_SURFACE_STATE_SIZE,
};
}
}
}
list_addtail(&set->pool_link, &pool->desc_sets);
*out_set = set;
return VK_SUCCESS;
}
static void
anv_descriptor_set_destroy(struct anv_device *device,
struct anv_descriptor_pool *pool,
struct anv_descriptor_set *set)
{
anv_descriptor_set_layout_unref(device, set->layout);
if (set->desc_surface_mem.alloc_size) {
anv_descriptor_pool_heap_free(&pool->surfaces, set->desc_surface_mem);
if (set->desc_surface_state.alloc_size)
anv_descriptor_pool_free_state(pool, set->desc_surface_state);
}
if (set->desc_sampler_mem.alloc_size)
anv_descriptor_pool_heap_free(&pool->samplers, set->desc_sampler_mem);
if (device->physical->indirect_descriptors) {
if (!pool->host_only) {
for (uint32_t b = 0; b < set->buffer_view_count; b++) {
if (set->buffer_views[b].general.state.alloc_size) {
anv_descriptor_pool_free_state(
pool, set->buffer_views[b].general.state);
}
}
}
}
list_del(&set->pool_link);
vk_object_base_finish(&set->base);
anv_descriptor_pool_free_set(pool, set);
}
VkResult anv_AllocateDescriptorSets(
VkDevice _device,
const VkDescriptorSetAllocateInfo* pAllocateInfo,
VkDescriptorSet* pDescriptorSets)
{
ANV_FROM_HANDLE(anv_device, device, _device);
ANV_FROM_HANDLE(anv_descriptor_pool, pool, pAllocateInfo->descriptorPool);
VkResult result = VK_SUCCESS;
struct anv_descriptor_set *set = NULL;
uint32_t i;
const VkDescriptorSetVariableDescriptorCountAllocateInfo *vdcai =
vk_find_struct_const(pAllocateInfo->pNext,
DESCRIPTOR_SET_VARIABLE_DESCRIPTOR_COUNT_ALLOCATE_INFO);
for (i = 0; i < pAllocateInfo->descriptorSetCount; i++) {
ANV_FROM_HANDLE(anv_descriptor_set_layout, layout,
pAllocateInfo->pSetLayouts[i]);
uint32_t var_desc_count = 0;
if (vdcai != NULL && vdcai->descriptorSetCount > 0) {
assert(vdcai->descriptorSetCount == pAllocateInfo->descriptorSetCount);
var_desc_count = vdcai->pDescriptorCounts[i];
}
result = anv_descriptor_set_create(device, pool, layout,
var_desc_count, &set);
if (result != VK_SUCCESS)
break;
pDescriptorSets[i] = anv_descriptor_set_to_handle(set);
}
if (result != VK_SUCCESS) {
anv_FreeDescriptorSets(_device, pAllocateInfo->descriptorPool,
i, pDescriptorSets);
/* The Vulkan 1.3.228 spec, section 14.2.3. Allocation of Descriptor Sets:
*
* "If the creation of any of those descriptor sets fails, then the
* implementation must destroy all successfully created descriptor
* set objects from this command, set all entries of the
* pDescriptorSets array to VK_NULL_HANDLE and return the error."
*/
for (i = 0; i < pAllocateInfo->descriptorSetCount; i++)
pDescriptorSets[i] = VK_NULL_HANDLE;
}
return result;
}
VkResult anv_FreeDescriptorSets(
VkDevice _device,
VkDescriptorPool descriptorPool,
uint32_t count,
const VkDescriptorSet* pDescriptorSets)
{
ANV_FROM_HANDLE(anv_device, device, _device);
ANV_FROM_HANDLE(anv_descriptor_pool, pool, descriptorPool);
for (uint32_t i = 0; i < count; i++) {
ANV_FROM_HANDLE(anv_descriptor_set, set, pDescriptorSets[i]);
if (!set)
continue;
anv_descriptor_set_destroy(device, pool, set);
}
return VK_SUCCESS;
}
bool
anv_push_descriptor_set_init(struct anv_cmd_buffer *cmd_buffer,
struct anv_push_descriptor_set *push_set,
struct anv_descriptor_set_layout *layout)
{
struct anv_descriptor_set *set = &push_set->set;
/* Only copy the old descriptor data if needed :
* - not if there was no previous layout
* - not if the layout is different (descriptor set data becomes
* undefined)
* - not if there is only one descriptor, we know the entire data will
* be replaced
*
* TODO: we could optimizer further, try to keep a copy of the old data on
* the host, try to copy only the non newly written bits, ...
*/
const bool copy_old_descriptors = set->layout != NULL &&
set->layout == layout &&
layout->descriptor_count > 1;
if (set->layout != layout) {
if (set->layout) {
anv_descriptor_set_layout_unref(cmd_buffer->device, set->layout);
} else {
/* one-time initialization */
vk_object_base_init(&cmd_buffer->device->vk, &set->base,
VK_OBJECT_TYPE_DESCRIPTOR_SET);
set->is_push = true;
set->buffer_views = push_set->buffer_views;
}
anv_descriptor_set_layout_ref(layout);
set->layout = layout;
set->generate_surface_states = 0;
}
assert(set->is_push && set->buffer_views);
set->size = anv_descriptor_set_layout_size(layout, false /* host_only */, 0);
set->buffer_view_count = layout->buffer_view_count;
set->descriptor_count = layout->descriptor_count;
if (layout->descriptor_buffer_surface_size &&
(push_set->set_used_on_gpu ||
set->desc_surface_mem.alloc_size < layout->descriptor_buffer_surface_size)) {
struct anv_physical_device *pdevice = cmd_buffer->device->physical;
struct anv_state_stream *push_stream;
uint64_t push_base_address;
if (layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_DESCRIPTOR_BUFFER_BIT_EXT) {
push_stream = pdevice->uses_ex_bso ?
&cmd_buffer->push_descriptor_buffer_stream :
&cmd_buffer->surface_state_stream;
push_base_address = pdevice->uses_ex_bso ?
pdevice->va.push_descriptor_buffer_pool.addr :
pdevice->va.internal_surface_state_pool.addr;
} else {
push_stream = pdevice->indirect_descriptors ?
&cmd_buffer->indirect_push_descriptor_stream :
&cmd_buffer->surface_state_stream;
push_base_address = pdevice->indirect_descriptors ?
pdevice->va.indirect_push_descriptor_pool.addr :
pdevice->va.internal_surface_state_pool.addr;
}
uint32_t surface_size, sampler_size;
anv_descriptor_set_layout_descriptor_buffer_size(layout, 0,
&surface_size,
&sampler_size);
/* The previous buffer is either actively used by some GPU command (so
* we can't modify it) or is too small. Allocate a new one.
*/
struct anv_state desc_surface_mem =
anv_state_stream_alloc(push_stream, surface_size, ANV_UBO_ALIGNMENT);
if (desc_surface_mem.map == NULL)
return false;
if (copy_old_descriptors) {
memcpy(desc_surface_mem.map, set->desc_surface_mem.map,
MIN2(desc_surface_mem.alloc_size,
set->desc_surface_mem.alloc_size));
}
set->desc_surface_mem = desc_surface_mem;
set->desc_surface_addr = anv_state_pool_state_address(
push_stream->state_pool,
set->desc_surface_mem);
set->desc_offset = anv_address_physical(set->desc_surface_addr) -
push_base_address;
}
if (layout->descriptor_buffer_sampler_size &&
(push_set->set_used_on_gpu ||
set->desc_sampler_mem.alloc_size < layout->descriptor_buffer_sampler_size)) {
struct anv_physical_device *pdevice = cmd_buffer->device->physical;
assert(!pdevice->indirect_descriptors);
struct anv_state_stream *push_stream = &cmd_buffer->dynamic_state_stream;
uint32_t surface_size, sampler_size;
anv_descriptor_set_layout_descriptor_buffer_size(layout, 0,
&surface_size,
&sampler_size);
/* The previous buffer is either actively used by some GPU command (so
* we can't modify it) or is too small. Allocate a new one.
*/
struct anv_state desc_sampler_mem =
anv_state_stream_alloc(push_stream, sampler_size, ANV_SAMPLER_STATE_SIZE);
if (desc_sampler_mem.map == NULL)
return false;
if (copy_old_descriptors) {
memcpy(desc_sampler_mem.map, set->desc_sampler_mem.map,
MIN2(desc_sampler_mem.alloc_size,
set->desc_sampler_mem.alloc_size));
}
set->desc_sampler_mem = desc_sampler_mem;
set->desc_sampler_addr = anv_state_pool_state_address(
push_stream->state_pool,
set->desc_sampler_mem);
}
if (push_set->set_used_on_gpu) {
set->desc_surface_state = ANV_STATE_NULL;
push_set->set_used_on_gpu = false;
}
return true;
}
void
anv_push_descriptor_set_finish(struct anv_push_descriptor_set *push_set)
{
struct anv_descriptor_set *set = &push_set->set;
if (set->layout) {
struct anv_device *device =
container_of(set->base.device, struct anv_device, vk);
anv_descriptor_set_layout_unref(device, set->layout);
}
}
static uint32_t
anv_surface_state_to_handle(struct anv_physical_device *device,
struct anv_state state)
{
/* Bits 31:12 of the bindless surface offset in the extended message
* descriptor is bits 25:6 of the byte-based address.
*/
assert(state.offset >= 0);
uint32_t offset = state.offset;
if (device->uses_ex_bso) {
assert((offset & 0x3f) == 0);
return offset;
} else {
assert((offset & 0x3f) == 0 && offset < (1 << 26));
return offset << 6;
}
}
static const void *
anv_image_view_surface_data_for_plane_layout(struct anv_image_view *image_view,
VkDescriptorType desc_type,
unsigned plane,
VkImageLayout layout)
{
if (desc_type == VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER ||
desc_type == VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE ||
desc_type == VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT) {
return (layout == VK_IMAGE_LAYOUT_GENERAL ||
layout == VK_IMAGE_LAYOUT_RENDERING_LOCAL_READ_KHR) ?
&image_view->planes[plane].general_sampler.state_data :
&image_view->planes[plane].optimal_sampler.state_data;
}
if (desc_type == VK_DESCRIPTOR_TYPE_STORAGE_IMAGE)
return &image_view->planes[plane].storage.state_data;
unreachable("Invalid descriptor type");
}
static const uint32_t *
anv_sampler_state_for_descriptor_set(const struct anv_sampler *sampler,
const struct anv_descriptor_set *set,
uint32_t plane)
{
return sampler->state[plane];
}
void
anv_descriptor_set_write_image_view(struct anv_device *device,
struct anv_descriptor_set *set,
const VkDescriptorImageInfo * const info,
VkDescriptorType type,
uint32_t binding,
uint32_t element)
{
const struct anv_descriptor_set_binding_layout *bind_layout =
&set->layout->binding[binding];
struct anv_descriptor *desc =
&set->descriptors[bind_layout->descriptor_index + element];
struct anv_image_view *image_view = NULL;
struct anv_sampler *sampler = NULL;
/* We get called with just VK_DESCRIPTOR_TYPE_SAMPLER as part of descriptor
* set initialization to set the bindless samplers.
*/
assert(type == bind_layout->type ||
type == VK_DESCRIPTOR_TYPE_SAMPLER ||
bind_layout->type == VK_DESCRIPTOR_TYPE_MUTABLE_EXT);
switch (type) {
case VK_DESCRIPTOR_TYPE_SAMPLER:
sampler = bind_layout->immutable_samplers ?
bind_layout->immutable_samplers[element] :
anv_sampler_from_handle(info->sampler);
break;
case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
image_view = anv_image_view_from_handle(info->imageView);
sampler = bind_layout->immutable_samplers ?
bind_layout->immutable_samplers[element] :
anv_sampler_from_handle(info->sampler);
break;
case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
image_view = anv_image_view_from_handle(info->imageView);
break;
default:
unreachable("invalid descriptor type");
}
*desc = (struct anv_descriptor) {
.type = type,
.layout = info->imageLayout,
.image_view = image_view,
.sampler = sampler,
};
void *desc_surface_map = set->desc_surface_mem.map +
bind_layout->descriptor_surface_offset +
element * bind_layout->descriptor_surface_stride;
enum anv_descriptor_data data =
bind_layout->type == VK_DESCRIPTOR_TYPE_MUTABLE_EXT ?
anv_descriptor_data_for_type(device->physical, set->layout->type,
set->layout->flags, type) :
bind_layout->data;
if (data & ANV_DESCRIPTOR_INDIRECT_SAMPLED_IMAGE) {
struct anv_sampled_image_descriptor desc_data[3];
memset(desc_data, 0, sizeof(desc_data));
if (image_view) {
for (unsigned p = 0; p < image_view->n_planes; p++) {
const struct anv_surface_state *sstate =
anv_image_view_texture_surface_state(image_view, p,
desc->layout);
desc_data[p].image =
anv_surface_state_to_handle(device->physical, sstate->state);
}
}
if (sampler) {
for (unsigned p = 0; p < sampler->n_planes; p++)
desc_data[p].sampler = sampler->bindless_state.offset + p * 32;
}
/* We may have max_plane_count < 0 if this isn't a sampled image but it
* can be no more than the size of our array of handles.
*/
assert(bind_layout->max_plane_count <= ARRAY_SIZE(desc_data));
memcpy(desc_surface_map, desc_data,
bind_layout->max_plane_count * sizeof(desc_data[0]));
}
if (data & ANV_DESCRIPTOR_INDIRECT_STORAGE_IMAGE) {
if (image_view) {
assert(image_view->n_planes == 1);
struct anv_storage_image_descriptor desc_data = {
.vanilla = anv_surface_state_to_handle(
device->physical,
anv_image_view_storage_surface_state(image_view)->state),
.image_depth = image_view->vk.storage.z_slice_count,
};
memcpy(desc_surface_map, &desc_data, sizeof(desc_data));
} else {
memset(desc_surface_map, 0, bind_layout->descriptor_surface_stride);
}
}
if (data & ANV_DESCRIPTOR_SAMPLER) {
void *sampler_map =
set->layout->type == ANV_PIPELINE_DESCRIPTOR_SET_LAYOUT_TYPE_DIRECT ?
(set->desc_sampler_mem.map +
bind_layout->descriptor_sampler_offset +
element * bind_layout->descriptor_sampler_stride) : desc_surface_map;
if (sampler) {
for (unsigned p = 0; p < sampler->n_planes; p++) {
memcpy(sampler_map + p * ANV_SAMPLER_STATE_SIZE,
anv_sampler_state_for_descriptor_set(sampler, set, p),
ANV_SAMPLER_STATE_SIZE);
}
} else {
memset(sampler_map, 0, bind_layout->descriptor_sampler_stride);
}
}
if (data & ANV_DESCRIPTOR_SURFACE) {
unsigned max_plane_count = image_view ? image_view->n_planes : 1;
for (unsigned p = 0; p < max_plane_count; p++) {
void *plane_map = desc_surface_map + p * ANV_SURFACE_STATE_SIZE;
if (image_view) {
memcpy(plane_map,
anv_image_view_surface_data_for_plane_layout(image_view, type,
p, desc->layout),
ANV_SURFACE_STATE_SIZE);
} else {
memcpy(plane_map, &device->host_null_surface_state, ANV_SURFACE_STATE_SIZE);
}
}
}
if (data & ANV_DESCRIPTOR_SURFACE_SAMPLER) {
unsigned max_plane_count =
MAX2(image_view ? image_view->n_planes : 1,
sampler ? sampler->n_planes : 1);
for (unsigned p = 0; p < max_plane_count; p++) {
void *plane_map = desc_surface_map + p * 2 * ANV_SURFACE_STATE_SIZE;
if (image_view) {
memcpy(plane_map,
anv_image_view_surface_data_for_plane_layout(image_view, type,
p, desc->layout),
ANV_SURFACE_STATE_SIZE);
} else {
memcpy(plane_map, &device->host_null_surface_state, ANV_SURFACE_STATE_SIZE);
}
if (sampler) {
memcpy(plane_map + ANV_SURFACE_STATE_SIZE,
anv_sampler_state_for_descriptor_set(sampler, set, p),
ANV_SAMPLER_STATE_SIZE);
} else {
memset(plane_map + ANV_SURFACE_STATE_SIZE, 0,
ANV_SAMPLER_STATE_SIZE);
}
}
}
}
static const void *
anv_buffer_view_surface_data(struct anv_buffer_view *buffer_view,
VkDescriptorType desc_type)
{
if (desc_type == VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER)
return &buffer_view->general.state_data;
if (desc_type == VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER)
return &buffer_view->storage.state_data;
unreachable("Invalid descriptor type");
}
void
anv_descriptor_set_write_buffer_view(struct anv_device *device,
struct anv_descriptor_set *set,
VkDescriptorType type,
struct anv_buffer_view *buffer_view,
uint32_t binding,
uint32_t element)
{
const struct anv_descriptor_set_binding_layout *bind_layout =
&set->layout->binding[binding];
struct anv_descriptor *desc =
&set->descriptors[bind_layout->descriptor_index + element];
assert(type == bind_layout->type ||
bind_layout->type == VK_DESCRIPTOR_TYPE_MUTABLE_EXT);
*desc = (struct anv_descriptor) {
.type = type,
.buffer_view = buffer_view,
};
enum anv_descriptor_data data =
bind_layout->type == VK_DESCRIPTOR_TYPE_MUTABLE_EXT ?
anv_descriptor_data_for_type(device->physical, set->layout->type,
set->layout->flags, type) :
bind_layout->data;
void *desc_map = set->desc_surface_mem.map +
bind_layout->descriptor_surface_offset +
element * bind_layout->descriptor_surface_stride;
if (buffer_view == NULL) {
if (data & ANV_DESCRIPTOR_SURFACE)
memcpy(desc_map, &device->host_null_surface_state, ANV_SURFACE_STATE_SIZE);
else
memset(desc_map, 0, bind_layout->descriptor_surface_stride);
return;
}
if (data & ANV_DESCRIPTOR_INDIRECT_SAMPLED_IMAGE) {
struct anv_sampled_image_descriptor desc_data = {
.image = anv_surface_state_to_handle(
device->physical, buffer_view->general.state),
};
memcpy(desc_map, &desc_data, sizeof(desc_data));
}
if (data & ANV_DESCRIPTOR_INDIRECT_STORAGE_IMAGE) {
struct anv_storage_image_descriptor desc_data = {
.vanilla = anv_surface_state_to_handle(
device->physical, buffer_view->storage.state),
};
memcpy(desc_map, &desc_data, sizeof(desc_data));
}
if (data & ANV_DESCRIPTOR_SURFACE) {
memcpy(desc_map,
anv_buffer_view_surface_data(buffer_view, type),
ANV_SURFACE_STATE_SIZE);
}
}
void
anv_descriptor_write_surface_state(struct anv_device *device,
struct anv_descriptor *desc,
struct anv_state surface_state)
{
assert(surface_state.alloc_size);
struct anv_buffer_view *bview = desc->buffer_view;
bview->general.state = surface_state;
isl_surf_usage_flags_t usage =
anv_isl_usage_for_descriptor_type(desc->type);
enum isl_format format =
anv_isl_format_for_descriptor_type(device, desc->type);
anv_fill_buffer_surface_state(device, bview->general.state.map,
format, ISL_SWIZZLE_IDENTITY,
usage, bview->address, bview->vk.range, 1);
}
void
anv_descriptor_set_write_buffer(struct anv_device *device,
struct anv_descriptor_set *set,
VkDescriptorType type,
struct anv_buffer *buffer,
uint32_t binding,
uint32_t element,
VkDeviceSize offset,
VkDeviceSize range)
{
const struct anv_descriptor_set_binding_layout *bind_layout =
&set->layout->binding[binding];
const uint32_t descriptor_index = bind_layout->descriptor_index + element;
struct anv_descriptor *desc = &set->descriptors[descriptor_index];
assert(type == bind_layout->type ||
bind_layout->type == VK_DESCRIPTOR_TYPE_MUTABLE_EXT);
*desc = (struct anv_descriptor) {
.type = type,
.offset = offset,
.range = range,
.buffer = buffer,
};
enum anv_descriptor_data data =
bind_layout->type == VK_DESCRIPTOR_TYPE_MUTABLE_EXT ?
anv_descriptor_data_for_type(device->physical, set->layout->type,
set->layout->flags, type) :
bind_layout->data;
void *desc_map = set->desc_surface_mem.map +
bind_layout->descriptor_surface_offset +
element * bind_layout->descriptor_surface_stride;
if (buffer == NULL) {
if (data & ANV_DESCRIPTOR_SURFACE)
memcpy(desc_map, &device->host_null_surface_state, ANV_SURFACE_STATE_SIZE);
else
memset(desc_map, 0, bind_layout->descriptor_surface_stride);
return;
}
struct anv_address bind_addr = anv_address_add(buffer->address, offset);
desc->bind_range = vk_buffer_range(&buffer->vk, offset, range);
/* We report a bounds checking alignment of ANV_UBO_ALIGNMENT in
* VkPhysicalDeviceRobustness2PropertiesEXT::robustUniformBufferAccessSizeAlignment
* so align the range to that.
*/
if (type == VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER ||
type == VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC)
desc->bind_range = align64(desc->bind_range, ANV_UBO_ALIGNMENT);
if (data & ANV_DESCRIPTOR_INDIRECT_ADDRESS_RANGE) {
struct anv_address_range_descriptor desc_data = {
.address = anv_address_physical(bind_addr),
.range = desc->bind_range,
};
memcpy(desc_map, &desc_data, sizeof(desc_data));
}
if (data & ANV_DESCRIPTOR_SURFACE) {
isl_surf_usage_flags_t usage =
anv_isl_usage_for_descriptor_type(desc->type);
enum isl_format format =
anv_isl_format_for_descriptor_type(device, desc->type);
if (bind_addr.bo && bind_addr.bo->alloc_flags & ANV_BO_ALLOC_PROTECTED)
usage |= ISL_SURF_USAGE_PROTECTED_BIT;
isl_buffer_fill_state(&device->isl_dev, desc_map,
.address = anv_address_physical(bind_addr),
.mocs = isl_mocs(&device->isl_dev, usage,
bind_addr.bo && anv_bo_is_external(bind_addr.bo)),
.size_B = desc->bind_range,
.format = format,
.swizzle = ISL_SWIZZLE_IDENTITY,
.stride_B = 1);
}
if (vk_descriptor_type_is_dynamic(type))
return;
if (data & ANV_DESCRIPTOR_BUFFER_VIEW) {
struct anv_buffer_view *bview =
&set->buffer_views[bind_layout->buffer_view_index + element];
desc->set_buffer_view = bview;
bview->vk.range = desc->bind_range;
bview->address = bind_addr;
if (set->is_push) {
set->generate_surface_states |= BITFIELD_BIT(descriptor_index);
/* Reset the surface state to make sure
* genX(cmd_buffer_emit_push_descriptor_surfaces) generates a new
* one.
*/
bview->general.state = ANV_STATE_NULL;
} else {
anv_descriptor_write_surface_state(device, desc, bview->general.state);
}
}
}
void
anv_descriptor_set_write_inline_uniform_data(struct anv_device *device,
struct anv_descriptor_set *set,
uint32_t binding,
const void *data,
size_t offset,
size_t size)
{
const struct anv_descriptor_set_binding_layout *bind_layout =
&set->layout->binding[binding];
assert(bind_layout->data & ANV_DESCRIPTOR_INLINE_UNIFORM);
void *desc_map = set->desc_surface_mem.map +
bind_layout->descriptor_surface_offset;
memcpy(desc_map + offset, data, size);
}
void
anv_descriptor_set_write_acceleration_structure(struct anv_device *device,
struct anv_descriptor_set *set,
struct vk_acceleration_structure *accel,
uint32_t binding,
uint32_t element)
{
const struct anv_descriptor_set_binding_layout *bind_layout =
&set->layout->binding[binding];
struct anv_descriptor *desc =
&set->descriptors[bind_layout->descriptor_index + element];
assert(bind_layout->data & ANV_DESCRIPTOR_INDIRECT_ADDRESS_RANGE);
*desc = (struct anv_descriptor) {
.type = VK_DESCRIPTOR_TYPE_ACCELERATION_STRUCTURE_KHR,
.accel_struct = accel,
};
struct anv_address_range_descriptor desc_data = { };
if (accel != NULL) {
desc_data.address = vk_acceleration_structure_get_va(accel);
desc_data.range = accel->size;
}
assert(sizeof(desc_data) <= bind_layout->descriptor_surface_stride);
void *desc_map = set->desc_surface_mem.map +
bind_layout->descriptor_surface_offset +
element * bind_layout->descriptor_surface_stride;
memcpy(desc_map, &desc_data, sizeof(desc_data));
}
void
anv_descriptor_set_write(struct anv_device *device,
struct anv_descriptor_set *set_override,
uint32_t write_count,
const VkWriteDescriptorSet *writes)
{
for (uint32_t i = 0; i < write_count; i++) {
const VkWriteDescriptorSet *write = &writes[i];
struct anv_descriptor_set *set = unlikely(set_override) ?
set_override :
anv_descriptor_set_from_handle(write->dstSet);
switch (write->descriptorType) {
case VK_DESCRIPTOR_TYPE_SAMPLER:
case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
for (uint32_t j = 0; j < write->descriptorCount; j++) {
anv_descriptor_set_write_image_view(device, set,
write->pImageInfo + j,
write->descriptorType,
write->dstBinding,
write->dstArrayElement + j);
}
break;
case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
for (uint32_t j = 0; j < write->descriptorCount; j++) {
ANV_FROM_HANDLE(anv_buffer_view, bview,
write->pTexelBufferView[j]);
anv_descriptor_set_write_buffer_view(device, set,
write->descriptorType,
bview,
write->dstBinding,
write->dstArrayElement + j);
}
break;
case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
for (uint32_t j = 0; j < write->descriptorCount; j++) {
ANV_FROM_HANDLE(anv_buffer, buffer, write->pBufferInfo[j].buffer);
anv_descriptor_set_write_buffer(device, set,
write->descriptorType,
buffer,
write->dstBinding,
write->dstArrayElement + j,
write->pBufferInfo[j].offset,
write->pBufferInfo[j].range);
}
break;
case VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK: {
const VkWriteDescriptorSetInlineUniformBlock *inline_write =
vk_find_struct_const(write->pNext,
WRITE_DESCRIPTOR_SET_INLINE_UNIFORM_BLOCK);
assert(inline_write->dataSize == write->descriptorCount);
anv_descriptor_set_write_inline_uniform_data(device, set,
write->dstBinding,
inline_write->pData,
write->dstArrayElement,
inline_write->dataSize);
break;
}
case VK_DESCRIPTOR_TYPE_ACCELERATION_STRUCTURE_KHR: {
const VkWriteDescriptorSetAccelerationStructureKHR *accel_write =
vk_find_struct_const(write, WRITE_DESCRIPTOR_SET_ACCELERATION_STRUCTURE_KHR);
assert(accel_write->accelerationStructureCount ==
write->descriptorCount);
for (uint32_t j = 0; j < write->descriptorCount; j++) {
ANV_FROM_HANDLE(vk_acceleration_structure, accel,
accel_write->pAccelerationStructures[j]);
anv_descriptor_set_write_acceleration_structure(device, set, accel,
write->dstBinding,
write->dstArrayElement + j);
}
break;
}
default:
break;
}
}
}
void anv_UpdateDescriptorSets(
VkDevice _device,
uint32_t descriptorWriteCount,
const VkWriteDescriptorSet* pDescriptorWrites,
uint32_t descriptorCopyCount,
const VkCopyDescriptorSet* pDescriptorCopies)
{
ANV_FROM_HANDLE(anv_device, device, _device);
anv_descriptor_set_write(device, NULL, descriptorWriteCount,
pDescriptorWrites);
for (uint32_t i = 0; i < descriptorCopyCount; i++) {
const VkCopyDescriptorSet *copy = &pDescriptorCopies[i];
ANV_FROM_HANDLE(anv_descriptor_set, src, copy->srcSet);
ANV_FROM_HANDLE(anv_descriptor_set, dst, copy->dstSet);
const struct anv_descriptor_set_binding_layout *src_layout =
&src->layout->binding[copy->srcBinding];
const struct anv_descriptor_set_binding_layout *dst_layout =
&dst->layout->binding[copy->dstBinding];
if (src_layout->type == VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK) {
anv_descriptor_set_write_inline_uniform_data(device, dst,
copy->dstBinding,
src->desc_surface_mem.map +
src_layout->descriptor_surface_offset + copy->srcArrayElement,
copy->dstArrayElement,
copy->descriptorCount);
continue;
}
uint32_t copy_surface_element_size =
MIN2(src_layout->descriptor_surface_stride,
dst_layout->descriptor_surface_stride);
uint32_t copy_sampler_element_size =
MIN2(src_layout->descriptor_sampler_stride,
dst_layout->descriptor_sampler_stride);
for (uint32_t j = 0; j < copy->descriptorCount; j++) {
struct anv_descriptor *src_desc =
&src->descriptors[src_layout->descriptor_index +
copy->srcArrayElement + j];
struct anv_descriptor *dst_desc =
&dst->descriptors[dst_layout->descriptor_index +
copy->dstArrayElement + j];
/* Copy the memory containing one of the following structure read by
* the shaders :
* - anv_sampled_image_descriptor
* - anv_storage_image_descriptor
* - anv_address_range_descriptor
* - RENDER_SURFACE_STATE
* - SAMPLER_STATE
*/
if (copy_surface_element_size > 0) {
assert(dst->desc_surface_mem.map != NULL);
assert(src->desc_surface_mem.map != NULL);
memcpy(dst->desc_surface_mem.map +
dst_layout->descriptor_surface_offset +
(copy->dstArrayElement + j) * dst_layout->descriptor_surface_stride,
src->desc_surface_mem.map +
src_layout->descriptor_surface_offset +
(copy->srcArrayElement + j) * src_layout->descriptor_surface_stride,
copy_surface_element_size);
}
if (copy_sampler_element_size) {
assert(dst->desc_sampler_mem.map != NULL);
assert(src->desc_sampler_mem.map != NULL);
memcpy(dst->desc_sampler_mem.map +
dst_layout->descriptor_sampler_offset +
(copy->dstArrayElement + j) * dst_layout->descriptor_sampler_stride,
src->desc_sampler_mem.map +
src_layout->descriptor_sampler_offset +
(copy->srcArrayElement + j) * src_layout->descriptor_sampler_stride,
copy_sampler_element_size);
}
/* Copy the CPU side data anv_descriptor */
*dst_desc = *src_desc;
/* If the CPU side may contain a buffer view, we need to copy that as
* well
*/
const enum anv_descriptor_data data =
src_layout->type == VK_DESCRIPTOR_TYPE_MUTABLE_EXT ?
anv_descriptor_data_for_type(device->physical,
src->layout->type,
src->layout->flags,
src_desc->type) :
src_layout->data;
if (data & ANV_DESCRIPTOR_BUFFER_VIEW) {
struct anv_buffer_view *src_bview =
&src->buffer_views[src_layout->buffer_view_index +
copy->srcArrayElement + j];
struct anv_buffer_view *dst_bview =
&dst->buffer_views[dst_layout->buffer_view_index +
copy->dstArrayElement + j];
dst_desc->set_buffer_view = dst_bview;
dst_bview->vk.range = src_bview->vk.range;
dst_bview->address = src_bview->address;
memcpy(dst_bview->general.state.map,
src_bview->general.state.map,
ANV_SURFACE_STATE_SIZE);
}
}
}
}
/*
* Descriptor update templates.
*/
void
anv_descriptor_set_write_template(struct anv_device *device,
struct anv_descriptor_set *set,
const struct vk_descriptor_update_template *template,
const void *data)
{
for (uint32_t i = 0; i < template->entry_count; i++) {
const struct vk_descriptor_template_entry *entry =
&template->entries[i];
switch (entry->type) {
case VK_DESCRIPTOR_TYPE_SAMPLER:
case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
for (uint32_t j = 0; j < entry->array_count; j++) {
const VkDescriptorImageInfo *info =
data + entry->offset + j * entry->stride;
anv_descriptor_set_write_image_view(device, set,
info, entry->type,
entry->binding,
entry->array_element + j);
}
break;
case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
for (uint32_t j = 0; j < entry->array_count; j++) {
const VkBufferView *_bview =
data + entry->offset + j * entry->stride;
ANV_FROM_HANDLE(anv_buffer_view, bview, *_bview);
anv_descriptor_set_write_buffer_view(device, set,
entry->type,
bview,
entry->binding,
entry->array_element + j);
}
break;
case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
for (uint32_t j = 0; j < entry->array_count; j++) {
const VkDescriptorBufferInfo *info =
data + entry->offset + j * entry->stride;
ANV_FROM_HANDLE(anv_buffer, buffer, info->buffer);
anv_descriptor_set_write_buffer(device, set,
entry->type,
buffer,
entry->binding,
entry->array_element + j,
info->offset, info->range);
}
break;
case VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK:
anv_descriptor_set_write_inline_uniform_data(device, set,
entry->binding,
data + entry->offset,
entry->array_element,
entry->array_count);
break;
case VK_DESCRIPTOR_TYPE_ACCELERATION_STRUCTURE_KHR:
for (uint32_t j = 0; j < entry->array_count; j++) {
VkAccelerationStructureKHR *accel_obj =
(VkAccelerationStructureKHR *)(data + entry->offset + j * entry->stride);
ANV_FROM_HANDLE(vk_acceleration_structure, accel, *accel_obj);
anv_descriptor_set_write_acceleration_structure(device, set,
accel,
entry->binding,
entry->array_element + j);
}
break;
default:
break;
}
}
}
void anv_UpdateDescriptorSetWithTemplate(
VkDevice _device,
VkDescriptorSet descriptorSet,
VkDescriptorUpdateTemplate descriptorUpdateTemplate,
const void* pData)
{
ANV_FROM_HANDLE(anv_device, device, _device);
ANV_FROM_HANDLE(anv_descriptor_set, set, descriptorSet);
VK_FROM_HANDLE(vk_descriptor_update_template, template,
descriptorUpdateTemplate);
anv_descriptor_set_write_template(device, set, template, pData);
}
void anv_GetDescriptorSetLayoutSizeEXT(
VkDevice device,
VkDescriptorSetLayout layout,
VkDeviceSize* pLayoutSizeInBytes)
{
ANV_FROM_HANDLE(anv_descriptor_set_layout, set_layout, layout);
*pLayoutSizeInBytes = set_layout->descriptor_buffer_surface_size;
}
void anv_GetDescriptorSetLayoutBindingOffsetEXT(
VkDevice device,
VkDescriptorSetLayout layout,
uint32_t binding,
VkDeviceSize* pOffset)
{
ANV_FROM_HANDLE(anv_descriptor_set_layout, set_layout, layout);
assert(binding < set_layout->binding_count);
const struct anv_descriptor_set_binding_layout *bind_layout =
&set_layout->binding[binding];
*pOffset = bind_layout->descriptor_surface_offset;
}
static bool
address_info_is_null(const VkDescriptorAddressInfoEXT *addr_info)
{
return addr_info == NULL || addr_info->address == 0 || addr_info->range == 0;
}
void anv_GetDescriptorEXT(
VkDevice _device,
const VkDescriptorGetInfoEXT* pDescriptorInfo,
size_t dataSize,
void* pDescriptor)
{
ANV_FROM_HANDLE(anv_device, device, _device);
struct anv_sampler *sampler;
struct anv_image_view *image_view;
switch (pDescriptorInfo->type) {
case VK_DESCRIPTOR_TYPE_SAMPLER:
if (pDescriptorInfo->data.pSampler &&
(sampler = anv_sampler_from_handle(*pDescriptorInfo->data.pSampler))) {
memcpy(pDescriptor, sampler->state[0], ANV_SAMPLER_STATE_SIZE);
} else {
memset(pDescriptor, 0, ANV_SAMPLER_STATE_SIZE);
}
break;
case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
for (uint32_t i = 0; i < dataSize / (2 * ANV_SURFACE_STATE_SIZE); i++) {
uint32_t desc_offset = i * 2 * ANV_SURFACE_STATE_SIZE;
if (pDescriptorInfo->data.pCombinedImageSampler &&
(image_view = anv_image_view_from_handle(
pDescriptorInfo->data.pCombinedImageSampler->imageView))) {
const VkImageLayout layout =
pDescriptorInfo->data.pCombinedImageSampler->imageLayout;
memcpy(pDescriptor + desc_offset,
anv_image_view_surface_data_for_plane_layout(image_view,
pDescriptorInfo->type,
i,
layout),
ANV_SURFACE_STATE_SIZE);
} else {
memcpy(pDescriptor + desc_offset,
device->host_null_surface_state,
ANV_SURFACE_STATE_SIZE);
}
if (pDescriptorInfo->data.pCombinedImageSampler &&
(sampler = anv_sampler_from_handle(
pDescriptorInfo->data.pCombinedImageSampler->sampler))) {
memcpy(pDescriptor + desc_offset + ANV_SURFACE_STATE_SIZE,
sampler->state[i], ANV_SAMPLER_STATE_SIZE);
} else {
memset(pDescriptor + desc_offset + ANV_SURFACE_STATE_SIZE,
0, ANV_SAMPLER_STATE_SIZE);
}
}
break;
case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
if (pDescriptorInfo->data.pSampledImage &&
(image_view = anv_image_view_from_handle(
pDescriptorInfo->data.pSampledImage->imageView))) {
const VkImageLayout layout =
pDescriptorInfo->data.pSampledImage->imageLayout;
memcpy(pDescriptor,
anv_image_view_surface_data_for_plane_layout(image_view,
pDescriptorInfo->type,
0,
layout),
ANV_SURFACE_STATE_SIZE);
} else {
memcpy(pDescriptor, device->host_null_surface_state,
ANV_SURFACE_STATE_SIZE);
}
break;
case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER: {
const VkDescriptorAddressInfoEXT *addr_info =
pDescriptorInfo->data.pUniformTexelBuffer;
if (!address_info_is_null(addr_info)) {
struct anv_format_plane format =
anv_get_format_plane(device->info,
addr_info->format,
0, VK_IMAGE_TILING_LINEAR);
const uint32_t format_bs =
isl_format_get_layout(format.isl_format)->bpb / 8;
anv_fill_buffer_surface_state(device, pDescriptor,
format.isl_format, format.swizzle,
ISL_SURF_USAGE_TEXTURE_BIT,
anv_address_from_u64(addr_info->address),
align_down_npot_u32(addr_info->range, format_bs),
format_bs);
} else {
memcpy(pDescriptor, device->host_null_surface_state,
ANV_SURFACE_STATE_SIZE);
}
break;
}
case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER: {
const VkDescriptorAddressInfoEXT *addr_info =
pDescriptorInfo->data.pStorageTexelBuffer;
if (!address_info_is_null(addr_info)) {
struct anv_format_plane format =
anv_get_format_plane(device->info,
addr_info->format,
0, VK_IMAGE_TILING_LINEAR);
const uint32_t format_bs =
isl_format_get_layout(format.isl_format)->bpb / 8;
anv_fill_buffer_surface_state(device, pDescriptor,
format.isl_format, format.swizzle,
ISL_SURF_USAGE_STORAGE_BIT,
anv_address_from_u64(addr_info->address),
align_down_npot_u32(addr_info->range, format_bs),
format_bs);
} else {
memcpy(pDescriptor, device->host_null_surface_state,
ANV_SURFACE_STATE_SIZE);
}
break;
}
case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER: {
const VkDescriptorAddressInfoEXT *addr_info =
pDescriptorInfo->data.pStorageBuffer;
if (!address_info_is_null(addr_info)) {
VkDeviceSize range = addr_info->range;
/* We report a bounds checking alignment of 32B for the sake of block
* messages which read an entire register worth at a time.
*/
if (pDescriptorInfo->type == VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER)
range = align64(range, ANV_UBO_ALIGNMENT);
isl_surf_usage_flags_t usage =
pDescriptorInfo->type == VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER ?
ISL_SURF_USAGE_CONSTANT_BUFFER_BIT :
ISL_SURF_USAGE_STORAGE_BIT;
enum isl_format format =
anv_isl_format_for_descriptor_type(device, pDescriptorInfo->type);
isl_buffer_fill_state(&device->isl_dev, pDescriptor,
.address = addr_info->address,
.mocs = isl_mocs(&device->isl_dev, usage, false),
.size_B = range,
.format = format,
.swizzle = ISL_SWIZZLE_IDENTITY,
.stride_B = 1);
} else {
memcpy(pDescriptor, device->host_null_surface_state,
ANV_SURFACE_STATE_SIZE);
}
break;
}
case VK_DESCRIPTOR_TYPE_ACCELERATION_STRUCTURE_KHR: {
struct anv_address_range_descriptor desc_data = {
.address = pDescriptorInfo->data.accelerationStructure,
.range = 0,
};
memcpy(pDescriptor, &desc_data, sizeof(desc_data));
break;
}
default:
unreachable("Invalid descriptor type");
}
}