mirror of https://github.com/cemu-project/Cemu.git
Vulkan: Update some code to use VK_KHR_synchronization2
This commit is contained in:
parent
49c55a3f56
commit
8f1cd4f925
|
@ -468,6 +468,15 @@ VulkanRenderer::VulkanRenderer()
|
||||||
|
|
||||||
void* deviceExtensionFeatures = nullptr;
|
void* deviceExtensionFeatures = nullptr;
|
||||||
|
|
||||||
|
// enable VK_KHR_synchonization_2
|
||||||
|
VkPhysicalDeviceSynchronization2FeaturesKHR sync2Feature{};
|
||||||
|
{
|
||||||
|
sync2Feature.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_SYNCHRONIZATION_2_FEATURES_KHR;
|
||||||
|
sync2Feature.pNext = deviceExtensionFeatures;
|
||||||
|
deviceExtensionFeatures = &sync2Feature;
|
||||||
|
sync2Feature.synchronization2 = VK_TRUE;
|
||||||
|
}
|
||||||
|
|
||||||
// enable VK_EXT_pipeline_creation_cache_control
|
// enable VK_EXT_pipeline_creation_cache_control
|
||||||
VkPhysicalDevicePipelineCreationCacheControlFeaturesEXT cacheControlFeature{};
|
VkPhysicalDevicePipelineCreationCacheControlFeaturesEXT cacheControlFeature{};
|
||||||
if (m_featureControl.deviceExtensions.pipeline_creation_cache_control)
|
if (m_featureControl.deviceExtensions.pipeline_creation_cache_control)
|
||||||
|
@ -2852,13 +2861,20 @@ void VulkanRenderer::DrawBackbufferQuad(LatteTextureView* texView, RendererOutpu
|
||||||
ClearColorbuffer(padView);
|
ClearColorbuffer(padView);
|
||||||
|
|
||||||
// barrier for input texture
|
// barrier for input texture
|
||||||
VkMemoryBarrier memoryBarrier{};
|
{
|
||||||
memoryBarrier.sType = VK_STRUCTURE_TYPE_MEMORY_BARRIER;
|
VkMemoryBarrier2 memoryBarrier2{};
|
||||||
VkPipelineStageFlags srcStage = VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT | VK_PIPELINE_STAGE_TRANSFER_BIT;
|
memoryBarrier2.sType = VK_STRUCTURE_TYPE_MEMORY_BARRIER_2;
|
||||||
VkPipelineStageFlags dstStage = VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT | VK_PIPELINE_STAGE_VERTEX_SHADER_BIT | VK_PIPELINE_STAGE_GEOMETRY_SHADER_BIT | VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
|
memoryBarrier2.srcStageMask = VK_PIPELINE_STAGE_2_COLOR_ATTACHMENT_OUTPUT_BIT_KHR | VK_PIPELINE_STAGE_2_TRANSFER_BIT_KHR;
|
||||||
memoryBarrier.srcAccessMask = VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT | VK_ACCESS_TRANSFER_WRITE_BIT;
|
memoryBarrier2.dstStageMask = VK_PIPELINE_STAGE_2_COLOR_ATTACHMENT_OUTPUT_BIT_KHR | VK_PIPELINE_STAGE_2_VERTEX_SHADER_BIT_KHR | VK_PIPELINE_STAGE_2_GEOMETRY_SHADER_BIT_KHR | VK_PIPELINE_STAGE_2_FRAGMENT_SHADER_BIT_KHR;
|
||||||
memoryBarrier.dstAccessMask = VK_ACCESS_COLOR_ATTACHMENT_READ_BIT | VK_ACCESS_SHADER_READ_BIT;
|
memoryBarrier2.srcAccessMask = VK_ACCESS_2_MEMORY_WRITE_BIT;
|
||||||
vkCmdPipelineBarrier(m_state.currentCommandBuffer, srcStage, dstStage, 0, 1, &memoryBarrier, 0, nullptr, 0, nullptr);
|
memoryBarrier2.dstAccessMask = VK_ACCESS_2_MEMORY_READ_BIT;
|
||||||
|
VkDependencyInfo dependencyInfo{};
|
||||||
|
dependencyInfo.sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO;
|
||||||
|
dependencyInfo.dependencyFlags = 0;
|
||||||
|
dependencyInfo.memoryBarrierCount = 1;
|
||||||
|
dependencyInfo.pMemoryBarriers = &memoryBarrier2;
|
||||||
|
vkCmdPipelineBarrier2KHR(m_state.currentCommandBuffer, &dependencyInfo);
|
||||||
|
}
|
||||||
|
|
||||||
auto pipeline = backbufferBlit_createGraphicsPipeline(m_swapchainDescriptorSetLayout, padView, shader);
|
auto pipeline = backbufferBlit_createGraphicsPipeline(m_swapchainDescriptorSetLayout, padView, shader);
|
||||||
|
|
||||||
|
|
|
@ -728,201 +728,192 @@ private:
|
||||||
|
|
||||||
IMAGE_READ = 0x20,
|
IMAGE_READ = 0x20,
|
||||||
IMAGE_WRITE = 0x40,
|
IMAGE_WRITE = 0x40,
|
||||||
|
|
||||||
};
|
};
|
||||||
|
|
||||||
template<uint32 TSyncOp>
|
template<uint32 TSyncOp>
|
||||||
void barrier_calcStageAndMask(VkPipelineStageFlags& stages, VkAccessFlags& accessFlags)
|
void barrier_calcStageAndMask(VkPipelineStageFlags2& stages, VkAccessFlags2& accessFlags)
|
||||||
{
|
{
|
||||||
stages = 0;
|
stages = 0;
|
||||||
accessFlags = 0;
|
accessFlags = 0;
|
||||||
if constexpr ((TSyncOp & BUFFER_SHADER_READ) != 0)
|
if constexpr ((TSyncOp & BUFFER_SHADER_READ) != 0)
|
||||||
{
|
{
|
||||||
// in theory: VK_ACCESS_INDEX_READ_BIT should be set here too but indices are currently separated
|
// in theory: VK_ACCESS_2_INDEX_READ_BIT should be set here too but indices are currently separated
|
||||||
stages |= VK_PIPELINE_STAGE_VERTEX_INPUT_BIT | VK_PIPELINE_STAGE_VERTEX_SHADER_BIT | VK_PIPELINE_STAGE_GEOMETRY_SHADER_BIT | VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
|
stages |= VK_PIPELINE_STAGE_2_VERTEX_INPUT_BIT | VK_PIPELINE_STAGE_2_VERTEX_SHADER_BIT | VK_PIPELINE_STAGE_2_GEOMETRY_SHADER_BIT | VK_PIPELINE_STAGE_2_FRAGMENT_SHADER_BIT;
|
||||||
accessFlags |= VK_ACCESS_VERTEX_ATTRIBUTE_READ_BIT | VK_ACCESS_UNIFORM_READ_BIT | VK_ACCESS_SHADER_READ_BIT;
|
accessFlags |= VK_ACCESS_2_VERTEX_ATTRIBUTE_READ_BIT | VK_ACCESS_2_UNIFORM_READ_BIT | VK_ACCESS_2_SHADER_READ_BIT;
|
||||||
}
|
}
|
||||||
|
|
||||||
if constexpr ((TSyncOp & BUFFER_SHADER_WRITE) != 0)
|
if constexpr ((TSyncOp & BUFFER_SHADER_WRITE) != 0)
|
||||||
{
|
{
|
||||||
stages |= VK_PIPELINE_STAGE_VERTEX_SHADER_BIT | VK_PIPELINE_STAGE_GEOMETRY_SHADER_BIT | VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
|
stages |= VK_PIPELINE_STAGE_2_VERTEX_SHADER_BIT | VK_PIPELINE_STAGE_2_GEOMETRY_SHADER_BIT | VK_PIPELINE_STAGE_2_FRAGMENT_SHADER_BIT;
|
||||||
accessFlags |= VK_ACCESS_SHADER_WRITE_BIT;
|
accessFlags |= VK_ACCESS_2_SHADER_WRITE_BIT;
|
||||||
}
|
}
|
||||||
|
|
||||||
if constexpr ((TSyncOp & ANY_TRANSFER) != 0)
|
if constexpr ((TSyncOp & ANY_TRANSFER) != 0)
|
||||||
{
|
{
|
||||||
//stages |= VK_PIPELINE_STAGE_TRANSFER_BIT | VK_PIPELINE_STAGE_HOST_BIT;
|
stages |= VK_PIPELINE_STAGE_2_TRANSFER_BIT;
|
||||||
//accessFlags |= VK_ACCESS_TRANSFER_READ_BIT | VK_ACCESS_TRANSFER_WRITE_BIT | VK_ACCESS_HOST_READ_BIT | VK_ACCESS_HOST_WRITE_BIT;
|
accessFlags |= VK_ACCESS_2_TRANSFER_READ_BIT | VK_ACCESS_2_TRANSFER_WRITE_BIT;
|
||||||
stages |= VK_PIPELINE_STAGE_TRANSFER_BIT;
|
|
||||||
accessFlags |= VK_ACCESS_TRANSFER_READ_BIT | VK_ACCESS_TRANSFER_WRITE_BIT;
|
|
||||||
|
|
||||||
//accessFlags |= VK_ACCESS_MEMORY_READ_BIT;
|
|
||||||
//accessFlags |= VK_ACCESS_MEMORY_WRITE_BIT;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if constexpr ((TSyncOp & TRANSFER_READ) != 0)
|
if constexpr ((TSyncOp & TRANSFER_READ) != 0)
|
||||||
{
|
{
|
||||||
stages |= VK_PIPELINE_STAGE_TRANSFER_BIT;
|
stages |= VK_PIPELINE_STAGE_2_TRANSFER_BIT;
|
||||||
accessFlags |= VK_ACCESS_TRANSFER_READ_BIT;
|
accessFlags |= VK_ACCESS_2_TRANSFER_READ_BIT;
|
||||||
|
|
||||||
//accessFlags |= VK_ACCESS_MEMORY_READ_BIT;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if constexpr ((TSyncOp & TRANSFER_WRITE) != 0)
|
if constexpr ((TSyncOp & TRANSFER_WRITE) != 0)
|
||||||
{
|
{
|
||||||
stages |= VK_PIPELINE_STAGE_TRANSFER_BIT;
|
stages |= VK_PIPELINE_STAGE_2_TRANSFER_BIT;
|
||||||
accessFlags |= VK_ACCESS_TRANSFER_WRITE_BIT;
|
accessFlags |= VK_ACCESS_2_TRANSFER_WRITE_BIT;
|
||||||
|
|
||||||
//accessFlags |= VK_ACCESS_MEMORY_WRITE_BIT;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if constexpr ((TSyncOp & HOST_WRITE) != 0)
|
if constexpr ((TSyncOp & HOST_WRITE) != 0)
|
||||||
{
|
{
|
||||||
stages |= VK_PIPELINE_STAGE_HOST_BIT;
|
stages |= VK_PIPELINE_STAGE_2_HOST_BIT;
|
||||||
accessFlags |= VK_ACCESS_HOST_WRITE_BIT;
|
accessFlags |= VK_ACCESS_2_HOST_WRITE_BIT;
|
||||||
}
|
}
|
||||||
|
|
||||||
if constexpr ((TSyncOp & HOST_READ) != 0)
|
if constexpr ((TSyncOp & HOST_READ) != 0)
|
||||||
{
|
{
|
||||||
stages |= VK_PIPELINE_STAGE_HOST_BIT;
|
stages |= VK_PIPELINE_STAGE_2_HOST_BIT;
|
||||||
accessFlags |= VK_ACCESS_HOST_READ_BIT;
|
accessFlags |= VK_ACCESS_2_HOST_READ_BIT;
|
||||||
}
|
}
|
||||||
|
|
||||||
if constexpr ((TSyncOp & IMAGE_READ) != 0)
|
if constexpr ((TSyncOp & IMAGE_READ) != 0)
|
||||||
{
|
{
|
||||||
stages |= VK_PIPELINE_STAGE_VERTEX_SHADER_BIT | VK_PIPELINE_STAGE_GEOMETRY_SHADER_BIT | VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
|
stages |= VK_PIPELINE_STAGE_2_VERTEX_SHADER_BIT | VK_PIPELINE_STAGE_2_GEOMETRY_SHADER_BIT | VK_PIPELINE_STAGE_2_FRAGMENT_SHADER_BIT;
|
||||||
accessFlags |= VK_ACCESS_SHADER_READ_BIT;
|
accessFlags |= VK_ACCESS_2_SHADER_READ_BIT;
|
||||||
|
|
||||||
stages |= VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT;
|
stages |= VK_PIPELINE_STAGE_2_COLOR_ATTACHMENT_OUTPUT_BIT;
|
||||||
accessFlags |= VK_ACCESS_COLOR_ATTACHMENT_READ_BIT;
|
accessFlags |= VK_ACCESS_2_COLOR_ATTACHMENT_READ_BIT;
|
||||||
|
|
||||||
stages |= VK_PIPELINE_STAGE_EARLY_FRAGMENT_TESTS_BIT | VK_PIPELINE_STAGE_LATE_FRAGMENT_TESTS_BIT;
|
stages |= VK_PIPELINE_STAGE_2_EARLY_FRAGMENT_TESTS_BIT | VK_PIPELINE_STAGE_2_LATE_FRAGMENT_TESTS_BIT;
|
||||||
accessFlags |= VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_READ_BIT;
|
accessFlags |= VK_ACCESS_2_DEPTH_STENCIL_ATTACHMENT_READ_BIT;
|
||||||
}
|
}
|
||||||
|
|
||||||
if constexpr ((TSyncOp & IMAGE_WRITE) != 0)
|
if constexpr ((TSyncOp & IMAGE_WRITE) != 0)
|
||||||
{
|
{
|
||||||
stages |= VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT;
|
stages |= VK_PIPELINE_STAGE_2_COLOR_ATTACHMENT_OUTPUT_BIT;
|
||||||
accessFlags |= VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT;
|
accessFlags |= VK_ACCESS_2_COLOR_ATTACHMENT_WRITE_BIT;
|
||||||
|
|
||||||
stages |= VK_PIPELINE_STAGE_EARLY_FRAGMENT_TESTS_BIT | VK_PIPELINE_STAGE_LATE_FRAGMENT_TESTS_BIT;
|
stages |= VK_PIPELINE_STAGE_2_EARLY_FRAGMENT_TESTS_BIT | VK_PIPELINE_STAGE_2_LATE_FRAGMENT_TESTS_BIT;
|
||||||
accessFlags |= VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT;
|
accessFlags |= VK_ACCESS_2_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
template<uint32 TSrcSyncOp, uint32 TDstSyncOp>
|
template<uint32 TSrcSyncOp, uint32 TDstSyncOp>
|
||||||
void barrier_bufferRange(VkBuffer buffer, VkDeviceSize offset, VkDeviceSize size)
|
void barrier_bufferRange(VkBuffer buffer, VkDeviceSize offset, VkDeviceSize size)
|
||||||
{
|
{
|
||||||
VkBufferMemoryBarrier bufMemBarrier{};
|
VkBufferMemoryBarrier2 bufMemBarrier{};
|
||||||
bufMemBarrier.sType = VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER;
|
bufMemBarrier.sType = VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER_2;
|
||||||
bufMemBarrier.pNext = nullptr;
|
bufMemBarrier.pNext = nullptr;
|
||||||
bufMemBarrier.srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
bufMemBarrier.srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
||||||
bufMemBarrier.dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
bufMemBarrier.dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
||||||
|
|
||||||
VkPipelineStageFlags srcStages = 0;
|
barrier_calcStageAndMask<TSrcSyncOp>(bufMemBarrier.srcStageMask, bufMemBarrier.srcAccessMask);
|
||||||
VkPipelineStageFlags dstStages = 0;
|
barrier_calcStageAndMask<TDstSyncOp>(bufMemBarrier.dstStageMask, bufMemBarrier.dstAccessMask);
|
||||||
|
|
||||||
bufMemBarrier.srcAccessMask = 0;
|
|
||||||
bufMemBarrier.dstAccessMask = 0;
|
|
||||||
|
|
||||||
barrier_calcStageAndMask<TSrcSyncOp>(srcStages, bufMemBarrier.srcAccessMask);
|
|
||||||
barrier_calcStageAndMask<TDstSyncOp>(dstStages, bufMemBarrier.dstAccessMask);
|
|
||||||
|
|
||||||
bufMemBarrier.buffer = buffer;
|
bufMemBarrier.buffer = buffer;
|
||||||
bufMemBarrier.offset = offset;
|
bufMemBarrier.offset = offset;
|
||||||
bufMemBarrier.size = size;
|
bufMemBarrier.size = size;
|
||||||
vkCmdPipelineBarrier(m_state.currentCommandBuffer, srcStages, dstStages, 0, 0, nullptr, 1, &bufMemBarrier, 0, nullptr);
|
|
||||||
|
VkDependencyInfo depInfo{};
|
||||||
|
depInfo.sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO;
|
||||||
|
depInfo.pNext = nullptr;
|
||||||
|
depInfo.bufferMemoryBarrierCount = 1;
|
||||||
|
depInfo.pBufferMemoryBarriers = &bufMemBarrier;
|
||||||
|
vkCmdPipelineBarrier2KHR(m_state.currentCommandBuffer, &depInfo);
|
||||||
}
|
}
|
||||||
|
|
||||||
template<uint32 TSrcSyncOpA, uint32 TDstSyncOpA, uint32 TSrcSyncOpB, uint32 TDstSyncOpB>
|
template<uint32 TSrcSyncOpA, uint32 TDstSyncOpA, uint32 TSrcSyncOpB, uint32 TDstSyncOpB>
|
||||||
void barrier_bufferRange(VkBuffer bufferA, VkDeviceSize offsetA, VkDeviceSize sizeA,
|
void barrier_bufferRange(VkBuffer bufferA, VkDeviceSize offsetA, VkDeviceSize sizeA,
|
||||||
VkBuffer bufferB, VkDeviceSize offsetB, VkDeviceSize sizeB)
|
VkBuffer bufferB, VkDeviceSize offsetB, VkDeviceSize sizeB)
|
||||||
{
|
{
|
||||||
VkPipelineStageFlags srcStagesA = 0;
|
VkBufferMemoryBarrier2 bufMemBarrier2[2] = {};
|
||||||
VkPipelineStageFlags dstStagesA = 0;
|
bufMemBarrier2[0].sType = VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER_2_KHR;
|
||||||
VkPipelineStageFlags srcStagesB = 0;
|
bufMemBarrier2[0].pNext = nullptr;
|
||||||
VkPipelineStageFlags dstStagesB = 0;
|
bufMemBarrier2[0].srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
||||||
|
bufMemBarrier2[0].dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
||||||
|
bufMemBarrier2[0].buffer = bufferA;
|
||||||
|
bufMemBarrier2[0].offset = offsetA;
|
||||||
|
bufMemBarrier2[0].size = sizeA;
|
||||||
|
barrier_calcStageAndMask<TSrcSyncOpA>(bufMemBarrier2[0].srcStageMask, bufMemBarrier2[0].srcAccessMask);
|
||||||
|
barrier_calcStageAndMask<TDstSyncOpA>(bufMemBarrier2[0].dstStageMask, bufMemBarrier2[0].dstAccessMask);
|
||||||
|
|
||||||
VkBufferMemoryBarrier bufMemBarrier[2];
|
bufMemBarrier2[1].sType = VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER_2_KHR;
|
||||||
|
bufMemBarrier2[1].pNext = nullptr;
|
||||||
|
bufMemBarrier2[1].srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
||||||
|
bufMemBarrier2[1].dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
||||||
|
bufMemBarrier2[1].buffer = bufferB;
|
||||||
|
bufMemBarrier2[1].offset = offsetB;
|
||||||
|
bufMemBarrier2[1].size = sizeB;
|
||||||
|
barrier_calcStageAndMask<TSrcSyncOpB>(bufMemBarrier2[1].srcStageMask, bufMemBarrier2[1].srcAccessMask);
|
||||||
|
barrier_calcStageAndMask<TDstSyncOpB>(bufMemBarrier2[1].dstStageMask, bufMemBarrier2[1].dstAccessMask);
|
||||||
|
|
||||||
bufMemBarrier[0].sType = VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER;
|
VkDependencyInfo dependencyInfo = {};
|
||||||
bufMemBarrier[0].pNext = nullptr;
|
dependencyInfo.sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO;
|
||||||
bufMemBarrier[0].srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
dependencyInfo.pNext = nullptr;
|
||||||
bufMemBarrier[0].dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
dependencyInfo.bufferMemoryBarrierCount = 2;
|
||||||
bufMemBarrier[0].srcAccessMask = 0;
|
dependencyInfo.pBufferMemoryBarriers = bufMemBarrier2;
|
||||||
bufMemBarrier[0].dstAccessMask = 0;
|
vkCmdPipelineBarrier2KHR(m_state.currentCommandBuffer, &dependencyInfo);
|
||||||
barrier_calcStageAndMask<TSrcSyncOpA>(srcStagesA, bufMemBarrier[0].srcAccessMask);
|
|
||||||
barrier_calcStageAndMask<TDstSyncOpA>(dstStagesA, bufMemBarrier[0].dstAccessMask);
|
|
||||||
bufMemBarrier[0].buffer = bufferA;
|
|
||||||
bufMemBarrier[0].offset = offsetA;
|
|
||||||
bufMemBarrier[0].size = sizeA;
|
|
||||||
|
|
||||||
bufMemBarrier[1].sType = VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER;
|
|
||||||
bufMemBarrier[1].pNext = nullptr;
|
|
||||||
bufMemBarrier[1].srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
|
||||||
bufMemBarrier[1].dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
|
||||||
bufMemBarrier[1].srcAccessMask = 0;
|
|
||||||
bufMemBarrier[1].dstAccessMask = 0;
|
|
||||||
barrier_calcStageAndMask<TSrcSyncOpB>(srcStagesB, bufMemBarrier[1].srcAccessMask);
|
|
||||||
barrier_calcStageAndMask<TDstSyncOpB>(dstStagesB, bufMemBarrier[1].dstAccessMask);
|
|
||||||
bufMemBarrier[1].buffer = bufferB;
|
|
||||||
bufMemBarrier[1].offset = offsetB;
|
|
||||||
bufMemBarrier[1].size = sizeB;
|
|
||||||
|
|
||||||
vkCmdPipelineBarrier(m_state.currentCommandBuffer, srcStagesA|srcStagesB, dstStagesA|dstStagesB, 0, 0, nullptr, 2, bufMemBarrier, 0, nullptr);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void barrier_sequentializeTransfer()
|
void barrier_sequentializeTransfer()
|
||||||
{
|
{
|
||||||
VkMemoryBarrier memBarrier{};
|
VkMemoryBarrier2 memoryBarrier2{};
|
||||||
memBarrier.sType = VK_STRUCTURE_TYPE_MEMORY_BARRIER;
|
memoryBarrier2.sType = VK_STRUCTURE_TYPE_MEMORY_BARRIER_2;
|
||||||
memBarrier.pNext = nullptr;
|
memoryBarrier2.pNext = nullptr;
|
||||||
|
memoryBarrier2.srcStageMask = VK_PIPELINE_STAGE_2_TRANSFER_BIT;
|
||||||
|
memoryBarrier2.srcAccessMask = VK_ACCESS_2_TRANSFER_READ_BIT | VK_ACCESS_2_TRANSFER_WRITE_BIT;
|
||||||
|
memoryBarrier2.dstStageMask = VK_PIPELINE_STAGE_2_TOP_OF_PIPE_BIT;
|
||||||
|
memoryBarrier2.dstAccessMask = VK_ACCESS_2_MEMORY_READ_BIT | VK_ACCESS_2_MEMORY_WRITE_BIT;
|
||||||
|
|
||||||
VkPipelineStageFlags srcStages = VK_PIPELINE_STAGE_TRANSFER_BIT;
|
VkDependencyInfo dependencyInfo{};
|
||||||
VkPipelineStageFlags dstStages = VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT;
|
dependencyInfo.sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO;
|
||||||
|
dependencyInfo.pNext = nullptr;
|
||||||
memBarrier.srcAccessMask = VK_ACCESS_TRANSFER_READ_BIT | VK_ACCESS_TRANSFER_WRITE_BIT;
|
dependencyInfo.memoryBarrierCount = 1;
|
||||||
memBarrier.dstAccessMask = 0;
|
dependencyInfo.pMemoryBarriers = &memoryBarrier2;
|
||||||
|
dependencyInfo.bufferMemoryBarrierCount = 0;
|
||||||
memBarrier.srcAccessMask |= (VK_ACCESS_MEMORY_READ_BIT | VK_ACCESS_MEMORY_WRITE_BIT);
|
dependencyInfo.imageMemoryBarrierCount = 0;
|
||||||
memBarrier.dstAccessMask |= (VK_ACCESS_MEMORY_READ_BIT | VK_ACCESS_MEMORY_WRITE_BIT);
|
vkCmdPipelineBarrier2KHR(m_state.currentCommandBuffer, &dependencyInfo);
|
||||||
|
|
||||||
vkCmdPipelineBarrier(m_state.currentCommandBuffer, srcStages, dstStages, 0, 1, &memBarrier, 0, nullptr, 0, nullptr);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void barrier_sequentializeCommand()
|
void barrier_sequentializeCommand()
|
||||||
{
|
{
|
||||||
VkPipelineStageFlags srcStages = VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT;
|
VkMemoryBarrier2 memoryBarrier = {};
|
||||||
VkPipelineStageFlags dstStages = VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT;
|
memoryBarrier.sType = VK_STRUCTURE_TYPE_MEMORY_BARRIER_2;
|
||||||
|
memoryBarrier.srcStageMask = VK_PIPELINE_STAGE_2_BOTTOM_OF_PIPE_BIT_KHR;
|
||||||
|
memoryBarrier.srcAccessMask = 0;
|
||||||
|
memoryBarrier.dstStageMask = VK_PIPELINE_STAGE_2_TOP_OF_PIPE_BIT_KHR;
|
||||||
|
memoryBarrier.dstAccessMask = 0;
|
||||||
|
|
||||||
vkCmdPipelineBarrier(m_state.currentCommandBuffer, srcStages, dstStages, 0, 0, nullptr, 0, nullptr, 0, nullptr);
|
VkDependencyInfo dependencyInfo = {};
|
||||||
|
dependencyInfo.sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO;
|
||||||
|
dependencyInfo.dependencyFlags = 0;
|
||||||
|
dependencyInfo.memoryBarrierCount = 1;
|
||||||
|
dependencyInfo.pMemoryBarriers = &memoryBarrier;
|
||||||
|
vkCmdPipelineBarrier2KHR(m_state.currentCommandBuffer, &dependencyInfo);
|
||||||
}
|
}
|
||||||
|
|
||||||
template<uint32 TSrcSyncOp, uint32 TDstSyncOp>
|
template<uint32 TSrcSyncOp, uint32 TDstSyncOp>
|
||||||
void barrier_image(VkImage imageVk, VkImageSubresourceRange& subresourceRange, VkImageLayout oldLayout, VkImageLayout newLayout)
|
void barrier_image(VkImage imageVk, VkImageSubresourceRange& subresourceRange, VkImageLayout oldLayout, VkImageLayout newLayout)
|
||||||
{
|
{
|
||||||
VkPipelineStageFlags srcStages = 0;
|
VkImageMemoryBarrier2 imageMemBarrier2{};
|
||||||
VkPipelineStageFlags dstStages = 0;
|
imageMemBarrier2.sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER_2;
|
||||||
|
imageMemBarrier2.oldLayout = oldLayout;
|
||||||
|
imageMemBarrier2.newLayout = newLayout;
|
||||||
|
imageMemBarrier2.srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
||||||
|
imageMemBarrier2.dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
||||||
|
imageMemBarrier2.image = imageVk;
|
||||||
|
imageMemBarrier2.subresourceRange = subresourceRange;
|
||||||
|
|
||||||
VkImageMemoryBarrier imageMemBarrier{};
|
barrier_calcStageAndMask<TSrcSyncOp>(imageMemBarrier2.srcStageMask, imageMemBarrier2.srcAccessMask);
|
||||||
imageMemBarrier.sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER;
|
barrier_calcStageAndMask<TDstSyncOp>(imageMemBarrier2.dstStageMask, imageMemBarrier2.dstAccessMask);
|
||||||
imageMemBarrier.srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
|
||||||
imageMemBarrier.dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
|
|
||||||
imageMemBarrier.srcAccessMask = 0;
|
|
||||||
imageMemBarrier.dstAccessMask = 0;
|
|
||||||
barrier_calcStageAndMask<TSrcSyncOp>(srcStages, imageMemBarrier.srcAccessMask);
|
|
||||||
barrier_calcStageAndMask<TDstSyncOp>(dstStages, imageMemBarrier.dstAccessMask);
|
|
||||||
imageMemBarrier.image = imageVk;
|
|
||||||
imageMemBarrier.subresourceRange = subresourceRange;
|
|
||||||
imageMemBarrier.oldLayout = oldLayout;
|
|
||||||
imageMemBarrier.newLayout = newLayout;
|
|
||||||
|
|
||||||
vkCmdPipelineBarrier(m_state.currentCommandBuffer,
|
VkDependencyInfo dependencyInfo{};
|
||||||
srcStages, dstStages,
|
dependencyInfo.sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO;
|
||||||
0,
|
dependencyInfo.imageMemoryBarrierCount = 1;
|
||||||
0, NULL,
|
dependencyInfo.pImageMemoryBarriers = &imageMemBarrier2;
|
||||||
0, NULL,
|
vkCmdPipelineBarrier2KHR(m_state.currentCommandBuffer, &dependencyInfo);
|
||||||
1, &imageMemBarrier);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
template<uint32 TSrcSyncOp, uint32 TDstSyncOp>
|
template<uint32 TSrcSyncOp, uint32 TDstSyncOp>
|
||||||
|
@ -942,7 +933,6 @@ private:
|
||||||
vkTexture->SetImageLayout(subresourceRange, newLayout);
|
vkTexture->SetImageLayout(subresourceRange, newLayout);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
public:
|
public:
|
||||||
bool GetDisableMultithreadedCompilation() const { return m_featureControl.disableMultithreadedCompilation; }
|
bool GetDisableMultithreadedCompilation() const { return m_featureControl.disableMultithreadedCompilation; }
|
||||||
bool UseTFViaSSBO() const { return m_featureControl.mode.useTFEmulationViaSSBO; }
|
bool UseTFViaSSBO() const { return m_featureControl.mode.useTFEmulationViaSSBO; }
|
||||||
|
|
|
@ -1033,29 +1033,18 @@ void VulkanRenderer::sync_inputTexturesChanged()
|
||||||
// barrier here
|
// barrier here
|
||||||
if (writeFlushRequired)
|
if (writeFlushRequired)
|
||||||
{
|
{
|
||||||
VkMemoryBarrier memoryBarrier{};
|
VkMemoryBarrier2 memoryBarrier2{};
|
||||||
memoryBarrier.sType = VK_STRUCTURE_TYPE_MEMORY_BARRIER;
|
memoryBarrier2.sType = VK_STRUCTURE_TYPE_MEMORY_BARRIER_2_KHR;
|
||||||
memoryBarrier.srcAccessMask = 0;
|
memoryBarrier2.srcStageMask = VK_PIPELINE_STAGE_2_COLOR_ATTACHMENT_OUTPUT_BIT_KHR | VK_PIPELINE_STAGE_2_EARLY_FRAGMENT_TESTS_BIT_KHR | VK_PIPELINE_STAGE_2_LATE_FRAGMENT_TESTS_BIT_KHR;
|
||||||
memoryBarrier.dstAccessMask = 0;
|
memoryBarrier2.srcAccessMask = VK_ACCESS_2_COLOR_ATTACHMENT_WRITE_BIT_KHR | VK_ACCESS_2_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT_KHR;
|
||||||
|
memoryBarrier2.dstStageMask = VK_PIPELINE_STAGE_2_COLOR_ATTACHMENT_OUTPUT_BIT_KHR | VK_PIPELINE_STAGE_2_VERTEX_SHADER_BIT_KHR | VK_PIPELINE_STAGE_2_GEOMETRY_SHADER_BIT_KHR | VK_PIPELINE_STAGE_2_FRAGMENT_SHADER_BIT_KHR | VK_PIPELINE_STAGE_2_EARLY_FRAGMENT_TESTS_BIT_KHR | VK_PIPELINE_STAGE_2_LATE_FRAGMENT_TESTS_BIT_KHR;
|
||||||
VkPipelineStageFlags srcStage = 0;
|
memoryBarrier2.dstAccessMask = VK_ACCESS_2_COLOR_ATTACHMENT_READ_BIT_KHR | VK_ACCESS_2_COLOR_ATTACHMENT_WRITE_BIT_KHR | VK_ACCESS_2_DEPTH_STENCIL_ATTACHMENT_READ_BIT_KHR | VK_ACCESS_2_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT_KHR | VK_ACCESS_2_SHADER_READ_BIT_KHR;
|
||||||
VkPipelineStageFlags dstStage = 0;
|
VkDependencyInfo dependencyInfo{};
|
||||||
|
dependencyInfo.sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO_KHR;
|
||||||
// src
|
dependencyInfo.dependencyFlags = 0;
|
||||||
srcStage |= VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT;
|
dependencyInfo.memoryBarrierCount = 1;
|
||||||
memoryBarrier.srcAccessMask |= VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT;
|
dependencyInfo.pMemoryBarriers = &memoryBarrier2;
|
||||||
|
vkCmdPipelineBarrier2KHR(m_state.currentCommandBuffer, &dependencyInfo);
|
||||||
srcStage |= VK_PIPELINE_STAGE_EARLY_FRAGMENT_TESTS_BIT | VK_PIPELINE_STAGE_LATE_FRAGMENT_TESTS_BIT;
|
|
||||||
memoryBarrier.srcAccessMask |= VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT;
|
|
||||||
|
|
||||||
// dst
|
|
||||||
dstStage |= VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT | VK_PIPELINE_STAGE_VERTEX_SHADER_BIT | VK_PIPELINE_STAGE_GEOMETRY_SHADER_BIT | VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
|
|
||||||
memoryBarrier.dstAccessMask |= VK_ACCESS_COLOR_ATTACHMENT_READ_BIT | VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT | VK_ACCESS_SHADER_READ_BIT;
|
|
||||||
|
|
||||||
dstStage |= VK_PIPELINE_STAGE_EARLY_FRAGMENT_TESTS_BIT | VK_PIPELINE_STAGE_LATE_FRAGMENT_TESTS_BIT | VK_PIPELINE_STAGE_VERTEX_SHADER_BIT | VK_PIPELINE_STAGE_GEOMETRY_SHADER_BIT | VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
|
|
||||||
memoryBarrier.dstAccessMask |= VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_READ_BIT | VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT | VK_ACCESS_SHADER_READ_BIT;
|
|
||||||
|
|
||||||
vkCmdPipelineBarrier(m_state.currentCommandBuffer, srcStage, dstStage, 0, 1, &memoryBarrier, 0, nullptr, 0, nullptr);
|
|
||||||
|
|
||||||
performanceMonitor.vk.numDrawBarriersPerFrame.increment();
|
performanceMonitor.vk.numDrawBarriersPerFrame.increment();
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue