| /* |
| * Copyright (c) 2019-2021 Valve Corporation |
| * Copyright (c) 2019-2021 LunarG, Inc. |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| * |
| * Author: John Zulauf <jzulauf@lunarg.com> |
| * Author: Locke Lin <locke@lunarg.com> |
| * Author: Jeremy Gebben <jeremyg@lunarg.com> |
| */ |
| #include "sync_utils.h" |
| #include "state_tracker.h" |
| #include "synchronization_validation_types.h" |
| |
| namespace sync_utils { |
| static constexpr uint32_t kNumPipelineStageBits = sizeof(VkPipelineStageFlags2KHR) * 8; |
| |
| VkPipelineStageFlags2KHR DisabledPipelineStages(const DeviceFeatures &features) { |
| VkPipelineStageFlags2KHR result = 0; |
| if (!features.core.geometryShader) { |
| result |= VK_PIPELINE_STAGE_GEOMETRY_SHADER_BIT; |
| } |
| if (!features.core.tessellationShader) { |
| result |= VK_PIPELINE_STAGE_TESSELLATION_CONTROL_SHADER_BIT | VK_PIPELINE_STAGE_TESSELLATION_EVALUATION_SHADER_BIT; |
| } |
| if (!features.conditional_rendering.conditionalRendering) { |
| result |= VK_PIPELINE_STAGE_CONDITIONAL_RENDERING_BIT_EXT; |
| } |
| if (!features.fragment_density_map_features.fragmentDensityMap) { |
| result |= VK_PIPELINE_STAGE_FRAGMENT_DENSITY_PROCESS_BIT_EXT; |
| } |
| if (!features.transform_feedback_features.transformFeedback) { |
| result |= VK_PIPELINE_STAGE_TRANSFORM_FEEDBACK_BIT_EXT; |
| } |
| if (!features.mesh_shader.meshShader) { |
| result |= VK_PIPELINE_STAGE_MESH_SHADER_BIT_NV; |
| } |
| if (!features.mesh_shader.taskShader) { |
| result |= VK_PIPELINE_STAGE_TASK_SHADER_BIT_NV; |
| } |
| if (!features.fragment_shading_rate_features.pipelineFragmentShadingRate && !features.shading_rate_image.shadingRateImage) { |
| result |= VK_PIPELINE_STAGE_FRAGMENT_SHADING_RATE_ATTACHMENT_BIT_KHR; |
| } |
| // TODO: VK_PIPELINE_STAGE_ACCELERATION_STRUCTURE_BUILD_BIT_KHR |
| // TODO: VK_PIPELINE_STAGE_RAY_TRACING_SHADER_BIT_KHR |
| return result; |
| } |
| |
| VkPipelineStageFlags2KHR ExpandPipelineStages(VkPipelineStageFlags2KHR stage_mask, VkQueueFlags queue_flags, |
| const VkPipelineStageFlags2KHR disabled_feature_mask) { |
| VkPipelineStageFlags2KHR expanded = stage_mask; |
| |
| if (VK_PIPELINE_STAGE_ALL_COMMANDS_BIT & stage_mask) { |
| expanded &= ~VK_PIPELINE_STAGE_ALL_COMMANDS_BIT; |
| for (const auto &all_commands : syncAllCommandStagesByQueueFlags) { |
| if (all_commands.first & queue_flags) { |
| expanded |= all_commands.second & ~disabled_feature_mask; |
| } |
| } |
| } |
| if (VK_PIPELINE_STAGE_ALL_GRAPHICS_BIT & stage_mask) { |
| expanded &= ~VK_PIPELINE_STAGE_ALL_GRAPHICS_BIT; |
| // Make sure we don't pull in the HOST stage from expansion, but keep it if set by the caller. |
| // The syncAllCommandStagesByQueueFlags table includes HOST for all queue types since it is |
| // allowed but it shouldn't be part of ALL_GRAPHICS |
| expanded |= |
| syncAllCommandStagesByQueueFlags.at(VK_QUEUE_GRAPHICS_BIT) & ~disabled_feature_mask & ~VK_PIPELINE_STAGE_HOST_BIT; |
| } |
| if (VK_PIPELINE_STAGE_2_ALL_TRANSFER_BIT_KHR & stage_mask) { |
| expanded &= ~VK_PIPELINE_STAGE_2_ALL_TRANSFER_BIT_KHR; |
| expanded |= VK_PIPELINE_STAGE_2_COPY_BIT_KHR | VK_PIPELINE_STAGE_2_RESOLVE_BIT_KHR | VK_PIPELINE_STAGE_2_BLIT_BIT_KHR | |
| VK_PIPELINE_STAGE_2_CLEAR_BIT_KHR; |
| } |
| if (VK_PIPELINE_STAGE_2_VERTEX_INPUT_BIT_KHR & stage_mask) { |
| expanded &= ~VK_PIPELINE_STAGE_2_VERTEX_INPUT_BIT_KHR; |
| expanded |= VK_PIPELINE_STAGE_2_INDEX_INPUT_BIT_KHR | VK_PIPELINE_STAGE_2_VERTEX_ATTRIBUTE_INPUT_BIT_KHR; |
| } |
| if (VK_PIPELINE_STAGE_2_PRE_RASTERIZATION_SHADERS_BIT_KHR & stage_mask) { |
| expanded &= ~VK_PIPELINE_STAGE_2_PRE_RASTERIZATION_SHADERS_BIT_KHR; |
| expanded |= VK_PIPELINE_STAGE_2_VERTEX_SHADER_BIT_KHR | VK_PIPELINE_STAGE_2_TESSELLATION_CONTROL_SHADER_BIT_KHR | |
| VK_PIPELINE_STAGE_2_TESSELLATION_EVALUATION_SHADER_BIT_KHR | VK_PIPELINE_STAGE_2_GEOMETRY_SHADER_BIT_KHR; |
| } |
| |
| return expanded; |
| } |
| |
| static const auto kShaderReadExpandBits = |
| VK_ACCESS_2_UNIFORM_READ_BIT_KHR | VK_ACCESS_2_SHADER_SAMPLED_READ_BIT_KHR | VK_ACCESS_2_SHADER_STORAGE_READ_BIT_KHR; |
| static const auto kShaderWriteExpandBits = VK_ACCESS_2_SHADER_STORAGE_WRITE_BIT_KHR; |
| |
| VkAccessFlags2KHR ExpandAccessFlags(VkAccessFlags2KHR access_mask) { |
| VkAccessFlags2KHR expanded = access_mask; |
| |
| if (VK_ACCESS_2_SHADER_READ_BIT_KHR & access_mask) { |
| expanded = expanded & ~VK_ACCESS_2_SHADER_READ_BIT_KHR; |
| expanded |= kShaderReadExpandBits; |
| } |
| |
| if (VK_ACCESS_2_SHADER_WRITE_BIT_KHR & access_mask) { |
| expanded = expanded & ~VK_ACCESS_2_SHADER_WRITE_BIT_KHR; |
| expanded |= kShaderWriteExpandBits; |
| } |
| |
| return expanded; |
| } |
| |
| VkAccessFlags2KHR CompatibleAccessMask(VkPipelineStageFlags2KHR stage_mask) { |
| VkAccessFlags2KHR result = 0; |
| stage_mask = ExpandPipelineStages(stage_mask); |
| for (size_t i = 0; i < kNumPipelineStageBits; i++) { |
| VkPipelineStageFlags2KHR bit = 1ULL << i; |
| if (stage_mask & bit) { |
| auto access_rec = syncDirectStageToAccessMask.find(bit); |
| if (access_rec != syncDirectStageToAccessMask.end()) { |
| result |= access_rec->second; |
| continue; |
| } |
| } |
| } |
| |
| // put the meta-access bits back on |
| if (result & kShaderReadExpandBits) { |
| result |= VK_ACCESS_2_SHADER_READ_BIT_KHR; |
| } |
| |
| if (result & kShaderWriteExpandBits) { |
| result |= VK_ACCESS_2_SHADER_WRITE_BIT_KHR; |
| } |
| |
| return result; |
| } |
| |
| VkPipelineStageFlags2KHR RelatedPipelineStages(VkPipelineStageFlags2KHR stage_mask, |
| const std::map<VkPipelineStageFlags2KHR, VkPipelineStageFlags2KHR> &map) { |
| VkPipelineStageFlags2KHR unscanned = stage_mask; |
| VkPipelineStageFlags2KHR related = 0; |
| for (const auto &entry : map) { |
| const auto &stage = entry.first; |
| if (stage & unscanned) { |
| related = related | entry.second; |
| unscanned = unscanned & ~stage; |
| if (!unscanned) break; |
| } |
| } |
| return related; |
| } |
| |
| VkPipelineStageFlags2KHR WithEarlierPipelineStages(VkPipelineStageFlags2KHR stage_mask) { |
| return stage_mask | RelatedPipelineStages(stage_mask, syncLogicallyEarlierStages); |
| } |
| |
| VkPipelineStageFlags2KHR WithLaterPipelineStages(VkPipelineStageFlags2KHR stage_mask) { |
| return stage_mask | RelatedPipelineStages(stage_mask, syncLogicallyLaterStages); |
| } |
| |
| int GetGraphicsPipelineStageLogicalOrdinal(VkPipelineStageFlags2KHR flag) { |
| const auto &rec = syncStageOrder.find(flag); |
| if (rec == syncStageOrder.end()) { |
| return -1; |
| } |
| return rec->second; |
| } |
| |
| // The following two functions technically have O(N^2) complexity, but it's for a value of O that's largely |
| // stable and also rather tiny - this could definitely be rejigged to work more efficiently, but the impact |
| // on runtime is currently negligible, so it wouldn't gain very much. |
| // If we add a lot more graphics pipeline stages, this set of functions should be rewritten to accomodate. |
| VkPipelineStageFlags2KHR GetLogicallyEarliestGraphicsPipelineStage(VkPipelineStageFlags2KHR inflags) { |
| VkPipelineStageFlags2KHR earliest_bit = VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT; |
| int earliest_bit_order = GetGraphicsPipelineStageLogicalOrdinal(earliest_bit); |
| |
| inflags = ExpandPipelineStages(inflags); |
| for (std::size_t i = 0; i < kNumPipelineStageBits; ++i) { |
| VkPipelineStageFlags2KHR current_flag = (inflags & 0x1ull) << i; |
| if (current_flag) { |
| int new_order = GetGraphicsPipelineStageLogicalOrdinal(current_flag); |
| if (new_order != -1 && new_order < earliest_bit_order) { |
| earliest_bit_order = new_order; |
| earliest_bit = current_flag; |
| } |
| } |
| inflags = inflags >> 1; |
| } |
| return earliest_bit; |
| } |
| |
| VkPipelineStageFlags2KHR GetLogicallyLatestGraphicsPipelineStage(VkPipelineStageFlags2KHR inflags) { |
| VkPipelineStageFlags2KHR latest_bit = VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT; |
| int latest_bit_order = GetGraphicsPipelineStageLogicalOrdinal(latest_bit); |
| |
| inflags = ExpandPipelineStages(inflags); |
| for (std::size_t i = 0; i < kNumPipelineStageBits; ++i) { |
| VkPipelineStageFlags2KHR current_flag = (inflags & 0x1ull) << i; |
| if (current_flag) { |
| int new_order = GetGraphicsPipelineStageLogicalOrdinal(current_flag); |
| if (new_order != -1 && new_order > latest_bit_order) { |
| latest_bit_order = new_order; |
| latest_bit = current_flag; |
| } |
| } |
| inflags = inflags >> 1; |
| } |
| return latest_bit; |
| } |
| |
| // helper to extract the union of the stage masks in all of the barriers |
| ExecScopes GetGlobalStageMasks(const VkDependencyInfoKHR &dep_info) { |
| ExecScopes result{}; |
| for (uint32_t i = 0; i < dep_info.memoryBarrierCount; i++) { |
| result.src |= dep_info.pMemoryBarriers[i].srcStageMask; |
| result.dst |= dep_info.pMemoryBarriers[i].dstStageMask; |
| } |
| for (uint32_t i = 0; i < dep_info.bufferMemoryBarrierCount; i++) { |
| result.src |= dep_info.pBufferMemoryBarriers[i].srcStageMask; |
| result.dst |= dep_info.pBufferMemoryBarriers[i].dstStageMask; |
| } |
| for (uint32_t i = 0; i < dep_info.imageMemoryBarrierCount; i++) { |
| result.src |= dep_info.pImageMemoryBarriers[i].srcStageMask; |
| result.dst |= dep_info.pImageMemoryBarriers[i].dstStageMask; |
| } |
| return result; |
| } |
| |
| // Helpers to try to print the shortest string description of masks. |
| // If the bitmask doesn't use a synchronization2 specific flag, we'll |
| // print the old strings. There are common code paths where we need |
| // to print masks as strings and this makes the output less confusing |
| // for people not using synchronization2. |
| std::string StringPipelineStageFlags(VkPipelineStageFlags2KHR mask) { |
| if (mask <= UINT32_MAX) { |
| return string_VkPipelineStageFlags(mask & UINT32_MAX); |
| } |
| return string_VkPipelineStageFlags2KHR(mask); |
| } |
| |
| std::string StringAccessFlags(VkAccessFlags2KHR mask) { |
| if (mask <= UINT32_MAX) { |
| return string_VkAccessFlags(mask & UINT32_MAX); |
| } |
| return string_VkAccessFlags2KHR(mask); |
| } |
| |
| } // namespace sync_utils |