| /* Copyright (c) 2018-2023 The Khronos Group Inc. |
| * Copyright (c) 2018-2023 Valve Corporation |
| * Copyright (c) 2018-2023 LunarG, Inc. |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #pragma once |
| |
| #include "gpu_validation/gpu_utils.h" |
| #include "state_tracker/pipeline_state.h" |
| |
| class GpuAssisted; |
| |
| struct GpuAssistedDeviceMemoryBlock { |
| VkBuffer buffer; |
| VmaAllocation allocation; |
| vvl::unordered_map<uint32_t, const cvdescriptorset::DescriptorBinding*> update_at_submit; |
| }; |
| |
| struct GpuAssistedPreDrawResources { |
| VkDescriptorPool desc_pool = VK_NULL_HANDLE; |
| VkDescriptorSet desc_set = VK_NULL_HANDLE; |
| VkBuffer buffer = VK_NULL_HANDLE; |
| VkDeviceSize offset = 0; |
| uint32_t stride = 0; |
| VkDeviceSize buf_size = 0; |
| static const uint32_t push_constant_words = 4; |
| }; |
| |
| struct GpuAssistedPreDispatchResources { |
| VkDescriptorPool desc_pool = VK_NULL_HANDLE; |
| VkDescriptorSet desc_set = VK_NULL_HANDLE; |
| VkBuffer buffer = VK_NULL_HANDLE; |
| VkDeviceSize offset = 0; |
| static const uint32_t push_constant_words = 4; |
| }; |
| |
| struct GpuAssistedBufferInfo { |
| GpuAssistedDeviceMemoryBlock output_mem_block; |
| GpuAssistedDeviceMemoryBlock bda_input_mem_block; // Buffer Device Address input |
| GpuAssistedPreDrawResources pre_draw_resources; |
| GpuAssistedPreDispatchResources pre_dispatch_resources; |
| VkDescriptorSet desc_set; |
| VkDescriptorPool desc_pool; |
| VkPipelineBindPoint pipeline_bind_point; |
| bool uses_robustness; |
| CMD_TYPE cmd_type; |
| GpuAssistedBufferInfo(GpuAssistedDeviceMemoryBlock output_mem_block, GpuAssistedDeviceMemoryBlock bda_input_mem_block, |
| GpuAssistedPreDrawResources pre_draw_resources, GpuAssistedPreDispatchResources pre_dispatch_resources, |
| VkDescriptorSet desc_set, VkDescriptorPool desc_pool, VkPipelineBindPoint pipeline_bind_point, |
| bool uses_robustness, CMD_TYPE cmd_type) |
| : output_mem_block(output_mem_block), |
| bda_input_mem_block(bda_input_mem_block), |
| pre_draw_resources(pre_draw_resources), |
| pre_dispatch_resources(pre_dispatch_resources), |
| desc_set(desc_set), |
| desc_pool(desc_pool), |
| pipeline_bind_point(pipeline_bind_point), |
| uses_robustness(uses_robustness), |
| cmd_type(cmd_type){}; |
| }; |
| |
| struct GpuVuid { |
| const char* uniform_access_oob = kVUIDUndefined; |
| const char* storage_access_oob = kVUIDUndefined; |
| const char* count_exceeds_bufsize_1 = kVUIDUndefined; |
| const char* count_exceeds_bufsize = kVUIDUndefined; |
| const char* count_exceeds_device_limit = kVUIDUndefined; |
| const char* first_instance_not_zero = kVUIDUndefined; |
| const char* group_exceeds_device_limit_x = kVUIDUndefined; |
| const char* group_exceeds_device_limit_y = kVUIDUndefined; |
| const char* group_exceeds_device_limit_z = kVUIDUndefined; |
| }; |
| |
| struct GpuAssistedAccelerationStructureBuildValidationBufferInfo { |
| // The acceleration structure that is being built. |
| VkAccelerationStructureNV acceleration_structure = VK_NULL_HANDLE; |
| |
| // The descriptor pool and descriptor set being used to validate a given build. |
| VkDescriptorPool descriptor_pool = VK_NULL_HANDLE; |
| VkDescriptorSet descriptor_set = VK_NULL_HANDLE; |
| |
| // The storage buffer used by the validating compute shader whichcontains info about |
| // the valid handles and which is written to communicate found invalid handles. |
| VkBuffer buffer = VK_NULL_HANDLE; |
| VmaAllocation buffer_allocation = VK_NULL_HANDLE; |
| }; |
| |
| struct GpuAssistedAccelerationStructureBuildValidationState { |
| // some resources can be used each time so only to need to create once |
| bool initialized = false; |
| |
| VkPipeline pipeline = VK_NULL_HANDLE; |
| VkPipelineLayout pipeline_layout = VK_NULL_HANDLE; |
| |
| VkAccelerationStructureNV replacement_as = VK_NULL_HANDLE; |
| VmaAllocation replacement_as_allocation = VK_NULL_HANDLE; |
| uint64_t replacement_as_handle = 0; |
| |
| void Destroy(VkDevice device, VmaAllocator& vmaAllocator); |
| }; |
| |
| struct GpuAssistedPreDrawValidationState { |
| // some resources can be used each time so only to need to create once |
| bool initialized = false; |
| |
| VkShaderModule shader_module = VK_NULL_HANDLE; |
| VkDescriptorSetLayout ds_layout = VK_NULL_HANDLE; |
| VkPipelineLayout pipeline_layout = VK_NULL_HANDLE; |
| vl_concurrent_unordered_map<VkRenderPass, VkPipeline> renderpass_to_pipeline; |
| |
| void Destroy(VkDevice device); |
| }; |
| |
| struct GpuAssistedPreDispatchValidationState { |
| // some resources can be used each time so only to need to create once |
| bool initialized = false; |
| |
| VkShaderModule shader_module = VK_NULL_HANDLE; |
| VkDescriptorSetLayout ds_layout = VK_NULL_HANDLE; |
| VkPipelineLayout pipeline_layout = VK_NULL_HANDLE; |
| VkPipeline pipeline = VK_NULL_HANDLE; |
| |
| void Destroy(VkDevice device); |
| }; |
| |
| // Used for draws/dispatch/traceRays indirect |
| struct GpuAssistedCmdIndirectState { |
| VkBuffer buffer; |
| VkDeviceSize offset; |
| uint32_t draw_count; |
| uint32_t stride; |
| VkBuffer count_buffer; |
| VkDeviceSize count_buffer_offset; |
| }; |
| |
| namespace gpuav_state { |
| class CommandBuffer : public gpu_utils_state::CommandBuffer { |
| public: |
| std::vector<GpuAssistedBufferInfo> per_draw_buffer_list; |
| std::vector<GpuAssistedDeviceMemoryBlock> di_input_buffer_list; |
| std::vector<GpuAssistedAccelerationStructureBuildValidationBufferInfo> as_validation_buffers; |
| VkBuffer current_input_buffer = VK_NULL_HANDLE; |
| |
| CommandBuffer(GpuAssisted* ga, VkCommandBuffer cb, const VkCommandBufferAllocateInfo* pCreateInfo, |
| const COMMAND_POOL_STATE* pool); |
| ~CommandBuffer(); |
| |
| bool NeedsProcessing() const final { return !per_draw_buffer_list.empty() || has_build_as_cmd; } |
| void Process(VkQueue queue) final; |
| |
| void Destroy() final; |
| void Reset() final; |
| |
| private: |
| void ResetCBState(); |
| void ProcessAccelerationStructure(VkQueue queue); |
| }; |
| } // namespace gpuav_state |
| |
| VALSTATETRACK_DERIVED_STATE_OBJECT(VkCommandBuffer, gpuav_state::CommandBuffer, CMD_BUFFER_STATE) |
| |
| class GpuAssisted : public GpuAssistedBase { |
| public: |
| GpuAssisted() { |
| setup_vuid = "UNASSIGNED-GPU-Assisted-Validation"; |
| container_type = LayerObjectTypeGpuAssisted; |
| desired_features.vertexPipelineStoresAndAtomics = true; |
| desired_features.fragmentStoresAndAtomics = true; |
| desired_features.shaderInt64 = true; |
| } |
| |
| bool CheckForDescriptorIndexing(DeviceFeatures enabled_features) const; |
| void CreateDevice(const VkDeviceCreateInfo* pCreateInfo) override; |
| void PreCallRecordDestroyDevice(VkDevice device, const VkAllocationCallbacks* pAllocator) override; |
| void PostCallRecordBindAccelerationStructureMemoryNV(VkDevice device, uint32_t bindInfoCount, |
| const VkBindAccelerationStructureMemoryInfoNV* pBindInfos, |
| VkResult result) override; |
| void PreCallRecordCreateBuffer(VkDevice device, const VkBufferCreateInfo* pCreateInfo, const VkAllocationCallbacks* pAllocator, |
| VkBuffer* pBuffer, void* cb_state_data) override; |
| void CreateAccelerationStructureBuildValidationState(); |
| void PreCallRecordCmdBuildAccelerationStructureNV(VkCommandBuffer commandBuffer, const VkAccelerationStructureInfoNV* pInfo, |
| VkBuffer instanceData, VkDeviceSize instanceOffset, VkBool32 update, |
| VkAccelerationStructureNV dst, VkAccelerationStructureNV src, |
| VkBuffer scratch, VkDeviceSize scratchOffset) override; |
| void PreCallRecordDestroyRenderPass(VkDevice device, VkRenderPass renderPass, const VkAllocationCallbacks* pAllocator) override; |
| bool InstrumentShader(const vvl::span<const uint32_t>& input, std::vector<uint32_t>& new_pgm, |
| uint32_t* unique_shader_id) override; |
| void PreCallRecordCreateShaderModule(VkDevice device, const VkShaderModuleCreateInfo* pCreateInfo, |
| const VkAllocationCallbacks* pAllocator, VkShaderModule* pShaderModule, |
| void* csm_state_data) override; |
| void AnalyzeAndGenerateMessages(VkCommandBuffer command_buffer, VkQueue queue, GpuAssistedBufferInfo& buffer_info, |
| uint32_t operation_index, uint32_t* const debug_output_buffer); |
| |
| void SetBindingState(uint32_t* data, uint32_t index, const cvdescriptorset::DescriptorBinding* binding); |
| void UpdateInstrumentationBuffer(gpuav_state::CommandBuffer* cb_node); |
| void PostCallRecordCmdBindDescriptorSets(VkCommandBuffer commandBuffer, VkPipelineBindPoint pipelineBindPoint, |
| VkPipelineLayout layout, uint32_t firstSet, uint32_t descriptorSetCount, |
| const VkDescriptorSet* pDescriptorSets, uint32_t dynamicOffsetCount, |
| const uint32_t* pDynamicOffsets) override; |
| void PreCallRecordQueueSubmit(VkQueue queue, uint32_t submitCount, const VkSubmitInfo* pSubmits, VkFence fence) override; |
| void PreCallRecordQueueSubmit2KHR(VkQueue queue, uint32_t submitCount, const VkSubmitInfo2KHR* pSubmits, |
| VkFence fence) override; |
| void PreCallRecordQueueSubmit2(VkQueue queue, uint32_t submitCount, const VkSubmitInfo2* pSubmits, VkFence fence) override; |
| void PreCallRecordCmdDraw(VkCommandBuffer commandBuffer, uint32_t vertexCount, uint32_t instanceCount, uint32_t firstVertex, |
| uint32_t firstInstance) override; |
| void PreCallRecordCmdDrawMultiEXT(VkCommandBuffer commandBuffer, uint32_t drawCount, const VkMultiDrawInfoEXT* pVertexInfo, |
| uint32_t instanceCount, uint32_t firstInstance, uint32_t stride) override; |
| void PreCallRecordCmdDrawIndexed(VkCommandBuffer commandBuffer, uint32_t indexCount, uint32_t instanceCount, |
| uint32_t firstIndex, int32_t vertexOffset, uint32_t firstInstance) override; |
| void PreCallRecordCmdDrawMultiIndexedEXT(VkCommandBuffer commandBuffer, uint32_t drawCount, |
| const VkMultiDrawIndexedInfoEXT* pIndexInfo, uint32_t instanceCount, |
| uint32_t firstInstance, uint32_t stride, const int32_t* pVertexOffset) override; |
| void PreCallRecordCmdDrawIndirect(VkCommandBuffer commandBuffer, VkBuffer buffer, VkDeviceSize offset, uint32_t count, |
| uint32_t stride) override; |
| void PreCallRecordCmdDrawIndexedIndirect(VkCommandBuffer commandBuffer, VkBuffer buffer, VkDeviceSize offset, uint32_t count, |
| uint32_t stride) override; |
| void PreCallRecordCmdDrawIndirectCountKHR(VkCommandBuffer commandBuffer, VkBuffer buffer, VkDeviceSize offset, |
| VkBuffer countBuffer, VkDeviceSize countBufferOffset, uint32_t maxDrawCount, |
| uint32_t stride) override; |
| void PreCallRecordCmdDrawIndirectCount(VkCommandBuffer commandBuffer, VkBuffer buffer, VkDeviceSize offset, |
| VkBuffer countBuffer, VkDeviceSize countBufferOffset, uint32_t maxDrawCount, |
| uint32_t stride) override; |
| void PreCallRecordCmdDrawIndirectByteCountEXT(VkCommandBuffer commandBuffer, uint32_t instanceCount, uint32_t firstInstance, |
| VkBuffer counterBuffer, VkDeviceSize counterBufferOffset, uint32_t counterOffset, |
| uint32_t vertexStride) override; |
| void PreCallRecordCmdDrawIndexedIndirectCountKHR(VkCommandBuffer commandBuffer, VkBuffer buffer, VkDeviceSize offset, |
| VkBuffer countBuffer, VkDeviceSize countBufferOffset, uint32_t maxDrawCount, |
| uint32_t stride) override; |
| void PreCallRecordCmdDrawIndexedIndirectCount(VkCommandBuffer commandBuffer, VkBuffer buffer, VkDeviceSize offset, |
| VkBuffer countBuffer, VkDeviceSize countBufferOffset, uint32_t maxDrawCount, |
| uint32_t stride) override; |
| void PreCallRecordCmdDrawMeshTasksNV(VkCommandBuffer commandBuffer, uint32_t taskCount, uint32_t firstTask) override; |
| void PreCallRecordCmdDrawMeshTasksIndirectNV(VkCommandBuffer commandBuffer, VkBuffer buffer, VkDeviceSize offset, |
| uint32_t drawCount, uint32_t stride) override; |
| void PreCallRecordCmdDrawMeshTasksIndirectCountNV(VkCommandBuffer commandBuffer, VkBuffer buffer, VkDeviceSize offset, |
| VkBuffer countBuffer, VkDeviceSize countBufferOffset, uint32_t maxDrawCount, |
| uint32_t stride) override; |
| void PreCallRecordCmdDrawMeshTasksEXT(VkCommandBuffer commandBuffer, uint32_t groupCountX, uint32_t groupCountY, |
| uint32_t groupCountZ) override; |
| void PreCallRecordCmdDrawMeshTasksIndirectEXT(VkCommandBuffer commandBuffer, VkBuffer buffer, VkDeviceSize offset, |
| uint32_t drawCount, uint32_t stride) override; |
| void PreCallRecordCmdDrawMeshTasksIndirectCountEXT(VkCommandBuffer commandBuffer, VkBuffer buffer, VkDeviceSize offset, |
| VkBuffer countBuffer, VkDeviceSize countBufferOffset, uint32_t maxDrawCount, |
| uint32_t stride) override; |
| void PreCallRecordCmdDispatch(VkCommandBuffer commandBuffer, uint32_t x, uint32_t y, uint32_t z) override; |
| void PreCallRecordCmdDispatchIndirect(VkCommandBuffer commandBuffer, VkBuffer buffer, VkDeviceSize offset) override; |
| void PreCallRecordCmdDispatchBase(VkCommandBuffer commandBuffer, uint32_t baseGroupX, uint32_t baseGroupY, uint32_t baseGroupZ, |
| uint32_t groupCountX, uint32_t groupCountY, uint32_t groupCountZ) override; |
| void PreCallRecordCmdDispatchBaseKHR(VkCommandBuffer commandBuffer, uint32_t baseGroupX, uint32_t baseGroupY, |
| uint32_t baseGroupZ, uint32_t groupCountX, uint32_t groupCountY, |
| uint32_t groupCountZ) override; |
| void PreCallRecordCmdTraceRaysNV(VkCommandBuffer commandBuffer, VkBuffer raygenShaderBindingTableBuffer, |
| VkDeviceSize raygenShaderBindingOffset, VkBuffer missShaderBindingTableBuffer, |
| VkDeviceSize missShaderBindingOffset, VkDeviceSize missShaderBindingStride, |
| VkBuffer hitShaderBindingTableBuffer, VkDeviceSize hitShaderBindingOffset, |
| VkDeviceSize hitShaderBindingStride, VkBuffer callableShaderBindingTableBuffer, |
| VkDeviceSize callableShaderBindingOffset, VkDeviceSize callableShaderBindingStride, |
| uint32_t width, uint32_t height, uint32_t depth) override; |
| void PreCallRecordCmdTraceRaysKHR(VkCommandBuffer commandBuffer, |
| const VkStridedDeviceAddressRegionKHR* pRaygenShaderBindingTable, |
| const VkStridedDeviceAddressRegionKHR* pMissShaderBindingTable, |
| const VkStridedDeviceAddressRegionKHR* pHitShaderBindingTable, |
| const VkStridedDeviceAddressRegionKHR* pCallableShaderBindingTable, uint32_t width, |
| uint32_t height, uint32_t depth) override; |
| void PreCallRecordCmdTraceRaysIndirectKHR(VkCommandBuffer commandBuffer, |
| const VkStridedDeviceAddressRegionKHR* pRaygenShaderBindingTable, |
| const VkStridedDeviceAddressRegionKHR* pMissShaderBindingTable, |
| const VkStridedDeviceAddressRegionKHR* pHitShaderBindingTable, |
| const VkStridedDeviceAddressRegionKHR* pCallableShaderBindingTable, |
| VkDeviceAddress indirectDeviceAddress) override; |
| void PreCallRecordCmdTraceRaysIndirect2KHR(VkCommandBuffer commandBuffer, VkDeviceAddress indirectDeviceAddress) override; |
| void AllocateValidationResources(const VkCommandBuffer cmd_buffer, const VkPipelineBindPoint bind_point, CMD_TYPE cmd, |
| const GpuAssistedCmdIndirectState* indirect_state = nullptr); |
| void AllocatePreDrawValidationResources(const GpuAssistedDeviceMemoryBlock& output_block, |
| GpuAssistedPreDrawResources& resources, const VkRenderPass render_pass, |
| VkPipeline* pPipeline, const GpuAssistedCmdIndirectState* indirect_state); |
| void AllocatePreDispatchValidationResources(const GpuAssistedDeviceMemoryBlock& output_block, |
| GpuAssistedPreDispatchResources& resources, |
| const GpuAssistedCmdIndirectState* indirect_state); |
| void PostCallRecordGetPhysicalDeviceProperties(VkPhysicalDevice physicalDevice, |
| VkPhysicalDeviceProperties* pPhysicalDeviceProperties) override; |
| void PostCallRecordGetPhysicalDeviceProperties2(VkPhysicalDevice physicalDevice, |
| VkPhysicalDeviceProperties2* pPhysicalDeviceProperties2) override; |
| |
| std::shared_ptr<CMD_BUFFER_STATE> CreateCmdBufferState(VkCommandBuffer cb, const VkCommandBufferAllocateInfo* create_info, |
| const COMMAND_POOL_STATE* pool) final; |
| |
| void DestroyBuffer(GpuAssistedBufferInfo& buffer_info); |
| void DestroyBuffer(GpuAssistedAccelerationStructureBuildValidationBufferInfo& buffer_info); |
| |
| private: |
| void PreRecordCommandBuffer(VkCommandBuffer command_buffer); |
| VkPipeline GetValidationPipeline(VkRenderPass render_pass); |
| |
| VkBool32 shaderInt64; |
| bool buffer_oob_enabled; |
| bool validate_draw_indirect; |
| bool validate_dispatch_indirect; |
| bool warn_on_robust_oob; |
| bool validate_instrumented_shaders; |
| GpuAssistedAccelerationStructureBuildValidationState acceleration_structure_validation_state; |
| GpuAssistedPreDrawValidationState pre_draw_validation_state; |
| GpuAssistedPreDispatchValidationState pre_dispatch_validation_state; |
| |
| bool descriptor_indexing = false; |
| bool buffer_device_address; |
| }; |