blob: b53bb02de817bb57bb39ff4ff24ca387e02f4418 [file] [log] [blame]
/*
* Copyright 2020 Advanced Micro Devices, Inc.
* Copyright 2020 Valve Corporation
* All Rights Reserved.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* on the rights to use, copy, modify, merge, publish, distribute, sub
* license, and/or sell copies of the Software, and to permit persons to whom
* the Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice (including the next
* paragraph) shall be included in all copies or substantial portions of the
* Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
* THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
* DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
* OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
* USE OR OTHER DEALINGS IN THE SOFTWARE.
*/
#ifndef AC_RGP_H
#define AC_RGP_H
#include <stdint.h>
#include "compiler/shader_enums.h"
#include "util/list.h"
#include "util/simple_mtx.h"
struct radeon_info;
struct ac_thread_trace;
struct ac_thread_trace_data;
struct ac_spm_trace_data;
enum rgp_hardware_stages {
RGP_HW_STAGE_VS = 0,
RGP_HW_STAGE_LS,
RGP_HW_STAGE_HS,
RGP_HW_STAGE_ES,
RGP_HW_STAGE_GS,
RGP_HW_STAGE_PS,
RGP_HW_STAGE_CS,
RGP_HW_STAGE_MAX,
};
struct rgp_shader_data {
uint64_t hash[2];
uint32_t code_size;
uint8_t *code;
uint32_t vgpr_count;
uint32_t sgpr_count;
uint32_t scratch_memory_size;
uint32_t wavefront_size;
uint64_t base_address;
uint32_t elf_symbol_offset;
uint32_t hw_stage;
uint32_t is_combined;
};
struct rgp_code_object_record {
uint32_t shader_stages_mask;
struct rgp_shader_data shader_data[MESA_VULKAN_SHADER_STAGES];
uint32_t num_shaders_combined; /* count combined shaders as one count */
uint64_t pipeline_hash[2];
struct list_head list;
};
struct rgp_code_object {
uint32_t record_count;
struct list_head record;
simple_mtx_t lock;
};
enum rgp_loader_event_type
{
RGP_LOAD_TO_GPU_MEMORY = 0,
RGP_UNLOAD_FROM_GPU_MEMORY,
};
struct rgp_loader_events_record {
uint32_t loader_event_type;
uint32_t reserved;
uint64_t base_address;
uint64_t code_object_hash[2];
uint64_t time_stamp;
struct list_head list;
};
struct rgp_loader_events {
uint32_t record_count;
struct list_head record;
simple_mtx_t lock;
};
struct rgp_pso_correlation_record {
uint64_t api_pso_hash;
uint64_t pipeline_hash[2];
char api_level_obj_name[64];
struct list_head list;
};
struct rgp_pso_correlation {
uint32_t record_count;
struct list_head record;
simple_mtx_t lock;
};
enum sqtt_queue_type {
SQTT_QUEUE_TYPE_UNKNOWN = 0x0,
SQTT_QUEUE_TYPE_UNIVERSAL = 0x1,
SQTT_QUEUE_TYPE_COMPUTE = 0x2,
SQTT_QUEUE_TYPE_DMA = 0x3,
};
enum sqtt_engine_type {
SQTT_ENGINE_TYPE_UNKNOWN = 0x0,
SQTT_ENGINE_TYPE_UNIVERSAL = 0x1,
SQTT_ENGINE_TYPE_COMPUTE = 0x2,
SQTT_ENGINE_TYPE_EXCLUSIVE_COMPUTE = 0x3,
SQTT_ENGINE_TYPE_DMA = 0x4,
SQTT_ENGINE_TYPE_HIGH_PRIORITY_UNIVERSAL = 0x7,
SQTT_ENGINE_TYPE_HIGH_PRIORITY_GRAPHICS = 0x8,
};
struct sqtt_queue_hardware_info {
union {
struct {
enum sqtt_queue_type queue_type : 8;
enum sqtt_engine_type engine_type : 8;
uint32_t reserved : 16;
};
uint32_t value;
};
};
struct rgp_queue_info_record {
uint64_t queue_id;
uint64_t queue_context;
struct sqtt_queue_hardware_info hardware_info;
uint32_t reserved;
struct list_head list;
};
struct rgp_queue_info {
uint32_t record_count;
struct list_head record;
simple_mtx_t lock;
};
enum sqtt_queue_event_type {
SQTT_QUEUE_TIMING_EVENT_CMDBUF_SUBMIT,
SQTT_QUEUE_TIMING_EVENT_SIGNAL_SEMAPHORE,
SQTT_QUEUE_TIMING_EVENT_WAIT_SEMAPHORE,
SQTT_QUEUE_TIMING_EVENT_PRESENT
};
struct rgp_queue_event_record {
enum sqtt_queue_event_type event_type;
uint32_t sqtt_cb_id;
uint64_t frame_index;
uint32_t queue_info_index;
uint32_t submit_sub_index;
uint64_t api_id;
uint64_t cpu_timestamp;
uint64_t gpu_timestamps[2];
struct list_head list;
};
struct rgp_queue_event {
uint32_t record_count;
struct list_head record;
simple_mtx_t lock;
};
struct rgp_clock_calibration_record {
uint64_t cpu_timestamp;
uint64_t gpu_timestamp;
struct list_head list;
};
struct rgp_clock_calibration {
uint32_t record_count;
struct list_head record;
simple_mtx_t lock;
};
int
ac_dump_rgp_capture(struct radeon_info *info,
struct ac_thread_trace *thread_trace,
const struct ac_spm_trace_data *spm_trace);
void
ac_rgp_file_write_elf_object(FILE *output, size_t file_elf_start,
struct rgp_code_object_record *record,
uint32_t *written_size, uint32_t flags);
#endif