mirror of
https://gitlab.freedesktop.org/mesa/mesa.git
synced 2026-05-01 08:08:06 +02:00
GPU timestamps are emitted by the GPU to a BO with CPU-access which means the driver needs to read them back when the submission is done. Fix this by passing a pointer to that BO, like some other records. Signed-off-by: Samuel Pitoiset <samuel.pitoiset@gmail.com> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/22779>
186 lines
4.1 KiB
C
186 lines
4.1 KiB
C
/*
|
|
* Copyright 2020 Advanced Micro Devices, Inc.
|
|
* Copyright 2020 Valve Corporation
|
|
*
|
|
* SPDX-License-Identifier: MIT
|
|
*/
|
|
|
|
#ifndef AC_RGP_H
|
|
#define AC_RGP_H
|
|
|
|
#include <stdint.h>
|
|
#include "compiler/shader_enums.h"
|
|
#include "util/list.h"
|
|
#include "util/simple_mtx.h"
|
|
|
|
struct radeon_info;
|
|
struct ac_sqtt_trace;
|
|
struct ac_sqtt;
|
|
struct ac_spm_trace;
|
|
|
|
enum rgp_hardware_stages {
|
|
RGP_HW_STAGE_VS = 0,
|
|
RGP_HW_STAGE_LS,
|
|
RGP_HW_STAGE_HS,
|
|
RGP_HW_STAGE_ES,
|
|
RGP_HW_STAGE_GS,
|
|
RGP_HW_STAGE_PS,
|
|
RGP_HW_STAGE_CS,
|
|
RGP_HW_STAGE_MAX,
|
|
};
|
|
|
|
struct rgp_shader_data {
|
|
uint64_t hash[2];
|
|
uint32_t code_size;
|
|
uint8_t *code;
|
|
uint32_t vgpr_count;
|
|
uint32_t sgpr_count;
|
|
uint32_t scratch_memory_size;
|
|
uint32_t lds_size;
|
|
uint32_t wavefront_size;
|
|
uint64_t base_address;
|
|
uint32_t elf_symbol_offset;
|
|
uint32_t hw_stage;
|
|
uint32_t is_combined;
|
|
char rt_shader_name[32];
|
|
uint32_t rt_stack_size;
|
|
};
|
|
|
|
struct rgp_code_object_record {
|
|
uint32_t shader_stages_mask;
|
|
struct rgp_shader_data shader_data[MESA_VULKAN_SHADER_STAGES];
|
|
uint32_t num_shaders_combined; /* count combined shaders as one count */
|
|
uint64_t pipeline_hash[2];
|
|
|
|
bool is_rt;
|
|
struct list_head list;
|
|
};
|
|
|
|
struct rgp_code_object {
|
|
uint32_t record_count;
|
|
struct list_head record;
|
|
simple_mtx_t lock;
|
|
};
|
|
|
|
enum rgp_loader_event_type
|
|
{
|
|
RGP_LOAD_TO_GPU_MEMORY = 0,
|
|
RGP_UNLOAD_FROM_GPU_MEMORY,
|
|
};
|
|
|
|
struct rgp_loader_events_record {
|
|
uint32_t loader_event_type;
|
|
uint32_t reserved;
|
|
uint64_t base_address;
|
|
uint64_t code_object_hash[2];
|
|
uint64_t time_stamp;
|
|
struct list_head list;
|
|
};
|
|
|
|
struct rgp_loader_events {
|
|
uint32_t record_count;
|
|
struct list_head record;
|
|
simple_mtx_t lock;
|
|
};
|
|
|
|
struct rgp_pso_correlation_record {
|
|
uint64_t api_pso_hash;
|
|
uint64_t pipeline_hash[2];
|
|
char api_level_obj_name[64];
|
|
struct list_head list;
|
|
};
|
|
|
|
struct rgp_pso_correlation {
|
|
uint32_t record_count;
|
|
struct list_head record;
|
|
simple_mtx_t lock;
|
|
};
|
|
|
|
enum sqtt_queue_type {
|
|
SQTT_QUEUE_TYPE_UNKNOWN = 0x0,
|
|
SQTT_QUEUE_TYPE_UNIVERSAL = 0x1,
|
|
SQTT_QUEUE_TYPE_COMPUTE = 0x2,
|
|
SQTT_QUEUE_TYPE_DMA = 0x3,
|
|
};
|
|
|
|
enum sqtt_engine_type {
|
|
SQTT_ENGINE_TYPE_UNKNOWN = 0x0,
|
|
SQTT_ENGINE_TYPE_UNIVERSAL = 0x1,
|
|
SQTT_ENGINE_TYPE_COMPUTE = 0x2,
|
|
SQTT_ENGINE_TYPE_EXCLUSIVE_COMPUTE = 0x3,
|
|
SQTT_ENGINE_TYPE_DMA = 0x4,
|
|
SQTT_ENGINE_TYPE_HIGH_PRIORITY_UNIVERSAL = 0x7,
|
|
SQTT_ENGINE_TYPE_HIGH_PRIORITY_GRAPHICS = 0x8,
|
|
};
|
|
|
|
struct sqtt_queue_hardware_info {
|
|
union {
|
|
struct {
|
|
enum sqtt_queue_type queue_type : 8;
|
|
enum sqtt_engine_type engine_type : 8;
|
|
uint32_t reserved : 16;
|
|
};
|
|
uint32_t value;
|
|
};
|
|
};
|
|
|
|
struct rgp_queue_info_record {
|
|
uint64_t queue_id;
|
|
uint64_t queue_context;
|
|
struct sqtt_queue_hardware_info hardware_info;
|
|
uint32_t reserved;
|
|
struct list_head list;
|
|
};
|
|
|
|
struct rgp_queue_info {
|
|
uint32_t record_count;
|
|
struct list_head record;
|
|
simple_mtx_t lock;
|
|
};
|
|
|
|
enum sqtt_queue_event_type {
|
|
SQTT_QUEUE_TIMING_EVENT_CMDBUF_SUBMIT,
|
|
SQTT_QUEUE_TIMING_EVENT_SIGNAL_SEMAPHORE,
|
|
SQTT_QUEUE_TIMING_EVENT_WAIT_SEMAPHORE,
|
|
SQTT_QUEUE_TIMING_EVENT_PRESENT
|
|
};
|
|
|
|
struct rgp_queue_event_record {
|
|
enum sqtt_queue_event_type event_type;
|
|
uint32_t sqtt_cb_id;
|
|
uint64_t frame_index;
|
|
uint32_t queue_info_index;
|
|
uint32_t submit_sub_index;
|
|
uint64_t api_id;
|
|
uint64_t cpu_timestamp;
|
|
uint64_t *gpu_timestamps[2];
|
|
struct list_head list;
|
|
};
|
|
|
|
struct rgp_queue_event {
|
|
uint32_t record_count;
|
|
struct list_head record;
|
|
simple_mtx_t lock;
|
|
};
|
|
|
|
struct rgp_clock_calibration_record {
|
|
uint64_t cpu_timestamp;
|
|
uint64_t gpu_timestamp;
|
|
struct list_head list;
|
|
};
|
|
|
|
struct rgp_clock_calibration {
|
|
uint32_t record_count;
|
|
struct list_head record;
|
|
simple_mtx_t lock;
|
|
};
|
|
|
|
int ac_dump_rgp_capture(const struct radeon_info *info, struct ac_sqtt_trace *sqtt_trace,
|
|
const struct ac_spm_trace *spm_trace);
|
|
|
|
void
|
|
ac_rgp_file_write_elf_object(FILE *output, size_t file_elf_start,
|
|
struct rgp_code_object_record *record,
|
|
uint32_t *written_size, uint32_t flags);
|
|
|
|
#endif
|