It needs to be resized instead, like the SQTT BO. Signed-off-by: Samuel Pitoiset <samuel.pitoiset@gmail.com> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/31883>
201 lines
4.6 KiB
C
201 lines
4.6 KiB
C
/*
|
|
* Copyright 2021 Valve Corporation
|
|
*
|
|
* SPDX-License-Identifier: MIT
|
|
*/
|
|
|
|
#ifndef AC_SPM_H
|
|
#define AC_SPM_H
|
|
|
|
#include <stdint.h>
|
|
|
|
#include "ac_perfcounter.h"
|
|
|
|
#define AC_SPM_MAX_COUNTER_PER_BLOCK 16
|
|
#define AC_SPM_GLOBAL_TIMESTAMP_COUNTERS 4 /* in unit of 16-bit counters*/
|
|
#define AC_SPM_NUM_COUNTER_PER_MUXSEL 16 /* 16 16-bit counters per muxsel */
|
|
#define AC_SPM_MUXSEL_LINE_SIZE ((AC_SPM_NUM_COUNTER_PER_MUXSEL * 2) / 4) /* in dwords */
|
|
#define AC_SPM_NUM_PERF_SEL 4
|
|
|
|
/* GFX10+ */
|
|
enum ac_spm_global_block {
|
|
AC_SPM_GLOBAL_BLOCK_CPG,
|
|
AC_SPM_GLOBAL_BLOCK_CPC,
|
|
AC_SPM_GLOBAL_BLOCK_CPF,
|
|
AC_SPM_GLOBAL_BLOCK_GDS,
|
|
AC_SPM_GLOBAL_BLOCK_GCR,
|
|
AC_SPM_GLOBAL_BLOCK_PH,
|
|
AC_SPM_GLOBAL_BLOCK_GE,
|
|
AC_SPM_GLOBAL_BLOCK_GE1 = AC_SPM_GLOBAL_BLOCK_GE,
|
|
AC_SPM_GLOBAL_BLOCK_GL2A,
|
|
AC_SPM_GLOBAL_BLOCK_GL2C,
|
|
AC_SPM_GLOBAL_BLOCK_SDMA,
|
|
AC_SPM_GLOBAL_BLOCK_GUS,
|
|
AC_SPM_GLOBAL_BLOCK_EA,
|
|
AC_SPM_GLOBAL_BLOCK_CHA,
|
|
AC_SPM_GLOBAL_BLOCK_CHC,
|
|
AC_SPM_GLOBAL_BLOCK_CHCG,
|
|
AC_SPM_GLOBAL_BLOCK_GPUVMATTCL2,
|
|
AC_SPM_GLOBAL_BLOCK_GPUVMVML2,
|
|
AC_SPM_GLOBAL_BLOCK_GE2SE, /* Per-SE counters */
|
|
AC_SPM_GLOBAL_BLOCK_GE2DIST,
|
|
|
|
/* GFX11+ */
|
|
/* gap */
|
|
AC_SPM_GLOBAL_BLOCK_RSPM = 31,
|
|
};
|
|
|
|
enum ac_spm_se_block {
|
|
AC_SPM_SE_BLOCK_CB,
|
|
AC_SPM_SE_BLOCK_DB,
|
|
AC_SPM_SE_BLOCK_PA,
|
|
AC_SPM_SE_BLOCK_SX,
|
|
AC_SPM_SE_BLOCK_SC,
|
|
AC_SPM_SE_BLOCK_TA,
|
|
AC_SPM_SE_BLOCK_TD,
|
|
AC_SPM_SE_BLOCK_TCP,
|
|
AC_SPM_SE_BLOCK_SPI,
|
|
AC_SPM_SE_BLOCK_SQG,
|
|
AC_SPM_SE_BLOCK_GL1A,
|
|
AC_SPM_SE_BLOCK_RMI,
|
|
AC_SPM_SE_BLOCK_GL1C,
|
|
AC_SPM_SE_BLOCK_GL1CG,
|
|
|
|
/* GFX11+ */
|
|
AC_SPM_SE_BLOCK_CBR,
|
|
AC_SPM_SE_BLOCK_DBR,
|
|
AC_SPM_SE_BLOCK_GL1H,
|
|
AC_SPM_SE_BLOCK_SQC,
|
|
AC_SPM_SE_BLOCK_PC,
|
|
/* gap */
|
|
AC_SPM_SE_BLOCK_SE_RPM = 31,
|
|
};
|
|
|
|
enum ac_spm_segment_type {
|
|
AC_SPM_SEGMENT_TYPE_SE0,
|
|
AC_SPM_SEGMENT_TYPE_SE1,
|
|
AC_SPM_SEGMENT_TYPE_SE2,
|
|
AC_SPM_SEGMENT_TYPE_SE3,
|
|
AC_SPM_SEGMENT_TYPE_SE4,
|
|
AC_SPM_SEGMENT_TYPE_SE5,
|
|
AC_SPM_SEGMENT_TYPE_GLOBAL,
|
|
AC_SPM_SEGMENT_TYPE_COUNT,
|
|
};
|
|
|
|
struct ac_spm_counter_descr {
|
|
enum ac_pc_gpu_block gpu_block;
|
|
uint32_t event_id;
|
|
};
|
|
|
|
struct ac_spm_counter_create_info {
|
|
struct ac_spm_counter_descr *b;
|
|
uint32_t instance;
|
|
};
|
|
|
|
union ac_spm_muxsel {
|
|
struct {
|
|
uint16_t counter : 6;
|
|
uint16_t block : 4;
|
|
uint16_t shader_array : 1; /* 0: SA0, 1: SA1 */
|
|
uint16_t instance : 5;
|
|
} gfx10;
|
|
|
|
struct {
|
|
uint16_t counter : 5;
|
|
uint16_t instance : 5;
|
|
uint16_t shader_array : 1;
|
|
uint16_t block : 5;
|
|
} gfx11;
|
|
uint16_t value;
|
|
};
|
|
|
|
struct ac_spm_muxsel_line {
|
|
union ac_spm_muxsel muxsel[AC_SPM_NUM_COUNTER_PER_MUXSEL];
|
|
};
|
|
|
|
struct ac_spm_counter_info {
|
|
/* General info. */
|
|
enum ac_pc_gpu_block gpu_block;
|
|
uint32_t instance;
|
|
uint32_t event_id;
|
|
|
|
/* Muxsel info. */
|
|
enum ac_spm_segment_type segment_type;
|
|
bool is_even;
|
|
union ac_spm_muxsel muxsel;
|
|
|
|
/* Output info. */
|
|
uint64_t offset;
|
|
};
|
|
|
|
struct ac_spm_counter_select {
|
|
uint8_t active; /* mask of used 16-bit counters. */
|
|
uint32_t sel0;
|
|
uint32_t sel1;
|
|
};
|
|
|
|
struct ac_spm_block_instance {
|
|
uint32_t grbm_gfx_index;
|
|
|
|
uint32_t num_counters;
|
|
struct ac_spm_counter_select counters[AC_SPM_MAX_COUNTER_PER_BLOCK];
|
|
};
|
|
|
|
struct ac_spm_block_select {
|
|
const struct ac_pc_block *b;
|
|
|
|
uint32_t num_instances;
|
|
struct ac_spm_block_instance *instances;
|
|
};
|
|
|
|
struct ac_spm {
|
|
/* struct radeon_winsys_bo or struct pb_buffer */
|
|
void *bo;
|
|
void *ptr;
|
|
uint8_t ptr_granularity;
|
|
uint32_t buffer_size;
|
|
uint16_t sample_interval;
|
|
|
|
/* Enabled counters. */
|
|
unsigned num_counters;
|
|
struct ac_spm_counter_info *counters;
|
|
|
|
/* Block/counters selection. */
|
|
uint32_t num_block_sel;
|
|
struct ac_spm_block_select *block_sel;
|
|
|
|
struct {
|
|
uint32_t num_counters;
|
|
struct ac_spm_counter_select counters[16];
|
|
} sqg[AC_SPM_SEGMENT_TYPE_GLOBAL];
|
|
|
|
struct {
|
|
uint32_t grbm_gfx_index;
|
|
uint32_t num_counters;
|
|
struct ac_spm_counter_select counters[16];
|
|
} sq_wgp[AMD_MAX_WGP];
|
|
|
|
/* Muxsel lines. */
|
|
unsigned num_muxsel_lines[AC_SPM_SEGMENT_TYPE_COUNT];
|
|
struct ac_spm_muxsel_line *muxsel_lines[AC_SPM_SEGMENT_TYPE_COUNT];
|
|
unsigned max_se_muxsel_lines;
|
|
};
|
|
|
|
struct ac_spm_trace {
|
|
void *ptr;
|
|
uint16_t sample_interval;
|
|
unsigned num_counters;
|
|
struct ac_spm_counter_info *counters;
|
|
uint32_t sample_size_in_bytes;
|
|
uint32_t num_samples;
|
|
};
|
|
|
|
bool ac_init_spm(const struct radeon_info *info,
|
|
const struct ac_perfcounters *pc,
|
|
struct ac_spm *spm);
|
|
void ac_destroy_spm(struct ac_spm *spm);
|
|
|
|
bool ac_spm_get_trace(const struct ac_spm *spm, struct ac_spm_trace *trace);
|
|
|
|
#endif
|