mesa/src/amd/vulkan/radv_debug.h
Tatsuyuki Ishi a8c5fd3b1b radv: Upload shaders to invisible VRAM on small BAR systems.
Following PAL's implementation, this patch avoids allocating shader code
buffers in BAR and use SDMA to upload them to invisible VRAM
directly.

For some games like HZD, shaders can take as much as 400MB, which exceeds
the non-resizable BAR size (256MB) and cause inconsistent spilling
behavior. The kernel will normally move these to invisible VRAM on its own,
but there are a few cases that it does not reliably happen. This patch does
the moving explicitly in the driver to ensure predictable results.

In this patch, we upload the shaders synchronously; so the shader will be
ready as soon as vkCreate*Pipeline returns. A following patch will make
this asynchronous and don't block until we see a use of the pipeline.

As a side effect, when SQTT is used we now store the shaders on a cacheable
buffer which would speed up writing the trace to the disk.

Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/16271>
2023-03-16 18:02:57 +00:00

106 lines
3.9 KiB
C

/*
* Copyright © 2017 Google.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice (including the next
* paragraph) shall be included in all copies or substantial portions of the
* Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
* IN THE SOFTWARE.
*/
#ifndef RADV_DEBUG_H
#define RADV_DEBUG_H
#include "radv_private.h"
/* Please keep docs/envvars.rst up-to-date when you add/remove options. */
enum {
RADV_DEBUG_NO_FAST_CLEARS = 1ull << 0,
RADV_DEBUG_NO_DCC = 1ull << 1,
RADV_DEBUG_DUMP_SHADERS = 1ull << 2,
RADV_DEBUG_NO_CACHE = 1ull << 3,
RADV_DEBUG_DUMP_SHADER_STATS = 1ull << 4,
RADV_DEBUG_NO_HIZ = 1ull << 5,
RADV_DEBUG_NO_COMPUTE_QUEUE = 1ull << 6,
RADV_DEBUG_ALL_BOS = 1ull << 7,
RADV_DEBUG_NO_IBS = 1ull << 8,
RADV_DEBUG_DUMP_SPIRV = 1ull << 9,
RADV_DEBUG_VM_FAULTS = 1ull << 10,
RADV_DEBUG_ZERO_VRAM = 1ull << 11,
RADV_DEBUG_SYNC_SHADERS = 1ull << 12,
RADV_DEBUG_PREOPTIR = 1ull << 13,
RADV_DEBUG_NO_DYNAMIC_BOUNDS = 1ull << 14,
RADV_DEBUG_INFO = 1ull << 15,
RADV_DEBUG_STARTUP = 1ull << 16,
RADV_DEBUG_CHECKIR = 1ull << 17,
RADV_DEBUG_NOBINNING = 1ull << 18,
RADV_DEBUG_NO_NGG = 1ull << 19,
RADV_DEBUG_DUMP_META_SHADERS = 1ull << 20,
RADV_DEBUG_NO_MEMORY_CACHE = 1ull << 21,
RADV_DEBUG_DISCARD_TO_DEMOTE = 1ull << 22,
RADV_DEBUG_LLVM = 1ull << 23,
RADV_DEBUG_FORCE_COMPRESS = 1ull << 24,
RADV_DEBUG_HANG = 1ull << 25,
RADV_DEBUG_IMG = 1ull << 26,
RADV_DEBUG_NO_UMR = 1ull << 27,
RADV_DEBUG_INVARIANT_GEOM = 1ull << 28,
RADV_DEBUG_NO_DISPLAY_DCC = 1ull << 29,
RADV_DEBUG_NO_TC_COMPAT_CMASK = 1ull << 30,
RADV_DEBUG_NO_VRS_FLAT_SHADING = 1ull << 31,
RADV_DEBUG_NO_ATOC_DITHERING = 1ull << 32,
RADV_DEBUG_NO_NGGC = 1ull << 33,
RADV_DEBUG_DUMP_PROLOGS = 1ull << 34,
RADV_DEBUG_NO_DMA_BLIT = 1ull << 35,
RADV_DEBUG_SPLIT_FMA = 1ull << 36,
RADV_DEBUG_DUMP_EPILOGS = 1ull << 37,
RADV_DEBUG_NO_FMASK = 1ull << 38,
RADV_DEBUG_SHADOW_REGS = 1ull << 39,
};
enum {
RADV_PERFTEST_LOCAL_BOS = 1u << 0,
RADV_PERFTEST_DCC_MSAA = 1u << 1,
RADV_PERFTEST_BO_LIST = 1u << 2,
RADV_PERFTEST_CS_WAVE_32 = 1u << 3,
RADV_PERFTEST_PS_WAVE_32 = 1u << 4,
RADV_PERFTEST_GE_WAVE_32 = 1u << 5,
RADV_PERFTEST_NO_SAM = 1u << 6,
RADV_PERFTEST_SAM = 1u << 7,
RADV_PERFTEST_RT = 1u << 8,
RADV_PERFTEST_NGGC = 1u << 9,
RADV_PERFTEST_EMULATE_RT = 1u << 10,
RADV_PERFTEST_NV_MS = 1u << 11,
RADV_PERFTEST_RT_WAVE_64 = 1u << 12,
RADV_PERFTEST_GPL = 1u << 13,
RADV_PERFTEST_NGG_STREAMOUT = 1u << 14,
RADV_PERFTEST_VIDEO_DECODE = 1u << 15,
RADV_PERFTEST_DMA_SHADERS = 1u << 16,
};
bool radv_init_trace(struct radv_device *device);
void radv_finish_trace(struct radv_device *device);
void radv_check_gpu_hangs(struct radv_queue *queue, struct radeon_cmdbuf *cs);
void radv_print_spirv(const char *data, uint32_t size, FILE *fp);
void radv_dump_enabled_options(struct radv_device *device, FILE *f);
bool radv_trap_handler_init(struct radv_device *device);
void radv_trap_handler_finish(struct radv_device *device);
void radv_check_trap_handler(struct radv_queue *queue);
#endif