radv: fix IB alignment

This re-introduces "radv: fix alignment of DGC command buffers" and
"radv/amdgpu: fix alignment of command buffers" which were valid
changes.

IBs need to be aligned to the IB size requirement, not the number of
padded NOPs.

Signed-off-by: Samuel Pitoiset <samuel.pitoiset@gmail.com>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/25588>
This commit is contained in:
Samuel Pitoiset
2023-10-06 12:04:50 +02:00
committed by Marge Bot
parent af062126ae
commit e1622dcca1
2 changed files with 7 additions and 9 deletions

View File

@@ -142,10 +142,9 @@ radv_get_sequence_size(const struct radv_indirect_command_layout *layout, struct
static uint32_t static uint32_t
radv_align_cmdbuf_size(const struct radv_device *device, uint32_t size) radv_align_cmdbuf_size(const struct radv_device *device, uint32_t size)
{ {
const uint32_t ib_pad_dw_mask = MAX2(device->physical_device->rad_info.ib_pad_dw_mask[AMD_IP_GFX], const uint32_t ib_alignment = device->physical_device->rad_info.ib_alignment;
device->physical_device->rad_info.ib_pad_dw_mask[AMD_IP_COMPUTE]);
return align(size, ib_pad_dw_mask + 1); return align(size, ib_alignment);
} }
static unsigned static unsigned

View File

@@ -287,9 +287,9 @@ radv_amdgpu_cs_get_new_ib(struct radeon_cmdbuf *_cs, uint32_t ib_size)
static unsigned static unsigned
radv_amdgpu_cs_get_initial_size(struct radv_amdgpu_winsys *ws, enum amd_ip_type ip_type) radv_amdgpu_cs_get_initial_size(struct radv_amdgpu_winsys *ws, enum amd_ip_type ip_type)
{ {
uint32_t ib_pad_dw_mask = MAX2(3, ws->info.ib_pad_dw_mask[ip_type]); const uint32_t ib_alignment = ws->info.ib_alignment;
assert(util_is_power_of_two_nonzero(ib_pad_dw_mask + 1)); assert(util_is_power_of_two_nonzero(ib_alignment));
return align(20 * 1024 * 4, ib_pad_dw_mask + 1); return align(20 * 1024 * 4, ib_alignment);
} }
static struct radeon_cmdbuf * static struct radeon_cmdbuf *
@@ -377,15 +377,14 @@ radv_amdgpu_cs_grow(struct radeon_cmdbuf *_cs, size_t min_size)
return; return;
} }
enum amd_ip_type ip_type = cs->hw_ip; const uint32_t ib_alignment = cs->ws->info.ib_alignment;
uint32_t ib_pad_dw_mask = MAX2(3, cs->ws->info.ib_pad_dw_mask[ip_type]);
cs->ws->base.cs_finalize(_cs); cs->ws->base.cs_finalize(_cs);
uint64_t ib_size = MAX2(min_size * 4 + 16, cs->base.max_dw * 4 * 2); uint64_t ib_size = MAX2(min_size * 4 + 16, cs->base.max_dw * 4 * 2);
/* max that fits in the chain size field. */ /* max that fits in the chain size field. */
ib_size = align(MIN2(ib_size, 0xfffff), ib_pad_dw_mask + 1); ib_size = align(MIN2(ib_size, 0xfffff), ib_alignment);
VkResult result = radv_amdgpu_cs_bo_create(cs, ib_size); VkResult result = radv_amdgpu_cs_bo_create(cs, ib_size);