cuda : disables launch_fattn PDL enrollment due to compiler bug (llama/23825)

This commit is contained in:
Andreas Kieslinger 2026-05-29 06:46:10 +02:00 committed by Georgi Gerganov
parent f1b687da28
commit e90501e179
1 changed files with 2 additions and 2 deletions

View File

@ -1153,8 +1153,8 @@ void launch_fattn(
GGML_ASSERT(block_dim.x % warp_size == 0);
const ggml_cuda_kernel_launch_params launch_params = ggml_cuda_kernel_launch_params(blocks_num, block_dim, nbytes_shared, main_stream);
ggml_cuda_kernel_launch(fattn_kernel, launch_params,
// disabled PDL enrollment for now due to a compiler bug.
fattn_kernel<<<blocks_num, block_dim, nbytes_shared, main_stream>>>(
(const char *) Q->data,
K_data,
V_data,