cuda : disables launch_fattn PDL enrollment due to compiler bug (llama/23825)
This commit is contained in:
parent
f1b687da28
commit
e90501e179
|
|
@ -1153,8 +1153,8 @@ void launch_fattn(
|
|||
|
||||
GGML_ASSERT(block_dim.x % warp_size == 0);
|
||||
|
||||
const ggml_cuda_kernel_launch_params launch_params = ggml_cuda_kernel_launch_params(blocks_num, block_dim, nbytes_shared, main_stream);
|
||||
ggml_cuda_kernel_launch(fattn_kernel, launch_params,
|
||||
// disabled PDL enrollment for now due to a compiler bug.
|
||||
fattn_kernel<<<blocks_num, block_dim, nbytes_shared, main_stream>>>(
|
||||
(const char *) Q->data,
|
||||
K_data,
|
||||
V_data,
|
||||
|
|
|
|||
Loading…
Reference in New Issue