cuda : disables launch_fattn PDL enrollment due to compiler bug (#23825)

This commit is contained in:
Andreas Kieslinger 2026-05-29 06:46:10 +02:00 committed by GitHub
parent 33c718db1f
commit 241cbd41d2
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -1153,8 +1153,8 @@ void launch_fattn(
GGML_ASSERT(block_dim.x % warp_size == 0);
const ggml_cuda_kernel_launch_params launch_params = ggml_cuda_kernel_launch_params(blocks_num, block_dim, nbytes_shared, main_stream);
ggml_cuda_kernel_launch(fattn_kernel, launch_params,
// disabled PDL enrollment for now due to a compiler bug.
fattn_kernel<<<blocks_num, block_dim, nbytes_shared, main_stream>>>(
(const char *) Q->data,
K_data,
V_data,