Add Cuda Graphs in CMakeList (#947)

original LCPP PR 3242 by Slaren
This commit is contained in:
Nexesenex 2024-06-29 04:10:51 +02:00 committed by GitHub
parent 2857fb52ba
commit a5a32b9179
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -49,6 +49,7 @@ option(LLAMA_CUDA_F16 "llama: use 16 bit floats for dmmv
set(LLAMA_CUDA_KQUANTS_ITER "2" CACHE STRING "llama: iters./thread per block for Q2_K/Q6_K")
set(LLAMA_CUDA_PEER_MAX_BATCH_SIZE "128" CACHE STRING
"llama: max. batch size for using peer access")
set(GGML_CUDA_USE_GRAPHS ON)
option(LLAMA_HIPBLAS "llama: use hipBLAS" OFF)
# Other