limit to GGML_ALLOW_CUDA_GRAPHS defined in llama.cpp cmake

2025-07-28 21:23:55 -04:00 · 2024-04-25 00:51:48 -07:00
parent 408759687f
commit 0640427f7b
2 changed files with 2 additions and 1 deletions
--- a/ggml-cuda.cu
+++ b/ggml-cuda.cu
@@ -2405,7 +2405,7 @@ GGML_CALL static void ggml_backend_cuda_synchronize(ggml_backend_t backend) {
    GGML_UNUSED(backend);
 }

-#if (CUDART_VERSION >= 12000)
+#if (CUDART_VERSION >= 12000) && defined(GGML_ALLOW_CUDA_GRAPHS)
 #define USE_CUDA_GRAPH
 #endif