Fixed mmap prefetch for GPU offloading (#2529)

2025-08-24 08:49:15 -04:00 · 2023-08-07 10:09:40 +02:00
parent f6f9896ac3
commit 3d9a551816
2 changed files with 4 additions and 4 deletions
--- a/llama-util.h
+++ b/llama-util.h
@@ -219,7 +219,7 @@ struct llama_mmap {
        // prefetch/readahead impairs performance on NUMA systems
        if (numa) { prefetch = 0; }
 #ifdef __linux__
-        if (prefetch) { flags |= MAP_POPULATE; }
+        if (prefetch >= file->size) { flags |= MAP_POPULATE; }
 #endif
        addr = mmap(NULL, file->size, PROT_READ, flags, fd, 0);
        if (addr == MAP_FAILED) {