server : fix LRU check (#14079)

ggml-ci
2025-06-26 19:55:04 +00:00 · 2025-06-09 12:57:58 +03:00
parent b460d16ae8
commit 87d34b381d
1 changed files with 3 additions and 2 deletions
--- a/tools/server/server.cpp
+++ b/tools/server/server.cpp
@ -2142,7 +2142,8 @@ struct server_context {

        // find the slot that has been least recently used
        if (ret == nullptr) {
-            int64_t t_last = ggml_time_us();
+            int64_t t_last = -1;
+
            for (server_slot & slot : slots) {
                // skip the slot if it is not available
                if (slot.is_processing()) {
@ -2150,7 +2151,7 @@ struct server_context {
                }

                // select the current slot if the criteria match
-                if (slot.t_last_used < t_last) {
+                if (!ret || slot.t_last_used <= t_last) {
                    t_last = slot.t_last_used;
                    ret = &slot;
                }