metal : release buffers when freeing metal context (#2062)

2025-08-17 05:25:09 -04:00 · 2023-07-01 11:14:59 -07:00
parent 471aab6e4c
commit 2f8cd979ec
2 changed files with 10 additions and 2 deletions
--- a/llama.cpp
+++ b/llama.cpp
@@ -253,7 +253,13 @@ struct llama_model {

 struct llama_context {
    llama_context(const llama_model & model, const llama_vocab & vocab) : model(model), vocab(vocab), t_load_us(model.t_load_us), t_start_us(model.t_start_us) {}
-
+#ifdef GGML_USE_METAL
+    ~llama_context() {
+        if (ctx_metal) {
+            ggml_metal_free(ctx_metal);
+        }
+    }
+#endif
    std::mt19937 rng;

    bool has_evaluated_once = false;