metal : reduce command encoding overhead (#9698)

* metal : reduce command encoding overhead ggml-ci * metal : add comments
2025-08-12 19:37:53 -04:00 · 2024-10-01 16:00:25 +03:00
parent a90484c6d9
commit cad341d889
5 changed files with 2000 additions and 1912 deletions
--- a/examples/llava/clip.cpp
+++ b/examples/llava/clip.cpp
@@ -2444,12 +2444,6 @@ bool clip_image_batch_encode(clip_ctx * ctx, const int n_threads, const clip_ima
        ggml_backend_cpu_set_n_threads(ctx->backend, n_threads);
    }

-#ifdef GGML_USE_METAL
-    if (ggml_backend_is_metal(ctx->backend)) {
-        ggml_backend_metal_set_n_cb(ctx->backend, n_threads);
-    }
-#endif
-
    ggml_backend_graph_compute(ctx->backend, gf);

    // the last node is the embedding tensor