llama : models now build their graphs using llama_graph_i

ggml-ci
2025-07-16 15:47:35 +00:00 · 2025-02-12 15:08:40 +02:00
parent 0ab50f1bbb
commit f63aeecce6
6 changed files with 7457 additions and 7441 deletions
--- a/src/llama-graph.h
+++ b/src/llama-graph.h
@ -7,9 +7,15 @@ struct ggml_context;
 struct ggml_tensor;
 struct llama_ubatch;

-// TODO: pass to llama_model graph build
+// TODO: can become more granular in the future
 class llama_graph_i {
 public:
+    // callback that allows us to apply custom logic to each tensor (e.g. ggml-alloc, offloading, etc.)
+    virtual void build_cb(
+             ggml_tensor * cur,
+              const char * name,
+                     int   il) = 0;
+
    // apply control vector for layer il
    virtual ggml_tensor * build_cvec(
            ggml_context * ctx0,