mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-07-16 15:47:35 +00:00
llama : models now build their graphs using llama_graph_i
ggml-ci
This commit is contained in:
@ -7,9 +7,15 @@ struct ggml_context;
|
||||
struct ggml_tensor;
|
||||
struct llama_ubatch;
|
||||
|
||||
// TODO: pass to llama_model graph build
|
||||
// TODO: can become more granular in the future
|
||||
class llama_graph_i {
|
||||
public:
|
||||
// callback that allows us to apply custom logic to each tensor (e.g. ggml-alloc, offloading, etc.)
|
||||
virtual void build_cb(
|
||||
ggml_tensor * cur,
|
||||
const char * name,
|
||||
int il) = 0;
|
||||
|
||||
// apply control vector for layer il
|
||||
virtual ggml_tensor * build_cvec(
|
||||
ggml_context * ctx0,
|
||||
|
Reference in New Issue
Block a user