mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-06-27 03:55:20 +00:00
convert : fix tensor naming conflict for llama 4 vision (#13836)
* convert : fix tensor naming conflict for llama 4 vision * add comment
This commit is contained in:
@ -2169,6 +2169,9 @@ class Llama4VisionModel(MmprojModel):
|
|||||||
# process vision tensors
|
# process vision tensors
|
||||||
if "positional_embedding_vlm" in name and ".weight" not in name:
|
if "positional_embedding_vlm" in name and ".weight" not in name:
|
||||||
name += ".weight"
|
name += ".weight"
|
||||||
|
if "multi_modal_projector.linear_1" in name:
|
||||||
|
# despite the name with number postfix, this is a single fully connected layer
|
||||||
|
return [(gguf.TENSOR_NAMES[gguf.MODEL_TENSOR.V_MMPROJ_FC], data_torch)]
|
||||||
return [(self.map_tensor_name(name), data_torch)]
|
return [(self.map_tensor_name(name), data_torch)]
|
||||||
return []
|
return []
|
||||||
|
|
||||||
|
@ -902,7 +902,6 @@ class TensorNameMap:
|
|||||||
|
|
||||||
MODEL_TENSOR.V_MMPROJ_FC: (
|
MODEL_TENSOR.V_MMPROJ_FC: (
|
||||||
"model.connector.modality_projection.proj", # SmolVLM
|
"model.connector.modality_projection.proj", # SmolVLM
|
||||||
"multi_modal_projector.linear_1", # llama 4
|
|
||||||
),
|
),
|
||||||
|
|
||||||
MODEL_TENSOR.V_MMPROJ_MLP: (
|
MODEL_TENSOR.V_MMPROJ_MLP: (
|
||||||
|
Reference in New Issue
Block a user