mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-06-29 04:35:05 +00:00
llama : fix KV shift for qwen2vl (#13870)
* llama : fix KV shift for qwen2vl * add ref to the PR
This commit is contained in:
@ -455,7 +455,7 @@ llm_graph_context::llm_graph_context(const llm_graph_params & params) :
|
||||
}
|
||||
|
||||
int64_t llm_graph_context::n_pos_per_embd() const {
|
||||
return arch == LLM_ARCH_QWEN2VL ? 4 : 1;
|
||||
return hparams.rope_type == LLAMA_ROPE_TYPE_MROPE ? 4 : 1;
|
||||
}
|
||||
|
||||
void llm_graph_context::cb(ggml_tensor * cur, const char * name, int il) const {
|
||||
|
Reference in New Issue
Block a user