mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-07-21 18:28:31 +00:00
@ -1261,7 +1261,7 @@ void llama_kv_cache_unified::set_input_k_shift(ggml_tensor * dst) const {
|
|||||||
const auto & cells = v_cells[s];
|
const auto & cells = v_cells[s];
|
||||||
|
|
||||||
for (uint32_t i = 0; i < cells.size(); ++i) {
|
for (uint32_t i = 0; i < cells.size(); ++i) {
|
||||||
data[i] = cells.is_empty(i) ? 0 : cells.get_shift(i);
|
data[s*cells.size() + i] = cells.is_empty(i) ? 0 : cells.get_shift(i);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
Reference in New Issue
Block a user