vocab : add midm-2.0 model pre-tokenizer (#14626)

This commit is contained in:
Dowon
2025-07-11 16:36:04 +09:00
committed by GitHub
parent 0aedae00e6
commit 576c82eda2
3 changed files with 6 additions and 1 deletions

View File

@@ -1524,7 +1524,8 @@ void llama_vocab::impl::load(llama_model_loader & ml, const LLM_KV & kv) {
tokenizer_pre == "llama-bpe"||
tokenizer_pre == "falcon3" ||
tokenizer_pre == "falcon-h1" ||
tokenizer_pre == "pixtral") {
tokenizer_pre == "pixtral" ||
tokenizer_pre == "midm-2.0") {
pre_type = LLAMA_VOCAB_PRE_TYPE_LLAMA3;
ignore_merges = true;
add_bos = true;