convert : only check for tokenizer folder if we need it (#14704)

2025-08-09 02:12:45 -04:00 · 2025-07-16 08:52:04 +02:00
parent cf91f217f1
commit 4b91d6f71f
1 changed files with 6 additions and 5 deletions
--- a/convert_hf_to_gguf_update.py
+++ b/convert_hf_to_gguf_update.py
@@ -240,11 +240,6 @@ for model in [*pre_computed_hashes, *all_models]:
    if tokt == TOKENIZER_TYPE.SPM or tokt == TOKENIZER_TYPE.UGM:
        continue

-    # Skip if the tokenizer folder does not exist or there are other download issues previously
-    if not os.path.exists(f"models/tokenizers/{name}"):
-        logger.warning(f"Directory for tokenizer {name} not found. Skipping...")
-        continue
-
    # create the tokenizer
    if chkhsh is not None:
        # if the model has a pre-computed hash, use it
@@ -254,6 +249,12 @@ for model in [*pre_computed_hashes, *all_models]:
        chkhsh = existing_models[name]
    else:
        # otherwise, compute the hash of the tokenizer
+
+        # Skip if the tokenizer folder does not exist or there are other download issues previously
+        if not os.path.exists(f"models/tokenizers/{name}"):
+            logger.warning(f"Directory for tokenizer {name} not found. Skipping...")
+            continue
+
        try:
            logger.info(f"Loading tokenizer from {f'models/tokenizers/{name}'}...")
            if name == "t5":