convert : remove now-unused ignore_nonllama parameter

2025-01-13 22:08:55 +01:00 · 2024-04-04 17:44:58 -04:00 · 2024-04-04 17:44:58 -04:00 · 45983e3a47
commit 45983e3a47
parent 909f6be291
1 changed files with 2 additions and 4 deletions
--- a/convert.py
+++ b/convert.py
@ -516,7 +516,7 @@ class LlamaHfVocab(Vocab):
    tokenizer_model = "llama"
    name = "hfft"

-    def __init__(self, base_path: Path, ignore_nonllama: bool = False):
+    def __init__(self, base_path: Path):
        fname_tokenizer = base_path / FAST_TOKENIZER_FILE
        # if this fails, FileNotFoundError propagates to caller
        with open(fname_tokenizer, encoding='utf-8') as f:
@ -524,9 +524,7 @@ class LlamaHfVocab(Vocab):

        # pre-check so we know if we need transformers
        tokenizer_model: dict[str, Any] = tokenizer_json['model']
-        if ignore_nonllama:
-            pass  # workaround incorrect use of this class for WordPiece
-        elif (
+        if (
            tokenizer_model['type'] != 'BPE' or not tokenizer_model.get('byte_fallback', False)
            or tokenizer_json['decoder']['type'] != 'Sequence'
        ):