convert : fix Qwen/Qwen-7b conversion (#7308)

This commit is contained in:
amd-lalithnc 2024-05-17 12:31:58 +05:30 committed by GitHub
parent ee94172d33
commit e18bc6aaf3
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -526,7 +526,7 @@ class Model:
# for this kind of tokenizer, added_vocab is not a subset of vocab, so they need to be combined # for this kind of tokenizer, added_vocab is not a subset of vocab, so they need to be combined
added_vocab = tokenizer.special_tokens added_vocab = tokenizer.special_tokens
reverse_vocab = {id_ : encoded_tok for encoded_tok, id_ in (vocab | added_vocab).items()} reverse_vocab = {id_ : encoded_tok for encoded_tok, id_ in {**vocab, **added_vocab}.items()}
for i in range(vocab_size): for i in range(vocab_size):
if i not in reverse_vocab: if i not in reverse_vocab: