mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-10-29 22:20:15 +01:00
convert : fix Qwen/Qwen-7b conversion (#7308)
This commit is contained in:
parent
ee94172d33
commit
e18bc6aaf3
@ -526,7 +526,7 @@ class Model:
|
|||||||
|
|
||||||
# for this kind of tokenizer, added_vocab is not a subset of vocab, so they need to be combined
|
# for this kind of tokenizer, added_vocab is not a subset of vocab, so they need to be combined
|
||||||
added_vocab = tokenizer.special_tokens
|
added_vocab = tokenizer.special_tokens
|
||||||
reverse_vocab = {id_ : encoded_tok for encoded_tok, id_ in (vocab | added_vocab).items()}
|
reverse_vocab = {id_ : encoded_tok for encoded_tok, id_ in {**vocab, **added_vocab}.items()}
|
||||||
|
|
||||||
for i in range(vocab_size):
|
for i in range(vocab_size):
|
||||||
if i not in reverse_vocab:
|
if i not in reverse_vocab:
|
||||||
|
Loading…
Reference in New Issue
Block a user