convert : XLMRoberta Type Vocab Size (#10458)

This matches the key in common bert-based embedding models and may have a
value other than 1 in it.

Branch: XLMRobertaTypeVocabSize

Signed-off-by: Gabe Goodhart <ghart@us.ibm.com>
This commit is contained in:
Gabe Goodhart 2024-11-24 02:02:34 -07:00 committed by GitHub
parent 96fa2c5e2d
commit 9336db462c
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -2707,7 +2707,7 @@ class XLMRobertaModel(BertModel):
self.gguf_writer.add_token_scores(scores) self.gguf_writer.add_token_scores(scores)
self.gguf_writer.add_token_types(toktypes) self.gguf_writer.add_token_types(toktypes)
self.gguf_writer.add_add_space_prefix(add_prefix) self.gguf_writer.add_add_space_prefix(add_prefix)
self.gguf_writer.add_token_type_count(1) self.gguf_writer.add_token_type_count(self.hparams.get("type_vocab_size", 1))
self.gguf_writer.add_remove_extra_whitespaces(remove_whitespaces) self.gguf_writer.add_remove_extra_whitespaces(remove_whitespaces)
if precompiled_charsmap: if precompiled_charsmap:
self.gguf_writer.add_precompiled_charsmap(precompiled_charsmap) self.gguf_writer.add_precompiled_charsmap(precompiled_charsmap)