spaces--

ggml-org · CISC · Jun 1, 2025 · May 24, 2025 · May 24, 2025 · May 24, 2025
commit a835a0c0b1665a347e22ce765ef9783a46f2e046
diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py
@@ -3854,7 +3854,7 @@ def _xlmroberta_set_vocab(self) -> None:
                 if (piece := tokenizer._convert_id_to_token(token_id)) is not None:
                     text = piece.encode("utf-8")
                     score = tokenizer_json["model"]["vocab"][token_id][1]
-    
+
                     toktype = SentencePieceTokenTypes.NORMAL
                     if token_id == unk_token_id:
                         toktype = SentencePieceTokenTypes.UNKNOWN
@@ -3865,7 +3865,7 @@ def _xlmroberta_set_vocab(self) -> None:
                     # No reliable way to detect this, but jina doesn't have any
                     # elif tokenizer.IsByte(token_id):
                     #     toktype = SentencePieceTokenTypes.BYTE
-    
+
                     tokens[token_id] = text
                     scores[token_id] = score
                     toktypes[token_id] = toktype