File tree Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -3854,7 +3854,7 @@ def _xlmroberta_set_vocab(self) -> None:
38543854 if (piece := tokenizer ._convert_id_to_token (token_id )) is not None :
38553855 text = piece .encode ("utf-8" )
38563856 score = tokenizer_json ["model" ]["vocab" ][token_id ][1 ]
3857-
3857+
38583858 toktype = SentencePieceTokenTypes .NORMAL
38593859 if token_id == unk_token_id :
38603860 toktype = SentencePieceTokenTypes .UNKNOWN
@@ -3865,7 +3865,7 @@ def _xlmroberta_set_vocab(self) -> None:
38653865 # No reliable way to detect this, but jina doesn't have any
38663866 # elif tokenizer.IsByte(token_id):
38673867 # toktype = SentencePieceTokenTypes.BYTE
3868-
3868+
38693869 tokens [token_id ] = text
38703870 scores [token_id ] = score
38713871 toktypes [token_id ] = toktype
You can’t perform that action at this time.
0 commit comments