Skip to content

Commit d4eeb2d

Browse files
committed
bpe_tokenizer class updated.
1 parent 2db56f5 commit d4eeb2d

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

dlib/tokenizer/bpe_tokenizer.h

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -213,7 +213,8 @@ namespace dlib
213213
const std::vector<uint8_t>& pattern = merges[token].pattern;
214214
result.insert(result.end(), pattern.begin(), pattern.end());
215215
}
216-
else if (token >= static_cast<int>(merges.size()) && token < get_vocab_without_specials_size()) {
216+
else if (token >= static_cast<int>(merges.size()) &&
217+
token < static_cast<int>(get_vocab_without_specials_size())) {
217218
// Special token
218219
int special_idx = token - static_cast<int>(merges.size());
219220
if (display_special_tokens) {
@@ -321,7 +322,7 @@ namespace dlib
321322
"<user>", "<bot>", "<system>", "<question>",
322323
"<answer>", "<search>", "<unk>", "<pad>"
323324
};
324-
static const size_t BPE_BASE_VOCAB_SIZE = 256;
325+
static const int BPE_BASE_VOCAB_SIZE = 256;
325326

326327
// Merge structure
327328
struct Merge {

0 commit comments

Comments
 (0)