File tree Expand file tree Collapse file tree 1 file changed +7
-0
lines changed Expand file tree Collapse file tree 1 file changed +7
-0
lines changed Original file line number Diff line number Diff line change 1414#include < executorch/extension/llm/runner/util.h>
1515#include < pytorch/tokenizers/hf_tokenizer.h>
1616#include < pytorch/tokenizers/llama2c_tokenizer.h>
17+ #include < pytorch/tokenizers/sentencepiece_tokenizer.h>
1718#include < pytorch/tokenizers/tiktoken.h>
1819
1920namespace executorch ::extension::llm {
@@ -252,6 +253,12 @@ std::unique_ptr<tokenizers::Tokenizer> load_tokenizer(
252253 return tiktoken_tokenizer;
253254 }
254255
256+ auto sp_tokenizer = std::make_unique<::tokenizers::SPTokenizer>();
257+ if (sp_tokenizer->load (tokenizer_path) == ::tokenizers::Error::Ok) {
258+ ET_LOG (Info, " Loaded Sentencepiece tokenizer" );
259+ return sp_tokenizer;
260+ }
261+
255262 auto bpe_tokenizer = std::make_unique<::tokenizers::Llama2cTokenizer>();
256263 if (bpe_tokenizer->load (tokenizer_path) == ::tokenizers::Error::Ok) {
257264 ET_LOG (Info, " Loaded BPE tokenizer" );
You can’t perform that action at this time.
0 commit comments