File tree Expand file tree Collapse file tree 3 files changed +5
-10
lines changed
include/pytorch/tokenizers Expand file tree Collapse file tree 3 files changed +5
-10
lines changed Original file line number Diff line number Diff line change 12
12
13
13
namespace tokenizers {
14
14
15
- struct TokenIndex {
16
- const char * str;
17
- int32_t id;
18
- };
19
-
20
15
// A simple Byte Pair Encoding (BPE) Tokenizer. Note that the current C++ code
21
16
// won't work with this class, it needs to go through tokenizer.py first.
22
17
class Llama2cTokenizer : public Tokenizer {
Original file line number Diff line number Diff line change 16
16
#include " sentencepiece_processor.h"
17
17
namespace tokenizers {
18
18
19
- struct TokenIndex {
20
- const char * str;
21
- int32_t id;
22
- };
23
-
24
19
class SPTokenizer : public Tokenizer {
25
20
public:
26
21
explicit SPTokenizer ();
Original file line number Diff line number Diff line change 20
20
21
21
namespace tokenizers {
22
22
23
+ struct TokenIndex {
24
+ const char * str;
25
+ int32_t id;
26
+ };
27
+
23
28
class Tokenizer {
24
29
public:
25
30
explicit Tokenizer () {}
You can’t perform that action at this time.
0 commit comments