@@ -11,114 +11,114 @@ defmodule Tokenizers.Encoding do
11
11
@ doc """
12
12
Get the number of tokens in an encoding.
13
13
"""
14
- @ spec get_length ( Encoding . t ( ) ) :: non_neg_integer ( )
14
+ @ spec get_length ( t ( ) ) :: non_neg_integer ( )
15
15
defdelegate get_length ( encoding ) , to: Tokenizers.Native , as: :encoding_get_length
16
16
17
17
@ doc """
18
18
Return the number of sequences combined in this Encoding
19
19
"""
20
- @ spec get_n_sequences ( Encoding . t ( ) ) :: non_neg_integer ( )
20
+ @ spec get_n_sequences ( t ( ) ) :: non_neg_integer ( )
21
21
defdelegate get_n_sequences ( encoding ) , to: Tokenizers.Native , as: :encoding_get_n_sequences
22
22
23
23
@ doc """
24
24
Set the given sequence id for the whole range of tokens contained in this Encoding.
25
25
"""
26
- @ spec set_sequence_id ( Encoding . t ( ) , non_neg_integer ( ) ) :: Encoding . t ( )
26
+ @ spec set_sequence_id ( t ( ) , non_neg_integer ( ) ) :: t ( )
27
27
defdelegate set_sequence_id ( encoding , id ) , to: Tokenizers.Native , as: :encoding_set_sequence_id
28
28
29
29
@ doc """
30
30
Get the ids from an encoding.
31
31
"""
32
- @ spec get_ids ( Encoding . t ( ) ) :: [ integer ( ) ]
32
+ @ spec get_ids ( t ( ) ) :: [ integer ( ) ]
33
33
defdelegate get_ids ( encoding ) , to: Tokenizers.Native , as: :encoding_get_ids
34
34
35
35
@ doc """
36
36
Same as `get_ids/1`, but returns binary with u32 values.
37
37
"""
38
- @ spec get_u32_ids ( Encoding . t ( ) ) :: binary ( )
38
+ @ spec get_u32_ids ( t ( ) ) :: binary ( )
39
39
defdelegate get_u32_ids ( encoding ) , to: Tokenizers.Native , as: :encoding_get_u32_ids
40
40
41
41
@ doc """
42
42
Get token type ids from an encoding.
43
43
"""
44
- @ spec get_type_ids ( Encoding . t ( ) ) :: [ integer ( ) ]
44
+ @ spec get_type_ids ( t ( ) ) :: [ integer ( ) ]
45
45
defdelegate get_type_ids ( encoding ) , to: Tokenizers.Native , as: :encoding_get_type_ids
46
46
47
47
@ doc """
48
48
Same as `get_type_ids/1`, but returns binary with u32 values.
49
49
"""
50
- @ spec get_u32_type_ids ( Encoding . t ( ) ) :: binary ( )
50
+ @ spec get_u32_type_ids ( t ( ) ) :: binary ( )
51
51
defdelegate get_u32_type_ids ( encoding ) , to: Tokenizers.Native , as: :encoding_get_u32_type_ids
52
52
53
53
@ doc """
54
54
Get the attention mask from an encoding.
55
55
"""
56
- @ spec get_attention_mask ( Encoding . t ( ) ) :: [ integer ( ) ]
56
+ @ spec get_attention_mask ( t ( ) ) :: [ integer ( ) ]
57
57
defdelegate get_attention_mask ( encoding ) ,
58
58
to: Tokenizers.Native ,
59
59
as: :encoding_get_attention_mask
60
60
61
61
@ doc """
62
62
Same as `get_attention_mask/1`, but returns binary with u32 values.
63
63
"""
64
- @ spec get_u32_attention_mask ( Encoding . t ( ) ) :: binary ( )
64
+ @ spec get_u32_attention_mask ( t ( ) ) :: binary ( )
65
65
defdelegate get_u32_attention_mask ( encoding ) ,
66
66
to: Tokenizers.Native ,
67
67
as: :encoding_get_u32_attention_mask
68
68
69
69
@ doc """
70
70
Get the special tokens mask from an encoding.
71
71
"""
72
- @ spec get_special_tokens_mask ( Encoding . t ( ) ) :: [ integer ( ) ]
72
+ @ spec get_special_tokens_mask ( t ( ) ) :: [ integer ( ) ]
73
73
defdelegate get_special_tokens_mask ( encoding ) ,
74
74
to: Tokenizers.Native ,
75
75
as: :encoding_get_special_tokens_mask
76
76
77
77
@ doc """
78
78
Same as `get_special_tokens_mask/1`, but returns binary with u32 values.
79
79
"""
80
- @ spec get_u32_special_tokens_mask ( Encoding . t ( ) ) :: binary ( )
80
+ @ spec get_u32_special_tokens_mask ( t ( ) ) :: binary ( )
81
81
defdelegate get_u32_special_tokens_mask ( encoding ) ,
82
82
to: Tokenizers.Native ,
83
83
as: :encoding_get_u32_special_tokens_mask
84
84
85
85
@ doc """
86
86
Get the tokens from an encoding.
87
87
"""
88
- @ spec get_tokens ( Encoding . t ( ) ) :: [ binary ( ) ]
88
+ @ spec get_tokens ( t ( ) ) :: [ binary ( ) ]
89
89
defdelegate get_tokens ( encoding ) , to: Tokenizers.Native , as: :encoding_get_tokens
90
90
91
91
@ doc """
92
92
Get word ids from an encoding.
93
93
"""
94
- @ spec get_word_ids ( Encoding . t ( ) ) :: [ non_neg_integer ( ) | nil ]
94
+ @ spec get_word_ids ( t ( ) ) :: [ non_neg_integer ( ) | nil ]
95
95
defdelegate get_word_ids ( encoding ) , to: Tokenizers.Native , as: :encoding_get_word_ids
96
96
97
97
@ doc """
98
98
Get sequence ids from an encoding.
99
99
"""
100
- @ spec get_sequence_ids ( Encoding . t ( ) ) :: [ non_neg_integer ( ) | nil ]
100
+ @ spec get_sequence_ids ( t ( ) ) :: [ non_neg_integer ( ) | nil ]
101
101
defdelegate get_sequence_ids ( encoding ) , to: Tokenizers.Native , as: :encoding_get_sequence_ids
102
102
103
103
@ doc """
104
104
Get offsets from an encoding.
105
105
106
106
The offsets are expressed in terms of UTF-8 bytes.
107
107
"""
108
- @ spec get_offsets ( Encoding . t ( ) ) :: [ { integer ( ) , integer ( ) } ]
108
+ @ spec get_offsets ( t ( ) ) :: [ { integer ( ) , integer ( ) } ]
109
109
defdelegate get_offsets ( encoding ) , to: Tokenizers.Native , as: :encoding_get_offsets
110
110
111
111
@ doc """
112
112
Get the overflow from an encoding.
113
113
"""
114
- @ spec get_overflowing ( Encoding . t ( ) ) :: [ Encoding . t ( ) ]
114
+ @ spec get_overflowing ( t ( ) ) :: [ t ( ) ]
115
115
defdelegate get_overflowing ( encoding ) , to: Tokenizers.Native , as: :encoding_get_overflowing
116
116
117
117
@ doc """
118
118
Get the encoded tokens corresponding to the word at the given index in the input sequence,
119
119
with the form (start_token, end_token + 1)
120
120
"""
121
- @ spec word_to_tokens ( Encoding . t ( ) , non_neg_integer ( ) , non_neg_integer ( ) ) ::
121
+ @ spec word_to_tokens ( t ( ) , non_neg_integer ( ) , non_neg_integer ( ) ) ::
122
122
{ non_neg_integer ( ) , non_neg_integer ( ) } | nil
123
123
defdelegate word_to_tokens ( encoding , word , seq_id ) ,
124
124
to: Tokenizers.Native ,
@@ -127,7 +127,7 @@ defmodule Tokenizers.Encoding do
127
127
@ doc """
128
128
Get the offsets of the word at the given index in the input sequence.
129
129
"""
130
- @ spec word_to_chars ( Encoding . t ( ) , non_neg_integer ( ) , non_neg_integer ( ) ) ::
130
+ @ spec word_to_chars ( t ( ) , non_neg_integer ( ) , non_neg_integer ( ) ) ::
131
131
{ non_neg_integer ( ) , non_neg_integer ( ) } | nil
132
132
defdelegate word_to_chars ( encoding , word , seq_id ) ,
133
133
to: Tokenizers.Native ,
@@ -136,29 +136,29 @@ defmodule Tokenizers.Encoding do
136
136
@ doc """
137
137
Returns the index of the sequence containing the given token
138
138
"""
139
- @ spec token_to_sequence ( Encoding . t ( ) , non_neg_integer ( ) ) :: non_neg_integer ( ) | nil
139
+ @ spec token_to_sequence ( t ( ) , non_neg_integer ( ) ) :: non_neg_integer ( ) | nil
140
140
defdelegate token_to_sequence ( encoding , token ) ,
141
141
to: Tokenizers.Native ,
142
142
as: :encoding_token_to_sequence
143
143
144
144
@ doc """
145
145
Get the offsets of the token at the given index.
146
146
"""
147
- @ spec token_to_chars ( Encoding . t ( ) , non_neg_integer ( ) ) ::
147
+ @ spec token_to_chars ( t ( ) , non_neg_integer ( ) ) ::
148
148
{ non_neg_integer ( ) , { non_neg_integer ( ) , non_neg_integer ( ) } } | nil
149
149
defdelegate token_to_chars ( encoding , token ) , to: Tokenizers.Native , as: :encoding_token_to_chars
150
150
151
151
@ doc """
152
152
Get the word that contains the token at the given index.
153
153
"""
154
- @ spec token_to_word ( Encoding . t ( ) , non_neg_integer ( ) ) ::
154
+ @ spec token_to_word ( t ( ) , non_neg_integer ( ) ) ::
155
155
{ non_neg_integer ( ) , non_neg_integer ( ) } | nil
156
156
defdelegate token_to_word ( encoding , token ) , to: Tokenizers.Native , as: :encoding_token_to_word
157
157
158
158
@ doc """
159
159
Get the token that contains the given char.
160
160
"""
161
- @ spec char_to_token ( Encoding . t ( ) , non_neg_integer ( ) , non_neg_integer ( ) ) ::
161
+ @ spec char_to_token ( t ( ) , non_neg_integer ( ) , non_neg_integer ( ) ) ::
162
162
non_neg_integer ( ) | nil
163
163
defdelegate char_to_token ( encoding , position , seq_id ) ,
164
164
to: Tokenizers.Native ,
@@ -167,7 +167,7 @@ defmodule Tokenizers.Encoding do
167
167
@ doc """
168
168
Get the word that contains the given char.
169
169
"""
170
- @ spec char_to_word ( Encoding . t ( ) , non_neg_integer ( ) , non_neg_integer ( ) ) ::
170
+ @ spec char_to_word ( t ( ) , non_neg_integer ( ) , non_neg_integer ( ) ) ::
171
171
non_neg_integer ( ) | nil
172
172
defdelegate char_to_word ( encoding , position , seq_id ) ,
173
173
to: Tokenizers.Native ,
@@ -192,7 +192,7 @@ defmodule Tokenizers.Encoding do
192
192
@ doc """
193
193
Pad the encoding to the given length.
194
194
"""
195
- @ spec pad ( Encoding . t ( ) , non_neg_integer ( ) , padding_opts ( ) ) :: Encoding . t ( )
195
+ @ spec pad ( t ( ) , non_neg_integer ( ) , padding_opts ( ) ) :: t ( )
196
196
defdelegate pad ( encoding , target_length , opts \\ [ ] ) ,
197
197
to: Tokenizers.Native ,
198
198
as: :encoding_pad
@@ -208,15 +208,15 @@ defmodule Tokenizers.Encoding do
208
208
@ doc """
209
209
Truncate the encoding to the given length.
210
210
"""
211
- @ spec truncate ( Encoding . t ( ) , non_neg_integer ( ) , truncation_opts ( ) ) :: Encoding . t ( )
211
+ @ spec truncate ( t ( ) , non_neg_integer ( ) , truncation_opts ( ) ) :: t ( )
212
212
defdelegate truncate ( encoding , max_length , opts \\ [ ] ) ,
213
213
to: Tokenizers.Native ,
214
214
as: :encoding_truncate
215
215
216
216
@ doc """
217
- Returns the number of tokens in an `Encoding. t()`.
217
+ Returns the number of tokens in an `t()`.
218
218
"""
219
- @ spec n_tokens ( encoding :: Encoding . t ( ) ) :: non_neg_integer ( )
219
+ @ spec n_tokens ( encoding :: t ( ) ) :: non_neg_integer ( )
220
220
defdelegate n_tokens ( encoding ) , to: Tokenizers.Native , as: :encoding_get_length
221
221
end
222
222
0 commit comments