Skip to content

Commit 95451a9

Browse files
authored
Merge pull request #1860 from lcedaw/feat/add-gse-ch-tokenizer
add gse_ch Tokenize
2 parents 9226624 + d2bbdb9 commit 95451a9

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

weaviate/collections/classes/config.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -164,6 +164,7 @@ class Tokenization(str, BaseEnum):
164164
TRIGRAM: Tokenize into trigrams.
165165
KAGOME_JA: Tokenize using the 'Kagome' tokenizer (for Japanese).
166166
KAGOME_KR: Tokenize using the 'Kagome' tokenizer and a Korean MeCab dictionary (for Korean).
167+
GSE_CH: Tokenize using GSE (for Chinese).
167168
"""
168169

169170
WORD = "word"
@@ -174,6 +175,7 @@ class Tokenization(str, BaseEnum):
174175
TRIGRAM = "trigram"
175176
KAGOME_JA = "kagome_ja"
176177
KAGOME_KR = "kagome_kr"
178+
GSE_CH = "gse_ch"
177179

178180

179181
class GenerativeSearches(str, BaseEnum):

0 commit comments

Comments
 (0)