We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b010c04 commit f6854f3Copy full SHA for f6854f3
tests/test_semchunk.py
@@ -64,12 +64,15 @@ def tiktoken_token_counter(text: str) -> int:
64
65
# Test using a `tiktoken` tokenizer by name.
66
chunker = semchunk.chunkerify('gpt-4', 1)
67
+ chunker('ThisIs\tATest.')
68
69
# Test using a `transformers` tokenizer by name.
70
chunker = semchunk.chunkerify('umarbutler/emubert', 1)
71
72
73
# Test using a `tiktoken` encoding by name.
74
chunker = semchunk.chunkerify('cl100k_base', 1)
75
76
77
# Test causing a `ValueError` by passing a tokenizer by name that should not exist.
78
try:
0 commit comments