Skip to content

Commit f6854f3

Browse files
committed
Made testing more robust.
1 parent b010c04 commit f6854f3

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

tests/test_semchunk.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -64,12 +64,15 @@ def tiktoken_token_counter(text: str) -> int:
6464

6565
# Test using a `tiktoken` tokenizer by name.
6666
chunker = semchunk.chunkerify('gpt-4', 1)
67+
chunker('ThisIs\tATest.')
6768

6869
# Test using a `transformers` tokenizer by name.
6970
chunker = semchunk.chunkerify('umarbutler/emubert', 1)
71+
chunker('ThisIs\tATest.')
7072

7173
# Test using a `tiktoken` encoding by name.
7274
chunker = semchunk.chunkerify('cl100k_base', 1)
75+
chunker('ThisIs\tATest.')
7376

7477
# Test causing a `ValueError` by passing a tokenizer by name that should not exist.
7578
try:

0 commit comments

Comments
 (0)