Skip to content

Commit c5190c3

Browse files
committed
Move models/ggml-vocab-* to models/tests/ggml-vocab-*
1 parent 08ea539 commit c5190c3

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

52 files changed

+37
-2407
lines changed

.gitignore

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -78,7 +78,7 @@ autogen-*.md
7878
models/*
7979
models-mnt
8080
!models/.editorconfig
81-
!models/ggml-vocab-*.gguf*
81+
!models/tests/ggml-vocab-*.gguf*
8282

8383
# Zig
8484
zig-out/

Makefile

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -216,14 +216,14 @@ test: $(TEST_TARGETS)
216216
@failures=0; \
217217
for test_target in $(TEST_TARGETS); do \
218218
if [ "$$test_target" = "tests/test-tokenizer-0" ]; then \
219-
./$$test_target $(CURDIR)/models/ggml-vocab-llama-spm.gguf; \
220-
./$$test_target $(CURDIR)/models/ggml-vocab-llama-bpe.gguf; \
221-
./$$test_target $(CURDIR)/models/ggml-vocab-phi-3.gguf; \
222-
./$$test_target $(CURDIR)/models/ggml-vocab-falcon.gguf; \
223-
./$$test_target $(CURDIR)/models/ggml-vocab-bert-bge.gguf; \
224-
./$$test_target $(CURDIR)/models/ggml-vocab-starcoder.gguf; \
225-
./$$test_target $(CURDIR)/models/ggml-vocab-gpt-2.gguf; \
226-
./$$test_target $(CURDIR)/models/ggml-vocab-refact.gguf; \
219+
./$$test_target $(CURDIR)/models/tests/ggml-vocab-llama-spm.gguf; \
220+
./$$test_target $(CURDIR)/models/tests/ggml-vocab-llama-bpe.gguf; \
221+
./$$test_target $(CURDIR)/models/tests/ggml-vocab-phi-3.gguf; \
222+
./$$test_target $(CURDIR)/models/tests/ggml-vocab-falcon.gguf; \
223+
./$$test_target $(CURDIR)/models/tests/ggml-vocab-bert-bge.gguf; \
224+
./$$test_target $(CURDIR)/models/tests/ggml-vocab-starcoder.gguf; \
225+
./$$test_target $(CURDIR)/models/tests/ggml-vocab-gpt-2.gguf; \
226+
./$$test_target $(CURDIR)/models/tests/ggml-vocab-refact.gguf; \
227227
elif [ "$$test_target" = "tests/test-tokenizer-1-spm" ]; then \
228228
continue; \
229229
elif [ "$$test_target" = "tests/test-tokenizer-1-bpe" ]; then \

convert_hf_to_gguf_update.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -351,12 +351,12 @@ def get_vocab_base_pre(self, tokenizer) -> str:
351351
logger.error(f"Failed to load tokenizer for model {name}. Error: {e}")
352352
continue # Skip this model and continue with the next one in the loop
353353

354-
with open(f"models/ggml-vocab-{name}.gguf.inp", "w", encoding="utf-8") as f:
354+
with open(f"models/tests/ggml-vocab-{name}.gguf.inp", "w", encoding="utf-8") as f:
355355
for text in tests:
356356
f.write(f"{text}")
357357
f.write("\n__ggml_vocab_test__\n")
358358

359-
with open(f"models/ggml-vocab-{name}.gguf.out", "w") as f:
359+
with open(f"models/tests/ggml-vocab-{name}.gguf.out", "w") as f:
360360
for text in tests:
361361
res = tokenizer.encode(text, add_special_tokens=False)
362362
for r in res:

models/ggml-vocab-aquila.gguf

-4.6 MB
Binary file not shown.

models/ggml-vocab-baichuan.gguf

-1.28 MB
Binary file not shown.

models/ggml-vocab-bert-bge.gguf

-613 KB
Binary file not shown.

models/ggml-vocab-bert-bge.gguf.inp

Lines changed: 0 additions & 112 deletions
This file was deleted.

models/ggml-vocab-bert-bge.gguf.out

Lines changed: 0 additions & 46 deletions
This file was deleted.

models/ggml-vocab-chameleon.gguf.inp

Lines changed: 0 additions & 112 deletions
This file was deleted.

models/ggml-vocab-chameleon.gguf.out

Lines changed: 0 additions & 46 deletions
This file was deleted.

0 commit comments

Comments
 (0)