Skip to content

Commit 4c10ff8

Browse files
committed
Merge branch 'feature/llm-complete-updates' of github.com:zenml-io/zenml-projects into feature/llm-complete-updates
2 parents e83b505 + 32e2be0 commit 4c10ff8

File tree

3 files changed

+13
-10
lines changed

3 files changed

+13
-10
lines changed

.gitignore

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -162,6 +162,7 @@ llm-lora-finetuning/configs/shopify.yaml
162162
finetuned-matryoshka/
163163
finetuned-all-MiniLM-L6-v2/
164164
finetuned-snowflake-arctic-embed-m/
165+
finetuned-snowflake-arctic-embed-m-v1.5/
165166

166167
# ollama ignores
167168
nohup.out

llm-complete-guide/constants.py

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -57,16 +57,17 @@
5757

5858
# embeddings finetuning constants
5959
EMBEDDINGS_MODEL_NAME_ZENML = "finetuned-zenml-docs-embeddings"
60-
DATASET_NAME_DEFAULT = "zenml/rag_qa_embedding_questions_0_60_0"
60+
# DATASET_NAME_DEFAULT = "zenml/rag_qa_embedding_questions_0_60_0"
61+
DATASET_NAME_DEFAULT = "zenml/rag_qa_embedding_questions"
6162
DATASET_NAME_DISTILABEL = f"{DATASET_NAME_DEFAULT}_distilabel"
6263
DATASET_NAME_ARGILLA = DATASET_NAME_DEFAULT.replace("zenml/", "")
6364
OPENAI_MODEL_GEN = "gpt-4o"
6465
OPENAI_MODEL_GEN_KWARGS_EMBEDDINGS = {
6566
"temperature": 0.7,
6667
"max_new_tokens": 512,
6768
}
68-
EMBEDDINGS_MODEL_ID_BASELINE = "Snowflake/snowflake-arctic-embed-m"
69-
EMBEDDINGS_MODEL_ID_FINE_TUNED = "finetuned-snowflake-arctic-embed-m"
69+
EMBEDDINGS_MODEL_ID_BASELINE = "Snowflake/snowflake-arctic-embed-m-v1.5"
70+
EMBEDDINGS_MODEL_ID_FINE_TUNED = "finetuned-snowflake-arctic-embed-m-v1.5"
7071
EMBEDDINGS_MODEL_MATRYOSHKA_DIMS: list[int] = [
7172
384,
7273
256,
Lines changed: 8 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,10 @@
1-
zenml[server]>=0.63.0
2-
sentence-transformers>=3
3-
transformers
1+
zenml[server]>=0.63.0,<0.68.0
2+
sentence-transformers>=3,<=3.0.1
3+
transformers<=4.44.0
44
litellm
55
ollama
6-
polars
7-
datasets
8-
argilla
9-
distilabel
6+
polars<=1.4.1
7+
datasets<=2.20.0
8+
argilla<=2.0.0
9+
distilabel<=1.3.1
10+
accelerate<=0.33.0

0 commit comments

Comments
 (0)