Skip to content

Commit 40b4b2d

Browse files
committed
add new models tokens
1 parent ec77ff7 commit 40b4b2d

File tree

2 files changed

+40
-10
lines changed

2 files changed

+40
-10
lines changed

scrapegraphai/graphs/abstract_graph.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -327,6 +327,7 @@ def _create_embedder(self, embedder_config: dict) -> object:
327327
raise KeyError("Model not supported") from exc
328328
return OllamaEmbeddings(**embedder_params)
329329
elif "hugging_face" in embedder_params["model"]:
330+
embedder_params["model"] = "/".join(embedder_params["model"].split("/")[1:])
330331
try:
331332
models_tokens["hugging_face"][embedder_params["model"]]
332333
except KeyError as exc:

scrapegraphai/helpers/models_tokens.py

Lines changed: 39 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,3 @@
1-
"""
2-
Models token
3-
"""
4-
51
models_tokens = {
62
"openai": {
73
"gpt-3.5-turbo-0125": 16385,
@@ -31,10 +27,11 @@
3127
},
3228
"gemini": {
3329
"gemini-pro": 128000,
34-
"gemini-1.5-flash-latest":128000,
35-
"gemini-1.5-pro-latest":128000,
30+
"gemini-1.5-flash-latest": 128000,
31+
"gemini-1.5-pro-latest": 128000,
3632
"models/embedding-001": 2048
3733
},
34+
<<<<<<< Updated upstream
3835
"ollama": { "command-r": 12800,
3936
"codellama": 16000,
4037
"dbrx": 32768,
@@ -63,6 +60,39 @@
6360
"shaw/dmeta-embedding-zh": 8192,
6461
"snowflake-arctic-embed": 8192,
6562
"mxbai-embed-large": 512
63+
=======
64+
"ollama": {
65+
"command-r": 12800,
66+
"codellama": 16000,
67+
"dbrx": 32768,
68+
"deepseek-coder:33b": 16000,
69+
"falcon": 2048,
70+
"llama2": 4096,
71+
"llama3": 8192,
72+
"scrapegraph": 8192,
73+
"llava": 4096,
74+
"mixtral:8x22b-instruct": 65536,
75+
"mistral-openorca": 32000,
76+
"nomic-embed-text": 8192,
77+
"nous-hermes2:34b": 4096,
78+
"orca-mini": 2048,
79+
"phi3:3.8b": 12800,
80+
"qwen:0.5b": 32000,
81+
"qwen:1.8b": 32000,
82+
"qwen:4b": 32000,
83+
"qwen:14b": 32000,
84+
"qwen:32b": 32000,
85+
"qwen:72b": 32000,
86+
"qwen:110b": 32000,
87+
"stablelm-zephyr": 8192,
88+
"wizardlm2:8x22b": 65536,
89+
"shaw/dmeta-embedding-zh-small-q4": 8192,
90+
"shaw/dmeta-embedding-zh-q4": 8192,
91+
"chevalblanc/acge_text_embedding": 8192,
92+
"martcreation/dmeta-embedding-zh": 8192,
93+
"snowflake-arctic-embed": 8192,
94+
"mxbai-embed-large": 512,
95+
>>>>>>> Stashed changes
6696
},
6797
"oneapi": {
6898
"qwen-turbo": 6000
@@ -93,9 +123,8 @@
93123
"mistral.mistral-7b-instruct-v0:2": 32768,
94124
"mistral.mixtral-8x7b-instruct-v0:1": 32768,
95125
"mistral.mistral-large-2402-v1:0": 32768,
96-
# Embedding models
97-
"amazon.titan-embed-text-v1": 8000,
98-
"amazon.titan-embed-text-v2:0": 8000,
126+
"amazon.titan-embed-text-v1": 8000,
127+
"amazon.titan-embed-text-v2:0": 8000,
99128
"cohere.embed-english-v3": 512,
100129
"cohere.embed-multilingual-v3": 512
101130
},
@@ -147,6 +176,6 @@
147176
"ernie-bot-2-base-zh": 4096,
148177
"ernie-bot-2-base-en": 4096,
149178
"ernie-bot-2-base-en-zh": 4096,
150-
"ernie-bot-2-base-zh-en": 4096,
179+
"ernie-bot-2-base-zh-en": 4096
151180
}
152181
}

0 commit comments

Comments
 (0)