|
51 | 51 | "gemini-1.5-pro-latest": 128000, |
52 | 52 | "models/embedding-001": 2048 |
53 | 53 | }, |
54 | | - "ollama": { "command-r": 12800, |
55 | | - "codellama": 16000, |
56 | | - "dbrx": 32768, |
57 | | - "deepseek-coder:33b": 16000, |
58 | | - "falcon": 2048, |
59 | | - "llama2": 4096, |
60 | | - "llama3": 8192, |
61 | | - "llama3:70b": 8192, |
62 | | - "llama3.1":128000, |
63 | | - "llama3.1:8b": 128000, |
64 | | - "llama3.1:70b": 128000, |
65 | | - "lama3.1:405b": 128000, |
66 | | - "scrapegraph": 8192, |
67 | | - "llava": 4096, |
68 | | - "mixtral:8x22b-instruct": 65536, |
69 | | - "mistral-openorca": 32000, |
70 | | - "nomic-embed-text": 8192, |
71 | | - "nous-hermes2:34b": 4096, |
72 | | - "orca-mini": 2048, |
73 | | - "phi3:3.8b": 12800, |
74 | | - "qwen:0.5b": 32000, |
75 | | - "qwen:1.8b": 32000, |
76 | | - "qwen:4b": 32000, |
77 | | - "qwen:14b": 32000, |
78 | | - "qwen:32b": 32000, |
79 | | - "qwen:72b": 32000, |
80 | | - "qwen:110b": 32000, |
81 | | - "stablelm-zephyr": 8192, |
82 | | - "wizardlm2:8x22b": 65536, |
83 | | - # embedding models |
84 | | - "shaw/dmeta-embedding-zh-small-q4": 8192, |
85 | | - "shaw/dmeta-embedding-zh-q4": 8192, |
86 | | - "chevalblanc/acge_text_embedding": 8192, |
87 | | - "martcreation/dmeta-embedding-zh": 8192, |
88 | | - "snowflake-arctic-embed": 8192, |
89 | | - "mxbai-embed-large": 512 |
| 54 | + "ollama": { |
| 55 | + "command-r": 12800, |
| 56 | + "codellama": 16000, |
| 57 | + "dbrx": 32768, |
| 58 | + "deepseek-coder:33b": 16000, |
| 59 | + "falcon": 2048, |
| 60 | + "llama2": 4096, |
| 61 | + "llama3": 8192, |
| 62 | + "llama3:70b": 8192, |
| 63 | + "llama3.1":128000, |
| 64 | + "llama3.1:8b": 128000, |
| 65 | + "llama3.1:70b": 128000, |
| 66 | + "lama3.1:405b": 128000, |
| 67 | + "scrapegraph": 8192, |
| 68 | + "llava": 4096, |
| 69 | + "mixtral:8x22b-instruct": 65536, |
| 70 | + "mistral-openorca": 32000, |
| 71 | + "nomic-embed-text": 8192, |
| 72 | + "nous-hermes2:34b": 4096, |
| 73 | + "orca-mini": 2048, |
| 74 | + "phi3:3.8b": 12800, |
| 75 | + "qwen:0.5b": 32000, |
| 76 | + "qwen:1.8b": 32000, |
| 77 | + "qwen:4b": 32000, |
| 78 | + "qwen:14b": 32000, |
| 79 | + "qwen:32b": 32000, |
| 80 | + "qwen:72b": 32000, |
| 81 | + "qwen:110b": 32000, |
| 82 | + "stablelm-zephyr": 8192, |
| 83 | + "wizardlm2:8x22b": 65536, |
| 84 | + # embedding models |
| 85 | + "shaw/dmeta-embedding-zh-small-q4": 8192, |
| 86 | + "shaw/dmeta-embedding-zh-q4": 8192, |
| 87 | + "chevalblanc/acge_text_embedding": 8192, |
| 88 | + "martcreation/dmeta-embedding-zh": 8192, |
| 89 | + "snowflake-arctic-embed": 8192, |
| 90 | + "mxbai-embed-large": 512, |
90 | 91 | }, |
91 | 92 | "oneapi": { |
92 | | - "qwen-turbo": 6000 |
| 93 | + "qwen-turbo": 6000, |
93 | 94 | }, |
94 | | - "nvidia": { |
| 95 | + "nv dia": { |
95 | 96 | "meta/llama3-70b-instruct": 419, |
96 | 97 | "meta/llama3-8b-instruct": 419, |
97 | 98 | "nemotron-4-340b-instruct": 1024, |
98 | | - "databricks/dbrx-instruct": 4096, |
99 | | - "google/codegemma-7b": 8192, |
100 | | - "google/gemma-2b": 2048, |
101 | | - "google/gemma-7b": 8192, |
102 | | - "google/recurrentgemma-2b": 2048, |
103 | | - "meta/codellama-70b": 16384, |
104 | | - "meta/llama2-70b": 4096, |
105 | | - "microsoft/phi-3-mini-128k-instruct": 122880, |
106 | | - "mistralai/mistral-7b-instruct-v0.2": 4096, |
107 | | - "mistralai/mistral-large": 8192, |
108 | | - "mistralai/mixtral-8x22b-instruct-v0.1": 32768, |
109 | | - "mistralai/mixtral-8x7b-instruct-v0.1": 8192, |
110 | | - "snowflake/arctic": 16384, |
| 99 | + "databricks/dbrx-instruct": 4096, |
| 100 | + "google/codegemma-7b": 8192, |
| 101 | + "google/gemma-2b": 2048, |
| 102 | + "google/gemma-7b": 8192, |
| 103 | + "google/recurrentgemma-2b": 2048, |
| 104 | + "meta/codellama-70b": 16384, |
| 105 | + "meta/llama2-70b": 4096, |
| 106 | + "microsoft/phi-3-mini-128k-instruct": 122880, |
| 107 | + "mistralai/mistral-7b-instruct-v0.2": 4096, |
| 108 | + "mistralai/mistral-large": 8192, |
| 109 | + "mistralai/mixtral-8x22b-instruct-v0.1": 32768, |
| 110 | + "mistralai/mixtral-8x7b-instruct-v0.1": 8192, |
| 111 | + "snowflake/arctic": 16384, |
111 | 112 | }, |
112 | 113 | "groq": { |
113 | 114 | "llama3-8b-8192": 8192, |
114 | 115 | "llama3-70b-8192": 8192, |
115 | 116 | "mixtral-8x7b-32768": 32768, |
116 | 117 | "gemma-7b-it": 8192, |
117 | | - "claude-3-haiku-20240307'": 8192 |
| 118 | + "claude-3-haiku-20240307'": 8192, |
118 | 119 | }, |
119 | 120 | "claude": { |
120 | 121 | "claude_instant": 100000, |
|
125 | 126 | "claude-3-opus-20240229": 200000, |
126 | 127 | "claude-3-sonnet-20240229": 200000, |
127 | 128 | "claude-3-haiku-20240307": 200000, |
128 | | - "claude-3-5-sonnet-20240620": 200000 |
| 129 | + "claude-3-5-sonnet-20240620": 200000, |
129 | 130 | }, |
130 | 131 | "google_vertexai": { |
131 | 132 | "gemini-1.5-flash": 128000, |
132 | 133 | "gemini-1.5-pro": 128000, |
133 | | - "gemini-1.0-pro": 128000 |
| 134 | + "gemini-1.0-pro": 128000, |
134 | 135 | }, |
135 | 136 | "bedrock": { |
136 | 137 | "anthropic.claude-3-haiku-20240307-v1:0": 200000, |
|
149 | 150 | "amazon.titan-embed-text-v1": 8000, |
150 | 151 | "amazon.titan-embed-text-v2:0": 8000, |
151 | 152 | "cohere.embed-english-v3": 512, |
152 | | - "cohere.embed-multilingual-v3": 512 |
| 153 | + "cohere.embed-multilingual-v3": 512, |
153 | 154 | }, |
154 | 155 | "mistralai": { |
155 | 156 | "mistral-large-latest": 128000, |
|
159 | 160 | "open-mistral-7b": 32000, |
160 | 161 | "open-mixtral-8x7b": 32000, |
161 | 162 | "open-mixtral-8x22b": 64000, |
162 | | - "open-codestral-mamba": 256000 |
| 163 | + "open-codestral-mamba": 256000, |
163 | 164 | }, |
164 | 165 | "hugging_face": { |
165 | 166 | "xai-org/grok-1": 8192, |
|
193 | 194 | "TheBloke/dolphin-2.7-mixtral-8x7b-GGUF": 32768, |
194 | 195 | "deepseek-ai/DeepSeek-V2": 131072, |
195 | 196 | "deepseek-ai/DeepSeek-V2-Chat": 131072, |
196 | | - "claude-3-haiku": 200000 |
| 197 | + "claude-3-haiku": 200000, |
197 | 198 | }, |
198 | 199 | "deepseek": { |
199 | 200 | "deepseek-chat": 28672, |
200 | | - "deepseek-coder": 16384 |
| 201 | + "deepseek-coder": 16384, |
201 | 202 | }, |
202 | 203 | "ernie": { |
203 | 204 | "ernie-bot-turbo": 4096, |
|
207 | 208 | "ernie-bot-2-base-zh": 4096, |
208 | 209 | "ernie-bot-2-base-en": 4096, |
209 | 210 | "ernie-bot-2-base-en-zh": 4096, |
210 | | - "ernie-bot-2-base-zh-en": 4096 |
| 211 | + "ernie-bot-2-base-zh-en": 4096, |
211 | 212 | }, |
212 | 213 | "fireworks": { |
213 | 214 | "llama-v2-7b": 4096, |
214 | 215 | "mixtral-8x7b-instruct": 4096, |
215 | | - "nomic-ai/nomic-embed-text-v1.5": 8192, |
| 216 | + "nomic-ai/nomic-embed-text-v1.5": 8192, |
216 | 217 | "llama-3.1-405B-instruct": 131072, |
217 | 218 | "llama-3.1-70B-instruct": 131072, |
218 | 219 | "llama-3.1-8B-instruct": 131072, |
219 | 220 | "mixtral-moe-8x22B-instruct": 65536, |
220 | | - "mixtral-moe-8x7B-instruct": 65536 |
| 221 | + "mixtral-moe-8x7B-instruct": 65536, |
221 | 222 | }, |
222 | 223 | } |
0 commit comments