Skip to content

Commit 1f0cc0c

Browse files
authored
support mixtral 8x22b instruct (#495)
1 parent a995869 commit 1f0cc0c

File tree

3 files changed

+4
-1
lines changed

3 files changed

+4
-1
lines changed

docs/model_zoo.md

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -23,6 +23,7 @@ Scale hosts the following models in the LLM Engine Model Zoo:
2323
| `mixtral-8x7b` || | vllm | 32768 |
2424
| `mixtral-8x7b-instruct` || | vllm | 32768 |
2525
| `mixtral-8x22b` || | vllm | 65536 |
26+
| `mixtral-8x22b-instruct` || | vllm | 65536 |
2627
| `codellama-7b` ||| text-generation-inference, vllm | 16384 |
2728
| `codellama-7b-instruct` ||| text-generation-inference, vllm | 16384 |
2829
| `codellama-13b` ||| text-generation-inference, vllm | 16384 |

model-engine/model_engine_server/domain/use_cases/llm_model_endpoint_use_cases.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -181,6 +181,7 @@
181181
"mixtral-8x7b",
182182
"mixtral-8x7b-instruct",
183183
"mixtral-8x22b",
184+
"mixtral-8x22b-instruct",
184185
"mammoth-coder-llama-2-7b",
185186
"mammoth-coder-llama-2-13b",
186187
"mammoth-coder-llama-2-34b",

model-engine/model_engine_server/infra/repositories/live_tokenizer_repository.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -62,7 +62,8 @@ def get_default_supported_models_info() -> Dict[str, ModelInfo]:
6262
"mistral-7b-instruct": ModelInfo("mistralai/Mistral-7B-Instruct-v0.1", None),
6363
"mixtral-8x7b": ModelInfo("mistralai/Mixtral-8x7B-v0.1", None),
6464
"mixtral-8x7b-instruct": ModelInfo("mistralai/Mixtral-8x7B-Instruct-v0.1", None),
65-
"mixtral-8x22b": ModelInfo("mistral-community/Mixtral-8x22B-v0.1", None),
65+
"mixtral-8x22b": ModelInfo("mistralai/Mixtral-8x22B-v0.1", None),
66+
"mixtral-8x22b-instruct": ModelInfo("mistralai/Mixtral-8x22B-Instruct-v0.1", None),
6667
"mammoth-coder-llama-2-7b": ModelInfo("TIGER-Lab/MAmmoTH-Coder-7B", None),
6768
"mammoth-coder-llama-2-13b": ModelInfo("TIGER-Lab/MAmmoTH-Coder-13B", None),
6869
"mammoth-coder-llama-2-34b": ModelInfo("TIGER-Lab/MAmmoTH-Coder-34B", None),

0 commit comments

Comments
 (0)