Skip to content

Commit 5edc46e

Browse files
dsingal0dsingal
andauthored
added minimax 2.1 w/ sglang and minimax/qwen3 reasoning parser (#535)
Co-authored-by: dsingal <dsingal@dsingals-MacBook-Pro.local>
1 parent 577c4f9 commit 5edc46e

File tree

2 files changed

+51
-32
lines changed

2 files changed

+51
-32
lines changed

minimax/minimax_m2_1/config.yaml

Lines changed: 51 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,51 @@
1+
base_image:
2+
image: lmsysorg/sglang:nightly-dev-20260126-48f4340b
3+
docker_server:
4+
liveness_endpoint: /health_generate
5+
predict_endpoint: /v1/chat/completions
6+
readiness_endpoint: /health_generate
7+
server_port: 8000
8+
start_command: sh -c "truss-transfer-cli && find /app/model_cache/checkpoint -type f -print0 | xargs -0 -P 0 -I {} dd if={} of=/dev/null bs=4M && python3 -m sglang.launch_server --model-path /app/model_cache/checkpoint --tp-size 8 --ep-size 8 --tool-call-parser minimax-m2 --trust-remote-code --host 0.0.0.0 --reasoning-parser minimax --port 8000 --mem-fraction-static 0.85"
9+
#environment_variables:
10+
# SGLANG_ALLOW_OVERWRITE_LONGER_CONTEXT_LEN: 1
11+
model_cache:
12+
- allow_patterns:
13+
- '*.json'
14+
- '*.safetensors'
15+
- '*.txt'
16+
- '*.model'
17+
- '*.py'
18+
- '*.jinja'
19+
repo_id: MiniMaxAI/MiniMax-M2.1
20+
revision: 927ea2b64008fe4a1e31a4e107a6b75916b3b44a
21+
use_volume: true
22+
volume_folder: checkpoint
23+
model_metadata:
24+
example_model_input:
25+
max_tokens: 4096
26+
messages:
27+
- content: You are a helpful assistant.
28+
role: system
29+
- content: Who won the world series in 2020?
30+
role: user
31+
model: MiniMaxAI/MiniMax-M2
32+
stream: true
33+
temperature: 0.6
34+
model_name: MiniMax-M2
35+
tags:
36+
- openai-compatible
37+
model_name: minimax
38+
resources:
39+
accelerator: H100:8
40+
cpu: '1'
41+
memory: 2Gi
42+
use_gpu: true
43+
runtime:
44+
health_checks:
45+
restart_check_delay_seconds: 1200
46+
restart_threshold_seconds: 600
47+
stop_traffic_threshold_seconds: 1800
48+
is_websocket_endpoint: false
49+
predict_concurrency: 32
50+
transport:
51+
kind: http

minimax/minimax_m2_sglang/config.yaml

Lines changed: 0 additions & 32 deletions
This file was deleted.

0 commit comments

Comments
 (0)