File tree Expand file tree Collapse file tree 2 files changed +51
-32
lines changed
Expand file tree Collapse file tree 2 files changed +51
-32
lines changed Original file line number Diff line number Diff line change 1+ base_image :
2+ image : lmsysorg/sglang:nightly-dev-20260126-48f4340b
3+ docker_server :
4+ liveness_endpoint : /health_generate
5+ predict_endpoint : /v1/chat/completions
6+ readiness_endpoint : /health_generate
7+ server_port : 8000
8+ start_command : sh -c "truss-transfer-cli && find /app/model_cache/checkpoint -type f -print0 | xargs -0 -P 0 -I {} dd if={} of=/dev/null bs=4M && python3 -m sglang.launch_server --model-path /app/model_cache/checkpoint --tp-size 8 --ep-size 8 --tool-call-parser minimax-m2 --trust-remote-code --host 0.0.0.0 --reasoning-parser minimax --port 8000 --mem-fraction-static 0.85"
9+ # environment_variables:
10+ # SGLANG_ALLOW_OVERWRITE_LONGER_CONTEXT_LEN: 1
11+ model_cache :
12+ - allow_patterns :
13+ - ' *.json'
14+ - ' *.safetensors'
15+ - ' *.txt'
16+ - ' *.model'
17+ - ' *.py'
18+ - ' *.jinja'
19+ repo_id : MiniMaxAI/MiniMax-M2.1
20+ revision : 927ea2b64008fe4a1e31a4e107a6b75916b3b44a
21+ use_volume : true
22+ volume_folder : checkpoint
23+ model_metadata :
24+ example_model_input :
25+ max_tokens : 4096
26+ messages :
27+ - content : You are a helpful assistant.
28+ role : system
29+ - content : Who won the world series in 2020?
30+ role : user
31+ model : MiniMaxAI/MiniMax-M2
32+ stream : true
33+ temperature : 0.6
34+ model_name : MiniMax-M2
35+ tags :
36+ - openai-compatible
37+ model_name : minimax
38+ resources :
39+ accelerator : H100:8
40+ cpu : ' 1'
41+ memory : 2Gi
42+ use_gpu : true
43+ runtime :
44+ health_checks :
45+ restart_check_delay_seconds : 1200
46+ restart_threshold_seconds : 600
47+ stop_traffic_threshold_seconds : 1800
48+ is_websocket_endpoint : false
49+ predict_concurrency : 32
50+ transport :
51+ kind : http
Load Diff This file was deleted.
You can’t perform that action at this time.
0 commit comments