Skip to content

Commit a1248f3

Browse files
committed
update catalog
1 parent c5dbc67 commit a1248f3

File tree

1 file changed

+37
-0
lines changed

1 file changed

+37
-0
lines changed
Lines changed: 37 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,37 @@
1+
apiVersion: v1
2+
kind: ModelCatalog
3+
metadata:
4+
name: deepseek-r1-distill-qwen-1-5b
5+
display_name: deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
6+
labels:
7+
icon_url: 'https://cdn-thumbnails.huggingface.co/social-thumbnails/deepseek-ai.png'
8+
hf_repo_url: 'https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B'
9+
spec:
10+
model:
11+
registry: ''
12+
name: deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
13+
file: model.safetensors
14+
version: latest
15+
task: text-generation
16+
engine:
17+
engine: vllm
18+
version: v1
19+
resources: {}
20+
replicas:
21+
num: 1
22+
deployment_options:
23+
scheduler:
24+
type: consistent_hash
25+
virtual_nodes: 150
26+
load_factor: 1.25
27+
variables:
28+
RAY_SCHEDULER_TYPE: consistent_hash
29+
engine_args:
30+
tensor_parallel_size: 1
31+
max_model_len: 32768
32+
enforce_eager: true
33+
gpu_memory_utilization: 0.95
34+
enable_chunked_prefill: true
35+
served_model_name: deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
36+
reasoning_parser: deepseek_r1
37+
enable_reasoning: true

0 commit comments

Comments
 (0)