Skip to content

Commit 05bdf4c

Browse files
committed
add contributor info
1 parent 1850e2a commit 05bdf4c

File tree

4 files changed

+13
-4
lines changed

4 files changed

+13
-4
lines changed

README.md

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -29,6 +29,10 @@
2929

3030
## Roadmap
3131

32+
- [x] 2025/08
33+
34+
- [x] Thanks to the contribution from NVIDIA Yuekai Zhang, add triton trtllm runtime support
35+
3236
- [x] 2025/07
3337

3438
- [x] release cosyvoice 3.0 eval set

runtime/triton_trtllm/Dockerfile.server

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,6 @@
11
FROM nvcr.io/nvidia/tritonserver:25.06-trtllm-python-py3
2+
LABEL maintainer="[email protected]"
3+
24
RUN apt-get update && apt-get install -y cmake
35
RUN git clone https://github.com/pytorch/audio.git && cd audio && git checkout c670ad8 && PATH=/usr/local/cuda/bin:$PATH python3 setup.py develop
46
COPY ./requirements.txt /workspace/requirements.txt

runtime/triton_trtllm/README.md

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,7 @@
11
## Best Practices for Serving CosyVoice with NVIDIA Triton Inference Server
22

3+
Thanks to the contribution from NVIDIA Yuekai Zhang.
4+
35
### Quick Start
46
Launch the service directly with Docker Compose:
57
```sh

runtime/triton_trtllm/run.sh

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
1-
1+
#!/bin/bash
2+
# Copyright (c) 2025 NVIDIA (authors: Yuekai Zhang)
23
export CUDA_VISIBLE_DEVICES=0
34
cosyvoice_path=/workspace/CosyVoice
45
export PYTHONPATH=${cosyvoice_path}:$PYTHONPATH
@@ -24,8 +25,8 @@ fi
2425

2526
if [ $stage -le 0 ] && [ $stop_stage -ge 0 ]; then
2627
echo "Downloading CosyVoice2-0.5B"
27-
huggingface-cli download --local-dir $huggingface_model_local_dir yuekai/cosyvoice2_llm
28-
modelscope download --model iic/CosyVoice2-0.5B --local_dir $model_scope_model_local_dir
28+
huggingface-cli download --local-dir $huggingface_model_local_dir yuekai/cosyvoice2_llm
29+
modelscope download --model iic/CosyVoice2-0.5B --local_dir $model_scope_model_local_dir
2930
fi
3031

3132

@@ -67,7 +68,7 @@ if [ $stage -le 2 ] && [ $stop_stage -ge 2 ]; then
6768
BLS_INSTANCE_NUM=4
6869
TRITON_MAX_BATCH_SIZE=16
6970
DECOUPLED_MODE=False
70-
71+
7172
python3 scripts/fill_template.py -i ${model_repo}/token2wav/config.pbtxt model_dir:${MODEL_DIR},triton_max_batch_size:${TRITON_MAX_BATCH_SIZE},max_queue_delay_microseconds:${MAX_QUEUE_DELAY_MICROSECONDS}
7273
python3 scripts/fill_template.py -i ${model_repo}/audio_tokenizer/config.pbtxt model_dir:${MODEL_DIR},triton_max_batch_size:${TRITON_MAX_BATCH_SIZE},max_queue_delay_microseconds:${MAX_QUEUE_DELAY_MICROSECONDS}
7374
python3 scripts/fill_template.py -i ${model_repo}/${cosyvoice2_dir}/config.pbtxt model_dir:${MODEL_DIR},bls_instance_num:${BLS_INSTANCE_NUM},llm_tokenizer_dir:${LLM_TOKENIZER_DIR},triton_max_batch_size:${TRITON_MAX_BATCH_SIZE},decoupled_mode:${DECOUPLED_MODE},max_queue_delay_microseconds:${MAX_QUEUE_DELAY_MICROSECONDS}

0 commit comments

Comments
 (0)