@@ -18,6 +18,7 @@ Arguments:
1818 Supported models:
1919 - mistralai/Voxtral-Mini-3B-2507
2020 - openai/whisper-small
21+ - openai/whisper-large-v2
2122 - google/gemma-3-4b-it
2223
2324 quant_name Quantization type (required)
@@ -91,13 +92,13 @@ case "$HF_MODEL" in
9192 AUDIO_FILE=" poem.wav"
9293 IMAGE_PATH=" "
9394 ;;
94- openai/whisper-small )
95- MODEL_NAME=" whisper "
95+ openai/whisper-* )
96+ MODEL_NAME=" ${HF_MODEL # openai / } "
9697 RUNNER_TARGET=" whisper_runner"
9798 RUNNER_PATH=" whisper"
9899 EXPECTED_OUTPUT=" Mr. Quilter is the apostle of the middle classes"
99100 PREPROCESSOR=" whisper_preprocessor.pte"
100- TOKENIZER_URL=" https://huggingface.co/openai/whisper-small /resolve/main" # @lint-ignore
101+ TOKENIZER_URL=" https://huggingface.co/${HF_MODEL} /resolve/main" # @lint-ignore
101102 TOKENIZER_FILE=" "
102103 AUDIO_URL=" "
103104 AUDIO_FILE=" output.wav"
@@ -117,7 +118,7 @@ case "$HF_MODEL" in
117118 ;;
118119 * )
119120 echo " Error: Unsupported model '$HF_MODEL '"
120- echo " Supported models: mistralai/Voxtral-Mini-3B-2507, openai/whisper-small, google/gemma-3-4b-it"
121+ echo " Supported models: mistralai/Voxtral-Mini-3B-2507, openai/whisper-small, openai/whisper-large-v2, google/gemma-3-4b-it"
121122 exit 1
122123 ;;
123124esac
142143# Download test files
143144if [ " $AUDIO_URL " != " " ]; then
144145 curl -L $AUDIO_URL -o ${MODEL_DIR} /$AUDIO_FILE
145- elif [ " $MODEL_NAME " = " whisper" ]; then
146+ elif [[ " $MODEL_NAME " == * whisper* ] ]; then
146147 conda install -y -c conda-forge " ffmpeg<8"
147148 pip install datasets soundfile torchcodec
148149 python -c " from datasets import load_dataset;import soundfile as sf;sample = load_dataset('distil-whisper/librispeech_long', 'clean', split='validation')[0]['audio'];sf.write('${MODEL_DIR} /$AUDIO_FILE ', sample['array'][:sample['sampling_rate']*30], sample['sampling_rate'])"
@@ -180,7 +181,7 @@ case "$MODEL_NAME" in
180181 RUNNER_ARGS=" $RUNNER_ARGS --tokenizer_path ${MODEL_DIR} /$TOKENIZER_FILE --audio_path ${MODEL_DIR} /$AUDIO_FILE --processor_path ${MODEL_DIR} /$PREPROCESSOR "
181182 ;;
182183 whisper)
183- RUNNER_ARGS=" $RUNNER_ARGS --tokenizer_path ${MODEL_DIR} / --audio_path ${MODEL_DIR} /$AUDIO_FILE --processor_path ${MODEL_DIR} /$PREPROCESSOR "
184+ RUNNER_ARGS=" $RUNNER_ARGS --tokenizer_path ${MODEL_DIR} / --audio_path ${MODEL_DIR} /$AUDIO_FILE --processor_path ${MODEL_DIR} /$PREPROCESSOR --model_name ${WHISPER_MODEL_NAME} "
184185 ;;
185186 gemma3)
186187 RUNNER_ARGS=" $RUNNER_ARGS --tokenizer_path ${MODEL_DIR} / --image_path $IMAGE_PATH "
0 commit comments