@@ -5,54 +5,59 @@ stages:
55      - name : v0_gsm8k_small_g3_tp1_part1 
66        flavor : g3 
77        command : >- 
8-           export PT_HPU_LAZY_MODE=1 &&   
8+           export PT_HPU_LAZY_MODE=1 && 
99          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-small.txt -t 1 
1010       - name : v0_gsm8k_small_g3_tp1_part2 
1111        flavor : g3 
1212        command : >- 
13-           export PT_HPU_LAZY_MODE=1 &&   
13+           export PT_HPU_LAZY_MODE=1 && 
1414          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-small-2.txt -t 1 
1515       - name : v0_gsm8k_small_g3_tp1_part3 
1616        flavor : g3 
1717        command : >- 
18-           export PT_HPU_LAZY_MODE=1 &&   
18+           export PT_HPU_LAZY_MODE=1 && 
1919          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-small-3.txt -t 1 
2020       - name : v0_gsm8k_small_g3_tp2 
2121        flavor : g3.s 
2222        command : >- 
23-           export PT_HPU_LAZY_MODE=1 &&   
23+           export PT_HPU_LAZY_MODE=1 && 
2424          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-small.txt -t 2 
2525       - name : v0_gsm8k_small_g2_tp1 
2626        flavor : g2 
2727        command : >- 
28-           export PT_HPU_LAZY_MODE=1 &&   
28+           export PT_HPU_LAZY_MODE=1 && 
2929          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-small.txt -t 1 
3030       - name : v0_gsm8k_small_g2_tp2 
3131        flavor : g2.s 
3232        command : >- 
33-           export PT_HPU_LAZY_MODE=1 &&   
33+           export PT_HPU_LAZY_MODE=1 && 
3434          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-small.txt -t 2 
3535       - name : v0_gsm8k_g2_deepseek-v2-lite_tp1 
3636        flavor : g3 
3737        command : >- 
38-           export PT_HPU_LAZY_MODE=1 &&   
38+           export PT_HPU_LAZY_MODE=1 && 
3939          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-deepseek.txt -t 1 
4040       - name : v0_gsm8k_g3_gemma3_tp1 
4141        flavor : g3.s 
4242        command : >- 
4343          export PT_HPU_LAZY_MODE=1 && 
4444          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-gemma.txt -t 1 
45+        - name : v0_gsm8k_g3_ovis2_5_tp1 
46+         flavor : g3.s 
47+         command : >- 
48+           export PT_HPU_LAZY_MODE=1 && export VLLM_SKIP_WARMUP=true && 
49+           cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-ovis.txt -t 1 
4550   - name : test_gsm8k_small_models_apc 
4651    steps :
4752      - name : gsm8k_small_g3_tp1_apc 
4853        flavor : g3 
4954        command : >- 
50-           export VLLM_CONTIGUOUS_PA=false &&   
55+           export VLLM_CONTIGUOUS_PA=false && 
5156          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-small.txt -t 1 -a 
5257       - name : gsm8k_small_g2_tp1_apc 
5358        flavor : g2 
5459        command : >- 
55-           export VLLM_CONTIGUOUS_PA=false &&   
60+           export VLLM_CONTIGUOUS_PA=false && 
5661          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-small.txt -t 1 -a 
5762   - name : test_gsm8k_small_models_merged_prefill 
5863    steps :
@@ -66,139 +71,139 @@ stages:
6671      - name : v0_gsm8k_large_g3_tp2_part1 
6772        flavor : g3.s 
6873        command : >- 
69-           export PT_HPU_LAZY_MODE=1 &&   
74+           export PT_HPU_LAZY_MODE=1 && 
7075          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-large.txt -t 2 
7176       - name : v0_gsm8k_large_g3_tp2_part2 
7277        flavor : g3.s 
7378        command : >- 
74-           export PT_HPU_LAZY_MODE=1 &&   
79+           export PT_HPU_LAZY_MODE=1 && 
7580          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-large-2.txt -t 2 
7681       - name : v0_gsm8k_large_g2_tp4 
7782        flavor : g2.m 
7883        command : >- 
79-           export PT_HPU_LAZY_MODE=1 &&   
84+           export PT_HPU_LAZY_MODE=1 && 
8085          cd .jenkins/lm-eval-harness && bash run-tests.sh -c configs/models-large.txt -t 4 
8186   - name : test_gsm8k_fp8 
8287    steps :
8388      - name : gsm8k_small_g3_tp1_fp8 
8489        flavor : g3 
8590        command : >- 
86-           cd .jenkins/lm-eval-harness &&   
87-           PT_HPU_LAZY_MODE=1   
91+           cd .jenkins/lm-eval-harness && 
92+           PT_HPU_LAZY_MODE=1 
8893          bash run-tests.sh -c configs/models-fp8-g3-tp1.txt -t 1 
8994       #  - name: gsm8k_small_g3_tp2_fp8
9095      #    flavor: g3.s
9196      #    command: >-
92-       #      cd .jenkins/lm-eval-harness &&  
93-       #      PT_HPU_LAZY_MODE=1  
97+       #      cd .jenkins/lm-eval-harness &&
98+       #      PT_HPU_LAZY_MODE=1
9499      #      bash run-tests.sh -c configs/models-fp8.txt -t 2
95100  - name : test_gsm8k_fp8_bypass_inc 
96101    steps :
97102      - name : gsm8k_fp8_llama4_scout_g3_tp2_compressed_tensor 
98103        flavor : g3.s 
99104        command : >- 
100-           cd .jenkins/lm-eval-harness &&   
101-           PT_HPU_LAZY_MODE=1   
105+           cd .jenkins/lm-eval-harness && 
106+           PT_HPU_LAZY_MODE=1 
102107          bash run-tests.sh -c configs/models-fp8-compressedtensor.txt -t 2 
103108       - name : gsm8k_fp8_qwen3_30B_g3_tp1_block_scale_dynamic 
104109        flavor : g3 
105110        command : >- 
106-           cd .jenkins/lm-eval-harness &&   
107-           PT_HPU_LAZY_MODE=1   
111+           cd .jenkins/lm-eval-harness && 
112+           PT_HPU_LAZY_MODE=1 
108113          bash run-tests.sh -c configs/models-fp8-blockfp8.txt -t 1 
109114       - name : gsm8k_fp8_qwen3_30B_g3_tp1_block_scale_dequant 
110115        flavor : g3 
111116        command : >- 
112-           cd .jenkins/lm-eval-harness &&   
113-           PT_HPU_LAZY_MODE=1 VLLM_HPU_FORCE_CHANNEL_FP8=0   
117+           cd .jenkins/lm-eval-harness && 
118+           PT_HPU_LAZY_MODE=1 VLLM_HPU_FORCE_CHANNEL_FP8=0 
114119          bash run-tests.sh -c configs/models-fp8-blockfp8.txt -t 1 
115120   - name : test_gsm8k_mss 
116121    steps :
117122      - name : gsm8k_small_g3_tp1_mss 
118123        flavor : g3 
119124        command : >- 
120-           cd .jenkins/lm-eval-harness &&   
121-           PT_HPU_LAZY_MODE=1   
125+           cd .jenkins/lm-eval-harness && 
126+           PT_HPU_LAZY_MODE=1 
122127          bash run-tests.sh -c configs/models-mss.txt -t 1 
123128       - name : gsm8k_small_g2_tp1_mss 
124129        flavor : g2 
125130        command : >- 
126-           cd .jenkins/lm-eval-harness &&   
127-           PT_HPU_LAZY_MODE=1   
131+           cd .jenkins/lm-eval-harness && 
132+           PT_HPU_LAZY_MODE=1 
128133          bash run-tests.sh -c configs/models-mss.txt -t 1 
129134       - name : gsm8k_small_g3_tp2_mss 
130135        flavor : g3.s 
131136        command : >- 
132-           cd .jenkins/lm-eval-harness &&   
133-           PT_HPU_LAZY_MODE=1   
137+           cd .jenkins/lm-eval-harness && 
138+           PT_HPU_LAZY_MODE=1 
134139          bash run-tests.sh -c configs/models-mss.txt -t 2 
135140       - name : gsm8k_small_g2_tp2_mss 
136141        flavor : g2.s 
137142        command : >- 
138-           cd .jenkins/lm-eval-harness &&   
139-           PT_HPU_LAZY_MODE=1   
143+           cd .jenkins/lm-eval-harness && 
144+           PT_HPU_LAZY_MODE=1 
140145          bash run-tests.sh -c configs/models-mss.txt -t 2 
141146       - name : gsm8k_small_g2_tp1_spec_decode 
142147        flavor : g2 
143148        command : >- 
144-           cd .jenkins/lm-eval-harness &&   
145-           PT_HPU_LAZY_MODE=1   
149+           cd .jenkins/lm-eval-harness && 
150+           PT_HPU_LAZY_MODE=1 
146151          bash run-tests.sh -c configs/models-mss.txt -t 1 
147152   - name : test_gsm8k_spec_decode 
148153    steps :
149154      #  - name: gsm8k_small_g2_tp1_mlp_spec_decode
150155      #    flavor: g2
151156      #    command: >-
152-       #      PT_HPU_LAZY_MODE=1 VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True  
157+       #      PT_HPU_LAZY_MODE=1 VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True
153158      #      pytest -v tests/spec_decode/e2e/test_mlp_correctness.py::test_mlp_e2e_greedy_correctness
154159      - name : gsm8k_small_g2_tp1_medusa_spec_decode 
155160        flavor : g2 
156161        command : >- 
157-           PT_HPU_LAZY_MODE=1 VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True   
162+           PT_HPU_LAZY_MODE=1 VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True 
158163          pytest -v tests/spec_decode/e2e/test_medusa_correctness.py::test_medusa_e2e_greedy_correctness 
159164       - name : gsm8k_small_g2_tp1_eagle_spec_decode 
160165        flavor : g2 
161166        command : >- 
162-           PT_HPU_LAZY_MODE=1 VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True   
167+           PT_HPU_LAZY_MODE=1 VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True 
163168          pytest -v tests/spec_decode/e2e/test_eagle_correctness.py::test_eagle_e2e_greedy_correctness 
164169   # TODO(kwisniewski98) temporary disable test, until model specific for Gaudi2 is uploaded to test infrastructure
165170  #  - name: test_deepseek_mtp
166171  #    steps:
167172  #      - name: test_deepseek_mtp_correctness
168173  #        flavor: g3
169174  #        command: >-
170-   #          PT_HPU_LAZY_MODE=1 VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True  
175+   #          PT_HPU_LAZY_MODE=1 VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True
171176  #          pytest -v tests/spec_decode/e2e/test_mtp_correctness.py::test_mtp_e2e_greedy_correctness
172177  - name : tests_lora 
173178    steps :
174179      - name : test_llama_lora 
175180        flavor : g2 
176181        command : >- 
177-           PT_HPU_LAZY_MODE=1 VLLM_SKIP_WARMUP=true   
182+           PT_HPU_LAZY_MODE=1 VLLM_SKIP_WARMUP=true 
178183          pytest -v tests/lora/test_llama_hpu.py::test_llama_lora_1x 
179184       - name : test_multilora 
180185        flavor : g2 
181186        command : >- 
182-           PT_HPU_LAZY_MODE=1 VLLM_SKIP_WARMUP=true   
187+           PT_HPU_LAZY_MODE=1 VLLM_SKIP_WARMUP=true 
183188          pytest -v tests/lora/test_multilora_hpu.py::test_llama_multilora_1x 
184189       #  - name: test_long_context
185190      #    flavor: g2
186191      #    command: >-
187-       #      PT_HPU_LAZY_MODE=1 VLLM_SKIP_WARMUP=true  
192+       #      PT_HPU_LAZY_MODE=1 VLLM_SKIP_WARMUP=true
188193      #      pytest -v tests/lora/test_long_context_hpu.py::test_quality
189194  - name : tests_multimodal 
190195    steps :
191196      - name : multimodal_small_g3_tp1 
192197        flavor : g3 
193198        command : >- 
194-           cd .jenkins/vision &&   
195-           PT_HPU_LAZY_MODE=1   
199+           cd .jenkins/vision && 
200+           PT_HPU_LAZY_MODE=1 
196201          bash run-tests.sh -c configs/models-small.txt -t 1 
197202       - name : multimodal_small_g3_tp2 
198203        flavor : g3.s 
199204        command : >- 
200205          cd .jenkins/vision && 
201-           PT_HPU_LAZY_MODE=1   
206+           PT_HPU_LAZY_MODE=1 
202207          bash run-tests.sh -c configs/models-small.txt -t 2 
203208       - name : multimodal_qwen_tp1 
204209        flavor : g3.s 
@@ -210,13 +215,13 @@ stages:
210215        flavor : g3 
211216        command : >- 
212217          cd .jenkins/vision && 
213-           PT_HPU_LAZY_MODE=1   
218+           PT_HPU_LAZY_MODE=1 
214219          bash run-tests.sh -c configs/models-mss.txt -t 1 
215220       - name : multimodal_small_g3_tp2_mss 
216221        flavor : g3.s 
217222        command : >- 
218223          cd .jenkins/vision && 
219-           PT_HPU_LAZY_MODE=1   
224+           PT_HPU_LAZY_MODE=1 
220225          bash run-tests.sh -c configs/models-mss.txt -t 2 
221226       - name : multimodal_llama4_scout_g3_tp2_ep 
222227        flavor : g3.s 
@@ -230,26 +235,32 @@ stages:
230235          cd .jenkins/vision && 
231236          PT_HPU_LAZY_MODE=1 
232237          bash run-tests.sh -c configs/models-gemma.txt -t 1 
238+        - name : multimodal_ovis2_5_g3_tp1_ep 
239+         flavor : g3.s 
240+         command : >- 
241+           cd .jenkins/vision && 
242+           PT_HPU_LAZY_MODE=1 VLLM_SKIP_WARMUP=true 
243+           bash run-tests.sh -c configs/models-ovis.txt -t 1 
233244   - name : tests_int4_quantization 
234245    steps :
235246      - name : test_awq 
236247        flavor : g2 
237248        command : >- 
238-           PT_HPU_LAZY_MODE=1 VLLM_SKIP_WARMUP=true   
249+           PT_HPU_LAZY_MODE=1 VLLM_SKIP_WARMUP=true 
239250          pytest -v tests/quantization/test_awq.py::test_awq 
240251       - name : test_gptq 
241252        flavor : g2 
242253        command : >- 
243-           PT_HPU_LAZY_MODE=1 VLLM_SKIP_WARMUP=true   
254+           PT_HPU_LAZY_MODE=1 VLLM_SKIP_WARMUP=true 
244255          pytest -v tests/quantization/test_gptq.py::test_gptq 
245256   - name : tests_guided_decode 
246257    steps :
247258    - name : test_lazy_outlines 
248259      flavor : g2 
249260      command : >- 
250261        pip install -e tests/vllm_test_utils && 
251-         export VLLM_SKIP_WARMUP=true && PT_HPU_LAZY_MODE=1   
252-         pytest -v tests/entrypoints/llm/test_lazy_outlines.py -s -vvv --log-cli-level=INFO   
262+         export VLLM_SKIP_WARMUP=true && PT_HPU_LAZY_MODE=1 
263+         pytest -v tests/entrypoints/llm/test_lazy_outlines.py -s -vvv --log-cli-level=INFO 
253264     #  - name: test_guided_generate
254265    #    flavor: g2
255266    #    command: >-
0 commit comments