@@ -50,39 +50,39 @@ if [ $? -ne 0 ]; then
50
50
fi
51
51
echo " Test with deepseek_v2 + inc passed"
52
52
53
- # # gsm8k test
54
- # # used to check HPUattn + MLP
55
- # echo "Testing GSM8K on ganite-8b"
56
- # echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 \
57
- # pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/granite-8b.yaml
58
- # VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 \
59
- # pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/granite-8b.yaml
60
- # if [ $? -ne 0 ]; then
61
- # echo "Error: Test failed for granite-8b" >&2
62
- # exit -1
63
- # fi
64
- # echo "Test with granite-8b passed"
53
+ # gsm8k test
54
+ # used to check HPUattn + MLP
55
+ echo " Testing GSM8K on ganite-8b"
56
+ echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 \
57
+ pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/granite-8b.yaml
58
+ VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 \
59
+ pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/granite-8b.yaml
60
+ if [ $? -ne 0 ]; then
61
+ echo " Error: Test failed for granite-8b" >&2
62
+ exit -1
63
+ fi
64
+ echo " Test with granite-8b passed"
65
65
66
- # # used to check MLA + MOE
67
- # echo "Testing GSM8K on deepseek v2 lite"
68
- # # deepseek-R1
69
- # echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/DeepSeek-V2-Lite-chat.yaml
70
- # VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 \
71
- # pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/DeepSeek-V2-Lite-chat.yaml
72
- # if [ $? -ne 0 ]; then
73
- # echo "Error: Test failed for deepseek R1" >&2
74
- # exit -1
75
- # fi
76
- # echo "Test with deepseek R1 passed"
66
+ # used to check MLA + MOE
67
+ echo " Testing GSM8K on deepseek v2 lite"
68
+ # deepseek-R1
69
+ echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/DeepSeek-V2-Lite-chat.yaml
70
+ VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 \
71
+ pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/DeepSeek-V2-Lite-chat.yaml
72
+ if [ $? -ne 0 ]; then
73
+ echo " Error: Test failed for deepseek R1" >&2
74
+ exit -1
75
+ fi
76
+ echo " Test with deepseek R1 passed"
77
77
78
- # # used to check HPUATTN + MOE + ExpertParallel
79
- # echo "Testing GSM8K on QWEN3-30B-A3B"
80
- # echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 TP_SIZE=2 \
81
- # pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/Qwen3-30B-A3B.yaml
82
- # VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 TP_SIZE=2 \
83
- # pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/Qwen3-30B-A3B.yaml
84
- # if [ $? -ne 0 ]; then
85
- # echo "Error: Test failed for QWEN3-30B-A3B" >&2
86
- # exit -1
87
- # fi
88
- # echo "Test with QWEN3-30B-A3B passed"
78
+ # used to check HPUATTN + MOE + ExpertParallel
79
+ echo " Testing GSM8K on QWEN3-30B-A3B"
80
+ echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 TP_SIZE=2 \
81
+ pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/Qwen3-30B-A3B.yaml
82
+ VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 TP_SIZE=2 \
83
+ pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/Qwen3-30B-A3B.yaml
84
+ if [ $? -ne 0 ]; then
85
+ echo " Error: Test failed for QWEN3-30B-A3B" >&2
86
+ exit -1
87
+ fi
88
+ echo " Test with QWEN3-30B-A3B passed"
0 commit comments