@@ -50,39 +50,39 @@ if [ $? -ne 0 ]; then
50
50
fi
51
51
echo " Test with deepseek_v2 + inc passed"
52
52
53
- # gsm8k test
54
- # used to check HPUattn + MLP
55
- echo " Testing GSM8K on ganite-8b"
56
- echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 \
57
- pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/granite-8b.yaml
58
- VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 \
59
- pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/granite-8b.yaml
60
- if [ $? -ne 0 ]; then
61
- echo " Error: Test failed for granite-8b" >&2
62
- exit -1
63
- fi
64
- echo " Test with granite-8b passed"
53
+ # # gsm8k test
54
+ # # used to check HPUattn + MLP
55
+ # echo "Testing GSM8K on ganite-8b"
56
+ # echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 \
57
+ # pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/granite-8b.yaml
58
+ # VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 \
59
+ # pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/granite-8b.yaml
60
+ # if [ $? -ne 0 ]; then
61
+ # echo "Error: Test failed for granite-8b" >&2
62
+ # exit -1
63
+ # fi
64
+ # echo "Test with granite-8b passed"
65
65
66
- # used to check MLA + MOE
67
- echo " Testing GSM8K on deepseek v2 lite"
68
- # deepseek-R1
69
- echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/DeepSeek-V2-Lite-chat.yaml
70
- VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 \
71
- pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/DeepSeek-V2-Lite-chat.yaml
72
- if [ $? -ne 0 ]; then
73
- echo " Error: Test failed for deepseek R1" >&2
74
- exit -1
75
- fi
76
- echo " Test with deepseek R1 passed"
66
+ # # used to check MLA + MOE
67
+ # echo "Testing GSM8K on deepseek v2 lite"
68
+ # # deepseek-R1
69
+ # echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/DeepSeek-V2-Lite-chat.yaml
70
+ # VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 \
71
+ # pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/DeepSeek-V2-Lite-chat.yaml
72
+ # if [ $? -ne 0 ]; then
73
+ # echo "Error: Test failed for deepseek R1" >&2
74
+ # exit -1
75
+ # fi
76
+ # echo "Test with deepseek R1 passed"
77
77
78
- # used to check HPUATTN + MOE + ExpertParallel
79
- echo " Testing GSM8K on QWEN3-30B-A3B"
80
- echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 TP_SIZE=2 \
81
- pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/Qwen3-30B-A3B.yaml
82
- VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 TP_SIZE=2 \
83
- pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/Qwen3-30B-A3B.yaml
84
- if [ $? -ne 0 ]; then
85
- echo " Error: Test failed for QWEN3-30B-A3B" >&2
86
- exit -1
87
- fi
88
- echo " Test with QWEN3-30B-A3B passed"
78
+ # # used to check HPUATTN + MOE + ExpertParallel
79
+ # echo "Testing GSM8K on QWEN3-30B-A3B"
80
+ # echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 TP_SIZE=2 \
81
+ # pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/Qwen3-30B-A3B.yaml
82
+ # VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 TP_SIZE=2 \
83
+ # pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/Qwen3-30B-A3B.yaml
84
+ # if [ $? -ne 0 ]; then
85
+ # echo "Error: Test failed for QWEN3-30B-A3B" >&2
86
+ # exit -1
87
+ # fi
88
+ # echo "Test with QWEN3-30B-A3B passed"
0 commit comments