|
19 | 19 | IreeBenchmarkException, |
20 | 20 | IreeCompileException, |
21 | 21 | ) |
22 | | - |
23 | | -is_mi300x = pytest.mark.skipif("config.getoption('iree_hip_target') != 'gfx942'") |
24 | | -skipif_run_quick_llama_test = pytest.mark.skipif( |
25 | | - 'config.getoption("run-quick-llama-test") and not config.getoption("run-nightly-llama-tests")', |
26 | | - reason="Skipping largs tests when --run-quick-llama-test is set.", |
| 22 | +from sharktank.utils.testing import ( |
| 23 | + is_mi300x, |
| 24 | + is_nightly, |
| 25 | + is_pre_submit_nightly, |
27 | 26 | ) |
28 | 27 |
|
29 | 28 |
|
@@ -100,7 +99,6 @@ def save_benchmarks( |
100 | 99 |
|
101 | 100 |
|
102 | 101 | @is_mi300x |
103 | | -@pytest.mark.expensive |
104 | 102 | class BenchmarkLlama3_1_8B(BaseBenchmarkTest): |
105 | 103 | def setUp(self): |
106 | 104 | super().setUp() |
@@ -224,7 +222,7 @@ def setUp(self): |
224 | 222 | ">>", |
225 | 223 | ] |
226 | 224 |
|
227 | | - @skipif_run_quick_llama_test |
| 225 | + @is_pre_submit_nightly |
228 | 226 | def testBenchmark8B_f16_TP1_Non_Decomposed_Input_Len_128(self): |
229 | 227 | output_file_name = self.dir_path_8b / "f16_torch_128_tp1" |
230 | 228 | output_mlir = self.llama8b_f16_torch_sdpa_artifacts.create_file( |
@@ -269,7 +267,7 @@ def testBenchmark8B_f16_TP1_Non_Decomposed_Input_Len_128(self): |
269 | 267 | cwd=self.repo_root, |
270 | 268 | ) |
271 | 269 |
|
272 | | - @skipif_run_quick_llama_test |
| 270 | + @is_nightly |
273 | 271 | def testBenchmark8B_f16_TP1_Non_Decomposed_Input_Len_2048(self): |
274 | 272 | output_file_name = self.dir_path_8b / "f16_torch_2048_tp1" |
275 | 273 | output_mlir = self.llama8b_f16_torch_sdpa_artifacts.create_file( |
@@ -314,8 +312,12 @@ def testBenchmark8B_f16_TP1_Non_Decomposed_Input_Len_2048(self): |
314 | 312 | cwd=self.repo_root, |
315 | 313 | ) |
316 | 314 |
|
317 | | - @skipif_run_quick_llama_test |
318 | | - @pytest.mark.xfail(reason="Benchmarking Error", raises=IreeBenchmarkException) |
| 315 | + @is_nightly |
| 316 | + @pytest.mark.xfail( |
| 317 | + run=False, |
| 318 | + reason="https://github.com/iree-org/iree/issues/20528", |
| 319 | + raises=IreeCompileException, |
| 320 | + ) |
319 | 321 | def testBenchmark8B_fp8_TP1_Non_Decomposed(self): |
320 | 322 | output_file_name = self.dir_path_8b / "fp8_torch_tp1" |
321 | 323 | output_mlir = self.llama8b_fp8_torch_sdpa_artifacts.create_file( |
@@ -360,7 +362,7 @@ def testBenchmark8B_fp8_TP1_Non_Decomposed(self): |
360 | 362 | cwd=self.repo_root, |
361 | 363 | ) |
362 | 364 |
|
363 | | - @skipif_run_quick_llama_test |
| 365 | + @is_nightly |
364 | 366 | def testBenchmark8B_fp8_attnf8_TP1_Non_Decomposed_Input_Len_2048(self): |
365 | 367 | output_file_name = self.dir_path_8b / "fp8_attnf8_2048_tp1" |
366 | 368 | output_mlir = self.llama8b_fp8_attnf8_sdpa_artifacts.create_file( |
@@ -405,7 +407,7 @@ def testBenchmark8B_fp8_attnf8_TP1_Non_Decomposed_Input_Len_2048(self): |
405 | 407 | cwd=self.repo_root, |
406 | 408 | ) |
407 | 409 |
|
408 | | - @skipif_run_quick_llama_test |
| 410 | + @is_nightly |
409 | 411 | def testBenchmark8B_fp8_attnf8_TP1_Non_Decomposed_Input_Len_128(self): |
410 | 412 | output_file_name = self.dir_path_8b / "fp8_attnf8_128_tp1" |
411 | 413 | output_mlir = self.llama8b_fp8_attnf8_sdpa_artifacts.create_file( |
@@ -452,8 +454,7 @@ def testBenchmark8B_fp8_attnf8_TP1_Non_Decomposed_Input_Len_128(self): |
452 | 454 |
|
453 | 455 |
|
454 | 456 | @is_mi300x |
455 | | -@pytest.mark.expensive |
456 | | -@skipif_run_quick_llama_test |
| 457 | +@is_nightly |
457 | 458 | class BenchmarkLlama3_1_70B(BaseBenchmarkTest): |
458 | 459 | def setUp(self): |
459 | 460 | super().setUp() |
@@ -808,8 +809,7 @@ def testBenchmark70B_fp8_TP1_Non_Decomposed(self): |
808 | 809 |
|
809 | 810 |
|
810 | 811 | @is_mi300x |
811 | | -@pytest.mark.expensive |
812 | | -@skipif_run_quick_llama_test |
| 812 | +@is_nightly |
813 | 813 | class BenchmarkLlama3_1_405B(BaseBenchmarkTest): |
814 | 814 | def setUp(self): |
815 | 815 | super().setUp() |
|
0 commit comments