|
385 | 385 | "accuracy/test_llm_api_pytorch.py::TestMistralSmall24B::test_fp8": 196.57955891895108, |
386 | 386 | "accuracy/test_llm_api_pytorch.py::TestMixtral8x7B::test_fp8_tp2": 3600.0022730380297, |
387 | 387 | "accuracy/test_llm_api_pytorch.py::TestMixtral8x7B::test_nvfp4_tp2": 3600.7994798690197058, |
388 | | - "accuracy/test_llm_api_pytorch.py::TestNano_V2_VLM::test_auto_dtype": 3600.0003106039948761463, |
389 | 388 | "accuracy/test_llm_api_pytorch.py::TestNemotronNas::test_auto_dtype_tp8": 3600.5389363930444, |
390 | 389 | "accuracy/test_llm_api_pytorch.py::TestPhi4::test_auto_dtype": 3600.0017098310054, |
391 | 390 | "accuracy/test_llm_api_pytorch.py::TestPhi4::test_fp8": 3600.0018840720295, |
392 | 391 | "accuracy/test_llm_api_pytorch.py::TestPhi4MM::test_auto_dtype": 3600.000989172084, |
393 | 392 | "accuracy/test_llm_api_pytorch.py::TestPhi4MM::test_auto_dtype_long_rope": 3600.001809718029, |
394 | 393 | "accuracy/test_llm_api_pytorch.py::TestPhi4MiniInstruct::test_auto_dtype": 3600.0018334789784, |
395 | 394 | "accuracy/test_llm_api_pytorch.py::TestQwen2_7BInstruct::test_auto_dtype": 49.38216367200948, |
396 | | - "accuracy/test_llm_api_pytorch.py::TestQwen2_VL_7B::test_auto_dtype": 3600.0019999769866, |
397 | 395 | "accuracy/test_llm_api_pytorch.py::TestQwen3_235B_A22B::test_fp8[latency]": 7576.4847942629713, |
398 | 396 | "accuracy/test_llm_api_pytorch.py::TestQwen3_235B_A22B::test_fp8[throughput_latency]": 75934.1885519769276, |
399 | 397 | "accuracy/test_llm_api_pytorch.py::TestQwen3_235B_A22B::test_nvfp4[latency_moe_cutlass]": 7570.00041150598553940654, |
|
871 | 869 | "test_e2e.py::test_ptp_quickstart_multimodal[mistral-small-3.1-24b-instruct-Mistral-Small-3.1-24B-Instruct-2503-image-False]": 59.619638262083754, |
872 | 870 | "test_e2e.py::test_ptp_quickstart_multimodal[mistral-small-3.1-24b-instruct-Mistral-Small-3.1-24B-Instruct-2503-image-True]": 984.4696121218149, |
873 | 871 | "test_e2e.py::test_ptp_quickstart_multimodal[mistral-small-3.1-24b-instruct-Mistral-Small-3.1-24B-Instruct-2503-mixture_text_image-True]": 78.27158910990693, |
874 | | - "test_e2e.py::test_ptp_quickstart_multimodal[qwen2-vl-7b-instruct-Qwen2-VL-7B-Instruct-image-False]": 113.76943837082945, |
875 | | - "test_e2e.py::test_ptp_quickstart_multimodal[qwen2-vl-7b-instruct-Qwen2-VL-7B-Instruct-video-False]": 96.37042473605834, |
876 | | - "test_e2e.py::test_ptp_quickstart_multimodal[qwen2.5-vl-7b-instruct-Qwen2.5-VL-7B-Instruct-image-False]": 128.0739826040808, |
877 | | - "test_e2e.py::test_ptp_quickstart_multimodal[qwen2.5-vl-7b-instruct-Qwen2.5-VL-7B-Instruct-image-True]": 128.0739826040808, |
878 | | - "test_e2e.py::test_ptp_quickstart_multimodal[qwen2.5-vl-7b-instruct-Qwen2.5-VL-7B-Instruct-video-False]": 97.74500772892497, |
879 | | - "test_e2e.py::test_ptp_quickstart_multimodal[qwen2.5-vl-7b-instruct-Qwen2.5-VL-7B-Instruct-video-True]": 97.74500772892497, |
880 | 872 | "test_e2e.py::test_ptp_quickstart_multimodal_2gpu[Phi-4-multimodal-instruct-multimodals/Phi-4-multimodal-instruct]": 128.000317517900839448, |
881 | 873 | "test_e2e.py::test_ptp_quickstart_multimodal_2gpu[gemma-3-27b-it-gemma/gemma-3-27b-it]": 66.45376745378599, |
882 | 874 | "test_e2e.py::test_ptp_quickstart_multimodal_2gpu[mistral-small-3.1-24b-instruct-Mistral-Small-3.1-24B-Instruct-2503]": 55.03272026847117, |
|
0 commit comments