|
121 | 121 | "test_accuracy.py::test_accuracy_gptj[gptj-cyclic-and-paged-kv-cache]": 173.45949043799192, |
122 | 122 | "test_accuracy.py::test_accuracy_gptj[gptj-cyclic-kv-cache-beam-search]": 231.8624299732037, |
123 | 123 | "test_accuracy.py::test_accuracy_gptj[gptj-mmha-multi-block-mode]": 182.0765182878822, |
124 | | - "test_e2e.py::test_falcon_e2e[gpu_percent_0-use_py_session-gqa]": 96.65795732289553, |
125 | | - "test_e2e.py::test_falcon_e2e[gpu_percent_0_8-use_cpp_session-mqa]": 94.91713926941156, |
126 | | - "test_e2e.py::test_falcon_e2e[use_cpp_session-mha]": 72.26053975522518, |
127 | | - "test_e2e.py::test_falcon_e2e[use_py_session-mha]": 71.00531469285488, |
128 | | - "test_e2e.py::test_falcon_gqa_e2e[use_py_session-enable_ibf-enable_fp8]": 68.68854057043791, |
129 | 124 | "test_e2e.py::test_gpt_fp32[use_cpp_session]": 102.94305092096329, |
130 | 125 | "test_e2e.py::test_gpt_fp32[use_py_session-multi_query_mode]": 101.54258136451244, |
131 | 126 | "test_e2e.py::test_gpt_fp32[use_py_session]": 100.1567601710558, |
|
146 | 141 | "test_accuracy.py::test_accuracy_gpt[gpt-context-fmha-disabled]": 96.56836012890562, |
147 | 142 | "test_accuracy.py::test_accuracy_gptj[gptj-context-fmha-enabled]": 227.20399192301556, |
148 | 143 | "test_accuracy.py::test_accuracy_gptj[gptj-cyclic-kv-cache]": 168.16926325811073, |
149 | | - "test_e2e.py::test_falcon_e2e[use_cpp_session-gqa]": 75.75471282750368, |
150 | | - "test_e2e.py::test_falcon_e2e[use_cpp_session-mqa]": 74.27118157595396, |
151 | | - "test_e2e.py::test_falcon_e2e[use_py_session-gqa]": 74.21104773320258, |
152 | | - "test_e2e.py::test_falcon_e2e[use_py_session-mqa]": 73.01505787856877, |
153 | | - "test_e2e.py::test_falcon_gqa_e2e[use_cpp_session-enable_ibf-enable_fp8]": 71.1147844651714, |
154 | 144 | "test_e2e.py::test_gpt_fp32[use_cpp_session-multi_query_mode]": 102.81246098689735, |
155 | 145 | "test_e2e.py::test_mistral_e2e[use_py_session-remove_input_padding]": 178.69259701482952, |
156 | 146 | "test_e2e.py::test_mistral_e2e[use_py_session]": 158.53167643211782, |
|
0 commit comments