You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
echo"Quant $QFORMATnot supported with the TensorRT-LLM torch llmapi. Allowed values are: fp8, nvfp4, bf16, fp16, int4_awq, w4a8_awq"
197
+
echo"Quant $QFORMATspecified. Please read TensorRT-LLM quantization support matrix https://nvidia.github.io/TensorRT-LLM/features/quantization.html#quantization-in-tensorrt-llm and use TensorRT-LLM for deployment. Checkpoint export_path: $SAVE_PATH"
198
198
exit 0
199
199
fi
200
200
@@ -333,12 +333,6 @@ if [[ $TASKS =~ "livecodebench" || $TASKS =~ "simple_eval" ]]; then
333
333
fi
334
334
335
335
if [[ $TASKS=~"benchmark" ]];then
336
-
337
-
if [ "$PP"-ne 1 ];then
338
-
echo"Benchmark does not work with multi PP. Please run the c++ benchmark in the TensorRT-LLM repo..."
339
-
exit 1
340
-
fi
341
-
342
336
BENCHMARK_RESULT=${SAVE_PATH}/benchmark.txt
343
337
echo"Evaluating performance, result saved to $BENCHMARK_RESULT..."
344
338
@@ -371,12 +365,17 @@ if [[ $TASKS =~ "benchmark" ]]; then
0 commit comments