expose the batch size of INT8 calibration as parameter, since different

Chujingjun · Chujingjun · commit 3ddd70d7cb70 · 2020-09-03T04:31:22.000+08:00
size may generate different accuracy loss.
diff --git a/torch2trt/torch2trt.py b/torch2trt/torch2trt.py
@@ -392,6 +392,7 @@ def torch2trt(module,
               int8_mode=False, 
               int8_calib_dataset=None,
               int8_calib_algorithm=DEFAULT_CALIBRATION_ALGORITHM,
+              int8_calib_batch_size=1,
               use_onnx=False):
 
     inputs_in = inputs
@@ -454,7 +455,7 @@ def torch2trt(module,
 
         # @TODO(jwelsh):  Should we set batch_size=max_batch_size?  Need to investigate memory consumption
         builder.int8_calibrator = DatasetCalibrator(
-            inputs, int8_calib_dataset, batch_size=1, algorithm=int8_calib_algorithm
+            inputs, int8_calib_dataset, batch_size=int8_calib_batch_size, algorithm=int8_calib_algorithm
         )
 
     engine = builder.build_cuda_engine(network)