expose the batch size of INT8 calibration as parameter, since different

size may generate different accuracy loss.
NVIDIA-AI-IOT · Sep 2, 2020 · 3ddd70d · 3ddd70d
1 parent 63895f0
commit 3ddd70d
Showing 1 changed file with 2 additions and 1 deletion.
diff --git a/torch2trt/torch2trt.py b/torch2trt/torch2trt.py
@@ -392,6 +392,7 @@ def torch2trt(module,
               int8_mode=False, 
               int8_calib_dataset=None,
               int8_calib_algorithm=DEFAULT_CALIBRATION_ALGORITHM,
+              int8_calib_batch_size=1,
               use_onnx=False):
 
     inputs_in = inputs
@@ -454,7 +455,7 @@ def torch2trt(module,
 
         # @TODO(jwelsh):  Should we set batch_size=max_batch_size?  Need to investigate memory consumption
         builder.int8_calibrator = DatasetCalibrator(
-            inputs, int8_calib_dataset, batch_size=1, algorithm=int8_calib_algorithm
+            inputs, int8_calib_dataset, batch_size=int8_calib_batch_size, algorithm=int8_calib_algorithm
         )
 
     engine = builder.build_cuda_engine(network)