"""calibrator.py The original code could be found in TensorRT-7.x sample code: "samples/python/int8_caffe_mnist/calibrator.py". I made the modification so that the Calibrator could handle MS-COCO dataset images instead of MNIST. """ # # Copyright 1993-2019 NVIDIA Corporation. All rights reserved. # # NOTICE TO LICENSEE: # # This source code and/or documentation ("Licensed Deliverables") are # subject to NVIDIA intellectual property rights under U.S. and # international Copyright laws. # # These Licensed Deliverables contained herein is PROPRIETARY and # CONFIDENTIAL to NVIDIA and is being provided under the terms and # conditions of a form of NVIDIA software license agreement by and # between NVIDIA and Licensee ("License Agreement") or electronically # accepted by Licensee. Notwithstanding any terms or conditions to # the contrary in the License Agreement, reproduction or disclosure # of the Licensed Deliverables to any third party without the express # written consent of NVIDIA is prohibited. # # NOTWITHSTANDING ANY TERMS OR CONDITIONS TO THE CONTRARY IN THE # LICENSE AGREEMENT, NVIDIA MAKES NO REPRESENTATION ABOUT THE # SUITABILITY OF THESE LICENSED DELIVERABLES FOR ANY PURPOSE. IT IS # PROVIDED "AS IS" WITHOUT EXPRESS OR IMPLIED WARRANTY OF ANY KIND. # NVIDIA DISCLAIMS ALL WARRANTIES WITH REGARD TO THESE LICENSED # DELIVERABLES, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY, # NONINFRINGEMENT, AND FITNESS FOR A PARTICULAR PURPOSE. # NOTWITHSTANDING ANY TERMS OR CONDITIONS TO THE CONTRARY IN THE # LICENSE AGREEMENT, IN NO EVENT SHALL NVIDIA BE LIABLE FOR ANY # SPECIAL, INDIRECT, INCIDENTAL, OR CONSEQUENTIAL DAMAGES, OR ANY # DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, # WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS # ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE # OF THESE LICENSED DELIVERABLES. # # U.S. Government End Users. These Licensed Deliverables are a # "commercial item" as that term is defined at 48 C.F.R. 2.101 (OCT # 1995), consisting of "commercial computer software" and "commercial # computer software documentation" as such terms are used in 48 # C.F.R. 12.212 (SEPT 1995) and is provided to the U.S. Government # only as a commercial end item. Consistent with 48 C.F.R.12.212 and # 48 C.F.R. 227.7202-1 through 227.7202-4 (JUNE 1995), all # U.S. Government End Users acquire the Licensed Deliverables with # only those rights set forth herein. # # Any use of the Licensed Deliverables in individual and commercial # software must include, in the user documentation and internal # comments to the code, the above Disclaimer and U.S. Government End # Users Notice. import os import numpy as np import cv2 import pycuda.autoinit import pycuda.driver as cuda import tensorrt as trt def _preprocess_yolo(img, input_shape): """Preprocess an image before TRT YOLO inferencing. # Args img: uint8 numpy array of shape either (img_h, img_w, 3) or (img_h, img_w) input_shape: a tuple of (H, W) # Returns preprocessed img: float32 numpy array of shape (3, H, W) """ if img.ndim == 2: img = cv2.cvtColor(img, cv2.COLOR_GRAY2BGR) img = cv2.resize(img, (input_shape[1], input_shape[0])) img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB) img = img.transpose((2, 0, 1)).astype(np.float32) img /= 255.0 return img class YOLOEntropyCalibrator(trt.IInt8EntropyCalibrator2): """YOLOEntropyCalibrator This class implements TensorRT's IInt8EntropyCalibtrator2 interface. It reads all images from the specified directory and generates INT8 calibration data for YOLO models accordingly. """ def __init__(self, img_dir, net_hw, cache_file, batch_size=1): if not os.path.isdir(img_dir): raise FileNotFoundError('%s does not exist' % img_dir) if len(net_hw) != 2 or net_hw[0] % 32 or net_hw[1] % 32: raise ValueError('bad net shape: %s' % str(net_hw)) super().__init__() # trt.IInt8EntropyCalibrator2.__init__(self) self.img_dir = img_dir self.net_hw = net_hw self.cache_file = cache_file self.batch_size = batch_size self.blob_size = 3 * net_hw[0] * net_hw[1] * np.dtype('float32').itemsize * batch_size self.jpgs = [f for f in os.listdir(img_dir) if f.endswith('.jpg')] # The number "500" is NVIDIA's suggestion. See here: # https://docs.nvidia.com/deeplearning/tensorrt/developer-guide/index.html#optimizing_int8_c if len(self.jpgs) < 500: print('WARNING: found less than 500 images in %s!' % img_dir) self.current_index = 0 # Allocate enough memory for a whole batch. self.device_input = cuda.mem_alloc(self.blob_size) def __del__(self): del self.device_input # free CUDA memory def get_batch_size(self): return self.batch_size def get_batch(self, names): if self.current_index + self.batch_size > len(self.jpgs): return None current_batch = int(self.current_index / self.batch_size) batch = [] for i in range(self.batch_size): img_path = os.path.join( self.img_dir, self.jpgs[self.current_index + i]) img = cv2.imread(img_path) assert img is not None, 'failed to read %s' % img_path batch.append(_preprocess_yolo(img, self.net_hw)) batch = np.stack(batch) assert batch.nbytes == self.blob_size cuda.memcpy_htod(self.device_input, np.ascontiguousarray(batch)) self.current_index += self.batch_size return [self.device_input] def read_calibration_cache(self): # If there is a cache, use it instead of calibrating again. # Otherwise, implicitly return None. if os.path.exists(self.cache_file): with open(self.cache_file, 'rb') as f: return f.read() def write_calibration_cache(self, cache): with open(self.cache_file, 'wb') as f: f.write(cache)