Improve benchmark configurations (#2)

* Improve benchmark configurations:

* Move data downloading from configs to download_data.py. Add an alternative download link.

* Add Data class to operate data loading and indexing.

* Add Metric class to operate benchmark runs.

* Benchmark results are now the median or geometric mean of benchmark
runs.

Files changed (6) hide show

benchmark/README.md +4 -0
benchmark/benchmark.py +114 -77
benchmark/config/face_detection_yunet.yaml +11 -16
benchmark/config/text_detection_db.yaml +10 -15
benchmark/config/text_recognition_crnn.yaml +9 -14
benchmark/{download.py → download_data.py} +44 -14

benchmark/README.md CHANGED Viewed

@@ -10,6 +10,10 @@ Time is measured from data preprocess (resize is excluded), to a forward pass of
 1. Install `python >= 3.6`.
 2. Install dependencies: `pip install -r requirements.txt`.
 ## Benchmarking

 1. Install `python >= 3.6`.
 2. Install dependencies: `pip install -r requirements.txt`.
+3. Download data for benchmarking.
+    1. Download all data: `python download_data.py`
+    2. Download one or more specified data: `python download_data.py face text`. Available names can be found in `download_data.py`.
+    3. If download fails, you can download all data from https://pan.baidu.com/s/18sV8D4vXUb2xC9EG45k7bg (code: pvrw). Please place and extract data packages under [./data](./data).
 ## Benchmarking

benchmark/benchmark.py CHANGED Viewed

@@ -7,7 +7,6 @@ import numpy as np
 import cv2 as cv
 from models import MODELS
-from download import Downloader
 parser = argparse.ArgumentParser("Benchmarks for OpenCV Zoo.")
 parser.add_argument('--cfg', '-c', type=str,
@@ -15,11 +14,11 @@ parser.add_argument('--cfg', '-c', type=str,
 args = parser.parse_args()
 class Timer:
-    def __init__(self):
         self._tm = cv.TickMeter()
         self._time_record = []
-        self._average_time = 0
         self._calls = 0
     def start(self):
@@ -29,22 +28,121 @@ class Timer:
         self._tm.stop()
         self._calls += 1
         self._time_record.append(self._tm.getTimeMilli())
-        self._average_time = sum(self._time_record) / self._calls
         self._tm.reset()
     def reset(self):
         self._time_record = []
-        self._average_time = 0
         self._calls = 0
-    def getAverageTime(self):
-        return self._average_time
 class Benchmark:
     def __init__(self, **kwargs):
-        self._fileList = kwargs.pop('fileList', None)
-        assert self._fileList, 'fileList cannot be empty'
         backend_id = kwargs.pop('backend', 'default')
         available_backends = dict(
@@ -71,76 +169,22 @@ class Benchmark:
         )
         self._target = available_targets[target_id]
-        self._sizes = kwargs.pop('sizes', None)
-        self._repeat = kwargs.pop('repeat', 100)
-        self._parentPath = kwargs.pop('parentPath', 'benchmark/data')
-        self._useGroundTruth = kwargs.pop('useDetectionLabel', False) # If it is enable, 'sizes' will not work
-        assert (self._sizes and not self._useGroundTruth) or (not self._sizes and self._useGroundTruth), 'If \'useDetectionLabel\' is True, \'sizes\' should not exist.'
-        self._timer = Timer()
-        self._benchmark_results = dict.fromkeys(self._fileList, dict())
-        if self._useGroundTruth:
-            self.loadLabel()
-    def loadLabel(self):
-        self._labels = dict.fromkeys(self._fileList, None)
-        for imgName in self._fileList:
-            self._labels[imgName] = np.loadtxt(os.path.join(self._parentPath, '{}.txt'.format(imgName[:-4])))
     def run(self, model):
         model.setBackend(self._backend)
         model.setTarget(self._target)
-        for imgName in self._fileList:
-            img = cv.imread(os.path.join(self._parentPath, imgName))
-            if self._useGroundTruth:
-                for idx, gt in enumerate(self._labels[imgName]):
-                    self._benchmark_results[imgName]['gt{}'.format(idx)] = self._run(
-                        model,
-                        img,
-                        gt,
-                        pbar_msg='  {}, gt{}'.format(imgName, idx)
-                    )
-            else:
-                if self._sizes is None:
-                    h, w, _ = img.shape
-                    model.setInputSize([w, h])
-                    self._benchmark_results[imgName][str([w, h])] = self._run(
-                        model,
-                        img,
-                        pbar_msg='  {}, original size {}'.format(imgName, str([w, h]))
-                    )
-                else:
-                    for size in self._sizes:
-                        imgResized = cv.resize(img, size)
-                        model.setInputSize(size)
-                        self._benchmark_results[imgName][str(size)] = self._run(
-                            model,
-                            imgResized,
-                            pbar_msg='  {}, size {}'.format(imgName, str(size))
-                        )
     def printResults(self):
-        print('  Results:')
         for imgName, results in self._benchmark_results.items():
-            print('    image: {}'.format(imgName))
             total_latency = 0
             for key, latency in results.items():
                 total_latency += latency
-                print('        {}, latency: {:.4f} ms'.format(key, latency))
-            print('        Average latency: {:.4f} ms'.format(total_latency / len(results)))
-    def _run(self, model, *args, **kwargs):
-        self._timer.reset()
-        pbar = tqdm.tqdm(range(self._repeat))
-        for _ in pbar:
-            pbar.set_description(kwargs.get('pbar_msg', None))
-            self._timer.start()
-            results = model.infer(*args)
-            self._timer.stop()
-        return self._timer.getAverageTime()
 def build_from_cfg(cfg, registery):
@@ -160,16 +204,9 @@ if __name__ == '__main__':
         cfg = yaml.safe_load(f)
     # prepend PYTHONPATH to each path
-    prepend_pythonpath(cfg, key1='Data', key2='parentPath')
-    prepend_pythonpath(cfg, key1='Benchmark', key2='parentPath')
     prepend_pythonpath(cfg, key1='Model', key2='modelPath')
-    # Download data if not exist
-    print('Loading data:')
-    downloader = Downloader(**cfg['Data'])
-    downloader.get()
     # Instantiate benchmarking
     benchmark = Benchmark(**cfg['Benchmark'])

 import cv2 as cv
 from models import MODELS
 parser = argparse.ArgumentParser("Benchmarks for OpenCV Zoo.")
 parser.add_argument('--cfg', '-c', type=str,
 args = parser.parse_args()
 class Timer:
+    def __init__(self, warmup=0, reduction='median'):
+        self._warmup = warmup
+        self._reduction = reduction
         self._tm = cv.TickMeter()
         self._time_record = []
         self._calls = 0
     def start(self):
         self._tm.stop()
         self._calls += 1
         self._time_record.append(self._tm.getTimeMilli())
         self._tm.reset()
     def reset(self):
         self._time_record = []
         self._calls = 0
+    def getResult(self):
+        if self._reduction == 'median':
+            return self._getMedian(self._time_record[self._warmup:])
+        elif self._reduction == 'gmean':
+            return self._getGMean(self._time_record[self._warmup:])
+        else:
+            raise NotImplementedError()
+    def _getMedian(self, records):
+        ''' Return median time
+        '''
+        l = len(records)
+        mid = int(l / 2)
+        if l % 2 == 0:
+            return (records[mid] + records[mid - 1]) / 2
+        else:
+            return records[mid]
+    def _getGMean(self, records, drop_largest=3):
+        ''' Return geometric mean of time
+        '''
+        time_record_sorted = sorted(records, reverse=True)
+        return sum(records[drop_largest:]) / (self._calls - drop_largest)
+class Data:
+    def __init__(self, **kwargs):
+        self._path = kwargs.pop('path', None)
+        assert self._path, 'Benchmark[\'data\'][\'path\'] cannot be empty.'
+        self._files = kwargs.pop('files', None)
+        if not self._files:
+            print('Benchmark[\'data\'][\'files\'] is empty, loading all images by default.')
+            self._files = list()
+            for filename in os.listdir(self._path):
+                if filename.endswith('jpg') or filename.endswith('png'):
+                    self._files.append(filename)
+        self._use_label = kwargs.pop('useLabel', False)
+        if self._use_label:
+            self._labels = self._load_label()
+    def _load_label(self):
+        labels = dict.fromkeys(self._files, None)
+        for filename in self._files:
+            labels[filename] = np.loadtxt(os.path.join(self._path, '{}.txt'.format(filename[:-4])))
+        return labels
+    def __getitem__(self, idx):
+        image = cv.imread(os.path.join(self._path, self._files[idx]))
+        if self._use_label:
+            return self._files[idx], image, self._labels[self._files[idx]]
+        else:
+            return self._files[idx], image
+class Metric:
+    def __init__(self, **kwargs):
+        self._sizes = kwargs.pop('sizes', None)
+        self._warmup = kwargs.pop('warmup', 3)
+        self._repeat = kwargs.pop('repeat', 10)
+        assert self._warmup < self._repeat, 'The value of warmup must be smaller than the value of repeat.'
+        self._batch_size = kwargs.pop('batchSize', 1)
+        self._reduction = kwargs.pop('reduction', 'median')
+        self._timer = Timer(self._warmup, self._reduction)
+    def getReduction(self):
+        return self._reduction
+    def forward(self, model, *args, **kwargs):
+        img = args[0]
+        h, w, _ = img.shape
+        if not self._sizes:
+            self._sizes = [[w, h]]
+        results = dict()
+        self._timer.reset()
+        if len(args) == 1:
+            for size in self._sizes:
+                img_r = cv.resize(img, size)
+                model.setInputSize(size)
+                # TODO: batched inference
+                # input_data = [img] * self._batch_size
+                input_data = img_r
+                for _ in range(self._repeat+self._warmup):
+                    self._timer.start()
+                    model.infer(input_data)
+                    self._timer.stop()
+                results[str(size)] = self._timer.getResult()
+        else:
+            # TODO: batched inference
+            # input_data = [args] * self._batch_size
+            bboxes = args[1]
+            for idx, bbox in enumerate(bboxes):
+                for _ in range(self._repeat+self._warmup):
+                    self._timer.start()
+                    model.infer(img, bbox)
+                    self._timer.stop()
+                results['bbox{}'.format(idx)] = self._timer.getResult()
+        return results
 class Benchmark:
     def __init__(self, **kwargs):
+        self._data_dict = kwargs.pop('data', None)
+        assert self._data_dict, 'Benchmark[\'data\'] cannot be empty and must have path and files.'
+        self._data = Data(**self._data_dict)
+        self._metric_dict = kwargs.pop('metric', None)
+        self._metric = Metric(**self._metric_dict)
         backend_id = kwargs.pop('backend', 'default')
         available_backends = dict(
         )
         self._target = available_targets[target_id]
+        self._benchmark_results = dict()
     def run(self, model):
         model.setBackend(self._backend)
         model.setTarget(self._target)
+        for data in self._data:
+            self._benchmark_results[data[0]] = self._metric.forward(model, *data[1:])
     def printResults(self):
         for imgName, results in self._benchmark_results.items():
+            print('  image: {}'.format(imgName))
             total_latency = 0
             for key, latency in results.items():
                 total_latency += latency
+                print('      {}, latency ({}): {:.4f} ms'.format(key, self._metric.getReduction(), latency))
 def build_from_cfg(cfg, registery):
         cfg = yaml.safe_load(f)
     # prepend PYTHONPATH to each path
+    prepend_pythonpath(cfg['Benchmark'], key1='data', key2='path')
     prepend_pythonpath(cfg, key1='Model', key2='modelPath')
     # Instantiate benchmarking
     benchmark = Benchmark(**cfg['Benchmark'])

benchmark/config/face_detection_yunet.yaml CHANGED Viewed

@@ -1,23 +1,18 @@
-Data:
-  name: "Images for Face Detection"
-  url: "https://drive.google.com/u/0/uc?id=1lOAliAIeOv4olM65YDzE55kn6XjiX2l6&export=download"
-  sha: "0ba67a9cfd60f7fdb65cdb7c55a1ce76c1193df1"
-  filename: "face_detection.zip"
-  parentPath: "benchmark/data"
 Benchmark:
   name: "Face Detection Benchmark"
-  parentPath: "benchmark/data/face_detection"
-  fileList:
-    - "group.jpg"
-    - "concerts.jpg"
-    - "dance.jpg"
   backend: "default"
   target: "cpu"
-  sizes: # [w, h], Omit to run at original scale
-    - [160, 120]
-    - [640, 480]
-  repeat: 100 # default 100
 Model:
   name: "YuNet"

 Benchmark:
   name: "Face Detection Benchmark"
+  data:
+    path: "benchmark/data/face"
+    files: ["group.jpg", "concerts.jpg", "dance.jpg"]
+  metric:
+    sizes: # [[w1, h1], ...], Omit to run at original scale
+      - [160, 120]
+      - [640, 480]
+    warmup: 3
+    repeat: 10
+    batchSize: 1
+    reduction: 'median'
   backend: "default"
   target: "cpu"
 Model:
   name: "YuNet"

benchmark/config/text_detection_db.yaml CHANGED Viewed

@@ -1,22 +1,17 @@
-Data:
-  name: "Images for Text Detection"
-  url: "https://drive.google.com/u/0/uc?id=1lTQdZUau7ujHBqp0P6M1kccnnJgO-dRj&export=download"
-  sha: "a40cf095ceb77159ddd2a5902f3b4329696dd866"
-  filename: "text.zip"
-  parentPath: "benchmark/data"
 Benchmark:
   name: "Text Detection Benchmark"
-  parentPath: "benchmark/data/text"
-  fileList:
-    - "1.jpg"
-    - "2.jpg"
-    - "3.jpg"
   backend: "default"
   target: "cpu"
-  sizes: # [w, h], default original scale
-    - [640, 480]
-  repeat: 100
 Model:
   name: "DB"

 Benchmark:
   name: "Text Detection Benchmark"
+  data:
+    path: "benchmark/data/text"
+    files: ["1.jpg", "2.jpg", "3.jpg"]
+  metric:
+    sizes: # [[w1, h1], ...], Omit to run at original scale
+      - [640, 480]
+    warmup: 3
+    repeat: 10
+    batchSize: 1
+    reduction: 'median'
   backend: "default"
   target: "cpu"
 Model:
   name: "DB"

benchmark/config/text_recognition_crnn.yaml CHANGED Viewed

@@ -1,21 +1,16 @@
-Data:
-  name: "Images for Text Detection"
-  url: "https://drive.google.com/u/0/uc?id=1lTQdZUau7ujHBqp0P6M1kccnnJgO-dRj&export=download"
-  sha: "a40cf095ceb77159ddd2a5902f3b4329696dd866"
-  filename: "text.zip"
-  parentPath: "benchmark/data"
 Benchmark:
   name: "Text Recognition Benchmark"
-  parentPath: "benchmark/data/text"
-  fileList:
-    - "1.jpg"
-    - "2.jpg"
-    - "3.jpg"
   backend: "default"
   target: "cpu"
-  useDetectionLabel: True
-  repeat: 100
 Model:
   name: "CRNN"

 Benchmark:
   name: "Text Recognition Benchmark"
+  data:
+    path: "benchmark/data/text"
+    files: ["1.jpg", "2.jpg", "3.jpg"]
+    useLabel: True
+  metric: # 'sizes' is omitted since this model requires input of fixed size
+    warmup: 3
+    repeat: 10
+    batchSize: 1
+    reduction: 'median'
   backend: "default"
   target: "cpu"
 Model:
   name: "CRNN"

benchmark/{download.py → download_data.py} RENAMED Viewed

@@ -32,7 +32,7 @@ class Downloader:
                 if c in d:
                     return int(d[c]) / self.MB
             return '<unknown>'
-        print('  {} {} [{} Mb]'.format(r.getcode(), r.msg, getMB(r)))
     def verifyHash(self):
         if not self._sha:
@@ -46,44 +46,45 @@ class Downloader:
                         break
                     sha.update(buf)
             if self._sha != sha.hexdigest():
-                print('  actual {}'.format(sha.hexdigest()))
-                print('  expect {}'.format(self._sha))
             return self._sha == sha.hexdigest()
         except Exception as e:
-            print('  catch {}'.format(e))
     def get(self):
         if self.verifyHash():
-            print('  hash match - skipping download')
         else:
             basedir = os.path.dirname(self._saveTo)
             if basedir and not os.path.exists(basedir):
-                print('  creating directory: ' + basedir)
                 os.makedirs(basedir, exist_ok=True)
-            print('  hash check failed - downloading')
             if 'drive.google.com' in self._url:
                 urlquery = urlparse(self._url).query.split('&')
                 for q in urlquery:
                     if 'id=' in q:
                         gid = q[3:]
                 sz = GDrive(gid)(osp.join(self._saveTo, self._filename))
-                print('  size = %.2f Mb' % (sz / (1024.0 * 1024)))
             else:
-                print('  get {}'.format(self._url))
                 self.download()
             # Verify hash after download
-            print(' done')
-            print(' file {}'.format(self._filename))
             if self.verifyHash():
-                print('  hash match - extracting')
             else:
-                print('  hash check failed - exiting')
         # Extract
         if '.zip' in self._filename:
-            print('  extracting - ', end='')
             self.extract()
             print('done')
@@ -161,3 +162,32 @@ def GDrive(gid):
         print('')
         return sz
     return download_gdrive

                 if c in d:
                     return int(d[c]) / self.MB
             return '<unknown>'
+        print('    {} {} [{} Mb]'.format(r.getcode(), r.msg, getMB(r)))
     def verifyHash(self):
         if not self._sha:
                         break
                     sha.update(buf)
             if self._sha != sha.hexdigest():
+                print('    actual {}'.format(sha.hexdigest()))
+                print('    expect {}'.format(self._sha))
             return self._sha == sha.hexdigest()
         except Exception as e:
+            print('    catch {}'.format(e))
     def get(self):
+        print('  {}: {}'.format(self._name, self._filename))
         if self.verifyHash():
+            print('    hash match - skipping download')
         else:
             basedir = os.path.dirname(self._saveTo)
             if basedir and not os.path.exists(basedir):
+                print('    creating directory: ' + basedir)
                 os.makedirs(basedir, exist_ok=True)
+            print('    hash check failed - downloading')
             if 'drive.google.com' in self._url:
                 urlquery = urlparse(self._url).query.split('&')
                 for q in urlquery:
                     if 'id=' in q:
                         gid = q[3:]
                 sz = GDrive(gid)(osp.join(self._saveTo, self._filename))
+                print('    size = %.2f Mb' % (sz / (1024.0 * 1024)))
             else:
+                print('    get {}'.format(self._url))
                 self.download()
             # Verify hash after download
+            print('    done')
+            print('    file {}'.format(self._filename))
             if self.verifyHash():
+                print('    hash match - extracting')
             else:
+                print('    hash check failed - exiting')
         # Extract
         if '.zip' in self._filename:
+            print('    extracting - ', end='')
             self.extract()
             print('done')
         print('')
         return sz
     return download_gdrive
+# Data will be downloaded and extracted to ./data by default
+data_downloaders = dict(
+    face=Downloader(name='face',
+        url='https://drive.google.com/u/0/uc?id=1lOAliAIeOv4olM65YDzE55kn6XjiX2l6&export=download',
+        sha='8397f115c0d4447e55ea05488579e71a813e2691',
+        filename='face.zip'),
+    text=Downloader(name='text',
+        url='https://drive.google.com/u/0/uc?id=1lTQdZUau7ujHBqp0P6M1kccnnJgO-dRj&export=download',
+        sha='a40cf095ceb77159ddd2a5902f3b4329696dd866',
+        filename='text.zip'),
+)
+if __name__ == '__main__':
+    selected_data_names = []
+    for i in range(1, len(sys.argv)):
+        selected_data_names.append(sys.argv[i])
+    if not selected_data_names:
+        selected_data_names = list(data_downloaders.keys())
+    print('Data will be downloaded: {}'.format(str(selected_data_names)))
+    download_failed = []
+    for selected_data_name in selected_data_names:
+        downloader = data_downloaders[selected_data_name]
+        if not downloader.get():
+            download_failed.append(downloader._name)
+    if download_failed:
+        print('Data have not been downloaded: {}'.format(str(download_failed)))