[Enhance] Speed up evaluation on waymo (#2008)

JingweiZhang12 · web-flow · commit 0f4ba413cb05 · 2022-11-16T16:36:57.000+08:00
* support fast eval on waymo

* support waymo evaluatioin more flexible and faster

* support waymo evaluatioin more flexible and faster

* renames

* add docs

* add guides for multi-thread evaluation toolkit

* fix docstring

* add download link for idx2metainfo

* add docstring

* set convert_kitti_format=False in Lidar-based methods

* fix docs

* add docstring
diff --git a/configs/_base_/datasets/waymoD5-3d-3class.py b/configs/_base_/datasets/waymoD5-3d-3class.py
@@ -151,7 +151,8 @@
     ann_file='./data/waymo/kitti_format/waymo_infos_val.pkl',
     waymo_bin_file='./data/waymo/waymo_format/gt.bin',
     data_root='./data/waymo/waymo_format',
-    file_client_args=file_client_args)
+    file_client_args=file_client_args,
+    convert_kitti_format=False)
 test_evaluator = val_evaluator
 
 vis_backends = [dict(type='LocalVisBackend')]
diff --git a/configs/_base_/datasets/waymoD5-3d-car.py b/configs/_base_/datasets/waymoD5-3d-car.py
@@ -135,7 +135,8 @@
     type='WaymoMetric',
     ann_file='./data/waymo/kitti_format/waymo_infos_val.pkl',
     waymo_bin_file='./data/waymo/waymo_format/gt.bin',
-    data_root='./data/waymo/waymo_format')
+    data_root='./data/waymo/waymo_format',
+    convert_kitti_format=False)
 test_evaluator = val_evaluator
 
 vis_backends = [dict(type='LocalVisBackend')]
diff --git a/docs/en/advanced_guides/datasets/waymo_det.md b/docs/en/advanced_guides/datasets/waymo_det.md
@@ -106,6 +106,7 @@ For evaluation on Waymo, please follow the [instruction](https://github.com/waym
 ```shell
 # download the code and enter the base directory
 git clone https://github.com/waymo-research/waymo-open-dataset.git waymo-od
+# git clone https://github.com/Abyssaledge/waymo-open-dataset-master waymo-od # if you want to use faster multi-thread version.
 cd waymo-od
 git checkout remotes/origin/master
 
diff --git a/docs/en/user_guides/dataset_prepare.md b/docs/en/user_guides/dataset_prepare.md
@@ -110,7 +110,25 @@ Download Waymo open dataset V1.2 [HERE](https://waymo.com/open/download/) and it
 python tools/create_data.py waymo --root-path ./data/waymo/ --out-dir ./data/waymo/ --workers 128 --extra-tag waymo
 ```
 
-Note that if your local disk does not have enough space for saving converted data, you can change the `out-dir` to anywhere else. Just remember to create folders and prepare data there in advance and link them back to `data/waymo/kitti_format` after the data conversion.
+Note that:
+
+- If your local disk does not have enough space for saving converted data, you can change the `out-dir` to anywhere else. Just remember to create folders and prepare data there in advance and link them back to `data/waymo/kitti_format` after the data conversion.
+
+- If you want faster evaluation on Waymo, you can download the preprocessed [metainfo](https://download.openmmlab.com/mmdetection3d/data/waymo/idx2metainfo.pkl) containing `contextname` and `timestamp` to the directory `data/waymo/waymo_format/`. Then, the dataset config is modified like the following:
+
+  ```python
+  val_evaluator = dict(
+      type='WaymoMetric',
+      ann_file='./data/waymo/kitti_format/waymo_infos_val.pkl',
+      waymo_bin_file='./data/waymo/waymo_format/gt.bin',
+      data_root='./data/waymo/waymo_format',
+      file_client_args=file_client_args,
+      convert_kitti_format=True,
+      idx2metainfo='data/waymo/waymo_format/idx2metainfo.pkl'
+      )
+  ```
+
+  Now, this trick is only used for LiDAR-based detection methods.
 
 ### NuScenes
 
diff --git a/docs/zh_cn/advanced_guides/datasets/waymo_det.md b/docs/zh_cn/advanced_guides/datasets/waymo_det.md
@@ -106,6 +106,7 @@ mmdetection3d
 ```shell
 # download the code and enter the base directory
 git clone https://github.com/waymo-research/waymo-open-dataset.git waymo-od
+# git clone https://github.com/Abyssaledge/waymo-open-dataset-master waymo-od # if you want to use faster multi-thread version.
 cd waymo-od
 git checkout remotes/origin/master
 
diff --git a/docs/zh_cn/user_guides/dataset_prepare.md b/docs/zh_cn/user_guides/dataset_prepare.md
@@ -104,8 +104,23 @@ python tools/create_data.py kitti --root-path ./data/kitti --out-dir ./data/kitt
 python tools/create_data.py waymo --root-path ./data/waymo/ --out-dir ./data/waymo/ --workers 128 --extra-tag waymo
 ```
 
-注意，如果你的硬盘空间大小不足以存储转换后的数据，你可以将 `out-dir` 参数设定为别的路径。
-你只需要记得在那个路径下创建文件夹并下载数据，然后在数据预处理完成后将其链接回 `data/waymo/kitti_format` 即可。
+注意:
+
+- 如果你的硬盘空间大小不足以存储转换后的数据，你可以将 `out-dir` 参数设定为别的路径。
+  你只需要记得在那个路径下创建文件夹并下载数据，然后在数据预处理完成后将其链接回 `data/waymo/kitti_format` 即可
+- 如果你想在 Waymo 上进行更快的评估，你可以下载已经预处理好的[元信息文件](https://download.openmmlab.com/mmdetection3d/data/waymo/idx2metainfo.pkl) 并将其放置在 `data/waymo/waymo_format/` 目录下. 接着，你可以按照下方来更改数据集的配置：
+  ```python
+  val_evaluator = dict(
+      type='WaymoMetric',
+      ann_file='./data/waymo/kitti_format/waymo_infos_val.pkl',
+      waymo_bin_file='./data/waymo/waymo_format/gt.bin',
+      data_root='./data/waymo/waymo_format',
+      file_client_args=file_client_args,
+      convert_kitti_format=True,
+      idx2metainfo='data/waymo/waymo_format/idx2metainfo.pkl'
+      )
+  ```
+  目前这种方式仅限于纯点云任务。
 
 ### NuScenes
 
diff --git a/mmdet3d/datasets/waymo_dataset.py b/mmdet3d/datasets/waymo_dataset.py
@@ -96,7 +96,7 @@ def __init__(self,
         self.max_sweeps = max_sweeps
         # we do not provide file_client_args to custom_3d init
         # because we want disk loading for info
-        # while ceph loading for KITTI2Waymo
+        # while ceph loading for Prediction2Waymo
         super().__init__(
             data_root=data_root,
             ann_file=ann_file,
diff --git a/mmdet3d/evaluation/functional/waymo_utils/__init__.py b/mmdet3d/evaluation/functional/waymo_utils/__init__.py
@@ -1,5 +1,5 @@
 # Copyright (c) OpenMMLab. All rights reserved.
 
-from .prediction_kitti_to_waymo import KITTI2Waymo
+from .prediction_to_waymo import Prediction2Waymo
 
-__all__ = ['KITTI2Waymo']
+__all__ = ['Prediction2Waymo']
diff --git a/mmdet3d/evaluation/functional/waymo_utils/prediction_to_waymo.py b/mmdet3d/evaluation/functional/waymo_utils/prediction_to_waymo.py
@@ -5,63 +5,81 @@
 
 try:
     from waymo_open_dataset import dataset_pb2 as open_dataset
+    from waymo_open_dataset import label_pb2
+    from waymo_open_dataset.protos import metrics_pb2
+    from waymo_open_dataset.protos.metrics_pb2 import Objects
 except ImportError:
+    Objects = None
     raise ImportError(
         'Please run "pip install waymo-open-dataset-tf-2-1-0==1.2.0" '
         'to install the official devkit first.')
 
 from glob import glob
 from os.path import join
+from typing import List, Optional
 
 import mmengine
 import numpy as np
 import tensorflow as tf
-from waymo_open_dataset import label_pb2
-from waymo_open_dataset.protos import metrics_pb2
 
 
-class KITTI2Waymo(object):
-    """KITTI predictions to Waymo converter.
+class Prediction2Waymo(object):
+    """Predictions to Waymo converter. The format of prediction results could
+    be original format or kitti-format.
 
     This class serves as the converter to change predictions from KITTI to
     Waymo format.
 
     Args:
-        kitti_result_files (list[dict]): Predictions in KITTI format.
+        results (list[dict]): Prediction results.
         waymo_tfrecords_dir (str): Directory to load waymo raw data.
         waymo_results_save_dir (str): Directory to save converted predictions
             in waymo format (.bin files).
         waymo_results_final_path (str): Path to save combined
             predictions in waymo format (.bin file), like 'a/b/c.bin'.
         prefix (str): Prefix of filename. In general, 0 for training, 1 for
             validation and 2 for testing.
-        workers (str): Number of parallel processes.
+        classes (dict): A list of class name.
+        workers (str): Number of parallel processes. Defaults to 2.
+        file_client_args (str): File client for reading gt in waymo format.
+            Defaults to ``dict(backend='disk')``.
+        from_kitti_format (bool, optional): Whether the reuslts are kitti
+            format. Defaults to False.
+        idx2metainfo (Optional[dict], optional): The mapping from sample_idx to
+            metainfo. The metainfo must contain the keys: 'idx2contextname' and
+            'idx2timestamp'. Defaults to None.
     """
 
     def __init__(self,
-                 kitti_result_files,
-                 waymo_tfrecords_dir,
-                 waymo_results_save_dir,
-                 waymo_results_final_path,
-                 prefix,
-                 workers=64,
-                 file_client_args=dict(backend='disk')):
-
-        self.kitti_result_files = kitti_result_files
+                 results: List[dict],
+                 waymo_tfrecords_dir: str,
+                 waymo_results_save_dir: str,
+                 waymo_results_final_path: str,
+                 prefix: str,
+                 classes: dict,
+                 workers: int = 2,
+                 file_client_args: dict = dict(backend='disk'),
+                 from_kitti_format: bool = False,
+                 idx2metainfo: Optional[dict] = None):
+
+        self.results = results
         self.waymo_tfrecords_dir = waymo_tfrecords_dir
         self.waymo_results_save_dir = waymo_results_save_dir
         self.waymo_results_final_path = waymo_results_final_path
         self.prefix = prefix
+        self.classes = classes
         self.workers = int(workers)
         self.file_client_args = file_client_args
-        self.name2idx = {}
-        for idx, result in enumerate(kitti_result_files):
-            if len(result['sample_id']) > 0:
-                self.name2idx[str(result['sample_id'][0])] = idx
+        self.from_kitti_format = from_kitti_format
+        if idx2metainfo is not None:
+            self.idx2metainfo = idx2metainfo
+            # If ``fast_eval``, the metainfo does not need to be read from
+            # original data online. It's preprocessed offline.
+            self.fast_eval = True
+        else:
+            self.fast_eval = False
 
-        # turn on eager execution for older tensorflow versions
-        if int(tf.__version__.split('.')[0]) < 2:
-            tf.enable_eager_execution()
+        self.name2idx = {}
 
         self.k2w_cls_map = {
             'Car': label_pb2.Label.TYPE_VEHICLE,
@@ -70,12 +88,28 @@ def __init__(self,
             'Cyclist': label_pb2.Label.TYPE_CYCLIST,
         }
 
-        self.T_ref_to_front_cam = np.array([[0.0, 0.0, 1.0, 0.0],
-                                            [-1.0, 0.0, 0.0, 0.0],
-                                            [0.0, -1.0, 0.0, 0.0],
-                                            [0.0, 0.0, 0.0, 1.0]])
+        if self.from_kitti_format:
+            self.T_ref_to_front_cam = np.array([[0.0, 0.0, 1.0, 0.0],
+                                                [-1.0, 0.0, 0.0, 0.0],
+                                                [0.0, -1.0, 0.0, 0.0],
+                                                [0.0, 0.0, 0.0, 1.0]])
+            # ``sample_idx`` of the sample in kitti-format is an array
+            for idx, result in enumerate(results):
+                if len(result['sample_idx']) > 0:
+                    self.name2idx[str(result['sample_idx'][0])] = idx
+        else:
+            # ``sample_idx`` of the sample in the original prediction
+            # is an int value.
+            for idx, result in enumerate(results):
+                self.name2idx[str(result['sample_idx'])] = idx
+
+        if not self.fast_eval:
+            # need to read original '.tfrecord' file
+            self.get_file_names()
+            # turn on eager execution for older tensorflow versions
+            if int(tf.__version__.split('.')[0]) < 2:
+                tf.enable_eager_execution()
 
-        self.get_file_names()
         self.create_folder()
 
     def get_file_names(self):
@@ -207,22 +241,30 @@ def convert_one(self, file_idx):
 
             filename = f'{self.prefix}{file_idx:03d}{frame_num:03d}'
 
-            for camera in frame.context.camera_calibrations:
-                # FRONT = 1, see dataset.proto for details
-                if camera.name == 1:
-                    T_front_cam_to_vehicle = np.array(
-                        camera.extrinsic.transform).reshape(4, 4)
-
-            T_k2w = T_front_cam_to_vehicle @ self.T_ref_to_front_cam
-
             context_name = frame.context.name
             frame_timestamp_micros = frame.timestamp_micros
 
             if filename in self.name2idx:
-                kitti_result = \
-                    self.kitti_result_files[self.name2idx[filename]]
-                objects = self.parse_objects(kitti_result, T_k2w, context_name,
-                                             frame_timestamp_micros)
+                if self.from_kitti_format:
+                    for camera in frame.context.camera_calibrations:
+                        # FRONT = 1, see dataset.proto for details
+                        if camera.name == 1:
+                            T_front_cam_to_vehicle = np.array(
+                                camera.extrinsic.transform).reshape(4, 4)
+
+                    T_k2w = T_front_cam_to_vehicle @ self.T_ref_to_front_cam
+
+                    kitti_result = \
+                        self.results[self.name2idx[filename]]
+                    objects = self.parse_objects(kitti_result, T_k2w,
+                                                 context_name,
+                                                 frame_timestamp_micros)
+                else:
+                    index = self.name2idx[filename]
+                    objects = self.parse_objects_from_origin(
+                        self.results[index], context_name,
+                        frame_timestamp_micros)
+
             else:
                 print(filename, 'not found.')
                 objects = metrics_pb2.Objects()
@@ -232,11 +274,100 @@ def convert_one(self, file_idx):
                     'wb') as f:
                 f.write(objects.SerializeToString())
 
+    def convert_one_fast(self, res_index: int):
+        """Convert action for single file. It read the metainfo from the
+        preprocessed file offline and will be faster.
+
+        Args:
+            res_index (int): The indices of the results.
+        """
+        sample_idx = self.results[res_index]['sample_idx']
+        if len(self.results[res_index]['pred_instances_3d']) > 0:
+            objects = self.parse_objects_from_origin(
+                self.results[res_index],
+                self.idx2metainfo[str(sample_idx)]['contextname'],
+                self.idx2metainfo[str(sample_idx)]['timestamp'])
+        else:
+            print(sample_idx, 'not found.')
+            objects = metrics_pb2.Objects()
+
+        with open(
+                join(self.waymo_results_save_dir, f'{sample_idx}.bin'),
+                'wb') as f:
+            f.write(objects.SerializeToString())
+
+    def parse_objects_from_origin(self, result: dict, contextname: str,
+                                  timestamp: str) -> Objects:
+        """Parse obejcts from the original prediction results.
+
+        Args:
+            result (dict): The original prediction results.
+            contextname (str): The ``contextname`` of sample in waymo.
+            timestamp (str): The ``timestamp`` of sample in waymo.
+
+        Returns:
+            metrics_pb2.Objects: The parsed object.
+        """
+        lidar_boxes = result['pred_instances_3d']['bboxes_3d'].tensor
+        scores = result['pred_instances_3d']['scores_3d']
+        labels = result['pred_instances_3d']['labels_3d']
+
+        def parse_one_object(index):
+            class_name = self.classes[labels[index].item()]
+
+            box = label_pb2.Label.Box()
+            height = lidar_boxes[index][5].item()
+            heading = lidar_boxes[index][6].item()
+
+            while heading < -np.pi:
+                heading += 2 * np.pi
+            while heading > np.pi:
+                heading -= 2 * np.pi
+
+            box.center_x = lidar_boxes[index][0].item()
+            box.center_y = lidar_boxes[index][1].item()
+            box.center_z = lidar_boxes[index][2].item() + height / 2
+            box.length = lidar_boxes[index][3].item()
+            box.width = lidar_boxes[index][4].item()
+            box.height = height
+            box.heading = heading
+
+            o = metrics_pb2.Object()
+            o.object.box.CopyFrom(box)
+            o.object.type = self.k2w_cls_map[class_name]
+            o.score = scores[index].item()
+            o.context_name = contextname
+            o.frame_timestamp_micros = timestamp
+
+            return o
+
+        objects = metrics_pb2.Objects()
+        for i in range(len(lidar_boxes)):
+            objects.objects.append(parse_one_object(i))
+
+        return objects
+
     def convert(self):
         """Convert action."""
         print('Start converting ...')
-        mmengine.track_parallel_progress(self.convert_one, range(len(self)),
-                                         self.workers)
+        convert_func = self.convert_one_fast if self.fast_eval else \
+            self.convert_one
+
+        # from torch.multiprocessing import set_sharing_strategy
+        # # Force using "file_system" sharing strategy for stability
+        # set_sharing_strategy("file_system")
+
+        # mmengine.track_parallel_progress(convert_func, range(len(self)),
+        #                                  self.workers)
+
+        # TODO: Support multiprocessing. Now, multiprocessing evaluation will
+        # cause shared memory error in torch-1.10 and torch-1.11. Details can
+        # be seen in https://github.com/pytorch/pytorch/issues/67864.
+        prog_bar = mmengine.ProgressBar(len(self))
+        for i in range(len(self)):
+            convert_func(i)
+            prog_bar.update()
+
         print('\nFinished ...')
 
         # combine all files into one .bin
@@ -248,7 +379,8 @@ def convert(self):
 
     def __len__(self):
         """Length of the filename list."""
-        return len(self.waymo_tfrecord_pathnames)
+        return len(self.results) if self.fast_eval else len(
+            self.waymo_tfrecord_pathnames)
 
     def transform(self, T, x, y, z):
         """Transform the coordinates with matrix T.
diff --git a/mmdet3d/evaluation/metrics/waymo_metric.py b/mmdet3d/evaluation/metrics/waymo_metric.py