OpenSceneFlow/process.py at main · KTH-RPL/OpenSceneFlow · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
"""
# Created: 2023-11-04 15:55
# Copyright (C) 2023-now, RPL, KTH Royal Institute of Technology
# Author: Qingwen Zhang  (https://kin-zhang.github.io/)
#
# This file is part of
# * HiMo (https://kin-zhang.github.io/HiMo).
# If you find this repo helpful, please cite the respective publication as
# listed on the above website.
#
# Description: follow seflow & seflow++ idea but more to run:
# (a) dufomap; (b) linefit; (c) hdbscan; (d) nnd.
#
"""

from pathlib import Path
from tqdm import tqdm
import numpy as np
import fire, time, h5py, os, sys
from hdbscan import HDBSCAN

from src.utils import npcal_pose0to1
from src.utils.mics import HDF5Data, transform_to_array
from dufomap import dufomap
from linefit import ground_seg

MIN_AXIS_RANGE = 2 # HARD CODED: remove ego vehicle points
MAX_AXIS_RANGE = 50 # HARD CODED: remove far away points
BASE_DIR = os.path.abspath(os.path.join( os.path.dirname( __file__ )))

def check_data_key(filekey, keyname, scene_id, ts):
    """
    Checks if a specified key exists in the given file-like object and deletes it if present.

    This is typically used to remove old or outdated data before overwriting with new data.

    Args:
        filekey: The file-like object (e.g., HDF5 group or dictionary) to check for the key.
        keyname: The name of the key to check and potentially delete.
        scene_id: Identifier for the scene (used for logging or warning purposes).
        ts: Timestamp or frame identifier (used for logging or warning purposes).
    """
    if keyname in filekey:
        # print(f"Warning: {scene_id} {ts} has {keyname}, old data will be removed and overwritten.")
        del filekey[keyname]

def run_dufocluster(
    data_dir: str ="/home/kin/data/av2/preprocess/sensor/train",
    scene_range: list = [0, 1],
    interval: int = 1, # interval frames to run dufomap only
    overwrite: bool = True,

    # NOTE (Qingwen): following is for ground segmentation only... at least for code now.
    tag: str = "av2", # [nus, zod, man, sca] etc
    run_gm: bool = False, # run ground segmentation
    min_nnd: float = 0.14, # min nnd distance 1.4m/s pedestrain speed; For Scania data, we set 0.32 here.
):
    data_path = Path(data_dir)
    dataset = HDF5Data(data_path) # single frame reading.
    all_scene_ids = list(dataset.scene_id_bounds.keys())
    for scene_in_data_index, scene_id in enumerate(all_scene_ids):
        start_time = time.time()
        # NOTE (Qingwen): so the scene id range is [start, end)
        if scene_range[0]!= -1 and scene_range[-1]!= -1 and (scene_in_data_index < scene_range[0] or scene_in_data_index >= scene_range[1]):
            continue
        bounds = dataset.scene_id_bounds[scene_id]
        flag_exist_label = True
        with h5py.File(os.path.join(data_path, f'{scene_id}.h5'), 'r+') as f:
            for ii in range(bounds["min_index"], bounds["max_index"]+1):
                key = str(dataset[ii]['timestamp'])
                if 'dufocluster' not in f[key]:
                    flag_exist_label = False
                    break
        if flag_exist_label and not overwrite:
            print(f"==> Scene {scene_id} has plus label, skip.")
            continue

        hdb = HDBSCAN(min_cluster_size=20, cluster_selection_epsilon=0.7)
        for i in tqdm(range(bounds["min_index"], bounds["max_index"]+1), desc=f"Start Plus Cluster: {scene_in_data_index}/{len(all_scene_ids)}", ncols=80):
            data = dataset[i]
            pc0 = data['pc0'][:,:3]
            cluster_label = np.zeros(pc0.shape[0], dtype= np.int16)

            if "dufo" not in data:
                print(f"Warning: {scene_id} {data['timestamp']} has no dufo, will be skipped. Better to rerun dufomap again in this scene.")
                continue
            elif data["dufo"].sum() < 20:
                print(f"Warning: {scene_id} {data['timestamp']} has no dynamic points, will be skipped. Better to check this scene.")
            else:
                hdb.fit(pc0[data["dufo"]==1])
                # NOTE(Qingwen): since -1 will be assigned if no cluster. We set it to 0.
                cluster_label[data["dufo"]==1] = hdb.labels_ + 1

            # save labels
            timestamp = data['timestamp']
            key = str(timestamp)
            with h5py.File(os.path.join(data_path, f'{scene_id}.h5'), 'r+') as f:
                if 'dufocluster' in f[key]:
                    # print(f"Warning: {scene_id} {timestamp} has label, will be overwritten.")
                    del f[key]['dufocluster']
                f[key].create_dataset('dufocluster', data=np.array(cluster_label).astype(np.int16))
        print(f"==> Scene {scene_id} finished, used: {(time.time() - start_time)/60:.2f} mins")
    print(f"Data inside {str(data_path)} finished. Check the result with tools/visulization.py if you want to visualize them.\n")

# since it's the only one need cuda to do. in case you want to run two single jobs.
def run_nnd(
    data_dir: str ="/home/kin/data/av2/preprocess/sensor/train",
    scene_range: list = [0, 1],
    interval: int = 1, # interval frames to run dufomap only
    overwrite: bool = True,

    # NOTE (Qingwen): following is for ground segmentation only... at least for code now.
    tag: str = "av2", # [nus, zod, man, sca] etc
    run_gm: bool = False, # run ground segmentation
    min_nnd: float = 0.14, # min nnd distance 1.4m/s pedestrain speed; For Scania data, we set 0.32 here.
):
    # nnd function
    from assets.cuda.chamfer3D import nnChamferDis
    MyCUDAChamferDis = nnChamferDis()
    import torch
    if not torch.cuda.is_available():
        raise EnvironmentError("No cuda available, please check your cuda environment.")
    # exit()
    def cuda_nnd(pc0: torch.tensor, pc1: torch.tensor, moving_threshold=0.14, truncated=4.4): # 4.4 ~= 160km/h * 0.1s
        # pc0: (N,3), already ego motion transformed; pc1: (M,3)
        pow2_dist0, _= MyCUDAChamferDis.dis_res(pc0, pc1)
        pow2_dist0 = pow2_dist0.cpu().numpy()
        label = np.zeros(pc0.shape[0], dtype=np.uint8)
        label[(pow2_dist0>=pow(moving_threshold,2)) & (pow2_dist0<pow(truncated,2))] = 1
        return label

    data_path = Path(data_dir)
    dataset = HDF5Data(data_path) # single frame reading.
    all_scene_ids = list(dataset.scene_id_bounds.keys())
    for scene_in_data_index, scene_id in enumerate(all_scene_ids):
        start_time = time.time()
        # NOTE (Qingwen): so the scene id range is [start, end)
        if scene_range[0]!= -1 and scene_range[-1]!= -1 and (scene_in_data_index < scene_range[0] or scene_in_data_index >= scene_range[1]):
            continue
        bounds = dataset.scene_id_bounds[scene_id]
        exist_dict = {"nnd": True}
        with h5py.File(os.path.join(data_path, f'{scene_id}.h5'), 'r') as f:
            for ii in range(bounds["min_index"], bounds["max_index"]+1):
                key = str(dataset[ii]['timestamp'])
                for datakey in exist_dict.keys():
                    if datakey not in f[key]:
                        exist_dict[datakey] = False
                if not all(exist_dict.values()):
                    break

        if all(exist_dict.values()) and not overwrite:
            print(f"==> Scene {scene_id} already processed, skip.")
            continue

        ego_pose_norm = dataset[bounds["min_index"]]['pose0']
        for data_id in tqdm(range(bounds["min_index"], bounds["max_index"]+1), desc=f"CUDA nnd run: {scene_in_data_index+1}/{len(all_scene_ids)}", ncols=80):
            data = dataset[data_id]
            pc0 = data['pc0'][:,:3]
            pose0 = npcal_pose0to1(data['pose0'], ego_pose_norm)
            timestamp = data['timestamp']
            key = str(timestamp)

            with h5py.File(os.path.join(data_path, f'{scene_id}.h5'), 'r+') as f:
                if not exist_dict["nnd"]:
                    nnd_labels = np.zeros(pc0.shape[0], dtype= np.uint8)
                    data_t1 = dataset[data_id-1] if data_id == bounds["max_index"] else dataset[data_id+1]
                    ego_motion = npcal_pose0to1(pose0, npcal_pose0to1(data_t1['pose0'], ego_pose_norm))
                    transform_pc0 = pc0 @ ego_motion[:3,:3].T + ego_motion[:3,3]
                    nnd_labels = cuda_nnd(torch.tensor(transform_pc0).cuda(), torch.tensor(data_t1['pc0'][:,:3]).cuda(), moving_threshold=min_nnd)
                    check_data_key(f[key], "nnd", scene_id, timestamp)
                    f[key].create_dataset("nnd", data=np.array(nnd_labels).astype(np.uint8))

# No Need GPU, CPU-only for following process.
def main(
    data_dir: str ="/home/kin/data/av2/preprocess/sensor/train",
    scene_range: list = [0, 1],
    interval: int = 1, # interval frames to run dufomap only
    overwrite: bool = True,

    # NOTE (Qingwen): following is for ground segmentation only... at least for code now.
    tag: str = "av2", # [zod, nuscenes, truckscenes, sca] etc
    run_gm: bool = False, # run ground segmentation
    min_nnd: float = 0.14, # min nnd distance 1.4m/s pedestrain speed; For Scania data, we set 0.32 here.
):
    gm_config_path = f"{BASE_DIR}/conf/ground/{tag}.toml"
    if not os.path.exists(gm_config_path) and run_gm:
        raise FileNotFoundError(f"Ground segmentation config file not found: {gm_config_path}. Please check folder")

    data_path = Path(data_dir)
    dataset = HDF5Data(data_path) # single frame reading.
    all_scene_ids = list(dataset.scene_id_bounds.keys())
    for scene_in_data_index, scene_id in enumerate(all_scene_ids):
        start_time = time.time()
        # NOTE (Qingwen): so the scene id range is [start, end)
        if scene_range[0]!= -1 and scene_range[-1]!= -1 and (scene_in_data_index < scene_range[0] or scene_in_data_index >= scene_range[1]):
            continue
        bounds = dataset.scene_id_bounds[scene_id]
        # If you don't want to seflowpp label, then remove cluster: True here. It won't process then.
        exist_dict = {"dufo": True, "ground_mask": True, "cluster": True}
        with h5py.File(os.path.join(data_path, f'{scene_id}.h5'), 'r') as f:
            for ii in range(bounds["min_index"], bounds["max_index"]+1):
                key = str(dataset[ii]['timestamp'])
                for datakey in exist_dict.keys():
                    if datakey not in f[key]:
                        exist_dict[datakey] = False
                if not all(exist_dict.values()):
                    break

        if all(exist_dict.values()) and not overwrite:
            print(f"==> Scene {scene_id} already processed, skip.")
            continue

        # double check
        if not exist_dict["ground_mask"] or run_gm:
            mygroundseg = ground_seg(gm_config_path)
        elif not exist_dict["ground_mask"] and not run_gm:
            raise ValueError("You set run_gm=False, but ground segmentation is not done. Please check the code.")
        exist_dict["ground_mask"] = exist_dict["ground_mask"] and not run_gm # and not overwrite # this overwrite is for debug mainly.

        if overwrite:
            exist_dict["dufo"] = False
        # assign all exist_dict to False, so we can run all the process again.

        if 'cluster' in exist_dict and not exist_dict["cluster"]:
            hdbscan_cluster = HDBSCAN(min_cluster_size=20, cluster_selection_epsilon=0.7, alpha=1.1)

        # for each scene, we normalize the pose to the first frame to avoid large values.
        ego_pose_norm = dataset[bounds["min_index"]]['pose0']
        if not exist_dict["dufo"]:
            mydufo = dufomap(0.15, 0.2, 1, num_threads=12) # resolution, d_s, d_p, hit_extension
            mydufo.setCluster(0, 20, 0.2) # depth=0, min_points=20, max_dist=0.2

            print(f"==> Scene {scene_id} start, data path: {data_path}")
            for i in tqdm(range(bounds["min_index"], bounds["max_index"]+1), desc=f"Dufo run: {scene_in_data_index+1}/{len(all_scene_ids)}", ncols=80):
                if interval != 1 and i % interval != 0 and (i + interval//2 < bounds["max_index"] or i - interval//2 > bounds["min_index"]):
                    continue
                data = dataset[i]
                assert data['scene_id'] == scene_id, f"Check the data, scene_id {scene_id} is not consistent in {i}th data in {scene_in_data_index}th scene."
                # HARD CODED: remove points outside the range
                norm_pc0 = np.linalg.norm(data['pc0'][:, :3], axis=1)
                range_mask = (
                        (norm_pc0>MIN_AXIS_RANGE) &
                        (norm_pc0<MAX_AXIS_RANGE)
                )
                pose0 = npcal_pose0to1(data['pose0'], ego_pose_norm)
                if 'lidar_center' not in data:
                    # single lidar
                    pose_array = transform_to_array(pose0)
                    mydufo.run(data['pc0'][range_mask], pose_array, cloud_transform = True)
                else:
                    # multi-lidar
                    for lid in range(data['lidar_center'].shape[0]):
                        pose_lidar = pose0 @ np.linalg.inv(data['lidar_center'][lid])
                        lidar_mask = data['lidar_id']==lid
                        points_xyz_ego = data['pc0'][lidar_mask & range_mask][:,:3]
                        # to lidar frame
                        T_ego_to_lidar = data['lidar_center'][lid]
                        R_ego_to_lidar = T_ego_to_lidar[:3, :3]
                        t_ego_to_lidar = T_ego_to_lidar[:3, 3]

                        points_xyz_lidar = points_xyz_ego @ R_ego_to_lidar.T + t_ego_to_lidar

                        # to world frame
                        T_lidar_to_ego = np.linalg.inv(T_ego_to_lidar)
                        T_lidar_to_world = pose0 @ T_lidar_to_ego
                        pose_array_lidar = transform_to_array(T_lidar_to_world)

                        pose_array = transform_to_array(pose_lidar)
                        mydufo.run(points_xyz_lidar, pose_array_lidar, cloud_transform = True)

            # finished integrate, start segment, needed since we have map.label inside dufo
            mydufo.oncePropagateCluster(if_cluster = True, if_propagate=True)
            # NOTE(Qingwen): Just for Qingwen to check the voxel map is correct, for dufomap outputMap if voxel_map=True, there is no need to input points.
            # mydufo.outputMap(np.zeros_like(data['pc0'][:,:3]), voxel_map=True)
            # return

        for data_id in tqdm(range(bounds["min_index"], bounds["max_index"]+1), desc=f"Auto-labels run: {scene_in_data_index+1}/{len(all_scene_ids)}", ncols=80):
            data = dataset[data_id]
            pc0 = data['pc0'][:,:3]
            pose0 = npcal_pose0to1(data['pose0'], ego_pose_norm)
            timestamp = data['timestamp']
            key = str(timestamp)

            gm0 = data['gm0'] if exist_dict["ground_mask"] else mygroundseg.run(pc0)
            if 'cluster' in exist_dict and not exist_dict["cluster"]:
                cluster_labels = np.zeros(pc0.shape[0], dtype=np.int16) # =0 no label
                # NOTE(Qingwen): since -1 will be assigned if no cluster. We set it to 0.
                cluster_labels[gm0==0] = (hdbscan_cluster.fit_predict(pc0[gm0==0]) + 1)
            if not exist_dict["dufo"]:
                pose_array = transform_to_array(pose0)
                dufo_label = mydufo.segment(pc0, pose_array, cloud_transform = True)

            with h5py.File(os.path.join(data_path, f'{scene_id}.h5'), 'r+') as f:
                if not exist_dict["ground_mask"]:
                    check_data_key(f[key], "ground_mask", scene_id, timestamp)
                    f[key].create_dataset("ground_mask", data=np.array(gm0).astype(np.uint8))
                if 'cluster' in exist_dict and not exist_dict["cluster"]:
                    check_data_key(f[key], "cluster", scene_id, timestamp)
                    f[key].create_dataset("cluster", data=np.array(cluster_labels).astype(np.int16))
                if not exist_dict["dufo"]:
                    dufo_labels = np.zeros(pc0.shape[0], dtype= np.uint8)
                    dufo_labels[~gm0] = dufo_label[~gm0]
                    check_data_key(f[key], "dufo", scene_id, timestamp)
                    f[key].create_dataset("dufo", data=np.array(dufo_labels).astype(np.uint8))
        print(f"==> Scene {scene_id} finished, used: {(time.time() - start_time)/60:.2f} mins")

if __name__ == '__main__':
    start_time = time.time()
    fire.Fire(main)
    fire.Fire(run_dufocluster)
    print("\nAlready Finished the main labels: dufo, cluster, ground mask etc.\n")
    # fire.Fire(run_nnd)
    print(f"\nScript Time used: {(time.time() - start_time)/60:.2f} mins")