ORB_SLAM_live-map/main.py at master · minhnhat93/ORB_SLAM_live-map · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
import argparse
from config import ORB_SLAM2_DIR
from PIL import Image
import numpy as np
from config import ORB_SLAM2_DIR, KEYFRAME_DIR, MAPPOINT_DIR
from utils import read_until_good, read_keyframes, read_mappoints, get_num_cols_rows, get_graph_segment_for_frame, load_frame
import os
import matplotlib.pyplot as plt
import cv2
import time
import shutil
from point_cloud import convert_3d_point_to_pix, convert_pix_to_3d_point, get_camera_to_world, get_world_to_camera
from fit_planes import best_fitting_plane, fit_plane_with_outlier_removed
from config import cx, cy, fx, fy
from scipy.signal import convolve2d

im_size = [480, 640]

def save_map(MAP_SAVE, threshold, origins, resolution):

  map_out = Image.fromarray(((1 - output) * 255).astype(np.uint8))
  map_out.save(MAP_SAVE + '.pgm')

  with open(MAP_SAVE + '.yaml', 'wb') as f:
    f.write('image: map.pgm\n')
    f.write('resolution: {}\n'.format(resolution))
    f.write('origin: [{}, {}, 0.0]\n'.format(origins[0], origins[1]))
    f.write('occupied_thresh: {}\n'.format(threshold[1]))
    f.write('free_thresh: 0.165\n'.format(threshold[0]))
    f.write('negate: 0\n')


def read_kf_and_mps():
  kfs, ended = read_until_good(os.path.join(MAPPOINT_DIR, 'KeyFrames.txt'), read_keyframes)
  if ended:
    time.sleep(1)
    mps, _ = read_until_good(os.path.join(MAPPOINT_DIR, 'AllMapPoints.txt'), read_mappoints)
  else:
    #mps = np.array(('0', 0, 0, 0, 0),dtype=[('time', '|S17'), ('id', '>f8'), ('x', '>f8'), ('y', '>f8'), ('z', '>f8')])
    mps = None
    for j, kf in enumerate(kfs):
      fn = os.path.join(MAPPOINT_DIR, kf[0])
      if os.path.exists(fn):
        mps_, _ = read_until_good(fn, read_mappoints)
        if mps is None:
          mps = mps_
        else:
          mps = np.concatenate((mps, mps_), axis=0)
  kfs_dict = {}
  for kf in kfs:
    kfs_dict[kf[0]] = kf
  return kfs, mps, kfs_dict, ended

def draw_points(img, points, color):
  for point in points:
    cv2.circle(img, (point[0], point[1]), 5, color)

def get_increment_vector(dx, dy, dz, resolution):
  sign_dx = np.sign(dx)
  sign_dy = np.sign(dy)
  sign_dz = np.sign(dz)
  dx = abs(dx)
  dy = abs(dy)
  dz = abs(dz)
  if dx == 0:
    return [0 * sign_dx, resolution * sign_dy * int(dy != 0), resolution * sign_dz]
  if dz == 0:
    return [resolution * sign_dx, resolution * sign_dy * int(dy != 0), 0 * sign_dz]
  if dx > dz:
    return [resolution * sign_dx, dy * resolution / dx * sign_dy, dz * resolution / dx * sign_dz]
  else:
    return [dx * resolution / dz * sign_dx, dy * resolution / dz * sign_dy, resolution * sign_dz]


def update_map(occupied, counts, kfs_id, kfs_dict, mps, origins, resolution, y_check=[None, None], only_end_point=0):
  numCols, numRows = get_num_cols_rows(origins, resolution)
  for mp in mps:
    if not mp[0] in kfs_id:
      continue
    px = mp[2]
    py = mp[3]
    pz = mp[4]
    kf = kfs_dict[mp[0]]
    kx = kf[1]
    ky = kf[2]
    kz = kf[3]
    dx = px - kx
    dy = py - ky
    dz = pz - kz

    u, t, v = get_increment_vector(dx, dy, dz, resolution)
    coord_end_x = int((px - origins[0]) / resolution)
    coord_end_z = numRows - int((pz - origins[1]) / resolution) - 1
    if not (coord_end_x < 0 or coord_end_x >= numCols or coord_end_z < 0 or coord_end_z >= numRows):
      counts[coord_end_z, coord_end_x] += 1
      occupied[coord_end_z, coord_end_x] += 1

    if not only_end_point:
      x = kx
      z = kz
      y = 0
      while 1:
        if (px - kx) * (px - x) < 0 or (pz - kz) * (pz - z) < 0:
          break
        if (y_check[0] is not None and y < y_check[0]) or (y_check[1] is not None and y > y_check[1]):
          break
        coord_x = int((x - origins[0]) / resolution)
        coord_z = numRows - int((z - origins[1]) / resolution) - 1
        if coord_x < 0 or coord_x >= numCols or coord_z < 0 or coord_z >= numRows:
          break
        counts[coord_z, coord_x] += 1
        x += u
        z += v
        y += t


def create_plane_equation_dict(segment, choosen_mps, pix_of_mps):
  classes = np.unique(segment)
  point_dict = {}
  plane_equation_dict = {}

  for cl in classes:
    point_dict[cl] = []
    plane_equation_dict[cl] = None

  for j in range(len(choosen_mps)):
    u, v = pix_of_mps[j]
    world_coord = choosen_mps[j]
    cl = segment[v, u]
    point_dict[cl].append(world_coord)

  for cl in classes:
    points = point_dict[cl]
    if len(points) >= 3:
      plane = best_fitting_plane(points)
      plane_equation_dict[cl] = plane
  return plane_equation_dict

def create_extra_mps_from_plane_equation_dict(rows, cols, plane_equation_dict, segment, camera_to_world, world_to_camera, kf_id, fx, fy, cx, cy, z_max):
  # us, vs are rows and cols respectively
  mps = []
  pix = []
  for row, col in zip(rows, cols):
    cl = segment[row, col]
    x, y = col, row
    plane_equation = plane_equation_dict[cl]
    if plane_equation is not None:
      world_coord = convert_pix_to_3d_point(x, y, plane_equation, camera_to_world, fx, fy, cx, cy, z_max=z_max)
      if world_coord is not None:
        X, Y, Z = world_coord
        x_, y_ = convert_3d_point_to_pix(X, Y, Z, world_to_camera, fx, fy, cx, cy)
        mps.append([kf_id, -1, X, Y, Z])
        pix.append([x_, y_])
  return mps, pix


def parse_args():
  parser = argparse.ArgumentParser()
  parser.add_argument('--path', default=ORB_SLAM2_DIR)
  parser.add_argument('--xmin', default=-5, type=float)
  parser.add_argument('--zmin', default=-5, type=float)
  parser.add_argument('--xmax', default=5, type=float)
  parser.add_argument('--zmax', default=5, type=float)
  parser.add_argument('--reso', default=0.01, type=float)
  parser.add_argument('--thresmin', default=0.196, type=float)
  parser.add_argument('--thresmax', default=0.65, type=float)
  parser.add_argument('--save', default='output/map', type=str)
  parser.add_argument('--offline', default=1, type=int)
  parser.add_argument('--min_num', default=0, type=int)
  parser.add_argument('--livemap', default=1, type=int)
  parser.add_argument('--only_end_points', default=0, type=int)
  parser.add_argument('--with_orb_slam_points', default=1, type=int)
  parser.add_argument('--with_extra_points', default=0, type=int)
  parser.add_argument('--postprocess', default=0, type=int)
  parser.add_argument('--clean_after_iteration', default=0, type=int)
  parser.add_argument('--show_individual_graph', default=0, type=int)
  parser.add_argument('--start_row', default=int(im_size[0] * 0.3333), type=int)
  parser.add_argument('--end_row', default=int(im_size[0] * 0.6666), type=int)
  parser.add_argument('--grid_row', default=50, type=int)
  parser.add_argument('--grid_col', default=25, type=int)
  parser.add_argument('--y_min', default=None, type=int)
  parser.add_argument('--y_max', default=None, type=int)
  parser.add_argument('--sigma', default=1.0, type=float)
  parser.add_argument('--z_max_camera', default=float('inf'), type=float)
  return parser.parse_args()

args = parse_args()
if not args.offline:
  try:
    shutil.rmtree(MAPPOINT_DIR)
    os.mkdir(MAPPOINT_DIR)
    shutil.rmtree(KEYFRAME_DIR)
    os.mkdir(KEYFRAME_DIR)
  except:
    pass
origins = [args.xmin, args.zmin, args.xmax, args.zmax]
resolution = args.reso
threshold = [args.thresmin, args.thresmax]
numCols, numRows = get_num_cols_rows(origins, resolution)

counts = np.ones((numRows, numCols), dtype=float) * 0
occupied = np.ones((numRows, numCols), dtype=float) * 0

grid_size = [args.grid_row, args.grid_col]
# rows_range = np.arange(0, im_size[0], grid_size[0])
rows_range = np.arange(args.start_row, args.end_row, grid_size[0])
cols_range = np.arange(0, im_size[1], grid_size[1])
rows, cols = np.meshgrid(rows_range, cols_range)
cols_add = np.ones(cols.shape[1], dtype=float)
cols_add = (np.cumsum(cols_add) - 1) * grid_size[1] / cols.shape[1]
cols = (cols + cols_add.reshape(-1, cols_add.size)).astype(int) % im_size[1]
rows, cols = rows.flatten(), cols.flatten()

y_check = [args.y_min, args.y_max]

processed_kfs = []
while 1:
  print('Waiting for frames')
  kfs, mps, kfs_dict, ended = read_kf_and_mps()
  if ended:
    print("ORB_SLAM ended")
    processed_kfs = []
    counts = np.ones((numRows, numCols), dtype=float) * 0
    occupied = np.ones((numRows, numCols), dtype=float) * 0
  print('Map Points:', len(mps))
  print('Key Frames:', len(kfs))

  kfs_id = []
  kfs_mappoints = {}
  for kf in kfs:
    if kf[0] not in processed_kfs:
      kfs_id.append(kf[0])
      kfs_mappoints[kf[0]] = []
      processed_kfs.append(kf[0])

  for mp in mps:
    if mp[0] in kfs_id:
      kfs_mappoints[mp[0]].append(mp)

  for kf_id in kfs_id:
    if args.clean_after_iteration:
      counts = np.ones((numRows, numCols), dtype=float) * 0
      occupied = np.ones((numRows, numCols), dtype=float) * 0

    extra_mps = []
    if args.with_extra_points:
      kf = kfs_dict[kf_id]  # current keyframe
      camera_center = [kf[1], kf[2], kf[3]]
      camera_translation = [kf[4], kf[5], kf[6]]
      camera_rotation = [kf[7], kf[8], kf[9], kf[10], kf[11], kf[12], kf[13], kf[14], kf[15]]
      time_stamp = kf[0]

      camera_matrix = np.asarray([[fx, 0, cx], [0, fy, cy], [0, 0, 1]])
      mps_of_this_kf = kfs_mappoints[time_stamp]  # map points of current keyframe
      camera_to_world = get_camera_to_world(camera_translation, camera_rotation)  # tf matrix
      world_to_camera = get_world_to_camera(camera_translation, camera_rotation)  # inverse tf matrix

      kf_img = load_frame(time_stamp, 0)
      segment = get_graph_segment_for_frame(time_stamp, 0, sigma=args.sigma)  # segmentation from graph-cut algorithm
      segment_with_color = segment
      segment = segment[:, :, 0] * (255**2) + segment[:, :, 1] * 255 + segment[:, :, 2]
      # get pixel coordinates of the map points

      pix_of_mps = []
      choosen_mps = []
      for mp in mps_of_this_kf:
        x, y = convert_3d_point_to_pix(mp[2], mp[3], mp[4], world_to_camera, fx, fy, cx, cy)
        if x in range(0, segment.shape[1]) and y in range(0, segment.shape[0]):
          pix_of_mps.append([x, y])
          choosen_mps.append([mp[2], mp[3], mp[4]])
      pix_of_mps = np.asarray(pix_of_mps)
      plane_equation_dict = create_plane_equation_dict(segment, choosen_mps, pix_of_mps)

      extra_mps, pix_of_extra_mps = create_extra_mps_from_plane_equation_dict(rows, cols, plane_equation_dict, segment, camera_to_world,
                                                            world_to_camera, kf_id, fx, fy, cx, cy, args.z_max_camera)
      print("Extra Map Points: ", len(extra_mps))

      # Draw segmentation
      draw_points(segment_with_color, np.asarray(pix_of_mps, dtype=int), (0, 255, 0))
      draw_points(segment_with_color, np.asarray(pix_of_extra_mps, dtype=int), (0, 0, 255))
      cv2.imshow('Map Point Projection', segment_with_color)
      cv2.waitKey(20)


    # Update map
    if args.with_orb_slam_points:
      update_map(occupied, counts, [kf_id], kfs_dict, mps, origins, resolution, y_check=y_check, only_end_point=args.only_end_points)
    if args.with_extra_points:
      update_map(occupied, counts, [kf_id], kfs_dict, extra_mps, origins, resolution, y_check=y_check, only_end_point=args.only_end_points)

    # Compute output
    if not args.only_end_points:
      occupied[counts < args.min_num] = 0
      counts[counts < args.min_num] = 0
    if args.postprocess:
      conv_kernel = np.ones((3, 3))
      conv_kernel = conv_kernel / conv_kernel.sum()
      occupied_ = convolve2d(occupied, conv_kernel,'same')
      counts_ = convolve2d(counts, conv_kernel, 'same')
      output = occupied_ / counts_
    else:
      output = occupied / counts
    output[counts == 0] = threshold[0] + 0.1
    output[output > threshold[1]] = 1.0
    output[output < threshold[0]] = 0.0
    output[(output != 1.0) * (output != 0.0)] = threshold[0] + 0.1
    save_map(args.save, threshold, origins, resolution)

    # Draw live map
    if args.livemap:
      if args.show_individual_graph:
        if args.with_orb_slam_points:
          counts_orb_slam_mp = np.ones((numRows, numCols), dtype=float) * 0
          occupied_orb_slam_mp = np.ones((numRows, numCols), dtype=float) * 0
          update_map(occupied_orb_slam_mp, counts_orb_slam_mp, [kf_id], kfs_dict, mps, origins, resolution, y_check=y_check, only_end_point=args.only_end_points)
          output_orb_slam_mp = occupied_orb_slam_mp / counts_orb_slam_mp
          output_orb_slam_mp[counts_orb_slam_mp == 0] = threshold[0] + 0.1
          output_orb_slam_mp[output_orb_slam_mp > threshold[1]] = 1.0
          output_orb_slam_mp[output_orb_slam_mp < threshold[0]] = 0.0
          output_orb_slam_mp[(output_orb_slam_mp != 1.0) * (output_orb_slam_mp != 0.0)] = threshold[0] + 0.1
          cv2.imshow('ORB-SLAM Map Points Update', 1 - output_orb_slam_mp)
          cv2.waitKey(20)
        if args.with_extra_points:
          counts_extra = np.ones((numRows, numCols), dtype=float) * 0
          occupied_extra = np.ones((numRows, numCols), dtype=float) * 0
          update_map(occupied_extra, counts_extra, [kf_id], kfs_dict, extra_mps, origins, resolution, y_check=y_check, only_end_point=args.only_end_points)
          output_extra = occupied_extra / counts_extra
          output_extra[counts_extra == 0] = threshold[0] + 0.1
          output_extra[output_extra > threshold[1]] = 1.0
          output_extra[output_extra < threshold[0]] = 0.0
          output_extra[(output_extra != 1.0) * (output_extra != 0.0)] = threshold[0] + 0.1
          cv2.imshow('Extra Map Points Update', 1 - output_extra)
          cv2.waitKey(20)
      cv2.imshow('Occupancy Grid Map', 1 - output)
      cv2.waitKey(20)
    print("Processed frame: {}".format(kf_id))
  if ended:
    cv2.waitKey(0)

# KITT0:
# python main.py --xmin -25 --xmax 20 --zmin -10 --zmax 40 --reso 0.1 --only_end_points 0
# python main.py --xmin -10 --xmax 10 --zmin -10 --zmax 10 --reso 0.05 --only_end_points 1