Add camera localization code into the repo.

eroniki · Sep 30, 2019 · 4212ac8 · 4212ac8
1 parent d361769
commit 4212ac8
Show file tree

Hide file tree

Showing 2 changed files with 162 additions and 0 deletions.
diff --git a/app.py b/app.py
@@ -25,6 +25,7 @@
 from tf.tf import TFTree
 from skeleton.skeleton import people, skeleton
 import visualization
+from computer_vision import computer_vision
 
 import logging
 from logging.handlers import RotatingFileHandler
@@ -54,6 +55,8 @@ def __init__(self, key):
         self.login_manager.request_loader(self.request_loader)
 
         self.extrinsic_dict = self.load_extrinsics()
+        self.K, self.d = self.load_intrinsics()
+
         self.xform_tree = TFTree()
 
         for elem in self.extrinsic_dict["extrinsic_params"]:
@@ -85,6 +88,13 @@ def load_extrinsics(self):
         """Load extrinsic matrices from a json file."""
         return self.um.read_json("extrinsics.json")
 
+    def load_intrinsics(self):
+        """Load intrinsic parameters from a json file."""
+        data = self.um.read_json("intrinsics.json")
+        K = np.asarray(data["K"])
+        d = np.asarray(data["dist"])
+        return K, d
+
     def load_users(self):
         """Load users for authorization purposes from the json file."""
         return self.um.read_json("users.json")
@@ -206,6 +216,10 @@ def create_endpoints(self):
                               "get_matchstick_video",
                               self.get_matchstick_video)
 
+        self.app.add_url_rule("/locate_camera/<exp_id>/<left_cam_id>/<right_cam_id>/<frame_id>",
+                              "locate_camera_frame",
+                              self.locate_camera_frame)
+
         self.app.view_functions['index'] = self.index
         self.app.view_functions['video'] = self.video
         self.app.view_functions['video_feed'] = self.video_feed
@@ -239,6 +253,8 @@ def create_endpoints(self):
         self.app.view_functions['draw_matchsticks'] = self.draw_matchsticks
         self.app.view_functions['make_videofrom_matchsticks'] = self.make_videofrom_matchsticks
         self.app.view_functions['get_matchstick_video'] = self.get_matchstick_video
+        self.app.view_functions['locate_camera_frame'] = self.locate_camera_frame
+
 
 
     def index(self):
@@ -878,6 +894,83 @@ def log_n(self, n):
         return statement
 
 
+    @flask_login.login_required
+    def locate_camera_frame(self, exp_id, left_cam_id, right_cam_id, frame_id):
+        """Locate the camera with respect to the checkerboard."""
+        return Response(self.gen_locate_camera_frame(exp_id,
+                                                     left_cam_id, right_cam_id,
+                                                     frame_id),
+                        mimetype='multipart/x-mixed-replace; boundary=frame')
+
+    def gen_locate_camera_frame(self, exp_id, left_cam_id, right_cam_id, frame_id):
+        """Camera generator for the test_camera endpoint."""
+        exp = experiment.experiment(new_experiment=False, ts=str(exp_id))
+        room_name = exp.metadata["room"]
+        if room_name.lower() == "cears":
+            room_id = 1
+        elif room_name.lower() == "computer_lab":
+            room_id = 0
+
+        devices = self.rooms[room_id]["devices"]
+        devices.sort()
+
+        fname = str(frame_id) + ".png"
+
+        l_camera_name = os.path.basename(devices[int(left_cam_id)])
+        r_camera_name = os.path.basename(devices[int(right_cam_id)])
+
+        path_l = os.path.join(self.um.experiment_path(exp_id), "raw", l_camera_name, fname)  # noqa: E501
+
+        path_r = os.path.join(self.um.experiment_path(exp_id), "raw", r_camera_name, fname)  # noqa: E501
+
+        frame_l = cv2.imread(path_l, )
+        frame_r = cv2.imread(path_r, )
+
+        retval = True
+
+        if frame_l is None:
+            frame_l = cv2.imread("flask_app/static/task.jpg")
+            ret_val = False
+
+        if frame_r is None:
+            frame_r = cv2.imread("flask_app/static/task.jpg")
+            ret_val = False
+
+        pattern_shape = (9, 6)  # TODO: CHECK THIS
+        grid_size = 30  # TODO: CHECK THIS
+        text_l, corners_l, canvas_l, R_l, t_l = computer_vision.calculate_camera_pose(frame_l, self.K, self.d, pattern_shape=pattern_shape, grid_size=grid_size)  # noqa: E501
+        text_r, corners_r, canvas_r, R_r, t_r = computer_vision.calculate_camera_pose(frame_r, self.K, self.d, pattern_shape=pattern_shape, grid_size=grid_size)  # noqa: E501
+
+        T_l = np.eye(4)
+        T_r = np.eye(4)
+        if R_l is not None and R_r is not None:
+            T_l[0:3, 0:3] = R_l
+            T_r[0:3, 0:3] = R_r
+            T_l[0:3, 3] = t_l.ravel()
+            T_r[0:3, 3] = t_r.ravel()
+
+            T_l = np.eye(4)
+            T_r = np.linalg.inv(T_l).dot(T_r)
+
+        print T_l
+        print T_r
+        canvas = np.hstack([canvas_l, canvas_r])
+
+        text = "Left: " + text_l + " Right: " + text_r
+        cv2.putText(canvas, text, (20, 40), cv2.FONT_HERSHEY_SIMPLEX,
+                    1.0, (0, 0, 255), lineType=cv2.LINE_AA)
+
+        ret, jpeg = cv2.imencode('.jpg', canvas)
+
+        if ret:
+            img = jpeg.tobytes()
+        else:
+            pass
+
+        yield (b'--frame\r\n'
+               b'Content-Type: image/png;base64,\r\n\r\n' + img + b'\r\n')
+
+
 class User(flask_login.UserMixin):
     # TODO: Implement this
     pass

diff --git a/computer_vision.py b/computer_vision.py
@@ -71,3 +71,72 @@ def extract_thumbnail(img, joints):
     def undistort_points(points, K, dist):
         """Undistort points to eliminate the lens distortion."""
         return cv2.undistortPoints(points, K, dist)
+
+    @staticmethod
+    def _calculate_camera_pose(frame, K, d, corners, pattern_shape=(6, 4), grid_size=30):  # noqa: E501
+        """Calculate camera pose with a frame containing checkerboard in it."""
+        img = frame.copy()
+        axis = np.float32([[grid_size, 0, 0], [0, grid_size, 0],
+                           [0, 0, -grid_size]]).reshape(-1, 3)*2
+
+        objp = np.zeros((np.prod(pattern_shape), 3), np.float32)
+        objp[:, :2] = np.mgrid[0:pattern_shape[0],
+                               0:pattern_shape[1]].T.reshape(-1, 2) * grid_size
+
+        _, rvecs, tvecs = cv2.solvePnP(objp, corners, K, d)
+        R, _ = cv2.Rodrigues(rvecs)
+        # project 3D points onto image plane
+        imgpts, _ = cv2.projectPoints(axis,
+                                      rvecs, tvecs,
+                                      K, d)
+
+        canvas = computer_vision.draw_axis(img, corners, imgpts)
+        return R, tvecs, canvas
+
+    @staticmethod
+    def calculate_camera_pose(frame,  K, d, pattern_shape=(6, 4), grid_size=30):  # noqa: E501
+        """Calculate camera pose with a frame containing checkerboard in it."""
+        corners, canvas = computer_vision.detect_chessboard(frame, pattern_shape)  # noqa: E501
+
+        if corners is None:
+            canvas = frame
+            text = "No checkerboard"
+            return text, corners, canvas, None, None
+        else:
+            canvas = cv2.undistort(canvas, K, d)
+            R, t, canvas = computer_vision._calculate_camera_pose(frame,
+                                                                  K, d,
+                                                                  corners,
+                                                                  pattern_shape,  # noqa: E501
+                                                                  grid_size)
+            text = " ".join(np.round(t, 2).ravel().astype(str))
+        return text, corners, canvas, R, t
+
+    @staticmethod
+    def detect_chessboard(frame, pattern_shape=(7, 6)):
+        """Detect chessboard with a given shape in the frame."""
+        corners = None
+        canvas = None
+        img = frame.copy()
+        criteria = (cv2.TERM_CRITERIA_EPS +
+                    cv2.TERM_CRITERIA_MAX_ITER, 30, 0.001)
+
+        gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+
+        ret, corners = cv2.findChessboardCorners(gray, pattern_shape)
+        if ret:
+            corners = cv2.cornerSubPix(gray, corners,
+                                       (11, 11), (-1, -1), criteria)
+            canvas = cv2.drawChessboardCorners(img, pattern_shape,
+                                               corners, ret)
+
+        return corners, canvas
+
+    @staticmethod
+    def draw_axis(img, corners, imgpts):
+        """Draw 3D axis on a given image."""
+        corner = tuple(corners[0].ravel())
+        img = cv2.line(img, corner, tuple(imgpts[0].ravel()), (255, 0, 0), 5)
+        img = cv2.line(img, corner, tuple(imgpts[1].ravel()), (0, 255, 0), 5)
+        img = cv2.line(img, corner, tuple(imgpts[2].ravel()), (0, 0, 255), 5)
+        return img