add support for "big depth" maps

rjw57 · Mar 23, 2017 · 32de55f · 32de55f
1 parent cc7f08f
commit 32de55f
Show file tree

Hide file tree

Showing 5 changed files with 206 additions and 103 deletions.
diff --git a/doc/conf.py b/doc/conf.py
@@ -58,9 +58,9 @@
 # built documents.
 #
 # The short X.Y version.
-version = '0.2.2'
+version = '0.2.3'
 # The full version, including alpha/beta/rc tags.
-release = '0.2.2'
+release = '0.2.3'
 
 # The language for content autogenerated by Sphinx. Refer to documentation
 # for a list of supported languages.

diff --git a/examples/dump_big_depth.py b/examples/dump_big_depth.py
@@ -0,0 +1,32 @@
+import json
+from freenect2 import Device, FrameType
+import numpy as np
+
+def main():
+    device = Device()
+    frames = {}
+    with device.running():
+        for type_, frame in device:
+            frames[type_] = frame
+            if FrameType.Color in frames and FrameType.Depth in frames:
+                break
+
+    rgb, depth = frames[FrameType.Color], frames[FrameType.Depth]
+    undistorted, registered, big_depth = device.registration.apply(
+        rgb, depth, with_big_depth=True)
+
+    rgb.to_image().save('output_rgb.png')
+    big_depth.to_image().save('output_depth.tiff')
+
+    with open('output_calib.json', 'w') as fobj:
+        json.dump({
+            'color': dict(
+                (k, getattr(device.color_camera_params, k))
+                for k in 'fx fy cx cy'.split()),
+            'ir': dict(
+                (k, getattr(device.ir_camera_params, k))
+                for k in 'fx fy cx cy k1 k2 k3 p1 p2'.split()),
+        }, fobj)
+
+if __name__ == '__main__':
+    main()
diff --git a/examples/dump_pcd.py b/examples/dump_pcd.py
@@ -20,8 +20,12 @@
 # Use the factory calibration to undistort the depth frame and register the RGB
 # frame onto it.
 rgb, depth = frames[FrameType.Color], frames[FrameType.Depth]
-undistorted, registered = device.registration.apply(rgb, depth)
+undistorted, registered, big_depth = device.registration.apply(
+    rgb, depth, with_big_depth=True)
 
 # Combine the depth and RGB data together into a single point cloud.
-with open('output.pcd', 'w') as fobj:
+with open('output.pcd', 'wb') as fobj:
     device.registration.write_pcd(fobj, undistorted, registered)
+
+with open('output_big.pcd', 'wb') as fobj:
+   device.registration.write_big_pcd(fobj, big_depth, rgb)
diff --git a/freenect2/__init__.py b/freenect2/__init__.py
@@ -1,65 +1,3 @@
-"""
-.. py:class:: ColorCameraParams
-
-    Color camera intrinsic calibration.
-
-    .. py:attribute:: fx
-
-        Focal length for x-axis (pixels)
-
-    .. py:attribute:: fy
-
-        Focal length for y-axis (pixels)
-
-    .. py:attribute:: cx
-
-        Principal point for x-axis (pixels)
-
-    .. py:attribute:: cy
-
-        Principal point for y-axis (pixels)
-
-.. py:class:: IrCameraParams
-
-    IR/depth camera intrinsic calibration.
-
-    .. py:attribute:: fx
-
-        Focal length for x-axis (pixels)
-
-    .. py:attribute:: fy
-
-        Focal length for y-axis (pixels)
-
-    .. py:attribute:: cx
-
-        Principal point for x-axis (pixels)
-
-    .. py:attribute:: cy
-
-        Principal point for y-axis (pixels)
-
-    .. py:attribute:: k1
-
-        Radial distortion co-efficient, 1st-order
-
-    .. py:attribute:: k2
-
-        Radial distortion co-efficient, 2nd-order
-
-    .. py:attribute:: k3
-
-        Radial distortion co-efficient, 3rd-order
-
-    .. py:attribute:: p1
-
-        Tangential distortion co-efficient
-
-    .. py:attribute:: p2
-
-        Tangential distortion co-efficient
-
-"""
 from __future__ import print_function
 
 from contextlib import contextmanager
@@ -79,6 +17,8 @@
     'FrameFormat',
     'Frame',
     'Registration',
+    'IrCameraParams',
+    'ColorCameraParams'
 )
 
 _FREENECT2_SINGLETON = None
@@ -160,6 +100,68 @@ def __call__(self, frame_type, frame):
     def get(self, timeout=False):
         return self.queue.get(True, timeout)
 
+class ColorCameraParams(object):
+    """
+    Color camera intrinsic calibration.
+
+    .. py:attribute:: fx
+
+        Focal length for x-axis (pixels)
+
+    .. py:attribute:: fy
+
+        Focal length for y-axis (pixels)
+
+    .. py:attribute:: cx
+
+        Principal point for x-axis (pixels)
+
+    .. py:attribute:: cy
+
+        Principal point for y-axis (pixels)
+    """
+
+class IrCameraParams(object):
+    """
+    IR/depth camera intrinsic calibration.
+
+    .. py:attribute:: fx
+
+        Focal length for x-axis (pixels)
+
+    .. py:attribute:: fy
+
+        Focal length for y-axis (pixels)
+
+    .. py:attribute:: cx
+
+        Principal point for x-axis (pixels)
+
+    .. py:attribute:: cy
+
+        Principal point for y-axis (pixels)
+
+    .. py:attribute:: k1
+
+        Radial distortion co-efficient, 1st-order
+
+    .. py:attribute:: k2
+
+        Radial distortion co-efficient, 2nd-order
+
+    .. py:attribute:: k3
+
+        Radial distortion co-efficient, 3rd-order
+
+    .. py:attribute:: p1
+
+        Tangential distortion co-efficient
+
+    .. py:attribute:: p2
+
+        Tangential distortion co-efficient
+    """
+
 class Device(object):
     """Control a single device.
 
@@ -498,6 +500,8 @@ class Registration(object):
 
     """
     def __init__(self, depth_p, rgb_p):
+        self.depth_p = depth_p
+        self.rgb_p = rgb_p
         self._c_object = ffi.gc(
             lib.freenect2_registration_create(depth_p, rgb_p),
             lib.freenect2_registration_dispose)
@@ -573,24 +577,47 @@ def get_points_xyz(self, undistorted, rows, cols):
             ffi.cast('float*', ys.ctypes.data),
             ffi.cast('float*', zs.ctypes.data)
         )
-        return xs, ys, zs
+        return xs, ys, -zs
 
     def get_points_xyz_array(self, undistorted):
         """Return a 3D array of x, y, z points for each point in an undistorted
         frame. Invalid points are Nan-ed.
 
         Args:
-            undistorted (:py:class:`Frame`): the undistorted depth frame
+            undistorted (:py:class:`.Frame`): the undistorted depth frame
 
         Returns:
-            A 512x424x3 array of 3D points. The last dimension corresponding to
+            A 424x512x3 array of 3D points. The last dimension corresponding to
             x, y and z.
 
         """
         cols, rows = np.meshgrid(
             np.arange(undistorted.width), np.arange(undistorted.height))
         return np.dstack(self.get_points_xyz(undistorted, rows, cols))
 
+    def get_big_points_xyz_array(self, big_depth):
+        """Like :py:meth:`.get_points_xyz_array` but operates on the "big" depth
+        map which can be returned from :py:meth:`.apply`.
+
+        Args:
+            big_depth (:py:class:`.Frame`): big 1920x1082 frame returned from
+                :py:meth:`.apply`.
+
+        Returns:
+            A 1082x1920x3 array of 3D points. The last dimension corresponding
+            to x, y and z.
+
+        """
+        points = np.ones((big_depth.height, big_depth.width, 3), dtype=np.float32)
+        points[..., 2] = 1e-3 * big_depth.to_array()
+        points[..., 0], points[..., 1] = np.meshgrid(
+            (np.arange(1920) - self.rgb_p.cx) / self.rgb_p.fx,
+            (1080-np.arange(-1, 1081) - self.rgb_p.cy) / self.rgb_p.fy)
+        points[..., 0] *= points[..., 2]
+        points[..., 1] *= points[..., 2]
+
+        return points
+
     def write_pcd(self, file_object, undistorted, registered=None):
         """Write depth map and (optionally) RGB data to libpcl-compatible PCD
         format file. If the registered RGB frame is present, each point is
@@ -604,38 +631,78 @@ def write_pcd(self, file_object, undistorted, registered=None):
         Args:
             file_object (file): A file object to write PCD data to
             undistorted (:py:class:`Frame`): the undistorted depth frame
-            rgb (:py:class:`Frame`): if not-None, the RGB data corresponding to
+            registered (:py:class:`Frame`): if not-None, the RGB data corresponding to
                 the depth frame.
         """
-        cols, rows = np.meshgrid(np.arange(undistorted.width), np.arange(undistorted.height))
-        xs, ys, zs = self.get_points_xyz(undistorted, rows, cols)
-        n_points = int(np.product(xs.shape))
-
-        file_object.write(b'VERSION .7\n')
-
-        if registered is None:
-            file_object.write(
-                b'FIELDS x y z\nSIZE 4 4 4\nTYPE F F F\nCOUNT 1 1 1\n')
-            data = np.zeros((n_points, 3), order='C', dtype=np.float32)
-            data[:, 0] = -xs.flatten()
-            data[:, 1] = -ys.flatten()
-            data[:, 2] = -zs.flatten()
-        else:
-            file_object.write(
-                b'FIELDS x y z rgb\nSIZE 4 4 4 4\nTYPE F F F F\nCOUNT 1 1 1 1\n')
-            bgrx = registered.to_array().astype(np.uint32)
-            rgbs = (
-                bgrx[..., 0] + (bgrx[..., 1] << 8) + (bgrx[..., 2] << 16)
-            ).view(np.float32)
-            data = np.zeros((n_points, 4), order='C', dtype=np.float32)
-            data[:, 0] = -xs.flatten()
-            data[:, 1] = -ys.flatten()
-            data[:, 2] = -zs.flatten()
-            data[:, 3] = rgbs.flatten()
-
-        file_object.write('WIDTH {}\n'.format(undistorted.width).encode())
-        file_object.write('HEIGHT {}\n'.format(undistorted.height).encode())
-        file_object.write(b'VIEWPOINT 0 0 0 1 0 0 0\n')
-        file_object.write('POINTS {}\n'.format(n_points).encode())
-        file_object.write(b'DATA binary\n')
-        file_object.write(data.tobytes())
+        write_pcd(
+            file_object, self.get_points_xyz_array(undistorted), registered)
+
+    def write_big_pcd(self, file_object, big_depth, rgb=None):
+        """Write depth map and (optionally) RGB data to libpcl-compatible PCD
+        format file. Works like :py:meth:`.write_pcd` except that it works on
+        the "big" depth map which can be returned from :py:meth:`apply`. If the
+        RGB frame is present, each point is coloured according to the image
+        otherwise the points are left uncoloured.
+
+        .. note::
+
+            Under Python 3 the file object *must* be opened in binary mode.
+
+        Args:
+            file_object (file): A file object to write PCD data to
+            big_depth (:py:class:`Frame`): the 1920x1082 de[th frame
+            registered (:py:class:`Frame`): if not-None, the RGB data from the
+                color camera
+        """
+        write_pcd(
+            file_object,
+            self.get_big_points_xyz_array(big_depth)[1:-1, ...], rgb)
+
+def write_pcd(file_object, points, rgb=None):
+    """Write 3d points and (optionally) RGB data to libpcl-compatible PCD
+    format file. If the registered RGB frame is present, each point is
+    coloured according to the image otherwise the points are left
+    uncoloured.
+
+    .. note::
+
+        Under Python 3 the file object *must* be opened in binary mode.
+
+    Args:
+        file_object (file): A file object to write PCD data to
+        points (array): A NxMx3 array of 3d points.
+        rgb (:py:class:`Frame`): if not-None, the RGB frame corresponding to
+            the points array. Assumed to be NxM.
+    """
+    assert len(points.shape) == 3
+    xs, ys, zs = points[..., 0], points[..., 1], points[..., 2]
+    n_points = int(np.product(points.shape[:-1]))
+
+    file_object.write(b'VERSION .7\n')
+
+    if rgb is None:
+        file_object.write(
+            b'FIELDS x y z\nSIZE 4 4 4\nTYPE F F F\nCOUNT 1 1 1\n')
+        data = np.zeros((n_points, 3), order='C', dtype=np.float32)
+        data[:, 0] = xs.flatten()
+        data[:, 1] = ys.flatten()
+        data[:, 2] = zs.flatten()
+    else:
+        file_object.write(
+            b'FIELDS x y z rgb\nSIZE 4 4 4 4\nTYPE F F F F\nCOUNT 1 1 1 1\n')
+        bgrx = rgb.to_array().astype(np.uint32)
+        rgbs = (
+            bgrx[..., 0] + (bgrx[..., 1] << 8) + (bgrx[..., 2] << 16)
+        ).view(np.float32)
+        data = np.zeros((n_points, 4), order='C', dtype=np.float32)
+        data[:, 0] = xs.flatten()
+        data[:, 1] = ys.flatten()
+        data[:, 2] = zs.flatten()
+        data[:, 3] = rgbs.flatten()
+
+    file_object.write('WIDTH {}\n'.format(points.shape[1]).encode())
+    file_object.write('HEIGHT {}\n'.format(points.shape[0]).encode())
+    file_object.write(b'VIEWPOINT 0 0 0 1 0 0 0\n')
+    file_object.write('POINTS {}\n'.format(n_points).encode())
+    file_object.write(b'DATA binary\n')
+    file_object.write(data.tobytes())
diff --git a/setup.py b/setup.py
@@ -8,7 +8,7 @@
 setup(
     name='freenect2',
     description='Python bindings for the libfreenect2 Kinect for Windows driver',
-    version='0.2.2',
+    version='0.2.3',
     author='Rich Wareham',
     author_email='rich.freenect2@richwareham.com',
     url='https://github.com/rjw57/freenect2-python',