Source code for pymvg.camera_model

import numpy as np
import yaml

from .util import _undistort, get_rotation_matrix_and_quaternion, np2plain, \
     Bunch, plain_vec, my_rq, is_rotation_matrix, center, normalize, \
     point_msg_to_tuple, parse_rotation_msg, _cam_str, is_string
from .quaternions import quaternion_matrix, quaternion_from_matrix
from .ros_compat import sensor_msgs as sensor_msgs_compat

import warnings

# Define matrices to point ROS transforms such than +Z is directly
# ahead and +X is right.
rot_90 = np.array( [[ 0,0,1],
                    [ -1,0,0],
                    [ 0,-1,0]], dtype=np.float)
rot_90i = np.linalg.pinv(rot_90)

def warn_deprecation(attr):
    warnings.warn('CameraModel property %r will be removed'%attr, DeprecationWarning)

[docs]class CameraModel(object):
    """an implementation of the Camera Model used by ROS and OpenCV

    Tranformations: We can think about the overall projection to 2D in
    two steps. Step 1 takes 3D world coordinates and, with a simple
    matrix multiplication and perspective division, projects them to
    undistorted 2D coordinates. Step 2 takes these undistorted 2D
    coordinates and distorts them so they are 'distorted' and match up
    with a real camera with radial distortion, for example.

    3D world --(step1)----> undistorted 2D ---(step2)----> distorted 2D

    Step 1 is accomplished by making the world coordinates a
    homogeneous vector of length 4, multiplying by a 3x4 matrix M
    (built from P, R and t) to get values [r,s,t] in which the
    undistorted 2D coordinates are [r/t, s/t]. (The implementation is
    vectorized so that in fact many points at once can be
    transformed.)

    Step 2 is somewhat complicated in that it allows a separate focal
    length and camera center to be used for distortion. Undistorted 2D
    coordinates are transformed first to uncorrected normalized image
    coordinates using parameters from P, then corrected using a
    rectification matrix. These corrected normalized image coordinates
    are then used in conjunction with the distortion model to create
    distorted normalized pixels which are finally transformed to
    distorted image pixels by K.

    Coordinate system: the camera is looking at +Z, with +X rightward
    and +Y down. For more information, see
    http://www.ros.org/wiki/image_pipeline/CameraInfo

    As noted on the link above, this differs from the coordinate
    system of Harley and Zisserman, which has Z forward, Y up, and X
    to the left (looking towards +Z).'

    """
    __slots__ = [
        # basic properties
        'name', # a string with the camera name
        'width','height', # the size of the image

        # extrinsic parameters
        '_rquat', # the rotation quaternion, np.array with shape (4,)
        '_camcenter', # the center of the camera, np.array with shape (3,)

        # intrinsic parameters
        '_opencv_compatible',
        # these intrinsic parameters specified like OpenCV
        'P', # used for undistorted<->normalized, np.array with shape (3,4)
        'K', # used for distorted<->normalized, a scaled version of P[:3,:3], np.array with shape (3,3)

        # (The scaling of K, with the default alpha=0, is such that
        # every pixel in the undistorted image is valid, thus throwing
        # away some pixels. With alpha=1, P==K and all pixels in the
        # original image are in the undistorted image.)

        # the distortion model
        'distortion', # (distortion params) the distortion, np.array with shape (5,1) or (8,1)
        'rect', # (distortion params) the rectification, None or np.array with shape (3,3)

        '_cache', # cached computational results
        ]
    AXIS_FORWARD = np.array((0,0,1),dtype=np.float)
    AXIS_UP = np.array((0,-1,0),dtype=np.float)
    AXIS_RIGHT = np.array((1,0,0),dtype=np.float)

    # --- start of CameraModel constructors ------------------------------------

    def __init__(self, name, width, height, _rquat, _camcenter, P, K, distortion, rect):
        self.name = name
        self.width = width
        self.height = height
        self._rquat = _rquat
        self._camcenter = _camcenter
        self.P = P
        eps = 1e-8
        if abs(self.P[2,2]-1.0) > eps:
            raise ValueError('matrix P must have element (2,2) near 1.0')
        self.K = K
        self.distortion = distortion
        self.rect = rect

        self._opencv_compatible = (self.P[0,1]==0)
        assert np.allclose( P[:,3], np.zeros((3,)))
        self._cache = {}
        self._cache['Q'] = self.get_Q()
        self._cache['translation'] = self.get_translation()
        self._cache['Qt'] = self.get_Qt()
        self._cache['M'] = self.get_M()
        self._cache['Q_inv'] = self.get_Q_inv()
        self._cache['t_inv'] = self.get_t_inv()

    def __getstate__(self):
        """allow CameraModel to be pickled"""
        return self.to_dict()

    def __setstate__(self,state):
        tmp = CameraModel.from_dict(state)
        for attr in self.__slots__:
            setattr( self, attr, getattr( tmp, attr ) )

    @classmethod
    def _from_parts(cls,
                      translation=None,
                      camcenter=None,
                      rotation=None,
                      intrinsics=None,
                      name=None,
                      ):
        """Instantiate a Camera Model.

        params
        ------
        translation : converted to np.array with shape (3,)
          the translational position of the camera (note: not the camera center)
        camcenter : converted to np.array with shape (3,)
          the camera center (mutually exclusive with translation parameter)
        rotation : converted to np.array with shape (4,) or (3,3)
          the camera orientation as a quaternion or a 3x3 rotation vector
        intrinsics : a ROS CameraInfo message
          the intrinsic camera calibration
        name : string
          the name of the camera
        """
        if translation is not None and camcenter is not None:
            raise RuntimeError('translation and camcenter arguments are mutually exclusive')
        set_camcenter_from_translation = True
        if camcenter is not None:
            set_camcenter_from_translation = False
            camcenter = np.array(camcenter)
            assert camcenter.ndim==1
            assert camcenter.shape[0]==3
        if translation is None:
            translation = (0,0,0)
        if rotation is None:
            rotation = np.eye(3)
        if name is None:
            name = 'camera'

        rmat, rquat = get_rotation_matrix_and_quaternion(rotation)

        if set_camcenter_from_translation:
            t = np.array(translation)
            t.shape = 3,1
            camcenter = -np.dot( rmat.T, t )[:,0]
            del t

        _rquat = rquat

        if 1:
            # Initialize the camera calibration from a CameraInfo message.
            msg = intrinsics
            width = msg.width
            height = msg.height
            shape = (msg.height, msg.width)

            P = np.array(msg.P,dtype=np.float)
            P.shape = (3,4)
            if not np.allclose(P[:,3], np.zeros((3,))):
                raise NotImplementedError('not tested when 4th column of P is nonzero')

            K = np.array( msg.K, dtype=np.float)
            K.shape = (3,3)
            assert K.ndim == 2

            distortion = np.array(msg.D, dtype=np.float)
            if len(distortion) == 5:
                distortion.shape = (5,)
            elif len(distortion) == 8:
                distortion.shape = (8,)
            else:
                raise ValueError('distortion can have only 5 or 8 entries')

            assert distortion.ndim==1

            if msg.R is None:
                rect = None
            else:
                rect = np.array( msg.R, dtype=np.float )
                rect.shape = (3,3)
                if np.allclose(rect,np.eye(3)):
                    rect = None

        denom = P[2,2]
        if denom != 1.0:
            if rect is not None:
                warnings.warn(
                    'A non-normalized P matrix and a rectification matrix were '
                    'supplied. This case is not well tested and the behavior '
                    'should be considered undefined.')
            P = P/denom # normalize
        result = cls(name, width, height, _rquat, camcenter, P, K, distortion, rect)
        return result

    @classmethod
    def from_dict(cls, d, extrinsics_required=True ):
        translation = None
        rotation = None

        if 'image_height' in d:
            # format saved in ~/.ros/camera_info/<camera_name>.yaml
            #only needs w,h,P,K,D,R
            c = sensor_msgs_compat.msg.CameraInfo(
                height=d['image_height'],
                width=d['image_width'],
                P=d['projection_matrix']['data'],
                K=d['camera_matrix']['data'],
                D=d['distortion_coefficients']['data'],
                R=d['rectification_matrix']['data'])
            name = d['camera_name']
        else:
            # format saved by roslib.message.strify_message( sensor_msgs.msg.CameraInfo() )
            c = sensor_msgs_compat.msg.CameraInfo(
                height = d['height'],
                width = d['width'],
                P=d['P'],
                K=d['K'],
                D=d['D'],
                R=d['R'])
            name = d.get('name',None)
            translation = d.get('translation',None)
            rotation = d.get('Q',None)

        if translation is None or rotation is None:
            if extrinsics_required:
                raise ValueError('extrinsic parameters are required, but not provided')

        result = cls._from_parts(translation=translation,
                                   rotation=rotation,
                                   intrinsics=c,
                                   name=name,
                                   )
        return result

    @classmethod
    def load_camera_from_file( cls, fname, extrinsics_required=True ):
        if fname.endswith('.bag'):
            raise NotImplementedError('cannot open .bag file directly. Open '
                                      'with ROS and call '
                                      'CameraModel.load_camera_from_opened_bagfile(bag, ...)')
        elif (fname.endswith('.yaml') or
              fname.endswith('.json')):
            if fname.endswith('.yaml'):
                with open(fname,'r') as f:
                    d = yaml.safe_load(f)
            else:
                assert fname.endswith('.json')
                with open(fname,'r') as f:
                    d = json.load(f)
            return cls.from_dict(d, extrinsics_required=extrinsics_required)
        else:
            raise ValueError("only supports: .bag .yaml .json")

    @classmethod
[docs]    def load_camera_from_opened_bagfile( cls, bag, extrinsics_required=True ): # pragma: no cover
        """factory function for class CameraModel

        arguments
        ---------
        bag - an opened rosbag.Bag instance
        extrinsics_required - are extrinsic parameters required
        """
        camera_name = None
        translation = None
        rotation = None
        intrinsics = None

        for topic, msg, t in bag.read_messages():
            if 1:
                parts = topic.split('/')
                if parts[0]=='':
                    parts = parts[1:]
                topic = parts[-1]
                parts = parts[:-1]
                if len(parts)>1:
                    this_camera_name = '/'.join(parts)
                else:
                    this_camera_name = parts[0]
                # empty, this_camera_name, topic = parts
                # assert empty==''
            if camera_name is None:
                camera_name = this_camera_name
            else:
                assert this_camera_name == camera_name

            if topic == 'tf':
                translation = msg.translation
                rotation = msg.rotation # quaternion
            elif topic == 'matrix_tf':
                translation = msg.translation
                rotation = msg.rotation # matrix
            elif topic == 'camera_info':
                intrinsics = msg
            else:
                warnings.warn('skipping message topic %r'%topic)
                continue

        bag.close()

        if translation is None or rotation is None:
            if extrinsics_required:
                raise ValueError('no extrinsic parameters in bag file')
            else:
                translation = (np.nan, np.nan, np.nan)
                rotation = (np.nan, np.nan, np.nan, np.nan)
        else:
            translation = point_msg_to_tuple(translation)
            rotation = parse_rotation_msg(rotation)

        if intrinsics is None:
            raise ValueError('no intrinsic parameters in bag file')

        result = cls._from_parts(translation=translation,
                                   rotation=rotation,
                                   intrinsics=intrinsics,
                                   name=camera_name,
                                   )
        return result


    @classmethod
[docs]    def load_camera_from_M( cls, pmat, width=None, height=None, name='cam',
                            distortion_coefficients=None,
                            _depth=0, eps=1e-15 ):
        """create CameraModel instance from a camera matrix M"""
        pmat = np.array(pmat)
        assert pmat.shape==(3,4)
        M = pmat[:,:3]
        K,R = my_rq(M)
        if not is_rotation_matrix(R):
            # RQ may return left-handed rotation matrix. Make right-handed.
            assert np.allclose(np.dot(-K,-R), np.dot(K,R))
            R = -R
            K = -K
        a = K[2,2]
        if a==0:
            warnings.warn('ill-conditioned intrinsic camera parameters')
        else:
            if abs(a-1.0) > eps:
                if _depth > 0:
                    raise ValueError('cannot scale this pmat: %s'%( repr(pmat,)))
                new_pmat = pmat/a
                cam = cls.load_camera_from_M( new_pmat, width=width, height=height, name=name, _depth=_depth+1)
                return cam

        camcenter = center(pmat)[:,0]

        P = np.zeros( (3,4) )
        P[:3,:3]=K

        if distortion_coefficients is None:
            distortion_coefficients = np.zeros((5,))
        else:
            distortion_coefficients = np.array(distortion_coefficients)
            assert distortion_coefficients.shape == (5,)

        i = sensor_msgs_compat.msg.CameraInfo()
        i.width = width
        i.height = height
        i.D = [float(val) for val in distortion_coefficients]
        i.K = list(K.flatten())
        i.R = list(np.eye(3).flatten())
        i.P = list(P.flatten())
        result = cls._from_parts(camcenter = camcenter,
                                   rotation = R,
                                   intrinsics = i,
                                   name=name)
        return result

    @classmethod
    def load_camera_default(cls):
        pmat = np.array( [[ 300,   0, 320, 0],
                          [   0, 300, 240, 0],
                          [   0,   0,   1, 0]])
        return cls.load_camera_from_M( pmat, width=640, height=480, name='cam')

    @classmethod
    def load_camera_from_ROS_tf( cls,
                                 translation=None,
                                 rotation=None,
                                 **kwargs):
        rmatx, rquatx = get_rotation_matrix_and_quaternion(rotation)
        rmat = np.dot( rot_90i,rmatx)
        rmat, rquat = get_rotation_matrix_and_quaternion(rmat)
        if hasattr(translation,'x'):
            translation = (translation.x, translation.y, translation.z)
        C = np.array(translation)
        C.shape = (3,)

        return cls._from_parts(camcenter=C, rotation=rquat, **kwargs)

    @classmethod
    def load_camera_simple( cls,
                            fov_x_degrees=30.0,
                            width=640, height=480,
                            eye=(0,0,0),
                            lookat=(0,0,-1),
                            up=None,
                            name='simple',
                            distortion_coefficients=None,
                            ):
        aspect = float(width)/float(height)
        fov_y_degrees = fov_x_degrees/aspect
        f = (width/2.0) / np.tan(np.radians(fov_x_degrees)/2.0)
        cx = width/2.0
        cy = height/2.0
        M = np.array( [[ f, 0, cx, 0],
                       [ 0, f, cy, 0],
                       [ 0, 0,  1, 0]])
        c1 = cls.load_camera_from_M( M, width=width, height=height, name=name,
                                     distortion_coefficients=distortion_coefficients)
        c2 = c1.get_view_camera( eye=eye, lookat=lookat, up=up)
        return c2

    # --- end of CameraModel constructors --------------------------------------

    def __str__(self):
        return _cam_str(self.to_dict())

    def __eq__(self,other):
        assert isinstance( self, CameraModel )
        if not isinstance( other, CameraModel ):
            return False
        d1 = self.to_dict()
        d2 = other.to_dict()
        for k in d1:
            if k not in d2:
                return False
            v1 = d1[k]
            v2 = d2[k]
            if is_string(v1):
                if not v1==v2:
                    return False
            elif v1 is None:
                if not v2 is None:
                    return False
            else:
                if not np.allclose(np.array(v1), np.array(v2)):
                    return False
        for k in d2:
            if k not in d1:
                return False
        return True

    def __ne__(self,other):
        return not (self==other)

    def to_dict(self):
        d = {}
        d['name'] =self.name
        d['height'] = self.height
        d['width'] = self.width
        d['P'] = np2plain(self.P)
        d['K'] = np2plain(self.K)
        d['D'] = np2plain(self.distortion[:])
        if self.rect is None:
            d['R'] = np2plain(np.eye(3))
        else:
            d['R'] = np2plain(self.rect)
        d['translation']=np2plain(self._cache['translation'])
        d['Q']=np2plain(self.get_Q())
        return d

    # -------------------------------------------------
    # properties / getters

    def get_Q(self):
        R = quaternion_matrix(self._rquat)[:3,:3]
        return R
    def _get_Q(self):
        warn_deprecation( 'Q' )
        return self.get_Q()
    Q = property(_get_Q)

    def get_Qt(self):
        Q = self._cache['Q']
        t = np.array(self._cache['translation'],copy=True)
        t.shape = 3,1
        Rt = np.hstack((Q,t))
        return Rt
    def _get_Qt(self):
        warn_deprecation( 'Qt' )
        return self.get_Qt()
    Qt = property(_get_Qt)

    def get_M(self):
        Qt = self._cache['Qt']
        P33 = self.P[:,:3]
        M = np.dot( P33, Qt )
        return M
    def _get_M(self):
        warn_deprecation( 'M' )
        return self.get_M()
    M = property(_get_M)

    def get_translation(self):
        Q = self._cache['Q']
        C = np.array(self._camcenter)
        C.shape = (3,1)
        t = -np.dot(Q, C)[:,0]
        return t
    def _get_translation(self):
        warn_deprecation( 'translation' )
        return self.get_translation()
    translation = property(_get_translation)

    def get_Q_inv(self):
        Q = self._cache['Q']
        return np.linalg.pinv(Q)
    def _get_Q_inv(self):
        warn_deprecation( 'Q_inv')
        return self.get_Q_inv()
    Q_inv = property(_get_Q_inv)

    def get_t_inv(self):
        ti = np.array(self._camcenter)
        ti.shape = 3,1
        return ti
    def _get_t_inv(self):
        warn_deprecation( 't_inv' )
        return self.get_t_inv()
    t_inv = property(_get_t_inv)

    # -------------------------------------------------
    # other getters

[docs]    def is_opencv_compatible(self):
        """True iff there is no skew"""
        return self._opencv_compatible

[docs]    def is_distorted_and_skewed(self,max_skew_ratio=1e15):
        """True if pixels are skewed and distorted"""

        if self.is_skewed(max_skew_ratio=max_skew_ratio):
            if np.sum(abs(self.distortion)) != 0.0:
                return True
        return False

[docs]    def is_skewed(self,max_skew_ratio=1e15):
        """True if pixels are skewed"""

        # With default value, if skew is 15 orders of magnitude less
        # than focal length, return False.

        skew = self.P[0,1]
        fx = self.P[0,0]

        if abs(skew) > (abs(fx)/max_skew_ratio):
            return True
        return False

    def get_name(self):
        return self.name

    def get_extrinsics_as_bunch(self):
        msg = Bunch()
        msg.translation = Bunch()
        msg.rotation = Bunch()
        translation = self._cache['translation']
        for i in range(3):
            setattr(msg.translation,'xyz'[i], translation[i] )
        for i in range(4):
            setattr(msg.rotation,'xyzw'[i], self._rquat[i] )
        return msg

    def get_ROS_tf(self):
        rmatx = self.get_Q()
        rmat = np.dot( rot_90,rmatx)
        rmat2, rquat2 = get_rotation_matrix_and_quaternion(rmat)
        return self.get_camcenter(), rquat2

    def get_intrinsics_as_bunch(self):
        i = Bunch()
        i.height = self.height
        i.width = self.width
        assert len(self.distortion) == 5
        i.distortion_model = 'plumb_bob'
        i.D = plain_vec(self.distortion.flatten())
        i.K = plain_vec(self.K.flatten())
        i.R = plain_vec(self.get_rect().flatten())
        i.P = plain_vec(self.P.flatten())
        return i

    def get_camcenter(self):
        t_inv = self._cache['t_inv']
        return t_inv[:,0] # drop dimension

    def get_lookat(self,distance=1.0):
        world_coords = self.project_camera_frame_to_3d( [distance*self.AXIS_FORWARD] )
        world_coords.shape = (3,) # drop dimension
        return world_coords

    def get_up(self,distance=1.0):
        world_coords = self.project_camera_frame_to_3d( [distance*self.AXIS_UP] )
        world_coords.shape = (3,) # drop dimension
        return world_coords-self._camcenter

    def get_right(self,distance=1.0):
        cam_coords = np.array([[distance,0,0]])
        world_coords = self.project_camera_frame_to_3d( [distance*self.AXIS_RIGHT] )
        world_coords.shape = (3,) # drop dimension
        return world_coords-self._camcenter

    def get_view(self):
        return self.get_camcenter(), self.get_lookat(), self.get_up()

    def get_rotation_quat(self):
        return np.array(self._rquat)

    def get_rotation(self):
        return self._cache['Q']

    def get_K(self):
        return self.K

    def get_D(self):
        return self.distortion

    def get_rect(self):
        if self.rect is None:
            return np.eye(3)
        else:
            return self.rect

    def get_P(self):
        return self.P

[docs]    def save_to_bagfile(self,fname,roslib): # pragma: no cover
        """save CameraModel to ROS bag file

        arguments
        ---------
        fname - filename or file descriptor to save to
        roslib - the roslib module
        """

        roslib.load_manifest('rosbag')
        roslib.load_manifest('sensor_msgs')
        roslib.load_manifest('geometry_msgs')

        import sensor_msgs.msg
        import geometry_msgs
        import rosbag

        bagout = rosbag.Bag(fname, 'w')

        msg = extrinsics = geometry_msgs.msg.Transform()
        b = self.get_extrinsics_as_bunch()
        for name in 'xyz':
            setattr(msg.translation, name, getattr(b.translation,name) )
        for name in 'xyzw':
            setattr(msg.rotation, name, getattr(b.rotation,name) )

        topic = self.name + '/tf'
        bagout.write(topic, extrinsics)

        msg = intrinsics = sensor_msgs.msg.CameraInfo()
        b = self.get_intrinsics_as_bunch()
        # these are from image_geometry ROS package in the utest.cpp file
        msg.height = b.height
        msg.width = b.width
        msg.distortion_model = b.distortion_model
        msg.D = b.D
        msg.K = b.K
        msg.R = b.R
        msg.P = b.P

        topic = self.name.encode('ascii') + '/camera_info'
        bagout.write(topic, intrinsics)

        bagout.close()

    def save_intrinsics_to_yamlfile(self,fname):
        b = self.get_intrinsics_as_bunch()
        d = b.__dict__
        buf = yaml.dump(d)
        with open(fname,'w') as fd:
            fd.write( buf )

[docs]    def get_mirror_camera(self,axis='lr',hold_center=False):
        """return a copy of this camera whose x coordinate is (image_width-x)

        arguments
        ---------

        axis - string. Specifies the axis of the mirroring, either 'lr' or 'ud'.
        hold_center - boolean. Preserve the optical center?
        """
        assert axis in ['lr','ud']
        # Keep extrinsic coordinates, but flip intrinsic
        # parameter so that a mirror image is rendered.
        i = self.get_intrinsics_as_bunch()
        if axis=='lr':
            i.K[0] = -i.K[0]
            i.P[0] = -i.P[0]

            if not hold_center:
                i.P[1] = -i.P[1]

                i.K[2] = (self.width-i.K[2])
                i.P[2] = (self.width-i.P[2])
        else:
            # axis=='ud'
            i.K[4] = -i.K[4]
            i.P[5] = -i.P[5]

            if not hold_center:
                i.K[5] = (self.height-i.K[5])
                i.P[6] = (self.height-i.P[6])

        translation = self._cache['translation']
        Q = self._cache['Q']
        camnew = self._from_parts(
                              translation = translation,
                              rotation = Q,
                              intrinsics = i,
                              name = self.name + '_mirror',
                              )
        return camnew

[docs]    def get_flipped_camera(self):
        """return a copy of this camera looking in the opposite direction

        The returned camera has the same 3D->2D projection. (The
        2D->3D projection results in a vector in the opposite
        direction.)
        """
        cc, la, up = self.get_view()
        lv = la-cc # look vector

        lv2 = -lv
        up2 = -up
        la2 = cc+lv2

        camnew = self.get_view_camera(cc, la2, up2).get_mirror_camera(hold_center=True)
        camnew.distortion[3] = -camnew.distortion[3]

        if camnew.rect is not None:
            camnew.rect[0,:] = -camnew.rect[0,:]
            camnew.distortion[3] = -camnew.distortion[3]
            camnew.K[0,0] = -camnew.K[0,0]
        return camnew

[docs]    def get_view_camera(self, eye, lookat, up=None):
        """return a copy of this camera with new extrinsic coordinates"""
        eye = np.array(eye); eye.shape=(3,)
        lookat = np.array(lookat); lookat.shape=(3,)
        gen_up = False
        if up is None:
            up = np.array((0,-1,0))
            gen_up = True
        else:
            up = np.array(up)
            assert up.ndim==1
            assert up.shape[0]==3
        lv = lookat - eye
        f = normalize(lv)
        old_settings = np.seterr(invalid='ignore')
        s = normalize( np.cross( f, up ))
        np.seterr(**old_settings)
        if np.isnan(s[0]) and gen_up:
            up = np.array((0,0,1))
            s = normalize( np.cross( f, up ))
        assert not np.isnan(s[0]), 'invalid up vector'
        u = normalize( np.cross( f, s ))
        R = np.array( [[ s[0], u[0], f[0]],
                       [ s[1], u[1], f[1]],
                       [ s[2], u[2], f[2]]]).T

        eye.shape = (3,1)
        t = -np.dot(R,eye)

        result = self._from_parts(
                             translation=t,
                             rotation=R,
                             intrinsics=self.get_intrinsics_as_bunch(),
                             name=self.name,
                             )
        return result

[docs]    def get_aligned_camera(self, scale, rotation, translation):
        """return a copy of this camera with new extrinsic coordinates"""
        s,R,t = scale, rotation, translation
        cc, la, up = self.get_view()
        f = la-cc

        X = np.linalg.inv( R )

        fa = np.dot( f, X )
        cca0 = cc*s
        cca = np.dot( cca0, X )
        laa = cca+fa
        up2 = np.dot( up, X )

        cca2 = cca+t
        laa2 = laa+t

        return self.get_view_camera(cca2, laa2, up2)

    # --------------------------------------------------
    # image coordinate operations

    def undistort(self, nparr):
        # See http://opencv.willowgarage.com/documentation/cpp/camera_calibration_and_3d_reconstruction.html#cv-undistortpoints

        # Parse inputs
        nparr = np.array(nparr,copy=False)
        assert nparr.ndim==2
        assert nparr.shape[1]==2

        u = nparr[:,0]
        v = nparr[:,1]

        # prepare parameters
        K = self.get_K()

        fx = K[0,0]
        cx = K[0,2]
        fy = K[1,1]
        cy = K[1,2]

        # P=[fx' 0 cx' tx; 0 fy' cy' ty; 0 0 1 tz]

        P = self.get_P()
        fxp = P[0,0]
        cxp = P[0,2]
        fyp = P[1,1]
        cyp = P[1,2]

        # Apply intrinsic parameters to get normalized, distorted coordinates
        xpp = (u-cx)/fx
        ypp = (v-cy)/fy

        # Undistort
        (xp,yp) = _undistort( xpp, ypp, self.get_D() )

        # Now rectify
        R = self.rect
        if R is None:
            x = xp
            y = yp
        else:
            assert R.shape==(3,3)
            Rti = np.linalg.inv(R.T)
            uh = np.vstack( (xp,yp,np.ones_like(xp)) )
            XYWt = np.dot(Rti, uh)
            X = XYWt[0,:]
            Y = XYWt[1,:]
            W = XYWt[2,:]
            x = X/W
            y = Y/W

        # Finally, get (undistorted) pixel coordinates
        up = x*fxp + cxp
        vp = y*fyp + cyp

        return np.vstack( (up,vp) ).T

    def distort(self, nparr):
        # See http://opencv.willowgarage.com/documentation/cpp/camera_calibration_and_3d_reconstruction.html#cv-undistortpoints

        # Based on code in pinhole_camera_model.cpp of ROS image_geometry package.

        # Parse inputs
        nparr = np.array(nparr,copy=False)
        assert nparr.ndim==2
        assert nparr.shape[1]==2

        uv_rect_x = nparr[:,0]
        uv_rect_y = nparr[:,1]

        # prepare parameters
        P = self.get_P()

        fx = P[0,0]
        cx = P[0,2]
        Tx = P[0,3]
        fy = P[1,1]
        cy = P[1,2]
        Ty = P[1,3]

        x = (uv_rect_x - cx - Tx)/fx
        y = (uv_rect_y - cy - Ty)/fy

        if self.rect is not None:
            R = self.rect.T
            xy1 = np.vstack((x,y,np.ones_like(x)))
            X,Y,W = np.dot(R, xy1)
            xp = X/W
            yp = Y/W
        else:
            xp = x
            yp = y
        r2 = xp*xp + yp*yp
        r4 = r2*r2
        r6 = r4*r2
        a1 = 2*xp*yp
        D = self.distortion
        k1 = D[0]; k2=D[1]; p1=D[2]; p2=D[3]; k3=D[4]
        barrel = 1 + k1*r2 + k2*r4 + k3*r6
        if len(D)==8:
            barrel /= (1.0 + D[5]*r2 + D[6]*r4 + D[7]*r6)
        xpp = xp*barrel + p1*a1 + p2*(r2+2*(xp*xp))
        ypp = yp*barrel + p1*(r2+2*(yp*yp)) + p2*a1

        K = self.get_K()
        kfx = K[0,0]
        kcx = K[0,2]
        kfy = K[1,1]
        kcy = K[1,2]

        u = xpp*kfx + kcx
        v = ypp*kfy + kcy
        return np.vstack( (u,v) ).T

    # --------------------------------------------------
    # 3D <-> image coordinate operations

    def project_pixel_to_camera_frame(self, nparr, distorted=True, distance=1.0 ):
        if distorted:
            nparr = self.undistort(nparr)
        # now nparr is undistorted (aka rectified) 2d point data

        # Parse inputs
        nparr = np.array(nparr,copy=False)
        assert nparr.ndim==2
        assert nparr.shape[1]==2
        uv_rect_x = nparr[:,0]
        uv_rect_y = nparr[:,1]

        P = self.P/self.P[2,2] # normalize

        # transform to 3D point in camera frame at z=1
        y = (uv_rect_y            - P[1,2] - P[1,3]) / P[1,1]
        x = (uv_rect_x - P[0,1]*y - P[0,2] - P[0,3]) / P[0,0]
        z = np.ones_like(x)
        ray_cam = np.vstack((x,y,z))
        rl = np.sqrt(np.sum(ray_cam**2,axis=0))
        ray_cam = distance*(ray_cam/rl) # normalize then scale
        return ray_cam.T

    def project_camera_frame_to_pixel(self, pts3d, distorted=True):
        pts3d = np.array(pts3d,copy=False)
        assert pts3d.ndim==2
        assert pts3d.shape[1]==3

        # homogeneous and transposed
        pts3d_h = np.empty( (4,pts3d.shape[0]) )
        pts3d_h[:3,:] = pts3d.T
        pts3d_h[3] = 1

        # undistorted homogeneous image coords
        cc = np.dot(self.P, pts3d_h)

        # project
        pc = cc[:2]/cc[2]
        u, v = pc

        if distorted:
            # distort (the currently undistorted) image coordinates
            nparr = np.vstack((u,v)).T
            u,v = self.distort( nparr ).T
        return np.vstack((u,v)).T

    def project_pixel_to_3d_ray(self, nparr, distorted=True, distance=1.0 ):
        ray_cam = self.project_pixel_to_camera_frame( nparr, distorted=distorted, distance=distance )
        # transform to world frame
        return self.project_camera_frame_to_3d( ray_cam )

    def project_3d_to_pixel(self, pts3d, distorted=True):
        pts3d = np.array(pts3d,copy=False)
        assert pts3d.ndim==2
        assert pts3d.shape[1]==3

        # homogeneous and transposed
        pts3d_h = np.empty( (4,pts3d.shape[0]) )
        pts3d_h[:3,:] = pts3d.T
        pts3d_h[3] = 1

        M = self._cache['M']

        # undistorted homogeneous image coords
        cc = np.dot(M, pts3d_h)

        # project
        pc = cc[:2]/cc[2]
        u, v = pc

        if distorted:
            # distort (the currently undistorted) image coordinates
            nparr = np.vstack((u,v)).T
            u,v = self.distort( nparr ).T
        return np.vstack((u,v)).T

[docs]    def project_camera_frame_to_3d(self, pts3d):
        """take 3D coordinates in camera frame and convert to world frame"""
        Q_inv = self._cache['Q_inv']
        cam_coords = np.array(pts3d).T
        t = self.get_translation()
        t.shape = (3,1)
        world_coords = np.dot(Q_inv, cam_coords - t)
        return world_coords.T

[docs]    def project_3d_to_camera_frame(self, pts3d):
        """take 3D coordinates in world frame and convert to camera frame"""
        pts3d = np.array(pts3d)
        assert pts3d.ndim==2
        assert pts3d.shape[1]==3

        # homogeneous and transposed
        pts3d_h = np.empty( (4,pts3d.shape[0]) )
        pts3d_h[:3,:] = pts3d.T
        pts3d_h[3] = 1

        # undistorted homogeneous image coords
        Qt = self._cache['Qt']
        cc = np.dot(Qt, pts3d_h)

        return cc.T

    # --------------------------------------------
    # misc. helpers

[docs]    def camcenter_like(self,nparr):
        """create numpy array of camcenters like another array"""
        nparr = np.array(nparr,copy=False)
        assert nparr.ndim==2
        assert nparr.shape[1]==3
        t_inv = self._cache['t_inv']
        return np.zeros( nparr.shape ) + t_inv.T