#!/usr/bin/env python
"""
Camera class
@author: Dorian Tsai
@author: Peter Corke
"""
from math import cos, pi, sqrt, sin, tan
from abc import ABC, abstractmethod
import copy
from collections import namedtuple
import numpy as np
import matplotlib.pyplot as plt
import scipy
import cv2 as cv
from spatialmath import base, Line3, SO3
from machinevisiontoolbox.ImagePointFeatures import FeatureMatch
from machinevisiontoolbox.base import idisp
from machinevisiontoolbox.base.imageio import _isnotebook
# from machinevisiontoolbox.classes import Image
# import CameraVisualizer as CamVis
# from mpl_toolkits.mplot3d import Axes3D, art3d
from mpl_toolkits.mplot3d.art3d import Poly3DCollection
# from collections import namedtuple
from spatialmath import SE3
import spatialmath.base as smbase
from machinevisiontoolbox import Image
class CameraBase(ABC):
# list of attributes
_name = None # camera name (string)
_camtype = None # camera type (string)
_imagesize = None # number of pixels (horizontal, vertical)
_pp = None # principal point (horizontal, vertical)
_rhou = None # pixel imagesize (single pixel) horizontal
_rhov = None # pixel imagesize (single pixel) vertical
_image = None # image (TODO image class?), for now, just numpy array
_T = [] # camera pose (homogeneous transform, SE3 class)
_ax = [] # for plotting, axes handle
def __init__(
self,
name=None,
camtype="central",
rho=1,
imagesize=None,
sensorsize=None,
pp=None,
noise=None,
pose=None,
limits=None,
labels=None,
seed=None,
):
"""Abstract camera base class
:param name: camera instance name, defaults to None
:type name: str, optional
:param camtype: camera projection type, defaults to 'central'
:type camtype: str, optional
:param rho: pixel size, defaults to 1
:type rho: scalar or array_like(2), optional
:param imagesize: image dimension in pixels, defaults to None
:type imagesize: int or array_like(2), optional
:param sensorsize: image sensor size, defaults to None
:type sensorsize: array_like(2), optional
:param pp: principal point position, defaults to None
:type pp: array_like(2), optional
:param noise: standard deviation of image plane projection noise, defaults to None
:type noise: float, optional
:param pose: camera pose, defaults to None
:type pose: :class:`~spatialmath..pose3d.SE3`, optional
:param limits: bounds of virtual image plane [umin, umax, vmin, vmax], defaults to None
:type limits: array_like(4), optional
:param labels: axis labels for virtual image plane, defaults to ``('u', 'v')``
:type labels: 2-tuple of str, optional
:param seed: random number seed for projection noise, defaults to None
:type seed: int, optional
:raises TypeError: name must be a string
:raises TypeError: camtype must be a string
:raises ValueError: rho must be a 1- or 2-element vector
This abstract class is the base for all camera projection model
classes. All baseclass constructors support these options.
"""
if name is None:
self._name = camtype
else:
if not isinstance(name, str):
raise TypeError(name, "name must be a string")
self._name = name
if not isinstance(camtype, str):
raise TypeError(camtype, "camtype must be a string")
self._camtype = camtype
if imagesize is None:
if pp is None:
self.pp = (0, 0)
else:
self.pp = pp
else:
self.imagesize = imagesize
if pp is None:
self.pp = [x / 2 for x in self.imagesize]
else:
self.pp = pp
if sensorsize is not None:
self._rhou = sensorsize[0] / self.imagesize[1]
self._rhov = sensorsize[1] / self.imagesize[0]
else:
rho = base.getvector(rho)
if len(rho) == 1:
self._rhou = rho[0]
self._rhov = rho[0]
elif len(rho) == 2:
self._rhou = rho[0]
self._rhov = rho[1]
else:
raise ValueError(rho, "rho must be a 1- or 2-element vector")
if noise is not None:
self._noise = noise
self._random = np.random.default_rng(seed)
if pose is None:
self._pose = SE3()
else:
self._pose = SE3(pose)
self.pose0 = self.pose
self._noise = noise
self._image = None
self._ax = None
self._distortion = None
self.labels = labels
self.limits = limits
def reset(self):
"""
Reset camera pose (base method)
Restore camera to a copy of the pose given to the constructor. The copy
means that the camera pose can be modified freely, without destroying
the initial pose value.
"""
self.pose = self.pose0.copy()
def __str__(self):
"""
String representation of camera parameters (base method)
:return: string representation
:rtype: str
Multi-line string representation of camera intrinsic and extrinsic
parameters.
"""
# TODO, imagesize should be integers
s = ""
self.fmt = "{:>15s}: {}\n"
s += self.fmt.format("Name", self.name + " [" + self.__class__.__name__ + "]")
s += self.fmt.format("pixel size", " x ".join([str(x) for x in self.rho]))
if self.imagesize is not None:
s += self.fmt.format(
"image size", " x ".join([str(x) for x in self.imagesize])
)
s += self.fmt.format("pose", self.pose.strline(fmt="{:.3g}", orient="rpy/yxz"))
return s
def __repr__(self):
"""
Readable representatio of camera parameters (base method)
:return: string representation
:rtype: str
Multi-line string representation of camera intrinsic and extrinsic
parameters.
"""
return str(self)
@abstractmethod
def project_point(self, P, **kwargs):
pass
def project_line(self, *args, **kwargs):
raise NotImplementedError("not implemented for this camera model")
def project_conic(self, *args, **kwargs):
raise NotImplementedError("not implemented for this camera model")
@property
def name(self):
"""
Set/get camera name (base method)
A camera has a string-valued name that can be read and written.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera();
>>> camera.name
>>> camera.name = "foo"
>>> camera.name
"""
return self._name
@name.setter
def name(self, newname):
"""
Set camera name
:param newname: camera name
:type newname: str
"""
if isinstance(newname, str):
self._name = newname
else:
raise TypeError(newname, "name must be a string")
@property
def camtype(self):
"""
Set/get camera type (base method)
A camera has a string-valued type that can be read and written. This
is unique to the camera subclass and projection model.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera();
>>> camera.camtype
>>> camera.camtype = "foo"
>>> camera.camtype
"""
return self._camtype
@camtype.setter
def camtype(self, newcamtype):
"""
Set camera type
:param newcamtype: camera projection type
:type newcamtype: str
"""
if isinstance(newcamtype, str):
self._camtype = newcamtype
else:
raise TypeError(newcamtype, "camtype must be a string")
@property
def imagesize(self):
"""
Set/get size of virtual image plane (base method)
The dimensions of the virtual image plane is a 2-tuple, width and
height, that can be read or written. For writing the size must be an
iterable of length 2.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default();
>>> camera.imagesize
>>> camera.imagesize = (500, 500)
>>> camera.imagesize
:note: If the principal point is not set, then setting imagesize
sets the principal point to the centre of the image plane.
:seealso: :meth:`width` :meth:`height` :meth:`nu` :meth:`nv`
"""
return self._imagesize
@imagesize.setter
def imagesize(self, npix):
"""
Set image plane size
:param npix: [description]
:type npix: array_like(2)
:raises ValueError: bad value
Sets the size of the virtual image plane.
:note: If the principle point is not set, then it
is set to the centre of the image plane.
:seealso: :meth:`width` :meth:`height` :meth:`nu` :meth:`nv`
"""
npix = base.getvector(npix, dtype="int")
if len(npix) == 1:
self._imagesize = np.r_[npix[0], npix[0]]
elif len(npix) in (2, 3):
# ignore color dimension in case it is given
self._imagesize = npix[:2]
else:
raise ValueError(npix, "imagesize must be a 1- or 2-element vector")
if self._pp is None:
self._pp = self._imagesize / 2
@property
def nu(self):
"""
Get image plane width (base method)
:return: width
:rtype: int
Number of pixels in the u-direction (width)
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default();
>>> camera.nu
:seealso: :meth:`nv` :meth:`width` :meth:`imagesize`
"""
return self._imagesize[0]
@property
def nv(self):
"""
Get image plane height (base method)
:return: height
:rtype: int
Number of pixels in the v-direction (height)
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default();
>>> camera.nv
:seealso: :meth:`nu` :meth:`height` :meth:`imagesize`
"""
return self._imagesize[1]
@property
def width(self):
"""
Get image plane width (base method)
:return: width
:rtype: int
Image plane height, number of pixels in the v-direction
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default();
>>> camera.width
:seealso: :meth:`nu` :meth:`height`
"""
return self._imagesize[0]
@property
def height(self):
"""
Get image plane height (base method)
:return: height
:rtype: int
Image plane width, number of pixels in the u-direction
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default();
>>> camera.height
:seealso: :meth:`nv` :meth:`width`
"""
return self._imagesize[1]
@property
def pp(self):
"""
Set/get principal point coordinate (base method)
The principal point is the coordinate of the point where
the optical axis pierces the image plane. It is a 2-tuple which can
be read or written. For writing the size must be an
iterable of length 2.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default();
>>> camera.pp
:seealso: :meth:`u0` :meth:`v0`
"""
return self._pp
@pp.setter
def pp(self, pp):
"""
Set principal point coordinate
:param pp: principal point
:type pp: array_like(2)
:seealso: :meth:`pp` :meth:`u0` :meth:`v0`
"""
pp = base.getvector(pp)
if len(pp) == 1:
self._pp = np.r_[pp[0], pp[0]]
elif len(pp) == 2:
self._pp = pp
else:
raise ValueError(pp, "pp must be a 1- or 2-element vector")
@property
def u0(self):
"""
Get principal point: horizontal coordinate (base method)
:return: horizontal component of principal point
:rtype: float
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera();
>>> camera.u0
:seealso: :meth:`v0` :meth:`pp`
"""
return self._pp[0]
@property
def v0(self):
"""
Get principal point: vertical coordinate (base method)
:return: vertical component of principal point
:rtype: float
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera();
>>> camera.v0
:seealso: :meth:`u0` :meth:`pp`
"""
return self._pp[1]
@property
def rhou(self):
"""
Get pixel width (base method)
:return: horizontal pixel size
:rtype: float
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default();
>>> camera.rhou
:seealso: :meth:`rhov` :meth:`rho`
"""
return self._rhou
# this is generally the centre of the image, has special meaning for
# perspective camera
@property
def rhov(self):
"""
Get pixel width (base method)
:return: vertical pixel size
:rtype: float
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default();
>>> camera.rhov
:seealso: :meth:`rhov` :meth:`rho`
"""
return self._rhov
@property
def rho(self):
"""
Get pixel dimensions (base method)
:return: horizontal pixel size
:rtype: ndarray(2)
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera();
>>> camera.rhov
:seealso: :meth:`rhou` :meth:`rhov`
"""
return np.array([self._rhou, self._rhov])
# @property
# def image(self):
# return self._image
# @image.setter
# def image(self, newimage):
# """
# :param newimage: [description]
# :type newimage: [type]
# """
# self._image = Image(newimage)
@property
def pose(self):
"""
Set/get camera pose (base method)
The camera pose with respect to the global frame can be read or written
as an :class:`~spatialmath..pose3d.SE3` instance.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera = CentralCamera();
>>> camera.pose
>>> camera.pose = SE3.Trans(1, 2, 3)
>>> camera
:note: Changes the pose of the current camera instance, whereas
:meth:`move` clones the camera instance with a new pose.
:seealso: :meth:`move`
"""
return self._pose
@pose.setter
def pose(self, newpose):
"""
Set camera pose
:param newpose: pose of camera frame
:type newpose: :class:`~spatialmath..pose3d.SE3` or ndarray(4,4)
:seealso: :meth:`move`
"""
self._pose = SE3(newpose)
@property
def noise(self):
"""
Set/Get projection noise (base method)
:return: standard deviation of noise added to projected image plane points
:rtype: float
The noise parameter is set by the object constructor.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default();
>>> camera.project_point([0, 0, 3])
>>> camera.noise = 2
>>> camera.project_point([0, 0, 2])
>>> camera.project_point([0, 0, 2])
:seealso: :meth:`project_point`
"""
return self._noise
@noise.setter
def noise(self, noise):
self._noise = noise
@property
def distortion(self):
r"""
Set/Get distortion model (base method)
:return: distortion model
:rtype: array_like()
The distortion model is a vector of various lengths that can be read or written.
It is passed directly to OpenCV functions which define how it is used:
- 4-element vector, :math:`[k_1, k_2, p_1, p_2]`
- 5-element vector, :math:`[k_1, k_2, p_1, p_2, k_3]`
- 8-element vector, :math:`[k_1, k_2, p_1, p_2, k_3, k_4, k_5, k_6]`
- 12-element vector, :math:`[k_1, k_2, p_1, p_2, k_3, k_4, k_5, k_6, s_1, s_2, s_3, s_4]`,
- 14-element vector, :math:`[k_1, k_2, p_1, p_2, k_3, k_4, k_5, k_6, s_1, s_2, s_3, s_4, \tau_x, \tau_y]`
The elements :math:`k_i` are radial distortion coefficients, :math:`p_i` are
tangential distortion coefficients, :math:`s_i` are thin prism
distortion coefficients, and :math:`\tau_i` apply when the camera's image plane
is tilted with respect to the lens.
If the vector is ``None``, then zero distortion (all coefficients are zero) is
assumed.
:seealso: :meth:`~CentralCamera.project_point` `OpenCV distortion model <https://docs.opencv.org/4.x/d9/d0c/group__calib3d.html>`_
"""
return self._distortion
@distortion.setter
def distortion(self, distortion):
self._distortion = distortion
def move(self, T, name=None, relative=False):
"""
Move camera (base method)
:param T: pose of camera frame
:type T: :class:`~spatialmath..pose3d.SE3`
:param relative: move relative to pose of original camera, defaults to False
:type relative: bool, optional
:return: new camera object
:rtype: :class:`CameraBase` subclass
Returns a copy of the camera object with pose set to ``T``.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera = CentralCamera();
>>> camera.move(SE3.Trans(0.1, 0.2, 0.3))
>>> camera
:note: The ``plot`` method of this cloned camera will create a new
window.
:seealso: :meth:`pose`
"""
newcamera = copy.copy(self)
if name is not None:
newcamera.name = name
else:
newcamera.name = self.name + "-moved"
newcamera._ax = None
if relative:
newcamera.pose = self.pose * T
else:
newcamera.pose = T
return newcamera
# ----------------------- plotting ----------------------------------- #
def _new_imageplane(self, fig=None, ax=None):
"""
Create a new virtual image plane if required
:param fig: Matplotlib figure number, defaults to None
:type fig: int, optional
:param ax: Matplotlob axes, defaults to None
:type ax: :class:`matplotlib.axes`, optional
:return: whether virtual image plane exists
:rtype: bool
If this camera already has a virtual image plane, return True.
Otherwise, create an axes, and optionally a figure, and return False.
"""
if _isnotebook():
ax = plt.gca() # return current or create new
if self._ax is None or self._ax is not ax:
self._ax = ax
self._fig = plt.gcf()
return False
else:
return True
else:
# if not Jupyter, reuse an existing imageplane plot
if self._ax is not None:
return True
if (fig is None) and (ax is None):
# create our own handle for the figure/plot
# print('creating new figure and axes for camera')
fig, ax = plt.subplots() # TODO *args, **kwargs?
# TODO elif ax is a plot handle, else raise ValueError
self._ax = ax
self._fig = fig
return False
def _init_imageplane(self, fig=None, ax=None):
"""
Create plot window for camera image plane
:param fig: figure to plot into, defaults to None
:type fig: figure handle, optional
:param ax: axis to plot into, defaults to None
:type ax: 2D axis handle, optional
:return: figure and axis
:rtype: (fig, axis)
Creates a 2D axis that represents the image plane of the virtual
camera.
:seealso: :meth:`plot` :meth:`mesh`
"""
if self._new_imageplane(fig, ax):
return self._ax
ax = self._ax
if self._image is not None:
# if camera has an image, display said image
idisp(self._image, fig=fig, ax=ax, title=self._name, drawonly=True)
else:
if self.limits is None:
ax.set_xlim(0, self.nu)
ax.set_ylim(0, self.nv)
else:
ax.set_xlim(self.limits[0], self.limits[1])
ax.set_ylim(self.limits[2], self.limits[3])
ax.autoscale(False)
ax.set_aspect("equal")
ax.invert_yaxis()
ax.grid(True)
if self.labels is None:
ax.set_xlabel("u (pixels)")
ax.set_ylabel("v (pixels)")
else:
ax.set_xlabel(self.labels[0])
ax.set_ylabel(self.labels[1])
ax.set_title(self.name)
ax.set_facecolor("lightyellow")
try:
ax.figure.canvas.manager.set_window_title(
"Machine Vision Toolbox for Python"
)
except AttributeError:
# can happen during unit test without GUI
pass
# TODO figure out axes ticks, etc
return ax # likely this return is not necessary
def clf(self):
"""
Clear the virtual image plane (base method)
Every camera object has a virtual image plane drawn using Matplotlib.
Remove all points and lines from the image plane.
:seealso: :meth:`plot_point` :meth:`plot_line` :meth:`disp`
"""
if self._ax is not None:
for artist in self._ax.get_children():
try:
artist.remove()
except:
pass
def plot_point(
self, P, *fmt, return_artist=False, objpose=None, pose=None, ax=None, **kwargs
):
"""
Plot points on virtual image plane (base method)
:param P: 3D world point or points, or 2D image plane point or points
:type P: ndarray(3,), ndarray(3,N), or ndarray(2,), ndarray(2,N)
:param objpose: transformation for the 3D points, defaults to None
:type objpose: :class:`~spatialmath..pose3d.SE3`, optional
:param pose: pose of the camera, defaults to None
:type pose: :class:`~spatialmath..pose3d.SE3`, optional
:param ax: axes to plot into
:type ax: :class:`matplotlib.axes`
:param kwargs: additional arguments passed to :obj:`~matplotlib.pyplot.plot`
:return: Matplotlib line objects
:rtype: list of :class:`~matplotlib.lines.Line2d`
3D world points are first projected to the image plane and then
plotted on the camera's virtual image plane.
Points are organized as columns of the arrays.
Example::
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera = CentralCamera.Default()
>>> camera.plot_point([0.2, 0.3, 2])
>>> camera.plot_point([0.2, 0.3, 2], 'r*')
>>> camera.plot_point([0.2, 0.3, 2], pose=SE3(0.1, 0, 0))
.. plot::
from machinevisiontoolbox import CentralCamera
from spatialmath import SE3
camera = CentralCamera.Default()
camera.plot_point([0.2, 0.3, 2])
camera.plot_point([0.2, 0.3, 2], 'r*')
camera.plot_point([0.2, 0.3, 2], pose=SE3(0.1, 0, 0))
:note:
- Successive calls add items to the virtual image plane.
- This method is common to all ``CameraBase`` subclasses, but it
invokes a camera-specific projection method.
:seealso: :meth:`plot_line2` :meth:`plot_line3` :meth:`plot_wireframe` :meth:`clf`
"""
self._init_imageplane(ax)
if not isinstance(P, np.ndarray):
P = base.getvector(P)
if P.shape[0] == 3:
# plot world points
p = self.project_point(P, pose=pose, objpose=objpose)
else:
# plot image plane points
p = P
if p.shape[0] != 2:
raise ValueError("p must have be (2,), (3,), (2,n), (3,n)")
defaults = dict(markersize=6, color="k")
if len(fmt) == 0:
fmt = ["o"]
kwargs = {**defaults, **kwargs}
artist = self._ax.plot(p[0, :], p[1, :], *fmt, **kwargs)
if plt.isinteractive():
plt.show(block=False)
if return_artist:
return p, artist[0]
else:
return p
def plot_line2(self, l, *args, **kwargs):
r"""
Plot 2D line on virtual image plane (base method)
:param l: homogeneous line
:type l: array_like(3)
:param kwargs: arguments passed to ``plot``
Plot the homogeneous line on the camera's virtual image plane. The line
is expressed in the form
.. math:: \ell_0 u + \ell_1 v + \ell_2 = 0
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default()
>>> camera.plot_line2([1, 0.2, -500])
:note:
- Successive calls add items to the virtual image plane.
- This method is common to all ``CameraBase`` subclasses, but it
invokes a camera-specific projection method.
:seealso: :meth:`plot_point` :meth:`plot_line3` :meth:`clf`
"""
# get handle for this camera image plane
self._init_imageplane()
plt.autoscale(False)
base.plot_homline(l, *args, ax=self._ax, **kwargs)
# def plot_line3(self, L, nsteps=21, **kwargs):
# """
# Plot 3D line on virtual image plane (base method)
# :param L: 3D line or lines in Plucker coordinates
# :type L: :class:`~spatialmath..geom3d.Line3`
# :param kwargs: arguments passed to ``plot``
# The Plucker lines are projected to the camera's virtual image plane and
# plotted. Each line is approximated by ``nsteps`` points, each of which
# is projected, allowing straight lines to appear curved after projection.
# Example:
# .. runblock:: pycon
# >>> from machinevisiontoolbox import CentralCamera, mkcube
# >>> from spatialmath import Line3
# >>> camera = CentralCamera()
# >>> line = Line3.Join((-1, -2, -3), (4, 5, 6))
# >>> camera.plot_line3(line, 'k--')
# .. note::
# - Successive calls add items to the virtual image plane.
# - This method is common to all ``CameraBase`` subclasses, but it
# invokes a camera-specific projection method.
# :seealso: :meth:`plot_point` :meth:`plot_line2` :meth:`plot_wireframe` :meth:`clf`
# """
# # draw 3D line segments
# s = np.linspace(0, 1, nsteps)
# this is actually pretty tricky
# - how to determine which part of the 3D line is visible
# - if highly curved it may be in two or more segments
# for line in L:
# l = self.project_line(line)
# # straight world lines are not straight, plot them piecewise
# P = (1 - s) * P0[:, np.newaxis] + s * P2[:, np.newaxis]
# uv = self.project_point(P, pose=pose)
def plot_wireframe(
self, X, Y, Z, *fmt, objpose=None, pose=None, nsteps=21, **kwargs
):
"""
Plot 3D wireframe in virtual image plane (base method)
:param X: world X coordinates
:type X: ndarray(N,M)
:param Y: world Y coordinates
:type Y: ndarray(N,M)
:param Z: world Z coordinates
:type Z: ndarray(N,M)
:param objpose: transformation for the wireframe points, defaults to None
:type objpose: :class:`~spatialmath..pose3d.SE3`, optional
:param pose: pose of the camera, defaults to None
:type pose: :class:`~spatialmath..pose3d.SE3`, optional
:param nsteps: number of points for each wireframe segment, defaults to 21
:type nsteps: int, optional
:param kwargs: arguments passed to ``plot``
The 3D wireframe is projected to the camera's virtual image plane. Each
wire link in the wireframe is approximated by ``nsteps`` points, each of
which is projected, allowing straight edges to appear curved.
Example::
>>> from machinevisiontoolbox import CentralCamera, mkcube
>>> from spatialmath import SE3
>>> camera = CentralCamera.Default()
>>> X, Y, Z = mkcube(0.2, pose=SE3(0, 0, 1), edge=True)
>>> camera.plot_wireframe(X, Y, Z, 'k--')
.. plot::
from machinevisiontoolbox import CentralCamera, mkcube
from spatialmath import SE3
camera = CentralCamera.Default()
X, Y, Z = mkcube(0.2, pose=SE3(0, 0, 1), edge=True)
camera.plot_wireframe(X, Y, Z, 'k--')
:seealso: :func:`mkcube` :obj:`spatialmath.base.cylinder` :obj:`spatialmath.base.sphere` :obj:`spatialmath.base.cuboid`
"""
# self._ax.plot_surface(X, Y, Z)
# plt.show()
# check that mesh matrices conform
if X.shape != Y.shape or X.shape != Z.shape:
raise ValueError("matrices must be the same shape")
if pose is None:
pose = self.pose
if objpose is not None:
pose = objpose.inv() * pose
# get handle for this camera image plane
self._init_imageplane()
plt.autoscale(False)
# draw 3D line segments
s = np.linspace(0, 1, nsteps)
# c.clf
# holdon = c.hold(1);
for i in range(X.shape[0] - 1): # i=1:numrows(X)-1
for j in range(X.shape[1] - 1): # j=1:numcols(X)-1
P0 = np.r_[X[i, j], Y[i, j], Z[i, j]]
P1 = np.r_[X[i + 1, j], Y[i + 1, j], Z[i + 1, j]]
P2 = np.r_[X[i, j + 1], Y[i, j + 1], Z[i, j + 1]]
if self.camtype == "perspective":
# straight world lines are straight on the image plane
uv = self.project_point(np.c_[P0, P1], pose=pose)
else:
# straight world lines are not straight, plot them piecewise
P = (1 - s) * P0[:, np.newaxis] + s * P1[:, np.newaxis]
uv = self.project_point(P, pose=pose)
self._ax.plot(uv[0, :], uv[1, :], *fmt, **kwargs)
if self.camtype == "perspective":
# straight world lines are straight on the image plane
uv = self.project_point(np.c_[P0, P2], pose=pose)
else:
# straight world lines are not straight, plot them piecewise
P = (1 - s) * P0[:, np.newaxis] + s * P2[:, np.newaxis]
uv = self.project_point(P, pose=pose)
self._ax.plot(uv[0, :], uv[1, :], *fmt, **kwargs)
for j in range(X.shape[1] - 1): # j=1:numcols(X)-1
P0 = [X[-1, j], Y[-1, j], Z[-1, j]]
P1 = [X[-1, j + 1], Y[-1, j + 1], Z[-1, j + 1]]
# if c.perspective
# straight world lines are straight on the image plane
uv = self.project_point(np.c_[P0, P1], pose=pose)
# else
# # straight world lines are not straight, plot them piecewise
# P = bsxfun(@times, (1-s), P0) + bsxfun(@times, s, P1);
# uv = c.project(P, 'setopt', opt);
self._ax.plot(uv[0, :], uv[1, :], *fmt, **kwargs)
# c.hold(holdon); # turn hold off if it was initially off
plt.draw()
def disp(self, im, **kwargs):
"""
Display image on virtual image plane (base method)
:param im: image to display
:type im: :class:`Image` instance
:param kwargs: options to :func:`~machinevisiontoolbox.base.imageio.idisp()`
An image is displayed on camera's the virtual image plane.
.. note: The dimensions of the image plane should match the dimensions of the image.
:seealso: :func:`machinevisiontoolbox.base.idisp()`
"""
self.imagesize = (im.shape[1], im.shape[0])
self._init_imageplane()
im.disp(ax=self._ax, title=False, **kwargs)
plt.autoscale(False)
def plot(
self=None,
pose=None,
scale=1,
shape="camera",
label=True,
alpha=1,
solid=False,
color="r",
projection="ortho",
frame=False,
ax=None,
):
"""
Plot 3D camera icon in world view (base method)
:param pose: camera pose
:type pose: :class:`~spatialmath..pose3d.SE3`
:param scale: scale factor, defaults to 1
:type scale: float
:param shape: icon shape: 'frustum' [default], 'camera'
:type shape: str, optional
:param label: show camera name, defaults to True
:type label: bool, optional
:param alpha: transparency of icon, defaults to 1
:type alpha: float, optional
:param solid: icon comprises solid faces, defaults to False
:type solid: bool, optional
:param color: icon color, defaults to 'r'
:type color: str, optional
:param projection: projection model for new axes, defaults to 'ortho'
:type projection: str, optional
:param ax: axes to draw in, defaults to current 3D axes
:type ax: :class:`~matplotlib.Axes3D`, optional
:return: axes drawn into
:rtype: :class:`~matplotlib.Axes3D`
Plot a 3D icon representing the pose of a camera into a 3D Matplotlib
plot. Two icons are supported: the traditional frustum, and a
simplistic camera comprising a box and cylinder.
:note: If ``pose`` is not given it defaults to the pose of the
instance.
"""
# if (fig is None) and (ax is None):
# # create our own handle for the figure/plot
# print('creating new figure and axes for camera')
# fig = plt.figure()
# ax = fig.gca(projection='3d')
# # ax.set_aspect('equal')
"""[summary]
face order -x, +y, +x, -y
"""
# get axes to draw in
ax = smbase.axes_logic(ax, 3, projection=projection)
if pose is None:
pose = self.pose
# draw camera-like object:
if shape == "frustum":
# TODO make this kwargs or optional inputs
# side colors:
# +x red
# -y red
# +y green
# -y yellow
length = scale
widthb = scale / 10
widtht = scale
widthb /= 2
widtht /= 2
b0 = np.array([-widthb, -widthb, 0, 1])
b1 = np.array([-widthb, widthb, 0, 1])
b2 = np.array([widthb, widthb, 0, 1])
b3 = np.array([widthb, -widthb, 0, 1])
t0 = np.array([-widtht, -widtht, length, 1])
t1 = np.array([-widtht, widtht, length, 1])
t2 = np.array([widtht, widtht, length, 1])
t3 = np.array([widtht, -widtht, length, 1])
# bottom/narrow end
T = pose.A
b0 = (T @ b0)[:-1]
b1 = (T @ b1)[:-1]
b2 = (T @ b2)[:-1]
b3 = (T @ b3)[:-1]
# wide/top end
t0 = (T @ t0)[:-1]
t1 = (T @ t1)[:-1]
t2 = (T @ t2)[:-1]
t3 = (T @ t3)[:-1]
# Each set of four points is a single side of the Frustrum
# points = np.array([[b0, b1, t1, t0], [b1, b2, t2, t1], [
# b2, b3, t3, t2], [b3, b0, t0, t3]])
points = [
np.array([b0, b1, t1, t0]), # -x face
np.array([b1, b2, t2, t1]), # +y face
np.array([b2, b3, t3, t2]), # +x face
np.array([b3, b0, t0, t3]), # -y face
]
poly = Poly3DCollection(
points, facecolors=["r", "g", "r", "y"], alpha=alpha
)
ax.add_collection3d(poly)
elif shape == "camera":
# the box is centred at the origin and its centerline parallel to the
# z-axis. Its z-extent is -bh/2 to bh/2.
W = 0.5 # width & height of the box
L = 1.2 # length of the box
cr = 0.2 # cylinder radius
ch = 0.4 # cylinder height
cn = 12 # number of facets of cylinder
a = 3 # length of axis line segments
# draw the box part of the camera
smbase.plot_cuboid(
sides=np.r_[W, W, L] * scale,
pose=pose,
filled=solid,
color=color,
alpha=0.5 * alpha if solid else alpha,
ax=ax,
)
# draw the lens
smbase.plot_cylinder(
radius=cr * scale,
height=np.r_[L / 2, L / 2 + ch] * scale,
resolution=cn,
pose=pose,
filled=solid,
color=color,
alpha=0.5 * alpha,
ax=ax,
)
if label:
ax.set_xlabel("X")
ax.set_ylabel("Y")
ax.set_zlabel("Z")
if frame is True:
self.pose.plot(
length=scale * 1.5, style="line", color=color, flo=(0.07, 0, -0.01)
)
elif frame is not False:
self.pose.plot(**frame)
return ax
def _add_noise_distortion(self, uv):
"""
Add noise to pixel coordinates
:param uv: image plane point coordinates
:type uv: ndarray(2,N)
:return: point coordinates with additive noise
:rtype: ndarray(2,N)
Model noise in the image process by adding zero-mean Gaussian noise
to the coordinates of projected world points. The noise has a
standard deviation specified by the camera constructor.
:seealso: :meth:`noise`
"""
# distort the pixels
# add Gaussian noise with specified standard deviation
if self.noise is not None:
uv += self._random.normal(0.0, self.noise, size=uv.shape)
return uv
[docs]
class CentralCamera(CameraBase):
"""
Create central camera projection model
.. inheritance-diagram:: machinevisiontoolbox.Camera.CentralCamera
:top-classes: machinevisiontoolbox.Camera.Camera
:parts: 1
:param f: focal length, defaults to 8mm
:type f: float, optional
:param distortion: camera distortion parameters, defaults to None
:type distortion: array_like(5), optional
:param kwargs: arguments passed to :class:`CameraBase` constructor
A camera object contains methods for projecting 3D points and lines
to the image plane, as well as supporting a virtual image plane onto
which 3D points and lines can be drawn.
:references:
- Robotics, Vision & Control for Python, Section 13.1, P. Corke, Springer 2023.
:seealso: :class:`CameraBase` :class:`FishEyeCamera` :class:`SphericalCamera`
"""
[docs]
def __init__(self, f=1, distortion=None, **kwargs):
super().__init__(camtype="perspective", **kwargs)
# TODO some of this logic to f and pp setters
self.f = f
self._distortion = distortion
[docs]
@classmethod
def Default(cls, **kwargs):
r"""
Set default central camera parameters
:return: central camera model
:rtype: :class:`CentralCamera` instance
Initialize a central camera with: focal length of 8mm, :math:`10\mu\mbox{m}` pixels,
image size of :math:`1000 \times 1000` with principal point at (500, 500).
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default(name='camera1')
>>> camera
:references:
- Robotics, Vision & Control for Python, Section 13.1, P. Corke, Springer 2023.
:seealso: :class:`CentralCamera`
"""
default = {
"f": 0.008,
"rho": 10e-6,
"imagesize": 1000,
"pp": (500, 500),
"name": "default perspective camera",
}
return CentralCamera(**{**default, **kwargs})
def __str__(self):
"""
String representation of central camera parameters
:return: string representation
:rtype: str
Multi-line string representation of camera intrinsic and extrinsic
parameters.
"""
s = super().__str__()
s += self.fmt.format("principal pt", self.pp)
s += self.fmt.format("focal length", self.f)
return s
[docs]
def project_point(
self,
P,
pose=None,
objpose=None,
behind=True,
visibility=False,
retinal=False,
**kwargs,
):
r"""
Project 3D points to image plane
:param P: 3D world point or points in Euclidean or homogeneous form
:type P: array_like(3), array_like(3,n), array_like(4), array_like(4,n)
:param pose: camera pose with respect to the world frame, defaults to
camera's ``pose`` attribute
:type pose: :class:`~spatialmath..pose3d.SE3`, optional
:param objpose: 3D point reference frame, defaults to world frame
:type objpose: :class:`~spatialmath..pose3d.SE3`, optional
:param behind: points behind the camera indicated by NaN, defaults to True
:type behind: bool, optional
:param visibility: return visibility array, defaults to False
:type visibility: bool
:param retinal: transform to retinal coordinates, defaults to False
:type retinal: bool, optional
:return: image plane points, optional visibility vector
:rtype: ndarray(2,n), ndarray(n)
Project a 3D point to the image plane
.. math::
\hvec{p} = \mat{C} \hvec{P}
where :math:`\mat{C}` is the camera calibration matrix and
:math:`\hvec{p}` and :math:`\hvec{P}` are the image plane and world
frame coordinates respectively, in homogeneous form.
World points are given as a 1D array or the columns of a 2D array of
Euclidean or homogeneous coordinates. The computed image plane
coordinates are Euclidean or homogeneous and given as a 1D array or the
corresponding columns of a 2D array.
If ``pose`` is specified it is used for the camera frame pose, otherwise
the attribute ``pose`` is used. The object's ``pose`` attribute is not
updated if ``pose`` is specified.
A single point can be specified as a 3-vector, multiple points as an
array with three rows and each column is the 3D point coordinate (X, Y,
Z).
The points ``P`` are by default with respect to the world frame, but
they can be transformed by specifying ``objpose``.
If world points are behind the camera and ``behind`` is True then the
image plane coordinates are set to NaN.
if ``visibility`` is True then each projected point is checked to ensure
it lies in the bounds of the image plane. In this case there are two
return values: the image plane coordinates and an array of booleans
indicating if the corresponding point is visible.
If ``retinal`` is True then project points in retinal coordinates,
in units of metres with respect to the principal point.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default()
>>> camera.project_point((0.3, 0.4, 2))
:references:
- Robotics, Vision & Control for Python, Section 13.1, P. Corke, Springer 2023.
:seealso: :meth:`C` :meth:`project_point` :meth:`project_line` :meth:`project_quadric`
"""
if pose is None:
pose = self.pose
C = self.C(pose, retinal=retinal)
if isinstance(P, np.ndarray):
if P.ndim == 1:
P = P.reshape((-1, 1)) # make it a column
else:
P = base.getvector(P, out="col")
if P.shape[0] == 3:
P = base.e2h(P) # make it homogeneous
euclidean = True
else:
euclidean = False
# project 3D points
if objpose is not None:
P = objpose.A @ P
x = C @ P
if behind:
x[2, x[2, :] < 0] = np.nan # points behind the camera are set to NaN
if euclidean:
# Euclidean points given, return Euclidean points
x = base.h2e(x)
# add Gaussian noise and distortion
if self._distortion:
x = self._distort(x)
x = self._add_noise_distortion(x)
# do visibility check if required
if visibility:
visible = (
~np.isnan(x[0, :])
& (x[0, :] >= 0)
& (x[1, :] >= 0)
& (x[0, :] < self.nu)
& (x[1, :] < self.nv)
)
return x, visible
else:
return x
else:
# homogeneous points given, return homogeneous points
return x
[docs]
def project_line(self, lines):
r"""
Project 3D lines to image plane
:param lines: Plucker line or lines
:type lines: :class:`~spatialmath..geom3d.Line3` instance with N values
:return: 2D homogeneous lines, one per column
:rtype: ndarray(3,N)
The :class:`~spatialmath..geom3d.Line3` object can contain multiple lines. The result array has one
column per line, and each column is a vector describing the image plane
line in homogeneous form :math:`\ell_0 u + \ell_1 v + \ell_2 = 0`.
The projection is
.. math::
\ell = \vex{\mat{C} \sk{\vec{L}} \mat{C}^{\top}}
where :math:`\mat{C}` is the camera calibration matrix and :math:`\sk{\vec{L}}`
is the skew matrix representation of the Plucker line.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import Line3
>>> line = Line3.Join((-3, -4, 5), (5, 2, 6))
>>> line
>>> camera = CentralCamera()
>>> camera.project_line(line)
:references:
- Robotics, Vision & Control for Python, Section 13.7.1, P. Corke, Springer 2023.
:seealso: :meth:`C` :class:`~spatialmath..geom3d.Line3` :meth:`project_point` :meth:`project_quadric`
"""
if not isinstance(lines, Line3):
raise ValueError("expecting Line3 lines")
# project Plucker lines
lines2d = []
C = self.C()
for line in lines:
l = base.vex(C @ line.skew() @ C.T)
x = l / np.max(np.abs(l)) # normalize by largest element
lines2d.append(x)
return np.column_stack(lines2d)
[docs]
def project_quadric(self, Q):
r"""
Project 3D quadric to image plane
:param Q: quadric matrix
:type Q: ndarray(4,4)
:return: image plane conic
:rtype: ndarray(3,3)
Quadrics, short for quadratic surfaces, are a rich family of
3-dimensional surfaces. There are 17 standard types including spheres,
ellipsoids, hyper- boloids, paraboloids, cylinders and cones all
described by points :math:`\vec{x} \in \mathbb{P}^3` such that
.. math::
\hvec{x}^{\top} \mat{Q} \hvec{x} = 0
The outline of the quadric is projected to a conic section on the image
plane
.. math::
c^* = \mat{C} \mat{Q}^* \mat{C}^{\top}
where :math:`(\mat{X})^* = det(\mat{X}) \mat{X}^{-1}` is the adjugate
operator.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> T_cam = SE3.Trans(0.2, 0.1, -5) * SE3.Rx(0.2)
>>> Q = np.diag([1, 1, 1, -1]) # unit sphere at origin
>>> camera = CentralCamera.Default(f=0.015, pose=T_cam);
>>> camera.project_quadric(Q)
:references:
- Robotics, Vision & Control for Python, Section 13.7.1, P. Corke, Springer 2023.
:seealso: :meth:`C` :meth:`project_point` :meth:`project_line`
"""
if not smbase.ismatrix(Q, (4, 4)):
raise ValueError("expecting 4x4 conic matrix")
return self.C() @ Q @ self.C().T
[docs]
def epiline(self, p, camera2):
r"""
Compute epipolar line
:param p: image plane point or points
:type p: array_like(2) or ndarray(2,N)
:param camera2: second camera
:type camera2: :class:`CentralCamera` instance
:return: epipolar line or lines in homogeneous form
:rtype: ndarray(3), ndarray(3,N)
Compute the epipolar line in ``camera2`` induced by the image plane
points ``p`` in the current camera. Each line is given by
.. math::
\ell = \mat{F} {}^1 \hvec{p}
which is in homogeneous form :math:`\ell_0 u + \ell_1 v + \ell_2 = 0`
and the conjugate point :math:`{}^2 \vec{p}` lies on this line.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera1 = CentralCamera.Default(name='camera1')
>>> camera2 = CentralCamera.Default(pose=SE3(0.1, 0.05, 0), name='camera2')
>>> P = [-0.2, 0.3, 5] # world point
>>> p1 = camera1.project_point(P) # project to first camera
>>> camera1.epiline(p1, camera2) # epipolar line in second camera
:references:
- Robotics, Vision & Control for Python, Section 14.2.1, P. Corke, Springer 2023.
:seealso: :meth:`plot_epiline` :meth:`CentralCamera.F`
"""
# p is 3 x N, result is 3 x N
return self.F(camera2) @ base.e2h(p)
[docs]
def plot_epiline(self, F, p, *fmt, **kwargs):
r"""
Plot epipolar line
:param F: fundamental matrix
:type F: ndarray(3,3)
:param p: image plane point or points
:type p: array_like(2) or ndarray(2,N)
:param fmt: line style argument passed to ``plot``
:param kwargs: additional line style arguments passed to ``plot``
Plot the epipolar line induced by the image plane points ``p`` in the
camera's virtual image plane. Each line is given by
.. math::
\ell = \mat{F} {}^1 \hvec{p}
which is in homogeneous form :math:`\ell_0 u + \ell_1 v + \ell_2 = 0`
and the conjugate point :math:`{}^2 \vec{p}` lies on this line.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera1 = CentralCamera.Default(name='camera1')
>>> camera2 = CentralCamera.Default(pose=SE3(0.1, 0.05, 0), name='camera2')
>>> P = [-0.2, 0.3, 5] # world point
>>> p1 = camera1.project_point(P) # project to first camera
>>> camera2.plot_point(P, 'kd') # project and display in second camera
>>> camera2.plot_epiline(camera1.F(camera2), p1) # plot epipolar line in second camera
:references:
- Robotics, Vision & Control for Python, Section 14.2.1, P. Corke, Springer 2023.
:seealso: :meth:`plot_point` :meth:`epiline` :meth:`CentralCamera.F`
"""
# p is 3 x N, result is 3 x N
self.plot_line2(F @ base.e2h(p), *fmt, **kwargs)
[docs]
def plot_line3(self, L, **kwargs):
"""
Plot 3D line on virtual image plane (base method)
:param L: 3D line in Plucker coordinates
:type L: :class:`~spatialmath..geom3d.Line3`
:param kwargs: arguments passed to ``plot``
The Plucker line is projected to the camera's virtual image plane and
plotted.
:note:
- Successive calls add items to the virtual image plane.
- This method is common to all ``CameraBase`` subclasses, but it
invokes a camera-specific projection method.
:seealso: :meth:`plot_point` :meth:`plot_line2` :meth:`plot_wireframe` :meth:`clf`
"""
l = self.project_line(L)
for hl in l.T:
self.plot_line2(hl, **kwargs)
[docs]
def ray(self, points, pose=None):
"""
Project image plane points to a ray
:param points: image plane points
:type points: ndarray(2,N)
:param pose: camera pose, defaults to None
:type pose: :class:`~spatialmath..pose3d.SE3`, optional
:return: corresponding Plucker lines
:rtype: :class:`~spatialmath..geom3d.Line3`
For each image plane point compute the equation of a Plucker line
that represents the 3D ray from the camera origin through the image
plane point.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default()
>>> line = camera.ray((100, 200))
>>> line
:references:
- "Multiview Geometry", Hartley & Zisserman, p.162
- Robotics, Vision & Control for Python, Section 14.3, P. Corke, Springer 2023.
:seealso: :class:`~spatialmath..geom3d.Line3`
"""
# define Plucker line in terms of point (centre of camera) and direction
C = self.C(pose=pose)
Mi = np.linalg.inv(C[:3, :3])
v = C[:, 3]
lines = []
for point in base.getmatrix(points, (2, None)).T:
lines.append(Line3.PointDir(-Mi @ v, Mi @ smbase.e2h(point)))
return Line3(lines)
@property
def centre(self):
"""
Position of camera frame
:return: Euclidean coordinate of the camera frame's origin
:rtype: ndarray(3)
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera1 = CentralCamera.Default(name='camera1', pose=SE3.Trans(1,2,3))
>>> camera1
>>> camera1.centre
"""
return self.pose.t
@property
def center(self):
"""
Position of camera frame
:return: Euclidean coordinate of the camera frame's origin
:rtype: ndarray(3)
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera1 = CentralCamera.Default(name='camera1', pose=SE3.Trans(1,2,3))
>>> camera1
>>> camera1.center
"""
return self.pose.t
[docs]
def fov(self):
"""
Camera field-of-view angles
:return: field of view angles in radians
:rtype: ndarray(2)
Computes the field of view angles (2x1) in radians for the camera
horizontal and vertical directions.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera1 = CentralCamera.Default(name='camera1')
>>> camera1.fov()
:references:
- Robotics, Vision & Control for Python, Section 13.1.4, P. Corke,
Springer 2023.
"""
try:
return 2 * np.arctan(np.r_[self.imagesize] / 2 * np.r_[self.rho] / self.f)
except:
raise ValueError("imagesize or rho properties not set")
[docs]
def distort(self, points):
"""
Compute distorted coordinate
:param points: image plane points
:type points: ndarray(2,n)
:returns: distorted image plane coordinates
:rtype: ndarray(2,n)
Compute the image plane coordinates after lens distortion has been
applied. The lens distortion model is initialized at constructor time.
"""
if self._distortion is None:
return points
# convert to normalized image coordinates
X = np.linalg.inv(self.K) * smbase.e2h(points)
# unpack coordinates
u = X[0, :]
v = X[1, :]
# unpack distortion vector
k = self._distortion[:3]
p = self._distortion[3:]
r = np.sqrt(u**2 + v**2) # distance from principal point
# compute the shift due to distortion
delta_u = (
u * (k[0] * r**2 + k[1] * r**4 + k[2] * r**6)
+ 2 * p[0] * u * v
+ p[1] * (r**2 + 2 * u**2)
)
delta_v = (
v * (k[0] * r**2 + k[1] * r**4 + k[2] * r**6)
+ p[0] * (r**2 + 2 * v**2)
+ 2 * p[1] * u * v
)
# distorted coordinates
ud = u + delta_u
vd = v + delta_v
return self.K * smbase.e2h(np.r_[ud, vd]) # convert to pixel coords
@property
def fu(self):
"""
Get focal length in horizontal direction
:return: focal length in horizontal direction
:rtype: float
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default(name='camera1')
>>> camera.fu
:seealso: :meth:`fv` :meth:`f`
"""
return self._fu
@property
def fv(self):
"""
Get focal length in vertical direction
:return: focal length in vertical direction
:rtype: float
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default(name='camera1')
>>> camera.fv
:seealso: :meth:`fu` :meth:`f`
"""
return self._fv
@property
def f(self):
"""
Set/get focal length
:return: focal length in horizontal and vertical directions
:rtype: ndarray(2)
Return focal length in horizontal and vertical directions.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default(name='camera1')
>>> camera.f
>>> camera.f = 0.015
>>> camera.f
>>> camera.f = [0.015, 0.020]
>>> camera.f
:note: These are normally identical but will differ if the sensor
has non-square pixels or the frame grabber is changing the aspect
ratio of the image.
:seealso: :meth:`fu` :meth:`fv`
"""
return np.r_[self._fu, self._fv]
@f.setter
def f(self, f):
"""[summary]
:param f: focal length
:type f: scalar or array_like(2)
:raises ValueError: incorrect length of ``f``
"""
f = base.getvector(f)
if len(f) == 1:
self._fu = f[0]
self._fv = f[0]
elif len(f) == 2:
self._fu = f[0]
self._fv = f[1]
else:
raise ValueError(f, "f must be a 1- or 2-element vector")
@property
def fpix(self):
"""
Get focal length in pixels
:return: focal length in horizontal and vertical directions in pixels
:rtype: ndarray(2)
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default(name='camera1')
>>> camera.fpix
:seealso: :meth:`f`
"""
return np.r_[self._fu / self._rhou, self._fv / self._rhov]
@property
def K(self):
"""
Intrinsic matrix of camera
:return: intrinsic matrix
:rtype: ndarray(3,3)
Return the camera intrinsic matrix.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default(name='camera1')
>>> camera.K
:references:
- Robotics, Vision & Control for Python, Section 13.1, P. Corke, Springer 2023.
:seealso: :meth:`C` :meth:`pp` :meth:`rho`
"""
# fmt: off
K = np.array([[self.fu / self.rhou, 0, self.u0],
[ 0, self.fv / self.rhov, self.v0],
[ 0, 0, 1]
], dtype=np.float64)
# fmt: on
return K
# =================== camera calibration =============================== #
[docs]
def C(self, pose=None, retinal=False):
"""
Camera projection matrix
:param T: camera pose with respect to world frame, defaults to pose from camera object
:type T: :class:`~spatialmath..pose3d.SE3`, optional
:param retinal: transform to retinal coordinates, default False
:type retinal: bool, optional
:return: camera projection/calibration matrix
:rtype: ndarray(3,4)
Return the camera matrix which projects 3D points to the image plane.
It is a function of the camera's intrinsic and extrinsic parameters.
If ``retinal`` is True then project points in retinal coordinates,
in units of metres with respect to the principal point.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default(name='camera1')
>>> camera.C()
>>> camera.C(SE3.Trans(0.1, 0, 0))
>>> camera.move(SE3(0.1, 0, 0)).C()
:references:
- Robotics, Vision & Control for Python, Section 13.1, P. Corke, Springer 2023.
:seealso: :meth:`project_point` :meth:`K` :meth:`decomposeC`
"""
P0 = np.eye(3, 4)
if pose is None:
pose = self.pose
if retinal:
K = np.diag([self.fu, self.fv, 1])
else:
K = self.K
return K @ P0 @ pose.inv().A
[docs]
@staticmethod
def points2C(P, p):
r"""
Estimate camera matrix from data points
:param P: calibration points in world coordinate frame
:type P: ndarray(3,N)
:param p: calibration points in image plane
:type p: ndarray(2,N)
:return: camera calibration matrix and residual
:rtype: ndarray(3,4), float
Estimate the camera matrix :math:`\mat{C}` determined by least
squares from corresponding world ``P`` and image-plane ``p`` points.
Corresponding points are represented by corresponding columns of ``P``
and ``p``. Also returns the residual which is:
.. math::
\max | \mat{C}\mat{P} - \mat{p} |
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera, mkcube
>>> P = mkcube(0.2)
>>> camera_unknown = CentralCamera(f=0.015, rho=10e-6, imagesize=[1280, 1024], noise=0.05, seed=0)
>>> T_unknown = SE3.Trans(0.1, 0.2, 1.5) * SE3.RPY(0.1, 0.2, 0.3)
>>> p = camera_unknown.project_point(P, objpose=T_unknown)
>>> C, resid = CentralCamera.points2C(P, p)
>>> C
>>> camera_unknown.C()
>>> resid
:note: This method assumes no lens distortion affecting the image plane
coordinates.
:references:
- Robotics, Vision & Control for Python, Section 13.2.1, P. Corke,
Springer 2023.
:seealso: :meth:`C` :meth:`images2C` :meth:`decomposeC`
"""
z4 = np.zeros((4,))
A = np.empty(shape=(0, 11))
b = np.empty(shape=(0,))
for uv, X in zip(p.T, P.T):
u, v = uv
# fmt: off
row = np.array([
np.r_[ X, 1, z4, -u * X],
np.r_[z4, X, 1, -v * X]
])
# fmt: on
A = np.vstack((A, row))
b = np.r_[b, uv]
# solve Ax = b where c is 11 elements of camera matrix
c, *_ = scipy.linalg.lstsq(A, b)
# compute and print the residual
r = np.max(np.abs((A @ c - b)))
c = np.r_[c, 1] # append a 1
C = c.reshape((3, 4)) # make a 3x4 matrix
return C, r
[docs]
@classmethod
def images2C(self, images, gridshape=(7, 6), squaresize=0.025):
"""
Calibrate camera from checkerboard images
:param images: an iterator that returns :class:`~machinevisiontoolbox.ImageCore.Image` objects
:type images: :class:`~machinevisiontoolbox.Sources.ImageSource`
:param gridshape: number of grid squares in each dimension, defaults to (7,6)
:type gridshape: tuple, optional
:param squaresize: size of the grid squares in units of length, defaults to 0.025
:type squaresize: float, optional
:return: camera calibration matrix, distortion parameters, image frames
:rtype: ndarray(3,4), ndarray(5), list of named tuples
The distortion coefficients are in the order :math:`(k_1, k_2, p_1, p_2, k_3)`
where :math:`k_i` are radial distortion coefficients and :math:`p_i` are
tangential distortion coefficients.
Image frames that were successfully processed are returned as a list of
named tuples ``CalibrationFrame`` with elements:
======= ===================== ===========================================================
element type description
======= ===================== ===========================================================
image :class:`Image` calibration image with overlaid annotation
pose :class:`SE3` instance pose of the camera with respect to the origin of this image
id int sequence number of this image in ``images``
======= ===================== ===========================================================
:note: The units used for ``squaresize`` must match the units used
for defining 3D points in space.
:references:
- Robotics, Vision & Control for Python, Section 13.7, P. Corke,
Springer 2023.
:seealso: :meth:`C` :meth:`points2C` :meth:`decomposeC` :class:`~spatialmath..pose3d.SE3`
"""
criteria = (cv.TERM_CRITERIA_EPS + cv.TERM_CRITERIA_MAX_ITER, 30, 0.001)
# create set of feature points, like (0,0,0), (1,0,0), (2,0,0) ....,(6,5,0)
# these all have Z=0 since they are relative to the calibration target frame
objp = np.zeros((gridshape[0] * gridshape[1], 3), np.float32)
objp[:, :2] = (
np.mgrid[0 : gridshape[0], 0 : gridshape[1]].T.reshape(-1, 2) * squaresize
)
# lists to store object points and image points from all the images
objpoints = [] # 3d point in real world space
imgpoints = [] # 2d points in image plane.
corner_images = []
valid = []
for i, image in enumerate(images):
gray = image.mono().A
# Find the chess board corners
ret, corners = cv.findChessboardCorners(gray, gridshape, None)
# If found, add object points, image points (after refining them)
if ret:
objpoints.append(objp)
corners2 = cv.cornerSubPix(gray, corners, (11, 11), (-1, -1), criteria)
imgpoints.append(corners)
# Draw the corners
image = Image(image, copy=True)
if not image.iscolor:
image = image.colorize()
corner_images.append(
cv.drawChessboardCorners(image.A, gridshape, corners2, ret)
)
valid.append(i)
ret, C, distortion, rvecs, tvecs = cv.calibrateCamera(
objpoints, imgpoints, gray.shape[::-1], None, None
)
CalibrationFrame = namedtuple("CalibrationFrame", "image pose id")
if ret:
frames = []
for rvec, tvec, corner_image, id in zip(rvecs, tvecs, corner_images, valid):
frame = CalibrationFrame(
Image(corner_image, colororder="BGR"),
(SE3(tvec) * SE3.EulerVec(rvec.flatten())).inv(),
id,
)
frames.append(frame)
return C, distortion[0], frames
else:
return None
[docs]
@classmethod
def decomposeC(cls, C):
r"""
Decompose camera calibration matrix
:param C: camera calibration matrix
:type C: ndarray(3,4)
:return: camera model parameters
:rtype: :class:`CentralCamera`
Decompose a :math:`3\times 4` camera calibration matrix ``C`` to
determine feasible intrinsic and extrinsic parameters. The result is a
``CentralCamera`` instance with the following parameters set:
================ ====================================
Parameter Meaning
================ ====================================
``f`` focal length in pixels
``sx``, ``sy`` pixel size where ``sx`` =1
(``u0``, ``v0``) principal point
``pose`` pose of the camera frame wrt world
================ ====================================
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera = CentralCamera(name='camera1')
>>> C = camera.C(SE3(0.1, 0, 0))
>>> CentralCamera.decomposeC(C)
:note: Since only :math:`f s_x` and :math:`f s_y` can be estimated we
set :math:`s_x = 1`.
:references:
- Multiple View Geometry, Hartley&Zisserman, p 163-164
- Robotics, Vision & Control for Python, Section 13.2.3, P. Corke,
Springer 2023.
:seealso: :meth:`C` :meth:`points2C`
"""
def rq(S):
# from vgg_rq.m
# [R,Q] = vgg_rq(S) Just like qr but the other way around.
# If [R,Q] = vgg_rq(X), then R is upper-triangular, Q is orthogonal, and X==R*Q.
# Moreover, if S is a real matrix, then det(Q)>0.
# By awf
S = S.T
Q, U = np.linalg.qr(S[::-1, ::-1])
Q = Q.T
Q = Q[::-1, ::-1]
U = U.T
U = U[::-1, ::-1]
if np.linalg.det(Q) < 0:
U[:, 0] = -U[:, 0]
Q[0, :] = -Q[0, :]
return U, Q
if not C.shape == (3, 4):
raise ValueError("argument is not a 3x4 matrix")
u, s, v = np.linalg.svd(C)
v = v.T
# determine camera position
t = v[:, 3] # last column
t = t / t[3]
t = t[:3]
# determine camera orientation
M = C[:3, :3]
# K, R = rq(M)
K, R = scipy.linalg.rq(M)
# deal with K having negative elements on the diagonal
# make a matrix to fix this, K*C has positive diagonal
C = np.diag(np.sign(np.diag(K)))
# now K*R = (K*C) * (inv(C)*R), so we need to check C is a proper rotation
# matrix. If isn't then the situation is unfixable
if not np.isclose(np.linalg.det(C), 1):
raise RuntimeError("cannot correct signs in the intrinsic matrix")
# all good, let's fix it
K = K @ C
R = C.T @ R
# normalize K so that lower left is 1
K = K / K[2, 2]
# pull out focal length and scale factors
f = K[0, 0]
s = np.r_[1, K[1, 1] / K[0, 0]]
# build an equivalent camera model
return cls(name="invC", f=f, pp=K[:2, 2], rho=s, pose=SE3.Rt(R.T, t))
# https://docs.opencv.org/3.1.0/d9/d0c/group__calib3d.html#gaaae5a7899faa1ffdf268cd9088940248
# ======================= homography =============================== #
[docs]
def H(self, T, n, d):
"""
Compute homography from plane and camera pose
:param T: relative camera motion
:type T: :class:`~spatialmath..pose3d.SE3`
:param n: plane normal with respect to world frame
:type n: array_like(3)
:param d: plane offset from world frame origin
:type d: float
:return: homography matrix
:rtype: ndarray(3,3)
Computes the homography matrix for the camera observing points on a
plane from two viewpoints. The first view is from the current camera
pose (``self.pose``), and the second is after a relative motion
represented by the rigid-body motion ``T``. The plane has normal ``n``
and at distance ``d`` with respect to the world frame.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera = CentralCamera.Default(name='camera1') # looking along z-axis
>>> plane = [0, 1, 1]
>>> H = camera.H(SE3.Tx(0.2), plane, 5)
>>> H
:seealso: :meth:`points2H` :meth:`decomposeH`
"""
if d < 0:
raise ValueError(d, "plane distance d must be > 0")
n = base.getvector(n)
if n[2] < 0:
raise ValueError(n, "normal must be away from camera (n[2] >= 0)")
# T transform view 1 to view 2
T = SE3(T).inv()
HH = T.R + 1.0 / d * T.t @ n # need to ensure column then row = 3x3
# apply camera intrinsics
HH = self.K @ HH @ np.linalg.inv(self.K)
return HH / HH[2, 2] # normalised
[docs]
@staticmethod
def points2H(p1, p2, method="leastsquares", seed=None, **kwargs):
"""
Estimate homography from corresponding points
:param p1: image plane points from first camera
:type p1: ndarray(2,N)
:param p2: image plane points from second camera
:type p2: ndarray(2,N)
:param method: algorithm: 'leastsquares' [default], 'ransac', 'lmeds', 'prosac'
:type method: str
:param kwargs: optional arguments as required for ransac' and 'lmeds'
methods
:return: homography, residual and optional inliers
:rtype: ndarray(3,3), float, ndarray(N,bool)
Compute a homography from two sets of corresponding image plane points
whose world points lie on a plane.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera, mkgrid
>>> from spatialmath import SE3
>>> camera1 = CentralCamera(name="camera 1", f=0.002, imagesize=1000, rho=10e-6, pose=SE3.Tx(-0.1)*SE3.Ry(0.4))
>>> camera2 = CentralCamera(name="camera 2", f=0.002, imagesize=1000, rho=10e-6, pose=SE3.Tx(0.1)*SE3.Ry(-0.4))
>>> T_grid = SE3.Tz(1) * SE3.Rx(0.1) * SE3.Ry(0.2)
>>> P = mkgrid(3, 1.0, pose=T_grid)
>>> p1 = camera1.project_point(P)
>>> p2 = camera2.project_point(P);
>>> H, resid = CentralCamera.points2H(p1, p2)
>>> H
>>> resid
:note: If the method is 'ransac' or 'lmeds' then a boolean array
of inliers is also returned, True means the corresponding input
point pair is an inlier.
:references:
- Robotics, Vision & Control for Python, Section 14.2.4, P. Corke,
Springer 2023.
:seealso: :meth:`H` :meth:`decomposeH`
`opencv.findHomography <https://docs.opencv.org/master/d9/d0c/group__calib3d.html#ga4abc2ece9fab9398f2e560d53c8c9780>`_
"""
points2H_dict = {
"leastsquares": 0,
"ransac": cv.RANSAC,
"lmeds": cv.LMEDS,
"prosac": cv.RHO,
}
if seed is not None:
cv.setRNGSeed(seed)
H, mask = cv.findHomography(
srcPoints=p1.T, dstPoints=p2.T, method=points2H_dict[method], **kwargs
)
mask = mask.ravel().astype(bool)
e = base.homtrans(H, p1[:, mask]) - p2[:, mask]
resid = np.linalg.norm(e)
if method in ("ransac", "lmeds"):
return H, resid, mask
else:
return H, resid
# https://docs.opencv.org/3.1.0/d9/d0c/group__calib3d.html#ga7f60bdff78833d1e3fd6d9d0fd538d92
[docs]
def decomposeH(self, H, K=None):
"""
Decompose homography matrix
:param H: homography matrix
:type H: ndarray(3,3)
:param K: camera intrinsics, defaults to parameters from object
:type K: ndarray(3,3), optional
:return: camera poses, plane normals
:rtype: :class:`~spatialmath..pose3d.SE3`, list of ndarray(3,1)
Decomposes the homography matrix into the camera motion and the normal
to the plane. In practice, there are multiple solutions. The translation
not to scale.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera, mkgrid
>>> from spatialmath import SE3
>>> camera1 = CentralCamera(name="camera 1", f=0.002, imagesize=1000, rho=10e-6, pose=SE3.Tx(-0.1)*SE3.Ry(0.4))
>>> camera2 = CentralCamera(name="camera 2", f=0.002, imagesize=1000, rho=10e-6, pose=SE3.Tx(0.1)*SE3.Ry(-0.4))
>>> T_grid = SE3.Tz(1) * SE3.Rx(0.1) * SE3.Ry(0.2)
>>> P = mkgrid(3, 1.0, pose=T_grid)
>>> p1 = camera1.project_point(P)
>>> p2 = camera2.project_point(P);
>>> H, resid = CentralCamera.points2H(p1, p2)
>>> T, normals = camera1.decomposeH(H)
>>> T.printline(orient="camera")
>>> normals
:references:
- Robotics, Vision & Control for Python, Section 14.2.4, P. Corke,
Springer 2023.
:seealso: :meth:`points2H` :meth:`H`
`opencv.decomposeHomographyMat <https://docs.opencv.org/3.4/d9/d0c/group__calib3d.html#ga7f60bdff78833d1e3fd6d9d0fd538d92>`_
"""
retval, rotations, translations, normals = cv.decomposeHomographyMat(H, self.K)
T = SE3.Empty()
for R, t in zip(rotations, translations):
# we normalize the rotation matrix, those returned by openCV can
# not quite proper SO(3) values
pose = SE3.Rt(smbase.trnorm(R), t).inv()
T.append(pose)
return T, normals
# if K is None:
# K = np.identity(3)
# # also have K = self.K
# H = np.linalg.inv(K) @ H @ K
# # normalise so that the second singular value is one
# U, S, V = np.linalg.svd(H, compute_uv=True)
# H = H / S[1]
# # compute the SVD of the symmetric matrix H'*H = VSV'
# U, S, V = np.linalg.svd(np.transpose(H) @ H)
# # ensure V is right-handed
# if np.linalg.det(V) < 0:
# print('det(V) was < 0')
# V = -V
# # get squared singular values
# s0 = S[0]
# s2 = S[2]
# # v0 = V[0:, 0]
# # v1 = V[0:, 1]
# # v2 = V[0:, 2]
# # pure rotation - where all singular values == 1
# if np.abs(s0 - s2) < (100 * np.spacing(1)):
# print('Warning: Homography due to pure rotation')
# if np.linalg.det(H) < 0:
# H = -H
# # sol = namedtuple('T', T, ''
# # TODO finish from invhomog.m
# print('Unfinished')
# return False
# =================== fundamental matrix =============================== #
[docs]
def F(self, other):
"""
Fundamental matrix
:param other: second camera view
:type other: :class:`CentralCamera`, :class:`~spatialmath..pose3d.SE3`
:return: fundamental matrix
:rtype: numpy(3,3)
Compute the fundamental matrix relating two camera views. The
first view is defined by the instance. The second
is defined by:
* another :class:`CentralCamera` instance
* an SE3 pose describing the pose of the second view with respect to
the first, assuming the same camera intrinsic parameters.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera1 = CentralCamera(name="camera 1", f=0.002, imagesize=1000, rho=10e-6, pose=SE3.Tx(-0.1)*SE3.Ry(0.4))
>>> camera2 = CentralCamera(name="camera 2", f=0.002, imagesize=1000, rho=10e-6, pose=SE3.Tx(0.1)*SE3.Ry(-0.4))
>>> F = camera1.F(camera2)
>>> F
>>> F = camera1.F(SE3.Tx(0.2))
>>> F
:references:
- Y.Ma, J.Kosecka, S.Soatto, S.Sastry, "An invitation to 3D",
Springer, 2003. p.177
- Robotics, Vision & Control for Python, Section 14.2.1, P. Corke,
Springer 2023.
:seealso: :meth:`points2F` :meth:`E`
"""
if isinstance(other, SE3):
E = self.E(other)
K = self.K
return np.linalg.inv(K).T @ E @ np.linalg.inv(K)
elif isinstance(other, CentralCamera):
# use relative pose and camera parameters of
E = self.E(other)
K1 = self.K
K2 = other.K
return np.linalg.inv(K2).T @ E @ np.linalg.inv(K1)
else:
raise ValueError("bad type")
[docs]
@staticmethod
def points2F(p1, p2, method="8p", residual=True, seed=None, **kwargs):
"""
Estimate fundamental matrix from corresponding points
:param p1: image plane points from first camera
:type p1: ndarray(2,N)
:param p2: image plane points from second camera
:type p2: ndarray(2,N)
:param method: algorithm '7p', '8p' [default], 'ransac', 'lmeds'
:type method: str, optional
:param kwargs: optional arguments as required for ransac', 'lmeds'
methods
:return: fundamental matrix and residual
:rtype: ndarray(3,3), float
Computes the fundamental matrix from two sets of corresponding
image-plane points. Corresponding points are given by corresponding
columns of ``p1`` and ``p2``.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera, mkgrid
>>> from spatialmath import SE3
>>> camera1 = CentralCamera(name="camera 1", f=0.002, imagesize=1000, rho=10e-6, pose=SE3.Tx(-0.1)*SE3.Ry(0.4))
>>> camera2 = CentralCamera(name="camera 2", f=0.002, imagesize=1000, rho=10e-6, pose=SE3.Tx(0.1)*SE3.Ry(-0.4))
>>> T_grid = SE3.Tz(1) * SE3.Rx(0.1) * SE3.Ry(0.2)
>>> P = mkgrid(3, 1.0, pose=T_grid)
>>> p1 = camera1.project_point(P)
>>> p2 = camera2.project_point(P);
>>> F, resid = CentralCamera.points2F(p1, p2)
>>> F
>>> resid
:seealso: :meth:`F` :meth:`E`
`opencv.findFundamentalMat <https://docs.opencv.org/master/d9/d0c/group__calib3d.html#ga59b0d57f46f8677fb5904294a23d404a>`_
"""
points2F_dict = {
"7p": cv.FM_7POINT,
"8p": cv.FM_8POINT,
"ransac": cv.FM_RANSAC,
"lmeds": cv.FM_LMEDS,
}
if seed is not None:
cv.setRNGSeed(seed)
F, mask = cv.findFundamentalMat(
p1.T, p2.T, method=points2F_dict[method], **kwargs
)
mask = mask.ravel().astype(bool)
# add various return values
retval = [F]
if residual:
e = base.e2h(p2[:, mask]).T @ F @ base.e2h(p1[:, mask])
resid = np.linalg.norm(np.diagonal(e))
retval.append(resid)
if method in ("ransac", "lmeds"):
retval.append(mask)
return retval
# elines = base.e2h(p2).T @ F # homog lines, one per row
# p1h = base.e2h(p1)
# residuals = []
# for i, line in enumerate(elines):
# d = line @ p1h[:, i] / np.sqrt(line[0] ** 2 + line[1] ** 2)
# residuals.append(d)
# resid = np.array(residuals).mean()
[docs]
@staticmethod
def epidist(F, p1, p2):
"""
Epipolar distance
:param F: fundamental matrix
:type F: ndarray(3,3)
:param p1: image plane point or points from first camera
:type p1: ndarray(2) or ndarray(2,N)
:param p2: image plane point or points from second camera
:type p2: ndarray(2) or ndarray(2,M)
:return: distance matrix
:rtype: ndarray(N,M)
Computes the distance of the points ``p2`` from the
epipolar lines induced by points ``p1``. Element [i,j] of the return
value is the istance of point j in camera 2 from the epipolar line
induced by point i in camera 1.
"""
if p1.ndim == 1:
p1 = np.c_[p1]
if p2.ndim == 1:
p2 = np.c_[p2]
D = np.empty((p1.shape[1], p2.shape[1]))
# compute epipolar lines corresponding to p1
l = F @ base.e2h(p1)
for i in range(p1.shape[1]):
for j in range(p2.shape[1]):
D[i, j] = np.abs(
l[0, i] * p2[0, j] + l[1, i] * p2[1, j] + l[2, i]
) / np.sqrt(l[0, i] ** 2 + l[1, i] ** 2)
return D
# ===================== essential matrix =============================== #
[docs]
def E(self, other):
"""
Essential matrix from two camera views
:param other: second camera view, camera pose or fundamental matrix
:type other: :class:`CentralCamera`, :class:`~spatialmath..pose3d.SE3`, ndarray(3,3)
:return: essential matrix
:rtype: ndarray(3,3)
Compute the essential matrix relating two camera views. The first view
is defined by the instance, and second view is specified by:
* a camera instance represented by a :class:`CentralCamera`. Assumes the
cameras have the same intrinsics.
* a relative motion represented by a :class:`~spatialmath..pose3d.SE3`
* a fundamental matrix
:references:
- Y.Ma, J.Kosecka, S.Soatto, S.Sastry, "An invitation to 3D",
Springer, 2003. p.177
:seealso: :meth:`F` :meth:`decomposeE` :meth:`points2E`
"""
if isinstance(other, np.ndarray) and other.shape == (3, 3):
# essential matrix from F matrix and intrinsics
return self.K.T @ other @ self.K
elif isinstance(other, CentralCamera):
# camera relative pose
T21 = other.pose.inv() * self.pose
elif isinstance(other, SE3):
# relative pose given explicitly
T21 = other.inv()
else:
raise ValueError("bad type")
return base.skew(T21.t) @ T21.R
[docs]
def points2E(self, p1, p2, method=None, K=None, **kwargs):
"""
Essential matrix from points
:param P1: image plane points
:type P1: ndarray(2,N)
:param P2: image plane points
:type P2: ndarray(2,N)
:param method: method, can be 'ransac' or 'lmeds'
:type method: str
:param K: camera intrinsic matrix, defaults to that of camera object
:type K: ndarray(3,3), optional
:param kwargs: additional arguments required for 'ransac' or 'lmeds'
options
:return: essential matrix and optional inlier vevtor
:rtype: ndarray(3,3), ndarray(N, bool)
Compute the essential matrix from two sets of corresponding points.
Each set of points is represented by the columns of the array ``p1``
or ``p2``.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera, mkgrid
>>> from spatialmath import SE3
>>> camera1 = CentralCamera(name="camera 1", f=0.002, imagesize=1000, rho=10e-6, pose=SE3.Tx(-0.1)*SE3.Ry(0.4))
>>> camera2 = CentralCamera(name="camera 2", f=0.002, imagesize=1000, rho=10e-6, pose=SE3.Tx(0.1)*SE3.Ry(-0.4))
>>> T_grid = SE3.Tz(1) * SE3.Rx(0.1) * SE3.Ry(0.2)
>>> P = mkgrid(3, 1.0, pose=T_grid)
>>> p1 = camera1.project_point(P)
>>> p2 = camera2.project_point(P);
>>> E, inliers = camera1.points2E(p1, p2)
>>> E
>>> inliers
:note: If the method is 'ransac' or 'lmeds' then a boolean array
of inliers is also returned, True means the corresponding input
point pair is an inlier.
:seealso: :meth:`E` :meth:`decomposeE`
`opencv.findEssentialMat <https://docs.opencv.org/master/d9/d0c/group__calib3d.html#gad245d60e64d0c1270dbfd0520847bb87>`_
"""
if K is None:
K = self.K
points2E_dict = {"ransac": cv.RANSAC, "lmeds": cv.LMEDS}
if method is not None:
method = points2E_dict[method]
E, mask = cv.findEssentialMat(
p1.T, p2.T, cameraMatrix=K, method=method, **kwargs
)
if mask is not None:
mask = mask.flatten().astype(bool)
return E, mask
else:
return E
[docs]
def decomposeE(self, E, P=None):
"""
Decompose essential matrix
:param E: essential matrix
:type E: ndarray(3,3)
:param P: world point or feature match object to resolve ambiguity
:type P: array_like(3), :class:`~machinevisiontoolbox.ImagePointFeatures.FeatureMatch`
:return: camera relative pose
:rtype: :class:`~spatialmath..pose3d.SE3`
Determines relative pose from essential matrix. This operation has
multiple solutions which is resolved by passing in:
- a single 3D world point in front of the camera
- a :class:`~machinevisiontoolbox.ImagePointFeatures.FeatureMatch` object
:references:
- Robotics, Vision & Control for Python, Section 14.2.2 P. Corke,
Springer 2023.
:seealso: :meth:`E` :meth:`points2E`
:class:`~machinevisiontoolbox.ImagePointFeatures.FeatureMatch`
`opencv.decomposeEssentialMat <https://docs.opencv.org/master/d9/d0c/group__calib3d.html#ga54a2f5b3f8aeaf6c76d4a31dece85d5d>`_
`opencv.recoverPose <https://docs.opencv.org/master/d9/d0c/group__calib3d.html#gadb7d2dfcc184c1d2f496d8639f4371c0>`_
"""
if isinstance(P, FeatureMatch):
# passed a Match object
match = P
retval, R, t, mask = cv.recoverPose(
E=E,
points1=match.p1.T,
points2=match.p2.T,
cameraMatrix=self.C()[:3, :3],
)
# not explicitly stated, but seems that this returns (R, t) from
# camera to world
return SE3.Rt(R, t).inv()
else:
R1, R2, t = cv.decomposeEssentialMat(E=E)
# not explicitly stated, but seems that this returns (R, t) from
# camera to world
possibles = [(R1, t), (R1, -t), (R2, t), (R2, -t)]
if base.isvector(P, 3):
for Rt in possibles:
pose = SE3.Rt(Rt[0], Rt[1]).inv()
p = self.project_point(P, pose=pose, behind=True)
# check if point is projected behind the camera, indicated
# by nan values
if not np.isnan(p[0]):
# return the first good one
return pose
else:
T = SE3.Empty()
for Rt in possibles:
pose = SE3.Rt(Rt[0], Rt[1]).inv()
T.append(pose)
return T
# ===================== image plane motion ============================= #
[docs]
def visjac_p(self, uv, depth):
r"""
Visual Jacobian for point features
:param p: image plane point or points
:type p: array_like(2), ndarray(2,N)
:param depth: point depth
:type depth: float, array_like(N)
:return: visual Jacobian matrix
:rtype: ndarray(2,6), ndarray(2N,6)
Compute the image Jacobian :math:`\mat{J}` which maps
.. math::
\dvec{p} = \mat{J}(\vec{p}, z) \vec{\nu}
camera spatial velocity :math:`\vec{\nu}` to the image plane velocity
:math:`\dvec{p}` of the point.
If ``p`` describes multiple points then return a stack of these
:math:`2\times 6` matrices, one per point.
Depth is the z-component of the point's coordinate in the camera frame.
If ``depth`` is a scalar then it is the depth for all points.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera = CentralCamera.Default()
>>> camera.visjac_p((200, 300), 2)
:references:
- A tutorial on Visual Servo Control, Hutchinson, Hager & Corke,
IEEE Trans. R&A, Vol 12(5), Oct, 1996, pp 651-670.
- Robotics, Vision & Control for Python, Section 15.2.1, P. Corke,
Springer 2023.
:seealso: :meth:`flowfield` :meth:`visjac_p_polar` :meth:`visjac_l` :meth:`visjac_e`
"""
uv = base.getmatrix(uv, (2, None))
Z = depth
Z = base.getvector(Z)
if len(Z) == 1:
Z = np.repeat(Z, uv.shape[1])
elif len(Z) != uv.shape[1]:
raise ValueError("Z must be a scalar or have same number of columns as uv")
L = np.empty((0, 6)) # empty matrix
K = self.K
Kinv = np.linalg.inv(K)
for z, p in zip(Z, uv.T): # iterate over each column (point)
# convert to normalized image-plane coordinates
xy = Kinv @ base.e2h(p)
x = xy[0, 0]
y = xy[1, 0]
# 2x6 Jacobian for this point
# fmt: off
Lp = K[:2,:2] @ np.array(
[ [-1/z, 0, x/z, x * y, -(1 + x**2), y],
[ 0, -1/z, y/z, (1 + y**2), -x*y, -x] ])
# fmt: on
# stack them vertically
L = np.vstack([L, Lp])
return L
[docs]
def visjac_p_polar(self, p, Z):
r"""
Visual Jacobian for point features in polar coordinates
:param p: image plane point or points
:type p: array_like(2), ndarray(2,N)
:param depth: point depth
:type depth: float, array_like(N)
:return: visual Jacobian matrix in polar coordinates
:rtype: ndarray(2,6), ndarray(2N,6)
Compute the image Jacobian :math:`\mat{J}` which maps
.. math::
\begin{pmatrix} \dot{\phi} \\ \dot{r} \end{pmatrix} = \mat{J}(\vec{p}, z) \vec{\nu}
camera spatial velocity :math:`\vec{\nu}` to the image plane velocity
of the point expressed in polar coordinate form :math:`(\phi, r)`.
If ``p`` describes multiple points then return a stack of these
:math:`2\times 6` matrices, one per point.
Depth is the z-component of the point's coordinate in the camera frame.
If ``depth`` is a scalar then it is the depth for all points.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera = CentralCamera.Default()
>>> camera.visjac_p_polar((200, 300), 2)
:references:
- Combining Cartesian and polar coordinates in IBVS.
Corke PI, Spindler F, Chaumette F
IROS 2009, pp 5962–5967
- Robotics, Vision & Control for Python, Section 16.2 P. Corke,
Springer 2023.
:seealso: :meth:`visjac_p` :meth:`visjac_l` :meth:`visjac_e`
"""
J = []
p = smbase.getmatrix(p, (2, None))
f = self.f[0]
if smbase.isscalar(Z):
Z = [Z] * p.shape[1]
for (phi, r), Zk in zip(p.T, Z):
# k = (f**2 + r**2) / f
# k2 = f / (r * Zk)
c = np.cos(phi)
s = np.sin(phi)
r = max(r, 0.05)
Jk = np.array(
[
[-s / r / Zk, c / r / Zk, 0, -c / r, -s / r, 1],
[c / Zk, s / Zk, -r / Zk, -(1 + r**2) * s, (1 + r**2) * c, 0],
]
)
# Jk = np.array([
# [ k2 * sth, -k2 * cth, 0, f / r * cth, f / r * sth , -1],
# [-f / Zk * cth, -f / Zk * sth, r / Zk, k * sth, -k * cth, 0],
# ])
# Jk = np.array([
# [cth/Zk , sth / Zk, -r / Zk, -(1+r**2) * sth, -k * cth, 0],
# [ k2 * sth, -k2 * cth, 0, f / r * cth, f / r * sth , -1]])
J.append(Jk)
return np.vstack(J)
# if 0
# r = rt(1); theta = rt(2);
# % compute the mapping from uv-dot to r-theta dot
# M = 1/r * [r*cos(theta) r*sin(theta); -sin(theta) cos(theta)];
# % convert r-theta form to uv form
# u = r * cos(theta); v = r * sin(theta);
# % compute the Jacobian
# J = M * cam.visjac_p([u; v], Z);
[docs]
def visjac_l(self, lines, plane):
r"""
Visual Jacobian for line features
:param lines: image plane line parameters
:type p: array_like(2), ndarray(2,N)
:param plane: plane containing the line
:type plane: array_like(4)
:return: visual Jacobian matrix for line feature
:rtype: ndarray(2,6), ndarray(2N,6)
Compute the Jacobian which gives the rates of change of the line
parameters in terms of camera spatial velocity.
For image planes lines
.. math:: u \cos \theta + v \sin \theta = \rho
the image Jacobian :math:`\mat{J}` maps
.. math::
\begin{pmatrix} \dot{\theta} \\ \dot{\rho} \end{pmatrix} = \mat{J}(\vec{p}, z) \vec{\nu}
camera spatial velocity :math:`\vec{\nu}` to the image plane velocity
of the line parameters :math:`(\theta, \rho)`.
The world plane containing the line is also required, and is provided
as a vector :math:`(a,b,c,d)` such that
.. math: aX + bY +cZ + d = 0
If ``lines`` describes multiple points then return a stack of these
:math:`2\times 6` matrices, one per point.
Depth is the z-component of the point's coordinate in the camera frame.
If ``depth`` is a scalar then it is the depth for all points.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera = CentralCamera.Default()
>>> camera.visjac_l((0.2, 500), (0, 0, 1, -3))
:references:
- A New Approach to Visual Servoing in Robotics,
B. Espiau, F. Chaumette, and P. Rives,
IEEE Transactions on Robotics and Automation,
vol. 8, pp. 313-326, June 1992.
- Visual servo control 2: Advanced approaches
Chaumette F, Hutchinson S,
IEEE Robot Autom Mag 14(1):109–118 (2007)
- Robotics, Vision & Control for Python, Section 15.3.1, P. Corke,
Springer 2023.
:seealso: :meth:`visjac_p` :meth:`visjac_p_polar` :meth:`visjac_e`
"""
a, b, c, d = plane
lines = smbase.getmatrix(lines, (2, None))
jac = []
for theta, rho in lines.T:
sth = np.sin(theta)
cth = np.cos(theta)
lam_th = (a * sth - b * cth) / d
lam_rho = (a * rho * cth + b * rho * sth + c) / d
L = np.array(
[
[
lam_th * cth,
lam_th * sth,
-lam_th * rho,
-rho * cth,
-rho * sth,
-1,
],
[
lam_rho * cth,
lam_rho * sth,
-lam_rho * rho,
(1 + rho**2) * sth,
-(1 + rho**2) * cth,
0,
],
]
)
jac.append(L)
return np.vstack(jac)
[docs]
def visjac_e(self, E, plane):
r"""
Visual Jacobian for ellipse features
:param E: image plane ellipse parameters
:type E: array_like(5), ndarray(5,N)
:param plane: plane containing the ellipse
:type plane: array_like(4)
:return: visual Jacobian matrix for ellipse feature
:rtype: ndarray(2,6), ndarray(2N,6)
Compute the Jacobian gives the rates of change of the ellipse parameters
in terms of camera spatial velocity.
For image plane ellipses
.. math:: u^2 + E_0 v^2 -2 E_1 u v + 2 E_2 u + 2 E_3 v + E_4 = 0
the image Jacobian :math:`\mat{J}` maps
.. math::
\begin{pmatrix} \dot{E_0} \\ \vdots \\ \dot{E_4} \end{pmatrix} = \mat{J}(\vec{p}, z) \vec{\nu}
camera spatial velocity :math:`\vec{\nu}` to the velocity
of the ellipse parameters :math:`(E_0 \ldots E_4)`.
The world plane containing the ellipse is also required, and is provided
as a vector :math:`(a,b,c,d)` such that
.. math: aX + bY +cZ + d = 0
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> from spatialmath import SE3
>>> camera = CentralCamera.Default()
>>> camera.visjac_e(((0.5, 0, -1000, -500, 374900)), (0, 0, 1, -1)
:references:
- A New Approach to Visual Servoing in Robotics,
B. Espiau, F. Chaumette, and P. Rives,
IEEE Transactions on Robotics and Automation,
vol. 8, pp. 313-326, June 1992.
- Visual servo control 2: Advanced approaches
Chaumette F, Hutchinson S,
IEEE Robot Autom Mag 14(1):109–118 (2007)
- Robotics, Vision & Control for Python, Section 15.3.2, P. Corke,
Springer 2023.
:seealso: :meth:`visjac_p` :meth:`visjac_p_polar` :meth:`visjac_l`
"""
a = -plane[0] / plane[3]
b = -plane[1] / plane[3]
c = -plane[2] / plane[3]
L = np.array(
[
[
2 * b * E[1] - 2 * a * E[0],
2 * E[0] * (b - a * E[1]),
2 * b * E[3] - 2 * a * E[0] * E[2],
2 * E[3],
2 * E[0] * E[2],
-2 * E[1] * (E[0] + 1),
],
[
b - a * E[1],
b * E[1] - a * (2 * E[1] ** 2 - E[0]),
a * (E[3] - 2 * E[1] * E[2]) + b * E[2],
-E[2],
-(2 * E[1] * E[2] - E[3]),
E[0] - 2 * E[1] ** 2 - 1,
],
[
c - a * E[2],
a * (E[3] - 2 * E[1] * E[2]) + c * E[1],
c * E[2] - a * (2 * E[2] ** 2 - E[4]),
-E[1],
1 + 2 * E[2] ** 2 - E[4],
E[3] - 2 * E[1] * E[2],
],
[
E[2] * b + E[1] * c - 2 * a * E[3],
E[3] * b + E[0] * c - 2 * a * E[1] * E[3],
b * E[4] + c * E[3] - 2 * a * E[2] * E[3],
E[4] - E[0],
2 * E[2] * E[3] + E[1],
-2 * E[1] * E[3] - E[2],
],
[
2 * c * E[2] - 2 * a * E[4],
2 * c * E[3] - 2 * a * E[1] * E[4],
2 * c * E[4] - 2 * a * E[2] * E[4],
-2 * E[3],
2 * E[2] * E[4] + 2 * E[2],
-2 * E[1] * E[4],
],
]
)
L = L @ np.diag([0.5, 0.5, 0.5, 1, 1, 1]) # not sure why...
return L
[docs]
def flowfield(self, vel, Z=2):
"""
Display optical flow field
:param vel: camera spatial velocity
:type vel: array_like(6)
:param Z: _description_, defaults to 2
:type Z: scalar, optional
Display the optical flow field using Matplotlib, for a grid of points at
distance ``Z`` for a camera velocity of ``vel``.
Example:
.. runblock:: pycon
>>> from machinevisiontoolbox import CentralCamera
>>> camera = CentralCamera.Default()
>>> camera.flowfield([0, 0, 0, 0, 1, 0])
:seealso: :meth:`visjac_p`
"""
vel = base.getvector(vel, 6)
u = np.arange(0, self.nu, 50)
v = np.arange(0, self.nv, 50)
[U, V] = np.meshgrid(u, v, indexing="ij")
du = np.empty(shape=U.shape)
dv = np.empty(shape=U.shape)
for r in range(U.shape[0]):
for c in range(U.shape[1]):
J = self.visjac_p((U[r, c], V[r, c]), Z)
ud, vd = J @ vel
du[r, c] = ud
dv[r, c] = -vd
self.clf()
ax = self._init_imageplane()
ax.quiver(U, V, du, dv, 0.4, zorder=20)
[docs]
def derivatives(self, x, P):
r"""
Compute projection and derivatives for bundle adjustment
:param x: camera pose as translation and quaternion vector part
:type x: array_like(6)
:param P: 3D world point
:type P: array_like(3)
:return: p, A, B
:rtype: ndarray(2), ndarray(2,6), ndarray(2,3)
For a world point :math:`\vec{x}` compute the image plane projection and the
sensitivity to camera and point change
.. math:: \mat{A} = \frac{\partial \vec{f}(\vec{x})}{\partial \pose}, \mat{B} = \frac{\partial \vec{f}(\vec{x})}{\partial \vec{P}}
where :math:`\vec{f}(\vec{x})` is the perspective projection function.
:seealso: :meth:`project_point`
"""
# compute Jacobians and projection
from machinevisiontoolbox.camera_derivatives import cameraModel
Kp = [self.f[0], self.rhou, self.rhov, self.u0, self.v0]
return cameraModel(*x, *P, *Kp)
[docs]
def estpose(self, P, p, method="iterative", frame="world"):
"""
Estimate object pose
:param P: A set of 3D points defining the object with respect to its own frame
:type P: ndarray(3, N)
:param p: Image plane projection of the object points
:type p: ndarray(2, N)
:param method: pose estimation algorithm, see OpenCV solvePnP, defaults to 'iterative'
:type method: str, optional
:param frame: estimate pose with respect to frame "world" [default] or "camera"
:type frame: str, optional
:return: pose of target frame relative to the world frame
:rtype: :class:`~spatialmath..pose3d.SE3`
Using a set of points defining some object with respect to its own frame {B}, and
a set of image-plane projections, estimate the pose of {B} with respect to the world
or camera frame.
To estimate the camera's pose with respect to the world frame the camera's pose
``self.pose`` is used.
:note:
* All of the OpenCV estimation algorithms are supported.
* Algorithm ``"ippe-square"`` requires exactly four points at the corners of a
square and in the order: (-x, y), (x, y), (x, -y), (-x, -y).
:seealso: :meth:`project_point`
`opencv.solvePnP <https://docs.opencv.org/3.4/d9/d0c/group__calib3d.html#ga549c2075fac14829ff4a58bc931c033d>`_
"""
method_dict = {
"iterative": cv.SOLVEPNP_ITERATIVE,
"epnp": cv.SOLVEPNP_EPNP,
"p3p": cv.SOLVEPNP_P3P,
"ap3p": cv.SOLVEPNP_AP3P,
"ippe": cv.SOLVEPNP_IPPE,
"ippe-square": cv.SOLVEPNP_IPPE_SQUARE,
}
# as per the Note on solvePnP page
# we need to ensure that the image point data is contiguous nx1x2 array
n = p.shape[1]
p = np.ascontiguousarray(p[:2, :].T).reshape((n, 1, 2))
# do the pose estimation
sol = cv.solvePnP(P.T, p, self.K, self._distortion, flags=method_dict[method])
if sol[0]:
# pose of target with respect to camera
pose_C_T = SE3(sol[2]) * SE3.EulerVec(sol[1])
# pose with respect to world frame
if frame == "camera":
return pose_C_T
elif frame == "world":
return self.pose * pose_C_T
else:
raise ValueError(f"bad frame value {frame}")
else:
return None
# ------------------------------------------------------------------------ #
[docs]
class FishEyeCamera(CameraBase):
r"""
Create fisheye camera projection model
.. inheritance-diagram:: machinevisiontoolbox.Camera.FishEyeCamera
:top-classes: machinevisiontoolbox.Camera.Camera
:parts: 1
:param k: scale factor
:type k: float, optional
:param projection: projection model: ``'equiangular'`` [default], ``'sine'``, ``'equisolid'`` or ``'stereographic'``
:type projection: str, optional
:param kwargs: arguments passed to :class:`CameraBase` constructor
A fisheye camera contains a wide angle lens, and the angle of the
incoming ray is mapped to a radius with respect to the principal point.
The mapping from elevation angle :math:`\theta` to image plane radius is
given by:
============= =======================================
Projection :math:`r(\theta)`
============= =======================================
equiangular :math:`r = k \theta`
sine :math:`r = k \sin \theta`
equisolid :math:`r = k \sin \frac{\theta}{2}`
stereographic :math:`r = k \tan \frac{\theta}{2}`
============= =======================================
:note:
- If ``K`` is not specified it is computed such that the circular
imaging region maximally fills the square image plane.
- This camera model assumes central projection, that is, the focal point
is at z=0 and the image plane is at z=f. The image is not inverted.
:references:
- Robotics, Vision & Control for Python, Section 13.3.1, P. Corke, Springer 2023.
:seealso: :class:`CameraBase` :class:`CentralCamera` :class:`CatadioptricCamera`
:class:`SphericalCamera`
"""
[docs]
def __init__(self, k=None, projection="equiangular", **kwargs):
super().__init__(camtype="fisheye", **kwargs)
self.projection = projection
if k is None:
r = np.min((self.imagesize - self.pp) * self.rho)
if self.projection == "equiangular":
if k is None:
k = r / (pi / 2)
rfunc = lambda theta: k * theta
elif self.projection == "sine":
if k is None:
k = r
rfunc = lambda theta: k * np.sin(theta)
elif self.projection == "equisolid":
if k is None:
k = r / sin(pi / 4)
rfunc = lambda theta: k * np.sin(theta / 2)
elif self.projection == "stereographic":
if k is None:
k = r / tan(pi / 4)
rfunc = lambda theta: k * np.tan(theta / 2)
else:
raise ValueError("unknown projection model")
self.k = k
self.rfunc = rfunc
def __str__(self):
s = super().__str__()
s += self.fmt.format("model", self.projection, fmt="{}")
s += self.fmt.format("k", self.k, fmt="{:.4g}")
return s
[docs]
def project_point(self, P, pose=None, objpose=None):
r"""
Project 3D points to image plane
:param P: 3D world point or points
:type P: array_like(3), array_like(3,n)
:param pose: camera pose with respect to the world frame, defaults to
camera's ``pose`` attribute
:type pose: SE:class:`~spatialmath..pose3d.SE3`3, optional
:param objpose: 3D point reference frame, defaults to world frame
:type objpose: :class:`~spatialmath..pose3d.SE3`, optional
:param visibility: test if points are visible, default False
:type visibility: bool
:raises ValueError: [description]
:return: image plane points
:rtype: ndarray(2,n)
Project world points to the fisheye camera image plane.
The elevation angle range is from :math:`-pi/2` (below the mirror) to
maxangle above the horizontal plane. The mapping from elevation angle
:math:`\theta` to image plane radius is given by:
============= =======================================
Projection :math:`r(\theta)`
============= =======================================
equiangular :math:`r = k \theta`
sine :math:`r = k \sin \theta`
equisolid :math:`r = k \sin \frac{\theta}{2}`
stereographic :math:`r = k \tan \frac{\theta}{2}`
============= =======================================
World points are given as a 1D array or the columns of a 2D array of
Euclidean coordinates. The computed image plane coordinates are
Euclidean and given as a 1D array or the corresponding columns of a 2D
array.
If ``pose`` is specified it is used for the camera pose instead of the
attribute ``pose``. The object's attribute is not updated.
The points ``P`` are by default with respect to the world frame, but
they can be transformed by specifying ``objpose``.
:seealso: :meth:`plot_point`
"""
P = base.getmatrix(P, (3, None))
if pose is not None:
T = self.pose.inv()
else:
T = SE3()
if objpose is not None:
T *= objpose
R = np.sqrt(np.sum(P**2, axis=0))
phi = np.arctan2(P[1, :], P[0, :])
theta = np.arccos(P[2, :] / R)
r = self.rfunc(theta)
x = r * np.cos(phi)
y = r * np.sin(phi)
uv = np.array([x / self.rhou + self.u0, y / self.rhov + self.v0])
return self._add_noise_distortion(uv)
# ------------------------------------------------------------------------ #
[docs]
class CatadioptricCamera(CameraBase):
r"""
Create catadioptric camera projection model
.. inheritance-diagram:: machinevisiontoolbox.Camera.CatadioptricCamera
:top-classes: machinevisiontoolbox.Camera.Camera
:parts: 1
:param k: scale factor
:type k: float, optional
:param projection: projection model: ``'equiangular'`` [default], ``'sine'``, ``'equisolid'`` or ``'stereographic'``
:type projection: str, optional
:param kwargs: arguments passed to :class:`CameraBase` constructor
A catadioptric camera comprises a perspective camera pointed at a
convex mirror, typically paraboloidal or conical.
The elevation angle range is from :math:`-\pi/2` (below the mirror) to
maxangle above the horizontal plane. The mapping from elevation angle
:math:`\theta` to image plane radius is given by:
============= =======================================
Projection :math:`r(\theta)`
============= =======================================
equiangular :math:`r = k \theta`
sine :math:`r = k \sin \theta`
equisolid :math:`r = k \sin \frac{\theta}{2}`
stereographic :math:`r = k \tan \frac{\theta}{2}`
============= =======================================
:note:
- If ``K`` is not specified it is computed such that the circular
imaging region maximally fills the image plane.
- This camera model assumes central projection, that is, the focal point
is at :math:`z=0` and the image plane is at :math:`z=f`. The image is not inverted.
:references:
- Robotics, Vision & Control for Python, Section 13.3.2, P. Corke, Springer 2023.
:seealso: :class:`CameraBase` :class:`CentralCamera` :class:`FishEyeCamera`
:class:`SphericalCamera`
"""
[docs]
def __init__(self, k=None, projection="equiangular", maxangle=None, **kwargs):
super().__init__(camtype="catadioptric", **kwargs)
self.projection = projection
if k is None:
r = np.min((self.imagesize - self.pp) * self.rho)
# compute k if not specified, so that hemisphere fits into
# image plane, requires maxangle being set
if self.projection == "equiangular":
if k is None:
if maxangle is not None:
k = r / (pi / 2 + maxangle)
self.maxangle = maxangle
else:
raise ValueError("must specify either k or maxangle")
rfunc = lambda theta: k * theta
elif self.projection == "sine":
if k is None:
k = r
rfunc = lambda theta: k * np.sin(theta)
elif self.projection == "equisolid":
if k is None:
k = r / sin(pi / 4)
rfunc = lambda theta: k * np.sin(theta / 2)
elif self.projection == "stereographic":
if k is None:
k = r / tan(pi / 4)
rfunc = lambda theta: k * np.tan(theta / 2)
else:
raise ValueError("unknown projection model")
self.k = k
self.rfunc = rfunc
def __str__(self):
s = super().__str__()
s += self.fmt.format("model", self.projection, fmt="{}")
s += self.fmt.format("k", self.k, fmt="{:.4g}")
return s
[docs]
def project_point(self, P, pose=None, objpose=None):
"""
Project 3D points to image plane
:param P: 3D world point or points
:type P: array_like(3), array_like(3,n)
:param pose: camera pose with respect to the world frame, defaults to
camera's ``pose`` attribute
:type pose: :class:`~spatialmath..pose3d.SE3`, optional
:param objpose: 3D point reference frame, defaults to world frame
:type objpose: :class:`~spatialmath..pose3d.SE3`, optional
:param visibility: test if points are visible, default False
:type visibility: bool
:raises ValueError: [description]
:return: image plane points
:rtype: ndarray(2,n)
Project world points to the catadioptric camera image plane.
World points are given as a 1D array or the columns of a 2D array of
Euclidean coordinates. The computed image plane coordinates are
Euclidean and given as a 1D array or the corresponding columns of a 2D
array.
If ``pose`` is specified it is used for the camera pose instead of the
attribute ``pose``. The object's attribute is not updated.
The points ``P`` are by default with respect to the world frame, but
they can be transformed by specifying ``objpose``.
:seealso: :meth:`plot_point`
"""
P = base.getmatrix(P, (3, None))
if pose is not None:
T = self.pose.inv()
else:
T = SE3()
if objpose is not None:
T *= objpose
P = T * P # transform points to camera frame
# project to the image plane
R = np.sqrt(np.sum(P**2, axis=0))
phi = np.arctan2(P[1, :], P[0, :])
theta = np.arccos(P[2, :] / R)
r = self.rfunc(theta) # depends on projection model
x = r * np.cos(phi)
y = r * np.sin(phi)
uv = np.array([x / self.rhou + self.u0, y / self.rhov + self.v0])
return self._add_noise_distortion(uv)
# ------------------------------------------------------------------------ #
[docs]
class SphericalCamera(CameraBase):
"""
Create spherical camera projection model
.. inheritance-diagram:: machinevisiontoolbox.Camera.SphericalCamera
:top-classes: machinevisiontoolbox.Camera.Camera
:parts: 1
:param kwargs: arguments passed to :class:`CameraBase` constructor
The spherical camera is an idealization with a complete field of view
that can be used to generalize all camera projection models.
:references:
- Robotics, Vision & Control for Python, Section 13.3.3, P. Corke, Springer 2023.
:seealso: :class:`CameraBase` :class:`CentralCamera` :class:`CatadioptricCamera`
:class:`FishEyeCamera`
"""
[docs]
def __init__(self, **kwargs):
# invoke the superclass constructor
super().__init__(
camtype="spherical",
limits=[-pi, pi, 0, pi],
labels=["Longitude φ (rad)", "Colatitude θ (rad)"],
**kwargs,
)
# return field-of-view angle for x and y direction (rad)
[docs]
def fov(self):
"""
Camera field-of-view angles
:return: field of view angles in radians
:rtype: ndarray(2)
Computes the field of view angles (2x1) in radians for the camera
horizontal and vertical directions.
"""
return [2 * pi, 2 * pi]
[docs]
def project_point(self, P, pose=None, objpose=None):
r"""
Project 3D points to image plane
:param P: 3D world point or points
:type P: array_like(3), array_like(3,n)
:param pose: camera pose with respect to the world frame, defaults to
camera's ``pose`` attribute
:type pose: :class:`~spatialmath..pose3d.SE3`, optional
:param objpose: 3D point reference frame, defaults to world frame
:type objpose: :class:`~spatialmath..pose3d.SE3`, optional
:return: image plane points
:rtype: ndarray(2,n)
Project world points to the spherical camera image plane.
World points are given as a 1D array or the columns of a 2D array of
Euclidean coordinates. The computed image plane coordinates are
in polar form :math:`(\phi, \theta)` (longitude, colatitude),
and given as a 1D array or the corresponding columns of a 2D
array.
If ``pose`` is specified it is used for the camera pose instead of the
attribute ``pose``. The object's attribute is not updated.
The points ``P`` are by default with respect to the world frame, but
they can be transformed by specifying ``objpose``.
:seealso: :meth:`plot_point`
"""
P = base.getmatrix(P, (3, None))
if pose is None:
pose = self.pose
pose = pose.inv()
if objpose is not None:
pose *= objpose
P = pose * P # transform points to camera frame
R = np.linalg.norm(P, axis=0)
x = P[0, :] / R
y = P[1, :] / R
z = P[2, :] / R
phi = np.arctan2(y, x)
theta = np.arccos(z)
return np.array([phi, theta])
[docs]
def visjac_p(self, p, depth=None):
r"""
Visual Jacobian for point features
:param p: image plane points
:type p: array_like(2) or ndarray(2,N)
:param depth: point depth, defaults to None
:type depth: float or array_like(N), optional
:return: visual Jacobian
:rtype: ndarray(2,6) or ndarray(2N,6)
Compute the image Jacobian :math:`\mat{J}` which maps
.. math::
\dvec{p} = \mat{J}(\vec{p}, z) \vec{\nu}
camera spatial velocity :math:`\vec{\nu}` to the image plane velocity
:math:`\dvec{p}` of the point where :math:`\vec{p}=(\phi, \theta)`
If ``p`` describes multiple points then return a stack of these
:math:`2\times 6` matrices, one per point.
Depth is the z-component of the point's coordinate in the camera frame.
If ``depth`` is a scalar then it is the depth for all points.
"""
J = []
if smbase.isscalar(depth):
depth = [depth] * p.shape[1]
for (phi, theta), R in zip(p.T, depth):
sp = np.sin(phi)
cp = np.cos(phi)
st = np.sin(theta)
ct = np.cos(theta)
Jk = np.array(
[
[sp / R / st, -cp / R / st, 0, cp * ct / st, sp * ct / st, -1],
[-cp * ct / R, -sp * ct / R, st / R, sp, -cp, 0],
]
)
J.append(Jk)
return np.vstack(J)
[docs]
def plot(self, frame=False, **kwargs):
smbase.plot_sphere(
radius=1,
filled=True,
color="lightyellow",
alpha=0.3,
resolution=20,
centre=self.pose.t,
)
self.pose.plot(style="arrow", axislabel=True, length=1.4)
# class CentralCamera_polar(Camera):
# """
# Central projection camera class
# """
# def __init__(self,
# f=1,
# distortion=None,
# **kwargs):
# """
# Create central camera projection model in polar coordinates
# :param f: focal length, defaults to 8*1e-3
# :type f: float, optional
# :param distortion: camera distortion parameters, defaults to None
# :type distortion: array_like(5), optional
# :seealso: :meth:`distort`
# """
# super().__init__(type='perspective', **kwargs)
# # TODO some of this logic to f and pp setters
# self.f = f
# self._distortion = distortion
# @classmethod
# def Default(cls, **kwargs):
# default = {
# 'f': 0.008,
# 'rho': 10e-6,
# 'imagesize': 1000,
# 'pp': (500,500),
# 'name': 'default perspective camera'
# }
# return CentralCamera_polar(**{**default, **kwargs})
# def __str__(self):
# s = super().__str__()
# s += self.fmt.format('principal pt', self.pp)
# s += self.fmt.format('focal length', self.f)
# return s
# def project_point(self, P, pose=None, objpose=None, **kwargs):
# r"""
# Project 3D points to image plane
# :param P: 3D points to project into camera image plane
# :type P: array_like(3), array_like(3,n)
# :param pose: camera pose with respect to the world frame, defaults to
# camera's ``pose`` attribute
# :type pose: SE3, optional
# :param objpose: 3D point reference frame, defaults to world frame
# :type objpose: SE3, optional
# :param visibility: test if points are visible, default False
# :type visibility: bool
# :param retinal: transform to retinal coordinates, default False
# :type retinal: bool, optional
# :return: image plane points
# :rtype: ndarray(2,n)
# Project a 3D point to the image plane
# .. math::
# \hvec{p} = \mat{C} \hvec{P}
# where :math:`\mat{C}` is the camera calibration matrix and :math:`\hvec{p}` and :math:`\hvec{P}`
# are the image plane and world frame coordinates respectively.
# Example:
# .. runblock:: pycon
# >>> from machinevisiontoolbox import CentralCamera
# >>> camera = CentralCamera()
# >>> camera.project_point((0.3, 0.4, 2))
# If ``pose`` is specified it is used for the camera frame pose, otherwise
# the attribute ``pose``. The object's ``pose`` attribute is not updated
# if ``pose`` is specified.
# A single point can be specified as a 3-vector, multiple points as an
# array with three rows and one column (x, y, z) per point.
# The points ``P`` are by default with respect to the world frame, but
# they can be transformed by specifying ``objpose``.
# If world points are behind the camera, the image plane points are set to
# NaN.
# if ``visibility`` is True then each projected point is checked to ensure
# it lies in the bounds of the image plane. In this case there are two
# return values: the image plane coordinates and an array of booleans
# indicating if the corresponding point is visible.
# """
# if pose is None:
# pose = self.pose
# C = self.C(pose, retinal=retinal)
# if isinstance(P, np.ndarray):
# if P.ndim == 1:
# P = P.reshape((-1, 1)) # make it a column
# else:
# P = base.getvector(P, out='col')
# # make it homogeneous if not already
# if P.shape[0] == 3:
# P = base.e2h(P)
# # project 3D points
# if objpose is not None:
# P = objpose.A @ P
# x = C @ P
# if behind:
# x[2, x[2, :] < 0] = np.nan # points behind the camera are set to NaN
# x = base.h2e(x)
# # add Gaussian noise and distortion
# x = self.add_noise_distortion(x)
# # do visibility check if required
# if visibility:
# visible = ~np.isnan(x[0,:]) \
# & (x[0, :] >= 0) \
# & (x[1, :] >= 0) \
# & (x[0, :] < self.nu) \
# & (x[1, :] < self.nv)
# return x, visible
# else:
# return x
# def plot_point(self, Pp
# ax = _newplot(self, fig, ax)
# if self._image is not None:
# # if camera has an image, display said image
# idisp(self._image,
# fig=fig,
# ax=ax,
# title=self._name,
# drawonly=True)
# else:
# if self.limits is None:
# ax.set_xlim(0, self.nu)
# ax.set_ylim(0, self.nv)
# else:
# ax.set_xlim(self.limits[0], self.limits[1])
# ax.set_ylim(self.limits[2], self.limits[3])
# ax.autoscale(False)
# ax.set_aspect('equal')
# ax.invert_yaxis()
# ax.grid(True)
# if self.labels is None:
# ax.set_xlabel('u (pixels)')
# ax.set_ylabel('v (pixels)')
# else:
# ax.set_xlabel(self.labels[0])
# ax.set_ylabel(self.labels[1])
# ax.set_title(self.name)
# ax.set_facecolor('lightyellow')
# ax.figure.canvas.set_window_title('Machine Vision Toolbox for Python')
# # TODO figure out axes ticks, etc
# return ax # likely this return is not necessary
if __name__ == "__main__":
from spatialmath import UnitQuaternion
# im1 = Image.Read("eiffel2-1.png", grey=True)
# camera = CentralCamera();
# camera.disp(im1);
# cam = CentralCamera(f=0.08)
# print(cam)
# P = [0.1, 0.2, 3]
# print(cam.project_point(P))
cam = CentralCamera(f=0.08, imagesize=1000, rho=10e-6)
print(cam)
cam.project_point([1, 2, 3])
# P = np.array([[0, 10], [0, 10], [10, 10]])
# p, visible = cam.project_point(P, visibility=True)
# visible
# P = [0.1, 0.2, 3]
# print(cam.project_point(P))
# T1 = SE3(-0.1, 0, 0) * SE3.Ry(0.4);
# camera1 = CentralCamera(name="camera 1", f=0.002, imagesize=1000, rho=10e-6, pose=T1)
# # print(camera1)
# camera1.decomposeH(np.eye(3,3))
# L = Line3.TwoPoints([0, 0, 1], [1, 1, 1])
# camera = CentralCamera.Default();
# l = camera.project_line(L)
# camera.plot_line3(L)
# x = np.r_[cam.pose.t, UnitQuaternion(cam.pose).vec3]
# print(x)
# p, JA, JB = cam.derivatives(x, P)
# print(p)
# print(cam.project_point(P))
# print(JA)
# print(JB)
# smbase.plotvol3(2)
# cam.plot_camera(scale=0.5, shape='camera', T=SE3.Ry(np.pi/2))
# plt.show(block=True)
# print(cam)
# # cam.pose = SE3([0.1, 0.2, 0.3])
# print(cam.pose)
# # fig, ax = c.plot_camera(frustum=True)
# # plt.show()
# np.set_printoptions(linewidth=120, formatter={'float': lambda x: f"{x:8.4g}" if abs(x) > 1e-10 else f"{0:8.4g}"})
# print(cam.project([1,2,3]))
# print(cam.visjac_p((300,300), 1))
# cam.flowfield([0,0,0, 0,0,1])
# # fundamental matrix
# # create +8 world points (20 in this case)
# nx, ny = (4, 5)
# depth = 3
# x = np.linspace(-1, 1, nx)
# y = np.linspace(-1, 1, ny)
# X, Y = np.meshgrid(x, y)
# Z = depth * np.ones(X.shape)
# P = np.dstack((X, Y, Z))
# PC = np.ravel(P, order='C')
# PW = np.reshape(PC, (3, nx * ny), order='F')
# # create projections from pose 1:
# print(c.T)
# p1 = c.project(PW) # p1 wrt c's T
# print(p1)
# c.plot(PW)
# # define pose 2:
# T2 = SE3([0.4, 0.2, 0.3]) # just pure x-translation
# p2 = c.project(PW, T2)
# print(p2)
# c.plot(p2)
# # convert p1, p2 into lists of points?
# p1 = np.float32(np.transpose(p1))
# p2 = np.float32(np.transpose(p2))
# F = c.FfromPoints(p1,
# p2,
# method='8p',
# ransacThresh=3,
# confidence=0.99,
# maxiters=10)
# # to check F:
# p1h = e2h(p1.T)
# p2h = e2h(p2.T)
# pfp = [p2h[:, i].T @ F @ p1h[:, i] for i in range(p1h.shape[1])]
# # [print(pfpi) for pfpi in pfp]
# for pfpi in pfp:
# print(pfpi)
# # should be all close to zero, which they are!
# # essential matrix from points:
# E = c.EfromPoints(p1, p2, c.C)
# # TODO verify E
# import code
# code.interact(local=dict(globals(), **locals()))