Source code for machinevisiontoolbox.ImageIO

#!/usr/bin/env python

from collections import namedtuple
import matplotlib.pyplot as plt
import numpy as np
import scipy as sp
from scipy import interpolate
import cv2 as cv
from pathlib import Path
import os.path
from spatialmath.base import argcheck, getvector
from machinevisiontoolbox.base import (
    iread,
    iwrite,
    colorname,
    int_image,
    float_image,
    idisp,
)

import os
import cv2 as cv
import zipfile
import numpy as np
import fnmatch
from numpy.core.numeric import _rollaxis_dispatcher

from machinevisiontoolbox.base import mvtb_path_to_datafile, iread, convert
from numpy.lib.arraysetops import isin


[docs] class ImageIOMixin: # ======================= image i/io ================================== #
[docs] @classmethod def Read(cls, filename, alpha=False, rgb=True, **kwargs): """ Read image from file :param filename: image file name :type filename: str :param alpha: include alpha plane if present, defaults to False :type alpha: bool, optional :param rgb: force color image to be in RGB order, defaults to True :type rgb: bool, optional :param kwargs: options applied to image frames, see :func:`~machinevisiontoolbox.base.imageio.convert` :raises ValueError: file not found :return: image from file :rtype: :class:`Image` Load monochrome or color image from file, many common formats are supported. A number of transformations can be applied to the image loaded from the file before it is returned. Example: .. runblock:: pycon >>> from machinevisiontoolbox import Image >>> Image.Read('street.png') >>> Image.Read('flowers1.png') >>> Image.Read('flowers1.png', grey=True) >>> Image.Read('flowers1.png', dtype='float16') >>> Image.Read('flowers1.png', reduce=4) >>> Image.Read('flowers1.png', gamma='sRGB') # linear tristimulus values :note: If the path is not absolute it is first searched for relative to the current directory, and if not found, it is searched for in the ``images`` folder of the ```mvtb_data`` package <https://github.com/petercorke/machinevision-toolbox-python/tree/master/mvtb-data>`_. :seealso: :func:`~machinevisiontoolbox.base.imageio.iread` :func:`~machinevisiontoolbox.base.imageio.convert` `cv2.imread <https://docs.opencv.org/master/d4/da8/group__imgcodecs.html#ga288b8b3da0892bd651fce07b3bbd3a56>`_ """ if not isinstance(filename, (str, Path)): raise ValueError("expecting a string or path") # read the image data = iread(filename, rgb=rgb, **kwargs) # result is a tuple(image, filename) or a list of tuples colororder = None if isinstance(data, tuple): # singleton image, make it a list image, name = data if not alpha and image.ndim == 3 and image.shape[2] == 4: image = image[:, :, :3] if image.ndim > 2: colororder = "RGB" if rgb else "BGR" return cls( image, name=name, colororder=colororder ) # OpenCV file read order) elif isinstance(data, list): raise ValueError("wildcard read not support, use FileCollection")
[docs] def disp(self, title=None, **kwargs): """ Display image :param title: named of window, defaults to image ``name`` :type title: bool :param kwargs: options, see :func:`~machinevisiontoolbox.base.imageio.idisp` Display an image using either Matplotlib (default) or OpenCV. Example: .. runblock:: pycon >>> from machinevisiontoolbox import Image >>> img = Image.Read('flowers1.png') >>> img.disp() .. plot:: from machinevisiontoolbox import Image Image.Read('flowers1.png').disp() :seealso: :func:`~machinevisiontoolbox.base.imageio.idisp` """ if title is False: title = None elif title is None and self.name is not None: _, title = os.path.split(self.name) if self.domain is not None: # left right top bottom kwargs["extent"] = [ self.domain[0][0], self.domain[0][-1], self.domain[1][-1], self.domain[1][0], ] return idisp( self.A, title=title, colororder="RGB" if self.isrgb else "BGR", **kwargs )
[docs] def write(self, filename, dtype="uint8", **kwargs): """ Write image to file :param filename: filename to write to :type filename: str :param dtype: data type to convert to, before writing :type dtype: str :param kwargs: options for :func:`~machinevisiontoolbox.base.iwrite` Write image data to a file. The file format is taken from the extension of the filename. Example: .. runblock:: pycon >>> from machinevisiontoolbox import Image >>> img = Image.Read('flowers1.png') >>> img.write('flowers.jpg') :seealso: :func:`~machinevisiontoolbox.base.iwrite` `cv2.imwrite <https://docs.opencv.org/master/d4/da8/group__imgcodecs.html#gabbc7ef1aa2edfaa87772f1202d67e0ce>`_ """ # cv.imwrite can only save 8-bit single channel or 3-channel BGR images # with several specific exceptions # https://docs.opencv.org/4.4.0/d4/da8/group__imgcodecs.html # #gabbc7ef1aa2edfaa87772f1202d67e0ce # TODO imwrite has many quality/type flags ret = iwrite(self.image.astype(dtype), filename, **kwargs) return ret
[docs] def metadata(self, key=None): """ Get image EXIF metadata :param key: metadata key :type key: str, optional :return: image metadata :rtype: dict, int, float, str Get image metadata from EXIF headers. Example: .. runblock:: pycon >>> from machinevisiontoolbox import Image >>> img = Image.Read('church.jpg') >>> meta = img.metadata() # get all metadata as a dict >>> len(meta) >>> meta >>> meta['FocalLength'] >>> img.metadata('FocalLength') # get specific metadata item :note: Metadata items will be converted, where possible, to int or float values. """ try: import PIL from PIL.ExifTags import TAGS except ImportError: print("Pillow is required to read image file metadata\npip install pillow") image = PIL.Image.open(self.name) exif = {} # iterate over the EXIF tags meta = image._getexif() if meta is None: return # no metadata for tag, value in meta.items(): if tag in TAGS: # map tag number to tag name exif[TAGS[tag]] = value if key is None: return exif else: val = exif[key] if isinstance(val, str): # attempt to turn string into int or float try: return int(val) except ValueError: pass try: return float(val) except ValueError: pass return val if isinstance(val, int): return val elif isinstance(val, tuple) and len(val) == 2: # old versions of PIL return (numerator, denominator) return val[0] / val[1] else: # float values are actually type PIL.TiffImagePlugin.IFDRational val = float(val) return val
[docs] def showpixels( self, textcolors=["yellow", "blue"], fmt=None, ax=None, windowsize=0, **kwargs ): """ Display image with pixel values :param textcolors: text color, defaults to ['yellow', 'blue'] :type textcolors: list or str, optional :param fmt: format string for displaying pixel values, defaults to None :type fmt: str, optional :param ax: Matplotlb axes to draw into, defaults to None :type ax: axes, optional :param windowsize: half side length of superimposed moving window, defaults to 0 :type windowsize: int, optional :return: a moving window :rtype: ``Window`` instance Display a monochrome image with the pixel values overlaid. This is suitable for small images, of order 10x10, used for pedagogical purposes. For example it can be used to animate the operation of sliding window operations like convolution or morphology. ``textcolors`` can be: - a colorname string, in which case all pixel values are displayed in that color - "grey", in which case the pixel values are displayed in grey that is signficantly different from the pixel value - a 2-element tuple or list. The first color in ``textcolors`` is used for pixels below 50% intensity and the second color for those above 50%. .. plot:: from machinevisiontoolbox import Image img = Image.Random(10) img.showpixels(textcolor="grey) .. plot:: from machinevisiontoolbox import Image img = Image.Random(10) img.showpixels(textcolor="yellow") .. plot:: from machinevisiontoolbox import Image img = Image.Random(10) img.showpixels(textcolor=["yellow", "blue"]) If ``windowsize`` is given then a translucent colored window is superimposed and a ``Window`` instance returned. This allows the window position, color and opacity to be changed. Example: .. runblock:: pycon >>> from machinevisiontoolbox import Image >>> img = Image.Random(10) >>> window = img.showpixels(windowsize=1) # with 3x3 window >>> window.move(2,3) # position window at (2,3) >>> window.move(4,5, color='blue', alpha=0.7) .. plot:: from machinevisiontoolbox import Image img = Image.Random(10) img.showpixels(windowsize=1) .. plot:: from machinevisiontoolbox import Image img = Image.Random(10) window = img.showpixels(windowsize=1) window.move(2,3) :seealso: :meth:`print` """ if ax is None: ax = plt.gca() if self.isint: fmt = "{:d}" halfway = self.maxval / 2 elif self.isfloat: fmt = "{:.2f}" halfway = 0.5 elif self.isbool: fmt = "{:d}" halfway = 0.5 else: raise ValueError("unsupported image type") image = self.image for v in range(self.height): for u in range(self.width): if isinstance(textcolors, (list, tuple)): if image[v, u] < halfway: color = textcolors[0] else: color = textcolors[1] elif textcolors == "grey": if image[v, u] < halfway: color = image[v, u] + 0.4 * np.r_[1, 1, 1] else: color = image[v, u] - 0.4 * np.r_[1, 1, 1] elif isinstance(textcolors, str): color = textcolors # same color for all pixels ax.text( u, v, fmt.format(image[v, u]), horizontalalignment="center", verticalalignment="center", color=color, **kwargs, ) ax.imshow(image, cmap="gray") ax.set_xlabel("u (pixels)") ax.set_ylabel("v (pixels)") plt.draw() class Window: def __init__(self, image, h=1, wincolor="red", alpha=0.6, ax=None): self.h = h self.color = wincolor self.alpha = alpha self.image = image w = 2 * h + 1 patch = plt.Rectangle((0, 0), w, w, color=color, alpha=alpha) if ax is None: ax = plt.gca() ax.add_patch(patch) self.patch = patch def move(self, u, v, color=None, alpha=0.5): if color is not None: self.color = color self.patch.set_color(color) if alpha is not None: self.alpha = alpha self.patch.set_alpha(alpha) self.patch.set_x(u - self.h - 0.5) self.patch.set_y(v - self.h - 0.5) return self.image[ v - self.h : v + self.h + 1, u - self.h : u + self.h + 1 ] if windowsize > 0: return Window(self, h=windowsize, ax=ax, **kwargs)
# def ascvtype(self): # if np.issubdtype(self.image.dtype, np.floating): # return self.image.astype(np.float32) # else: # return self.image.astype(np.uint8)
[docs] def anaglyph(self, right, colors="rc", disp=0): """ Convert stereo images to an anaglyph image :param right: right image :type right: Image instance :param colors: lens colors (left, right), defaults to 'rc' :type colors: str, optional :param disp: disparity, defaults to 0 :type disp: int, optional :raises ValueErrror: images are not the same size :return: anaglyph image :rtype: :class:`Image` Returns an anaglyph image which combines the two images of a stereo pair by coding them in two different colors. By default the left image is red, and the right image is cyan. ``colors`` describes the lens color coding as a string with 2 letters, the first for left, the second for right, and each is one of: ==== ======== code color ==== ======== 'r' red 'g' green 'b' green 'c' cyan 'm' magenta ==== ======== If ``disp`` is positive the disparity is increased by shifting the ``right`` image to the right. If negative disparity is reduced by shifting the ``right`` image to the left. These adjustments are achieved by trimming the images. Use this option to make the images more natural/comfortable to view, useful if the images were captured with a stereo baseline significantly different to the human eye separation (typically 65mm). Example: .. runblock:: pycon >>> from machinevisiontoolbox import Image >>> left = Image.Read("rocks2-l.png", reduce=2) >>> right = Image.Read("rocks2-r.png", reduce=2) >>> left.anaglyph(right).disp() .. plot:: from machinevisiontoolbox import Image left = Image.Read("rocks2-l.png", reduce=2) right = Image.Read("rocks2-r.png", reduce=2) left.anaglyph(right).disp() :reference: - Robotics, Vision & Control for Python, Section 14.4, P. Corke, Springer 2023. :seealso: :meth:`stdisp` :meth:`Overlay` """ if self.size != right.size: raise ValueError("images must be same size") width, height = self.size # ensure the images are greyscale left = self.mono() right = right.mono() if disp > 0: left = left.trim(right=disp) right = right.trim(left=disp) elif disp < 0: disp = -disp left = left.trim(left=disp) right = right.trim(right=disp) colordict = { "r": (1, 0, 0), "g": (0, 1, 0), "b": (0, 0, 1), "c": (0, 1, 1), "m": (1, 0, 1), "o": (1, 1, 0), } return left.colorize(colordict[colors[0]]) + right.colorize( colordict[colors[1]] )
[docs] def stdisp(self, right): """ Interactive display of stereo image pair :param right: right image :type right: :class:`Image` The left and right images are displayed, stacked horizontally. Clicking in the left-hand image sets a crosshair cursor in the right-hand image. Clicking the corresponding point in the right-hand image will display the disparity at the top of the right-hand image. Example:: >>> from machinevisiontoolbox import Image >>> left = Image.Read("rocks2-l.png", reduce=2) >>> right = Image.Read("rocks2-r.png", reduce=2) >>> left.stdisp(right) .. plot:: from machinevisiontoolbox import Image left = Image.Read("rocks2-l.png", reduce=2) right = Image.Read("rocks2-r.png", reduce=2) left.stdisp(right) :note: The images are assumed to be epipolar aligned. :reference: - Robotics, Vision & Control for Python, Section 14.4, P. Corke, Springer 2023. :seealso: :meth:`anaglyph` """ class Cursor: """ A cross hair cursor. """ def __init__(self, ax, ax2): self.ax = ax self.ax2 = ax2 self.horizontal_line = ax.axhline(color="k", lw=0.8) self.horizontal_line2 = ax2.axhline(color="k", lw=0.8) self.vertical_line = ax.axvline(color="k", lw=0.8) self.vertical_line2 = ax2.axvline(color="k", lw=0.8) self.vertical_line3 = ax2.axvline(color="k", lw=0.8, ls="--") self.leftclicked = False self.x_left = None # text location in axes coordinates self.text = self.ax2.text( 0.05, 0.95, "", transform=ax2.transAxes, backgroundcolor="w" ) def set_cross_hair_visible(self, visible): need_redraw = self.horizontal_line.get_visible() != visible self.horizontal_line.set_visible(visible) self.horizontal_line2.set_visible(visible) self.vertical_line.set_visible(visible) self.vertical_line2.set_visible(visible) self.vertical_line3.set_visible(visible) self.text.set_visible(visible) return need_redraw def on_mouse_move(self, event): if event.inaxes == self.ax2 and self.leftclicked: x, y = event.xdata, event.ydata # update the line positions self.vertical_line3.set_xdata(x) self.text.set_text("d={:.2f}".format(self.x_left - x)) self.ax2.figure.canvas.draw() # if event.inaxes: # need_redraw = self.set_cross_hair_visible(False) # if need_redraw: # self.ax.figure.canvas.draw() # else: # self.set_cross_hair_visible(True) # x, y = event.xdata, event.ydata # # update the line positions # self.horizontal_line.set_ydata(y) # self.vertical_line.set_xdata(x) # # self.text.set_text('x=%1.2f, y=%1.2f' % (x, y)) # self.ax.figure.canvas.draw() def on_click(self, event): # if not event.inaxes: # need_redraw = self.set_cross_hair_visible(False) # if need_redraw: # self.ax.figure.canvas.draw() # else: if event.inaxes == self.ax: self.set_cross_hair_visible(True) x, y = event.xdata, event.ydata # update the line positions self.horizontal_line.set_ydata(y) self.vertical_line.set_xdata(x) self.horizontal_line2.set_ydata(y) self.vertical_line2.set_xdata(x) self.ax.figure.canvas.draw() self.leftclicked = True self.x_left = x fig, (ax1, ax2) = plt.subplots(ncols=2, sharey=True) self.disp(ax=ax1, grid=True) right.disp(ax=ax2, grid=True) cursor = Cursor(ax1, ax2) fig.canvas.mpl_connect("motion_notify_event", cursor.on_mouse_move) fig.canvas.mpl_connect("button_press_event", cursor.on_click) plt.show(block=True)
# --------------------------------------------------------------------------- # if __name__ == "__main__": import pathlib import os.path # from machinevisiontoolbox import VideoCamera # import time # camera = VideoCamera(1) # time.sleep(10) # for i in range(10): # image = camera.grab() # time.sleep(0.1) # camera.release() # image.disp() # from machinevisiontoolbox import * from machinevisiontoolbox import Image church = Image.Read("shark2.png") print(church.metadata()) church.disp(block=True) # exec(open(pathlib.Path(__file__).parent.parent.absolute() / "tests" / "test_processing.py").read()) # pylint: disable=exec-used