image_pyramid.py

import numpy

import utils


class ImagePyramid:
    _ZOOMED_IN_LEVELS = 3  # Number of times you can zoom in beyond 100%

    def __init__(self, matrix, hues, sidelength):
        """
        The sidelength is how large a sub-image we will return in get_submatrix
        """
        self._pyramid = []  # A list of `matrix` at different zoom levels
        self._pyramid.append(matrix)
        self._sidelength = sidelength

        if hues is None:
            self._hue_pyramid = None
        else:
            self._hue_pyramid = []
            self._hue_pyramid.append(hues)

        # Zoom out and make the matrix smaller and smaller
        while max(matrix.shape) >= sidelength:
            # Combine 2x2 squares of pixels to make the next level.
            nr, nc = [(value // 2) * 2 for value in matrix.shape]
            quads = [matrix[row:nr:2, col:nc:2]
                     for row in [0, 1] for col in [0, 1]]
            # TODO: Is there a standard way of resizing a binary image that
            # keeps lines crisp while removing salt-and-pepper noise?

            # We want the following outcomes when combining a 2x2 square into a
            # single pixel:
            #   - If none of the 4 pixels is set, we should not be set.
            #   - If 1 of the 4 pixels is set, we're set a quarter of the time.
            #   - If 2 of the 4 pixels are set, we're set half the time.
            #   - It's impossible to have 3 of the 4 pixels set.
            #   - If all 4 pixels are set, this one should be set, too.
            # To discuss the times when half the pixels are set:
            #   - If the two that are set are on the main diagonal, we should be
            #     set. It's good to make diagonals easy to see.
            #   - If the two that are set are off the main diagonal, we should
            #     not be set.
            #   - If the two that are set are adjacent to each other, we should
            #     be set half the time.
            # To discuss times when 1 pixel is set:
            #   - If the 1 pixel is off the diagonal, it might be part of a
            #     large diagonal line shifted 1 pixel off of our diagonal. Half
            #     of these should be set.
            #   - If the 1 pixel is on the diagonal, we should not be set (so
            #     that we're set a quarter of the time overall).
            # To satisfy all these conditions, we should be set either if both
            # pixels on the diagonal are set or if 1 pixel off the diagonal is
            # set.
            matrix = ((quads[0] & quads[3]) |
                      (quads[1] & numpy.logical_not(quads[2])))
            self._pyramid.append(matrix)

            if hues is not None:
                # Do the same thing with the hues, except use the most extreme
                # value. To get the hues to look right (most problematic is
                # red), we inverted them so low hues indicate longer runs of
                # duplicated code than high ones. So, use the minimum instead
                # of the maximum.
                hue_quads = [hues[row:nr:2, col:nc:2]
                             for row in [0, 1] for col in [0, 1]]
                hues = numpy.minimum(
                    numpy.minimum(hue_quads[0], hue_quads[1]),
                    numpy.minimum(hue_quads[2], hue_quads[3]))
                self._hue_pyramid.append(hues)

        # self._zoom_level is the index into self._pyramid to get the current
        # image.
        self._zoom_level = 0  # Start at 100%
        self._max_zoom_level = len(self._pyramid) - 1

    def get_submatrix(self, top_left_x, top_left_y):
        """
        Given the top left corner of a window, we return a
        sidelength-by-sidelength-by-3 tensor containing an HSV image of the
        relevant region, and the indices of the top-left corner.

        The image returned is at the current zoom level, 3 times taller and
        wider than the displayed window, so that the center of the window is
        the center of the image.
        """
        zoom_level = self._zoom_level
        scale = max(0, -zoom_level)
        current_data = self._pyramid[max(0, zoom_level)]
        nr, nc = current_data.shape
        nr <<= scale
        nc <<= scale

        min_x = max(0,  top_left_x -     self._sidelength)
        min_y = max(0,  top_left_y -     self._sidelength)
        max_x = min(nc, top_left_x + 2 * self._sidelength)
        max_y = min(nr, top_left_y + 2 * self._sidelength)

        if zoom_level >= 0:
            # No need to do anything special: just return the relevant data
            submatrix = current_data[min_y:max_y, min_x:max_x]
            if self._hue_pyramid is None:
                subhues = None
            else:
                hues = self._hue_pyramid[zoom_level]
                subhues = hues[min_y:max_y, min_x:max_x]
            image = utils.to_hsv_matrix(submatrix, subhues)
            return image, min_x, min_y

        # Otherwise, we're zoomed in more than 100%. Grab the data we want,
        # then duplicate it a bunch.

        # First, scale all the coordinates to the actual data size.
        min_x >>= scale
        min_y >>= scale
        max_x >>= scale
        max_y >>= scale
        # To make roundoff errors harder to notice, make the truncated edges 1
        # pixel wider before expanding. Better to be too big than too small.
        max_x += 1
        max_y += 1

        submatrix = current_data[min_y:max_y, min_x:max_x]
        if self._hue_pyramid is None:
            subhues = None
        else:
            subhues = self._hue_pyramid[0][min_y:max_y, min_x:max_x]
        image = utils.to_hsv_matrix(submatrix, subhues)

        # Now, duplicate the data until it's grown to the right size.
        for _ in range(-zoom_level):
            new_image = numpy.zeros(
                [2 * image.shape[0], 2 * image.shape[1], 3], numpy.uint8)
            for r in [0, 1]:
                for c in [0, 1]:
                    new_image[r::2, c::2, :] = image
            image = new_image

        return image, min_x << scale, min_y << scale

    def zoom(self, amount):
        """
        Returns whether we successfully changed zoom levels.
        """
        orig_zoom_level = self._zoom_level
        # Note that tkinter doesn't spawn extra threads, so this doesn't have
        # race conditions.
        self._zoom_level += amount
        self._zoom_level = min(self._zoom_level, self._max_zoom_level)
        self._zoom_level = max(self._zoom_level, -self._ZOOMED_IN_LEVELS)
        return (self._zoom_level != orig_zoom_level)

    def get_zoom_level(self):
        return self._zoom_level