Collage_generator/_insertion.py

import PIL.Image as Img
import numpy as np
from tqdm.notebook import tqdm
from PIL import ImageFilter
import tables
import time
import gc
"""
all the insert/append function for collage generator
_canvas_append takes the inserting operation, the rest are finding add_point logic
"""

class _insertion():
    def _canvas_append(self,
                       canvas: np.ndarray,
                       add_point: np.ndarray,
                       img: np.ndarray,
                       mask: np.ndarray = None,
                       mask_label: int = None,
                       mode = "label",
                       format = "pixel"):
        """
        the actual working part, add a image to a canvas
        Args:
            canvas: np.ndarray, 3-channel canvas
            add_point: tuple of int, the topleft point of the image to be added
            img: np.ndarray, 3-channel, the vignette to be added
            mask: np.ndarray(if it's there), 1-channel/4-channels, the mask with the canvas
            mask_label: int/2d np.ndarray/4 channels np.ndarray, the value of this label onto the mask
            mode: str, "label" or "pattern", how the mask be overwritten,
                if "label", it will use the int mask_label
                if "pattern", it will copy the np.ndarray passed to mask_label
            format: str, "pixel" or "COCO", how the mask will be updates by new vignettes
                    in "pixel", each individual mask will be saved on the same dimension
                    if "COCO", each individual mask will be saved by a different color on a 3-channel mask
        Return:
            canvas: np.ndarray of 3 channels, the canvas with img added.
            mask: if format is "pixel" np.ndarray of 1 channel, the mask with img's label added.
                  if format is "COCO", np.ndarray of 4-channels, the mask with img's label added.
        """
        assert format in ["pixel", "COCO"]
        # if there's no mask (preview/background)
        if type(mask) != np.ndarray:
            # add img to canvas, if there's any overlap, skip it
            np.add(canvas[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                  img,
                  where = (canvas[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]] == 0),
                  out = canvas[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                  casting = "unsafe")
            # return canvas
            return canvas

        #if there's a mask, from the logic of the functions below,
        #we are going to direcly add these value to a 0-filled canvas and mask
        else:
            if format == "pixel":
                # add image to canvas
                np.add(canvas[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                       img,
                       out = canvas[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                       casting = "unsafe")
                # add label to mask
                if mode == "label":
                    # if in label mode, we are adding this label int value to all nonzero space
                    np.add(mask[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                           mask_label*np.any(img, axis = 2),
                           out = mask[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                           casting = "unsafe")
                else:
                    #else we are adding a pattern, copy the while pattern
                    np.add(mask[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                           mask_label,
                           out = mask[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                           casting = "unsafe")
                    return canvas, mask
            # if we are building a COCO mode
            if format == "COCO":
                if mode == "label":
                    # generate a new color for this object
                    _new_color, self.existed_color = self._generate_new_color(self.existed_color)
                    self.color_dict[str(tuple(_new_color.tolist()))] = mask_label
                    # we have COCO format use as following, first layer will work as the pixel mask,
                    # and the rest will following, the first layer will be removed when converted to COCO
                    if mask.ndim == 2:
                        # if the mask only have one layer, it must be the start mask
                        # add 3 new layers as the RGB recording
                        mask = np.stack((mask, np.zeros_like(mask),np.zeros_like(mask),np.zeros_like(mask)), axis = -1)
                    # add image to canvas, add different label to different channel of the mask
                    np.add(canvas[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                           img,
                           out = canvas[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                           casting="unsafe")
                    np.add(mask[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1],0],
                           mask_label*np.any(img, axis = 2),
                           out = mask[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1],0],
                           casting="unsafe")
                    np.add(mask[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1],1:4],
                           np.any(img, axis = 2, keepdims = True)*_new_color,
                           mask[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1],1:4],
                           casting="unsafe")
                    return canvas, mask
                else:
                    if mask.ndim == 2:
                        mask = np.stack((mask, np.zeros_like(mask),np.zeros_like(mask),np.zeros_like(mask)), axis = -1)
                    np.add(canvas[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                           img,
                           out = canvas[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                           casting="unsafe")
                    np.add(mask[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                           mask_label,
                           out = mask[add_point[0]:add_point[0]+img.shape[0], add_point[1]:add_point[1]+img.shape[1]],
                           casting="unsafe")
                    return canvas, mask

    def _init_insert(self,
                     img: np.ndarray,
                     canvas: np.ndarray,
                     mask: np.ndarray,
                     label: int,
                     mode = "pattern",
                     format = "pixel"):
        """
        find a random legal position in canvas, append img to canvas and mask
        Args:
            img: np.ndarray of 3 channels, the vignette to be added
            canvas: np.ndarray of 3 channels, the canvas
            mask: 2d/4-channel np.ndarray, the mask
            label: the label to be added
            mode: str, "label" or "pattern", see mode in _canvas_append()
            format: str, see format in _canvas_append()
        Return:
            canvas: np.ndarray of 3 channels, the canvas with img added.
            mask: np.ndarray of 1 channel, the mask with img's label added.
        """
        _outer_bound = (canvas.shape[0] - img.shape[0], canvas.shape[1] - img.shape[1])
        # select an initial add_point
        _add_point = np.array((np.random.randint(low = self._scanning_constant,
                                                 high = _outer_bound[0] - self._scanning_constant),
                               np.random.randint(low = self._scanning_constant,
                                                 high = _outer_bound[1] - self._scanning_constant)))
        # create a binary mask of the img
        _img_mask = np.any(img, axis = 2)

        # directly use the _add_point
        canvas, mask = self._canvas_append(canvas = canvas,
                                           add_point = _add_point,
                                           img = img,
                                           mask = mask,
                                           mask_label = label,
                                           mode = mode,
                                           format = format)
        return canvas, mask

    def _secondary_insert(self,
                          img: np.ndarray,
                          canvas: np.ndarray,
                          mask: np.ndarray,
                          label: int,
                          patience: int,
                          mode = "label",
                          format = "pixel"):
        """
        find a random non-overlapping position in canvas, append img to canvas and mask
        Args:
            img: np.ndarray of 3 channels, the vignette to be added
            canvas: np.ndarray of 3 channels, the canvas
            mask: 2d/4-channel np.ndarray, the mask
            label: the label to be added
            patience: int, the retry time for finding non-overlapping position
            mode: str, "label" or "pattern", see mode in _canvas_append()
            format: str, see format in _canvas_append()
        Return:
            canvas: np.ndarray of 3 channels, the canvas with img added,
                if the tries in {patience} times succssfully added the img onto canvas,
                otherwise the original canvas is returned
            mask: np.ndarray of 2d or 4 channels, the mask with img added,
                if the tries in {patience} times succssfully added the img onto canvas,
                otherwise the original mask if returned
        """
        _outer_bound = (canvas.shape[0] - img.shape[0], canvas.shape[1] - img.shape[1])
        # select an initial add_point
        _add_point = np.array((np.random.randint(
                                 low = self._scanning_constant,
                                 high = _outer_bound[0] - self._scanning_constant),
                               np.random.randint(
                                 low = self._scanning_constant,
                                 high = _outer_bound[1] - self._scanning_constant)
                                ))

        # create a binary mask of the img
        _img_mask = np.any(img, axis = 2)

        for retry in range(patience):
            # for each time make a small move
            _add_point = _add_point + np.random.randint(
                                        low = -1*self._scanning_constant,
                                        high = self._scanning_constant,
                                        size = 2)
            # make sure the new value is legal
            _add_point = np.clip(a = _add_point,
                            a_min = (0,0),
                            a_max = _outer_bound)
            # check if there's any overlap
            # in pixel format check the mask directly
            if format == "pixel":
                _check_zone = mask[_add_point[0]:_add_point[0]+_img_mask.shape[0],
                                   _add_point[1]:_add_point[1]+_img_mask.shape[1]]
            # in COCO format check the first layer of mask
            else:
                _check_zone = mask[_add_point[0]:_add_point[0]+_img_mask.shape[0],
                                   _add_point[1]:_add_point[1]+_img_mask.shape[1],
                                   0]
            # if so
            if np.any(np.multiply(_check_zone,_img_mask)) == True:
                #retry for a new point
                continue
            # otherwise add the img to canvas and mask and stop retry
            else:
                canvas, mask = self._canvas_append(canvas = canvas,
                                                add_point = _add_point,
                                                img = img,
                                                mask = mask,
                                                mask_label = label,
                                                mode = mode,
                                                format = format)
                break
        gc.collect()
        return canvas, mask

    def _try_insert(self,
                    img: np.ndarray,
                    canvas: np.ndarray,
                    mask: np.ndarray,
                    label: int,
                    patience: int,
                    mode = "label",
                    format = "pixel"):
        """
        try to insert img into canvas and mask using a escape-overlapping algorithm
        if the initial point is overlapping, try to "escape" the overlapping
        and append at the first position successfuly escape

        if the initial point is not overlapping, try to find a overlapping point
        and append at the last non-overlapping point before this one

        Args:
            img: np.ndarray of 3 channels, the vignette to be added
            canvas: np.ndarray of 3 channels, the canvas
            mask: 2d/4-channel np.ndarray, the mask
            label: the label to be added
            patience: int, the retry time for finding non-overlapping position
            mode: str, "label" or "pattern", see mode in _canvas_append()
            format: str, see format in _canvas_append()
        Return:
            canvas: np.ndarray of 3 channels, the canvas with img added,
                if the tries in {patience} times succssfully added the img onto canvas,
                otherwise the original canvas is returned
            mask: np.ndarray of 2d or 4 channels, the mask with img added,
                if the tries in {patience} times succssfully added the img onto canvas,
                otherwise the original mask if returned
        """
        _outer_bound = (canvas.shape[0] - img.shape[0], canvas.shape[1] - img.shape[1])
        # select an initial add_point
        _add_point = np.array((np.random.randint(low = self._scanning_constant,
                                       high = _outer_bound[0] - self._scanning_constant),
                    np.random.randint(low = self._scanning_constant,
                                      high = _outer_bound[1] - self._scanning_constant)))
        # create a binary mask of the img
        _img_mask = np.any(img, axis = 2)

        # check if there's any overlap
        if format == "pixel":
            _check_zone = mask[_add_point[0]:_add_point[0]+_img_mask.shape[0],
                               _add_point[1]:_add_point[1]+_img_mask.shape[1]]
        # in COCO format check the first layer of mask
        else:
            _check_zone = mask[_add_point[0]:_add_point[0]+_img_mask.shape[0],
                               _add_point[1]:_add_point[1]+_img_mask.shape[1],
                               0]
        # if we start with an overlap, we need to escape from overlap, otherwise we need to find a overlap
        _init_overlapped = np.any(np.multiply(_check_zone,_img_mask))
        # if we are in a finding mode and need to record the last add point
        _last_add_point = _add_point

        # in the patience time
        for retry in range(patience):
            # for each time make a small move
            _add_point = _add_point + np.random.randint(low = -1*self._scanning_constant,
                                                  high = self._scanning_constant,
                                                  size = 2)
            # make sure the new value is legal
            _add_point = np.clip(a = _add_point,
                                 a_min = (0,0),
                                 a_max = _outer_bound)
            # check if there's any overlap
            if format == "pixel":
                _check_zone = mask[_add_point[0]:_add_point[0]+_img_mask.shape[0],
                                   _add_point[1]:_add_point[1]+_img_mask.shape[1]]
            # in COCO format check the first layer of mask
            else:
                _check_zone = mask[_add_point[0]:_add_point[0]+_img_mask.shape[0],
                                   _add_point[1]:_add_point[1]+_img_mask.shape[1],
                                   0]
            # check if there's overlap
            _overlap = np.any(np.multiply(_check_zone,_img_mask))
            # if we had a overlap in "escaping"
            if (_overlap == True) and (_init_overlapped == True):
                #retry for a new point
                continue
            # if we met the first non-overlap while escaping
            elif (_overlap == False) and (_init_overlapped == True):
                #stop the finding
                canvas, mask = self._canvas_append(canvas = canvas,
                                                add_point = _add_point,
                                                img = img,
                                                mask = mask,
                                                mask_label = label,
                                                mode = mode,
                                                format = format)
                break
            # if we are finding but not found
            elif (_overlap == False) and (_init_overlapped == False):
                #record last add_point and retry for a new point
                _last_add_point = _add_point
                continue
            # or we are finding a overlap and found it, we need to use the last
            else:
                canvas, mask = self._canvas_append(canvas = canvas,
                                                 add_point = _last_add_point,
                                                 img = img,
                                                 mask = mask,
                                                 mask_label = label,
                                                 mode = mode,
                                                 format = format)
                break
        gc.collect()
        return canvas, mask