Source code for conex.helpers.transforms.masks

import math
import torch
import torchvision.transforms.functional as TF

from itertools import product


[docs]class GridEraseMask:
    """
    A Transformer that Grids input and removes only one cell.
    Adding a new dimension in position for total number of cells.
    Inputs should have channel at first index.

    Args:
        m (int): The grid row size.
        n (int): The grid column size.
        random (bool): If true, shuffles the order of the masks.
        gap (tuple(int)): left, right, up, bottom gaps for the cell.
    """

    def __init__(self, m, n, random=False, gap=(0, 0, 0, 0)):
        self.m = m
        self.n = n
        self.random = random
        self.gap = gap

    def __call__(self, img):
        _, h, w = img.shape
        w_grid = math.ceil(w / self.n)
        h_grid = math.ceil(h / self.m)
        gap_left, gap_right, gap_top, gap_bottom = self.gap

        result = []
        location = torch.ones(
            self.m * self.n, self.m, self.n, dtype=torch.bool, device=img.device
        )
        for index, ij in enumerate(product(range(self.m), range(self.n))):
            i, j = ij
            h_cor = i * h_grid + gap_left
            dh = min(h_cor, 0) 
            w_cor = j * w_grid + gap_top
            dw = min(w_cor, 0)
            result.append(
                TF.erase(
                    img,
                    max(h_cor, 0),
                    max(w_cor, 0),
                    h_grid - gap_bottom - gap_top + dh,
                    w_grid - gap_right - gap_left + dw,
                    v=0,
                )
            )
            location[index, ij[0], ij[1]] = False

        result = torch.stack(result)
        if self.random:
            indices = torch.randperm(result.size(0), device=result.device)
            location = location[indices]
            result = result[indices]
        return result, location


[docs]class GridKeepMask:
    """
    A Transformer that Grids input and removes alls but only one cell.
    Adding a new dimension in position for total number of cells.
    Inputs should have channel at first index.

    Args:
        m (int): The grid row size.
        n (int): The grid column size.
        random (bool): If true, shuffles the order of the masks.
        gap (tuple(int)): left, right, up, bottom gaps for the cell.
    """

    def __init__(self, m, n, random=False, gap=(0, 0, 0, 0)):
        self.m = m
        self.n = n
        self.random = random
        self.gap = gap

    def __call__(self, img):
        _, h, w = img.shape
        w_grid = math.ceil(w / self.n)
        h_grid = math.ceil(h / self.m)
        gap_left, gap_right, gap_top, gap_bottom = self.gap

        result = []
        location = torch.zeros(
            self.m * self.n, self.m, self.n, dtype=torch.bool, device=img.device
        )
        for index, ij in enumerate(product(range(self.m), range(self.n))):
            i, j = ij
            bg = torch.zeros_like(img)
            bg[
                :,
                max(i * h_grid + gap_left, 0) : min(
                    (i + 1) * h_grid - gap_right, img.size(1)
                ),
                max(j * w_grid + gap_top, 0) : min(
                    (j + 1) * w_grid - gap_bottom, img.size(2)
                ),
            ] = img[
                :,
                max(i * h_grid + gap_left, 0) : min(
                    (i + 1) * h_grid - gap_right, img.size(1)
                ),
                max(j * w_grid + gap_top, 0) : min(
                    (j + 1) * w_grid - gap_bottom, img.size(2)
                ),
            ]
            result.append(bg)
            location[index, ij[0], ij[1]] = True

        result = torch.stack(result)
        if self.random:
            indices = torch.randperm(result.size(0), device=result.device)
            location = location[indices]
            result = result[indices]
        return result, location


[docs]class GridCropMask:
    """
    A Transformer that Grids input and crops to one cell.
    Adding a new dimension in position for total number of cells.
    Inputs should have channel at first index.

    Args:
        m (int): The grid row size.
        n (int): The grid column size.
        random (bool): If true, shuffles the order of the masks.
        gap (tuple(int)): left, right, up, bottom gaps for the cell.
    """

    def __init__(self, m, n, random=False, gap=(0, 0, 0, 0)):
        self.m = m
        self.n = n
        self.random = random
        self.gap = gap

    def __call__(self, img):
        _, h, w = img.shape
        w_grid = math.ceil(w / self.n)
        h_grid = math.ceil(h / self.m)
        gap_left, gap_right, gap_top, gap_bottom = self.gap

        result = []
        location = torch.zeros(
            self.m * self.n, self.m, self.n, dtype=torch.bool, device=img.device
        )
        for index, ij in enumerate(product(range(self.m), range(self.n))):
            i, j = ij
            result.append(
                TF.crop(
                    img,
                    i * h_grid + gap_left,
                    j * w_grid + gap_top,
                    h_grid - gap_bottom - gap_top,
                    w_grid - gap_right - gap_left,
                )
            )
            location[index, ij[0], ij[1]] = True

        result = torch.stack(result)
        if self.random:
            indices = torch.randperm(result.size(0), device=result.device)
            location = location[indices]
            result = result[indices]
        return result, location