modules/grid_sample_Cinf.py

import math

import torch
import torch.nn.functional as F
from icecream import ic

SIGN = -1


# sign = -1 matches grid sample
def gaussian_partial(squaredbit, std):
    dist = torch.exp(-0.5 * squaredbit) / (std * math.sqrt(2 * math.pi))
    return dist / (dist.sum() + 1e-8)


@torch.jit.script
def gaussian_fn(M: int, std: float, device: torch.device):
    n = torch.arange(0, M, device=device) - (M - 1.0) / 2.0
    sig2 = 2 * std * std
    w = torch.exp(-(n**2) / sig2)
    return w


@torch.jit.script
def gkern(kernlen: int, std: float, device: torch.device):
    """Returns a 2D Gaussian kernel array."""
    gkern1d = gaussian_fn(kernlen, std=std, device=device)
    gkern2d = torch.outer(gkern1d, gkern1d)
    return gkern2d


def combine_kernels1d(kernel1, kernel2):
    if kernel2 is None:
        return kernel1
    if kernel1 is None:
        return kernel2

    s1 = kernel1.shape[-1]
    s2 = kernel2.shape[-1]
    sf = s1 + s2 - 1
    p = (sf - s1) // 2 + 1
    kernel1 = kernel1.reshape(1, 1, s1)
    kernel2 = kernel2.reshape(1, 1, s2)
    kernelf = -F.conv1d(kernel1, kernel2, stride=1, padding=p)
    # place kernel1 at center
    return kernelf


def combine_kernels2d(kernel1, kernel2):
    if kernel2 is None:
        return kernel1
    if kernel1 is None:
        return kernel2

    s1 = kernel1.shape[-1]
    s2 = kernel2.shape[-1]
    sf = s1 + s2 - 1
    p = (sf - s1) // 2 + 1
    kernel1 = kernel1.reshape(1, 1, s1, s1)
    kernel2 = kernel2.reshape(1, 1, s2, s2)
    # place kernel1 at center
    kernelf = -F.conv2d(kernel1, kernel2, stride=1, padding=p)
    return kernelf


def combine_kernels3d(kernel1, kernel2):
    if kernel2 is None:
        return kernel1
    if kernel1 is None:
        return kernel2

    s1 = kernel1.shape[-1]
    s2 = kernel2.shape[-1]
    sf = s1 + s2 - 1
    p = (sf - s1) // 2 + 1
    kernel1 = kernel1.reshape(1, 1, s1, s1, s1)
    kernel2 = kernel2.reshape(1, 1, s2, s2, s2)
    # place kernel1 at center
    kernelf = -F.conv3d(kernel1, kernel2, stride=1, padding=p)
    return kernelf


class GridSampler2D(torch.autograd.Function):
    @staticmethod
    def forward(
        ctx,
        input,
        grid,
        mode="bilinear",
        padding_mode="zeros",
        align_corners=None,
        smoothing=0,
    ):
        # plane.shape: 1, n_comp, grid_size, grid_size
        # grid: (1, N, 1, 2)
        ctx.save_for_backward(input, grid)
        ctx.mode = mode
        ctx.padding_mode = padding_mode
        ctx.align_corners = align_corners
        ctx.smoothing = smoothing
        return F.grid_sample(
            input,
            grid,
            mode=mode,
            padding_mode=padding_mode,
            align_corners=align_corners,
        )

    @staticmethod
    def backward(ctx, grad_output):
        input, grid = ctx.saved_tensors
        device = input.device
        grad_grid = None
        is_3d = len(grid.shape) == 5
        Gsize = max(input.shape)
        if ctx.needs_input_grad[1]:
            f_blur = torch.tensor([0.0, 1.0, 0.0], device=grid.device)
            f_edge = SIGN * torch.tensor([1, 0.0, -1], device=grid.device) / 2
            # f_blur = torch.tensor([0.5, 0.5], device=grid.device)
            # f_edge = SIGN * torch.tensor([1, -1], device=grid.device) / 2
            l = len(f_blur)
            # smoothing = ctx.smoothing * Gsize / 128
            smoothing = 1
            kernlen = 3  # 2*int(smoothing)+1
            if is_3d:
                dy_filter = (
                    f_blur[None, :, None]
                    * f_edge[:, None, None]
                    * f_blur[None, None, :]
                ).reshape(1, 1, l, l, l)
                dx_filter = dy_filter.permute(0, 1, 3, 2, 4)
                dz_filter = dy_filter.permute(0, 1, 2, 4, 3)

                g1 = gaussian_fn(kernlen, std=smoothing + 1e-8)
                smooth_kern = g1[:, None, None] * g1[None, :, None] * g1[None, None, :]
                smooth_kern /= smooth_kern.sum()
                sm_dx_filter = combine_kernels3d(smooth_kern, dx_filter)
                sm_dy_filter = combine_kernels3d(smooth_kern, dy_filter)
                sm_dz_filter = combine_kernels3d(smooth_kern, dz_filter)
                s = sm_dx_filter.shape[-1]

                pinput = input.permute(1, 0, 2, 3, 4)
                dx_input = F.conv3d(
                    pinput,
                    sm_dx_filter.reshape(1, 1, s, s, s),
                    stride=1,
                    padding=s // 2,
                )
                dy_input = F.conv3d(
                    pinput,
                    sm_dy_filter.reshape(1, 1, s, s, s),
                    stride=1,
                    padding=s // 2,
                )
                dz_input = F.conv3d(
                    pinput,
                    sm_dz_filter.reshape(1, 1, s, s, s),
                    stride=1,
                    padding=s // 2,
                )

                dx = F.grid_sample(
                    dx_input.permute(1, 0, 2, 3, 4),
                    grid,
                    mode=ctx.mode,
                    padding_mode=ctx.padding_mode,
                    align_corners=ctx.align_corners,
                )
                dy = F.grid_sample(
                    dy_input.permute(1, 0, 2, 3, 4),
                    grid,
                    mode=ctx.mode,
                    padding_mode=ctx.padding_mode,
                    align_corners=ctx.align_corners,
                )
                dz = F.grid_sample(
                    dz_input.permute(1, 0, 2, 3, 4),
                    grid,
                    mode=ctx.mode,
                    padding_mode=ctx.padding_mode,
                    align_corners=ctx.align_corners,
                )

                grad_grid = torch.stack(
                    [
                        (grad_output * dx).sum(dim=1),
                        (grad_output * dy).sum(dim=1),
                        (grad_output * dz).sum(dim=1),
                    ],
                    dim=-1,
                )
            else:
                """
                s = 2
                # input = torch.zeros((1, 5, 400, 200), device=device)
                fadj_size = torch.tensor(input.shape[-2:]) / 256
                adj_size = s * fadj_size.ceil().int()
                fx, fy = torch.meshgrid(
                    torch.linspace(-adj_size[1]/2, adj_size[1]/2, adj_size[1], device=device),
                    torch.linspace(-adj_size[0]/2, adj_size[0]/2, adj_size[0], device=device), indexing='xy')
                cx2 = fx**2
                cy2 = fy**2

                dist_x_pos = (cy2 + (fx - adj_size[1]/3)**2) / (s * fadj_size[1] * ctx.smoothing)**2
                dist_x_neg = (cy2 + (fx + adj_size[1]/3)**2) / (s * fadj_size[1] * ctx.smoothing)**2

                dist_y_pos = (cx2 + (fy - adj_size[0]/3)**2) / (s * fadj_size[0] * ctx.smoothing)**2
                dist_y_neg = (cx2 + (fy + adj_size[0]/3)**2) / (s * fadj_size[0] * ctx.smoothing)**2

                sm_dx_filter = ((gaussian_partial(dist_x_pos, ctx.smoothing) - gaussian_partial(dist_x_neg, ctx.smoothing))/2).reshape(1, 1, *adj_size)
                sm_dy_filter = ((gaussian_partial(dist_y_pos, ctx.smoothing) - gaussian_partial(dist_y_neg, ctx.smoothing))/2).reshape(1, 1, *adj_size)
                #"""
                # """
                # ic(adj_size, fadj_size, (fx + adj_size[0]/3)**2)
                # ic(dist_x_pos)
                # ic(dist_x_neg)

                dy_filter = (f_blur[None, :] * f_edge[:, None]).reshape(1, 1, l, l)
                dx_filter = dy_filter.permute(0, 1, 3, 2)
                # """
                # """

                dy_filter = (f_blur[None, :] * f_edge[:, None]).reshape(1, 1, l, l)
                dx_filter = dy_filter.permute(0, 1, 3, 2)
                if ctx.smoothing >= 1:
                    smooth_kern = gkern(
                        2 * int(ctx.smoothing + 0.5) + 1,
                        std=1,
                        device=grad_output.device,
                    )
                    smooth_kern /= smooth_kern.sum()
                    sm_dx_filter = combine_kernels2d(smooth_kern, dx_filter)
                    sm_dy_filter = combine_kernels2d(smooth_kern, dy_filter)
                else:
                    sm_dx_filter = dx_filter
                    sm_dy_filter = dy_filter
                """
                size_mul = (torch.tensor(input.shape[-2:]) / 256).ceil().int()
                sm_dx_filter = F.interpolate(
                    sm_dx_filter,
                    tuple((torch.tensor(sm_dx_filter.shape[-2:]) * size_mul).int()),
                    mode="bilinear",
                    align_corners=True,
                )
                sm_dy_filter = F.interpolate(
                    sm_dy_filter,
                    tuple((torch.tensor(sm_dy_filter.shape[-2:]) * size_mul).int()),
                    mode="bilinear",
                    align_corners=True,
                )
                # """

                padding = (sm_dx_filter.shape[-2] // 2, sm_dx_filter.shape[-1] // 2)
                dx_input = F.conv2d(
                    input.permute(1, 0, 2, 3), sm_dx_filter, stride=1, padding=padding
                )
                dy_input = F.conv2d(
                    input.permute(1, 0, 2, 3), sm_dy_filter, stride=1, padding=padding
                )
                # dx_input = dx_input / input.shape[-2] * 128
                # dy_input = dy_input / input.shape[-1] * 128

                dx = F.grid_sample(
                    dx_input.permute(1, 0, 2, 3),
                    grid,
                    mode=ctx.mode,
                    padding_mode=ctx.padding_mode,
                    align_corners=ctx.align_corners,
                )
                dy = F.grid_sample(
                    dy_input.permute(1, 0, 2, 3),
                    grid,
                    mode=ctx.mode,
                    padding_mode=ctx.padding_mode,
                    align_corners=ctx.align_corners,
                )

                grad_grid = torch.stack(
                    [(grad_output * dx).sum(dim=1), (grad_output * dy).sum(dim=1)],
                    dim=-1,
                )

        grad_input = None
        if ctx.needs_input_grad[0]:
            #  if True:
            if ctx.mode == "bilinear":
                mode_enum = 0
            elif ctx.mode == "nearest":
                mode_enum = 1
            else:  # mode == 'bicubic'
                mode_enum = 2

            if ctx.padding_mode == "zeros":
                padding_mode_enum = 0
            elif ctx.padding_mode == "border":
                padding_mode_enum = 1
            else:  # padding_mode == 'reflection'
                padding_mode_enum = 2
            if is_3d:
                op = torch._C._jit_get_operation("aten::grid_sampler_3d_backward")
                if type(op) == tuple:
                    op = op[0]
                grad_input, _ = op(
                    grad_output,
                    input,
                    grid,
                    mode_enum,
                    padding_mode_enum,
                    ctx.align_corners,
                )
            else:
                op = torch._C._jit_get_operation("aten::grid_sampler_2d_backward")
                if type(op) == tuple:
                    op = op[0]
                grad_input, _ = op(
                    grad_output,
                    input,
                    grid,
                    mode_enum,
                    padding_mode_enum,
                    ctx.align_corners,
                    (ctx.needs_input_grad[0], False),
                )

        return grad_input, grad_grid, None, None, None, None


class GridSampler1D(torch.autograd.Function):
    @staticmethod
    def forward(
        ctx,
        input,
        grid,
        mode="bilinear",
        padding_mode="zeros",
        align_corners=None,
        smoothing=0,
    ):
        # plane.shape: 1, n_comp, grid_size, 1
        # grid: (1, N, 1, 2)
        ctx.save_for_backward(input, grid)
        ctx.mode = mode
        ctx.padding_mode = padding_mode
        ctx.align_corners = align_corners
        ctx.smoothing = smoothing
        return F.grid_sample(
            input,
            grid,
            mode=mode,
            padding_mode=padding_mode,
            align_corners=align_corners,
        )

    @staticmethod
    def backward(ctx, grad_output):
        input, grid = ctx.saved_tensors
        mode = ctx.mode
        padding_mode = ctx.padding_mode
        align_corners = ctx.align_corners
        smoothing = ctx.smoothing
        grad_grid = None
        if ctx.needs_input_grad[1]:
            # f_edge = torch.tensor([-1, 0, 1]) / 2
            # f_edge = torch.tensor([1, 0, -1]) / 2
            f_edge = SIGN * torch.tensor([1, -1]) / 2
            l = len(f_edge)

            dz_filter = f_edge.reshape(1, 1, l)
            smooth_kern = gaussian_fn(2 * int(smoothing) + 3, std=smoothing)
            sm_dx_filter = combine_kernels2d(smooth_kern, dz_filter)
            s = sm_dx_filter.shape[-1]

            dx_input = F.conv1d(
                input, sm_dx_filter.reshape(1, 1, s), stride=1, padding=s // 2
            )

            grad_grid = grad_output * F.grid_sample(
                dx_input,
                grid,
                mode=mode,
                padding_mode=padding_mode,
                align_corners=align_corners,
            )

        grad_input = None
        if ctx.needs_input_grad[0]:
            if mode == "bilinear":
                mode_enum = 0
            elif mode == "nearest":
                mode_enum = 1
            else:  # mode == 'bicubic'
                mode_enum = 2

            if padding_mode == "zeros":
                padding_mode_enum = 0
            elif padding_mode == "border":
                padding_mode_enum = 1
            else:  # padding_mode == 'reflection'
                padding_mode_enum = 2
            op = torch._C._jit_get_operation("aten::grid_sampler_1d_backward")

            grad_input, _ = op(
                grad_output,
                input,
                grid,
                mode_enum,
                padding_mode_enum,
                align_corners,
                (ctx.needs_input_grad[1], False),
            )
        return grad_input, grad_grid, None, None, None, None


def grid_sample(
    input, grid, mode="bilinear", padding_mode="zeros", align_corners=None, smoothing=0
):
    # plane.shape: 1, n_comp, grid_size, 1
    # grid: (1, N, 1, 2)
    if grid.shape[-1] == 2 or grid.shape[-1] == 3:
        return GridSampler2D.apply(
            input, grid, mode, padding_mode, align_corners, smoothing
        )
    else:
        raise NotImplementedError("GridSampler only implemented for 2D/3D inputs")


if __name__ == "__main__":
    import cv2
    import matplotlib.pyplot as plt

    im = cv2.imread("plane.png")
    s = im.shape[1]
    plt.imshow(im)
    plt.figure()
    im = torch.as_tensor(im, dtype=torch.float32).permute(2, 0, 1).unsqueeze(0)
    x, y = torch.meshgrid(
        torch.linspace(-1, 1, s), torch.linspace(-1, 1, s), indexing="ij"
    )
    grid = torch.stack([x, y], dim=-1).unsqueeze(0).reshape(1, -1, 1, 2)
    ic(grid.shape)
    grid.requires_grad = True
    dist = torch.linalg.norm(grid, dim=-1, keepdim=True) + 1e-8
    ic(dist.shape)
    grid = torch.where(dist > 0.5, (1 - 1 / dist), dist) * grid / dist
    ic(grid)
    plt.imshow(grid.detach().numpy()[0, :, :, 0].reshape(s, s))
    plt.figure()
    plt.imshow(im[0].permute(1, 2, 0).detach().numpy())
    samp_im = grid_sample(im, grid, smoothing=0)
    ic(samp_im.shape)
    grad_outputs = torch.ones(samp_im.shape)
    plt.imshow(samp_im.detach().reshape(3, s, s).permute(1, 2, 0).numpy())
    plt.figure()
    g = torch.autograd.grad(
        samp_im, grid, grad_outputs=grad_outputs, create_graph=True, allow_unused=True
    )[0]
    ic(grid.shape)
    ic(g.shape)
    plt.imshow(g[..., 0].detach().reshape(s, s))
    plt.figure()
    plt.imshow(g[..., 1].detach().reshape(s, s))
    plt.show()