Kaggle-UWMGIT / Git / [f1e01c] /mmseg/datasets/pipelines/custom/tamper

Models:
Mathew-S/
Kaggle-UWMGIT
Downloads: 1
[f1e01c]: / mmseg / datasets / pipelines / custom / tamper_transforms.py
History
Download this file
155 lines (127 with data), 5.6 kB

import copy
import os
import inspect
from collections import defaultdict

import cv2
import mmcv
import numpy as np
from copy import deepcopy
from mmcv.utils import deprecated_api_warning, is_tuple_of
from numpy import random
import math

import traceback

from torch import matrix_power

try:
    from imagecorruptions import corrupt
except ImportError:
    corrupt = None

try:
    import albumentations
    from albumentations import Compose
except ImportError:
    albumentations = None
    Compose = None

from ...builder import PIPELINES

@PIPELINES.register_module()
class RandomRemove(object):
    def __init__(self, prob=0., y_crop_ratio=(0.05, 0.15), x_crop_ratio=(0.15, 0.25)):
        self.prob = prob
        self.x_crop_ratio = x_crop_ratio
        self.y_crop_ratio = y_crop_ratio

    def get_crop_bbox(self, img, crop_size = None):
        """Randomly get a crop bounding box."""
        if crop_size is None:
            crop_size = (
                int(img.shape[0] * (np.random.rand() * (self.y_crop_ratio[1] - self.y_crop_ratio[0]) + self.y_crop_ratio[0])),
                int(img.shape[1] * (np.random.rand() * (self.x_crop_ratio[1] - self.x_crop_ratio[0]) + self.x_crop_ratio[0]))
            )
        margin_h = max(img.shape[0] - crop_size[0], 0)
        margin_w = max(img.shape[1] - crop_size[1], 0)
        offset_h = np.random.randint(0, margin_h + 1)
        offset_w = np.random.randint(0, margin_w + 1)
        crop_y1, crop_y2 = offset_h, offset_h + crop_size[0]
        crop_x1, crop_x2 = offset_w, offset_w + crop_size[1]

        return crop_y1, crop_y2, crop_x1, crop_x2
    
    def __call__(self, results):
        """Call function to flip bounding boxes, masks, semantic segmentation
        maps.

        Args:
            results (dict): Result dict from loading pipeline.

        Returns:
            dict: Flipped results, 'flip', 'flip_direction' keys are added into
                result dict.
        """
        if np.random.rand() < self.prob:
            img = results['img']
            seg = results['gt_semantic_seg']
            y1, y2, x1, x2 = self.get_crop_bbox(img)

            mask_ = np.zeros(img.shape[:2], dtype="uint8")
            xm1, ym1 = int(x1 + 0.5 * (y2 - y1)), int((y1 + y2) / 2)
            xm2, ym2 = int(x2 - 0.5 * (y2 - y1)), int((y1 + y2) / 2)
            xm1, xm2 = min(xm1, xm2), max(xm1, xm2)

            thickness = int(math.sqrt((y2 - y1) ** 2))

            cv2.line(mask_, (xm1, ym1), (xm2, ym2), 255, thickness)
            img = cv2.inpaint(img, mask_, 7, cv2.INPAINT_NS)

            seg[y1:y2, x1:x2,...] = 1
            
            results['img'] = img
            results['gt_semantic_seg'] = seg

        return results

@PIPELINES.register_module()
class RandomCopyMove(object):
    def __init__(self, prob=0., mix_prob=0., save_buffer=16, crop_ratio=(0.05, 0.15)):
        self.prob = prob
        self.mix_prob = mix_prob
        self.save_buffer = save_buffer
        self.saves = [None for _ in range(save_buffer)]
        self.crop_ratio = crop_ratio

    def get_crop_bbox(self, img, crop_size = None):
        """Randomly get a crop bounding box."""
        if crop_size is None:
            crop_size = (
                int(img.shape[0] * (np.random.rand() * (self.crop_ratio[1] - self.crop_ratio[0]) + self.crop_ratio[0])),
                int(img.shape[1] * (np.random.rand() * (self.crop_ratio[1] - self.crop_ratio[0]) + self.crop_ratio[0]))
            )
        margin_h = max(img.shape[0] - crop_size[0], 0)
        margin_w = max(img.shape[1] - crop_size[1], 0)
        offset_h = np.random.randint(0, margin_h + 1)
        offset_w = np.random.randint(0, margin_w + 1)
        crop_y1, crop_y2 = offset_h, offset_h + crop_size[0]
        crop_x1, crop_x2 = offset_w, offset_w + crop_size[1]

        return (crop_y1, crop_y2, crop_x1, crop_x2), crop_size

    def __call__(self, results):
        """Call function to flip bounding boxes, masks, semantic segmentation
        maps.

        Args:
            results (dict): Result dict from loading pipeline.

        Returns:
            dict: Flipped results, 'flip', 'flip_direction' keys are added into
                result dict.
        """
        self.save_results(results)
        if np.random.rand() < self.prob:
            if np.random.rand() < self.mix_prob:
                mix_idx = np.random.randint(0, len(self.saves))
                results = self.copy_move(results, self.saves[mix_idx])
            else:
                results = self.copy_move(results, results)
        return results

    def copy_move(self, results1, results2):
        results2 = results1 if results2 is None else results2
        img1 = results1['img']
        seg1 = results1['gt_semantic_seg']
        crop_bbox1, crop_size = self.get_crop_bbox(img1)
        crop_y11, crop_y21, crop_x11, crop_x21 = crop_bbox1
        img2 = results2['img']
        crop_bbox2, _ = self.get_crop_bbox(img2, crop_size)
        crop_y12, crop_y22, crop_x12, crop_x22 = crop_bbox2
        img1[crop_y11:crop_y21, crop_x11:crop_x21,...] = img2[crop_y12:crop_y22, crop_x12:crop_x22,...]
        seg1[crop_y11:crop_y21, crop_x11:crop_x21,...] = 1
        results1['img'] = img1
        results1['gt_semantic_seg'] = seg1
        return results1

    def save_results(self, results):
        mix_idx = np.random.randint(0, len(self.saves))
        if np.random.rand() < 0.5:
            self.saves[mix_idx] = deepcopy(results)

    def __repr__(self):
        return self.__class__.__name__ + f'(prob={self.prob}, mix_prob={self.mix_prob}, save_buffer={self.save_buffer})'