video-object-remover

Sleeping

File size: 5,681 Bytes

d4b77ac

import random
import numpy as np

class RandomMask():
    def __init__(self, videoLength, dataInfo):
        self.videoLength = videoLength
        self.imageHeight, self.imageWidth = dataInfo['image']['image_height'], \
                                            dataInfo['image']['image_width']
        self.maskHeight, self.maskWidth = dataInfo['mask']['mask_height'], \
                                          dataInfo['mask']['mask_width']
        try:
            self.maxDeltaHeight, self.maxDeltaWidth = dataInfo['mask']['max_delta_height'], \
                                                    dataInfo['mask']['max_delta_width']
        except KeyError:
            self.maxDeltaHeight, self.maxDeltaWidth = 0, 0

        try:
            self.verticalMargin, self.horizontalMargin = dataInfo['mask']['vertical_margin'], \
                                                         dataInfo['mask']['horizontal_margin']
        except KeyError:
            self.verticalMargin, self.horizontalMargin = 0, 0

    def __call__(self):
        from .utils import random_bbox
        from .utils import bbox2mask
        masks = []
        bbox = random_bbox(self.imageHeight, self.imageWidth, self.verticalMargin, self.horizontalMargin,
                           self.maskHeight, self.maskWidth)
        if random.uniform(0, 1) > 0.5:
            mask = bbox2mask(self.imageHeight, self.imageWidth, 0, 0, bbox)
            for frame in range(self.videoLength):
                masks.append(mask)
        else:
            for frame in range(self.videoLength):
                delta_h, delta_w = random.randint(-3, 3), random.randint(-3, 3)  # 每次向四个方向移动三个像素以内
                bbox = list(bbox)
                bbox[0] = min(max(self.verticalMargin, bbox[0] + delta_h), self.imageHeight - self.verticalMargin - bbox[2])
                bbox[1] = min(max(self.horizontalMargin, bbox[1] + delta_w), self.imageWidth - self.horizontalMargin - bbox[3])
                mask = bbox2mask(self.imageHeight, self.imageWidth, 0, 0, bbox)
                masks.append(mask)
        masks = np.stack(masks, axis=0)
        if len(masks.shape) == 3:
            masks = masks[:, :, :, np.newaxis]
        assert len(masks.shape) == 4, 'Wrong mask dimension {}'.format(len(masks.shape))
        return masks


class MidRandomMask():
    ### This mask is considered without random motion
    def __init__(self, videoLength, dataInfo):
        self.videoLength = videoLength
        self.imageHeight, self.imageWidth = dataInfo['image']['image_height'], \
                                            dataInfo['image']['image_width']
        self.maskHeight, self.maskWidth = dataInfo['mask']['mask_height'], \
                                          dataInfo['mask']['mask_width']

    def __call__(self):
        from .utils import mid_bbox_mask
        mask = mid_bbox_mask(self.imageHeight, self.imageWidth, self.maskHeight, self.maskWidth)
        masks = []
        for _ in range(self.videoLength):
            masks.append(mask)
        return mask


class MatrixMask():
    ### This mask is considered without random motion
    def __init__(self, videoLength, dataInfo):
        self.videoLength = videoLength
        self.imageHeight, self.imageWidth = dataInfo['image']['image_height'], \
                                            dataInfo['image']['image_width']
        self.maskHeight, self.maskWidth = dataInfo['mask']['mask_height'], \
                                          dataInfo['mask']['mask_width']
        try:
            self.row, self.column = dataInfo['mask']['row'], \
                                dataInfo['mask']['column']
        except KeyError:
            self.row, self.column = 5, 4

    def __call__(self):
        from .utils import matrix2bbox
        mask = matrix2bbox(self.imageHeight, self.imageWidth, self.maskHeight,
                           self.maskWidth, self.row, self.column)
        masks = []
        for video in range(self.videoLength):
            masks.append(mask)
        return mask


class FreeFormMask():
    def __init__(self, videoLength, dataInfo):
        self.videoLength = videoLength
        self.imageHeight, self.imageWidth = dataInfo['image']['image_height'], \
                                            dataInfo['image']['image_width']
        self.maxVertex = dataInfo['mask']['max_vertex']
        self.maxLength = dataInfo['mask']['max_length']
        self.maxBrushWidth = dataInfo['mask']['max_brush_width']
        self.maxAngle = dataInfo['mask']['max_angle']

    def __call__(self):
        from .utils import freeFormMask
        mask = freeFormMask(self.imageHeight, self.imageWidth,
                     self.maxVertex, self.maxLength,
                     self.maxBrushWidth, self.maxAngle)
        return mask


class StationaryMask():
    def __init__(self, videoLength, dataInfo):
        self.videoLength = videoLength
        self.imageHeight, self.imageWidth = dataInfo['image']['image_height'], \
                                            dataInfo['image']['image_width']
        # self.maxPointNum = dataInfo['mask']['max_point_num']
        # self.maxLength = dataInfo['mask']['max_length']

    def __call__(self):
        from .STTN_mask import create_random_shape_with_random_motion
        masks = create_random_shape_with_random_motion(self.videoLength, 0.9, 1.1, 1, 10, self.imageHeight, self.imageWidth)
        masks = np.stack(masks, axis=0)
        if len(masks.shape) == 3:
            masks = masks[:, :, :, np.newaxis]
        assert len(masks.shape) == 4, 'Your masks with a wrong shape {}'.format(len(masks.shape))
        return masks