Digital-Image-Processing-Project/transform.py at main · Screamadelicax/Digital-Image-Processing-Project · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
import torchvision.transforms as transforms
import torch
import torch.nn.functional as F
import cv2
import random

class transform_method:
    def __init__(self, method=1):
        self.transform1 = transforms.Compose([
            transforms.ToPILImage(),
            transforms.Resize((512, 512)),
            transforms.ToTensor(),
            transforms.Normalize((0.5,), (0.5,))
        ])
        self.transform2 = transforms.Compose([
            transforms.RandomResizedCrop(224),
            transforms.RandomHorizontalFlip(),
            transforms.ToTensor(),
            transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
        ])
        self.method = method

    def __call__(self, image):
        """Return the transformation applied on the input image."""

        # Example:
        # self.method = 1, then return self.method_1(image)
        return getattr(self, f'method_{self.method}')(image)

    def normalization(self, iamge):
        mean = torch.tensor([0.5, 0.5, 0.5])
        std = torch.tensor([0.5, 0.5, 0.5])

        image = F.normalize(image, mean, std)
        return image

    """
    transform_method_origin:在加载数据时,所有数据均会先经过这一method
    transform_method_epoch:加载完毕数据之后,训练时的每一个epoch都会经过这一method

    也就是说,train_data会经过transform_method_origin,然后经过transform_method_epoch
    而valid_data只会经过transform_method_origin

    所以,transform_method_epoch一般用于实现数据增强,比如随机裁剪,随机旋转等
    而transform_method_origin一般用于实现数据预处理,比如resize,normalize等

    如果不需要数据增强,则在命令行参数中令 transform_method_epoch = 0 即可
    """

    def method_0(self, image):
        """Return the original image."""
        return image

    def method_1(self, image):
        # resize image
        image = cv2.resize(image, (512, 512)) # (800, 800, 3) -> (512, 512, 3)

        # convert to tensor
        image = torch.from_numpy(image).permute(2, 0, 1).to(torch.float)    # (3, 512, 512)

        # normalize
        image = image / 255.0

        return image

    def method_2(self, image):
        """epoch transform method"""
        # input shape torch.tensor([3, x, x])
        assert image.shape[0] == 3, f'Input image must have 3 channels, but got {image.shape[0]} channels.'

        # 即0.25的几率进行水平翻转
        # 0.25的几率进行垂直翻转
        # 0.5的几率不进行翻转
        if random.random() < 0.25:
            image = torch.flip(image, [1])
        elif random.random() < 0.5:
            image = torch.flip(image, [2])

        # 0.25的几率进行90度旋转
        # 0.25的几率进行180度旋转
        # 0.25的几率进行270度旋转
        # 0.25的几率不进行旋转
        if random.random() < 0.25:
            image = transforms.functional.rotate(image, 90)
        elif random.random() < 0.5:
            image = transforms.functional.rotate(image, 180)
        elif random.random() < 0.75:
            image = transforms.functional.rotate(image, 270)

        return image

    def method_12(self, image):
        """origin transform method"""
        # resize image
        image = cv2.resize(image, (512, 512)) # (800, 800, 3) -> (512, 512, 3)

        # convert to tensor
        image = torch.from_numpy(image).permute(2, 0, 1).to(torch.float)    # (3, 512, 512)

        # normalize to [0, 1]
        #image = image / 255.0

        # replace the pixel value that is more than threshold with replace_value
        threshold = 0.98 * 255
        mask = image > threshold

        replace_value = image[~mask].mean()
        image[mask] = replace_value

        print(mask.sum().item())

        return image