-
Notifications
You must be signed in to change notification settings - Fork 5
Expand file tree
/
Copy pathmodels.py
More file actions
110 lines (93 loc) · 3.92 KB
/
models.py
File metadata and controls
110 lines (93 loc) · 3.92 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
import torch
import torch.nn as nn
import torch.nn.functional as F
from operator import itemgetter
from transformers import Swinv2Config, Swinv2ForImageClassification
from ultralytics import YOLO
class CNNModel1(nn.Module):
def __init__(self, fully_layer_1, fully_layer_2, drop_rate):
super(CNNModel1, self).__init__()
self.conv1 = nn.Conv2d(3, 32, 2)
self.bn1 = nn.BatchNorm2d(32)
self.conv2 = nn.Conv2d(32, 64, 2)
self.bn2 = nn.BatchNorm2d(64)
self.conv3 = nn.Conv2d(64, 128, 2)
self.bn3 = nn.BatchNorm2d(128)
self.conv4 = nn.Conv2d(128, 64, 2)
self.bn4 = nn.BatchNorm2d(64)
self.conv5 = nn.Conv2d(64, 32, 2)
self.bn5 = nn.BatchNorm2d(32)
self.pool = nn.MaxPool2d(2, 2)
self.drop_rate = drop_rate
#self.dropout = nn.Dropout(drop_rate)
self.fc1 = nn.Linear(#32*5*5,
32*8*8, fully_layer_1)
self.fc2 = nn.Linear(fully_layer_1, fully_layer_2)
self.fc3 = nn.Linear(fully_layer_2, 2)
def forward(self, x):
#print(x.shape)
x = self.pool(F.relu(self.bn1(self.conv1(x))))
#print(x.shape)
x = self.pool(F.relu(self.bn2(self.conv2(x))))
#print(x.shape)
x = self.pool(F.relu(self.bn3(self.conv3(x))))
#print(x.shape)
x = self.pool(F.relu(self.bn4(self.conv4(x))))
#print(x.shape)
x = self.pool(F.relu(self.bn5(self.conv5(x))))
#print(x.shape)
x = x.view(-1, #32*5*5) # For 200x200 images
32*8*8) # For 300x300 images
"""
x = self.dropout(F.relu(self.fc1(x))
x = self.dropout(F.relu(self.fc2(x))
x = self.dropout(x)"""
x = F.dropout(F.relu(self.fc1(x)), self.drop_rate, self.training)
x = F.dropout(F.relu(self.fc2(x)), self.drop_rate, self.training)
x = self.fc3(x)
return x
# TODO: Create other models
class ViT(nn.Module):
def __init__(self, window_size,hidden_size,att_drop,drop_path_rate,drop_rate,layer_norm_eps,encoder_stride,embed_dim,depths,mlp_ratio,num_classes = 2):
super(ViT, self).__init__()
configuration = Swinv2Config()
configuration.hidden_size = hidden_size
configuration.image_size = 300
configuration.hidden_dropout_prob = float(drop_rate)
configuration.window_size = int(window_size)
configuration.attention_probs_dropout_prob = float(att_drop)
configuration.drop_path_rate = float(drop_path_rate)
configuration.layer_norm_eps = float(layer_norm_eps)
configuration.encoder_stride = int(encoder_stride)
configuration.embed_dim = int(embed_dim)
configuration.depths = depths
configuration.mlp_ratio = mlp_ratio
configuration.num_labels = num_classes
model = Swinv2ForImageClassification(configuration)
self.vit = model
def forward(self, x, return_attention=False):
outputs = self.vit(
x,
output_attentions=return_attention,
return_dict=True
)
if return_attention:
return outputs.logits, outputs.attentions
return outputs.logits
class YOLOv11Classifier(nn.Module):
def __init__(self, num_classes, model_size):
super().__init__()
yolo = YOLO(f"{model_size}-cls.pt")
head = yolo.model.model[-1]
if hasattr(head, "linear"):
in_features = head.linear.in_features
head.linear = nn.Linear(in_features, num_classes)
elif hasattr(head, "fc"):
in_features = head.fc.in_features
head.fc = nn.Linear(in_features, num_classes)
self.model = yolo.model
def forward(self, x):
out = self.model(x)
if isinstance(out, (tuple, list)):
out = out[0]
return out