-
Notifications
You must be signed in to change notification settings - Fork 21
/
Copy pathmodel.py
73 lines (61 loc) · 1.88 KB
/
model.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
import torch
import torch.nn as nn
import torch.nn.functional as F
import timm
import hyptorch.nn as hypnn
def init_model(cfg):
cfg = cfg.as_dict()
if cfg["model"].startswith("dino"):
body = torch.hub.load("facebookresearch/dino:main", cfg["model"])
else:
body = timm.create_model(cfg["model"], pretrained=True)
if cfg.get("hyp_c", 0) > 0:
last = hypnn.ToPoincare(
c=cfg["hyp_c"],
ball_dim=cfg.get("emb", 128),
riemannian=False,
clip_r=cfg.get("clip_r", None),
)
else:
last = NormLayer()
bdim = 2048 if cfg["model"] == "resnet50" else 384
head = nn.Sequential(nn.Linear(bdim, cfg.get("emb", 128)), last)
nn.init.constant_(head[0].bias.data, 0)
nn.init.orthogonal_(head[0].weight.data)
rm_head(body)
if cfg.get("freeze", None) is not None:
freeze(body, cfg["freeze"])
model = HeadSwitch(body, head)
model.cuda().train()
return model
class HeadSwitch(nn.Module):
def __init__(self, body, head):
super(HeadSwitch, self).__init__()
self.body = body
self.head = head
self.norm = NormLayer()
def forward(self, x, skip_head=False):
x = self.body(x)
if type(x) == tuple:
x = x[0]
if not skip_head:
x = self.head(x)
else:
x = self.norm(x)
return x
class NormLayer(nn.Module):
def forward(self, x):
return F.normalize(x, p=2, dim=1)
def freeze(model, num_block):
def fr(m):
for param in m.parameters():
param.requires_grad = False
fr(model.patch_embed)
fr(model.pos_drop)
for i in range(num_block):
fr(model.blocks[i])
def rm_head(m):
names = set(x[0] for x in m.named_children())
target = {"head", "fc", "head_dist"}
for x in names & target:
m.add_module(x, nn.Identity())