-
Notifications
You must be signed in to change notification settings - Fork 65
/
Copy patht2t_vit_t_19.yaml
65 lines (59 loc) · 1.15 KB
/
t2t_vit_t_19.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
epochs: 300
output_dir: output_dir
seed: 0
device: gpu
model:
name: T2TViTWrapper
architecture:
name: T2TViT
img_size: 224
tokens_type: 'transformer'
embed_dim: 448
depth: 19
num_heads: 7
head:
name: T2TViTClsHead
num_classes: 1000
in_channels: 448
dataloader:
train:
loader:
num_workers: 8
use_shared_memory: True
sampler:
batch_size: 128
shuffle: true
drop_last: True
dataset:
name: ImageNet
dataroot: data/ILSVRC2012/train/
return_label: True
transforms:
- name: ToRGB
- name: RandomResizedCrop
size: 224
scale: [0.75, 1.]
ratio: [1., 1.]
interpolation: 'bicubic'
- name: Transpose
- name: Normalize
mean: [127.5, 127.5, 127.5]
std: [127.5, 127.5, 127.5]
lr_scheduler:
name: CosineWarmup
learning_rate: 0.003
T_max: 93835
warmup_steps: 10000
start_lr: 0.00003
end_lr: 0.003
optimizer:
name: AdamW
beta1: 0.9
beta2: 0.999
weight_decay: 0.3
grad_clip:
name: global_norm
value: 1.0
log_config:
name: LogHook
interval: 10