-
Notifications
You must be signed in to change notification settings - Fork 88
Expand file tree
/
Copy pathconfigs.yml
More file actions
118 lines (104 loc) · 2.36 KB
/
configs.yml
File metadata and controls
118 lines (104 loc) · 2.36 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
# ----------------------------------------------------------------------------------
vit_base_pod16:
# Execution
half: True
rts: True
batch_size: 6
gradient_accumulation_count: 172
replica: 4
epochs: 1600
device: ipu
num_workers: 48
output: checkpoint_mae_vit_base
log: vit_base_pod16
warmup_epochs: 40
saveckp_freq: 4
print_freq: 15
async_type: async
rebatched_worker_size: 1032
norm_pix_loss: True
resume: False
# Model
model: mae_vit_base_patch16
checkpoint: checkpoint.pth
input_size: 224
mask_ratio: 0.75
embed_dim: 768
pipeline: [3, 3, 3, 3, 2, 2, 2, 2]
# tanh or erf
gelu_type: tanh
# Optimizer
blr: 1.5e-4
weight_decay: 0.05
loss_scale: 8388608.
optimizer_step: 10
use_als: False
# ----------------------------------------------------------------------------------
# ----------------------------------------------------------------------------------
vit_base_pod64:
# Execution
half: True
rts: False
batch_size: 6
gradient_accumulation_count: 43
replica: 16
epochs: 1600
device: ipu
num_workers: 64
output: checkpoint_mae_vit_base_pod64
log: vit_base_pod64
warmup_epochs: 40
saveckp_freq: 4
print_freq: 10
async_type: async
rebatched_worker_size: 1032
norm_pix_loss: True
resume: False
# Model
model: mae_vit_base_patch16
checkpoint: checkpoint.pth
input_size: 224
mask_ratio: 0.75
embed_dim: 768
pipeline: [3, 3, 3, 3, 2, 2, 2, 2]
# tanh or erf
gelu_type: tanh
# Optimizer
blr: 1.5e-4
weight_decay: 0.05
loss_scale: 8388608.
optimizer_step: 10
use_als: False
# ----------------------------------------------------------------------------------
# ----------------------------------------------------------------------------------
vit_base_finetune:
# Execution
half: True
batch_size: 8
gradient_accumulation_count: 256
replica: 4
epochs: 100
device: ipu
num_workers: 64
output: checkpoint_mae_vit_base_finetune
log: finetune
saveckp_freq: 4
print_freq: 10
async_type: rebatch
rebatched_worker_size: 256
ipus: 4
eval: False
resume: False
# Model
model: vit_base_patch16
input_size: 224
pipeline: [3, 3, 3, 3]
blr: 5e-4
layer_decay: 0.65
weight_decay: 0.05
drop_path: 0.1
reprob: 0.25
mixup: 0.8
cutmix: 1.0
loss_scale: 1024
# ----------------------------------------------------------------------------------