-
Notifications
You must be signed in to change notification settings - Fork 1
/
_demo_.py
57 lines (45 loc) · 985 Bytes
/
_demo_.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
# Copyright (c) QIU Tian. All rights reserved.
from torch import nn
# runtime
device = 'cuda'
seed = 42
batch_size = 256
epochs = 300
clip_max_norm = 1.0
eval_interval = 1
num_workers = None # auto
pin_memory = True
sync_bn = True
find_unused_params = False
dist_url = 'env://'
print_freq = 50
amp = True
# dataset
data_root = './data'
dataset = 'cifar10'
# data augmentation
image_size = 32
# model
model_lib = 'default'
model = 'vit_tiny_patch4_32'
model_kwargs = dict(in_chans=3, act_layer=nn.GELU, drop_path_rate=0.1) # Do NOT set 'num_classes' in 'model_kwargs'.
# criterion
criterion = 'default'
# optimizer
optimizer = 'adamw'
lr = 0.0005 * (batch_size / 512)
weight_decay = 5e-2
# lr_scheduler
scheduler = 'cosine'
warmup_epochs = 20
warmup_lr = 1e-06
min_lr = 1e-05
# evaluator
evaluator = 'default'
# loading
no_pretrain = True
# saving
save_interval = 5
output_dir = f'./runs/{model}-{dataset}'
# remarks
note = f"using the demo config in 'configs/_demo_.py'"