-
Notifications
You must be signed in to change notification settings - Fork 65
/
Copy pathcait_s24_224.yaml
67 lines (61 loc) · 1.19 KB
/
cait_s24_224.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
epochs: 300
output_dir: output_dir
seed: 0
device: gpu
model:
name: CaitWrapper
architecture:
name: Cait
img_size: 224
patch_size: 16
embed_dim: 384
depth: 24
num_heads: 8
init_scale: 1e-5
head:
name: CaitClsHead
num_classes: 1000
in_channels: 384
dataloader:
train:
loader:
num_workers: 8
use_shared_memory: True
sampler:
batch_size: 128
shuffle: true
drop_last: True
dataset:
name: ImageNet
dataroot: data/ILSVRC2012/train/
return_label: True
transforms:
- name: ToRGB
- name: RandomResizedCrop
size: 224
scale: [0.75, 1.]
ratio: [1., 1.]
interpolation: 'bicubic'
- name: Transpose
- name: NormalizeImage
scale: 1.0/255.0
mean: [0.485, 0.456, 0.406]
std: [0.229, 0.224, 0.225]
lr_scheduler:
name: CosineWarmup
learning_rate: 0.003
T_max: 93835
warmup_steps: 10000
start_lr: 0.00003
end_lr: 0.003
optimizer:
name: AdamW
beta1: 0.9
beta2: 0.999
weight_decay: 0.3
grad_clip:
name: global_norm
value: 1.0
log_config:
name: LogHook
interval: 10