-
Notifications
You must be signed in to change notification settings - Fork 10
/
Copy pathtrain-original.sh
41 lines (33 loc) · 978 Bytes
/
train-original.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
# original configurations described in the paper are used
# see: Table A.1 of Appendix.A
function bert-base-uncased() {
poetry run python train.py \
--model_name bert-base-uncased \
--batch_size 64 \
--lr 3e-5 \
--output_dir ./outputs/bert-base-uncased
}
function bert-large-uncased() {
poetry run python train.py \
--model_name bert-large-uncased \
--batch_size 64 \
--lr 1e-5 \
--output_dir ./outputs/bert-large-uncased
}
function roberta-base() {
poetry run python train.py \
--model_name roberta-base \
--batch_size 512 \
--lr 1e-5 \
--output_dir ./outputs/roberta-base
}
function roberta-large() {
poetry run python train.py \
--model_name roberta-large \
--batch_size 512 \
--lr 3e-5 \
--output_dir ./outputs/roberta-large
}
# run training!
# you should change the function name to run different models
bert-base-uncased