File tree Expand file tree Collapse file tree 11 files changed +11
-11
lines changed Expand file tree Collapse file tree 11 files changed +11
-11
lines changed Original file line number Diff line number Diff line change @@ -40,7 +40,7 @@ log_level: info
4040logging_steps : 5
4141logging_strategy : steps
4242lr_scheduler_type : cosine
43- max_seq_length : 2048
43+ max_length : 2048
4444max_steps : -1
4545num_train_epochs : 1
4646output_dir : data/mistral-7b-sft-constitutional-ai
Original file line number Diff line number Diff line change @@ -40,7 +40,7 @@ log_level: info
4040logging_steps : 5
4141logging_strategy : steps
4242lr_scheduler_type : cosine
43- max_seq_length : 2048
43+ max_length : 2048
4444max_steps : -1
4545num_train_epochs : 1
4646output_dir : data/mistral-7b-sft-constitutional-ai
Original file line number Diff line number Diff line change @@ -90,7 +90,7 @@ log_level: info
9090logging_steps : 5
9191logging_strategy : steps
9292lr_scheduler_type : cosine
93- max_seq_length : 2048
93+ max_length : 2048
9494max_steps : -1
9595num_train_epochs : 1
9696output_dir : data/smollm-360M-instruct-new
Original file line number Diff line number Diff line change @@ -27,7 +27,7 @@ log_level: info
2727logging_steps : 5
2828logging_strategy : steps
2929lr_scheduler_type : cosine
30- max_seq_length : 8192
30+ max_length : 8192
3131max_steps : -1
3232num_train_epochs : 2
3333output_dir : data/smollm2-1.7B-sft
Original file line number Diff line number Diff line change @@ -26,7 +26,7 @@ log_level: info
2626logging_steps : 5
2727logging_strategy : steps
2828lr_scheduler_type : cosine
29- max_seq_length : 8192
29+ max_length : 8192
3030max_steps : -1
3131num_train_epochs : 2
3232output_dir : data/smollm2-360M-sft
Original file line number Diff line number Diff line change @@ -87,7 +87,7 @@ log_level: info
8787logging_steps : 5
8888logging_strategy : steps
8989lr_scheduler_type : cosine
90- max_seq_length : 2048
90+ max_length : 2048
9191max_steps : -1
9292num_train_epochs : 3
9393output_dir : data/starchat2-15b-v0.1
Original file line number Diff line number Diff line change @@ -39,7 +39,7 @@ log_level: info
3939logging_steps : 5
4040logging_strategy : steps
4141lr_scheduler_type : cosine
42- max_seq_length : 2048
42+ max_length : 2048
4343max_steps : -1
4444num_train_epochs : 1
4545output_dir : data/zephyr-7b-sft-full
Original file line number Diff line number Diff line change @@ -54,7 +54,7 @@ log_level: info
5454logging_steps : 5
5555logging_strategy : steps
5656lr_scheduler_type : cosine
57- max_seq_length : 2048
57+ max_length : 2048
5858max_steps : -1
5959num_train_epochs : 1
6060output_dir : data/zephyr-7b-sft-qlora
Original file line number Diff line number Diff line change @@ -42,7 +42,7 @@ log_level: info
4242logging_steps : 5
4343logging_strategy : steps
4444lr_scheduler_type : cosine
45- max_seq_length : 2048
45+ max_length : 2048
4646max_steps : -1
4747num_train_epochs : 3
4848output_dir : data/zephyr-7b-gemma-sft
Original file line number Diff line number Diff line change 2424 --learning_rate 2.0e-5 \
2525 --num_train_epochs 1 \
2626 --packing \
27- --max_seq_length 4096 \
27+ --max_length 4096 \
2828 --per_device_train_batch_size 2 \
2929 --gradient_accumulation_steps 8 \
3030 --gradient_checkpointing \
You can’t perform that action at this time.
0 commit comments