We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5a2acc9 commit 67bdbd3Copy full SHA for 67bdbd3
configs/sft.yaml
@@ -0,0 +1,29 @@
1
+command_file: null
2
+commands: null
3
+compute_environment: LOCAL_MACHINE
4
+deepspeed_config:
5
+ gradient_accumulation_steps: 1
6
+ gradient_clipping: 1.0
7
+ offload_optimizer_device: none
8
+ offload_param_device: none
9
+ zero3_init_flag: true
10
+ zero3_save_16bit_model: true
11
+ zero_stage: 3
12
+distributed_type: DEEPSPEED
13
+downcast_bf16: 'no'
14
+dynamo_backend: 'NO'
15
+fsdp_config: {}
16
+gpu_ids: null
17
+machine_rank: 0
18
+main_process_ip: null
19
+main_process_port: null
20
+main_training_function: main
21
+megatron_lm_config: {}
22
+mixed_precision: fp16
23
+num_machines: 1
24
+num_processes: 8
25
+rdzv_backend: static
26
+same_network: true
27
+tpu_name: null
28
+tpu_zone: null
29
+use_cpu: false
0 commit comments