diff --git a/examples/accelerate/fsdp_config.yaml b/examples/accelerate/fsdp_config.yaml index cd65e074..6fb09a95 100644 --- a/examples/accelerate/fsdp_config.yaml +++ b/examples/accelerate/fsdp_config.yaml @@ -14,7 +14,7 @@ fsdp_config: fsdp_use_orig_params: true machine_rank: 0 main_training_function: main -mixed_precision: fp16 # or bf16 +mixed_precision: bf16 # or fp16 num_machines: 1 # the number of nodes num_processes: 2 # the number of GPUs in all nodes rdzv_backend: static diff --git a/examples/deepspeed/ds_z0_config.json b/examples/deepspeed/ds_z0_config.json index 46c5ea47..8ac99181 100644 --- a/examples/deepspeed/ds_z0_config.json +++ b/examples/deepspeed/ds_z0_config.json @@ -19,7 +19,7 @@ "stage": 0, "allgather_partitions": true, "allgather_bucket_size": 5e8, - "overlap_comm": true, + "overlap_comm": false, "reduce_scatter": true, "reduce_bucket_size": 5e8, "contiguous_gradients": true, diff --git a/examples/deepspeed/ds_z2_config.json b/examples/deepspeed/ds_z2_config.json index c2ffe80d..c4177e5e 100644 --- a/examples/deepspeed/ds_z2_config.json +++ b/examples/deepspeed/ds_z2_config.json @@ -19,7 +19,7 @@ "stage": 2, "allgather_partitions": true, "allgather_bucket_size": 5e8, - "overlap_comm": true, + "overlap_comm": false, "reduce_scatter": true, "reduce_bucket_size": 5e8, "contiguous_gradients": true, diff --git a/examples/deepspeed/ds_z2_offload_config.json b/examples/deepspeed/ds_z2_offload_config.json index 93f1519a..7550472b 100644 --- a/examples/deepspeed/ds_z2_offload_config.json +++ b/examples/deepspeed/ds_z2_offload_config.json @@ -23,7 +23,7 @@ }, "allgather_partitions": true, "allgather_bucket_size": 5e8, - "overlap_comm": true, + "overlap_comm": false, "reduce_scatter": true, "reduce_bucket_size": 5e8, "contiguous_gradients": true, diff --git a/examples/deepspeed/ds_z3_config.json b/examples/deepspeed/ds_z3_config.json index 6acbe520..46584a76 100644 --- a/examples/deepspeed/ds_z3_config.json +++ b/examples/deepspeed/ds_z3_config.json @@ -17,7 +17,7 @@ }, "zero_optimization": { "stage": 3, - "overlap_comm": true, + "overlap_comm": false, "contiguous_gradients": true, "sub_group_size": 1e9, "reduce_bucket_size": "auto", diff --git a/examples/deepspeed/ds_z3_offload_config.json b/examples/deepspeed/ds_z3_offload_config.json index b92f96a9..0fabebb9 100644 --- a/examples/deepspeed/ds_z3_offload_config.json +++ b/examples/deepspeed/ds_z3_offload_config.json @@ -25,7 +25,7 @@ "device": "cpu", "pin_memory": true }, - "overlap_comm": true, + "overlap_comm": false, "contiguous_gradients": true, "sub_group_size": 1e9, "reduce_bucket_size": "auto",