diff --git a/README.md b/README.md index 1d3366b6..981a273f 100644 --- a/README.md +++ b/README.md @@ -520,7 +520,7 @@ use_cpu: false ```bash deepspeed --num_gpus 8 src/train_bash.py \ --deepspeed ds_config.json \ - --ddp_timeout 180000000 \ # If the training data is too large, it is recommended to add the ddp_timeout command line option to prevent NCCL errors. + --ddp_timeout 180000000 \ ... # arguments (same as above) ``` diff --git a/README_zh.md b/README_zh.md index 594dc651..6affad1e 100644 --- a/README_zh.md +++ b/README_zh.md @@ -519,7 +519,7 @@ use_cpu: false ```bash deepspeed --num_gpus 8 src/train_bash.py \ --deepspeed ds_config.json \ - --ddp_timeout 180000000 \ # 如训练数据过大,建议加上ddp_timeout命令行,防止nccl报错 + --ddp_timeout 180000000 \ ... # 参数同上 ```