diff --git a/batch_run.sh b/batch_run.sh index e74a46fe..aa154997 100644 --- a/batch_run.sh +++ b/batch_run.sh @@ -4,24 +4,33 @@ repeat_cnt=$1 +export HCCL_CONNECT_TIMEOUT=300 + for ((i=0; i