fix: modify paras in pretrain_dragonfly

This commit is contained in:
wql 2024-08-07 16:00:45 +08:00
parent a62a188fd5
commit db532ca4b1
1 changed files with 2 additions and 2 deletions

View File

@ -219,10 +219,10 @@ else
fi
GPUS_PER_NODE=1
GPUS_PER_NODE=2
NNODES=1
RANK=0
MASTER_ENDPOINT=g3006
MASTER_ENDPOINT=ubuntu
MASTER_PORT=23456
#CMD="torchrun --nnodes=${NNODES} --nproc_per_node=${GPUS_PER_NODE} --node_rank=${RANK} --master_addr=${MASTER_ENDPOINT} --master_port=${MASTER_PORT} ${PRETRAIN_ENTRY} ${OPTS}"
CMD="torchrun --nnodes=${NNODES} --nproc_per_node=${GPUS_PER_NODE} --node_rank=${RANK} --rdzv_id=1 --rdzv_backend=c10d --rdzv_endpoint=${MASTER_ENDPOINT}:${MASTER_PORT} ${PRETRAIN_ENTRY} ${OPTS}"