!10052 set HCCL_CONNECT_TIMEOUT=600 for transformer distribute training

From: @yuchaojie
Reviewed-by: @linqingke,@liangchenghui
Signed-off-by: @linqingke
This commit is contained in:
mindspore-ci-bot 2020-12-16 21:10:32 +08:00 committed by Gitee
commit b2e98083c6
1 changed files with 1 additions and 0 deletions

View File

@ -28,6 +28,7 @@ cd run_distribute_train || exit
EPOCH_SIZE=$2 EPOCH_SIZE=$2
DATA_PATH=$3 DATA_PATH=$3
export HCCL_CONNECT_TIMEOUT=600
export RANK_TABLE_FILE=$4 export RANK_TABLE_FILE=$4
export RANK_SIZE=$1 export RANK_SIZE=$1
export HCCL_FLAG=1 export HCCL_FLAG=1