diff --git a/projects/rccl/.azuredevops/slurm/test_rccl-tests.sh b/projects/rccl/.azuredevops/slurm/test_rccl-tests.sh index a4509ce5d6..c0c05b0303 100644 --- a/projects/rccl/.azuredevops/slurm/test_rccl-tests.sh +++ b/projects/rccl/.azuredevops/slurm/test_rccl-tests.sh @@ -2,7 +2,7 @@ #SBATCH --job-name=rccl-tests #SBATCH --output=%x-%j.out #SBATCH --error=%x-%j.out -#SBATCH --time=60 +#SBATCH --time=120 #SBATCH --nodes=1 #SBATCH --exclusive #SBATCH --partition=gt @@ -40,7 +40,7 @@ do total=$((n*8)) #h_8ppn=`echo ${hosts_8ppn[@]:0:${n}} | tr ' ' ','` - for coll in all_reduce all_gather reduce_scatter alltoall alltoallv broadcast gather reduce scatter sendrecv + for coll in all_reduce all_reduce_bias all_gather reduce_scatter alltoall alltoallv broadcast gather reduce scatter sendrecv do for dtype in float bfloat16 half fp8_e5m2 do