Updated driver.sh and tester.hpp with sequential numbering for test identification
* Enabled Ping Pong tests
* Removed test commands for multi-workgroup collective tests
[ROCm/rocshmem commit: 23172c9150]
This commit is contained in:
@@ -59,76 +59,76 @@ case $2 in
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 3 > $3/putnbi_n2_w1_z1_1MB.log
|
||||
check putnbi_n2_w1_z1_1MB
|
||||
echo "wg_get_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 28 > $3/wg_get_n2_w1_z64_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 25 > $3/wg_get_n2_w1_z64_1MB.log
|
||||
check wg_get_n2_w1_z1_1MB
|
||||
echo "wg_getnbi_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 29 > $3/wg_getnbi_n2_w1_z64_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 26 > $3/wg_getnbi_n2_w1_z64_1MB.log
|
||||
check wg_getnbi_n2_w1_z1_1MB
|
||||
echo "wg_put_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 30 > $3/wg_put_n2_w1_z64_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 27 > $3/wg_put_n2_w1_z64_1MB.log
|
||||
check wg_put_n2_w1_z1_1MB
|
||||
echo "wg_putnbi_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 31 > $3/wg_putnbi_n2_w1_z64_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 28 > $3/wg_putnbi_n2_w1_z64_1MB.log
|
||||
check wg_putnbi_n2_w1_z1_1MB
|
||||
echo "wg_get_tiled_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 64 -s 1048576 -a 28 > $3/wg_get_tiled_n2_w2_z64_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 64 -s 1048576 -a 25 > $3/wg_get_tiled_n2_w2_z64_1MB.log
|
||||
check wg_get_tiled_n2_w1_z1_1MB
|
||||
echo "wg_getnbi_tiled_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 64 -s 1048576 -a 29 > $3/wg_getnbi_tiled_n2_w2_z64_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 64 -s 1048576 -a 26 > $3/wg_getnbi_tiled_n2_w2_z64_1MB.log
|
||||
check wg_getnbi_tiled_n2_w1_z1_1MB
|
||||
echo "wg_put_tiled_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 64 -s 1048576 -a 30 > $3/wg_put_tiled_n2_w2_z64_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 64 -s 1048576 -a 27 > $3/wg_put_tiled_n2_w2_z64_1MB.log
|
||||
check wg_put_tiled_n2_w1_z1_1MB
|
||||
echo "wg_putnbi_tiled_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 64 -s 1048576 -a 31 > $3/wg_putnbi_tiled_n2_w2_z64_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 64 -s 1048576 -a 28 > $3/wg_putnbi_tiled_n2_w2_z64_1MB.log
|
||||
check wg_putnbi_tiled_n2_w1_z1_1MB
|
||||
echo "wave_get_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 32 > $3/wave_get_n2_w1_z64_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 29 > $3/wave_get_n2_w1_z64_1MB.log
|
||||
check wave_get_n2_w1_z1_1MB
|
||||
echo "wave_getnbi_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 33 > $3/wave_getnbi_n2_w1_z64_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 30 > $3/wave_getnbi_n2_w1_z64_1MB.log
|
||||
check wave_getnbi_n2_w1_z1_1MB
|
||||
echo "wave_put_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 34 > $3/wave_put_n2_w1_z64_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 31 > $3/wave_put_n2_w1_z64_1MB.log
|
||||
check wave_put_n2_w1_z1_1MB
|
||||
echo "wave_putnbi_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 35 > $3/wave_putnbi_n2_w1_z64_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 1048576 -a 32 > $3/wave_putnbi_n2_w1_z64_1MB.log
|
||||
check wave_putnbi_n2_w1_z1_1MB
|
||||
echo "wave_get_tiled_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 128 -s 1048576 -a 32 > $3/wave_get_tiled_n2_w2_z128_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 128 -s 1048576 -a 29 > $3/wave_get_tiled_n2_w2_z128_1MB.log
|
||||
check wave_get_tiled_n2_w1_z1_1MB
|
||||
echo "wave_getnbi_tiled_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 128 -s 1048576 -a 33 > $3/wave_getnbi_tiled_n2_w2_z128_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 128 -s 1048576 -a 30 > $3/wave_getnbi_tiled_n2_w2_z128_1MB.log
|
||||
check wave_getnbi_tiled_n2_w1_z1_1MB
|
||||
echo "wave_put_tiled_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 128 -s 1048576 -a 34 > $3/wave_put_tiled_n2_w2_z128_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 128 -s 1048576 -a 31 > $3/wave_put_tiled_n2_w2_z128_1MB.log
|
||||
check wave_put_tiled_n2_w1_z1_1MB
|
||||
echo "wave_putnbi_tiled_n2_w1_z1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 128 -s 1048576 -a 35 > $3/wave_putnbi_tiled_n2_w2_z128_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 128 -s 1048576 -a 32 > $3/wave_putnbi_tiled_n2_w2_z128_1MB.log
|
||||
check wave_putnbi_tiled_n2_w1_z1_1MB
|
||||
echo "amofadd_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 6 > $3/amofadd_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 5 > $3/amofadd_n2_w1_z1.log
|
||||
check amofadd_n2_w1_z1
|
||||
echo "amofinc_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 7 > $3/amofinc_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 6 > $3/amofinc_n2_w1_z1.log
|
||||
check amofinc_n2_w1_z1
|
||||
echo "amofetch_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 8 > $3/amofetch_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 7 > $3/amofetch_n2_w1_z1.log
|
||||
check amofetch_n2_w1_z1
|
||||
echo "amofcswap_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 9 > $3/amofcswap_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 8 > $3/amofcswap_n2_w1_z1.log
|
||||
check amofcswap_n2_w1_z1
|
||||
echo "amoadd_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 10 > $3/amoadd_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 9 > $3/amoadd_n2_w1_z1.log
|
||||
check amoadd_n2_w1_z1
|
||||
echo "amoinc_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 11 > $3/amoinc_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 10 > $3/amoinc_n2_w1_z1.log
|
||||
check amoinc_n2_w1_z1
|
||||
# echo "pingpong_n2_w1"
|
||||
# ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -a 14 > $3/pingpong_n2_w1.log
|
||||
# check pingpong_n2_w1
|
||||
echo "pingpong_n2_w1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -a 13 > $3/pingpong_n2_w1.log
|
||||
check pingpong_n2_w1
|
||||
echo "amoset_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 44 > $3/amoset_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 41 > $3/amoset_n2_w1_z1.log
|
||||
check amoset_n2_w1_z1
|
||||
;;
|
||||
|
||||
@@ -149,103 +149,103 @@ case $2 in
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 128 -s 8 -a 3 > $3/putnbi_n2_w16_z128_8B.log
|
||||
check putnbi_n2_w16_z128_8B
|
||||
echo "wg_get_n2_w1_z64_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 28 > $3/wg_get_n2_w1_z64_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 25 > $3/wg_get_n2_w1_z64_8B.log
|
||||
check wg_get_n2_w1_z64_8B
|
||||
echo "wg_getnbi_n2_w1_z64_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 29 > $3/wg_getnbi_n2_w1_z64_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 26 > $3/wg_getnbi_n2_w1_z64_8B.log
|
||||
check wg_getnbi_n2_w1_z64_8B
|
||||
echo "wg_put_n2_w1_z64_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 30 > $3/wg_put_n2_w1_z64_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 27 > $3/wg_put_n2_w1_z64_8B.log
|
||||
check wg_put_n2_w1_z64_8B
|
||||
echo "wg_putnbi_n2_w1_z64_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 31 > $3/wg_putnbi_n2_w1_z64_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 28 > $3/wg_putnbi_n2_w1_z64_8B.log
|
||||
check wg_putnbi_n2_w1_z64_8B
|
||||
echo "wg_get_tiled_n2_w16_z64_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 64 -s 8 -a 28 > $3/wg_get_tiled_n2_w16_z64_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 64 -s 8 -a 25 > $3/wg_get_tiled_n2_w16_z64_8B.log
|
||||
check wg_get_tiled_n2_w16_z64_8B
|
||||
echo "wg_getnbi_tiled_n2_w16_z64_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 64 -s 8 -a 29 > $3/wg_getnbi_tiled_n2_w16_z64_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 64 -s 8 -a 26 > $3/wg_getnbi_tiled_n2_w16_z64_8B.log
|
||||
check wg_getnbi_tiled_n2_w16_z64_8B
|
||||
echo "wg_put_tiled_n2_w16_z64_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 64 -s 8 -a 30 > $3/wg_put_tiled_n2_w16_z64_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 64 -s 8 -a 27 > $3/wg_put_tiled_n2_w16_z64_8B.log
|
||||
check wg_put_tiled_n2_w16_z64_8B
|
||||
echo "wg_putnbi_tiled_n2_w16_z64_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 64 -s 8 -a 31 > $3/wg_putnbi_tiled_n2_w16_z64_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 64 -s 8 -a 28 > $3/wg_putnbi_tiled_n2_w16_z64_8B.log
|
||||
check wg_putnbi_tiled_n2_w16_z64_8B
|
||||
echo "wave_get_n2_w1_z64_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 32 > $3/wave_get_n2_w1_z64_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 29 > $3/wave_get_n2_w1_z64_8B.log
|
||||
check wave_get_n2_w1_z64_8B
|
||||
echo "wave_getnbi_n2_w1_z64_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 33 > $3/wave_getnbi_n2_w1_z64_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 30 > $3/wave_getnbi_n2_w1_z64_8B.log
|
||||
check wave_getnbi_n2_w1_z64_8B
|
||||
echo "wave_put_n2_w1_z64_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 34 > $3/wave_put_n2_w1_z64_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 31 > $3/wave_put_n2_w1_z64_8B.log
|
||||
check wave_put_n2_w1_z64_8B
|
||||
echo "wave_putnbi_n2_w1_z64_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 35 > $3/wave_putnbi_n2_w1_z64_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 64 -s 8 -a 32 > $3/wave_putnbi_n2_w1_z64_8B.log
|
||||
check wave_putnbi_n2_w1_z64_8B
|
||||
echo "wave_get_tiled_n2_w16_z128_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 128 -s 8 -a 32 > $3/wave_get_tiled_n2_w16_z128_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 128 -s 8 -a 29 > $3/wave_get_tiled_n2_w16_z128_8B.log
|
||||
check wave_get_tiled_n2_w16_z128_8B
|
||||
echo "wave_getnbi_tiled_n2_w16_z128_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 128 -s 8 -a 33 > $3/wave_getnbi_tiled_n2_w16_z128_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 128 -s 8 -a 30 > $3/wave_getnbi_tiled_n2_w16_z128_8B.log
|
||||
check wave_getnbi_tiled_n2_w16_z128_8B
|
||||
echo "wave_put_tiled_n2_w16_z128_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 128 -s 8 -a 34 > $3/wave_put_tiled_n2_w16_z128_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 128 -s 8 -a 31 > $3/wave_put_tiled_n2_w16_z128_8B.log
|
||||
check wave_put_tiled_n2_w16_z128_8B
|
||||
echo "wave_putnbi_tiled_n2_w16_z128_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 128 -s 8 -a 35 > $3/wave_putnbi_tiled_n2_w16_z128_8B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=16 mpirun -np 2 $1 -w 16 -z 128 -s 8 -a 32 > $3/wave_putnbi_tiled_n2_w16_z128_8B.log
|
||||
check wave_putnbi_tiled_n2_w16_z128_8B
|
||||
echo "amofadd_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 6 > $3/amofadd_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 5 > $3/amofadd_n2_w8_z1.log
|
||||
check amofadd_n2_w8_z1
|
||||
echo "amofinc_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 7 > $3/amofinc_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 6 > $3/amofinc_n2_w8_z1.log
|
||||
check amofinc_n2_w8_z1
|
||||
echo "amofetch_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 8 > $3/amofetch_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 7 > $3/amofetch_n2_w8_z1.log
|
||||
check amofetch_n2_w8_z1
|
||||
echo "amofcswap_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 9 > $3/amofcswap_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 8 > $3/amofcswap_n2_w8_z1.log
|
||||
check amofcswap_n2_w8_z1
|
||||
echo "amoadd_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 10 > $3/amoadd_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 9 > $3/amoadd_n2_w8_z1.log
|
||||
check amoadd_n2_w8_z1
|
||||
echo "amoinc_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 11 > $3/amoinc_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 10 > $3/amoinc_n2_w8_z1.log
|
||||
check amoinc_n2_w8_z1
|
||||
# echo "pingpong_n2_w1"
|
||||
# ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -a 14 > $3/pingpong_n2_w1.log
|
||||
# check pingpong_n2_w1
|
||||
echo "pingpong_n2_w1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -a 13 > $3/pingpong_n2_w1.log
|
||||
check pingpong_n2_w1
|
||||
echo "amoset_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 44 > $3/amoset_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 41 > $3/amoset_n2_w8_z1.log
|
||||
check amoset_n2_w8_z1
|
||||
echo "putsignal_n2_w1_z1"
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 53 > $3/putsignal_n2_w1_z1.log
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 50 > $3/putsignal_n2_w1_z1.log
|
||||
check putsignal_n2_w1_z1
|
||||
echo "putsignalwg_n2_w2_z32"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 32 -s 1048576 -a 55 > $3/putsignalwg_n2_w2_z32.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 32 -s 1048576 -a 52 > $3/putsignalwg_n2_w2_z32.log
|
||||
check putsignalwg_n2_w2_z32
|
||||
echo "putsignalwave_n2_w1_z32"
|
||||
mpirun -np 2 $1 -w 1 -z 32 -s 1048576 -a 55 > $3/putsignalwave_n2_w1_z32.log
|
||||
mpirun -np 2 $1 -w 1 -z 32 -s 1048576 -a 52 > $3/putsignalwave_n2_w1_z32.log
|
||||
check putsignalwave_n2_w1_z32
|
||||
echo "putsignalnbi"
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 56 > $3/putsignalnbi_n2_w1_z1.log
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 53 > $3/putsignalnbi_n2_w1_z1.log
|
||||
check putsignalnbi_n2_w1_z1
|
||||
echo "putsignalnbiwg"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 32 -s 1048576 -a 57 > $3/putsignalnbiwg_n2_w2_z32.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 32 -s 1048576 -a 54 > $3/putsignalnbiwg_n2_w2_z32.log
|
||||
check putsignalnbiwg_n2_w2_z32
|
||||
echo "putsignalnbiwave"
|
||||
mpirun -np 2 $1 -w 1 -z 32 -s 1048576 -a 58 > $3/putsignalnbiwave_n2_w1_z32.log
|
||||
mpirun -np 2 $1 -w 1 -z 32 -s 1048576 -a 55 > $3/putsignalnbiwave_n2_w1_z32.log
|
||||
check putsignalnbiwave_n2_w1_z32
|
||||
echo "signalfetch"
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 59 > $3/signalfetch_n2_w1_z1.log
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 56 > $3/signalfetch_n2_w1_z1.log
|
||||
check signalfetch_n2_w1_z1
|
||||
echo "signalfetchwg"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 32 -a 60 > $3/signalfetchwg_n2_w2_z32.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 32 -a 57 > $3/signalfetchwg_n2_w2_z32.log
|
||||
check signalfetchwg_n2_w2_z32
|
||||
echo "signalfetchwave"
|
||||
mpirun -np 2 $1 -w 1 -z 32 -a 60 > $3/signalfetchwave_n2_w2_z32.log
|
||||
mpirun -np 2 $1 -w 1 -z 32 -a 57 > $3/signalfetchwave_n2_w2_z32.log
|
||||
check signalfetchwave_n2_w2_z32
|
||||
;;
|
||||
|
||||
@@ -329,172 +329,132 @@ case $2 in
|
||||
echo "putnbi_n2_w64_z1024_8B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=64 mpirun -np 2 $1 -w 64 -z 1024 -s 8 -a 3 > $3/putnbi_n2_w64_z1024_8B.log
|
||||
check putnbi_n2_w64_z1024_8B
|
||||
############################# REDUCTION ##############################
|
||||
echo "reduction_n2_w1_z1_32K"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -s 32768 -a 5 > $3/reduction_n2_w1_z1_32K.log
|
||||
check reduction_n2_w1_z1_32K
|
||||
echo "reduction_n2_w8_z1_32K"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -s 32768 -a 5 > $3/reduction_n2_w8_z1_32K.log
|
||||
check reduction_n2_w8_z1_32K
|
||||
echo "reduction_n2_w32_z1_32K"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 1 -s 32768 -a 5 > $3/reduction_n2_w32_z1_32K.log
|
||||
check reduction_n2_w32_z1_32K
|
||||
############################## AMOFADD ###############################
|
||||
echo "amofadd_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 6 > $3/amofadd_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 5 > $3/amofadd_n2_w1_z1.log
|
||||
check amofadd_n2_w1_z1
|
||||
echo "amofadd_n2_w1_z1024"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1024 -a 6 > $3/amofadd_n2_w1_z1024.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1024 -a 5 > $3/amofadd_n2_w1_z1024.log
|
||||
check amofadd_n2_w1_z1024
|
||||
echo "amofadd_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 6 > $3/amofadd_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 5 > $3/amofadd_n2_w8_z1.log
|
||||
check amofadd_n2_w8_z1
|
||||
echo "amofadd_n2_w32_z128"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 128 -a 6 > $3/amofadd_n2_w32_z128.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 128 -a 5 > $3/amofadd_n2_w32_z128.log
|
||||
check amofadd_n2_w32_z128
|
||||
############################## AMOFINC ###############################
|
||||
echo "amofinc_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 7 > $3/amofinc_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 6 > $3/amofinc_n2_w1_z1.log
|
||||
check amofinc_n2_w1_z1
|
||||
echo "amofinc_n2_w1_z1024"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1024 -a 7 > $3/amofinc_n2_w1_z1024.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1024 -a 6 > $3/amofinc_n2_w1_z1024.log
|
||||
check amofinc_n2_w1_z1024
|
||||
echo "amofinc_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 7 > $3/amofinc_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 6 > $3/amofinc_n2_w8_z1.log
|
||||
check amofinc_n2_w8_z1
|
||||
echo "amofinc_n2_w32_z128"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 128 -a 7 > $3/amofinc_n2_w32_z128.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 128 -a 6 > $3/amofinc_n2_w32_z128.log
|
||||
check amofinc_n2_w32_z128
|
||||
############################ AMOFETCH ################################
|
||||
echo "amofetch_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 8 > $3/amofetch_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 7 > $3/amofetch_n2_w1_z1.log
|
||||
check amofetch_n2_w1_z1
|
||||
echo "amofetch_n2_w1_z1024"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1024 -a 8 > $3/amofetch_n2_w1_z1024.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1024 -a 7 > $3/amofetch_n2_w1_z1024.log
|
||||
check amofetch_n2_w1_z1024
|
||||
echo "amofetch_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 8 > $3/amofetch_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 7 > $3/amofetch_n2_w8_z1.log
|
||||
check amofetch_n2_w8_z1
|
||||
echo "amofetch_n2_w32_z128"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 128 -a 8 > $3/amofetch_n2_w32_z128.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 128 -a 7 > $3/amofetch_n2_w32_z128.log
|
||||
check amofetch_n2_w32_z128
|
||||
########################### AMOFCSWAP ################################
|
||||
echo "amofcswap_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 9 > $3/amofcswap_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 8 > $3/amofcswap_n2_w1_z1.log
|
||||
check amofcswap_n2_w1_z1
|
||||
echo "amofcswap_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 9 > $3/amofcswap_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 8 > $3/amofcswap_n2_w8_z1.log
|
||||
check amofcswap_n2_w8_z1
|
||||
echo "amofcswap_n2_w32_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 1 -a 9 > $3/amofcswap_n2_w32_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 1 -a 8 > $3/amofcswap_n2_w32_z1.log
|
||||
check amofcswap_n2_w32_z1
|
||||
############################# AMOADD ################################
|
||||
echo "amoadd_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 10 > $3/amoadd_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 9 > $3/amoadd_n2_w1_z1.log
|
||||
check amoadd_n2_w1_z1
|
||||
echo "amoadd_n2_w1_z1024"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1024 -a 10 > $3/amoadd_n2_w1_z1024.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1024 -a 9 > $3/amoadd_n2_w1_z1024.log
|
||||
check amoadd_n2_w1_z1024
|
||||
echo "amoadd_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 10 > $3/amoadd_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 9 > $3/amoadd_n2_w8_z1.log
|
||||
check amoadd_n2_w8_z1
|
||||
echo "amoadd_n2_w32_z128"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 128 -a 10 > $3/amoadd_n2_w32_z128.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 128 -a 9 > $3/amoadd_n2_w32_z128.log
|
||||
check amoadd_n2_w32_z128
|
||||
############################# AMOINC ################################
|
||||
echo "amoinc_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 11 > $3/amoinc_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 10 > $3/amoinc_n2_w1_z1.log
|
||||
check amoinc_n2_w1_z1
|
||||
echo "amoinc_n2_w1_z1024"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1024 -a 11 > $3/amoinc_n2_w1_z1024.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1024 -a 10 > $3/amoinc_n2_w1_z1024.log
|
||||
check amoinc_n2_w1_z1024
|
||||
echo "amoinc_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 11 > $3/amoinc_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 10 > $3/amoinc_n2_w8_z1.log
|
||||
check amoinc_n2_w8_z1
|
||||
echo "amoinc_n2_w32_z128"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 128 -a 11 > $3/amoinc_n2_w32_z128.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 128 -a 10 > $3/amoinc_n2_w32_z128.log
|
||||
check amoinc_n2_w32_z128
|
||||
############################## INIT #################################
|
||||
echo "init_n2"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -a 13 > $3/init_n2.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -a 12 > $3/init_n2.log
|
||||
check init_n2
|
||||
########################### PINGPONG ################################
|
||||
echo "pingpong_n2_w1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -a 14 > $3/pingpong_n2_w1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -a 13 > $3/pingpong_n2_w1.log
|
||||
check pingpong_n2_w1
|
||||
echo "pingpong_n2_w8"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -a 14 > $3/pingpong_n2_w8.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -a 13 > $3/pingpong_n2_w8.log
|
||||
check pingpong_n2_w8
|
||||
echo "pingpong_n2_w32"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -a 14 > $3/pingpong_n2_w32.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -a 13 > $3/pingpong_n2_w32.log
|
||||
check pingpong_n2_w32
|
||||
############################ BARRIER ################################
|
||||
echo "barrier_n2_w1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -a 17 > $3/barrier_n2_w1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -a 15 > $3/barrier_n2_w1.log
|
||||
check barrier_n2_w1
|
||||
echo "barrier_n2_w8"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -a 17 > $3/barrier_n2_w8.log
|
||||
check barrier_n2_w8
|
||||
echo "barrier_n2_w32"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -a 17 > $3/barrier_n2_w32.log
|
||||
check barrier_n2_w32
|
||||
############################ SYNCALL ################################
|
||||
echo "syncall_n2_w1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -a 18 > $3/syncall_n2_w1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -a 16 > $3/syncall_n2_w1.log
|
||||
check syncall_n2_w1
|
||||
echo "syncall_n2_w8"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -a 18 > $3/syncall_n2_w8.log
|
||||
check syncall_n2_w8
|
||||
echo "syncall_n2_w32"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -a 18 > $3/syncall_n2_w32.log
|
||||
check syncall_n2_w32
|
||||
############################# SYNC ##################################
|
||||
echo "sync_n2_w1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -a 19 > $3/sync_n2_w1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -a 17 > $3/sync_n2_w1.log
|
||||
check sync_n2_w1
|
||||
echo "sync_n2_w8"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -a 19 > $3/sync_n2_w8.log
|
||||
check sync_n2_w8
|
||||
echo "sync_n2_w32"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -a 19 > $3/sync_n2_w32.log
|
||||
check sync_n2_w32
|
||||
########################### FCOLLECT ################################
|
||||
echo "fcollect_n2_w1_512B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -s 512 -a 22 > $3/fcollect_n2_w1_512B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -s 512 -a 19 > $3/fcollect_n2_w1_512B.log
|
||||
check fcollect_n2_w1_512B
|
||||
echo "fcollect_n2_w8_512B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -s 512 -a 22 > $3/fcollect_n2_w8_512B.log
|
||||
check fcollect_n2_w8_512B
|
||||
echo "fcollect_n2_w32_512B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -s 512 -a 22 > $3/fcollect_n2_w32_512B.log
|
||||
check fcollect_n2_w32_512B
|
||||
########################### ALLTOALL ################################
|
||||
echo "alltoall_n2_w1_512B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -s 512 -a 23 > $3/alltoall_n2_w1_512B.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -s 512 -a 20 > $3/alltoall_n2_w1_512B.log
|
||||
check alltoall_n2_w1_512B
|
||||
echo "alltoall_n2_w8_512B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -s 512 -a 23 > $3/alltoall_n2_w8_512B.log
|
||||
check alltoall_n2_w8_512B
|
||||
echo "alltoall_n2_w32_512B"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -s 512 -a 23 > $3/alltoall_n2_w32_512B.log
|
||||
check alltoall_n2_w32_512B
|
||||
########################## TEAMGETNBI ###############################
|
||||
echo "teamgetnbi_n2_w1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -s 1048576 -a 39 > $3/teamgetnbi_n2_w1_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -s 1048576 -a 36 > $3/teamgetnbi_n2_w1_1MB.log
|
||||
check teamgetnbi_n2_w1_1MB
|
||||
########################## TEAMPUTNBI ###############################
|
||||
echo "teamputnbi_n2_w1_1MB"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -s 1048576 -a 41 > $3/teamputnbi_n2_w1_1MB.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -s 1048576 -a 38 > $3/teamputnbi_n2_w1_1MB.log
|
||||
check teamputnbi_n2_w1_1MB
|
||||
############################ AMOSET #################################
|
||||
echo "amoset_n2_w1_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 44 > $3/amoset_n2_w1_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=1 mpirun -np 2 $1 -w 1 -z 1 -a 41 > $3/amoset_n2_w1_z1.log
|
||||
check amoset_n2_w1_z1
|
||||
echo "amoset_n2_w8_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 44 > $3/amoset_n2_w8_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=8 mpirun -np 2 $1 -w 8 -z 1 -a 41 > $3/amoset_n2_w8_z1.log
|
||||
check amoset_n2_w8_z1
|
||||
echo "amoset_n2_w32_z1"
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 1 -a 44 > $3/amoset_n2_w32_z1.log
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=32 mpirun -np 2 $1 -w 32 -z 1 -a 41 > $3/amoset_n2_w32_z1.log
|
||||
check amoset_n2_w32_z1
|
||||
;;
|
||||
|
||||
@@ -517,118 +477,115 @@ case $2 in
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 32768 -a 5
|
||||
;;
|
||||
*"amofadd")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 6
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 5
|
||||
;;
|
||||
*"amofinc")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 7
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 6
|
||||
;;
|
||||
*"amofetch")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 8
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 7
|
||||
;;
|
||||
*"amofcswap")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 9
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 8
|
||||
;;
|
||||
*"amoadd")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 10
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 9
|
||||
;;
|
||||
*"amoinc")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 11
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 10
|
||||
;;
|
||||
*"init")
|
||||
mpirun -np 2 $1 -a 13
|
||||
mpirun -np 2 $1 -a 12
|
||||
;;
|
||||
*"pingpong")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 14
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 13
|
||||
;;
|
||||
*"barrier")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 17
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 15
|
||||
;;
|
||||
*"syncall")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 18
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 16
|
||||
;;
|
||||
*"sync")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 8 -a 19
|
||||
;;
|
||||
*"broadcast")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 32768 -a 20
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 8 -a 17
|
||||
;;
|
||||
*"fcollect")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 32768 -a 22
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 32768 -a 19
|
||||
;;
|
||||
*"alltoall")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 32768 -a 23
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 32768 -a 20
|
||||
;;
|
||||
*"team_broadcast")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 32768 -a 36
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 32768 -a 33
|
||||
;;
|
||||
*"team_reduction")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 32768 -a 37
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 32768 -a 34
|
||||
;;
|
||||
*"team_get")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 38
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 35
|
||||
;;
|
||||
*"team_getnbi")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 39
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 36
|
||||
;;
|
||||
*"team_put")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 40
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 37
|
||||
;;
|
||||
*"team_putnbi")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 41
|
||||
mpirun -np 2 $1 -w 1 -z 1 -s 1048576 -a 38
|
||||
;;
|
||||
*"ctx_infra")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 42
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 39
|
||||
;;
|
||||
*"amoset")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 44
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 41
|
||||
;;
|
||||
*"amoswap")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 45
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 42
|
||||
;;
|
||||
*"amofetchand")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 46
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 43
|
||||
;;
|
||||
*"amofetchor")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 47
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 44
|
||||
;;
|
||||
*"amofetchxor")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 48
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 45
|
||||
;;
|
||||
*"amoand")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 49
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 46
|
||||
;;
|
||||
*"amoor")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 50
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 47
|
||||
;;
|
||||
*"amoxor")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 51
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 48
|
||||
;;
|
||||
*"putsignal")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 53
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 50
|
||||
;;
|
||||
*"putsignalwg")
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 32 -a 55
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 32 -a 52
|
||||
;;
|
||||
*"putsignalwave")
|
||||
mpirun -np 2 $1 -w 1 -z 32 -a 55
|
||||
mpirun -np 2 $1 -w 1 -z 32 -a 52
|
||||
;;
|
||||
*"putsignalnbi")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 56
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 53
|
||||
;;
|
||||
*"putsignalnbiwg")
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 32 -a 57
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 32 -a 54
|
||||
;;
|
||||
*"putsignalnbiwave")
|
||||
mpirun -np 2 $1 -w 1 -z 32 -a 58
|
||||
mpirun -np 2 $1 -w 1 -z 32 -a 55
|
||||
;;
|
||||
*"signalfetch")
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 59
|
||||
mpirun -np 2 $1 -w 1 -z 1 -a 56
|
||||
;;
|
||||
*"signalfetchwg")
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 32 -a 60
|
||||
ROCSHMEM_MAX_NUM_CONTEXTS=2 mpirun -np 2 $1 -w 2 -z 32 -a 57
|
||||
;;
|
||||
*"signalfetchwave")
|
||||
mpirun -np 2 $1 -w 1 -z 32 -a 60
|
||||
mpirun -np 2 $1 -w 1 -z 32 -a 57
|
||||
;;
|
||||
*)
|
||||
echo "UNKNOWN TEST TYPE: $2"
|
||||
|
||||
@@ -37,63 +37,60 @@ enum TestType {
|
||||
PutTestType = 2,
|
||||
PutNBITestType = 3,
|
||||
GetSwarmTestType = 4,
|
||||
// ReductionTestType = 5,
|
||||
AMO_FAddTestType = 6,
|
||||
AMO_FIncTestType = 7,
|
||||
AMO_FetchTestType = 8,
|
||||
AMO_FCswapTestType = 9,
|
||||
AMO_AddTestType = 10,
|
||||
AMO_IncTestType = 11,
|
||||
AMO_CswapTestType = 12,
|
||||
InitTestType = 13,
|
||||
PingPongTestType = 14,
|
||||
// BarrierTestType = 15, // Deprecated in OpenSHMEM 1.5
|
||||
RandomAccessTestType = 16,
|
||||
BarrierAllTestType = 17,
|
||||
SyncAllTestType = 18,
|
||||
SyncTestType = 19,
|
||||
// BroadcastTestType = 20,
|
||||
CollectTestType = 21,
|
||||
FCollectTestType = 22,
|
||||
AllToAllTestType = 23,
|
||||
AllToAllsTestType = 24,
|
||||
ShmemPtrTestType = 25,
|
||||
PTestType = 26,
|
||||
GTestType = 27,
|
||||
WGGetTestType = 28,
|
||||
WGGetNBITestType = 29,
|
||||
WGPutTestType = 30,
|
||||
WGPutNBITestType = 31,
|
||||
WAVEGetTestType = 32,
|
||||
WAVEGetNBITestType = 33,
|
||||
WAVEPutTestType = 34,
|
||||
WAVEPutNBITestType = 35,
|
||||
TeamBroadcastTestType = 36,
|
||||
TeamReductionTestType = 37,
|
||||
TeamCtxGetTestType = 38,
|
||||
TeamCtxGetNBITestType = 39,
|
||||
TeamCtxPutTestType = 40,
|
||||
TeamCtxPutNBITestType = 41,
|
||||
TeamCtxInfraTestType = 42,
|
||||
PutNBIMRTestType = 43,
|
||||
AMO_SetTestType = 44,
|
||||
AMO_SwapTestType = 45,
|
||||
AMO_FetchAndTestType = 46,
|
||||
AMO_FetchOrTestType = 47,
|
||||
AMO_FetchXorTestType = 48,
|
||||
AMO_AndTestType = 49,
|
||||
AMO_OrTestType = 50,
|
||||
AMO_XorTestType = 51,
|
||||
PingAllTestType = 52,
|
||||
PutSignalTestType = 53,
|
||||
WGPutSignalTestType = 54,
|
||||
WAVEPutSignalTestType = 55,
|
||||
PutSignalNBITestType = 56,
|
||||
WGPutSignalNBITestType = 57,
|
||||
WAVEPutSignalNBITestType = 58,
|
||||
SignalFetchTestType = 59,
|
||||
WGSignalFetchTestType = 60,
|
||||
WAVESignalFetchTestType = 61,
|
||||
AMO_FAddTestType = 5,
|
||||
AMO_FIncTestType = 6,
|
||||
AMO_FetchTestType = 7,
|
||||
AMO_FCswapTestType = 8,
|
||||
AMO_AddTestType = 9,
|
||||
AMO_IncTestType = 10,
|
||||
AMO_CswapTestType = 11,
|
||||
InitTestType = 12,
|
||||
PingPongTestType = 13,
|
||||
RandomAccessTestType = 14,
|
||||
BarrierAllTestType = 15,
|
||||
SyncAllTestType = 16,
|
||||
SyncTestType = 17,
|
||||
CollectTestType = 18,
|
||||
FCollectTestType = 19,
|
||||
AllToAllTestType = 20,
|
||||
AllToAllsTestType = 21,
|
||||
ShmemPtrTestType = 22,
|
||||
PTestType = 23,
|
||||
GTestType = 24,
|
||||
WGGetTestType = 25,
|
||||
WGGetNBITestType = 26,
|
||||
WGPutTestType = 27,
|
||||
WGPutNBITestType = 28,
|
||||
WAVEGetTestType = 29,
|
||||
WAVEGetNBITestType = 30,
|
||||
WAVEPutTestType = 31,
|
||||
WAVEPutNBITestType = 32,
|
||||
TeamBroadcastTestType = 33,
|
||||
TeamReductionTestType = 34,
|
||||
TeamCtxGetTestType = 35,
|
||||
TeamCtxGetNBITestType = 36,
|
||||
TeamCtxPutTestType = 37,
|
||||
TeamCtxPutNBITestType = 38,
|
||||
TeamCtxInfraTestType = 39,
|
||||
PutNBIMRTestType = 40,
|
||||
AMO_SetTestType = 41,
|
||||
AMO_SwapTestType = 42,
|
||||
AMO_FetchAndTestType = 43,
|
||||
AMO_FetchOrTestType = 44,
|
||||
AMO_FetchXorTestType = 45,
|
||||
AMO_AndTestType = 46,
|
||||
AMO_OrTestType = 47,
|
||||
AMO_XorTestType = 48,
|
||||
PingAllTestType = 49,
|
||||
PutSignalTestType = 50,
|
||||
WGPutSignalTestType = 51,
|
||||
WAVEPutSignalTestType = 52,
|
||||
PutSignalNBITestType = 53,
|
||||
WGPutSignalNBITestType = 54,
|
||||
WAVEPutSignalNBITestType = 55,
|
||||
SignalFetchTestType = 56,
|
||||
WGSignalFetchTestType = 57,
|
||||
WAVESignalFetchTestType = 58,
|
||||
};
|
||||
|
||||
enum OpType { PutType = 0, GetType = 1 };
|
||||
|
||||
Verwijs in nieuw issue
Block a user