Files
blis/test/mixeddt/runme.sh
Devangi N. Parikh 38203ecd15 Added thunderx2 system in the mixeddt test scripts
Details:
 - Added thunderx2 (tx2) as a system in the runme.sh in test/mixeddt
2019-02-04 15:28:28 -05:00

179 lines
4.5 KiB
Bash
Executable File

#!/bin/bash
# File pefixes.
exec_root="test"
out_root="output"
sys="blis"
#sys="stampede2"
#sys="lonestar5"
#sys="ul252"
sys="tx2"
# Bind threads to processors.
#export OMP_PROC_BIND=true
#export GOMP_CPU_AFFINITY="0 2 4 6 8 10 12 14 1 3 5 7 9 11 13 15"
#export GOMP_CPU_AFFINITY="0 1 2 3 4 5 6 7"
#export GOMP_CPU_AFFINITY="0 1 2 3 4 5 6 7"
#export GOMP_CPU_AFFINITY="0 2 4 6 1 3 5 7"
#export GOMP_CPU_AFFINITY="0 4 1 5 2 6 3 7"
#export GOMP_CPU_AFFINITY="0 1 4 5 8 9 12 13 16 17 20 21 24 25 28 29 32 33 36 37 40 41 44 45"
#export GOMP_CPU_AFFINITY="0 2 4 6 8 10 12 14 16 18 20 22 1 3 5 7 9 11 13 15 17 19 21 23"
#export GOMP_CPU_AFFINITY="0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23"
export GOMP_CPU_AFFINITY="0 1 2 3"
# Modify LD_LIBRARY_PATH.
if [ ${sys} = "blis" ]; then
export LD_LIBRARY_PATH="$LD_LIBRARY_PATH"
export GOMP_CPU_AFFINITY="0 1 2 3"
jc_nt=1 # 5th loop
ic_nt=4 # 3rd loop
jr_nt=1 # 2nd loop
ir_nt=1 # 1st loop
nt=4
elif [ ${sys} = "stampede2" ]; then
echo "Need to set GOMP_CPU_AFFINITY."
exit 1
jc_nt=4 # 5th loop
ic_nt=12 # 3rd loop
jr_nt=1 # 2nd loop
ir_nt=1 # 1st loop
nt=48
elif [ ${sys} = "lonestar5" ]; then
echo "Need to set GOMP_CPU_AFFINITY."
exit 1
# A hack to use libiomp5 with gcc.
export LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/apps/intel/16.0.1.150/compilers_and_libraries_2016.1.150/linux/compiler/lib/intel64"
jc_nt=2 # 5th loop
ic_nt=12 # 3rd loop
jr_nt=1 # 2nd loop
ir_nt=1 # 1st loop
nt=24
elif [ ${sys} = "ul252" ]; then
export LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/home/field/intel/mkl/lib/intel64"
#export GOMP_CPU_AFFINITY="0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103"
export GOMP_CPU_AFFINITY="0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51"
#jc_nt=4 # 5th loop
jc_nt=2 # 5th loop
ic_nt=13 # 3rd loop
jr_nt=1 # 2nd loop
ir_nt=1 # 1st loop
#nt=52
nt=26
elif [ ${sys} = "tx2" ]; then
export GOMP_CPU_AFFINITY="0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55"
jc_nt=8 # 5th loop
ic_nt=7 # 3rd loop
jr_nt=1 # 2nd loop
ir_nt=1 # 1st loop
nt=56
fi
# Save a copy of GOMP_CPU_AFFINITY so that if we have to unset it, we can
# restore the value.
GOMP_CPU_AFFINITYsave=${GOMP_CPU_AFFINITY}
# Datatypes to test.
#dts="s d c z"
# Threadedness to test.
threads="mt"
#threads="st"
# Implementations to test.
test_impls="ad_hoc intern"
# Operations to test.
l3_ops="gemm"
test_ops="${l3_ops}"
# Define the list of datatype chars and precision chars.
dt_chars="s d c z"
pr_chars="s d"
# Construct the datatype combination strings.
dt_combos=""
for dtc in ${dt_chars}; do
for dta in ${dt_chars}; do
for dtb in ${dt_chars}; do
for pre in ${pr_chars}; do
dt_combos="${dt_combos} ${dtc}${dta}${dtb}${pre}"
done
done
done
done
# Overrides, in case something goes wrong for a subset of tests.
#test_impls="ad_hoc"
#dt_combos="ssss sssd ssds sdss dsss ddds dddd"
# Now perform complex test cases.
for th in ${threads}; do
for dt in ${dt_combos}; do
for im in ${test_impls}; do
for op in ${test_ops}; do
# Set the number of threads according to th.
if [ ${th} = "mt" ]; then
export BLIS_JC_NT=${jc_nt}
export BLIS_IC_NT=${ic_nt}
export BLIS_JR_NT=${jr_nt}
export BLIS_IR_NT=${ir_nt}
export OMP_NUM_THREADS=${nt}
export OPENBLAS_NUM_THREADS=${nt}
# Unset GOMP_CPU_AFFINITY for OpenBLAS.
if [ ${im} = "openblas" ]; then
unset GOMP_CPU_AFFINITY
else
export GOMP_CPU_AFFINITY=${GOMP_CPU_AFFINITYsave}
fi
else
export BLIS_JC_NT=1
export BLIS_IC_NT=1
export BLIS_JR_NT=1
export BLIS_IR_NT=1
export OMP_NUM_THREADS=1
export OPENBLAS_NUM_THREADS=1
fi
# Construct the name of the test executable.
exec_name="${exec_root}_${dt}${op}_${im}_${th}.x"
# Construct the name of the output file.
out_file="${out_root}_${th}_${dt}${op}_${im}.m"
echo "Running (nt = ${OMP_NUM_THREADS}) ./${exec_name} > ${out_file}"
# Run executable.
./${exec_name} > ${out_file}
#sleep 1
done
done
done
done