ddn-ime-evaluation/run.sh

99 lines
2.7 KiB
Bash
Executable File

#!/bin/bash
function force_exit {
echo "Committing suicide (PID $$)"
exit
}
trap force_exit SIGINT
# Provides a list of good hosts (that contains QDR connection)
function hosts() {
num="$1"
#HOST_LIST=( isc17-c04 isc17-c05 isc17-c06 isc17-c18 )
HOST_LIST=( isc17-c04 isc17-c05 isc17-c06 isc17-c18 isc17-c01 isc17-c02 isc17-c03 isc17-c07 isc17-c08 isc17-c09 isc17-c11 isc17-c12 isc17-c13 isc17-c14 isc17-c15 isc17-c22 )
hlist=${HOST_LIST[0]}
for POS in $(seq 1 $(($num - 1))) ; do
hlist="$hlist,${HOST_LIST[$POS]}"
done
echo $hlist
}
export MODULEPATH=/esfs/jtacquaviva/software/modules:$MODULEPATH
module purge
module load betke/hdf5/1.8.20-ddn
module load betke/ior/git-ddn
module list
LUSTRE_TESTFILE_WRITE="/esfs/jtacquaviva/ioperf/file_write"
LUSTRE_TESTFILE_READ=""
ITERATIONS=3
IOR="$(which ior)"
MPIEXEC="/opt/ddn/mvapich/bin/mpiexec"
API_ARR=( "POSIX" "MPIIO" )
#NN_ARR=( 4 2 1 8 10 16)
NN_ARR=( 2 1 )
PPN_ARR=( 8 6 4 2 1 )
T_ARR=( $((10*1024*1024)) $((1*1024*1024)) $((100*1024)) $((16*1024)) )
for COUNT in $(seq 1); do
for NN in ${NN_ARR[@]}; do
for T in ${T_ARR[@]}; do
for PPN in ${PPN_ARR[@]}; do
for API in ${API_ARR[@]}; do
BENCHFILE="./output/COUNT:$COUNT#NN:$NN#PPN:$PPN#API:$API#T:$T.txt"
if [ ! -e "${BENCHFILE}" ]; then
OUTDIR="$(dirname $BENCHFILE)"
if [ ! -d $OUTDIR ]; then
mkdir $OUTDIR
fi
touch $BENCHFILE
IOR_API_OPTS=""
if [[ "POSIX" == $API ]]; then
IOR_API_OPTS="-F"
LUSTRE_TESTFILE_READ="/esfs/jtacquaviva/indread$NN/file"
elif [[ "MPIIO" == $API ]]; then
IOR_API_OPTS=""
LUSTRE_TESTFILE_READ="/esfs/jtacquaviva/file_read"
fi
IOR_PARAMS="-i $ITERATIONS -s 1 -t $T -b $((4800 * 1024 * 1024 * 32 / $PPN)) -D $((120)) -a $API $IOR_API_OPTS -e -g -z -k"
ENVVAR="-genv MV2_NUM_HCAS 1 -genv MV2_CPU_BINDING_LEVEL core -genv MV2_CPU_BINDING_POLICY scatter"
MPIEXEC_PARAMS=" -ppn $PPN -np $(($NN * $PPN)) $ENVVAR --hosts $(hosts $NN) "
TESTDIR="$(dirname $LUSTRE_TESTFILE_WRITE)"
if [ -d $TESTDIR ]; then
rm -r $TESTDIR
fi
mkdir -p $TESTDIR
lfs setstripe -c $((2 * $NN)) $TESTDIR
(
set -x
$MPIEXEC $MPIEXEC_PARAMS $IOR $IOR_PARAMS -o $LUSTRE_TESTFILE_WRITE -w | tee -a $BENCHFILE
$MPIEXEC $MPIEXEC_PARAMS /esfs/jtacquaviva/git/ime-evaluation/drop_caches.sh
$MPIEXEC $MPIEXEC_PARAMS $IOR $IOR_PARAMS -o $LUSTRE_TESTFILE_READ -r | tee -a $BENCHFILE
set +x
) 2> >(tee -a $BENCHFILE)
lfs getstripe $TESTDIR | tee -a $BENCHFILE
else
echo "skip $(readlink -f $BENCHFILE), already exists"
fi
done
done
done
done
done