iprbench/iprbench/resources/clusterbench-template.job

78 lines
2.6 KiB
Bash

#!/usr/bin/env bash
# this job file is a template file for clusterbench jobs
executed_by_sge=''
if [ "${JOB_ID}" = '' ]
then
executed_by_sge='false'
# this script is not executed by sge... set dummy values for test
TMPDIR=/tmp
JOB_ID=666666
NSLOTS=<num_cores>
else
executed_by_sge='true'
fi
launch_dir="$(pwd)"
echo "Executing job ${JOB_ID} on $(hostname) from ${launch_dir}"
echo "date: $(date --iso-8601=seconds)"
temp_dir=${TMPDIR}/$(whoami)/${JOB_ID}
if [ -d "${temp_dir}" ]
then
rm -Rf "${temp_dir}"
fi
mkdir -p "${temp_dir}"
iprbench_venv_path='<iprbench_venv_hardcoded_path>'
iprbench_venv_parent=$(dirname "$iprbench_venv_path")
iprbench_venv_archive_path='<iprbench_venv_archive_path>'
echo "unarchiving virtual environment ${iprbench_venv_archive_path} to ${iprbench_venv_parent}"
pushd "${iprbench_venv_parent}"
tar xzvf "${iprbench_venv_archive_path}" > /dev/null
popd
if [ ! -d "${iprbench_venv_path}" ]
then
echo "failed to find expected directory ${iprbench_venv_path}"
exit 1
fi
echo "using the iprbench virtual environment that has been created for this bench: ${iprbench_venv_path}"
source "$iprbench_venv_path/bin/activate"
if [ $? != 0 ]
then
echo "failed to activate the virtual environment $iprbench_venv_path"
exit 1
fi
echo "VIRTUAL_ENV = $VIRTUAL_ENV"
# show the list of packages installed in the virtual environment
pip list
output_dir="${temp_dir}"
num_cores=${NSLOTS}
# set environment variables
# launch the benchmark
command="iprbench-run --benchmark-id '<benchmark_id>' --config '<benchmark_config>' --results-dir '${output_dir}' --resultsdb-params '<resultsdb_params>' --target-system-type-id '<target_system_type_id>'"
echo "command: ${command}"
eval ${command}
if [ "$?" = '0' ]
then
echo "the command ${command} succeeded"
rsync -va --exclude 'build' --exclude 'source.git' --exclude "${iprbench_venv_path}" "${output_dir}/" ${launch_dir}/ # exclude the source.git and build directories (one for each worker) because they are big and not that precious
# TMPDIR will be deleted by sge at the end of the job
else
if [ ${executed_by_sge} = 'true' ]
then
# TMPDIR will be deleted by sge at the end of the job. Backup data for investigation
backup_dir="/opt/ipr/cluster/work.local/$(whoami)/${JOB_ID}"
echo "moving ${output_dir} to ${backup_dir} so that it doesn't get deleted by sge at the end of the job. This way, data gets a chance to be investigated then manually deleted."
mv "${output_dir}" "${backup_dir}"
fi
echo "the command ${command} failed... the output data dir (${output_dir}) is expected to be cleaned up manually after investigation"
exit 1
fi