1688a027d8
- additional miscellaneous tweaks to workflows and docker scripts, e.g. install perfetto python bindings - improves the stability of MPI finalization - reduces some debug messages within timemory when `OMNITRACE_DEBUG=ON` - fixes issue found in RHEL where libunwind is using mutex and omnitrace was not treating this as an internal mutex call - this may have been affecting the causal profiling slightly (tests seem a bit more stable now) - fix data race in timemory * Add RedHat CI and release packaging - additional miscellaneous tweaks to workflows and docker scripts, e.g. install perfetto python bindings * Fix URL for ROCm packages in redhat workflow * Fix dnf --enable-repo for ROCm perl packages * Dockerfile.rhel and redhat.yml updates - Fix dnf repo for ROCm PERL packages - Disable python in CI (interpreter segfaults) - Exclude parallel-overhead-locks tests due to inclusion of internal locks - This needs to be remedied in the future * Exclude _dl_relocate_static_pie from instrumentation * Testing updates - OMNITRACE_SAMPLING_KEEP_INTERNAL=OFF for parallel-overhead-locks * Fix redhat workflow * redhat.yml update - remove if condition on config/build/test step * Update timemory submodule - tweaks to verbosity messages * Set thread state before unw_step - on Redhat, unw_step calls mutex * Update timemory submodule - verbosity changes - gotcha uses spin_lock/spin_mutex * Remove using gsplit-dwarf unless OMNITRACE_BUILD_NUMBER > 2 * Re-enable parallel-overhead-locks tests in redhat workflow * Always disable timemory manager metadata auto output * testing updates - tweak parallel-overhead-locks-timemory to higher instruction count min - OMNITRACE_SAMPLING_KEEP_INTERNAL=OFF for parallel-overhead-locks-perfetto * Update timemory submodule - quiet realpath queries * omnitrace exe updates - detect text files - improved bin/lib locating * cmake format * test-install.sh and redhat workflow updates - handle testing when ls is script - re-enable python testing on redhat workflow - invoke test-install.sh in redhat workflow * Misc guards for finalization * omnitrace-exe, testing updates - test-install.sh: LS_EXEC -> LS_NAME - handle /usr/bin/ls being script in source/bin/tests - improve locating the binary * Fix mpi_gotcha compile error * omnitrace-exe updates - improve file locating * formatting * Misc fixes - remove -static-libstdc++ for RHEL packaging (rocky-linux doesn't distribute static lib) * omnitrace-exe paths * Replace realpath with absolute - using absolute path to symlink fixes issues with locating libdyninstAPI_RT at runtime * omnitrace exe updates - judicious use of realpath * Update timemory submodule - fix update main hash ids/aliases data race in merge * bin tests update - change working directory of omnitrace-exe-simulate-lib-basename * omnitrace exe updates - Update resolved exe/lib messaging * bin tests update - change working directory of omnitrace-exe-simulate-lib-basename
263 righe
9.3 KiB
Bash
Executable File
263 righe
9.3 KiB
Bash
Executable File
#!/usr/bin/env bash
|
|
|
|
: ${USER:=$(whoami)}
|
|
: ${ROCM_VERSIONS:="5.0"}
|
|
: ${DISTRO:=ubuntu}
|
|
: ${VERSIONS:=20.04}
|
|
: ${PYTHON_VERSIONS:="6 7 8 9 10"}
|
|
: ${BUILD_CI:=""}
|
|
: ${PUSH:=0}
|
|
: ${RETRY:=3}
|
|
|
|
set -e
|
|
|
|
tolower()
|
|
{
|
|
echo "$@" | awk -F '\|~\|' '{print tolower($1)}';
|
|
}
|
|
|
|
toupper()
|
|
{
|
|
echo "$@" | awk -F '\|~\|' '{print toupper($1)}';
|
|
}
|
|
|
|
usage()
|
|
{
|
|
print_option() { printf " --%-20s %-24s %s\n" "${1}" "${2}" "${3}"; }
|
|
echo "Options:"
|
|
print_option "help -h" "" "This message"
|
|
|
|
echo ""
|
|
print_default_option() { printf " --%-20s %-24s %s (default: %s)\n" "${1}" "${2}" "${3}" "$(tolower ${4})"; }
|
|
print_default_option distro "[ubuntu|opensuse|rhel]" "OS distribution" "${DISTRO}"
|
|
print_default_option versions "[VERSION] [VERSION...]" "Ubuntu, OpenSUSE, or RHEL release" "${VERSIONS}"
|
|
print_default_option rocm-versions "[VERSION] [VERSION...]" "ROCm versions" "${ROCM_VERSIONS}"
|
|
print_default_option python-versions "[VERSION] [VERSION...]" "Python 3 minor releases" "${PYTHON_VERSIONS}"
|
|
print_default_option "user -u" "[USERNAME]" "DockerHub username" "${USER}"
|
|
print_default_option "retry -r" "[N]" "Number of attempts to build (to account for network errors)" "${RETRY}"
|
|
print_default_option push "" "Push the image to Dockerhub" ""
|
|
#print_default_option lto "[on|off]" "Enable LTO" "${LTO}"
|
|
}
|
|
|
|
send-error()
|
|
{
|
|
usage
|
|
echo -e "\nError: ${@}"
|
|
exit 1
|
|
}
|
|
|
|
verbose-run()
|
|
{
|
|
echo -e "\n### Executing \"${@}\"... ###\n"
|
|
eval "${@}"
|
|
}
|
|
|
|
verbose-build()
|
|
{
|
|
echo -e "\n### Executing \"${@}\" a maximum of ${RETRY} times... ###\n"
|
|
for i in $(seq 1 1 ${RETRY})
|
|
do
|
|
set +e
|
|
eval "${@}"
|
|
local RETC=$?
|
|
set -e
|
|
if [ "${RETC}" -eq 0 ]; then
|
|
break
|
|
else
|
|
echo -en "\n### Command failed with error code ${RETC}... "
|
|
if [ "${i}" -ne "${RETRY}" ]; then
|
|
echo -e "Retrying... ###\n"
|
|
sleep 3
|
|
else
|
|
echo -e "Exiting... ###\n"
|
|
exit ${RETC}
|
|
fi
|
|
fi
|
|
done
|
|
}
|
|
|
|
reset-last()
|
|
{
|
|
last() { send-error "Unsupported argument :: ${1}"; }
|
|
}
|
|
|
|
reset-last
|
|
|
|
n=0
|
|
while [[ $# -gt 0 ]]
|
|
do
|
|
case "${1}" in
|
|
-h|--help)
|
|
usage
|
|
exit 0
|
|
;;
|
|
"--distro")
|
|
shift
|
|
DISTRO=${1}
|
|
last() { DISTRO="${DISTRO} ${1}"; }
|
|
;;
|
|
"--versions")
|
|
shift
|
|
VERSIONS=${1}
|
|
last() { VERSIONS="${VERSIONS} ${1}"; }
|
|
;;
|
|
"--rocm-versions")
|
|
shift
|
|
ROCM_VERSIONS=${1}
|
|
last() { ROCM_VERSIONS="${ROCM_VERSIONS} ${1}"; }
|
|
;;
|
|
"--python-versions")
|
|
shift
|
|
PYTHON_VERSIONS=${1}
|
|
last() { PYTHON_VERSIONS="${PYTHON_VERSIONS} ${1}"; }
|
|
;;
|
|
--user|-u)
|
|
shift
|
|
USER=${1}
|
|
reset-last
|
|
;;
|
|
--push)
|
|
PUSH=1
|
|
;;
|
|
--retry|-r)
|
|
shift
|
|
RETRY=${1}
|
|
reset-last
|
|
;;
|
|
"--*")
|
|
send-error "Unsupported argument at position $((${n} + 1)) :: ${1}"
|
|
;;
|
|
*)
|
|
last ${1}
|
|
;;
|
|
esac
|
|
n=$((${n} + 1))
|
|
shift
|
|
done
|
|
|
|
DOCKER_FILE="Dockerfile.${DISTRO}"
|
|
|
|
if [ -n "${BUILD_CI}" ]; then DOCKER_FILE="${DOCKER_FILE}.ci"; fi
|
|
if [ ! -f ${DOCKER_FILE} ]; then cd docker; fi
|
|
if [ ! -f ${DOCKER_FILE} ]; then send-error "File \"${DOCKER_FILE}\" not found"; fi
|
|
|
|
for VERSION in ${VERSIONS}
|
|
do
|
|
VERSION_MAJOR=$(echo ${VERSION} | sed 's/\./ /g' | awk '{print $1}')
|
|
VERSION_MINOR=$(echo ${VERSION} | sed 's/\./ /g' | awk '{print $2}')
|
|
VERSION_PATCH=$(echo ${VERSION} | sed 's/\./ /g' | awk '{print $3}')
|
|
for ROCM_VERSION in ${ROCM_VERSIONS}
|
|
do
|
|
CONTAINER=${USER}/omnitrace:release-base-${DISTRO}-${VERSION}-rocm-${ROCM_VERSION}
|
|
ROCM_MAJOR=$(echo ${ROCM_VERSION} | sed 's/\./ /g' | awk '{print $1}')
|
|
ROCM_MINOR=$(echo ${ROCM_VERSION} | sed 's/\./ /g' | awk '{print $2}')
|
|
ROCM_PATCH=$(echo ${ROCM_VERSION} | sed 's/\./ /g' | awk '{print $3}')
|
|
if [ -n "${ROCM_PATCH}" ]; then
|
|
ROCM_VERSN=$(( (${ROCM_MAJOR}*10000)+(${ROCM_MINOR}*100)+(${ROCM_PATCH}) ))
|
|
ROCM_SEP="."
|
|
else
|
|
ROCM_VERSN=$(( (${ROCM_MAJOR}*10000)+(${ROCM_MINOR}*100) ))
|
|
ROCM_SEP=""
|
|
fi
|
|
if [ "${DISTRO}" = "ubuntu" ]; then
|
|
ROCM_REPO_DIST="ubuntu"
|
|
ROCM_REPO_VERSION=${ROCM_VERSION}
|
|
case "${ROCM_VERSION}" in
|
|
4.1* | 4.0*)
|
|
ROCM_REPO_DIST="xenial"
|
|
;;
|
|
5.3* | 5.4*)
|
|
case "${VERSION}" in
|
|
22.04)
|
|
ROCM_REPO_DIST="jammy"
|
|
;;
|
|
20.04)
|
|
ROCM_REPO_DIST="focal"
|
|
;;
|
|
18.04)
|
|
ROCM_REPO_DIST="bionic"
|
|
;;
|
|
*)
|
|
;;
|
|
esac
|
|
;;
|
|
*)
|
|
;;
|
|
esac
|
|
verbose-build docker build . -f ${DOCKER_FILE} --tag ${CONTAINER} --build-arg DISTRO=${DISTRO} --build-arg VERSION=${VERSION} --build-arg ROCM_VERSION=${ROCM_VERSION} --build-arg ROCM_REPO_VERSION=${ROCM_REPO_VERSION} --build-arg ROCM_REPO_DIST=${ROCM_REPO_DIST} --build-arg PYTHON_VERSIONS=\"${PYTHON_VERSIONS}\"
|
|
elif [ "${DISTRO}" = "rhel" ]; then
|
|
if [ -z "${VERSION_MINOR}" ]; then
|
|
send-error "Please provide a major and minor version of the OS. Supported: >= 8.7, <= 9.1"
|
|
fi
|
|
|
|
# Components used to create the sub-URL below
|
|
# set <OS-VERSION> in amdgpu-install/<ROCM-VERSION>/rhel/<OS-VERSION>
|
|
RPM_PATH=${VERSION_MAJOR}.${VERSION_MINOR}
|
|
RPM_TAG=".el${VERSION_MAJOR}"
|
|
|
|
# set the sub-URL in https://repo.radeon.com/amdgpu-install/<sub-URL>
|
|
case "${ROCM_VERSION}" in
|
|
5.4 | 5.4.*)
|
|
ROCM_RPM=${ROCM_VERSION}/rhel/${RPM_PATH}/amdgpu-install-${ROCM_MAJOR}.${ROCM_MINOR}.${ROCM_VERSN}-1${RPM_TAG}.noarch.rpm
|
|
;;
|
|
5.3 | 5.3.*)
|
|
ROCM_RPM=${ROCM_VERSION}/rhel/${RPM_PATH}/amdgpu-install-${ROCM_MAJOR}.${ROCM_MINOR}.${ROCM_VERSN}-1${RPM_TAG}.noarch.rpm
|
|
;;
|
|
5.2 | 5.2.* | 5.1 | 5.1.* | 5.0 | 5.0.* | 4.*)
|
|
send-error "Invalid ROCm version ${ROCM_VERSION}. Supported: >= 5.3.0, <= 5.4.x"
|
|
;;
|
|
0.0)
|
|
;;
|
|
*)
|
|
send-error "Unsupported combination :: ${DISTRO}-${VERSION} + ROCm ${ROCM_VERSION}"
|
|
;;
|
|
esac
|
|
|
|
# use Rocky Linux as a base image for RHEL builds
|
|
DISTRO_BASE_IMAGE=rockylinux
|
|
|
|
verbose-build docker build . -f ${DOCKER_FILE} --tag ${CONTAINER} --build-arg DISTRO=${DISTRO_BASE_IMAGE} --build-arg VERSION=${VERSION} --build-arg ROCM_VERSION=${ROCM_VERSION} --build-arg AMDGPU_RPM=${ROCM_RPM} --build-arg PYTHON_VERSIONS=\"${PYTHON_VERSIONS}\"
|
|
elif [ "${DISTRO}" = "opensuse" ]; then
|
|
case "${VERSION}" in
|
|
15.*)
|
|
DISTRO_IMAGE="opensuse/leap"
|
|
echo "DISTRO_IMAGE: ${DISTRO_IMAGE}"
|
|
;;
|
|
*)
|
|
send-error "Invalid opensuse version ${VERSION}. Supported: 15.x"
|
|
;;
|
|
esac
|
|
case "${ROCM_VERSION}" in
|
|
5.4 | 5.4.*)
|
|
ROCM_RPM=${ROCM_VERSION}/sle/${VERSION}/amdgpu-install-${ROCM_MAJOR}.${ROCM_MINOR}.${ROCM_VERSN}-1.noarch.rpm
|
|
;;
|
|
5.3 | 5.3.*)
|
|
ROCM_RPM=${ROCM_VERSION}/sle/${VERSION}/amdgpu-install-${ROCM_MAJOR}.${ROCM_MINOR}.${ROCM_VERSN}-1.noarch.rpm
|
|
;;
|
|
5.2 | 5.2.*)
|
|
ROCM_RPM=22.20${ROCM_SEP}${ROCM_PATCH}/sle/${VERSION}/amdgpu-install-22.20.${ROCM_VERSN}-1.noarch.rpm
|
|
;;
|
|
5.1 | 5.1.*)
|
|
ROCM_RPM=22.10${ROCM_SEP}${ROCM_PATCH}/sle/15/amdgpu-install-22.10${ROCM_SEP}${ROCM_PATCH}.${ROCM_VERSN}-1.noarch.rpm
|
|
;;
|
|
5.0 | 5.0.*)
|
|
ROCM_RPM=21.50${ROCM_SEP}${ROCM_PATCH}/sle/15/amdgpu-install-21.50${ROCM_SEP}${ROCM_PATCH}.${ROCM_VERSN}-1.noarch.rpm
|
|
;;
|
|
4.5 | 4.5.*)
|
|
ROCM_RPM=21.40${ROCM_SEP}${ROCM_PATCH}/sle/15/amdgpu-install-21.40${ROCM_SEP}${ROCM_PATCH}.${ROCM_VERSN}-1.noarch.rpm
|
|
;;
|
|
0.0)
|
|
;;
|
|
*)
|
|
send-error "Unsupported combination :: ${DISTRO}-${VERSION} + ROCm ${ROCM_VERSION}"
|
|
;;
|
|
esac
|
|
PERL_REPO="SLE_${VERSION_MAJOR}_SP${VERSION_MINOR}"
|
|
verbose-build docker build . -f ${DOCKER_FILE} --tag ${CONTAINER} --build-arg DISTRO=${DISTRO_IMAGE} --build-arg VERSION=${VERSION} --build-arg ROCM_VERSION=${ROCM_VERSION} --build-arg AMDGPU_RPM=${ROCM_RPM} --build-arg PERL_REPO=${PERL_REPO} --build-arg PYTHON_VERSIONS=\"${PYTHON_VERSIONS}\"
|
|
fi
|
|
if [ "${PUSH}" -ne 0 ]; then
|
|
docker push ${CONTAINER}
|
|
fi
|
|
done
|
|
done
|