mirror of
https://github.com/sbrl/research-rainfallradar
synced 2024-11-22 01:12:59 +00:00
slurm/dlr: tensorflow is dumb
Workaround for this crash on Tensorflow 2.13: Could not load library libcublasLt.so.12. Error: libcublasLt.so.12: cannot open shared object file: No such file or directory
This commit is contained in:
parent
52af6f00ec
commit
17d2d2bcaf
1 changed files with 7 additions and 0 deletions
|
@ -21,6 +21,13 @@ command_exists() {
|
||||||
|
|
||||||
#######################################################
|
#######################################################
|
||||||
|
|
||||||
|
# Fix "Could not load library libcublasLt.so.12. Error: libcublasLt.so.12: cannot open shared object file: No such file or directory" error
|
||||||
|
if [[ "${SLURM_CLUSTER_NAME}" != "cs-cluster" ]] && [[ -d "${HOME}/cuda" ]]; then
|
||||||
|
echo "[slurm_runner] csgpu cluster detected, sourcing extra CUDA setup script" >&2;
|
||||||
|
#shellcheck source=/dev/null
|
||||||
|
source "${HOME}/cuda/activate.sh";
|
||||||
|
fi
|
||||||
|
|
||||||
# No modules on the CS cluster
|
# No modules on the CS cluster
|
||||||
if command_exists module && [[ "${SLURM_CLUSTER_NAME}" != "cs-cluster" ]]; then
|
if command_exists module && [[ "${SLURM_CLUSTER_NAME}" != "cs-cluster" ]]; then
|
||||||
module load utilities/multi
|
module load utilities/multi
|
||||||
|
|
Loading…
Reference in a new issue