Skip to content

Commit

Permalink
Updated the image ml-tensorflow-gpu:alma9-python39 to resolve the CUD…
Browse files Browse the repository at this point in the history
…A_ERROR_SYSTEM_DRIVER_MISMATCH problem
  • Loading branch information
Shuwei Ye authored and Shuwei Ye committed May 23, 2024
1 parent d65cd2b commit 7fc792d
Show file tree
Hide file tree
Showing 2 changed files with 80 additions and 100 deletions.
8 changes: 4 additions & 4 deletions alma9/ml-tensorflow-gpu/ml-tensorflow-gpu.Dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -11,8 +11,8 @@ RUN yum -y install which file git bzip2 \

# path prefix for micromamba to install pkgs into
#
ARG TF_ver=2.15.0
ARG Conda_ver=12.4
ARG TF_ver=2.14.*
ARG Conda_ver=12.3.*
ARG prefix=/opt/conda
ARG Micromamba_ver=1.5.7
ARG PyVer=3.9
Expand Down Expand Up @@ -84,7 +84,7 @@ RUN micromamba install -y lightgbm xgboost catboost \
# TensorFlow Datasets: a collection of ready-to-use datasets
#
RUN export CONDA_OVERRIDE_CUDA=$Conda_ver \
&& micromamba install -y tensorflow-gpu=$TF_ver cuda-compat tensorflow-datasets \
&& micromamba install -y tensorflow-gpu=$TF_ver cuda-compat=$Conda_ver tensorflow-datasets \
&& cd $prefix/lib && ln -s ../cuda-compat/lib*.so* . \
&& micromamba clean -y -a -f

Expand All @@ -93,7 +93,7 @@ RUN micromamba install -y keras-tuner keras-cv \
&& micromamba clean -y -a -f

# Install keras-nlp
RUN $prefix/bin/python -m pip install keras-nlp tf_keras==2.15.0 tensorflow-text==2.15.0 \
RUN $prefix/bin/python -m pip install keras-nlp tf_keras==$TF_ver tensorflow-text==$TF_ver \
&& $prefix/bin/python -m pip cache purge

# get the command lspci to enable gpu checking in shell
Expand Down
Loading

0 comments on commit 7fc792d

Please sign in to comment.