Dockerfile 1.2 KB

12345678910111213141516171819202122232425262728293031323334
  1. # Copyright (c) 2020 NVIDIA CORPORATION. All rights reserved.
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License");
  4. # you may not use this file except in compliance with the License.
  5. # You may obtain a copy of the License at
  6. #
  7. # http://www.apache.org/licenses/LICENSE-2.0
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. ARG FROM_IMAGE_NAME=nvcr.io/nvidia/pytorch:20.03-py3
  15. FROM ${FROM_IMAGE_NAME}
  16. RUN apt update && \
  17. apt install -y openjdk-8-jdk && \
  18. curl http://archive.apache.org/dist/spark/spark-2.4.5/spark-2.4.5-bin-hadoop2.7.tgz -o /opt/spark-2.4.5-bin-hadoop2.7.tgz && \
  19. tar zxf /opt/spark-2.4.5-bin-hadoop2.7.tgz -C /opt/ && \
  20. rm /opt/spark-2.4.5-bin-hadoop2.7.tgz
  21. ADD requirements.txt .
  22. RUN pip install -r requirements.txt
  23. RUN pip uninstall -y apex && \
  24. git clone https://github.com/NVIDIA/apex && \
  25. cd apex && \
  26. pip install -v --no-cache-dir --global-option="--cpp_ext" --global-option="--cuda_ext" ./
  27. WORKDIR /workspace/dlrm
  28. COPY . .