Skip to content

Commit 41cc33f

Browse files
tgrelnv-kkudrynski
authored andcommitted
[DLRM/TF2] Fix preprocessing and training Dockerfiles
1 parent 16c0b93 commit 41cc33f

File tree

2 files changed

+7
-5
lines changed

2 files changed

+7
-5
lines changed

TensorFlow2/Recommendation/DLRM/Dockerfile

+5-3
Original file line numberDiff line numberDiff line change
@@ -18,11 +18,13 @@
1818
ARG FROM_IMAGE_NAME=nvcr.io/nvidia/tensorflow:21.06-tf2-py3
1919
FROM ${FROM_IMAGE_NAME}
2020

21-
RUN pip install -e git+https://github.com/NVIDIA/dllogger#egg=dllogger
21+
WORKDIR /dlrm
2222

23-
ENV HOROVOD_CYCLE_TIME=0.1
23+
ADD requirements.txt .
2424

25-
WORKDIR /dlrm
25+
RUN pip install -r requirements.txt
26+
27+
ENV HOROVOD_CYCLE_TIME=0.1
2628

2729
ADD . .
2830

TensorFlow2/Recommendation/DLRM/Dockerfile_spark

+2-2
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@ FROM ${FROM_IMAGE_NAME}
1818
RUN apt update && \
1919
apt install -y openjdk-8-jdk && \
2020
apt install -y curl && \
21-
curl https://archive.apache.org/dist/spark/spark-3.0.1/spark-3.0.1-bin-hadoop2.7.tgz -o /opt/spark.tgz && \
21+
curl https://archive.apache.org/dist/spark/spark-3.0.1/spark-3.0.1-bin-hadoop3.2.tgz -o /opt/spark.tgz && \
2222
tar zxf /opt/spark.tgz -C /opt/ && \
2323
mv /opt/spark-3.0.1-bin-hadoop3.2 /opt/spark && \
2424
rm /opt/spark.tgz && \
@@ -27,7 +27,7 @@ RUN apt update && \
2727
apt install -y git
2828

2929
ADD requirements.txt .
30-
RUN apt install -y python3-pip && pip3 install -r requirements.txt
30+
RUN apt install -y python3-pip && python3 -m pip install --upgrade pip && pip3 install -r requirements.txt
3131

3232
WORKDIR /workspace/dlrm
3333

0 commit comments

Comments
 (0)