diff --git a/Dockerfile b/Dockerfile index 4d28a3c..90e2374 100644 --- a/Dockerfile +++ b/Dockerfile @@ -3,13 +3,16 @@ FROM centos:latest MAINTAINER Matthew Farrellee USER root +ARG DISTRO_LOC=https://dist.apache.org/repos/dist/release/spark/spark-2.1.0/spark-2.1.0-bin-hadoop2.7.tgz +ARG DISTRO_NAME=spark-2.1.0-bin-hadoop2.7 + RUN yum install -y epel-release tar java && \ yum clean all RUN cd /opt && \ - curl https://dist.apache.org/repos/dist/release/spark/spark-2.1.0/spark-2.1.0-bin-hadoop2.7.tgz | \ + curl $DISTRO_LOC | \ tar -zx && \ - ln -s spark-2.1.0-bin-hadoop2.7 spark + ln -s $DISTRO_NAME spark # when the containers are not run w/ uid 0, the uid may not map in # /etc/passwd and it may not be possible to modify things like