Skip to content

Commit 0599172

Browse files
committed
Update spark dockerfile to for the new spark scala
1 parent 940beff commit 0599172

File tree

1 file changed

+12
-18
lines changed

1 file changed

+12
-18
lines changed

spark/Dockerfile

Lines changed: 12 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -8,34 +8,28 @@ apt-get clean && \
88
rm -rf /var/lib/apt/lists/*
99

1010
RUN useradd --create-home --shell /bin/bash ubuntu
11-
USER ubuntu
1211

1312
ENV HOME /home/ubuntu
14-
ENV SPARK_VERSION 1.6.1
13+
ENV SPARK_VERSION 1.6.2
1514
ENV HADOOP_VERSION 2.6
16-
ENV MONGO_HADOOP_VERSION 1.5.2
17-
ENV MONGO_JAVA_VERSION 3.2.2
15+
ENV MONGO_SPARK_VERSION 1.0.0
16+
ENV SCALA_VERSION 2.11
1817

1918
WORKDIR ${HOME}
2019

20+
COPY files/times.json /home/ubuntu/times.json
21+
COPY files/readme.txt /home/ubuntu/readme.txt
22+
COPY files/reduceByKey.scala /home/ubuntu/reduceByKey.scala
23+
COPY files/initDocuments.scala /home/ubuntu/initDocuments.scala
24+
25+
RUN chown -R ubuntu:ubuntu /home/ubuntu/*
26+
USER ubuntu
27+
2128
# get spark
2229
RUN wget http://apache.mirror.digitalpacific.com.au/spark/spark-${SPARK_VERSION}/spark-${SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}.tgz && \
2330
tar xvf spark-${SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}.tgz
2431

2532
RUN rm -fv spark-${SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}.tgz
2633

27-
# get mongo-hadoop
28-
RUN wget -O mongo-hadoop-spark-${MONGO_HADOOP_VERSION}.jar http://search.maven.org/remotecontent?filepath=org/mongodb/mongo-hadoop/mongo-hadoop-spark/${MONGO_HADOOP_VERSION}/mongo-hadoop-spark-${MONGO_HADOOP_VERSION}.jar
29-
30-
31-
# get mongo java driver
32-
RUN wget http://central.maven.org/maven2/org/mongodb/mongo-java-driver/3.2.2/mongo-java-driver-${MONGO_JAVA_VERSION}.jar
33-
3434
# Run single node of spark
35-
RUN ${HOME}/spark-${SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}/sbin/start-master.sh
36-
37-
COPY files/times.json /home/ubuntu/times.json
38-
39-
# add readme file to start-up
40-
COPY files/readme.txt /home/ubuntu/readme.txt
41-
COPY files/reduceByKey.scala /home/ubuntu/reduceByKey.scala
35+
RUN ${HOME}/spark-${SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}/sbin/start-master.sh

0 commit comments

Comments
 (0)