Skip to content

Commit

Permalink
Install numpy on all spark images
Browse files Browse the repository at this point in the history
  • Loading branch information
mattf committed Nov 20, 2015
1 parent fc8f567 commit fb4afda
Showing 1 changed file with 7 additions and 0 deletions.
7 changes: 7 additions & 0 deletions examples/spark/images/base/Dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -26,6 +26,13 @@ RUN mkdir -p /opt && \
# Add the GCS connector.
RUN wget -O /opt/spark/lib/gcs-connector-latest-hadoop2.jar https://storage.googleapis.com/hadoop-lib/gcs/gcs-connector-latest-hadoop2.jar

# if numpy is installed on a driver it needs to be installed on all
# workers, so install it everywhere
RUN apt-get update && \
apt-get install -y python-numpy && \
apt-get clean && \
rm -rf /var/lib/apt/lists/*

ADD log4j.properties /opt/spark/conf/log4j.properties
ADD start-common.sh /
ADD core-site.xml /opt/spark/conf/core-site.xml
Expand Down

0 comments on commit fb4afda

Please sign in to comment.