| # |
| # Licensed to the Apache Software Foundation (ASF) under one or more |
| # contributor license agreements. See the NOTICE file distributed with |
| # this work for additional information regarding copyright ownership. |
| # The ASF licenses this file to You under the Apache License, Version 2.0 |
| # (the "License"); you may not use this file except in compliance with |
| # the License. You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, software |
| # distributed under the License is distributed on an "AS IS" BASIS, |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| # See the License for the specific language governing permissions and |
| # limitations under the License |
| # |
| # This is a dockerfile used to construct the spark environment used for the |
| # integration test suite. |
| |
| FROM jupyter/all-spark-notebook:07a7c4d6d447 |
| |
| # User escalation |
| USER root |
| |
| # Spark dependencies |
| ENV APACHE_SPARK_VERSION 2.0.0 |
| |
| # Temporarily add jessie backports to get openjdk 8, but then remove that source |
| RUN echo 'deb http://ftp.debian.org/debian jessie-backports main' > /etc/apt/sources.list.d/jessie-backports.list && \ |
| apt-get -y update && \ |
| apt-get install -y --no-install-recommends -t jessie-backports openjdk-8-jre-headless && \ |
| rm /etc/apt/sources.list.d/jessie-backports.list && \ |
| apt-get clean && \ |
| rm -rf /var/lib/apt/lists/* && \ |
| rm -rf /var/lib/apt/lists/* && \ |
| update-alternatives --set java /usr/lib/jvm/java-8-openjdk-amd64/jre/bin/java |
| |
| |
| # Installing Spark2 |
| RUN cd /tmp && \ |
| wget -q http://d3kbcqa49mib13.cloudfront.net/spark-${APACHE_SPARK_VERSION}-bin-hadoop2.6.tgz && \ |
| echo "e17d9da4b3ac463ea3ce42289f2a71cefb479d154b1ffd00310c7d7ab207aa2c *spark-${APACHE_SPARK_VERSION}-bin-hadoop2.6.tgz" | sha256sum -c - && \ |
| tar xzf spark-${APACHE_SPARK_VERSION}-bin-hadoop2.6.tgz -C /usr/local && \ |
| rm spark-${APACHE_SPARK_VERSION}-bin-hadoop2.6.tgz |
| |
| # Overwrite symlink |
| RUN cd /usr/local && \ |
| rm spark && \ |
| ln -s spark-${APACHE_SPARK_VERSION}-bin-hadoop2.6 spark |
| |