From c9bd0ff3170935580f75f29cb9e4025403419e6a Mon Sep 17 00:00:00 2001 From: Javier Ivan Venegas Carrillo Date: Thu, 8 Nov 2018 16:29:41 -0700 Subject: [PATCH 1/7] Bumped Spark to 2.4.0 adn py4j to 0.10.8.1 --- pyspark-notebook/Dockerfile | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/pyspark-notebook/Dockerfile b/pyspark-notebook/Dockerfile index 8ef0ed23..740b80f6 100644 --- a/pyspark-notebook/Dockerfile +++ b/pyspark-notebook/Dockerfile @@ -8,7 +8,7 @@ LABEL maintainer="Jupyter Project " USER root # Spark dependencies -ENV APACHE_SPARK_VERSION 2.3.1 +ENV APACHE_SPARK_VERSION 2.4.0 ENV HADOOP_VERSION 2.7 RUN apt-get -y update && \ @@ -18,7 +18,7 @@ RUN apt-get -y update && \ RUN cd /tmp && \ wget -q http://mirrors.ukfast.co.uk/sites/ftp.apache.org/spark/spark-${APACHE_SPARK_VERSION}/spark-${APACHE_SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}.tgz && \ - echo "DC3A97F3D99791D363E4F70A622B84D6E313BD852F6FDBC777D31EAB44CBC112CEEAA20F7BF835492FB654F48AE57E9969F93D3B0E6EC92076D1C5E1B40B4696 *spark-${APACHE_SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}.tgz" | sha512sum -c - && \ + echo "5F4184E0FE7E5C8AE67F5E6BC5DEEE881051CC712E9FF8AEDDF3529724C00E402C94BB75561DD9517A372F06C1FCB78DC7AE65DCBD4C156B3BA4D8E267EC2936 *spark-${APACHE_SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}.tgz" | sha512sum -c - && \ tar xzf spark-${APACHE_SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}.tgz -C /usr/local --owner root --group root --no-same-owner && \ rm spark-${APACHE_SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}.tgz RUN cd /usr/local && ln -s spark-${APACHE_SPARK_VERSION}-bin-hadoop${HADOOP_VERSION} spark @@ -39,7 +39,7 @@ RUN apt-get -y update && \ # Spark and Mesos config ENV SPARK_HOME /usr/local/spark -ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.7-src.zip +ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.8.1-src.zip ENV MESOS_NATIVE_LIBRARY /usr/local/lib/libmesos.so ENV SPARK_OPTS --driver-java-options=-Xms1024M --driver-java-options=-Xmx4096M --driver-java-options=-Dlog4j.logLevel=info From 5162984d028416475034511afe868ca1e5bb0e93 Mon Sep 17 00:00:00 2001 From: Javier Ivan Venegas Carrillo Date: Thu, 8 Nov 2018 16:41:04 -0700 Subject: [PATCH 2/7] Update for test --- pyspark-notebook/Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pyspark-notebook/Dockerfile b/pyspark-notebook/Dockerfile index 740b80f6..267a0e28 100644 --- a/pyspark-notebook/Dockerfile +++ b/pyspark-notebook/Dockerfile @@ -39,7 +39,7 @@ RUN apt-get -y update && \ # Spark and Mesos config ENV SPARK_HOME /usr/local/spark -ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.8.1-src.zip +ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.7-src.zip ENV MESOS_NATIVE_LIBRARY /usr/local/lib/libmesos.so ENV SPARK_OPTS --driver-java-options=-Xms1024M --driver-java-options=-Xmx4096M --driver-java-options=-Dlog4j.logLevel=info From dd3a1989225f3c1232ff4b7ef367fd6fbc85c265 Mon Sep 17 00:00:00 2001 From: Javier Ivan Venegas Carrillo Date: Thu, 8 Nov 2018 17:04:10 -0700 Subject: [PATCH 3/7] Update for test with py4j update --- pyspark-notebook/Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pyspark-notebook/Dockerfile b/pyspark-notebook/Dockerfile index 267a0e28..642c2a35 100644 --- a/pyspark-notebook/Dockerfile +++ b/pyspark-notebook/Dockerfile @@ -39,7 +39,7 @@ RUN apt-get -y update && \ # Spark and Mesos config ENV SPARK_HOME /usr/local/spark -ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.7-src.zip +ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.8-src.zip ENV MESOS_NATIVE_LIBRARY /usr/local/lib/libmesos.so ENV SPARK_OPTS --driver-java-options=-Xms1024M --driver-java-options=-Xmx4096M --driver-java-options=-Dlog4j.logLevel=info From 777eec10c32be0b59e1e02acc30b39dfca1f7c4f Mon Sep 17 00:00:00 2001 From: Javier Ivan Venegas Carrillo Date: Thu, 8 Nov 2018 17:29:03 -0700 Subject: [PATCH 4/7] Update for test with py4j update for test --- pyspark-notebook/Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pyspark-notebook/Dockerfile b/pyspark-notebook/Dockerfile index 642c2a35..740b80f6 100644 --- a/pyspark-notebook/Dockerfile +++ b/pyspark-notebook/Dockerfile @@ -39,7 +39,7 @@ RUN apt-get -y update && \ # Spark and Mesos config ENV SPARK_HOME /usr/local/spark -ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.8-src.zip +ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.8.1-src.zip ENV MESOS_NATIVE_LIBRARY /usr/local/lib/libmesos.so ENV SPARK_OPTS --driver-java-options=-Xms1024M --driver-java-options=-Xmx4096M --driver-java-options=-Dlog4j.logLevel=info From 313453504d3c79bac8e30ef5872fbd5e42953745 Mon Sep 17 00:00:00 2001 From: Peter Parente Date: Fri, 9 Nov 2018 23:43:03 -0500 Subject: [PATCH 5/7] Keep py4j-0.10.7-src.zip --- pyspark-notebook/Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pyspark-notebook/Dockerfile b/pyspark-notebook/Dockerfile index 740b80f6..267a0e28 100644 --- a/pyspark-notebook/Dockerfile +++ b/pyspark-notebook/Dockerfile @@ -39,7 +39,7 @@ RUN apt-get -y update && \ # Spark and Mesos config ENV SPARK_HOME /usr/local/spark -ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.8.1-src.zip +ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.7-src.zip ENV MESOS_NATIVE_LIBRARY /usr/local/lib/libmesos.so ENV SPARK_OPTS --driver-java-options=-Xms1024M --driver-java-options=-Xmx4096M --driver-java-options=-Dlog4j.logLevel=info From 46dbe7590471e46bf00abd90cdc919d74525bbe8 Mon Sep 17 00:00:00 2001 From: borregore <42614659+borregore@users.noreply.github.com> Date: Wed, 14 Nov 2018 10:26:12 -0700 Subject: [PATCH 6/7] Update Dockerfile --- pyspark-notebook/Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pyspark-notebook/Dockerfile b/pyspark-notebook/Dockerfile index 267a0e28..a5149ab1 100644 --- a/pyspark-notebook/Dockerfile +++ b/pyspark-notebook/Dockerfile @@ -39,7 +39,7 @@ RUN apt-get -y update && \ # Spark and Mesos config ENV SPARK_HOME /usr/local/spark -ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.7-src.zip +ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.7-src.zip ENV MESOS_NATIVE_LIBRARY /usr/local/lib/libmesos.so ENV SPARK_OPTS --driver-java-options=-Xms1024M --driver-java-options=-Xmx4096M --driver-java-options=-Dlog4j.logLevel=info From f4f24a3e6306bc1e728f22cf3a0300ea4a173698 Mon Sep 17 00:00:00 2001 From: borregore <42614659+borregore@users.noreply.github.com> Date: Wed, 14 Nov 2018 11:06:44 -0700 Subject: [PATCH 7/7] Update Dockerfile --- pyspark-notebook/Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pyspark-notebook/Dockerfile b/pyspark-notebook/Dockerfile index a5149ab1..267a0e28 100644 --- a/pyspark-notebook/Dockerfile +++ b/pyspark-notebook/Dockerfile @@ -39,7 +39,7 @@ RUN apt-get -y update && \ # Spark and Mesos config ENV SPARK_HOME /usr/local/spark -ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.7-src.zip +ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-0.10.7-src.zip ENV MESOS_NATIVE_LIBRARY /usr/local/lib/libmesos.so ENV SPARK_OPTS --driver-java-options=-Xms1024M --driver-java-options=-Xmx4096M --driver-java-options=-Dlog4j.logLevel=info