Skip to content

Commit 55e224e

Browse files
authored
Change spark download url to https://dlcdn.apache.org (#1876)
1 parent ee64c2a commit 55e224e

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

pyspark-notebook/Dockerfile

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -33,10 +33,12 @@ RUN apt-get update --yes && \
3333
# Spark installation
3434
WORKDIR /tmp
3535

36+
# You need to use https://archive.apache.org/dist/ website if you want to download old Spark versions
37+
# But it seems to be slower, that's why we use recommended site for download
3638
RUN if [ -z "${scala_version}" ]; then \
37-
wget -qO "spark.tgz" "https://archive.apache.org/dist/spark/spark-${APACHE_SPARK_VERSION}/spark-${APACHE_SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}.tgz"; \
39+
wget -qO "spark.tgz" "https://dlcdn.apache.org/spark/spark-${APACHE_SPARK_VERSION}/spark-${APACHE_SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}.tgz"; \
3840
else \
39-
wget -qO "spark.tgz" "https://archive.apache.org/dist/spark/spark-${APACHE_SPARK_VERSION}/spark-${APACHE_SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}-scala${scala_version}.tgz"; \
41+
wget -qO "spark.tgz" "https://dlcdn.apache.org/spark/spark-${APACHE_SPARK_VERSION}/spark-${APACHE_SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}-scala${scala_version}.tgz"; \
4042
fi && \
4143
echo "${spark_checksum} *spark.tgz" | sha512sum -c - && \
4244
tar xzf "spark.tgz" -C /usr/local --owner root --group root --no-same-owner && \

0 commit comments

Comments
 (0)