-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathspark-base.Dockerfile
More file actions
executable file
·28 lines (22 loc) · 1019 Bytes
/
spark-base.Dockerfile
File metadata and controls
executable file
·28 lines (22 loc) · 1019 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
FROM cluster-base
# -- Layer: Apache Spark
ARG spark_version=3.5.3
ARG hadoop_version=3
RUN apt-get update -y && \
apt-get install -y --no-install-recommends curl && \
curl https://archive.apache.org/dist/spark/spark-${spark_version}/spark-${spark_version}-bin-hadoop${hadoop_version}.tgz -o spark.tgz && \
tar -xf spark.tgz && \
mv spark-${spark_version}-bin-hadoop${hadoop_version} /usr/bin/ && \
mkdir /usr/bin/spark-${spark_version}-bin-hadoop${hadoop_version}/logs && \
rm spark.tgz && rm -rf /var/lib/apt/lists/* && \
rm -rf /usr/bin/spark-${spark_version}-bin-hadoop${hadoop_version}/examples && \
rm -rf /usr/bin/spark-${spark_version}-bin-hadoop${hadoop_version}/data
ENV SPARK_HOME /usr/bin/spark-${spark_version}-bin-hadoop${hadoop_version}
ENV JAVA_HOME=/usr/lib/jvm/java-17-openjdk-arm64
ENV SPARK_MASTER_HOST spark-master
ENV SPARK_MASTER_PORT 7077
ENV SPARK_UI_PORT 4040
# ENV SPARK_PUBLIC_DNS localhost
ENV PYSPARK_PYTHON python3
# -- Runtime
WORKDIR ${SPARK_HOME}