-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathDockerfile
29 lines (23 loc) · 874 Bytes
/
Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
FROM ubuntu
WORKDIR /root
RUN apt update \
&& apt upgrade -y \
&& apt install openjdk-8-jre-headless -y \
&& apt install python3-pip -y \
&& pip3 install jupyter \
&& apt install wget -y \
&& wget https://archive.apache.org/dist/spark/spark-3.0.1/spark-3.0.1-bin-hadoop2.7.tgz \
&& tar xzf spark-3.0.1-bin-hadoop2.7.tgz \
&& mv spark-3.0.1-bin-hadoop2.7 /opt/spark \
&& wget https://jdbc.postgresql.org/download/postgresql-42.2.12.jar
ENV JUPYTER_HOME=/root/.local
ENV PATH=$JUPYTER_HOME/bin:$PATH
ENV SPARK_HOME=/opt/spark
ENV PATH=$PATH:$SPARK_HOME/bin:$SPARK_HOME/sbin
ENV PYSPARK_PYTHON=/usr/bin/python3
ENV PYSPARK_DRIVER_PYTHON="jupyter"
ENV PYSPARK_DRIVER_PYTHON_OPTS="notebook --allow-root"
ENV PYTHONPATH=$SPARK_HOME/python:$PYTHONPATH
ENV SPARK_CLASSPATH='/root/postgresql-42.2.12.jar'
EXPOSE 8888
WORKDIR /root/workspace