Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
16 changes: 8 additions & 8 deletions Dockerfile
Original file line number Diff line number Diff line change
@@ -1,24 +1,24 @@
FROM ubuntu:22.04
FROM ubuntu:23.04

ARG PYTHON_VERSION=3.8
ARG PYTHON_VERSION=3.10
ARG DEBIAN_FRONTEND=noninteractive

RUN apt-get update && \
apt-get install -y wget bzip2 build-essential openjdk-8-jdk ssh sudo && \
apt-get install -y wget bzip2 build-essential openjdk-17-jdk ssh sudo && \
apt-get clean

# Install Spark and update env variables.
ENV SCALA_VERSION 2.12.17
ENV SPARK_VERSION "3.4.1"
ENV SPARK_BUILD "spark-${SPARK_VERSION}-bin-hadoop3.2"
ENV SPARK_BUILD_URL "https://dist.apache.org/repos/dist/release/spark/spark-${SPARK_VERSION}/${SPARK_BUILD}.tgz"
ENV SCALA_VERSION 2.13.16
ENV SPARK_VERSION "4.0.1"
ENV SPARK_BUILD "spark-${SPARK_VERSION}-bin-hadoop3"
ENV SPARK_BUILD_URL "https://dlcdn.apache.org/spark/spark-${SPARK_VERSION}/${SPARK_BUILD}.tgz"
RUN wget --quiet "$SPARK_BUILD_URL" -O /tmp/spark.tgz && \
tar -C /opt -xf /tmp/spark.tgz && \
mv /opt/$SPARK_BUILD /opt/spark && \
rm /tmp/spark.tgz
ENV SPARK_HOME /opt/spark
ENV PATH $SPARK_HOME/bin:$PATH
ENV PYTHONPATH /opt/spark/python/lib/py4j-0.10.9.2-src.zip:/opt/spark/python/lib/pyspark.zip:$PYTHONPATH
ENV PYTHONPATH $SPARK_HOME/python/lib/py4j-0.10.9.9-src.zip:${SPARK_HOME}/python/lib/pyspark.zip:$PYTHONPATH
ENV PYSPARK_PYTHON python

# The graphframes dir will be mounted here.
Expand Down
53 changes: 0 additions & 53 deletions dev/release_guide.md

This file was deleted.