Skip to content

Commit e4d5477

Browse files
committed
Upgrade Spark to latest version, 3.1.2
- Moved to Python 3.9.2 - Kept Java 11, upgraded base docker image - Direnv to use custom "use java" (via jabba)
1 parent 6b2c226 commit e4d5477

File tree

6 files changed

+13
-13
lines changed

6 files changed

+13
-13
lines changed

.envrc

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
1-
layout pyenv 3.9.0
2-
use sdk java 11.0.9.hs-adpt
3-
export VBOXMANAGE=/Applications/VirtualBox.app/Contents/MacOS
4-
export SPARK_HOME=$(pwd)/.spark
5-
export PATH=$SPARK_HOME/bin:$VBOXMANAGE:$PATH
1+
layout pyenv 3.9.2
2+
3+
export SPARK_HOME="$(pwd)/.spark"
4+
PATH_add "$SPARK_HOME/bin"
65
export PYSPARK_PYTHON=python3
6+

.python-version

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
3.9.0
1+
3.9.2

infra/docker/Dockerfile

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,9 +6,9 @@ RUN apt-get update && \
66
apt-get install -y --no-install-recommends python3-software-properties python3-numpy curl && \
77
rm -rf /var/lib/apt/lists/*
88

9-
ARG SPARK_VERSION=3.0.1
9+
ARG SPARK_VERSION=3.1.2
1010
ENV SPARK_HOME=/opt/spark
11-
RUN mkdir -p /opt/spark && curl -s https://downloads.apache.org/spark/spark-${SPARK_VERSION}/spark-${SPARK_VERSION}-bin-hadoop2.7.tgz | tar -xz -C "${SPARK_HOME}" --strip-components=1
11+
RUN mkdir -p /opt/spark && curl -s https://downloads.apache.org/spark/spark-${SPARK_VERSION}/spark-${SPARK_VERSION}-bin-hadoop3.2.tgz | tar -xz -C "${SPARK_HOME}" --strip-components=1
1212
ENV PATH=$SPARK_HOME/bin:$SPARK_HOME/sbin:$PATH
1313

1414
RUN cp "${SPARK_HOME}/conf/log4j.properties.template" "${SPARK_HOME}/conf/log4j.properties" && \

infra/docker/Makefile

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
SPARK_VERSION:=3.0.1
2-
COURSE_VERSION:=2020.12
1+
SPARK_VERSION:=3.1.2
2+
COURSE_VERSION:=2021.10
33
IMAGE_NAME:=luisbelloch/spark
44

55
.PHONY: help

local_setup.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
#!/bin/bash
22
set -euo pipefail
3-
SPARK_URL=${SPARK_URL:-https://downloads.apache.org/spark/spark-3.0.1/spark-3.0.1-bin-hadoop2.7.tgz}
3+
SPARK_URL=${SPARK_URL:-https://downloads.apache.org/spark/spark-3.1.2/spark-3.1.2-bin-hadoop3.2.tgz}
44
SPARK_PKG=${SPARK_URL##*/}
55
SPARK_HOME=${SPARK_HOME:-$(pwd)/.spark}
66

playbook.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,8 +2,8 @@
22
- hosts: all
33
vars:
44
spark_home: /opt/spark
5-
spark_pkg_name: spark-3.0.1-bin-hadoop2.7
6-
spark_pkg_url: https://downloads.apache.org/spark/spark-3.0.1/spark-3.0.1-bin-hadoop2.7.tgz
5+
spark_pkg_name: spark-3.1.2-bin-hadoop3.2
6+
spark_pkg_url: https://downloads.apache.org/spark/spark-3.1.2/spark-3.1.2-bin-hadoop3.2.tgz
77

88
tasks:
99
- name: Update all packages to the latest version

0 commit comments

Comments
 (0)