Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
19 changes: 9 additions & 10 deletions spark-minimal/Dockerfile
Original file line number Diff line number Diff line change
@@ -1,28 +1,27 @@
FROM ubuntu:16.04
MAINTAINER Mark Mims <mark.mims@gmail.com>
FROM ubuntu:20.04
MAINTAINER Mark Mims <mark.mims@gmail.com>, Alexander To <alexander.to@berkeley.edu>

ENV SPARK_VERSION 2.2.0
ENV SPARK_HADOOP_VERSION 2.6
ENV SPARK_VERSION 3.1.1
ENV SPARK_HADOOP_VERSION 2.7

ENV SPARK_HOME /spark-$SPARK_VERSION-bin-hadoop$SPARK_HADOOP_VERSION
ENV JAVA_HOME /usr/lib/jvm/java-8-oracle
ENV JAVA_HOME /usr/lib/jvm/java-11-openjdk-amd64/

ENV SPARK_TEMPLATE_PATH $SPARK_HOME/templates
ENV SPARK_CONF_PATH $SPARK_HOME/conf

ENV PATH $SPARK_HOME/bin:$PATH

RUN echo oracle-java8-installer shared/accepted-oracle-license-v1-1 select true | debconf-set-selections \
&& apt-get update \
RUN apt-get update \
&& apt-get upgrade -y \
&& apt-get install -y software-properties-common \
&& add-apt-repository -y ppa:webupd8team/java \
&& add-apt-repository -y ppa:openjdk-r/ppa \
&& apt-key adv --keyserver keyserver.ubuntu.com --recv E56151BF \
&& apt-get update \
&& apt-get install -y \
curl \
dnsutils \
oracle-java8-installer \
openjdk-11-jdk \
&& apt-get purge -y software-properties-common \
&& apt-get autoremove -y \
&& curl -OL http://www-us.apache.org/dist/spark/spark-$SPARK_VERSION/spark-$SPARK_VERSION-bin-hadoop$SPARK_HADOOP_VERSION.tgz \
Expand All @@ -31,7 +30,7 @@ RUN echo oracle-java8-installer shared/accepted-oracle-license-v1-1 select true

COPY *-site.xml $SPARK_TEMPLATE_PATH/
#COPY *.properties $SPARK_CONF_PATH/
#COPY spark-defaults.conf $SPARK_CONF_PATH
COPY spark-defaults.conf $SPARK_CONF_PATH
#COPY spark-env.sh $SPARK_CONF_PATH

COPY jars/* $SPARK_HOME/jars/
Expand Down
2 changes: 1 addition & 1 deletion spark-minimal/Makefile
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@ default: version list

NAMESPACE=midsw205
IMAGE=$(shell basename $(PWD))
VERSION=0.0.6
VERSION=0.0.7

version: show-version
show-version:
Expand Down
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file removed spark-minimal/jars/org.slf4j_slf4j-api-1.7.16.jar
Binary file not shown.
Binary file added spark-minimal/jars/org.slf4j_slf4j-api-1.7.3.jar
Binary file not shown.
Binary file not shown.
Binary file not shown.
23 changes: 23 additions & 0 deletions spark-minimal/spark-defaults.conf
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
#
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

# Default system properties included when running spark-submit.
# This is useful for setting default environmental settings.

#spark.jars jars/org.apache.spark_spark-sql-kafka-0-10_2.12-3.1.1.jar
spark.jars.packages org.apache.spark:spark-sql-kafka-0-10_2.12:3.1.1
#spark.jars.ivy /root/spark-3.1.1-bin-hadoop2.7/
10 changes: 5 additions & 5 deletions spark-python/Dockerfile
Original file line number Diff line number Diff line change
@@ -1,8 +1,8 @@
FROM midsw205/spark-minimal:0.0.6
MAINTAINER Mark Mims <mark.mims@gmail.com>
FROM atox120/spark-minimal:0.0.8
MAINTAINER Mark Mims <mark.mims@gmail.com>, Alexander To <alexander.to@berkeley.edu>

ENV ANACONDA_VERSION 4.4.0
ENV PY4J_VERSION 0.10.4
ENV ANACONDA_VERSION 2020.11
ENV PY4J_VERSION 0.10.9.2

WORKDIR /

Expand All @@ -11,7 +11,7 @@ RUN apt-get install -y bzip2 \
&& chmod 755 Anaconda3-$ANACONDA_VERSION-Linux-x86_64.sh \
&& /Anaconda3-$ANACONDA_VERSION-Linux-x86_64.sh -b -p /opt/anaconda3 \
&& rm /Anaconda3-$ANACONDA_VERSION-Linux-x86_64.sh \
&& /opt/anaconda3/bin/conda install pyarrow arrow-cpp parquet-cpp -c conda-forge
&& /opt/anaconda3/bin/conda install pyarrow parquet-cpp arrow-cpp -c conda-forge

ENV PATH /opt/anaconda3/bin:$PATH
ENV PYTHONPATH $SPARK_HOME/python:$SPARK_HOME/python/lib/py4j-$PY4J_VERSION-src.zip
Expand Down
2 changes: 1 addition & 1 deletion spark-python/Makefile
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@ default: version list

NAMESPACE=midsw205
IMAGE=$(shell basename $(PWD))
VERSION=0.0.6
VERSION=0.0.7

version: show-version
show-version:
Expand Down