Permalink
Switch branches/tags
Nothing to show
Find file Copy path
Fetching contributors…
Cannot retrieve contributors at this time
29 lines (22 sloc) 880 Bytes
# Base Alpine Linux based image with OpenJDK and Maven
FROM maven:3-jdk-8-alpine
# Metadata
LABEL maintainer="Nick Ruest <ruestn@gmail.com>"
LABEL description="Docker image for the Archives Unleashed Toolkit."
LABEL website="http://archivesunleashed.org/"
## Build variables
#########################
ARG SPARK_VERSION=2.3.2
# Git and Wget
RUN apk add --update \
git \
wget
# Sample resources
RUN git clone https://github.com/archivesunleashed/aut-resources.git /aut-resources
# Spark shell
RUN mkdir /spark \
&& cd /tmp \
&& wget -q "https://archive.apache.org/dist/spark/spark-$SPARK_VERSION/spark-$SPARK_VERSION-bin-hadoop2.7.tgz" \
&& tar -xf "/tmp/spark-$SPARK_VERSION-bin-hadoop2.7.tgz" -C /spark --strip-components=1 \
&& rm "/tmp/spark-$SPARK_VERSION-bin-hadoop2.7.tgz"
CMD /spark/bin/spark-shell --packages "io.archivesunleashed:aut:0.17.0"