Skip to content
Permalink
Branch: master
Find file Copy path
Find file Copy path
Fetching contributors…
Cannot retrieve contributors at this time
35 lines (27 sloc) 1.02 KB
# Base Alpine Linux based image with OpenJDK and Maven
FROM maven:3-jdk-8-alpine
# Metadata
LABEL maintainer="Nick Ruest <ruestn@gmail.com>"
LABEL description="Docker image for the Archives Unleashed Toolkit."
LABEL website="http://archivesunleashed.org/"
## Build variables
#######################
ARG SPARK_VERSION=2.4.3
# Git and Wget
RUN apk add --update \
git \
wget
# Sample resources
RUN git clone https://github.com/archivesunleashed/aut-resources.git
# Archives Unleashed Toolkit
RUN git clone https://github.com/archivesunleashed/aut.git /aut \
&& cd /aut \
&& export JAVA_OPTS=-Xmx512m \
&& mvn clean install
# Spark shell
RUN mkdir /spark \
&& cd /tmp \
&& wget -q "https://archive.apache.org/dist/spark/spark-$SPARK_VERSION/spark-$SPARK_VERSION-bin-hadoop2.7.tgz" \
&& tar -xf "/tmp/spark-$SPARK_VERSION-bin-hadoop2.7.tgz" -C /spark --strip-components=1 \
&& rm "/tmp/spark-$SPARK_VERSION-bin-hadoop2.7.tgz"
CMD /spark/bin/spark-shell --packages "io.archivesunleashed:aut:0.18.1-SNAPSHOT"
You can’t perform that action at this time.