-
Notifications
You must be signed in to change notification settings - Fork 2
/
Dockerfile
29 lines (23 loc) · 970 Bytes
/
Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
# Base Alpine Linux based image with OpenJDK and Maven
FROM maven:3-jdk-11
# Metadata
LABEL maintainer="Nick Ruest <[email protected]>"
LABEL description="Docker image for the Archives Unleashed Toolkit."
LABEL website="http://archivesunleashed.org/"
## Build variables
#######################
ARG SPARK_VERSION=3.3.1
# Sample resources
RUN git clone https://github.com/archivesunleashed/aut-resources.git
# Archives Unleashed Toolkit
RUN git clone https://github.com/archivesunleashed/aut.git /aut \
&& cd /aut \
&& export JAVA_OPTS=-Xmx512m \
&& mvn clean install
# Spark shell
RUN mkdir /spark \
&& cd /tmp \
&& wget -q "https://archive.apache.org/dist/spark/spark-$SPARK_VERSION/spark-$SPARK_VERSION-bin-hadoop2.tgz" \
&& tar -xf "/tmp/spark-$SPARK_VERSION-bin-hadoop2.tgz" -C /spark --strip-components=1 \
&& rm "/tmp/spark-$SPARK_VERSION-bin-hadoop2.tgz"
CMD /spark/bin/spark-shell --jars /aut/target/aut-1.2.1-SNAPSHOT-fatjar.jar