-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathDockerfile
36 lines (28 loc) · 1.07 KB
/
Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
# Linux+Py
FROM python:3.6
# JAVA
RUN apt-get update && \
DEBIAN_FRONTEND=noninteractive \
apt-get -y install default-jre-headless && \
apt-get clean && \
rm -rf /var/lib/apt/lists/*
ENV JAVA_HOME=/opt/java/openjdk \
PATH="/opt/java/openjdk/bin:$PATH"
# Install packages
RUN pip3 install --upgrade pip requests
ADD tika-python /tika-python
RUN cd tika-python && pip install . && cd
# Download Tika files
RUN mkdir /tika-tester
RUN wget https://repo1.maven.org/maven2/org/apache/tika/tika-server/1.24/tika-server-1.24-bin.tgz && tar -xzf tika-server-1.24-bin.tgz
RUN wget https://repo1.maven.org/maven2/org/apache/tika/tika-server/1.24/tika-server-1.24.jar.md5
RUN mv /tika-server-1.24-bin/tika-server.jar /tika-tester
RUN mv /tika-server-1.24.jar.md5 /tika-tester/tika-server.jar.md5
# Copy local files
COPY xtract_tika_main.py /
ENV CONTAINER_VERSION=1.0
RUN pip install funcx funcx_endpoint
RUN pip install xtract_sdk==0.0.7a11
RUN pip uninstall globus_sdk -y && pip install globus_sdk==2.0.1
RUN pip install numpy
CMD [ "python3", "./xtract_tika_main.py" ]