2020-03-30 22:45:43 +00:00
|
|
|
FROM alpine:latest
|
|
|
|
|
|
|
|
ENV UNO_URL https://raw.githubusercontent.com/unoconv/unoconv/0.9.0/unoconv
|
|
|
|
|
|
|
|
LABEL maintainer="eikek0 <eike@docspell.org>"
|
|
|
|
|
|
|
|
RUN apk add --no-cache openjdk11-jre \
|
|
|
|
unzip \
|
|
|
|
bash \
|
|
|
|
curl \
|
|
|
|
ghostscript \
|
|
|
|
tesseract-ocr \
|
|
|
|
tesseract-ocr-data-deu \
|
|
|
|
unpaper \
|
|
|
|
wkhtmltopdf \
|
|
|
|
libreoffice \
|
|
|
|
ttf-droid-nonlatin \
|
|
|
|
ttf-droid \
|
|
|
|
ttf-dejavu \
|
|
|
|
ttf-freefont \
|
|
|
|
ttf-liberation \
|
2020-07-18 10:48:41 +00:00
|
|
|
libxml2-dev \
|
|
|
|
libxslt-dev \
|
|
|
|
pngquant \
|
|
|
|
zlib-dev \
|
|
|
|
g++ \
|
|
|
|
qpdf \
|
|
|
|
python3-dev \
|
|
|
|
libffi-dev\
|
|
|
|
qpdf-dev \
|
|
|
|
&& pip3 install --upgrade pip \
|
|
|
|
&& pip3 install ocrmypdf \
|
2020-03-30 22:45:43 +00:00
|
|
|
&& curl -Ls $UNO_URL -o /usr/local/bin/unoconv \
|
|
|
|
&& chmod +x /usr/local/bin/unoconv \
|
|
|
|
&& ln -s /usr/bin/python3 /usr/bin/python \
|
|
|
|
&& mkdir -p /opt \
|
|
|
|
&& cd /opt \
|
2020-06-29 19:01:07 +00:00
|
|
|
&& curl -L -o docspell.zip https://github.com/eikek/docspell/releases/download/v0.8.0/docspell-joex-0.8.0.zip \
|
2020-03-30 22:45:43 +00:00
|
|
|
&& unzip docspell.zip \
|
|
|
|
&& rm docspell.zip \
|
2020-07-18 10:48:41 +00:00
|
|
|
&& apk del curl unzip libxml2-dev libxslt-dev zlib-dev g++ python3-dev libffi-dev qpdf-dev
|
2020-03-30 22:45:43 +00:00
|
|
|
|
2020-06-28 00:12:57 +00:00
|
|
|
COPY entrypoint-joex.sh /opt/entrypoint.sh
|
2020-03-30 22:45:43 +00:00
|
|
|
|
|
|
|
EXPOSE 7878
|
|
|
|
|
|
|
|
ENTRYPOINT ["/opt/entrypoint.sh"]
|