dangerzone/dangerzone-converter/Dockerfile

100 lines
2.7 KiB
Docker

FROM alpine:latest
# Install dependencies
RUN apk -U upgrade && \
apk add \
ghostscript \
graphicsmagick \
libreoffice \
openjdk8 \
poppler-utils \
py3-magic \
py3-pillow \
sudo
# tesseract-ocr \
# tesseract-ocr-data-afr \
# tesseract-ocr-data-ara \
# tesseract-ocr-data-aze \
# tesseract-ocr-data-bel \
# tesseract-ocr-data-ben \
# tesseract-ocr-data-bul \
# tesseract-ocr-data-cat \
# tesseract-ocr-data-ces \
# tesseract-ocr-data-chi_sim \
# tesseract-ocr-data-chi_tra \
# tesseract-ocr-data-chr \
# tesseract-ocr-data-dan \
# tesseract-ocr-data-deu \
# tesseract-ocr-data-ell \
# tesseract-ocr-data-enm \
# tesseract-ocr-data-epo \
# tesseract-ocr-data-equ \
# tesseract-ocr-data-est \
# tesseract-ocr-data-eus \
# tesseract-ocr-data-fin \
# tesseract-ocr-data-fra \
# tesseract-ocr-data-frk \
# tesseract-ocr-data-frm \
# tesseract-ocr-data-glg \
# tesseract-ocr-data-grc \
# tesseract-ocr-data-heb \
# tesseract-ocr-data-hin \
# tesseract-ocr-data-hrv \
# tesseract-ocr-data-hun \
# tesseract-ocr-data-ind \
# tesseract-ocr-data-isl \
# tesseract-ocr-data-ita \
# tesseract-ocr-data-ita_old \
# tesseract-ocr-data-jpn \
# tesseract-ocr-data-kan \
# tesseract-ocr-data-kat \
# tesseract-ocr-data-kor \
# tesseract-ocr-data-lav \
# tesseract-ocr-data-lit \
# tesseract-ocr-data-mal \
# tesseract-ocr-data-mkd \
# tesseract-ocr-data-mlt \
# tesseract-ocr-data-msa \
# tesseract-ocr-data-nld \
# tesseract-ocr-data-nor \
# tesseract-ocr-data-pol \
# tesseract-ocr-data-por \
# tesseract-ocr-data-ron \
# tesseract-ocr-data-rus \
# tesseract-ocr-data-slk \
# tesseract-ocr-data-slv \
# tesseract-ocr-data-spa \
# tesseract-ocr-data-spa_old \
# tesseract-ocr-data-sqi \
# tesseract-ocr-data-srp \
# tesseract-ocr-data-swa \
# tesseract-ocr-data-swe \
# tesseract-ocr-data-tam \
# tesseract-ocr-data-tel \
# tesseract-ocr-data-tgl \
# tesseract-ocr-data-tha \
# tesseract-ocr-data-tur \
# tesseract-ocr-data-ukr \
# tesseract-ocr-data-vie
# Install pdftk
RUN \
wget https://gitlab.com/pdftk-java/pdftk/-/jobs/924565145/artifacts/raw/build/libs/pdftk-all.jar && \
mv pdftk-all.jar /usr/local/bin && \
chmod +x /usr/local/bin/pdftk-all.jar && \
echo '#!/bin/sh' > /usr/local/bin/pdftk && \
echo '/usr/bin/java -jar "/usr/local/bin/pdftk-all.jar" "$@"' >> /usr/local/bin/pdftk && \
chmod +x /usr/local/bin/pdftk
COPY scripts/* /usr/local/bin/
# Add the unprivileged user
RUN adduser -h /home/user -s /bin/sh -D user
# /tmp/input_file is where the first convert expects the input file to be, and
# /tmp where it will write the pixel files
#
# /dangerzone is where the second script expects files to be put by the first one
#
# /safezone is where the wrapper eventually moves the sanitized files.
VOLUME /dangerzone /tmp/input_file /safezone