Stirling-PDF/Dockerfile

68 lines
2.3 KiB
Text
Raw Normal View History

2024-02-11 17:47:00 +01:00
# Main stage
FROM alpine:3.20.2
2024-02-11 17:47:00 +01:00
# Copy necessary files
COPY scripts /scripts
COPY pipeline /pipeline
2024-04-29 00:33:55 +02:00
COPY src/main/resources/static/fonts/*.ttf /usr/share/fonts/opentype/noto/
2024-05-05 13:18:52 +02:00
#COPY src/main/resources/static/fonts/*.otf /usr/share/fonts/opentype/noto/
COPY build/libs/*.jar app.jar
ARG VERSION_TAG
# Set Environment Variables
ENV DOCKER_ENABLE_SECURITY=false \
VERSION_TAG=$VERSION_TAG \
JAVA_TOOL_OPTIONS="$JAVA_TOOL_OPTIONS -XX:MaxRAMPercentage=75" \
2024-05-22 23:58:01 +02:00
HOME=/home/stirlingpdfuser \
PUID=1000 \
PGID=1000 \
UMASK=022
2024-02-11 17:47:00 +01:00
# JDK for app
RUN echo "@testing https://dl-cdn.alpinelinux.org/alpine/edge/main" | tee -a /etc/apk/repositories && \
echo "@testing https://dl-cdn.alpinelinux.org/alpine/edge/community" | tee -a /etc/apk/repositories && \
echo "@testing https://dl-cdn.alpinelinux.org/alpine/edge/testing" | tee -a /etc/apk/repositories && \
2024-05-22 23:58:01 +02:00
apk upgrade --no-cache -a && \
2024-02-11 17:47:00 +01:00
apk add --no-cache \
ca-certificates \
tzdata \
tini \
bash \
curl \
2024-03-09 15:03:46 +01:00
shadow \
2024-05-23 00:02:55 +02:00
su-exec \
openssl \
openssl-dev \
openjdk21-jre \
2024-02-11 17:47:00 +01:00
# Doc conversion
2024-05-22 23:58:01 +02:00
libreoffice \
# pdftohtml
poppler-utils \
2024-02-11 17:47:00 +01:00
# OCR MY PDF (unpaper for descew and other advanced featues)
ocrmypdf \
tesseract-ocr-data-eng \
# CV
py3-opencv \
# python3/pip
python3 && \
wget https://bootstrap.pypa.io/get-pip.py -qO - | python3 - --break-system-packages --no-cache-dir --upgrade && \
# uno unoconv and HTML
pip install --break-system-packages --no-cache-dir --upgrade unoconv WeasyPrint && \
mv /usr/share/tessdata /usr/share/tessdata-original && \
mkdir -p $HOME /configs /logs /customFiles /pipeline/watchedFolders /pipeline/finishedFolders && \
2024-02-11 17:47:00 +01:00
fc-cache -f -v && \
chmod +x /scripts/* && \
chmod +x /scripts/init.sh && \
# User permissions
addgroup -S stirlingpdfgroup && adduser -S stirlingpdfuser -G stirlingpdfgroup && \
2024-03-09 15:03:46 +01:00
chown -R stirlingpdfuser:stirlingpdfgroup $HOME /scripts /usr/share/fonts/opentype/noto /configs /customFiles /pipeline && \
2024-04-05 13:51:22 +02:00
chown stirlingpdfuser:stirlingpdfgroup /app.jar && \
2024-05-22 23:58:01 +02:00
tesseract --list-langs
2024-02-11 17:47:00 +01:00
2024-05-22 23:58:01 +02:00
EXPOSE 8080/tcp
2024-02-11 17:47:00 +01:00
# Set user and run command
ENTRYPOINT ["tini", "--", "/scripts/init.sh"]
CMD ["java", "-Dfile.encoding=UTF-8", "-jar", "/app.jar"]