Stirling-PDF/Dockerfile

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

70 lines
2.5 KiB
Text
Raw Normal View History

2024-02-10 00:45:18 +01:00
# Main stage
2024-02-10 11:29:17 +01:00
FROM alpine:3.19.1
2024-02-10 00:45:18 +01:00
# JDK for app
RUN echo "@testing https://dl-cdn.alpinelinux.org/alpine/edge/main" | tee -a /etc/apk/repositories && \
echo "@testing https://dl-cdn.alpinelinux.org/alpine/edge/community" | tee -a /etc/apk/repositories && \
echo "@testing https://dl-cdn.alpinelinux.org/alpine/edge/testing" | tee -a /etc/apk/repositories && \
apk add --no-cache \
ca-certificates \
tzdata \
tini \
bash \
curl \
openjdk17-jre \
# Doc conversion
libreoffice@testing \
# OCR MY PDF (unpaper for descew and other advanced featues)
ocrmypdf \
tesseract-ocr-data-eng \
# CV
py3-opencv \
# python3/pip
python3 && \
wget https://bootstrap.pypa.io/get-pip.py -qO - | python3 - --break-system-packages --no-cache-dir --upgrade && \
# uno unoconv and HTML
pip install --break-system-packages --no-cache-dir --upgrade unoconv WeasyPrint && \
mv /usr/share/tessdata /usr/share/tessdata-original
2023-05-01 22:57:48 +02:00
2023-09-14 22:07:39 +02:00
ARG VERSION_TAG
2023-09-04 19:42:22 +02:00
# Set Environment Variables
2023-09-14 22:07:39 +02:00
ENV DOCKER_ENABLE_SECURITY=false \
2023-09-04 19:42:22 +02:00
HOME=/home/stirlingpdfuser \
2023-12-28 18:49:45 +01:00
VERSION_TAG=$VERSION_TAG \
JAVA_TOOL_OPTIONS="$JAVA_TOOL_OPTIONS -XX:MaxRAMPercentage=75"
2023-09-14 22:07:39 +02:00
# PUID=1000 \
# PGID=1000 \
# UMASK=022 \
# Copy necessary files
COPY scripts /scripts
COPY pipeline /pipeline
COPY src/main/resources/static/fonts/*.ttf /usr/share/fonts/opentype/noto
COPY src/main/resources/static/fonts/*.otf /usr/share/fonts/opentype/noto
COPY build/libs/*.jar app.jar
2023-09-04 19:42:22 +02:00
# Create user and group
2023-09-14 22:07:39 +02:00
##RUN groupadd -g $PGID stirlingpdfgroup && \
## useradd -u $PUID -g stirlingpdfgroup -s /bin/sh stirlingpdfuser && \
## mkdir -p $HOME && chown stirlingpdfuser:stirlingpdfgroup $HOME && \
2023-09-04 19:42:22 +02:00
# Set up necessary directories and permissions
2024-02-10 00:45:18 +01:00
RUN mkdir -p /configs /logs /customFiles /pipeline/watchedFolders /pipeline/finishedFolders && \
2023-09-14 22:07:39 +02:00
##&& \
## chown -R stirlingpdfuser:stirlingpdfgroup /scripts /usr/share/fonts/opentype/noto /usr/share/tesseract-ocr /configs /customFiles && \
## chown -R stirlingpdfuser:stirlingpdfgroup /usr/share/tesseract-ocr-original && \
2023-09-04 19:42:22 +02:00
# Set font cache and permissions
fc-cache -f -v && \
chmod +x /scripts/*
2023-09-14 22:07:39 +02:00
## chown stirlingpdfuser:stirlingpdfgroup /app.jar && \
## chmod +x /scripts/init.sh
2024-02-10 11:29:17 +01:00
EXPOSE 8080
2023-09-04 19:42:22 +02:00
# Set user and run command
2023-09-14 22:07:39 +02:00
##USER stirlingpdfuser
ENTRYPOINT ["tini", "--", "/scripts/init.sh"]
CMD ["java", "-Dfile.encoding=UTF-8", "-jar", "/app.jar"]