2024-02-09 23:45:18 +00:00
|
|
|
# Main stage
|
2025-02-17 10:21:40 +00:00
|
|
|
FROM alpine:3.21.3@sha256:a8560b36e8b8210634f77d9f7f9efd7ffa463e380b75e2e74aff4511df3ef88c
|
2024-02-11 11:47:00 -05:00
|
|
|
|
2024-03-04 20:51:49 +00:00
|
|
|
# Copy necessary files
|
|
|
|
COPY scripts /scripts
|
|
|
|
COPY pipeline /pipeline
|
2024-04-28 23:33:55 +01:00
|
|
|
COPY src/main/resources/static/fonts/*.ttf /usr/share/fonts/opentype/noto/
|
2024-05-05 12:18:52 +01:00
|
|
|
#COPY src/main/resources/static/fonts/*.otf /usr/share/fonts/opentype/noto/
|
2024-03-04 20:51:49 +00:00
|
|
|
COPY build/libs/*.jar app.jar
|
|
|
|
|
|
|
|
ARG VERSION_TAG
|
|
|
|
|
2024-12-22 00:09:52 +00:00
|
|
|
LABEL org.opencontainers.image.title="Stirling-PDF"
|
2024-12-22 00:11:06 +00:00
|
|
|
LABEL org.opencontainers.image.description="A powerful locally hosted web-based PDF manipulation tool supporting 50+ operations including merging, splitting, conversion, OCR, watermarking, and more."
|
2024-12-22 00:09:52 +00:00
|
|
|
LABEL org.opencontainers.image.source="https://github.com/Stirling-Tools/Stirling-PDF"
|
|
|
|
LABEL org.opencontainers.image.licenses="MIT"
|
|
|
|
LABEL org.opencontainers.image.vendor="Stirling-Tools"
|
|
|
|
LABEL org.opencontainers.image.url="https://www.stirlingpdf.com"
|
|
|
|
LABEL org.opencontainers.image.documentation="https://docs.stirlingpdf.com"
|
|
|
|
LABEL maintainer="Stirling-Tools"
|
|
|
|
LABEL org.opencontainers.image.authors="Stirling-Tools"
|
|
|
|
LABEL org.opencontainers.image.version="${VERSION_TAG}"
|
|
|
|
LABEL org.opencontainers.image.keywords="PDF, manipulation, merge, split, convert, OCR, watermark"
|
|
|
|
|
2024-03-04 20:51:49 +00:00
|
|
|
# Set Environment Variables
|
|
|
|
ENV DOCKER_ENABLE_SECURITY=false \
|
|
|
|
VERSION_TAG=$VERSION_TAG \
|
2025-03-25 17:57:17 +00:00
|
|
|
JAVA_BASE_OPTS="-XX:+UnlockExperimentalVMOptions -XX:MaxRAMPercentage=75 -XX:InitiatingHeapOccupancyPercent=20 -XX:+G1PeriodicGCInvokesConcurrent -XX:G1PeriodicGCInterval=10000 -XX:+UseStringDeduplication -XX:G1PeriodicGCSystemLoadThreshold=70" \
|
|
|
|
JAVA_CUSTOM_OPTS="" \
|
2024-05-22 23:58:01 +02:00
|
|
|
HOME=/home/stirlingpdfuser \
|
|
|
|
PUID=1000 \
|
2024-03-08 20:49:19 +00:00
|
|
|
PGID=1000 \
|
2025-02-18 11:57:56 +00:00
|
|
|
UMASK=022 \
|
|
|
|
PYTHONPATH=/usr/lib/libreoffice/program:/opt/venv/lib/python3.12/site-packages \
|
|
|
|
UNO_PATH=/usr/lib/libreoffice/program \
|
2025-03-25 17:57:17 +00:00
|
|
|
URE_BOOTSTRAP=file:///usr/lib/libreoffice/program/fundamentalrc \
|
|
|
|
PATH=$PATH:/opt/venv/bin
|
2024-03-04 20:51:49 +00:00
|
|
|
|
2024-12-22 00:09:52 +00:00
|
|
|
|
2024-02-09 23:45:18 +00:00
|
|
|
# JDK for app
|
2025-02-18 11:57:56 +00:00
|
|
|
RUN echo "@main https://dl-cdn.alpinelinux.org/alpine/edge/main" | tee -a /etc/apk/repositories && \
|
|
|
|
echo "@community https://dl-cdn.alpinelinux.org/alpine/edge/community" | tee -a /etc/apk/repositories && \
|
2024-02-09 23:45:18 +00:00
|
|
|
echo "@testing https://dl-cdn.alpinelinux.org/alpine/edge/testing" | tee -a /etc/apk/repositories && \
|
2024-05-22 23:58:01 +02:00
|
|
|
apk upgrade --no-cache -a && \
|
2024-02-09 23:45:18 +00:00
|
|
|
apk add --no-cache \
|
2025-02-18 11:57:56 +00:00
|
|
|
ca-certificates \
|
|
|
|
tzdata \
|
|
|
|
tini \
|
|
|
|
bash \
|
|
|
|
curl \
|
|
|
|
qpdf \
|
|
|
|
shadow \
|
|
|
|
su-exec \
|
|
|
|
openssl \
|
|
|
|
openssl-dev \
|
|
|
|
openjdk21-jre \
|
|
|
|
# Doc conversion
|
|
|
|
gcompat \
|
|
|
|
libc6-compat \
|
|
|
|
libreoffice \
|
|
|
|
# pdftohtml
|
|
|
|
poppler-utils \
|
|
|
|
# OCR MY PDF (unpaper for descew and other advanced features)
|
|
|
|
tesseract-ocr-data-eng \
|
2025-03-20 09:39:57 +00:00
|
|
|
tesseract-ocr-data-chi_sim \
|
|
|
|
tesseract-ocr-data-deu \
|
|
|
|
tesseract-ocr-data-fra \
|
|
|
|
tesseract-ocr-data-por \
|
2025-02-18 11:57:56 +00:00
|
|
|
# CV
|
|
|
|
py3-opencv \
|
|
|
|
python3 \
|
|
|
|
py3-pip \
|
|
|
|
py3-pillow@testing \
|
|
|
|
py3-pdf2image@testing && \
|
|
|
|
python3 -m venv /opt/venv && \
|
2025-03-25 18:38:57 +00:00
|
|
|
/opt/venv/bin/pip install --upgrade pip && \
|
|
|
|
/opt/venv/bin/pip install --no-cache-dir --upgrade unoserver weasyprint && \
|
2025-02-18 11:57:56 +00:00
|
|
|
ln -s /usr/lib/libreoffice/program/uno.py /opt/venv/lib/python3.12/site-packages/ && \
|
|
|
|
ln -s /usr/lib/libreoffice/program/unohelper.py /opt/venv/lib/python3.12/site-packages/ && \
|
|
|
|
ln -s /usr/lib/libreoffice/program /opt/venv/lib/python3.12/site-packages/LibreOffice && \
|
2024-03-04 20:51:49 +00:00
|
|
|
mv /usr/share/tessdata /usr/share/tessdata-original && \
|
|
|
|
mkdir -p $HOME /configs /logs /customFiles /pipeline/watchedFolders /pipeline/finishedFolders && \
|
2023-12-31 15:54:34 +01:00
|
|
|
fc-cache -f -v && \
|
2024-03-04 20:51:49 +00:00
|
|
|
chmod +x /scripts/* && \
|
|
|
|
chmod +x /scripts/init.sh && \
|
2025-02-18 11:57:56 +00:00
|
|
|
# User permissions
|
2024-03-04 20:51:49 +00:00
|
|
|
addgroup -S stirlingpdfgroup && adduser -S stirlingpdfuser -G stirlingpdfgroup && \
|
2024-03-09 14:03:46 +00:00
|
|
|
chown -R stirlingpdfuser:stirlingpdfgroup $HOME /scripts /usr/share/fonts/opentype/noto /configs /customFiles /pipeline && \
|
2024-12-22 12:00:52 +00:00
|
|
|
chown stirlingpdfuser:stirlingpdfgroup /app.jar
|
2024-02-11 11:47:00 -05:00
|
|
|
|
2024-05-22 23:58:01 +02:00
|
|
|
EXPOSE 8080/tcp
|
2024-02-11 11:47:00 -05:00
|
|
|
|
2023-09-04 18:42:22 +01:00
|
|
|
# Set user and run command
|
2023-12-31 15:54:34 +01:00
|
|
|
ENTRYPOINT ["tini", "--", "/scripts/init.sh"]
|
2025-04-09 09:54:02 +01:00
|
|
|
CMD ["sh", "-c", "java -Dfile.encoding=UTF-8 -jar /app.jar & /opt/venv/bin/unoserver --port 2003 --interface 127.0.0.1"]
|