FROM openjdk:17-jdk-slim AS builder WORKDIR /app RUN apt-get update && apt-get install -y \ git \ curl \ gradle \ maven RUN git clone https://github.com/Stirling-Tools/Stirling-PDF.git . RUN ./gradlew build FROM openjdk:17-jdk-slim WORKDIR /app COPY --from=builder /app/build/libs/*.jar /app/stirling-pdf.jar RUN mkdir -p /app/logs /app/configs /app/customFiles /usr/share/tessdata && \ chmod -R 777 /app/logs /app/configs /app/customFiles /usr/share/tessdata RUN apt-get update && apt-get install -y \ libreoffice \ poppler-utils \ tesseract-ocr \ tesseract-ocr-eng \ wget \ python3 \ python3-pip && \ pip3 install --no-cache-dir unoconv WeasyPrint pdf2image pillow && \ cd /usr/share/tessdata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/chi_sim.traineddata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/chi_tra.traineddata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/eng.traineddata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/jpn.traineddata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/kor.traineddata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/rus.traineddata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/fra.traineddata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/deu.traineddata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/spa.traineddata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/ita.traineddata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/por.traineddata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/vie.traineddata && \ wget https://github.com/tesseract-ocr/tessdata/raw/main/tha.traineddata && \ rm -rf /var/lib/apt/lists/* EXPOSE 7860 CMD ["java", "-Dserver.port=7860", "-Dserver.address=0.0.0.0", "-Dfile.encoding=UTF-8", "-jar", "/app/stirling-pdf.jar"]