Hoghoghi / Dockerfile
Really-amin's picture
Update Dockerfile
23a2d5f verified
raw
history blame
2.76 kB
# ────────────────
# Stage 1: Builder
# ────────────────
FROM python:3.10-slim AS builder
# Install build dependencies
RUN apt-get update && apt-get install -y \
build-essential \
gcc \
g++ \
pkg-config \
libmupdf-dev \
&& rm -rf /var/lib/apt/lists/*
# Upgrade pip and install wheel
RUN pip install --upgrade pip setuptools wheel
# Create virtual environment
RUN python -m venv /opt/venv
ENV PATH="/opt/venv/bin:$PATH"
# Copy requirements and install dependencies
WORKDIR /build
COPY requirements.txt .
# Install Python packages
RUN pip install --no-cache-dir -r requirements.txt
# ────────────────
# Stage 2: Production
# ────────────────
FROM python:3.10-slim
# Install runtime dependencies
RUN apt-get update && apt-get install -y \
poppler-utils \
tesseract-ocr \
tesseract-ocr-eng \
tesseract-ocr-fas \
mupdf-tools \
libmupdf-dev \
ffmpeg \
libopencv-dev \
libgl1-mesa-glx \
libglib2.0-0 \
libsm6 \
libxext6 \
libxrender-dev \
libgomp1 \
libgbm1 \
libxss1 \
libgtk-3-0 \
libxtst6 \
libxrandr2 \
libasound2 \
libpangocairo-1.0-0 \
libatk1.0-0 \
libcairo-gobject2 \
libgdk-pixbuf2.0-0 \
libffi-dev \
libssl-dev \
curl \
wget \
sqlite3 \
&& rm -rf /var/lib/apt/lists/* \
&& apt-get clean
# Create non-root user
RUN groupadd -g 1000 appuser && useradd -r -u 1000 -g appuser appuser
# Copy virtual environment from builder
COPY --from=builder /opt/venv /opt/venv
ENV PATH="/opt/venv/bin:$PATH"
# Set working directory
WORKDIR /app
# Copy all files (ensuring frontend stays in /app/frontend)
COPY --chown=appuser:appuser . .
# βœ… Ensure frontend exists
RUN mkdir -p /app/frontend && chmod -R 755 /app/frontend
# Pre-download TrOCR model to speed up startup
RUN python -c "from transformers import TrOCRProcessor, VisionEncoderDecoderModel; \
TrOCRProcessor.from_pretrained('microsoft/trocr-base-printed'); \
VisionEncoderDecoderModel.from_pretrained('microsoft/trocr-base-printed')"
# Environment variables
ENV PYTHONPATH=/app
ENV DATABASE_DIR=/app/data
ENV DATABASE_PATH=/app/data/legal_documents.db
ENV TRANSFORMERS_CACHE=/app/cache
ENV HF_HOME=/app/cache
ENV LOG_LEVEL=INFO
ENV ENVIRONMENT=production
ENV PYTHONUNBUFFERED=1
# Switch to non-root user
USER appuser
# Expose port
EXPOSE 7860
# Healthcheck
HEALTHCHECK --interval=45s --timeout=30s --start-period=180s --retries=10 \
CMD curl -fs http://localhost:7860/health || exit 1
# Start app
CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860", "--workers", "1", "--log-level", "info"]