Spaces:
Paused
Paused
| # ββββββββββββββββ | |
| # Stage 1: Builder | |
| # ββββββββββββββββ | |
| FROM python:3.10-slim AS builder | |
| # Install build dependencies | |
| RUN apt-get update && apt-get install -y \ | |
| build-essential \ | |
| gcc \ | |
| g++ \ | |
| pkg-config \ | |
| libmupdf-dev \ | |
| && rm -rf /var/lib/apt/lists/* | |
| # Upgrade pip and install wheel | |
| RUN pip install --upgrade pip setuptools wheel | |
| # Create virtual environment | |
| RUN python -m venv /opt/venv | |
| ENV PATH="/opt/venv/bin:$PATH" | |
| # Copy requirements and install dependencies | |
| WORKDIR /build | |
| COPY requirements.txt . | |
| # Install Python packages | |
| RUN pip install --no-cache-dir -r requirements.txt | |
| # ββββββββββββββββ | |
| # Stage 2: Production | |
| # ββββββββββββββββ | |
| FROM python:3.10-slim | |
| # Install runtime dependencies | |
| RUN apt-get update && apt-get install -y \ | |
| poppler-utils \ | |
| tesseract-ocr \ | |
| tesseract-ocr-eng \ | |
| tesseract-ocr-fas \ | |
| mupdf-tools \ | |
| libmupdf-dev \ | |
| ffmpeg \ | |
| libopencv-dev \ | |
| libgl1-mesa-glx \ | |
| libglib2.0-0 \ | |
| libsm6 \ | |
| libxext6 \ | |
| libxrender-dev \ | |
| libgomp1 \ | |
| libgbm1 \ | |
| libxss1 \ | |
| libgtk-3-0 \ | |
| libxtst6 \ | |
| libxrandr2 \ | |
| libasound2 \ | |
| libpangocairo-1.0-0 \ | |
| libatk1.0-0 \ | |
| libcairo-gobject2 \ | |
| libgdk-pixbuf2.0-0 \ | |
| libffi-dev \ | |
| libssl-dev \ | |
| curl \ | |
| wget \ | |
| sqlite3 \ | |
| && rm -rf /var/lib/apt/lists/* \ | |
| && apt-get clean | |
| # Create non-root user | |
| RUN groupadd -g 1000 appuser && useradd -r -u 1000 -g appuser appuser | |
| # Copy virtual environment from builder | |
| COPY --from=builder /opt/venv /opt/venv | |
| ENV PATH="/opt/venv/bin:$PATH" | |
| # Set working directory | |
| WORKDIR /app | |
| # Copy all files (ensuring frontend stays in /app/frontend) | |
| COPY --chown=appuser:appuser . . | |
| # β Ensure frontend exists | |
| RUN mkdir -p /app/frontend && chmod -R 755 /app/frontend | |
| # Pre-download TrOCR model to speed up startup | |
| RUN python -c "from transformers import TrOCRProcessor, VisionEncoderDecoderModel; \ | |
| TrOCRProcessor.from_pretrained('microsoft/trocr-base-printed'); \ | |
| VisionEncoderDecoderModel.from_pretrained('microsoft/trocr-base-printed')" | |
| # Environment variables | |
| ENV PYTHONPATH=/app | |
| ENV DATABASE_DIR=/app/data | |
| ENV DATABASE_PATH=/app/data/legal_documents.db | |
| ENV TRANSFORMERS_CACHE=/app/cache | |
| ENV HF_HOME=/app/cache | |
| ENV LOG_LEVEL=INFO | |
| ENV ENVIRONMENT=production | |
| ENV PYTHONUNBUFFERED=1 | |
| # Switch to non-root user | |
| USER appuser | |
| # Expose port | |
| EXPOSE 7860 | |
| # Healthcheck | |
| HEALTHCHECK --interval=45s --timeout=30s --start-period=180s --retries=10 \ | |
| CMD curl -fs http://localhost:7860/health || exit 1 | |
| # Start app | |
| CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860", "--workers", "1", "--log-level", "info"] | |