Files
Benjamin Boenisch ad111d5e69 Initial commit: breakpilot-core - Shared Infrastructure
Docker Compose with 24+ services:
- PostgreSQL (PostGIS), Valkey, MinIO, Qdrant
- Vault (PKI/TLS), Nginx (Reverse Proxy)
- Backend Core API, Consent Service, Billing Service
- RAG Service, Embedding Service
- Gitea, Woodpecker CI/CD
- Night Scheduler, Health Aggregator
- Jitsi (Web/XMPP/JVB/Jicofo), Mailpit

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-11 23:47:13 +01:00

37 lines
1.1 KiB
Docker

# Embedding Service Dockerfile
# Handles ML-heavy operations: embeddings, re-ranking, PDF extraction
FROM python:3.11-slim
WORKDIR /app
# Install system dependencies for PDF extraction
RUN apt-get update && apt-get install -y --no-install-recommends \
libmagic1 \
poppler-utils \
tesseract-ocr \
tesseract-ocr-deu \
&& rm -rf /var/lib/apt/lists/*
# Install PyTorch CPU-only (smaller image)
RUN pip install --no-cache-dir torch --index-url https://download.pytorch.org/whl/cpu
# Copy and install requirements
COPY requirements.txt .
RUN pip install --no-cache-dir -r requirements.txt
# Note: Models are downloaded on first startup (not during build)
# This makes the build faster but first startup slower
# To pre-download models, mount a persistent volume for /root/.cache/huggingface
# Copy application code
COPY . .
# Health check
HEALTHCHECK --interval=30s --timeout=10s --start-period=60s --retries=3 \
CMD python -c "import httpx; httpx.get('http://localhost:8087/health').raise_for_status()"
# Run the service
EXPOSE 8087
CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8087"]