| # Use lightweight Python base | |
| FROM python:3.10-slim | |
| WORKDIR /app | |
| RUN apt-get update && apt-get install -y eatmydata && eatmydata apt-get install -y --no-install-recommends build-essential | |
| # Install Python deps first (better caching) | |
| COPY requirements.txt . | |
| RUN pip install --no-cache-dir -r requirements.txt | |
| # Copy app code | |
| COPY . . | |
| # Default envs (can override at runtime) | |
| ENV OPENAI_API_KEY=sk-no-key-needed | |
| # If you’ll use docker-compose with a llama.cpp service named "llama": | |
| ENV OPENAI_API_BASE=http://llama:8001/v1 | |
| # Expose FastAPI port | |
| EXPOSE 8000 | |
| # Run server | |
| CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8000"] | |