msse-ai-engineering / Dockerfile
sethmcknight
chore(docker): include synthetic_policies in image for startup ingestion
b8d81de
# Use an official Python runtime as a parent image
FROM python:3.10-slim AS base
ENV PYTHONDONTWRITEBYTECODE=1 \
PYTHONUNBUFFERED=1 \
PIP_NO_CACHE_DIR=1 \
PIP_DISABLE_PIP_VERSION_CHECK=1 \
# Constrain BLAS/parallel libs to avoid excess threads on small CPU
OMP_NUM_THREADS=1 \
OPENBLAS_NUM_THREADS=1 \
MKL_NUM_THREADS=1 \
NUMEXPR_NUM_THREADS=1 \
TOKENIZERS_PARALLELISM=false \
# ONNX Runtime threading limits (fallback if not explicitly set)
ORT_INTRA_OP_NUM_THREADS=1 \
ORT_INTER_OP_NUM_THREADS=1
WORKDIR /app
# Install build essentials only if needed for wheels (kept minimal)
RUN apt-get update && apt-get install -y --no-install-recommends \
build-essential \
procps \
&& rm -rf /var/lib/apt/lists/*
COPY constraints.txt requirements.txt ./
RUN python -m pip install --upgrade pip setuptools wheel \
&& pip install --no-cache-dir -r requirements.txt -c constraints.txt --only-binary=:all: || \
pip install --no-cache-dir -r requirements.txt -c constraints.txt
# Application source
COPY app.py ./app.py
COPY templates ./templates
COPY static ./static
COPY src ./src
COPY synthetic_policies ./synthetic_policies
COPY data ./data
COPY scripts ./scripts
COPY run.sh ./run.sh
COPY gunicorn.conf.py ./gunicorn.conf.py
RUN chmod +x run.sh && chmod +x scripts/init_pgvector.py || true
EXPOSE 8080
# Run the app via Gunicorn binding to 0.0.0.0:8080. Use conservative workers/threads
# to reduce memory usage on small instances.
CMD ["gunicorn", "-b", "0.0.0.0:8080", "-w", "2", "--threads", "2", "src.app_factory:create_app()"]
# Optional dev stage for local tooling (not used in final image)
FROM base AS dev
COPY dev-requirements.txt ./dev-requirements.txt
RUN pip install --no-cache-dir -r dev-requirements.txt -c constraints.txt || true