9aab79d49b
- Remove v1 Python CLI (src/kb_search/, tests/, root pyproject.toml, uv.lock, .venv) - Add Go client with cross-platform build (client/) - Add FastAPI engine with NVIDIA and multi-stage ROCm Dockerfiles (engine/) - Add VERSION files for client and engine, wired into builds - Add release.sh for automated build, tag, release, and Docker push - Update README with build/release docs and ROCm migration note - Clean up .gitignore for v2 project structure Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
36 lines
836 B
Docker
36 lines
836 B
Docker
FROM nvidia/cuda:13.0.1-runtime-ubuntu24.04
|
|
|
|
ENV DEBIAN_FRONTEND=noninteractive
|
|
|
|
RUN apt-get update && apt-get install -y --no-install-recommends \
|
|
python3.12 python3.12-venv python3.12-dev python3-pip \
|
|
libpoppler-cpp-dev poppler-utils \
|
|
libgl1 libglib2.0-0 \
|
|
build-essential curl \
|
|
&& rm -rf /var/lib/apt/lists/*
|
|
|
|
COPY --from=ghcr.io/astral-sh/uv:latest /uv /usr/local/bin/uv
|
|
|
|
WORKDIR /app
|
|
|
|
COPY pyproject.toml ./
|
|
COPY kb/ kb/
|
|
COPY main.py ./
|
|
COPY VERSION ./
|
|
|
|
RUN uv venv .venv && \
|
|
. .venv/bin/activate && \
|
|
uv pip install -e . && \
|
|
uv pip install --no-deps onnxruntime-gpu
|
|
|
|
ENV PATH="/app/.venv/bin:$PATH"
|
|
ENV VIRTUAL_ENV="/app/.venv"
|
|
ENV KB_DEVICE=auto
|
|
ENV KB_INGEST_DEVICE=auto
|
|
ENV KB_DATA_DIR=/data
|
|
|
|
EXPOSE 8000
|
|
VOLUME ["/data"]
|
|
|
|
CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8000"]
|