diff --git a/dockerfiles/Dockerfile.ray-worker-strixhalo b/dockerfiles/Dockerfile.ray-worker-strixhalo index 84f4559..2fcbca8 100644 --- a/dockerfiles/Dockerfile.ray-worker-strixhalo +++ b/dockerfiles/Dockerfile.ray-worker-strixhalo @@ -206,6 +206,15 @@ RUN --mount=type=cache,target=/root/.cache/uv \ 'grpcio>=1.60.0' \ 'protobuf>=4.25.0' +# ── Ray Serve application package ────────────────────────────────────── +# Baked into the image so the LLM serve app can use the source-built vllm +# from /opt/venv instead of a pip runtime_env virtualenv (which would +# shadow it with a PyPI vllm that lacks ROCm support). +RUN --mount=type=cache,target=/root/.cache/uv \ + uv pip install --python /opt/venv/bin/python3 \ + --extra-index-url https://git.daviestechlabs.io/api/packages/daviestechlabs/pypi/simple/ \ + 'ray-serve-apps==1.0.1+10' + # ── Verify vendor torch survived ─────────────────────────────────────── # Fail early if any install step accidentally replaced the vendor torch. RUN python3 -c "\