From 2e3e014b80fc139a64d9e44502292462e7805397 Mon Sep 17 00:00:00 2001 From: "Billy D." Date: Mon, 9 Feb 2026 10:24:32 -0500 Subject: [PATCH] fixing nvidia and strixhalo --- dockerfiles/Dockerfile.ray-worker-nvidia | 1 + dockerfiles/Dockerfile.ray-worker-strixhalo | 5 +++++ 2 files changed, 6 insertions(+) diff --git a/dockerfiles/Dockerfile.ray-worker-nvidia b/dockerfiles/Dockerfile.ray-worker-nvidia index 0e40e79..d960281 100644 --- a/dockerfiles/Dockerfile.ray-worker-nvidia +++ b/dockerfiles/Dockerfile.ray-worker-nvidia @@ -45,6 +45,7 @@ RUN --mount=type=cache,target=/home/ray/.cache/uv,uid=1000,gid=1000 \ 'librosa>=0.10.0,<1.0' \ 'torch>=2.0.0,<3.0' \ 'torchaudio>=2.0.0,<3.0' \ + 'transformers>=4.46.0,<5.0' \ 'fastapi>=0.100.0,<1.0' \ 'uvicorn>=0.23.0,<1.0' \ 'httpx>=0.27.0,<1.0' \ diff --git a/dockerfiles/Dockerfile.ray-worker-strixhalo b/dockerfiles/Dockerfile.ray-worker-strixhalo index c134327..01df3f1 100644 --- a/dockerfiles/Dockerfile.ray-worker-strixhalo +++ b/dockerfiles/Dockerfile.ray-worker-strixhalo @@ -115,6 +115,11 @@ RUN echo "import strixhalo_vram_fix" > \ # Pre-download common models for faster cold starts (optional, increases image size) # RUN python3 -c "from sentence_transformers import SentenceTransformer; SentenceTransformer('BAAI/bge-large-en-v1.5')" +# Pre-create aiter JIT build cache directory. +# The vLLM ROCm aiter package compiles kernels on first import and needs +# this directory writable by the ray user (uid 1000). +RUN mkdir -p /home/ray/.aiter + # Copy entrypoint script (ray-serve-apps is installed from PyPI at runtime) COPY --chown=1000:100 --chmod=755 dockerfiles/ray-entrypoint.sh /app/ray-entrypoint.sh