diff --git a/container/Dockerfile.vllm b/container/Dockerfile.vllm index f42124b6ee..1a2469a76d 100644 --- a/container/Dockerfile.vllm +++ b/container/Dockerfile.vllm @@ -171,7 +171,8 @@ ENV PATH="${VIRTUAL_ENV}/bin:${PATH}" # TEMP: disable gds backend for arm64 RUN if [ "$ARCH" = "arm64" ]; then \ cd ${NIXL_SRC_DIR} && uv build . --out-dir /workspace/wheels/nixl \ - --config-settings=setup-args="-Ddisable_gds_backend=true -Dgds_path=/usr/local/cuda/targets/sbsa-linux"; \ + --config-settings=setup-args="-Ddisable_gds_backend=true" \ + --config-settings=setup-args="-Dgds_path=/usr/local/cuda/targets/sbsa-linux"; \ else \ cd ${NIXL_SRC_DIR} && uv build . --out-dir /workspace/wheels/nixl; \ fi && \ diff --git a/container/deps/vllm/install_vllm.sh b/container/deps/vllm/install_vllm.sh index ee48487a69..54384e18d1 100755 --- a/container/deps/vllm/install_vllm.sh +++ b/container/deps/vllm/install_vllm.sh @@ -119,9 +119,10 @@ if [ "$ARCH" = "arm64" ]; then # Try to install specific PyTorch version first, fallback to latest nightly echo "Attempting to install pinned PyTorch nightly versions..." - if ! uv pip install torch==2.9.0.dev20250712+cu128 torchvision==0.24.0.dev20250712+cu128 torchaudio==2.8.0.dev20250712+cu128 --index-url https://download.pytorch.org/whl/nightly/cu128; then - echo "Pinned versions failed, falling back to latest stable..." - uv pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu128 + if ! uv pip install torch==2.8.0.dev20250613+cu128 torchaudio==2.8.0.dev20250616 torchvision==0.23.0.dev20250616 --index-url https://download.pytorch.org/whl/nightly/cu128; then + echo "Pinned versions failed" + exit 1 + # uv pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu128 fi python use_existing_torch.py @@ -163,10 +164,14 @@ python setup.py install # Install Flash Infer -cd $INSTALLATION_DIR -git clone https://github.com/flashinfer-ai/flashinfer.git --recursive -cd flashinfer -git checkout $FLASHINF_REF -python -m pip install -v . +if [ "$ARCH" = "arm64" ]; then + uv pip install flashinfer-python +else + cd $INSTALLATION_DIR + git clone https://github.com/flashinfer-ai/flashinfer.git --recursive + cd flashinfer + git checkout $FLASHINF_REF + python -m pip install -v . +fi echo "vllm installation completed successfully"