diff --git a/container/Dockerfile.vllm b/container/Dockerfile.vllm
index f42124b6ee..1a2469a76d 100644
--- a/container/Dockerfile.vllm
+++ b/container/Dockerfile.vllm
@@ -171,7 +171,8 @@ ENV PATH="${VIRTUAL_ENV}/bin:${PATH}"
 # TEMP: disable gds backend for arm64
 RUN if [ "$ARCH" = "arm64" ]; then \
         cd ${NIXL_SRC_DIR} && uv build . --out-dir /workspace/wheels/nixl \
-        --config-settings=setup-args="-Ddisable_gds_backend=true -Dgds_path=/usr/local/cuda/targets/sbsa-linux"; \
+        --config-settings=setup-args="-Ddisable_gds_backend=true" \
+        --config-settings=setup-args="-Dgds_path=/usr/local/cuda/targets/sbsa-linux"; \
     else \
         cd ${NIXL_SRC_DIR} && uv build . --out-dir /workspace/wheels/nixl; \
     fi && \
diff --git a/container/deps/vllm/install_vllm.sh b/container/deps/vllm/install_vllm.sh
index ee48487a69..54384e18d1 100755
--- a/container/deps/vllm/install_vllm.sh
+++ b/container/deps/vllm/install_vllm.sh
@@ -119,9 +119,10 @@ if [ "$ARCH" = "arm64" ]; then
 
     # Try to install specific PyTorch version first, fallback to latest nightly
     echo "Attempting to install pinned PyTorch nightly versions..."
-    if ! uv pip install torch==2.9.0.dev20250712+cu128 torchvision==0.24.0.dev20250712+cu128 torchaudio==2.8.0.dev20250712+cu128 --index-url https://download.pytorch.org/whl/nightly/cu128; then
-        echo "Pinned versions failed, falling back to latest stable..."
-        uv pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu128
+    if ! uv pip install torch==2.8.0.dev20250613+cu128 torchaudio==2.8.0.dev20250616 torchvision==0.23.0.dev20250616 --index-url https://download.pytorch.org/whl/nightly/cu128; then
+        echo "Pinned versions failed"
+        exit 1
+        # uv pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu128
     fi
 
     python use_existing_torch.py
@@ -163,10 +164,14 @@ python setup.py install
 
 
 # Install Flash Infer
-cd $INSTALLATION_DIR
-git clone https://github.com/flashinfer-ai/flashinfer.git --recursive
-cd flashinfer
-git checkout $FLASHINF_REF
-python -m pip install -v .
+if [ "$ARCH" = "arm64" ]; then
+    uv pip install flashinfer-python
+else
+    cd $INSTALLATION_DIR
+    git clone https://github.com/flashinfer-ai/flashinfer.git --recursive
+    cd flashinfer
+    git checkout $FLASHINF_REF
+    python -m pip install -v .
+fi
 
 echo "vllm installation completed successfully"