Check GPU without torch

mozilla-ai · daavoo · Jan 17, 2025 · Jan 17, 2025 · Jan 17, 2025 · Jan 17, 2025
commit d07ee3966509692e3d7f4402b673c7244d756eeb
diff --git a/src/structured_qa/model_loaders.py b/src/structured_qa/model_loaders.py
@@ -1,7 +1,15 @@
-import torch
+import subprocess
 from llama_cpp import Llama
 
 
+def gpu_available():
+    try:
+        subprocess.check_output("nvidia-smi")
+        return True
+    except Exception:
+        return False
+
+
 def load_llama_cpp_model(model_id: str) -> Llama:
     """
     Loads the given model_id using Llama.from_pretrained.
@@ -22,6 +30,6 @@ def load_llama_cpp_model(model_id: str) -> Llama:
         filename=filename,
         n_ctx=0,  # 0 means that the model limit will be used, instead of the default (512) or other hardcoded value
         verbose=False,
-        n_gpu_layers=-1 if torch.cuda.is_available() else 0,
+        n_gpu_layers=-1 if gpu_available() else 0,
     )
     return model