meta-llama · ashwinb · May 28, 2025 · May 16, 2025 · May 26, 2025
@@ -75,7 +75,9 @@ def __init__(
         self.temperature = temperature
         self.threshold = threshold
 
-        self.device = "cuda"
+        self.device = "cpu"
+        if torch.cuda.is_available():
+            self.device = "cuda"
 
         # load model and tokenizer
         self.tokenizer = AutoTokenizer.from_pretrained(model_dir)