update to allow local model cache for prediction

Eliotdoesprogramming · Eliotdoesprogramming · commit ba4cc070bb68 · 2024-12-02T12:43:31.000-06:00
diff --git a/.gitignore b/.gitignore
@@ -225,4 +225,5 @@ Next steps
 To learn more about publishing packages, check out the PyPA guides on building and publishing.
 
 Or, read on for guides on integrating uv with other software.
-.ruff_cache/
+.ruff_cache/
+model_cache/
diff --git a/src/api/endpoints.py b/src/api/endpoints.py
@@ -747,9 +747,14 @@ async def predict(model_id: str, text: str) -> dict:
     """
     try:
         # First try loading as a registered model
+        if "model_cache" not in os.listdir():
+            os.makedirs("model_cache", exist_ok=True)
         dst_path = f"model_cache/{model_id}"
         if model_id in os.listdir("model_cache"):
-            loaded_model = mlflow.pyfunc.load_model(dst_path)
+            try:
+                loaded_model = mlflow.pyfunc.load_model(dst_path + "/intent_model")
+            except mlflow.exceptions.MlflowException as e:
+                raise HTTPException(status_code=500, detail=str(e))
         else:
             os.makedirs(dst_path, exist_ok=True)
             try: