Refactor model availability check in is_serverless_endpoint_available (…

…#363) * Refactor model availability check in is_serverless_endpoint_available() function * Refactor model ID retrieval in is_serverless_endpoint_available() function
argilla-io · Mar 1, 2024 · f9e41b6 · f9e41b6
1 parent f255c16
commit f9e41b6
Showing 1 changed file with 5 additions and 5 deletions.
diff --git a/src/distilabel/llm/huggingface/inference_endpoints.py b/src/distilabel/llm/huggingface/inference_endpoints.py
@@ -66,11 +66,11 @@ def is_serverless_endpoint_available(model_id: str) -> bool:
     # 2. Then we check if the model is currently deployed
     try:
         client = InferenceClient()
-        deploy_llms = client.list_deployed_models("text-generation-inference")[
-            "text-generation"
-        ]
-        if model_id in deploy_llms:
-            return True
+        status = client.get_model_status(model_id)
+        return (
+            status.state in {"Loadable", "Loaded"}
+            and status.framework == "text-generation-inference"
+        )
     except Exception as e:
         logger.error(e)