Sorvad

Runtime error

App Files Files Community

vpcom commited on Aug 17, 2024

Commit

a887b56

verified ·

1 Parent(s): c056d22

fix: InferenceTimeoutError outdated

Browse files

Files changed (1) hide show

app.py +13 -7

app.py CHANGED Viewed

@@ -35,7 +35,7 @@ from huggingface_hub.utils import (
 from huggingface_hub.inference._common import (
     TASKS_EXPECTING_IMAGES,
     ContentT,
-    InferenceTimeoutError,
     ModelStatus,
     _b64_encode,
     _b64_to_image,
@@ -216,7 +216,7 @@ class InferenceClientUS(InferenceClient):
                     )
                 except TimeoutError as error:
                     # Convert any `TimeoutError` to a `InferenceTimeoutError`
-                    raise InferenceTimeoutError(f"Inference call timed out: {url}") from error  # type: ignore
             try:
                 hf_raise_for_status(response)
@@ -225,12 +225,18 @@ class InferenceClientUS(InferenceClient):
                 if error.response.status_code == 503:
                     # If Model is unavailable, either raise a TimeoutError...
                     if timeout is not None and time.time() - t0 > timeout:
-                        raise InferenceTimeoutError(
                             f"Model not loaded on the server: {url}. Please retry with a higher timeout (current:"
-                            f" {self.timeout}).",
-                            request=error.request,
-                            response=error.response,
-                        ) from error
                     # ...or wait 1s and retry
                     logger.info(f"Waiting for model to be loaded on the server: {error}")
                     time.sleep(1)

 from huggingface_hub.inference._common import (
     TASKS_EXPECTING_IMAGES,
     ContentT,
+    # InferenceTimeoutError,
     ModelStatus,
     _b64_encode,
     _b64_to_image,
                     )
                 except TimeoutError as error:
                     # Convert any `TimeoutError` to a `InferenceTimeoutError`
+                    raise ValueError(f"Inference call timed out: {url}, {error}") # type: ignore
             try:
                 hf_raise_for_status(response)
                 if error.response.status_code == 503:
                     # If Model is unavailable, either raise a TimeoutError...
                     if timeout is not None and time.time() - t0 > timeout:
+                        # raise InferenceTimeoutError(
+                        #     f"Model not loaded on the server: {url}. Please retry with a higher timeout (current:"
+                        #     f" {self.timeout}).",
+                        #     request=error.request,
+                        #     response=error.response,
+                        # ) from error
+                        raise ValueError(
                             f"Model not loaded on the server: {url}. Please retry with a higher timeout (current:"
+                            f" {self.timeout}), Err:{error}"
+                            # request=error.request,
+                            # response=error.response,
+                        )
                     # ...or wait 1s and retry
                     logger.info(f"Waiting for model to be loaded on the server: {error}")
                     time.sleep(1)