roboflow
diff --git a/‎inference/core/exceptions.py‎
Lines changed: 4 additions & 0 deletions b/‎inference/core/exceptions.py‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎inference/core/interfaces/http/error_handlers.py‎
Lines changed: 80 additions & 2 deletions b/‎inference/core/interfaces/http/error_handlers.py‎
Lines changed: 80 additions & 2 deletions
diff --git a/‎inference/core/workflows/errors.py‎
Lines changed: 16 additions & 0 deletions b/‎inference/core/workflows/errors.py‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎inference/core/workflows/execution_engine/v1/step_error_handlers.py‎
Lines changed: 53 additions & 2 deletions b/‎inference/core/workflows/execution_engine/v1/step_error_handlers.py‎
Lines changed: 53 additions & 2 deletions
diff --git a/‎inference/models/rfdetr/rfdetr.py‎
Lines changed: 4 additions & 2 deletions b/‎inference/models/rfdetr/rfdetr.py‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎inference_models/docs/changelog.md‎
Lines changed: 10 additions & 0 deletions b/‎inference_models/docs/changelog.md‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎inference_models/inference_models/errors.py‎
Lines changed: 14 additions & 2 deletions b/‎inference_models/inference_models/errors.py‎
Lines changed: 14 additions & 2 deletions
diff --git a/‎inference_models/inference_models/models/auto_loaders/core.py‎
Lines changed: 1 addition & 0 deletions b/‎inference_models/inference_models/models/auto_loaders/core.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎inference_models/pyproject.toml‎
Lines changed: 1 addition & 1 deletion b/‎inference_models/pyproject.toml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎inference_models/uv.lock‎
Lines changed: 1 addition & 1 deletion b/‎inference_models/uv.lock‎
Lines changed: 1 addition & 1 deletion
@@ -215,6 +215,10 @@ class CannotInitialiseModelError(Exception):
     pass
 
 
+class CannotInitialiseModelDueToInputSizeError(CannotInitialiseModelError):
+    pass
+
+
 class RetryRequestError(Exception):
 
     def __init__(self, message: str, inner_error: Exception):
 
@@ -5,6 +5,7 @@
 from inference.core import logger
 from inference.core.entities.responses.workflows import WorkflowErrorResponse
 from inference.core.exceptions import (
+    CannotInitialiseModelDueToInputSizeError,
     ContentTypeInvalid,
     ContentTypeMissing,
     CreditsExceededError,
@@ -59,6 +60,7 @@
     NotSupportedExecutionEngineError,
     ReferenceTypeError,
     RuntimeInputError,
+    RuntimeLimitsCausedStepExecutionError,
     StepExecutionError,
     StepInputDimensionalityError,
     WorkflowBlockError,
@@ -77,7 +79,9 @@
     ModelInputError,
     ModelLoadingError,
     ModelNotFoundError,
+    ModelPackageAlternativesExhaustedError,
     ModelPackageNegotiationError,
+    ModelPackageRestrictedError,
     ModelRetrievalError,
     UnauthorizedModelAccessError,
     UntrustedFileError,
@@ -309,6 +313,40 @@ def wrapped_route(*args, **kwargs):
             resp = JSONResponse(
                 status_code=500, content={"message": "Model package is broken."}
             )
+        except (
+            CannotInitialiseModelDueToInputSizeError,
+            ModelPackageRestrictedError,
+        ) as error:
+            logger.exception("%s: %s", type(error).__name__, error)
+            resp = JSONResponse(
+                status_code=507,
+                content={
+                    "message": "Model loading failed due to restrictions of server configuration - "
+                    "usually due to excessive runtime memory requirement of the model (for instance "
+                    "caused by large input size).",
+                },
+            )
+        except ModelPackageAlternativesExhaustedError as error:
+            logger.exception("%s: %s", type(error).__name__, error)
+            inner_errors = error.alternatives_errors or []
+            if any(isinstance(e, ModelPackageRestrictedError) for e in inner_errors):
+                resp = JSONResponse(
+                    status_code=507,
+                    content={
+                        "message": "Model loading failed due to restrictions of server configuration - "
+                        "usually due to excessive runtime memory requirement of the model (for instance "
+                        "caused by large input size).",
+                        "help_url": error.help_url,
+                    },
+                )
+            else:
+                resp = JSONResponse(
+                    status_code=500,
+                    content={
+                        "message": f"Model loading failed: {error}",
+                        "help_url": error.help_url,
+                    },
+                )
         except ModelLoadingError as error:
             logger.exception("%s: %s", type(error).__name__, error)
             resp = JSONResponse(
@@ -389,7 +427,10 @@ def wrapped_route(*args, **kwargs):
                     "message": "Timeout when attempting to connect to Roboflow API."
                 },
             )
-        except ClientCausedStepExecutionError as error:
+        except (
+            ClientCausedStepExecutionError,
+            RuntimeLimitsCausedStepExecutionError,
+        ) as error:
             logger.exception("%s: %s", type(error).__name__, error)
             content = WorkflowErrorResponse(
                 message=str(error.public_message),
@@ -711,6 +752,40 @@ async def wrapped_route(*args, **kwargs):
             resp = JSONResponse(
                 status_code=500, content={"message": "Model package is broken."}
             )
+        except (
+            CannotInitialiseModelDueToInputSizeError,
+            ModelPackageRestrictedError,
+        ) as error:
+            logger.exception("%s: %s", type(error).__name__, error)
+            resp = JSONResponse(
+                status_code=507,
+                content={
+                    "message": "Model loading failed due to restrictions of server configuration - "
+                    "usually due to excessive runtime memory requirement of the model (for instance "
+                    "caused by large input size).",
+                },
+            )
+        except ModelPackageAlternativesExhaustedError as error:
+            logger.exception("%s: %s", type(error).__name__, error)
+            inner_errors = error.alternatives_errors or []
+            if any(isinstance(e, ModelPackageRestrictedError) for e in inner_errors):
+                resp = JSONResponse(
+                    status_code=507,
+                    content={
+                        "message": "Model loading failed due to restrictions of server configuration - "
+                        "usually due to excessive runtime memory requirement of the model (for instance "
+                        "caused by large input size).",
+                        "help_url": error.help_url,
+                    },
+                )
+            else:
+                resp = JSONResponse(
+                    status_code=500,
+                    content={
+                        "message": f"Model loading failed: {error}",
+                        "help_url": error.help_url,
+                    },
+                )
         except ModelLoadingError as error:
             logger.exception("%s: %s", type(error).__name__, error)
             resp = JSONResponse(
@@ -791,7 +866,10 @@ async def wrapped_route(*args, **kwargs):
                     "message": "Timeout when attempting to connect to Roboflow API."
                 },
             )
-        except ClientCausedStepExecutionError as error:
+        except (
+            ClientCausedStepExecutionError,
+            RuntimeLimitsCausedStepExecutionError,
+        ) as error:
             logger.exception("%s: %s", type(error).__name__, error)
             content = WorkflowErrorResponse(
                 message=str(error.public_message),
 
@@ -189,6 +189,22 @@ def __init__(
         self.status_code = status_code
 
 
+class RuntimeLimitsCausedStepExecutionError(WorkflowExecutionEngineError):
+    def __init__(
+        self,
+        block_id: str,
+        status_code: int,
+        public_message: str,
+        context: str,
+        inner_error: Optional[Exception] = None,
+    ):
+        super().__init__(
+            public_message=public_message, context=context, inner_error=inner_error
+        )
+        self.block_id = block_id
+        self.status_code = status_code
+
+
 class ExecutionEngineRuntimeError(WorkflowExecutionEngineError):
     pass
 
 
@@ -1,4 +1,5 @@
 from inference.core.exceptions import (
+    CannotInitialiseModelDueToInputSizeError,
     InferenceModelNotFound,
     InvalidModelIDError,
     ModelManagerLockAcquisitionError,
@@ -7,8 +8,16 @@
     RoboflowAPINotAuthorizedError,
     RoboflowAPINotNotFoundError,
 )
-from inference.core.workflows.errors import ClientCausedStepExecutionError
-from inference_models.errors import ModelNotFoundError, UnauthorizedModelAccessError
+from inference.core.workflows.errors import (
+    ClientCausedStepExecutionError,
+    RuntimeLimitsCausedStepExecutionError,
+)
+from inference_models.errors import (
+    ModelNotFoundError,
+    ModelPackageAlternativesExhaustedError,
+    ModelPackageRestrictedError,
+    UnauthorizedModelAccessError,
+)
 from inference_sdk.http.errors import HTTPCallErrorError
 
 
@@ -27,6 +36,39 @@ def extended_roboflow_errors_handler(step_name: str, error: Exception) -> None:
         ),
     ):
         raise error
+    if isinstance(error, CannotInitialiseModelDueToInputSizeError):
+        raise RuntimeLimitsCausedStepExecutionError(
+            block_id=step_name,
+            status_code=507,
+            public_message=f"Could not complete workflow execution due to configured runtime constraints. "
+            f"Details: model input size causes runtime memory requirements exceed the limit "
+            f"configured for the environment.",
+            context="workflow_execution | step_execution",
+            inner_error=error,
+        ) from error
+    if isinstance(error, ModelPackageRestrictedError):
+        raise RuntimeLimitsCausedStepExecutionError(
+            block_id=step_name,
+            status_code=507,
+            public_message="Model loading failed due to restrictions of server configuration - "
+            "usually due to excessive runtime memory requirement of the model (for instance "
+            "caused by large input size).",
+            context="workflow_execution | step_execution",
+            inner_error=error,
+        ) from error
+    if isinstance(error, ModelPackageAlternativesExhaustedError) and any(
+        isinstance(e, ModelPackageRestrictedError)
+        for e in (error.alternatives_errors or [])
+    ):
+        raise RuntimeLimitsCausedStepExecutionError(
+            block_id=step_name,
+            status_code=507,
+            public_message="Model loading failed due to restrictions of server configuration - "
+            "usually due to excessive runtime memory requirement of the model (for instance "
+            "caused by large input size).",
+            context="workflow_execution | step_execution",
+            inner_error=error,
+        ) from error
     if isinstance(error, InvalidModelIDError):
         raise ClientCausedStepExecutionError(
             block_id=step_name,
@@ -117,4 +159,13 @@ def extended_roboflow_errors_handler(step_name: str, error: Exception) -> None:
                 context="workflow_execution | step_execution",
                 inner_error=error,
             ) from error
+        if error.status_code == 507:
+            raise RuntimeLimitsCausedStepExecutionError(
+                block_id=step_name,
+                status_code=507,
+                public_message=f"Could not complete workflow execution due to configured runtime constraints. "
+                f"Details: {error.api_message}",
+                context="workflow_execution | step_execution",
+                inner_error=error,
+            ) from error
     return None
@@ -22,7 +22,7 @@
     USE_PYTORCH_FOR_PREPROCESSING,
 )
 from inference.core.exceptions import (
-    CannotInitialiseModelError,
+    CannotInitialiseModelDueToInputSizeError,
     ModelArtefactError,
     OnnxProviderNotAvailable,
 )
@@ -450,7 +450,9 @@ def initialize_model(self, **kwargs) -> None:
                 input_resolution,
                 RFDETR_ONNX_MAX_RESOLUTION,
             )
-            raise CannotInitialiseModelError(f"Resolution too high for RFDETR")
+            raise CannotInitialiseModelDueToInputSizeError(
+                f"Resolution too high for RFDETR"
+            )
 
         logger.debug("Creating inference session")
         if self.load_weights or not self.has_model_metadata:
 
@@ -1,5 +1,15 @@
 # Changelog
 
+## `0.24.1`
+
+### Changed
+
+- Added optional field `alternatives_errors` to `ModelPackageAlternativesExhaustedError`, making it possible 
+to report to the caller what types of errors happened during the load - making it possible to deduce if 
+problem with loading is recoverable.
+
+---
+
 ## `0.24.0`
 
 ### Added
 
@@ -1,4 +1,4 @@
-from typing import Optional
+from typing import List, Optional
 
 
 class BaseInferenceModelsError(Exception):
@@ -106,7 +106,19 @@ class ModelLoadingError(BaseInferenceModelsError):
 
 
 class ModelPackageAlternativesExhaustedError(ModelLoadingError):
-    pass
+
+    def __init__(
+        self,
+        message: str,
+        help_url: Optional[str] = None,
+        alternatives_errors: Optional[List[Exception]] = None,
+    ):
+        super().__init__(message, help_url)
+        self._alternatives_errors = alternatives_errors
+
+    @property
+    def alternatives_errors(self) -> Optional[List[Exception]]:
+        return self._alternatives_errors
 
 
 class MissingModelInitParameterError(ModelLoadingError):
 
@@ -1203,6 +1203,7 @@ def attempt_loading_matching_model_packages(
         f"the event. https://github.com/roboflow/inference/issues\n\n"
         f"Here is the summary of errors for specific model packages:\n{summary_of_errors}\n\n",
         help_url="https://inference-models.roboflow.com/errors/model-loading/#modelpackagealternativesexhaustederror",
+        alternatives_errors=[summary[1] for summary in failed_load_attempts],
     )
 
 
 
@@ -1,6 +1,6 @@
 [project]
 name = "inference-models"
-version = "0.24.0"
+version = "0.24.1"
 description = "The new inference engine for Computer Vision models"
 readme = "README.md"
 requires-python = ">=3.10,<3.13"
Original file line number	Diff line number	Diff line change
`@@ -22,7 +22,7 @@`
`22`	`22`	`USE_PYTORCH_FOR_PREPROCESSING,`
`23`	`23`	`)`
`24`	`24`	`from inference.core.exceptions import (`
`25`		`- CannotInitialiseModelError,`
	`25`	`+ CannotInitialiseModelDueToInputSizeError,`
`26`	`26`	`ModelArtefactError,`
`27`	`27`	`OnnxProviderNotAvailable,`
`28`	`28`	`)`
`@@ -450,7 +450,9 @@ def initialize_model(self, **kwargs) -> None:`
`450`	`450`	`input_resolution,`
`451`	`451`	`RFDETR_ONNX_MAX_RESOLUTION,`
`452`	`452`	`)`
`453`		`- raise CannotInitialiseModelError(f"Resolution too high for RFDETR")`
	`453`	`+ raise CannotInitialiseModelDueToInputSizeError(`
	`454`	`+ f"Resolution too high for RFDETR"`
	`455`	`+ )`
`454`	`456`
`455`	`457`	`logger.debug("Creating inference session")`
`456`	`458`	`if self.load_weights or not self.has_model_metadata:`
Original file line number	Diff line number	Diff line change
`@@ -1203,6 +1203,7 @@ def attempt_loading_matching_model_packages(`
`1203`	`1203`	`f"the event. https://github.com/roboflow/inference/issues\n\n"`
`1204`	`1204`	`f"Here is the summary of errors for specific model packages:\n{summary_of_errors}\n\n",`
`1205`	`1205`	`help_url="https://inference-models.roboflow.com/errors/model-loading/#modelpackagealternativesexhaustederror",`
	`1206`	`+ alternatives_errors=[summary[1] for summary in failed_load_attempts],`
`1206`	`1207`	`)`
`1207`	`1208`
`1208`	`1209`