From 06daa9834fc30b4038afc390084b86a49d730150 Mon Sep 17 00:00:00 2001 From: Shuchang Zheng Date: Thu, 29 Aug 2024 12:19:51 -0700 Subject: [PATCH] catch litellm no deployment error (token ratelimit / ValueError) and raise LLMProviderErrorRetryableTask (#758) --- skyvern/forge/sdk/api/llm/api_handler_factory.py | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/skyvern/forge/sdk/api/llm/api_handler_factory.py b/skyvern/forge/sdk/api/llm/api_handler_factory.py index 8bc26b27..d73519b5 100644 --- a/skyvern/forge/sdk/api/llm/api_handler_factory.py +++ b/skyvern/forge/sdk/api/llm/api_handler_factory.py @@ -108,6 +108,13 @@ class LLMAPIHandlerFactory: LOG.info("LLM API call successful", llm_key=llm_key, model=llm_config.model_name) except litellm.exceptions.APIError as e: raise LLMProviderErrorRetryableTask(llm_key) from e + except ValueError as e: + LOG.exception( + "LLM token limit exceeded", + llm_key=llm_key, + model=main_model_group, + ) + raise LLMProviderErrorRetryableTask(llm_key) from e except Exception as e: LOG.exception( "LLM request failed unexpectedly",