Pedro/thinking budget tests (#4072)

2025-11-21 21:22:12 -08:00
parent 5ab41d649a
commit b52982d3c8
1 changed files with 27 additions and 2 deletions
--- a/skyvern/forge/sdk/api/llm/api_handler_factory.py
+++ b/skyvern/forge/sdk/api/llm/api_handler_factory.py
@@ -88,9 +88,34 @@ class LLMAPIHandlerFactory:
                check_model = llm_config.model_list[0].model_name or model_label  # type: ignore[attr-defined]
            except Exception:
                check_model = model_label
        # Check reasoning support (safe call - log but don't fail if litellm errors)
        supports_reasoning = False
        if check_model:
            try:
                supports_reasoning = litellm.supports_reasoning(model=check_model)
            except Exception as exc:  # pragma: no cover - diagnostic safeguard
                LOG.debug(
                    "Failed to check reasoning support via litellm",
                    model=check_model,
                    error=str(exc),
                )
        try:
-            # Early return if model doesn't support reasoning
+            # Gemini router/fallback configs (e.g., gemini-2.5-pro-gpt-5-fallback-router)
-            if check_model and not litellm.supports_reasoning(model=check_model):
+            # are not recognized by litellm, but they do support reasoning budgets.
            if not supports_reasoning and model_label:
                model_label_lower = model_label.lower()
                if "gemini" in model_label_lower and "fallback" in model_label_lower:
                    supports_reasoning = True
                    LOG.info(
                        "Forcing reasoning support for Gemini fallback model",
                        prompt_name=prompt_name,
                        budget=new_budget,
                        model=model_label,
                    )
            if check_model and not supports_reasoning:
                LOG.info(
                    "Thinking budget optimization not supported for model",
                    prompt_name=prompt_name,