add vertex ai (#2243)

2025-04-29 03:11:56 +08:00
parent 7e4a193443
commit 47ad15a864
4 changed files with 82 additions and 7 deletions
--- a/skyvern/config.py
+++ b/skyvern/config.py
@@ -125,6 +125,7 @@ class Settings(BaseSettings):
    ENABLE_AZURE_O3_MINI: bool = False
    ENABLE_BEDROCK: bool = False
    ENABLE_GEMINI: bool = False
+    ENABLE_VERTEX_AI: bool = False
    ENABLE_AZURE_CUA: bool = False
    ENABLE_OPENAI_COMPATIBLE: bool = False
    # OPENAI
@@ -205,6 +206,9 @@ class Settings(BaseSettings):
    # GEMINI
    GEMINI_API_KEY: str | None = None

+    # VERTEX_AI
+    VERTEX_CREDENTIALS: str | None = None
+
    # NOVITA AI
    ENABLE_NOVITA: bool = False
    NOVITA_API_KEY: str | None = None
--- a/skyvern/forge/sdk/api/llm/config_registry.py
+++ b/skyvern/forge/sdk/api/llm/config_registry.py
@@ -733,6 +733,78 @@ if settings.ENABLE_NOVITA:
        ),
    )

+# Create a GCP service account WITH the Vertex AI API access enabled
+# Get the credentials json file. See documentation: https://support.google.com/a/answer/7378726?hl=en
+# my_vertex_credentials = json.dumps(json.load(open("my_credentials_file.json")))
+# Set the value of my_vertex_credentials as the environment variable VERTEX_CREDENTIALS
+if settings.ENABLE_VERTEX_AI:
+    LLMConfigRegistry.register_config(
+        "VERTEX_GEMINI_2.5_PRO_EXP_03_25",
+        LLMConfig(
+            "vertex_ai/gemini-2.5-pro-preview-03-25",
+            ["VERTEX_CREDENTIALS"],
+            supports_vision=True,
+            add_assistant_prefix=False,
+            max_completion_tokens=65535,
+            litellm_params=LiteLLMParams(
+                vertex_credentials=settings.VERTEX_CREDENTIALS,  # type: ignore
+            ),
+        ),
+    )
+    LLMConfigRegistry.register_config(
+        "VERTEX_GEMINI_2.5_PRO_PREVIEW_03_25",
+        LLMConfig(
+            "vertex_ai/gemini-2.5-pro-preview-03-25",
+            ["VERTEX_CREDENTIALS"],
+            supports_vision=True,
+            add_assistant_prefix=False,
+            max_completion_tokens=65535,
+            litellm_params=LiteLLMParams(
+                vertex_credentials=settings.VERTEX_CREDENTIALS,  # type: ignore
+            ),
+        ),
+    )
+    LLMConfigRegistry.register_config(
+        "VERTEX_GEMINI_FLASH_2_0",
+        LLMConfig(
+            "vertex_ai/gemini-2.0-flash-001",
+            ["VERTEX_CREDENTIALS"],
+            supports_vision=True,
+            add_assistant_prefix=False,
+            max_completion_tokens=8192,
+            litellm_params=LiteLLMParams(
+                vertex_credentials=settings.VERTEX_CREDENTIALS,  # type: ignore
+            ),
+        ),
+    )
+    LLMConfigRegistry.register_config(
+        "VERTEX_GEMINI_PRO",
+        LLMConfig(
+            "vertex_ai/gemini-1.5-pro",
+            ["VERTEX_CREDENTIALS"],
+            supports_vision=True,
+            add_assistant_prefix=False,
+            max_completion_tokens=8192,
+            litellm_params=LiteLLMParams(
+                vertex_credentials=settings.VERTEX_CREDENTIALS,  # type: ignore
+            ),
+        ),
+    )
+    LLMConfigRegistry.register_config(
+        "VERTEX_GEMINI_FLASH",
+        LLMConfig(
+            "vertex_ai/gemini-1.5-flash",
+            ["VERTEX_CREDENTIALS"],
+            supports_vision=True,
+            add_assistant_prefix=False,
+            max_completion_tokens=8192,
+            litellm_params=LiteLLMParams(
+                vertex_credentials=settings.VERTEX_CREDENTIALS,  # type: ignore
+            ),
+        ),
+    )
+
+
 # Add support for dynamically configuring OpenAI-compatible LLM models
 # Based on liteLLM's support for OpenAI-compatible APIs
 # See documentation: https://docs.litellm.ai/docs/providers/openai_compatible