From 02cf2a1e87fc15fea19437b046b653f9b807a887 Mon Sep 17 00:00:00 2001 From: Kerem Yilmaz Date: Tue, 16 Apr 2024 14:52:15 -0700 Subject: [PATCH] New LLM Router strategy (#199) --- poetry.lock | 6 +++--- .../src/routes/tasks/create/CreateNewTaskForm.tsx | 2 +- skyvern/forge/sdk/api/llm/models.py | 3 ++- 3 files changed, 6 insertions(+), 5 deletions(-) diff --git a/poetry.lock b/poetry.lock index 3a2b88f8..1ad4be01 100644 --- a/poetry.lock +++ b/poetry.lock @@ -2767,13 +2767,13 @@ files = [ [[package]] name = "litellm" -version = "1.34.41" +version = "1.35.8" description = "Library to easily interface with LLM API providers" optional = false python-versions = "!=2.7.*,!=3.0.*,!=3.1.*,!=3.2.*,!=3.3.*,!=3.4.*,!=3.5.*,!=3.6.*,!=3.7.*,>=3.8" files = [ - {file = "litellm-1.34.41-py3-none-any.whl", hash = "sha256:ec6b1fb7f27178ad36f3be64e2f0fb73a637c0d7c128d5aa1d845414cc21be66"}, - {file = "litellm-1.34.41.tar.gz", hash = "sha256:e8ad1a0b9cf4abea0471394db8c95f479e94e271bc1ce3d98204e1a6ed917e93"}, + {file = "litellm-1.35.8-py3-none-any.whl", hash = "sha256:0b328b37b6c40e5ece82f701bcb92e4d1d76ffb070e03f6c3abfbc6030bf07b8"}, + {file = "litellm-1.35.8.tar.gz", hash = "sha256:0a8c031a01c19f2cfd9d873ff89bebc120917ec88f5656c1464a64d38e7c782d"}, ] [package.dependencies] diff --git a/skyvern-frontend/src/routes/tasks/create/CreateNewTaskForm.tsx b/skyvern-frontend/src/routes/tasks/create/CreateNewTaskForm.tsx index 5133a931..9776fad3 100644 --- a/skyvern-frontend/src/routes/tasks/create/CreateNewTaskForm.tsx +++ b/skyvern-frontend/src/routes/tasks/create/CreateNewTaskForm.tsx @@ -299,7 +299,7 @@ function CreateNewTaskForm({ initialValues }: Props) { body: createTaskRequestObject(form.getValues()), headers: { "Content-Type": "application/json", - "x-api-key": envCredential ?? "", + "x-api-key": envCredential ?? "", }, }); await navigator.clipboard.writeText(curl); diff --git a/skyvern/forge/sdk/api/llm/models.py b/skyvern/forge/sdk/api/llm/models.py index 9db88873..2605bd82 100644 --- a/skyvern/forge/sdk/api/llm/models.py +++ b/skyvern/forge/sdk/api/llm/models.py @@ -43,8 +43,9 @@ class LLMRouterConfig(LLMConfig): "simple-shuffle", "least-busy", "usage-based-routing", + "usage-based-routing-v2", "latency-based-routing", - ] = "usage-based-routing" + ] = "usage-based-routing-v2" num_retries: int = 2 retry_delay_seconds: int = 15 set_verbose: bool = False