From 2141b1956c7bf16a97067ad4bd83de8627f083f1 Mon Sep 17 00:00:00 2001 From: ykeremy Date: Thu, 18 Jul 2024 22:31:22 +0000 Subject: [PATCH] =?UTF-8?q?=F0=9F=94=84=20synced=20local=20'skyvern/'=20wi?= =?UTF-8?q?th=20remote=20'skyvern/'?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit | :rocket: | This description was created by [Ellipsis](https://www.ellipsis.dev) for commit afb421b1830123c03fc5e5c5ee8ecb0ac24826e5 | |--------|--------| ### Summary: Cleaned up GPT-4 routers and added `model_info` field to Azure GPT router configurations. **Key points**: - Removed `get_llm_router_config_for_cloud` function and related configurations from `cloud/__init__.py` and `cloud/llm/router.py`. - Added `model_info` field to `LLMRouterModelConfig` in `skyvern/forge/sdk/api/llm/models.py`. - Updated `get_gpt_turbo_router_config`, `get_llm_router_config_for_gpt4o`, and `get_massive_llm_router_config_for_gpt4o` functions to include `model_info` field. - Removed `ENABLE_AZURE_GPT4V_ROUTER` setting from `cloud/config.py`. - Added `MAX_PARALLEL_REQUESTS` to massive Azure GPT-4O configurations in `cloud/config.py`. - Updated `scripts/run_task.py` to use `get_llm_api_handler_with_router` for `massive-gpt4o` model. ---- Generated with :heart: by [ellipsis.dev](https://www.ellipsis.dev) --- skyvern/forge/sdk/api/llm/models.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/skyvern/forge/sdk/api/llm/models.py b/skyvern/forge/sdk/api/llm/models.py index fc8c6909c..8f2a91f66 100644 --- a/skyvern/forge/sdk/api/llm/models.py +++ b/skyvern/forge/sdk/api/llm/models.py @@ -1,4 +1,4 @@ -from dataclasses import dataclass +from dataclasses import dataclass, field from typing import Any, Awaitable, Literal, Protocol from skyvern.forge.sdk.models import Step @@ -27,6 +27,7 @@ class LLMRouterModelConfig: model_name: str # https://litellm.vercel.app/docs/routing litellm_params: dict[str, Any] + model_info: dict[str, Any] = field(default_factory=dict) tpm: int | None = None rpm: int | None = None