point flash and flash lite to stable (#3816)
This commit is contained in:
@@ -395,11 +395,11 @@ class Settings(BaseSettings):
|
|||||||
if self.is_cloud_environment():
|
if self.is_cloud_environment():
|
||||||
return {
|
return {
|
||||||
"gemini-2.5-pro-preview-05-06": {"llm_key": "VERTEX_GEMINI_2.5_PRO", "label": "Gemini 2.5 Pro"},
|
"gemini-2.5-pro-preview-05-06": {"llm_key": "VERTEX_GEMINI_2.5_PRO", "label": "Gemini 2.5 Pro"},
|
||||||
"gemini-2.5-flash-preview-09-2025": {
|
"gemini-2.5-flash": {
|
||||||
"llm_key": "VERTEX_GEMINI_2.5_FLASH",
|
"llm_key": "VERTEX_GEMINI_2.5_FLASH",
|
||||||
"label": "Gemini 2.5 Flash",
|
"label": "Gemini 2.5 Flash",
|
||||||
},
|
},
|
||||||
"gemini-2.5-flash-lite-preview-09-2025": {
|
"gemini-2.5-flash-lite": {
|
||||||
"llm_key": "VERTEX_GEMINI_2.5_FLASH_LITE",
|
"llm_key": "VERTEX_GEMINI_2.5_FLASH_LITE",
|
||||||
"label": "Gemini 2.5 Flash Lite",
|
"label": "Gemini 2.5 Flash Lite",
|
||||||
},
|
},
|
||||||
@@ -431,11 +431,11 @@ class Settings(BaseSettings):
|
|||||||
# TODO: apparently the list for OSS is to be much larger
|
# TODO: apparently the list for OSS is to be much larger
|
||||||
return {
|
return {
|
||||||
"gemini-2.5-pro-preview-05-06": {"llm_key": "VERTEX_GEMINI_2.5_PRO", "label": "Gemini 2.5 Pro"},
|
"gemini-2.5-pro-preview-05-06": {"llm_key": "VERTEX_GEMINI_2.5_PRO", "label": "Gemini 2.5 Pro"},
|
||||||
"gemini-2.5-flash-preview-09-2025": {
|
"gemini-2.5-flash": {
|
||||||
"llm_key": "VERTEX_GEMINI_2.5_FLASH",
|
"llm_key": "VERTEX_GEMINI_2.5_FLASH",
|
||||||
"label": "Gemini 2.5 Flash",
|
"label": "Gemini 2.5 Flash",
|
||||||
},
|
},
|
||||||
"gemini-2.5-flash-lite-preview-09-2025": {
|
"gemini-2.5-flash-lite": {
|
||||||
"llm_key": "VERTEX_GEMINI_2.5_FLASH_LITE",
|
"llm_key": "VERTEX_GEMINI_2.5_FLASH_LITE",
|
||||||
"label": "Gemini 2.5 Flash Lite",
|
"label": "Gemini 2.5 Flash Lite",
|
||||||
},
|
},
|
||||||
|
|||||||
@@ -1190,14 +1190,14 @@ if settings.ENABLE_VERTEX_AI and settings.VERTEX_CREDENTIALS:
|
|||||||
LLMConfigRegistry.register_config(
|
LLMConfigRegistry.register_config(
|
||||||
"VERTEX_GEMINI_2.5_FLASH",
|
"VERTEX_GEMINI_2.5_FLASH",
|
||||||
LLMConfig(
|
LLMConfig(
|
||||||
"vertex_ai/gemini-2.5-flash-preview-09-2025",
|
"vertex_ai/gemini-2.5-flash",
|
||||||
["VERTEX_CREDENTIALS"],
|
["VERTEX_CREDENTIALS"],
|
||||||
supports_vision=True,
|
supports_vision=True,
|
||||||
add_assistant_prefix=False,
|
add_assistant_prefix=False,
|
||||||
max_completion_tokens=65535,
|
max_completion_tokens=65535,
|
||||||
litellm_params=LiteLLMParams(
|
litellm_params=LiteLLMParams(
|
||||||
vertex_credentials=settings.VERTEX_CREDENTIALS,
|
vertex_credentials=settings.VERTEX_CREDENTIALS,
|
||||||
api_base=f"{api_base}/gemini-2.5-flash-preview-09-2025" if api_base else None,
|
api_base=f"{api_base}/gemini-2.5-flash" if api_base else None,
|
||||||
vertex_location=settings.VERTEX_LOCATION,
|
vertex_location=settings.VERTEX_LOCATION,
|
||||||
thinking={
|
thinking={
|
||||||
"budget_tokens": settings.GEMINI_THINKING_BUDGET,
|
"budget_tokens": settings.GEMINI_THINKING_BUDGET,
|
||||||
@@ -1209,14 +1209,14 @@ if settings.ENABLE_VERTEX_AI and settings.VERTEX_CREDENTIALS:
|
|||||||
LLMConfigRegistry.register_config(
|
LLMConfigRegistry.register_config(
|
||||||
"VERTEX_GEMINI_2.5_FLASH_LITE",
|
"VERTEX_GEMINI_2.5_FLASH_LITE",
|
||||||
LLMConfig(
|
LLMConfig(
|
||||||
"vertex_ai/gemini-2.5-flash-lite-preview-09-2025",
|
"vertex_ai/gemini-2.5-flash-lite",
|
||||||
["VERTEX_CREDENTIALS"],
|
["VERTEX_CREDENTIALS"],
|
||||||
supports_vision=True,
|
supports_vision=True,
|
||||||
add_assistant_prefix=False,
|
add_assistant_prefix=False,
|
||||||
max_completion_tokens=65535,
|
max_completion_tokens=65535,
|
||||||
litellm_params=LiteLLMParams(
|
litellm_params=LiteLLMParams(
|
||||||
vertex_credentials=settings.VERTEX_CREDENTIALS,
|
vertex_credentials=settings.VERTEX_CREDENTIALS,
|
||||||
api_base=f"{api_base}/gemini-2.5-flash-lite-preview-09-2025" if api_base else None,
|
api_base=f"{api_base}/gemini-2.5-flash-lite" if api_base else None,
|
||||||
vertex_location=settings.VERTEX_LOCATION,
|
vertex_location=settings.VERTEX_LOCATION,
|
||||||
thinking={
|
thinking={
|
||||||
"budget_tokens": settings.GEMINI_THINKING_BUDGET,
|
"budget_tokens": settings.GEMINI_THINKING_BUDGET,
|
||||||
|
|||||||
Reference in New Issue
Block a user