From f825d671057ce7c67ab62444c1f0aa301459fb5f Mon Sep 17 00:00:00 2001 From: Ken Jiang Date: Wed, 20 May 2026 14:05:26 -0400 Subject: [PATCH 1/2] add gemini 3.1-flash-lite for vertex --- packages/proxy/schema/model_list.json | 16 ++++++++++++++++ 1 file changed, 16 insertions(+) diff --git a/packages/proxy/schema/model_list.json b/packages/proxy/schema/model_list.json index 361c6d9f..eb1ee7ea 100644 --- a/packages/proxy/schema/model_list.json +++ b/packages/proxy/schema/model_list.json @@ -8543,6 +8543,22 @@ "max_input_tokens": 1048576, "max_output_tokens": 65535 }, + "publishers/google/models/gemini-3.1-flash-lite": { + "format": "google", + "flavor": "chat", + "multimodal": true, + "input_cost_per_mil_tokens": 0.25, + "output_cost_per_mil_tokens": 1.5, + "input_cache_read_cost_per_mil_tokens": 0.025, + "displayName": "Gemini 3.1 Flash-Lite", + "reasoning": true, + "reasoning_budget": true, + "locations": [ + "global" + ], + "max_input_tokens": 1048576, + "max_output_tokens": 65536 + }, "publishers/google/models/gemini-3-pro-preview": { "format": "google", "flavor": "chat", From e966ee8f37976820447833523c2059f5b936f573 Mon Sep 17 00:00:00 2001 From: Ken Jiang Date: Wed, 20 May 2026 14:30:50 -0400 Subject: [PATCH 2/2] fixxx --- packages/proxy/schema/index.ts | 5 +++-- packages/proxy/schema/model_list.json | 16 ++++++++++++++++ 2 files changed, 19 insertions(+), 2 deletions(-) diff --git a/packages/proxy/schema/index.ts b/packages/proxy/schema/index.ts index bea254a5..464a3820 100644 --- a/packages/proxy/schema/index.ts +++ b/packages/proxy/schema/index.ts @@ -598,9 +598,8 @@ export const AvailableEndpointTypes: { [name: string]: ModelEndpointType[] } = { "mistral-medium-3": ["mistral"], "mistral-medium-3-5-26-04": ["mistral"], "gemini-3.5-flash": ["google", "vertex"], - "publishers/google/models/gemini-3.5-flash": ["google"], "deepseek.v3.2": ["bedrock"], - "gemini-3.1-flash-lite": ["google"], + "gemini-3.1-flash-lite": ["google", "vertex"], "amazon.nova-premier-v1:0": ["bedrock"], "amazon.nova-2-lite-v1:0": ["bedrock"], "magistral-medium-2509": ["mistral"], @@ -881,8 +880,10 @@ export const AvailableEndpointTypes: { [name: string]: ModelEndpointType[] } = { "gemini-3.1-flash-lite-preview": ["google"], "gemini-3-pro-image-preview": ["google"], "gemini-3-flash-preview": ["google"], + "publishers/google/models/gemini-3.5-flash": ["vertex"], "publishers/google/models/gemini-3.1-pro-preview": ["vertex"], "publishers/google/models/gemini-3.1-pro-preview-customtools": ["vertex"], + "publishers/google/models/gemini-3.1-flash-lite": ["vertex"], "publishers/google/models/gemini-3.1-flash-lite-preview": ["vertex"], "publishers/google/models/gemini-3-pro-preview": ["vertex"], "publishers/google/models/gemini-3-flash-preview": ["vertex"], diff --git a/packages/proxy/schema/model_list.json b/packages/proxy/schema/model_list.json index eb1ee7ea..57d7b976 100644 --- a/packages/proxy/schema/model_list.json +++ b/packages/proxy/schema/model_list.json @@ -8575,6 +8575,22 @@ "max_input_tokens": 1048576, "max_output_tokens": 65535 }, + "publishers/google/models/gemini-3.5-flash": { + "format": "google", + "flavor": "chat", + "multimodal": true, + "input_cost_per_mil_tokens": 1.5, + "output_cost_per_mil_tokens": 9, + "input_cache_read_cost_per_mil_tokens": 0.15, + "displayName": "Gemini 3.5 Flash", + "reasoning": true, + "reasoning_budget": true, + "locations": [ + "global" + ], + "max_input_tokens": 1048576, + "max_output_tokens": 65535 + }, "publishers/google/models/gemini-3-flash-preview": { "format": "google", "flavor": "chat",