From ba617afdc769c9d65e804a0db9a3ee32158d9a6e Mon Sep 17 00:00:00 2001 From: cpinn <4450689+cpinn@users.noreply.github.com> Date: Wed, 20 May 2026 22:37:48 +0000 Subject: [PATCH 1/2] fix: add Bedrock models meta.llama4-scout-17b-instruct-v1:0 +3 more --- packages/proxy/schema/index.ts | 4 +++ packages/proxy/schema/model_list.json | 46 +++++++++++++++++++++++++++ 2 files changed, 50 insertions(+) diff --git a/packages/proxy/schema/index.ts b/packages/proxy/schema/index.ts index 464a3820..79133f2a 100644 --- a/packages/proxy/schema/index.ts +++ b/packages/proxy/schema/index.ts @@ -590,6 +590,10 @@ export const AvailableEndpointTypes: { [name: string]: ModelEndpointType[] } = { "grok-2-1212": ["xAI"], "grok-vision-beta": ["xAI"], "grok-beta": ["xAI"], + "meta.llama4-scout-17b-instruct-v1:0": ["bedrock"], + "us.meta.llama4-scout-17b-instruct-v1:0": ["bedrock"], + "meta.llama4-maverick-17b-instruct-v1:0": ["bedrock"], + "us.meta.llama4-maverick-17b-instruct-v1:0": ["bedrock"], "grok-4.20-0309-non-reasoning": ["xAI"], "accounts/fireworks/models/deepseek-v4-flash": ["fireworks"], "accounts/fireworks/models/glm-5": ["fireworks"], diff --git a/packages/proxy/schema/model_list.json b/packages/proxy/schema/model_list.json index 57d7b976..bf4647ec 100644 --- a/packages/proxy/schema/model_list.json +++ b/packages/proxy/schema/model_list.json @@ -11670,5 +11670,51 @@ "available_providers": [ "together" ] + }, + "meta.llama4-scout-17b-instruct-v1:0": { + "format": "converse", + "flavor": "chat", + "multimodal": true, + "displayName": "Llama 4 Scout", + "max_input_tokens": 10000000, + "max_output_tokens": 8000, + "available_providers": [ + "bedrock" + ] + }, + "meta.llama4-maverick-17b-instruct-v1:0": { + "format": "converse", + "flavor": "chat", + "multimodal": true, + "displayName": "Llama 4 Maverick", + "max_input_tokens": 1000000, + "max_output_tokens": 8000, + "available_providers": [ + "bedrock" + ] + }, + "us.meta.llama4-scout-17b-instruct-v1:0": { + "format": "converse", + "flavor": "chat", + "multimodal": true, + "displayName": "US Llama 4 Scout", + "parent": "meta.llama4-scout-17b-instruct-v1:0", + "max_input_tokens": 10000000, + "max_output_tokens": 8000, + "available_providers": [ + "bedrock" + ] + }, + "us.meta.llama4-maverick-17b-instruct-v1:0": { + "format": "converse", + "flavor": "chat", + "multimodal": true, + "displayName": "US Llama 4 Maverick", + "parent": "meta.llama4-maverick-17b-instruct-v1:0", + "max_input_tokens": 1000000, + "max_output_tokens": 8000, + "available_providers": [ + "bedrock" + ] } } From de9664c16731a90be3e6c340c8857b7e0222cc85 Mon Sep 17 00:00:00 2001 From: Erin McNulty Date: Fri, 29 May 2026 11:14:11 -0400 Subject: [PATCH 2/2] fix: expose Llama 4 Bedrock inference profiles only --- packages/proxy/schema/index.ts | 2 -- packages/proxy/schema/model_list.json | 10 ++-------- 2 files changed, 2 insertions(+), 10 deletions(-) diff --git a/packages/proxy/schema/index.ts b/packages/proxy/schema/index.ts index 79133f2a..f63f9697 100644 --- a/packages/proxy/schema/index.ts +++ b/packages/proxy/schema/index.ts @@ -590,9 +590,7 @@ export const AvailableEndpointTypes: { [name: string]: ModelEndpointType[] } = { "grok-2-1212": ["xAI"], "grok-vision-beta": ["xAI"], "grok-beta": ["xAI"], - "meta.llama4-scout-17b-instruct-v1:0": ["bedrock"], "us.meta.llama4-scout-17b-instruct-v1:0": ["bedrock"], - "meta.llama4-maverick-17b-instruct-v1:0": ["bedrock"], "us.meta.llama4-maverick-17b-instruct-v1:0": ["bedrock"], "grok-4.20-0309-non-reasoning": ["xAI"], "accounts/fireworks/models/deepseek-v4-flash": ["fireworks"], diff --git a/packages/proxy/schema/model_list.json b/packages/proxy/schema/model_list.json index bf4647ec..6f49d3c6 100644 --- a/packages/proxy/schema/model_list.json +++ b/packages/proxy/schema/model_list.json @@ -11677,10 +11677,7 @@ "multimodal": true, "displayName": "Llama 4 Scout", "max_input_tokens": 10000000, - "max_output_tokens": 8000, - "available_providers": [ - "bedrock" - ] + "max_output_tokens": 8000 }, "meta.llama4-maverick-17b-instruct-v1:0": { "format": "converse", @@ -11688,10 +11685,7 @@ "multimodal": true, "displayName": "Llama 4 Maverick", "max_input_tokens": 1000000, - "max_output_tokens": 8000, - "available_providers": [ - "bedrock" - ] + "max_output_tokens": 8000 }, "us.meta.llama4-scout-17b-instruct-v1:0": { "format": "converse",