diff --git a/README.md b/README.md index 492025f..c24c3d5 100644 --- a/README.md +++ b/README.md @@ -175,6 +175,10 @@ Currently, Bedrock Access Gateway only supports cross-region Inference for the f - Claude 3.5 Sonnet - Meta Llama 3.1 8b Instruct - Meta Llama 3.1 70b Instruct +- Meta Llama 3.2 1B Instruct +- Meta Llama 3.2 3B Instruct +- Meta Llama 3.2 11B Vision Instruct +- Meta Llama 3.2 90B Vision Instruct **Prerequisites:** - IAM policies must allow cross-region access,Callers need permissions to access models and inference profiles in both regions (added in cloudformation template) diff --git a/README_CN.md b/README_CN.md index 61f27a6..b5ef7a1 100644 --- a/README_CN.md +++ b/README_CN.md @@ -177,6 +177,10 @@ Cross-Region Inference 支持跨区域访问的基础模型,即允许用户在 - Claude 3.5 Sonnet - Meta Llama 3.1 8b Instruct - Meta Llama 3.1 70b Instruct +- Meta Llama 3.2 1B Instruct +- Meta Llama 3.2 3B Instruct +- Meta Llama 3.2 11B Vision Instruct +- Meta Llama 3.2 90B Vision Instruct **使用前提:** - IAM Policy 有 inference profiles 相关的权限和调用模型的权限 (cloudformation template 中已添加) diff --git a/src/api/models/bedrock.py b/src/api/models/bedrock.py index 48e9c59..0782324 100644 --- a/src/api/models/bedrock.py +++ b/src/api/models/bedrock.py @@ -143,34 +143,62 @@ class BedrockModel(BaseChatModel): "us.meta.llama3-1-8b-instruct-v1:0": { "system": True, "multimodal": False, - "tool_call": False, + "tool_call": True, "stream_tool_call": False, }, "meta.llama3-1-8b-instruct-v1:0": { "system": True, "multimodal": False, - "tool_call": False, + "tool_call": True, "stream_tool_call": False, }, # Llama 3.1 70b cross-region inference profile "us.meta.llama3-1-70b-instruct-v1:0": { "system": True, "multimodal": False, - "tool_call": False, + "tool_call": True, "stream_tool_call": False, }, "meta.llama3-1-70b-instruct-v1:0": { "system": True, "multimodal": False, - "tool_call": False, + "tool_call": True, "stream_tool_call": False, }, "meta.llama3-1-405b-instruct-v1:0": { + "system": True, + "multimodal": False, + "tool_call": True, + "stream_tool_call": False, + }, + # Llama 3.2 1B cross-region inference profile + "us.meta.llama3-2-1b-instruct-v1:0": { "system": True, "multimodal": False, "tool_call": False, "stream_tool_call": False, }, + # Llama 3.2 3B cross-region inference profile + "us.meta.llama3-2-3b-instruct-v1:0": { + "system": True, + "multimodal": False, + "tool_call": False, + "stream_tool_call": False, + }, + # Llama 3.2 11B cross-region inference profile + "us.meta.llama3-2-11b-instruct-v1:0": { + "system": True, + "multimodal": True, + "tool_call": True, + "stream_tool_call": False, + }, + # Llama 3.2 90B cross-region inference profile + "us.meta.llama3-2-90b-instruct-v1:0": { + "system": True, + "multimodal": True, + "tool_call": True, + "stream_tool_call": False, + }, "mistral.mistral-7b-instruct-v0:2": { "system": False, "multimodal": False,