Add cross-region inference profiles for Llama 3.2 models. (#75)

This commit is contained in:
mschfh
2024-12-05 04:22:11 +01:00
committed by GitHub
parent 6849ca828a
commit 17503b032a
3 changed files with 40 additions and 4 deletions

View File

@@ -175,6 +175,10 @@ Currently, Bedrock Access Gateway only supports cross-region Inference for the f
- Claude 3.5 Sonnet
- Meta Llama 3.1 8b Instruct
- Meta Llama 3.1 70b Instruct
- Meta Llama 3.2 1B Instruct
- Meta Llama 3.2 3B Instruct
- Meta Llama 3.2 11B Vision Instruct
- Meta Llama 3.2 90B Vision Instruct
**Prerequisites:**
- IAM policies must allow cross-region access,Callers need permissions to access models and inference profiles in both regions (added in cloudformation template)

View File

@@ -177,6 +177,10 @@ Cross-Region Inference 支持跨区域访问的基础模型,即允许用户在
- Claude 3.5 Sonnet
- Meta Llama 3.1 8b Instruct
- Meta Llama 3.1 70b Instruct
- Meta Llama 3.2 1B Instruct
- Meta Llama 3.2 3B Instruct
- Meta Llama 3.2 11B Vision Instruct
- Meta Llama 3.2 90B Vision Instruct
**使用前提:**
- IAM Policy 有 inference profiles 相关的权限和调用模型的权限 (cloudformation template 中已添加)

View File

@@ -143,34 +143,62 @@ class BedrockModel(BaseChatModel):
"us.meta.llama3-1-8b-instruct-v1:0": {
"system": True,
"multimodal": False,
"tool_call": False,
"tool_call": True,
"stream_tool_call": False,
},
"meta.llama3-1-8b-instruct-v1:0": {
"system": True,
"multimodal": False,
"tool_call": False,
"tool_call": True,
"stream_tool_call": False,
},
# Llama 3.1 70b cross-region inference profile
"us.meta.llama3-1-70b-instruct-v1:0": {
"system": True,
"multimodal": False,
"tool_call": False,
"tool_call": True,
"stream_tool_call": False,
},
"meta.llama3-1-70b-instruct-v1:0": {
"system": True,
"multimodal": False,
"tool_call": False,
"tool_call": True,
"stream_tool_call": False,
},
"meta.llama3-1-405b-instruct-v1:0": {
"system": True,
"multimodal": False,
"tool_call": True,
"stream_tool_call": False,
},
# Llama 3.2 1B cross-region inference profile
"us.meta.llama3-2-1b-instruct-v1:0": {
"system": True,
"multimodal": False,
"tool_call": False,
"stream_tool_call": False,
},
# Llama 3.2 3B cross-region inference profile
"us.meta.llama3-2-3b-instruct-v1:0": {
"system": True,
"multimodal": False,
"tool_call": False,
"stream_tool_call": False,
},
# Llama 3.2 11B cross-region inference profile
"us.meta.llama3-2-11b-instruct-v1:0": {
"system": True,
"multimodal": True,
"tool_call": True,
"stream_tool_call": False,
},
# Llama 3.2 90B cross-region inference profile
"us.meta.llama3-2-90b-instruct-v1:0": {
"system": True,
"multimodal": True,
"tool_call": True,
"stream_tool_call": False,
},
"mistral.mistral-7b-instruct-v0:2": {
"system": False,
"multimodal": False,