Add cross-region inference profiles for Llama 3.2 models. (#75)
This commit is contained in:
@@ -175,6 +175,10 @@ Currently, Bedrock Access Gateway only supports cross-region Inference for the f
|
||||
- Claude 3.5 Sonnet
|
||||
- Meta Llama 3.1 8b Instruct
|
||||
- Meta Llama 3.1 70b Instruct
|
||||
- Meta Llama 3.2 1B Instruct
|
||||
- Meta Llama 3.2 3B Instruct
|
||||
- Meta Llama 3.2 11B Vision Instruct
|
||||
- Meta Llama 3.2 90B Vision Instruct
|
||||
|
||||
**Prerequisites:**
|
||||
- IAM policies must allow cross-region access,Callers need permissions to access models and inference profiles in both regions (added in cloudformation template)
|
||||
|
||||
@@ -177,6 +177,10 @@ Cross-Region Inference 支持跨区域访问的基础模型,即允许用户在
|
||||
- Claude 3.5 Sonnet
|
||||
- Meta Llama 3.1 8b Instruct
|
||||
- Meta Llama 3.1 70b Instruct
|
||||
- Meta Llama 3.2 1B Instruct
|
||||
- Meta Llama 3.2 3B Instruct
|
||||
- Meta Llama 3.2 11B Vision Instruct
|
||||
- Meta Llama 3.2 90B Vision Instruct
|
||||
|
||||
**使用前提:**
|
||||
- IAM Policy 有 inference profiles 相关的权限和调用模型的权限 (cloudformation template 中已添加)
|
||||
|
||||
@@ -143,34 +143,62 @@ class BedrockModel(BaseChatModel):
|
||||
"us.meta.llama3-1-8b-instruct-v1:0": {
|
||||
"system": True,
|
||||
"multimodal": False,
|
||||
"tool_call": False,
|
||||
"tool_call": True,
|
||||
"stream_tool_call": False,
|
||||
},
|
||||
"meta.llama3-1-8b-instruct-v1:0": {
|
||||
"system": True,
|
||||
"multimodal": False,
|
||||
"tool_call": False,
|
||||
"tool_call": True,
|
||||
"stream_tool_call": False,
|
||||
},
|
||||
# Llama 3.1 70b cross-region inference profile
|
||||
"us.meta.llama3-1-70b-instruct-v1:0": {
|
||||
"system": True,
|
||||
"multimodal": False,
|
||||
"tool_call": False,
|
||||
"tool_call": True,
|
||||
"stream_tool_call": False,
|
||||
},
|
||||
"meta.llama3-1-70b-instruct-v1:0": {
|
||||
"system": True,
|
||||
"multimodal": False,
|
||||
"tool_call": False,
|
||||
"tool_call": True,
|
||||
"stream_tool_call": False,
|
||||
},
|
||||
"meta.llama3-1-405b-instruct-v1:0": {
|
||||
"system": True,
|
||||
"multimodal": False,
|
||||
"tool_call": True,
|
||||
"stream_tool_call": False,
|
||||
},
|
||||
# Llama 3.2 1B cross-region inference profile
|
||||
"us.meta.llama3-2-1b-instruct-v1:0": {
|
||||
"system": True,
|
||||
"multimodal": False,
|
||||
"tool_call": False,
|
||||
"stream_tool_call": False,
|
||||
},
|
||||
# Llama 3.2 3B cross-region inference profile
|
||||
"us.meta.llama3-2-3b-instruct-v1:0": {
|
||||
"system": True,
|
||||
"multimodal": False,
|
||||
"tool_call": False,
|
||||
"stream_tool_call": False,
|
||||
},
|
||||
# Llama 3.2 11B cross-region inference profile
|
||||
"us.meta.llama3-2-11b-instruct-v1:0": {
|
||||
"system": True,
|
||||
"multimodal": True,
|
||||
"tool_call": True,
|
||||
"stream_tool_call": False,
|
||||
},
|
||||
# Llama 3.2 90B cross-region inference profile
|
||||
"us.meta.llama3-2-90b-instruct-v1:0": {
|
||||
"system": True,
|
||||
"multimodal": True,
|
||||
"tool_call": True,
|
||||
"stream_tool_call": False,
|
||||
},
|
||||
"mistral.mistral-7b-instruct-v0:2": {
|
||||
"system": False,
|
||||
"multimodal": False,
|
||||
|
||||
Reference in New Issue
Block a user