diff --git a/.flake8 b/.flake8
new file mode 100644
index 0000000..364a711
--- /dev/null
+++ b/.flake8
@@ -0,0 +1,19 @@
+[flake8]
+max-line-length = 120
+ignore =
+    E203,W191,W503
+exclude =
+    build
+    .git
+    __pycache__
+    .tox
+    venv
+    .venv
+    .venv-test
+    tmp*
+    deployment
+    cdk.out
+    node_modules
+
+max-complexity = 10
+require-code = True
\ No newline at end of file
diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..d8b355e
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,162 @@
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+.pybuilder/
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# IPython
+profile_default/
+ipython_config.py
+
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+#poetry.lock
+
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#pdm.lock
+#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
+#   in version control.
+#   https://pdm.fming.dev/#use-with-ide
+.pdm.toml
+
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+
+# SageMath parsed files
+*.sage.py
+
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+
+# Pyre type checker
+.pyre/
+
+# pytype static type analyzer
+.pytype/
+
+# Cython debug symbols
+cython_debug/
+
+# PyCharm
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+.idea/
+
+Config
\ No newline at end of file
diff --git a/README.md b/README.md
index 7f92204..22163db 100644
--- a/README.md
+++ b/README.md
@@ -1,11 +1,245 @@
-## My Project
+[中文](./README_CN.md)
 
-TODO: Fill this README out!
+# Bedrock Access Gateway
 
-Be sure to:
+OpenAI-Compatible RESTful APIs for Amazon Bedrock
 
-* Change the title in this README
-* Edit your repository description on GitHub
+## Overview
+
+Amazon Bedrock offers a wide range of foundation models (such as Claude 3 Sonnet/Haiku, Llama 2, Mistral/Mixtral etc.)
+and a broad set of capabilities for you to build generative AI applications.
+Check [Amazon Bedrock](https://aws.amazon.com/bedrock) for more details.
+
+Sometimes, you might have applications developed using OpenAI APIs or SDKs, and you want to experiment with Amazon
+Bedrock without modifying your codebase. Or you may simply wish to evaluate the capabilities of these foundation models
+in tools like AutoGen etc. Well, this repository allows you to access Amazon Bedrock models seamlessly through OpenAI
+APIs and SDKs, enabling you to test these models without code changes.
+
+If you find this GitHub repository useful, please consider giving it a free star to show your appreciation and support
+for the project.
+
+Features:
+
+- [x] Support streaming response via server-sent events (SSE)
+- [x] Support Model APIs
+- [x] Support Chat Completion APIs
+- [ ] Support Function Call/Tool Call
+- [ ] Support Embedding APIs
+- [ ] Support Image APIs
+
+> NOTE: 1. The legacy [text completion](https://platform.openai.com/docs/api-reference/completions) API is not
+> supported, you should move to chat completion API. 2. May support other APIs such as fine-tuning, Assistants API etc.
+> in the future.
+
+Supported Amazon Bedrock models (Model IDs):
+
+- anthropic.claude-instant-v1
+- anthropic.claude-v2:1
+- anthropic.claude-v2
+- anthropic.claude-3-sonnet-20240229-v1:0
+- anthropic.claude-3-haiku-20240307-v1:0
+- meta.llama2-13b-chat-v1
+- meta.llama2-70b-chat-v1
+- mistral.mistral-7b-instruct-v0:2
+- mistral.mixtral-8x7b-instruct-v0:1
+
+> Note: The default model is set to `anthropic.claude-3-sonnet-20240229-v1:0`. You can change it via Lambda environment
+> variables.
+
+## Get Started
+
+### Prerequisites
+
+Please make sure you have met below prerequisites:
+
+- Access to Amazon Bedrock foundation models.
+
+If you haven't got model access, please follow
+the [Set Up](https://docs.aws.amazon.com/bedrock/latest/userguide/model-access.html) guide
+
+### Architecture
+
+The following diagram illustrates the solution architecture. Note that it also includes a new **VPC** with two public
+subnets only for the Application Load Balancer (ALB).
+
+![Architecture](assets/arch.svg)
+
+### Deployment
+
+Please follow below steps to deploy the Bedrock Proxy APIs into your AWS account. Only support regions where Amazon
+Bedrock is available (such as us-west-2). The deployment will take approximately 3-5 minutes.
+
+**Step 1: Create you own custom API key (Optional)**
+
+> NOTE: This step is to use any string (without spaces) you like to create a custom API Key (credential) that will be
+> used to access the proxy API later. This key does not have to match your actual OpenAI key, and you don't even need to
+> have an OpenAI API key. It is recommended that you take this step and ensure that you keep the key safe and private.
+
+1. Open the AWS Management Console and navigate to the Systems Manager service.
+2. In the left-hand navigation pane, click on "Parameter Store".
+3. Click on the "Create parameter" button.
+4. In the "Create parameter" window, select the following options:
+    - Name: Enter a descriptive name for your parameter (e.g., "BedrockProxyAPIKey").
+    - Description: Optionally, provide a description for the parameter.
+    - Tier: Select **Standard**.
+    - Type: Select **SecureString**.
+    - Value: Any string (without spaces).
+5. Click "Create parameter".
+6. Make a note of the parameter name you used (e.g., "BedrockProxyAPIKey"). You'll need this in the next step.
+
+**Step 2: Deploy the CloudFormation stack**
+
+1. Sign in to AWS Management Console, switch to the region to deploy the CloudFormation Stack to.
+2. Click the following button to launch the CloudFormation Stack in that region.
+
+   [![Launch Stack](assets/launch-stack.png)](https://console.aws.amazon.com/cloudformation/home#/stacks/create/template?stackName=BedrockProxyAPI&templateURL=https://aws-gcr-solutions.s3.amazonaws.com/bedrock-proxy-api/latest/BedrockProxy.template)
+
+3. Click "Next".
+4. On the "Specify stack details" page, provide the following information:
+    - Stack name: Change the stack name if needed.
+    - ApiKeyParam (if you set up an API key in Step 1): Enter the parameter name you used for storing the API key (
+      e.g., "BedrockProxyAPIKey"). If you did not set up an API key, leave this field blank.
+      Click "Next".
+5. On the "Configure stack options" page, you can leave the default settings or customize them according to your needs.
+6. Click "Next".
+7. On the "Review" page, review the details of the stack you're about to create. Check the "I acknowledge that AWS
+   CloudFormation might create IAM resources" checkbox at the bottom.
+8. Click "Create stack".
+
+That is it! Once deployed, click the CloudFormation stack and go to **Outputs** tab, you can find the API Base URL
+from `APIBaseUrl`, the value should look like `http://xxxx.xxx.elb.amazonaws.com/api/v1`.
+
+### SDK/API Usage
+
+All you need is the API Key and the API Base URL. And if you didn't
+set up your own key, then the default API Key `bedrock` will be used.
+
+Now, you can try out the proxy APIs. Let's say you want to test Claude 3 Sonnet model, then
+use `anthropic.claude-3-sonnet-20240229-v1:0` as the Model ID.
+
+- **Example API Usage**
+
+```bash
+curl https://<API base url>/chat/completions \
+  -H "Content-Type: application/json" \
+  -H "Authorization: Bearer <API Key>" \
+  -d '{
+    "model": "anthropic.claude-3-sonnet-20240229-v1:0",
+    "messages": [
+      {
+        "role": "user",
+        "content": "Hello!"
+      }
+    ]
+  }'
+```
+
+- **Example SDK Usage**
+
+```bash
+export OPENAI_API_KEY=<API key>
+export OPENAI_API_BASE=<API base url>
+```
+
+```python
+from openai import OpenAI
+
+client = OpenAI()
+completion = client.chat.completions.create(
+    model="anthropic.claude-3-sonnet-20240229-v1:0",
+    messages=[{"role": "user", "content": "Hello!"}],
+)
+
+print(completion.choices[0].message.content)
+```
+
+## Other Examples
+
+### AutoGen
+
+Below is an image of setting up the model in AutoGen studio.
+
+![AutoGen Model](assets/autogen-model.png)
+
+### LangChain
+
+Make sure you use `ChatOpenAI(...)` instead of `OpenAI(...)`
+
+```python
+# pip install langchain-openai
+from langchain.chains import LLMChain
+from langchain.prompts import PromptTemplate
+from langchain_openai import ChatOpenAI
+
+chat = ChatOpenAI(
+    model="anthropic.claude-3-sonnet-20240229-v1:0",
+    temperature=0,
+    openai_api_key="xxxx",
+    openai_api_base="http://xxx.elb.amazonaws.com/api/v1",
+)
+
+template = """Question: {question}
+
+Answer: Let's think step by step."""
+
+prompt = PromptTemplate.from_template(template)
+llm_chain = LLMChain(prompt=prompt, llm=chat)
+
+question = "What NFL team won the Super Bowl in the year Justin Beiber was born?"
+response = llm_chain.invoke(question)
+print(response)
+
+```
+
+## FAQs
+
+### About Privacy
+
+This application does not collect any of your data. Furthermore, it does not log any requests or responses by default.
+
+### Why not used API Gateway instead of Application Load Balancer?
+
+Short answer is that API Gateway does not support server-sent events (SSE) for streaming response.
+
+### Which regions are supported?
+
+This solution only supports the regions where Amazon Bedrock is available, so:
+
+- US East (N. Virginia)
+- US West (Oregon)
+- Asia Pacific (Singapore)
+- Asia Pacific (Tokyo)
+- Europe (Frankfurt)
+
+Note that not all models are available in those regions.
+
+### Can I build and use my own ECR image
+
+Yes, you can clone the repo and build the container image by yourself (src/Dockerfile) and then push to your ECR repo.
+
+Replace the repo url in the CloudFormation template before you deploy.
+
+### Can I run this locally
+
+Yes, you can run this locally, then the API base url should be like `http://localhost:8000/api/v1`
+
+### Any performance sacrifice or latency increase by using the proxy APIs
+
+This is yet to be tested. But you should use this solution for PoC only.
+
+### Any plan to support SageMaker models?
+
+Currently, there is no plan of supporting SageMaker models. This depends on if there are customer asks.
+
+### Any plan to support Bedrock custom models?
+
+Fine-tuned models and models with Provisioned Throughput are not supported. You can clone the repo and make the
+customization if needed.
+
+### How to upgrade?
+
+If there is no changes on architecture, you can simply deploy the latest image to your Lambda to use the new
+features (manually) without redeploying the whole CloudFormation stack.
 
 ## Security
 
diff --git a/README_CN.md b/README_CN.md
new file mode 100644
index 0000000..3d36451
--- /dev/null
+++ b/README_CN.md
@@ -0,0 +1,236 @@
+[English](./README.md)
+
+# Bedrock Access Gateway
+
+使用兼容OpenAI的API访问Amazon Bedrock
+
+## 概述
+
+Amazon Bedrock提供了广泛的基础模型(如Claude 3 Sonnet/Haiku、Llama 2、Mistral/Mixtral等)
+,以及构建生成式AI应用程序的多种功能。更多详细信息,请查看[Amazon Bedrock](https://aws.amazon.com/bedrock)。
+
+有时,您可能已经使用OpenAI的API或SDK构建了应用程序,并希望在不修改代码的情况下试用Amazon
+Bedrock的模型。或者,您可能只是希望在AutoGen等工具中评估这些基础模型的功能。 好消息是, 这里提供了一种方便的途径,让您可以使用
+OpenAI 的 API 或 SDK 无缝集成并试用 Amazon Bedrock 的模型,而无需对现有代码进行修改。
+
+如果您觉得这个项目有用,请考虑给它点个一个免费的小星星。
+
+功能列表：
+
+- [x] 支持 server-sent events (SSE)的流式响应
+- [x] 支持 Model APIs
+- [x] 支持 Chat Completion APIs
+- [ ] 支持 Function Call/Tool Call
+- [ ] 支持 Embedding APIs
+- [ ] 支持 Image APIs
+
+> 注意： 1，不支持旧的 [text completion](https://platform.openai.com/docs/api-reference/completions) API，请更改为使用Chat
+> Completion API。 2.未来可能支持其他API, 如Fine-tune、Assistants API等。
+
+支持的Amazon Bedrock模型列表（Model IDs）：
+
+- anthropic.claude-instant-v1
+- anthropic.claude-v2:1
+- anthropic.claude-v2
+- anthropic.claude-3-sonnet-20240229-v1:0
+- anthropic.claude-3-haiku-20240307-v1:0
+- meta.llama2-13b-chat-v1
+- meta.llama2-70b-chat-v1
+- mistral.mistral-7b-instruct-v0:2
+- mistral.mixtral-8x7b-instruct-v0:1
+
+> Note: 默认模型为 `anthropic.claude-3-sonnet-20240229-v1:0`， 可以通过更改Lambda环境变量进行更改。
+
+## 使用指南
+
+### 前提条件
+
+请确保您已满足以下先决条件:
+
+- 可以访问Amazon Bedrock基础模型。
+
+如果您还没有获得模型访问权限,请参考[配置](https://docs.aws.amazon.com/bedrock/latest/userguide/model-access.html)指南。
+
+### 架构图
+
+下图展示了本方案的架构。请注意,它还包括一个新的**VPC**,其中只有两个公共子网用于应用程序负载均衡器(ALB)。
+
+![Architecture](assets/arch.svg)
+
+### 部署
+
+请按以下步骤将Bedrock代理API部署到您的AWS账户中。仅支持Amazon Bedrock可用的区域(如us-west-2)。
+
+**第一步: 自定义您的API Key (可选)**
+
+> 注意:这一步是使用任意字符串（不带空格）创建一个自定义的API Key(凭证),将用于后续访问代理API。此API Key不必与您实际的OpenAI
+> Key一致,您甚至无需拥有OpenAI API Key。建议您执行此步操作并且请确保保管好此API Key。
+
+1. 打开AWS管理控制台,导航到Systems Manager服务。
+2. 在左侧导航窗格中,单击"参数存储"。
+3. 单击"创建参数"按钮。
+4. 在"创建参数"窗口中,选择以下选项:
+    - 名称:输入参数的描述性名称(例如"BedrockProxyAPIKey")。
+    - 描述:可选,为参数提供描述。
+    - 层级:选择**标准**。
+    - 类型:选择**SecureString**。
+    - 值: 随意字符串（不带空格）。
+5. 单击"创建参数"。
+6. 记录您使用的参数名称(例如"BedrockProxyAPIKey")。您将在下一步中需要它。
+
+**第二步: 部署CloudFormation堆栈**
+
+1. 登录AWS管理控制台,切换到要部署CloudFormation堆栈的区域。
+2. 单击以下按钮在该区域启动CloudFormation堆栈。
+
+   [![Launch Stack](assets/launch-stack.png)](https://console.aws.amazon.com/cloudformation/home#/stacks/create/template?stackName=BedrockProxyAPI&templateURL=https://aws-gcr-solutions.s3.amazonaws.com/bedrock-proxy-api/latest/BedrockProxy.template)
+
+3. 单击"下一步"。
+4. 在"指定堆栈详细信息"页面,提供以下信息:
+    - 堆栈名称: 可以根据需要更改名称。
+    - ApiKeyParam(如果在步骤1中设置了API密钥):输入您用于存储API密钥的参数名称(例如"BedrockProxyAPIKey")
+      。如果您没有设置API密钥,请将此字段留空。
+      单击"下一步"。
+5. 在"配置堆栈选项"页面,您可以保留默认设置或根据需要进行自定义。
+6. 单击"下一步"。
+7. 在"审核"页面,查看您即将创建的堆栈详细信息。勾选底部的"我确认，AWS CloudFormation 可能创建 IAM 资源。"复选框。
+8. 单击"创建堆栈"。
+
+仅此而已。部署完成后,点击CloudFormation堆栈,进入"输出"选项卡,你可以从"APIBaseUrl"
+中找到API Base URL,它应该类似于`http://xxxx.xxx.elb.amazonaws.com/api/v1` 这样的格式。
+
+### SDK/API使用
+
+你只需要API Key和API Base URL。如果你没有设置自己的密钥,那么默认将使用API Key `bedrock`。
+
+现在,你可以尝试使用代理API了。假设你想测试Claude 3 Sonnet模型,那么使用"anthropic.claude-3-sonnet-20240229-v1:0"作为模型ID。
+
+- **API 使用示例**
+
+```bash
+curl https://<API base url>/chat/completions \
+  -H "Content-Type: application/json" \
+  -H "Authorization: Bearer <API Key>" \
+  -d '{
+    "model": "anthropic.claude-3-sonnet-20240229-v1:0",
+    "messages": [
+      {
+        "role": "user",
+        "content": "Hello!"
+      }
+    ]
+  }'
+```
+
+- **SDK 使用示例**
+
+```bash
+export OPENAI_API_KEY=<API key>
+export OPENAI_API_BASE=<API base url>
+```
+
+```python
+from openai import OpenAI
+
+client = OpenAI()
+completion = client.chat.completions.create(
+    model="anthropic.claude-3-sonnet-20240229-v1:0",
+    messages=[{"role": "user", "content": "Hello!"}],
+)
+
+print(completion.choices[0].message.content)
+```
+
+## 其他例子
+
+### AutoGen
+
+例如在AutoGen studio配置和使用模型
+
+![AutoGen Model](assets/autogen-model.png)
+
+### LangChain
+
+请确保使用的示`ChatOpenAI(...)` ，而不是`OpenAI(...)`
+
+```python
+# pip install langchain-openai
+from langchain.chains import LLMChain
+from langchain.prompts import PromptTemplate
+from langchain_openai import ChatOpenAI
+
+chat = ChatOpenAI(
+    model="anthropic.claude-3-sonnet-20240229-v1:0",
+    temperature=0,
+    openai_api_key="xxxx",
+    openai_api_base="http://xxx.elb.amazonaws.com/api/v1",
+)
+
+template = """Question: {question}
+
+Answer: Let's think step by step."""
+
+prompt = PromptTemplate.from_template(template)
+llm_chain = LLMChain(prompt=prompt, llm=chat)
+
+question = "What NFL team won the Super Bowl in the year Justin Beiber was born?"
+response = llm_chain.invoke(question)
+print(response)
+
+```
+
+## FAQs
+
+### 关于隐私
+
+这个方案不会收集您的任何数据。而且,它默认情况下也不会记录任何请求或响应。
+
+### 为什么没有使用API Gateway 而是使用了Application Load Balancer?
+
+简单的答案是API Gateway不支持 server-sent events (SSE) 用于流式响应。
+
+### 支持哪些区域?
+
+只支持Amazon Bedrock可用的区域,即:
+
+- 美国东部(弗吉尼亚北部)
+- 美国西部(俄勒冈州)
+- 亚太地区(新加坡)
+- 亚太地区(东京)
+- 欧洲(法兰克福)
+
+注意，并非所有模型都在上面区可用。
+
+### 我可以构建并使用自己的ECR镜像吗?
+
+是的,你可以克隆repo并自行构建容器镜像(src/Dockerfile),然后推送到你自己的ECR仓库。
+
+在部署之前,请在CloudFormation模板中替换镜像仓库URL。
+
+### 我可以在本地运行吗?
+
+是的,你可以在本地运行,那么API Base URL应该类似于`http://localhost:8000/api/v1`
+
+### 使用代理API会有任何性能牺牲或延迟增加吗?
+
+这还有待测试。但你应该只将此解决方案用于概念验证。
+
+### 有计划支持SageMaker模型吗?
+
+目前没有支持SageMaker模型的计划。这取决于是否有客户需求。
+
+### 有计划支持Bedrock自定义模型吗?
+
+不支持微调模型和设置了已预配吞吐量的模型。如有需要,你可以克隆repo并进行自定义。
+
+### 如何升级?
+
+如果架构没有变化,你可以简单地将最新镜像部署到Lambda中,以使用新功能(手动),而无需重新部署整个CloudFormation堆栈。
+
+## 安全
+
+更多信息,请参阅[CONTRIBUTING](CONTRIBUTING.md#security-issue-notifications)。
+
+## 许可证
+
+本项目根据MIT-0许可证获得许可。请参阅LICENSE文件。
diff --git a/assets/arch.svg b/assets/arch.svg
new file mode 100644
index 0000000..a872ef3
--- /dev/null
+++ b/assets/arch.svg
@@ -0,0 +1,4 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!-- Do not edit this file with editors other than draw.io -->
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" version="1.1" width="673px" height="343px" viewBox="-0.5 -0.5 673 343" content="&lt;mxfile modified=&quot;2024-03-17T09:56:12.984Z&quot; host=&quot;Electron&quot; agent=&quot;Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) draw.io/22.1.16 Chrome/120.0.6099.109 Electron/28.1.0 Safari/537.36&quot; etag=&quot;gLux7VUD_9kdfONcRsVA&quot; version=&quot;22.1.16&quot; type=&quot;device&quot;&gt;&lt;diagram id=&quot;Ht1M8jgEwFfnCIfOTk4-&quot; name=&quot;Page-1&quot;&gt;7Vldc+I2FP01zLQPzVg2xs5jMNBmQqd06Uy6T4ywhVEjLI8sAuyv75UtY2yJpLshmzSzSSbxvdbnvecc6ZKeF232vwqcr3/nCWE910n2PW/Uc13k9l34ozyHyhM6g8qRCproRo1jTr8Q7XS0d0sTUrQaSs6ZpHnbGfMsI7Fs+bAQfNdutuKsPWuOU2I45jFmpveeJnKtvWhw3bz4jdB0racO3aB6scF1Y72TYo0TvjtxeeOeFwnOZfW02UeEqeDVcan6Tc68PS5MkEz+lw6fxvd/kv5ncovuIvTXYrp9SOa/oH41zCNmW73jm/s5OCLGt4leuDzU0cg5zWQZUX8IPzBh5PR8eBMp68r1O46uHbQdyLTUGG1H1w7aDtQdHnXmR90FnjgMqzW805nfOVkg/HhDvpWMZiQ6Ys8BZypwQiEnEWdcgC/jGURvuJYbBhaCx92aSjLPcayiugPegG/FM6nRj9za1oFXowK+JYa5hB6jzAQR40dSJaRqwxjOC7o89hIk3oqCPpJPpKgGV15AYq6eN/tUkfYK74r+VSr4Ni+XfwtzWd8u4HERK2AsMJNqICn4A6k32nM9+J4o9A1XlLFOAB6JkBSIdcNoqsaXXE2HtcXIqhwRokKzdFpaI8/RkbBNkeBiTRK9JY1imILsz/IDHVkHckX4hkhxgCa6g3utiaqVyh1obuwa3vsDLWfrE8p7tcZhrTXpceyGjvCgGfk17DTIGTEFrZ6i+gR+z0d3BkeLByLjtY6LFaHnInoGuae5rJuPjOzrxq2s1Cmf4iVhM15QSUtoLbmUfPMsJmKiIN7mznM8wUVebXRF92odBlHQOQKQPTTLMFsUycNlEIXCNqK8+lA7QdQgNAEVhK+EJ88AC0ngtNMmF3LNUw4hGDfeIRA/S44ZbdpMucpVGc5/iJQHnRS8lbydMQiWOPyt+5fGZ2WArmpztD99OTqcWjMiKOy9lL2G52rVT+cENsm3IibPkcvMnSAMS1DM9k3Ckgnddabw1eTcG3Ry3r9uDyGxSInUvTr5PC7j21NsOc/znAHHSuq5zpRjONYd4BjOYgjr91aPMOpPJpOPpx64ifKCQYwXyzrCF5ESA1YWKQm+p5Rcv4WUHOFRGzMslWiDB/bphJcVCF+XGyVhn2gXvlBIXnZFuDYI/0euUIiZNUMlmdpRNQjT5dWGJkmVQHWLxM31sl0OjJ6Cuq7PdOemKjpNzHmgneUFXMcHfdS+t1XWC3W8HqbmW7s/X60K8ir6jZA1ba9MrDdgTfCWrPHNU7Kseqd4s0xwzx2U5c0SjsdBqp5+mgm+P/z89GlpLY6tBbKtSLYWymax3GpWlq+WGbpOmy8wnchsVle8ptPms5X33d7I0ht1ep8vrs9dPjq3jPEoQI5jq1BX5dd7vGpYrxWguCXhqppcCbCtOmcVbC9y0/D77+ymMfhRtBjX+2fV1X9LdQ1Mdd3gL2X5MSSJ4PHDDyH9nwipg27C0Pyw56MK6VLD8yJKGnjvTElDg5czLHClVK4zl1wQy9XnZnYLb+/Ic9efV/iwYBwgPxh+vA8L8jrsi6IM+oUObnTltwDXD3wTcP5FAAdm85+rqvZp/v/njf8F&lt;/diagram&gt;&lt;/mxfile&gt;" style="background-color: rgb(255, 255, 255);"><defs/><g><path d="M 110 0 L 672 0 L 672 342 L 110 342 Z" fill="none" stroke="#232f3e" stroke-miterlimit="10" pointer-events="none"/><path d="M 116.09 7.18 C 116.01 7.18 115.93 7.19 115.85 7.19 C 115.5 7.19 115.15 7.23 114.81 7.32 C 114.53 7.39 114.25 7.49 113.98 7.62 C 113.9 7.65 113.84 7.7 113.79 7.76 C 113.75 7.83 113.74 7.91 113.74 7.99 L 113.74 8.32 C 113.74 8.46 113.78 8.53 113.89 8.53 L 113.99 8.53 L 114.22 8.44 C 114.45 8.35 114.69 8.27 114.94 8.21 C 115.17 8.16 115.41 8.13 115.65 8.13 C 116.04 8.09 116.43 8.2 116.73 8.44 C 116.97 8.74 117.09 9.12 117.05 9.5 L 117.05 9.99 C 116.78 9.93 116.54 9.88 116.29 9.84 C 116.05 9.81 115.81 9.79 115.57 9.79 C 114.98 9.76 114.4 9.94 113.94 10.31 C 113.54 10.65 113.32 11.15 113.34 11.68 C 113.31 12.15 113.49 12.62 113.82 12.96 C 114.18 13.29 114.66 13.46 115.15 13.44 C 115.91 13.45 116.63 13.11 117.11 12.51 C 117.18 12.66 117.24 12.79 117.31 12.91 C 117.38 13.02 117.46 13.12 117.55 13.21 C 117.6 13.27 117.67 13.31 117.75 13.31 C 117.81 13.31 117.87 13.29 117.92 13.25 L 118.34 12.97 C 118.41 12.93 118.46 12.86 118.47 12.77 C 118.47 12.72 118.45 12.67 118.42 12.62 C 118.34 12.47 118.26 12.31 118.21 12.14 C 118.15 11.95 118.12 11.75 118.13 11.55 L 118.14 9.37 C 118.2 8.77 118 8.18 117.59 7.74 C 117.17 7.39 116.64 7.19 116.09 7.18 Z M 129.89 7.19 C 129.78 7.19 129.68 7.19 129.57 7.2 C 129.29 7.2 129 7.24 128.73 7.31 C 128.47 7.38 128.23 7.5 128.01 7.66 C 127.82 7.81 127.66 7.99 127.54 8.21 C 127.42 8.43 127.35 8.67 127.36 8.92 C 127.36 9.27 127.48 9.61 127.69 9.89 C 127.97 10.22 128.34 10.46 128.76 10.56 L 129.72 10.87 C 129.97 10.93 130.2 11.05 130.39 11.22 C 130.51 11.35 130.58 11.51 130.57 11.69 C 130.58 11.94 130.45 12.18 130.23 12.31 C 129.93 12.48 129.6 12.56 129.26 12.54 C 128.99 12.54 128.72 12.51 128.46 12.45 C 128.22 12.4 127.98 12.32 127.75 12.22 L 127.59 12.15 C 127.54 12.14 127.5 12.14 127.46 12.15 C 127.36 12.15 127.31 12.22 127.31 12.36 L 127.31 12.69 C 127.31 12.76 127.32 12.82 127.35 12.89 C 127.4 12.97 127.47 13.03 127.56 13.07 C 127.8 13.19 128.06 13.28 128.32 13.34 C 128.66 13.41 129 13.45 129.35 13.45 L 129.33 13.46 C 129.66 13.45 129.98 13.4 130.29 13.3 C 130.55 13.22 130.8 13.09 131.01 12.92 C 131.21 12.77 131.38 12.57 131.49 12.34 C 131.61 12.1 131.67 11.83 131.66 11.56 C 131.67 11.23 131.56 10.9 131.36 10.63 C 131.09 10.32 130.73 10.09 130.33 9.99 L 129.39 9.69 C 129.13 9.61 128.88 9.49 128.67 9.32 C 128.54 9.2 128.47 9.03 128.47 8.85 C 128.46 8.61 128.58 8.38 128.79 8.25 C 129.06 8.11 129.36 8.05 129.67 8.06 C 130.11 8.06 130.55 8.14 130.96 8.32 C 131.04 8.37 131.12 8.4 131.21 8.41 C 131.31 8.41 131.36 8.34 131.36 8.19 L 131.36 7.88 C 131.37 7.8 131.35 7.72 131.31 7.66 C 131.25 7.59 131.18 7.54 131.11 7.49 L 130.83 7.38 L 130.45 7.27 L 130.01 7.2 C 129.97 7.2 129.93 7.19 129.89 7.19 Z M 126.02 7.36 C 125.94 7.35 125.86 7.38 125.79 7.42 C 125.72 7.5 125.68 7.59 125.66 7.69 L 124.51 12.14 L 123.47 7.71 C 123.45 7.61 123.41 7.52 123.34 7.44 C 123.26 7.39 123.17 7.37 123.07 7.38 L 122.54 7.38 C 122.44 7.37 122.35 7.39 122.27 7.44 C 122.2 7.51 122.15 7.61 122.14 7.71 L 121.09 12.14 L 119.97 7.7 C 119.95 7.6 119.91 7.51 119.84 7.44 C 119.76 7.39 119.67 7.36 119.58 7.37 L 118.92 7.37 C 118.81 7.37 118.76 7.43 118.76 7.54 C 118.77 7.63 118.79 7.72 118.82 7.81 L 120.38 12.95 C 120.4 13.05 120.45 13.14 120.52 13.21 C 120.6 13.26 120.69 13.29 120.78 13.28 L 121.36 13.26 C 121.46 13.27 121.55 13.25 121.63 13.19 C 121.7 13.12 121.74 13.03 121.76 12.93 L 122.79 8.64 L 123.82 12.93 C 123.83 13.03 123.88 13.12 123.95 13.19 C 124.03 13.25 124.12 13.27 124.21 13.26 L 124.78 13.26 C 124.88 13.27 124.97 13.25 125.04 13.2 C 125.11 13.13 125.16 13.03 125.18 12.94 L 126.79 7.79 C 126.84 7.72 126.84 7.63 126.84 7.63 C 126.84 7.59 126.84 7.56 126.84 7.52 C 126.84 7.48 126.82 7.43 126.79 7.4 C 126.76 7.37 126.72 7.35 126.67 7.36 L 126.05 7.36 C 126.04 7.36 126.03 7.36 126.02 7.36 Z M 115.65 10.62 C 115.7 10.62 115.75 10.62 115.8 10.62 L 116.43 10.62 C 116.64 10.64 116.85 10.67 117.06 10.71 L 117.06 11.01 C 117.07 11.21 117.05 11.4 117 11.59 C 116.96 11.75 116.88 11.9 116.77 12.01 C 116.61 12.21 116.39 12.36 116.14 12.44 C 115.91 12.52 115.67 12.56 115.43 12.56 C 115.18 12.6 114.93 12.53 114.73 12.37 C 114.55 12.18 114.46 11.92 114.49 11.66 C 114.47 11.36 114.59 11.08 114.81 10.89 C 115.06 10.72 115.35 10.62 115.65 10.62 Z M 131.04 14.72 C 130.34 14.73 129.51 14.89 128.88 15.33 C 128.69 15.46 128.72 15.63 128.94 15.63 C 129.64 15.54 131.21 15.35 131.5 15.71 C 131.78 16.06 131.19 17.54 130.94 18.21 C 130.86 18.41 131.03 18.49 131.21 18.34 C 132.39 17.36 132.72 15.3 132.46 15 C 132.32 14.85 131.74 14.71 131.04 14.72 Z M 112.65 15.1 C 112.5 15.12 112.42 15.3 112.58 15.44 C 115.29 17.89 118.82 19.23 122.48 19.21 C 125.37 19.22 128.2 18.36 130.59 16.74 C 130.95 16.47 130.63 16.07 130.26 16.23 C 127.87 17.24 125.3 17.76 122.71 17.77 C 119.23 17.78 115.82 16.87 112.81 15.14 C 112.75 15.11 112.69 15.1 112.65 15.1 Z M 110 0 L 135 0 L 135 25 L 110 25 Z" fill="#232f3e" stroke="none" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe flex-start; justify-content: unsafe flex-start; width: 530px; height: 1px; padding-top: 7px; margin-left: 142px;"><div data-drawio-colors="color: #232F3E; " style="box-sizing: border-box; font-size: 0px; text-align: left;"><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: rgb(35, 47, 62); line-height: 1.2; pointer-events: all; white-space: normal; overflow-wrap: normal;">AWS Cloud</div></div></div></foreignObject><text x="142" y="19" fill="#232F3E" font-family="Helvetica" font-size="12px">AWS Cloud</text></switch></g><rect x="0" y="46" width="68" height="78" fill="none" stroke="none" pointer-events="all"/><path d="M 35.77 119.17 L 35.77 104.71 L 50.99 95.93 C 51.54 95.61 51.87 95.03 51.87 94.39 L 51.87 76.52 L 64.44 69.26 L 64.44 102.62 Z M 3.56 69.26 L 16.13 76.52 L 16.13 94.39 C 16.13 95.03 16.46 95.61 17.01 95.93 L 32.23 104.71 L 32.23 119.17 L 3.56 102.62 Z M 35.77 85.99 L 48.34 78.74 L 48.34 93.38 L 35.77 100.63 Z M 19.66 78.74 L 32.23 85.99 L 32.23 100.63 L 19.66 93.38 Z M 34 82.76 L 21.69 75.65 L 34 68.54 L 46.31 75.65 Z M 34 49.88 L 62.47 66.32 L 49.85 73.61 L 34.88 64.97 C 34.34 64.65 33.66 64.65 33.12 64.97 L 18.15 73.61 L 5.53 66.32 Z M 67.1 64.91 L 34.88 46.31 C 34.34 46 33.66 46 33.12 46.31 L 0.9 64.91 C 0.36 65.23 0.02 65.81 0.02 66.44 L 0.02 103.64 C 0.02 104.27 0.36 104.85 0.9 105.17 L 33.12 123.76 C 33.39 123.92 33.69 124 34 124 C 34.31 124 34.61 123.92 34.88 123.76 L 67.1 105.17 C 67.64 104.85 67.98 104.27 67.98 103.64 L 67.98 66.44 C 67.98 65.81 67.64 65.23 67.1 64.91 Z" fill="#232f3d" stroke="none" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe flex-start; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 131px; margin-left: 34px;"><div data-drawio-colors="color: #232F3E; " style="box-sizing: border-box; font-size: 0px; text-align: center;"><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: rgb(35, 47, 62); line-height: 1.2; pointer-events: all; white-space: nowrap;">Client / SDK</div></div></div></foreignObject><text x="34" y="143" fill="#232F3E" font-family="Helvetica" font-size="12px" text-anchor="middle">Client / SDK</text></switch></g><path d="M 67.98 85 L 124 85 L 173.63 85" fill="none" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="stroke"/><path d="M 178.88 85 L 171.88 88.5 L 173.63 85 L 171.88 81.5 Z" fill="rgb(0, 0, 0)" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="all"/><rect x="180" y="46" width="78" height="78" fill="none" stroke="none" pointer-events="all"/><path d="M 219 46 C 197.49 46 180 63.5 180 85 C 180 106.5 197.49 124 219 124 C 240.5 124 258 106.5 258 85 C 258 63.5 240.5 46 219 46 Z M 219 120.45 C 199.45 120.45 183.55 104.55 183.55 85 C 183.55 65.45 199.45 49.55 219 49.55 C 238.55 49.55 254.45 65.45 254.45 85 C 254.45 104.55 238.55 120.45 219 120.45 Z M 242.11 95.64 L 239.39 95.64 L 239.39 89.65 C 239.39 88.67 238.59 87.88 237.61 87.88 L 233.18 87.88 L 233.18 81.9 C 233.18 80.92 232.39 80.13 231.41 80.13 L 220.77 80.13 L 220.77 75.91 L 231.41 75.91 C 232.39 75.91 233.18 75.12 233.18 74.14 L 233.18 60.18 C 233.18 59.2 232.39 58.41 231.41 58.41 L 206.59 58.41 C 205.61 58.41 204.82 59.2 204.82 60.18 L 204.82 74.14 C 204.82 75.12 205.61 75.91 206.59 75.91 L 217.23 75.91 L 217.23 80.13 L 206.59 80.13 C 205.61 80.13 204.82 80.92 204.82 81.9 L 204.82 87.88 L 200.39 87.88 C 199.41 87.88 198.61 88.67 198.61 89.65 L 198.61 95.64 L 195.89 95.64 C 194.91 95.64 194.12 96.43 194.12 97.41 L 194.12 105.16 C 194.12 106.14 194.91 106.94 195.89 106.94 L 203.49 106.94 C 204.47 106.94 205.26 106.14 205.26 105.16 L 205.26 97.41 C 205.26 96.43 204.47 95.64 203.49 95.64 L 202.16 95.64 L 202.16 91.43 L 209.47 91.43 L 209.47 95.64 L 208.14 95.64 C 207.16 95.64 206.37 96.43 206.37 97.41 L 206.37 105.16 C 206.37 106.14 207.16 106.94 208.14 106.94 L 215.9 106.94 C 216.88 106.94 217.67 106.14 217.67 105.16 L 217.67 97.41 C 217.67 96.43 216.88 95.64 215.9 95.64 L 213.02 95.64 L 213.02 89.65 C 213.02 88.67 212.22 87.88 211.25 87.88 L 208.36 87.88 L 208.36 83.67 L 229.64 83.67 L 229.64 87.88 L 226.76 87.88 C 225.78 87.88 224.98 88.67 224.98 89.65 L 224.98 95.64 L 222.1 95.64 C 221.12 95.64 220.33 96.43 220.33 97.41 L 220.33 105.16 C 220.33 106.14 221.12 106.94 222.1 106.94 L 229.86 106.94 C 230.84 106.94 231.63 106.14 231.63 105.16 L 231.63 97.41 C 231.63 96.43 230.84 95.64 229.86 95.64 L 228.53 95.64 L 228.53 91.43 L 235.84 91.43 L 235.84 95.64 L 234.4 95.64 C 233.42 95.64 232.63 96.43 232.63 97.41 L 232.63 105.16 C 232.63 106.14 233.42 106.94 234.4 106.94 L 242.11 106.94 C 243.08 106.94 243.88 106.14 243.88 105.16 L 243.88 97.41 C 243.88 96.43 243.08 95.64 242.11 95.64 Z M 208.36 72.37 L 208.36 61.96 L 229.64 61.96 L 229.64 72.37 Z M 197.67 103.39 L 197.67 99.18 L 201.72 99.18 L 201.72 103.39 Z M 209.92 103.39 L 209.92 99.18 L 214.13 99.18 L 214.13 103.39 Z M 223.88 103.39 L 223.88 99.18 L 228.09 99.18 L 228.09 103.39 Z M 236.18 103.39 L 236.18 99.18 L 240.33 99.18 L 240.33 103.39 Z" fill="#8c4fff" stroke="none" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe flex-start; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 131px; margin-left: 219px;"><div data-drawio-colors="color: #232F3E; " style="box-sizing: border-box; font-size: 0px; text-align: center;"><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: rgb(35, 47, 62); line-height: 1.2; pointer-events: all; white-space: nowrap;">Application Load Balancer</div></div></div></foreignObject><text x="219" y="143" fill="#232F3E" font-family="Helvetica" font-size="12px" text-anchor="middle">Application L...</text></switch></g><path d="M 399 124 L 399 204.65" fill="none" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" stroke-dasharray="8 8" pointer-events="stroke"/><path d="M 399 209.9 L 395.5 202.9 L 399 204.65 L 402.5 202.9 Z" fill="rgb(0, 0, 0)" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 183px; margin-left: 424px;"><div data-drawio-colors="color: rgb(0, 0, 0); background-color: rgb(255, 255, 255); " style="box-sizing: border-box; font-size: 0px; text-align: center;"><div style="display: inline-block; font-size: 11px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; background-color: rgb(255, 255, 255); white-space: nowrap;">Optional</div></div></div></foreignObject><text x="424" y="186" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="11px" text-anchor="middle">Optional</text></switch></g><path d="M 438 85 L 543.63 85" fill="none" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="stroke"/><path d="M 548.88 85 L 541.88 88.5 L 543.63 85 L 541.88 81.5 Z" fill="rgb(0, 0, 0)" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="all"/><path d="M 360 46 L 438 46 L 438 124 L 360 124 Z" fill="#ed7100" stroke="none" pointer-events="all"/><path d="M 385.67 113.97 L 371.83 113.97 L 387.13 81.99 L 394.06 96.26 Z M 388.13 78.93 C 387.94 78.55 387.55 78.3 387.13 78.3 L 387.12 78.3 C 386.69 78.3 386.3 78.55 386.12 78.94 L 369.05 114.61 C 368.89 114.95 368.91 115.36 369.11 115.68 C 369.32 116 369.68 116.2 370.06 116.2 L 386.37 116.2 C 386.8 116.2 387.2 115.95 387.38 115.56 L 396.31 96.73 C 396.46 96.43 396.46 96.07 396.31 95.77 Z M 426.88 113.97 L 413.13 113.97 L 391.08 67.81 C 390.9 67.42 390.5 67.17 390.07 67.17 L 381.08 67.17 L 381.09 56.03 L 398.72 56.03 L 420.67 102.19 C 420.85 102.58 421.25 102.83 421.68 102.83 L 426.88 102.83 Z M 428 100.6 L 422.38 100.6 L 400.43 54.44 C 400.25 54.05 399.85 53.8 399.42 53.8 L 379.97 53.8 C 379.36 53.8 378.86 54.3 378.85 54.91 L 378.84 68.28 C 378.84 68.58 378.96 68.86 379.17 69.07 C 379.38 69.28 379.66 69.4 379.96 69.4 L 389.37 69.4 L 411.42 115.56 C 411.61 115.95 412 116.2 412.43 116.2 L 428 116.2 C 428.61 116.2 429.11 115.7 429.11 115.09 L 429.11 101.71 C 429.11 101.1 428.61 100.6 428 100.6 Z" fill="#ffffff" stroke="none" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe flex-start; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 131px; margin-left: 399px;"><div data-drawio-colors="color: #232F3E; " style="box-sizing: border-box; font-size: 0px; text-align: center;"><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: rgb(35, 47, 62); line-height: 1.2; pointer-events: all; white-space: nowrap;">AWS Lambda<br />(Proxy)</div></div></div></foreignObject><text x="399" y="143" fill="#232F3E" font-family="Helvetica" font-size="12px" text-anchor="middle">AWS Lambda...</text></switch></g><path d="M 258 85 L 353.63 85" fill="none" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="stroke"/><path d="M 358.88 85 L 351.88 88.5 L 353.63 85 L 351.88 81.5 Z" fill="rgb(0, 0, 0)" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="all"/><path d="M 550 46 L 628 46 L 628 124 L 550 124 Z" fill="#01a88d" stroke="none" pointer-events="all"/><path d="M 615.72 83.91 C 614.5 83.91 613.5 82.91 613.5 81.68 C 613.5 80.45 614.5 79.45 615.72 79.45 C 616.95 79.45 617.95 80.45 617.95 81.68 C 617.95 82.91 616.95 83.91 615.72 83.91 Z M 580.22 113.87 L 576.6 111.76 L 584.02 107.12 L 582.84 105.23 L 574.43 110.49 L 567.84 106.65 L 567.84 96.75 L 574.03 92.63 L 572.79 90.78 L 566.68 94.85 L 560.05 91.06 L 560.05 85.67 L 567.28 81.53 L 566.18 79.6 L 560.05 83.1 L 560.05 78.99 L 566.73 75.17 L 573.41 78.99 L 573.41 83.28 L 568.38 86.29 L 569.53 88.2 L 574.52 85.21 L 579.52 88.2 L 580.67 86.29 L 575.64 83.28 L 575.64 78.94 L 581.82 74.81 C 582.13 74.61 582.32 74.26 582.32 73.89 L 582.32 66.09 L 580.09 66.09 L 580.09 73.29 L 574.48 77.03 L 567.84 73.24 L 567.84 63.39 L 573.41 60.14 L 573.41 69.43 L 575.64 69.43 L 575.64 58.84 L 580.22 56.17 L 589 59.1 L 589 91.07 L 572.84 100.77 L 573.98 102.68 L 589 93.67 L 589 110.94 Z M 613.5 96.16 C 613.5 97.39 612.5 98.38 611.27 98.38 C 610.04 98.38 609.04 97.39 609.04 96.16 C 609.04 94.93 610.04 93.93 611.27 93.93 C 612.5 93.93 613.5 94.93 613.5 96.16 Z M 602.36 107.29 C 602.36 108.52 601.36 109.52 600.14 109.52 C 598.91 109.52 597.91 108.52 597.91 107.29 C 597.91 106.06 598.91 105.06 600.14 105.06 C 601.36 105.06 602.36 106.06 602.36 107.29 Z M 601.25 62.75 C 601.25 61.52 602.25 60.52 603.48 60.52 C 604.7 60.52 605.7 61.52 605.7 62.75 C 605.7 63.98 604.7 64.98 603.48 64.98 C 602.25 64.98 601.25 63.98 601.25 62.75 Z M 615.72 77.23 C 613.65 77.23 611.93 78.65 611.43 80.57 L 591.23 80.57 L 591.23 75 L 603.48 75 C 604.09 75 604.59 74.5 604.59 73.89 L 604.59 67.05 C 606.5 66.55 607.93 64.82 607.93 62.75 C 607.93 60.3 605.93 58.3 603.48 58.3 C 601.02 58.3 599.02 60.3 599.02 62.75 C 599.02 64.82 600.45 66.55 602.36 67.05 L 602.36 72.77 L 591.23 72.77 L 591.23 58.3 C 591.23 57.82 590.92 57.39 590.47 57.24 L 580.44 53.9 C 580.14 53.8 579.81 53.83 579.53 53.99 L 566.17 61.79 C 565.83 61.99 565.62 62.36 565.62 62.75 L 565.62 73.24 L 558.38 77.37 C 558.04 77.57 557.82 77.94 557.82 78.34 L 557.82 91.7 C 557.82 92.1 558.04 92.47 558.38 92.67 L 565.62 96.8 L 565.62 107.29 C 565.62 107.69 565.83 108.05 566.17 108.25 L 579.53 116.05 C 579.7 116.15 579.9 116.2 580.09 116.2 C 580.21 116.2 580.33 116.18 580.44 116.14 L 590.47 112.8 C 590.92 112.65 591.23 112.23 591.23 111.75 L 591.23 98.38 L 599.02 98.38 L 599.02 103 C 597.11 103.49 595.68 105.22 595.68 107.29 C 595.68 109.75 597.68 111.75 600.14 111.75 C 602.59 111.75 604.59 109.75 604.59 107.29 C 604.59 105.22 603.16 103.49 601.25 103 L 601.25 97.27 C 601.25 96.66 600.75 96.16 600.14 96.16 L 591.23 96.16 L 591.23 90.59 L 605.15 90.59 L 607.53 93.76 C 607.08 94.46 606.82 95.27 606.82 96.16 C 606.82 98.61 608.81 100.61 611.27 100.61 C 613.73 100.61 615.72 98.61 615.72 96.16 C 615.72 93.7 613.73 91.7 611.27 91.7 C 610.51 91.7 609.8 91.91 609.18 92.25 L 606.59 88.81 C 606.38 88.53 606.05 88.36 605.7 88.36 L 591.23 88.36 L 591.23 82.79 L 611.43 82.79 C 611.93 84.71 613.65 86.14 615.72 86.14 C 618.18 86.14 620.18 84.14 620.18 81.68 C 620.18 79.22 618.18 77.23 615.72 77.23 Z" fill="#ffffff" stroke="none" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe flex-start; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 131px; margin-left: 589px;"><div data-drawio-colors="color: #232F3E; " style="box-sizing: border-box; font-size: 0px; text-align: center;"><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: rgb(35, 47, 62); line-height: 1.2; pointer-events: all; white-space: nowrap;">Amazon Bedrock</div></div></div></foreignObject><text x="589" y="143" fill="#232F3E" font-family="Helvetica" font-size="12px" text-anchor="middle">Amazon Bedrock</text></switch></g><rect x="361.5" y="211" width="75" height="78" fill="none" stroke="none" pointer-events="all"/><path d="M 419.56 272.83 C 419.56 273.49 420.1 274.04 420.77 274.04 L 420.77 274.04 C 421.09 274.04 421.4 273.91 421.62 273.69 C 421.85 273.46 421.98 273.15 421.98 272.83 L 421.98 272.82 C 421.98 272.5 421.86 272.2 421.63 271.97 C 421.4 271.74 421.09 271.61 420.77 271.61 L 420.77 271.61 C 420.45 271.61 420.14 271.74 419.91 271.97 C 419.68 272.2 419.56 272.5 419.56 272.83 Z M 416 272.82 C 416 271.55 416.5 270.35 417.4 269.45 C 418.3 268.55 419.5 268.06 420.77 268.06 L 420.77 268.06 C 422.05 268.06 423.24 268.56 424.15 269.46 C 425.05 270.36 425.54 271.56 425.54 272.83 C 425.54 274.11 425.04 275.3 424.14 276.2 C 423.68 276.66 423.14 277.01 422.55 277.25 L 422.55 282.22 L 418.99 282.22 L 418.99 277.24 C 417.24 276.54 416 274.83 416 272.82 Z M 432.94 265.74 L 408.6 265.73 L 408.6 285.41 L 432.93 285.43 Z M 414.78 262.18 L 426.72 262.18 L 426.72 257.79 C 426.73 254.2 424.07 251.27 420.8 251.26 L 420.78 251.26 C 419.21 251.26 417.73 251.91 416.6 253.1 C 415.45 254.33 414.81 255.96 414.8 257.71 Z M 436.5 263.96 L 436.49 287.21 C 436.49 288.19 435.69 288.98 434.71 288.98 L 406.82 288.97 C 405.84 288.97 405.04 288.17 405.04 287.19 L 405.05 263.95 C 405.05 263.48 405.23 263.03 405.57 262.7 C 405.9 262.36 406.35 262.17 406.83 262.17 L 411.22 262.18 L 411.25 257.7 C 411.25 255.04 412.24 252.54 414.02 250.66 C 415.82 248.75 418.22 247.7 420.78 247.7 L 420.81 247.7 C 426.05 247.72 430.29 252.25 430.27 257.8 L 430.27 262.18 L 434.72 262.19 C 435.19 262.19 435.65 262.37 435.98 262.71 C 436.31 263.04 436.5 263.49 436.5 263.96 Z M 382.01 262.63 L 394.42 262.63 L 394.42 259.07 L 382.01 259.07 Z M 382.01 256.43 L 394.42 256.43 L 394.42 252.87 L 382.01 252.87 Z M 382.01 250.23 L 394.42 250.23 L 394.42 246.67 L 382.01 246.67 Z M 379.22 266.83 L 397.37 266.83 L 397.37 242.48 L 379.22 242.48 Z M 400.92 240.7 L 400.92 268.6 C 400.92 269.59 400.13 270.38 399.15 270.38 L 377.44 270.38 C 376.46 270.38 375.67 269.59 375.67 268.6 L 375.67 240.7 C 375.67 239.72 376.46 238.92 377.44 238.92 L 399.15 238.92 C 400.13 238.92 400.92 239.72 400.92 240.7 Z M 366.84 223.42 L 409.65 223.42 L 403.34 214.57 L 373.14 214.57 Z M 361.8 226.01 C 361.5 225.42 361.55 224.71 361.94 224.17 L 370.78 211.76 C 371.11 211.29 371.65 211.02 372.22 211.02 L 404.26 211.02 C 404.84 211.02 405.38 211.29 405.71 211.76 L 414.55 224.17 C 414.93 224.71 414.99 225.42 414.68 226.01 C 414.38 226.6 413.76 226.98 413.1 226.98 L 363.38 226.98 C 362.72 226.98 362.11 226.6 361.8 226.01 Z M 365.25 277.68 L 400.62 277.68 L 400.62 281.23 L 363.47 281.23 C 362.49 281.23 361.7 280.44 361.7 279.46 L 361.7 231.4 C 361.7 230.42 362.49 229.62 363.47 229.62 L 413.1 229.62 C 414.08 229.62 414.87 230.42 414.87 231.4 L 414.87 246.9 L 411.32 246.9 L 411.32 233.18 L 365.25 233.18 Z" fill="#e7157b" stroke="none" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe flex-start; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 296px; margin-left: 399px;"><div data-drawio-colors="color: #232F3E; " style="box-sizing: border-box; font-size: 0px; text-align: center;"><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: rgb(35, 47, 62); line-height: 1.2; pointer-events: all; white-space: nowrap;">Parameter Store<br />(API Key)</div></div></div></foreignObject><text x="399" y="308" fill="#232F3E" font-family="Helvetica" font-size="12px" text-anchor="middle">Parameter St...</text></switch></g></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a transform="translate(0,-5)" xlink:href="https://www.drawio.com/doc/faq/svg-export-text-problems" target="_blank"><text text-anchor="middle" font-size="10px" x="50%" y="100%">Text is not SVG - cannot display</text></a></switch></svg>
\ No newline at end of file
diff --git a/assets/autogen-agent.png b/assets/autogen-agent.png
new file mode 100644
index 0000000..823e1dc
Binary files /dev/null and b/assets/autogen-agent.png differ
diff --git a/assets/autogen-model.png b/assets/autogen-model.png
new file mode 100644
index 0000000..bbc8f91
Binary files /dev/null and b/assets/autogen-model.png differ
diff --git a/assets/launch-stack.png b/assets/launch-stack.png
new file mode 100644
index 0000000..2745adf
Binary files /dev/null and b/assets/launch-stack.png differ
diff --git a/deployment/BedrockProxy.template b/deployment/BedrockProxy.template
new file mode 100644
index 0000000..0ec4e23
--- /dev/null
+++ b/deployment/BedrockProxy.template
@@ -0,0 +1,805 @@
+{
+  "Parameters": {
+    "ApiKeyParam": {
+      "Type": "String",
+      "Default": "",
+      "Description": "The parameter name in System Manager used to store the API Key, leave blank to use a default key"
+    }
+  },
+  "Resources": {
+    "VPCB9E5F0B4": {
+      "Type": "AWS::EC2::VPC",
+      "Properties": {
+        "CidrBlock": "10.250.0.0/16",
+        "EnableDnsHostnames": true,
+        "EnableDnsSupport": true,
+        "InstanceTenancy": "default",
+        "Tags": [
+          {
+            "Key": "Name",
+            "Value": "BedrockProxy/VPC"
+          }
+        ]
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/VPC/Resource"
+      }
+    },
+    "VPCPublicSubnet1SubnetB4246D30": {
+      "Type": "AWS::EC2::Subnet",
+      "Properties": {
+        "AvailabilityZone": {
+          "Fn::Select": [
+            0,
+            {
+              "Fn::GetAZs": ""
+            }
+          ]
+        },
+        "CidrBlock": "10.250.0.0/24",
+        "MapPublicIpOnLaunch": true,
+        "Tags": [
+          {
+            "Key": "aws-cdk:subnet-name",
+            "Value": "Public"
+          },
+          {
+            "Key": "aws-cdk:subnet-type",
+            "Value": "Public"
+          },
+          {
+            "Key": "Name",
+            "Value": "BedrockProxy/VPC/PublicSubnet1"
+          }
+        ],
+        "VpcId": {
+          "Ref": "VPCB9E5F0B4"
+        }
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/VPC/PublicSubnet1/Subnet"
+      }
+    },
+    "VPCPublicSubnet1RouteTableFEE4B781": {
+      "Type": "AWS::EC2::RouteTable",
+      "Properties": {
+        "Tags": [
+          {
+            "Key": "Name",
+            "Value": "BedrockProxy/VPC/PublicSubnet1"
+          }
+        ],
+        "VpcId": {
+          "Ref": "VPCB9E5F0B4"
+        }
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/VPC/PublicSubnet1/RouteTable"
+      }
+    },
+    "VPCPublicSubnet1RouteTableAssociation0B0896DC": {
+      "Type": "AWS::EC2::SubnetRouteTableAssociation",
+      "Properties": {
+        "RouteTableId": {
+          "Ref": "VPCPublicSubnet1RouteTableFEE4B781"
+        },
+        "SubnetId": {
+          "Ref": "VPCPublicSubnet1SubnetB4246D30"
+        }
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/VPC/PublicSubnet1/RouteTableAssociation"
+      }
+    },
+    "VPCPublicSubnet1DefaultRoute91CEF279": {
+      "Type": "AWS::EC2::Route",
+      "Properties": {
+        "DestinationCidrBlock": "0.0.0.0/0",
+        "GatewayId": {
+          "Ref": "VPCIGWB7E252D3"
+        },
+        "RouteTableId": {
+          "Ref": "VPCPublicSubnet1RouteTableFEE4B781"
+        }
+      },
+      "DependsOn": [
+        "VPCVPCGW99B986DC"
+      ],
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/VPC/PublicSubnet1/DefaultRoute"
+      }
+    },
+    "VPCPublicSubnet2Subnet74179F39": {
+      "Type": "AWS::EC2::Subnet",
+      "Properties": {
+        "AvailabilityZone": {
+          "Fn::Select": [
+            1,
+            {
+              "Fn::GetAZs": ""
+            }
+          ]
+        },
+        "CidrBlock": "10.250.1.0/24",
+        "MapPublicIpOnLaunch": true,
+        "Tags": [
+          {
+            "Key": "aws-cdk:subnet-name",
+            "Value": "Public"
+          },
+          {
+            "Key": "aws-cdk:subnet-type",
+            "Value": "Public"
+          },
+          {
+            "Key": "Name",
+            "Value": "BedrockProxy/VPC/PublicSubnet2"
+          }
+        ],
+        "VpcId": {
+          "Ref": "VPCB9E5F0B4"
+        }
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/VPC/PublicSubnet2/Subnet"
+      }
+    },
+    "VPCPublicSubnet2RouteTable6F1A15F1": {
+      "Type": "AWS::EC2::RouteTable",
+      "Properties": {
+        "Tags": [
+          {
+            "Key": "Name",
+            "Value": "BedrockProxy/VPC/PublicSubnet2"
+          }
+        ],
+        "VpcId": {
+          "Ref": "VPCB9E5F0B4"
+        }
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/VPC/PublicSubnet2/RouteTable"
+      }
+    },
+    "VPCPublicSubnet2RouteTableAssociation5A808732": {
+      "Type": "AWS::EC2::SubnetRouteTableAssociation",
+      "Properties": {
+        "RouteTableId": {
+          "Ref": "VPCPublicSubnet2RouteTable6F1A15F1"
+        },
+        "SubnetId": {
+          "Ref": "VPCPublicSubnet2Subnet74179F39"
+        }
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/VPC/PublicSubnet2/RouteTableAssociation"
+      }
+    },
+    "VPCPublicSubnet2DefaultRouteB7481BBA": {
+      "Type": "AWS::EC2::Route",
+      "Properties": {
+        "DestinationCidrBlock": "0.0.0.0/0",
+        "GatewayId": {
+          "Ref": "VPCIGWB7E252D3"
+        },
+        "RouteTableId": {
+          "Ref": "VPCPublicSubnet2RouteTable6F1A15F1"
+        }
+      },
+      "DependsOn": [
+        "VPCVPCGW99B986DC"
+      ],
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/VPC/PublicSubnet2/DefaultRoute"
+      }
+    },
+    "VPCIGWB7E252D3": {
+      "Type": "AWS::EC2::InternetGateway",
+      "Properties": {
+        "Tags": [
+          {
+            "Key": "Name",
+            "Value": "BedrockProxy/VPC"
+          }
+        ]
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/VPC/IGW"
+      }
+    },
+    "VPCVPCGW99B986DC": {
+      "Type": "AWS::EC2::VPCGatewayAttachment",
+      "Properties": {
+        "InternetGatewayId": {
+          "Ref": "VPCIGWB7E252D3"
+        },
+        "VpcId": {
+          "Ref": "VPCB9E5F0B4"
+        }
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/VPC/VPCGW"
+      }
+    },
+    "ProxyApiHandlerServiceRoleBE71BFB1": {
+      "Type": "AWS::IAM::Role",
+      "Properties": {
+        "AssumeRolePolicyDocument": {
+          "Statement": [
+            {
+              "Action": "sts:AssumeRole",
+              "Effect": "Allow",
+              "Principal": {
+                "Service": "lambda.amazonaws.com"
+              }
+            }
+          ],
+          "Version": "2012-10-17"
+        },
+        "ManagedPolicyArns": [
+          {
+            "Fn::Join": [
+              "",
+              [
+                "arn:",
+                {
+                  "Ref": "AWS::Partition"
+                },
+                ":iam::aws:policy/service-role/AWSLambdaBasicExecutionRole"
+              ]
+            ]
+          }
+        ]
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/Proxy/ApiHandler/ServiceRole/Resource"
+      }
+    },
+    "ProxyApiHandlerServiceRoleDefaultPolicy86681202": {
+      "Type": "AWS::IAM::Policy",
+      "Properties": {
+        "PolicyDocument": {
+          "Statement": [
+            {
+              "Action": [
+                "bedrock:InvokeModel",
+                "bedrock:InvokeModelWithResponseStream"
+              ],
+              "Effect": "Allow",
+              "Resource": "arn:aws:bedrock:*::foundation-model/*"
+            },
+            {
+              "Action": [
+                "ssm:DescribeParameters",
+                "ssm:GetParameters",
+                "ssm:GetParameter",
+                "ssm:GetParameterHistory"
+              ],
+              "Effect": "Allow",
+              "Resource": {
+                "Fn::Join": [
+                  "",
+                  [
+                    "arn:",
+                    {
+                      "Ref": "AWS::Partition"
+                    },
+                    ":ssm:",
+                    {
+                      "Ref": "AWS::Region"
+                    },
+                    ":",
+                    {
+                      "Ref": "AWS::AccountId"
+                    },
+                    ":parameter/",
+                    {
+                      "Ref": "ApiKeyParam"
+                    }
+                  ]
+                ]
+              }
+            }
+          ],
+          "Version": "2012-10-17"
+        },
+        "PolicyName": "ProxyApiHandlerServiceRoleDefaultPolicy86681202",
+        "Roles": [
+          {
+            "Ref": "ProxyApiHandlerServiceRoleBE71BFB1"
+          }
+        ]
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/Proxy/ApiHandler/ServiceRole/DefaultPolicy/Resource"
+      }
+    },
+    "ProxyApiHandlerEC15A492": {
+      "Type": "AWS::Lambda::Function",
+      "Properties": {
+        "Architectures": [
+          "arm64"
+        ],
+        "Code": {
+          "ImageUri": {
+            "Fn::Join": [
+              "",
+              [
+                {
+                  "Fn::Select": [
+                    4,
+                    {
+                      "Fn::Split": [
+                        ":",
+                        {
+                          "Fn::FindInMap": [
+                            "ProxyRegionTable03E5BEB3",
+                            {
+                              "Ref": "AWS::Region"
+                            },
+                            "repoArn"
+                          ]
+                        }
+                      ]
+                    }
+                  ]
+                },
+                ".dkr.ecr.",
+                {
+                  "Fn::Select": [
+                    3,
+                    {
+                      "Fn::Split": [
+                        ":",
+                        {
+                          "Fn::FindInMap": [
+                            "ProxyRegionTable03E5BEB3",
+                            {
+                              "Ref": "AWS::Region"
+                            },
+                            "repoArn"
+                          ]
+                        }
+                      ]
+                    }
+                  ]
+                },
+                ".",
+                {
+                  "Ref": "AWS::URLSuffix"
+                },
+                "/bedrock-proxy-api:latest"
+              ]
+            ]
+          }
+        },
+        "Description": "Bedrock Proxy API Handler",
+        "Environment": {
+          "Variables": {
+            "API_KEY_PARAM_NAME": {
+              "Ref": "ApiKeyParam"
+            },
+            "DEBUG": "false",
+            "DEFAULT_MODEL": {
+              "Fn::FindInMap": [
+                "ProxyRegionTable03E5BEB3",
+                {
+                  "Ref": "AWS::Region"
+                },
+                "model"
+              ]
+            }
+          }
+        },
+        "MemorySize": 1024,
+        "PackageType": "Image",
+        "Role": {
+          "Fn::GetAtt": [
+            "ProxyApiHandlerServiceRoleBE71BFB1",
+            "Arn"
+          ]
+        },
+        "Timeout": 300
+      },
+      "DependsOn": [
+        "ProxyApiHandlerServiceRoleDefaultPolicy86681202",
+        "ProxyApiHandlerServiceRoleBE71BFB1"
+      ],
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/Proxy/ApiHandler/Resource"
+      }
+    },
+    "ProxyApiHandlerInvoke2UTWxhlfyqbT5FTn5jvgbLgjFfJwzswGk55DU1HYF6C33779": {
+      "Type": "AWS::Lambda::Permission",
+      "Properties": {
+        "Action": "lambda:InvokeFunction",
+        "FunctionName": {
+          "Fn::GetAtt": [
+            "ProxyApiHandlerEC15A492",
+            "Arn"
+          ]
+        },
+        "Principal": "elasticloadbalancing.amazonaws.com"
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/Proxy/ApiHandler/Invoke2UTWxhlfyqbT5FTn--5jvgbLgj+FfJwzswGk55DU1H--Y="
+      }
+    },
+    "ProxyALB87756780": {
+      "Type": "AWS::ElasticLoadBalancingV2::LoadBalancer",
+      "Properties": {
+        "LoadBalancerAttributes": [
+          {
+            "Key": "deletion_protection.enabled",
+            "Value": "false"
+          }
+        ],
+        "Scheme": "internet-facing",
+        "SecurityGroups": [
+          {
+            "Fn::GetAtt": [
+              "ProxyALBSecurityGroup0D6CA3DA",
+              "GroupId"
+            ]
+          }
+        ],
+        "Subnets": [
+          {
+            "Ref": "VPCPublicSubnet1SubnetB4246D30"
+          },
+          {
+            "Ref": "VPCPublicSubnet2Subnet74179F39"
+          }
+        ],
+        "Type": "application"
+      },
+      "DependsOn": [
+        "VPCPublicSubnet1DefaultRoute91CEF279",
+        "VPCPublicSubnet1RouteTableAssociation0B0896DC",
+        "VPCPublicSubnet2DefaultRouteB7481BBA",
+        "VPCPublicSubnet2RouteTableAssociation5A808732"
+      ],
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/Proxy/ALB/Resource"
+      }
+    },
+    "ProxyALBSecurityGroup0D6CA3DA": {
+      "Type": "AWS::EC2::SecurityGroup",
+      "Properties": {
+        "GroupDescription": "Automatically created Security Group for ELB BedrockProxyALB1CE4CAD1",
+        "SecurityGroupEgress": [
+          {
+            "CidrIp": "255.255.255.255/32",
+            "Description": "Disallow all traffic",
+            "FromPort": 252,
+            "IpProtocol": "icmp",
+            "ToPort": 86
+          }
+        ],
+        "SecurityGroupIngress": [
+          {
+            "CidrIp": "0.0.0.0/0",
+            "Description": "Allow from anyone on port 80",
+            "FromPort": 80,
+            "IpProtocol": "tcp",
+            "ToPort": 80
+          }
+        ],
+        "VpcId": {
+          "Ref": "VPCB9E5F0B4"
+        }
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/Proxy/ALB/SecurityGroup/Resource"
+      }
+    },
+    "ProxyALBListener933E9515": {
+      "Type": "AWS::ElasticLoadBalancingV2::Listener",
+      "Properties": {
+        "DefaultActions": [
+          {
+            "TargetGroupArn": {
+              "Ref": "ProxyALBListenerTargetsGroup187739FA"
+            },
+            "Type": "forward"
+          }
+        ],
+        "LoadBalancerArn": {
+          "Ref": "ProxyALB87756780"
+        },
+        "Port": 80,
+        "Protocol": "HTTP"
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/Proxy/ALB/Listener/Resource"
+      }
+    },
+    "ProxyALBListenerTargetsGroup187739FA": {
+      "Type": "AWS::ElasticLoadBalancingV2::TargetGroup",
+      "Properties": {
+        "HealthCheckEnabled": false,
+        "TargetType": "lambda",
+        "Targets": [
+          {
+            "Id": {
+              "Fn::GetAtt": [
+                "ProxyApiHandlerEC15A492",
+                "Arn"
+              ]
+            }
+          }
+        ]
+      },
+      "DependsOn": [
+        "ProxyApiHandlerInvoke2UTWxhlfyqbT5FTn5jvgbLgjFfJwzswGk55DU1HYF6C33779"
+      ],
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/Proxy/ALB/Listener/TargetsGroup/Resource"
+      }
+    },
+    "CDKMetadata": {
+      "Type": "AWS::CDK::Metadata",
+      "Properties": {
+        "Analytics": "v2:deflate64:H4sIAAAAAAAA/1VRXW/CMAz8LbyHDMovAKZNSJtWFcTr5LpeZ0iTKHFAqOp/n1q+uief7y7ynZLp+WKhZxM4xylWx6nhUrdbATyq9Y/NIUBDQkHBOX63hJlu9x57aZ+vVZ5Kw7hNpSXpuScqXBLaQWnoyT+5ZYwOGYSdfZh7sLFCwZK8g9AZLrczt20pAvjbkBW1JUyB5fIeXPLDgTHRKcKgC/IusrhwWUEkZaApK9Dtq8MjhU0DNb0li/cIY5xTaDhGdrZTDI1uC3etMczcGcYh2hV1igxEYTQOqhIMWGRbnzLdLr03jEPLDwfVatAo9E//7WMfRyF789zxSN9BqEketUdr16mCoksBh6if4D3buodfSXy6fsrIsHa2Yhk6WleRPsSXUzbT87meTQ6ReRqSFW5IF9f5B/Z2H8goAgAA"
+      },
+      "Metadata": {
+        "aws:cdk:path": "BedrockProxy/CDKMetadata/Default"
+      },
+      "Condition": "CDKMetadataAvailable"
+    }
+  },
+  "Mappings": {
+    "ProxyRegionTable03E5BEB3": {
+      "us-east-1": {
+        "repoArn": "arn:aws:ecr:us-east-1:366590864501:repository/bedrock-proxy-api",
+        "model": "anthropic.claude-3-sonnet-20240229-v1:0"
+      },
+      "us-west-2": {
+        "repoArn": "arn:aws:ecr:us-west-2:366590864501:repository/bedrock-proxy-api",
+        "model": "anthropic.claude-3-sonnet-20240229-v1:0"
+      },
+      "ap-southeast-1": {
+        "repoArn": "arn:aws:ecr:ap-southeast-1:366590864501:repository/bedrock-proxy-api",
+        "model": "anthropic.claude-v2"
+      },
+      "ap-northeast-1": {
+        "repoArn": "arn:aws:ecr:ap-northeast-1:366590864501:repository/bedrock-proxy-api",
+        "model": "anthropic.claude-v2:1"
+      },
+      "eu-central-1": {
+        "repoArn": "arn:aws:ecr:eu-central-1:366590864501:repository/bedrock-proxy-api",
+        "model": "anthropic.claude-v2:1"
+      }
+    }
+  },
+  "Outputs": {
+    "APIBaseUrl": {
+      "Description": "Proxy API Base URL (OPENAI_API_BASE)",
+      "Value": {
+        "Fn::Join": [
+          "",
+          [
+            "http://",
+            {
+              "Fn::GetAtt": [
+                "ProxyALB87756780",
+                "DNSName"
+              ]
+            },
+            "/api/v1"
+          ]
+        ]
+      }
+    }
+  },
+  "Conditions": {
+    "CDKMetadataAvailable": {
+      "Fn::Or": [
+        {
+          "Fn::Or": [
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "af-south-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "ap-east-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "ap-northeast-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "ap-northeast-2"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "ap-south-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "ap-southeast-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "ap-southeast-2"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "ca-central-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "cn-north-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "cn-northwest-1"
+              ]
+            }
+          ]
+        },
+        {
+          "Fn::Or": [
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "eu-central-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "eu-north-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "eu-south-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "eu-west-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "eu-west-2"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "eu-west-3"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "il-central-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "me-central-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "me-south-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "sa-east-1"
+              ]
+            }
+          ]
+        },
+        {
+          "Fn::Or": [
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "us-east-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "us-east-2"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "us-west-1"
+              ]
+            },
+            {
+              "Fn::Equals": [
+                {
+                  "Ref": "AWS::Region"
+                },
+                "us-west-2"
+              ]
+            }
+          ]
+        }
+      ]
+    }
+  }
+}
\ No newline at end of file
diff --git a/src/Dockerfile b/src/Dockerfile
new file mode 100644
index 0000000..920a01e
--- /dev/null
+++ b/src/Dockerfile
@@ -0,0 +1,9 @@
+FROM public.ecr.aws/lambda/python:3.12
+
+COPY ./api ./api
+
+COPY requirements.txt .
+
+RUN pip3 install -r requirements.txt -U --no-cache-dir
+
+CMD [ "api.app.handler" ]
\ No newline at end of file
diff --git a/src/api/__init__.py b/src/api/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/api/app.py b/src/api/app.py
new file mode 100644
index 0000000..cafdf70
--- /dev/null
+++ b/src/api/app.py
@@ -0,0 +1,52 @@
+import logging
+
+import uvicorn
+from fastapi import FastAPI
+from fastapi.exceptions import RequestValidationError
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import PlainTextResponse
+from mangum import Mangum
+
+from api.routers import model, chat
+from api.setting import API_ROUTE_PREFIX, TITLE, DESCRIPTION, SUMMARY, VERSION
+
+config = {
+    "title": TITLE,
+    "description": DESCRIPTION,
+    "summary": SUMMARY,
+    "version": VERSION,
+}
+
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s [%(levelname)s] %(message)s",
+)
+app = FastAPI(**config)
+
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+
+app.include_router(model.router, prefix=API_ROUTE_PREFIX)
+app.include_router(chat.router, prefix=API_ROUTE_PREFIX)
+
+
+@app.get("/health")
+async def health():
+    """For health check if needed"""
+    return {"status": "OK"}
+
+
+@app.exception_handler(RequestValidationError)
+async def validation_exception_handler(request, exc):
+    return PlainTextResponse(str(exc), status_code=400)
+
+
+handler = Mangum(app)
+
+if __name__ == "__main__":
+    uvicorn.run("app:app", host="0.0.0.0", port=8000, reload=True)
diff --git a/src/api/auth.py b/src/api/auth.py
new file mode 100644
index 0000000..1593375
--- /dev/null
+++ b/src/api/auth.py
@@ -0,0 +1,28 @@
+import os
+from typing import Annotated
+
+import boto3
+from fastapi import Depends, HTTPException, status
+from fastapi.security import HTTPBearer, HTTPAuthorizationCredentials
+
+from api.setting import DEFAULT_API_KEYS
+
+api_key_param = os.environ.get("API_KEY_PARAM_NAME")
+if api_key_param:
+    ssm = boto3.client("ssm")
+    api_key = ssm.get_parameter(Name=api_key_param, WithDecryption=True)["Parameter"][
+        "Value"
+    ]
+else:
+    api_key = DEFAULT_API_KEYS
+
+security = HTTPBearer()
+
+
+def api_key_auth(
+    credentials: Annotated[HTTPAuthorizationCredentials, Depends(security)]
+):
+    if credentials.credentials != api_key:
+        raise HTTPException(
+            status_code=status.HTTP_401_UNAUTHORIZED, detail="Invalid API Key"
+        )
diff --git a/src/api/models/__init__.py b/src/api/models/__init__.py
new file mode 100644
index 0000000..6cb3b00
--- /dev/null
+++ b/src/api/models/__init__.py
@@ -0,0 +1 @@
+from api.models.bedrock import ClaudeModel, SUPPORTED_BEDROCK_MODELS, get_model
diff --git a/src/api/models/bedrock.py b/src/api/models/bedrock.py
new file mode 100644
index 0000000..6bdd132
--- /dev/null
+++ b/src/api/models/bedrock.py
@@ -0,0 +1,391 @@
+import json
+import logging
+import uuid
+from abc import ABC, abstractmethod
+from typing import AsyncIterable
+
+import boto3
+
+from api.schema import (
+    ChatResponse,
+    ChatRequest,
+    ChatRequestMessage,
+    Choice,
+    ChatResponseMessage,
+    Usage,
+    ChatStreamResponse,
+    ChoiceDelta,
+)
+from api.setting import DEBUG, AWS_REGION
+
+logger = logging.getLogger(__name__)
+
+bedrock_runtime = boto3.client(
+    service_name="bedrock-runtime",
+    region_name=AWS_REGION,
+)
+
+SUPPORTED_BEDROCK_MODELS = {
+    "anthropic.claude-instant-v1": "Claude Instant",
+    "anthropic.claude-v2:1": "Claude",
+    "anthropic.claude-v2": "Claude",
+    "anthropic.claude-3-sonnet-20240229-v1:0": "Claude 3 Sonnet",
+    "anthropic.claude-3-haiku-20240307-v1:0": "Claude 3 Haiku",
+    "meta.llama2-13b-chat-v1": "Llama 2 Chat 13B",
+    "meta.llama2-70b-chat-v1": "Llama 2 Chat 70B",
+    "mistral.mistral-7b-instruct-v0:2": "Mistral 7B Instruct",
+    "mistral.mixtral-8x7b-instruct-v0:1": "Mixtral 8x7B Instruct",
+}
+
+
+class BaseChatModel(ABC):
+    """Represent a basic chat model
+
+    Currently, only Bedrock model is supported, but may be used for SageMaker models if needed.
+    """
+
+    @abstractmethod
+    def chat(self, chat_request: ChatRequest) -> ChatResponse:
+        """Handle a basic chat completion requests."""
+        pass
+
+    @abstractmethod
+    def chat_stream(self, chat_request: ChatRequest) -> AsyncIterable[bytes]:
+        """Handle a basic chat completion requests with stream response."""
+        pass
+
+    def _generate_message_id(self) -> str:
+        return "chatcmpl-" + str(uuid.uuid4())[:8]
+
+    def _stream_response_to_bytes(self, response: ChatStreamResponse) -> bytes:
+        return "data: {}\n\n".format(response.model_dump_json()).encode("utf-8")
+
+
+# https://docs.aws.amazon.com/bedrock/latest/userguide/model-parameters.html
+class BedrockModel(BaseChatModel):
+    accept = "application/json"
+    content_type = "application/json"
+
+    def _invoke_model(self, args: dict, model_id: str, with_stream: bool = False):
+        body = json.dumps(args)
+        if DEBUG:
+            logger.info("Invoke Bedrock Model: " + model_id)
+            logger.info("Bedrock request body: " + body)
+        if with_stream:
+            return bedrock_runtime.invoke_model_with_response_stream(
+                body=body,
+                modelId=model_id,
+                accept=self.accept,
+                contentType=self.content_type,
+            )
+        return bedrock_runtime.invoke_model(
+            body=body,
+            modelId=model_id,
+            accept=self.accept,
+            contentType=self.content_type,
+        )
+
+    def _create_response(
+        self,
+        model: str,
+        message: str,
+        message_id: str,
+        input_tokens: int = 0,
+        output_tokens: int = 0,
+    ) -> ChatResponse:
+        choice = Choice(
+            index=0,
+            message=ChatResponseMessage(
+                role="assistant",
+                content=message,
+            ),
+            finish_reason="stop",
+        )
+        response = ChatResponse(
+            id=message_id,
+            model=model,
+            choices=[choice],
+            usage=Usage(
+                prompt_tokens=input_tokens,
+                completion_tokens=output_tokens,
+                total_tokens=input_tokens + output_tokens,
+            ),
+        )
+        if DEBUG:
+            logger.info("Proxy response :" + response.model_dump_json())
+        return response
+
+    def _create_response_stream(
+        self, model: str, message_id: str, chunk_message: str, finish_reason: str | None
+    ) -> ChatStreamResponse:
+        choice = ChoiceDelta(
+            index=0,
+            delta=ChatResponseMessage(
+                role="assistant",
+                content=chunk_message,
+            ),
+            finish_reason=finish_reason,
+        )
+        response = ChatStreamResponse(
+            id=message_id,
+            model=model,
+            choices=[choice],
+        )
+        if DEBUG:
+            logger.info("Proxy response :" + response.model_dump_json())
+        return response
+
+
+def get_model(model_id: str) -> BedrockModel:
+    model_name = SUPPORTED_BEDROCK_MODELS.get(model_id, "")
+    if DEBUG:
+        logger.info("model name is " + model_name)
+    if model_name in ["Claude Instant", "Claude", "Claude 3 Sonnet", "Claude 3 Haiku"]:
+        return ClaudeModel()
+    elif model_name in ["Llama 2 Chat 13B", "Llama 2 Chat 70B"]:
+        return Llama2Model()
+    elif model_name in ["Mistral 7B Instruct", "Mixtral 8x7B Instruct"]:
+        return MistralModel()
+    else:
+        logger.error("Unsupported model id " + model_id)
+        raise ValueError("Invalid model ID")
+
+
+class ClaudeModel(BedrockModel):
+    anthropic_version = "bedrock-2023-05-31"
+
+    def _parse_args(self, chat_request: ChatRequest) -> dict:
+        args = {
+            "anthropic_version": self.anthropic_version,
+            "max_tokens": chat_request.max_tokens,
+            "top_p": chat_request.top_p,
+            "temperature": chat_request.temperature,
+        }
+        if chat_request.messages[0].role == "system":
+            args["system"] = chat_request.messages[0].content
+            args["messages"] = [
+                {"role": msg.role, "content": msg.content}
+                for msg in chat_request.messages[1:]
+            ]
+        else:
+            args["messages"] = [
+                {"role": msg.role, "content": msg.content}
+                for msg in chat_request.messages
+            ]
+
+        return args
+
+    def chat(self, chat_request: ChatRequest) -> ChatResponse:
+        response = self._invoke_model(
+            args=self._parse_args(chat_request), model_id=chat_request.model
+        )
+        response_body = json.loads(response.get("body").read())
+        if DEBUG:
+            logger.info("Bedrock response body: " + str(response_body))
+
+        return self._create_response(
+            model=chat_request.model,
+            message=response_body["content"][0]["text"],
+            message_id=response_body["id"],
+            input_tokens=response_body["usage"]["input_tokens"],
+            output_tokens=response_body["usage"]["output_tokens"],
+        )
+
+    def chat_stream(self, chat_request: ChatRequest) -> AsyncIterable[bytes]:
+        response = self._invoke_model(
+            args=self._parse_args(chat_request),
+            model_id=chat_request.model,
+            with_stream=True,
+        )
+        msg_id = ""
+        chunk_id = 0
+        for event in response.get("body"):
+            if DEBUG:
+                logger.info("Bedrock response chunk: " + str(event))
+            chunk = json.loads(event["chunk"]["bytes"])
+            chunk_id += 1
+            if chunk["type"] == "message_start":
+                msg_id = chunk["message"]["id"]
+                continue
+
+            if chunk["type"] == "message_delta":
+                chunk_message = ""
+                finish_reason = "stop"
+
+            elif chunk["type"] == "content_block_delta":
+                chunk_message = chunk["delta"]["text"]
+                finish_reason = None
+            else:
+                continue
+            response = self._create_response_stream(
+                model=chat_request.model,
+                message_id=msg_id,
+                chunk_message=chunk_message,
+                finish_reason=finish_reason,
+            )
+
+            yield self._stream_response_to_bytes(response)
+
+
+class Llama2Model(BedrockModel):
+
+    def _convert_prompt(self, messages: list[ChatRequestMessage]) -> str:
+        """Create a prompt message follow below example:
+
+        <s>[INST] <<SYS>>\n{your_system_message}\n<</SYS>>\n\n{user_message_1} [/INST] {model_reply_1}</s>
+        <s>[INST] {user_message_2} [/INST]
+        """
+        if DEBUG:
+            logger.info("Convert below messages to prompt for Llama 2: ")
+            for msg in messages:
+                logger.info(msg.model_dump_json())
+        bos_token = "<s>"
+        eos_token = "</s>"
+        prompt = bos_token + "[INST] "
+        start = 0
+        end_turn = False
+        if messages[0].role == "system":
+            prompt += "<<SYS>>\n" + messages[0].content + "\n<<SYS>>\n\n"
+            start = 1
+        # TODO: Add validation
+        for i in range(start, len(messages)):
+            msg = messages[i]
+            if msg.role == "user":
+                if end_turn:
+                    prompt += bos_token + "[INST] "
+                prompt += msg.content + " [/INST] "
+                end_turn = False
+            else:
+                prompt += msg.content + eos_token
+                end_turn = True
+        if DEBUG:
+            logger.info("Converted prompt: " + prompt.replace("\n", "\\n"))
+        return prompt
+
+    def _parse_args(self, chat_request: ChatRequest) -> dict:
+        prompt = self._convert_prompt(chat_request.messages)
+        return {
+            "prompt": prompt,
+            "max_gen_len": chat_request.max_tokens,
+            "temperature": chat_request.temperature,
+            "top_p": chat_request.top_p,
+        }
+
+    def chat(self, chat_request: ChatRequest) -> ChatResponse:
+        response = self._invoke_model(
+            args=self._parse_args(chat_request), model_id=chat_request.model
+        )
+        response_body = json.loads(response.get("body").read())
+        if DEBUG:
+            logger.info("Bedrock response body: " + str(response_body))
+        message_id = self._generate_message_id()
+
+        return self._create_response(
+            model=chat_request.model,
+            message=response_body["generation"],
+            message_id=message_id,
+            input_tokens=response_body["prompt_token_count"],
+            output_tokens=response_body["generation_token_count"],
+        )
+
+    def chat_stream(self, chat_request: ChatRequest) -> AsyncIterable[bytes]:
+        response = self._invoke_model(
+            args=self._parse_args(chat_request),
+            model_id=chat_request.model,
+            with_stream=True,
+        )
+        msg_id = ""
+        chunk_id = 0
+        for event in response.get("body"):
+            if DEBUG:
+                logger.info("Bedrock response chunk: " + str(event))
+            chunk = json.loads(event["chunk"]["bytes"])
+            chunk_id += 1
+            response = self._create_response_stream(
+                model=chat_request.model,
+                message_id=msg_id,
+                chunk_message=chunk["generation"],
+                finish_reason=chunk["stop_reason"],
+            )
+            yield self._stream_response_to_bytes(response)
+
+
+class MistralModel(BedrockModel):
+    def _convert_prompt(self, messages: list[ChatRequestMessage]) -> str:
+        """Create a prompt message follow below example:
+
+        <s>[INST] {your_system_message}\n{user_message_1} [/INST] {model_reply_1}</s>
+        <s>[INST] {user_message_2} [/INST]
+        """
+        if DEBUG:
+            logger.info("Convert below messages to prompt for Llama 2: ")
+            for msg in messages:
+                logger.info(msg.model_dump_json())
+        bos_token = "<s>"
+        eos_token = "</s>"
+        prompt = bos_token + "[INST] "
+        start = 0
+        end_turn = False
+        if messages[0].role == "system":
+            prompt += messages[0].content + "\n"
+            start = 1
+        # TODO: Add validation
+        for i in range(start, len(messages)):
+            msg = messages[i]
+            if msg.role == "user":
+                if end_turn:
+                    prompt += bos_token + "[INST] "
+                prompt += msg.content + " [/INST] "
+                end_turn = False
+            else:
+                prompt += msg.content + eos_token
+                end_turn = True
+        if DEBUG:
+            logger.info("Converted prompt: " + prompt.replace("\n", "\\n"))
+        return prompt
+
+    def _parse_args(self, chat_request: ChatRequest) -> dict:
+        prompt = self._convert_prompt(chat_request.messages)
+        return {
+            "prompt": prompt,
+            "max_tokens": chat_request.max_tokens,
+            "temperature": chat_request.temperature,
+            "top_p": chat_request.top_p,
+        }
+
+    def chat(self, chat_request: ChatRequest) -> ChatResponse:
+
+        response = self._invoke_model(
+            args=self._parse_args(chat_request), model_id=chat_request.model
+        )
+        response_body = json.loads(response.get("body").read())
+        if DEBUG:
+            logger.info("Bedrock response body: " + str(response_body))
+        message_id = self._generate_message_id()
+
+        return self._create_response(
+            model=chat_request.model,
+            message=response_body["outputs"][0]["text"],
+            message_id=message_id,
+        )
+
+    def chat_stream(self, chat_request: ChatRequest) -> AsyncIterable[bytes]:
+        response = self._invoke_model(
+            args=self._parse_args(chat_request),
+            model_id=chat_request.model,
+            with_stream=True,
+        )
+        msg_id = ""
+        chunk_id = 0
+        for event in response.get("body"):
+            if DEBUG:
+                logger.info("Bedrock response chunk: " + str(event))
+            chunk = json.loads(event["chunk"]["bytes"])
+            chunk_id += 1
+            response = self._create_response_stream(
+                model=chat_request.model,
+                message_id=msg_id,
+                chunk_message=chunk["outputs"][0]["text"],
+                finish_reason=chunk["outputs"][0]["stop_reason"],
+            )
+            yield self._stream_response_to_bytes(response)
diff --git a/src/api/routers/__init__.py b/src/api/routers/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/api/routers/chat.py b/src/api/routers/chat.py
new file mode 100644
index 0000000..d9b2fa6
--- /dev/null
+++ b/src/api/routers/chat.py
@@ -0,0 +1,51 @@
+from typing import Annotated
+
+from fastapi import APIRouter, Depends, Body, HTTPException
+from fastapi.responses import StreamingResponse
+
+from api.auth import api_key_auth
+from api.models import get_model, SUPPORTED_BEDROCK_MODELS
+from api.schema import ChatRequest, ChatResponse, ChatStreamResponse
+from api.setting import DEFAULT_MODEL
+
+router = APIRouter()
+
+router = APIRouter(
+    prefix="/chat",
+    tags=["items"],
+    dependencies=[Depends(api_key_auth)],
+    # responses={404: {"description": "Not found"}},
+)
+
+
+@router.post("/completions", response_model=ChatResponse | ChatStreamResponse)
+async def chat_completions(
+        chat_request: Annotated[
+            ChatRequest,
+            Body(
+                examples=[
+                    {
+                        "model": "anthropic.claude-3-sonnet-20240229-v1:0",
+                        "messages": [
+                            {"role": "system", "content": "You are a helpful assistant."},
+                            {"role": "user", "content": "Hello!"},
+                        ],
+                    }
+                ],
+            ),
+        ]
+):
+    if chat_request.model.lower().startswith("gpt-"):
+        chat_request.model = DEFAULT_MODEL
+    if chat_request.model not in SUPPORTED_BEDROCK_MODELS.keys():
+        raise HTTPException(status_code=400, detail="Unsupported Model Id " + chat_request.model)
+    try:
+        model = get_model(chat_request.model)
+
+        if chat_request.stream:
+            return StreamingResponse(
+                content=model.chat_stream(chat_request), media_type="text/event-stream"
+            )
+        return model.chat(chat_request)
+    except ValueError as e:
+        raise HTTPException(status_code=400, detail=str(e))
diff --git a/src/api/routers/model.py b/src/api/routers/model.py
new file mode 100644
index 0000000..4d10f98
--- /dev/null
+++ b/src/api/routers/model.py
@@ -0,0 +1,41 @@
+from typing import Annotated
+
+from fastapi import APIRouter, Depends, HTTPException, Path
+
+from api.auth import api_key_auth
+from api.models import SUPPORTED_BEDROCK_MODELS
+from api.schema import Models, Model
+
+router = APIRouter()
+
+router = APIRouter(
+    prefix="/models",
+    tags=["items"],
+    dependencies=[Depends(api_key_auth)],
+    # responses={404: {"description": "Not found"}},
+)
+
+
+async def validate_model_id(model_id: str):
+    if model_id not in SUPPORTED_BEDROCK_MODELS.keys():
+        raise HTTPException(status_code=400, detail="Unsupported Model Id")
+
+
+@router.get("/", response_model=Models)
+async def list_models():
+    model_list = [Model(id=model_id) for model_id in SUPPORTED_BEDROCK_MODELS.keys()]
+    return Models(data=model_list)
+
+
+@router.get(
+    "/{model_id}",
+    response_model=Model,
+)
+async def get_model(
+    model_id: Annotated[
+        str,
+        Path(description="Model ID", example="anthropic.claude-3-sonnet-20240229-v1:0"),
+    ]
+):
+    await validate_model_id(model_id)
+    return Model(id=model_id)
diff --git a/src/api/schema.py b/src/api/schema.py
new file mode 100644
index 0000000..53732c8
--- /dev/null
+++ b/src/api/schema.py
@@ -0,0 +1,80 @@
+import time
+from typing import Literal
+
+from pydantic import BaseModel, Field
+
+
+class Model(BaseModel):
+    id: str
+    created: int = Field(default_factory=lambda: int(time.time()))
+    object: str | None = "model"
+    owned_by: str | None = "bedrock"
+
+
+class Models(BaseModel):
+    object: str | None = "list"
+    data: list[Model] = []
+
+
+class ChatRequestMessage(BaseModel):
+    name: str | None = None
+    role: Literal["user", "assistant", "system"]
+    content: str
+
+
+class ChatRequest(BaseModel):
+    messages: list[ChatRequestMessage]
+    model: str
+    frequency_penalty: float | None = Field(default=0.0, le=2.0, ge=-2.0)  # Not used
+    presence_penalty: float | None = Field(default=0.0, le=2.0, ge=-2.0)  # Not used
+    stream: bool | None = False
+    temperature: float | None = Field(default=1.0, le=2.0, ge=0.0)
+    top_p: float | None = Field(default=1.0, le=1.0, ge=0.0)
+    user: str | None = None  # Not used
+    max_tokens: int | None = 2048
+    n: int | None = 1  # Not used
+
+
+class Usage(BaseModel):
+    prompt_tokens: int
+    completion_tokens: int
+    total_tokens: int
+
+
+class ChatResponseMessage(BaseModel):
+    # tool_calls
+    role: Literal["assistant"] | None = None
+    content: str | None = None
+
+
+class BaseChoice(BaseModel):
+    index: int
+    finish_reason: str | None
+    logprobs: dict | None = None
+
+
+class Choice(BaseChoice):
+    message: ChatResponseMessage
+
+
+class ChoiceDelta(BaseChoice):
+    delta: ChatResponseMessage
+
+
+class BaseChatResponse(BaseModel):
+    # id: str = Field(default_factory=lambda: "chatcmpl-" + str(uuid.uuid4())[:8])
+    id: str
+    created: int = Field(default_factory=lambda: int(time.time()))
+    model: str
+    system_fingerprint: str = "fp_e97c09dd4e26"
+
+
+class ChatResponse(BaseChatResponse):
+    choices: list[Choice]
+    object: Literal["chat.completion"] = "chat.completion"
+    usage: Usage
+
+
+class ChatStreamResponse(BaseChatResponse):
+    choices: list[ChoiceDelta]
+    object: Literal["chat.completion.chunk"] = "chat.completion.chunk"
diff --git a/src/api/setting.py b/src/api/setting.py
new file mode 100644
index 0000000..f183aa2
--- /dev/null
+++ b/src/api/setting.py
@@ -0,0 +1,27 @@
+import os
+
+DEFAULT_API_KEYS = "bedrock"
+
+API_ROUTE_PREFIX = "/api/v1"
+
+TITLE = "Amazon Bedrock Proxy APIs"
+SUMMARY = "OpenAI-Compatible RESTful APIs for Amazon Bedrock"
+VERSION = "0.1.0"
+DESCRIPTION = """
+Use OpenAI-Compatible RESTful APIs for Amazon Bedrock models.
+
+List of Amazon Bedrock models currently supported:
+- anthropic.claude-instant-v1
+- anthropic.claude-v2:1
+- anthropic.claude-v2
+- anthropic.claude-3-sonnet-20240229-v1:0
+- anthropic.claude-3-haiku-20240307-v1:0
+- meta.llama2-13b-chat-v1
+- meta.llama2-70b-chat-v1
+- mistral.mistral-7b-instruct-v0:2
+- mistral.mixtral-8x7b-instruct-v0:1
+"""
+
+DEBUG = os.environ.get("DEBUG", "false").lower() != "false"
+AWS_REGION = os.environ.get("AWS_REGION", "us-west-2")
+DEFAULT_MODEL = os.environ.get("DEFAULT_MODEL", "anthropic.claude-3-sonnet-20240229-v1:0")
diff --git a/src/requirements.txt b/src/requirements.txt
new file mode 100644
index 0000000..fec17d7
--- /dev/null
+++ b/src/requirements.txt
@@ -0,0 +1,4 @@
+fastapi==0.103.0
+pydantic==2.6.3
+uvicorn==0.27.0.post1
+mangum==0.17.0
\ No newline at end of file