aws-samples
diff --git a/‎lib/aws-genai-llm-chatbot-stack.ts‎
Lines changed: 57 additions & 56 deletions b/‎lib/aws-genai-llm-chatbot-stack.ts‎
Lines changed: 57 additions & 56 deletions
diff --git a/‎lib/model-interfaces/idefics/functions/request-handler/adapters/__init__.py‎
Lines changed: 2 additions & 0 deletions b/‎lib/model-interfaces/idefics/functions/request-handler/adapters/__init__.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎lib/model-interfaces/idefics/functions/request-handler/adapters/base.py‎
Lines changed: 12 additions & 0 deletions b/‎lib/model-interfaces/idefics/functions/request-handler/adapters/base.py‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎lib/model-interfaces/idefics/functions/request-handler/adapters/claude.py‎
Lines changed: 104 additions & 0 deletions b/‎lib/model-interfaces/idefics/functions/request-handler/adapters/claude.py‎
Lines changed: 104 additions & 0 deletions
diff --git a/‎lib/model-interfaces/idefics/functions/request-handler/adapters/idefics.py‎
Lines changed: 84 additions & 0 deletions b/‎lib/model-interfaces/idefics/functions/request-handler/adapters/idefics.py‎
Lines changed: 84 additions & 0 deletions
@@ -53,7 +53,7 @@ export class AwsGenAILLMChatbotStack extends cdk.Stack {
     });
 
     // Langchain Interface Construct
-    // This is the model interface recieving messages from the websocket interface via the message topic
+    // This is the model interface receiving messages from the websocket interface via the message topic
     // and interacting with the model via LangChain library
     const langchainModels = models.models.filter(
       (model) => model.interface === ModelInterface.LangChain
@@ -100,46 +100,45 @@ export class AwsGenAILLMChatbotStack extends cdk.Stack {
     }
 
     // IDEFICS Interface Construct
-    // This is the model interface recieving messages from the websocket interface via the message topic
+    // This is the model interface receiving messages from the websocket interface via the message topic
     // and interacting with IDEFICS visual language models
     const ideficsModels = models.models.filter(
-      (model) => model.interface === ModelInterface.Idefics
+      (model) => model.interface === ModelInterface.MultiModal
     );
 
     // check if any deployed model requires idefics interface
-    if (ideficsModels.length > 0) {
-      const ideficsInterface = new IdeficsInterface(this, "IdeficsInterface", {
-        shared,
-        config: props.config,
-        messagesTopic: chatBotApi.messagesTopic,
-        sessionsTable: chatBotApi.sessionsTable,
-        byUserIdIndex: chatBotApi.byUserIdIndex,
-        chatbotFilesBucket: chatBotApi.filesBucket,
-      });
 
-      // Route all incoming messages targeted to idefics to the idefics model interface queue
-      chatBotApi.messagesTopic.addSubscription(
-        new subscriptions.SqsSubscription(ideficsInterface.ingestionQueue, {
-          filterPolicyWithMessageBody: {
-            direction: sns.FilterOrPolicy.filter(
-              sns.SubscriptionFilter.stringFilter({
-                allowlist: [Direction.In],
-              })
-            ),
-            modelInterface: sns.FilterOrPolicy.filter(
-              sns.SubscriptionFilter.stringFilter({
-                allowlist: [ModelInterface.Idefics],
-              })
-            ),
-          },
-        })
-      );
+    const ideficsInterface = new IdeficsInterface(this, "IdeficsInterface", {
+      shared,
+      config: props.config,
+      messagesTopic: chatBotApi.messagesTopic,
+      sessionsTable: chatBotApi.sessionsTable,
+      byUserIdIndex: chatBotApi.byUserIdIndex,
+      chatbotFilesBucket: chatBotApi.filesBucket,
+    });
 
-      for (const model of models.models) {
-        // if model name contains idefics then add to idefics interface
-        if (model.interface === ModelInterface.Idefics) {
-          ideficsInterface.addSageMakerEndpoint(model);
-        }
+    // Route all incoming messages targeted to idefics to the idefics model interface queue
+    chatBotApi.messagesTopic.addSubscription(
+      new subscriptions.SqsSubscription(ideficsInterface.ingestionQueue, {
+        filterPolicyWithMessageBody: {
+          direction: sns.FilterOrPolicy.filter(
+            sns.SubscriptionFilter.stringFilter({
+              allowlist: [Direction.In],
+            })
+          ),
+          modelInterface: sns.FilterOrPolicy.filter(
+            sns.SubscriptionFilter.stringFilter({
+              allowlist: [ModelInterface.MultiModal],
+            })
+          ),
+        },
+      })
+    );
+
+    for (const model of models.models) {
+      // if model name contains idefics then add to idefics interface
+      if (model.interface === ModelInterface.MultiModal) {
+        ideficsInterface.addSageMakerEndpoint(model);
       }
     }
 
@@ -415,38 +414,40 @@ export class AwsGenAILLMChatbotStack extends cdk.Stack {
         reason: "Not yet upgraded from Python 3.11 to 3.12.",
       },
     ]);
-    
+
     if (props.config.privateWebsite) {
       const paths = [];
-      for(let index = 0; index < shared.vpc.availabilityZones.length; index++) {
-        paths.push(`/${this.stackName}/UserInterface/PrivateWebsite/DescribeNetworkInterfaces-${index}/CustomResourcePolicy/Resource`,)
+      for (
+        let index = 0;
+        index < shared.vpc.availabilityZones.length;
+        index++
+      ) {
+        paths.push(
+          `/${this.stackName}/UserInterface/PrivateWebsite/DescribeNetworkInterfaces-${index}/CustomResourcePolicy/Resource`
+        );
       }
-      paths.push(`/${this.stackName}/UserInterface/PrivateWebsite/describeVpcEndpoints/CustomResourcePolicy/Resource`,)
+      paths.push(
+        `/${this.stackName}/UserInterface/PrivateWebsite/describeVpcEndpoints/CustomResourcePolicy/Resource`
+      );
+      NagSuppressions.addResourceSuppressionsByPath(this, paths, [
+        {
+          id: "AwsSolutions-IAM5",
+          reason:
+            "Custom Resource requires permissions to Describe VPC Endpoint Network Interfaces",
+        },
+      ]);
       NagSuppressions.addResourceSuppressionsByPath(
         this,
-        paths,
+        [
+          `/${this.stackName}/AWS679f53fac002430cb0da5b7982bd2287/ServiceRole/Resource`,
+        ],
         [
           {
-            id: "AwsSolutions-IAM5",
-            reason:
-              "Custom Resource requires permissions to Describe VPC Endpoint Network Interfaces",
+            id: "AwsSolutions-IAM4",
+            reason: "IAM role implicitly created by CDK.",
           },
         ]
       );
-      NagSuppressions.addResourceSuppressionsByPath(
-          this,
-          [
-            `/${this.stackName}/AWS679f53fac002430cb0da5b7982bd2287/ServiceRole/Resource`
-          ],
-          [
-            {
-              id: "AwsSolutions-IAM4",
-              reason:
-                "IAM role implicitly created by CDK.",
-            },
-          ]
-      );
-      
     }
   }
 }
@@ -0,0 +1,2 @@
+from .idefics import Idefics
+from .claude import Claude3
@@ -0,0 +1,12 @@
+from abc import abstractmethod
+
+
+class MultiModalModelBase:
+    @abstractmethod
+    def handle_run(self, prompt: str, model_kwargs: dict) -> str: ...
+
+    @abstractmethod
+    def format_prompt(self, prompt: str, messages: list, files: list) -> str: ...
+
+    def clean_prompt(self, prompt: str) -> str:
+        return prompt
@@ -0,0 +1,104 @@
+from .base import MultiModalModelBase
+from genai_core.types import ChatbotAction, ChatbotMessageType
+from urllib.parse import urljoin
+import os
+from genai_core.clients import get_bedrock_client
+import json
+import requests
+from base64 import b64encode
+from genai_core.registry import registry
+
+
+def get_image_message(
+    file: dict,
+):
+    img = requests.get(
+        f"{urljoin(os.environ['CHATBOT_FILES_PRIVATE_API'], file['key'])}"
+    ).content
+    return {
+        "type": "image",
+        "source": {
+            "type": "base64",
+            "media_type": "image/jpeg",
+            "data": str(b64encode(img), "ascii"),
+        },
+    }
+
+
+class Claude3(MultiModalModelBase):
+    model_id: str
+    client: any
+
+    def __init__(self, model_id: str):
+        self.model_id = model_id
+        self.client = get_bedrock_client()
+
+    def format_prompt(self, prompt: str, messages: list, files: list) -> str:
+        prompts = []
+
+        # Chat history
+        for message in messages:
+            if message.type.lower() == ChatbotMessageType.Human.value.lower():
+                user_msg = {
+                    "role": "user",
+                    "content": [{"type": "text", "text": message.content}],
+                }
+                prompts.append(user_msg)
+                message_files = message.additional_kwargs.get("files", [])
+                for message_file in message_files:
+                    user_msg["content"].append(get_image_message(message_file))
+            if message.type.lower() == ChatbotMessageType.AI.value.lower():
+                prompts.append({"role": "assistant", "content": message.content})
+
+        # User prompt
+        user_msg = {
+            "role": "user",
+            "content": [{"type": "text", "text": prompt}],
+        }
+        prompts.append(user_msg)
+        for file in files:
+            user_msg["content"].append(get_image_message(file))
+
+        return json.dumps(
+            {
+                "anthropic_version": "bedrock-2023-05-31",
+                "max_tokens": 512,
+                "messages": prompts,
+                "temperature": 0.3,
+            }
+        )
+
+    def handle_run(self, prompt: str, model_kwargs: dict):
+        print(model_kwargs)
+        body = json.loads(prompt)
+
+        if "temperature" in model_kwargs:
+            body["temperature"] = model_kwargs["temperature"]
+        if "topP" in model_kwargs:
+            body["top_p"] = model_kwargs["topP"]
+        if "maxTokens" in model_kwargs:
+            body["max_tokens"] = model_kwargs["maxTokens"]
+        if "topK" in model_kwargs:
+            body["top_k"] = model_kwargs["topK"]
+
+        body_str = json.dumps(body)
+        mlm_response = self.client.invoke_model(
+            modelId=self.model_id,
+            body=body_str,
+            accept="application/json",
+            contentType="application/json",
+        )
+
+        return json.loads(mlm_response["body"].read())["content"][0]["text"]
+
+    def clean_prompt(self, prompt: str) -> str:
+        p = json.loads(prompt)
+        for m in p["messages"]:
+            if m["role"] == "user" and type(m["content"]) == type([]):
+                for c in m["content"]:
+                    if c["type"] == "image":
+                        c["data"]["source"] = ""
+        return json.dumps(p)
+
+
+registry.register(r"^bedrock.anthropic.claude-3.*", Claude3)
@@ -0,0 +1,84 @@
+from .base import MultiModalModelBase
+from genai_core.types import ChatbotAction, ChatbotMessageType
+from urllib.parse import urljoin
+import os
+from langchain.llms import SagemakerEndpoint
+from content_handler import ContentHandler
+from genai_core.registry import registry
+
+
+class Idefics(MultiModalModelBase):
+    model_id: str
+
+    def __init__(self, model_id: str):
+        self.model_id = model_id
+
+    def format_prompt(self, prompt: str, messages: list, files: list) -> str:
+
+        human_prompt_template = "User:{prompt}"
+        human_prompt_with_image = "User:{prompt}![]({image})"
+        ai_prompt_template = "Assistant:{prompt}"
+
+        prompts = []
+        for message in messages:
+            if message.type.lower() == ChatbotMessageType.Human.value.lower():
+                message_files = message.additional_kwargs.get("files", [])
+                if not message_files:
+                    prompts.append(human_prompt_template.format(prompt=message.content))
+                for message_file in message_files:
+                    prompts.append(
+                        human_prompt_with_image.format(
+                            prompt=message.content,
+                            image=f"{urljoin(os.environ['CHATBOT_FILES_PRIVATE_API'], message_file['key'])}",
+                        )
+                    )
+            if message.type.lower() == ChatbotMessageType.AI.value.lower():
+                prompts.append(ai_prompt_template.format(prompt=message.content))
+
+        if not files:
+            prompts.append(human_prompt_template.format(prompt=prompt))
+
+        for file in files:
+            key = file["key"]
+            prompts.append(
+                human_prompt_with_image.format(
+                    prompt=prompt,
+                    image=f"{urljoin(os.environ['CHATBOT_FILES_PRIVATE_API'], key)}",
+                )
+            )
+
+        prompts.append("<end_of_utterance>\nAssistant:")
+
+        prompt_template = "".join(prompts)
+        print(prompt_template)
+        return prompt_template
+
+    def handle_run(self, prompt: str, model_kwargs: dict):
+        print(model_kwargs)
+        params = {
+            "do_sample": True,
+            "top_p": 0.2,
+            "temperature": 0.4,
+            "top_k": 50,
+            "max_new_tokens": 512,
+            "stop": ["User:", "<end_of_utterance>"],
+        }
+        if "temperature" in model_kwargs:
+            params["temperature"] = model_kwargs["temperature"]
+        if "topP" in model_kwargs:
+            params["top_p"] = model_kwargs["topP"]
+        if "maxTokens" in model_kwargs:
+            params["max_new_tokens"] = model_kwargs["maxTokens"]
+
+        mlm = SagemakerEndpoint(
+            endpoint_name=self.model_id,
+            region_name=os.environ["AWS_REGION"],
+            model_kwargs=params,
+            content_handler=ContentHandler(),
+        )
+
+        mlm_response = mlm.predict(prompt)
+        return mlm_response
+
+
+registry.register(r"^sagemaker.*idefics*", Idefics)
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+from .idefics import Idefics`
	`2`	`+from .claude import Claude3`