OpenSearch-AI

Running on T4

prasadnu commited on 15 days ago

Commit

0fcedcf

1 Parent(s): a4d2378

model changed to Haiku 3.5 for query re=write

Files changed (1) hide show

utilities/invoke_models.py CHANGED Viewed

@@ -11,8 +11,6 @@ import streamlit as st
 #from transformers import VisionEncoderDecoderModel, ViTImageProcessor, AutoTokenizer
 #import torch
-region = 'us-east-1'
 def get_bedrock_client():
     return boto3.client(
     'bedrock-runtime',
@@ -32,8 +30,8 @@ def invoke_model(input):
         }),
         modelId="amazon.titan-embed-text-v1",
         accept="application/json",
-        contentType="application/json",
-        performanceConfigLatency='optimized'
     )
     response_body = json.loads(response.get("body").read())
@@ -54,7 +52,7 @@ def invoke_model_mm(text,img):
     contentType = "application/json"
     response = bedrock_runtime_client.invoke_model(
-            body=body, modelId=modelId, accept=accept, contentType=contentType,performanceConfigLatency='optimized'
         )
     response_body = json.loads(response.get("body").read())
     #print(response_body)
@@ -63,7 +61,7 @@ def invoke_model_mm(text,img):
 def invoke_llm_model(input,is_stream):
     if(is_stream == False):
         response = bedrock_runtime_client.invoke_model(
-            modelId= "anthropic.claude-3-5-haiku-20241022-v1:0",#"anthropic.claude-3-5-sonnet-20240620-v1:0",,
             contentType = "application/json",
             accept = "application/json",
             performanceConfigLatency='optimized',

 #from transformers import VisionEncoderDecoderModel, ViTImageProcessor, AutoTokenizer
 #import torch
 def get_bedrock_client():
     return boto3.client(
     'bedrock-runtime',
         }),
         modelId="amazon.titan-embed-text-v1",
         accept="application/json",
+        contentType="application/json"
+        #,performanceConfigLatency='optimized'
     )
     response_body = json.loads(response.get("body").read())
     contentType = "application/json"
     response = bedrock_runtime_client.invoke_model(
+            body=body, modelId=modelId, accept=accept, contentType=contentType#,performanceConfigLatency='optimized'
         )
     response_body = json.loads(response.get("body").read())
     #print(response_body)
 def invoke_llm_model(input,is_stream):
     if(is_stream == False):
         response = bedrock_runtime_client.invoke_model(
+            modelId= "us.anthropic.claude-3-5-haiku-20241022-v1:0"#"anthropic.claude-3-5-haiku-20241022-v1:0",#"anthropic.claude-3-5-sonnet-20240620-v1:0",,
             contentType = "application/json",
             accept = "application/json",
             performanceConfigLatency='optimized',