prasadnu commited on
Commit
1608ab2
·
1 Parent(s): d1e16b2

model changed to Haiku 3.5 for query re=write

Browse files
Files changed (1) hide show
  1. utilities/invoke_models.py +3 -1
utilities/invoke_models.py CHANGED
@@ -33,6 +33,7 @@ def invoke_model(input):
33
  modelId="amazon.titan-embed-text-v1",
34
  accept="application/json",
35
  contentType="application/json",
 
36
  )
37
 
38
  response_body = json.loads(response.get("body").read())
@@ -53,7 +54,7 @@ def invoke_model_mm(text,img):
53
  contentType = "application/json"
54
 
55
  response = bedrock_runtime_client.invoke_model(
56
- body=body, modelId=modelId, accept=accept, contentType=contentType
57
  )
58
  response_body = json.loads(response.get("body").read())
59
  #print(response_body)
@@ -65,6 +66,7 @@ def invoke_llm_model(input,is_stream):
65
  modelId= "anthropic.claude-3-5-haiku-20241022-v1:0",#"anthropic.claude-3-5-sonnet-20240620-v1:0",,
66
  contentType = "application/json",
67
  accept = "application/json",
 
68
 
69
  body = json.dumps({
70
  "anthropic_version": "bedrock-2023-05-31",
 
33
  modelId="amazon.titan-embed-text-v1",
34
  accept="application/json",
35
  contentType="application/json",
36
+ performanceConfigLatency='optimized'
37
  )
38
 
39
  response_body = json.loads(response.get("body").read())
 
54
  contentType = "application/json"
55
 
56
  response = bedrock_runtime_client.invoke_model(
57
+ body=body, modelId=modelId, accept=accept, contentType=contentType,performanceConfigLatency='optimized'
58
  )
59
  response_body = json.loads(response.get("body").read())
60
  #print(response_body)
 
66
  modelId= "anthropic.claude-3-5-haiku-20241022-v1:0",#"anthropic.claude-3-5-sonnet-20240620-v1:0",,
67
  contentType = "application/json",
68
  accept = "application/json",
69
+ performanceConfigLatency='optimized'
70
 
71
  body = json.dumps({
72
  "anthropic_version": "bedrock-2023-05-31",