Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
model changed to Haiku 3.5 for query re=write
Browse files
utilities/invoke_models.py
CHANGED
@@ -33,6 +33,7 @@ def invoke_model(input):
|
|
33 |
modelId="amazon.titan-embed-text-v1",
|
34 |
accept="application/json",
|
35 |
contentType="application/json",
|
|
|
36 |
)
|
37 |
|
38 |
response_body = json.loads(response.get("body").read())
|
@@ -53,7 +54,7 @@ def invoke_model_mm(text,img):
|
|
53 |
contentType = "application/json"
|
54 |
|
55 |
response = bedrock_runtime_client.invoke_model(
|
56 |
-
body=body, modelId=modelId, accept=accept, contentType=contentType
|
57 |
)
|
58 |
response_body = json.loads(response.get("body").read())
|
59 |
#print(response_body)
|
@@ -65,6 +66,7 @@ def invoke_llm_model(input,is_stream):
|
|
65 |
modelId= "anthropic.claude-3-5-haiku-20241022-v1:0",#"anthropic.claude-3-5-sonnet-20240620-v1:0",,
|
66 |
contentType = "application/json",
|
67 |
accept = "application/json",
|
|
|
68 |
|
69 |
body = json.dumps({
|
70 |
"anthropic_version": "bedrock-2023-05-31",
|
|
|
33 |
modelId="amazon.titan-embed-text-v1",
|
34 |
accept="application/json",
|
35 |
contentType="application/json",
|
36 |
+
performanceConfigLatency='optimized'
|
37 |
)
|
38 |
|
39 |
response_body = json.loads(response.get("body").read())
|
|
|
54 |
contentType = "application/json"
|
55 |
|
56 |
response = bedrock_runtime_client.invoke_model(
|
57 |
+
body=body, modelId=modelId, accept=accept, contentType=contentType,performanceConfigLatency='optimized'
|
58 |
)
|
59 |
response_body = json.loads(response.get("body").read())
|
60 |
#print(response_body)
|
|
|
66 |
modelId= "anthropic.claude-3-5-haiku-20241022-v1:0",#"anthropic.claude-3-5-sonnet-20240620-v1:0",,
|
67 |
contentType = "application/json",
|
68 |
accept = "application/json",
|
69 |
+
performanceConfigLatency='optimized'
|
70 |
|
71 |
body = json.dumps({
|
72 |
"anthropic_version": "bedrock-2023-05-31",
|