Spaces:
Runtime error
Runtime error
Saif Rehman Nasir
commited on
Commit
·
756f286
1
Parent(s):
b861528
Update model
Browse files
app.py
CHANGED
@@ -12,7 +12,7 @@ index = pc.Index("medicine")
|
|
12 |
"""
|
13 |
For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
|
14 |
"""
|
15 |
-
client = InferenceClient("
|
16 |
|
17 |
embedding_model = SentenceTransformer(
|
18 |
"nomic-ai/nomic-embed-text-v1", trust_remote_code=True
|
@@ -55,7 +55,7 @@ def respond(
|
|
55 |
messages.append({"role": "user", "content": retrieved_data})
|
56 |
|
57 |
response = ""
|
58 |
-
|
59 |
for message in client.chat_completion(
|
60 |
messages,
|
61 |
max_tokens=max_tokens,
|
|
|
12 |
"""
|
13 |
For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
|
14 |
"""
|
15 |
+
client = InferenceClient("meta-llama/Meta-Llama-3-8B-Instruct")
|
16 |
|
17 |
embedding_model = SentenceTransformer(
|
18 |
"nomic-ai/nomic-embed-text-v1", trust_remote_code=True
|
|
|
55 |
messages.append({"role": "user", "content": retrieved_data})
|
56 |
|
57 |
response = ""
|
58 |
+
print("Completion request")
|
59 |
for message in client.chat_completion(
|
60 |
messages,
|
61 |
max_tokens=max_tokens,
|