Spaces:

ishaan-mital
/

ncert-helper

Runtime error

App Files Files Community

ishaan-mital commited on Nov 13, 2023

Commit

d1289ae

1 Parent(s): e665513

dsf

Browse files

Files changed (1) hide show

app.py +43 -41

app.py CHANGED Viewed

@@ -12,63 +12,65 @@ API_URL = "https://api-inference.huggingface.co/models/HuggingFaceH4/zephyr-7b-b
 headers = {"Authorization": f"Bearer {os.environ.get('API_KEY')}"}
 retrieval = Client("https://ishaan-mital-ncert-helper-vector-db.hf.space/--replicas/149bl5mjn/")
-embed_model_id = 'sentence-transformers/all-MiniLM-L6-v2'
-# device = f'cuda:{cuda.current_device()}' if cuda.is_available() else 'cpu'
-embed_model = HuggingFaceEmbeddings(
-    model_name=embed_model_id,
-    # model_kwargs={'device': device},
-    # encode_kwargs={'device': device, 'batch_size': 32}
-)
-pinecone.init(
-    api_key=os.environ.get('PINECONE_API_KEY'),
-    environment=os.environ.get('PINECONE_ENVIRONMENT')
-)
-index_name = 'llama-rag'
-index = pinecone.Index(index_name)
-text_field = 'text'  # field in metadata that contains text content
-docs = [
-    "this is one document",
-    "and another document"
-]
-embeddings = embed_model.embed_documents(docs)
-if index_name not in pinecone.list_indexes():
-    pinecone.create_index(
-        index_name,
-        dimension=len(embeddings[0]),
-        metric='cosine'
-    )
-    # wait for index to finish initialization
-    while not pinecone.describe_index(index_name).status['ready']:
-        time.sleep(1)
-vectorstore = Pinecone(
-    index, embed_model.embed_query, text_field
-)
 def call_llm_api(input_text,context):
     payload = {
-        "inputs": f'question: {input_text}, context: {context}'
             }
     response = requests.post(API_URL, headers=headers, json=payload)
     return response.json()  # Adjust as needed based on your API response format
-rag_pipeline = RetrievalQA.from_chain_type(
-    llm=call_llm_api, chain_type='stuff',
-    retriever=vectorstore.as_retriever()
-)
 def main(question):
     # return rag_pipeline(question)
-    # global chatbot
-    # context = retrieval.predict(question, api_name = "/predict")
-    # answer=call_llm_api(question,context)
-    # # chatbot = answer[1]
-    # return answer[0]
 demo = gr.Interface(main, inputs = "text", outputs = "text")

 headers = {"Authorization": f"Bearer {os.environ.get('API_KEY')}"}
 retrieval = Client("https://ishaan-mital-ncert-helper-vector-db.hf.space/--replicas/149bl5mjn/")
+# embed_model_id = 'sentence-transformers/all-MiniLM-L6-v2'
+# # device = f'cuda:{cuda.current_device()}' if cuda.is_available() else 'cpu'
+# embed_model = HuggingFaceEmbeddings(
+#     model_name=embed_model_id,
+#     # model_kwargs={'device': device},
+#     # encode_kwargs={'device': device, 'batch_size': 32}
+# )
+# pinecone.init(
+#     api_key=os.environ.get('PINECONE_API_KEY'),
+#     environment=os.environ.get('PINECONE_ENVIRONMENT')
+# )
+# index_name = 'llama-rag'
+# index = pinecone.Index(index_name)
+# text_field = 'text'  # field in metadata that contains text content
+# docs = [
+#     "this is one document",
+#     "and another document"
+# ]
+# embeddings = embed_model.embed_documents(docs)
+# if index_name not in pinecone.list_indexes():
+#     pinecone.create_index(
+#         index_name,
+#         dimension=len(embeddings[0]),
+#         metric='cosine'
+#     )
+#     # wait for index to finish initialization
+#     while not pinecone.describe_index(index_name).status['ready']:
+#         time.sleep(1)
+# vectorstore = Pinecone(
+#     index, embed_model.embed_query, text_field
+# )
 def call_llm_api(input_text,context):
+    init_prompt ="## Instruction: You are an AI language model and must return truthful responses as per the information. Do not answer with any information which isn't completely verified and correct. Do not lie. Do not present information where you don't know the answer. Do not include incorrect extra information. Your name is NCERT Helper. You are a helpful and truthful chatbot. \n"
+    info="Information: \n"
     payload = {
+        "inputs": init_prompt + info + context + "\nQuestion: " + input_text + "\nAnswer:"
             }
     response = requests.post(API_URL, headers=headers, json=payload)
     return response.json()  # Adjust as needed based on your API response format
+# rag_pipeline = RetrievalQA.from_chain_type(
+#     llm=call_llm_api, chain_type='stuff',
+#     retriever=vectorstore.as_retriever()
+# )
 def main(question):
     # return rag_pipeline(question)
+    global chatbot
+    context = retrieval.predict(question, api_name = "/predict")
+    answer=call_llm_api(question,context)
+    chatbot = answer
+    return answer
 demo = gr.Interface(main, inputs = "text", outputs = "text")