Spaces:

gufett0
/

chatbot-llamaindex

Sleeping

App Files Files Community

gufett0 commited on Sep 14, 2024

Commit

8238f47

1 Parent(s): 5c3431a

added text streamer

Browse files

Files changed (1) hide show

backend.py +3 -26

backend.py CHANGED Viewed

@@ -13,9 +13,6 @@ from llama_cpp import Llama
 import spaces
 from huggingface_hub import login
-from transformers import TextIteratorStreamer
-import threading
 huggingface_token = os.getenv("HUGGINGFACE_TOKEN")
 login(huggingface_token)
@@ -72,29 +69,9 @@ def handle_query(query_str, chathistory):
         ("user", qa_prompt_str),
     ]
     text_qa_template = ChatPromptTemplate.from_messages(chat_text_qa_msgs)
-    # Create the query engine
-    query_engine = index.as_query_engine(text_qa_template=text_qa_template)
-    try:
-        # Setup the TextIteratorStreamer for streaming the response
-        streamer = TextIteratorStreamer(tokenizer, skip_special_tokens=True)
-        # Create a thread to run the generation in the background
-        def generate_response():
-            query_engine.query(query_str, streamer=streamer)
-        generation_thread = threading.Thread(target=generate_response)
-        generation_thread.start()
-        # Stream tokens as they are generated
-        for new_text in streamer:
-            yield new_text
-    except Exception as e:
-        yield f"Error processing query: {str(e)}"
-"""    try:
-        result = index.as_query_engine(text_qa_template=text_qa_template).query(query_str)
         response_text = result.response
         # Remove any unwanted tokens like <end_of_turn>
@@ -102,7 +79,7 @@ def handle_query(query_str, chathistory):
         yield cleaned_result
     except Exception as e:
-        yield f"Error processing query: {str(e)}" """

 import spaces
 from huggingface_hub import login
 huggingface_token = os.getenv("HUGGINGFACE_TOKEN")
 login(huggingface_token)
         ("user", qa_prompt_str),
     ]
     text_qa_template = ChatPromptTemplate.from_messages(chat_text_qa_msgs)
+    try:
+        result = index.as_query_engine(text_qa_template=text_qa_template, streaming=True).query(query_str)
         response_text = result.response
         # Remove any unwanted tokens like <end_of_turn>
         yield cleaned_result
     except Exception as e:
+        yield f"Error processing query: {str(e)}"