Spaces:

GIZ
/

climate_vulnerability_analysis

Sleeping

App Files Files Community

leavoigt commited on 26 days ago

Commit

f93aadf

verified ·

1 Parent(s): 9410c95

fix bug in summary generation

Browse files

Files changed (1) hide show

appStore/rag.py +32 -18

appStore/rag.py CHANGED Viewed

@@ -58,26 +58,40 @@ def run_query(context, label, model_sel_name):
     # Initialize the client, pointing it to one of the available models
     client = InferenceClient(model_sel_name, token=hf_token)
-    # Instantiate ChatCompletion as a generator object (stream is set to True)
-    chat_completion = client.chat.completions.create(
-        messages=messages,
-        stream=True
-    )
-    # Create an object to store the full chat completion
     completion_result = ChatCompletionResult()
     res_box = st.empty()
-    # Iterate through the streamed output
-    for chunk in chat_completion:
-        # Extract the object containing the text
-        if chunk.choices is not None:
-            chunk_message = chunk.choices[0].delta
-            if 'content' in chunk_message:
-                completion_result.add_content(chunk_message['content'])  # Store the message
-                # Add the latest text and merge it with all previous
-                result = completion_result.get_full_content()
-                res_box.success(result)  # Output to response text box
-    # Return the stored chat completion object for later use
     return completion_result

     # Initialize the client, pointing it to one of the available models
     client = InferenceClient(model_sel_name, token=hf_token)
+    # # Instantiate ChatCompletion as a generator object (stream is set to True)
+    # chat_completion = client.chat.completions.create(
+    #     messages=messages,
+    #     stream=True
+    # )
+    # # Create an object to store the full chat completion
+    # completion_result = ChatCompletionResult()
+    # res_box = st.empty()
+    # # Iterate through the streamed output
+    # for chunk in chat_completion:
+    #     # Extract the object containing the text
+    #     if chunk.choices is not None:
+    #         chunk_message = chunk.choices[0].delta
+    #         if 'content' in chunk_message:
+    #             completion_result.add_content(chunk_message['content'])  # Store the message
+    #             # Add the latest text and merge it with all previous
+    #             result = completion_result.get_full_content()
+    #             res_box.success(result)  # Output to response text box
+    # Use streaming text generation
+    response_stream = client.text_generation(prompt, stream=True, max_new_tokens=512)
     completion_result = ChatCompletionResult()
     res_box = st.empty()
+    for chunk in response_stream:
+        completion_result.add_content(chunk)
+        result = completion_result.get_full_content()
+        res_box.success(result)
     return completion_result
+    # # Return the stored chat completion object for later use
+    # return completion_result