Spaces:

mgbam
/

sythenticdata

Sleeping

App Files Files Community

mgbam commited on Feb 9

Commit

45e7a79

verified ·

1 Parent(s): 945d7f4

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -11

app.py CHANGED Viewed

@@ -7,7 +7,7 @@ import pandas as pd
 import sqlalchemy
 from typing import Any, Dict, List
-# Provider clients – ensure these libraries are installed
 try:
     from openai import OpenAI
 except ImportError:
@@ -34,7 +34,7 @@ class QADataGenerator:
         self._setup_input_handlers()
         self._initialize_session_state()
         # This prompt instructs the LLM to generate a configurable number of Q&A pairs.
-        # Note: Literal curly braces for the example are escaped with double braces.
         self.custom_prompt_template = (
             "You are an expert in extracting question and answer pairs from documents. "
             "Generate {num_pairs} Q&A pairs from the following data, formatted as a JSON list of dictionaries. "
@@ -87,12 +87,13 @@ class QADataGenerator:
                 "provider": "OpenAI",
                 "model": "gpt-4-turbo",
                 "temperature": DEFAULT_TEMPERATURE,
-                "num_pairs": 3,  # Default to 3 Q&A pairs
             },
             "api_key": "",
             "inputs": [],       # List to store input sources
-            "qa_pairs": "",     # Generated Q&A pairs output
             "error_logs": [],   # To store any error messages
         }
         for key, value in defaults.items():
             if key not in st.session_state:
@@ -198,6 +199,7 @@ class QADataGenerator:
             st.write("### Raw API Response")
             st.write(response)
             qa_pairs = self._parse_response(response, provider_name)
             st.write("### Parsed Q&A Pairs")
@@ -245,7 +247,7 @@ class QADataGenerator:
         """
         Parse the LLM response and return a list of Q&A pairs.
         Expects the response to be in a JSON-like format.
-        If JSON parsing fails (e.g. due to single quotes), fall back to ast.literal_eval.
         """
         st.write("Parsing response for provider:", provider)
         try:
@@ -303,8 +305,8 @@ def config_ui(generator: QADataGenerator):
         temperature = st.slider("Temperature", 0.0, 1.0, DEFAULT_TEMPERATURE)
         st.session_state.config["temperature"] = temperature
-        # New: Number of Q&A pairs
-        num_pairs = st.number_input("Number of Q&A Pairs", min_value=1, max_value=20, value=3, step=1)
         st.session_state.config["num_pairs"] = num_pairs
         api_key = st.text_input(f"{provider} API Key", type="password")
@@ -357,13 +359,27 @@ def input_ui(generator: QADataGenerator):
             st.success("Database input added!")
 def output_ui(generator: QADataGenerator):
-    """Display the generated Q&A pairs and provide a download option."""
     st.subheader("Q&A Pairs Output")
     if st.session_state.qa_pairs:
-        st.write("### Generated Q&A Pairs")
-        st.write(st.session_state.qa_pairs)
         st.download_button(
-            "Download Output",
             json.dumps(st.session_state.qa_pairs, indent=2),
             file_name="qa_pairs.json",
             mime="application/json"

 import sqlalchemy
 from typing import Any, Dict, List
+# Provider clients – ensure these libraries are installed if needed.
 try:
     from openai import OpenAI
 except ImportError:
         self._setup_input_handlers()
         self._initialize_session_state()
         # This prompt instructs the LLM to generate a configurable number of Q&A pairs.
+        # Note: Literal curly braces in the example are escaped with double braces.
         self.custom_prompt_template = (
             "You are an expert in extracting question and answer pairs from documents. "
             "Generate {num_pairs} Q&A pairs from the following data, formatted as a JSON list of dictionaries. "
                 "provider": "OpenAI",
                 "model": "gpt-4-turbo",
                 "temperature": DEFAULT_TEMPERATURE,
+                "num_pairs": 3,  # Default number of Q&A pairs; can be increased
             },
             "api_key": "",
             "inputs": [],       # List to store input sources
+            "qa_pairs": [],     # Generated Q&A pairs output
             "error_logs": [],   # To store any error messages
+            "raw_response": "", # Store raw API response (if needed)
         }
         for key, value in defaults.items():
             if key not in st.session_state:
             st.write("### Raw API Response")
             st.write(response)
+            st.session_state.raw_response = response
             qa_pairs = self._parse_response(response, provider_name)
             st.write("### Parsed Q&A Pairs")
         """
         Parse the LLM response and return a list of Q&A pairs.
         Expects the response to be in a JSON-like format.
+        If JSON parsing fails (e.g. due to single quotes), falls back to ast.literal_eval.
         """
         st.write("Parsing response for provider:", provider)
         try:
         temperature = st.slider("Temperature", 0.0, 1.0, DEFAULT_TEMPERATURE)
         st.session_state.config["temperature"] = temperature
+        # New: Number of Q&A pairs (allow up to 50)
+        num_pairs = st.number_input("Number of Q&A Pairs", min_value=1, max_value=50, value=3, step=1)
         st.session_state.config["num_pairs"] = num_pairs
         api_key = st.text_input(f"{provider} API Key", type="password")
             st.success("Database input added!")
 def output_ui(generator: QADataGenerator):
+    """Display the generated Q&A pairs in a readable table and provide download options."""
     st.subheader("Q&A Pairs Output")
     if st.session_state.qa_pairs:
+        st.write("### Generated Q&A Pairs (Table)")
+        try:
+            df = pd.DataFrame(st.session_state.qa_pairs)
+            st.dataframe(df)
+            csv_data = df.to_csv(index=False).encode("utf-8")
+        except Exception as e:
+            st.write("Could not convert output to table format, displaying raw output.")
+            csv_data = json.dumps(st.session_state.qa_pairs, indent=2).encode("utf-8")
+            st.write(st.session_state.qa_pairs)
+        st.download_button(
+            "Download as CSV",
+            csv_data,
+            file_name="qa_pairs.csv",
+            mime="text/csv"
+        )
         st.download_button(
+            "Download as JSON",
             json.dumps(st.session_state.qa_pairs, indent=2),
             file_name="qa_pairs.json",
             mime="application/json"