Spaces:

ramalMr
/

data_gen

Sleeping

ramalMr commited on Apr 1, 2024

Commit

5b06a47

verified ·

1 Parent(s): 17f5007

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -58,8 +58,10 @@ def generate(file, temperature, max_new_tokens, top_p, repetition_penalty):
             save_to_csv(sentence, f"Error: {e}")
     # CSV dosyasını okuyup byte olarak döndür
-    with open("synthetic_data.csv", "rb") as file:
-        return file.read()
 gr.Interface(
     fn=generate,
     inputs=[
@@ -69,7 +71,7 @@ gr.Interface(
         gr.Slider(label="Top-p (nucleus sampling)", value=0.95, minimum=0.0, maximum=1, step=0.05, interactive=True, info="Higher values sample more low-probability tokens"),
         gr.Slider(label="Repetition penalty", value=1.0, minimum=1.0, maximum=2.0, step=0.1, interactive=True, info="Penalize repeated tokens"),
     ],
-    outputs=gr.File(label="Download Synthetic Data CSV"),
     title="Synthetic Data Generation",
     description="This tool generates synthetic data from the sentences in your PDF and saves it to a CSV file.",
     allow_flagging="never",

             save_to_csv(sentence, f"Error: {e}")
     # CSV dosyasını okuyup byte olarak döndür
+    with open("synthetic_data.csv", "r", encoding="utf-8") as file:
+        csv_content = file.read()
+    csv_bytes = csv_content.encode()
+    return io.BytesIO(csv_bytes)
 gr.Interface(
     fn=generate,
     inputs=[
         gr.Slider(label="Top-p (nucleus sampling)", value=0.95, minimum=0.0, maximum=1, step=0.05, interactive=True, info="Higher values sample more low-probability tokens"),
         gr.Slider(label="Repetition penalty", value=1.0, minimum=1.0, maximum=2.0, step=0.1, interactive=True, info="Penalize repeated tokens"),
     ],
+    outputs=gr.File(label="Synthetic Data CSV"),
     title="Synthetic Data Generation",
     description="This tool generates synthetic data from the sentences in your PDF and saves it to a CSV file.",
     allow_flagging="never",