gradio-fastapi-static-server_testing

Build error

App Files Files Community

m7n commited on Oct 10, 2024

Commit

1951cf0

verified ·

1 Parent(s): 2261de4

Update app.py

Browse files

Added sample reduction method button, added logic for this, set Button to main

Files changed (1) hide show

app.py +20 -8

app.py CHANGED Viewed

@@ -239,7 +239,7 @@ print(f"Language model is set up: {time.strftime('%Y-%m-%d %H:%M:%S')}")
-def predict(text_input, sample_size_slider, reduce_sample_checkbox, progress=gr.Progress()):
     print('getting data to project')
     progress(0, desc="Starting...")
@@ -259,6 +259,7 @@ def predict(text_input, sample_size_slider, reduce_sample_checkbox, progress=gr.
     records_df = pd.DataFrame(records)
     records_df['abstract'] = [invert_abstract(t) for t in records_df['abstract_inverted_index']]
@@ -271,11 +272,18 @@ def predict(text_input, sample_size_slider, reduce_sample_checkbox, progress=gr.
     if reduce_sample_checkbox:
-        records_df = records_df.sample(sample_size_slider)
     print(records_df)
     progress(0.3, desc="Embedding Data...")
     texts_to_embedd = [title + tokenizer.sep_token + publication + tokenizer.sep_token  + abstract for title, publication, abstract in zip(records_df['title'],records_df['parsed_publication'], records_df['abstract'])]
@@ -422,14 +430,18 @@ with gr.Blocks() as block:
 #    You're a philosopher of science who wonders where the concept of a fitness landscape has appeared...
     with gr.Column():
-        text_input = gr.Textbox(label="OpenAlex Fulltext-Search")
-        sample_size_slider = gr.Slider(label="Sample Size", minimum=10, maximum=20000, step=10, value=1000)
-        reduce_sample_checkbox = gr.Checkbox(label="Reduce Sample Size", value=True)
-        new_btn = gr.Button("Run Query")
         markdown = gr.Markdown(label="")
         html = gr.HTML(label="HTML preview", show_label=True)
-    new_btn.click(fn=predict, inputs=[text_input, sample_size_slider, reduce_sample_checkbox], outputs=[markdown, html])

+def predict(text_input, sample_size_slider, reduce_sample_checkbox,sample_reduction_method, progress=gr.Progress()):
     print('getting data to project')
     progress(0, desc="Starting...")
     records_df = pd.DataFrame(records)
     records_df['abstract'] = [invert_abstract(t) for t in records_df['abstract_inverted_index']]
     if reduce_sample_checkbox:
+        sample_size = min(sample_size_slider, len(records_df))
+        if sample_reduction_method == "Random":
+            records_df = records_df.sample(sample_size)
+        elif sample_reduction_method == "Order of Results":
+            records_df = records_df.iloc[:sample_size]
     print(records_df)
     progress(0.3, desc="Embedding Data...")
     texts_to_embedd = [title + tokenizer.sep_token + publication + tokenizer.sep_token  + abstract for title, publication, abstract in zip(records_df['title'],records_df['parsed_publication'], records_df['abstract'])]
 #    You're a philosopher of science who wonders where the concept of a fitness landscape has appeared...
     with gr.Column():
+        text_input = gr.Textbox(label="OpenAlex-search URL")
+        with gr.Row():
+            reduce_sample_checkbox = gr.Checkbox(label="Reduce Sample Size", value=True, info="Reduce sample size.")
+            sample_size_slider = gr.Slider(label="Sample Size", minimum=10, maximum=20000, step=10, value=1000, info="How many samples to keep.")
+            sample_reduction_method = gr.Dropdown(["Order of Results", "Random"], label="Order of Results", info="How to choose the samples to keep.")
+        new_btn = gr.Button("Run Query",variant='primary')
         markdown = gr.Markdown(label="")
         html = gr.HTML(label="HTML preview", show_label=True)
+    new_btn.click(fn=predict, inputs=[text_input, sample_size_slider, reduce_sample_checkbox,sample_reduction_method], outputs=[markdown, html])