Spaces:

steviel
/

ICML2025

Sleeping

App Files Files Community

stefanoviel commited on Jul 9

Commit

b1a742b

1 Parent(s): 3c2ac96

removing useless st print

Browse files

Files changed (1) hide show

src/streamlit_app.py +7 -7

src/streamlit_app.py CHANGED Viewed

@@ -33,7 +33,7 @@ def create_and_save_embeddings(model, data_df):
     Generates and saves document embeddings and the dataframe.
     This function is called only once if the files don't exist.
     """
-    st.info("First time setup: Generating and saving embeddings. This may take a moment...")
     # Combine title and abstract for richer embeddings
     data_df['text_to_embed'] = data_df['title'] + ". " + data_df['abstract'].fillna('')
@@ -44,9 +44,9 @@ def create_and_save_embeddings(model, data_df):
     try:
         torch.save(corpus_embeddings.cpu(), EMBEDDINGS_FILE)
         data_df.to_pickle(DATA_FILE)
-        st.success("Embeddings and data saved successfully!")
     except Exception as e:
-        st.warning(f"Could not save embeddings to disk: {e}. Will regenerate on each session.")
     return corpus_embeddings, data_df
@@ -65,19 +65,19 @@ def load_data_and_embeddings():
             data_df = pd.read_pickle(DATA_FILE)
             return model, corpus_embeddings, data_df
         except Exception as e:
-            st.warning(f"Could not load saved embeddings: {e}. Regenerating...")
-    st.info("embeding model path exists: " + str(Path(EMBEDDING_MODEL).exists()))
     # Load the raw data from CSV
     try:
         data_df = pd.read_csv(CSV_FILE)
         corpus_embeddings, data_df = create_and_save_embeddings(model, data_df)
     except FileNotFoundError:
-        st.error(f"CSV file '{CSV_FILE}' not found. Please ensure it's in your repository.")
         st.stop()
     except Exception as e:
-        st.error(f"Error loading data: {e}")
         st.stop()
     return model, corpus_embeddings, data_df

     Generates and saves document embeddings and the dataframe.
     This function is called only once if the files don't exist.
     """
+    print("First time setup: Generating and saving embeddings. This may take a moment...")
     # Combine title and abstract for richer embeddings
     data_df['text_to_embed'] = data_df['title'] + ". " + data_df['abstract'].fillna('')
     try:
         torch.save(corpus_embeddings.cpu(), EMBEDDINGS_FILE)
         data_df.to_pickle(DATA_FILE)
+        print("Embeddings and data saved successfully!")
     except Exception as e:
+        print(f"Could not save embeddings to disk: {e}. Will regenerate on each session.")
     return corpus_embeddings, data_df
             data_df = pd.read_pickle(DATA_FILE)
             return model, corpus_embeddings, data_df
         except Exception as e:
+            print(f"Could not load saved embeddings: {e}. Regenerating...")
+    print("embeding model path exists: " + str(Path(EMBEDDING_MODEL).exists()))
     # Load the raw data from CSV
     try:
         data_df = pd.read_csv(CSV_FILE)
         corpus_embeddings, data_df = create_and_save_embeddings(model, data_df)
     except FileNotFoundError:
+        print(f"CSV file '{CSV_FILE}' not found. Please ensure it's in your repository.")
         st.stop()
     except Exception as e:
+        print(f"Error loading data: {e}")
         st.stop()
     return model, corpus_embeddings, data_df