Standard_Intelligence_Dev

Sleeping

heymenn commited on Apr 12, 2024

Commit

561f923

verified ·

1 Parent(s): 103847d

Update scrape_3gpp.py

Files changed (1) hide show

scrape_3gpp.py CHANGED Viewed

@@ -71,21 +71,17 @@ import gradio as gr
 def scrape(url, excel_file, folder_name, status_list, sorted_files, progress=gr.Progress()):
-    print("ENTERING SCRAPE FUNCTION")
     filenames = []
     status_filenames = []
     df = pd.DataFrame()  # Initialize df to ensure it's always defined
     # Try to process the Excel file if provided and valid
-    print(f"WE ARE TESTING IF OS.PATH.EXISTS WITH THIS FILE : {excel_file}")
     if excel_file and os.path.exists(excel_file):
         try:
             df = pd.read_excel(excel_file)
             print(f"Initial DataFrame size: {len(df)}")
-            print(f"WE ARE TRYING TO LOOK AT status_list : {status_list}")
-            print(f"WE ARE TRYING TO LOOK AT df.columns : {df.columns.tolist()}")
             if 'TDoc Status' in df.columns and status_list:
                 df = df[df['TDoc Status'].isin(status_list)]
                 print(f"Filtered DataFrame size: {len(df)}")

 def scrape(url, excel_file, folder_name, status_list, sorted_files, progress=gr.Progress()):
     filenames = []
     status_filenames = []
     df = pd.DataFrame()  # Initialize df to ensure it's always defined
     # Try to process the Excel file if provided and valid
     if excel_file and os.path.exists(excel_file):
         try:
             df = pd.read_excel(excel_file)
             print(f"Initial DataFrame size: {len(df)}")
             if 'TDoc Status' in df.columns and status_list:
                 df = df[df['TDoc Status'].isin(status_list)]
                 print(f"Filtered DataFrame size: {len(df)}")