Spaces:

EAV123
/

Microbial_Susceptibility_Analyzer

Sleeping

App Files Files Community

EAV123 commited on May 19

Commit

1af97d1

verified ·

1 Parent(s): 5ae966a

Update app.py

Browse files

Files changed (1) hide show

app.py +109 -13

app.py CHANGED Viewed

@@ -117,11 +117,30 @@ elif page == "Susceptibility Analysis":
 # Data Upload Page
 elif page == "Data Upload":
     st.title("Batch Prediction: Upload CSV")
     uploaded_file = st.file_uploader("Upload your CSV file", type=["csv"])
     if uploaded_file:
         try:
             df = pd.read_csv(uploaded_file)
             st.write("Uploaded Data Preview:", df.head())
             # Validate the required columns
@@ -131,26 +150,103 @@ elif page == "Data Upload":
             if missing_columns:
                 st.error(f"The uploaded CSV is missing the following required columns: {', '.join(missing_columns)}")
             else:
                 # Process predictions
                 if st.button("Predict for Dataset"):
                     with st.spinner("Processing predictions..."):
-                        df["Prediction"] = df.apply(
-                            lambda row: predict_susceptibility(row.to_dict(), model, encoders)["Final Output"], axis=1
-                        )
                     st.success("Predictions complete!")
-                    st.write("Prediction Results:", df)
-                    # Optionally, download the results as a CSV
-                    csv = df.to_csv(index=False)
-                    st.download_button(
-                        label="Download Results as CSV",
-                        data=csv,
-                        file_name="predictions.csv",
-                        mime='text/csv'
-                    )
         except Exception as e:
-            st.error(f"Error reading the uploaded CSV file: {e}")
 # About Page
 elif page == "About":

 # Data Upload Page
 elif page == "Data Upload":
     st.title("Batch Prediction: Upload CSV")
+    # Add sample data download option
+    st.markdown("### Sample Data")
+    sample_data = pd.DataFrame({
+        'organism': ['Escherichia coli', 'Staphylococcus aureus', 'Pseudomonas aeruginosa'],
+        'antibiotic': ['Amoxicillin', 'Vancomycin', 'Ciprofloxacin'],
+        'was_positive': [1, 0, 1]
+    })
+    csv_sample = sample_data.to_csv(index=False)
+    st.download_button(
+        label="Download Sample CSV Template",
+        data=csv_sample,
+        file_name="sample_template.csv",
+        mime='text/csv'
+    )
     uploaded_file = st.file_uploader("Upload your CSV file", type=["csv"])
     if uploaded_file:
         try:
+            # Read the CSV file
             df = pd.read_csv(uploaded_file)
+            # Display preview with column check
             st.write("Uploaded Data Preview:", df.head())
             # Validate the required columns
             if missing_columns:
                 st.error(f"The uploaded CSV is missing the following required columns: {', '.join(missing_columns)}")
             else:
+                # Check data types and convert if necessary
+                if df['was_positive'].dtype != 'int64':
+                    try:
+                        df['was_positive'] = df['was_positive'].astype(int)
+                        st.info("Converted 'was_positive' column to integer type.")
+                    except ValueError:
+                        st.error("The 'was_positive' column must contain only 0 or 1 values.")
+                        st.stop()
+                # Validate organisms and antibiotics against encoders
+                invalid_organisms = [org for org in df['organism'].unique() if org not in encoders['organism']]
+                invalid_antibiotics = [ab for ab in df['antibiotic'].unique() if ab not in encoders['antibiotic']]
+                if invalid_organisms:
+                    st.warning(f"Found {len(invalid_organisms)} organisms not in the training data: {', '.join(invalid_organisms[:5])}{'...' if len(invalid_organisms) > 5 else ''}")
+                if invalid_antibiotics:
+                    st.warning(f"Found {len(invalid_antibiotics)} antibiotics not in the training data: {', '.join(invalid_antibiotics[:5])}{'...' if len(invalid_antibiotics) > 5 else ''}")
                 # Process predictions
                 if st.button("Predict for Dataset"):
                     with st.spinner("Processing predictions..."):
+                        # Create a progress bar
+                        progress_bar = st.progress(0)
+                        total_rows = len(df)
+                        # Initialize results columns
+                        df["Prediction"] = ""
+                        df["Rule Guidance"] = ""
+                        df["Model Prediction"] = ""
+                        df["Decision Reason"] = ""
+                        # Process each row with error handling
+                        for i, (index, row) in enumerate(df.iterrows()):
+                            try:
+                                # Skip rows with invalid data
+                                if (row['organism'] not in encoders['organism'] or
+                                    row['antibiotic'] not in encoders['antibiotic']):
+                                    df.at[index, "Prediction"] = "Invalid data"
+                                    continue
+                                # Get full prediction result
+                                result = predict_susceptibility(row.to_dict(), model, encoders)
+                                # Store all results
+                                if "Error" in result:
+                                    df.at[index, "Prediction"] = "Error: " + result["Error"]
+                                else:
+                                    df.at[index, "Prediction"] = result["Final Output"]
+                                    df.at[index, "Rule Guidance"] = result["Rule Guidance"]
+                                    df.at[index, "Model Prediction"] = result["Model Prediction"]
+                                    df.at[index, "Decision Reason"] = result["Decision Reason"]
+                            except Exception as e:
+                                df.at[index, "Prediction"] = f"Error: {str(e)}"
+                            # Update progress bar
+                            progress_bar.progress((i + 1) / total_rows)
                     st.success("Predictions complete!")
+                    # Display results with tabs for different views
+                    tab1, tab2 = st.tabs(["Basic Results", "Detailed Results"])
+                    with tab1:
+                        st.dataframe(df[['organism', 'antibiotic', 'was_positive', 'Prediction']])
+                    with tab2:
+                        st.dataframe(df)
+                    # Download options
+                    col1, col2 = st.columns(2)
+                    with col1:
+                        # Download basic results
+                        csv_basic = df[['organism', 'antibiotic', 'was_positive', 'Prediction']].to_csv(index=False)
+                        st.download_button(
+                            label="Download Basic Results",
+                            data=csv_basic,
+                            file_name="predictions_basic.csv",
+                            mime='text/csv'
+                        )
+                    with col2:
+                        # Download detailed results
+                        csv_detailed = df.to_csv(index=False)
+                        st.download_button(
+                            label="Download Detailed Results",
+                            data=csv_detailed,
+                            file_name="predictions_detailed.csv",
+                            mime='text/csv'
+                        )
+        except pd.errors.EmptyDataError:
+            st.error("The uploaded file is empty.")
+        except pd.errors.ParserError:
+            st.error("Error parsing the CSV file. Please ensure it's a valid CSV format.")
         except Exception as e:
+            st.error(f"An unexpected error occurred: {str(e)}")
 # About Page
 elif page == "About":