Spaces:

HelloWorld2307
/

my-pycaret-app

Sleeping

App Files Files Community

HelloWorld2307 commited on May 4

Commit

3a79137

verified ·

1 Parent(s): d48c27d

Deploy PyCaret model baseline_dt_20250426_212853.pkl

Browse files

Files changed (4) hide show

README.md +10 -6
app.py +169 -0
model.pkl +3 -0
requirements.txt +7 -0

README.md CHANGED Viewed

@@ -1,10 +1,14 @@
 ---
-title: My Pycaret App
-emoji: 🌖
-colorFrom: red
-colorTo: gray
-sdk: docker
 pinned: false
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: my-pycaret-app
+emoji: 🚀
+colorFrom: blue
+colorTo: green
+sdk: streamlit
+app_file: app.py
 pinned: false
 ---
+# my-pycaret-app
+Simple prediction app deployed using Streamlit. Model file: `model.pkl`.
+Check `requirements.txt` for dependencies.

app.py ADDED Viewed

	@@ -0,0 +1,169 @@

+import streamlit as st
+import pandas as pd
+from pycaret.classification import load_model, predict_model
+import os
+import warnings # Added to potentially suppress warnings
+import logging # Added for better debugging in the Space
+# Configure simple logging for the Streamlit app
+# Use Streamlit logger if available, otherwise basic config
+try:
+    # Attempt to get logger specific to Streamlit context
+    logger = st.logger.get_logger(__name__)
+except AttributeError: # Fallback for older Streamlit versions or different contexts
+    # Basic logging setup if Streamlit logger isn't available
+    logging.basicConfig(level=logging.INFO, format='%(asctime)s - StreamlitApp - %(levelname)s - %(message)s')
+    logger = logging.getLogger(__name__)
+# --- Configuration ---
+MODEL_FILE = "model.pkl" # Relative path within the Space
+APP_TITLE = "my-pycaret-app"
+# --- Load Model ---
+# Use cache_resource for efficient loading
+@st.cache_resource
+def get_model():
+    logger.info(f"Attempting to load model from file: {MODEL_FILE}")
+    # Define the path expected by PyCaret's load_model (without extension)
+    model_load_path = MODEL_FILE.replace('.pkl','')
+    logger.info(f"Calculated PyCaret load path: '{model_load_path}'") # Escaped braces
+    if not os.path.exists(MODEL_FILE):
+        st.error(f"Model file '{MODEL_FILE}' not found in the Space repository.")
+        logger.error(f"Model file '{MODEL_FILE}' not found at expected path.")
+        return None
+    try:
+        # Suppress specific warnings during loading if needed
+        # warnings.filterwarnings("ignore", category=UserWarning, message=".*Trying to unpickle estimator.*")
+        logger.info(f"Calling PyCaret's load_model('{model_load_path}')...") # Escaped braces
+        # Ensure PyCaret logging doesn't interfere excessively if needed
+        # from pycaret.utils.generic import enable_colab
+        # enable_colab() # May help manage output/logging in some environments
+        model = load_model(model_load_path)
+        logger.info("PyCaret's load_model executed successfully.")
+        return model
+    except FileNotFoundError:
+        # Specific handling if load_model itself can't find related files (like preprocess.pkl)
+        st.error(f"Error loading model components for '{model_load_path}'. PyCaret's load_model failed, possibly missing auxiliary files.") # Escaped braces
+        logger.exception(f"PyCaret load_model failed for '{model_load_path}', likely due to missing components:") # Escaped braces
+        return None
+    except Exception as e:
+        # Catch other potential errors during model loading
+        st.error(f"An unexpected error occurred loading model '{model_load_path}': {e}") # Escaped braces around model_load_path
+        logger.exception("Unexpected model loading error details:") # Log full traceback
+        return None
+model = get_model()
+# --- App Layout ---
+st.set_page_config(page_title=APP_TITLE, layout="centered")
+st.title(APP_TITLE)
+if model is None:
+    st.error("Model could not be loaded. Please check the application logs in the Space settings for more details. Application cannot proceed.")
+else:
+    st.success("Model loaded successfully!") # Indicate success
+    st.write("Enter the input features below to get a prediction.")
+    # --- Input Widgets ---
+    with st.form("prediction_form"):
+        st.subheader("Input Features:")
+        # Dynamically generated widgets based on schema
+        input_PassengerId = st.number_input(label='PassengerId', format='%f', key='input_PassengerId')
+        input_Pclass = st.number_input(label='Pclass', format='%f', key='input_Pclass')
+        input_Name = st.number_input(label='Name', format='%f', key='input_Name')
+        input_Sex = st.number_input(label='Sex', format='%f', key='input_Sex')
+        input_Age = st.number_input(label='Age', format='%f', key='input_Age')
+        input_SibSp = st.number_input(label='SibSp', format='%f', key='input_SibSp')
+        input_Parch = st.number_input(label='Parch', format='%f', key='input_Parch')
+        input_Ticket = st.number_input(label='Ticket', format='%f', key='input_Ticket')
+        input_Fare = st.number_input(label='Fare', format='%f', key='input_Fare')
+        input_Cabin = st.number_input(label='Cabin', format='%f', key='input_Cabin')
+        input_Embarked = st.number_input(label='Embarked', format='%f', key='input_Embarked')
+        input_Survived = st.number_input(label='Survived', format='%f', key='input_Survived')
+        submitted = st.form_submit_button("Predict")
+    # --- Prediction Logic ---
+    if submitted:
+        try:
+            # Create DataFrame from inputs using original feature names as keys
+            # The values are automatically fetched by Streamlit using the keys assigned to widgets
+            input_data_dict = {'PassengerId': input_PassengerId, 'Pclass': input_Pclass, 'Name': input_Name, 'Sex': input_Sex, 'Age': input_Age, 'SibSp': input_SibSp, 'Parch': input_Parch, 'Ticket': input_Ticket, 'Fare': input_Fare, 'Cabin': input_Cabin, 'Embarked': input_Embarked, 'Survived': input_Survived} # Use triple braces for dict literal inside f-string
+            logger.info(f"Raw input data from form: {input_data_dict}")
+            input_data = pd.DataFrame([input_data_dict])
+            # Ensure correct dtypes based on schema before prediction
+            logger.info("Applying dtypes based on schema...")
+            # Use double braces for the schema dict literal in the generated code
+            for feature, f_type in {'PassengerId': 'numerical', 'Pclass': 'numerical', 'Name': 'numerical', 'Sex': 'numerical', 'Age': 'numerical', 'SibSp': 'numerical', 'Parch': 'numerical', 'Ticket': 'numerical', 'Fare': 'numerical', 'Cabin': 'numerical', 'Embarked': 'numerical', 'Survived': 'numerical'}.items():
+                 if feature in input_data.columns: # Check if feature exists
+                     try:
+                         if f_type == 'numerical':
+                             # Convert to numeric, coercing errors (users might enter text)
+                             input_data[feature] = pd.to_numeric(input_data[feature], errors='coerce')
+                         # Add elif for 'categorical' or other types if needed
+                         # else:
+                         #     input_data[feature] = input_data[feature].astype(str) # Ensure string type
+                     except Exception as type_e:
+                         logger.warning(f"Could not convert feature '{feature}' to type '{f_type}'. Error: {type_e}")
+                         # Decide how to handle type conversion errors, e.g., set to NaN or keep original
+                         input_data[feature] = pd.NA # Set to missing if conversion fails
+                 else:
+                     logger.warning(f"Feature '{feature}' from schema not found in input form data.")
+            # Handle potential NaN values from coercion or failed conversion
+            if input_data.isnull().values.any():
+                 st.warning("Some inputs might be invalid or missing. Attempting to handle missing values (e.g., replacing with 0).")
+                 logger.warning(f"NaN values found in input data after type conversion/validation. Filling with 0. Data before fill:\n{input_data}")
+                 # More robust imputation might be needed depending on the model
+                 input_data.fillna(0, inplace=True) # Simple imputation strategy
+                 logger.info(f"Data after filling NaN with 0:\n{input_data}")
+            st.write("Input Data for Prediction (after processing):")
+            st.dataframe(input_data)
+            # Make prediction
+            logger.info("Calling predict_model...")
+            with st.spinner("Predicting..."):
+                # Suppress prediction warnings if needed
+                # with warnings.catch_warnings():
+                #    warnings.simplefilter("ignore")
+                predictions = predict_model(model, data=input_data)
+                logger.info("Prediction successful.")
+            st.subheader("Prediction Result:")
+            logger.info(f"Prediction output columns: {predictions.columns.tolist()}")
+            # Display relevant prediction columns (adjust based on PyCaret task)
+            # Common columns: 'prediction_label', 'prediction_score'
+            pred_col_label = 'prediction_label'
+            pred_col_score = 'prediction_score'
+            if pred_col_label in predictions.columns:
+                st.success(f"Predicted Label: **{predictions[pred_col_label].iloc[0]}**")
+            elif pred_col_score in predictions.columns: # Show score if label not present (e.g., regression)
+                 st.success(f"Prediction Score: **{predictions[pred_col_score].iloc[0]:.4f}**")
+            else:
+                 # Fallback: Display the last column as prediction if specific ones aren't found
+                 try:
+                     last_col_name = predictions.columns[-1]
+                     st.info(f"Prediction Output (Column: '{last_col_name}'): **{predictions[last_col_name].iloc[0]}**")
+                     logger.warning(f"Could not find 'prediction_label' or 'prediction_score'. Displaying last column: '{last_col_name}'")
+                 except IndexError:
+                     st.error("Prediction result DataFrame is empty.")
+                     logger.error("Prediction result DataFrame is empty.")
+            # Show full prediction output optionally
+            with st.expander("See Full Prediction Output DataFrame"):
+                st.dataframe(predictions)
+        except Exception as e:
+            st.error(f"An error occurred during prediction: {e}")
+            logger.exception("Prediction error details:") # Log full traceback

model.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d027abd627a584c17c7db89b3f348f88612ed2dddd9f2e6085f45dab538e777c
+size 126186

requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+streamlit>=1.20.0 # Specify a recent streamlit version
+pycaret[full]==3.3.2
+pandas>=1.5.0 # Specify recent pandas
+scikit-learn # Often needed by PyCaret under the hood, ensure compatibility with pycaret version if possible
+python-dotenv # Needed if app uses .env itself, though typically not needed in deployed Space
+# Add any other specific dependencies your model might need here
+# Example: numpy, joblib, etc.