Spaces:

Aliou12
/

streamlit-app

Sleeping

App Files Files Community

Aliou12 commited on Jan 31

Commit

edbe41b

1 Parent(s): 9747b16

new update

Browse files

Files changed (1) hide show

app.py +7 -6

app.py CHANGED Viewed

@@ -30,6 +30,7 @@ if uploaded_file is not None:
     # ✅ Convertir en catégories
     data['Product_line'] = data['Product_line'].astype('category')
     data['Payment'] = data['Payment'].astype('category')
     # 📌 Afficher un aperçu des données
     st.subheader("📊 Aperçu des Données")
@@ -46,7 +47,7 @@ if uploaded_file is not None:
     residuals = model.resid
     if len(residuals) > 5000:
-        residuals_sample = residuals.sample(5000, random_state=42)
     else:
         residuals_sample = residuals
@@ -72,11 +73,11 @@ if uploaded_file is not None:
     st.subheader("📌 Comparaisons Post-Hoc (Tukey HSD)")
-    if np.issubdtype(data['Rating'].dtype, np.number):
         tukey = pairwise_tukeyhsd(data['Rating'], data['Product_line'])
         st.write(tukey.summary())
     else:
-        st.error("Erreur : La colonne 'Rating' doit être numérique pour le test de Tukey.")
     # ============================
     # 📊 Visualisation des Résultats
@@ -91,7 +92,7 @@ if uploaded_file is not None:
     st.pyplot(fig)
     # 🔹 Heatmap des Moyennes des Évaluations
-    mean_ratings = data.groupby(['Product_line', 'Payment'])['Rating'].mean().unstack()
     fig, ax = plt.subplots(figsize=(8, 5))
     sns.heatmap(mean_ratings, annot=True, cmap='coolwarm', ax=ax)
     st.pyplot(fig)
@@ -117,6 +118,6 @@ if uploaded_file is not None:
     # 🔹 Visualisation du Clustering
     fig, ax = plt.subplots(figsize=(8, 5))
-    sns.scatterplot(x='Product_line', y='Rating', hue=data['Cluster'].astype(str), palette='viridis', data=data, ax=ax)
-    plt.xticks(rotation=45)
     st.pyplot(fig)

     # ✅ Convertir en catégories
     data['Product_line'] = data['Product_line'].astype('category')
     data['Payment'] = data['Payment'].astype('category')
+    data['Rating'] = pd.to_numeric(data['Rating'], errors='coerce')  # Convertir en numérique
     # 📌 Afficher un aperçu des données
     st.subheader("📊 Aperçu des Données")
     residuals = model.resid
     if len(residuals) > 5000:
+        residuals_sample = pd.Series(residuals).sample(5000, random_state=42)
     else:
         residuals_sample = residuals
     st.subheader("📌 Comparaisons Post-Hoc (Tukey HSD)")
+    if data['Rating'].isna().sum() == 0:  # Vérifie qu'il n'y a pas de NaN
         tukey = pairwise_tukeyhsd(data['Rating'], data['Product_line'])
         st.write(tukey.summary())
     else:
+        st.error("Erreur : Des valeurs non numériques ont été détectées dans 'Rating'. Vérifiez votre fichier CSV.")
     # ============================
     # 📊 Visualisation des Résultats
     st.pyplot(fig)
     # 🔹 Heatmap des Moyennes des Évaluations
+    mean_ratings = data.groupby(['Product_line', 'Payment'])['Rating'].mean().unstack().fillna(0)
     fig, ax = plt.subplots(figsize=(8, 5))
     sns.heatmap(mean_ratings, annot=True, cmap='coolwarm', ax=ax)
     st.pyplot(fig)
     # 🔹 Visualisation du Clustering
     fig, ax = plt.subplots(figsize=(8, 5))
+    sns.scatterplot(x='Product_line_encoded', y='Rating', hue=data['Cluster'].astype(str), palette='viridis', data=data, ax=ax)
+    plt.xticks(ticks=range(len(encoder.classes_)), labels=encoder.classes_, rotation=45)
     st.pyplot(fig)