Spaces:

KavinduHansaka
/

Toxic_Comment_Classifier

Sleeping

KavinduHansaka commited on May 15

Commit

4ad87c5

verified ·

1 Parent(s): e00c4c7

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,23 +5,38 @@ import pandas as pd
 # Load model once
 model = Detoxify('original')
 def classify_multiple(comments):
-    # Split input by newlines and clean
     comment_list = [c.strip() for c in comments.split('\n') if c.strip()]
     if not comment_list:
         return "Please enter at least one valid comment."
-    results = model.predict(comment_list)  # Returns a dict of lists
     df = pd.DataFrame(results, index=comment_list).round(4)
     return df
 iface = gr.Interface(
     fn=classify_multiple,
     inputs=gr.Textbox(lines=8, placeholder="Enter one or more comments, each on a new line..."),
-    outputs=gr.Dataframe(label="Toxicity Predictions"),
-    title="💬 Toxic Comment Classifier (Multi-Comment)",
-    description="Paste one or more comments. Each will be scored for toxicity, severe toxicity, insult, threat, obscene, and identity hate using Detoxify."
 )
 if __name__ == "__main__":

 # Load model once
 model = Detoxify('original')
+# Threshold for flagging a comment as risky
+TOXICITY_THRESHOLD = 0.7
 def classify_multiple(comments):
+    # Split input into lines
     comment_list = [c.strip() for c in comments.split('\n') if c.strip()]
     if not comment_list:
         return "Please enter at least one valid comment."
+    # Predict toxicity scores
+    results = model.predict(comment_list)
     df = pd.DataFrame(results, index=comment_list).round(4)
+    # Capitalize headers
+    df.columns = [col.replace("_", " ").title().replace(" ", "_") for col in df.columns]
+    df.columns = [col.replace("_", " ") for col in df.columns]
+    # Add warning column
+    def check_warning(row):
+        return "⚠️ High Risk" if any(score > TOXICITY_THRESHOLD for score in row) else "✅ Safe"
+    df["⚠️ Warning"] = df.apply(check_warning, axis=1)
     return df
+# UI setup
 iface = gr.Interface(
     fn=classify_multiple,
     inputs=gr.Textbox(lines=8, placeholder="Enter one or more comments, each on a new line..."),
+    outputs=gr.Dataframe(label="Toxicity Predictions with Warnings"),
+    title="💬 Toxic Comment Classifier (Multi-Comment, with Warnings)",
+    description="Paste one or more comments. Each comment is scored for toxicity, and flagged as ⚠️ if any label exceeds 0.7."
 )
 if __name__ == "__main__":