Spaces:

CIRCL
/

CWE-PARENT-patch-Vulnerability-Patch-Classification-Roberta-Base

Sleeping

App Files Files Community

elselse commited on 10 days ago

Commit

9ba88a4

·

verified ·

1 Parent(s): 1d606fb

Update app.py

Files changed (1) hide show

app.py +23 -9

app.py CHANGED Viewed

@@ -1,36 +1,50 @@
 import gradio as gr
 from transformers import pipeline
-# Load the Hugging Face model for text classification
 classifier = pipeline(
     task="text-classification",
     model="CIRCL/cwe-parent-vulnerability-classification-roberta-base",
     return_all_scores=True
 )
 def predict_cwe(commit_message: str):
     """
-    Predict CWE(s) from a commit message using the model.
     """
     results = classifier(commit_message)[0]
-    # Sort the results by score descending
     sorted_results = sorted(results, key=lambda x: x["score"], reverse=True)
-    # Return top 5 predictions as a dictionary
-    return {item["label"]: round(float(item["score"]), 4) for item in sorted_results[:5]}
-# Build the Gradio interface
 demo = gr.Interface(
     fn=predict_cwe,
     inputs=gr.Textbox(lines=3, placeholder="Enter your commit message here..."),
     outputs=gr.Label(num_top_classes=5),
     title="CWE Prediction from Commit Message",
-    description="Type a Git commit message and get the most likely CWE classes predicted by the model.",
     examples=[
         ["Fixed buffer overflow in input parsing"],
-        ["SQL injection possible in user login endpoint"]
     ]
 )
 if __name__ == "__main__":
     demo.launch()

 import gradio as gr
+import json
 from transformers import pipeline
+# Load Hugging Face model (text classification)
 classifier = pipeline(
     task="text-classification",
     model="CIRCL/cwe-parent-vulnerability-classification-roberta-base",
     return_all_scores=True
 )
+# Load child-to-parent mapping
+with open("vulntrain/trainers/child_to_parent_mapping.json", "r") as f:
+    child_to_parent = json.load(f)
 def predict_cwe(commit_message: str):
     """
+    Predict CWE(s) from a commit message and map to parent CWEs.
     """
     results = classifier(commit_message)[0]
     sorted_results = sorted(results, key=lambda x: x["score"], reverse=True)
+    # Map predictions to parent CWE (if available)
+    mapped_results = {}
+    for item in sorted_results[:5]:
+        child_cwe = item["label"].replace("CWE-", "")
+        parent_cwe = child_to_parent.get(child_cwe, child_cwe)  # default to child if no parent
+        mapped_results[f"CWE-{parent_cwe}"] = round(float(item["score"]), 4)
+    return mapped_results
+# Gradio UI
 demo = gr.Interface(
     fn=predict_cwe,
     inputs=gr.Textbox(lines=3, placeholder="Enter your commit message here..."),
     outputs=gr.Label(num_top_classes=5),
     title="CWE Prediction from Commit Message",
+    description="This tool uses a fine-tuned model to predict CWE categories from Git commit messages. "
+                "Predicted child CWEs are mapped to their parent CWEs if applicable.",
     examples=[
         ["Fixed buffer overflow in input parsing"],
+        ["SQL injection possible in login flow"],
+        ["Improved input validation to prevent XSS"],
+        ["Added try/catch to avoid null pointer crash"],
+        ["Patched race condition in thread lock logic"]
     ]
 )
 if __name__ == "__main__":
     demo.launch()