Spaces:

dtcxzyw
/

llvm-apr-benchmark-leaderboard

Running

App Files Files Community

dtcxzyw commited on Feb 10

Commit

a311ab2

unverified ·

1 Parent(s): d8484e3

Update

Browse files

Files changed (1) hide show

app.py +8 -4

app.py CHANGED Viewed

@@ -44,6 +44,7 @@ except Exception:
 dataset = load_dataset("dtcxzyw/llvm-apr-benchmark")
 total_issues = dataset.num_rows["test"]
 bug_id_to_time = dict()
 bug_id_by_cat = {
     "crash": [],
     "miscompilation": [],
@@ -52,13 +53,13 @@ bug_id_by_cat = {
 for issue in dataset["test"]:
     bug_id_to_time[issue["bug_id"]] = pd.to_datetime(issue["knowledge_cutoff"])
     bug_id_by_cat[issue["bug_type"]].append(issue["bug_id"])
 timeline_xs = []
 timeline_ys = []
 timeline_cols = []
 timeline_bugids = []
 model_cnt = 0
 for bug_id, time in bug_id_to_time.items():
-    timeline_xs.append(time)
     timeline_ys.append(0)
     timeline_cols.append("All")
     timeline_bugids.append(bug_id)
@@ -66,7 +67,6 @@ cat_cnt = 4
 for cat, bug_ids in bug_id_by_cat.items():
     cat_cnt -= 1
     for bug_id in bug_ids:
-        timeline_xs.append(bug_id_to_time[bug_id])
         timeline_ys.append(cat_cnt)
         timeline_cols.append(str(cat).capitalize())
         timeline_bugids.append(bug_id)
@@ -75,16 +75,20 @@ for row in LEADERBOARD_DF.itertuples():
     print(row)
     model_cnt += 1
     for fix in row.fixed_bug_ids:
-        timeline_xs.append(bug_id_to_time[fix])
         timeline_ys.append(-model_cnt)
         timeline_cols.append(row.method_id)
         timeline_bugids.append(fix)
 timeline_df = pd.DataFrame(
     {
         "time": timeline_xs,
         "model": timeline_ys,
         "method_name": timeline_cols,
         "bug_id": timeline_bugids,
     }
 )
@@ -127,7 +131,7 @@ with demo:
                 y_label="Model",
                 title="Timeline",
                 y_lim=(-model_cnt - 1, 4),
-                tooltip=["bug_id", "method_name", "time"],
             )
         with gr.TabItem("🚀 Submission", elem_id="llm-benchmark-tab-table", id=1):

 dataset = load_dataset("dtcxzyw/llvm-apr-benchmark")
 total_issues = dataset.num_rows["test"]
 bug_id_to_time = dict()
+bug_id_to_type = dict()
 bug_id_by_cat = {
     "crash": [],
     "miscompilation": [],
 for issue in dataset["test"]:
     bug_id_to_time[issue["bug_id"]] = pd.to_datetime(issue["knowledge_cutoff"])
     bug_id_by_cat[issue["bug_type"]].append(issue["bug_id"])
+    bug_id_to_type[issue["bug_id"]] = issue["bug_type"]
 timeline_xs = []
 timeline_ys = []
 timeline_cols = []
 timeline_bugids = []
 model_cnt = 0
 for bug_id, time in bug_id_to_time.items():
     timeline_ys.append(0)
     timeline_cols.append("All")
     timeline_bugids.append(bug_id)
 for cat, bug_ids in bug_id_by_cat.items():
     cat_cnt -= 1
     for bug_id in bug_ids:
         timeline_ys.append(cat_cnt)
         timeline_cols.append(str(cat).capitalize())
         timeline_bugids.append(bug_id)
     print(row)
     model_cnt += 1
     for fix in row.fixed_bug_ids:
         timeline_ys.append(-model_cnt)
         timeline_cols.append(row.method_id)
         timeline_bugids.append(fix)
+timeline_bugtypes = []
+for bug_id in timeline_bugids:
+    timeline_xs.append(bug_id_to_time[bug_id])
+    timeline_bugtypes.append(bug_id_to_type[bug_id])
 timeline_df = pd.DataFrame(
     {
         "time": timeline_xs,
         "model": timeline_ys,
         "method_name": timeline_cols,
         "bug_id": timeline_bugids,
+        "bug_type": timeline_bugtypes,
     }
 )
                 y_label="Model",
                 title="Timeline",
                 y_lim=(-model_cnt - 1, 4),
+                tooltip=["bug_id", "method_name", "time", "bug_type"],
             )
         with gr.TabItem("🚀 Submission", elem_id="llm-benchmark-tab-table", id=1):