dtcxzyw commited on
Commit
7a313bd
·
unverified ·
1 Parent(s): 913f726

show unique bugs

Browse files
Files changed (1) hide show
  1. app.py +13 -0
app.py CHANGED
@@ -77,6 +77,7 @@ for cat, bug_ids in bug_id_by_cat.items():
77
  timeline_bugids.append(bug_id)
78
  LEADERBOARD_DF = get_leaderboard_df(EVAL_REQUESTS_PATH, total_issues)
79
  fixed_bug_ids = set()
 
80
  fixed_bug_ids_fast = set()
81
  for row in LEADERBOARD_DF.itertuples():
82
  print(row)
@@ -86,8 +87,10 @@ for row in LEADERBOARD_DF.itertuples():
86
  timeline_cols.append(row.method_id)
87
  timeline_bugids.append(fix)
88
  fixed_bug_ids.add(fix)
 
89
  for fix in row.fixed_bug_ids_fast:
90
  fixed_bug_ids_fast.add(fix)
 
91
  timeline_bugtypes = []
92
  for bug_id in timeline_bugids:
93
  timeline_xs.append(bug_id_to_time[bug_id])
@@ -148,6 +151,15 @@ fixed_by_comp_df = pd.DataFrame(
148
  }
149
  )
150
  fixed_by_comp_df.sort_values("Total", inplace=True, ascending=False)
 
 
 
 
 
 
 
 
 
151
 
152
 
153
  def init_leaderboard(dataframe):
@@ -192,6 +204,7 @@ with demo:
192
  )
193
  gr.Dataframe(fixed_by_cat_df)
194
  gr.Dataframe(fixed_by_comp_df)
 
195
 
196
  with gr.TabItem("🚀 Submission", elem_id="llm-benchmark-tab-table", id=1):
197
  gr.Markdown(EVALUATION_QUEUE_TEXT, elem_classes="markdown-text")
 
77
  timeline_bugids.append(bug_id)
78
  LEADERBOARD_DF = get_leaderboard_df(EVAL_REQUESTS_PATH, total_issues)
79
  fixed_bug_ids = set()
80
+ fixed_bug_ids_count = dict()
81
  fixed_bug_ids_fast = set()
82
  for row in LEADERBOARD_DF.itertuples():
83
  print(row)
 
87
  timeline_cols.append(row.method_id)
88
  timeline_bugids.append(fix)
89
  fixed_bug_ids.add(fix)
90
+ fixed_bug_ids_count[fix] = fixed_bug_ids_count.get(fix, 0) + 1
91
  for fix in row.fixed_bug_ids_fast:
92
  fixed_bug_ids_fast.add(fix)
93
+ unique_bug_ids = set([bug_id for bug_id, count in fixed_bug_ids_count.items() if count == 1])
94
  timeline_bugtypes = []
95
  for bug_id in timeline_bugids:
96
  timeline_xs.append(bug_id_to_time[bug_id])
 
151
  }
152
  )
153
  fixed_by_comp_df.sort_values("Total", inplace=True, ascending=False)
154
+ unique_bugs_df = pd.DataFrame(
155
+ {
156
+ "Model": [c.method_id for c in LEADERBOARD_DF.itertuples()],
157
+ "Unique Bugs Fixed": [
158
+ len(set(c.fixed_bug_ids).intersection(unique_bug_ids)) for c in LEADERBOARD_DF.itertuples()
159
+ ],
160
+ }
161
+ )
162
+ unique_bugs_df.sort_values("Unique Bugs Fixed", inplace=True, ascending=False)
163
 
164
 
165
  def init_leaderboard(dataframe):
 
204
  )
205
  gr.Dataframe(fixed_by_cat_df)
206
  gr.Dataframe(fixed_by_comp_df)
207
+ gr.Dataframe(unique_bugs_df)
208
 
209
  with gr.TabItem("🚀 Submission", elem_id="llm-benchmark-tab-table", id=1):
210
  gr.Markdown(EVALUATION_QUEUE_TEXT, elem_classes="markdown-text")