Jacqueline Garrahan
commited on
Commit
•
3c7b0e5
1
Parent(s):
0982a7f
Check in updated files
Browse files- app.py +1 -1
- src/about.py +9 -8
app.py
CHANGED
@@ -82,7 +82,7 @@ def init_leaderboard(dataframe):
|
|
82 |
label="Select the number of parameters (B)",
|
83 |
),
|
84 |
ColumnFilter(
|
85 |
-
AutoEvalColumn.still_on_hub.name, type="boolean", label="
|
86 |
),
|
87 |
],
|
88 |
bool_checkboxgroup_label="Hide models",
|
|
|
82 |
label="Select the number of parameters (B)",
|
83 |
),
|
84 |
ColumnFilter(
|
85 |
+
AutoEvalColumn.still_on_hub.name, type="boolean", label="External Providers", default=False
|
86 |
),
|
87 |
],
|
88 |
bool_checkboxgroup_label="Hide models",
|
src/about.py
CHANGED
@@ -6,20 +6,21 @@ class Task:
|
|
6 |
benchmark: str
|
7 |
metric: str
|
8 |
col_name: str
|
|
|
9 |
|
10 |
|
11 |
# Select your tasks here
|
12 |
# ---------------------------------------------------
|
13 |
class Tasks(Enum):
|
14 |
# task_key in the json file, metric_key in the json file, name to display in the leaderboard
|
15 |
-
task0 = Task("aiera_speaker_assign", "accuracy,none", "
|
16 |
-
task1 = Task("aiera_transcript_sentiment", "accuracy,none","
|
17 |
-
task2 = Task("bbh_zeroshot_causal_judgement", "exact_match,flexible-extract","
|
18 |
-
task3 = Task("flare_ectsum", "recall,none","
|
19 |
-
task4 = Task("flare_edtsum", "rougeLsum,none","
|
20 |
-
task5 = Task("flare_finqa", "exact_match_manual,none","
|
21 |
-
task6 = Task("flare_fiqasa", "accuracy,none","
|
22 |
-
task7 = Task("flare_ner", "accuracy,none","
|
23 |
|
24 |
|
25 |
NUM_FEWSHOT = 0 # Change with your few shot
|
|
|
6 |
benchmark: str
|
7 |
metric: str
|
8 |
col_name: str
|
9 |
+
reference_url: str
|
10 |
|
11 |
|
12 |
# Select your tasks here
|
13 |
# ---------------------------------------------------
|
14 |
class Tasks(Enum):
|
15 |
# task_key in the json file, metric_key in the json file, name to display in the leaderboard
|
16 |
+
task0 = Task("aiera_speaker_assign", "accuracy,none", "Speaker ID")
|
17 |
+
task1 = Task("aiera_transcript_sentiment", "accuracy,none","Speaker Sentiment")
|
18 |
+
task2 = Task("bbh_zeroshot_causal_judgement", "exact_match,flexible-extract","BBH-causal-judgement")
|
19 |
+
task3 = Task("flare_ectsum", "recall,none", "flare-ect-sum")
|
20 |
+
task4 = Task("flare_edtsum", "rougeLsum,none","flare-edt-sum")
|
21 |
+
task5 = Task("flare_finqa", "exact_match_manual,none","finqa")
|
22 |
+
task6 = Task("flare_fiqasa", "accuracy,none","fiqasa")
|
23 |
+
task7 = Task("flare_ner", "accuracy,none","flare-ner")
|
24 |
|
25 |
|
26 |
NUM_FEWSHOT = 0 # Change with your few shot
|