AudioBench-Leaderboard-Extend

Running

App Files Files Community

binwang commited on Mar 19

Commit

2bd4813

verified ·

1 Parent(s): 7d5f69e

Upload folder using huggingface_hub

Browse files

Files changed (1) hide show

app/pages.py +11 -11

app/pages.py CHANGED Viewed

@@ -282,7 +282,7 @@ def speech_question_answering_singlish():
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
-        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE'])
         metric = metric.lower()
     if tab_section:
@@ -310,7 +310,7 @@ def spoken_dialogue_summarization_singlish():
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
-        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE'])
         metric = metric.lower()
     if tab_section:
@@ -336,7 +336,7 @@ def speech_instruction():
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
-        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE'])
         metric = metric.lower()
     if tab_section:
@@ -360,7 +360,7 @@ def audio_captioning():
     with space1:
         tab_section = st.selectbox('Dataset', dataset_list)
     with space2:
-        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'METEOR'])
         metric = metric.lower()
     if tab_section:
@@ -383,7 +383,7 @@ def audio_scene_question_answering():
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
-        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE'])
         metric = metric.lower()
     if tab_section:
@@ -413,7 +413,7 @@ def accent_recognition():
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
-        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE'])
         metric = metric.lower()
     if tab_section:
@@ -440,7 +440,7 @@ def gender_recognition():
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
-        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE'])
         metric = metric.lower()
     if tab_section:
@@ -470,7 +470,7 @@ def emotion_recognition():
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
-        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE'])
         metric = metric.lower()
     if tab_section:
@@ -498,7 +498,7 @@ def music_understanding():
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
-        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE'])
         metric = metric.lower()
     if tab_section:
@@ -561,7 +561,7 @@ def under_development():
                 'YTB-SDS-Batch1',
                 'YTB-PQA-Batch1',
                 ]:
-            metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE'])
             metric = metric.lower()
         else:
             raise ValueError('Invalid dataset')
@@ -588,7 +588,7 @@ def mmau_evaluation():
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
-        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'STRING_MATCH'])
         metric = metric.lower()
     if tab_section:

     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
+        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'GPT4O_JUDGE'])
         metric = metric.lower()
     if tab_section:
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
+        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'GPT4O_JUDGE'])
         metric = metric.lower()
     if tab_section:
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
+        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'GPT4O_JUDGE'])
         metric = metric.lower()
     if tab_section:
     with space1:
         tab_section = st.selectbox('Dataset', dataset_list)
     with space2:
+        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'GPT4O_JUDGE', 'METEOR'])
         metric = metric.lower()
     if tab_section:
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
+        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'GPT4O_JUDGE'])
         metric = metric.lower()
     if tab_section:
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
+        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'GPT4O_JUDGE'])
         metric = metric.lower()
     if tab_section:
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
+        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'GPT4O_JUDGE'])
         metric = metric.lower()
     if tab_section:
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
+        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'GPT4O_JUDGE'])
         metric = metric.lower()
     if tab_section:
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
+        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'GPT4O_JUDGE'])
         metric = metric.lower()
     if tab_section:
                 'YTB-SDS-Batch1',
                 'YTB-PQA-Batch1',
                 ]:
+            metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'GPT4O_JUDGE'])
             metric = metric.lower()
         else:
             raise ValueError('Invalid dataset')
     with space1:
         tab_section = st.selectbox('Dataset', filters_1_list)
     with space2:
+        metric = st.selectbox('Metric', ['LLAMA3_70B_JUDGE', 'STRING_MATCH', 'GPT4O_JUDGE'])
         metric = metric.lower()
     if tab_section: