Spaces:
Running
Running
update readme
Browse files- app.py +9 -9
- src/display/about.py +13 -2
app.py
CHANGED
@@ -124,15 +124,15 @@ with demo:
|
|
124 |
|
125 |
with gr.TabItem("π About", elem_id="llm-benchmark-tab-table", id=3):
|
126 |
gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
|
127 |
-
|
128 |
-
|
129 |
-
|
130 |
-
|
131 |
-
|
132 |
-
|
133 |
-
|
134 |
-
|
135 |
-
|
136 |
gr.Markdown(CONTACT_TEXT, elem_classes="markdown-text")
|
137 |
|
138 |
demo.launch(share=True)
|
|
|
124 |
|
125 |
with gr.TabItem("π About", elem_id="llm-benchmark-tab-table", id=3):
|
126 |
gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
|
127 |
+
with gr.Row():
|
128 |
+
with gr.Accordion("π Citation", open=False):
|
129 |
+
citation_button = gr.Textbox(
|
130 |
+
value=CITATION_BUTTON_TEXT,
|
131 |
+
label=CITATION_BUTTON_LABEL,
|
132 |
+
lines=20,
|
133 |
+
elem_id="citation-button",
|
134 |
+
show_copy_button=True,
|
135 |
+
)
|
136 |
gr.Markdown(CONTACT_TEXT, elem_classes="markdown-text")
|
137 |
|
138 |
demo.launch(share=True)
|
src/display/about.py
CHANGED
@@ -36,7 +36,7 @@ This leaderboard evaluates Large Language Models (LLMs) on Southeast Asian (SEA)
|
|
36 |
"""
|
37 |
|
38 |
INTRODUCTION_TEXT = """
|
39 |
-
This leaderboard evaluates Large Language Models (LLMs) on Southeast Asian (SEA) languages through two comprehensive benchmarks - SeaExam and SeaBench:
|
40 |
* **SeaExam** assesses world knowledge and reasoning capabilities through exam-style questions (for both base and chat version models) [[data (public)](https://huggingface.co/datasets/SeaLLMs/SeaExam)] [[eval code](https://github.com/DAMO-NLP-SG/SeaExam)]
|
41 |
* **SeaBench** evaluates instruction-following abilities and multi-turn conversational skills (thus only for chat version models). [[data (public)](https://huggingface.co/datasets/SeaLLMs/SeaBench)] [[eval code](https://github.com/DAMO-NLP-SG/SeaBench?tab=readme-ov-file)]
|
42 |
|
@@ -121,11 +121,22 @@ If everything is done, check you can launch the EleutherAIHarness on your model
|
|
121 |
|
122 |
CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
|
123 |
CITATION_BUTTON_TEXT = r"""
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
124 |
}
|
125 |
"""
|
126 |
|
127 |
CONTACT_TEXT = f"""
|
128 |
## Contact
|
129 |
|
130 |
-
If you have any questions or want to include your models in the leaderboard, please contact Chaoqun Liu
|
131 |
"""
|
|
|
36 |
"""
|
37 |
|
38 |
INTRODUCTION_TEXT = """
|
39 |
+
This leaderboard evaluates Large Language Models (LLMs) on Southeast Asian (SEA) languages through two comprehensive benchmarks - SeaExam and SeaBench [[Paper](https://aclanthology.org/2025.findings-naacl.341/)]:
|
40 |
* **SeaExam** assesses world knowledge and reasoning capabilities through exam-style questions (for both base and chat version models) [[data (public)](https://huggingface.co/datasets/SeaLLMs/SeaExam)] [[eval code](https://github.com/DAMO-NLP-SG/SeaExam)]
|
41 |
* **SeaBench** evaluates instruction-following abilities and multi-turn conversational skills (thus only for chat version models). [[data (public)](https://huggingface.co/datasets/SeaLLMs/SeaBench)] [[eval code](https://github.com/DAMO-NLP-SG/SeaBench?tab=readme-ov-file)]
|
42 |
|
|
|
121 |
|
122 |
CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
|
123 |
CITATION_BUTTON_TEXT = r"""
|
124 |
+
@inproceedings{liu-etal-2025-seaexam,
|
125 |
+
title = "{S}ea{E}xam and {S}ea{B}ench: Benchmarking {LLM}s with Local Multilingual Questions in {S}outheast {A}sia",
|
126 |
+
author = "Liu, Chaoqun and Zhang, Wenxuan and Ying, Jiahao and Aljunied, Mahani and Luu, Anh Tuan and Bing, Lidong",
|
127 |
+
booktitle = "Findings of the Association for Computational Linguistics: NAACL 2025",
|
128 |
+
month = apr,
|
129 |
+
year = "2025",
|
130 |
+
address = "Albuquerque, New Mexico",
|
131 |
+
publisher = "Association for Computational Linguistics",
|
132 |
+
url = "https://aclanthology.org/2025.findings-naacl.341/",
|
133 |
+
pages = "6119--6136",
|
134 |
+
ISBN = "979-8-89176-195-7"
|
135 |
}
|
136 |
"""
|
137 |
|
138 |
CONTACT_TEXT = f"""
|
139 |
## Contact
|
140 |
|
141 |
+
If you have any questions or want to include your models in the leaderboard, please contact [Chaoqun Liu](https://liuchaoqun.github.io/) and [Wenxuan Zhang](https://isakzhang.github.io/).
|
142 |
"""
|