lukecq commited on
Commit
1c09f6d
Β·
1 Parent(s): a3e5824

update readme

Browse files
Files changed (2) hide show
  1. app.py +9 -9
  2. src/display/about.py +13 -2
app.py CHANGED
@@ -124,15 +124,15 @@ with demo:
124
 
125
  with gr.TabItem("πŸ“ About", elem_id="llm-benchmark-tab-table", id=3):
126
  gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
127
- # with gr.Row():
128
- # with gr.Accordion("πŸ“™ Citation", open=False):
129
- # citation_button = gr.Textbox(
130
- # value=CITATION_BUTTON_TEXT,
131
- # label=CITATION_BUTTON_LABEL,
132
- # lines=20,
133
- # elem_id="citation-button",
134
- # show_copy_button=True,
135
- # )
136
  gr.Markdown(CONTACT_TEXT, elem_classes="markdown-text")
137
 
138
  demo.launch(share=True)
 
124
 
125
  with gr.TabItem("πŸ“ About", elem_id="llm-benchmark-tab-table", id=3):
126
  gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
127
+ with gr.Row():
128
+ with gr.Accordion("πŸ“™ Citation", open=False):
129
+ citation_button = gr.Textbox(
130
+ value=CITATION_BUTTON_TEXT,
131
+ label=CITATION_BUTTON_LABEL,
132
+ lines=20,
133
+ elem_id="citation-button",
134
+ show_copy_button=True,
135
+ )
136
  gr.Markdown(CONTACT_TEXT, elem_classes="markdown-text")
137
 
138
  demo.launch(share=True)
src/display/about.py CHANGED
@@ -36,7 +36,7 @@ This leaderboard evaluates Large Language Models (LLMs) on Southeast Asian (SEA)
36
  """
37
 
38
  INTRODUCTION_TEXT = """
39
- This leaderboard evaluates Large Language Models (LLMs) on Southeast Asian (SEA) languages through two comprehensive benchmarks - SeaExam and SeaBench:
40
  * **SeaExam** assesses world knowledge and reasoning capabilities through exam-style questions (for both base and chat version models) [[data (public)](https://huggingface.co/datasets/SeaLLMs/SeaExam)] [[eval code](https://github.com/DAMO-NLP-SG/SeaExam)]
41
  * **SeaBench** evaluates instruction-following abilities and multi-turn conversational skills (thus only for chat version models). [[data (public)](https://huggingface.co/datasets/SeaLLMs/SeaBench)] [[eval code](https://github.com/DAMO-NLP-SG/SeaBench?tab=readme-ov-file)]
42
 
@@ -121,11 +121,22 @@ If everything is done, check you can launch the EleutherAIHarness on your model
121
 
122
  CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
123
  CITATION_BUTTON_TEXT = r"""
 
 
 
 
 
 
 
 
 
 
 
124
  }
125
  """
126
 
127
  CONTACT_TEXT = f"""
128
  ## Contact
129
 
130
- If you have any questions or want to include your models in the leaderboard, please contact Chaoqun Liu (<chaoqun.liu@alibaba-inc.com>) and [Wenxuan Zhang](https://isakzhang.github.io/).
131
  """
 
36
  """
37
 
38
  INTRODUCTION_TEXT = """
39
+ This leaderboard evaluates Large Language Models (LLMs) on Southeast Asian (SEA) languages through two comprehensive benchmarks - SeaExam and SeaBench [[Paper](https://aclanthology.org/2025.findings-naacl.341/)]:
40
  * **SeaExam** assesses world knowledge and reasoning capabilities through exam-style questions (for both base and chat version models) [[data (public)](https://huggingface.co/datasets/SeaLLMs/SeaExam)] [[eval code](https://github.com/DAMO-NLP-SG/SeaExam)]
41
  * **SeaBench** evaluates instruction-following abilities and multi-turn conversational skills (thus only for chat version models). [[data (public)](https://huggingface.co/datasets/SeaLLMs/SeaBench)] [[eval code](https://github.com/DAMO-NLP-SG/SeaBench?tab=readme-ov-file)]
42
 
 
121
 
122
  CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
123
  CITATION_BUTTON_TEXT = r"""
124
+ @inproceedings{liu-etal-2025-seaexam,
125
+ title = "{S}ea{E}xam and {S}ea{B}ench: Benchmarking {LLM}s with Local Multilingual Questions in {S}outheast {A}sia",
126
+ author = "Liu, Chaoqun and Zhang, Wenxuan and Ying, Jiahao and Aljunied, Mahani and Luu, Anh Tuan and Bing, Lidong",
127
+ booktitle = "Findings of the Association for Computational Linguistics: NAACL 2025",
128
+ month = apr,
129
+ year = "2025",
130
+ address = "Albuquerque, New Mexico",
131
+ publisher = "Association for Computational Linguistics",
132
+ url = "https://aclanthology.org/2025.findings-naacl.341/",
133
+ pages = "6119--6136",
134
+ ISBN = "979-8-89176-195-7"
135
  }
136
  """
137
 
138
  CONTACT_TEXT = f"""
139
  ## Contact
140
 
141
+ If you have any questions or want to include your models in the leaderboard, please contact [Chaoqun Liu](https://liuchaoqun.github.io/) and [Wenxuan Zhang](https://isakzhang.github.io/).
142
  """