Commit
·
64b7cb2
1
Parent(s):
ee07d52
added about section for datasets
Browse files- app.py +14 -0
- src/display/about.py +23 -6
app.py
CHANGED
@@ -357,6 +357,20 @@ with demo:
|
|
357 |
|
358 |
with gr.TabItem("📝 Evaluation Datasets", elem_id="llm-benchmark-tab-table", id=4):
|
359 |
gr.Markdown(LLM_DATASET_TEXT, elem_classes="markdown-text")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
360 |
|
361 |
scheduler = BackgroundScheduler()
|
362 |
scheduler.add_job(restart_space, "interval", seconds=300)
|
|
|
357 |
|
358 |
with gr.TabItem("📝 Evaluation Datasets", elem_id="llm-benchmark-tab-table", id=4):
|
359 |
gr.Markdown(LLM_DATASET_TEXT, elem_classes="markdown-text")
|
360 |
+
with gr.Row():
|
361 |
+
with gr.Column(scale=1):
|
362 |
+
gr.Image('src/display/kapital.jpg', scale=1,
|
363 |
+
show_label=False,
|
364 |
+
interactive=False,
|
365 |
+
show_share_button=False,
|
366 |
+
show_download_button=False)
|
367 |
+
|
368 |
+
with gr.Column(scale=1, min_width=1):
|
369 |
+
gr.Image('src/display/kapital.jpg', scale=1,
|
370 |
+
show_label=False,
|
371 |
+
interactive=False,
|
372 |
+
show_share_button=False,
|
373 |
+
show_download_button=False)
|
374 |
|
375 |
scheduler = BackgroundScheduler()
|
376 |
scheduler.add_job(restart_space, "interval", seconds=300)
|
src/display/about.py
CHANGED
@@ -48,15 +48,32 @@ If you have a fine-tuned Azerbaijani LLM, submit it for evaluation!
|
|
48 |
"""
|
49 |
|
50 |
LLM_BENCHMARKS_TEXT = f"""
|
51 |
-
##
|
52 |
-
|
53 |
-
|
54 |
"""
|
55 |
|
56 |
LLM_DATASET_TEXT = f"""
|
57 |
-
##
|
58 |
-
|
59 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
60 |
"""
|
61 |
|
62 |
|
|
|
48 |
"""
|
49 |
|
50 |
LLM_BENCHMARKS_TEXT = f"""
|
51 |
+
## Azerbaijani Open LLM sponsored by Kapital Bank
|
52 |
+
|
53 |
+
This Open leaderboard
|
54 |
"""
|
55 |
|
56 |
LLM_DATASET_TEXT = f"""
|
57 |
+
##Banking_Call_Classification_MC
|
58 |
+
This dataset consists of 192 rows and 4 columns. It is a multiple-choice dataset used to determine which of the presented categories the subject of a request sent to the bank by a client belongs to.
|
59 |
+
|
60 |
+
##Banking_Exam_MCQ
|
61 |
+
A benchmark dataset of 200-300 multiple-choice questions sourced from universityexam materials across multiple departments,focused specifically on the banking sector in Azerbaijan.
|
62 |
+
|
63 |
+
##Banking_QA
|
64 |
+
This dataset consists of 97 raws and is a question-answer dataset in the Azerbaijani language about banking.
|
65 |
+
|
66 |
+
##Wiki_CQA
|
67 |
+
This database consists of 97 rows in Azerbaijani language. It consists of a test consisting of a context from Wikipedia, questions related to that context, and a created answer.
|
68 |
+
|
69 |
+
##GSM8K
|
70 |
+
A benchmark dataset contain 44 rows,diverse grade school math word problems to measure a model’s abilitiy to solve milti-step mathematical reasoning problems.
|
71 |
+
|
72 |
+
##ARC
|
73 |
+
This Benchmark dataset consists of multiple-choice science questions aimed at testing a model's ability to understand and apply elementary scientific knowledge, similar to questions that might appear in standard science exams for students. This version of the dataset is in Azerbaijani, providing an opportunity for models to engage in reasoning and inference in the Azerbaijani language. The dataset is divided into an easy set and a challenge set, with questions requiring reasoning beyond simple fact recall
|
74 |
+
|
75 |
+
##Informatics_MC, Azerbaijani_Lang_MC, History_MC, Physics_MC, Geography_MC, LLM-Literature_MC, Logic_MC, Azerbaijani_Hist_MC, Chemistry_MC, Biology_MC
|
76 |
+
A comprehensive collection of educational datasets in the Azerbaijani language, covering ten distinct academic disciplines: informatics, Azerbaijani language, world history, physics, geography, literature, logic, Azerbaijani history, chemistry, and biology. Each dataset contains 100 carefully curated multiple-choice questions, designed to assess knowledge and understanding in their respective fields.
|
77 |
"""
|
78 |
|
79 |
|