from dataclasses import dataclass from enum import Enum @dataclass class Task: benchmark: str metric: str col_name: str # Select your tasks here # --------------------------------------------------- class Tasks(Enum): # task_key in the json file, metric_key in the json file, name to display in the leaderboard task0 = Task("eng_natural_vanilla_acc", "acc", "[ENG-N] Vanilla Acc") task1 = Task("eng_natural_vanilla_pa", "pa", "[ENG-N] Vanilla PA") task2 = Task("eng_natural_metrics_reference_acc", "acc", "[ENG-N] Metrics Reference Acc") task3 = Task("eng_natural_metrics_reference_pa", "pa", "[ENG-N] Metrics Reference PA") task4 = Task("eng_natural_swap_acc", "acc", "[ENG-N] Swap Acc") task5 = Task("eng_natural_swap_pa", "pa", "[ENG-N] Swap PA") task6 = Task("eng_natural_swap_cot_acc", "acc", "[ENG-N] Swap COT Acc") task7 = Task("eng_natural_swap_cot_pa", "pa", "[ENG-N] Swap COT PA") task8 = Task("eng_adversarial_manual_vanilla_acc", "acc", "[ENG-A] Vanilla Acc") task9 = Task("eng_adversarial_manual_vanilla_pa", "pa", "[ENG-A] Vanilla PA") task10 = Task("eng_adversarial_manual_metrics_reference_acc", "acc", "[ENG-A] Metrics Reference Acc") task11 = Task("eng_adversarial_manual_metrics_reference_pa", "pa", "[ENG-A] Metrics Reference PA") task12 = Task("eng_adversarial_manual_swap_acc", "acc", "[ENG-A] Swap Acc") task13 = Task("eng_adversarial_manual_swap_pa", "pa", "[ENG-A] Swap PA") task14 = Task("eng_adversarial_manual_swap_cot_acc", "acc", "[ENG-A] Swap COT Acc") task15 = Task("eng_adversarial_manual_swap_cot_pa", "pa", "[ENG-A] Swap COT PA") task16 = Task("pt_natural_vanilla_acc", "acc", "[PT-N] Vanilla Acc") task17 = Task("pt_natural_vanilla_pa", "pa", "[PT-N] Vanilla PA") task18 = Task("pt_natural_metrics_reference_acc", "acc", "[PT-N] Metrics Reference Acc") task19 = Task("pt_natural_metrics_reference_pa", "pa", "[PT-N] Metrics Reference PA") task20 = Task("pt_natural_swap_acc", "acc", "[PT-N] Swap Acc") task21 = Task("pt_natural_swap_pa", "pa", "[PT-N] Swap PA") task22 = Task("pt_natural_swap_cot_acc", "acc", "[PT-N] Swap COT Acc") task23 = Task("pt_natural_swap_cot_pa", "pa", "[PT-N] Swap COT PA") task24 = Task("pt_adversarial_manual_vanilla_acc", "acc", "[PT-A] Vanilla Acc") task25 = Task("pt_adversarial_manual_vanilla_pa", "pa", "[PT-A] Vanilla PA") task26 = Task("pt_adversarial_manual_metrics_reference_acc", "acc", "[PT-A] Metrics Reference Acc") task27 = Task("pt_adversarial_manual_metrics_reference_pa", "pa", "[PT-A] Metrics Reference PA") task28 = Task("pt_adversarial_manual_swap_acc", "acc", "[PT-A] Swap Acc") task29 = Task("pt_adversarial_manual_swap_pa", "pa", "[PT-A] Swap PA") task30 = Task("pt_adversarial_manual_swap_cot_acc", "acc", "[PT-A] Swap COT Acc") task31 = Task("pt_adversarial_manual_swap_cot_pa", "pa", "[PT-A] Swap COT PA") task32 = Task("eng_pba_extraction_avg", "avg", "[ENG-P] Extraction Rate") task33 = Task("eng_pba_positional_avg", "avg", "[ENG-P] Positional Consistency Avg") task34 = Task("eng_pba_positional_std", "std", "[ENG-P] Positional Consistency Std") task35 = Task("eng_pba_preference_avg", "avg", "[ENG-P] Preference Score") task36 = Task("pt_pba_extraction_avg", "avg", "[PT-P] Extraction Rate") task37 = Task("pt_pba_positional_avg", "avg", "[PT-P] Positional Consistency Avg") task38 = Task("pt_pba_positional_std", "std", "[PT-P] Positional Consistency Std") task39 = Task("pt_pba_preference_avg", "avg", "[PT-P] Preference Score") NUM_FEWSHOT = 0 # Change with your few shot # --------------------------------------------------- # Your leaderboard name TITLE = """