Spaces:
AIR-Bench
/
Running on CPU Upgrade

File size: 512 Bytes
0af261c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
from air_benchmark.tasks import BenchmarkTable

from src.envs import BENCHMARK_VERSION_LIST, DEFAULT_METRIC_QA, DEFAULT_METRIC_LONG_DOC, METRIC_LIST


def test_benchmark_version_list():
    leaderboard_versions = frozenset(BENCHMARK_VERSION_LIST)
    available_versions = frozenset([k for k in BenchmarkTable.keys()])
    assert leaderboard_versions.issubset(
        available_versions)


def test_default_metrics():
    assert DEFAULT_METRIC_QA in METRIC_LIST
    assert DEFAULT_METRIC_LONG_DOC in METRIC_LIST