Spaces:
AIR-Bench
/
Restarting on CPU Upgrade

leaderboard / tests /src /test_envs.py
nan's picture
test: add unit tests for envs
0af261c
raw
history blame
512 Bytes
from air_benchmark.tasks import BenchmarkTable
from src.envs import BENCHMARK_VERSION_LIST, DEFAULT_METRIC_QA, DEFAULT_METRIC_LONG_DOC, METRIC_LIST
def test_benchmark_version_list():
leaderboard_versions = frozenset(BENCHMARK_VERSION_LIST)
available_versions = frozenset([k for k in BenchmarkTable.keys()])
assert leaderboard_versions.issubset(
available_versions)
def test_default_metrics():
assert DEFAULT_METRIC_QA in METRIC_LIST
assert DEFAULT_METRIC_LONG_DOC in METRIC_LIST