Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
File size: 512 Bytes
0af261c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 |
from air_benchmark.tasks import BenchmarkTable
from src.envs import BENCHMARK_VERSION_LIST, DEFAULT_METRIC_QA, DEFAULT_METRIC_LONG_DOC, METRIC_LIST
def test_benchmark_version_list():
leaderboard_versions = frozenset(BENCHMARK_VERSION_LIST)
available_versions = frozenset([k for k in BenchmarkTable.keys()])
assert leaderboard_versions.issubset(
available_versions)
def test_default_metrics():
assert DEFAULT_METRIC_QA in METRIC_LIST
assert DEFAULT_METRIC_LONG_DOC in METRIC_LIST
|