File size: 518 Bytes
51b9b31
 
d5581cc
52facf3
51b9b31
 
 
 
 
 
 
52facf3
51b9b31
52facf3
51b9b31
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
[
    {
        "agent_name": "GenericAgent-Llama-3.1-405b",
        "study_id": "d93a2398-2b70-41ce-b989-364fed988d73",
        "benchmark": "AssistantBench",
        "score": 3.9,
        "std_err": 1.0,
        "benchmark_specific": "No",
        "benchmark_tuned": "No",
        "followed_evaluation_protocol": "Yes",
        "reproducible": "Yes",
        "comments": "Intersection of finished tasks across agents.",
        "original_or_reproduced": "Original",
        "date_time": "2024-11-28 19:34:58"
    }
]