File size: 1,426 Bytes
ca5fb3d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
import json
import os

from collections import defaultdict


def main():

    base_bm_input_path = "./base_benchmarking_logs"
    agentic_bm_input_path = "./agentic_benchmarking_logs"

    log_file_map = defaultdict()

    for model_name in os.listdir(base_bm_input_path):
        log_file_map[model_name] = defaultdict(str)
        if os.path.isdir(os.path.join(base_bm_input_path, model_name)):
            for task_log_file in os.listdir(os.path.join(base_bm_input_path, model_name)):
                with open(os.path.join(base_bm_input_path, model_name, task_log_file), "r") as f:
                    result = json.load(f)
                task_name = result["eval"]["task"].split("/")[-1]
                log_file_map[model_name][task_name] = task_log_file

    for model_name in os.listdir(agentic_bm_input_path):
        if os.path.isdir(os.path.join(agentic_bm_input_path, model_name)):
            for task_log_file in os.listdir(os.path.join(agentic_bm_input_path, model_name)):
                with open(os.path.join(agentic_bm_input_path, model_name, task_log_file), "r") as f:
                    result = json.load(f)
                task_name = result["eval"]["task"].split("/")[-1]
                log_file_map[model_name][task_name] = task_log_file
                
    with open("./inspect_log_file_names.json", "w") as f:
        json.dump(log_file_map, f, indent=4)


if __name__ == "__main__":
    main()