|
import json |
|
|
|
def get_log_url(model_name: str, log_file_name: str) -> str: |
|
"""Returns the URL to the log file for a given model and benchmark""" |
|
if log_file_name is None: |
|
return None |
|
else: |
|
|
|
log_file_name = log_file_name.replace(".json", ".eval") |
|
return f"https://storage.googleapis.com/inspect-evals/eval/{model_name}/index.html?log_file=logs/logs/{log_file_name}" |
|
|
|
def main(): |
|
|
|
with open("data/results.json", "r") as f: |
|
results = json.load(f) |
|
|
|
with open("data/inspect_log_file_names.json", "r") as f: |
|
log_files = json.load(f) |
|
|
|
|
|
for model_name, model_data in results.items(): |
|
|
|
model_logs = log_files.get(model_name, {}) |
|
|
|
|
|
for task_name, task_data in model_data["results"].items(): |
|
|
|
log_file_name = model_logs.get(task_name) |
|
|
|
|
|
if log_file_name: |
|
task_data["log_url"] = get_log_url(model_name, log_file_name) |
|
else: |
|
task_data["log_url"] = None |
|
|
|
|
|
with open("data/results_with_logs.json", "w") as f: |
|
json.dump(results, f, indent=4) |
|
|
|
if __name__ == "__main__": |
|
main() |