Spaces:

abby101
/

surveyor-0

Sleeping

File size: 4,769 Bytes

a2b5ed5

import json
import logging
import os
import torch

from config import DEFAULT_RES_DIR as RES_DIR

from accelerate import (
    infer_auto_device_map,
    init_empty_weights,
    Accelerator,
    load_checkpoint_and_dispatch,
)
from transformers import AutoTokenizer, AutoModelForCausalLM, AutoConfig


def save_results(
    out_dir_path,
    all_inputs,
    gold_tags,
    predicted_responses,
    predicted_tags,
    metrics,
    runtype,
    append=False,
):
    mode = "a" if append else "w"

    with open(
        os.path.join(RES_DIR, out_dir_path, "prompts.txt"), mode, encoding="utf-8"
    ) as f:
        for input, gold_tag, pred_response, pred_tag in zip(
            all_inputs, gold_tags, predicted_responses, predicted_tags
        ):
            f.write(f"{input}\n")
            f.write(f"True Tag: {gold_tag}\n")
            f.write(f"Predicted Response: {pred_response}\n")
            f.write(f"Predicted Tag: {pred_tag}\n")
            f.write("#" * 50 + "\n")

    with open(
        os.path.join(RES_DIR, out_dir_path, "predicted_responses.txt"),
        mode,
        encoding="utf-8",
    ) as f:
        for response in predicted_responses:
            f.write(f"{response}\n")
            f.write("#" * 50 + "\n")

    if append:
        with open(os.path.join(RES_DIR, out_dir_path, "predictions.json"), "r+") as f:
            data = json.load(f)
            data["predicted_tags"].extend(predicted_tags)
            f.seek(0)
            json.dump(data, f, indent=4)
            f.truncate()
    else:
        with open(os.path.join(RES_DIR, out_dir_path, "predictions.json"), "w") as f:
            json.dump({"predicted_tags": predicted_tags}, f, indent=4)

    if runtype == "eval":
        if append:
            with open(
                os.path.join(RES_DIR, out_dir_path, "ground_truth.json"), "r+"
            ) as f:
                data = json.load(f)
                data["gold_tags"].extend(gold_tag)
                f.seek(0)
                json.dump(data, f, indent=4)
                f.truncate()
        else:
            with open(
                os.path.join(RES_DIR, out_dir_path, "ground_truth.json"), "w"
            ) as f:
                json.dump({"gold_tags": gold_tags}, f, indent=4)

    with open(os.path.join(RES_DIR, out_dir_path, "metrics.json"), "w") as f:
        json.dump({"metrics": metrics, "prompt_file": "prompts.txt"}, f, indent=4)

    logging.info(f"Results saved in: {os.path.join(RES_DIR, out_dir_path)}")


def save_best_config(metrics, config):
    best_config_path = os.path.join(RES_DIR, "best_config.json")
    if os.path.exists(best_config_path):
        with open(best_config_path, "r") as f:
            best_config = json.load(f)
        if metrics["precision"] > best_config["metrics"]["precision"]:
            best_config = {"metrics": metrics, "config": config}
    else:
        best_config = {"metrics": metrics, "config": config}

    with open(best_config_path, "w") as f:
        json.dump(best_config, f, indent=4)


def load_sweep_config(config_path="sweep_config.json"):
    with open(config_path, "r") as f:
        return json.load(f)


# def load_model_and_tokenizer(model_id: str):
#     accelerator = Accelerator()

#     tokenizer = AutoTokenizer.from_pretrained(model_id, padding_side="left")
#     # device_map = infer_auto_device_map(model, max_memory=max_memory)

#     if tokenizer.pad_token_id is None:
#         tokenizer.pad_token_id = tokenizer.eos_token_id

#     model = AutoModelForCausalLM.from_pretrained(
#         model_id,
#         torch_dtype=torch.bfloat16,
#         device_map="auto",
#         token=os.getenv("HF_TOKEN"),
#     )

#     model, tokenizer = accelerator.prepare(model, tokenizer)

#     return model, tokenizer


def clear_cuda_cache():
    if torch.cuda.is_available():
        torch.cuda.empty_cache()
        torch.cuda.memory.reset_max_memory_allocated()
        torch.cuda.memory.reset_max_memory_cached()


def load_model_and_tokenizer(model_id):
    # Set up memory-saving options
    torch.cuda.empty_cache()
    torch.backends.cuda.matmul.allow_tf32 = True
    torch.backends.cudnn.allow_tf32 = True

    # Initialize tokenizer
    tokenizer = AutoTokenizer.from_pretrained(
        model_id, padding_side="left", use_auth_token=os.getenv("HF_TOKEN")
    )
    if tokenizer.pad_token_id is None:
        tokenizer.pad_token_id = tokenizer.eos_token_id

    # Load configuration
    config = AutoConfig.from_pretrained(model_id, use_auth_token=os.getenv("HF_TOKEN"))

    # Load model
    model = AutoModelForCausalLM.from_pretrained(
        model_id,
        config=config,
        torch_dtype=torch.float16,
        use_auth_token=os.getenv("HF_TOKEN"),
        device_map="auto",
    )

    return model, tokenizer