Spaces:

abby101
/

surveyor-0

Sleeping

Abhipsha Das

add files

a2b5ed5 unverified 7 months ago

4.77 kB

	import json
	import logging
	import os
	import torch

	from config import DEFAULT_RES_DIR as RES_DIR

	from accelerate import (
	infer_auto_device_map,
	init_empty_weights,
	Accelerator,
	load_checkpoint_and_dispatch,
	)
	from transformers import AutoTokenizer, AutoModelForCausalLM, AutoConfig


	def save_results(
	out_dir_path,
	all_inputs,
	gold_tags,
	predicted_responses,
	predicted_tags,
	metrics,
	runtype,
	append=False,
	):
	mode = "a" if append else "w"

	with open(
	os.path.join(RES_DIR, out_dir_path, "prompts.txt"), mode, encoding="utf-8"
	) as f:
	for input, gold_tag, pred_response, pred_tag in zip(
	all_inputs, gold_tags, predicted_responses, predicted_tags
	):
	f.write(f"{input}\n")
	f.write(f"True Tag: {gold_tag}\n")
	f.write(f"Predicted Response: {pred_response}\n")
	f.write(f"Predicted Tag: {pred_tag}\n")
	f.write("#" * 50 + "\n")

	with open(
	os.path.join(RES_DIR, out_dir_path, "predicted_responses.txt"),
	mode,
	encoding="utf-8",
	) as f:
	for response in predicted_responses:
	f.write(f"{response}\n")
	f.write("#" * 50 + "\n")

	if append:
	with open(os.path.join(RES_DIR, out_dir_path, "predictions.json"), "r+") as f:
	data = json.load(f)
	data["predicted_tags"].extend(predicted_tags)
	f.seek(0)
	json.dump(data, f, indent=4)
	f.truncate()
	else:
	with open(os.path.join(RES_DIR, out_dir_path, "predictions.json"), "w") as f:
	json.dump({"predicted_tags": predicted_tags}, f, indent=4)

	if runtype == "eval":
	if append:
	with open(
	os.path.join(RES_DIR, out_dir_path, "ground_truth.json"), "r+"
	) as f:
	data = json.load(f)
	data["gold_tags"].extend(gold_tag)
	f.seek(0)
	json.dump(data, f, indent=4)
	f.truncate()
	else:
	with open(
	os.path.join(RES_DIR, out_dir_path, "ground_truth.json"), "w"
	) as f:
	json.dump({"gold_tags": gold_tags}, f, indent=4)

	with open(os.path.join(RES_DIR, out_dir_path, "metrics.json"), "w") as f:
	json.dump({"metrics": metrics, "prompt_file": "prompts.txt"}, f, indent=4)

	logging.info(f"Results saved in: {os.path.join(RES_DIR, out_dir_path)}")


	def save_best_config(metrics, config):
	best_config_path = os.path.join(RES_DIR, "best_config.json")
	if os.path.exists(best_config_path):
	with open(best_config_path, "r") as f:
	best_config = json.load(f)
	if metrics["precision"] > best_config["metrics"]["precision"]:
	best_config = {"metrics": metrics, "config": config}
	else:
	best_config = {"metrics": metrics, "config": config}

	with open(best_config_path, "w") as f:
	json.dump(best_config, f, indent=4)


	def load_sweep_config(config_path="sweep_config.json"):
	with open(config_path, "r") as f:
	return json.load(f)


	# def load_model_and_tokenizer(model_id: str):
	# accelerator = Accelerator()

	# tokenizer = AutoTokenizer.from_pretrained(model_id, padding_side="left")
	# # device_map = infer_auto_device_map(model, max_memory=max_memory)

	# if tokenizer.pad_token_id is None:
	# tokenizer.pad_token_id = tokenizer.eos_token_id

	# model = AutoModelForCausalLM.from_pretrained(
	# model_id,
	# torch_dtype=torch.bfloat16,
	# device_map="auto",
	# token=os.getenv("HF_TOKEN"),
	# )

	# model, tokenizer = accelerator.prepare(model, tokenizer)

	# return model, tokenizer


	def clear_cuda_cache():
	if torch.cuda.is_available():
	torch.cuda.empty_cache()
	torch.cuda.memory.reset_max_memory_allocated()
	torch.cuda.memory.reset_max_memory_cached()


	def load_model_and_tokenizer(model_id):
	# Set up memory-saving options
	torch.cuda.empty_cache()
	torch.backends.cuda.matmul.allow_tf32 = True
	torch.backends.cudnn.allow_tf32 = True

	# Initialize tokenizer
	tokenizer = AutoTokenizer.from_pretrained(
	model_id, padding_side="left", use_auth_token=os.getenv("HF_TOKEN")
	)
	if tokenizer.pad_token_id is None:
	tokenizer.pad_token_id = tokenizer.eos_token_id

	# Load configuration
	config = AutoConfig.from_pretrained(model_id, use_auth_token=os.getenv("HF_TOKEN"))

	# Load model
	model = AutoModelForCausalLM.from_pretrained(
	model_id,
	config=config,
	torch_dtype=torch.float16,
	use_auth_token=os.getenv("HF_TOKEN"),
	device_map="auto",
	)

	return model, tokenizer