Spaces:

thyaa10
/

instructblip

Runtime error

App Files Files Community

instructblip / lavis /tasks /multimodal_classification.py

WhiteWolf21

Initialization

be13417 about 1 year ago

raw

history blame contribute delete

4.29 kB

	"""
	Copyright (c) 2022, salesforce.com, inc.
	All rights reserved.
	SPDX-License-Identifier: BSD-3-Clause
	For full license text, see the LICENSE file in the repo root or https://opensource.org/licenses/BSD-3-Clause
	"""

	import json
	import os
	import logging
	import inspect

	import numpy as np
	import torch
	from lavis.common.dist_utils import main_process
	from lavis.common.registry import registry
	from lavis.tasks.base_task import BaseTask


	@registry.register_task("multimodal_classification")
	class MultimodalClassificationTask(BaseTask):
	def __init__(self,
	max_len,
	min_len,
	length_penalty,
	segments):
	super().__init__()
	self.max_len = max_len
	self.min_len = min_len
	self.length_penalty = length_penalty
	self.segments = segments


	@classmethod
	def setup_task(cls, cfg):
	run_cfg = cfg.run_cfg

	max_len = run_cfg.get("max_len", 30)
	min_len = run_cfg.get("min_len", 1)
	length_penalty = run_cfg.get("length_penalty", -1.)
	segments = run_cfg.get("segments", 1)

	return cls(
	max_len=max_len,
	min_len=min_len,
	length_penalty=length_penalty,
	segments=segments
	)

	def valid_step(self, model, samples):
	results = []

	argspec = inspect.getargspec(model.predict)
	# check if model allows for generation arguments in classification
	if all([k in argspec.args for k in ['max_length', "min_length", "length_penalty"]]):
	outputs = model.predict(samples,
	max_length=self.max_len,
	min_length=self.min_len,
	length_penalty=self.length_penalty,
	)
	else:
	outputs = model.predict(samples, n_segments=self.segments)

	if outputs == None: # missing data
	return {}

	predictions = outputs["predictions"]

	if isinstance(predictions[0], str):
	targets = samples["label"]
	indices = samples[self.inst_id_key]
	for pred, tgt, index in zip(predictions, targets, indices):
	results.append(
	{
	self.inst_id_key: index,
	"prediction": pred,
	"target": tgt,
	}
	)
	else:
	targets = outputs["targets"]
	predictions = predictions.max(1)[1].cpu().numpy()
	targets = targets.cpu().numpy()

	indices = samples[self.inst_id_key]

	for pred, tgt, index in zip(predictions, targets, indices):
	if isinstance(index, torch.Tensor):
	index = index.item()

	results.append(
	{
	self.inst_id_key: index,
	"prediction": pred.item(),
	"target": tgt.item(),
	}
	)

	return results

	def after_evaluation(self, val_result, split_name, epoch, **kwargs):
	eval_result_file = self.save_result(
	result=val_result,
	result_dir=registry.get_path("result_dir"),
	filename="{}_epoch{}".format(split_name, epoch),
	remove_duplicate=self.inst_id_key,
	)

	metrics = self._report_metrics(
	eval_result_file=eval_result_file, split_name=split_name
	)

	return metrics

	@main_process
	def _report_metrics(self, eval_result_file, split_name):
	results = json.load(open(eval_result_file))

	predictions = np.array([res["prediction"] for res in results])
	targets = np.array([res["target"] for res in results])

	accuracy = (targets == predictions).sum() / targets.shape[0]
	metrics = {"agg_metrics": accuracy, "acc": accuracy}

	log_stats = {split_name: {k: v for k, v in metrics.items()}}

	with open(
	os.path.join(registry.get_path("output_dir"), "evaluate.txt"), "a"
	) as f:
	f.write(json.dumps(log_stats) + "\n")

	logging.info(metrics)
	return metrics