Spaces:

mccaly
/

test

Running

App Files Files Community

test / FoodSeg103 /.dev /gather_models.py

mccaly

Upload 2805 files

985cc7f about 1 year ago

raw

history blame

6.97 kB

	import argparse
	import glob
	import json
	import os
	import os.path as osp
	import shutil
	import subprocess

	import mmcv
	import torch

	# build schedule look-up table to automatically find the final model
	RESULTS_LUT = ['mIoU', 'mAcc', 'aAcc']


	def process_checkpoint(in_file, out_file):
	checkpoint = torch.load(in_file, map_location='cpu')
	# remove optimizer for smaller file size
	if 'optimizer' in checkpoint:
	del checkpoint['optimizer']
	# if it is necessary to remove some sensitive data in checkpoint['meta'],
	# add the code here.
	torch.save(checkpoint, out_file)
	sha = subprocess.check_output(['sha256sum', out_file]).decode()
	final_file = out_file.rstrip('.pth') + '-{}.pth'.format(sha[:8])
	subprocess.Popen(['mv', out_file, final_file])
	return final_file


	def get_final_iter(config):
	iter_num = config.split('_')[-2]
	assert iter_num.endswith('k')
	return int(iter_num[:-1]) * 1000


	def get_final_results(log_json_path, iter_num):
	result_dict = dict()
	with open(log_json_path, 'r') as f:
	for line in f.readlines():
	log_line = json.loads(line)
	if 'mode' not in log_line.keys():
	continue

	if log_line['mode'] == 'train' and log_line['iter'] == iter_num:
	result_dict['memory'] = log_line['memory']

	if log_line['iter'] == iter_num:
	result_dict.update({
	key: log_line[key]
	for key in RESULTS_LUT if key in log_line
	})
	return result_dict


	def parse_args():
	parser = argparse.ArgumentParser(description='Gather benchmarked models')
	parser.add_argument(
	'root',
	type=str,
	help='root path of benchmarked models to be gathered')
	parser.add_argument(
	'config',
	type=str,
	help='root path of benchmarked configs to be gathered')
	parser.add_argument(
	'out_dir',
	type=str,
	help='output path of gathered models to be stored')
	parser.add_argument('out_file', type=str, help='the output json file name')
	parser.add_argument(
	'--filter', type=str, nargs='+', default=[], help='config filter')
	parser.add_argument(
	'--all', action='store_true', help='whether include .py and .log')

	args = parser.parse_args()
	return args


	def main():
	args = parse_args()
	models_root = args.root
	models_out = args.out_dir
	config_name = args.config
	mmcv.mkdir_or_exist(models_out)

	# find all models in the root directory to be gathered
	raw_configs = list(mmcv.scandir(config_name, '.py', recursive=True))

	# filter configs that is not trained in the experiments dir
	used_configs = []
	for raw_config in raw_configs:
	work_dir = osp.splitext(osp.basename(raw_config))[0]
	if osp.exists(osp.join(models_root, work_dir)):
	used_configs.append((work_dir, raw_config))
	print(f'Find {len(used_configs)} models to be gathered')

	# find final_ckpt and log file for trained each config
	# and parse the best performance
	model_infos = []
	for used_config, raw_config in used_configs:
	bypass = True
	for p in args.filter:
	if p in used_config:
	bypass = False
	break
	if bypass:
	continue
	exp_dir = osp.join(models_root, used_config)
	# check whether the exps is finished
	final_iter = get_final_iter(used_config)
	final_model = 'iter_{}.pth'.format(final_iter)
	model_path = osp.join(exp_dir, final_model)

	# skip if the model is still training
	if not osp.exists(model_path):
	print(f'{used_config} train not finished yet')
	continue

	# get logs
	log_json_paths = glob.glob(osp.join(exp_dir, '*.log.json'))
	log_json_path = log_json_paths[0]
	model_performance = None
	for idx, _log_json_path in enumerate(log_json_paths):
	model_performance = get_final_results(_log_json_path, final_iter)
	if model_performance is not None:
	log_json_path = _log_json_path
	break

	if model_performance is None:
	print(f'{used_config} model_performance is None')
	continue

	model_time = osp.split(log_json_path)[-1].split('.')[0]
	model_infos.append(
	dict(
	config=used_config,
	raw_config=raw_config,
	results=model_performance,
	iters=final_iter,
	model_time=model_time,
	log_json_path=osp.split(log_json_path)[-1]))

	# publish model for each checkpoint
	publish_model_infos = []
	for model in model_infos:
	model_publish_dir = osp.join(models_out,
	model['raw_config'].rstrip('.py'))
	model_name = osp.split(model['config'])[-1].split('.')[0]

	publish_model_path = osp.join(model_publish_dir,
	model_name + '_' + model['model_time'])
	trained_model_path = osp.join(models_root, model['config'],
	'iter_{}.pth'.format(model['iters']))
	if osp.exists(model_publish_dir):
	for file in os.listdir(model_publish_dir):
	if file.endswith('.pth'):
	print(f'model {file} found')
	model['model_path'] = osp.abspath(
	osp.join(model_publish_dir, file))
	break
	if 'model_path' not in model:
	print(f'dir {model_publish_dir} exists, no model found')

	else:
	mmcv.mkdir_or_exist(model_publish_dir)

	# convert model
	final_model_path = process_checkpoint(trained_model_path,
	publish_model_path)
	model['model_path'] = final_model_path

	new_json_path = f'{model_name}-{model["log_json_path"]}'
	# copy log
	shutil.copy(
	osp.join(models_root, model['config'], model['log_json_path']),
	osp.join(model_publish_dir, new_json_path))
	if args.all:
	new_txt_path = new_json_path.rstrip('.json')
	shutil.copy(
	osp.join(models_root, model['config'],
	model['log_json_path'].rstrip('.json')),
	osp.join(model_publish_dir, new_txt_path))

	if args.all:
	# copy config to guarantee reproducibility
	raw_config = osp.join(config_name, model['raw_config'])
	mmcv.Config.fromfile(raw_config).dump(
	osp.join(model_publish_dir, osp.basename(raw_config)))

	publish_model_infos.append(model)

	models = dict(models=publish_model_infos)
	mmcv.dump(models, osp.join(models_out, args.out_file))


	if __name__ == '__main__':
	main()