Spaces:

sabretoothedhugs
/

Distributional-RL-Benchmark-v2

Running

9b19c29 about 1 year ago

1.38 kB

	import torch


	class MultipleLRSchedulers:
	"""A wrapper for multiple learning rate schedulers.

	Every time :meth:`~tianshou.utils.MultipleLRSchedulers.step` is called,
	it calls the step() method of each of the schedulers that it contains.
	Example usage:
	::

	scheduler1 = ConstantLR(opt1, factor=0.1, total_iters=2)
	scheduler2 = ExponentialLR(opt2, gamma=0.9)
	scheduler = MultipleLRSchedulers(scheduler1, scheduler2)
	policy = PPOPolicy(..., lr_scheduler=scheduler)
	"""

	def __init__(self, *args: torch.optim.lr_scheduler.LRScheduler):
	self.schedulers = args

	def step(self) -> None:
	"""Take a step in each of the learning rate schedulers."""
	for scheduler in self.schedulers:
	scheduler.step()

	def state_dict(self) -> list[dict]:
	"""Get state_dict for each of the learning rate schedulers.

	:return: A list of state_dict of learning rate schedulers.
	"""
	return [s.state_dict() for s in self.schedulers]

	def load_state_dict(self, state_dict: list[dict]) -> None:
	"""Load states from state_dict.

	:param state_dict: A list of learning rate scheduler
	state_dict, in the same order as the schedulers.
	"""
	for s, sd in zip(self.schedulers, state_dict, strict=True):
	s.__dict__.update(sd)