ppo-CarRacing-v0 / wrappers /initial_step_truncate_wrapper.py

PPO playing CarRacing-v0 from https://github.com/sgoodfriend/rl-algo-impls/tree/5598ebc4b03054f16eebe76792486ba7bcacfc5c

0ca6846 over 2 years ago

948 Bytes

	import gym
	import numpy as np

	from gym.wrappers.monitoring.video_recorder import VideoRecorder
	from typing import Any, Dict, Tuple, Union

	ObsType = Union[np.ndarray, dict]
	ActType = Union[int, float, np.ndarray, dict]


	class InitialStepTruncateWrapper(gym.Wrapper):
	def __init__(self, env: gym.Env, initial_steps_to_truncate: int) -> None:
	super().__init__(env)
	self.initial_steps_to_truncate = initial_steps_to_truncate
	self.initialized = initial_steps_to_truncate == 0
	self.steps = 0

	def step(self, action: ActType) -> Tuple[ObsType, float, bool, Dict[str, Any]]:
	obs, rew, done, info = self.env.step(action)
	if not self.initialized:
	self.steps += 1
	if self.steps >= self.initial_steps_to_truncate:
	print(f"Truncation at {self.steps} steps")
	done = True
	self.initialized = True
	return obs, rew, done, info