Added videos of the best model from the most recent run

Files changed (5) hide show

record_video.py CHANGED Viewed

@@ -1,12 +1,12 @@
 import gymnasium as gym
 from stable_baselines3 import DQN
-from stable_baselines3.common.monitor import Monitor
 from stable_baselines3.common.vec_env import VecVideoRecorder, DummyVecEnv, VecEnv
 model_name = "agents/dqn_v2-8/best_model" # path to model, should be an argument
 env_id = "ALE/Pacman-v5"
 video_folder = "videos/"
-video_length = 100000 #steps by hard coding this, I can almost ensure only one episode is recorded...
 vec_env = DummyVecEnv([lambda: gym.make(env_id, render_mode="rgb_array")])
 model = DQN.load(model_name)
@@ -29,11 +29,11 @@ vec_env = VecVideoRecorder(vec_env,
                            video_folder,
                            record_video_trigger=lambda x: x == 0,
                            video_length=video_length,
-                           name_prefix=f"video-{model_name}"
                            )
 #  Once I make the environment, now I need to walk through it...???
 #   I want to act according to the policy that has been trained
-obs = vec_env.reset()
 print(vec_env)
 # for _ in range(video_length + 1):
 #   action, states = model.predict(obs)
@@ -50,4 +50,5 @@ while end == True:
     print("exiting loop")
     end = False
 # # Save the video
 vec_env.close()

 import gymnasium as gym
 from stable_baselines3 import DQN
+# from stable_baselines3.common.monitor import Monitor
 from stable_baselines3.common.vec_env import VecVideoRecorder, DummyVecEnv, VecEnv
 model_name = "agents/dqn_v2-8/best_model" # path to model, should be an argument
 env_id = "ALE/Pacman-v5"
 video_folder = "videos/"
+video_length = 10000 #steps by hard coding this, I can almost ensure only one episode is recorded...
 vec_env = DummyVecEnv([lambda: gym.make(env_id, render_mode="rgb_array")])
 model = DQN.load(model_name)
                            video_folder,
                            record_video_trigger=lambda x: x == 0,
                            video_length=video_length,
+                           name_prefix="one-episode_v2-8_bestmodel"
                            )
 #  Once I make the environment, now I need to walk through it...???
 #   I want to act according to the policy that has been trained
+vec_env.reset()
 print(vec_env)
 # for _ in range(video_length + 1):
 #   action, states = model.predict(obs)
     print("exiting loop")
     end = False
 # # Save the video
 vec_env.close()

videos/one-episode_v2-8_bestmodel-step-0-to-step-10000.meta.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"step_id": 0, "content_type": "video/mp4"}

videos/one-episode_v2-8_bestmodel-step-0-to-step-10000.mp4 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3884da6b0fbf91b475e9fa9bc9ea1d5a9771c89dba1ca699a22f6ec4cc5de6db
+size 178260

videos/v2-8_bestmodel-step-0-to-step-10000.meta.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"step_id": 0, "content_type": "video/mp4"}

videos/v2-8_bestmodel-step-0-to-step-10000.mp4 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:cf95394d8893382c21a7fa1f03a16ad1393fcb0804de19a076ef7adaaa032819
+size 1458975