Spaces:

acozma
/

CS581-Algos-Demo

Sleeping

Andrei Cozma commited on Apr 25, 2023

Commit

a33a97c

1 Parent(s): 64d4eec

Updates

Files changed (1) hide show

AgentBase.py CHANGED Viewed

@@ -104,8 +104,6 @@ class AgentBase:
         i = 0
         # Generate an episode following the current policy
         while i < max_steps and not solved and not done:
-            # Render the environment if needed
-            rgb_array = self.env.render() if render else None
             # Sample the next action from the policy
             action = self.choose_action(policy, state, **kwargs)
             # Keeping track of the trajectory
@@ -123,6 +121,9 @@ class AgentBase:
             # Generate the output at intermediate steps for the demo
             yield episode_hist, solved, rgb_array
             # For CliffWalking-v0 and Taxi-v3, the episode is solved when it terminates
             if done and self.env_name in ["CliffWalking-v0", "Taxi-v3"]:
                 solved = True

         i = 0
         # Generate an episode following the current policy
         while i < max_steps and not solved and not done:
             # Sample the next action from the policy
             action = self.choose_action(policy, state, **kwargs)
             # Keeping track of the trajectory
             # Generate the output at intermediate steps for the demo
             yield episode_hist, solved, rgb_array
+            # Render the environment if needed
+            rgb_array = self.env.render() if render else None
             # For CliffWalking-v0 and Taxi-v3, the episode is solved when it terminates
             if done and self.env_name in ["CliffWalking-v0", "Taxi-v3"]:
                 solved = True