Spaces:

sabretoothedhugs
/

Distributional-RL-Benchmark-v2

Sleeping

sabretoothedhugs commited on Jul 8, 2024

Commit

2befa79

1 Parent(s): 80a5e58

pong added

Files changed (7) hide show

app.py CHANGED Viewed

@@ -393,7 +393,10 @@ def display_choice(algo, game,slider):
                     mean_scores = test_c51(config_c51)
                 case "Pong" :
-                    return 19
         case "FQF":
           config_fqf["seed"] = slider
@@ -404,7 +407,9 @@ def display_choice(algo, game,slider):
                     mean_scores = test_FQF(config_fqf)
                 case "Pong" :
-                    return 20
         case "FQF-Rainbow":
             config_fqf_r["seed"] = slider
@@ -415,7 +420,9 @@ def display_choice(algo, game,slider):
                     mean_scores = test_fqf_rainbow(config_fqf_r)
                 case "Pong" :
-                    return 21
@@ -429,7 +436,7 @@ def display_choice(algo, game,slider):
 # Define the choices for the radio buttons
 algos = ["C51", "FQF", "FQF-Rainbow"]
 # games = ["Pong", "Space Invaders","Freeway","MsPacman"]
-games = ["Freeway"]
 # Create a Gradio Interface
@@ -440,10 +447,10 @@ demo = gr.Interface(
     title="Distributional RL Algorithms Benchmark",
     description="Select the DRL agent and the game of your choice",
     theme="soft",
-    # examples=[["FQF","Pong",31],
-    #           ["C51","Space Invaders",31],
-    #           ["FQF-Rainbow","Freeway",31]
-    #           ]
 )
 # Launch the Gradio app

                     mean_scores = test_c51(config_c51)
                 case "Pong" :
+                    config_c51["resume_path"] = "models/c51_pong.pth"
+                    config_c51["task"] = "PongNoFrameskip-v4"
+                    mean_scores = test_c51(config_c51)
         case "FQF":
           config_fqf["seed"] = slider
                     mean_scores = test_FQF(config_fqf)
                 case "Pong" :
+                    config_fqf["resume_path"] = "models/fqf_pong.pth"
+                    config_fqf["task"] = "PongNoFrameskip-v4"
+                    mean_scores = test_FQF(config_fqf)
         case "FQF-Rainbow":
             config_fqf_r["seed"] = slider
                     mean_scores = test_fqf_rainbow(config_fqf_r)
                 case "Pong" :
+                    config_fqf_r["resume_path"] = "models/fqf-rainbow_pong.pth"
+                    config_fqf_r["task"] = "PongNoFrameskip-v4"
+                    mean_scores = test_fqf_rainbow(config_fqf_r)
 # Define the choices for the radio buttons
 algos = ["C51", "FQF", "FQF-Rainbow"]
 # games = ["Pong", "Space Invaders","Freeway","MsPacman"]
+games = ["Freeway","Pong"]
 # Create a Gradio Interface
     title="Distributional RL Algorithms Benchmark",
     description="Select the DRL agent and the game of your choice",
     theme="soft",
+    examples=[["FQF","Pong",31],
+              ["C51","Freeway",31],
+              ["FQF-Rainbow","Freeway",31]
+              ]
 )
 # Launch the Gradio app

models/c51_pong.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:eb1c19a7ba5a20837b23f3d35e0887ccb872dcf046272baf234de90afee2079e
+size 14735486

models/fqf-rainbow_pong.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:7f6f5f6f11294aecb49492be954b2cb55c2f1f3f1dfcf0c8b0844dc10c9d5c68
+size 67072998

models/fqf_pong.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a7b5790f7beec93552a965aa3d877cd381103bf8d8c8132e155c9c8e965ad7d2
+size 15538854

video-app/rl-video-episode-0.mp4 CHANGED Viewed

Binary files a/video-app/rl-video-episode-0.mp4 and b/video-app/rl-video-episode-0.mp4 differ

video-app/rl-video-episode-1.meta.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"step_id": ~~2044~~, "episode_id": 1, "content_type": "video/mp4"}


1	+ {"step_id": 1647, "episode_id": 1, "content_type": "video/mp4"}

video-app/rl-video-episode-1.mp4 CHANGED Viewed

Binary files a/video-app/rl-video-episode-1.mp4 and b/video-app/rl-video-episode-1.mp4 differ