pkalkman commited on
Commit
6da49d4
·
verified ·
1 Parent(s): 3a3adf1

Upload folder using huggingface_hub

Browse files
Files changed (3) hide show
  1. README.md +27 -39
  2. ppo_pong.zip +2 -2
  3. results.json +1 -1
README.md CHANGED
@@ -1,41 +1,29 @@
1
-
2
- # **PPO** Agent playing **PongNoFrameskip-v4**
3
-
4
- This is a trained model of a **PPO** agent playing **PongNoFrameskip-v4**.
5
-
6
  ---
7
- {
8
- "tags": [
9
- "PongNoFrameskip-v4",
10
- "ppo",
11
- "reinforcement-learning",
12
- "stable-baselines3",
13
- "deep-rl",
14
- "atari"
15
- ],
16
- "model-index": [
17
- {
18
- "name": "PPO Pong Atari",
19
- "results": [
20
- {
21
- "task": {
22
- "type": "reinforcement-learning",
23
- "name": "Pong"
24
- },
25
- "dataset": {
26
- "name": "PongNoFrameskip-v4",
27
- "type": "atari"
28
- },
29
- "metrics": [
30
- {
31
- "name": "Mean Reward",
32
- "type": "mean_reward",
33
- "value": "21.00 +/- 0.00"
34
- }
35
- ]
36
- }
37
- ]
38
- }
39
- ]
40
- }
41
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
+ tags:
3
+ - PongNoFrameskip-v4
4
+ - ppo
5
+ - reinforcement-learning
6
+ - stable-baselines3
7
+ - deep-rl
8
+ - atari
9
+ model-index:
10
+ - name: PPO Pong Atari
11
+ results:
12
+ - task:
13
+ type: reinforcement-learning
14
+ name: Pong
15
+ dataset:
16
+ name: PongNoFrameskip-v4
17
+ type: atari
18
+ metrics:
19
+ - name: Mean Reward
20
+ type: mean_reward
21
+ value: 21.00 +/- 0.00
 
 
 
 
 
 
 
 
 
 
 
 
 
 
22
  ---
23
+
24
+
25
+ # **PPO** Agent playing **PongNoFrameskip-v4**
26
+
27
+ This is a trained model of a **PPO** agent playing **PongNoFrameskip-v4**.
28
+
29
+ To learn to use this model and train yours, check the Deep Reinforcement Learning Course on [Hugging Face](https://huggingface.co/deep-rl-course).
ppo_pong.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9974534e114b6b7f4f61c4d8093c32a6a162b160fb3ab33b2f5d58edb55c43ae
3
- size 23100241
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ce60ab54f7a1c69b4c971ea4c419c4cae54bf1bc01663073d460f0d3ccd47ae
3
+ size 23100621
results.json CHANGED
@@ -1 +1 @@
1
- {"env_id": "PongNoFrameskip-v4", "mean_reward": 21.0, "n_evaluation_episodes": 10, "eval_datetime": "2024-10-20T13:50:37.086070"}
 
1
+ {"env_id": "PongNoFrameskip-v4", "mean_reward": 21.0, "n_evaluation_episodes": 10, "eval_datetime": "2024-10-20T13:53:31.793001"}