pmolodo commited on
Commit
1390546
·
1 Parent(s): 7c96119

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 137.00 +/- 76.88
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -43,13 +43,13 @@ pip install rl_zoo3
43
 
44
  ```
45
  # Download model and save it into the logs/ folder
46
- python -m rl_zoo3.load_from_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -orga pmolodo -f logs/
47
  python -m rl_zoo3.enjoy --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
48
  ```
49
 
50
  If you installed the RL Zoo3 via pip (`pip install rl_zoo3`), from anywhere you can do:
51
  ```
52
- python -m rl_zoo3.load_from_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -orga pmolodo -f logs/
53
  python -m rl_zoo3.enjoy --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
54
  ```
55
 
@@ -57,7 +57,7 @@ python -m rl_zoo3.enjoy --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
57
  ```
58
  python -m rl_zoo3.train --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
59
  # Upload the model and generate video (when possible)
60
- python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/ -orga pmolodo
61
  ```
62
 
63
  ## Hyperparameters
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 320.00 +/- 86.46
20
  name: mean_reward
21
  verified: false
22
  ---
 
43
 
44
  ```
45
  # Download model and save it into the logs/ folder
46
+ python -m rl_zoo3.load_from_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -orga PMOLODO -f logs/
47
  python -m rl_zoo3.enjoy --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
48
  ```
49
 
50
  If you installed the RL Zoo3 via pip (`pip install rl_zoo3`), from anywhere you can do:
51
  ```
52
+ python -m rl_zoo3.load_from_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -orga PMOLODO -f logs/
53
  python -m rl_zoo3.enjoy --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
54
  ```
55
 
 
57
  ```
58
  python -m rl_zoo3.train --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
59
  # Upload the model and generate video (when possible)
60
+ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/ -orga PMOLODO
61
  ```
62
 
63
  ## Hyperparameters
args.yml CHANGED
@@ -9,6 +9,8 @@
9
  - SpaceInvadersNoFrameskip-v4
10
  - - env_kwargs
11
  - null
 
 
12
  - - eval_episodes
13
  - 5
14
  - - eval_freq
@@ -54,7 +56,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 225160754
58
  - - storage
59
  - null
60
  - - study_name
 
9
  - SpaceInvadersNoFrameskip-v4
10
  - - env_kwargs
11
  - null
12
+ - - eval_env_kwargs
13
+ - null
14
  - - eval_episodes
15
  - 5
16
  - - eval_freq
 
56
  - - save_replay_buffer
57
  - false
58
  - - seed
59
+ - 1432731666
60
  - - storage
61
  - null
62
  - - study_name
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7af21b2be18110a0f250f79493c84dd34aa5402dc2302ba595f5933f26becd7
3
- size 27220212
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c03c93dfeeb2247656e9132ec61879f1fe4b822cccce1f88c90d696d8dc64138
3
+ size 27218922
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5cebdc1d3829537a93bea496d34261357496c7434322497e928957b0528a630
3
- size 13505852
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2492567e69e1eb38a0bf62d2573af8ec0029e6e71984a799f99a63c218ab196a
3
+ size 13505419
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb1dbd2b88c171116432f2ada3affeb6dcb1bc95eee2c702e6f1840cc36162e2
3
- size 13505178
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d75453013dd2d878fb3736a8e70d6cb4c27249e301c2b50068623f2778cb02b0
3
+ size 13504745
dqn-SpaceInvadersNoFrameskip-v4/pytorch_variables.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c35cea3b2e60fb5e7e162d3592df775cd400e575a31c72f359fb9e654ab00c5
3
- size 864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d030ad8db708280fcae77d87e973102039acd23a11bdecc3db8eb6c0ac940ee1
3
+ size 431
dqn-SpaceInvadersNoFrameskip-v4/system_info.txt CHANGED
@@ -1,7 +1,7 @@
1
- - OS: Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sun Apr 28 14:29:16 UTC 2024
2
  - Python: 3.10.12
3
  - Stable-Baselines3: 2.3.2
4
- - PyTorch: 2.3.0+cu121
5
  - GPU Enabled: False
6
  - Numpy: 1.25.2
7
  - Cloudpickle: 2.2.1
 
1
+ - OS: Linux-5.10.16.3-microsoft-standard-WSL2-x86_64-with-glibc2.35 # 1 SMP Fri Apr 2 22:23:49 UTC 2021
2
  - Python: 3.10.12
3
  - Stable-Baselines3: 2.3.2
4
+ - PyTorch: 2.0.0.post101
5
  - GPU Enabled: False
6
  - Numpy: 1.25.2
7
  - Cloudpickle: 2.2.1
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:caca9ffe7b51a1ac3663454be4ba5a99228c84afc6854edb44ad4300ee957d60
3
- size 261751
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da78c1893795ae372d2322de97b4d9313a3b37a30e610ea2b75692c186761ea7
3
+ size 236375
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 137.0, "std_reward": 76.8830280361017, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-05-23T15:53:46.571288"}
 
1
+ {"mean_reward": 320.0, "std_reward": 86.45808232895291, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-05-24T13:29:11.883030"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:678f42d8caa4ee6bfab16248659145d345b3aca03e98df879eb6bb68dfadc4aa
3
- size 6261
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d14c59a8af82eac7b6778d71e06d19fa1a31ac3ae90331d875ab51795bec920
3
+ size 10207