Cesar514 commited on
Commit
2b7f273
·
1 Parent(s): 8428173

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 571.50 +/- 182.83
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -58,16 +58,16 @@ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f lo
58
  ## Hyperparameters
59
  ```python
60
  OrderedDict([('batch_size', 32),
61
- ('buffer_size', 100000),
62
  ('env_wrapper',
63
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
64
  ('exploration_final_eps', 0.01),
65
  ('exploration_fraction', 0.1),
66
  ('frame_stack', 4),
67
  ('gradient_steps', 1),
68
- ('learning_rate', 0.0001),
69
  ('learning_starts', 100000),
70
- ('n_timesteps', 1000000.0),
71
  ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 690.00 +/- 137.15
20
  name: mean_reward
21
  verified: false
22
  ---
 
58
  ## Hyperparameters
59
  ```python
60
  OrderedDict([('batch_size', 32),
61
+ ('buffer_size', 120000),
62
  ('env_wrapper',
63
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
64
  ('exploration_final_eps', 0.01),
65
  ('exploration_fraction', 0.1),
66
  ('frame_stack', 4),
67
  ('gradient_steps', 1),
68
+ ('learning_rate', 0.00015),
69
  ('learning_starts', 100000),
70
+ ('n_timesteps', 3000000.0),
71
  ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - hyperparams
19
  - null
20
  - - log_folder
21
- - logs/
22
  - - log_interval
23
  - -1
24
  - - max_total_trials
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 896005373
58
  - - storage
59
  - null
60
  - - study_name
 
18
  - - hyperparams
19
  - null
20
  - - log_folder
21
+ - content/drive/MyDrive/logs
22
  - - log_interval
23
  - -1
24
  - - max_total_trials
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 295434025
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -2,7 +2,7 @@
2
  - - - batch_size
3
  - 32
4
  - - buffer_size
5
- - 100000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
@@ -14,11 +14,11 @@
14
  - - gradient_steps
15
  - 1
16
  - - learning_rate
17
- - 0.0001
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
2
  - - - batch_size
3
  - 32
4
  - - buffer_size
5
+ - 120000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
 
14
  - - gradient_steps
15
  - 1
16
  - - learning_rate
17
+ - 0.00015
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 3000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37bfe913b0a250a807117a693bb9178fd033a94b27065f52673b75ce196c7862
3
- size 27224788
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ae9ad0217a4a60e3d4be1b77dde9f0834d5d92607fe1ed2c09ae7a1879e9eba
3
+ size 27224794
dqn-SpaceInvadersNoFrameskip-v4/_stable_baselines3_version CHANGED
@@ -1 +1 @@
1
- 1.6.2
 
1
+ 1.7.0a10
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4390e4ebf1b0f5fb6e228ae073f904d295423f1bce5779cda878bccbc5e98d39
3
  size 13505739
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1502a4590c32e1c137ae4f7e16e8f9dfb2eae1f0a21a5e08497c0ce767f0a1c7
3
  size 13505739
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7a038fe18dc0d284888c5882883b5f9de6fd859963cb248d5dcc7604d919b6a
3
  size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93a8854450947cd8c4405a35f67770ea5c22e4d52874d121693795ab05af50e5
3
  size 13504937
dqn-SpaceInvadersNoFrameskip-v4/system_info.txt CHANGED
@@ -1,6 +1,6 @@
1
  OS: Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022
2
  Python: 3.8.16
3
- Stable-Baselines3: 1.6.2
4
  PyTorch: 1.13.0+cu116
5
  GPU Enabled: True
6
  Numpy: 1.21.6
 
1
  OS: Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022
2
  Python: 3.8.16
3
+ Stable-Baselines3: 1.7.0a10
4
  PyTorch: 1.13.0+cu116
5
  GPU Enabled: True
6
  Numpy: 1.21.6
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:86213e6fbab24982dfe0a1602e29dcc8faffb6935df9c0e5c59f3014ad0e7963
3
- size 244536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:593071b8860d99b8a6de71327cac6033f91ab512a745f742a6a3bed87849c0cb
3
+ size 220610
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 571.5, "std_reward": 182.8257367002797, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-12-20T14:13:41.785070"}
 
1
+ {"mean_reward": 690.0, "std_reward": 137.14955340794953, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-12-23T17:47:30.715187"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f7045365a1bcd2357389ae8ea3433ef3c4fb72b780f8f3a3f12a68512c9bbf1
3
- size 37019
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c665bf32867ac5d7026262c3c96566ad0104ae0b8725460a28f33fde3fabe53
3
+ size 90824