Bishdata commited on
Commit
9b08cba
·
verified ·
1 Parent(s): 8f9378f

Initial commit

Browse files
Files changed (4) hide show
  1. README.md +3 -3
  2. dqn-EnduroNoFrameskip-v4.zip +2 -2
  3. replay.mp4 +2 -2
  4. results.json +1 -1
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: EnduroNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 3.40 +/- 4.15
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -63,7 +63,7 @@ python -m rl_zoo3.push_to_hub --algo dqn --env EnduroNoFrameskip-v4 -f logs/ -or
63
 
64
  ## Hyperparameters
65
  ```python
66
- OrderedDict([('batch_size', 100),
67
  ('buffer_size', 100000),
68
  ('env_wrapper',
69
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
@@ -74,7 +74,7 @@ OrderedDict([('batch_size', 100),
74
  ('gradient_steps', 1),
75
  ('learning_rate', 0.00011447658254850165),
76
  ('learning_starts', 20000),
77
- ('n_timesteps', 100000.0),
78
  ('optimize_memory_usage', False),
79
  ('policy', 'CnnPolicy'),
80
  ('target_update_interval', 1000),
 
16
  type: EnduroNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 155.30 +/- 17.60
20
  name: mean_reward
21
  verified: false
22
  ---
 
63
 
64
  ## Hyperparameters
65
  ```python
66
+ OrderedDict([('batch_size', 128),
67
  ('buffer_size', 100000),
68
  ('env_wrapper',
69
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
 
74
  ('gradient_steps', 1),
75
  ('learning_rate', 0.00011447658254850165),
76
  ('learning_starts', 20000),
77
+ ('n_timesteps', 1000000.0),
78
  ('optimize_memory_usage', False),
79
  ('policy', 'CnnPolicy'),
80
  ('target_update_interval', 1000),
dqn-EnduroNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8dd948a45fbc88dff9d1de0528b2970b062b87795b6069556d6eb29e269c14d6
3
- size 27242497
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7f7099c6b27e499cdc9940e4019456f78ec9235a0b0e51399066c102cd828d9
3
+ size 27245398
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c73c922f4d35f4a57a35399ced7c77d1143409b2b4ec751356c1682ea26af2f
3
- size 363896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db1fe135baf7c3dfcfc983087716daee0fa1147998b17afec7a56609041a8162
3
+ size 384000
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 3.4, "std_reward": 4.1521078984053394, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-12-08T11:43:47.026256"}
 
1
+ {"mean_reward": 155.3, "std_reward": 17.595738120351758, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-12-08T14:07:05.057188"}