atorre commited on
Commit
e3b78a9
1 Parent(s): 25301e0

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 303.00 +/- 116.69
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -71,8 +71,8 @@ OrderedDict([('batch_size', 32),
71
  ('frame_stack', 4),
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
- ('learning_starts', 10000),
75
- ('n_timesteps', 500000),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 456.00 +/- 81.36
20
  name: mean_reward
21
  verified: false
22
  ---
 
71
  ('frame_stack', 4),
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
+ ('learning_starts', 100000),
75
+ ('n_timesteps', 1000000),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 2988924314
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 3326709419
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -16,9 +16,9 @@
16
  - - learning_rate
17
  - 0.0001
18
  - - learning_starts
19
- - 10000
20
  - - n_timesteps
21
- - 500000
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
16
  - - learning_rate
17
  - 0.0001
18
  - - learning_starts
19
+ - 100000
20
  - - n_timesteps
21
+ - 1000000
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:acd4dcf0f363763849ff24272fbf27599c4389de0281adb2157fc9276e78a185
3
- size 27224799
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf206eabed56ae460ecae752a170ad1977098c5f567ebb69b78d5691dc59a7af
3
+ size 27224803
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00ba158e5da48771388dfc21c4d7644614d2f4095749eb0b22df3b6c90bcc065
3
  size 13505739
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7f13798d1a73f951b12795708346c6a6ec3688e5e5c65fbe80d17926e92dcaf
3
  size 13505739
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11041e6298dcb7a0a44169a82a82eb8df552549bab9e3d7535b07ea73740a0d0
3
  size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff232b43973129b4238aabd8a4eaecaf88f64c8a5eb555150227904a0ea5c4a0
3
  size 13504937
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b09cc7553b32ead61e40e66b8ab1524695053eb100bcc97d95942acaed9db542
3
- size 233359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:727221a0d972273ec948034a84889609b3a3977ab8efb84c5f524fb5cc584315
3
+ size 239848
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 303.0, "std_reward": 116.68761716651858, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-01-12T08:49:15.043707"}
 
1
+ {"mean_reward": 456.0, "std_reward": 81.35723692456621, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-01-12T10:22:53.875978"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f3570630f549696b128148eea25cdf8d09ad25e56dc421f8f9a9ae365997812
3
- size 21283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df2c4703d9c285824858df5b2e815c228a617d81954ef2fc55f7441c2ec532ba
3
+ size 36539