sdpkjc commited on
Commit
c4a5ea7
·
verified ·
1 Parent(s): 03a99b5

pushing model

Browse files
.gitattributes CHANGED
@@ -42,3 +42,4 @@ videos/Walker2d-v4__ppo_fix_continuous_action__5__1704458010-eval/rl-video-episo
42
  videos/Walker2d-v4__ppo_fix_continuous_action__5__1704498502-eval/rl-video-episode-8.mp4 filter=lfs diff=lfs merge=lfs -text
43
  videos/Walker2d-v4__ppo_fix_continuous_action__5__1704498502-eval/rl-video-episode-1.mp4 filter=lfs diff=lfs merge=lfs -text
44
  videos/Walker2d-v4__ppo_fix_continuous_action__5__1704498502-eval/rl-video-episode-0.mp4 filter=lfs diff=lfs merge=lfs -text
 
 
42
  videos/Walker2d-v4__ppo_fix_continuous_action__5__1704498502-eval/rl-video-episode-8.mp4 filter=lfs diff=lfs merge=lfs -text
43
  videos/Walker2d-v4__ppo_fix_continuous_action__5__1704498502-eval/rl-video-episode-1.mp4 filter=lfs diff=lfs merge=lfs -text
44
  videos/Walker2d-v4__ppo_fix_continuous_action__5__1704498502-eval/rl-video-episode-0.mp4 filter=lfs diff=lfs merge=lfs -text
45
+ videos/Walker2d-v4__ppo_fix_continuous_action__5__1705721020-eval/rl-video-episode-0.mp4 filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: Walker2d-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 4924.31 +/- 1237.76
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -46,7 +46,7 @@ curl -OL https://huggingface.co/sdpkjc/Walker2d-v4-ppo_fix_continuous_action-see
46
  curl -OL https://huggingface.co/sdpkjc/Walker2d-v4-ppo_fix_continuous_action-seed5/raw/main/pyproject.toml
47
  curl -OL https://huggingface.co/sdpkjc/Walker2d-v4-ppo_fix_continuous_action-seed5/raw/main/poetry.lock
48
  poetry install --all-extras
49
- python ppo_fix_continuous_action.py --save-model --upload-model --hf-entity sdpkjc --env-id Walker2d-v4 --seed 5 --track
50
  ```
51
 
52
  # Hyperparameters
@@ -56,7 +56,7 @@ python ppo_fix_continuous_action.py --save-model --upload-model --hf-entity sdpk
56
  'capture_video': False,
57
  'clip_coef': 0.2,
58
  'clip_vloss': True,
59
- 'cuda': True,
60
  'ent_coef': 0.0,
61
  'env_id': 'Walker2d-v4',
62
  'exp_name': 'ppo_fix_continuous_action',
 
16
  type: Walker2d-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 1457.49 +/- 811.87
20
  name: mean_reward
21
  verified: false
22
  ---
 
46
  curl -OL https://huggingface.co/sdpkjc/Walker2d-v4-ppo_fix_continuous_action-seed5/raw/main/pyproject.toml
47
  curl -OL https://huggingface.co/sdpkjc/Walker2d-v4-ppo_fix_continuous_action-seed5/raw/main/poetry.lock
48
  poetry install --all-extras
49
+ python ppo_fix_continuous_action.py --save-model --upload-model --hf-entity sdpkjc --env-id Walker2d-v4 --seed 5 --track --cuda False
50
  ```
51
 
52
  # Hyperparameters
 
56
  'capture_video': False,
57
  'clip_coef': 0.2,
58
  'clip_vloss': True,
59
+ 'cuda': False,
60
  'ent_coef': 0.0,
61
  'env_id': 'Walker2d-v4',
62
  'exp_name': 'ppo_fix_continuous_action',
events.out.tfevents.1704498509.4090-171.326604.0 → events.out.tfevents.1705721030.3090-172.2802263.0 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf8dfc6862d55e236cdfdea7ee7b32ffb04e004e10f4f14bd13785b4d2f25ecc
3
- size 573863
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6279a7e79abe1861119b9dd2611ab27766decc58ba4c1098c0a8b49a29c29239
3
+ size 791356
ppo_fix_continuous_action.cleanrl_model CHANGED
Binary files a/ppo_fix_continuous_action.cleanrl_model and b/ppo_fix_continuous_action.cleanrl_model differ
 
ppo_fix_continuous_action.py CHANGED
@@ -198,7 +198,7 @@ class NormalizeReward(gym.core.Wrapper, gym.utils.RecordConstructorArgs):
198
  return obs, rews, terminateds, truncateds, infos
199
 
200
  def reset(self, **kwargs):
201
- self.returns = np.zeros(self.num_envs)
202
  return self.env.reset(**kwargs)
203
 
204
  def normalize(self, rews):
 
198
  return obs, rews, terminateds, truncateds, infos
199
 
200
  def reset(self, **kwargs):
201
+ # self.returns = np.zeros(self.num_envs)
202
  return self.env.reset(**kwargs)
203
 
204
  def normalize(self, rews):
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c538c3c9d4183120e0678895787edb25663ab5d14c8b2e3593fc9853735c5d9
3
- size 1334268
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8925ae3b805d55df0e466a055ad06056ffcbbe556795b353340370247e6fb683
3
+ size 279554
videos/Walker2d-v4__ppo_fix_continuous_action__5__1704498502-eval/rl-video-episode-1.mp4 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:20ed525788b193b6b795e5a60660b590d6e6ee388767822566aee42260186f8f
3
- size 1335012
 
 
 
 
videos/Walker2d-v4__ppo_fix_continuous_action__5__1704498502-eval/rl-video-episode-8.mp4 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c538c3c9d4183120e0678895787edb25663ab5d14c8b2e3593fc9853735c5d9
3
- size 1334268
 
 
 
 
videos/{Walker2d-v4__ppo_fix_continuous_action__5__1704498502-eval → Walker2d-v4__ppo_fix_continuous_action__5__1705721020-eval}/rl-video-episode-0.mp4 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a6e6bae41f224bb8f45d64aa9675adb7d0348bb55897e7db23297c65ca03627
3
- size 1312361
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:690cb6a7c92c13cc9bd6b6c4934e39e0fb024837609dfa6ea9ca0c7b73cd40f4
3
+ size 1325646
videos/Walker2d-v4__ppo_fix_continuous_action__5__1705721020-eval/rl-video-episode-1.mp4 ADDED
Binary file (665 kB). View file
 
videos/Walker2d-v4__ppo_fix_continuous_action__5__1705721020-eval/rl-video-episode-8.mp4 ADDED
Binary file (280 kB). View file