pableitorr
commited on
Update hyperparameters.json
Browse files- hyperparameters.json +2 -9
hyperparameters.json
CHANGED
@@ -1,26 +1,19 @@
|
|
1 |
-
{"exp_name": "ppo",
|
2 |
-
"
|
3 |
"wandb_project_name": "cleanRL",
|
4 |
-
"wandb_entity": None,
|
5 |
-
"capture_video": False,
|
6 |
"env_id": "LunarLander-v2",
|
7 |
"total_timesteps": 2000000,
|
8 |
"learning_rate": 0.00035,
|
9 |
"num_envs": 4,
|
10 |
"num_steps": 1024,
|
11 |
-
"anneal_lr": True,
|
12 |
-
"gae": True,
|
13 |
"gamma": 0.999,
|
14 |
"gae_lambda": 0.98,
|
15 |
"num_minibatches": 4,
|
16 |
"update_epochs": 4,
|
17 |
-
"norm_adv": True,
|
18 |
"clip_coef": 0.2,
|
19 |
-
"clip_vloss": True,
|
20 |
"ent_coef": 0.01,
|
21 |
"vf_coef": 0.5,
|
22 |
"max_grad_norm": 0.5,
|
23 |
-
"target_kl": None,
|
24 |
"repo_id": "pableitorr/LunarLander-v2-UNIT8",
|
25 |
"batch_size": 4096,
|
26 |
"minibatch_size": 1024}
|
|
|
1 |
+
{"exp_name": "ppo",
|
2 |
+
"seed": 1,
|
3 |
"wandb_project_name": "cleanRL",
|
|
|
|
|
4 |
"env_id": "LunarLander-v2",
|
5 |
"total_timesteps": 2000000,
|
6 |
"learning_rate": 0.00035,
|
7 |
"num_envs": 4,
|
8 |
"num_steps": 1024,
|
|
|
|
|
9 |
"gamma": 0.999,
|
10 |
"gae_lambda": 0.98,
|
11 |
"num_minibatches": 4,
|
12 |
"update_epochs": 4,
|
|
|
13 |
"clip_coef": 0.2,
|
|
|
14 |
"ent_coef": 0.01,
|
15 |
"vf_coef": 0.5,
|
16 |
"max_grad_norm": 0.5,
|
|
|
17 |
"repo_id": "pableitorr/LunarLander-v2-UNIT8",
|
18 |
"batch_size": 4096,
|
19 |
"minibatch_size": 1024}
|