knight9114 commited on
Commit
22ca058
1 Parent(s): f87c44b

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +32 -19
config.json CHANGED
@@ -6,7 +6,7 @@
6
  "train_dir": "/home/knight/github/huggingface-deep-rl-course/unit8/train_dir",
7
  "restart_behavior": "resume",
8
  "device": "gpu",
9
- "seed": null,
10
  "num_policies": 1,
11
  "async_rl": true,
12
  "serial_mode": false,
@@ -17,7 +17,7 @@
17
  "max_policy_lag": 1000,
18
  "num_workers": 8,
19
  "num_envs_per_worker": 4,
20
- "batch_size": 1024,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
23
  "rollout": 32,
@@ -42,7 +42,7 @@
42
  "adam_eps": 1e-06,
43
  "adam_beta1": 0.9,
44
  "adam_beta2": 0.999,
45
- "max_grad_norm": 4.0,
46
  "learning_rate": 0.0001,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
@@ -50,7 +50,7 @@
50
  "obs_scale": 255.0,
51
  "normalize_input": true,
52
  "normalize_input_keys": null,
53
- "decorrelate_experience_max_seconds": 0,
54
  "decorrelate_envs_on_one_worker": true,
55
  "actor_worker_gpus": [],
56
  "set_workers_cpu_affinity": true,
@@ -61,10 +61,10 @@
61
  "flush_summaries_interval": 30,
62
  "stats_avg": 100,
63
  "summaries_use_frameskip": true,
64
- "heartbeat_interval": 20,
65
- "heartbeat_reporting_interval": 600,
66
- "train_for_env_steps": 4000000,
67
- "train_for_seconds": 10000000000,
68
  "save_every_sec": 120,
69
  "keep_checkpoints": 2,
70
  "load_checkpoint_kind": "latest",
@@ -83,10 +83,10 @@
83
  ],
84
  "use_rnn": true,
85
  "rnn_size": 512,
86
- "rnn_type": "gru",
87
  "rnn_num_layers": 1,
88
  "decoder_mlp_layers": [],
89
- "nonlinearity": "elu",
90
  "policy_initialization": "orthogonal",
91
  "policy_init_gain": 1.0,
92
  "actor_critic_share_weights": true,
@@ -95,7 +95,6 @@
95
  "initial_stddev": 1.0,
96
  "use_env_info_cache": false,
97
  "env_gpu_actions": false,
98
- "env_gpu_observations": true,
99
  "env_frameskip": 4,
100
  "env_framestack": 1,
101
  "pixel_format": "CHW",
@@ -128,14 +127,28 @@
128
  "wide_aspect_ratio": false,
129
  "eval_env_frameskip": 1,
130
  "fps": 35,
131
- "command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=4000000",
132
  "cli_args": {
 
133
  "env": "doom_health_gathering_supreme",
 
 
 
 
134
  "num_workers": 8,
135
- "num_envs_per_worker": 4,
136
- "train_for_env_steps": 4000000
137
- },
138
- "git_hash": "unknown",
139
- "git_repo_name": "not a git repository",
140
- "train_script": ".home.knight.github.huggingface-deep-rl-course.unit8.venv.lib.python3.10.site-packages.ipykernel_launcher"
141
- }
 
 
 
 
 
 
 
 
 
 
6
  "train_dir": "/home/knight/github/huggingface-deep-rl-course/unit8/train_dir",
7
  "restart_behavior": "resume",
8
  "device": "gpu",
9
+ "seed": 2222,
10
  "num_policies": 1,
11
  "async_rl": true,
12
  "serial_mode": false,
 
17
  "max_policy_lag": 1000,
18
  "num_workers": 8,
19
  "num_envs_per_worker": 4,
20
+ "batch_size": 2048,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
23
  "rollout": 32,
 
42
  "adam_eps": 1e-06,
43
  "adam_beta1": 0.9,
44
  "adam_beta2": 0.999,
45
+ "max_grad_norm": 0.0,
46
  "learning_rate": 0.0001,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
 
50
  "obs_scale": 255.0,
51
  "normalize_input": true,
52
  "normalize_input_keys": null,
53
+ "decorrelate_experience_max_seconds": 1,
54
  "decorrelate_envs_on_one_worker": true,
55
  "actor_worker_gpus": [],
56
  "set_workers_cpu_affinity": true,
 
61
  "flush_summaries_interval": 30,
62
  "stats_avg": 100,
63
  "summaries_use_frameskip": true,
64
+ "heartbeat_interval": 10,
65
+ "heartbeat_reporting_interval": 300,
66
+ "train_for_env_steps": 10000000000,
67
+ "train_for_seconds": 3600000,
68
  "save_every_sec": 120,
69
  "keep_checkpoints": 2,
70
  "load_checkpoint_kind": "latest",
 
83
  ],
84
  "use_rnn": true,
85
  "rnn_size": 512,
86
+ "rnn_type": "lstm",
87
  "rnn_num_layers": 1,
88
  "decoder_mlp_layers": [],
89
+ "nonlinearity": "relu",
90
  "policy_initialization": "orthogonal",
91
  "policy_init_gain": 1.0,
92
  "actor_critic_share_weights": true,
 
95
  "initial_stddev": 1.0,
96
  "use_env_info_cache": false,
97
  "env_gpu_actions": false,
 
98
  "env_frameskip": 4,
99
  "env_framestack": 1,
100
  "pixel_format": "CHW",
 
127
  "wide_aspect_ratio": false,
128
  "eval_env_frameskip": 1,
129
  "fps": 35,
130
+ "command_line": "--train_for_seconds=3600000 --algo=APPO --gamma=0.99 --use_rnn=True --num_workers=8 --num_envs_per_worker=12 --num_epochs=1 --rollout=32 --recurrence=32 --batch_size=2048 --benchmark=False --max_grad_norm=0.0 --decorrelate_experience_max_seconds=1 --nonlinearity=relu --rnn_type=lstm --num_policies=1 --heartbeat_reporting_interval=300 --train_dir=/home/knight/github/huggingface-deep-rl-course/unit8/train_dir --seed=2222 --experiment=default_experiment --env=doom_health_gathering_supreme",
131
  "cli_args": {
132
+ "algo": "APPO",
133
  "env": "doom_health_gathering_supreme",
134
+ "experiment": "default_experiment",
135
+ "train_dir": "/home/knight/github/huggingface-deep-rl-course/unit8/train_dir",
136
+ "seed": 2222,
137
+ "num_policies": 1,
138
  "num_workers": 8,
139
+ "num_envs_per_worker": 12,
140
+ "batch_size": 2048,
141
+ "num_epochs": 1,
142
+ "rollout": 32,
143
+ "recurrence": 32,
144
+ "gamma": 0.99,
145
+ "max_grad_norm": 0.0,
146
+ "decorrelate_experience_max_seconds": 1,
147
+ "heartbeat_reporting_interval": 300,
148
+ "train_for_seconds": 3600000,
149
+ "benchmark": false,
150
+ "use_rnn": true,
151
+ "rnn_type": "lstm",
152
+ "nonlinearity": "relu"
153
+ }
154
+ }