monti-python commited on
Commit
6cf71e3
1 Parent(s): 1aa339a

First training for SnowballTarget

Browse files
SnowballTarget/events.out.tfevents.1721473267.Montana.27072.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7c3475beff39aea916c9ac6e5e319dcde1f712dd9f2f4c624dc02f06a6aa32f
3
+ size 1114
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget.x86_64", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget.x86_64", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -68,8 +68,8 @@ checkpoint_settings:
68
  run_id: SnowballTarget1
69
  initialize_from: null
70
  load_model: false
71
- resume: false
72
- force: true
73
  train_model: false
74
  inference: false
75
  results_dir: results
 
68
  run_id: SnowballTarget1
69
  initialize_from: null
70
  load_model: false
71
+ resume: true
72
+ force: false
73
  train_model: false
74
  inference: false
75
  results_dir: results
run_logs/Player-0.log CHANGED
@@ -22,7 +22,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
22
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
23
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
24
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
25
- UnloadTime: 0.378228 ms
26
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
27
  requesting resize 84 x 84
28
  Setting up 4 worker threads for Enlighten.
@@ -30,7 +30,7 @@ Memory Statistics:
30
  [ALLOC_TEMP_TLS] TLS Allocator
31
  StackAllocators :
32
  [ALLOC_TEMP_MAIN]
33
- Peak usage frame count: [8.0 KB-16.0 KB]: 5371 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
34
  Initial Block Size 4.0 MB
35
  Current Block Size 4.0 MB
36
  Peak Allocated Bytes 2.0 MB
@@ -53,12 +53,12 @@ Memory Statistics:
53
  [ALLOC_TEMP_Job.Worker 6]
54
  Initial Block Size 256.0 KB
55
  Current Block Size 256.0 KB
56
- Peak Allocated Bytes 3.6 KB
57
  Overflow Count 0
58
  [ALLOC_TEMP_Job.Worker 0]
59
  Initial Block Size 256.0 KB
60
  Current Block Size 256.0 KB
61
- Peak Allocated Bytes 3.6 KB
62
  Overflow Count 0
63
  [ALLOC_TEMP_Background Job.Worker 10]
64
  Initial Block Size 32.0 KB
@@ -73,7 +73,7 @@ Memory Statistics:
73
  [ALLOC_TEMP_Job.Worker 5]
74
  Initial Block Size 256.0 KB
75
  Current Block Size 256.0 KB
76
- Peak Allocated Bytes 3.6 KB
77
  Overflow Count 0
78
  [ALLOC_TEMP_Background Job.Worker 14]
79
  Initial Block Size 32.0 KB
@@ -88,12 +88,12 @@ Memory Statistics:
88
  [ALLOC_TEMP_Job.Worker 4]
89
  Initial Block Size 256.0 KB
90
  Current Block Size 256.0 KB
91
- Peak Allocated Bytes 3.6 KB
92
  Overflow Count 0
93
  [ALLOC_TEMP_Job.Worker 3]
94
  Initial Block Size 256.0 KB
95
  Current Block Size 256.0 KB
96
- Peak Allocated Bytes 3.6 KB
97
  Overflow Count 0
98
  [ALLOC_TEMP_Background Job.Worker 12]
99
  Initial Block Size 32.0 KB
@@ -143,12 +143,12 @@ Memory Statistics:
143
  [ALLOC_TEMP_Job.Worker 1]
144
  Initial Block Size 256.0 KB
145
  Current Block Size 256.0 KB
146
- Peak Allocated Bytes 3.6 KB
147
  Overflow Count 0
148
  [ALLOC_TEMP_Job.Worker 2]
149
  Initial Block Size 256.0 KB
150
  Current Block Size 256.0 KB
151
- Peak Allocated Bytes 3.6 KB
152
  Overflow Count 0
153
  [ALLOC_TEMP_Background Job.Worker 3]
154
  Initial Block Size 32.0 KB
@@ -176,22 +176,22 @@ Memory Statistics:
176
  Peak Allocated Bytes 0 B
177
  Overflow Count 0
178
  [ALLOC_DEFAULT] Dual Thread Allocator
179
- Peak main deferred allocation count 40
180
  [ALLOC_BUCKET]
181
  Large Block size 4.0 MB
182
  Used Block count 1
183
  Peak Allocated bytes 1.0 MB
184
  [ALLOC_DEFAULT_MAIN]
185
- Peak usage frame count: [4.0 MB-8.0 MB]: 5463 frames
186
  Requested Block Size 16.0 MB
187
  Peak Block count 1
188
- Peak Allocated memory 6.8 MB
189
  Peak Large allocation bytes 0 B
190
  [ALLOC_DEFAULT_THREAD]
191
- Peak usage frame count: [16.0 MB-32.0 MB]: 5463 frames
192
  Requested Block Size 16.0 MB
193
  Peak Block count 1
194
- Peak Allocated memory 17.7 MB
195
  Peak Large allocation bytes 16.0 MB
196
  [ALLOC_TEMP_JOB_1_FRAME]
197
  Initial Block Size 2.0 MB
@@ -205,7 +205,7 @@ Memory Statistics:
205
  Overflow Count (full) 0
206
  [ALLOC_TEMP_JOB_4_FRAMES (JobTemp)]
207
  Initial Block Size 2.0 MB
208
- Used Block Count 2
209
  Overflow Count (too large) 0
210
  Overflow Count (full) 0
211
  [ALLOC_TEMP_JOB_ASYNC (Background)]
@@ -220,13 +220,13 @@ Memory Statistics:
220
  Used Block count 1
221
  Peak Allocated bytes 1.0 MB
222
  [ALLOC_GFX_MAIN]
223
- Peak usage frame count: [32.0 KB-64.0 KB]: 4951 frames, [64.0 KB-128.0 KB]: 512 frames
224
  Requested Block Size 16.0 MB
225
  Peak Block count 1
226
- Peak Allocated memory 66.4 KB
227
  Peak Large allocation bytes 0 B
228
  [ALLOC_GFX_THREAD]
229
- Peak usage frame count: [32.0 KB-64.0 KB]: 5463 frames
230
  Requested Block Size 16.0 MB
231
  Peak Block count 1
232
  Peak Allocated memory 39.6 KB
@@ -238,13 +238,13 @@ Memory Statistics:
238
  Used Block count 1
239
  Peak Allocated bytes 1.0 MB
240
  [ALLOC_CACHEOBJECTS_MAIN]
241
- Peak usage frame count: [0.5 MB-1.0 MB]: 5463 frames
242
  Requested Block Size 4.0 MB
243
  Peak Block count 1
244
- Peak Allocated memory 0.6 MB
245
  Peak Large allocation bytes 0 B
246
  [ALLOC_CACHEOBJECTS_THREAD]
247
- Peak usage frame count: [0.5 MB-1.0 MB]: 5462 frames, [2.0 MB-4.0 MB]: 1 frames
248
  Requested Block Size 4.0 MB
249
  Peak Block count 1
250
  Peak Allocated memory 2.2 MB
@@ -256,13 +256,13 @@ Memory Statistics:
256
  Used Block count 1
257
  Peak Allocated bytes 1.0 MB
258
  [ALLOC_TYPETREE_MAIN]
259
- Peak usage frame count: [0-1.0 KB]: 5463 frames
260
  Requested Block Size 2.0 MB
261
  Peak Block count 1
262
  Peak Allocated memory 1.0 KB
263
  Peak Large allocation bytes 0 B
264
  [ALLOC_TYPETREE_THREAD]
265
- Peak usage frame count: [1.0 KB-2.0 KB]: 5463 frames
266
  Requested Block Size 2.0 MB
267
  Peak Block count 1
268
  Peak Allocated memory 1.7 KB
 
22
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
23
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
24
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
25
+ UnloadTime: 0.474486 ms
26
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
27
  requesting resize 84 x 84
28
  Setting up 4 worker threads for Enlighten.
 
30
  [ALLOC_TEMP_TLS] TLS Allocator
31
  StackAllocators :
32
  [ALLOC_TEMP_MAIN]
33
+ Peak usage frame count: [2.0 MB-4.0 MB]: 1 frames
34
  Initial Block Size 4.0 MB
35
  Current Block Size 4.0 MB
36
  Peak Allocated Bytes 2.0 MB
 
53
  [ALLOC_TEMP_Job.Worker 6]
54
  Initial Block Size 256.0 KB
55
  Current Block Size 256.0 KB
56
+ Peak Allocated Bytes 2.8 KB
57
  Overflow Count 0
58
  [ALLOC_TEMP_Job.Worker 0]
59
  Initial Block Size 256.0 KB
60
  Current Block Size 256.0 KB
61
+ Peak Allocated Bytes 0 B
62
  Overflow Count 0
63
  [ALLOC_TEMP_Background Job.Worker 10]
64
  Initial Block Size 32.0 KB
 
73
  [ALLOC_TEMP_Job.Worker 5]
74
  Initial Block Size 256.0 KB
75
  Current Block Size 256.0 KB
76
+ Peak Allocated Bytes 0 B
77
  Overflow Count 0
78
  [ALLOC_TEMP_Background Job.Worker 14]
79
  Initial Block Size 32.0 KB
 
88
  [ALLOC_TEMP_Job.Worker 4]
89
  Initial Block Size 256.0 KB
90
  Current Block Size 256.0 KB
91
+ Peak Allocated Bytes 2.8 KB
92
  Overflow Count 0
93
  [ALLOC_TEMP_Job.Worker 3]
94
  Initial Block Size 256.0 KB
95
  Current Block Size 256.0 KB
96
+ Peak Allocated Bytes 0 B
97
  Overflow Count 0
98
  [ALLOC_TEMP_Background Job.Worker 12]
99
  Initial Block Size 32.0 KB
 
143
  [ALLOC_TEMP_Job.Worker 1]
144
  Initial Block Size 256.0 KB
145
  Current Block Size 256.0 KB
146
+ Peak Allocated Bytes 2.8 KB
147
  Overflow Count 0
148
  [ALLOC_TEMP_Job.Worker 2]
149
  Initial Block Size 256.0 KB
150
  Current Block Size 256.0 KB
151
+ Peak Allocated Bytes 2.8 KB
152
  Overflow Count 0
153
  [ALLOC_TEMP_Background Job.Worker 3]
154
  Initial Block Size 32.0 KB
 
176
  Peak Allocated Bytes 0 B
177
  Overflow Count 0
178
  [ALLOC_DEFAULT] Dual Thread Allocator
179
+ Peak main deferred allocation count 2
180
  [ALLOC_BUCKET]
181
  Large Block size 4.0 MB
182
  Used Block count 1
183
  Peak Allocated bytes 1.0 MB
184
  [ALLOC_DEFAULT_MAIN]
185
+ Peak usage frame count: [4.0 MB-8.0 MB]: 1 frames
186
  Requested Block Size 16.0 MB
187
  Peak Block count 1
188
+ Peak Allocated memory 4.9 MB
189
  Peak Large allocation bytes 0 B
190
  [ALLOC_DEFAULT_THREAD]
191
+ Peak usage frame count: [16.0 MB-32.0 MB]: 1 frames
192
  Requested Block Size 16.0 MB
193
  Peak Block count 1
194
+ Peak Allocated memory 17.4 MB
195
  Peak Large allocation bytes 16.0 MB
196
  [ALLOC_TEMP_JOB_1_FRAME]
197
  Initial Block Size 2.0 MB
 
205
  Overflow Count (full) 0
206
  [ALLOC_TEMP_JOB_4_FRAMES (JobTemp)]
207
  Initial Block Size 2.0 MB
208
+ Used Block Count 1
209
  Overflow Count (too large) 0
210
  Overflow Count (full) 0
211
  [ALLOC_TEMP_JOB_ASYNC (Background)]
 
220
  Used Block count 1
221
  Peak Allocated bytes 1.0 MB
222
  [ALLOC_GFX_MAIN]
223
+ Peak usage frame count: [64.0 KB-128.0 KB]: 1 frames
224
  Requested Block Size 16.0 MB
225
  Peak Block count 1
226
+ Peak Allocated memory 65.6 KB
227
  Peak Large allocation bytes 0 B
228
  [ALLOC_GFX_THREAD]
229
+ Peak usage frame count: [32.0 KB-64.0 KB]: 1 frames
230
  Requested Block Size 16.0 MB
231
  Peak Block count 1
232
  Peak Allocated memory 39.6 KB
 
238
  Used Block count 1
239
  Peak Allocated bytes 1.0 MB
240
  [ALLOC_CACHEOBJECTS_MAIN]
241
+ Peak usage frame count: [0.5 MB-1.0 MB]: 1 frames
242
  Requested Block Size 4.0 MB
243
  Peak Block count 1
244
+ Peak Allocated memory 0.5 MB
245
  Peak Large allocation bytes 0 B
246
  [ALLOC_CACHEOBJECTS_THREAD]
247
+ Peak usage frame count: [2.0 MB-4.0 MB]: 1 frames
248
  Requested Block Size 4.0 MB
249
  Peak Block count 1
250
  Peak Allocated memory 2.2 MB
 
256
  Used Block count 1
257
  Peak Allocated bytes 1.0 MB
258
  [ALLOC_TYPETREE_MAIN]
259
+ Peak usage frame count: [0-1.0 KB]: 1 frames
260
  Requested Block Size 2.0 MB
261
  Peak Block count 1
262
  Peak Allocated memory 1.0 KB
263
  Peak Large allocation bytes 0 B
264
  [ALLOC_TYPETREE_THREAD]
265
+ Peak usage frame count: [1.0 KB-2.0 KB]: 1 frames
266
  Requested Block Size 2.0 MB
267
  Peak Block count 1
268
  Peak Allocated memory 1.7 KB
run_logs/timers.json CHANGED
@@ -1,317 +1,40 @@
1
  {
2
  "name": "root",
3
- "gauges": {
4
- "SnowballTarget.Policy.Entropy.mean": {
5
- "value": 0.9319132566452026,
6
- "min": 0.9319132566452026,
7
- "max": 2.870424747467041,
8
- "count": 20
9
- },
10
- "SnowballTarget.Policy.Entropy.sum": {
11
- "value": 8938.912109375,
12
- "min": 8938.912109375,
13
- "max": 29522.318359375,
14
- "count": 20
15
- },
16
- "SnowballTarget.Step.mean": {
17
- "value": 199984.0,
18
- "min": 9952.0,
19
- "max": 199984.0,
20
- "count": 20
21
- },
22
- "SnowballTarget.Step.sum": {
23
- "value": 199984.0,
24
- "min": 9952.0,
25
- "max": 199984.0,
26
- "count": 20
27
- },
28
- "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
29
- "value": 12.874151229858398,
30
- "min": 0.39834508299827576,
31
- "max": 12.874151229858398,
32
- "count": 20
33
- },
34
- "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
35
- "value": 2510.45947265625,
36
- "min": 77.27894592285156,
37
- "max": 2602.755126953125,
38
- "count": 20
39
- },
40
- "SnowballTarget.Environment.EpisodeLength.mean": {
41
- "value": 199.0,
42
- "min": 199.0,
43
- "max": 199.0,
44
- "count": 20
45
- },
46
- "SnowballTarget.Environment.EpisodeLength.sum": {
47
- "value": 10945.0,
48
- "min": 8756.0,
49
- "max": 10945.0,
50
- "count": 20
51
- },
52
- "SnowballTarget.Losses.PolicyLoss.mean": {
53
- "value": 0.06857709564963657,
54
- "min": 0.057933525650250714,
55
- "max": 0.07610024299595833,
56
- "count": 20
57
- },
58
- "SnowballTarget.Losses.PolicyLoss.sum": {
59
- "value": 0.2743083825985463,
60
- "min": 0.23173410260100286,
61
- "max": 0.38050121497979167,
62
- "count": 20
63
- },
64
- "SnowballTarget.Losses.ValueLoss.mean": {
65
- "value": 0.17977972606233525,
66
- "min": 0.10100476959761343,
67
- "max": 0.28556475897922234,
68
- "count": 20
69
- },
70
- "SnowballTarget.Losses.ValueLoss.sum": {
71
- "value": 0.719118904249341,
72
- "min": 0.4040190783904537,
73
- "max": 1.408571179006614,
74
- "count": 20
75
- },
76
- "SnowballTarget.Policy.LearningRate.mean": {
77
- "value": 8.082097306000005e-06,
78
- "min": 8.082097306000005e-06,
79
- "max": 0.000291882002706,
80
- "count": 20
81
- },
82
- "SnowballTarget.Policy.LearningRate.sum": {
83
- "value": 3.232838922400002e-05,
84
- "min": 3.232838922400002e-05,
85
- "max": 0.00138516003828,
86
- "count": 20
87
- },
88
- "SnowballTarget.Policy.Epsilon.mean": {
89
- "value": 0.10269400000000001,
90
- "min": 0.10269400000000001,
91
- "max": 0.19729400000000002,
92
- "count": 20
93
- },
94
- "SnowballTarget.Policy.Epsilon.sum": {
95
- "value": 0.41077600000000003,
96
- "min": 0.41077600000000003,
97
- "max": 0.96172,
98
- "count": 20
99
- },
100
- "SnowballTarget.Policy.Beta.mean": {
101
- "value": 0.0001444306000000001,
102
- "min": 0.0001444306000000001,
103
- "max": 0.0048649706,
104
- "count": 20
105
- },
106
- "SnowballTarget.Policy.Beta.sum": {
107
- "value": 0.0005777224000000004,
108
- "min": 0.0005777224000000004,
109
- "max": 0.023089828,
110
- "count": 20
111
- },
112
- "SnowballTarget.Environment.CumulativeReward.mean": {
113
- "value": 25.363636363636363,
114
- "min": 3.1136363636363638,
115
- "max": 25.418181818181818,
116
- "count": 20
117
- },
118
- "SnowballTarget.Environment.CumulativeReward.sum": {
119
- "value": 1116.0,
120
- "min": 137.0,
121
- "max": 1398.0,
122
- "count": 20
123
- },
124
- "SnowballTarget.Policy.ExtrinsicReward.mean": {
125
- "value": 25.363636363636363,
126
- "min": 3.1136363636363638,
127
- "max": 25.418181818181818,
128
- "count": 20
129
- },
130
- "SnowballTarget.Policy.ExtrinsicReward.sum": {
131
- "value": 1116.0,
132
- "min": 137.0,
133
- "max": 1398.0,
134
- "count": 20
135
- },
136
- "SnowballTarget.IsTraining.mean": {
137
- "value": 1.0,
138
- "min": 1.0,
139
- "max": 1.0,
140
- "count": 20
141
- },
142
- "SnowballTarget.IsTraining.sum": {
143
- "value": 1.0,
144
- "min": 1.0,
145
- "max": 1.0,
146
- "count": 20
147
- }
148
- },
149
  "metadata": {
150
  "timer_format_version": "0.1.0",
151
- "start_time_seconds": "1721472628",
152
  "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
153
- "command_line_arguments": "/home/montana/miniconda3/envs/huggy/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget.x86_64 --run-id=SnowballTarget1 --no-graphics --force",
154
  "mlagents_version": "1.0.0",
155
  "mlagents_envs_version": "1.0.0",
156
  "communication_protocol_version": "1.5.0",
157
  "pytorch_version": "2.3.0+cu121",
158
  "numpy_version": "1.21.2",
159
- "end_time_seconds": "1721473081"
160
  },
161
- "total": 453.7232466909918,
162
  "count": 1,
163
- "self": 0.2725397319882177,
164
  "children": {
165
  "run_training.setup": {
166
- "total": 0.013106368016451597,
167
  "count": 1,
168
- "self": 0.013106368016451597
169
  },
170
  "TrainerController.start_learning": {
171
- "total": 453.43760059098713,
172
  "count": 1,
173
- "self": 0.4767339399259072,
174
  "children": {
175
  "TrainerController._reset_env": {
176
- "total": 2.856478811998386,
177
  "count": 1,
178
- "self": 2.856478811998386
179
- },
180
- "TrainerController.advance": {
181
- "total": 450.0170217230916,
182
- "count": 18207,
183
- "self": 0.2265568540606182,
184
- "children": {
185
- "env_step": {
186
- "total": 449.790464869031,
187
- "count": 18207,
188
- "self": 262.4828545647615,
189
- "children": {
190
- "SubprocessEnvManager._take_step": {
191
- "total": 187.07232962345006,
192
- "count": 18207,
193
- "self": 1.2606316194287501,
194
- "children": {
195
- "TorchPolicy.evaluate": {
196
- "total": 185.8116980040213,
197
- "count": 18207,
198
- "self": 185.8116980040213
199
- }
200
- }
201
- },
202
- "workers": {
203
- "total": 0.23528068081941456,
204
- "count": 18207,
205
- "self": 0.0,
206
- "children": {
207
- "worker_root": {
208
- "total": 452.63578140575555,
209
- "count": 18207,
210
- "is_parallel": true,
211
- "self": 268.31014963949565,
212
- "children": {
213
- "run_training.setup": {
214
- "total": 0.0,
215
- "count": 0,
216
- "is_parallel": true,
217
- "self": 0.0,
218
- "children": {
219
- "steps_from_proto": {
220
- "total": 0.0011406879930291325,
221
- "count": 1,
222
- "is_parallel": true,
223
- "self": 0.0003602970391511917,
224
- "children": {
225
- "_process_rank_one_or_two_observation": {
226
- "total": 0.0007803909538779408,
227
- "count": 10,
228
- "is_parallel": true,
229
- "self": 0.0007803909538779408
230
- }
231
- }
232
- },
233
- "UnityEnvironment.step": {
234
- "total": 0.035801211022771895,
235
- "count": 1,
236
- "is_parallel": true,
237
- "self": 0.00043541903141885996,
238
- "children": {
239
- "UnityEnvironment._generate_step_input": {
240
- "total": 0.0012463539896998554,
241
- "count": 1,
242
- "is_parallel": true,
243
- "self": 0.0012463539896998554
244
- },
245
- "communicator.exchange": {
246
- "total": 0.032584517990471795,
247
- "count": 1,
248
- "is_parallel": true,
249
- "self": 0.032584517990471795
250
- },
251
- "steps_from_proto": {
252
- "total": 0.0015349200111813843,
253
- "count": 1,
254
- "is_parallel": true,
255
- "self": 0.00049385498277843,
256
- "children": {
257
- "_process_rank_one_or_two_observation": {
258
- "total": 0.0010410650284029543,
259
- "count": 10,
260
- "is_parallel": true,
261
- "self": 0.0010410650284029543
262
- }
263
- }
264
- }
265
- }
266
- }
267
- }
268
- },
269
- "UnityEnvironment.step": {
270
- "total": 184.3256317662599,
271
- "count": 18206,
272
- "is_parallel": true,
273
- "self": 4.547100880125072,
274
- "children": {
275
- "UnityEnvironment._generate_step_input": {
276
- "total": 2.7601509311934933,
277
- "count": 18206,
278
- "is_parallel": true,
279
- "self": 2.7601509311934933
280
- },
281
- "communicator.exchange": {
282
- "total": 162.79889808109147,
283
- "count": 18206,
284
- "is_parallel": true,
285
- "self": 162.79889808109147
286
- },
287
- "steps_from_proto": {
288
- "total": 14.219481873849872,
289
- "count": 18206,
290
- "is_parallel": true,
291
- "self": 3.3427517008967698,
292
- "children": {
293
- "_process_rank_one_or_two_observation": {
294
- "total": 10.876730172953103,
295
- "count": 182060,
296
- "is_parallel": true,
297
- "self": 10.876730172953103
298
- }
299
- }
300
- }
301
- }
302
- }
303
- }
304
- }
305
- }
306
- }
307
- }
308
- }
309
- }
310
  },
311
  "trainer_threads": {
312
- "total": 0.0001153459888882935,
313
  "count": 1,
314
- "self": 0.0001153459888882935,
315
  "children": {
316
  "thread_root": {
317
  "total": 0.0,
@@ -320,38 +43,16 @@
320
  "self": 0.0,
321
  "children": {
322
  "trainer_advance": {
323
- "total": 448.1581348279433,
324
- "count": 372741,
325
  "is_parallel": true,
326
- "self": 5.601814194989856,
327
  "children": {
328
  "process_trajectory": {
329
- "total": 245.7939493758895,
330
- "count": 372741,
331
- "is_parallel": true,
332
- "self": 245.11395980493398,
333
- "children": {
334
- "RLTrainer._checkpoint": {
335
- "total": 0.679989570955513,
336
- "count": 4,
337
- "is_parallel": true,
338
- "self": 0.679989570955513
339
- }
340
- }
341
- },
342
- "_update_policy": {
343
- "total": 196.76237125706393,
344
- "count": 90,
345
  "is_parallel": true,
346
- "self": 30.571620423404966,
347
- "children": {
348
- "TorchPPOOptimizer.update": {
349
- "total": 166.19075083365897,
350
- "count": 4587,
351
- "is_parallel": true,
352
- "self": 166.19075083365897
353
- }
354
- }
355
  }
356
  }
357
  }
@@ -360,14 +61,14 @@
360
  }
361
  },
362
  "TrainerController._save_models": {
363
- "total": 0.08725076998234726,
364
  "count": 1,
365
- "self": 0.0015113929694052786,
366
  "children": {
367
  "RLTrainer._checkpoint": {
368
- "total": 0.08573937701294199,
369
  "count": 1,
370
- "self": 0.08573937701294199
371
  }
372
  }
373
  }
 
1
  {
2
  "name": "root",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  "metadata": {
4
  "timer_format_version": "0.1.0",
5
+ "start_time_seconds": "1721473267",
6
  "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
7
+ "command_line_arguments": "/home/montana/miniconda3/envs/huggy/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget.x86_64 --run-id=SnowballTarget1 --no-graphics --resume",
8
  "mlagents_version": "1.0.0",
9
  "mlagents_envs_version": "1.0.0",
10
  "communication_protocol_version": "1.5.0",
11
  "pytorch_version": "2.3.0+cu121",
12
  "numpy_version": "1.21.2",
13
+ "end_time_seconds": "1721473271"
14
  },
15
+ "total": 4.123133318993496,
16
  "count": 1,
17
+ "self": 0.27164047601399943,
18
  "children": {
19
  "run_training.setup": {
20
+ "total": 0.016180282982531935,
21
  "count": 1,
22
+ "self": 0.016180282982531935
23
  },
24
  "TrainerController.start_learning": {
25
+ "total": 3.8353125599969644,
26
  "count": 1,
27
+ "self": 0.0002827090211212635,
28
  "children": {
29
  "TrainerController._reset_env": {
30
+ "total": 2.398862707981607,
31
  "count": 1,
32
+ "self": 2.398862707981607
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  },
34
  "trainer_threads": {
35
+ "total": 1.2222997611388564e-05,
36
  "count": 1,
37
+ "self": 1.2222997611388564e-05,
38
  "children": {
39
  "thread_root": {
40
  "total": 0.0,
 
43
  "self": 0.0,
44
  "children": {
45
  "trainer_advance": {
46
+ "total": 0.0002568429918028414,
47
+ "count": 1,
48
  "is_parallel": true,
49
+ "self": 1.4424003893509507e-05,
50
  "children": {
51
  "process_trajectory": {
52
+ "total": 0.00024241898790933192,
53
+ "count": 1,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
54
  "is_parallel": true,
55
+ "self": 0.00024241898790933192
 
 
 
 
 
 
 
 
56
  }
57
  }
58
  }
 
61
  }
62
  },
63
  "TrainerController._save_models": {
64
+ "total": 1.4361549199966248,
65
  "count": 1,
66
+ "self": 0.0006549700046889484,
67
  "children": {
68
  "RLTrainer._checkpoint": {
69
+ "total": 1.4354999499919359,
70
  "count": 1,
71
+ "self": 1.4354999499919359
72
  }
73
  }
74
  }
run_logs/training_status.json CHANGED
@@ -45,13 +45,22 @@
45
  "auxillary_file_paths": [
46
  "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
47
  ]
 
 
 
 
 
 
 
 
 
48
  }
49
  ],
50
  "final_checkpoint": {
51
  "steps": 200112,
52
  "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
53
- "reward": 25.454545454545453,
54
- "creation_time": 1721473081.5591972,
55
  "auxillary_file_paths": [
56
  "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
57
  ]
 
45
  "auxillary_file_paths": [
46
  "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
47
  ]
48
+ },
49
+ {
50
+ "steps": 200112,
51
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.onnx",
52
+ "reward": null,
53
+ "creation_time": 1721473271.0107923,
54
+ "auxillary_file_paths": [
55
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
56
+ ]
57
  }
58
  ],
59
  "final_checkpoint": {
60
  "steps": 200112,
61
  "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
62
+ "reward": null,
63
+ "creation_time": 1721473271.0107923,
64
  "auxillary_file_paths": [
65
  "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
66
  ]