Seventh Push

Browse files

Files changed (11) hide show

SoccerTwos.onnx +1 -1
SoccerTwos/SoccerTwos-32499941.onnx +3 -0
SoccerTwos/SoccerTwos-32499941.pt +3 -0
SoccerTwos/checkpoint.pt +1 -1
SoccerTwos/events.out.tfevents.1725639265.Bretts-MacBook-Pro.local.55651.0 +2 -2
SoccerTwos/events.out.tfevents.1725741373.Bretts-MacBook-Pro.local.57198.0 +3 -0
config.json +1 -1
configuration.yaml +1 -1
run_logs/Player-0.log +2 -2
run_logs/timers.json +382 -61
run_logs/training_status.json +8 -8

SoccerTwos.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8310f421d4a705039d63cbe9bc3d579c90750570a9296b0f42eb6b2a7f44b6b7
 size 2351062

 version https://git-lfs.github.com/spec/v1
+oid sha256:ad5e42ffb14033363e95c48e20ea11212cf53e6b917d8f5d64f9916e59b9f24a
 size 2351062

SoccerTwos/SoccerTwos-32499941.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f95c440705145507bffabafa0a86080d9a1227e68029c5f3bfac64618a1e8dd9
+size 2351062

SoccerTwos/SoccerTwos-32499941.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:142f7de35a6a8c907c49c79d725f4a524117540d8f0de4caff367a5374f7a4da
+size 36303154

SoccerTwos/checkpoint.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:94a3b101cf7c8db717bd805a14c3a2aa885485c424e1ac8714fcd2bd87a93781
 size 36301318

 version https://git-lfs.github.com/spec/v1
+oid sha256:bb99e03d8d1496bfffcf9fa933bef55f12e098b38c01731441fab8126e9b2ebd
 size 36301318

SoccerTwos/events.out.tfevents.1725639265.Bretts-MacBook-Pro.local.55651.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5f952e5b983a9fe03dbadfbae99f9e339ae4d629adf958b2208d76516ddad8ec
-size 740049

 version https://git-lfs.github.com/spec/v1
+oid sha256:deb15b8fc9deffc7b288f005a81b904742b64f7de964afc36987ac9f5138eff2
+size 2417737

SoccerTwos/events.out.tfevents.1725741373.Bretts-MacBook-Pro.local.57198.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0dffce8bdecae174dc92a44c9618b9282f32401478c297757966b567386f0265
+size 1732159

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 40960, "buffer_size": 163840, "learning_rate": 0.0003, "beta": 0.01, "epsilon": 0.2, "lambd": 0.9, "num_epoch": 3, "learning_rate_schedule": "constant", "beta_schedule": "linear", "epsilon_schedule": "constant"}, "checkpoint_interval": 500000, "network_settings": {"normalize": true, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": {"sequence_length": 16, "memory_size": 128}, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.995, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}, "curiosity": {"gamma": 0.9, "strength": 1e-06, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "learning_rate": 0.0003, "encoding_size": 512}, "rnd": {"gamma": 0.9, "strength": 1e-06, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "learning_rate": 0.0001, "encoding_size": null}}, "init_path": null, "keep_checkpoints": 1, "even_checkpoints": false, "max_steps": 80000000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 100000, "team_change": 400000, "swap_steps": 2000, "window": 30, "play_against_latest_model_ratio": 0.5, "initial_elo": 1.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./SoccerTwos/SoccerTwos.app", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "sept-run-01", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 40960, "buffer_size": 163840, "learning_rate": 0.0003, "beta": 0.01, "epsilon": 0.2, "lambd": 0.9, "num_epoch": 3, "learning_rate_schedule": "constant", "beta_schedule": "linear", "epsilon_schedule": "constant"}, "checkpoint_interval": 500000, "network_settings": {"normalize": true, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": {"sequence_length": 16, "memory_size": 128}, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.995, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}, "curiosity": {"gamma": 0.9, "strength": 1e-06, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "learning_rate": 0.0003, "encoding_size": 512}, "rnd": {"gamma": 0.9, "strength": 1e-06, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "learning_rate": 0.0001, "encoding_size": null}}, "init_path": null, "keep_checkpoints": 1, "even_checkpoints": false, "max_steps": 80000000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 100000, "team_change": 400000, "swap_steps": 2000, "window": 30, "play_against_latest_model_ratio": 0.9, "initial_elo": 1.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./SoccerTwos/SoccerTwos.app", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "sept-run-01", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -74,7 +74,7 @@ behaviors:
       team_change: 400000
       swap_steps: 2000
       window: 30
-      play_against_latest_model_ratio: 0.5
       initial_elo: 1.0
     behavioral_cloning: null
 env_settings:

       team_change: 400000
       swap_steps: 2000
       window: 30
+      play_against_latest_model_ratio: 0.9
       initial_elo: 1.0
     behavioral_cloning: null
 env_settings:

run_logs/Player-0.log CHANGED Viewed

@@ -10,7 +10,7 @@ NullGfxDevice:
     Renderer: Null Device
     Vendor:   Unity Technologies
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.036 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -35,6 +35,6 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 0.223000 ms
 Registered Communicator in Agent.
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)

     Renderer: Null Device
     Vendor:   Unity Technologies
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.048 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 0.230292 ms
 Registered Communicator in Agent.
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)

run_logs/timers.json CHANGED Viewed

@@ -1,8 +1,310 @@
 {
     "name": "root",
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1725639228",
         "python_version": "3.10.12 (main, Aug 23 2024, 16:29:11) [Clang 15.0.0 (clang-1500.3.9.4)]",
         "command_line_arguments": "/Users/brettgohre/Desktop/huggingface/ml-agents/games/bin/mlagents-learn ./config/poca/sept/three.yaml --env=./SoccerTwos/SoccerTwos.app --run-id=sept-run-01 --resume --no-graphics",
         "mlagents_version": "1.1.0.dev0",
@@ -10,103 +312,103 @@
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.4.0",
         "numpy_version": "1.23.5",
-        "end_time_seconds": "1725639244"
     },
-    "total": 15.882768709008815,
     "count": 1,
-    "self": 0.05988275000709109,
     "children": {
         "run_training.setup": {
-            "total": 0.019645958993351087,
             "count": 1,
-            "self": 0.019645958993351087
         },
         "TrainerController.start_learning": {
-            "total": 15.803240000008373,
             "count": 1,
-            "self": 0.0026913749461527914,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 3.5253060839895625,
-                    "count": 2,
-                    "self": 3.5253060839895625
                 },
                 "TrainerController.advance": {
-                    "total": 12.153929750085808,
-                    "count": 287,
-                    "self": 0.002460731368046254,
                     "children": {
                         "env_step": {
-                            "total": 11.317403695225948,
-                            "count": 287,
-                            "self": 10.868867997516645,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 0.4469113309751265,
-                                    "count": 287,
-                                    "self": 0.0130690521618817,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 0.4338422788132448,
-                                            "count": 506,
-                                            "self": 0.4338422788132448
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 0.0016243667341768742,
-                                    "count": 286,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 12.562684869160876,
-                                            "count": 286,
                                             "is_parallel": true,
-                                            "self": 2.0004065242537763,
                                             "children": {
                                                 "steps_from_proto": {
-                                                    "total": 0.0027742499951273203,
-                                                    "count": 4,
                                                     "is_parallel": true,
-                                                    "self": 0.00039266597013920546,
                                                     "children": {
                                                         "_process_rank_one_or_two_observation": {
-                                                            "total": 0.002381584024988115,
-                                                            "count": 16,
                                                             "is_parallel": true,
-                                                            "self": 0.002381584024988115
                                                         }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 10.559504094911972,
-                                                    "count": 286,
                                                     "is_parallel": true,
-                                                    "self": 0.027175818424439058,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 0.18330224978853948,
-                                                            "count": 286,
                                                             "is_parallel": true,
-                                                            "self": 0.18330224978853948
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 10.00545607091044,
-                                                            "count": 286,
                                                             "is_parallel": true,
-                                                            "self": 10.00545607091044
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 0.34356995578855276,
-                                                            "count": 572,
                                                             "is_parallel": true,
-                                                            "self": 0.04205756550072692,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.30151239028782584,
-                                                                    "count": 2288,
                                                                     "is_parallel": true,
-                                                                    "self": 0.30151239028782584
                                                                 }
                                                             }
                                                         }
@@ -119,33 +421,52 @@
                             }
                         },
                         "trainer_advance": {
-                            "total": 0.8340653234918136,
-                            "count": 286,
-                            "self": 0.01612685641157441,
                             "children": {
                                 "process_trajectory": {
-                                    "total": 0.8179384670802392,
-                                    "count": 286,
-                                    "self": 0.8179384670802392
                                 }
                             }
                         }
                     }
                 },
                 "trainer_threads": {
-                    "total": 5.00003807246685e-07,
                     "count": 1,
-                    "self": 5.00003807246685e-07
                 },
                 "TrainerController._save_models": {
-                    "total": 0.12131229098304175,
                     "count": 1,
-                    "self": 0.0006150819826871157,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.12069720900035463,
                             "count": 1,
-                            "self": 0.12069720900035463
                         }
                     }
                 }

 {
     "name": "root",
+    "gauges": {
+        "SoccerTwos.Policy.Entropy.mean": {
+            "value": 2.1416494846343994,
+            "min": 2.0137786865234375,
+            "max": 2.151839017868042,
+            "count": 229
+        },
+        "SoccerTwos.Policy.Entropy.sum": {
+            "value": 41599.3984375,
+            "min": 27844.923828125,
+            "max": 47085.4375,
+            "count": 229
+        },
+        "SoccerTwos.Environment.EpisodeLength.mean": {
+            "value": 70.91304347826087,
+            "min": 50.824742268041234,
+            "max": 86.2280701754386,
+            "count": 229
+        },
+        "SoccerTwos.Environment.EpisodeLength.sum": {
+            "value": 19572.0,
+            "min": 11252.0,
+            "max": 21360.0,
+            "count": 229
+        },
+        "SoccerTwos.Self-play.ELO.mean": {
+            "value": 90.32114998486692,
+            "min": 67.98246219987821,
+            "max": 106.5567773055241,
+            "count": 229
+        },
+        "SoccerTwos.Self-play.ELO.sum": {
+            "value": 12464.318697911634,
+            "min": 7314.330712543377,
+            "max": 19099.755722564205,
+            "count": 229
+        },
+        "SoccerTwos.Step.mean": {
+            "value": 30899950.0,
+            "min": 28619966.0,
+            "max": 30899950.0,
+            "count": 229
+        },
+        "SoccerTwos.Step.sum": {
+            "value": 30899950.0,
+            "min": 28619966.0,
+            "max": 30899950.0,
+            "count": 229
+        },
+        "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
+            "value": -0.04198051616549492,
+            "min": -0.12825024127960205,
+            "max": 0.05813853442668915,
+            "count": 229
+        },
+        "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
+            "value": -5.79331111907959,
+            "min": -16.676513671875,
+            "max": 8.662641525268555,
+            "count": 229
+        },
+        "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
+            "value": -0.04343034699559212,
+            "min": -0.12868726253509521,
+            "max": 0.057454075664281845,
+            "count": 229
+        },
+        "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
+            "value": -5.993387699127197,
+            "min": -16.638057708740234,
+            "max": 8.560657501220703,
+            "count": 229
+        },
+        "SoccerTwos.Policy.CuriosityBaselineEstimate.mean": {
+            "value": 0.0024543115869164467,
+            "min": 0.00020709412638098001,
+            "max": 0.24234014749526978,
+            "count": 229
+        },
+        "SoccerTwos.Policy.CuriosityBaselineEstimate.sum": {
+            "value": 0.3386949896812439,
+            "min": 0.03044283762574196,
+            "max": 44.54613494873047,
+            "count": 229
+        },
+        "SoccerTwos.Policy.CuriosityValueEstimate.mean": {
+            "value": 0.002094687195494771,
+            "min": 0.0002014237834373489,
+            "max": 0.2422645092010498,
+            "count": 229
+        },
+        "SoccerTwos.Policy.CuriosityValueEstimate.sum": {
+            "value": 0.2890668213367462,
+            "min": 0.031623534858226776,
+            "max": 44.569114685058594,
+            "count": 229
+        },
+        "SoccerTwos.Policy.RndBaselineEstimate.mean": {
+            "value": 0.00014870119048282504,
+            "min": -0.00018489075591787696,
+            "max": 0.00017628517525736243,
+            "count": 229
+        },
+        "SoccerTwos.Policy.RndBaselineEstimate.sum": {
+            "value": 0.020520763471722603,
+            "min": -0.029478061944246292,
+            "max": 0.029439624398946762,
+            "count": 229
+        },
+        "SoccerTwos.Policy.RndValueEstimate.mean": {
+            "value": 0.00015831700875423849,
+            "min": -0.00018485976033844054,
+            "max": 0.0001771982351783663,
+            "count": 229
+        },
+        "SoccerTwos.Policy.RndValueEstimate.sum": {
+            "value": 0.021847747266292572,
+            "min": -0.029127497225999832,
+            "max": 0.029592106118798256,
+            "count": 229
+        },
+        "SoccerTwos.Environment.CumulativeReward.mean": {
+            "value": 0.0,
+            "min": 0.0,
+            "max": 0.0,
+            "count": 229
+        },
+        "SoccerTwos.Environment.CumulativeReward.sum": {
+            "value": 0.0,
+            "min": 0.0,
+            "max": 0.0,
+            "count": 229
+        },
+        "SoccerTwos.Policy.ExtrinsicReward.mean": {
+            "value": -0.04998840801957725,
+            "min": -0.4002886958744215,
+            "max": 0.2771585784720246,
+            "count": 229
+        },
+        "SoccerTwos.Policy.ExtrinsicReward.sum": {
+            "value": -6.89840030670166,
+            "min": -50.038799941539764,
+            "max": 46.839799761772156,
+            "count": 229
+        },
+        "SoccerTwos.Policy.CuriosityReward.mean": {
+            "value": 3.3735505580296747e-06,
+            "min": 0.0,
+            "max": 5.779475230838216e-06,
+            "count": 229
+        },
+        "SoccerTwos.Policy.CuriosityReward.sum": {
+            "value": 0.0004655499770080951,
+            "min": 0.0,
+            "max": 0.0008388239721170976,
+            "count": 229
+        },
+        "SoccerTwos.Policy.RndReward.mean": {
+            "value": 1.553490576139646e-06,
+            "min": 1.0619012450802476e-06,
+            "max": 1.9177394476529395e-06,
+            "count": 229
+        },
+        "SoccerTwos.Policy.RndReward.sum": {
+            "value": 0.00021438169950727115,
+            "min": 0.00013151309185133186,
+            "max": 0.00022558096927838278,
+            "count": 229
+        },
+        "SoccerTwos.Environment.GroupCumulativeReward.mean": {
+            "value": -0.04998840801957725,
+            "min": -0.4002886958744215,
+            "max": 0.2771585784720246,
+            "count": 229
+        },
+        "SoccerTwos.Environment.GroupCumulativeReward.sum": {
+            "value": -6.89840030670166,
+            "min": -50.038799941539764,
+            "max": 46.839799761772156,
+            "count": 229
+        },
+        "SoccerTwos.IsTraining.mean": {
+            "value": 1.0,
+            "min": 1.0,
+            "max": 1.0,
+            "count": 229
+        },
+        "SoccerTwos.IsTraining.sum": {
+            "value": 1.0,
+            "min": 1.0,
+            "max": 1.0,
+            "count": 229
+        },
+        "SoccerTwos.Losses.PolicyLoss.mean": {
+            "value": 0.011783653045616424,
+            "min": 0.0072254263698899495,
+            "max": 0.0510992972801129,
+            "count": 15
+        },
+        "SoccerTwos.Losses.PolicyLoss.sum": {
+            "value": 0.011783653045616424,
+            "min": 0.0072254263698899495,
+            "max": 0.0510992972801129,
+            "count": 15
+        },
+        "SoccerTwos.Losses.ValueLoss.mean": {
+            "value": 0.02236808432886998,
+            "min": 0.02193430345505476,
+            "max": 0.025202005325506132,
+            "count": 15
+        },
+        "SoccerTwos.Losses.ValueLoss.sum": {
+            "value": 0.02236808432886998,
+            "min": 0.02193430345505476,
+            "max": 0.025202005325506132,
+            "count": 15
+        },
+        "SoccerTwos.Losses.BaselineLoss.mean": {
+            "value": 0.02246675391991933,
+            "min": 0.02218010788783431,
+            "max": 0.025417460439105827,
+            "count": 15
+        },
+        "SoccerTwos.Losses.BaselineLoss.sum": {
+            "value": 0.02246675391991933,
+            "min": 0.02218010788783431,
+            "max": 0.025417460439105827,
+            "count": 15
+        },
+        "SoccerTwos.Policy.LearningRate.mean": {
+            "value": 0.0003,
+            "min": 0.0003,
+            "max": 0.0003,
+            "count": 15
+        },
+        "SoccerTwos.Policy.LearningRate.sum": {
+            "value": 0.0003,
+            "min": 0.0003,
+            "max": 0.0003,
+            "count": 15
+        },
+        "SoccerTwos.Policy.Epsilon.mean": {
+            "value": 0.20000000000000004,
+            "min": 0.20000000000000004,
+            "max": 0.20000000000000004,
+            "count": 15
+        },
+        "SoccerTwos.Policy.Epsilon.sum": {
+            "value": 0.20000000000000004,
+            "min": 0.20000000000000004,
+            "max": 0.20000000000000004,
+            "count": 15
+        },
+        "SoccerTwos.Policy.Beta.mean": {
+            "value": 0.006152085766,
+            "min": 0.006152085766,
+            "max": 0.00640850284225,
+            "count": 15
+        },
+        "SoccerTwos.Policy.Beta.sum": {
+            "value": 0.006152085766,
+            "min": 0.006152085766,
+            "max": 0.00640850284225,
+            "count": 15
+        },
+        "SoccerTwos.Losses.CuriosityForwardLoss.mean": {
+            "value": 0.044924141528705754,
+            "min": 0.044924141528705754,
+            "max": 0.12874181816975275,
+            "count": 15
+        },
+        "SoccerTwos.Losses.CuriosityForwardLoss.sum": {
+            "value": 0.044924141528705754,
+            "min": 0.044924141528705754,
+            "max": 0.12874181816975275,
+            "count": 15
+        },
+        "SoccerTwos.Losses.CuriosityInverseLoss.mean": {
+            "value": 1.5999893347422283,
+            "min": 1.5462068021297455,
+            "max": 1.7163931628068287,
+            "count": 15
+        },
+        "SoccerTwos.Losses.CuriosityInverseLoss.sum": {
+            "value": 1.5999893347422283,
+            "min": 1.5462068021297455,
+            "max": 1.7163931628068287,
+            "count": 15
+        },
+        "SoccerTwos.Losses.RNDLoss.mean": {
+            "value": 0.018670696765184402,
+            "min": 0.018668334931135178,
+            "max": 0.02088502235710621,
+            "count": 15
+        },
+        "SoccerTwos.Losses.RNDLoss.sum": {
+            "value": 0.018670696765184402,
+            "min": 0.018668334931135178,
+            "max": 0.02088502235710621,
+            "count": 15
+        }
+    },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1725639262",
         "python_version": "3.10.12 (main, Aug 23 2024, 16:29:11) [Clang 15.0.0 (clang-1500.3.9.4)]",
         "command_line_arguments": "/Users/brettgohre/Desktop/huggingface/ml-agents/games/bin/mlagents-learn ./config/poca/sept/three.yaml --env=./SoccerTwos/SoccerTwos.app --run-id=sept-run-01 --resume --no-graphics",
         "mlagents_version": "1.1.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.4.0",
         "numpy_version": "1.23.5",
+        "end_time_seconds": "1725648389"
     },
+    "total": 9127.100674749992,
     "count": 1,
+    "self": 0.15175625000847504,
     "children": {
         "run_training.setup": {
+            "total": 0.017048291978426278,
             "count": 1,
+            "self": 0.017048291978426278
         },
         "TrainerController.start_learning": {
+            "total": 9126.931870208005,
             "count": 1,
+            "self": 1.415727891610004,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 3.5643327069701627,
+                    "count": 7,
+                    "self": 3.5643327069701627
                 },
                 "TrainerController.advance": {
+                    "total": 9121.758065358445,
+                    "count": 158196,
+                    "self": 1.3677141138759907,
                     "children": {
                         "env_step": {
+                            "total": 6411.4115795473335,
+                            "count": 158196,
+                            "self": 6185.67660572668,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 224.9005823341431,
+                                    "count": 158196,
+                                    "self": 8.746982502460014,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 216.1535998316831,
+                                            "count": 287128,
+                                            "self": 216.1535998316831
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 0.8343914865108673,
+                                    "count": 158195,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 9121.446049298218,
+                                            "count": 158195,
                                             "is_parallel": true,
+                                            "self": 3101.727182136703,
                                             "children": {
                                                 "steps_from_proto": {
+                                                    "total": 0.009650043997680768,
+                                                    "count": 14,
                                                     "is_parallel": true,
+                                                    "self": 0.0012721649545710534,
                                                     "children": {
                                                         "_process_rank_one_or_two_observation": {
+                                                            "total": 0.008377879043109715,
+                                                            "count": 56,
                                                             "is_parallel": true,
+                                                            "self": 0.008377879043109715
                                                         }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 6019.709217117517,
+                                                    "count": 158195,
                                                     "is_parallel": true,
+                                                    "self": 15.64049137730035,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 118.73067298045498,
+                                                            "count": 158195,
                                                             "is_parallel": true,
+                                                            "self": 118.73067298045498
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 5690.6334428538685,
+                                                            "count": 158195,
                                                             "is_parallel": true,
+                                                            "self": 5690.6334428538685
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 194.70460990589345,
+                                                            "count": 316390,
                                                             "is_parallel": true,
+                                                            "self": 23.100591495400295,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 171.60401841049315,
+                                                                    "count": 1265560,
                                                                     "is_parallel": true,
+                                                                    "self": 171.60401841049315
                                                                 }
                                                             }
                                                         }
                             }
                         },
                         "trainer_advance": {
+                            "total": 2708.978771697235,
+                            "count": 158195,
+                            "self": 11.918968971876893,
                             "children": {
                                 "process_trajectory": {
+                                    "total": 517.3845484333578,
+                                    "count": 158195,
+                                    "self": 516.6691328503366,
+                                    "children": {
+                                        "RLTrainer._checkpoint": {
+                                            "total": 0.7154155830212403,
+                                            "count": 4,
+                                            "self": 0.7154155830212403
+                                        }
+                                    }
+                                },
+                                "_update_policy": {
+                                    "total": 2179.6752542920003,
+                                    "count": 15,
+                                    "self": 212.8977203327231,
+                                    "children": {
+                                        "TorchPOCAOptimizer.update": {
+                                            "total": 1966.7775339592772,
+                                            "count": 180,
+                                            "self": 1966.7775339592772
+                                        }
+                                    }
                                 }
                             }
                         }
                     }
                 },
                 "trainer_threads": {
+                    "total": 4.5899651013314724e-07,
                     "count": 1,
+                    "self": 4.5899651013314724e-07
                 },
                 "TrainerController._save_models": {
+                    "total": 0.19374379198416136,
                     "count": 1,
+                    "self": 0.0005647509824484587,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.1931790410017129,
                             "count": 1,
+                            "self": 0.1931790410017129
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -1,24 +1,24 @@
 {
     "SoccerTwos": {
-        "elo": 78.23583539049073,
         "checkpoints": [
             {
-                "steps": 28614312,
-                "file_path": "results/sept-run-01/SoccerTwos/SoccerTwos-28614312.onnx",
                 "reward": 0.0,
-                "creation_time": 1725639244.512409,
                 "auxillary_file_paths": [
-                    "results/sept-run-01/SoccerTwos/SoccerTwos-28614312.pt"
                 ]
             }
         ],
         "final_checkpoint": {
-            "steps": 28614312,
             "file_path": "results/sept-run-01/SoccerTwos.onnx",
             "reward": 0.0,
-            "creation_time": 1725639244.512409,
             "auxillary_file_paths": [
-                "results/sept-run-01/SoccerTwos/SoccerTwos-28614312.pt"
             ]
         }
     },

 {
     "SoccerTwos": {
+        "elo": 90.32114998486692,
         "checkpoints": [
             {
+                "steps": 30907162,
+                "file_path": "results/sept-run-01/SoccerTwos/SoccerTwos-30907162.onnx",
                 "reward": 0.0,
+                "creation_time": 1725648389.335208,
                 "auxillary_file_paths": [
+                    "results/sept-run-01/SoccerTwos/SoccerTwos-30907162.pt"
                 ]
             }
         ],
         "final_checkpoint": {
+            "steps": 30907162,
             "file_path": "results/sept-run-01/SoccerTwos.onnx",
             "reward": 0.0,
+            "creation_time": 1725648389.335208,
             "auxillary_file_paths": [
+                "results/sept-run-01/SoccerTwos/SoccerTwos-30907162.pt"
             ]
         }
     },